[v3,9/9] fuse: allow parallel dio writes with FUSE_DIRECT_IO_ALLOW_MMAP

Message ID	20240208170603.2078871-10-amir73il@gmail.com (mailing list archive)
State	New, archived
Headers	show Received: from mail-wm1-f43.google.com (mail-wm1-f43.google.com [209.85.128.43]) (using TLSv1.2 with cipher ECDHE-RSA-AES128-GCM-SHA256 (128/128 bits)) (No client certificate requested) by smtp.subspace.kernel.org (Postfix) with ESMTPS id 6E42F1272D9 for <linux-fsdevel@vger.kernel.org>; Thu, 8 Feb 2024 17:09:24 +0000 (UTC) From: Amir Goldstein <amir73il@gmail.com> To: Miklos Szeredi <miklos@szeredi.hu> Cc: Bernd Schubert <bernd.schubert@fastmail.fm>, linux-fsdevel@vger.kernel.org, Bernd Schubert <bschubert@ddn.com> Subject: [PATCH v3 9/9] fuse: allow parallel dio writes with FUSE_DIRECT_IO_ALLOW_MMAP Date: Thu, 8 Feb 2024 19:06:03 +0200 Message-Id: <20240208170603.2078871-10-amir73il@gmail.com> In-Reply-To: <20240208170603.2078871-1-amir73il@gmail.com> References: <20240208170603.2078871-1-amir73il@gmail.com> Precedence: bulk MIME-Version: 1.0 Content-Transfer-Encoding: 8bit
Series	fuse: inode IO modes and mmap + parallel dio \| expand [v3,0/9] fuse: inode IO modes and mmap + parallel dio [v3,1/9] fuse: Fix VM_MAYSHARE and direct_io_allow_mmap [v3,2/9] fuse: Create helper function if DIO write needs exclusive lock [v3,3/9] fuse: Add fuse_dio_lock/unlock helper functions [v3,4/9] fuse: factor out helper fuse_truncate_update_attr() [v3,5/9] fuse: allocate ff->release_args only if release is needed [v3,6/9] fuse: break up fuse_open_common() [v3,7/9] fuse: prepare for failing open response [v3,8/9] fuse: introduce inode io modes [v3,9/9] fuse: allow parallel dio writes with FUSE_DIRECT_IO_ALLOW_MMAP

diff --git a/fs/fuse/file.c b/fs/fuse/file.c index 29e18e5a6f6c..eb226457c4bd 100644 --- a/fs/fuse/file.c +++ b/fs/fuse/file.c @@ -1335,6 +1335,7 @@ static bool fuse_dio_wr_exclusive_lock(struct kiocb *iocb, struct iov_iter *from struct file *file = iocb->ki_filp; struct fuse_file *ff = file->private_data; struct inode *inode = file_inode(iocb->ki_filp); + struct fuse_inode *fi = get_fuse_inode(inode); /* server side has to advise that it supports parallel dio writes */ if (!(ff->open_flags & FOPEN_PARALLEL_DIRECT_WRITES)) @@ -1346,11 +1347,9 @@ static bool fuse_dio_wr_exclusive_lock(struct kiocb *iocb, struct iov_iter *from if (iocb->ki_flags & IOCB_APPEND) return true; - /* combination opf page access and direct-io difficult, shared - * locks actually introduce a conflict. - */ - if (get_fuse_conn(inode)->direct_io_allow_mmap) - return true; + /* shared locks are not allowed with parallel page cache IO */ + if (test_bit(FUSE_I_CACHE_IO_MODE, &fi->state)) + return false; /* parallel dio beyond eof is at least for now not supported */ if (fuse_io_past_eof(iocb, from)) @@ -1370,10 +1369,14 @@ static void fuse_dio_lock(struct kiocb *iocb, struct iov_iter *from, } else { inode_lock_shared(inode); /* - * Previous check was without inode lock and might have raced, - * check again. + * New parallal dio allowed only if inode is not in caching + * mode and denies new opens in caching mode. This check + * should be performed only after taking shared inode lock. + * Previous past eof check was without inode lock and might + * have raced, so check it again. */ - if (fuse_io_past_eof(iocb, from)) { + if (fuse_io_past_eof(iocb, from) || + fuse_file_uncached_io_start(inode) != 0) { inode_unlock_shared(inode); inode_lock(inode); *exclusive = true; @@ -1386,6 +1389,8 @@ static void fuse_dio_unlock(struct inode *inode, bool exclusive) if (exclusive) { inode_unlock(inode); } else { + /* Allow opens in caching mode after last parallel dio end */ + fuse_file_uncached_io_end(inode); inode_unlock_shared(inode); } } @@ -2521,6 +2526,10 @@ static int fuse_file_mmap(struct file *file, struct vm_area_struct *vma) if (FUSE_IS_DAX(file_inode(file))) return fuse_dax_mmap(file, vma); + /* + * FOPEN_DIRECT_IO handling is special compared to O_DIRECT, + * as does not allow MAP_SHARED mmap without FUSE_DIRECT_IO_ALLOW_MMAP. + */ if (ff->open_flags & FOPEN_DIRECT_IO) { /* * Can't provide the coherency needed for MAP_SHARED @@ -2533,6 +2542,8 @@ static int fuse_file_mmap(struct file *file, struct vm_area_struct *vma) /* * First mmap of direct_io file enters caching inode io mode. + * Also waits for parallel dio writers to go into serial mode + * (exclusive instead of shared lock). */ rc = fuse_file_io_mmap(ff, file_inode(file)); if (rc) @@ -3312,6 +3323,7 @@ void fuse_init_file_inode(struct inode *inode, unsigned int flags) fi->writectr = 0; fi->iocachectr = 0; init_waitqueue_head(&fi->page_waitq); + init_waitqueue_head(&fi->direct_io_waitq); fi->writepages = RB_ROOT; if (IS_ENABLED(CONFIG_FUSE_DAX)) diff --git a/fs/fuse/fuse_i.h b/fs/fuse/fuse_i.h index 5e5465f6a1ac..dede4378c719 100644 --- a/fs/fuse/fuse_i.h +++ b/fs/fuse/fuse_i.h @@ -129,6 +129,9 @@ struct fuse_inode { /* Waitq for writepage completion */ wait_queue_head_t page_waitq; + /* waitq for direct-io completion */ + wait_queue_head_t direct_io_waitq; + /* List of writepage requestst (pending or sent) */ struct rb_root writepages; }; diff --git a/fs/fuse/iomode.c b/fs/fuse/iomode.c index 13faae77aec4..acd0833ae873 100644 --- a/fs/fuse/iomode.c +++ b/fs/fuse/iomode.c @@ -12,18 +12,45 @@ #include <linux/file.h> #include <linux/fs.h> +/* + * Return true if need to wait for new opens in caching mode. + */ +static inline bool fuse_is_io_cache_wait(struct fuse_inode *fi) +{ + return READ_ONCE(fi->iocachectr) < 0; +} + /* * Request an open in caching mode. + * Blocks new parallel dio writes and waits for the in-progress parallel dio + * writes to complete. * Return 0 if in caching mode. */ static int fuse_inode_get_io_cache(struct fuse_inode *fi) { + int err = 0; + assert_spin_locked(&fi->lock); - if (fi->iocachectr < 0) - return -ETXTBSY; - if (fi->iocachectr++ == 0) - set_bit(FUSE_I_CACHE_IO_MODE, &fi->state); - return 0; + /* + * Setting the bit advises new direct-io writes to use an exclusive + * lock - without it the wait below might be forever. + */ + set_bit(FUSE_I_CACHE_IO_MODE, &fi->state); + while (!err && fuse_is_io_cache_wait(fi)) { + spin_unlock(&fi->lock); + err = wait_event_killable(fi->direct_io_waitq, + !fuse_is_io_cache_wait(fi)); + spin_lock(&fi->lock); + } + /* + * Enter caching mode or clear the FUSE_I_CACHE_IO_MODE bit if we + * failed to enter caching mode and no other caching open exists. + */ + if (!err) + fi->iocachectr++; + else if (fi->iocachectr <= 0) + clear_bit(FUSE_I_CACHE_IO_MODE, &fi->state); + return err; } /* @@ -102,10 +129,13 @@ int fuse_file_uncached_io_start(struct inode *inode) void fuse_file_uncached_io_end(struct inode *inode) { struct fuse_inode *fi = get_fuse_inode(inode); + int uncached_io; spin_lock(&fi->lock); - fuse_inode_allow_io_cache(fi); + uncached_io = fuse_inode_allow_io_cache(fi); spin_unlock(&fi->lock); + if (!uncached_io) + wake_up(&fi->direct_io_waitq); } /* Open flags to determine regular file io mode */ @@ -155,13 +185,10 @@ int fuse_file_io_open(struct file *file, struct inode *inode) /* * First caching file open enters caching inode io mode. - * First parallel dio open denies caching inode io mode. */ err = 0; if (ff->open_flags & FOPEN_CACHE_IO) err = fuse_file_cached_io_start(inode); - else if (ff->open_flags & FOPEN_PARALLEL_DIRECT_WRITES) - err = fuse_file_uncached_io_start(inode); if (err) goto fail;

[v3,9/9] fuse: allow parallel dio writes with FUSE_DIRECT_IO_ALLOW_MMAP

Commit Message

Comments

Patch