diff mbox series

[3/6] fs: Split fcntl_rw_hint()

Message ID 20240131205237.3540210-4-bvanassche@acm.org (mailing list archive)
State New, archived
Headers show
Series Restore data lifetime support | expand

Commit Message

Bart Van Assche Jan. 31, 2024, 8:52 p.m. UTC
Split fcntl_rw_hint() such that there is one helper function per fcntl. No
functionality is changed by this patch.

Reviewed-by: Christoph Hellwig <hch@lst.de>
Suggested-by: Christoph Hellwig <hch@lst.de>
Reviewed-by: Kanchan Joshi <joshi.k@samsung.com>
Cc: Jeff Layton <jlayton@kernel.org>
Cc: Chuck Lever <chuck.lever@oracle.com>
Cc: Jens Axboe <axboe@kernel.dk>
Cc: Stephen Rothwell <sfr@canb.auug.org.au>
Signed-off-by: Bart Van Assche <bvanassche@acm.org>
---
 fs/fcntl.c | 47 ++++++++++++++++++++++++++---------------------
 1 file changed, 26 insertions(+), 21 deletions(-)

Comments

Dave Chinner Jan. 31, 2024, 9:07 p.m. UTC | #1
On Wed, Jan 31, 2024 at 12:52:34PM -0800, Bart Van Assche wrote:
> Split fcntl_rw_hint() such that there is one helper function per fcntl. No
> functionality is changed by this patch.
> 
> Reviewed-by: Christoph Hellwig <hch@lst.de>
> Suggested-by: Christoph Hellwig <hch@lst.de>
> Reviewed-by: Kanchan Joshi <joshi.k@samsung.com>
> Cc: Jeff Layton <jlayton@kernel.org>
> Cc: Chuck Lever <chuck.lever@oracle.com>
> Cc: Jens Axboe <axboe@kernel.dk>
> Cc: Stephen Rothwell <sfr@canb.auug.org.au>
> Signed-off-by: Bart Van Assche <bvanassche@acm.org>
> ---
>  fs/fcntl.c | 47 ++++++++++++++++++++++++++---------------------
>  1 file changed, 26 insertions(+), 21 deletions(-)
> 
> diff --git a/fs/fcntl.c b/fs/fcntl.c
> index f3bc4662455f..5fa2d95114bf 100644
> --- a/fs/fcntl.c
> +++ b/fs/fcntl.c
> @@ -290,32 +290,35 @@ static bool rw_hint_valid(u64 hint)
>  	}
>  }
>  
> -static long fcntl_rw_hint(struct file *file, unsigned int cmd,
> -			  unsigned long arg)
> +static long fcntl_get_rw_hint(struct file *file, unsigned int cmd,
> +			      unsigned long arg)
>  {
>  	struct inode *inode = file_inode(file);
>  	u64 __user *argp = (u64 __user *)arg;
> -	u64 hint;
> +	u64 hint = inode->i_write_hint;
>  
> -	switch (cmd) {
> -	case F_GET_RW_HINT:
> -		hint = inode->i_write_hint;
> -		if (copy_to_user(argp, &hint, sizeof(*argp)))
> -			return -EFAULT;
> -		return 0;
> -	case F_SET_RW_HINT:
> -		if (copy_from_user(&hint, argp, sizeof(hint)))
> -			return -EFAULT;
> -		if (!rw_hint_valid(hint))
> -			return -EINVAL;
> +	if (copy_to_user(argp, &hint, sizeof(*argp)))
> +		return -EFAULT;
> +	return 0;
> +}
>  
> -		inode_lock(inode);
> -		inode->i_write_hint = hint;
> -		inode_unlock(inode);
> -		return 0;
> -	default:
> +static long fcntl_set_rw_hint(struct file *file, unsigned int cmd,
> +			      unsigned long arg)
> +{
> +	struct inode *inode = file_inode(file);
> +	u64 __user *argp = (u64 __user *)arg;
> +	u64 hint;
> +
> +	if (copy_from_user(&hint, argp, sizeof(hint)))
> +		return -EFAULT;
> +	if (!rw_hint_valid(hint))
>  		return -EINVAL;
> -	}
> +
> +	inode_lock(inode);
> +	inode->i_write_hint = hint;
> +	inode_unlock(inode);

What is this locking serialising against? The inode may or may not
be locked when we access this in IO path, so why isn't this just
WRITE_ONCE() here and READ_ONCE() in the IO paths?

-Dave.
Bart Van Assche Feb. 1, 2024, 5:38 p.m. UTC | #2
On 1/31/24 13:07, Dave Chinner wrote:
> On Wed, Jan 31, 2024 at 12:52:34PM -0800, Bart Van Assche wrote:
>> +	inode_lock(inode);
>> +	inode->i_write_hint = hint;
>> +	inode_unlock(inode);
> 
> What is this locking serialising against? The inode may or may not
> be locked when we access this in IO path, so why isn't this just
> WRITE_ONCE() here and READ_ONCE() in the IO paths?

How about using WRITE_ONCE()/READ_ONCE() in the fcntl implementations and
regular reads in the I/O paths? Using F_SET_RW_HINT while I/O is ongoing
is racy - there are no guarantees about how F_SET_RW_HINT will affect I/O
that has already been submitted. Hence, I think that it is acceptable to
use regular reads for i_write_hint in the I/O paths.

Thanks,

Bart.
diff mbox series

Patch

diff --git a/fs/fcntl.c b/fs/fcntl.c
index f3bc4662455f..5fa2d95114bf 100644
--- a/fs/fcntl.c
+++ b/fs/fcntl.c
@@ -290,32 +290,35 @@  static bool rw_hint_valid(u64 hint)
 	}
 }
 
-static long fcntl_rw_hint(struct file *file, unsigned int cmd,
-			  unsigned long arg)
+static long fcntl_get_rw_hint(struct file *file, unsigned int cmd,
+			      unsigned long arg)
 {
 	struct inode *inode = file_inode(file);
 	u64 __user *argp = (u64 __user *)arg;
-	u64 hint;
+	u64 hint = inode->i_write_hint;
 
-	switch (cmd) {
-	case F_GET_RW_HINT:
-		hint = inode->i_write_hint;
-		if (copy_to_user(argp, &hint, sizeof(*argp)))
-			return -EFAULT;
-		return 0;
-	case F_SET_RW_HINT:
-		if (copy_from_user(&hint, argp, sizeof(hint)))
-			return -EFAULT;
-		if (!rw_hint_valid(hint))
-			return -EINVAL;
+	if (copy_to_user(argp, &hint, sizeof(*argp)))
+		return -EFAULT;
+	return 0;
+}
 
-		inode_lock(inode);
-		inode->i_write_hint = hint;
-		inode_unlock(inode);
-		return 0;
-	default:
+static long fcntl_set_rw_hint(struct file *file, unsigned int cmd,
+			      unsigned long arg)
+{
+	struct inode *inode = file_inode(file);
+	u64 __user *argp = (u64 __user *)arg;
+	u64 hint;
+
+	if (copy_from_user(&hint, argp, sizeof(hint)))
+		return -EFAULT;
+	if (!rw_hint_valid(hint))
 		return -EINVAL;
-	}
+
+	inode_lock(inode);
+	inode->i_write_hint = hint;
+	inode_unlock(inode);
+
+	return 0;
 }
 
 static long do_fcntl(int fd, unsigned int cmd, unsigned long arg,
@@ -421,8 +424,10 @@  static long do_fcntl(int fd, unsigned int cmd, unsigned long arg,
 		err = memfd_fcntl(filp, cmd, argi);
 		break;
 	case F_GET_RW_HINT:
+		err = fcntl_get_rw_hint(filp, cmd, arg);
+		break;
 	case F_SET_RW_HINT:
-		err = fcntl_rw_hint(filp, cmd, arg);
+		err = fcntl_set_rw_hint(filp, cmd, arg);
 		break;
 	default:
 		break;