diff mbox series

xfs: dax: facilitate EXPERIMENTAL warning for dax=inode case

Message ID 20210826173012.273932-1-bodonnel@redhat.com (mailing list archive)
State Deferred, archived
Headers show
Series xfs: dax: facilitate EXPERIMENTAL warning for dax=inode case | expand

Commit Message

Bill O'Donnell Aug. 26, 2021, 5:30 p.m. UTC
When dax-mode was tri-stated by adding dax=inode case, the EXPERIMENTAL
warning on mount was missed for the case. Add logic to handle the
warning similar to that of the 'dax=always' case.

Signed-off-by: Bill O'Donnell <bodonnel@redhat.com>
---
 fs/xfs/xfs_mount.h | 2 ++
 fs/xfs/xfs_super.c | 8 +++++---
 2 files changed, 7 insertions(+), 3 deletions(-)

Comments

Darrick J. Wong Aug. 26, 2021, 6:09 p.m. UTC | #1
On Thu, Aug 26, 2021 at 12:30:12PM -0500, Bill O'Donnell wrote:
> When dax-mode was tri-stated by adding dax=inode case, the EXPERIMENTAL
> warning on mount was missed for the case. Add logic to handle the
> warning similar to that of the 'dax=always' case.
> 
> Signed-off-by: Bill O'Donnell <bodonnel@redhat.com>
> ---
>  fs/xfs/xfs_mount.h | 2 ++
>  fs/xfs/xfs_super.c | 8 +++++---
>  2 files changed, 7 insertions(+), 3 deletions(-)
> 
> diff --git a/fs/xfs/xfs_mount.h b/fs/xfs/xfs_mount.h
> index e091f3b3fa15..c9243a1b8d05 100644
> --- a/fs/xfs/xfs_mount.h
> +++ b/fs/xfs/xfs_mount.h
> @@ -277,6 +277,7 @@ typedef struct xfs_mount {
>  #define XFS_FEAT_NEEDSREPAIR	(1ULL << 25)	/* needs xfs_repair */
>  
>  /* Mount features */
> +#define XFS_FEAT_DAX_INODE	(1ULL << 47)	/* DAX enabled */
>  #define XFS_FEAT_NOATTR2	(1ULL << 48)	/* disable attr2 creation */
>  #define XFS_FEAT_NOALIGN	(1ULL << 49)	/* ignore alignment */
>  #define XFS_FEAT_ALLOCSIZE	(1ULL << 50)	/* user specified allocation size */
> @@ -359,6 +360,7 @@ __XFS_HAS_FEAT(swalloc, SWALLOC)
>  __XFS_HAS_FEAT(filestreams, FILESTREAMS)
>  __XFS_HAS_FEAT(dax_always, DAX_ALWAYS)
>  __XFS_HAS_FEAT(dax_never, DAX_NEVER)
> +__XFS_HAS_FEAT(dax_inode, DAX_INODE)
>  __XFS_HAS_FEAT(norecovery, NORECOVERY)
>  __XFS_HAS_FEAT(nouuid, NOUUID)
>  
> diff --git a/fs/xfs/xfs_super.c b/fs/xfs/xfs_super.c
> index 5e73ac78bf2f..f73f3687f0a8 100644
> --- a/fs/xfs/xfs_super.c
> +++ b/fs/xfs/xfs_super.c
> @@ -84,15 +84,16 @@ xfs_mount_set_dax_mode(
>  {
>  	switch (mode) {
>  	case XFS_DAX_INODE:
> +		mp->m_features |= XFS_FEAT_DAX_INODE;
>  		mp->m_features &= ~(XFS_FEAT_DAX_ALWAYS | XFS_FEAT_DAX_NEVER);
>  		break;
>  	case XFS_DAX_ALWAYS:
>  		mp->m_features |= XFS_FEAT_DAX_ALWAYS;
> -		mp->m_features &= ~XFS_FEAT_DAX_NEVER;
> +		mp->m_features &= ~(XFS_FEAT_DAX_NEVER | XFS_FEAT_DAX_INODE);
>  		break;
>  	case XFS_DAX_NEVER:
>  		mp->m_features |= XFS_FEAT_DAX_NEVER;
> -		mp->m_features &= ~XFS_FEAT_DAX_ALWAYS;
> +		mp->m_features &= ~(XFS_FEAT_DAX_ALWAYS | XFS_FEAT_DAX_INODE);
>  		break;
>  	}
>  }
> @@ -189,6 +190,7 @@ xfs_fs_show_options(
>  		{ XFS_FEAT_LARGE_IOSIZE,	",largeio" },
>  		{ XFS_FEAT_DAX_ALWAYS,		",dax=always" },
>  		{ XFS_FEAT_DAX_NEVER,		",dax=never" },
> +		{ XFS_FEAT_DAX_INODE,		",dax=inode" },
>  		{ 0, NULL }
>  	};
>  	struct xfs_mount	*mp = XFS_M(root->d_sb);
> @@ -1584,7 +1586,7 @@ xfs_fs_fill_super(
>  	if (xfs_has_crc(mp))
>  		sb->s_flags |= SB_I_VERSION;
>  
> -	if (xfs_has_dax_always(mp)) {
> +	if (xfs_has_dax_always(mp) || xfs_has_dax_inode(mp)) {

Er... can't this be done without burning another feature bit by:

	if (xfs_has_dax_always(mp) || (!xfs_has_dax_always(mp) &&
				       !xfs_has_dax_never(mp))) {
		...
		xfs_warn(mp, "DAX IS EXPERIMENTAL");
	}

--D

>  		bool rtdev_is_dax = false, datadev_is_dax;
>  
>  		xfs_warn(mp,
> -- 
> 2.31.1
>
Bill O'Donnell Aug. 26, 2021, 6:14 p.m. UTC | #2
On Thu, Aug 26, 2021 at 11:09:47AM -0700, Darrick J. Wong wrote:
> On Thu, Aug 26, 2021 at 12:30:12PM -0500, Bill O'Donnell wrote:
> > When dax-mode was tri-stated by adding dax=inode case, the EXPERIMENTAL
> > warning on mount was missed for the case. Add logic to handle the
> > warning similar to that of the 'dax=always' case.
> > 
> > Signed-off-by: Bill O'Donnell <bodonnel@redhat.com>
> > ---
> >  fs/xfs/xfs_mount.h | 2 ++
> >  fs/xfs/xfs_super.c | 8 +++++---
> >  2 files changed, 7 insertions(+), 3 deletions(-)
> > 
> > diff --git a/fs/xfs/xfs_mount.h b/fs/xfs/xfs_mount.h
> > index e091f3b3fa15..c9243a1b8d05 100644
> > --- a/fs/xfs/xfs_mount.h
> > +++ b/fs/xfs/xfs_mount.h
> > @@ -277,6 +277,7 @@ typedef struct xfs_mount {
> >  #define XFS_FEAT_NEEDSREPAIR	(1ULL << 25)	/* needs xfs_repair */
> >  
> >  /* Mount features */
> > +#define XFS_FEAT_DAX_INODE	(1ULL << 47)	/* DAX enabled */
> >  #define XFS_FEAT_NOATTR2	(1ULL << 48)	/* disable attr2 creation */
> >  #define XFS_FEAT_NOALIGN	(1ULL << 49)	/* ignore alignment */
> >  #define XFS_FEAT_ALLOCSIZE	(1ULL << 50)	/* user specified allocation size */
> > @@ -359,6 +360,7 @@ __XFS_HAS_FEAT(swalloc, SWALLOC)
> >  __XFS_HAS_FEAT(filestreams, FILESTREAMS)
> >  __XFS_HAS_FEAT(dax_always, DAX_ALWAYS)
> >  __XFS_HAS_FEAT(dax_never, DAX_NEVER)
> > +__XFS_HAS_FEAT(dax_inode, DAX_INODE)
> >  __XFS_HAS_FEAT(norecovery, NORECOVERY)
> >  __XFS_HAS_FEAT(nouuid, NOUUID)
> >  
> > diff --git a/fs/xfs/xfs_super.c b/fs/xfs/xfs_super.c
> > index 5e73ac78bf2f..f73f3687f0a8 100644
> > --- a/fs/xfs/xfs_super.c
> > +++ b/fs/xfs/xfs_super.c
> > @@ -84,15 +84,16 @@ xfs_mount_set_dax_mode(
> >  {
> >  	switch (mode) {
> >  	case XFS_DAX_INODE:
> > +		mp->m_features |= XFS_FEAT_DAX_INODE;
> >  		mp->m_features &= ~(XFS_FEAT_DAX_ALWAYS | XFS_FEAT_DAX_NEVER);
> >  		break;
> >  	case XFS_DAX_ALWAYS:
> >  		mp->m_features |= XFS_FEAT_DAX_ALWAYS;
> > -		mp->m_features &= ~XFS_FEAT_DAX_NEVER;
> > +		mp->m_features &= ~(XFS_FEAT_DAX_NEVER | XFS_FEAT_DAX_INODE);
> >  		break;
> >  	case XFS_DAX_NEVER:
> >  		mp->m_features |= XFS_FEAT_DAX_NEVER;
> > -		mp->m_features &= ~XFS_FEAT_DAX_ALWAYS;
> > +		mp->m_features &= ~(XFS_FEAT_DAX_ALWAYS | XFS_FEAT_DAX_INODE);
> >  		break;
> >  	}
> >  }
> > @@ -189,6 +190,7 @@ xfs_fs_show_options(
> >  		{ XFS_FEAT_LARGE_IOSIZE,	",largeio" },
> >  		{ XFS_FEAT_DAX_ALWAYS,		",dax=always" },
> >  		{ XFS_FEAT_DAX_NEVER,		",dax=never" },
> > +		{ XFS_FEAT_DAX_INODE,		",dax=inode" },
> >  		{ 0, NULL }
> >  	};
> >  	struct xfs_mount	*mp = XFS_M(root->d_sb);
> > @@ -1584,7 +1586,7 @@ xfs_fs_fill_super(
> >  	if (xfs_has_crc(mp))
> >  		sb->s_flags |= SB_I_VERSION;
> >  
> > -	if (xfs_has_dax_always(mp)) {
> > +	if (xfs_has_dax_always(mp) || xfs_has_dax_inode(mp)) {
> 
> Er... can't this be done without burning another feature bit by:
> 
> 	if (xfs_has_dax_always(mp) || (!xfs_has_dax_always(mp) &&
> 				       !xfs_has_dax_never(mp))) {
> 		...
> 		xfs_warn(mp, "DAX IS EXPERIMENTAL");
> 	}
> 

Good idea. I'll send a v2.
Thanks-
Bill


> --D
> 
> >  		bool rtdev_is_dax = false, datadev_is_dax;
> >  
> >  		xfs_warn(mp,
> > -- 
> > 2.31.1
> > 
>
Eric Sandeen Aug. 26, 2021, 6:16 p.m. UTC | #3
On 8/26/21 1:09 PM, Darrick J. Wong wrote:
> On Thu, Aug 26, 2021 at 12:30:12PM -0500, Bill O'Donnell wrote:

>> @@ -1584,7 +1586,7 @@ xfs_fs_fill_super(
>>   	if (xfs_has_crc(mp))
>>   		sb->s_flags |= SB_I_VERSION;
>>   
>> -	if (xfs_has_dax_always(mp)) {
>> +	if (xfs_has_dax_always(mp) || xfs_has_dax_inode(mp)) {
> 
> Er... can't this be done without burning another feature bit by:
> 
> 	if (xfs_has_dax_always(mp) || (!xfs_has_dax_always(mp) &&
> 				       !xfs_has_dax_never(mp))) {
> 		...
> 		xfs_warn(mp, "DAX IS EXPERIMENTAL");
> 	}

changing this conditional in this way will also fail dax=inode mounts on
reflink-capable (i.e. default) filesystems, no?

-	if (xfs_has_dax_always(mp)) {
+	if (xfs_has_dax_always(mp) || $NEW_DAX_INODE_TEST) {

...
                 if (xfs_has_reflink(mp)) {
                         xfs_alert(mp,
                 "DAX and reflink cannot be used together!");
                         error = -EINVAL;
                         goto out_filestream_unmount;
                 }
         }

-Eric
Bill O'Donnell Aug. 26, 2021, 10:08 p.m. UTC | #4
On Thu, Aug 26, 2021 at 01:16:22PM -0500, Eric Sandeen wrote:
> 
> On 8/26/21 1:09 PM, Darrick J. Wong wrote:
> > On Thu, Aug 26, 2021 at 12:30:12PM -0500, Bill O'Donnell wrote:
> 
> > > @@ -1584,7 +1586,7 @@ xfs_fs_fill_super(
> > >   	if (xfs_has_crc(mp))
> > >   		sb->s_flags |= SB_I_VERSION;
> > > -	if (xfs_has_dax_always(mp)) {
> > > +	if (xfs_has_dax_always(mp) || xfs_has_dax_inode(mp)) {
> > 
> > Er... can't this be done without burning another feature bit by:
> > 
> > 	if (xfs_has_dax_always(mp) || (!xfs_has_dax_always(mp) &&
> > 				       !xfs_has_dax_never(mp))) {
> > 		...
> > 		xfs_warn(mp, "DAX IS EXPERIMENTAL");
> > 	}
> 
> changing this conditional in this way will also fail dax=inode mounts on
> reflink-capable (i.e. default) filesystems, no?

Correct. My original patch tests fine, and still handles the reflink and dax
incompatibility. The new suggested logic is problematic. 
-Bill

> 
> -	if (xfs_has_dax_always(mp)) {
> +	if (xfs_has_dax_always(mp) || $NEW_DAX_INODE_TEST) {
> 
> ...
>                 if (xfs_has_reflink(mp)) {
>                         xfs_alert(mp,
>                 "DAX and reflink cannot be used together!");
>                         error = -EINVAL;
>                         goto out_filestream_unmount;
>                 }
>         }
> 
> -Eric
>
Eric Sandeen Aug. 26, 2021, 11:43 p.m. UTC | #5
On 8/26/21 5:08 PM, Bill O'Donnell wrote:
> On Thu, Aug 26, 2021 at 01:16:22PM -0500, Eric Sandeen wrote:
>>
>> On 8/26/21 1:09 PM, Darrick J. Wong wrote:
>>> On Thu, Aug 26, 2021 at 12:30:12PM -0500, Bill O'Donnell wrote:
>>
>>>> @@ -1584,7 +1586,7 @@ xfs_fs_fill_super(
>>>>    	if (xfs_has_crc(mp))
>>>>    		sb->s_flags |= SB_I_VERSION;
>>>> -	if (xfs_has_dax_always(mp)) {
>>>> +	if (xfs_has_dax_always(mp) || xfs_has_dax_inode(mp)) {
>>>
>>> Er... can't this be done without burning another feature bit by:
>>>
>>> 	if (xfs_has_dax_always(mp) || (!xfs_has_dax_always(mp) &&
>>> 				       !xfs_has_dax_never(mp))) {
>>> 		...
>>> 		xfs_warn(mp, "DAX IS EXPERIMENTAL");
>>> 	}
>>
>> changing this conditional in this way will also fail dax=inode mounts on
>> reflink-capable (i.e. default) filesystems, no?
> 
> Correct. My original patch tests fine, and still handles the reflink and dax
> incompatibility. The new suggested logic is problematic.
> -Bill

I think that both your proposed patch and Darrick's suggestion have this problem.

"mount -o dax=inode" makes your new xfs_has_dax_inode(mp) true, and in that
conditional, if the filesystem has reflink enabled, mount fails:

# mkfs.xfs -f /dev/pmem0p1
meta-data=/dev/pmem0p1           isize=512    agcount=4, agsize=4194304 blks
          =                       sectsz=4096  attr=2, projid32bit=1
          =                       crc=1        finobt=1, sparse=1, rmapbt=0
          =                       reflink=1    bigtime=0 inobtcount=0
data     =                       bsize=4096   blocks=16777216, imaxpct=25
          =                       sunit=0      swidth=0 blks
naming   =version 2              bsize=4096   ascii-ci=0, ftype=1
log      =internal log           bsize=4096   blocks=8192, version=2
          =                       sectsz=4096  sunit=1 blks, lazy-count=1
realtime =none                   extsz=4096   blocks=0, rtextents=0

# mount -o dax=inode /dev/pmem0p1 /mnt/test
mount: wrong fs type, bad option, bad superblock on /dev/pmem0p1,
        missing codepage or helper program, or other error

        In some cases useful info is found in syslog - try
        dmesg | tail or so.

# dmesg | tail -n 2
[  192.691733] XFS (pmem0p1): DAX enabled. Warning: EXPERIMENTAL, use at your own risk
[  192.700300] XFS (pmem0p1): DAX and reflink cannot be used together!
Bill O'Donnell Aug. 27, 2021, 2:03 p.m. UTC | #6
On Thu, Aug 26, 2021 at 06:43:44PM -0500, Eric Sandeen wrote:
> On 8/26/21 5:08 PM, Bill O'Donnell wrote:
> > On Thu, Aug 26, 2021 at 01:16:22PM -0500, Eric Sandeen wrote:
> > > 
> > > On 8/26/21 1:09 PM, Darrick J. Wong wrote:
> > > > On Thu, Aug 26, 2021 at 12:30:12PM -0500, Bill O'Donnell wrote:
> > > 
> > > > > @@ -1584,7 +1586,7 @@ xfs_fs_fill_super(
> > > > >    	if (xfs_has_crc(mp))
> > > > >    		sb->s_flags |= SB_I_VERSION;
> > > > > -	if (xfs_has_dax_always(mp)) {
> > > > > +	if (xfs_has_dax_always(mp) || xfs_has_dax_inode(mp)) {
> > > > 
> > > > Er... can't this be done without burning another feature bit by:
> > > > 
> > > > 	if (xfs_has_dax_always(mp) || (!xfs_has_dax_always(mp) &&
> > > > 				       !xfs_has_dax_never(mp))) {
> > > > 		...
> > > > 		xfs_warn(mp, "DAX IS EXPERIMENTAL");
> > > > 	}
> > > 
> > > changing this conditional in this way will also fail dax=inode mounts on
> > > reflink-capable (i.e. default) filesystems, no?
> > 
> > Correct. My original patch tests fine, and still handles the reflink and dax
> > incompatibility. The new suggested logic is problematic.
> > -Bill
> 
> I think that both your proposed patch and Darrick's suggestion have this problem.
> 
> "mount -o dax=inode" makes your new xfs_has_dax_inode(mp) true, and in that
> conditional, if the filesystem has reflink enabled, mount fails:
> 
> # mkfs.xfs -f /dev/pmem0p1
> meta-data=/dev/pmem0p1           isize=512    agcount=4, agsize=4194304 blks
>          =                       sectsz=4096  attr=2, projid32bit=1
>          =                       crc=1        finobt=1, sparse=1, rmapbt=0
>          =                       reflink=1    bigtime=0 inobtcount=0
> data     =                       bsize=4096   blocks=16777216, imaxpct=25
>          =                       sunit=0      swidth=0 blks
> naming   =version 2              bsize=4096   ascii-ci=0, ftype=1
> log      =internal log           bsize=4096   blocks=8192, version=2
>          =                       sectsz=4096  sunit=1 blks, lazy-count=1
> realtime =none                   extsz=4096   blocks=0, rtextents=0
> 
> # mount -o dax=inode /dev/pmem0p1 /mnt/test
> mount: wrong fs type, bad option, bad superblock on /dev/pmem0p1,
>        missing codepage or helper program, or other error
> 
>        In some cases useful info is found in syslog - try
>        dmesg | tail or so.
> 
> # dmesg | tail -n 2
> [  192.691733] XFS (pmem0p1): DAX enabled. Warning: EXPERIMENTAL, use at your own risk
> [  192.700300] XFS (pmem0p1): DAX and reflink cannot be used together!
> 

So, the "DAX enabled" is a misnomer in this case. However the incompatibility of DAX and reflink is
reflected in the next message, and indeed the mount fails. Is it now a matter of fixing
the message output so as not to indicate "DAX enabled..."?

Thanks-
Bill
Eric Sandeen Aug. 27, 2021, 2:18 p.m. UTC | #7
On 8/27/21 9:03 AM, Bill O'Donnell wrote:
> On Thu, Aug 26, 2021 at 06:43:44PM -0500, Eric Sandeen wrote:
>> On 8/26/21 5:08 PM, Bill O'Donnell wrote:
>>> On Thu, Aug 26, 2021 at 01:16:22PM -0500, Eric Sandeen wrote:
>>>>
>>>> On 8/26/21 1:09 PM, Darrick J. Wong wrote:
>>>>> On Thu, Aug 26, 2021 at 12:30:12PM -0500, Bill O'Donnell wrote:
>>>>
>>>>>> @@ -1584,7 +1586,7 @@ xfs_fs_fill_super(
>>>>>>     	if (xfs_has_crc(mp))
>>>>>>     		sb->s_flags |= SB_I_VERSION;
>>>>>> -	if (xfs_has_dax_always(mp)) {
>>>>>> +	if (xfs_has_dax_always(mp) || xfs_has_dax_inode(mp)) {
>>>>>
>>>>> Er... can't this be done without burning another feature bit by:
>>>>>
>>>>> 	if (xfs_has_dax_always(mp) || (!xfs_has_dax_always(mp) &&
>>>>> 				       !xfs_has_dax_never(mp))) {
>>>>> 		...
>>>>> 		xfs_warn(mp, "DAX IS EXPERIMENTAL");
>>>>> 	}
>>>>
>>>> changing this conditional in this way will also fail dax=inode mounts on
>>>> reflink-capable (i.e. default) filesystems, no?
>>>
>>> Correct. My original patch tests fine, and still handles the reflink and dax
>>> incompatibility. The new suggested logic is problematic.
>>> -Bill
>>
>> I think that both your proposed patch and Darrick's suggestion have this problem.
>>
>> "mount -o dax=inode" makes your new xfs_has_dax_inode(mp) true, and in that
>> conditional, if the filesystem has reflink enabled, mount fails:
>>
>> # mkfs.xfs -f /dev/pmem0p1
>> meta-data=/dev/pmem0p1           isize=512    agcount=4, agsize=4194304 blks
>>           =                       sectsz=4096  attr=2, projid32bit=1
>>           =                       crc=1        finobt=1, sparse=1, rmapbt=0
>>           =                       reflink=1    bigtime=0 inobtcount=0
>> data     =                       bsize=4096   blocks=16777216, imaxpct=25
>>           =                       sunit=0      swidth=0 blks
>> naming   =version 2              bsize=4096   ascii-ci=0, ftype=1
>> log      =internal log           bsize=4096   blocks=8192, version=2
>>           =                       sectsz=4096  sunit=1 blks, lazy-count=1
>> realtime =none                   extsz=4096   blocks=0, rtextents=0
>>
>> # mount -o dax=inode /dev/pmem0p1 /mnt/test
>> mount: wrong fs type, bad option, bad superblock on /dev/pmem0p1,
>>         missing codepage or helper program, or other error
>>
>>         In some cases useful info is found in syslog - try
>>         dmesg | tail or so.
>>
>> # dmesg | tail -n 2
>> [  192.691733] XFS (pmem0p1): DAX enabled. Warning: EXPERIMENTAL, use at your own risk
>> [  192.700300] XFS (pmem0p1): DAX and reflink cannot be used together!
>>
> 
> So, the "DAX enabled" is a misnomer in this case. However the incompatibility of DAX and reflink is
> reflected in the next message, and indeed the mount fails. Is it now a matter of fixing
> the message output so as not to indicate "DAX enabled..."?

The mount should not fail, and it does not fail prior to your change.

In the past, we did not allow any mixing of a reflink-capable
filesystem with dax in any way.  Now, with per-inode dax, dax-enabled inodes and
reflink-enabled inodes can exist on the same filesystem, you just cannot have an
inode which is both dax-enabled and reflinked at the same time.

-Eric
Bill O'Donnell Aug. 27, 2021, 2:25 p.m. UTC | #8
On Fri, Aug 27, 2021 at 09:18:32AM -0500, Eric Sandeen wrote:
> On 8/27/21 9:03 AM, Bill O'Donnell wrote:
> > On Thu, Aug 26, 2021 at 06:43:44PM -0500, Eric Sandeen wrote:
> > > On 8/26/21 5:08 PM, Bill O'Donnell wrote:
> > > > On Thu, Aug 26, 2021 at 01:16:22PM -0500, Eric Sandeen wrote:
> > > > > 
> > > > > On 8/26/21 1:09 PM, Darrick J. Wong wrote:
> > > > > > On Thu, Aug 26, 2021 at 12:30:12PM -0500, Bill O'Donnell wrote:
> > > > > 
> > > > > > > @@ -1584,7 +1586,7 @@ xfs_fs_fill_super(
> > > > > > >     	if (xfs_has_crc(mp))
> > > > > > >     		sb->s_flags |= SB_I_VERSION;
> > > > > > > -	if (xfs_has_dax_always(mp)) {
> > > > > > > +	if (xfs_has_dax_always(mp) || xfs_has_dax_inode(mp)) {
> > > > > > 
> > > > > > Er... can't this be done without burning another feature bit by:
> > > > > > 
> > > > > > 	if (xfs_has_dax_always(mp) || (!xfs_has_dax_always(mp) &&
> > > > > > 				       !xfs_has_dax_never(mp))) {
> > > > > > 		...
> > > > > > 		xfs_warn(mp, "DAX IS EXPERIMENTAL");
> > > > > > 	}
> > > > > 
> > > > > changing this conditional in this way will also fail dax=inode mounts on
> > > > > reflink-capable (i.e. default) filesystems, no?
> > > > 
> > > > Correct. My original patch tests fine, and still handles the reflink and dax
> > > > incompatibility. The new suggested logic is problematic.
> > > > -Bill
> > > 
> > > I think that both your proposed patch and Darrick's suggestion have this problem.
> > > 
> > > "mount -o dax=inode" makes your new xfs_has_dax_inode(mp) true, and in that
> > > conditional, if the filesystem has reflink enabled, mount fails:
> > > 
> > > # mkfs.xfs -f /dev/pmem0p1
> > > meta-data=/dev/pmem0p1           isize=512    agcount=4, agsize=4194304 blks
> > >           =                       sectsz=4096  attr=2, projid32bit=1
> > >           =                       crc=1        finobt=1, sparse=1, rmapbt=0
> > >           =                       reflink=1    bigtime=0 inobtcount=0
> > > data     =                       bsize=4096   blocks=16777216, imaxpct=25
> > >           =                       sunit=0      swidth=0 blks
> > > naming   =version 2              bsize=4096   ascii-ci=0, ftype=1
> > > log      =internal log           bsize=4096   blocks=8192, version=2
> > >           =                       sectsz=4096  sunit=1 blks, lazy-count=1
> > > realtime =none                   extsz=4096   blocks=0, rtextents=0
> > > 
> > > # mount -o dax=inode /dev/pmem0p1 /mnt/test
> > > mount: wrong fs type, bad option, bad superblock on /dev/pmem0p1,
> > >         missing codepage or helper program, or other error
> > > 
> > >         In some cases useful info is found in syslog - try
> > >         dmesg | tail or so.
> > > 
> > > # dmesg | tail -n 2
> > > [  192.691733] XFS (pmem0p1): DAX enabled. Warning: EXPERIMENTAL, use at your own risk
> > > [  192.700300] XFS (pmem0p1): DAX and reflink cannot be used together!
> > > 
> > 
> > So, the "DAX enabled" is a misnomer in this case. However the incompatibility of DAX and reflink is
> > reflected in the next message, and indeed the mount fails. Is it now a matter of fixing
> > the message output so as not to indicate "DAX enabled..."?
> 
> The mount should not fail, and it does not fail prior to your change.
> 
> In the past, we did not allow any mixing of a reflink-capable
> filesystem with dax in any way.  Now, with per-inode dax, dax-enabled inodes and
> reflink-enabled inodes can exist on the same filesystem, you just cannot have an
> inode which is both dax-enabled and reflinked at the same time.

Ah. I missed that nuance. I had thought the incompatibility was
absolute. :/

The manpage for mkfs.xfs may need updating for the inode mode
(unless mine is old):
----------------snip------------------
"Note:  the  filesystem DAX mount option ( -o dax ) is incom‐
patible  with  reflink-enabled  XFS  filesystems.   To   use
filesystem  DAX with XFS, specify the -m reflink=0 option to
mkfs.xfs to disable the reflink feature."
-------------------------------------
Thanks-
Bill
Eric Sandeen Aug. 27, 2021, 3:35 p.m. UTC | #9
On 8/27/21 9:25 AM, Bill O'Donnell wrote:
> On Fri, Aug 27, 2021 at 09:18:32AM -0500, Eric Sandeen wrote:
>> On 8/27/21 9:03 AM, Bill O'Donnell wrote:
>>> On Thu, Aug 26, 2021 at 06:43:44PM -0500, Eric Sandeen wrote:
>>>> On 8/26/21 5:08 PM, Bill O'Donnell wrote:
>>>>> On Thu, Aug 26, 2021 at 01:16:22PM -0500, Eric Sandeen wrote:
>>>>>>
>>>>>> On 8/26/21 1:09 PM, Darrick J. Wong wrote:
>>>>>>> On Thu, Aug 26, 2021 at 12:30:12PM -0500, Bill O'Donnell wrote:
>>>>>>
>>>>>>>> @@ -1584,7 +1586,7 @@ xfs_fs_fill_super(
>>>>>>>>      	if (xfs_has_crc(mp))
>>>>>>>>      		sb->s_flags |= SB_I_VERSION;
>>>>>>>> -	if (xfs_has_dax_always(mp)) {
>>>>>>>> +	if (xfs_has_dax_always(mp) || xfs_has_dax_inode(mp)) {
>>>>>>>
>>>>>>> Er... can't this be done without burning another feature bit by:
>>>>>>>
>>>>>>> 	if (xfs_has_dax_always(mp) || (!xfs_has_dax_always(mp) &&
>>>>>>> 				       !xfs_has_dax_never(mp))) {
>>>>>>> 		...
>>>>>>> 		xfs_warn(mp, "DAX IS EXPERIMENTAL");
>>>>>>> 	}
>>>>>>
>>>>>> changing this conditional in this way will also fail dax=inode mounts on
>>>>>> reflink-capable (i.e. default) filesystems, no?
>>>>>
>>>>> Correct. My original patch tests fine, and still handles the reflink and dax
>>>>> incompatibility. The new suggested logic is problematic.
>>>>> -Bill
>>>>
>>>> I think that both your proposed patch and Darrick's suggestion have this problem.
>>>>
>>>> "mount -o dax=inode" makes your new xfs_has_dax_inode(mp) true, and in that
>>>> conditional, if the filesystem has reflink enabled, mount fails:
>>>>
>>>> # mkfs.xfs -f /dev/pmem0p1
>>>> meta-data=/dev/pmem0p1           isize=512    agcount=4, agsize=4194304 blks
>>>>            =                       sectsz=4096  attr=2, projid32bit=1
>>>>            =                       crc=1        finobt=1, sparse=1, rmapbt=0
>>>>            =                       reflink=1    bigtime=0 inobtcount=0
>>>> data     =                       bsize=4096   blocks=16777216, imaxpct=25
>>>>            =                       sunit=0      swidth=0 blks
>>>> naming   =version 2              bsize=4096   ascii-ci=0, ftype=1
>>>> log      =internal log           bsize=4096   blocks=8192, version=2
>>>>            =                       sectsz=4096  sunit=1 blks, lazy-count=1
>>>> realtime =none                   extsz=4096   blocks=0, rtextents=0
>>>>
>>>> # mount -o dax=inode /dev/pmem0p1 /mnt/test
>>>> mount: wrong fs type, bad option, bad superblock on /dev/pmem0p1,
>>>>          missing codepage or helper program, or other error
>>>>
>>>>          In some cases useful info is found in syslog - try
>>>>          dmesg | tail or so.
>>>>
>>>> # dmesg | tail -n 2
>>>> [  192.691733] XFS (pmem0p1): DAX enabled. Warning: EXPERIMENTAL, use at your own risk
>>>> [  192.700300] XFS (pmem0p1): DAX and reflink cannot be used together!
>>>>
>>>
>>> So, the "DAX enabled" is a misnomer in this case. However the incompatibility of DAX and reflink is
>>> reflected in the next message, and indeed the mount fails. Is it now a matter of fixing
>>> the message output so as not to indicate "DAX enabled..."?
>>
>> The mount should not fail, and it does not fail prior to your change.
>>
>> In the past, we did not allow any mixing of a reflink-capable
>> filesystem with dax in any way.  Now, with per-inode dax, dax-enabled inodes and
>> reflink-enabled inodes can exist on the same filesystem, you just cannot have an
>> inode which is both dax-enabled and reflinked at the same time.
> 
> Ah. I missed that nuance. I had thought the incompatibility was
> absolute. :/
> 
> The manpage for mkfs.xfs may need updating for the inode mode
> (unless mine is old):
> ----------------snip------------------
> "Note:  the  filesystem DAX mount option ( -o dax ) is incom‐
> patible  with  reflink-enabled  XFS  filesystems.   To   use
> filesystem  DAX with XFS, specify the -m reflink=0 option to
> mkfs.xfs to disable the reflink feature."
> -------------------------------------

Hm, looks like the xfs(5) manpage got updated, but it seems mkfs.xfs(8) did not.

        dax=value
               Set  CPU  direct  access (DAX) behavior for the current filesystem.
               This mount option accepts the following values:

               "dax=inode"  DAX  will  be  enabled  only  on  regular  files  with
               FS_XFLAG_DAX applied.

               "dax=never"  DAX  will  not  be enabled for any files. FS_XFLAG_DAX
               will be ignored.

               "dax=always" DAX will be enabled for all regular files,  regardless
               of the FS_XFLAG_DAX state.

               If  no  option  is  used when mounting a filesystem stored on a DAX
               capable device, dax=inode will be used as default.

               For details regarding DAX behavior in kernel, please refer to  ker‐
               nel's documentation

I'll send a patch to fix up the mkfs manpage, thanks.

Thanks,
-Eric
Bill O'Donnell Aug. 27, 2021, 3:41 p.m. UTC | #10
On Fri, Aug 27, 2021 at 10:35:56AM -0500, Eric Sandeen wrote:
> On 8/27/21 9:25 AM, Bill O'Donnell wrote:
> > On Fri, Aug 27, 2021 at 09:18:32AM -0500, Eric Sandeen wrote:
> > > On 8/27/21 9:03 AM, Bill O'Donnell wrote:
> > > > On Thu, Aug 26, 2021 at 06:43:44PM -0500, Eric Sandeen wrote:
> > > > > On 8/26/21 5:08 PM, Bill O'Donnell wrote:
> > > > > > On Thu, Aug 26, 2021 at 01:16:22PM -0500, Eric Sandeen wrote:
> > > > > > > 
> > > > > > > On 8/26/21 1:09 PM, Darrick J. Wong wrote:
> > > > > > > > On Thu, Aug 26, 2021 at 12:30:12PM -0500, Bill O'Donnell wrote:
> > > > > > > 
> > > > > > > > > @@ -1584,7 +1586,7 @@ xfs_fs_fill_super(
> > > > > > > > >      	if (xfs_has_crc(mp))
> > > > > > > > >      		sb->s_flags |= SB_I_VERSION;
> > > > > > > > > -	if (xfs_has_dax_always(mp)) {
> > > > > > > > > +	if (xfs_has_dax_always(mp) || xfs_has_dax_inode(mp)) {
> > > > > > > > 
> > > > > > > > Er... can't this be done without burning another feature bit by:
> > > > > > > > 
> > > > > > > > 	if (xfs_has_dax_always(mp) || (!xfs_has_dax_always(mp) &&
> > > > > > > > 				       !xfs_has_dax_never(mp))) {
> > > > > > > > 		...
> > > > > > > > 		xfs_warn(mp, "DAX IS EXPERIMENTAL");
> > > > > > > > 	}
> > > > > > > 
> > > > > > > changing this conditional in this way will also fail dax=inode mounts on
> > > > > > > reflink-capable (i.e. default) filesystems, no?
> > > > > > 
> > > > > > Correct. My original patch tests fine, and still handles the reflink and dax
> > > > > > incompatibility. The new suggested logic is problematic.
> > > > > > -Bill
> > > > > 
> > > > > I think that both your proposed patch and Darrick's suggestion have this problem.
> > > > > 
> > > > > "mount -o dax=inode" makes your new xfs_has_dax_inode(mp) true, and in that
> > > > > conditional, if the filesystem has reflink enabled, mount fails:
> > > > > 
> > > > > # mkfs.xfs -f /dev/pmem0p1
> > > > > meta-data=/dev/pmem0p1           isize=512    agcount=4, agsize=4194304 blks
> > > > >            =                       sectsz=4096  attr=2, projid32bit=1
> > > > >            =                       crc=1        finobt=1, sparse=1, rmapbt=0
> > > > >            =                       reflink=1    bigtime=0 inobtcount=0
> > > > > data     =                       bsize=4096   blocks=16777216, imaxpct=25
> > > > >            =                       sunit=0      swidth=0 blks
> > > > > naming   =version 2              bsize=4096   ascii-ci=0, ftype=1
> > > > > log      =internal log           bsize=4096   blocks=8192, version=2
> > > > >            =                       sectsz=4096  sunit=1 blks, lazy-count=1
> > > > > realtime =none                   extsz=4096   blocks=0, rtextents=0
> > > > > 
> > > > > # mount -o dax=inode /dev/pmem0p1 /mnt/test
> > > > > mount: wrong fs type, bad option, bad superblock on /dev/pmem0p1,
> > > > >          missing codepage or helper program, or other error
> > > > > 
> > > > >          In some cases useful info is found in syslog - try
> > > > >          dmesg | tail or so.
> > > > > 
> > > > > # dmesg | tail -n 2
> > > > > [  192.691733] XFS (pmem0p1): DAX enabled. Warning: EXPERIMENTAL, use at your own risk
> > > > > [  192.700300] XFS (pmem0p1): DAX and reflink cannot be used together!
> > > > > 
> > > > 
> > > > So, the "DAX enabled" is a misnomer in this case. However the incompatibility of DAX and reflink is
> > > > reflected in the next message, and indeed the mount fails. Is it now a matter of fixing
> > > > the message output so as not to indicate "DAX enabled..."?
> > > 
> > > The mount should not fail, and it does not fail prior to your change.
> > > 
> > > In the past, we did not allow any mixing of a reflink-capable
> > > filesystem with dax in any way.  Now, with per-inode dax, dax-enabled inodes and
> > > reflink-enabled inodes can exist on the same filesystem, you just cannot have an
> > > inode which is both dax-enabled and reflinked at the same time.
> > 
> > Ah. I missed that nuance. I had thought the incompatibility was
> > absolute. :/
> > 
> > The manpage for mkfs.xfs may need updating for the inode mode
> > (unless mine is old):
> > ----------------snip------------------
> > "Note:  the  filesystem DAX mount option ( -o dax ) is incom‐
> > patible  with  reflink-enabled  XFS  filesystems.   To   use
> > filesystem  DAX with XFS, specify the -m reflink=0 option to
> > mkfs.xfs to disable the reflink feature."
> > -------------------------------------
> 
> Hm, looks like the xfs(5) manpage got updated, but it seems mkfs.xfs(8) did not.
> 
>        dax=value
>               Set  CPU  direct  access (DAX) behavior for the current filesystem.
>               This mount option accepts the following values:
> 
>               "dax=inode"  DAX  will  be  enabled  only  on  regular  files  with
>               FS_XFLAG_DAX applied.
> 
>               "dax=never"  DAX  will  not  be enabled for any files. FS_XFLAG_DAX
>               will be ignored.
> 
>               "dax=always" DAX will be enabled for all regular files,  regardless
>               of the FS_XFLAG_DAX state.
> 
>               If  no  option  is  used when mounting a filesystem stored on a DAX
>               capable device, dax=inode will be used as default.

The documentation here, https://www.kernel.org/doc/Documentation/filesystems/dax.txt
adds to the confusion.
   "-o dax"        is a legacy option which is an alias for "dax=always".
		    This may be removed in the future so "-o dax=always" is
		    the preferred method for specifying this behavior.



> 
>               For details regarding DAX behavior in kernel, please refer to  ker‐
>               nel's documentation
> 
> I'll send a patch to fix up the mkfs manpage, thanks.
> 
> Thanks,
> -Eric
>
Bill O'Donnell Aug. 30, 2021, 3:55 p.m. UTC | #11
On Thu, Aug 26, 2021 at 11:09:47AM -0700, Darrick J. Wong wrote:
> On Thu, Aug 26, 2021 at 12:30:12PM -0500, Bill O'Donnell wrote:
> > When dax-mode was tri-stated by adding dax=inode case, the EXPERIMENTAL
> > warning on mount was missed for the case. Add logic to handle the
> > warning similar to that of the 'dax=always' case.
> > 
> > Signed-off-by: Bill O'Donnell <bodonnel@redhat.com>
> > ---
> >  fs/xfs/xfs_mount.h | 2 ++
> >  fs/xfs/xfs_super.c | 8 +++++---
> >  2 files changed, 7 insertions(+), 3 deletions(-)
... 

> > -	if (xfs_has_dax_always(mp)) {
> > +	if (xfs_has_dax_always(mp) || xfs_has_dax_inode(mp)) {
> 
> Er... can't this be done without burning another feature bit by:
> 
> 	if (xfs_has_dax_always(mp) || (!xfs_has_dax_always(mp) &&
> 				       !xfs_has_dax_never(mp))) {
> 		...
> 		xfs_warn(mp, "DAX IS EXPERIMENTAL");
> 	}

Not quite. This will be true at initialization.
-Bill
diff mbox series

Patch

diff --git a/fs/xfs/xfs_mount.h b/fs/xfs/xfs_mount.h
index e091f3b3fa15..c9243a1b8d05 100644
--- a/fs/xfs/xfs_mount.h
+++ b/fs/xfs/xfs_mount.h
@@ -277,6 +277,7 @@  typedef struct xfs_mount {
 #define XFS_FEAT_NEEDSREPAIR	(1ULL << 25)	/* needs xfs_repair */
 
 /* Mount features */
+#define XFS_FEAT_DAX_INODE	(1ULL << 47)	/* DAX enabled */
 #define XFS_FEAT_NOATTR2	(1ULL << 48)	/* disable attr2 creation */
 #define XFS_FEAT_NOALIGN	(1ULL << 49)	/* ignore alignment */
 #define XFS_FEAT_ALLOCSIZE	(1ULL << 50)	/* user specified allocation size */
@@ -359,6 +360,7 @@  __XFS_HAS_FEAT(swalloc, SWALLOC)
 __XFS_HAS_FEAT(filestreams, FILESTREAMS)
 __XFS_HAS_FEAT(dax_always, DAX_ALWAYS)
 __XFS_HAS_FEAT(dax_never, DAX_NEVER)
+__XFS_HAS_FEAT(dax_inode, DAX_INODE)
 __XFS_HAS_FEAT(norecovery, NORECOVERY)
 __XFS_HAS_FEAT(nouuid, NOUUID)
 
diff --git a/fs/xfs/xfs_super.c b/fs/xfs/xfs_super.c
index 5e73ac78bf2f..f73f3687f0a8 100644
--- a/fs/xfs/xfs_super.c
+++ b/fs/xfs/xfs_super.c
@@ -84,15 +84,16 @@  xfs_mount_set_dax_mode(
 {
 	switch (mode) {
 	case XFS_DAX_INODE:
+		mp->m_features |= XFS_FEAT_DAX_INODE;
 		mp->m_features &= ~(XFS_FEAT_DAX_ALWAYS | XFS_FEAT_DAX_NEVER);
 		break;
 	case XFS_DAX_ALWAYS:
 		mp->m_features |= XFS_FEAT_DAX_ALWAYS;
-		mp->m_features &= ~XFS_FEAT_DAX_NEVER;
+		mp->m_features &= ~(XFS_FEAT_DAX_NEVER | XFS_FEAT_DAX_INODE);
 		break;
 	case XFS_DAX_NEVER:
 		mp->m_features |= XFS_FEAT_DAX_NEVER;
-		mp->m_features &= ~XFS_FEAT_DAX_ALWAYS;
+		mp->m_features &= ~(XFS_FEAT_DAX_ALWAYS | XFS_FEAT_DAX_INODE);
 		break;
 	}
 }
@@ -189,6 +190,7 @@  xfs_fs_show_options(
 		{ XFS_FEAT_LARGE_IOSIZE,	",largeio" },
 		{ XFS_FEAT_DAX_ALWAYS,		",dax=always" },
 		{ XFS_FEAT_DAX_NEVER,		",dax=never" },
+		{ XFS_FEAT_DAX_INODE,		",dax=inode" },
 		{ 0, NULL }
 	};
 	struct xfs_mount	*mp = XFS_M(root->d_sb);
@@ -1584,7 +1586,7 @@  xfs_fs_fill_super(
 	if (xfs_has_crc(mp))
 		sb->s_flags |= SB_I_VERSION;
 
-	if (xfs_has_dax_always(mp)) {
+	if (xfs_has_dax_always(mp) || xfs_has_dax_inode(mp)) {
 		bool rtdev_is_dax = false, datadev_is_dax;
 
 		xfs_warn(mp,