xfs: truncate pagecache before writeback in xfs_setattr_size()

author Eryu Guan <eguan@redhat.com>

Thu, 2 Nov 2017 04:43:50 +0000 (21:43 -0700)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Wed, 20 Dec 2017 09:10:26 +0000 (10:10 +0100)
author Eryu Guan <eguan@redhat.com>
Thu, 2 Nov 2017 04:43:50 +0000 (21:43 -0700)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Wed, 20 Dec 2017 09:10:26 +0000 (10:10 +0100)
diff --git a/fs/xfs/xfs_iops.c b/fs/xfs/xfs_iops.c

index 17081c7..f24e5b6 100644 (file)
--- a/fs/xfs/xfs_iops.c
+++ b/fs/xfs/xfs_iops.c
@@ -886,22 +886,6 @@ xfs_setattr_size(
                 return error;
  
         /*
-        * We are going to log the inode size change in this transaction so
-        * any previous writes that are beyond the on disk EOF and the new
-        * EOF that have not been written out need to be written here.  If we
-        * do not write the data out, we expose ourselves to the null files
-        * problem. Note that this includes any block zeroing we did above;
-        * otherwise those blocks may not be zeroed after a crash.
-        */
-       if (did_zeroing ||
-           (newsize > ip->i_d.di_size && oldsize != ip->i_d.di_size)) {
-               error = filemap_write_and_wait_range(VFS_I(ip)->i_mapping,
-                                                     ip->i_d.di_size, newsize);
-               if (error)
-                       return error;
-       }
-
-       /*
          * We've already locked out new page faults, so now we can safely remove
          * pages from the page cache knowing they won't get refaulted until we
          * drop the XFS_MMAP_EXCL lock after the extent manipulations are
@@ -917,9 +901,29 @@ xfs_setattr_size(
          * user visible changes). There's not much we can do about this, except
          * to hope that the caller sees ENOMEM and retries the truncate
          * operation.
+        *
+        * And we update in-core i_size and truncate page cache beyond newsize
+        * before writeback the [di_size, newsize] range, so we're guaranteed
+        * not to write stale data past the new EOF on truncate down.
          */
         truncate_setsize(inode, newsize);
  
+       /*
+        * We are going to log the inode size change in this transaction so
+        * any previous writes that are beyond the on disk EOF and the new
+        * EOF that have not been written out need to be written here.  If we
+        * do not write the data out, we expose ourselves to the null files
+        * problem. Note that this includes any block zeroing we did above;
+        * otherwise those blocks may not be zeroed after a crash.
+        */
+       if (did_zeroing ||
+           (newsize > ip->i_d.di_size && oldsize != ip->i_d.di_size)) {
+               error = filemap_write_and_wait_range(VFS_I(ip)->i_mapping,
+                                               ip->i_d.di_size, newsize - 1);
+               if (error)
+                       return error;
+       }
+
         error = xfs_trans_alloc(mp, &M_RES(mp)->tr_itruncate, 0, 0, 0, &tp);
         if (error)
                 return error;
author	Eryu Guan <eguan@redhat.com>
	Thu, 2 Nov 2017 04:43:50 +0000 (21:43 -0700)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Wed, 20 Dec 2017 09:10:26 +0000 (10:10 +0100)