btrfs: support subpage for extent buffer page release

author Qu Wenruo <wqu@suse.com>

Tue, 26 Jan 2021 08:33:50 +0000 (16:33 +0800)

committer David Sterba <dsterba@suse.com>

Mon, 8 Feb 2021 21:59:02 +0000 (22:59 +0100)
author Qu Wenruo <wqu@suse.com>
Tue, 26 Jan 2021 08:33:50 +0000 (16:33 +0800)
committer David Sterba <dsterba@suse.com>
Mon, 8 Feb 2021 21:59:02 +0000 (22:59 +0100)
diff --git a/fs/btrfs/extent_io.c b/fs/btrfs/extent_io.c

index 133ff453147200d1cb8a1a43e7791f4ad33e1e02..1812813bdf63fb87a3f14c29f8ed65512835e32f 100644 (file)
--- a/fs/btrfs/extent_io.c
+++ b/fs/btrfs/extent_io.c
@@ -4995,25 +4995,39 @@ int extent_buffer_under_io(const struct extent_buffer *eb)
                 test_bit(EXTENT_BUFFER_DIRTY, &eb->bflags));
  }
  
-/*
- * Release all pages attached to the extent buffer.
- */
-static void btrfs_release_extent_buffer_pages(struct extent_buffer *eb)
+static bool page_range_has_eb(struct btrfs_fs_info *fs_info, struct page *page)
  {
-       int i;
-       int num_pages;
-       int mapped = !test_bit(EXTENT_BUFFER_UNMAPPED, &eb->bflags);
+       struct btrfs_subpage *subpage;
  
-       BUG_ON(extent_buffer_under_io(eb));
+       lockdep_assert_held(&page->mapping->private_lock);
  
-       num_pages = num_extent_pages(eb);
-       for (i = 0; i < num_pages; i++) {
-               struct page *page = eb->pages[i];
+       if (PagePrivate(page)) {
+               subpage = (struct btrfs_subpage *)page->private;
+               if (atomic_read(&subpage->eb_refs))
+                       return true;
+       }
+       return false;
+}
  
-               if (!page)
-                       continue;
+static void detach_extent_buffer_page(struct extent_buffer *eb, struct page *page)
+{
+       struct btrfs_fs_info *fs_info = eb->fs_info;
+       const bool mapped = !test_bit(EXTENT_BUFFER_UNMAPPED, &eb->bflags);
+
+       /*
+        * For mapped eb, we're going to change the page private, which should
+        * be done under the private_lock.
+        */
+       if (mapped)
+               spin_lock(&page->mapping->private_lock);
+
+       if (!PagePrivate(page)) {
                 if (mapped)
-                       spin_lock(&page->mapping->private_lock);
+                       spin_unlock(&page->mapping->private_lock);
+               return;
+       }
+
+       if (fs_info->sectorsize == PAGE_SIZE) {
                 /*
                  * We do this since we'll remove the pages after we've
                  * removed the eb from the radix tree, so we could race
@@ -5032,9 +5046,49 @@ static void btrfs_release_extent_buffer_pages(struct extent_buffer *eb)
                          */
                         detach_page_private(page);
                 }
-
                 if (mapped)
                         spin_unlock(&page->mapping->private_lock);
+               return;
+       }
+
+       /*
+        * For subpage, we can have dummy eb with page private.  In this case,
+        * we can directly detach the private as such page is only attached to
+        * one dummy eb, no sharing.
+        */
+       if (!mapped) {
+               btrfs_detach_subpage(fs_info, page);
+               return;
+       }
+
+       btrfs_page_dec_eb_refs(fs_info, page);
+
+       /*
+        * We can only detach the page private if there are no other ebs in the
+        * page range.
+        */
+       if (!page_range_has_eb(fs_info, page))
+               btrfs_detach_subpage(fs_info, page);
+
+       spin_unlock(&page->mapping->private_lock);
+}
+
+/* Release all pages attached to the extent buffer */
+static void btrfs_release_extent_buffer_pages(struct extent_buffer *eb)
+{
+       int i;
+       int num_pages;
+
+       ASSERT(!extent_buffer_under_io(eb));
+
+       num_pages = num_extent_pages(eb);
+       for (i = 0; i < num_pages; i++) {
+               struct page *page = eb->pages[i];
+
+               if (!page)
+                       continue;
+
+               detach_extent_buffer_page(eb, page);
  
                 /* One for when we allocated the page */
                 put_page(page);
@@ -5394,6 +5448,16 @@ struct extent_buffer *alloc_extent_buffer(struct btrfs_fs_info *fs_info,
                 /* Should not fail, as we have preallocated the memory */
                 ret = attach_extent_buffer_page(eb, p, prealloc);
                 ASSERT(!ret);
+               /*
+                * To inform we have extra eb under allocation, so that
+                * detach_extent_buffer_page() won't release the page private
+                * when the eb hasn't yet been inserted into radix tree.
+                *
+                * The ref will be decreased when the eb released the page, in
+                * detach_extent_buffer_page().
+                * Thus needs no special handling in error path.
+                */
+               btrfs_page_inc_eb_refs(fs_info, p);
                 spin_unlock(&mapping->private_lock);
  
                 WARN_ON(PageDirty(p));
diff --git a/fs/btrfs/subpage.c b/fs/btrfs/subpage.c

index 61b28dfca20cbbbe96015fe690603fcf46142c10..a2a21fa0ea35ad23ddbe868f3468cde346f41686 100644 (file)
--- a/fs/btrfs/subpage.c
+++ b/fs/btrfs/subpage.c
@@ -52,6 +52,8 @@ int btrfs_alloc_subpage(const struct btrfs_fs_info *fs_info,
         if (!*ret)
                 return -ENOMEM;
         spin_lock_init(&(*ret)->lock);
+       if (type == BTRFS_SUBPAGE_METADATA)
+               atomic_set(&(*ret)->eb_refs, 0);
         return 0;
  }
  
@@ -59,3 +61,43 @@ void btrfs_free_subpage(struct btrfs_subpage *subpage)
  {
         kfree(subpage);
  }
+
+/*
+ * Increase the eb_refs of current subpage.
+ *
+ * This is important for eb allocation, to prevent race with last eb freeing
+ * of the same page.
+ * With the eb_refs increased before the eb inserted into radix tree,
+ * detach_extent_buffer_page() won't detach the page private while we're still
+ * allocating the extent buffer.
+ */
+void btrfs_page_inc_eb_refs(const struct btrfs_fs_info *fs_info,
+                           struct page *page)
+{
+       struct btrfs_subpage *subpage;
+
+       if (fs_info->sectorsize == PAGE_SIZE)
+               return;
+
+       ASSERT(PagePrivate(page) && page->mapping);
+       lockdep_assert_held(&page->mapping->private_lock);
+
+       subpage = (struct btrfs_subpage *)page->private;
+       atomic_inc(&subpage->eb_refs);
+}
+
+void btrfs_page_dec_eb_refs(const struct btrfs_fs_info *fs_info,
+                           struct page *page)
+{
+       struct btrfs_subpage *subpage;
+
+       if (fs_info->sectorsize == PAGE_SIZE)
+               return;
+
+       ASSERT(PagePrivate(page) && page->mapping);
+       lockdep_assert_held(&page->mapping->private_lock);
+
+       subpage = (struct btrfs_subpage *)page->private;
+       ASSERT(atomic_read(&subpage->eb_refs));
+       atomic_dec(&subpage->eb_refs);
+}
diff --git a/fs/btrfs/subpage.h b/fs/btrfs/subpage.h

index 7ba544bcc9c6b15945113247360622d9accac71a..fe51cc237a6678c7b9fa1da4c07d28b170382a48 100644 (file)
--- a/fs/btrfs/subpage.h
+++ b/fs/btrfs/subpage.h
@@ -19,7 +19,13 @@ struct btrfs_subpage {
         /* Common members for both data and metadata pages */
         spinlock_t lock;
         union {
-               /* Structures only used by metadata */
+               /*
+                * Structures only used by metadata
+                *
+                * @eb_refs should only be operated under private_lock, as it
+                * manages whether the subpage can be detached.
+                */
+               atomic_t eb_refs;
                 /* Structures only used by data */
         };
  };
@@ -40,4 +46,9 @@ int btrfs_alloc_subpage(const struct btrfs_fs_info *fs_info,
                         enum btrfs_subpage_type type);
  void btrfs_free_subpage(struct btrfs_subpage *subpage);
  
+void btrfs_page_inc_eb_refs(const struct btrfs_fs_info *fs_info,
+                           struct page *page);
+void btrfs_page_dec_eb_refs(const struct btrfs_fs_info *fs_info,
+                           struct page *page);
+
  #endif
author	Qu Wenruo <wqu@suse.com>
	Tue, 26 Jan 2021 08:33:50 +0000 (16:33 +0800)
committer	David Sterba <dsterba@suse.com>
	Mon, 8 Feb 2021 21:59:02 +0000 (22:59 +0100)
fs/btrfs/extent_io.c		patch \| blob \| history
fs/btrfs/subpage.c		patch \| blob \| history
fs/btrfs/subpage.h		patch \| blob \| history