btrfs: zoned: do not zone finish data relocation block group

author Naohiro Aota <naohiro.aota@wdc.com>

Fri, 21 Jul 2023 07:42:14 +0000 (16:42 +0900)

committer David Sterba <dsterba@suse.com>

Mon, 21 Aug 2023 12:54:47 +0000 (14:54 +0200)
author Naohiro Aota <naohiro.aota@wdc.com>
Fri, 21 Jul 2023 07:42:14 +0000 (16:42 +0900)
committer David Sterba <dsterba@suse.com>
Mon, 21 Aug 2023 12:54:47 +0000 (14:54 +0200)
diff --git a/fs/btrfs/extent-tree.c b/fs/btrfs/extent-tree.c

index ba22790..e050811 100644 (file)
--- a/fs/btrfs/extent-tree.c
+++ b/fs/btrfs/extent-tree.c
@@ -3738,7 +3738,8 @@ static int do_allocation_zoned(struct btrfs_block_group *block_group,
                fs_info->data_reloc_bg == 0);
  
         if (block_group->ro ||
-           test_bit(BLOCK_GROUP_FLAG_ZONED_DATA_RELOC, &block_group->runtime_flags)) {
+           (!ffe_ctl->for_data_reloc &&
+            test_bit(BLOCK_GROUP_FLAG_ZONED_DATA_RELOC, &block_group->runtime_flags))) {
                 ret = 1;
                 goto out;
         }
@@ -3781,8 +3782,26 @@ static int do_allocation_zoned(struct btrfs_block_group *block_group,
         if (ffe_ctl->for_treelog && !fs_info->treelog_bg)
                 fs_info->treelog_bg = block_group->start;
  
-       if (ffe_ctl->for_data_reloc && !fs_info->data_reloc_bg)
-               fs_info->data_reloc_bg = block_group->start;
+       if (ffe_ctl->for_data_reloc) {
+               if (!fs_info->data_reloc_bg)
+                       fs_info->data_reloc_bg = block_group->start;
+               /*
+                * Do not allow allocations from this block group, unless it is
+                * for data relocation. Compared to increasing the ->ro, setting
+                * the ->zoned_data_reloc_ongoing flag still allows nocow
+                * writers to come in. See btrfs_inc_nocow_writers().
+                *
+                * We need to disable an allocation to avoid an allocation of
+                * regular (non-relocation data) extent. With mix of relocation
+                * extents and regular extents, we can dispatch WRITE commands
+                * (for relocation extents) and ZONE APPEND commands (for
+                * regular extents) at the same time to the same zone, which
+                * easily break the write pointer.
+                *
+                * Also, this flag avoids this block group to be zone finished.
+                */
+               set_bit(BLOCK_GROUP_FLAG_ZONED_DATA_RELOC, &block_group->runtime_flags);
+       }
  
         ffe_ctl->found_offset = start + block_group->alloc_offset;
         block_group->alloc_offset += num_bytes;
@@ -3800,24 +3819,8 @@ static int do_allocation_zoned(struct btrfs_block_group *block_group,
  out:
         if (ret && ffe_ctl->for_treelog)
                 fs_info->treelog_bg = 0;
-       if (ret && ffe_ctl->for_data_reloc &&
-           fs_info->data_reloc_bg == block_group->start) {
-               /*
-                * Do not allow further allocations from this block group.
-                * Compared to increasing the ->ro, setting the
-                * ->zoned_data_reloc_ongoing flag still allows nocow
-                *  writers to come in. See btrfs_inc_nocow_writers().
-                *
-                * We need to disable an allocation to avoid an allocation of
-                * regular (non-relocation data) extent. With mix of relocation
-                * extents and regular extents, we can dispatch WRITE commands
-                * (for relocation extents) and ZONE APPEND commands (for
-                * regular extents) at the same time to the same zone, which
-                * easily break the write pointer.
-                */
-               set_bit(BLOCK_GROUP_FLAG_ZONED_DATA_RELOC, &block_group->runtime_flags);
+       if (ret && ffe_ctl->for_data_reloc)
                 fs_info->data_reloc_bg = 0;
-       }
         spin_unlock(&fs_info->relocation_bg_lock);
         spin_unlock(&fs_info->treelog_bg_lock);
         spin_unlock(&block_group->lock);
diff --git a/fs/btrfs/zoned.c b/fs/btrfs/zoned.c

index 52f49b0..a2f8e74 100644 (file)
--- a/fs/btrfs/zoned.c
+++ b/fs/btrfs/zoned.c
@@ -2091,6 +2091,10 @@ static int do_zone_finish(struct btrfs_block_group *block_group, bool fully_writ
          * and block_group->meta_write_pointer for metadata.
          */
         if (!fully_written) {
+               if (test_bit(BLOCK_GROUP_FLAG_ZONED_DATA_RELOC, &block_group->runtime_flags)) {
+                       spin_unlock(&block_group->lock);
+                       return -EAGAIN;
+               }
                 spin_unlock(&block_group->lock);
  
                 ret = btrfs_inc_block_group_ro(block_group, false);
@@ -2119,7 +2123,9 @@ static int do_zone_finish(struct btrfs_block_group *block_group, bool fully_writ
                         return 0;
                 }
  
-               if (block_group->reserved) {
+               if (block_group->reserved ||
+                   test_bit(BLOCK_GROUP_FLAG_ZONED_DATA_RELOC,
+                            &block_group->runtime_flags)) {
                         spin_unlock(&block_group->lock);
                         btrfs_dec_block_group_ro(block_group);
                         return -EAGAIN;
@@ -2362,7 +2368,10 @@ void btrfs_zoned_release_data_reloc_bg(struct btrfs_fs_info *fs_info, u64 logica
  
         /* All relocation extents are written. */
         if (block_group->start + block_group->alloc_offset == logical + length) {
-               /* Now, release this block group for further allocations. */
+               /*
+                * Now, release this block group for further allocations and
+                * zone finish.
+                */
                 clear_bit(BLOCK_GROUP_FLAG_ZONED_DATA_RELOC,
                           &block_group->runtime_flags);
         }
@@ -2386,7 +2395,8 @@ int btrfs_zone_finish_one_bg(struct btrfs_fs_info *fs_info)
  
                 spin_lock(&block_group->lock);
                 if (block_group->reserved || block_group->alloc_offset == 0 ||
-                   (block_group->flags & BTRFS_BLOCK_GROUP_SYSTEM)) {
+                   (block_group->flags & BTRFS_BLOCK_GROUP_SYSTEM) ||
+                   test_bit(BLOCK_GROUP_FLAG_ZONED_DATA_RELOC, &block_group->runtime_flags)) {
                         spin_unlock(&block_group->lock);
                         continue;
                 }
author	Naohiro Aota <naohiro.aota@wdc.com>
	Fri, 21 Jul 2023 07:42:14 +0000 (16:42 +0900)
committer	David Sterba <dsterba@suse.com>
	Mon, 21 Aug 2023 12:54:47 +0000 (14:54 +0200)
fs/btrfs/extent-tree.c		patch \| blob \| history
fs/btrfs/zoned.c		patch \| blob \| history