btrfs: zoned: do not zone finish data relocation block group

author Naohiro Aota <naohiro.aota@wdc.com>

Fri, 21 Jul 2023 07:42:14 +0000 (16:42 +0900)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Tue, 19 Sep 2023 10:28:05 +0000 (12:28 +0200)
author Naohiro Aota <naohiro.aota@wdc.com>
Fri, 21 Jul 2023 07:42:14 +0000 (16:42 +0900)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Tue, 19 Sep 2023 10:28:05 +0000 (12:28 +0200)
diff --git a/fs/btrfs/extent-tree.c b/fs/btrfs/extent-tree.c

index f2ee70c03f0d532bb1cb9b8729b710dbf309b17f..0640ef59fe6606b4e6de1ad909c67593cf791e51 100644 (file)
--- a/fs/btrfs/extent-tree.c
+++ b/fs/btrfs/extent-tree.c
@@ -3810,7 +3810,8 @@ static int do_allocation_zoned(struct btrfs_block_group *block_group,
                fs_info->data_reloc_bg == 0);
  
         if (block_group->ro ||
-           test_bit(BLOCK_GROUP_FLAG_ZONED_DATA_RELOC, &block_group->runtime_flags)) {
+           (!ffe_ctl->for_data_reloc &&
+            test_bit(BLOCK_GROUP_FLAG_ZONED_DATA_RELOC, &block_group->runtime_flags))) {
                 ret = 1;
                 goto out;
         }
@@ -3853,8 +3854,26 @@ static int do_allocation_zoned(struct btrfs_block_group *block_group,
         if (ffe_ctl->for_treelog && !fs_info->treelog_bg)
                 fs_info->treelog_bg = block_group->start;
  
-       if (ffe_ctl->for_data_reloc && !fs_info->data_reloc_bg)
-               fs_info->data_reloc_bg = block_group->start;
+       if (ffe_ctl->for_data_reloc) {
+               if (!fs_info->data_reloc_bg)
+                       fs_info->data_reloc_bg = block_group->start;
+               /*
+                * Do not allow allocations from this block group, unless it is
+                * for data relocation. Compared to increasing the ->ro, setting
+                * the ->zoned_data_reloc_ongoing flag still allows nocow
+                * writers to come in. See btrfs_inc_nocow_writers().
+                *
+                * We need to disable an allocation to avoid an allocation of
+                * regular (non-relocation data) extent. With mix of relocation
+                * extents and regular extents, we can dispatch WRITE commands
+                * (for relocation extents) and ZONE APPEND commands (for
+                * regular extents) at the same time to the same zone, which
+                * easily break the write pointer.
+                *
+                * Also, this flag avoids this block group to be zone finished.
+                */
+               set_bit(BLOCK_GROUP_FLAG_ZONED_DATA_RELOC, &block_group->runtime_flags);
+       }
  
         ffe_ctl->found_offset = start + block_group->alloc_offset;
         block_group->alloc_offset += num_bytes;
@@ -3872,24 +3891,8 @@ static int do_allocation_zoned(struct btrfs_block_group *block_group,
  out:
         if (ret && ffe_ctl->for_treelog)
                 fs_info->treelog_bg = 0;
-       if (ret && ffe_ctl->for_data_reloc &&
-           fs_info->data_reloc_bg == block_group->start) {
-               /*
-                * Do not allow further allocations from this block group.
-                * Compared to increasing the ->ro, setting the
-                * ->zoned_data_reloc_ongoing flag still allows nocow
-                *  writers to come in. See btrfs_inc_nocow_writers().
-                *
-                * We need to disable an allocation to avoid an allocation of
-                * regular (non-relocation data) extent. With mix of relocation
-                * extents and regular extents, we can dispatch WRITE commands
-                * (for relocation extents) and ZONE APPEND commands (for
-                * regular extents) at the same time to the same zone, which
-                * easily break the write pointer.
-                */
-               set_bit(BLOCK_GROUP_FLAG_ZONED_DATA_RELOC, &block_group->runtime_flags);
+       if (ret && ffe_ctl->for_data_reloc)
                 fs_info->data_reloc_bg = 0;
-       }
         spin_unlock(&fs_info->relocation_bg_lock);
         spin_unlock(&fs_info->treelog_bg_lock);
         spin_unlock(&block_group->lock);
diff --git a/fs/btrfs/zoned.c b/fs/btrfs/zoned.c

index 9bc7ac06c51775c6b14eaf90a27a8207d3436bc9..675dbed075d8e980021b2608671eea32a3aa7608 100644 (file)
--- a/fs/btrfs/zoned.c
+++ b/fs/btrfs/zoned.c
@@ -2009,6 +2009,10 @@ static int do_zone_finish(struct btrfs_block_group *block_group, bool fully_writ
          * and block_group->meta_write_pointer for metadata.
          */
         if (!fully_written) {
+               if (test_bit(BLOCK_GROUP_FLAG_ZONED_DATA_RELOC, &block_group->runtime_flags)) {
+                       spin_unlock(&block_group->lock);
+                       return -EAGAIN;
+               }
                 spin_unlock(&block_group->lock);
  
                 ret = btrfs_inc_block_group_ro(block_group, false);
@@ -2037,7 +2041,9 @@ static int do_zone_finish(struct btrfs_block_group *block_group, bool fully_writ
                         return 0;
                 }
  
-               if (block_group->reserved) {
+               if (block_group->reserved ||
+                   test_bit(BLOCK_GROUP_FLAG_ZONED_DATA_RELOC,
+                            &block_group->runtime_flags)) {
                         spin_unlock(&block_group->lock);
                         btrfs_dec_block_group_ro(block_group);
                         return -EAGAIN;
@@ -2268,7 +2274,10 @@ void btrfs_zoned_release_data_reloc_bg(struct btrfs_fs_info *fs_info, u64 logica
  
         /* All relocation extents are written. */
         if (block_group->start + block_group->alloc_offset == logical + length) {
-               /* Now, release this block group for further allocations. */
+               /*
+                * Now, release this block group for further allocations and
+                * zone finish.
+                */
                 clear_bit(BLOCK_GROUP_FLAG_ZONED_DATA_RELOC,
                           &block_group->runtime_flags);
         }
@@ -2292,7 +2301,8 @@ int btrfs_zone_finish_one_bg(struct btrfs_fs_info *fs_info)
  
                 spin_lock(&block_group->lock);
                 if (block_group->reserved || block_group->alloc_offset == 0 ||
-                   (block_group->flags & BTRFS_BLOCK_GROUP_SYSTEM)) {
+                   (block_group->flags & BTRFS_BLOCK_GROUP_SYSTEM) ||
+                   test_bit(BLOCK_GROUP_FLAG_ZONED_DATA_RELOC, &block_group->runtime_flags)) {
                         spin_unlock(&block_group->lock);
                         continue;
                 }
author	Naohiro Aota <naohiro.aota@wdc.com>
	Fri, 21 Jul 2023 07:42:14 +0000 (16:42 +0900)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Tue, 19 Sep 2023 10:28:05 +0000 (12:28 +0200)
fs/btrfs/extent-tree.c		patch \| blob \| history
fs/btrfs/zoned.c		patch \| blob \| history