btrfs: do not create raid sysfs entries under any locks

author Josef Bacik <josef@toxicpanda.com>

Tue, 1 Sep 2020 21:40:38 +0000 (17:40 -0400)

committer David Sterba <dsterba@suse.com>

Wed, 7 Oct 2020 10:13:19 +0000 (12:13 +0200)
author Josef Bacik <josef@toxicpanda.com>
Tue, 1 Sep 2020 21:40:38 +0000 (17:40 -0400)
committer David Sterba <dsterba@suse.com>
Wed, 7 Oct 2020 10:13:19 +0000 (12:13 +0200)
diff --git a/fs/btrfs/block-group.c b/fs/btrfs/block-group.c

index a3b2720..c0f1d68 100644 (file)
--- a/fs/btrfs/block-group.c
+++ b/fs/btrfs/block-group.c
@@ -1766,16 +1766,10 @@ static void link_block_group(struct btrfs_block_group *cache)
  {
         struct btrfs_space_info *space_info = cache->space_info;
         int index = btrfs_bg_flags_to_raid_index(cache->flags);
-       bool first = false;
  
         down_write(&space_info->groups_sem);
-       if (list_empty(&space_info->block_groups[index]))
-               first = true;
         list_add_tail(&cache->list, &space_info->block_groups[index]);
         up_write(&space_info->groups_sem);
-
-       if (first)
-               btrfs_sysfs_add_block_group_type(cache);
  }
  
  static struct btrfs_block_group *btrfs_create_block_group_cache(
@@ -2032,6 +2026,17 @@ int btrfs_read_block_groups(struct btrfs_fs_info *info)
         }
  
         list_for_each_entry(space_info, &info->space_info, list) {
+               int i;
+
+               for (i = 0; i < BTRFS_NR_RAID_TYPES; i++) {
+                       if (list_empty(&space_info->block_groups[i]))
+                               continue;
+                       cache = list_first_entry(&space_info->block_groups[i],
+                                                struct btrfs_block_group,
+                                                list);
+                       btrfs_sysfs_add_block_group_type(cache);
+               }
+
                 if (!(btrfs_get_alloc_profile(info, space_info->flags) &
                       (BTRFS_BLOCK_GROUP_RAID10 |
                        BTRFS_BLOCK_GROUP_RAID1_MASK |
@@ -2091,12 +2096,16 @@ void btrfs_create_pending_block_groups(struct btrfs_trans_handle *trans)
                 return;
  
         while (!list_empty(&trans->new_bgs)) {
+               int index;
+
                 block_group = list_first_entry(&trans->new_bgs,
                                                struct btrfs_block_group,
                                                bg_list);
                 if (ret)
                         goto next;
  
+               index = btrfs_bg_flags_to_raid_index(block_group->flags);
+
                 ret = insert_block_group_item(trans, block_group);
                 if (ret)
                         btrfs_abort_transaction(trans, ret);
@@ -2105,6 +2114,16 @@ void btrfs_create_pending_block_groups(struct btrfs_trans_handle *trans)
                 if (ret)
                         btrfs_abort_transaction(trans, ret);
                 add_block_group_free_space(trans, block_group);
+
+               /*
+                * If we restriped during balance, we may have added a new raid
+                * type, so now add the sysfs entries when it is safe to do so.
+                * We don't have to worry about locking here as it's handled in
+                * btrfs_sysfs_add_block_group_type.
+                */
+               if (block_group->space_info->block_group_kobjs[index] == NULL)
+                       btrfs_sysfs_add_block_group_type(block_group);
+
                 /* Already aborted the transaction if it failed. */
  next:
                 btrfs_delayed_refs_rsv_release(fs_info, 1);
diff --git a/fs/btrfs/sysfs.c b/fs/btrfs/sysfs.c

index 13354de..279d926 100644 (file)
--- a/fs/btrfs/sysfs.c
+++ b/fs/btrfs/sysfs.c
@@ -1137,17 +1137,38 @@ void btrfs_sysfs_add_block_group_type(struct btrfs_block_group *cache)
  
         rkobj->flags = cache->flags;
         kobject_init(&rkobj->kobj, &btrfs_raid_ktype);
+
+       /*
+        * We call this either on mount, or if we've created a block group for a
+        * new index type while running (i.e. when restriping).  The running
+        * case is tricky because we could race with other threads, so we need
+        * to have this check to make sure we didn't already init the kobject.
+        *
+        * We don't have to protect on the free side because it only happens on
+        * unmount.
+        */
+       spin_lock(&space_info->lock);
+       if (space_info->block_group_kobjs[index]) {
+               spin_unlock(&space_info->lock);
+               kobject_put(&rkobj->kobj);
+               return;
+       } else {
+               space_info->block_group_kobjs[index] = &rkobj->kobj;
+       }
+       spin_unlock(&space_info->lock);
+
         ret = kobject_add(&rkobj->kobj, &space_info->kobj, "%s",
                           btrfs_bg_type_to_raid_name(rkobj->flags));
         memalloc_nofs_restore(nofs_flag);
         if (ret) {
+               spin_lock(&space_info->lock);
+               space_info->block_group_kobjs[index] = NULL;
+               spin_unlock(&space_info->lock);
                 kobject_put(&rkobj->kobj);
                 btrfs_warn(fs_info,
                         "failed to add kobject for block cache, ignoring");
                 return;
         }
-
-       space_info->block_group_kobjs[index] = &rkobj->kobj;
  }
  
  /*
author	Josef Bacik <josef@toxicpanda.com>
	Tue, 1 Sep 2020 21:40:38 +0000 (17:40 -0400)
committer	David Sterba <dsterba@suse.com>
	Wed, 7 Oct 2020 10:13:19 +0000 (12:13 +0200)
fs/btrfs/block-group.c		patch \| blob \| history
fs/btrfs/sysfs.c		patch \| blob \| history