f2fs: give priority to select unpinned section for foreground GC
authorChao Yu <chao@kernel.org>
Fri, 6 May 2022 10:30:31 +0000 (18:30 +0800)
committerJaegeuk Kim <jaegeuk@kernel.org>
Fri, 6 May 2022 21:26:33 +0000 (14:26 -0700)
Previously, during foreground GC, if victims contain data of pinned file,
it will fail migration of the data, and meanwhile i_gc_failures of that
pinned file may increase, and when it exceeds threshold, GC will unpin
the file, result in breaking pinfile's semantics.

In order to mitigate such condition, let's record and skip section which
has pinned file's data and give priority to select unpinned one.

Signed-off-by: Chao Yu <chao.yu@oppo.com>
Signed-off-by: Jaegeuk Kim <jaegeuk@kernel.org>
fs/f2fs/gc.c
fs/f2fs/segment.c
fs/f2fs/segment.h

index a193862..3009c0a 100644 (file)
@@ -646,6 +646,54 @@ static void release_victim_entry(struct f2fs_sb_info *sbi)
        f2fs_bug_on(sbi, !list_empty(&am->victim_list));
 }
 
+static bool f2fs_pin_section(struct f2fs_sb_info *sbi, unsigned int segno)
+{
+       struct dirty_seglist_info *dirty_i = DIRTY_I(sbi);
+       unsigned int secno = GET_SEC_FROM_SEG(sbi, segno);
+
+       if (!dirty_i->enable_pin_section)
+               return false;
+       if (!test_and_set_bit(secno, dirty_i->pinned_secmap))
+               dirty_i->pinned_secmap_cnt++;
+       return true;
+}
+
+static bool f2fs_pinned_section_exists(struct dirty_seglist_info *dirty_i)
+{
+       return dirty_i->pinned_secmap_cnt;
+}
+
+static bool f2fs_section_is_pinned(struct dirty_seglist_info *dirty_i,
+                                               unsigned int secno)
+{
+       return dirty_i->enable_pin_section &&
+               f2fs_pinned_section_exists(dirty_i) &&
+               test_bit(secno, dirty_i->pinned_secmap);
+}
+
+static void f2fs_unpin_all_sections(struct f2fs_sb_info *sbi, bool enable)
+{
+       unsigned int bitmap_size = f2fs_bitmap_size(MAIN_SECS(sbi));
+
+       if (f2fs_pinned_section_exists(DIRTY_I(sbi))) {
+               memset(DIRTY_I(sbi)->pinned_secmap, 0, bitmap_size);
+               DIRTY_I(sbi)->pinned_secmap_cnt = 0;
+       }
+       DIRTY_I(sbi)->enable_pin_section = enable;
+}
+
+static int f2fs_gc_pinned_control(struct inode *inode, int gc_type,
+                                                       unsigned int segno)
+{
+       if (!f2fs_is_pinned_file(inode))
+               return 0;
+       if (gc_type != FG_GC)
+               return -EBUSY;
+       if (!f2fs_pin_section(F2FS_I_SB(inode), segno))
+               f2fs_pin_file_control(inode, true);
+       return -EAGAIN;
+}
+
 /*
  * This function is called from two paths.
  * One is garbage collection and the other is SSR segment selection.
@@ -787,6 +835,9 @@ retry:
                if (gc_type == BG_GC && test_bit(secno, dirty_i->victim_secmap))
                        goto next;
 
+               if (gc_type == FG_GC && f2fs_section_is_pinned(dirty_i, secno))
+                       goto next;
+
                if (is_atgc) {
                        add_victim_entry(sbi, &p, segno);
                        goto next;
@@ -1201,12 +1252,9 @@ static int move_data_block(struct inode *inode, block_t bidx,
                goto out;
        }
 
-       if (f2fs_is_pinned_file(inode)) {
-               if (gc_type == FG_GC)
-                       f2fs_pin_file_control(inode, true);
-               err = -EAGAIN;
+       err = f2fs_gc_pinned_control(inode, gc_type, segno);
+       if (err)
                goto out;
-       }
 
        set_new_dnode(&dn, inode, NULL, NULL, 0);
        err = f2fs_get_dnode_of_data(&dn, bidx, LOOKUP_NODE);
@@ -1351,12 +1399,9 @@ static int move_data_page(struct inode *inode, block_t bidx, int gc_type,
                err = -EAGAIN;
                goto out;
        }
-       if (f2fs_is_pinned_file(inode)) {
-               if (gc_type == FG_GC)
-                       f2fs_pin_file_control(inode, true);
-               err = -EAGAIN;
+       err = f2fs_gc_pinned_control(inode, gc_type, segno);
+       if (err)
                goto out;
-       }
 
        if (gc_type == BG_GC) {
                if (PageWriteback(page)) {
@@ -1476,14 +1521,15 @@ next_step:
                ofs_in_node = le16_to_cpu(entry->ofs_in_node);
 
                if (phase == 3) {
+                       int err;
+
                        inode = f2fs_iget(sb, dni.ino);
                        if (IS_ERR(inode) || is_bad_inode(inode) ||
                                        special_file(inode->i_mode))
                                continue;
 
-                       if (is_inode_flag_set(inode, FI_PIN_FILE) &&
-                                                       gc_type == FG_GC) {
-                               f2fs_pin_file_control(inode, true);
+                       err = f2fs_gc_pinned_control(inode, gc_type, segno);
+                       if (err == -EAGAIN) {
                                iput(inode);
                                return submitted;
                        }
@@ -1766,9 +1812,17 @@ gc_more:
                ret = -EINVAL;
                goto stop;
        }
+retry:
        ret = __get_victim(sbi, &segno, gc_type);
-       if (ret)
+       if (ret) {
+               /* allow to search victim from sections has pinned data */
+               if (ret == -ENODATA && gc_type == FG_GC &&
+                               f2fs_pinned_section_exists(DIRTY_I(sbi))) {
+                       f2fs_unpin_all_sections(sbi, false);
+                       goto retry;
+               }
                goto stop;
+       }
 
        seg_freed = do_garbage_collect(sbi, segno, &gc_list, gc_type, force);
        if (gc_type == FG_GC &&
@@ -1819,6 +1873,9 @@ stop:
        SIT_I(sbi)->last_victim[ALLOC_NEXT] = 0;
        SIT_I(sbi)->last_victim[FLUSH_DEVICE] = init_segno;
 
+       if (gc_type == FG_GC)
+               f2fs_unpin_all_sections(sbi, true);
+
        trace_f2fs_gc_end(sbi->sb, ret, total_freed, sec_freed,
                                get_pages(sbi, F2FS_DIRTY_NODES),
                                get_pages(sbi, F2FS_DIRTY_DENTS),
index 388bedc..87ff2b3 100644 (file)
@@ -4654,6 +4654,13 @@ static int init_victim_secmap(struct f2fs_sb_info *sbi)
        dirty_i->victim_secmap = f2fs_kvzalloc(sbi, bitmap_size, GFP_KERNEL);
        if (!dirty_i->victim_secmap)
                return -ENOMEM;
+
+       dirty_i->pinned_secmap = f2fs_kvzalloc(sbi, bitmap_size, GFP_KERNEL);
+       if (!dirty_i->pinned_secmap)
+               return -ENOMEM;
+
+       dirty_i->pinned_secmap_cnt = 0;
+       dirty_i->enable_pin_section = true;
        return 0;
 }
 
@@ -5242,6 +5249,7 @@ static void destroy_victim_secmap(struct f2fs_sb_info *sbi)
 {
        struct dirty_seglist_info *dirty_i = DIRTY_I(sbi);
 
+       kvfree(dirty_i->pinned_secmap);
        kvfree(dirty_i->victim_secmap);
 }
 
index 1fa26a9..8fbc9f6 100644 (file)
@@ -295,6 +295,9 @@ struct dirty_seglist_info {
        struct mutex seglist_lock;              /* lock for segment bitmaps */
        int nr_dirty[NR_DIRTY_TYPE];            /* # of dirty segments */
        unsigned long *victim_secmap;           /* background GC victims */
+       unsigned long *pinned_secmap;           /* pinned victims from foreground GC */
+       unsigned int pinned_secmap_cnt;         /* count of victims which has pinned data */
+       bool enable_pin_section;                /* enable pinning section */
 };
 
 /* victim selection function for cleaning and SSR */