]> git.ipfire.org Git - thirdparty/kernel/stable.git/commitdiff
f2fs: add a sysfs entry to reclaim POSIX_FADV_NOREUSE pages
authorJaegeuk Kim <jaegeuk@kernel.org>
Fri, 31 Jan 2025 22:27:57 +0000 (22:27 +0000)
committerGreg Kroah-Hartman <gregkh@linuxfoundation.org>
Thu, 18 Dec 2025 12:55:15 +0000 (13:55 +0100)
[ Upstream commit a907f3a68ee26ba493a08a958809208d17f3347e ]

1. fadvise(fd1, POSIX_FADV_NOREUSE, {0,3});
2. fadvise(fd2, POSIX_FADV_NOREUSE, {1,2});
3. fadvise(fd3, POSIX_FADV_NOREUSE, {3,1});
4. echo 1024 > /sys/fs/f2fs/tuning/reclaim_caches_kb

This gives a way to reclaim file-backed pages by iterating all f2fs mounts until
reclaiming 1MB page cache ranges, registered by #1, #2, and #3.

5. cat /sys/fs/f2fs/tuning/reclaim_caches_kb
-> gives total number of registered file ranges.

Reviewed-by: Chao Yu <chao@kernel.org>
Signed-off-by: Jaegeuk Kim <jaegeuk@kernel.org>
Stable-dep-of: e462fc48ceb8 ("f2fs: maintain one time GC mode is enabled during whole zoned GC cycle")
Signed-off-by: Sasha Levin <sashal@kernel.org>
Documentation/ABI/testing/sysfs-fs-f2fs
fs/f2fs/f2fs.h
fs/f2fs/shrinker.c
fs/f2fs/sysfs.c

index 3e1630c70d8ae70456de35a627afde1211c8882c..81deae2af84d2a6b7b2999dfb3c86c9a246f3131 100644 (file)
@@ -828,3 +828,10 @@ Date:              November 2024
 Contact:       "Chao Yu" <chao@kernel.org>
 Description:   It controls max read extent count for per-inode, the value of threshold
                is 10240 by default.
+
+What:          /sys/fs/f2fs/tuning/reclaim_caches_kb
+Date:          February 2025
+Contact:       "Jaegeuk Kim" <jaegeuk@kernel.org>
+Description:   It reclaims the given KBs of file-backed pages registered by
+               ioctl(F2FS_IOC_DONATE_RANGE).
+               For example, writing N tries to drop N KBs spaces in LRU.
index 7ced2e2c6574606ea815c94d7bc79c05d6fe81f3..f2f3e02b6fd4c845221ed5cfaf8202940b453e9d 100644 (file)
@@ -4271,6 +4271,8 @@ unsigned long f2fs_shrink_count(struct shrinker *shrink,
                        struct shrink_control *sc);
 unsigned long f2fs_shrink_scan(struct shrinker *shrink,
                        struct shrink_control *sc);
+unsigned int f2fs_donate_files(void);
+void f2fs_reclaim_caches(unsigned int reclaim_caches_kb);
 void f2fs_join_shrinker(struct f2fs_sb_info *sbi);
 void f2fs_leave_shrinker(struct f2fs_sb_info *sbi);
 
index 83d6fb97dcae0f84ff6bd76ad389198a5660a5c7..45efff635d8e41fcad01c6bd0291ef92c46b0fed 100644 (file)
@@ -130,6 +130,96 @@ unsigned long f2fs_shrink_scan(struct shrinker *shrink,
        return freed;
 }
 
+unsigned int f2fs_donate_files(void)
+{
+       struct f2fs_sb_info *sbi;
+       struct list_head *p;
+       unsigned int donate_files = 0;
+
+       spin_lock(&f2fs_list_lock);
+       p = f2fs_list.next;
+       while (p != &f2fs_list) {
+               sbi = list_entry(p, struct f2fs_sb_info, s_list);
+
+               /* stop f2fs_put_super */
+               if (!mutex_trylock(&sbi->umount_mutex)) {
+                       p = p->next;
+                       continue;
+               }
+               spin_unlock(&f2fs_list_lock);
+
+               donate_files += sbi->donate_files;
+
+               spin_lock(&f2fs_list_lock);
+               p = p->next;
+               mutex_unlock(&sbi->umount_mutex);
+       }
+       spin_unlock(&f2fs_list_lock);
+
+       return donate_files;
+}
+
+static unsigned int do_reclaim_caches(struct f2fs_sb_info *sbi,
+                               unsigned int reclaim_caches_kb)
+{
+       struct inode *inode;
+       struct f2fs_inode_info *fi;
+       unsigned int nfiles = sbi->donate_files;
+       pgoff_t npages = reclaim_caches_kb >> (PAGE_SHIFT - 10);
+
+       while (npages && nfiles--) {
+               pgoff_t len;
+
+               spin_lock(&sbi->inode_lock[DONATE_INODE]);
+               if (list_empty(&sbi->inode_list[DONATE_INODE])) {
+                       spin_unlock(&sbi->inode_lock[DONATE_INODE]);
+                       break;
+               }
+               fi = list_first_entry(&sbi->inode_list[DONATE_INODE],
+                                       struct f2fs_inode_info, gdonate_list);
+               list_move_tail(&fi->gdonate_list, &sbi->inode_list[DONATE_INODE]);
+               inode = igrab(&fi->vfs_inode);
+               spin_unlock(&sbi->inode_lock[DONATE_INODE]);
+
+               if (!inode)
+                       continue;
+
+               len = fi->donate_end - fi->donate_start + 1;
+               npages = npages < len ? 0 : npages - len;
+               invalidate_inode_pages2_range(inode->i_mapping,
+                                       fi->donate_start, fi->donate_end);
+               iput(inode);
+               cond_resched();
+       }
+       return npages << (PAGE_SHIFT - 10);
+}
+
+void f2fs_reclaim_caches(unsigned int reclaim_caches_kb)
+{
+       struct f2fs_sb_info *sbi;
+       struct list_head *p;
+
+       spin_lock(&f2fs_list_lock);
+       p = f2fs_list.next;
+       while (p != &f2fs_list && reclaim_caches_kb) {
+               sbi = list_entry(p, struct f2fs_sb_info, s_list);
+
+               /* stop f2fs_put_super */
+               if (!mutex_trylock(&sbi->umount_mutex)) {
+                       p = p->next;
+                       continue;
+               }
+               spin_unlock(&f2fs_list_lock);
+
+               reclaim_caches_kb = do_reclaim_caches(sbi, reclaim_caches_kb);
+
+               spin_lock(&f2fs_list_lock);
+               p = p->next;
+               mutex_unlock(&sbi->umount_mutex);
+       }
+       spin_unlock(&f2fs_list_lock);
+}
+
 void f2fs_join_shrinker(struct f2fs_sb_info *sbi)
 {
        spin_lock(&f2fs_list_lock);
index b3c04ecc3a2711d35d97b9a22b60903e6cfd3012..5c4fd0f3acab729eea2477e187fb57fe4832860e 100644 (file)
@@ -939,6 +939,39 @@ static struct f2fs_base_attr f2fs_base_attr_##_name = {            \
        .show   = f2fs_feature_show,                            \
 }
 
+static ssize_t f2fs_tune_show(struct f2fs_base_attr *a, char *buf)
+{
+       unsigned int res = 0;
+
+       if (!strcmp(a->attr.name, "reclaim_caches_kb"))
+               res = f2fs_donate_files();
+
+       return sysfs_emit(buf, "%u\n", res);
+}
+
+static ssize_t f2fs_tune_store(struct f2fs_base_attr *a,
+                       const char *buf, size_t count)
+{
+       unsigned long t;
+       int ret;
+
+       ret = kstrtoul(skip_spaces(buf), 0, &t);
+       if (ret)
+               return ret;
+
+       if (!strcmp(a->attr.name, "reclaim_caches_kb"))
+               f2fs_reclaim_caches(t);
+
+       return count;
+}
+
+#define F2FS_TUNE_RW_ATTR(_name)                               \
+static struct f2fs_base_attr f2fs_base_attr_##_name = {                \
+       .attr = {.name = __stringify(_name), .mode = 0644 },    \
+       .show   = f2fs_tune_show,                               \
+       .store  = f2fs_tune_store,                              \
+}
+
 static ssize_t f2fs_sb_feature_show(struct f2fs_attr *a,
                struct f2fs_sb_info *sbi, char *buf)
 {
@@ -1389,6 +1422,14 @@ static struct attribute *f2fs_sb_feat_attrs[] = {
 };
 ATTRIBUTE_GROUPS(f2fs_sb_feat);
 
+F2FS_TUNE_RW_ATTR(reclaim_caches_kb);
+
+static struct attribute *f2fs_tune_attrs[] = {
+       BASE_ATTR_LIST(reclaim_caches_kb),
+       NULL,
+};
+ATTRIBUTE_GROUPS(f2fs_tune);
+
 static const struct sysfs_ops f2fs_attr_ops = {
        .show   = f2fs_attr_show,
        .store  = f2fs_attr_store,
@@ -1422,6 +1463,20 @@ static struct kobject f2fs_feat = {
        .kset   = &f2fs_kset,
 };
 
+static const struct sysfs_ops f2fs_tune_attr_ops = {
+       .show   = f2fs_base_attr_show,
+       .store  = f2fs_base_attr_store,
+};
+
+static const struct kobj_type f2fs_tune_ktype = {
+       .default_groups = f2fs_tune_groups,
+       .sysfs_ops      = &f2fs_tune_attr_ops,
+};
+
+static struct kobject f2fs_tune = {
+       .kset   = &f2fs_kset,
+};
+
 static ssize_t f2fs_stat_attr_show(struct kobject *kobj,
                                struct attribute *attr, char *buf)
 {
@@ -1660,6 +1715,11 @@ int __init f2fs_init_sysfs(void)
        if (ret)
                goto put_kobject;
 
+       ret = kobject_init_and_add(&f2fs_tune, &f2fs_tune_ktype,
+                                  NULL, "tuning");
+       if (ret)
+               goto put_kobject;
+
        f2fs_proc_root = proc_mkdir("fs/f2fs", NULL);
        if (!f2fs_proc_root) {
                ret = -ENOMEM;
@@ -1667,7 +1727,9 @@ int __init f2fs_init_sysfs(void)
        }
 
        return 0;
+
 put_kobject:
+       kobject_put(&f2fs_tune);
        kobject_put(&f2fs_feat);
        kset_unregister(&f2fs_kset);
        return ret;
@@ -1675,6 +1737,7 @@ put_kobject:
 
 void f2fs_exit_sysfs(void)
 {
+       kobject_put(&f2fs_tune);
        kobject_put(&f2fs_feat);
        kset_unregister(&f2fs_kset);
        remove_proc_entry("fs/f2fs", NULL);