]> git.ipfire.org Git - thirdparty/linux.git/commitdiff
mm/mglru: scan and count the exact number of folios
authorKairui Song <kasong@tencent.com>
Mon, 27 Apr 2026 18:06:56 +0000 (02:06 +0800)
committerAndrew Morton <akpm@linux-foundation.org>
Thu, 4 Jun 2026 21:45:04 +0000 (14:45 -0700)
Make the scan helpers return the exact number of folios being scanned or
isolated.  Since the reclaim loop now has a natural scan budget that
controls the scan progress, returning the scan number and consuming the
budget makes the scan more accurate and easier to follow.

The number of scanned folios for each iteration is always larger than 0,
unless the reclaim must stop for a forced aging, so there is no more need
for any special handling when there is no progress made:

- `return isolated || !remaining ?  scanned : 0` in scan_folios: both
  the function and the call now just return the exact scan count, combined
  with the scan budget introduced in the previous commit to avoid livelock
  or under scan.

- `scanned += try_to_inc_min_seq` in evict_folios: adding a bool as a
  scan count was kind of confusing and no longer needed, as scan number
  should never be zero as long as there are still evictable gens.  We may
  encounter a empty old gen that returns 0 scan count, to avoid that, do a
  try_to_inc_min_seq before toisolation which have slight to none overhead
  in most cases.

- `evictable_min_seq + MIN_NR_GENS > max_seq` guard in evict_folios: the
  per-type get_nr_gens == MIN_NR_GENS check in scan_folios naturally
  returns 0 when only two gens remain and breaks the loop.

Also change try_to_inc_min_seq to return void, as its return value is no
longer used by any caller.  Call it before isolate_folios to flush any
empty gens left by external folio freeing, and again after isolate_folios
when scanning moved or protected folios may have emptied the oldest gen.

The scan still stops if only two gens are left, as the scan number will be
zero.  This matches the previous behavior.  This forced gen protection may
be removed or softened later to improve reclaim further.

Link: https://lore.kernel.org/20260428-mglru-reclaim-v7-5-02fabb92dc43@tencent.com
Signed-off-by: Kairui Song <kasong@tencent.com>
Reviewed-by: Axel Rasmussen <axelrasmussen@google.com>
Reviewed-by: Chen Ridong <chenridong@huaweicloud.com>
Reviewed-by: Baolin Wang <baolin.wang@linux.alibaba.com>
Cc: Barry Song <baohua@kernel.org>
Cc: Chris Li <chrisl@kernel.org>
Cc: David Hildenbrand <david@kernel.org>
Cc: David Stevens <stevensd@google.com>
Cc: Johannes Weiner <hannes@cmpxchg.org>
Cc: Kalesh Singh <kaleshsingh@google.com>
Cc: Leno Hou <lenohou@gmail.com>
Cc: Lorenzo Stoakes <ljs@kernel.org>
Cc: Michal Hocko <mhocko@kernel.org>
Cc: Shakeel Butt <shakeel.butt@linux.dev>
Cc: Suren Baghdasaryan <surenb@google.com>
Cc: Vernon Yang <vernon2gm@gmail.com>
Cc: Wei Xu <weixugc@google.com>
Cc: Yafang <laoar.shao@gmail.com>
Cc: Yuanchu Xie <yuanchu@google.com>
Cc: Yu Zhao <yuzhao@google.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
mm/vmscan.c

index 66ddf211e3ca9269785b411dbd6df21be7e2392e..adfe3e6645d661b6ded076ed719a7caaae2ae320 100644 (file)
@@ -3882,10 +3882,9 @@ done:
        return true;
 }
 
-static bool try_to_inc_min_seq(struct lruvec *lruvec, int swappiness)
+static void try_to_inc_min_seq(struct lruvec *lruvec, int swappiness)
 {
        int gen, type, zone;
-       bool success = false;
        bool seq_inc_flag = false;
        struct lru_gen_folio *lrugen = &lruvec->lrugen;
        DEFINE_MIN_SEQ(lruvec);
@@ -3911,11 +3910,10 @@ next:
 
        /*
         * If min_seq[type] of both anonymous and file is not increased,
-        * we can directly return false to avoid unnecessary checking
-        * overhead later.
+        * return here to avoid unnecessary checking overhead later.
         */
        if (!seq_inc_flag)
-               return success;
+               return;
 
        /* see the comment on lru_gen_folio */
        if (swappiness && swappiness <= MAX_SWAPPINESS) {
@@ -3933,10 +3931,7 @@ next:
 
                reset_ctrl_pos(lruvec, type, true);
                WRITE_ONCE(lrugen->min_seq[type], min_seq[type]);
-               success = true;
        }
-
-       return success;
 }
 
 static bool inc_max_seq(struct lruvec *lruvec, unsigned long seq, int swappiness)
@@ -4690,7 +4685,7 @@ static bool isolate_folio(struct lruvec *lruvec, struct folio *folio, struct sca
 
 static int scan_folios(unsigned long nr_to_scan, struct lruvec *lruvec,
                       struct scan_control *sc, int type, int tier,
-                      struct list_head *list)
+                      struct list_head *list, int *isolatedp)
 {
        int i;
        int gen;
@@ -4760,11 +4755,9 @@ static int scan_folios(unsigned long nr_to_scan, struct lruvec *lruvec,
                                type ? LRU_INACTIVE_FILE : LRU_INACTIVE_ANON);
        if (type == LRU_GEN_FILE)
                sc->nr.file_taken += isolated;
-       /*
-        * There might not be eligible folios due to reclaim_idx. Check the
-        * remaining to prevent livelock if it's not making progress.
-        */
-       return isolated || !remaining ? scanned : 0;
+
+       *isolatedp = isolated;
+       return scanned;
 }
 
 static int get_tier_idx(struct lruvec *lruvec, int type)
@@ -4808,33 +4801,36 @@ static int get_type_to_scan(struct lruvec *lruvec, int swappiness)
 
 static int isolate_folios(unsigned long nr_to_scan, struct lruvec *lruvec,
                          struct scan_control *sc, int swappiness,
-                         int *type_scanned, struct list_head *list)
+                         struct list_head *list, int *isolated,
+                         int *isolate_type, int *isolate_scanned)
 {
        int i;
+       int total_scanned = 0;
        int type = get_type_to_scan(lruvec, swappiness);
 
        for_each_evictable_type(i, swappiness) {
                int scanned;
                int tier = get_tier_idx(lruvec, type);
 
-               *type_scanned = type;
+               scanned = scan_folios(nr_to_scan, lruvec, sc,
+                                     type, tier, list, isolated);
 
-               scanned = scan_folios(nr_to_scan, lruvec, sc, type, tier, list);
-               if (scanned)
-                       return scanned;
+               total_scanned += scanned;
+               if (*isolated) {
+                       *isolate_type = type;
+                       *isolate_scanned = scanned;
+                       break;
+               }
 
                type = !type;
        }
 
-       return 0;
+       return total_scanned;
 }
 
 static int evict_folios(unsigned long nr_to_scan, struct lruvec *lruvec,
                        struct scan_control *sc, int swappiness)
 {
-       int type;
-       int scanned;
-       int reclaimed;
        LIST_HEAD(list);
        LIST_HEAD(clean);
        struct folio *folio;
@@ -4842,19 +4838,23 @@ static int evict_folios(unsigned long nr_to_scan, struct lruvec *lruvec,
        enum node_stat_item item;
        struct reclaim_stat stat;
        struct lru_gen_mm_walk *walk;
+       int scanned, reclaimed;
+       int isolated = 0, type, type_scanned;
        bool skip_retry = false;
-       struct lru_gen_folio *lrugen = &lruvec->lrugen;
        struct mem_cgroup *memcg = lruvec_memcg(lruvec);
        struct pglist_data *pgdat = lruvec_pgdat(lruvec);
 
        lruvec_lock_irq(lruvec);
 
-       scanned = isolate_folios(nr_to_scan, lruvec, sc, swappiness, &type, &list);
+       /* In case folio deletion left empty old gens, flush them */
+       try_to_inc_min_seq(lruvec, swappiness);
 
-       scanned += try_to_inc_min_seq(lruvec, swappiness);
+       scanned = isolate_folios(nr_to_scan, lruvec, sc, swappiness,
+                                &list, &isolated, &type, &type_scanned);
 
-       if (evictable_min_seq(lrugen->min_seq, swappiness) + MIN_NR_GENS > lrugen->max_seq)
-               scanned = 0;
+       /* Scanning may have emptied the oldest gen, flush it */
+       if (scanned)
+               try_to_inc_min_seq(lruvec, swappiness);
 
        lruvec_unlock_irq(lruvec);
 
@@ -4865,7 +4865,7 @@ retry:
        sc->nr.unqueued_dirty += stat.nr_unqueued_dirty;
        sc->nr_reclaimed += reclaimed;
        trace_mm_vmscan_lru_shrink_inactive(pgdat->node_id,
-                       scanned, reclaimed, &stat, sc->priority,
+                       type_scanned, reclaimed, &stat, sc->priority,
                        type ? LRU_INACTIVE_FILE : LRU_INACTIVE_ANON);
 
        list_for_each_entry_safe_reverse(folio, next, &list, lru) {