mm/vmscan: unify writeback reclaim statistic and throttling

author Kairui Song <kasong@tencent.com>

Mon, 27 Apr 2026 18:07:06 +0000 (02:07 +0800)

committer Andrew Morton <akpm@linux-foundation.org>

Thu, 4 Jun 2026 21:45:05 +0000 (14:45 -0700)
author Kairui Song <kasong@tencent.com>
Mon, 27 Apr 2026 18:07:06 +0000 (02:07 +0800)
committer Andrew Morton <akpm@linux-foundation.org>
Thu, 4 Jun 2026 21:45:05 +0000 (14:45 -0700)
diff --git a/mm/vmscan.c b/mm/vmscan.c

index 7494ac73e3f19344ec00753d3d0cae009d0eac12..e8a90911bf88fba6279daee1d2b59f4db2346316 100644 (file)
--- a/mm/vmscan.c
+++ b/mm/vmscan.c
@@ -1946,6 +1946,44 @@ static int current_may_throttle(void)
         return !(current->flags & PF_LOCAL_THROTTLE);
  }
  
+static void handle_reclaim_writeback(unsigned long nr_taken,
+                                    struct pglist_data *pgdat,
+                                    struct scan_control *sc,
+                                    struct reclaim_stat *stat)
+{
+       /*
+        * If dirty folios are scanned that are not queued for IO, it
+        * implies that flushers are not doing their job. This can
+        * happen when memory pressure pushes dirty folios to the end of
+        * the LRU before the dirty limits are breached and the dirty
+        * data has expired. It can also happen when the proportion of
+        * dirty folios grows not through writes but through memory
+        * pressure reclaiming all the clean cache. And in some cases,
+        * the flushers simply cannot keep up with the allocation
+        * rate. Nudge the flusher threads in case they are asleep.
+        */
+       if (stat->nr_unqueued_dirty == nr_taken) {
+               wakeup_flusher_threads(WB_REASON_VMSCAN);
+               /*
+                * For cgroupv1 dirty throttling is achieved by waking up
+                * the kernel flusher here and later waiting on folios
+                * which are in writeback to finish (see shrink_folio_list()).
+                *
+                * Flusher may not be able to issue writeback quickly
+                * enough for cgroupv1 writeback throttling to work
+                * on a large system.
+                */
+               if (!writeback_throttling_sane(sc))
+                       reclaim_throttle(pgdat, VMSCAN_THROTTLE_WRITEBACK);
+       }
+
+       sc->nr.dirty += stat->nr_dirty;
+       sc->nr.congested += stat->nr_congested;
+       sc->nr.writeback += stat->nr_writeback;
+       sc->nr.immediate += stat->nr_immediate;
+       sc->nr.taken += nr_taken;
+}
+
  /*
   * shrink_inactive_list() is a helper for shrink_node().  It returns the number
   * of reclaimed pages
@@ -2009,39 +2047,7 @@ static unsigned long shrink_inactive_list(unsigned long nr_to_scan,
         lruvec_lock_irq(lruvec);
         lru_note_cost_unlock_irq(lruvec, file, stat.nr_pageout,
                                         nr_scanned - nr_reclaimed);
-
-       /*
-        * If dirty folios are scanned that are not queued for IO, it
-        * implies that flushers are not doing their job. This can
-        * happen when memory pressure pushes dirty folios to the end of
-        * the LRU before the dirty limits are breached and the dirty
-        * data has expired. It can also happen when the proportion of
-        * dirty folios grows not through writes but through memory
-        * pressure reclaiming all the clean cache. And in some cases,
-        * the flushers simply cannot keep up with the allocation
-        * rate. Nudge the flusher threads in case they are asleep.
-        */
-       if (stat.nr_unqueued_dirty == nr_taken) {
-               wakeup_flusher_threads(WB_REASON_VMSCAN);
-               /*
-                * For cgroupv1 dirty throttling is achieved by waking up
-                * the kernel flusher here and later waiting on folios
-                * which are in writeback to finish (see shrink_folio_list()).
-                *
-                * Flusher may not be able to issue writeback quickly
-                * enough for cgroupv1 writeback throttling to work
-                * on a large system.
-                */
-               if (!writeback_throttling_sane(sc))
-                       reclaim_throttle(pgdat, VMSCAN_THROTTLE_WRITEBACK);
-       }
-
-       sc->nr.dirty += stat.nr_dirty;
-       sc->nr.congested += stat.nr_congested;
-       sc->nr.writeback += stat.nr_writeback;
-       sc->nr.immediate += stat.nr_immediate;
-       sc->nr.taken += nr_taken;
-
+       handle_reclaim_writeback(nr_taken, pgdat, sc, &stat);
         trace_mm_vmscan_lru_shrink_inactive(pgdat->node_id,
                         nr_scanned, nr_reclaimed, &stat, sc->priority, file);
         return nr_reclaimed;
@@ -4833,26 +4839,13 @@ static int evict_folios(unsigned long nr_to_scan, struct lruvec *lruvec,
  retry:
         reclaimed = shrink_folio_list(&list, pgdat, sc, &stat, false, memcg);
         sc->nr_reclaimed += reclaimed;
+       /* Retry pass is only meant for clean folios without new isolation */
+       if (isolated)
+               handle_reclaim_writeback(isolated, pgdat, sc, &stat);
         trace_mm_vmscan_lru_shrink_inactive(pgdat->node_id,
                         type_scanned, reclaimed, &stat, sc->priority,
                         type ? LRU_INACTIVE_FILE : LRU_INACTIVE_ANON);
  
-       /*
-        * If too many file cache in the coldest generation can't be evicted
-        * due to being dirty, wake up the flusher.
-        */
-       if (stat.nr_unqueued_dirty == isolated) {
-               wakeup_flusher_threads(WB_REASON_VMSCAN);
-
-               /*
-                * For cgroupv1 dirty throttling is achieved by waking up
-                * the kernel flusher here and later waiting on folios
-                * which are in writeback to finish (see shrink_folio_list()).
-                */
-               if (!writeback_throttling_sane(sc))
-                       reclaim_throttle(pgdat, VMSCAN_THROTTLE_WRITEBACK);
-       }
-
         list_for_each_entry_safe_reverse(folio, next, &list, lru) {
                 DEFINE_MIN_SEQ(lruvec);
  
@@ -4895,6 +4888,7 @@ retry:
  
         if (!list_empty(&list)) {
                 skip_retry = true;
+               isolated = 0;
                 goto retry;
         }
author	Kairui Song <kasong@tencent.com>
	Mon, 27 Apr 2026 18:07:06 +0000 (02:07 +0800)
committer	Andrew Morton <akpm@linux-foundation.org>
	Thu, 4 Jun 2026 21:45:05 +0000 (14:45 -0700)