memcg: introduce non-blocking limit setting option

author Shakeel Butt <shakeel.butt@linux.dev>

Sat, 19 Apr 2025 18:35:45 +0000 (11:35 -0700)

committer Andrew Morton <akpm@linux-foundation.org>

Tue, 13 May 2025 06:50:35 +0000 (23:50 -0700)
author Shakeel Butt <shakeel.butt@linux.dev>
Sat, 19 Apr 2025 18:35:45 +0000 (11:35 -0700)
committer Andrew Morton <akpm@linux-foundation.org>
Tue, 13 May 2025 06:50:35 +0000 (23:50 -0700)
diff --git a/Documentation/admin-guide/cgroup-v2.rst b/Documentation/admin-guide/cgroup-v2.rst

index 1a16ce68a4d7f6f8c9070be89c4975dbfa79077e..b34f1dd969e016284c2df0ed01535f48db98f8b1 100644 (file)
--- a/Documentation/admin-guide/cgroup-v2.rst
+++ b/Documentation/admin-guide/cgroup-v2.rst
@@ -1299,6 +1299,13 @@ PAGE_SIZE multiple when read back.
         monitors the limited cgroup to alleviate heavy reclaim
         pressure.
  
+        If memory.high is opened with O_NONBLOCK then the synchronous
+        reclaim is bypassed. This is useful for admin processes that
+        need to dynamically adjust the job's memory limits without
+        expending their own CPU resources on memory reclamation. The
+        job will trigger the reclaim and/or get throttled on its
+        next charge request.
+
    memory.max
         A read-write single value file which exists on non-root
         cgroups.  The default is "max".
@@ -1316,6 +1323,13 @@ PAGE_SIZE multiple when read back.
         Caller could retry them differently, return into userspace
         as -ENOMEM or silently ignore in cases like disk readahead.
  
+        If memory.max is opened with O_NONBLOCK, then the synchronous
+        reclaim and oom-kill are bypassed. This is useful for admin
+        processes that need to dynamically adjust the job's memory limits
+        without expending their own CPU resources on memory reclamation.
+        The job will trigger the reclaim and/or oom-kill on its next
+        charge request.
+
    memory.reclaim
         A write-only nested-keyed file which exists for all cgroups.
  
diff --git a/mm/memcontrol.c b/mm/memcontrol.c

index 8ed265852423f391731609ee73b63ad9d66c65b6..d3b6f50e00d47fcdf26d199e7daa7cc526288147 100644 (file)
--- a/mm/memcontrol.c
+++ b/mm/memcontrol.c
@@ -4269,6 +4269,9 @@ static ssize_t memory_high_write(struct kernfs_open_file *of,
  
         page_counter_set_high(&memcg->memory, high);
  
+       if (of->file->f_flags & O_NONBLOCK)
+               goto out;
+
         for (;;) {
                 unsigned long nr_pages = page_counter_read(&memcg->memory);
                 unsigned long reclaimed;
@@ -4291,7 +4294,7 @@ static ssize_t memory_high_write(struct kernfs_open_file *of,
                 if (!reclaimed && !nr_retries--)
                         break;
         }
-
+out:
         memcg_wb_domain_size_changed(memcg);
         return nbytes;
  }
@@ -4318,6 +4321,9 @@ static ssize_t memory_max_write(struct kernfs_open_file *of,
  
         xchg(&memcg->memory.max, max);
  
+       if (of->file->f_flags & O_NONBLOCK)
+               goto out;
+
         for (;;) {
                 unsigned long nr_pages = page_counter_read(&memcg->memory);
  
@@ -4345,7 +4351,7 @@ static ssize_t memory_max_write(struct kernfs_open_file *of,
                         break;
                 cond_resched();
         }
-
+out:
         memcg_wb_domain_size_changed(memcg);
         return nbytes;
  }
author	Shakeel Butt <shakeel.butt@linux.dev>
	Sat, 19 Apr 2025 18:35:45 +0000 (11:35 -0700)
committer	Andrew Morton <akpm@linux-foundation.org>
	Tue, 13 May 2025 06:50:35 +0000 (23:50 -0700)
Documentation/admin-guide/cgroup-v2.rst		patch \| blob \| blame \| history
mm/memcontrol.c		patch \| blob \| blame \| history