]> git.ipfire.org Git - thirdparty/kernel/stable.git/blame - include/linux/memcontrol.h
mm, memcontrol: move swap charge handling into get_swap_page()
[thirdparty/kernel/stable.git] / include / linux / memcontrol.h
CommitLineData
8cdea7c0
BS
1/* memcontrol.h - Memory Controller
2 *
3 * Copyright IBM Corporation, 2007
4 * Author Balbir Singh <balbir@linux.vnet.ibm.com>
5 *
78fb7466
PE
6 * Copyright 2007 OpenVZ SWsoft Inc
7 * Author: Pavel Emelianov <xemul@openvz.org>
8 *
8cdea7c0
BS
9 * This program is free software; you can redistribute it and/or modify
10 * it under the terms of the GNU General Public License as published by
11 * the Free Software Foundation; either version 2 of the License, or
12 * (at your option) any later version.
13 *
14 * This program is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 * GNU General Public License for more details.
18 */
19
20#ifndef _LINUX_MEMCONTROL_H
21#define _LINUX_MEMCONTROL_H
f8d66542 22#include <linux/cgroup.h>
456f998e 23#include <linux/vm_event_item.h>
7ae1e1d0 24#include <linux/hardirq.h>
a8964b9b 25#include <linux/jump_label.h>
33398cf2
MH
26#include <linux/page_counter.h>
27#include <linux/vmpressure.h>
28#include <linux/eventfd.h>
00f3ca2c
JW
29#include <linux/mm.h>
30#include <linux/vmstat.h>
33398cf2 31#include <linux/writeback.h>
fdf1cdb9 32#include <linux/page-flags.h>
456f998e 33
78fb7466 34struct mem_cgroup;
8697d331
BS
35struct page;
36struct mm_struct;
2633d7a0 37struct kmem_cache;
78fb7466 38
71cd3113
JW
39/* Cgroup-specific page state, on top of universal node page state */
40enum memcg_stat_item {
41 MEMCG_CACHE = NR_VM_NODE_STAT_ITEMS,
42 MEMCG_RSS,
43 MEMCG_RSS_HUGE,
44 MEMCG_SWAP,
45 MEMCG_SOCK,
46 /* XXX: why are these zone and not node counters? */
47 MEMCG_KERNEL_STACK_KB,
b2807f07 48 MEMCG_NR_STAT,
2a7106f2
GT
49};
50
e27be240
JW
51enum memcg_memory_event {
52 MEMCG_LOW,
71cd3113
JW
53 MEMCG_HIGH,
54 MEMCG_MAX,
55 MEMCG_OOM,
e27be240 56 MEMCG_NR_MEMORY_EVENTS,
71cd3113
JW
57};
58
5660048c 59struct mem_cgroup_reclaim_cookie {
ef8f2327 60 pg_data_t *pgdat;
5660048c
JW
61 int priority;
62 unsigned int generation;
63};
64
71cd3113
JW
65#ifdef CONFIG_MEMCG
66
67#define MEM_CGROUP_ID_SHIFT 16
68#define MEM_CGROUP_ID_MAX USHRT_MAX
69
70struct mem_cgroup_id {
71 int id;
72 atomic_t ref;
73};
74
33398cf2
MH
75/*
76 * Per memcg event counter is incremented at every pagein/pageout. With THP,
77 * it will be incremated by the number of pages. This counter is used for
78 * for trigger some periodic events. This is straightforward and better
79 * than using jiffies etc. to handle periodic memcg event.
80 */
81enum mem_cgroup_events_target {
82 MEM_CGROUP_TARGET_THRESH,
83 MEM_CGROUP_TARGET_SOFTLIMIT,
84 MEM_CGROUP_TARGET_NUMAINFO,
85 MEM_CGROUP_NTARGETS,
86};
87
33398cf2 88struct mem_cgroup_stat_cpu {
b2807f07 89 long count[MEMCG_NR_STAT];
e27be240 90 unsigned long events[NR_VM_EVENT_ITEMS];
33398cf2
MH
91 unsigned long nr_page_events;
92 unsigned long targets[MEM_CGROUP_NTARGETS];
93};
94
95struct mem_cgroup_reclaim_iter {
96 struct mem_cgroup *position;
97 /* scan generation, increased every round-trip */
98 unsigned int generation;
99};
100
00f3ca2c
JW
101struct lruvec_stat {
102 long count[NR_VM_NODE_STAT_ITEMS];
103};
104
33398cf2
MH
105/*
106 * per-zone information in memory controller.
107 */
ef8f2327 108struct mem_cgroup_per_node {
33398cf2 109 struct lruvec lruvec;
a983b5eb
JW
110
111 struct lruvec_stat __percpu *lruvec_stat_cpu;
112 atomic_long_t lruvec_stat[NR_VM_NODE_STAT_ITEMS];
113
b4536f0c 114 unsigned long lru_zone_size[MAX_NR_ZONES][NR_LRU_LISTS];
33398cf2
MH
115
116 struct mem_cgroup_reclaim_iter iter[DEF_PRIORITY + 1];
117
118 struct rb_node tree_node; /* RB tree node */
119 unsigned long usage_in_excess;/* Set to the value by which */
120 /* the soft limit is exceeded*/
121 bool on_tree;
e3c1ac58
AR
122 bool congested; /* memcg has many dirty pages */
123 /* backed by a congested BDI */
124
33398cf2
MH
125 struct mem_cgroup *memcg; /* Back pointer, we cannot */
126 /* use container_of */
127};
128
33398cf2
MH
129struct mem_cgroup_threshold {
130 struct eventfd_ctx *eventfd;
131 unsigned long threshold;
132};
133
134/* For threshold */
135struct mem_cgroup_threshold_ary {
136 /* An array index points to threshold just below or equal to usage. */
137 int current_threshold;
138 /* Size of entries[] */
139 unsigned int size;
140 /* Array of thresholds */
141 struct mem_cgroup_threshold entries[0];
142};
143
144struct mem_cgroup_thresholds {
145 /* Primary thresholds array */
146 struct mem_cgroup_threshold_ary *primary;
147 /*
148 * Spare threshold array.
149 * This is needed to make mem_cgroup_unregister_event() "never fail".
150 * It must be able to store at least primary->size - 1 entries.
151 */
152 struct mem_cgroup_threshold_ary *spare;
153};
154
567e9ab2
JW
155enum memcg_kmem_state {
156 KMEM_NONE,
157 KMEM_ALLOCATED,
158 KMEM_ONLINE,
159};
160
33398cf2
MH
161/*
162 * The memory controller data structure. The memory controller controls both
163 * page cache and RSS per cgroup. We would eventually like to provide
164 * statistics based on the statistics developed by Rik Van Riel for clock-pro,
165 * to help the administrator determine what knobs to tune.
166 */
167struct mem_cgroup {
168 struct cgroup_subsys_state css;
169
73f576c0
JW
170 /* Private memcg ID. Used to ID objects that outlive the cgroup */
171 struct mem_cgroup_id id;
172
33398cf2
MH
173 /* Accounted resources */
174 struct page_counter memory;
37e84351 175 struct page_counter swap;
0db15298
JW
176
177 /* Legacy consumer-oriented counters */
33398cf2
MH
178 struct page_counter memsw;
179 struct page_counter kmem;
0db15298 180 struct page_counter tcpmem;
33398cf2
MH
181
182 /* Normal memory consumption range */
183 unsigned long low;
184 unsigned long high;
185
f7e1cb6e
JW
186 /* Range enforcement for interrupt charges */
187 struct work_struct high_work;
188
33398cf2
MH
189 unsigned long soft_limit;
190
191 /* vmpressure notifications */
192 struct vmpressure vmpressure;
193
33398cf2
MH
194 /*
195 * Should the accounting and control be hierarchical, per subtree?
196 */
197 bool use_hierarchy;
198
199 /* protected by memcg_oom_lock */
200 bool oom_lock;
201 int under_oom;
202
203 int swappiness;
204 /* OOM-Killer disable */
205 int oom_kill_disable;
206
e27be240
JW
207 /* memory.events */
208 atomic_long_t memory_events[MEMCG_NR_MEMORY_EVENTS];
472912a2
TH
209 struct cgroup_file events_file;
210
33398cf2
MH
211 /* protect arrays of thresholds */
212 struct mutex thresholds_lock;
213
214 /* thresholds for memory usage. RCU-protected */
215 struct mem_cgroup_thresholds thresholds;
216
217 /* thresholds for mem+swap usage. RCU-protected */
218 struct mem_cgroup_thresholds memsw_thresholds;
219
220 /* For oom notifier event fd */
221 struct list_head oom_notify;
222
223 /*
224 * Should we move charges of a task when a task is moved into this
225 * mem_cgroup ? And what type of charges should we move ?
226 */
227 unsigned long move_charge_at_immigrate;
228 /*
229 * set > 0 if pages under this cgroup are moving to other cgroup.
230 */
231 atomic_t moving_account;
232 /* taken only while moving_account > 0 */
233 spinlock_t move_lock;
234 struct task_struct *move_lock_task;
235 unsigned long move_lock_flags;
a983b5eb 236
e27be240 237 /* memory.stat */
a983b5eb
JW
238 struct mem_cgroup_stat_cpu __percpu *stat_cpu;
239 atomic_long_t stat[MEMCG_NR_STAT];
e27be240 240 atomic_long_t events[NR_VM_EVENT_ITEMS];
33398cf2 241
d886f4e4
JW
242 unsigned long socket_pressure;
243
244 /* Legacy tcp memory accounting */
0db15298
JW
245 bool tcpmem_active;
246 int tcpmem_pressure;
d886f4e4 247
127424c8 248#ifndef CONFIG_SLOB
33398cf2
MH
249 /* Index in the kmem_cache->memcg_params.memcg_caches array */
250 int kmemcg_id;
567e9ab2 251 enum memcg_kmem_state kmem_state;
bc2791f8 252 struct list_head kmem_caches;
33398cf2
MH
253#endif
254
255 int last_scanned_node;
256#if MAX_NUMNODES > 1
257 nodemask_t scan_nodes;
258 atomic_t numainfo_events;
259 atomic_t numainfo_updating;
260#endif
261
262#ifdef CONFIG_CGROUP_WRITEBACK
263 struct list_head cgwb_list;
264 struct wb_domain cgwb_domain;
265#endif
266
267 /* List of events which userspace want to receive */
268 struct list_head event_list;
269 spinlock_t event_list_lock;
270
271 struct mem_cgroup_per_node *nodeinfo[0];
272 /* WARNING: nodeinfo must be the last member here */
273};
7d828602 274
a983b5eb
JW
275/*
276 * size of first charge trial. "32" comes from vmscan.c's magic value.
277 * TODO: maybe necessary to use big numbers in big irons.
278 */
279#define MEMCG_CHARGE_BATCH 32U
280
7d828602 281extern struct mem_cgroup *root_mem_cgroup;
56161634 282
23047a96
JW
283static inline bool mem_cgroup_disabled(void)
284{
285 return !cgroup_subsys_enabled(memory_cgrp_subsys);
286}
287
241994ed
JW
288bool mem_cgroup_low(struct mem_cgroup *root, struct mem_cgroup *memcg);
289
00501b53 290int mem_cgroup_try_charge(struct page *page, struct mm_struct *mm,
f627c2f5
KS
291 gfp_t gfp_mask, struct mem_cgroup **memcgp,
292 bool compound);
00501b53 293void mem_cgroup_commit_charge(struct page *page, struct mem_cgroup *memcg,
f627c2f5
KS
294 bool lrucare, bool compound);
295void mem_cgroup_cancel_charge(struct page *page, struct mem_cgroup *memcg,
296 bool compound);
0a31bc97 297void mem_cgroup_uncharge(struct page *page);
747db954 298void mem_cgroup_uncharge_list(struct list_head *page_list);
569b846d 299
6a93ca8f 300void mem_cgroup_migrate(struct page *oldpage, struct page *newpage);
569b846d 301
ef8f2327
MG
302static struct mem_cgroup_per_node *
303mem_cgroup_nodeinfo(struct mem_cgroup *memcg, int nid)
55779ec7 304{
ef8f2327 305 return memcg->nodeinfo[nid];
55779ec7
JW
306}
307
308/**
a9dd0a83
MG
309 * mem_cgroup_lruvec - get the lru list vector for a node or a memcg zone
310 * @node: node of the wanted lruvec
55779ec7
JW
311 * @memcg: memcg of the wanted lruvec
312 *
a9dd0a83
MG
313 * Returns the lru list vector holding pages for a given @node or a given
314 * @memcg and @zone. This can be the node lruvec, if the memory controller
55779ec7
JW
315 * is disabled.
316 */
a9dd0a83 317static inline struct lruvec *mem_cgroup_lruvec(struct pglist_data *pgdat,
ef8f2327 318 struct mem_cgroup *memcg)
55779ec7 319{
ef8f2327 320 struct mem_cgroup_per_node *mz;
55779ec7
JW
321 struct lruvec *lruvec;
322
323 if (mem_cgroup_disabled()) {
a9dd0a83 324 lruvec = node_lruvec(pgdat);
55779ec7
JW
325 goto out;
326 }
327
ef8f2327 328 mz = mem_cgroup_nodeinfo(memcg, pgdat->node_id);
55779ec7
JW
329 lruvec = &mz->lruvec;
330out:
331 /*
332 * Since a node can be onlined after the mem_cgroup was created,
599d0c95 333 * we have to be prepared to initialize lruvec->pgdat here;
55779ec7
JW
334 * and if offlined then reonlined, we need to reinitialize it.
335 */
ef8f2327
MG
336 if (unlikely(lruvec->pgdat != pgdat))
337 lruvec->pgdat = pgdat;
55779ec7
JW
338 return lruvec;
339}
340
599d0c95 341struct lruvec *mem_cgroup_page_lruvec(struct page *, struct pglist_data *);
c9b0ed51 342
2314b42d 343bool task_in_mem_cgroup(struct task_struct *task, struct mem_cgroup *memcg);
64219994 344struct mem_cgroup *mem_cgroup_from_task(struct task_struct *p);
e993d905 345
33398cf2
MH
346static inline
347struct mem_cgroup *mem_cgroup_from_css(struct cgroup_subsys_state *css){
348 return css ? container_of(css, struct mem_cgroup, css) : NULL;
349}
350
8e8ae645
JW
351#define mem_cgroup_from_counter(counter, member) \
352 container_of(counter, struct mem_cgroup, member)
353
33398cf2
MH
354struct mem_cgroup *mem_cgroup_iter(struct mem_cgroup *,
355 struct mem_cgroup *,
356 struct mem_cgroup_reclaim_cookie *);
357void mem_cgroup_iter_break(struct mem_cgroup *, struct mem_cgroup *);
7c5f64f8
VD
358int mem_cgroup_scan_tasks(struct mem_cgroup *,
359 int (*)(struct task_struct *, void *), void *);
33398cf2 360
23047a96
JW
361static inline unsigned short mem_cgroup_id(struct mem_cgroup *memcg)
362{
363 if (mem_cgroup_disabled())
364 return 0;
365
73f576c0 366 return memcg->id.id;
23047a96 367}
73f576c0 368struct mem_cgroup *mem_cgroup_from_id(unsigned short id);
23047a96 369
2262185c
RG
370static inline struct mem_cgroup *lruvec_memcg(struct lruvec *lruvec)
371{
372 struct mem_cgroup_per_node *mz;
373
374 if (mem_cgroup_disabled())
375 return NULL;
376
377 mz = container_of(lruvec, struct mem_cgroup_per_node, lruvec);
378 return mz->memcg;
379}
380
8e8ae645
JW
381/**
382 * parent_mem_cgroup - find the accounting parent of a memcg
383 * @memcg: memcg whose parent to find
384 *
385 * Returns the parent memcg, or NULL if this is the root or the memory
386 * controller is in legacy no-hierarchy mode.
387 */
388static inline struct mem_cgroup *parent_mem_cgroup(struct mem_cgroup *memcg)
389{
390 if (!memcg->memory.parent)
391 return NULL;
392 return mem_cgroup_from_counter(memcg->memory.parent, memory);
393}
394
33398cf2
MH
395static inline bool mem_cgroup_is_descendant(struct mem_cgroup *memcg,
396 struct mem_cgroup *root)
397{
398 if (root == memcg)
399 return true;
400 if (!root->use_hierarchy)
401 return false;
402 return cgroup_is_descendant(memcg->css.cgroup, root->css.cgroup);
403}
e1aab161 404
2314b42d
JW
405static inline bool mm_match_cgroup(struct mm_struct *mm,
406 struct mem_cgroup *memcg)
2e4d4091 407{
587af308 408 struct mem_cgroup *task_memcg;
413918bb 409 bool match = false;
c3ac9a8a 410
2e4d4091 411 rcu_read_lock();
587af308 412 task_memcg = mem_cgroup_from_task(rcu_dereference(mm->owner));
413918bb 413 if (task_memcg)
2314b42d 414 match = mem_cgroup_is_descendant(task_memcg, memcg);
2e4d4091 415 rcu_read_unlock();
c3ac9a8a 416 return match;
2e4d4091 417}
8a9f3ccd 418
64219994 419struct cgroup_subsys_state *mem_cgroup_css_from_page(struct page *page);
2fc04524 420ino_t page_cgroup_ino(struct page *page);
d324236b 421
eb01aaab
VD
422static inline bool mem_cgroup_online(struct mem_cgroup *memcg)
423{
424 if (mem_cgroup_disabled())
425 return true;
426 return !!(memcg->css.flags & CSS_ONLINE);
427}
428
58ae83db
KH
429/*
430 * For memory reclaim.
431 */
889976db 432int mem_cgroup_select_victim_node(struct mem_cgroup *memcg);
33398cf2
MH
433
434void mem_cgroup_update_lru_size(struct lruvec *lruvec, enum lru_list lru,
b4536f0c 435 int zid, int nr_pages);
33398cf2 436
0a6b76dd
VD
437unsigned long mem_cgroup_node_nr_lru_pages(struct mem_cgroup *memcg,
438 int nid, unsigned int lru_mask);
439
33398cf2
MH
440static inline
441unsigned long mem_cgroup_get_lru_size(struct lruvec *lruvec, enum lru_list lru)
442{
ef8f2327 443 struct mem_cgroup_per_node *mz;
b4536f0c
MH
444 unsigned long nr_pages = 0;
445 int zid;
33398cf2 446
ef8f2327 447 mz = container_of(lruvec, struct mem_cgroup_per_node, lruvec);
b4536f0c
MH
448 for (zid = 0; zid < MAX_NR_ZONES; zid++)
449 nr_pages += mz->lru_zone_size[zid][lru];
450 return nr_pages;
451}
452
453static inline
454unsigned long mem_cgroup_get_zone_lru_size(struct lruvec *lruvec,
455 enum lru_list lru, int zone_idx)
456{
457 struct mem_cgroup_per_node *mz;
458
459 mz = container_of(lruvec, struct mem_cgroup_per_node, lruvec);
460 return mz->lru_zone_size[zone_idx][lru];
33398cf2
MH
461}
462
b23afb93
TH
463void mem_cgroup_handle_over_high(void);
464
7c5f64f8
VD
465unsigned long mem_cgroup_get_limit(struct mem_cgroup *memcg);
466
64219994
MH
467void mem_cgroup_print_oom_info(struct mem_cgroup *memcg,
468 struct task_struct *p);
58ae83db 469
49426420 470static inline void mem_cgroup_oom_enable(void)
519e5247 471{
626ebc41
TH
472 WARN_ON(current->memcg_may_oom);
473 current->memcg_may_oom = 1;
519e5247
JW
474}
475
49426420 476static inline void mem_cgroup_oom_disable(void)
519e5247 477{
626ebc41
TH
478 WARN_ON(!current->memcg_may_oom);
479 current->memcg_may_oom = 0;
519e5247
JW
480}
481
3812c8c8
JW
482static inline bool task_in_memcg_oom(struct task_struct *p)
483{
626ebc41 484 return p->memcg_in_oom;
3812c8c8
JW
485}
486
49426420 487bool mem_cgroup_oom_synchronize(bool wait);
3812c8c8 488
c255a458 489#ifdef CONFIG_MEMCG_SWAP
c077719b
KH
490extern int do_swap_account;
491#endif
f8d66542 492
739f79fc
JW
493struct mem_cgroup *lock_page_memcg(struct page *page);
494void __unlock_page_memcg(struct mem_cgroup *memcg);
62cccb8c 495void unlock_page_memcg(struct page *page);
d7365e78 496
04fecbf5 497/* idx can be of type enum memcg_stat_item or node_stat_item */
ccda7f43 498static inline unsigned long memcg_page_state(struct mem_cgroup *memcg,
04fecbf5 499 int idx)
2a2e4885 500{
a983b5eb
JW
501 long x = atomic_long_read(&memcg->stat[idx]);
502#ifdef CONFIG_SMP
503 if (x < 0)
504 x = 0;
505#endif
506 return x;
2a2e4885
JW
507}
508
04fecbf5 509/* idx can be of type enum memcg_stat_item or node_stat_item */
00f3ca2c 510static inline void __mod_memcg_state(struct mem_cgroup *memcg,
04fecbf5 511 int idx, int val)
2a2e4885 512{
a983b5eb
JW
513 long x;
514
515 if (mem_cgroup_disabled())
516 return;
517
518 x = val + __this_cpu_read(memcg->stat_cpu->count[idx]);
519 if (unlikely(abs(x) > MEMCG_CHARGE_BATCH)) {
520 atomic_long_add(x, &memcg->stat[idx]);
521 x = 0;
522 }
523 __this_cpu_write(memcg->stat_cpu->count[idx], x);
2a2e4885
JW
524}
525
04fecbf5 526/* idx can be of type enum memcg_stat_item or node_stat_item */
00f3ca2c 527static inline void mod_memcg_state(struct mem_cgroup *memcg,
04fecbf5 528 int idx, int val)
2a2e4885 529{
c3cc3911
JW
530 unsigned long flags;
531
532 local_irq_save(flags);
a983b5eb 533 __mod_memcg_state(memcg, idx, val);
c3cc3911 534 local_irq_restore(flags);
2a2e4885
JW
535}
536
33398cf2 537/**
ccda7f43 538 * mod_memcg_page_state - update page state statistics
62cccb8c 539 * @page: the page
33398cf2
MH
540 * @idx: page state item to account
541 * @val: number of pages (positive or negative)
542 *
fdf1cdb9
JW
543 * The @page must be locked or the caller must use lock_page_memcg()
544 * to prevent double accounting when the page is concurrently being
545 * moved to another memcg:
81f8c3a4 546 *
fdf1cdb9 547 * lock_page(page) or lock_page_memcg(page)
81f8c3a4 548 * if (TestClearPageState(page))
ccda7f43 549 * mod_memcg_page_state(page, state, -1);
fdf1cdb9 550 * unlock_page(page) or unlock_page_memcg(page)
2a2e4885
JW
551 *
552 * Kernel pages are an exception to this, since they'll never move.
33398cf2 553 */
00f3ca2c 554static inline void __mod_memcg_page_state(struct page *page,
04fecbf5 555 int idx, int val)
00f3ca2c
JW
556{
557 if (page->mem_cgroup)
558 __mod_memcg_state(page->mem_cgroup, idx, val);
559}
560
ccda7f43 561static inline void mod_memcg_page_state(struct page *page,
04fecbf5 562 int idx, int val)
33398cf2 563{
62cccb8c 564 if (page->mem_cgroup)
ccda7f43 565 mod_memcg_state(page->mem_cgroup, idx, val);
33398cf2
MH
566}
567
00f3ca2c
JW
568static inline unsigned long lruvec_page_state(struct lruvec *lruvec,
569 enum node_stat_item idx)
2a7106f2 570{
00f3ca2c 571 struct mem_cgroup_per_node *pn;
a983b5eb 572 long x;
00f3ca2c
JW
573
574 if (mem_cgroup_disabled())
575 return node_page_state(lruvec_pgdat(lruvec), idx);
576
577 pn = container_of(lruvec, struct mem_cgroup_per_node, lruvec);
a983b5eb
JW
578 x = atomic_long_read(&pn->lruvec_stat[idx]);
579#ifdef CONFIG_SMP
580 if (x < 0)
581 x = 0;
582#endif
583 return x;
2a7106f2
GT
584}
585
00f3ca2c
JW
586static inline void __mod_lruvec_state(struct lruvec *lruvec,
587 enum node_stat_item idx, int val)
2a7106f2 588{
00f3ca2c 589 struct mem_cgroup_per_node *pn;
a983b5eb 590 long x;
00f3ca2c 591
28454265 592 /* Update node */
00f3ca2c 593 __mod_node_page_state(lruvec_pgdat(lruvec), idx, val);
28454265 594
00f3ca2c
JW
595 if (mem_cgroup_disabled())
596 return;
28454265 597
00f3ca2c 598 pn = container_of(lruvec, struct mem_cgroup_per_node, lruvec);
28454265
JW
599
600 /* Update memcg */
00f3ca2c 601 __mod_memcg_state(pn->memcg, idx, val);
28454265
JW
602
603 /* Update lruvec */
a983b5eb
JW
604 x = val + __this_cpu_read(pn->lruvec_stat_cpu->count[idx]);
605 if (unlikely(abs(x) > MEMCG_CHARGE_BATCH)) {
606 atomic_long_add(x, &pn->lruvec_stat[idx]);
607 x = 0;
608 }
609 __this_cpu_write(pn->lruvec_stat_cpu->count[idx], x);
00f3ca2c
JW
610}
611
612static inline void mod_lruvec_state(struct lruvec *lruvec,
613 enum node_stat_item idx, int val)
614{
c3cc3911
JW
615 unsigned long flags;
616
617 local_irq_save(flags);
28454265 618 __mod_lruvec_state(lruvec, idx, val);
c3cc3911 619 local_irq_restore(flags);
00f3ca2c
JW
620}
621
622static inline void __mod_lruvec_page_state(struct page *page,
623 enum node_stat_item idx, int val)
624{
28454265
JW
625 pg_data_t *pgdat = page_pgdat(page);
626 struct lruvec *lruvec;
00f3ca2c 627
28454265
JW
628 /* Untracked pages have no memcg, no lruvec. Update only the node */
629 if (!page->mem_cgroup) {
630 __mod_node_page_state(pgdat, idx, val);
00f3ca2c 631 return;
28454265
JW
632 }
633
634 lruvec = mem_cgroup_lruvec(pgdat, page->mem_cgroup);
635 __mod_lruvec_state(lruvec, idx, val);
00f3ca2c
JW
636}
637
638static inline void mod_lruvec_page_state(struct page *page,
639 enum node_stat_item idx, int val)
640{
c3cc3911
JW
641 unsigned long flags;
642
643 local_irq_save(flags);
28454265 644 __mod_lruvec_page_state(page, idx, val);
c3cc3911 645 local_irq_restore(flags);
2a7106f2
GT
646}
647
ef8f2327 648unsigned long mem_cgroup_soft_limit_reclaim(pg_data_t *pgdat, int order,
0608f43d
AM
649 gfp_t gfp_mask,
650 unsigned long *total_scanned);
a63d83f4 651
c9019e9b 652static inline void __count_memcg_events(struct mem_cgroup *memcg,
e27be240
JW
653 enum vm_event_item idx,
654 unsigned long count)
c9019e9b 655{
a983b5eb
JW
656 unsigned long x;
657
658 if (mem_cgroup_disabled())
659 return;
660
661 x = count + __this_cpu_read(memcg->stat_cpu->events[idx]);
662 if (unlikely(x > MEMCG_CHARGE_BATCH)) {
663 atomic_long_add(x, &memcg->events[idx]);
664 x = 0;
665 }
666 __this_cpu_write(memcg->stat_cpu->events[idx], x);
c9019e9b
JW
667}
668
2262185c 669static inline void count_memcg_events(struct mem_cgroup *memcg,
e27be240
JW
670 enum vm_event_item idx,
671 unsigned long count)
2262185c 672{
c3cc3911
JW
673 unsigned long flags;
674
675 local_irq_save(flags);
a983b5eb 676 __count_memcg_events(memcg, idx, count);
c3cc3911 677 local_irq_restore(flags);
2262185c
RG
678}
679
680static inline void count_memcg_page_event(struct page *page,
e27be240 681 enum vm_event_item idx)
2262185c
RG
682{
683 if (page->mem_cgroup)
684 count_memcg_events(page->mem_cgroup, idx, 1);
685}
686
687static inline void count_memcg_event_mm(struct mm_struct *mm,
688 enum vm_event_item idx)
68ae564b 689{
33398cf2
MH
690 struct mem_cgroup *memcg;
691
68ae564b
DR
692 if (mem_cgroup_disabled())
693 return;
33398cf2
MH
694
695 rcu_read_lock();
696 memcg = mem_cgroup_from_task(rcu_dereference(mm->owner));
8e675f7a 697 if (likely(memcg)) {
c9019e9b 698 count_memcg_events(memcg, idx, 1);
8e675f7a
KK
699 if (idx == OOM_KILL)
700 cgroup_file_notify(&memcg->events_file);
701 }
33398cf2 702 rcu_read_unlock();
68ae564b 703}
c9019e9b 704
e27be240
JW
705static inline void memcg_memory_event(struct mem_cgroup *memcg,
706 enum memcg_memory_event event)
c9019e9b 707{
e27be240 708 atomic_long_inc(&memcg->memory_events[event]);
c9019e9b
JW
709 cgroup_file_notify(&memcg->events_file);
710}
711
ca3e0214 712#ifdef CONFIG_TRANSPARENT_HUGEPAGE
e94c8a9c 713void mem_cgroup_split_huge_fixup(struct page *head);
ca3e0214
KH
714#endif
715
c255a458 716#else /* CONFIG_MEMCG */
23047a96
JW
717
718#define MEM_CGROUP_ID_SHIFT 0
719#define MEM_CGROUP_ID_MAX 0
720
7a81b88c
KH
721struct mem_cgroup;
722
23047a96
JW
723static inline bool mem_cgroup_disabled(void)
724{
725 return true;
726}
727
e27be240
JW
728static inline void memcg_memory_event(struct mem_cgroup *memcg,
729 enum memcg_memory_event event)
241994ed
JW
730{
731}
732
733static inline bool mem_cgroup_low(struct mem_cgroup *root,
734 struct mem_cgroup *memcg)
735{
736 return false;
737}
738
00501b53
JW
739static inline int mem_cgroup_try_charge(struct page *page, struct mm_struct *mm,
740 gfp_t gfp_mask,
f627c2f5
KS
741 struct mem_cgroup **memcgp,
742 bool compound)
7a81b88c 743{
00501b53 744 *memcgp = NULL;
7a81b88c
KH
745 return 0;
746}
747
00501b53
JW
748static inline void mem_cgroup_commit_charge(struct page *page,
749 struct mem_cgroup *memcg,
f627c2f5 750 bool lrucare, bool compound)
7a81b88c
KH
751{
752}
753
00501b53 754static inline void mem_cgroup_cancel_charge(struct page *page,
f627c2f5
KS
755 struct mem_cgroup *memcg,
756 bool compound)
7a81b88c
KH
757{
758}
759
0a31bc97 760static inline void mem_cgroup_uncharge(struct page *page)
569b846d
KH
761{
762}
763
747db954 764static inline void mem_cgroup_uncharge_list(struct list_head *page_list)
8a9f3ccd
BS
765{
766}
767
6a93ca8f 768static inline void mem_cgroup_migrate(struct page *old, struct page *new)
69029cd5
KH
769{
770}
771
a9dd0a83 772static inline struct lruvec *mem_cgroup_lruvec(struct pglist_data *pgdat,
ef8f2327 773 struct mem_cgroup *memcg)
08e552c6 774{
a9dd0a83 775 return node_lruvec(pgdat);
08e552c6
KH
776}
777
fa9add64 778static inline struct lruvec *mem_cgroup_page_lruvec(struct page *page,
599d0c95 779 struct pglist_data *pgdat)
66e1707b 780{
599d0c95 781 return &pgdat->lruvec;
66e1707b
BS
782}
783
587af308 784static inline bool mm_match_cgroup(struct mm_struct *mm,
c0ff4b85 785 struct mem_cgroup *memcg)
bed7161a 786{
587af308 787 return true;
bed7161a
BS
788}
789
ffbdccf5
DR
790static inline bool task_in_mem_cgroup(struct task_struct *task,
791 const struct mem_cgroup *memcg)
4c4a2214 792{
ffbdccf5 793 return true;
4c4a2214
DR
794}
795
5660048c
JW
796static inline struct mem_cgroup *
797mem_cgroup_iter(struct mem_cgroup *root,
798 struct mem_cgroup *prev,
799 struct mem_cgroup_reclaim_cookie *reclaim)
800{
801 return NULL;
802}
803
804static inline void mem_cgroup_iter_break(struct mem_cgroup *root,
805 struct mem_cgroup *prev)
806{
807}
808
7c5f64f8
VD
809static inline int mem_cgroup_scan_tasks(struct mem_cgroup *memcg,
810 int (*fn)(struct task_struct *, void *), void *arg)
811{
812 return 0;
813}
814
23047a96 815static inline unsigned short mem_cgroup_id(struct mem_cgroup *memcg)
f8d66542 816{
23047a96
JW
817 return 0;
818}
819
820static inline struct mem_cgroup *mem_cgroup_from_id(unsigned short id)
821{
822 WARN_ON_ONCE(id);
823 /* XXX: This should always return root_mem_cgroup */
824 return NULL;
f8d66542 825}
a636b327 826
2262185c
RG
827static inline struct mem_cgroup *lruvec_memcg(struct lruvec *lruvec)
828{
829 return NULL;
830}
831
eb01aaab 832static inline bool mem_cgroup_online(struct mem_cgroup *memcg)
14797e23 833{
13308ca9 834 return true;
14797e23
KM
835}
836
a3d8e054 837static inline unsigned long
4d7dcca2 838mem_cgroup_get_lru_size(struct lruvec *lruvec, enum lru_list lru)
a3d8e054
KM
839{
840 return 0;
841}
b4536f0c
MH
842static inline
843unsigned long mem_cgroup_get_zone_lru_size(struct lruvec *lruvec,
844 enum lru_list lru, int zone_idx)
845{
846 return 0;
847}
a3d8e054 848
0a6b76dd
VD
849static inline unsigned long
850mem_cgroup_node_nr_lru_pages(struct mem_cgroup *memcg,
851 int nid, unsigned int lru_mask)
852{
853 return 0;
854}
855
7c5f64f8
VD
856static inline unsigned long mem_cgroup_get_limit(struct mem_cgroup *memcg)
857{
858 return 0;
859}
860
e222432b
BS
861static inline void
862mem_cgroup_print_oom_info(struct mem_cgroup *memcg, struct task_struct *p)
863{
864}
865
739f79fc
JW
866static inline struct mem_cgroup *lock_page_memcg(struct page *page)
867{
868 return NULL;
869}
870
871static inline void __unlock_page_memcg(struct mem_cgroup *memcg)
89c06bd5
KH
872{
873}
874
62cccb8c 875static inline void unlock_page_memcg(struct page *page)
89c06bd5
KH
876{
877}
878
b23afb93
TH
879static inline void mem_cgroup_handle_over_high(void)
880{
881}
882
49426420 883static inline void mem_cgroup_oom_enable(void)
519e5247
JW
884{
885}
886
49426420 887static inline void mem_cgroup_oom_disable(void)
519e5247
JW
888{
889}
890
3812c8c8
JW
891static inline bool task_in_memcg_oom(struct task_struct *p)
892{
893 return false;
894}
895
49426420 896static inline bool mem_cgroup_oom_synchronize(bool wait)
3812c8c8
JW
897{
898 return false;
899}
900
ccda7f43 901static inline unsigned long memcg_page_state(struct mem_cgroup *memcg,
04fecbf5 902 int idx)
2a2e4885
JW
903{
904 return 0;
905}
906
00f3ca2c 907static inline void __mod_memcg_state(struct mem_cgroup *memcg,
04fecbf5 908 int idx,
00f3ca2c 909 int nr)
2a2e4885
JW
910{
911}
912
00f3ca2c 913static inline void mod_memcg_state(struct mem_cgroup *memcg,
04fecbf5 914 int idx,
00f3ca2c 915 int nr)
2a2e4885
JW
916{
917}
918
00f3ca2c 919static inline void __mod_memcg_page_state(struct page *page,
04fecbf5 920 int idx,
00f3ca2c 921 int nr)
2a2e4885
JW
922{
923}
924
ccda7f43 925static inline void mod_memcg_page_state(struct page *page,
04fecbf5 926 int idx,
ccda7f43 927 int nr)
553af430
JW
928{
929}
930
00f3ca2c
JW
931static inline unsigned long lruvec_page_state(struct lruvec *lruvec,
932 enum node_stat_item idx)
2a7106f2 933{
00f3ca2c 934 return node_page_state(lruvec_pgdat(lruvec), idx);
2a7106f2
GT
935}
936
00f3ca2c
JW
937static inline void __mod_lruvec_state(struct lruvec *lruvec,
938 enum node_stat_item idx, int val)
d69b042f 939{
00f3ca2c
JW
940 __mod_node_page_state(lruvec_pgdat(lruvec), idx, val);
941}
942
943static inline void mod_lruvec_state(struct lruvec *lruvec,
944 enum node_stat_item idx, int val)
945{
946 mod_node_page_state(lruvec_pgdat(lruvec), idx, val);
947}
948
949static inline void __mod_lruvec_page_state(struct page *page,
950 enum node_stat_item idx, int val)
951{
952 __mod_node_page_state(page_pgdat(page), idx, val);
953}
954
955static inline void mod_lruvec_page_state(struct page *page,
956 enum node_stat_item idx, int val)
957{
958 mod_node_page_state(page_pgdat(page), idx, val);
d69b042f
BS
959}
960
4e416953 961static inline
ef8f2327 962unsigned long mem_cgroup_soft_limit_reclaim(pg_data_t *pgdat, int order,
0608f43d
AM
963 gfp_t gfp_mask,
964 unsigned long *total_scanned)
4e416953 965{
0608f43d 966 return 0;
4e416953
BS
967}
968
e94c8a9c 969static inline void mem_cgroup_split_huge_fixup(struct page *head)
ca3e0214
KH
970{
971}
972
2262185c
RG
973static inline void count_memcg_events(struct mem_cgroup *memcg,
974 enum vm_event_item idx,
975 unsigned long count)
976{
977}
978
979static inline void count_memcg_page_event(struct page *page,
04fecbf5 980 int idx)
2262185c
RG
981{
982}
983
456f998e 984static inline
2262185c 985void count_memcg_event_mm(struct mm_struct *mm, enum vm_event_item idx)
456f998e
YH
986{
987}
c255a458 988#endif /* CONFIG_MEMCG */
78fb7466 989
04fecbf5 990/* idx can be of type enum memcg_stat_item or node_stat_item */
00f3ca2c 991static inline void __inc_memcg_state(struct mem_cgroup *memcg,
04fecbf5 992 int idx)
00f3ca2c
JW
993{
994 __mod_memcg_state(memcg, idx, 1);
995}
996
04fecbf5 997/* idx can be of type enum memcg_stat_item or node_stat_item */
00f3ca2c 998static inline void __dec_memcg_state(struct mem_cgroup *memcg,
04fecbf5 999 int idx)
00f3ca2c
JW
1000{
1001 __mod_memcg_state(memcg, idx, -1);
1002}
1003
04fecbf5 1004/* idx can be of type enum memcg_stat_item or node_stat_item */
00f3ca2c 1005static inline void __inc_memcg_page_state(struct page *page,
04fecbf5 1006 int idx)
00f3ca2c
JW
1007{
1008 __mod_memcg_page_state(page, idx, 1);
1009}
1010
04fecbf5 1011/* idx can be of type enum memcg_stat_item or node_stat_item */
00f3ca2c 1012static inline void __dec_memcg_page_state(struct page *page,
04fecbf5 1013 int idx)
00f3ca2c
JW
1014{
1015 __mod_memcg_page_state(page, idx, -1);
1016}
1017
1018static inline void __inc_lruvec_state(struct lruvec *lruvec,
1019 enum node_stat_item idx)
1020{
1021 __mod_lruvec_state(lruvec, idx, 1);
1022}
1023
1024static inline void __dec_lruvec_state(struct lruvec *lruvec,
1025 enum node_stat_item idx)
1026{
1027 __mod_lruvec_state(lruvec, idx, -1);
1028}
1029
1030static inline void __inc_lruvec_page_state(struct page *page,
1031 enum node_stat_item idx)
1032{
1033 __mod_lruvec_page_state(page, idx, 1);
1034}
1035
1036static inline void __dec_lruvec_page_state(struct page *page,
1037 enum node_stat_item idx)
1038{
1039 __mod_lruvec_page_state(page, idx, -1);
1040}
1041
04fecbf5 1042/* idx can be of type enum memcg_stat_item or node_stat_item */
00f3ca2c 1043static inline void inc_memcg_state(struct mem_cgroup *memcg,
04fecbf5 1044 int idx)
00f3ca2c
JW
1045{
1046 mod_memcg_state(memcg, idx, 1);
1047}
1048
04fecbf5 1049/* idx can be of type enum memcg_stat_item or node_stat_item */
00f3ca2c 1050static inline void dec_memcg_state(struct mem_cgroup *memcg,
04fecbf5 1051 int idx)
00f3ca2c
JW
1052{
1053 mod_memcg_state(memcg, idx, -1);
1054}
1055
04fecbf5 1056/* idx can be of type enum memcg_stat_item or node_stat_item */
00f3ca2c 1057static inline void inc_memcg_page_state(struct page *page,
04fecbf5 1058 int idx)
00f3ca2c
JW
1059{
1060 mod_memcg_page_state(page, idx, 1);
1061}
1062
04fecbf5 1063/* idx can be of type enum memcg_stat_item or node_stat_item */
00f3ca2c 1064static inline void dec_memcg_page_state(struct page *page,
04fecbf5 1065 int idx)
00f3ca2c
JW
1066{
1067 mod_memcg_page_state(page, idx, -1);
1068}
1069
1070static inline void inc_lruvec_state(struct lruvec *lruvec,
1071 enum node_stat_item idx)
1072{
1073 mod_lruvec_state(lruvec, idx, 1);
1074}
1075
1076static inline void dec_lruvec_state(struct lruvec *lruvec,
1077 enum node_stat_item idx)
1078{
1079 mod_lruvec_state(lruvec, idx, -1);
1080}
1081
1082static inline void inc_lruvec_page_state(struct page *page,
1083 enum node_stat_item idx)
1084{
1085 mod_lruvec_page_state(page, idx, 1);
1086}
1087
1088static inline void dec_lruvec_page_state(struct page *page,
1089 enum node_stat_item idx)
1090{
1091 mod_lruvec_page_state(page, idx, -1);
1092}
1093
52ebea74 1094#ifdef CONFIG_CGROUP_WRITEBACK
841710aa 1095
52ebea74 1096struct list_head *mem_cgroup_cgwb_list(struct mem_cgroup *memcg);
841710aa 1097struct wb_domain *mem_cgroup_wb_domain(struct bdi_writeback *wb);
c5edf9cd
TH
1098void mem_cgroup_wb_stats(struct bdi_writeback *wb, unsigned long *pfilepages,
1099 unsigned long *pheadroom, unsigned long *pdirty,
1100 unsigned long *pwriteback);
841710aa
TH
1101
1102#else /* CONFIG_CGROUP_WRITEBACK */
1103
1104static inline struct wb_domain *mem_cgroup_wb_domain(struct bdi_writeback *wb)
1105{
1106 return NULL;
1107}
1108
c2aa723a 1109static inline void mem_cgroup_wb_stats(struct bdi_writeback *wb,
c5edf9cd
TH
1110 unsigned long *pfilepages,
1111 unsigned long *pheadroom,
c2aa723a
TH
1112 unsigned long *pdirty,
1113 unsigned long *pwriteback)
1114{
1115}
1116
841710aa 1117#endif /* CONFIG_CGROUP_WRITEBACK */
52ebea74 1118
e1aab161 1119struct sock;
baac50bb
JW
1120bool mem_cgroup_charge_skmem(struct mem_cgroup *memcg, unsigned int nr_pages);
1121void mem_cgroup_uncharge_skmem(struct mem_cgroup *memcg, unsigned int nr_pages);
d886f4e4 1122#ifdef CONFIG_MEMCG
ef12947c
JW
1123extern struct static_key_false memcg_sockets_enabled_key;
1124#define mem_cgroup_sockets_enabled static_branch_unlikely(&memcg_sockets_enabled_key)
2d758073
JW
1125void mem_cgroup_sk_alloc(struct sock *sk);
1126void mem_cgroup_sk_free(struct sock *sk);
baac50bb 1127static inline bool mem_cgroup_under_socket_pressure(struct mem_cgroup *memcg)
e805605c 1128{
0db15298 1129 if (!cgroup_subsys_on_dfl(memory_cgrp_subsys) && memcg->tcpmem_pressure)
8e8ae645 1130 return true;
8e8ae645
JW
1131 do {
1132 if (time_before(jiffies, memcg->socket_pressure))
1133 return true;
1134 } while ((memcg = parent_mem_cgroup(memcg)));
1135 return false;
e805605c
JW
1136}
1137#else
80e95fe0 1138#define mem_cgroup_sockets_enabled 0
2d758073
JW
1139static inline void mem_cgroup_sk_alloc(struct sock *sk) { };
1140static inline void mem_cgroup_sk_free(struct sock *sk) { };
baac50bb 1141static inline bool mem_cgroup_under_socket_pressure(struct mem_cgroup *memcg)
e805605c
JW
1142{
1143 return false;
1144}
1145#endif
7ae1e1d0 1146
45264778
VD
1147struct kmem_cache *memcg_kmem_get_cache(struct kmem_cache *cachep);
1148void memcg_kmem_put_cache(struct kmem_cache *cachep);
1149int memcg_kmem_charge_memcg(struct page *page, gfp_t gfp, int order,
1150 struct mem_cgroup *memcg);
1151int memcg_kmem_charge(struct page *page, gfp_t gfp, int order);
1152void memcg_kmem_uncharge(struct page *page, int order);
1153
127424c8 1154#if defined(CONFIG_MEMCG) && !defined(CONFIG_SLOB)
ef12947c 1155extern struct static_key_false memcg_kmem_enabled_key;
17cc4dfe 1156extern struct workqueue_struct *memcg_kmem_cache_wq;
749c5415 1157
dbcf73e2 1158extern int memcg_nr_cache_ids;
64219994
MH
1159void memcg_get_cache_ids(void);
1160void memcg_put_cache_ids(void);
ebe945c2
GC
1161
1162/*
1163 * Helper macro to loop through all memcg-specific caches. Callers must still
1164 * check if the cache is valid (it is either valid or NULL).
1165 * the slab_mutex must be held when looping through those caches
1166 */
749c5415 1167#define for_each_memcg_cache_index(_idx) \
dbcf73e2 1168 for ((_idx) = 0; (_idx) < memcg_nr_cache_ids; (_idx)++)
749c5415 1169
7ae1e1d0
GC
1170static inline bool memcg_kmem_enabled(void)
1171{
ef12947c 1172 return static_branch_unlikely(&memcg_kmem_enabled_key);
7ae1e1d0
GC
1173}
1174
33398cf2 1175/*
9f706d68 1176 * helper for accessing a memcg's index. It will be used as an index in the
33398cf2
MH
1177 * child cache array in kmem_cache, and also to derive its name. This function
1178 * will return -1 when this is not a kmem-limited memcg.
1179 */
1180static inline int memcg_cache_id(struct mem_cgroup *memcg)
1181{
1182 return memcg ? memcg->kmemcg_id : -1;
1183}
5722d094 1184
7ae1e1d0 1185#else
749c5415
GC
1186#define for_each_memcg_cache_index(_idx) \
1187 for (; NULL; )
1188
b9ce5ef4
GC
1189static inline bool memcg_kmem_enabled(void)
1190{
1191 return false;
1192}
1193
2633d7a0
GC
1194static inline int memcg_cache_id(struct mem_cgroup *memcg)
1195{
1196 return -1;
1197}
1198
05257a1a
VD
1199static inline void memcg_get_cache_ids(void)
1200{
1201}
1202
1203static inline void memcg_put_cache_ids(void)
1204{
1205}
1206
127424c8
JW
1207#endif /* CONFIG_MEMCG && !CONFIG_SLOB */
1208
8cdea7c0 1209#endif /* _LINUX_MEMCONTROL_H */