]> git.proxmox.com Git - mirror_ubuntu-zesty-kernel.git/blame - include/linux/memcontrol.h
mm: memcontrol: rewrite uncharge API
[mirror_ubuntu-zesty-kernel.git] / include / linux / memcontrol.h
CommitLineData
8cdea7c0
BS
1/* memcontrol.h - Memory Controller
2 *
3 * Copyright IBM Corporation, 2007
4 * Author Balbir Singh <balbir@linux.vnet.ibm.com>
5 *
78fb7466
PE
6 * Copyright 2007 OpenVZ SWsoft Inc
7 * Author: Pavel Emelianov <xemul@openvz.org>
8 *
8cdea7c0
BS
9 * This program is free software; you can redistribute it and/or modify
10 * it under the terms of the GNU General Public License as published by
11 * the Free Software Foundation; either version 2 of the License, or
12 * (at your option) any later version.
13 *
14 * This program is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 * GNU General Public License for more details.
18 */
19
20#ifndef _LINUX_MEMCONTROL_H
21#define _LINUX_MEMCONTROL_H
f8d66542 22#include <linux/cgroup.h>
456f998e 23#include <linux/vm_event_item.h>
7ae1e1d0 24#include <linux/hardirq.h>
a8964b9b 25#include <linux/jump_label.h>
456f998e 26
78fb7466
PE
27struct mem_cgroup;
28struct page_cgroup;
8697d331
BS
29struct page;
30struct mm_struct;
2633d7a0 31struct kmem_cache;
78fb7466 32
68b4876d
SZ
33/*
34 * The corresponding mem_cgroup_stat_names is defined in mm/memcontrol.c,
35 * These two lists should keep in accord with each other.
36 */
37enum mem_cgroup_stat_index {
38 /*
39 * For MEM_CONTAINER_TYPE_ALL, usage = pagecache + rss.
40 */
41 MEM_CGROUP_STAT_CACHE, /* # of pages charged as cache */
42 MEM_CGROUP_STAT_RSS, /* # of pages charged as anon rss */
43 MEM_CGROUP_STAT_RSS_HUGE, /* # of pages charged as anon huge */
44 MEM_CGROUP_STAT_FILE_MAPPED, /* # of pages charged as file rss */
3ea67d06 45 MEM_CGROUP_STAT_WRITEBACK, /* # of pages under writeback */
68b4876d
SZ
46 MEM_CGROUP_STAT_SWAP, /* # of pages, swapped out */
47 MEM_CGROUP_STAT_NSTATS,
2a7106f2
GT
48};
49
5660048c
JW
50struct mem_cgroup_reclaim_cookie {
51 struct zone *zone;
52 int priority;
53 unsigned int generation;
54};
55
c255a458 56#ifdef CONFIG_MEMCG
00501b53
JW
57int mem_cgroup_try_charge(struct page *page, struct mm_struct *mm,
58 gfp_t gfp_mask, struct mem_cgroup **memcgp);
59void mem_cgroup_commit_charge(struct page *page, struct mem_cgroup *memcg,
60 bool lrucare);
61void mem_cgroup_cancel_charge(struct page *page, struct mem_cgroup *memcg);
925b7673 62
0a31bc97
JW
63void mem_cgroup_uncharge(struct page *page);
64
65/* Batched uncharging */
66void mem_cgroup_uncharge_start(void);
67void mem_cgroup_uncharge_end(void);
569b846d 68
0a31bc97
JW
69void mem_cgroup_migrate(struct page *oldpage, struct page *newpage,
70 bool lrucare);
569b846d 71
0a31bc97
JW
72struct lruvec *mem_cgroup_zone_lruvec(struct zone *, struct mem_cgroup *);
73struct lruvec *mem_cgroup_page_lruvec(struct page *, struct zone *);
c9b0ed51 74
c3ac9a8a
JW
75bool __mem_cgroup_same_or_subtree(const struct mem_cgroup *root_memcg,
76 struct mem_cgroup *memcg);
ffbdccf5
DR
77bool task_in_mem_cgroup(struct task_struct *task,
78 const struct mem_cgroup *memcg);
3062fc67 79
e42d9d5d 80extern struct mem_cgroup *try_get_mem_cgroup_from_page(struct page *page);
cf475ad2
BS
81extern struct mem_cgroup *mem_cgroup_from_task(struct task_struct *p);
82
e1aab161 83extern struct mem_cgroup *parent_mem_cgroup(struct mem_cgroup *memcg);
182446d0 84extern struct mem_cgroup *mem_cgroup_from_css(struct cgroup_subsys_state *css);
e1aab161 85
2e4d4091 86static inline
587af308 87bool mm_match_cgroup(const struct mm_struct *mm, const struct mem_cgroup *memcg)
2e4d4091 88{
587af308
JW
89 struct mem_cgroup *task_memcg;
90 bool match;
c3ac9a8a 91
2e4d4091 92 rcu_read_lock();
587af308
JW
93 task_memcg = mem_cgroup_from_task(rcu_dereference(mm->owner));
94 match = __mem_cgroup_same_or_subtree(memcg, task_memcg);
2e4d4091 95 rcu_read_unlock();
c3ac9a8a 96 return match;
2e4d4091 97}
8a9f3ccd 98
c0ff4b85 99extern struct cgroup_subsys_state *mem_cgroup_css(struct mem_cgroup *memcg);
d324236b 100
694fbc0f
AM
101struct mem_cgroup *mem_cgroup_iter(struct mem_cgroup *,
102 struct mem_cgroup *,
103 struct mem_cgroup_reclaim_cookie *);
5660048c
JW
104void mem_cgroup_iter_break(struct mem_cgroup *, struct mem_cgroup *);
105
58ae83db
KH
106/*
107 * For memory reclaim.
108 */
c56d5c7d 109int mem_cgroup_inactive_anon_is_low(struct lruvec *lruvec);
889976db 110int mem_cgroup_select_victim_node(struct mem_cgroup *memcg);
4d7dcca2 111unsigned long mem_cgroup_get_lru_size(struct lruvec *lruvec, enum lru_list);
fa9add64 112void mem_cgroup_update_lru_size(struct lruvec *, enum lru_list, int);
e222432b
BS
113extern void mem_cgroup_print_oom_info(struct mem_cgroup *memcg,
114 struct task_struct *p);
58ae83db 115
49426420 116static inline void mem_cgroup_oom_enable(void)
519e5247 117{
49426420
JW
118 WARN_ON(current->memcg_oom.may_oom);
119 current->memcg_oom.may_oom = 1;
519e5247
JW
120}
121
49426420 122static inline void mem_cgroup_oom_disable(void)
519e5247 123{
49426420
JW
124 WARN_ON(!current->memcg_oom.may_oom);
125 current->memcg_oom.may_oom = 0;
519e5247
JW
126}
127
3812c8c8
JW
128static inline bool task_in_memcg_oom(struct task_struct *p)
129{
49426420 130 return p->memcg_oom.memcg;
3812c8c8
JW
131}
132
49426420 133bool mem_cgroup_oom_synchronize(bool wait);
3812c8c8 134
c255a458 135#ifdef CONFIG_MEMCG_SWAP
c077719b
KH
136extern int do_swap_account;
137#endif
f8d66542
HT
138
139static inline bool mem_cgroup_disabled(void)
140{
073219e9 141 if (memory_cgrp_subsys.disabled)
f8d66542
HT
142 return true;
143 return false;
144}
145
89c06bd5
KH
146void __mem_cgroup_begin_update_page_stat(struct page *page, bool *locked,
147 unsigned long *flags);
148
4331f7d3
KH
149extern atomic_t memcg_moving;
150
89c06bd5
KH
151static inline void mem_cgroup_begin_update_page_stat(struct page *page,
152 bool *locked, unsigned long *flags)
153{
154 if (mem_cgroup_disabled())
155 return;
156 rcu_read_lock();
157 *locked = false;
4331f7d3
KH
158 if (atomic_read(&memcg_moving))
159 __mem_cgroup_begin_update_page_stat(page, locked, flags);
89c06bd5
KH
160}
161
162void __mem_cgroup_end_update_page_stat(struct page *page,
163 unsigned long *flags);
164static inline void mem_cgroup_end_update_page_stat(struct page *page,
165 bool *locked, unsigned long *flags)
166{
167 if (mem_cgroup_disabled())
168 return;
169 if (*locked)
170 __mem_cgroup_end_update_page_stat(page, flags);
171 rcu_read_unlock();
172}
173
2a7106f2 174void mem_cgroup_update_page_stat(struct page *page,
68b4876d 175 enum mem_cgroup_stat_index idx,
2a7106f2
GT
176 int val);
177
178static inline void mem_cgroup_inc_page_stat(struct page *page,
68b4876d 179 enum mem_cgroup_stat_index idx)
2a7106f2
GT
180{
181 mem_cgroup_update_page_stat(page, idx, 1);
182}
183
184static inline void mem_cgroup_dec_page_stat(struct page *page,
68b4876d 185 enum mem_cgroup_stat_index idx)
2a7106f2
GT
186{
187 mem_cgroup_update_page_stat(page, idx, -1);
188}
189
0608f43d
AM
190unsigned long mem_cgroup_soft_limit_reclaim(struct zone *zone, int order,
191 gfp_t gfp_mask,
192 unsigned long *total_scanned);
a63d83f4 193
68ae564b
DR
194void __mem_cgroup_count_vm_event(struct mm_struct *mm, enum vm_event_item idx);
195static inline void mem_cgroup_count_vm_event(struct mm_struct *mm,
196 enum vm_event_item idx)
197{
198 if (mem_cgroup_disabled())
199 return;
200 __mem_cgroup_count_vm_event(mm, idx);
201}
ca3e0214 202#ifdef CONFIG_TRANSPARENT_HUGEPAGE
e94c8a9c 203void mem_cgroup_split_huge_fixup(struct page *head);
ca3e0214
KH
204#endif
205
f212ad7c
DN
206#ifdef CONFIG_DEBUG_VM
207bool mem_cgroup_bad_page_check(struct page *page);
208void mem_cgroup_print_bad_page(struct page *page);
209#endif
c255a458 210#else /* CONFIG_MEMCG */
7a81b88c
KH
211struct mem_cgroup;
212
00501b53
JW
213static inline int mem_cgroup_try_charge(struct page *page, struct mm_struct *mm,
214 gfp_t gfp_mask,
215 struct mem_cgroup **memcgp)
7a81b88c 216{
00501b53 217 *memcgp = NULL;
7a81b88c
KH
218 return 0;
219}
220
00501b53
JW
221static inline void mem_cgroup_commit_charge(struct page *page,
222 struct mem_cgroup *memcg,
223 bool lrucare)
7a81b88c
KH
224{
225}
226
00501b53
JW
227static inline void mem_cgroup_cancel_charge(struct page *page,
228 struct mem_cgroup *memcg)
7a81b88c
KH
229{
230}
231
0a31bc97 232static inline void mem_cgroup_uncharge(struct page *page)
569b846d
KH
233{
234}
235
0a31bc97 236static inline void mem_cgroup_uncharge_start(void)
569b846d
KH
237{
238}
239
0a31bc97 240static inline void mem_cgroup_uncharge_end(void)
8a9f3ccd
BS
241{
242}
243
0a31bc97
JW
244static inline void mem_cgroup_migrate(struct page *oldpage,
245 struct page *newpage,
246 bool lrucare)
69029cd5
KH
247{
248}
249
925b7673
JW
250static inline struct lruvec *mem_cgroup_zone_lruvec(struct zone *zone,
251 struct mem_cgroup *memcg)
08e552c6 252{
925b7673 253 return &zone->lruvec;
08e552c6
KH
254}
255
fa9add64
HD
256static inline struct lruvec *mem_cgroup_page_lruvec(struct page *page,
257 struct zone *zone)
66e1707b 258{
925b7673 259 return &zone->lruvec;
66e1707b
BS
260}
261
e42d9d5d
WF
262static inline struct mem_cgroup *try_get_mem_cgroup_from_page(struct page *page)
263{
264 return NULL;
265}
266
587af308 267static inline bool mm_match_cgroup(struct mm_struct *mm,
c0ff4b85 268 struct mem_cgroup *memcg)
bed7161a 269{
587af308 270 return true;
bed7161a
BS
271}
272
ffbdccf5
DR
273static inline bool task_in_mem_cgroup(struct task_struct *task,
274 const struct mem_cgroup *memcg)
4c4a2214 275{
ffbdccf5 276 return true;
4c4a2214
DR
277}
278
c0ff4b85
R
279static inline struct cgroup_subsys_state
280 *mem_cgroup_css(struct mem_cgroup *memcg)
d324236b
WF
281{
282 return NULL;
283}
284
5660048c
JW
285static inline struct mem_cgroup *
286mem_cgroup_iter(struct mem_cgroup *root,
287 struct mem_cgroup *prev,
288 struct mem_cgroup_reclaim_cookie *reclaim)
289{
290 return NULL;
291}
292
293static inline void mem_cgroup_iter_break(struct mem_cgroup *root,
294 struct mem_cgroup *prev)
295{
296}
297
f8d66542
HT
298static inline bool mem_cgroup_disabled(void)
299{
300 return true;
301}
a636b327 302
14797e23 303static inline int
c56d5c7d 304mem_cgroup_inactive_anon_is_low(struct lruvec *lruvec)
14797e23
KM
305{
306 return 1;
307}
308
a3d8e054 309static inline unsigned long
4d7dcca2 310mem_cgroup_get_lru_size(struct lruvec *lruvec, enum lru_list lru)
a3d8e054
KM
311{
312 return 0;
313}
314
fa9add64
HD
315static inline void
316mem_cgroup_update_lru_size(struct lruvec *lruvec, enum lru_list lru,
317 int increment)
3e2f41f1 318{
3e2f41f1
KM
319}
320
e222432b
BS
321static inline void
322mem_cgroup_print_oom_info(struct mem_cgroup *memcg, struct task_struct *p)
323{
324}
325
89c06bd5
KH
326static inline void mem_cgroup_begin_update_page_stat(struct page *page,
327 bool *locked, unsigned long *flags)
328{
329}
330
331static inline void mem_cgroup_end_update_page_stat(struct page *page,
332 bool *locked, unsigned long *flags)
333{
334}
335
49426420 336static inline void mem_cgroup_oom_enable(void)
519e5247
JW
337{
338}
339
49426420 340static inline void mem_cgroup_oom_disable(void)
519e5247
JW
341{
342}
343
3812c8c8
JW
344static inline bool task_in_memcg_oom(struct task_struct *p)
345{
346 return false;
347}
348
49426420 349static inline bool mem_cgroup_oom_synchronize(bool wait)
3812c8c8
JW
350{
351 return false;
352}
353
2a7106f2 354static inline void mem_cgroup_inc_page_stat(struct page *page,
68b4876d 355 enum mem_cgroup_stat_index idx)
2a7106f2
GT
356{
357}
358
359static inline void mem_cgroup_dec_page_stat(struct page *page,
68b4876d 360 enum mem_cgroup_stat_index idx)
d69b042f
BS
361{
362}
363
4e416953 364static inline
0608f43d
AM
365unsigned long mem_cgroup_soft_limit_reclaim(struct zone *zone, int order,
366 gfp_t gfp_mask,
367 unsigned long *total_scanned)
4e416953 368{
0608f43d 369 return 0;
4e416953
BS
370}
371
e94c8a9c 372static inline void mem_cgroup_split_huge_fixup(struct page *head)
ca3e0214
KH
373{
374}
375
456f998e
YH
376static inline
377void mem_cgroup_count_vm_event(struct mm_struct *mm, enum vm_event_item idx)
378{
379}
c255a458 380#endif /* CONFIG_MEMCG */
78fb7466 381
c255a458 382#if !defined(CONFIG_MEMCG) || !defined(CONFIG_DEBUG_VM)
f212ad7c
DN
383static inline bool
384mem_cgroup_bad_page_check(struct page *page)
385{
386 return false;
387}
388
389static inline void
390mem_cgroup_print_bad_page(struct page *page)
391{
392}
393#endif
394
e1aab161
GC
395enum {
396 UNDER_LIMIT,
397 SOFT_LIMIT,
398 OVER_LIMIT,
399};
400
401struct sock;
cd59085a 402#if defined(CONFIG_INET) && defined(CONFIG_MEMCG_KMEM)
e1aab161
GC
403void sock_update_memcg(struct sock *sk);
404void sock_release_memcg(struct sock *sk);
405#else
406static inline void sock_update_memcg(struct sock *sk)
407{
408}
409static inline void sock_release_memcg(struct sock *sk)
410{
411}
cd59085a 412#endif /* CONFIG_INET && CONFIG_MEMCG_KMEM */
7ae1e1d0
GC
413
414#ifdef CONFIG_MEMCG_KMEM
a8964b9b 415extern struct static_key memcg_kmem_enabled_key;
749c5415
GC
416
417extern int memcg_limited_groups_array_size;
ebe945c2
GC
418
419/*
420 * Helper macro to loop through all memcg-specific caches. Callers must still
421 * check if the cache is valid (it is either valid or NULL).
422 * the slab_mutex must be held when looping through those caches
423 */
749c5415 424#define for_each_memcg_cache_index(_idx) \
91c777d8 425 for ((_idx) = 0; (_idx) < memcg_limited_groups_array_size; (_idx)++)
749c5415 426
7ae1e1d0
GC
427static inline bool memcg_kmem_enabled(void)
428{
a8964b9b 429 return static_key_false(&memcg_kmem_enabled_key);
7ae1e1d0
GC
430}
431
432/*
433 * In general, we'll do everything in our power to not incur in any overhead
434 * for non-memcg users for the kmem functions. Not even a function call, if we
435 * can avoid it.
436 *
437 * Therefore, we'll inline all those functions so that in the best case, we'll
438 * see that kmemcg is off for everybody and proceed quickly. If it is on,
439 * we'll still do most of the flag checking inline. We check a lot of
440 * conditions, but because they are pretty simple, they are expected to be
441 * fast.
442 */
443bool __memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **memcg,
444 int order);
445void __memcg_kmem_commit_charge(struct page *page,
446 struct mem_cgroup *memcg, int order);
447void __memcg_kmem_uncharge_pages(struct page *page, int order);
448
2633d7a0 449int memcg_cache_id(struct mem_cgroup *memcg);
5722d094 450
363a044f
VD
451int memcg_alloc_cache_params(struct mem_cgroup *memcg, struct kmem_cache *s,
452 struct kmem_cache *root_cache);
453void memcg_free_cache_params(struct kmem_cache *s);
2633d7a0 454
55007d84
GC
455int memcg_update_cache_size(struct kmem_cache *s, int num_groups);
456void memcg_update_array_size(int num_groups);
d7f25f8a
GC
457
458struct kmem_cache *
459__memcg_kmem_get_cache(struct kmem_cache *cachep, gfp_t gfp);
460
c67a8a68
VD
461int __memcg_charge_slab(struct kmem_cache *cachep, gfp_t gfp, int order);
462void __memcg_uncharge_slab(struct kmem_cache *cachep, int order);
5dfb4175 463
776ed0f0 464int __memcg_cleanup_cache_params(struct kmem_cache *s);
1f458cbf 465
7ae1e1d0
GC
466/**
467 * memcg_kmem_newpage_charge: verify if a new kmem allocation is allowed.
468 * @gfp: the gfp allocation flags.
469 * @memcg: a pointer to the memcg this was charged against.
470 * @order: allocation order.
471 *
472 * returns true if the memcg where the current task belongs can hold this
473 * allocation.
474 *
475 * We return true automatically if this allocation is not to be accounted to
476 * any memcg.
477 */
478static inline bool
479memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **memcg, int order)
480{
481 if (!memcg_kmem_enabled())
482 return true;
483
484 /*
485 * __GFP_NOFAIL allocations will move on even if charging is not
486 * possible. Therefore we don't even try, and have this allocation
487 * unaccounted. We could in theory charge it with
488 * res_counter_charge_nofail, but we hope those allocations are rare,
489 * and won't be worth the trouble.
490 */
52383431 491 if (gfp & __GFP_NOFAIL)
7ae1e1d0
GC
492 return true;
493 if (in_interrupt() || (!current->mm) || (current->flags & PF_KTHREAD))
494 return true;
495
496 /* If the test is dying, just let it go. */
497 if (unlikely(fatal_signal_pending(current)))
498 return true;
499
500 return __memcg_kmem_newpage_charge(gfp, memcg, order);
501}
502
503/**
504 * memcg_kmem_uncharge_pages: uncharge pages from memcg
505 * @page: pointer to struct page being freed
506 * @order: allocation order.
507 *
508 * there is no need to specify memcg here, since it is embedded in page_cgroup
509 */
510static inline void
511memcg_kmem_uncharge_pages(struct page *page, int order)
512{
513 if (memcg_kmem_enabled())
514 __memcg_kmem_uncharge_pages(page, order);
515}
516
517/**
518 * memcg_kmem_commit_charge: embeds correct memcg in a page
519 * @page: pointer to struct page recently allocated
520 * @memcg: the memcg structure we charged against
521 * @order: allocation order.
522 *
523 * Needs to be called after memcg_kmem_newpage_charge, regardless of success or
524 * failure of the allocation. if @page is NULL, this function will revert the
525 * charges. Otherwise, it will commit the memcg given by @memcg to the
526 * corresponding page_cgroup.
527 */
528static inline void
529memcg_kmem_commit_charge(struct page *page, struct mem_cgroup *memcg, int order)
530{
531 if (memcg_kmem_enabled() && memcg)
532 __memcg_kmem_commit_charge(page, memcg, order);
533}
534
d7f25f8a
GC
535/**
536 * memcg_kmem_get_cache: selects the correct per-memcg cache for allocation
537 * @cachep: the original global kmem cache
538 * @gfp: allocation flags.
539 *
5dfb4175 540 * All memory allocated from a per-memcg cache is charged to the owner memcg.
d7f25f8a
GC
541 */
542static __always_inline struct kmem_cache *
543memcg_kmem_get_cache(struct kmem_cache *cachep, gfp_t gfp)
544{
545 if (!memcg_kmem_enabled())
546 return cachep;
547 if (gfp & __GFP_NOFAIL)
548 return cachep;
549 if (in_interrupt() || (!current->mm) || (current->flags & PF_KTHREAD))
550 return cachep;
551 if (unlikely(fatal_signal_pending(current)))
552 return cachep;
553
554 return __memcg_kmem_get_cache(cachep, gfp);
555}
7ae1e1d0 556#else
749c5415
GC
557#define for_each_memcg_cache_index(_idx) \
558 for (; NULL; )
559
b9ce5ef4
GC
560static inline bool memcg_kmem_enabled(void)
561{
562 return false;
563}
564
7ae1e1d0
GC
565static inline bool
566memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **memcg, int order)
567{
568 return true;
569}
570
571static inline void memcg_kmem_uncharge_pages(struct page *page, int order)
572{
573}
574
575static inline void
576memcg_kmem_commit_charge(struct page *page, struct mem_cgroup *memcg, int order)
577{
578}
2633d7a0
GC
579
580static inline int memcg_cache_id(struct mem_cgroup *memcg)
581{
582 return -1;
583}
584
363a044f
VD
585static inline int memcg_alloc_cache_params(struct mem_cgroup *memcg,
586 struct kmem_cache *s, struct kmem_cache *root_cache)
2633d7a0
GC
587{
588 return 0;
589}
590
363a044f
VD
591static inline void memcg_free_cache_params(struct kmem_cache *s)
592{
593}
594
d7f25f8a
GC
595static inline struct kmem_cache *
596memcg_kmem_get_cache(struct kmem_cache *cachep, gfp_t gfp)
597{
598 return cachep;
599}
7ae1e1d0 600#endif /* CONFIG_MEMCG_KMEM */
8cdea7c0
BS
601#endif /* _LINUX_MEMCONTROL_H */
602