[mirror_ubuntu-zesty-kernel.git] / include / linux / memcontrol.h

/* memcontrol.h - Memory Controller
 *
 * Copyright IBM Corporation, 2007
 * Author Balbir Singh <balbir@linux.vnet.ibm.com>
 *
 * Copyright 2007 OpenVZ SWsoft Inc
 * Author: Pavel Emelianov <xemul@openvz.org>
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 */

#ifndef _LINUX_MEMCONTROL_H
#define _LINUX_MEMCONTROL_H
#include <linux/cgroup.h>
#include <linux/vm_event_item.h>
#include <linux/hardirq.h>
#include <linux/jump_label.h>

struct mem_cgroup;
struct page_cgroup;
struct page;
struct mm_struct;
struct kmem_cache;

/* Stats that can be updated by kernel. */
enum mem_cgroup_page_stat_item {
	MEMCG_NR_FILE_MAPPED, /* # of pages charged as file rss */
};

struct mem_cgroup_reclaim_cookie {
	struct zone *zone;
	int priority;
	unsigned int generation;
};

#ifdef CONFIG_MEMCG
/*
 * All "charge" functions with gfp_mask should use GFP_KERNEL or
 * (gfp_mask & GFP_RECLAIM_MASK). In current implementatin, memcg doesn't
 * alloc memory but reclaims memory from all available zones. So, "where I want
 * memory from" bits of gfp_mask has no meaning. So any bits of that field is
 * available but adding a rule is better. charge functions' gfp_mask should
 * be set to GFP_KERNEL or gfp_mask & GFP_RECLAIM_MASK for avoiding ambiguous
 * codes.
 * (Of course, if memcg does memory allocation in future, GFP_KERNEL is sane.)
 */

extern int mem_cgroup_newpage_charge(struct page *page, struct mm_struct *mm,
				gfp_t gfp_mask);
/* for swap handling */
extern int mem_cgroup_try_charge_swapin(struct mm_struct *mm,
		struct page *page, gfp_t mask, struct mem_cgroup **memcgp);
extern void mem_cgroup_commit_charge_swapin(struct page *page,
					struct mem_cgroup *memcg);
extern void mem_cgroup_cancel_charge_swapin(struct mem_cgroup *memcg);

extern int mem_cgroup_cache_charge(struct page *page, struct mm_struct *mm,
					gfp_t gfp_mask);

struct lruvec *mem_cgroup_zone_lruvec(struct zone *, struct mem_cgroup *);
struct lruvec *mem_cgroup_page_lruvec(struct page *, struct zone *);

/* For coalescing uncharge for reducing memcg' overhead*/
extern void mem_cgroup_uncharge_start(void);
extern void mem_cgroup_uncharge_end(void);

extern void mem_cgroup_uncharge_page(struct page *page);
extern void mem_cgroup_uncharge_cache_page(struct page *page);

bool __mem_cgroup_same_or_subtree(const struct mem_cgroup *root_memcg,
				  struct mem_cgroup *memcg);
int task_in_mem_cgroup(struct task_struct *task, const struct mem_cgroup *memcg);

extern struct mem_cgroup *try_get_mem_cgroup_from_page(struct page *page);
extern struct mem_cgroup *mem_cgroup_from_task(struct task_struct *p);
extern struct mem_cgroup *try_get_mem_cgroup_from_mm(struct mm_struct *mm);

extern struct mem_cgroup *parent_mem_cgroup(struct mem_cgroup *memcg);
extern struct mem_cgroup *mem_cgroup_from_cont(struct cgroup *cont);

static inline
bool mm_match_cgroup(const struct mm_struct *mm, const struct mem_cgroup *memcg)
{
	struct mem_cgroup *task_memcg;
	bool match;

	rcu_read_lock();
	task_memcg = mem_cgroup_from_task(rcu_dereference(mm->owner));
	match = __mem_cgroup_same_or_subtree(memcg, task_memcg);
	rcu_read_unlock();
	return match;
}

extern struct cgroup_subsys_state *mem_cgroup_css(struct mem_cgroup *memcg);

extern void
mem_cgroup_prepare_migration(struct page *page, struct page *newpage,
			     struct mem_cgroup **memcgp);
extern void mem_cgroup_end_migration(struct mem_cgroup *memcg,
	struct page *oldpage, struct page *newpage, bool migration_ok);

struct mem_cgroup *mem_cgroup_iter(struct mem_cgroup *,
				   struct mem_cgroup *,
				   struct mem_cgroup_reclaim_cookie *);
void mem_cgroup_iter_break(struct mem_cgroup *, struct mem_cgroup *);

/*
 * For memory reclaim.
 */
int mem_cgroup_inactive_anon_is_low(struct lruvec *lruvec);
int mem_cgroup_inactive_file_is_low(struct lruvec *lruvec);
int mem_cgroup_select_victim_node(struct mem_cgroup *memcg);
unsigned long mem_cgroup_get_lru_size(struct lruvec *lruvec, enum lru_list);
void mem_cgroup_update_lru_size(struct lruvec *, enum lru_list, int);
extern void mem_cgroup_print_oom_info(struct mem_cgroup *memcg,
					struct task_struct *p);
extern void mem_cgroup_replace_page_cache(struct page *oldpage,
					struct page *newpage);

#ifdef CONFIG_MEMCG_SWAP
extern int do_swap_account;
#endif

static inline bool mem_cgroup_disabled(void)
{
	if (mem_cgroup_subsys.disabled)
		return true;
	return false;
}

void __mem_cgroup_begin_update_page_stat(struct page *page, bool *locked,
					 unsigned long *flags);

extern atomic_t memcg_moving;

static inline void mem_cgroup_begin_update_page_stat(struct page *page,
					bool *locked, unsigned long *flags)
{
	if (mem_cgroup_disabled())
		return;
	rcu_read_lock();
	*locked = false;
	if (atomic_read(&memcg_moving))
		__mem_cgroup_begin_update_page_stat(page, locked, flags);
}

void __mem_cgroup_end_update_page_stat(struct page *page,
				unsigned long *flags);
static inline void mem_cgroup_end_update_page_stat(struct page *page,
					bool *locked, unsigned long *flags)
{
	if (mem_cgroup_disabled())
		return;
	if (*locked)
		__mem_cgroup_end_update_page_stat(page, flags);
	rcu_read_unlock();
}

void mem_cgroup_update_page_stat(struct page *page,
				 enum mem_cgroup_page_stat_item idx,
				 int val);

static inline void mem_cgroup_inc_page_stat(struct page *page,
					    enum mem_cgroup_page_stat_item idx)
{
	mem_cgroup_update_page_stat(page, idx, 1);
}

static inline void mem_cgroup_dec_page_stat(struct page *page,
					    enum mem_cgroup_page_stat_item idx)
{
	mem_cgroup_update_page_stat(page, idx, -1);
}

unsigned long mem_cgroup_soft_limit_reclaim(struct zone *zone, int order,
						gfp_t gfp_mask,
						unsigned long *total_scanned);

void __mem_cgroup_count_vm_event(struct mm_struct *mm, enum vm_event_item idx);
static inline void mem_cgroup_count_vm_event(struct mm_struct *mm,
					     enum vm_event_item idx)
{
	if (mem_cgroup_disabled())
		return;
	__mem_cgroup_count_vm_event(mm, idx);
}
#ifdef CONFIG_TRANSPARENT_HUGEPAGE
void mem_cgroup_split_huge_fixup(struct page *head);
#endif

#ifdef CONFIG_DEBUG_VM
bool mem_cgroup_bad_page_check(struct page *page);
void mem_cgroup_print_bad_page(struct page *page);
#endif
#else /* CONFIG_MEMCG */
struct mem_cgroup;

static inline int mem_cgroup_newpage_charge(struct page *page,
					struct mm_struct *mm, gfp_t gfp_mask)
{
	return 0;
}

static inline int mem_cgroup_cache_charge(struct page *page,
					struct mm_struct *mm, gfp_t gfp_mask)
{
	return 0;
}

static inline int mem_cgroup_try_charge_swapin(struct mm_struct *mm,
		struct page *page, gfp_t gfp_mask, struct mem_cgroup **memcgp)
{
	return 0;
}

static inline void mem_cgroup_commit_charge_swapin(struct page *page,
					  struct mem_cgroup *memcg)
{
}

static inline void mem_cgroup_cancel_charge_swapin(struct mem_cgroup *memcg)
{
}

static inline void mem_cgroup_uncharge_start(void)
{
}

static inline void mem_cgroup_uncharge_end(void)
{
}

static inline void mem_cgroup_uncharge_page(struct page *page)
{
}

static inline void mem_cgroup_uncharge_cache_page(struct page *page)
{
}

static inline struct lruvec *mem_cgroup_zone_lruvec(struct zone *zone,
						    struct mem_cgroup *memcg)
{
	return &zone->lruvec;
}

static inline struct lruvec *mem_cgroup_page_lruvec(struct page *page,
						    struct zone *zone)
{
	return &zone->lruvec;
}

static inline struct mem_cgroup *try_get_mem_cgroup_from_page(struct page *page)
{
	return NULL;
}

static inline struct mem_cgroup *try_get_mem_cgroup_from_mm(struct mm_struct *mm)
{
	return NULL;
}

static inline bool mm_match_cgroup(struct mm_struct *mm,
		struct mem_cgroup *memcg)
{
	return true;
}

static inline int task_in_mem_cgroup(struct task_struct *task,
				     const struct mem_cgroup *memcg)
{
	return 1;
}

static inline struct cgroup_subsys_state
		*mem_cgroup_css(struct mem_cgroup *memcg)
{
	return NULL;
}

static inline void
mem_cgroup_prepare_migration(struct page *page, struct page *newpage,
			     struct mem_cgroup **memcgp)
{
}

static inline void mem_cgroup_end_migration(struct mem_cgroup *memcg,
		struct page *oldpage, struct page *newpage, bool migration_ok)
{
}

static inline struct mem_cgroup *
mem_cgroup_iter(struct mem_cgroup *root,
		struct mem_cgroup *prev,
		struct mem_cgroup_reclaim_cookie *reclaim)
{
	return NULL;
}

static inline void mem_cgroup_iter_break(struct mem_cgroup *root,
					 struct mem_cgroup *prev)
{
}

static inline bool mem_cgroup_disabled(void)
{
	return true;
}

static inline int
mem_cgroup_inactive_anon_is_low(struct lruvec *lruvec)
{
	return 1;
}

static inline int
mem_cgroup_inactive_file_is_low(struct lruvec *lruvec)
{
	return 1;
}

static inline unsigned long
mem_cgroup_get_lru_size(struct lruvec *lruvec, enum lru_list lru)
{
	return 0;
}

static inline void
mem_cgroup_update_lru_size(struct lruvec *lruvec, enum lru_list lru,
			      int increment)
{
}

static inline void
mem_cgroup_print_oom_info(struct mem_cgroup *memcg, struct task_struct *p)
{
}

static inline void mem_cgroup_begin_update_page_stat(struct page *page,
					bool *locked, unsigned long *flags)
{
}

static inline void mem_cgroup_end_update_page_stat(struct page *page,
					bool *locked, unsigned long *flags)
{
}

static inline void mem_cgroup_inc_page_stat(struct page *page,
					    enum mem_cgroup_page_stat_item idx)
{
}

static inline void mem_cgroup_dec_page_stat(struct page *page,
					    enum mem_cgroup_page_stat_item idx)
{
}

static inline
unsigned long mem_cgroup_soft_limit_reclaim(struct zone *zone, int order,
					    gfp_t gfp_mask,
					    unsigned long *total_scanned)
{
	return 0;
}

static inline void mem_cgroup_split_huge_fixup(struct page *head)
{
}

static inline
void mem_cgroup_count_vm_event(struct mm_struct *mm, enum vm_event_item idx)
{
}
static inline void mem_cgroup_replace_page_cache(struct page *oldpage,
				struct page *newpage)
{
}
#endif /* CONFIG_MEMCG */

#if !defined(CONFIG_MEMCG) || !defined(CONFIG_DEBUG_VM)
static inline bool
mem_cgroup_bad_page_check(struct page *page)
{
	return false;
}

static inline void
mem_cgroup_print_bad_page(struct page *page)
{
}
#endif

enum {
	UNDER_LIMIT,
	SOFT_LIMIT,
	OVER_LIMIT,
};

struct sock;
#if defined(CONFIG_INET) && defined(CONFIG_MEMCG_KMEM)
void sock_update_memcg(struct sock *sk);
void sock_release_memcg(struct sock *sk);
#else
static inline void sock_update_memcg(struct sock *sk)
{
}
static inline void sock_release_memcg(struct sock *sk)
{
}
#endif /* CONFIG_INET && CONFIG_MEMCG_KMEM */

#ifdef CONFIG_MEMCG_KMEM
extern struct static_key memcg_kmem_enabled_key;
static inline bool memcg_kmem_enabled(void)
{
	return static_key_false(&memcg_kmem_enabled_key);
}

/*
 * In general, we'll do everything in our power to not incur in any overhead
 * for non-memcg users for the kmem functions. Not even a function call, if we
 * can avoid it.
 *
 * Therefore, we'll inline all those functions so that in the best case, we'll
 * see that kmemcg is off for everybody and proceed quickly.  If it is on,
 * we'll still do most of the flag checking inline. We check a lot of
 * conditions, but because they are pretty simple, they are expected to be
 * fast.
 */
bool __memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **memcg,
					int order);
void __memcg_kmem_commit_charge(struct page *page,
				       struct mem_cgroup *memcg, int order);
void __memcg_kmem_uncharge_pages(struct page *page, int order);

int memcg_cache_id(struct mem_cgroup *memcg);
int memcg_register_cache(struct mem_cgroup *memcg, struct kmem_cache *s);
void memcg_release_cache(struct kmem_cache *cachep);
void memcg_cache_list_add(struct mem_cgroup *memcg, struct kmem_cache *cachep);

int memcg_update_cache_size(struct kmem_cache *s, int num_groups);
void memcg_update_array_size(int num_groups);

struct kmem_cache *
__memcg_kmem_get_cache(struct kmem_cache *cachep, gfp_t gfp);

/**
 * memcg_kmem_newpage_charge: verify if a new kmem allocation is allowed.
 * @gfp: the gfp allocation flags.
 * @memcg: a pointer to the memcg this was charged against.
 * @order: allocation order.
 *
 * returns true if the memcg where the current task belongs can hold this
 * allocation.
 *
 * We return true automatically if this allocation is not to be accounted to
 * any memcg.
 */
static inline bool
memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **memcg, int order)
{
	if (!memcg_kmem_enabled())
		return true;

	/*
	 * __GFP_NOFAIL allocations will move on even if charging is not
	 * possible. Therefore we don't even try, and have this allocation
	 * unaccounted. We could in theory charge it with
	 * res_counter_charge_nofail, but we hope those allocations are rare,
	 * and won't be worth the trouble.
	 */
	if (!(gfp & __GFP_KMEMCG) || (gfp & __GFP_NOFAIL))
		return true;
	if (in_interrupt() || (!current->mm) || (current->flags & PF_KTHREAD))
		return true;

	/* If the test is dying, just let it go. */
	if (unlikely(fatal_signal_pending(current)))
		return true;

	return __memcg_kmem_newpage_charge(gfp, memcg, order);
}

/**
 * memcg_kmem_uncharge_pages: uncharge pages from memcg
 * @page: pointer to struct page being freed
 * @order: allocation order.
 *
 * there is no need to specify memcg here, since it is embedded in page_cgroup
 */
static inline void
memcg_kmem_uncharge_pages(struct page *page, int order)
{
	if (memcg_kmem_enabled())
		__memcg_kmem_uncharge_pages(page, order);
}

/**
 * memcg_kmem_commit_charge: embeds correct memcg in a page
 * @page: pointer to struct page recently allocated
 * @memcg: the memcg structure we charged against
 * @order: allocation order.
 *
 * Needs to be called after memcg_kmem_newpage_charge, regardless of success or
 * failure of the allocation. if @page is NULL, this function will revert the
 * charges. Otherwise, it will commit the memcg given by @memcg to the
 * corresponding page_cgroup.
 */
static inline void
memcg_kmem_commit_charge(struct page *page, struct mem_cgroup *memcg, int order)
{
	if (memcg_kmem_enabled() && memcg)
		__memcg_kmem_commit_charge(page, memcg, order);
}

/**
 * memcg_kmem_get_cache: selects the correct per-memcg cache for allocation
 * @cachep: the original global kmem cache
 * @gfp: allocation flags.
 *
 * This function assumes that the task allocating, which determines the memcg
 * in the page allocator, belongs to the same cgroup throughout the whole
 * process.  Misacounting can happen if the task calls memcg_kmem_get_cache()
 * while belonging to a cgroup, and later on changes. This is considered
 * acceptable, and should only happen upon task migration.
 *
 * Before the cache is created by the memcg core, there is also a possible
 * imbalance: the task belongs to a memcg, but the cache being allocated from
 * is the global cache, since the child cache is not yet guaranteed to be
 * ready. This case is also fine, since in this case the GFP_KMEMCG will not be
 * passed and the page allocator will not attempt any cgroup accounting.
 */
static __always_inline struct kmem_cache *
memcg_kmem_get_cache(struct kmem_cache *cachep, gfp_t gfp)
{
	if (!memcg_kmem_enabled())
		return cachep;
	if (gfp & __GFP_NOFAIL)
		return cachep;
	if (in_interrupt() || (!current->mm) || (current->flags & PF_KTHREAD))
		return cachep;
	if (unlikely(fatal_signal_pending(current)))
		return cachep;

	return __memcg_kmem_get_cache(cachep, gfp);
}
#else
static inline bool memcg_kmem_enabled(void)
{
	return false;
}

static inline bool
memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **memcg, int order)
{
	return true;
}

static inline void memcg_kmem_uncharge_pages(struct page *page, int order)
{
}

static inline void
memcg_kmem_commit_charge(struct page *page, struct mem_cgroup *memcg, int order)
{
}

static inline int memcg_cache_id(struct mem_cgroup *memcg)
{
	return -1;
}

static inline int memcg_register_cache(struct mem_cgroup *memcg,
				       struct kmem_cache *s)
{
	return 0;
}

static inline void memcg_release_cache(struct kmem_cache *cachep)
{
}

static inline void memcg_cache_list_add(struct mem_cgroup *memcg,
					struct kmem_cache *s)
{
}

static inline struct kmem_cache *
memcg_kmem_get_cache(struct kmem_cache *cachep, gfp_t gfp)
{
	return cachep;
}
#endif /* CONFIG_MEMCG_KMEM */
#endif /* _LINUX_MEMCONTROL_H */
Commit	Line	Data
8cdea7c0 BS	1	/* memcontrol.h - Memory Controller
	2	*
	3	* Copyright IBM Corporation, 2007
	4	* Author Balbir Singh <balbir@linux.vnet.ibm.com>
	5	*
78fb7466 PE	6	* Copyright 2007 OpenVZ SWsoft Inc
	7	* Author: Pavel Emelianov <xemul@openvz.org>
	8	*
8cdea7c0 BS	9	* This program is free software; you can redistribute it and/or modify
	10	* it under the terms of the GNU General Public License as published by
	11	* the Free Software Foundation; either version 2 of the License, or
	12	* (at your option) any later version.
	13	*
	14	* This program is distributed in the hope that it will be useful,
	15	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	16	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	17	* GNU General Public License for more details.
	18	*/
	19
	20	#ifndef _LINUX_MEMCONTROL_H
	21	#define _LINUX_MEMCONTROL_H
f8d66542	22	#include <linux/cgroup.h>
456f998e	23	#include <linux/vm_event_item.h>
7ae1e1d0	24	#include <linux/hardirq.h>
a8964b9b	25	#include <linux/jump_label.h>
456f998e	26
78fb7466 PE	27	struct mem_cgroup;
78fb7466 PE	28	struct page_cgroup;
8697d331 BS	29	struct page;
8697d331 BS	30	struct mm_struct;
2633d7a0	31	struct kmem_cache;
78fb7466	32
2a7106f2 GT	33	/* Stats that can be updated by kernel. */
	34	enum mem_cgroup_page_stat_item {
	35	MEMCG_NR_FILE_MAPPED, /* # of pages charged as file rss */
	36	};
	37
5660048c JW	38	struct mem_cgroup_reclaim_cookie {
	39	struct zone *zone;
	40	int priority;
	41	unsigned int generation;
	42	};
	43
c255a458	44	#ifdef CONFIG_MEMCG
2c26fdd7 KH	45	/*
	46	* All "charge" functions with gfp_mask should use GFP_KERNEL or
	47	* (gfp_mask & GFP_RECLAIM_MASK). In current implementatin, memcg doesn't
	48	* alloc memory but reclaims memory from all available zones. So, "where I want
	49	* memory from" bits of gfp_mask has no meaning. So any bits of that field is
	50	* available but adding a rule is better. charge functions' gfp_mask should
	51	* be set to GFP_KERNEL or gfp_mask & GFP_RECLAIM_MASK for avoiding ambiguous
	52	* codes.
	53	* (Of course, if memcg does memory allocation in future, GFP_KERNEL is sane.)
	54	*/
78fb7466	55
7a81b88c	56	extern int mem_cgroup_newpage_charge(struct page page, struct mm_struct mm,
e1a1cd59	57	gfp_t gfp_mask);
7a81b88c	58	/* for swap handling */
8c7c6e34	59	extern int mem_cgroup_try_charge_swapin(struct mm_struct *mm,
72835c86	60	struct page page, gfp_t mask, struct mem_cgroup *memcgp);
7a81b88c	61	extern void mem_cgroup_commit_charge_swapin(struct page *page,
72835c86 JW	62	struct mem_cgroup *memcg);
72835c86 JW	63	extern void mem_cgroup_cancel_charge_swapin(struct mem_cgroup *memcg);
7a81b88c	64
8289546e HD	65	extern int mem_cgroup_cache_charge(struct page page, struct mm_struct mm,
8289546e HD	66	gfp_t gfp_mask);
925b7673 JW	67
925b7673 JW	68	struct lruvec mem_cgroup_zone_lruvec(struct zone , struct mem_cgroup *);
fa9add64	69	struct lruvec mem_cgroup_page_lruvec(struct page , struct zone *);
569b846d KH	70
	71	/* For coalescing uncharge for reducing memcg' overhead*/
	72	extern void mem_cgroup_uncharge_start(void);
	73	extern void mem_cgroup_uncharge_end(void);
	74
3c541e14	75	extern void mem_cgroup_uncharge_page(struct page *page);
69029cd5	76	extern void mem_cgroup_uncharge_cache_page(struct page *page);
c9b0ed51	77
c3ac9a8a JW	78	bool __mem_cgroup_same_or_subtree(const struct mem_cgroup *root_memcg,
c3ac9a8a JW	79	struct mem_cgroup *memcg);
c0ff4b85	80	int task_in_mem_cgroup(struct task_struct task, const struct mem_cgroup memcg);
3062fc67	81
e42d9d5d	82	extern struct mem_cgroup try_get_mem_cgroup_from_page(struct page page);
cf475ad2	83	extern struct mem_cgroup mem_cgroup_from_task(struct task_struct p);
a433658c	84	extern struct mem_cgroup try_get_mem_cgroup_from_mm(struct mm_struct mm);
cf475ad2	85
e1aab161	86	extern struct mem_cgroup parent_mem_cgroup(struct mem_cgroup memcg);
d1a4c0b3	87	extern struct mem_cgroup mem_cgroup_from_cont(struct cgroup cont);
e1aab161	88
2e4d4091	89	static inline
587af308	90	bool mm_match_cgroup(const struct mm_struct mm, const struct mem_cgroup memcg)
2e4d4091	91	{
587af308 JW	92	struct mem_cgroup *task_memcg;
587af308 JW	93	bool match;
c3ac9a8a	94
2e4d4091	95	rcu_read_lock();
587af308 JW	96	task_memcg = mem_cgroup_from_task(rcu_dereference(mm->owner));
587af308 JW	97	match = __mem_cgroup_same_or_subtree(memcg, task_memcg);
2e4d4091	98	rcu_read_unlock();
c3ac9a8a	99	return match;
2e4d4091	100	}
8a9f3ccd	101
c0ff4b85	102	extern struct cgroup_subsys_state mem_cgroup_css(struct mem_cgroup memcg);
d324236b	103
0030f535 JW	104	extern void
	105	mem_cgroup_prepare_migration(struct page page, struct page newpage,
	106	struct mem_cgroup **memcgp);
c0ff4b85	107	extern void mem_cgroup_end_migration(struct mem_cgroup *memcg,
50de1dd9	108	struct page oldpage, struct page newpage, bool migration_ok);
ae41be37	109
5660048c JW	110	struct mem_cgroup mem_cgroup_iter(struct mem_cgroup ,
	111	struct mem_cgroup *,
	112	struct mem_cgroup_reclaim_cookie *);
	113	void mem_cgroup_iter_break(struct mem_cgroup , struct mem_cgroup );
	114
58ae83db KH	115	/*
	116	* For memory reclaim.
	117	*/
c56d5c7d KK	118	int mem_cgroup_inactive_anon_is_low(struct lruvec *lruvec);
c56d5c7d KK	119	int mem_cgroup_inactive_file_is_low(struct lruvec *lruvec);
889976db	120	int mem_cgroup_select_victim_node(struct mem_cgroup *memcg);
4d7dcca2	121	unsigned long mem_cgroup_get_lru_size(struct lruvec *lruvec, enum lru_list);
fa9add64	122	void mem_cgroup_update_lru_size(struct lruvec *, enum lru_list, int);
e222432b BS	123	extern void mem_cgroup_print_oom_info(struct mem_cgroup *memcg,
e222432b BS	124	struct task_struct *p);
ab936cbc KH	125	extern void mem_cgroup_replace_page_cache(struct page *oldpage,
ab936cbc KH	126	struct page *newpage);
58ae83db	127
c255a458	128	#ifdef CONFIG_MEMCG_SWAP
c077719b KH	129	extern int do_swap_account;
c077719b KH	130	#endif
f8d66542 HT	131
	132	static inline bool mem_cgroup_disabled(void)
	133	{
	134	if (mem_cgroup_subsys.disabled)
	135	return true;
	136	return false;
	137	}
	138
89c06bd5 KH	139	void __mem_cgroup_begin_update_page_stat(struct page page, bool locked,
	140	unsigned long *flags);
	141
4331f7d3 KH	142	extern atomic_t memcg_moving;
4331f7d3 KH	143
89c06bd5 KH	144	static inline void mem_cgroup_begin_update_page_stat(struct page *page,
	145	bool locked, unsigned long flags)
	146	{
	147	if (mem_cgroup_disabled())
	148	return;
	149	rcu_read_lock();
	150	*locked = false;
4331f7d3 KH	151	if (atomic_read(&memcg_moving))
4331f7d3 KH	152	__mem_cgroup_begin_update_page_stat(page, locked, flags);
89c06bd5 KH	153	}
	154
	155	void __mem_cgroup_end_update_page_stat(struct page *page,
	156	unsigned long *flags);
	157	static inline void mem_cgroup_end_update_page_stat(struct page *page,
	158	bool locked, unsigned long flags)
	159	{
	160	if (mem_cgroup_disabled())
	161	return;
	162	if (*locked)
	163	__mem_cgroup_end_update_page_stat(page, flags);
	164	rcu_read_unlock();
	165	}
	166
2a7106f2 GT	167	void mem_cgroup_update_page_stat(struct page *page,
	168	enum mem_cgroup_page_stat_item idx,
	169	int val);
	170
	171	static inline void mem_cgroup_inc_page_stat(struct page *page,
	172	enum mem_cgroup_page_stat_item idx)
	173	{
	174	mem_cgroup_update_page_stat(page, idx, 1);
	175	}
	176
	177	static inline void mem_cgroup_dec_page_stat(struct page *page,
	178	enum mem_cgroup_page_stat_item idx)
	179	{
	180	mem_cgroup_update_page_stat(page, idx, -1);
	181	}
	182
4e416953	183	unsigned long mem_cgroup_soft_limit_reclaim(struct zone *zone, int order,
0ae5e89c YH	184	gfp_t gfp_mask,
0ae5e89c YH	185	unsigned long *total_scanned);
a63d83f4	186
68ae564b DR	187	void __mem_cgroup_count_vm_event(struct mm_struct *mm, enum vm_event_item idx);
	188	static inline void mem_cgroup_count_vm_event(struct mm_struct *mm,
	189	enum vm_event_item idx)
	190	{
	191	if (mem_cgroup_disabled())
	192	return;
	193	__mem_cgroup_count_vm_event(mm, idx);
	194	}
ca3e0214	195	#ifdef CONFIG_TRANSPARENT_HUGEPAGE
e94c8a9c	196	void mem_cgroup_split_huge_fixup(struct page *head);
ca3e0214 KH	197	#endif
ca3e0214 KH	198
f212ad7c DN	199	#ifdef CONFIG_DEBUG_VM
	200	bool mem_cgroup_bad_page_check(struct page *page);
	201	void mem_cgroup_print_bad_page(struct page *page);
	202	#endif
c255a458	203	#else /* CONFIG_MEMCG */
7a81b88c KH	204	struct mem_cgroup;
	205
	206	static inline int mem_cgroup_newpage_charge(struct page *page,
8289546e	207	struct mm_struct *mm, gfp_t gfp_mask)
8a9f3ccd BS	208	{
	209	return 0;
	210	}
	211
8289546e HD	212	static inline int mem_cgroup_cache_charge(struct page *page,
8289546e HD	213	struct mm_struct *mm, gfp_t gfp_mask)
8a9f3ccd	214	{
8289546e	215	return 0;
8a9f3ccd BS	216	}
8a9f3ccd BS	217
8c7c6e34	218	static inline int mem_cgroup_try_charge_swapin(struct mm_struct *mm,
72835c86	219	struct page page, gfp_t gfp_mask, struct mem_cgroup *memcgp)
7a81b88c KH	220	{
	221	return 0;
	222	}
	223
	224	static inline void mem_cgroup_commit_charge_swapin(struct page *page,
72835c86	225	struct mem_cgroup *memcg)
7a81b88c KH	226	{
	227	}
	228
72835c86	229	static inline void mem_cgroup_cancel_charge_swapin(struct mem_cgroup *memcg)
7a81b88c KH	230	{
	231	}
	232
569b846d KH	233	static inline void mem_cgroup_uncharge_start(void)
	234	{
	235	}
	236
	237	static inline void mem_cgroup_uncharge_end(void)
	238	{
	239	}
	240
8a9f3ccd BS	241	static inline void mem_cgroup_uncharge_page(struct page *page)
	242	{
	243	}
	244
69029cd5 KH	245	static inline void mem_cgroup_uncharge_cache_page(struct page *page)
	246	{
	247	}
	248
925b7673 JW	249	static inline struct lruvec mem_cgroup_zone_lruvec(struct zone zone,
925b7673 JW	250	struct mem_cgroup *memcg)
08e552c6	251	{
925b7673	252	return &zone->lruvec;
08e552c6 KH	253	}
08e552c6 KH	254
fa9add64 HD	255	static inline struct lruvec mem_cgroup_page_lruvec(struct page page,
fa9add64 HD	256	struct zone *zone)
66e1707b	257	{
925b7673	258	return &zone->lruvec;
66e1707b BS	259	}
66e1707b BS	260
e42d9d5d WF	261	static inline struct mem_cgroup try_get_mem_cgroup_from_page(struct page page)
	262	{
	263	return NULL;
	264	}
	265
a433658c KM	266	static inline struct mem_cgroup try_get_mem_cgroup_from_mm(struct mm_struct mm)
	267	{
	268	return NULL;
	269	}
	270
587af308	271	static inline bool mm_match_cgroup(struct mm_struct *mm,
c0ff4b85	272	struct mem_cgroup *memcg)
bed7161a	273	{
587af308	274	return true;
bed7161a BS	275	}
bed7161a BS	276
4c4a2214	277	static inline int task_in_mem_cgroup(struct task_struct *task,
c0ff4b85	278	const struct mem_cgroup *memcg)
4c4a2214 DR	279	{
	280	return 1;
	281	}
	282
c0ff4b85 R	283	static inline struct cgroup_subsys_state
c0ff4b85 R	284	mem_cgroup_css(struct mem_cgroup memcg)
d324236b WF	285	{
	286	return NULL;
	287	}
	288
0030f535	289	static inline void
ac39cf8c	290	mem_cgroup_prepare_migration(struct page page, struct page newpage,
0030f535	291	struct mem_cgroup **memcgp)
ae41be37	292	{
ae41be37 KH	293	}
ae41be37 KH	294
c0ff4b85	295	static inline void mem_cgroup_end_migration(struct mem_cgroup *memcg,
50de1dd9	296	struct page oldpage, struct page newpage, bool migration_ok)
ae41be37 KH	297	{
	298	}
	299
5660048c JW	300	static inline struct mem_cgroup *
	301	mem_cgroup_iter(struct mem_cgroup *root,
	302	struct mem_cgroup *prev,
	303	struct mem_cgroup_reclaim_cookie *reclaim)
	304	{
	305	return NULL;
	306	}
	307
	308	static inline void mem_cgroup_iter_break(struct mem_cgroup *root,
	309	struct mem_cgroup *prev)
	310	{
	311	}
	312
f8d66542 HT	313	static inline bool mem_cgroup_disabled(void)
	314	{
	315	return true;
	316	}
a636b327	317
14797e23	318	static inline int
c56d5c7d	319	mem_cgroup_inactive_anon_is_low(struct lruvec *lruvec)
14797e23 KM	320	{
	321	return 1;
	322	}
	323
56e49d21	324	static inline int
c56d5c7d	325	mem_cgroup_inactive_file_is_low(struct lruvec *lruvec)
56e49d21 RR	326	{
	327	return 1;
	328	}
	329
a3d8e054	330	static inline unsigned long
4d7dcca2	331	mem_cgroup_get_lru_size(struct lruvec *lruvec, enum lru_list lru)
a3d8e054 KM	332	{
	333	return 0;
	334	}
	335
fa9add64 HD	336	static inline void
	337	mem_cgroup_update_lru_size(struct lruvec *lruvec, enum lru_list lru,
	338	int increment)
3e2f41f1	339	{
3e2f41f1 KM	340	}
3e2f41f1 KM	341
e222432b BS	342	static inline void
	343	mem_cgroup_print_oom_info(struct mem_cgroup memcg, struct task_struct p)
	344	{
	345	}
	346
89c06bd5 KH	347	static inline void mem_cgroup_begin_update_page_stat(struct page *page,
	348	bool locked, unsigned long flags)
	349	{
	350	}
	351
	352	static inline void mem_cgroup_end_update_page_stat(struct page *page,
	353	bool locked, unsigned long flags)
	354	{
	355	}
	356
2a7106f2 GT	357	static inline void mem_cgroup_inc_page_stat(struct page *page,
	358	enum mem_cgroup_page_stat_item idx)
	359	{
	360	}
	361
	362	static inline void mem_cgroup_dec_page_stat(struct page *page,
	363	enum mem_cgroup_page_stat_item idx)
d69b042f BS	364	{
	365	}
	366
4e416953 BS	367	static inline
4e416953 BS	368	unsigned long mem_cgroup_soft_limit_reclaim(struct zone *zone, int order,
0ae5e89c YH	369	gfp_t gfp_mask,
0ae5e89c YH	370	unsigned long *total_scanned)
4e416953 BS	371	{
	372	return 0;
	373	}
	374
e94c8a9c	375	static inline void mem_cgroup_split_huge_fixup(struct page *head)
ca3e0214 KH	376	{
	377	}
	378
456f998e YH	379	static inline
	380	void mem_cgroup_count_vm_event(struct mm_struct *mm, enum vm_event_item idx)
	381	{
	382	}
ab936cbc KH	383	static inline void mem_cgroup_replace_page_cache(struct page *oldpage,
	384	struct page *newpage)
	385	{
	386	}
c255a458	387	#endif /* CONFIG_MEMCG */
78fb7466	388
c255a458	389	#if !defined(CONFIG_MEMCG) \|\| !defined(CONFIG_DEBUG_VM)
f212ad7c DN	390	static inline bool
	391	mem_cgroup_bad_page_check(struct page *page)
	392	{
	393	return false;
	394	}
	395
	396	static inline void
	397	mem_cgroup_print_bad_page(struct page *page)
	398	{
	399	}
	400	#endif
	401
e1aab161 GC	402	enum {
	403	UNDER_LIMIT,
	404	SOFT_LIMIT,
	405	OVER_LIMIT,
	406	};
	407
	408	struct sock;
cd59085a	409	#if defined(CONFIG_INET) && defined(CONFIG_MEMCG_KMEM)
e1aab161 GC	410	void sock_update_memcg(struct sock *sk);
	411	void sock_release_memcg(struct sock *sk);
	412	#else
	413	static inline void sock_update_memcg(struct sock *sk)
	414	{
	415	}
	416	static inline void sock_release_memcg(struct sock *sk)
	417	{
	418	}
cd59085a	419	#endif /* CONFIG_INET && CONFIG_MEMCG_KMEM */
7ae1e1d0 GC	420
7ae1e1d0 GC	421	#ifdef CONFIG_MEMCG_KMEM
a8964b9b	422	extern struct static_key memcg_kmem_enabled_key;
7ae1e1d0 GC	423	static inline bool memcg_kmem_enabled(void)
7ae1e1d0 GC	424	{
a8964b9b	425	return static_key_false(&memcg_kmem_enabled_key);
7ae1e1d0 GC	426	}
	427
	428	/*
	429	* In general, we'll do everything in our power to not incur in any overhead
	430	* for non-memcg users for the kmem functions. Not even a function call, if we
	431	* can avoid it.
	432	*
	433	* Therefore, we'll inline all those functions so that in the best case, we'll
	434	* see that kmemcg is off for everybody and proceed quickly. If it is on,
	435	* we'll still do most of the flag checking inline. We check a lot of
	436	* conditions, but because they are pretty simple, they are expected to be
	437	* fast.
	438	*/
	439	bool __memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **memcg,
	440	int order);
	441	void __memcg_kmem_commit_charge(struct page *page,
	442	struct mem_cgroup *memcg, int order);
	443	void __memcg_kmem_uncharge_pages(struct page *page, int order);
	444
2633d7a0 GC	445	int memcg_cache_id(struct mem_cgroup *memcg);
	446	int memcg_register_cache(struct mem_cgroup memcg, struct kmem_cache s);
	447	void memcg_release_cache(struct kmem_cache *cachep);
	448	void memcg_cache_list_add(struct mem_cgroup memcg, struct kmem_cache cachep);
	449
55007d84 GC	450	int memcg_update_cache_size(struct kmem_cache *s, int num_groups);
55007d84 GC	451	void memcg_update_array_size(int num_groups);
d7f25f8a GC	452
	453	struct kmem_cache *
	454	__memcg_kmem_get_cache(struct kmem_cache *cachep, gfp_t gfp);
	455
7ae1e1d0 GC	456	/**
	457	* memcg_kmem_newpage_charge: verify if a new kmem allocation is allowed.
	458	* @gfp: the gfp allocation flags.
	459	* @memcg: a pointer to the memcg this was charged against.
	460	* @order: allocation order.
	461	*
	462	* returns true if the memcg where the current task belongs can hold this
	463	* allocation.
	464	*
	465	* We return true automatically if this allocation is not to be accounted to
	466	* any memcg.
	467	*/
	468	static inline bool
	469	memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **memcg, int order)
	470	{
	471	if (!memcg_kmem_enabled())
	472	return true;
	473
	474	/*
	475	* __GFP_NOFAIL allocations will move on even if charging is not
	476	* possible. Therefore we don't even try, and have this allocation
	477	* unaccounted. We could in theory charge it with
	478	* res_counter_charge_nofail, but we hope those allocations are rare,
	479	* and won't be worth the trouble.
	480	*/
	481	if (!(gfp & __GFP_KMEMCG) \|\| (gfp & __GFP_NOFAIL))
	482	return true;
	483	if (in_interrupt() \|\| (!current->mm) \|\| (current->flags & PF_KTHREAD))
	484	return true;
	485
	486	/* If the test is dying, just let it go. */
	487	if (unlikely(fatal_signal_pending(current)))
	488	return true;
	489
	490	return __memcg_kmem_newpage_charge(gfp, memcg, order);
	491	}
	492
	493	/**
	494	* memcg_kmem_uncharge_pages: uncharge pages from memcg
	495	* @page: pointer to struct page being freed
	496	* @order: allocation order.
	497	*
	498	* there is no need to specify memcg here, since it is embedded in page_cgroup
	499	*/
	500	static inline void
	501	memcg_kmem_uncharge_pages(struct page *page, int order)
	502	{
	503	if (memcg_kmem_enabled())
	504	__memcg_kmem_uncharge_pages(page, order);
	505	}
	506
	507	/**
	508	* memcg_kmem_commit_charge: embeds correct memcg in a page
	509	* @page: pointer to struct page recently allocated
	510	* @memcg: the memcg structure we charged against
	511	* @order: allocation order.
	512	*
	513	* Needs to be called after memcg_kmem_newpage_charge, regardless of success or
	514	* failure of the allocation. if @page is NULL, this function will revert the
	515	* charges. Otherwise, it will commit the memcg given by @memcg to the
	516	* corresponding page_cgroup.
	517	*/
	518	static inline void
	519	memcg_kmem_commit_charge(struct page page, struct mem_cgroup memcg, int order)
520	{
521	if (memcg_kmem_enabled() && memcg)
522	__memcg_kmem_commit_charge(page, memcg, order);
523	}
524
d7f25f8a GC	525	/**
	526	* memcg_kmem_get_cache: selects the correct per-memcg cache for allocation
	527	* @cachep: the original global kmem cache
	528	* @gfp: allocation flags.
	529	*
	530	* This function assumes that the task allocating, which determines the memcg
	531	* in the page allocator, belongs to the same cgroup throughout the whole
	532	* process. Misacounting can happen if the task calls memcg_kmem_get_cache()
	533	* while belonging to a cgroup, and later on changes. This is considered
	534	* acceptable, and should only happen upon task migration.
	535	*
	536	* Before the cache is created by the memcg core, there is also a possible
	537	* imbalance: the task belongs to a memcg, but the cache being allocated from
	538	* is the global cache, since the child cache is not yet guaranteed to be
	539	* ready. This case is also fine, since in this case the GFP_KMEMCG will not be
	540	* passed and the page allocator will not attempt any cgroup accounting.
	541	*/
	542	static __always_inline struct kmem_cache *
	543	memcg_kmem_get_cache(struct kmem_cache *cachep, gfp_t gfp)
	544	{
	545	if (!memcg_kmem_enabled())
	546	return cachep;
	547	if (gfp & __GFP_NOFAIL)
	548	return cachep;
	549	if (in_interrupt() \|\| (!current->mm) \|\| (current->flags & PF_KTHREAD))
	550	return cachep;
	551	if (unlikely(fatal_signal_pending(current)))
	552	return cachep;
	553
	554	return __memcg_kmem_get_cache(cachep, gfp);
	555	}
7ae1e1d0	556	#else
b9ce5ef4 GC	557	static inline bool memcg_kmem_enabled(void)
	558	{
	559	return false;
	560	}
	561
7ae1e1d0 GC	562	static inline bool
	563	memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **memcg, int order)
	564	{
	565	return true;
	566	}
	567
	568	static inline void memcg_kmem_uncharge_pages(struct page *page, int order)
	569	{
	570	}
	571
	572	static inline void
	573	memcg_kmem_commit_charge(struct page page, struct mem_cgroup memcg, int order)
	574	{
	575	}
2633d7a0 GC	576
	577	static inline int memcg_cache_id(struct mem_cgroup *memcg)
	578	{
	579	return -1;
	580	}
	581
	582	static inline int memcg_register_cache(struct mem_cgroup *memcg,
	583	struct kmem_cache *s)
	584	{
	585	return 0;
	586	}
	587
	588	static inline void memcg_release_cache(struct kmem_cache *cachep)
	589	{
	590	}
	591
	592	static inline void memcg_cache_list_add(struct mem_cgroup *memcg,
	593	struct kmem_cache *s)
	594	{
	595	}
d7f25f8a GC	596
	597	static inline struct kmem_cache *
	598	memcg_kmem_get_cache(struct kmem_cache *cachep, gfp_t gfp)
	599	{
	600	return cachep;
	601	}
7ae1e1d0	602	#endif /* CONFIG_MEMCG_KMEM */
8cdea7c0 BS	603	#endif /* _LINUX_MEMCONTROL_H */
8cdea7c0 BS	604