sched/headers: Prepare for new header dependencies before moving code to <linux/sched...

[mirror_ubuntu-artful-kernel.git] / mm / slab_common.c
diff --git a/mm/slab_common.c b/mm/slab_common.c

index ae323841adb1ac76052eb6536aa2a3acc36b88e3..09d0e849b07f47d82f5d9a5cda4862517d297cb2 100644 (file)
--- a/mm/slab_common.c
+++ b/mm/slab_common.c
@@ -30,6 +30,11 @@ LIST_HEAD(slab_caches);
  DEFINE_MUTEX(slab_mutex);
  struct kmem_cache *kmem_cache;
  
+static LIST_HEAD(slab_caches_to_rcu_destroy);
+static void slab_caches_to_rcu_destroy_workfn(struct work_struct *work);
+static DECLARE_WORK(slab_caches_to_rcu_destroy_work,
+                   slab_caches_to_rcu_destroy_workfn);
+
  /*
   * Set of flags that will prevent slab merging
   */
@@ -133,11 +138,14 @@ int __kmem_cache_alloc_bulk(struct kmem_cache *s, gfp_t flags, size_t nr,
  }
  
  #if defined(CONFIG_MEMCG) && !defined(CONFIG_SLOB)
+
+LIST_HEAD(slab_root_caches);
+
  void slab_init_memcg_params(struct kmem_cache *s)
  {
-       s->memcg_params.is_root_cache = true;
-       INIT_LIST_HEAD(&s->memcg_params.list);
+       s->memcg_params.root_cache = NULL;
         RCU_INIT_POINTER(s->memcg_params.memcg_caches, NULL);
+       INIT_LIST_HEAD(&s->memcg_params.children);
  }
  
  static int init_memcg_params(struct kmem_cache *s,
@@ -145,10 +153,11 @@ static int init_memcg_params(struct kmem_cache *s,
  {
         struct memcg_cache_array *arr;
  
-       if (memcg) {
-               s->memcg_params.is_root_cache = false;
-               s->memcg_params.memcg = memcg;
+       if (root_cache) {
                 s->memcg_params.root_cache = root_cache;
+               s->memcg_params.memcg = memcg;
+               INIT_LIST_HEAD(&s->memcg_params.children_node);
+               INIT_LIST_HEAD(&s->memcg_params.kmem_caches_node);
                 return 0;
         }
  
@@ -177,9 +186,6 @@ static int update_memcg_params(struct kmem_cache *s, int new_array_size)
  {
         struct memcg_cache_array *old, *new;
  
-       if (!is_root_cache(s))
-               return 0;
-
         new = kzalloc(sizeof(struct memcg_cache_array) +
                       new_array_size * sizeof(void *), GFP_KERNEL);
         if (!new)
@@ -203,7 +209,7 @@ int memcg_update_all_caches(int num_memcgs)
         int ret = 0;
  
         mutex_lock(&slab_mutex);
-       list_for_each_entry(s, &slab_caches, list) {
+       list_for_each_entry(s, &slab_root_caches, root_caches_node) {
                 ret = update_memcg_params(s, num_memcgs);
                 /*
                  * Instead of freeing the memory, we'll just leave the caches
@@ -215,6 +221,28 @@ int memcg_update_all_caches(int num_memcgs)
         mutex_unlock(&slab_mutex);
         return ret;
  }
+
+void memcg_link_cache(struct kmem_cache *s)
+{
+       if (is_root_cache(s)) {
+               list_add(&s->root_caches_node, &slab_root_caches);
+       } else {
+               list_add(&s->memcg_params.children_node,
+                        &s->memcg_params.root_cache->memcg_params.children);
+               list_add(&s->memcg_params.kmem_caches_node,
+                        &s->memcg_params.memcg->kmem_caches);
+       }
+}
+
+static void memcg_unlink_cache(struct kmem_cache *s)
+{
+       if (is_root_cache(s)) {
+               list_del(&s->root_caches_node);
+       } else {
+               list_del(&s->memcg_params.children_node);
+               list_del(&s->memcg_params.kmem_caches_node);
+       }
+}
  #else
  static inline int init_memcg_params(struct kmem_cache *s,
                 struct mem_cgroup *memcg, struct kmem_cache *root_cache)
@@ -225,6 +253,10 @@ static inline int init_memcg_params(struct kmem_cache *s,
  static inline void destroy_memcg_params(struct kmem_cache *s)
  {
  }
+
+static inline void memcg_unlink_cache(struct kmem_cache *s)
+{
+}
  #endif /* CONFIG_MEMCG && !CONFIG_SLOB */
  
  /*
@@ -255,7 +287,7 @@ struct kmem_cache *find_mergeable(size_t size, size_t align,
  {
         struct kmem_cache *s;
  
-       if (slab_nomerge || (flags & SLAB_NEVER_MERGE))
+       if (slab_nomerge)
                 return NULL;
  
         if (ctor)
@@ -266,7 +298,10 @@ struct kmem_cache *find_mergeable(size_t size, size_t align,
         size = ALIGN(size, align);
         flags = kmem_cache_flags(size, flags, name, NULL);
  
-       list_for_each_entry_reverse(s, &slab_caches, list) {
+       if (flags & SLAB_NEVER_MERGE)
+               return NULL;
+
+       list_for_each_entry_reverse(s, &slab_root_caches, root_caches_node) {
                 if (slab_unmergeable(s))
                         continue;
  
@@ -350,6 +385,7 @@ static struct kmem_cache *create_cache(const char *name,
  
         s->refcount = 1;
         list_add(&s->list, &slab_caches);
+       memcg_link_cache(s);
  out:
         if (err)
                 return ERR_PTR(err);
@@ -458,33 +494,61 @@ out_unlock:
  }
  EXPORT_SYMBOL(kmem_cache_create);
  
-static int shutdown_cache(struct kmem_cache *s,
-               struct list_head *release, bool *need_rcu_barrier)
+static void slab_caches_to_rcu_destroy_workfn(struct work_struct *work)
  {
-       if (__kmem_cache_shutdown(s) != 0)
-               return -EBUSY;
+       LIST_HEAD(to_destroy);
+       struct kmem_cache *s, *s2;
+
+       /*
+        * On destruction, SLAB_DESTROY_BY_RCU kmem_caches are put on the
+        * @slab_caches_to_rcu_destroy list.  The slab pages are freed
+        * through RCU and and the associated kmem_cache are dereferenced
+        * while freeing the pages, so the kmem_caches should be freed only
+        * after the pending RCU operations are finished.  As rcu_barrier()
+        * is a pretty slow operation, we batch all pending destructions
+        * asynchronously.
+        */
+       mutex_lock(&slab_mutex);
+       list_splice_init(&slab_caches_to_rcu_destroy, &to_destroy);
+       mutex_unlock(&slab_mutex);
+
+       if (list_empty(&to_destroy))
+               return;
  
-       if (s->flags & SLAB_DESTROY_BY_RCU)
-               *need_rcu_barrier = true;
+       rcu_barrier();
  
-       list_move(&s->list, release);
-       return 0;
+       list_for_each_entry_safe(s, s2, &to_destroy, list) {
+#ifdef SLAB_SUPPORTS_SYSFS
+               sysfs_slab_release(s);
+#else
+               slab_kmem_cache_release(s);
+#endif
+       }
  }
  
-static void release_caches(struct list_head *release, bool need_rcu_barrier)
+static int shutdown_cache(struct kmem_cache *s)
  {
-       struct kmem_cache *s, *s2;
+       /* free asan quarantined objects */
+       kasan_cache_shutdown(s);
  
-       if (need_rcu_barrier)
-               rcu_barrier();
+       if (__kmem_cache_shutdown(s) != 0)
+               return -EBUSY;
  
-       list_for_each_entry_safe(s, s2, release, list) {
+       memcg_unlink_cache(s);
+       list_del(&s->list);
+
+       if (s->flags & SLAB_DESTROY_BY_RCU) {
+               list_add_tail(&s->list, &slab_caches_to_rcu_destroy);
+               schedule_work(&slab_caches_to_rcu_destroy_work);
+       } else {
  #ifdef SLAB_SUPPORTS_SYSFS
-               sysfs_slab_remove(s);
+               sysfs_slab_release(s);
  #else
                 slab_kmem_cache_release(s);
  #endif
         }
+
+       return 0;
  }
  
  #if defined(CONFIG_MEMCG) && !defined(CONFIG_SLOB)
@@ -551,8 +615,6 @@ void memcg_create_kmem_cache(struct mem_cgroup *memcg,
                 goto out_unlock;
         }
  
-       list_add(&s->memcg_params.list, &root_cache->memcg_params.list);
-
         /*
          * Since readers won't lock (see cache_from_memcg_idx()), we need a
          * barrier here to ensure nobody will see the kmem_cache partially
@@ -568,6 +630,66 @@ out_unlock:
         put_online_cpus();
  }
  
+static void kmemcg_deactivate_workfn(struct work_struct *work)
+{
+       struct kmem_cache *s = container_of(work, struct kmem_cache,
+                                           memcg_params.deact_work);
+
+       get_online_cpus();
+       get_online_mems();
+
+       mutex_lock(&slab_mutex);
+
+       s->memcg_params.deact_fn(s);
+
+       mutex_unlock(&slab_mutex);
+
+       put_online_mems();
+       put_online_cpus();
+
+       /* done, put the ref from slab_deactivate_memcg_cache_rcu_sched() */
+       css_put(&s->memcg_params.memcg->css);
+}
+
+static void kmemcg_deactivate_rcufn(struct rcu_head *head)
+{
+       struct kmem_cache *s = container_of(head, struct kmem_cache,
+                                           memcg_params.deact_rcu_head);
+
+       /*
+        * We need to grab blocking locks.  Bounce to ->deact_work.  The
+        * work item shares the space with the RCU head and can't be
+        * initialized eariler.
+        */
+       INIT_WORK(&s->memcg_params.deact_work, kmemcg_deactivate_workfn);
+       queue_work(memcg_kmem_cache_wq, &s->memcg_params.deact_work);
+}
+
+/**
+ * slab_deactivate_memcg_cache_rcu_sched - schedule deactivation after a
+ *                                        sched RCU grace period
+ * @s: target kmem_cache
+ * @deact_fn: deactivation function to call
+ *
+ * Schedule @deact_fn to be invoked with online cpus, mems and slab_mutex
+ * held after a sched RCU grace period.  The slab is guaranteed to stay
+ * alive until @deact_fn is finished.  This is to be used from
+ * __kmemcg_cache_deactivate().
+ */
+void slab_deactivate_memcg_cache_rcu_sched(struct kmem_cache *s,
+                                          void (*deact_fn)(struct kmem_cache *))
+{
+       if (WARN_ON_ONCE(is_root_cache(s)) ||
+           WARN_ON_ONCE(s->memcg_params.deact_fn))
+               return;
+
+       /* pin memcg so that @s doesn't get destroyed in the middle */
+       css_get(&s->memcg_params.memcg->css);
+
+       s->memcg_params.deact_fn = deact_fn;
+       call_rcu_sched(&s->memcg_params.deact_rcu_head, kmemcg_deactivate_rcufn);
+}
+
  void memcg_deactivate_kmem_caches(struct mem_cgroup *memcg)
  {
         int idx;
@@ -579,41 +701,15 @@ void memcg_deactivate_kmem_caches(struct mem_cgroup *memcg)
         get_online_cpus();
         get_online_mems();
  
-#ifdef CONFIG_SLUB
-       /*
-        * In case of SLUB, we need to disable empty slab caching to
-        * avoid pinning the offline memory cgroup by freeable kmem
-        * pages charged to it. SLAB doesn't need this, as it
-        * periodically purges unused slabs.
-        */
-       mutex_lock(&slab_mutex);
-       list_for_each_entry(s, &slab_caches, list) {
-               c = is_root_cache(s) ? cache_from_memcg_idx(s, idx) : NULL;
-               if (c) {
-                       c->cpu_partial = 0;
-                       c->min_partial = 0;
-               }
-       }
-       mutex_unlock(&slab_mutex);
-       /*
-        * kmem_cache->cpu_partial is checked locklessly (see
-        * put_cpu_partial()). Make sure the change is visible.
-        */
-       synchronize_sched();
-#endif
-
         mutex_lock(&slab_mutex);
-       list_for_each_entry(s, &slab_caches, list) {
-               if (!is_root_cache(s))
-                       continue;
-
+       list_for_each_entry(s, &slab_root_caches, root_caches_node) {
                 arr = rcu_dereference_protected(s->memcg_params.memcg_caches,
                                                 lockdep_is_held(&slab_mutex));
                 c = arr->entries[idx];
                 if (!c)
                         continue;
  
-               __kmem_cache_shrink(c);
+               __kmemcg_cache_deactivate(c);
                 arr->entries[idx] = NULL;
         }
         mutex_unlock(&slab_mutex);
@@ -622,47 +718,29 @@ void memcg_deactivate_kmem_caches(struct mem_cgroup *memcg)
         put_online_cpus();
  }
  
-static int __shutdown_memcg_cache(struct kmem_cache *s,
-               struct list_head *release, bool *need_rcu_barrier)
-{
-       BUG_ON(is_root_cache(s));
-
-       if (shutdown_cache(s, release, need_rcu_barrier))
-               return -EBUSY;
-
-       list_del(&s->memcg_params.list);
-       return 0;
-}
-
  void memcg_destroy_kmem_caches(struct mem_cgroup *memcg)
  {
-       LIST_HEAD(release);
-       bool need_rcu_barrier = false;
         struct kmem_cache *s, *s2;
  
         get_online_cpus();
         get_online_mems();
  
         mutex_lock(&slab_mutex);
-       list_for_each_entry_safe(s, s2, &slab_caches, list) {
-               if (is_root_cache(s) || s->memcg_params.memcg != memcg)
-                       continue;
+       list_for_each_entry_safe(s, s2, &memcg->kmem_caches,
+                                memcg_params.kmem_caches_node) {
                 /*
                  * The cgroup is about to be freed and therefore has no charges
                  * left. Hence, all its caches must be empty by now.
                  */
-               BUG_ON(__shutdown_memcg_cache(s, &release, &need_rcu_barrier));
+               BUG_ON(shutdown_cache(s));
         }
         mutex_unlock(&slab_mutex);
  
         put_online_mems();
         put_online_cpus();
-
-       release_caches(&release, need_rcu_barrier);
  }
  
-static int shutdown_memcg_caches(struct kmem_cache *s,
-               struct list_head *release, bool *need_rcu_barrier)
+static int shutdown_memcg_caches(struct kmem_cache *s)
  {
         struct memcg_cache_array *arr;
         struct kmem_cache *c, *c2;
@@ -681,13 +759,13 @@ static int shutdown_memcg_caches(struct kmem_cache *s,
                 c = arr->entries[i];
                 if (!c)
                         continue;
-               if (__shutdown_memcg_cache(c, release, need_rcu_barrier))
+               if (shutdown_cache(c))
                         /*
                          * The cache still has objects. Move it to a temporary
                          * list so as not to try to destroy it for a second
                          * time while iterating over inactive caches below.
                          */
-                       list_move(&c->memcg_params.list, &busy);
+                       list_move(&c->memcg_params.children_node, &busy);
                 else
                         /*
                          * The cache is empty and will be destroyed soon. Clear
@@ -702,23 +780,22 @@ static int shutdown_memcg_caches(struct kmem_cache *s,
          * Second, shutdown all caches left from memory cgroups that are now
          * offline.
          */
-       list_for_each_entry_safe(c, c2, &s->memcg_params.list,
-                                memcg_params.list)
-               __shutdown_memcg_cache(c, release, need_rcu_barrier);
+       list_for_each_entry_safe(c, c2, &s->memcg_params.children,
+                                memcg_params.children_node)
+               shutdown_cache(c);
  
-       list_splice(&busy, &s->memcg_params.list);
+       list_splice(&busy, &s->memcg_params.children);
  
         /*
          * A cache being destroyed must be empty. In particular, this means
          * that all per memcg caches attached to it must be empty too.
          */
-       if (!list_empty(&s->memcg_params.list))
+       if (!list_empty(&s->memcg_params.children))
                 return -EBUSY;
         return 0;
  }
  #else
-static inline int shutdown_memcg_caches(struct kmem_cache *s,
-               struct list_head *release, bool *need_rcu_barrier)
+static inline int shutdown_memcg_caches(struct kmem_cache *s)
  {
         return 0;
  }
@@ -734,8 +811,6 @@ void slab_kmem_cache_release(struct kmem_cache *s)
  
  void kmem_cache_destroy(struct kmem_cache *s)
  {
-       LIST_HEAD(release);
-       bool need_rcu_barrier = false;
         int err;
  
         if (unlikely(!s))
@@ -744,16 +819,15 @@ void kmem_cache_destroy(struct kmem_cache *s)
         get_online_cpus();
         get_online_mems();
  
-       kasan_cache_destroy(s);
         mutex_lock(&slab_mutex);
  
         s->refcount--;
         if (s->refcount)
                 goto out_unlock;
  
-       err = shutdown_memcg_caches(s, &release, &need_rcu_barrier);
+       err = shutdown_memcg_caches(s);
         if (!err)
-               err = shutdown_cache(s, &release, &need_rcu_barrier);
+               err = shutdown_cache(s);
  
         if (err) {
                 pr_err("kmem_cache_destroy %s: Slab cache still has objects\n",
@@ -765,8 +839,6 @@ out_unlock:
  
         put_online_mems();
         put_online_cpus();
-
-       release_caches(&release, need_rcu_barrier);
  }
  EXPORT_SYMBOL(kmem_cache_destroy);
  
@@ -828,6 +900,7 @@ struct kmem_cache *__init create_kmalloc_cache(const char *name, size_t size,
  
         create_boot_cache(s, name, size, flags);
         list_add(&s->list, &slab_caches);
+       memcg_link_cache(s);
         s->refcount = 1;
         return s;
  }
@@ -912,10 +985,7 @@ struct kmem_cache *kmalloc_slab(size_t size, gfp_t flags)
   * kmalloc_index() supports up to 2^26=64MB, so the final entry of the table is
   * kmalloc-67108864.
   */
-static struct {
-       const char *name;
-       unsigned long size;
-} const kmalloc_info[] __initconst = {
+const struct kmalloc_info_struct kmalloc_info[] __initconst = {
         {NULL,                      0},         {"kmalloc-96",             96},
         {"kmalloc-192",           192},         {"kmalloc-8",               8},
         {"kmalloc-16",             16},         {"kmalloc-32",             32},
@@ -1138,12 +1208,12 @@ static void print_slabinfo_header(struct seq_file *m)
  void *slab_start(struct seq_file *m, loff_t *pos)
  {
         mutex_lock(&slab_mutex);
-       return seq_list_start(&slab_caches, *pos);
+       return seq_list_start(&slab_root_caches, *pos);
  }
  
  void *slab_next(struct seq_file *m, void *p, loff_t *pos)
  {
-       return seq_list_next(p, &slab_caches, pos);
+       return seq_list_next(p, &slab_root_caches, pos);
  }
  
  void slab_stop(struct seq_file *m, void *p)
@@ -1195,25 +1265,44 @@ static void cache_show(struct kmem_cache *s, struct seq_file *m)
  
  static int slab_show(struct seq_file *m, void *p)
  {
-       struct kmem_cache *s = list_entry(p, struct kmem_cache, list);
+       struct kmem_cache *s = list_entry(p, struct kmem_cache, root_caches_node);
  
-       if (p == slab_caches.next)
+       if (p == slab_root_caches.next)
                 print_slabinfo_header(m);
-       if (is_root_cache(s))
-               cache_show(s, m);
+       cache_show(s, m);
         return 0;
  }
  
  #if defined(CONFIG_MEMCG) && !defined(CONFIG_SLOB)
+void *memcg_slab_start(struct seq_file *m, loff_t *pos)
+{
+       struct mem_cgroup *memcg = mem_cgroup_from_css(seq_css(m));
+
+       mutex_lock(&slab_mutex);
+       return seq_list_start(&memcg->kmem_caches, *pos);
+}
+
+void *memcg_slab_next(struct seq_file *m, void *p, loff_t *pos)
+{
+       struct mem_cgroup *memcg = mem_cgroup_from_css(seq_css(m));
+
+       return seq_list_next(p, &memcg->kmem_caches, pos);
+}
+
+void memcg_slab_stop(struct seq_file *m, void *p)
+{
+       mutex_unlock(&slab_mutex);
+}
+
  int memcg_slab_show(struct seq_file *m, void *p)
  {
-       struct kmem_cache *s = list_entry(p, struct kmem_cache, list);
+       struct kmem_cache *s = list_entry(p, struct kmem_cache,
+                                         memcg_params.kmem_caches_node);
         struct mem_cgroup *memcg = mem_cgroup_from_css(seq_css(m));
  
-       if (p == slab_caches.next)
+       if (p == memcg->kmem_caches.next)
                 print_slabinfo_header(m);
-       if (!is_root_cache(s) && s->memcg_params.memcg == memcg)
-               cache_show(s, m);
+       cache_show(s, m);
         return 0;
  }
  #endif