memcg, slab: simplify synchronization scheme

author Vladimir Davydov <vdavydov@parallels.com>

Wed, 4 Jun 2014 23:07:40 +0000 (16:07 -0700)

committer Linus Torvalds <torvalds@linux-foundation.org>

Wed, 4 Jun 2014 23:54:01 +0000 (16:54 -0700)
author Vladimir Davydov <vdavydov@parallels.com>
Wed, 4 Jun 2014 23:07:40 +0000 (16:07 -0700)
committer Linus Torvalds <torvalds@linux-foundation.org>
Wed, 4 Jun 2014 23:54:01 +0000 (16:54 -0700)
diff --git a/include/linux/memcontrol.h b/include/linux/memcontrol.h

index d38d190f4cecbfdfb4e8ccfd2e55153d49ff831e..1fa23244fe37669fd12a76bc020c94334c32a88a 100644 (file)
--- a/include/linux/memcontrol.h
+++ b/include/linux/memcontrol.h
@@ -497,8 +497,6 @@ char *memcg_create_cache_name(struct mem_cgroup *memcg,
  int memcg_alloc_cache_params(struct mem_cgroup *memcg, struct kmem_cache *s,
                              struct kmem_cache *root_cache);
  void memcg_free_cache_params(struct kmem_cache *s);
-void memcg_register_cache(struct kmem_cache *s);
-void memcg_unregister_cache(struct kmem_cache *s);
  
  int memcg_update_cache_size(struct kmem_cache *s, int num_groups);
  void memcg_update_array_size(int num_groups);
@@ -640,14 +638,6 @@ static inline void memcg_free_cache_params(struct kmem_cache *s)
  {
  }
  
-static inline void memcg_register_cache(struct kmem_cache *s)
-{
-}
-
-static inline void memcg_unregister_cache(struct kmem_cache *s)
-{
-}
-
  static inline struct kmem_cache *
  memcg_kmem_get_cache(struct kmem_cache *cachep, gfp_t gfp)
  {
diff --git a/include/linux/slab.h b/include/linux/slab.h

index 905541dd37783e4bb1cd78eb7e6945b1d5b5d788..ecbec9ccb80d6b5bf3eeb240cfba2cd35bc767ad 100644 (file)
--- a/include/linux/slab.h
+++ b/include/linux/slab.h
@@ -116,7 +116,8 @@ struct kmem_cache *kmem_cache_create(const char *, size_t, size_t,
                         unsigned long,
                         void (*)(void *));
  #ifdef CONFIG_MEMCG_KMEM
-void kmem_cache_create_memcg(struct mem_cgroup *, struct kmem_cache *);
+struct kmem_cache *kmem_cache_create_memcg(struct mem_cgroup *,
+                                          struct kmem_cache *);
  #endif
  void kmem_cache_destroy(struct kmem_cache *);
  int kmem_cache_shrink(struct kmem_cache *);
@@ -525,8 +526,6 @@ static __always_inline void *kmalloc_node(size_t size, gfp_t flags, int node)
   * @list: list_head for the list of all caches in this memcg
   * @root_cache: pointer to the global, root cache, this cache was derived from
   * @nr_pages: number of pages that belongs to this cache.
- * @destroy: worker to be called whenever we are ready, or believe we may be
- *           ready, to destroy this cache.
   */
  struct memcg_cache_params {
         bool is_root_cache;
@@ -540,7 +539,6 @@ struct memcg_cache_params {
                         struct list_head list;
                         struct kmem_cache *root_cache;
                         atomic_t nr_pages;
-                       struct work_struct destroy;
                 };
         };
  };
diff --git a/mm/memcontrol.c b/mm/memcontrol.c

index 86a2078805e5ca0d7f3bdeb8f6d803ee285519e4..6b448881422b387f525b7b2399233eec1d73c14e 100644 (file)
--- a/mm/memcontrol.c
+++ b/mm/memcontrol.c
@@ -357,10 +357,9 @@ struct mem_cgroup {
         struct cg_proto tcp_mem;
  #endif
  #if defined(CONFIG_MEMCG_KMEM)
-       /* analogous to slab_common's slab_caches list. per-memcg */
+       /* analogous to slab_common's slab_caches list, but per-memcg;
+        * protected by memcg_slab_mutex */
         struct list_head memcg_slab_caches;
-       /* Not a spinlock, we can take a lot of time walking the list */
-       struct mutex slab_caches_mutex;
          /* Index in the kmem_cache->memcg_params->memcg_caches array */
         int kmemcg_id;
  #endif
@@ -2913,6 +2912,12 @@ static void __mem_cgroup_commit_charge(struct mem_cgroup *memcg,
  static DEFINE_MUTEX(set_limit_mutex);
  
  #ifdef CONFIG_MEMCG_KMEM
+/*
+ * The memcg_slab_mutex is held whenever a per memcg kmem cache is created or
+ * destroyed. It protects memcg_caches arrays and memcg_slab_caches lists.
+ */
+static DEFINE_MUTEX(memcg_slab_mutex);
+
  static DEFINE_MUTEX(activate_kmem_mutex);
  
  static inline bool memcg_can_account_kmem(struct mem_cgroup *memcg)
@@ -2945,10 +2950,10 @@ static int mem_cgroup_slabinfo_read(struct seq_file *m, void *v)
  
         print_slabinfo_header(m);
  
-       mutex_lock(&memcg->slab_caches_mutex);
+       mutex_lock(&memcg_slab_mutex);
         list_for_each_entry(params, &memcg->memcg_slab_caches, list)
                 cache_show(memcg_params_to_cache(params), m);
-       mutex_unlock(&memcg->slab_caches_mutex);
+       mutex_unlock(&memcg_slab_mutex);
  
         return 0;
  }
@@ -3050,8 +3055,6 @@ void memcg_update_array_size(int num)
                 memcg_limited_groups_array_size = memcg_caches_array_size(num);
  }
  
-static void kmem_cache_destroy_work_func(struct work_struct *w);
-
  int memcg_update_cache_size(struct kmem_cache *s, int num_groups)
  {
         struct memcg_cache_params *cur_params = s->memcg_params;
@@ -3148,8 +3151,6 @@ int memcg_alloc_cache_params(struct mem_cgroup *memcg, struct kmem_cache *s,
         if (memcg) {
                 s->memcg_params->memcg = memcg;
                 s->memcg_params->root_cache = root_cache;
-               INIT_WORK(&s->memcg_params->destroy,
-                               kmem_cache_destroy_work_func);
                 css_get(&memcg->css);
         } else
                 s->memcg_params->is_root_cache = true;
@@ -3166,24 +3167,34 @@ void memcg_free_cache_params(struct kmem_cache *s)
         kfree(s->memcg_params);
  }
  
-void memcg_register_cache(struct kmem_cache *s)
+static void memcg_kmem_create_cache(struct mem_cgroup *memcg,
+                                   struct kmem_cache *root_cache)
  {
-       struct kmem_cache *root;
-       struct mem_cgroup *memcg;
+       struct kmem_cache *cachep;
         int id;
  
-       if (is_root_cache(s))
+       lockdep_assert_held(&memcg_slab_mutex);
+
+       id = memcg_cache_id(memcg);
+
+       /*
+        * Since per-memcg caches are created asynchronously on first
+        * allocation (see memcg_kmem_get_cache()), several threads can try to
+        * create the same cache, but only one of them may succeed.
+        */
+       if (cache_from_memcg_idx(root_cache, id))
                 return;
  
+       cachep = kmem_cache_create_memcg(memcg, root_cache);
         /*
-        * Holding the slab_mutex assures nobody will touch the memcg_caches
-        * array while we are modifying it.
+        * If we could not create a memcg cache, do not complain, because
+        * that's not critical at all as we can always proceed with the root
+        * cache.
          */
-       lockdep_assert_held(&slab_mutex);
+       if (!cachep)
+               return;
  
-       root = s->memcg_params->root_cache;
-       memcg = s->memcg_params->memcg;
-       id = memcg_cache_id(memcg);
+       list_add(&cachep->memcg_params->list, &memcg->memcg_slab_caches);
  
         /*
          * Since readers won't lock (see cache_from_memcg_idx()), we need a
@@ -3192,49 +3203,30 @@ void memcg_register_cache(struct kmem_cache *s)
          */
         smp_wmb();
  
-       /*
-        * Initialize the pointer to this cache in its parent's memcg_params
-        * before adding it to the memcg_slab_caches list, otherwise we can
-        * fail to convert memcg_params_to_cache() while traversing the list.
-        */
-       VM_BUG_ON(root->memcg_params->memcg_caches[id]);
-       root->memcg_params->memcg_caches[id] = s;
-
-       mutex_lock(&memcg->slab_caches_mutex);
-       list_add(&s->memcg_params->list, &memcg->memcg_slab_caches);
-       mutex_unlock(&memcg->slab_caches_mutex);
+       BUG_ON(root_cache->memcg_params->memcg_caches[id]);
+       root_cache->memcg_params->memcg_caches[id] = cachep;
  }
  
-void memcg_unregister_cache(struct kmem_cache *s)
+static void memcg_kmem_destroy_cache(struct kmem_cache *cachep)
  {
-       struct kmem_cache *root;
+       struct kmem_cache *root_cache;
         struct mem_cgroup *memcg;
         int id;
  
-       if (is_root_cache(s))
-               return;
+       lockdep_assert_held(&memcg_slab_mutex);
  
-       /*
-        * Holding the slab_mutex assures nobody will touch the memcg_caches
-        * array while we are modifying it.
-        */
-       lockdep_assert_held(&slab_mutex);
+       BUG_ON(is_root_cache(cachep));
  
-       root = s->memcg_params->root_cache;
-       memcg = s->memcg_params->memcg;
+       root_cache = cachep->memcg_params->root_cache;
+       memcg = cachep->memcg_params->memcg;
         id = memcg_cache_id(memcg);
  
-       mutex_lock(&memcg->slab_caches_mutex);
-       list_del(&s->memcg_params->list);
-       mutex_unlock(&memcg->slab_caches_mutex);
+       BUG_ON(root_cache->memcg_params->memcg_caches[id] != cachep);
+       root_cache->memcg_params->memcg_caches[id] = NULL;
  
-       /*
-        * Clear the pointer to this cache in its parent's memcg_params only
-        * after removing it from the memcg_slab_caches list, otherwise we can
-        * fail to convert memcg_params_to_cache() while traversing the list.
-        */
-       VM_BUG_ON(root->memcg_params->memcg_caches[id] != s);
-       root->memcg_params->memcg_caches[id] = NULL;
+       list_del(&cachep->memcg_params->list);
+
+       kmem_cache_destroy(cachep);
  }
  
  /*
@@ -3268,70 +3260,42 @@ static inline void memcg_resume_kmem_account(void)
         current->memcg_kmem_skip_account--;
  }
  
-static void kmem_cache_destroy_work_func(struct work_struct *w)
-{
-       struct kmem_cache *cachep;
-       struct memcg_cache_params *p;
-
-       p = container_of(w, struct memcg_cache_params, destroy);
-
-       cachep = memcg_params_to_cache(p);
-
-       kmem_cache_shrink(cachep);
-       if (atomic_read(&cachep->memcg_params->nr_pages) == 0)
-               kmem_cache_destroy(cachep);
-}
-
  int __kmem_cache_destroy_memcg_children(struct kmem_cache *s)
  {
         struct kmem_cache *c;
         int i, failed = 0;
  
-       /*
-        * If the cache is being destroyed, we trust that there is no one else
-        * requesting objects from it. Even if there are, the sanity checks in
-        * kmem_cache_destroy should caught this ill-case.
-        *
-        * Still, we don't want anyone else freeing memcg_caches under our
-        * noses, which can happen if a new memcg comes to life. As usual,
-        * we'll take the activate_kmem_mutex to protect ourselves against
-        * this.
-        */
-       mutex_lock(&activate_kmem_mutex);
+       mutex_lock(&memcg_slab_mutex);
         for_each_memcg_cache_index(i) {
                 c = cache_from_memcg_idx(s, i);
                 if (!c)
                         continue;
  
-               /*
-                * We will now manually delete the caches, so to avoid races
-                * we need to cancel all pending destruction workers and
-                * proceed with destruction ourselves.
-                */
-               cancel_work_sync(&c->memcg_params->destroy);
-               kmem_cache_destroy(c);
+               memcg_kmem_destroy_cache(c);
  
                 if (cache_from_memcg_idx(s, i))
                         failed++;
         }
-       mutex_unlock(&activate_kmem_mutex);
+       mutex_unlock(&memcg_slab_mutex);
         return failed;
  }
  
  static void mem_cgroup_destroy_all_caches(struct mem_cgroup *memcg)
  {
         struct kmem_cache *cachep;
-       struct memcg_cache_params *params;
+       struct memcg_cache_params *params, *tmp;
  
         if (!memcg_kmem_is_active(memcg))
                 return;
  
-       mutex_lock(&memcg->slab_caches_mutex);
-       list_for_each_entry(params, &memcg->memcg_slab_caches, list) {
+       mutex_lock(&memcg_slab_mutex);
+       list_for_each_entry_safe(params, tmp, &memcg->memcg_slab_caches, list) {
                 cachep = memcg_params_to_cache(params);
-               schedule_work(&cachep->memcg_params->destroy);
+               kmem_cache_shrink(cachep);
+               if (atomic_read(&cachep->memcg_params->nr_pages) == 0)
+                       memcg_kmem_destroy_cache(cachep);
         }
-       mutex_unlock(&memcg->slab_caches_mutex);
+       mutex_unlock(&memcg_slab_mutex);
  }
  
  struct create_work {
@@ -3346,7 +3310,10 @@ static void memcg_create_cache_work_func(struct work_struct *w)
         struct mem_cgroup *memcg = cw->memcg;
         struct kmem_cache *cachep = cw->cachep;
  
-       kmem_cache_create_memcg(memcg, cachep);
+       mutex_lock(&memcg_slab_mutex);
+       memcg_kmem_create_cache(memcg, cachep);
+       mutex_unlock(&memcg_slab_mutex);
+
         css_put(&memcg->css);
         kfree(cw);
  }
@@ -5022,13 +4989,14 @@ static int __memcg_activate_kmem(struct mem_cgroup *memcg,
          * Make sure we have enough space for this cgroup in each root cache's
          * memcg_params.
          */
+       mutex_lock(&memcg_slab_mutex);
         err = memcg_update_all_caches(memcg_id + 1);
+       mutex_unlock(&memcg_slab_mutex);
         if (err)
                 goto out_rmid;
  
         memcg->kmemcg_id = memcg_id;
         INIT_LIST_HEAD(&memcg->memcg_slab_caches);
-       mutex_init(&memcg->slab_caches_mutex);
  
         /*
          * We couldn't have accounted to this cgroup, because it hasn't got the
diff --git a/mm/slab_common.c b/mm/slab_common.c

index 2dd920dc3776aff43399f8992916b68790aa168c..7e348cff814d898fee50d41ab7f14935be0d0e35 100644 (file)
--- a/mm/slab_common.c
+++ b/mm/slab_common.c
@@ -160,7 +160,6 @@ do_kmem_cache_create(char *name, size_t object_size, size_t size, size_t align,
  
         s->refcount = 1;
         list_add(&s->list, &slab_caches);
-       memcg_register_cache(s);
  out:
         if (err)
                 return ERR_PTR(err);
@@ -270,9 +269,10 @@ EXPORT_SYMBOL(kmem_cache_create);
   * requests going from @memcg to @root_cache. The new cache inherits properties
   * from its parent.
   */
-void kmem_cache_create_memcg(struct mem_cgroup *memcg, struct kmem_cache *root_cache)
+struct kmem_cache *kmem_cache_create_memcg(struct mem_cgroup *memcg,
+                                          struct kmem_cache *root_cache)
  {
-       struct kmem_cache *s;
+       struct kmem_cache *s = NULL;
         char *cache_name;
  
         get_online_cpus();
@@ -280,14 +280,6 @@ void kmem_cache_create_memcg(struct mem_cgroup *memcg, struct kmem_cache *root_c
  
         mutex_lock(&slab_mutex);
  
-       /*
-        * Since per-memcg caches are created asynchronously on first
-        * allocation (see memcg_kmem_get_cache()), several threads can try to
-        * create the same cache, but only one of them may succeed.
-        */
-       if (cache_from_memcg_idx(root_cache, memcg_cache_id(memcg)))
-               goto out_unlock;
-
         cache_name = memcg_create_cache_name(memcg, root_cache);
         if (!cache_name)
                 goto out_unlock;
@@ -296,14 +288,18 @@ void kmem_cache_create_memcg(struct mem_cgroup *memcg, struct kmem_cache *root_c
                                  root_cache->size, root_cache->align,
                                  root_cache->flags, root_cache->ctor,
                                  memcg, root_cache);
-       if (IS_ERR(s))
+       if (IS_ERR(s)) {
                 kfree(cache_name);
+               s = NULL;
+       }
  
  out_unlock:
         mutex_unlock(&slab_mutex);
  
         put_online_mems();
         put_online_cpus();
+
+       return s;
  }
  
  static int kmem_cache_destroy_memcg_children(struct kmem_cache *s)
@@ -348,11 +344,8 @@ void kmem_cache_destroy(struct kmem_cache *s)
                 goto out_unlock;
  
         list_del(&s->list);
-       memcg_unregister_cache(s);
-
         if (__kmem_cache_shutdown(s) != 0) {
                 list_add(&s->list, &slab_caches);
-               memcg_register_cache(s);
                 printk(KERN_ERR "kmem_cache_destroy %s: "
                        "Slab cache still has objects\n", s->name);
                 dump_stack();
author	Vladimir Davydov <vdavydov@parallels.com>
	Wed, 4 Jun 2014 23:07:40 +0000 (16:07 -0700)
committer	Linus Torvalds <torvalds@linux-foundation.org>
	Wed, 4 Jun 2014 23:54:01 +0000 (16:54 -0700)
include/linux/memcontrol.h		patch \| blob \| blame \| history
include/linux/slab.h		patch \| blob \| blame \| history
mm/memcontrol.c		patch \| blob \| blame \| history
mm/slab_common.c		patch \| blob \| blame \| history