Merge branch 'for-upstream' of git://git.kernel.org/pub/scm/linux/kernel/git/bluetoot...

[deliverable/linux.git] / mm / memcontrol.c
diff --git a/mm/memcontrol.c b/mm/memcontrol.c

index 78cb3b05a9fac6be7488acb8b4b3376109a8b613..ef91e856c7e456a0674e7b76e15cbd771a6c9acb 100644 (file)
--- a/mm/memcontrol.c
+++ b/mm/memcontrol.c
@@ -51,7 +51,7 @@
  #include <linux/seq_file.h>
  #include <linux/vmpressure.h>
  #include <linux/mm_inline.h>
-#include <linux/page_cgroup.h>
+#include <linux/swap_cgroup.h>
  #include <linux/cpu.h>
  #include <linux/oom.h>
  #include <linux/lockdep.h>
@@ -296,7 +296,6 @@ struct mem_cgroup {
          * Should the accounting and control be hierarchical, per subtree?
          */
         bool use_hierarchy;
-       unsigned long kmem_account_flags; /* See KMEM_ACCOUNTED_*, below */
  
         bool            oom_lock;
         atomic_t        under_oom;
@@ -366,22 +365,11 @@ struct mem_cgroup {
         /* WARNING: nodeinfo must be the last member here */
  };
  
-/* internal only representation about the status of kmem accounting. */
-enum {
-       KMEM_ACCOUNTED_ACTIVE, /* accounted by this cgroup itself */
-};
-
  #ifdef CONFIG_MEMCG_KMEM
-static inline void memcg_kmem_set_active(struct mem_cgroup *memcg)
-{
-       set_bit(KMEM_ACCOUNTED_ACTIVE, &memcg->kmem_account_flags);
-}
-
  static bool memcg_kmem_is_active(struct mem_cgroup *memcg)
  {
-       return test_bit(KMEM_ACCOUNTED_ACTIVE, &memcg->kmem_account_flags);
+       return memcg->kmemcg_id >= 0;
  }
-
  #endif
  
  /* Stuffs for move charges at task migration. */
@@ -1274,7 +1262,6 @@ struct lruvec *mem_cgroup_page_lruvec(struct page *page, struct zone *zone)
  {
         struct mem_cgroup_per_zone *mz;
         struct mem_cgroup *memcg;
-       struct page_cgroup *pc;
         struct lruvec *lruvec;
  
         if (mem_cgroup_disabled()) {
@@ -1282,8 +1269,7 @@ struct lruvec *mem_cgroup_page_lruvec(struct page *page, struct zone *zone)
                 goto out;
         }
  
-       pc = lookup_page_cgroup(page);
-       memcg = pc->mem_cgroup;
+       memcg = page->mem_cgroup;
         /*
          * Swapcache readahead pages are added to the LRU - and
          * possibly migrated - before they are charged.
@@ -1573,7 +1559,7 @@ static void mem_cgroup_out_of_memory(struct mem_cgroup *memcg, gfp_t gfp_mask,
          * select it.  The goal is to allow it to allocate so that it may
          * quickly exit and free its memory.
          */
-       if (fatal_signal_pending(current) || current->flags & PF_EXITING) {
+       if (fatal_signal_pending(current) || task_will_free_mem(current)) {
                 set_thread_flag(TIF_MEMDIE);
                 return;
         }
@@ -1630,6 +1616,8 @@ static void mem_cgroup_out_of_memory(struct mem_cgroup *memcg, gfp_t gfp_mask,
                          NULL, "Memory cgroup out of memory");
  }
  
+#if MAX_NUMNODES > 1
+
  /**
   * test_mem_cgroup_node_reclaimable
   * @memcg: the target memcg
@@ -1652,7 +1640,6 @@ static bool test_mem_cgroup_node_reclaimable(struct mem_cgroup *memcg,
         return false;
  
  }
-#if MAX_NUMNODES > 1
  
  /*
   * Always updating the nodemask is not very good - even if we have an empty
@@ -2020,16 +2007,13 @@ struct mem_cgroup *mem_cgroup_begin_page_stat(struct page *page,
                                               unsigned long *flags)
  {
         struct mem_cgroup *memcg;
-       struct page_cgroup *pc;
  
         rcu_read_lock();
  
         if (mem_cgroup_disabled())
                 return NULL;
-
-       pc = lookup_page_cgroup(page);
  again:
-       memcg = pc->mem_cgroup;
+       memcg = page->mem_cgroup;
         if (unlikely(!memcg))
                 return NULL;
  
@@ -2038,7 +2022,7 @@ again:
                 return memcg;
  
         spin_lock_irqsave(&memcg->move_lock, *flags);
-       if (memcg != pc->mem_cgroup) {
+       if (memcg != page->mem_cgroup) {
                 spin_unlock_irqrestore(&memcg->move_lock, *flags);
                 goto again;
         }
@@ -2405,15 +2389,12 @@ static struct mem_cgroup *mem_cgroup_lookup(unsigned short id)
  struct mem_cgroup *try_get_mem_cgroup_from_page(struct page *page)
  {
         struct mem_cgroup *memcg;
-       struct page_cgroup *pc;
         unsigned short id;
         swp_entry_t ent;
  
         VM_BUG_ON_PAGE(!PageLocked(page), page);
  
-       pc = lookup_page_cgroup(page);
-       memcg = pc->mem_cgroup;
-
+       memcg = page->mem_cgroup;
         if (memcg) {
                 if (!css_tryget_online(&memcg->css))
                         memcg = NULL;
@@ -2463,10 +2444,9 @@ static void unlock_page_lru(struct page *page, int isolated)
  static void commit_charge(struct page *page, struct mem_cgroup *memcg,
                           bool lrucare)
  {
-       struct page_cgroup *pc = lookup_page_cgroup(page);
         int isolated;
  
-       VM_BUG_ON_PAGE(pc->mem_cgroup, page);
+       VM_BUG_ON_PAGE(page->mem_cgroup, page);
  
         /*
          * In some cases, SwapCache and FUSE(splice_buf->radixtree), the page
@@ -2477,7 +2457,7 @@ static void commit_charge(struct page *page, struct mem_cgroup *memcg,
  
         /*
          * Nobody should be changing or seriously looking at
-        * pc->mem_cgroup at this point:
+        * page->mem_cgroup at this point:
          *
          * - the page is uncharged
          *
@@ -2489,7 +2469,7 @@ static void commit_charge(struct page *page, struct mem_cgroup *memcg,
          * - a page cache insertion, a swapin fault, or a migration
          *   have the page locked
          */
-       pc->mem_cgroup = memcg;
+       page->mem_cgroup = memcg;
  
         if (lrucare)
                 unlock_page_lru(page, isolated);
@@ -2655,7 +2635,6 @@ static void memcg_register_cache(struct mem_cgroup *memcg,
         if (!cachep)
                 return;
  
-       css_get(&memcg->css);
         list_add(&cachep->memcg_params->list, &memcg->memcg_slab_caches);
  
         /*
@@ -2689,40 +2668,6 @@ static void memcg_unregister_cache(struct kmem_cache *cachep)
         list_del(&cachep->memcg_params->list);
  
         kmem_cache_destroy(cachep);
-
-       /* drop the reference taken in memcg_register_cache */
-       css_put(&memcg->css);
-}
-
-/*
- * During the creation a new cache, we need to disable our accounting mechanism
- * altogether. This is true even if we are not creating, but rather just
- * enqueing new caches to be created.
- *
- * This is because that process will trigger allocations; some visible, like
- * explicit kmallocs to auxiliary data structures, name strings and internal
- * cache structures; some well concealed, like INIT_WORK() that can allocate
- * objects during debug.
- *
- * If any allocation happens during memcg_kmem_get_cache, we will recurse back
- * to it. This may not be a bounded recursion: since the first cache creation
- * failed to complete (waiting on the allocation), we'll just try to create the
- * cache again, failing at the same point.
- *
- * memcg_kmem_get_cache is prepared to abort after seeing a positive count of
- * memcg_kmem_skip_account. So we enclose anything that might allocate memory
- * inside the following two functions.
- */
-static inline void memcg_stop_kmem_account(void)
-{
-       VM_BUG_ON(!current->mm);
-       current->memcg_kmem_skip_account++;
-}
-
-static inline void memcg_resume_kmem_account(void)
-{
-       VM_BUG_ON(!current->mm);
-       current->memcg_kmem_skip_account--;
  }
  
  int __memcg_cleanup_cache_params(struct kmem_cache *s)
@@ -2756,9 +2701,7 @@ static void memcg_unregister_all_caches(struct mem_cgroup *memcg)
         mutex_lock(&memcg_slab_mutex);
         list_for_each_entry_safe(params, tmp, &memcg->memcg_slab_caches, list) {
                 cachep = memcg_params_to_cache(params);
-               kmem_cache_shrink(cachep);
-               if (atomic_read(&cachep->memcg_params->nr_pages) == 0)
-                       memcg_unregister_cache(cachep);
+               memcg_unregister_cache(cachep);
         }
         mutex_unlock(&memcg_slab_mutex);
  }
@@ -2793,10 +2736,10 @@ static void __memcg_schedule_register_cache(struct mem_cgroup *memcg,
         struct memcg_register_cache_work *cw;
  
         cw = kmalloc(sizeof(*cw), GFP_NOWAIT);
-       if (cw == NULL) {
-               css_put(&memcg->css);
+       if (!cw)
                 return;
-       }
+
+       css_get(&memcg->css);
  
         cw->memcg = memcg;
         cw->cachep = cachep;
@@ -2819,20 +2762,16 @@ static void memcg_schedule_register_cache(struct mem_cgroup *memcg,
          * this point we can't allow ourselves back into memcg_kmem_get_cache,
          * the safest choice is to do it like this, wrapping the whole function.
          */
-       memcg_stop_kmem_account();
+       current->memcg_kmem_skip_account = 1;
         __memcg_schedule_register_cache(memcg, cachep);
-       memcg_resume_kmem_account();
+       current->memcg_kmem_skip_account = 0;
  }
  
  int __memcg_charge_slab(struct kmem_cache *cachep, gfp_t gfp, int order)
  {
         unsigned int nr_pages = 1 << order;
-       int res;
  
-       res = memcg_charge_kmem(cachep->memcg_params->memcg, gfp, nr_pages);
-       if (!res)
-               atomic_add(nr_pages, &cachep->memcg_params->nr_pages);
-       return res;
+       return memcg_charge_kmem(cachep->memcg_params->memcg, gfp, nr_pages);
  }
  
  void __memcg_uncharge_slab(struct kmem_cache *cachep, int order)
@@ -2840,7 +2779,6 @@ void __memcg_uncharge_slab(struct kmem_cache *cachep, int order)
         unsigned int nr_pages = 1 << order;
  
         memcg_uncharge_kmem(cachep->memcg_params->memcg, nr_pages);
-       atomic_sub(nr_pages, &cachep->memcg_params->nr_pages);
  }
  
  /*
@@ -2856,8 +2794,7 @@ void __memcg_uncharge_slab(struct kmem_cache *cachep, int order)
   * Can't be called in interrupt context or from kernel threads.
   * This function needs to be called with rcu_read_lock() held.
   */
-struct kmem_cache *__memcg_kmem_get_cache(struct kmem_cache *cachep,
-                                         gfp_t gfp)
+struct kmem_cache *__memcg_kmem_get_cache(struct kmem_cache *cachep)
  {
         struct mem_cgroup *memcg;
         struct kmem_cache *memcg_cachep;
@@ -2865,25 +2802,16 @@ struct kmem_cache *__memcg_kmem_get_cache(struct kmem_cache *cachep,
         VM_BUG_ON(!cachep->memcg_params);
         VM_BUG_ON(!cachep->memcg_params->is_root_cache);
  
-       if (!current->mm || current->memcg_kmem_skip_account)
+       if (current->memcg_kmem_skip_account)
                 return cachep;
  
-       rcu_read_lock();
-       memcg = mem_cgroup_from_task(rcu_dereference(current->mm->owner));
-
+       memcg = get_mem_cgroup_from_mm(current->mm);
         if (!memcg_kmem_is_active(memcg))
                 goto out;
  
         memcg_cachep = cache_from_memcg_idx(cachep, memcg_cache_id(memcg));
-       if (likely(memcg_cachep)) {
-               cachep = memcg_cachep;
-               goto out;
-       }
-
-       /* The corresponding put will be done in the workqueue. */
-       if (!css_tryget_online(&memcg->css))
-               goto out;
-       rcu_read_unlock();
+       if (likely(memcg_cachep))
+               return memcg_cachep;
  
         /*
          * If we are in a safe context (can wait, and not in interrupt
@@ -2898,12 +2826,17 @@ struct kmem_cache *__memcg_kmem_get_cache(struct kmem_cache *cachep,
          * defer everything.
          */
         memcg_schedule_register_cache(memcg, cachep);
-       return cachep;
  out:
-       rcu_read_unlock();
+       css_put(&memcg->css);
         return cachep;
  }
  
+void __memcg_kmem_put_cache(struct kmem_cache *cachep)
+{
+       if (!is_root_cache(cachep))
+               css_put(&cachep->memcg_params->memcg->css);
+}
+
  /*
   * We need to verify if the allocation against current->mm->owner's memcg is
   * possible for the given order. But the page is not allocated yet, so we'll
@@ -2926,34 +2859,6 @@ __memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **_memcg, int order)
  
         *_memcg = NULL;
  
-       /*
-        * Disabling accounting is only relevant for some specific memcg
-        * internal allocations. Therefore we would initially not have such
-        * check here, since direct calls to the page allocator that are
-        * accounted to kmemcg (alloc_kmem_pages and friends) only happen
-        * outside memcg core. We are mostly concerned with cache allocations,
-        * and by having this test at memcg_kmem_get_cache, we are already able
-        * to relay the allocation to the root cache and bypass the memcg cache
-        * altogether.
-        *
-        * There is one exception, though: the SLUB allocator does not create
-        * large order caches, but rather service large kmallocs directly from
-        * the page allocator. Therefore, the following sequence when backed by
-        * the SLUB allocator:
-        *
-        *      memcg_stop_kmem_account();
-        *      kmalloc(<large_number>)
-        *      memcg_resume_kmem_account();
-        *
-        * would effectively ignore the fact that we should skip accounting,
-        * since it will drive us directly to this function without passing
-        * through the cache selector memcg_kmem_get_cache. Such large
-        * allocations are extremely rare but can happen, for instance, for the
-        * cache arrays. We bring this test here.
-        */
-       if (!current->mm || current->memcg_kmem_skip_account)
-               return true;
-
         memcg = get_mem_cgroup_from_mm(current->mm);
  
         if (!memcg_kmem_is_active(memcg)) {
@@ -2972,8 +2877,6 @@ __memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **_memcg, int order)
  void __memcg_kmem_commit_charge(struct page *page, struct mem_cgroup *memcg,
                               int order)
  {
-       struct page_cgroup *pc;
-
         VM_BUG_ON(mem_cgroup_is_root(memcg));
  
         /* The page allocation failed. Revert */
@@ -2981,14 +2884,12 @@ void __memcg_kmem_commit_charge(struct page *page, struct mem_cgroup *memcg,
                 memcg_uncharge_kmem(memcg, 1 << order);
                 return;
         }
-       pc = lookup_page_cgroup(page);
-       pc->mem_cgroup = memcg;
+       page->mem_cgroup = memcg;
  }
  
  void __memcg_kmem_uncharge_pages(struct page *page, int order)
  {
-       struct page_cgroup *pc = lookup_page_cgroup(page);
-       struct mem_cgroup *memcg = pc->mem_cgroup;
+       struct mem_cgroup *memcg = page->mem_cgroup;
  
         if (!memcg)
                 return;
@@ -2996,11 +2897,7 @@ void __memcg_kmem_uncharge_pages(struct page *page, int order)
         VM_BUG_ON_PAGE(mem_cgroup_is_root(memcg), page);
  
         memcg_uncharge_kmem(memcg, 1 << order);
-       pc->mem_cgroup = NULL;
-}
-#else
-static inline void memcg_unregister_all_caches(struct mem_cgroup *memcg)
-{
+       page->mem_cgroup = NULL;
  }
  #endif /* CONFIG_MEMCG_KMEM */
  
@@ -3014,16 +2911,15 @@ static inline void memcg_unregister_all_caches(struct mem_cgroup *memcg)
   */
  void mem_cgroup_split_huge_fixup(struct page *head)
  {
-       struct page_cgroup *pc = lookup_page_cgroup(head);
         int i;
  
         if (mem_cgroup_disabled())
                 return;
  
         for (i = 1; i < HPAGE_PMD_NR; i++)
-               pc[i].mem_cgroup = pc[0].mem_cgroup;
+               head[i].mem_cgroup = head->mem_cgroup;
  
-       __this_cpu_sub(pc[0].mem_cgroup->stat->count[MEM_CGROUP_STAT_RSS_HUGE],
+       __this_cpu_sub(head->mem_cgroup->stat->count[MEM_CGROUP_STAT_RSS_HUGE],
                        HPAGE_PMD_NR);
  }
  #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
@@ -3032,7 +2928,6 @@ void mem_cgroup_split_huge_fixup(struct page *head)
   * mem_cgroup_move_account - move account of the page
   * @page: the page
   * @nr_pages: number of regular pages (>1 for huge pages)
- * @pc:        page_cgroup of the page.
   * @from: mem_cgroup which the page is moved from.
   * @to:        mem_cgroup which the page is moved to. @from != @to.
   *
@@ -3045,7 +2940,6 @@ void mem_cgroup_split_huge_fixup(struct page *head)
   */
  static int mem_cgroup_move_account(struct page *page,
                                    unsigned int nr_pages,
-                                  struct page_cgroup *pc,
                                    struct mem_cgroup *from,
                                    struct mem_cgroup *to)
  {
@@ -3065,7 +2959,7 @@ static int mem_cgroup_move_account(struct page *page,
                 goto out;
  
         /*
-        * Prevent mem_cgroup_migrate() from looking at pc->mem_cgroup
+        * Prevent mem_cgroup_migrate() from looking at page->mem_cgroup
          * of its source page while we change it: page migration takes
          * both pages off the LRU, but page cache replacement doesn't.
          */
@@ -3073,7 +2967,7 @@ static int mem_cgroup_move_account(struct page *page,
                 goto out;
  
         ret = -EINVAL;
-       if (pc->mem_cgroup != from)
+       if (page->mem_cgroup != from)
                 goto out_unlock;
  
         spin_lock_irqsave(&from->move_lock, flags);
@@ -3093,13 +2987,13 @@ static int mem_cgroup_move_account(struct page *page,
         }
  
         /*
-        * It is safe to change pc->mem_cgroup here because the page
+        * It is safe to change page->mem_cgroup here because the page
          * is referenced, charged, and isolated - we can't race with
          * uncharging, charging, migration, or LRU putback.
          */
  
         /* caller should have done css_get */
-       pc->mem_cgroup = to;
+       page->mem_cgroup = to;
         spin_unlock_irqrestore(&from->move_lock, flags);
  
         ret = 0;
@@ -3173,40 +3067,6 @@ static inline int mem_cgroup_move_swap_account(swp_entry_t entry,
  }
  #endif
  
-#ifdef CONFIG_DEBUG_VM
-static struct page_cgroup *lookup_page_cgroup_used(struct page *page)
-{
-       struct page_cgroup *pc;
-
-       pc = lookup_page_cgroup(page);
-       /*
-        * Can be NULL while feeding pages into the page allocator for
-        * the first time, i.e. during boot or memory hotplug;
-        * or when mem_cgroup_disabled().
-        */
-       if (likely(pc) && pc->mem_cgroup)
-               return pc;
-       return NULL;
-}
-
-bool mem_cgroup_bad_page_check(struct page *page)
-{
-       if (mem_cgroup_disabled())
-               return false;
-
-       return lookup_page_cgroup_used(page) != NULL;
-}
-
-void mem_cgroup_print_bad_page(struct page *page)
-{
-       struct page_cgroup *pc;
-
-       pc = lookup_page_cgroup_used(page);
-       if (pc)
-               pr_alert("pc:%p pc->mem_cgroup:%p\n", pc, pc->mem_cgroup);
-}
-#endif
-
  static DEFINE_MUTEX(memcg_limit_mutex);
  
  static int mem_cgroup_resize_limit(struct mem_cgroup *memcg,
@@ -3588,12 +3448,6 @@ static int memcg_activate_kmem(struct mem_cgroup *memcg,
         if (memcg_kmem_is_active(memcg))
                 return 0;
  
-       /*
-        * We are going to allocate memory for data shared by all memory
-        * cgroups so let's stop accounting here.
-        */
-       memcg_stop_kmem_account();
-
         /*
          * For simplicity, we won't allow this to be disabled.  It also can't
          * be changed if the cgroup has children already, or if tasks had
@@ -3620,25 +3474,22 @@ static int memcg_activate_kmem(struct mem_cgroup *memcg,
                 goto out;
         }
  
-       memcg->kmemcg_id = memcg_id;
-       INIT_LIST_HEAD(&memcg->memcg_slab_caches);
-
         /*
-        * We couldn't have accounted to this cgroup, because it hasn't got the
-        * active bit set yet, so this should succeed.
+        * We couldn't have accounted to this cgroup, because it hasn't got
+        * activated yet, so this should succeed.
          */
         err = page_counter_limit(&memcg->kmem, nr_pages);
         VM_BUG_ON(err);
  
         static_key_slow_inc(&memcg_kmem_enabled_key);
         /*
-        * Setting the active bit after enabling static branching will
+        * A memory cgroup is considered kmem-active as soon as it gets
+        * kmemcg_id. Setting the id after enabling static branching will
          * guarantee no one starts accounting before all call sites are
          * patched.
          */
-       memcg_kmem_set_active(memcg);
+       memcg->kmemcg_id = memcg_id;
  out:
-       memcg_resume_kmem_account();
         return err;
  }
  
@@ -3841,11 +3692,6 @@ static int memcg_numa_stat_show(struct seq_file *m, void *v)
  }
  #endif /* CONFIG_NUMA */
  
-static inline void mem_cgroup_lru_names_not_uptodate(void)
-{
-       BUILD_BUG_ON(ARRAY_SIZE(mem_cgroup_lru_names) != NR_LRU_LISTS);
-}
-
  static int memcg_stat_show(struct seq_file *m, void *v)
  {
         struct mem_cgroup *memcg = mem_cgroup_from_css(seq_css(m));
@@ -3853,6 +3699,8 @@ static int memcg_stat_show(struct seq_file *m, void *v)
         struct mem_cgroup *mi;
         unsigned int i;
  
+       BUILD_BUG_ON(ARRAY_SIZE(mem_cgroup_lru_names) != NR_LRU_LISTS);
+
         for (i = 0; i < MEM_CGROUP_STAT_NSTATS; i++) {
                 if (i == MEM_CGROUP_STAT_SWAP && !do_swap_account)
                         continue;
@@ -4309,7 +4157,6 @@ static int memcg_init_kmem(struct mem_cgroup *memcg, struct cgroup_subsys *ss)
  {
         int ret;
  
-       memcg->kmemcg_id = -1;
         ret = memcg_propagate_kmem(memcg);
         if (ret)
                 return ret;
@@ -4319,6 +4166,7 @@ static int memcg_init_kmem(struct mem_cgroup *memcg, struct cgroup_subsys *ss)
  
  static void memcg_destroy_kmem(struct mem_cgroup *memcg)
  {
+       memcg_unregister_all_caches(memcg);
         mem_cgroup_sockets_destroy(memcg);
  }
  #else
@@ -4492,7 +4340,7 @@ static ssize_t memcg_write_event_control(struct kernfs_open_file *of,
          *
          * DO NOT ADD NEW FILES.
          */
-       name = cfile.file->f_dentry->d_name.name;
+       name = cfile.file->f_path.dentry->d_name.name;
  
         if (!strcmp(name, "memory.usage_in_bytes")) {
                 event->register_event = mem_cgroup_usage_register_event;
@@ -4516,7 +4364,7 @@ static ssize_t memcg_write_event_control(struct kernfs_open_file *of,
          * automatically removed on cgroup destruction but the removal is
          * asynchronous, so take an extra ref on @css.
          */
-       cfile_css = css_tryget_online_from_dir(cfile.file->f_dentry->d_parent,
+       cfile_css = css_tryget_online_from_dir(cfile.file->f_path.dentry->d_parent,
                                                &memory_cgrp_subsys);
         ret = -EINVAL;
         if (IS_ERR(cfile_css))
@@ -4774,17 +4622,6 @@ static void __mem_cgroup_free(struct mem_cgroup *memcg)
  
         free_percpu(memcg->stat);
  
-       /*
-        * We need to make sure that (at least for now), the jump label
-        * destruction code runs outside of the cgroup lock. This is because
-        * get_online_cpus(), which is called from the static_branch update,
-        * can't be called inside the cgroup_lock. cpusets are the ones
-        * enforcing this dependency, so if they ever change, we might as well.
-        *
-        * schedule_work() will guarantee this happens. Be careful if you need
-        * to move this code around, and make sure it is outside
-        * the cgroup_lock.
-        */
         disarm_static_keys(memcg);
         kfree(memcg);
  }
@@ -4854,6 +4691,10 @@ mem_cgroup_css_alloc(struct cgroup_subsys_state *parent_css)
         vmpressure_init(&memcg->vmpressure);
         INIT_LIST_HEAD(&memcg->event_list);
         spin_lock_init(&memcg->event_list_lock);
+#ifdef CONFIG_MEMCG_KMEM
+       memcg->kmemcg_id = -1;
+       INIT_LIST_HEAD(&memcg->memcg_slab_caches);
+#endif
  
         return &memcg->css;
  
@@ -4935,7 +4776,6 @@ static void mem_cgroup_css_offline(struct cgroup_subsys_state *css)
         }
         spin_unlock(&memcg->event_list_lock);
  
-       memcg_unregister_all_caches(memcg);
         vmpressure_cleanup(&memcg->vmpressure);
  }
  
@@ -5123,7 +4963,6 @@ static enum mc_target_type get_mctgt_type(struct vm_area_struct *vma,
                 unsigned long addr, pte_t ptent, union mc_target *target)
  {
         struct page *page = NULL;
-       struct page_cgroup *pc;
         enum mc_target_type ret = MC_TARGET_NONE;
         swp_entry_t ent = { .val = 0 };
  
@@ -5137,13 +4976,12 @@ static enum mc_target_type get_mctgt_type(struct vm_area_struct *vma,
         if (!page && !ent.val)
                 return ret;
         if (page) {
-               pc = lookup_page_cgroup(page);
                 /*
                  * Do only loose check w/o serialization.
-                * mem_cgroup_move_account() checks the pc is valid or
+                * mem_cgroup_move_account() checks the page is valid or
                  * not under LRU exclusion.
                  */
-               if (pc->mem_cgroup == mc.from) {
+               if (page->mem_cgroup == mc.from) {
                         ret = MC_TARGET_PAGE;
                         if (target)
                                 target->page = page;
@@ -5171,15 +5009,13 @@ static enum mc_target_type get_mctgt_type_thp(struct vm_area_struct *vma,
                 unsigned long addr, pmd_t pmd, union mc_target *target)
  {
         struct page *page = NULL;
-       struct page_cgroup *pc;
         enum mc_target_type ret = MC_TARGET_NONE;
  
         page = pmd_page(pmd);
         VM_BUG_ON_PAGE(!page || !PageHead(page), page);
         if (!move_anon())
                 return ret;
-       pc = lookup_page_cgroup(page);
-       if (pc->mem_cgroup == mc.from) {
+       if (page->mem_cgroup == mc.from) {
                 ret = MC_TARGET_PAGE;
                 if (target) {
                         get_page(page);
@@ -5378,7 +5214,6 @@ static int mem_cgroup_move_charge_pte_range(pmd_t *pmd,
         enum mc_target_type target_type;
         union mc_target target;
         struct page *page;
-       struct page_cgroup *pc;
  
         /*
          * We don't take compound_lock() here but no race with splitting thp
@@ -5399,9 +5234,8 @@ static int mem_cgroup_move_charge_pte_range(pmd_t *pmd,
                 if (target_type == MC_TARGET_PAGE) {
                         page = target.page;
                         if (!isolate_lru_page(page)) {
-                               pc = lookup_page_cgroup(page);
                                 if (!mem_cgroup_move_account(page, HPAGE_PMD_NR,
-                                                       pc, mc.from, mc.to)) {
+                                                            mc.from, mc.to)) {
                                         mc.precharge -= HPAGE_PMD_NR;
                                         mc.moved_charge += HPAGE_PMD_NR;
                                 }
@@ -5429,9 +5263,7 @@ retry:
                         page = target.page;
                         if (isolate_lru_page(page))
                                 goto put;
-                       pc = lookup_page_cgroup(page);
-                       if (!mem_cgroup_move_account(page, 1, pc,
-                                                    mc.from, mc.to)) {
+                       if (!mem_cgroup_move_account(page, 1, mc.from, mc.to)) {
                                 mc.precharge--;
                                 /* we uncharge from mc.from later. */
                                 mc.moved_charge++;
@@ -5619,7 +5451,6 @@ static void __init enable_swap_cgroup(void)
  void mem_cgroup_swapout(struct page *page, swp_entry_t entry)
  {
         struct mem_cgroup *memcg;
-       struct page_cgroup *pc;
         unsigned short oldid;
  
         VM_BUG_ON_PAGE(PageLRU(page), page);
@@ -5628,8 +5459,7 @@ void mem_cgroup_swapout(struct page *page, swp_entry_t entry)
         if (!do_swap_account)
                 return;
  
-       pc = lookup_page_cgroup(page);
-       memcg = pc->mem_cgroup;
+       memcg = page->mem_cgroup;
  
         /* Readahead page, never charged */
         if (!memcg)
@@ -5639,7 +5469,7 @@ void mem_cgroup_swapout(struct page *page, swp_entry_t entry)
         VM_BUG_ON_PAGE(oldid, page);
         mem_cgroup_swap_statistics(memcg, true);
  
-       pc->mem_cgroup = NULL;
+       page->mem_cgroup = NULL;
  
         if (!mem_cgroup_is_root(memcg))
                 page_counter_uncharge(&memcg->memory, 1);
@@ -5706,7 +5536,6 @@ int mem_cgroup_try_charge(struct page *page, struct mm_struct *mm,
                 goto out;
  
         if (PageSwapCache(page)) {
-               struct page_cgroup *pc = lookup_page_cgroup(page);
                 /*
                  * Every swap fault against a single page tries to charge the
                  * page, bail as early as possible.  shmem_unuse() encounters
@@ -5714,7 +5543,7 @@ int mem_cgroup_try_charge(struct page *page, struct mm_struct *mm,
                  * the page lock, which serializes swap cache removal, which
                  * in turn serializes uncharging.
                  */
-               if (pc->mem_cgroup)
+               if (page->mem_cgroup)
                         goto out;
         }
  
@@ -5867,7 +5696,6 @@ static void uncharge_list(struct list_head *page_list)
         next = page_list->next;
         do {
                 unsigned int nr_pages = 1;
-               struct page_cgroup *pc;
  
                 page = list_entry(next, struct page, lru);
                 next = page->lru.next;
@@ -5875,23 +5703,22 @@ static void uncharge_list(struct list_head *page_list)
                 VM_BUG_ON_PAGE(PageLRU(page), page);
                 VM_BUG_ON_PAGE(page_count(page), page);
  
-               pc = lookup_page_cgroup(page);
-               if (!pc->mem_cgroup)
+               if (!page->mem_cgroup)
                         continue;
  
                 /*
                  * Nobody should be changing or seriously looking at
-                * pc->mem_cgroup at this point, we have fully
+                * page->mem_cgroup at this point, we have fully
                  * exclusive access to the page.
                  */
  
-               if (memcg != pc->mem_cgroup) {
+               if (memcg != page->mem_cgroup) {
                         if (memcg) {
                                 uncharge_batch(memcg, pgpgout, nr_anon, nr_file,
                                                nr_huge, page);
                                 pgpgout = nr_anon = nr_file = nr_huge = 0;
                         }
-                       memcg = pc->mem_cgroup;
+                       memcg = page->mem_cgroup;
                 }
  
                 if (PageTransHuge(page)) {
@@ -5905,7 +5732,7 @@ static void uncharge_list(struct list_head *page_list)
                 else
                         nr_file += nr_pages;
  
-               pc->mem_cgroup = NULL;
+               page->mem_cgroup = NULL;
  
                 pgpgout++;
         } while (next != page_list);
@@ -5924,14 +5751,11 @@ static void uncharge_list(struct list_head *page_list)
   */
  void mem_cgroup_uncharge(struct page *page)
  {
-       struct page_cgroup *pc;
-
         if (mem_cgroup_disabled())
                 return;
  
         /* Don't touch page->lru of any random page, pre-check: */
-       pc = lookup_page_cgroup(page);
-       if (!pc->mem_cgroup)
+       if (!page->mem_cgroup)
                 return;
  
         INIT_LIST_HEAD(&page->lru);
@@ -5968,7 +5792,6 @@ void mem_cgroup_migrate(struct page *oldpage, struct page *newpage,
                         bool lrucare)
  {
         struct mem_cgroup *memcg;
-       struct page_cgroup *pc;
         int isolated;
  
         VM_BUG_ON_PAGE(!PageLocked(oldpage), oldpage);
@@ -5983,8 +5806,7 @@ void mem_cgroup_migrate(struct page *oldpage, struct page *newpage,
                 return;
  
         /* Page cache replacement: new page already charged? */
-       pc = lookup_page_cgroup(newpage);
-       if (pc->mem_cgroup)
+       if (newpage->mem_cgroup)
                 return;
  
         /*
@@ -5993,15 +5815,14 @@ void mem_cgroup_migrate(struct page *oldpage, struct page *newpage,
          * uncharged page when the PFN walker finds a page that
          * reclaim just put back on the LRU but has not released yet.
          */
-       pc = lookup_page_cgroup(oldpage);
-       memcg = pc->mem_cgroup;
+       memcg = oldpage->mem_cgroup;
         if (!memcg)
                 return;
  
         if (lrucare)
                 lock_page_lru(oldpage, &isolated);
  
-       pc->mem_cgroup = NULL;
+       oldpage->mem_cgroup = NULL;
  
         if (lrucare)
                 unlock_page_lru(oldpage, isolated);