mm: memcontrol: flush percpu slab vmstats on kmem offlining

author Roman Gushchin <guro@fb.com>

Fri, 30 Aug 2019 23:04:32 +0000 (16:04 -0700)

committer Linus Torvalds <torvalds@linux-foundation.org>

Sat, 31 Aug 2019 01:00:50 +0000 (18:00 -0700)
author Roman Gushchin <guro@fb.com>
Fri, 30 Aug 2019 23:04:32 +0000 (16:04 -0700)
committer Linus Torvalds <torvalds@linux-foundation.org>
Sat, 31 Aug 2019 01:00:50 +0000 (18:00 -0700)
diff --git a/include/linux/mmzone.h b/include/linux/mmzone.h

index d77d717c620cbe3362b5787086b546f08b938f46..3f38c30d2f13d1e3b86408a6edf1e0eb8ef52778 100644 (file)
--- a/include/linux/mmzone.h
+++ b/include/linux/mmzone.h
@@ -215,8 +215,9 @@ enum node_stat_item {
         NR_INACTIVE_FILE,       /*  "     "     "   "       "         */
         NR_ACTIVE_FILE,         /*  "     "     "   "       "         */
         NR_UNEVICTABLE,         /*  "     "     "   "       "         */
-       NR_SLAB_RECLAIMABLE,
-       NR_SLAB_UNRECLAIMABLE,
+       NR_SLAB_RECLAIMABLE,    /* Please do not reorder this item */
+       NR_SLAB_UNRECLAIMABLE,  /* and this one without looking at
+                                * memcg_flush_percpu_vmstats() first. */
         NR_ISOLATED_ANON,       /* Temporary isolated pages from anon lru */
         NR_ISOLATED_FILE,       /* Temporary isolated pages from file lru */
         WORKINGSET_NODES,
diff --git a/mm/memcontrol.c b/mm/memcontrol.c

index 26e2999af608d3776e609b213d522345fc793792..1f585d6c77c138d45cda49ec112595e1244d4f52 100644 (file)
--- a/mm/memcontrol.c
+++ b/mm/memcontrol.c
@@ -3260,37 +3260,49 @@ static u64 mem_cgroup_read_u64(struct cgroup_subsys_state *css,
         }
  }
  
-static void memcg_flush_percpu_vmstats(struct mem_cgroup *memcg)
+static void memcg_flush_percpu_vmstats(struct mem_cgroup *memcg, bool slab_only)
  {
         unsigned long stat[MEMCG_NR_STAT];
         struct mem_cgroup *mi;
         int node, cpu, i;
+       int min_idx, max_idx;
  
-       for (i = 0; i < MEMCG_NR_STAT; i++)
+       if (slab_only) {
+               min_idx = NR_SLAB_RECLAIMABLE;
+               max_idx = NR_SLAB_UNRECLAIMABLE;
+       } else {
+               min_idx = 0;
+               max_idx = MEMCG_NR_STAT;
+       }
+
+       for (i = min_idx; i < max_idx; i++)
                 stat[i] = 0;
  
         for_each_online_cpu(cpu)
-               for (i = 0; i < MEMCG_NR_STAT; i++)
+               for (i = min_idx; i < max_idx; i++)
                         stat[i] += raw_cpu_read(memcg->vmstats_percpu->stat[i]);
  
         for (mi = memcg; mi; mi = parent_mem_cgroup(mi))
-               for (i = 0; i < MEMCG_NR_STAT; i++)
+               for (i = min_idx; i < max_idx; i++)
                         atomic_long_add(stat[i], &mi->vmstats[i]);
  
+       if (!slab_only)
+               max_idx = NR_VM_NODE_STAT_ITEMS;
+
         for_each_node(node) {
                 struct mem_cgroup_per_node *pn = memcg->nodeinfo[node];
                 struct mem_cgroup_per_node *pi;
  
-               for (i = 0; i < NR_VM_NODE_STAT_ITEMS; i++)
+               for (i = min_idx; i < max_idx; i++)
                         stat[i] = 0;
  
                 for_each_online_cpu(cpu)
-                       for (i = 0; i < NR_VM_NODE_STAT_ITEMS; i++)
+                       for (i = min_idx; i < max_idx; i++)
                                 stat[i] += raw_cpu_read(
                                         pn->lruvec_stat_cpu->count[i]);
  
                 for (pi = pn; pi; pi = parent_nodeinfo(pi, node))
-                       for (i = 0; i < NR_VM_NODE_STAT_ITEMS; i++)
+                       for (i = min_idx; i < max_idx; i++)
                                 atomic_long_add(stat[i], &pi->lruvec_stat[i]);
         }
  }
@@ -3363,7 +3375,14 @@ static void memcg_offline_kmem(struct mem_cgroup *memcg)
         if (!parent)
                 parent = root_mem_cgroup;
  
+       /*
+        * Deactivate and reparent kmem_caches. Then flush percpu
+        * slab statistics to have precise values at the parent and
+        * all ancestor levels. It's required to keep slab stats
+        * accurate after the reparenting of kmem_caches.
+        */
         memcg_deactivate_kmem_caches(memcg, parent);
+       memcg_flush_percpu_vmstats(memcg, true);
  
         kmemcg_id = memcg->kmemcg_id;
         BUG_ON(kmemcg_id < 0);
@@ -4740,7 +4759,7 @@ static void __mem_cgroup_free(struct mem_cgroup *memcg)
          * Flush percpu vmstats and vmevents to guarantee the value correctness
          * on parent's and all ancestor levels.
          */
-       memcg_flush_percpu_vmstats(memcg);
+       memcg_flush_percpu_vmstats(memcg, false);
         memcg_flush_percpu_vmevents(memcg);
         for_each_node(node)
                 free_mem_cgroup_per_node_info(memcg, node);
author	Roman Gushchin <guro@fb.com>
	Fri, 30 Aug 2019 23:04:32 +0000 (16:04 -0700)
committer	Linus Torvalds <torvalds@linux-foundation.org>
	Sat, 31 Aug 2019 01:00:50 +0000 (18:00 -0700)
include/linux/mmzone.h		patch \| blob \| history
mm/memcontrol.c		patch \| blob \| history