memcg: add mlock statistic in memory.stat

author Ying Han <yinghan@google.com>

Thu, 3 May 2012 05:44:01 +0000 (15:44 +1000)

committer Stephen Rothwell <sfr@canb.auug.org.au>

Thu, 3 May 2012 05:46:36 +0000 (15:46 +1000)
author Ying Han <yinghan@google.com>
Thu, 3 May 2012 05:44:01 +0000 (15:44 +1000)
committer Stephen Rothwell <sfr@canb.auug.org.au>
Thu, 3 May 2012 05:46:36 +0000 (15:46 +1000)
diff --git a/Documentation/cgroups/memory.txt b/Documentation/cgroups/memory.txt

index 9f6b3b0d6a15b43250d051d0a267822eb9a56b21..730e222accedf6b0f13bab6c13a559e71a583baf 100644 (file)
--- a/Documentation/cgroups/memory.txt
+++ b/Documentation/cgroups/memory.txt
@@ -428,6 +428,7 @@ memory.stat file includes following statistics
  cache          - # of bytes of page cache memory.
  rss            - # of bytes of anonymous and swap cache memory.
  mapped_file    - # of bytes of mapped file (includes tmpfs/shmem)
+mlock          - # of bytes of mlocked memory.
  pgpgin         - # of charging events to the memory cgroup. The charging
                 event happens each time a page is accounted as either mapped
                 anon page(RSS) or cache page(Page Cache) to the cgroup.
diff --git a/include/linux/memcontrol.h b/include/linux/memcontrol.h

index b33fd64156a212d9adba714a1749035207126abe..94c0cdabb855d20a6165bb72896e3adad6719ae7 100644 (file)
--- a/include/linux/memcontrol.h
+++ b/include/linux/memcontrol.h
@@ -30,6 +30,7 @@ struct mm_struct;
  /* Stats that can be updated by kernel. */
  enum mem_cgroup_page_stat_item {
         MEMCG_NR_FILE_MAPPED, /* # of pages charged as file rss */
+       MEMCG_NR_MLOCK, /* # of pages charged as mlock */
  };
  
  struct mem_cgroup_reclaim_cookie {
diff --git a/mm/internal.h b/mm/internal.h

index 8b0fc8da802893d1f7be5892345950032b42d51f..dfe0a7da9c007557669c43636162287c17a06143 100644 (file)
--- a/mm/internal.h
+++ b/mm/internal.h
@@ -12,6 +12,7 @@
  #define __MM_INTERNAL_H
  
  #include <linux/mm.h>
+#include <linux/memcontrol.h>
  
  void free_pgtables(struct mmu_gather *tlb, struct vm_area_struct *start_vma,
                 unsigned long floor, unsigned long ceiling);
@@ -167,15 +168,22 @@ static inline void munlock_vma_pages_all(struct vm_area_struct *vma)
  static inline int mlocked_vma_newpage(struct vm_area_struct *vma,
                                     struct page *page)
  {
+       bool locked;
+       unsigned long flags;
+
         VM_BUG_ON(PageLRU(page));
  
         if (likely((vma->vm_flags & (VM_LOCKED | VM_SPECIAL)) != VM_LOCKED))
                 return 0;
  
+       mem_cgroup_begin_update_page_stat(page, &locked, &flags);
         if (!TestSetPageMlocked(page)) {
                 inc_zone_page_state(page, NR_MLOCK);
+               mem_cgroup_inc_page_stat(page, MEMCG_NR_MLOCK);
                 count_vm_event(UNEVICTABLE_PGMLOCKED);
         }
+       mem_cgroup_end_update_page_stat(page, &locked, &flags);
+
         return 1;
  }
  
@@ -197,8 +205,13 @@ extern void munlock_vma_page(struct page *page);
  extern void __clear_page_mlock(struct page *page);
  static inline void clear_page_mlock(struct page *page)
  {
+       bool locked;
+       unsigned long flags;
+
+       mem_cgroup_begin_update_page_stat(page, &locked, &flags);
         if (unlikely(TestClearPageMlocked(page)))
                 __clear_page_mlock(page);
+       mem_cgroup_end_update_page_stat(page, &locked, &flags);
  }
  
  /*
@@ -207,6 +220,11 @@ static inline void clear_page_mlock(struct page *page)
   */
  static inline void mlock_migrate_page(struct page *newpage, struct page *page)
  {
+       /*
+        * Here we are supposed to update the page memcg's mlock stat and the
+        * newpage memcgs' mlock. Since the page and newpage are always being
+        * charged to the same memcg, so no need.
+        */
         if (TestClearPageMlocked(page)) {
                 unsigned long flags;
  
diff --git a/mm/memcontrol.c b/mm/memcontrol.c

index bbae7af36cc7cd3bec762d648db44f77628e67d4..f9ce39f09da8a5e85d6591a546541a4144af5a28 100644 (file)
--- a/mm/memcontrol.c
+++ b/mm/memcontrol.c
@@ -97,6 +97,7 @@ enum mem_cgroup_stat_index {
         MEM_CGROUP_STAT_CACHE,     /* # of pages charged as cache */
         MEM_CGROUP_STAT_RSS,       /* # of pages charged as anon rss */
         MEM_CGROUP_STAT_FILE_MAPPED,  /* # of pages charged as file rss */
+       MEM_CGROUP_STAT_MLOCK, /* # of pages charged as mlock()ed */
         MEM_CGROUP_STAT_SWAPOUT, /* # of pages, swapped out */
         MEM_CGROUP_STAT_DATA, /* end of data requires synchronization */
         MEM_CGROUP_STAT_NSTATS,
@@ -1989,6 +1990,9 @@ void mem_cgroup_update_page_stat(struct page *page,
         case MEMCG_NR_FILE_MAPPED:
                 idx = MEM_CGROUP_STAT_FILE_MAPPED;
                 break;
+       case MEMCG_NR_MLOCK:
+               idx = MEM_CGROUP_STAT_MLOCK;
+               break;
         default:
                 BUG();
         }
@@ -2641,6 +2645,14 @@ static int mem_cgroup_move_account(struct page *page,
                 __this_cpu_inc(to->stat->count[MEM_CGROUP_STAT_FILE_MAPPED]);
                 preempt_enable();
         }
+
+       if (PageMlocked(page)) {
+               /* Update mlocked data for mem_cgroup */
+               preempt_disable();
+               __this_cpu_dec(from->stat->count[MEM_CGROUP_STAT_MLOCK]);
+               __this_cpu_inc(to->stat->count[MEM_CGROUP_STAT_MLOCK]);
+               preempt_enable();
+       }
         mem_cgroup_charge_statistics(from, anon, -nr_pages);
         if (uncharge)
                 /* This is not "cancel", but cancel_charge does all we need. */
@@ -4244,6 +4256,7 @@ enum {
         MCS_CACHE,
         MCS_RSS,
         MCS_FILE_MAPPED,
+       MCS_MLOCK,
         MCS_PGPGIN,
         MCS_PGPGOUT,
         MCS_SWAP,
@@ -4268,6 +4281,7 @@ static struct {
         {"cache", "total_cache"},
         {"rss", "total_rss"},
         {"mapped_file", "total_mapped_file"},
+       {"mlock", "total_mlock"},
         {"pgpgin", "total_pgpgin"},
         {"pgpgout", "total_pgpgout"},
         {"swap", "total_swap"},
@@ -4293,6 +4307,8 @@ mem_cgroup_get_local_stat(struct mem_cgroup *memcg, struct mcs_total_stat *s)
         s->stat[MCS_RSS] += val * PAGE_SIZE;
         val = mem_cgroup_read_stat(memcg, MEM_CGROUP_STAT_FILE_MAPPED);
         s->stat[MCS_FILE_MAPPED] += val * PAGE_SIZE;
+       val = mem_cgroup_read_stat(memcg, MEM_CGROUP_STAT_MLOCK);
+       s->stat[MCS_MLOCK] += val * PAGE_SIZE;
         val = mem_cgroup_read_events(memcg, MEM_CGROUP_EVENTS_PGPGIN);
         s->stat[MCS_PGPGIN] += val;
         val = mem_cgroup_read_events(memcg, MEM_CGROUP_EVENTS_PGPGOUT);
diff --git a/mm/mlock.c b/mm/mlock.c

index ef726e8aa8e9ca56c0713abfa4b621f44a210d4c..cef020158aae9b0a792d03204c50d3d9b135aa21 100644 (file)
--- a/mm/mlock.c
+++ b/mm/mlock.c
@@ -50,6 +50,8 @@ EXPORT_SYMBOL(can_do_mlock);
  
  /*
   *  LRU accounting for clear_page_mlock()
+ *  Make sure the caller calls mem_cgroup_begin[end]_update_page_stat,
+ *  otherwise it will be race between "move" and "page stat accounting".
   */
  void __clear_page_mlock(struct page *page)
  {
@@ -60,6 +62,7 @@ void __clear_page_mlock(struct page *page)
         }
  
         dec_zone_page_state(page, NR_MLOCK);
+       mem_cgroup_dec_page_stat(page, MEMCG_NR_MLOCK);
         count_vm_event(UNEVICTABLE_PGCLEARED);
         if (!isolate_lru_page(page)) {
                 putback_lru_page(page);
@@ -78,14 +81,20 @@ void __clear_page_mlock(struct page *page)
   */
  void mlock_vma_page(struct page *page)
  {
+       bool locked;
+       unsigned long flags;
+
         BUG_ON(!PageLocked(page));
  
+       mem_cgroup_begin_update_page_stat(page, &locked, &flags);
         if (!TestSetPageMlocked(page)) {
                 inc_zone_page_state(page, NR_MLOCK);
+               mem_cgroup_inc_page_stat(page, MEMCG_NR_MLOCK);
                 count_vm_event(UNEVICTABLE_PGMLOCKED);
                 if (!isolate_lru_page(page))
                         putback_lru_page(page);
         }
+       mem_cgroup_end_update_page_stat(page, &locked, &flags);
  }
  
  /**
@@ -105,10 +114,15 @@ void mlock_vma_page(struct page *page)
   */
  void munlock_vma_page(struct page *page)
  {
+       bool locked;
+       unsigned long flags;
+
         BUG_ON(!PageLocked(page));
  
+       mem_cgroup_begin_update_page_stat(page, &locked, &flags);
         if (TestClearPageMlocked(page)) {
                 dec_zone_page_state(page, NR_MLOCK);
+               mem_cgroup_dec_page_stat(page, MEMCG_NR_MLOCK);
                 if (!isolate_lru_page(page)) {
                         int ret = SWAP_AGAIN;
  
@@ -141,6 +155,7 @@ void munlock_vma_page(struct page *page)
                                 count_vm_event(UNEVICTABLE_PGMUNLOCKED);
                 }
         }
+       mem_cgroup_end_update_page_stat(page, &locked, &flags);
  }
  
  /**
diff --git a/mm/page_alloc.c b/mm/page_alloc.c

index 3a1c648ec7999a707d2cf5f621a785812b3d0f1b..3537be3b5bbe923e3db2429c6d9a915f7d80507b 100644 (file)
--- a/mm/page_alloc.c
+++ b/mm/page_alloc.c
@@ -723,6 +723,11 @@ static void __free_pages_ok(struct page *page, unsigned int order)
                 return;
  
         local_irq_save(flags);
+       /*
+        * Note: we didn't update the page memcg's mlock stat since we believe
+        * the mlocked page shouldn't get to here. However, we could be wrong
+        * and a warn_once would tell us.
+        */
         if (unlikely(wasMlocked))
                 free_page_mlock(page);
         __count_vm_events(PGFREE, 1 << order);
@@ -1298,6 +1303,11 @@ void free_hot_cold_page(struct page *page, int cold)
         migratetype = get_pageblock_migratetype(page);
         set_page_private(page, migratetype);
         local_irq_save(flags);
+       /*
+        * Note: we didn't update the page memcg's mlock stat since we believe
+        * the mlocked page shouldn't get to here. However, we could be wrong
+        * and a warn_once would tell us.
+        */
         if (unlikely(wasMlocked))
                 free_page_mlock(page);
         __count_vm_event(PGFREE);
author	Ying Han <yinghan@google.com>
	Thu, 3 May 2012 05:44:01 +0000 (15:44 +1000)
committer	Stephen Rothwell <sfr@canb.auug.org.au>
	Thu, 3 May 2012 05:46:36 +0000 (15:46 +1000)
Documentation/cgroups/memory.txt		patch \| blob \| history
include/linux/memcontrol.h		patch \| blob \| history
mm/internal.h		patch \| blob \| history
mm/memcontrol.c		patch \| blob \| history
mm/mlock.c		patch \| blob \| history
mm/page_alloc.c		patch \| blob \| history