mirror of
				https://git.kernel.org/pub/scm/linux/kernel/git/chenhuacai/linux-loongson
				synced 2025-10-25 17:45:25 +00:00 
			
		
		
		
	 8725d54162
			
		
	
	
		8725d54162
		
	
	
	
	
		
			
			Presently, memcg's FILE_MAPPED accounting has following race with
move_account (happens at rmdir()).
    increment page->mapcount (rmap.c)
    mem_cgroup_update_file_mapped()           move_account()
					      lock_page_cgroup()
					      check page_mapped() if
					      page_mapped(page)>1 {
						FILE_MAPPED -1 from old memcg
						FILE_MAPPED +1 to old memcg
					      }
					      .....
					      overwrite pc->mem_cgroup
					      unlock_page_cgroup()
    lock_page_cgroup()
    FILE_MAPPED + 1 to pc->mem_cgroup
    unlock_page_cgroup()
Then,
	old memcg (-1 file mapped)
	new memcg (+2 file mapped)
This happens because move_account see page_mapped() which is not guarded
by lock_page_cgroup().  This patch adds FILE_MAPPED flag to page_cgroup
and move account information based on it.  Now, all checks are synchronous
with lock_page_cgroup().
Signed-off-by: KAMEZAWA Hiroyuki <kamezawa.hiroyu@jp.fujitsu.com>
Reviewed-by: Balbir Singh <balbir@in.ibm.com>
Reviewed-by: Daisuke Nishimura <nishimura@mxp.nes.nec.co.jp>
Cc: Andrea Righi <arighi@develer.com>
Cc: Andrea Arcangeli <aarcange@redhat.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
		
	
			
		
			
				
	
	
		
			160 lines
		
	
	
		
			3.7 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			160 lines
		
	
	
		
			3.7 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| #ifndef __LINUX_PAGE_CGROUP_H
 | |
| #define __LINUX_PAGE_CGROUP_H
 | |
| 
 | |
| #ifdef CONFIG_CGROUP_MEM_RES_CTLR
 | |
| #include <linux/bit_spinlock.h>
 | |
| /*
 | |
|  * Page Cgroup can be considered as an extended mem_map.
 | |
|  * A page_cgroup page is associated with every page descriptor. The
 | |
|  * page_cgroup helps us identify information about the cgroup
 | |
|  * All page cgroups are allocated at boot or memory hotplug event,
 | |
|  * then the page cgroup for pfn always exists.
 | |
|  */
 | |
| struct page_cgroup {
 | |
| 	unsigned long flags;
 | |
| 	struct mem_cgroup *mem_cgroup;
 | |
| 	struct page *page;
 | |
| 	struct list_head lru;		/* per cgroup LRU list */
 | |
| };
 | |
| 
 | |
| void __meminit pgdat_page_cgroup_init(struct pglist_data *pgdat);
 | |
| 
 | |
| #ifdef CONFIG_SPARSEMEM
 | |
| static inline void __init page_cgroup_init_flatmem(void)
 | |
| {
 | |
| }
 | |
| extern void __init page_cgroup_init(void);
 | |
| #else
 | |
| void __init page_cgroup_init_flatmem(void);
 | |
| static inline void __init page_cgroup_init(void)
 | |
| {
 | |
| }
 | |
| #endif
 | |
| 
 | |
| struct page_cgroup *lookup_page_cgroup(struct page *page);
 | |
| 
 | |
| enum {
 | |
| 	/* flags for mem_cgroup */
 | |
| 	PCG_LOCK,  /* page cgroup is locked */
 | |
| 	PCG_CACHE, /* charged as cache */
 | |
| 	PCG_USED, /* this object is in use. */
 | |
| 	PCG_ACCT_LRU, /* page has been accounted for */
 | |
| 	PCG_FILE_MAPPED, /* page is accounted as "mapped" */
 | |
| };
 | |
| 
 | |
| #define TESTPCGFLAG(uname, lname)			\
 | |
| static inline int PageCgroup##uname(struct page_cgroup *pc)	\
 | |
| 	{ return test_bit(PCG_##lname, &pc->flags); }
 | |
| 
 | |
| #define SETPCGFLAG(uname, lname)			\
 | |
| static inline void SetPageCgroup##uname(struct page_cgroup *pc)\
 | |
| 	{ set_bit(PCG_##lname, &pc->flags);  }
 | |
| 
 | |
| #define CLEARPCGFLAG(uname, lname)			\
 | |
| static inline void ClearPageCgroup##uname(struct page_cgroup *pc)	\
 | |
| 	{ clear_bit(PCG_##lname, &pc->flags);  }
 | |
| 
 | |
| #define TESTCLEARPCGFLAG(uname, lname)			\
 | |
| static inline int TestClearPageCgroup##uname(struct page_cgroup *pc)	\
 | |
| 	{ return test_and_clear_bit(PCG_##lname, &pc->flags);  }
 | |
| 
 | |
| TESTPCGFLAG(Locked, LOCK)
 | |
| 
 | |
| /* Cache flag is set only once (at allocation) */
 | |
| TESTPCGFLAG(Cache, CACHE)
 | |
| CLEARPCGFLAG(Cache, CACHE)
 | |
| SETPCGFLAG(Cache, CACHE)
 | |
| 
 | |
| TESTPCGFLAG(Used, USED)
 | |
| CLEARPCGFLAG(Used, USED)
 | |
| SETPCGFLAG(Used, USED)
 | |
| 
 | |
| SETPCGFLAG(AcctLRU, ACCT_LRU)
 | |
| CLEARPCGFLAG(AcctLRU, ACCT_LRU)
 | |
| TESTPCGFLAG(AcctLRU, ACCT_LRU)
 | |
| TESTCLEARPCGFLAG(AcctLRU, ACCT_LRU)
 | |
| 
 | |
| 
 | |
| SETPCGFLAG(FileMapped, FILE_MAPPED)
 | |
| CLEARPCGFLAG(FileMapped, FILE_MAPPED)
 | |
| TESTPCGFLAG(FileMapped, FILE_MAPPED)
 | |
| 
 | |
| static inline int page_cgroup_nid(struct page_cgroup *pc)
 | |
| {
 | |
| 	return page_to_nid(pc->page);
 | |
| }
 | |
| 
 | |
| static inline enum zone_type page_cgroup_zid(struct page_cgroup *pc)
 | |
| {
 | |
| 	return page_zonenum(pc->page);
 | |
| }
 | |
| 
 | |
| static inline void lock_page_cgroup(struct page_cgroup *pc)
 | |
| {
 | |
| 	bit_spin_lock(PCG_LOCK, &pc->flags);
 | |
| }
 | |
| 
 | |
| static inline void unlock_page_cgroup(struct page_cgroup *pc)
 | |
| {
 | |
| 	bit_spin_unlock(PCG_LOCK, &pc->flags);
 | |
| }
 | |
| 
 | |
| #else /* CONFIG_CGROUP_MEM_RES_CTLR */
 | |
| struct page_cgroup;
 | |
| 
 | |
| static inline void __meminit pgdat_page_cgroup_init(struct pglist_data *pgdat)
 | |
| {
 | |
| }
 | |
| 
 | |
| static inline struct page_cgroup *lookup_page_cgroup(struct page *page)
 | |
| {
 | |
| 	return NULL;
 | |
| }
 | |
| 
 | |
| static inline void page_cgroup_init(void)
 | |
| {
 | |
| }
 | |
| 
 | |
| static inline void __init page_cgroup_init_flatmem(void)
 | |
| {
 | |
| }
 | |
| 
 | |
| #endif
 | |
| 
 | |
| #include <linux/swap.h>
 | |
| 
 | |
| #ifdef CONFIG_CGROUP_MEM_RES_CTLR_SWAP
 | |
| extern unsigned short swap_cgroup_cmpxchg(swp_entry_t ent,
 | |
| 					unsigned short old, unsigned short new);
 | |
| extern unsigned short swap_cgroup_record(swp_entry_t ent, unsigned short id);
 | |
| extern unsigned short lookup_swap_cgroup(swp_entry_t ent);
 | |
| extern int swap_cgroup_swapon(int type, unsigned long max_pages);
 | |
| extern void swap_cgroup_swapoff(int type);
 | |
| #else
 | |
| 
 | |
| static inline
 | |
| unsigned short swap_cgroup_record(swp_entry_t ent, unsigned short id)
 | |
| {
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline
 | |
| unsigned short lookup_swap_cgroup(swp_entry_t ent)
 | |
| {
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline int
 | |
| swap_cgroup_swapon(int type, unsigned long max_pages)
 | |
| {
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline void swap_cgroup_swapoff(int type)
 | |
| {
 | |
| 	return;
 | |
| }
 | |
| 
 | |
| #endif
 | |
| #endif
 |