| Home » Mailing lists » Devel » Re: [PATCH v2 07/13] memcg: Slab accounting. Goto Forum:
	| 
		
			| Re: [PATCH v2 07/13] memcg: Slab accounting. [message #45452] | Sun, 11 March 2012 10:25  |  
			| 
				
				
					|  Glauber Costa Messages: 916
 Registered: October 2011
 | Senior Member |  |  |  
	| On 03/10/2012 12:39 AM, Suleiman Souhlal wrote: > Introduce per-cgroup kmem_caches for memcg slab accounting, that
 > get created asynchronously the first time we do an allocation of
 > that type in the cgroup.
 > The cgroup cache gets used in subsequent allocations, and permits
 > accounting of slab on a per-page basis.
 >
 > For a slab type to getaccounted, the SLAB_MEMCG_ACCT flag has to be
 > passed to kmem_cache_create().
 >
 > The per-cgroup kmem_caches get looked up at slab allocation time,
 > in a MAX_KMEM_CACHE_TYPES-sized array in the memcg structure, based
 > on the original kmem_cache's id, which gets allocated when the original
 > cache gets created.
 >
 > Only allocations that can be attributed to a cgroup get charged.
 >
 > Each cgroup kmem_cache has a refcount that dictates the lifetime
 > of the cache: We destroy a cgroup cache when its cgroup has been
 > destroyed and there are no more active objects in the cache.
 >
 > Signed-off-by: Suleiman Souhlal<suleiman@google.com>
 > ---
 >   include/linux/memcontrol.h |   30 +++++-
 >   include/linux/slab.h       |   41 ++++++
 >   include/linux/slab_def.h   |   72 +++++++++++-
 >   include/linux/slub_def.h   |    3 +
 >   init/Kconfig               |    2 +-
 >   mm/memcontrol.c            |  290 ++++++++++++++++++++++++++++++++++++++++++++
 >   mm/slab.c                  |  248 ++++++++++++++++++++++++++++++++++---
 >   7 files changed, 663 insertions(+), 23 deletions(-)
 >
 > diff --git a/include/linux/memcontrol.h b/include/linux/memcontrol.h
 > index b80de52..b6b8388 100644
 > --- a/include/linux/memcontrol.h
 > +++ b/include/linux/memcontrol.h
 > @@ -416,13 +416,41 @@ struct sock;
 >   #ifdef CONFIG_CGROUP_MEM_RES_CTLR_KMEM
 >   void sock_update_memcg(struct sock *sk);
 >   void sock_release_memcg(struct sock *sk);
 > -#else
 > +struct kmem_cache *mem_cgroup_get_kmem_cache(struct kmem_cache *cachep,
 > +    gfp_t gfp);
 > +bool mem_cgroup_charge_slab(struct kmem_cache *cachep, gfp_t gfp, size_t size);
 > +void mem_cgroup_uncharge_slab(struct kmem_cache *cachep, size_t size);
 > +void mem_cgroup_flush_cache_create_queue(void);
 > +void mem_cgroup_remove_child_kmem_cache(struct kmem_cache *cachep, int id);
 > +#else /* CONFIG_CGROUP_MEM_RES_CTLR_KMEM */
 >   static inline void sock_update_memcg(struct sock *sk)
 >   {
 >   }
 >   static inline void sock_release_memcg(struct sock *sk)
 >   {
 >   }
 > +
 > +static inline bool
 > +mem_cgroup_charge_slab(struct kmem_cache *cachep, gfp_t gfp, size_t size)
 > +{
 > +	return true;
 > +}
 > +
 > +static inline void
 > +mem_cgroup_uncharge_slab(struct kmem_cache *cachep, size_t size)
 > +{
 > +}
 > +
 > +static inline struct kmem_cache *
 > +mem_cgroup_get_kmem_cache(struct kmem_cache *cachep, gfp_t gfp)
 > +{
 > +	return cachep;
 > +}
 > +
 > +static inline void
 > +mem_cgroup_flush_cache_create_queue(void)
 > +{
 > +}
 >   #endif /* CONFIG_CGROUP_MEM_RES_CTLR_KMEM */
 >   #endif /* _LINUX_MEMCONTROL_H */
 >
 > diff --git a/include/linux/slab.h b/include/linux/slab.h
 > index 573c809..bc9f87f 100644
 > --- a/include/linux/slab.h
 > +++ b/include/linux/slab.h
 > @@ -21,6 +21,7 @@
 >   #define SLAB_POISON		0x00000800UL	/* DEBUG: Poison objects */
 >   #define SLAB_HWCACHE_ALIGN	0x00002000UL	/* Align objs on cache lines */
 >   #define SLAB_CACHE_DMA		0x00004000UL	/* Use GFP_DMA memory */
 > +#define SLAB_MEMCG_ACCT		0x00008000UL	/* Accounted by memcg */
 >   #define SLAB_STORE_USER		0x00010000UL	/* DEBUG: Store the last owner for bug hunting */
 >   #define SLAB_PANIC		0x00040000UL	/* Panic if kmem_cache_create() fails */
 >   /*
 > @@ -153,6 +154,21 @@ unsigned int kmem_cache_size(struct kmem_cache *);
 >   #define ARCH_SLAB_MINALIGN __alignof__(unsigned long long)
 >   #endif
 >
 > +#ifdef CONFIG_CGROUP_MEM_RES_CTLR_KMEM
 > +struct mem_cgroup_cache_params {
 > +	struct mem_cgroup *memcg;
 > +	int id;
 > +	int obj_size;
 > +
 > +	/* Original cache parameters, used when creating a memcg cache */
 > +	size_t orig_align;
 > +	unsigned long orig_flags;
 > +	struct kmem_cache *orig_cache;
 > +
 > +	struct list_head destroyed_list; /* Used when deleting cpuset cache */
 > +};
 > +#endif
 > +
 >   /*
 >    * Common kmalloc functions provided by all allocators
 >    */
 > @@ -353,4 +369,29 @@ static inline void *kzalloc_node(size_t size, gfp_t flags, int node)
 >
 >   void __init kmem_cache_init_late(void);
 >
 > +#if defined(CONFIG_CGROUP_MEM_RES_CTLR_KMEM)&&  defined(CONFIG_SLAB)
 > +
 > +#define MAX_KMEM_CACHE_TYPES 400
 > +
 > +struct kmem_cache *kmem_cache_create_memcg(struct kmem_cache *cachep,
 > +    char *name);
 > +void kmem_cache_drop_ref(struct kmem_cache *cachep);
 > +
 > +#else /* !CONFIG_CGROUP_MEM_RES_CTLR_KMEM || !CONFIG_SLAB */
 
 
 > +#define MAX_KMEM_CACHE_TYPES 0
 > +
 > +static inline struct kmem_cache *
 > +kmem_cache_create_memcg(struct kmem_cache *cachep,
 > +    char *name)
 > +{
 > +	return NULL;
 > +}
 > +
 > +static inline void
 > +kmem_cache_drop_ref(struct kmem_cache *cachep)
 > +{
 > +}
 > +#endif /* CONFIG_CGROUP_MEM_RES_CTLR_KMEM&&  CONFIG_SLAB */
 > +
 >   #endif	/* _LINUX_SLAB_H */
 > diff --git a/include/linux/slab_def.h b/include/linux/slab_def.h
 > index 25f9a6a..248b8a9 100644
 > --- a/include/linux/slab_def.h
 > +++ b/include/linux/slab_def.h
 > @@ -51,7 +51,7 @@ struct kmem_cache {
 >   	void (*ctor)(void *obj);
 >
 >   /* 4) cache creation/removal */
 > -	const char *name;
 > +	char *name;
 >   	struct list_head next;
 >
 >   /* 5) statistics */
 > @@ -81,6 +81,12 @@ struct kmem_cache {
 >   	int obj_size;
 >   #endif /* CONFIG_DEBUG_SLAB */
 >
 > +#ifdef CONFIG_CGROUP_MEM_RES_CTLR_KMEM
 > +	struct mem_cgroup_cache_params memcg_params;
 > +
 Can't we have memcg pointer + id here, and then get
 the rest of this data from memcg->slab_params[id] ?
 
 I don't think we'll ever access this on hot paths - since we're
 allocating pages anyway when we do, and then we have less bloat on
 the slab structure.
 
 Sure, we're just moving the bloat away somewhere else, since this data
 has to exist anyway, but at least it's not here bothering the slab when
 memcg is disabled...
 
 But I don't really have the final word here, this is just my preference
 - Would any of the slabmasters comment here, on what's your preferred
 way between those?
 
 > +	atomic_t refcnt;
 > +#endif /* CONFIG_CGROUP_MEM_RES_CTLR_KMEM */
 > +
 >   /* 6) per-cpu/per-node data, touched during every alloc/free */
 >   	/*
 >   	 * We put array[] at the end of kmem_cache, because we want to size
 > @@ -218,4 +224,68 @@ found:
 >
 >   #endif	/* CONFIG_NUMA */
 >
 > +#ifdef CONFIG_CGROUP_MEM_RES_CTLR_KMEM
 > +
 > +void kmem_cache_drop_ref(struct kmem_cache *cachep);
 > +
 > +static inline void
 > +kmem_cache_get_ref(struct kmem_cache *cachep)
 > +{
 > +	if (cachep->memcg_params.id == -1&&
 > +	    unlikely(!atomic_add_unless(&cachep->refcnt, 1, 0)))
 > +		BUG();
 > +}
 > +
 > +static inline void
 > +mem_cgroup_put_kmem_cache(struct kmem_cache *cachep)
 > +{
 > +	rcu_read_unlock();
 > +}
 > +
 > +static inline void
 > +mem_cgroup_kmem_cache_prepare_sleep(struct kmem_cache *cachep)
 > +{
 > +	/*
 > +	 * Make sure the cache doesn't get freed while we have interrupts
 > +	 * enabled.
 > +	 */
 > +	kmem_cache_get_ref(cachep);
 > +	rcu_read_unlock();
 > +}
 
 Is this really needed ? After this function call in slab.c, the slab
 code itself accesses cachep a thousand times. If it could be freed, it
 would already explode today for other reasons?
 Am I missing something here?
 
 > +static inline void
 > +mem_cgroup_kmem_cache_finish_sleep(struct kmem_cache *cachep)
 > +{
 > +	rcu_read_lock();
 > +	kmem_cache_drop_ref(cachep);
 > +}
 > +
 > +#else /* CONFIG_CGROUP_MEM_RES_CTLR_KMEM */
 > +
 > +static inline void
 > +kmem_cache_get_ref(struct kmem_cache *cachep)
 > +{
 > +}
 > +
 > +static inline void
 > +kmem_cache_drop_ref(struct kmem_cache *cachep)
 > +{
 > +}
 > +
 > +static inline void
 > +mem_cgroup_put_kmem_cache(struct kmem_cache *cachep)
 > +{
 > +}
 > +
 > +static inline void
 > +mem_cgroup_kmem_cache_prepare_sleep(struct kmem_cache *cachep)
 > +{
 > +}
 > +
 > +static inline void
 > +mem_cgroup_kmem_cache_finish_sleep(struct kmem_cache *cachep)
 > +{
 > +}
 > +#endif /* CONFIG_CGROUP_MEM_RES_CTLR_KMEM */
 > +
 >   #endif	/* _LINUX_SLAB_DEF_H */
 > diff --git a/include/linux/slub_def.h b/include/linux/slub_def.h
 > index 5911d81..09b602d 100644
 > --- a/include/linux/slub_def.h
 > +++ b/include/linux/slub_def.h
 > @@ -99,6 +99,9 @@ struct kmem_cache {
 >   #ifdef CONFIG_SYSFS
 >   	struct kobject kobj;	/* For sysfs */
 >   #endif
 > +#ifdef CONFIG_CGROUP_MEM_RES_CTLR_KMEM
 > +	struct mem_cgroup_cache_params memcg_params;
 > +#endif
 >
 >   #ifdef CONFIG_NUMA
 >   	/*
 > diff --git a/init/Kconfig b/init/Kconfig
 > index 3f42cd6..e7eb652 100644
 > --- a/init/Kconfig
 > +++ b/init/Kconfig
 > @@ -705,7 +705,7 @@ config CGROUP_MEM_RES_CTLR_SWAP_ENABLED
 >   	  then swapaccount=0 does the trick).
 >   config CGROUP_MEM_RES_CTLR_KMEM
 >   	bool "Memory Resource Controller Kernel Memory accounting (EXPERIMENTAL)"
 > -	depends on CGROUP_MEM_RES_CTLR&&  EXPERIMENTAL
 > +	depends on CGROUP_MEM_RES_CTLR&&  EXPERIMENTAL&&  !SLOB
 
 Orthogonal question: Will we ever want this (SLOB) ?
 
 >   	default n
 >   	help
 >   	  The Kernel Memory extension for Memory Resource Controller can limit
 > diff --git a/mm/memcontrol.c b/mm/memcontrol.c
 > index 2576
...
 
 
 |  
	|  |  | 
 
 Current Time: Sun Oct 26 22:23:45 GMT 2025 
 Total time taken to generate the page: 0.12191 seconds |