| Home » Mailing lists » Devel » [PATCH, v4 0/2] Timer slack cgroup subsystem Goto Forum:
	| 
		
			| [PATCH, v4 0/2] Timer slack cgroup subsystem [message #41514] | Thu, 03 February 2011 14:34  |  
			| 
				
				
					|  Kirill A. Shutsemov Messages: 32
 Registered: February 2011
 | Member |  |  |  
	| From: Kirill A. Shutemov <kirill@shutemov.name> 
 Changelog:
 v4:
 - hierarchy support
 - drop dummy_timer_slack_check()
 - workaround lockdep false (?) positive
 - allow 0 as timer slack value
 v3:
 - rework interface
 - s/EXPORT_SYMBOL/EXPORT_SYMBOL_GPL/
 v2:
 - fixed with CONFIG_CGROUP_TIMER_SLACK=y
 v1:
 - initial revision
 
 Kirill A. Shutemov (2):
 cgroups: export cgroup_iter_{start,next,end}
 cgroups: introduce timer slack subsystem
 
 include/linux/cgroup_subsys.h |    6 +
 include/linux/init_task.h     |    4 +-
 init/Kconfig                  |   10 ++
 kernel/Makefile               |    1 +
 kernel/cgroup.c               |    3 +
 kernel/cgroup_timer_slack.c   |  262 +++++++++++++++++++++++++++++++++++++++++
 kernel/sys.c                  |   19 ++-
 7 files changed, 298 insertions(+), 7 deletions(-)
 create mode 100644 kernel/cgroup_timer_slack.c
 
 --
 1.7.3.5
 
 _______________________________________________
 Containers mailing list
 Containers@lists.linux-foundation.org
 https://lists.linux-foundation.org/mailman/listinfo/containe rs
 |  
	|  |  |  
	| 
		
			| [PATCH, v4 1/2] cgroups: export cgroup_iter_{start, next, end} [message #41515 is a reply to message #41514] | Thu, 03 February 2011 14:34   |  
			| 
				
				
					|  Kirill A. Shutsemov Messages: 32
 Registered: February 2011
 | Member |  |  |  
	| From: Kirill A. Shutemov <kirill@shutemov.name> 
 Signed-off-by: Kirill A. Shutemov <kirill@shutemov.name>
 ---
 kernel/cgroup.c |    3 +++
 1 files changed, 3 insertions(+), 0 deletions(-)
 
 diff --git a/kernel/cgroup.c b/kernel/cgroup.c
 index b24d702..8234daa 100644
 --- a/kernel/cgroup.c
 +++ b/kernel/cgroup.c
 @@ -2443,6 +2443,7 @@ void cgroup_iter_start(struct cgroup *cgrp, struct cgroup_iter *it)
 it->cg_link = &cgrp->css_sets;
 cgroup_advance_iter(cgrp, it);
 }
 +EXPORT_SYMBOL_GPL(cgroup_iter_start);
 
 struct task_struct *cgroup_iter_next(struct cgroup *cgrp,
 struct cgroup_iter *it)
 @@ -2467,11 +2468,13 @@ struct task_struct *cgroup_iter_next(struct cgroup *cgrp,
 }
 return res;
 }
 +EXPORT_SYMBOL_GPL(cgroup_iter_next);
 
 void cgroup_iter_end(struct cgroup *cgrp, struct cgroup_iter *it)
 {
 read_unlock(&css_set_lock);
 }
 +EXPORT_SYMBOL_GPL(cgroup_iter_end);
 
 static inline int started_after_time(struct task_struct *t1,
 struct timespec *time,
 --
 1.7.3.5
 
 _______________________________________________
 Containers mailing list
 Containers@lists.linux-foundation.org
 https://lists.linux-foundation.org/mailman/listinfo/containe rs
 |  
	|  |  |  
	| 
		
			| [PATCH, v4 2/2] cgroups: introduce timer slack subsystem [message #41516 is a reply to message #41514] | Thu, 03 February 2011 14:34   |  
			| 
				
				
					|  Kirill A. Shutsemov Messages: 32
 Registered: February 2011
 | Member |  |  |  
	| From: Kirill A. Shutemov <kirill@shutemov.name> 
 Provides a way of tasks grouping by timer slack value. Introduces per
 cgroup max and min timer slack value. When a task attaches to a cgroup,
 its timer slack value adjusts (if needed) to fit min-max range.
 
 It also provides a way to set timer slack value for all tasks in the
 cgroup at once.
 
 This functionality is useful in mobile devices where certain background
 apps are attached to a cgroup and minimum wakeups are desired.
 
 Signed-off-by: Kirill A. Shutemov <kirill@shutemov.name>
 Idea-by: Jacob Pan <jacob.jun.pan@linux.intel.com>
 Signed-off-by: Kirill A. Shutemov <kirill@shutemov.name>
 ---
 include/linux/cgroup_subsys.h |    6 +
 include/linux/init_task.h     |    4 +-
 init/Kconfig                  |   10 ++
 kernel/Makefile               |    1 +
 kernel/cgroup_timer_slack.c   |  262 +++++++++++++++++++++++++++++++++++++++++
 kernel/sys.c                  |   19 ++-
 6 files changed, 295 insertions(+), 7 deletions(-)
 create mode 100644 kernel/cgroup_timer_slack.c
 
 diff --git a/include/linux/cgroup_subsys.h b/include/linux/cgroup_subsys.h
 index ccefff0..e399228 100644
 --- a/include/linux/cgroup_subsys.h
 +++ b/include/linux/cgroup_subsys.h
 @@ -66,3 +66,9 @@ SUBSYS(blkio)
 #endif
 
 /* */
 +
 +#ifdef CONFIG_CGROUP_TIMER_SLACK
 +SUBSYS(timer_slack)
 +#endif
 +
 +/* */
 diff --git a/include/linux/init_task.h b/include/linux/init_task.h
 index caa151f..48eca8f 100644
 --- a/include/linux/init_task.h
 +++ b/include/linux/init_task.h
 @@ -124,6 +124,8 @@ extern struct cred init_cred;
 # define INIT_PERF_EVENTS(tsk)
 #endif
 
 +#define TIMER_SLACK_NS_DEFAULT 50000
 +
 /*
 *  INIT_TASK is used to set up the first task table, touch at
 * your own risk!. Base=0, limit=0x1fffff (=2MB)
 @@ -177,7 +179,7 @@ extern struct cred init_cred;
 .cpu_timers	= INIT_CPU_TIMERS(tsk.cpu_timers),		\
 .fs_excl	= ATOMIC_INIT(0),				\
 .pi_lock	= __RAW_SPIN_LOCK_UNLOCKED(tsk.pi_lock),	\
 -	.timer_slack_ns = 50000, /* 50 usec default slack */		\
 +	.timer_slack_ns = TIMER_SLACK_NS_DEFAULT,			\
 .pids = {							\
 [PIDTYPE_PID]  = INIT_PID_LINK(PIDTYPE_PID),		\
 [PIDTYPE_PGID] = INIT_PID_LINK(PIDTYPE_PGID),		\
 diff --git a/init/Kconfig b/init/Kconfig
 index be788c0..6cf465f 100644
 --- a/init/Kconfig
 +++ b/init/Kconfig
 @@ -596,6 +596,16 @@ config CGROUP_FREEZER
 Provides a way to freeze and unfreeze all tasks in a
 cgroup.
 
 +config CGROUP_TIMER_SLACK
 +	tristate "Timer slack cgroup subsystem"
 +	help
 +	  Provides a way of tasks grouping by timer slack value.
 +	  Introduces per cgroup timer slack value which will override
 +	  the default timer slack value once a task is attached to a
 +	  cgroup.
 +	  It's useful in mobile devices where certain background apps
 +	  are attached to a cgroup and combined wakeups are desired.
 +
 config CGROUP_DEVICE
 bool "Device controller for cgroups"
 help
 diff --git a/kernel/Makefile b/kernel/Makefile
 index 353d3fe..0b60239 100644
 --- a/kernel/Makefile
 +++ b/kernel/Makefile
 @@ -61,6 +61,7 @@ obj-$(CONFIG_BACKTRACE_SELF_TEST) += backtracetest.o
 obj-$(CONFIG_COMPAT) += compat.o
 obj-$(CONFIG_CGROUPS) += cgroup.o
 obj-$(CONFIG_CGROUP_FREEZER) += cgroup_freezer.o
 +obj-$(CONFIG_CGROUP_TIMER_SLACK) += cgroup_timer_slack.o
 obj-$(CONFIG_CPUSETS) += cpuset.o
 obj-$(CONFIG_CGROUP_NS) += ns_cgroup.o
 obj-$(CONFIG_UTS_NS) += utsname.o
 diff --git a/kernel/cgroup_timer_slack.c b/kernel/cgroup_timer_slack.c
 new file mode 100644
 index 0000000..affd33a
 --- /dev/null
 +++ b/kernel/cgroup_timer_slack.c
 @@ -0,0 +1,262 @@
 +/*
 + * cgroup_timer_slack.c - control group timer slack subsystem
 + *
 + * Copyright Nokia Corparation, 2011
 + * Author: Kirill A. Shutemov
 + *
 + * This program is free software; you can redistribute it and/or modify
 + * it under the terms of the GNU General Public License as published by
 + * the Free Software Foundation; either version 2 of the License, or
 + * (at your option) any later version.
 + *
 + * This program is distributed in the hope that it will be useful,
 + * but WITHOUT ANY WARRANTY; without even the implied warranty of
 + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 + * GNU General Public License for more details.
 + */
 +#include <linux/cgroup.h>
 +#include <linux/init_task.h>
 +#include <linux/module.h>
 +#include <linux/slab.h>
 +#include <linux/rcupdate.h>
 +
 +struct cgroup_subsys timer_slack_subsys;
 +struct timer_slack_cgroup {
 +	struct cgroup_subsys_state css;
 +	unsigned long min_slack_ns;
 +	unsigned long max_slack_ns;
 +};
 +
 +enum {
 +	TIMER_SLACK_MIN,
 +	TIMER_SLACK_MAX,
 +};
 +
 +extern int (*timer_slack_check)(struct task_struct *task,
 +		unsigned long slack_ns);
 +
 +static struct timer_slack_cgroup *cgroup_to_tslack_cgroup(struct cgroup *cgroup)
 +{
 +	struct cgroup_subsys_state *css;
 +
 +	css = cgroup_subsys_state(cgroup, timer_slack_subsys.subsys_id);
 +	return container_of(css, struct timer_slack_cgroup, css);
 +}
 +
 +static int is_timer_slack_allowed(struct timer_slack_cgroup *tslack_cgroup,
 +		unsigned long slack_ns)
 +{
 +	if (slack_ns < tslack_cgroup->min_slack_ns ||
 +			slack_ns > tslack_cgroup->max_slack_ns)
 +		return false;
 +	return true;
 +}
 +
 +static int cgroup_timer_slack_check(struct task_struct *task,
 +		unsigned long slack_ns)
 +{
 +	struct cgroup_subsys_state *css;
 +	struct timer_slack_cgroup *tslack_cgroup;
 +
 +	/* XXX: lockdep false positive? */
 +	rcu_read_lock();
 +	css = task_subsys_state(task, timer_slack_subsys.subsys_id);
 +	tslack_cgroup = container_of(css, struct timer_slack_cgroup, css);
 +	rcu_read_unlock();
 +
 +	if (!is_timer_slack_allowed(tslack_cgroup, slack_ns))
 +		return -EPERM;
 +	return 0;
 +}
 +
 +static struct cgroup_subsys_state *
 +tslack_cgroup_create(struct cgroup_subsys *subsys, struct cgroup *cgroup)
 +{
 +	struct timer_slack_cgroup *tslack_cgroup;
 +
 +	tslack_cgroup = kmalloc(sizeof(*tslack_cgroup), GFP_KERNEL);
 +	if (!tslack_cgroup)
 +		return ERR_PTR(-ENOMEM);
 +
 +	if (cgroup->parent) {
 +		struct timer_slack_cgroup *parent;
 +		parent = cgroup_to_tslack_cgroup(cgroup->parent);
 +		tslack_cgroup->min_slack_ns = parent->min_slack_ns;
 +		tslack_cgroup->max_slack_ns = parent->max_slack_ns;
 +	} else {
 +		tslack_cgroup->min_slack_ns = 0UL;
 +		tslack_cgroup->max_slack_ns = ULONG_MAX;
 +	}
 +
 +	return &tslack_cgroup->css;
 +}
 +
 +static void tslack_cgroup_destroy(struct cgroup_subsys *subsys,
 +		struct cgroup *cgroup)
 +{
 +	kfree(cgroup_to_tslack_cgroup(cgroup));
 +}
 +
 +/*
 + * Adjust ->timer_slack_ns and ->default_max_slack_ns of the task to fit
 + * limits of the cgroup.
 + */
 +static void tslack_adjust_task(struct timer_slack_cgroup *tslack_cgroup,
 +		struct task_struct *tsk)
 +{
 +	if (tslack_cgroup->min_slack_ns > tsk->timer_slack_ns)
 +		tsk->timer_slack_ns = tslack_cgroup->min_slack_ns;
 +	else if (tslack_cgroup->max_slack_ns < tsk->timer_slack_ns)
 +		tsk->timer_slack_ns = tslack_cgroup->max_slack_ns;
 +
 +	if (tslack_cgroup->min_slack_ns > tsk->default_timer_slack_ns)
 +		tsk->default_timer_slack_ns = tslack_cgroup->min_slack_ns;
 +	else if (tslack_cgroup->max_slack_ns < tsk->default_timer_slack_ns)
 +		tsk->default_timer_slack_ns = tslack_cgroup->max_slack_ns;
 +}
 +
 +static void tslack_cgroup_attach(struct cgroup_subsys *subsys,
 +		struct cgroup *cgroup, struct cgroup *prev,
 +		struct task_struct *tsk, bool threadgroup)
 +{
 +	tslack_adjust_task(cgroup_to_tslack_cgroup(cgroup), tsk);
 +}
 +
 +static int tslack_write_set_slack_ns(struct cgroup *cgroup, struct cftype *cft,
 +		u64 val)
 +{
 +	struct timer_slack_cgroup *tslack_cgroup;
 +	struct cgroup_iter it;
 +	struct task_struct *task;
 +
 +	tslack_cgroup = cgroup_to_tslack_cgroup(cgroup);
 +	if (!is_timer_slack_allowed(cgroup_to_tslack_cgroup(cgroup), val))
 +		return -EPERM;
 +
 +	/* Change timer slack value for all tasks in the cgroup */
 +	cgroup_iter_start(cgroup, &it);
 +	while ((task = cgroup_iter_next(cgroup, &it)))
 +		task->timer_slack_ns = val;
 +	cgroup_iter_end(cgroup, &it);
 +
 +	return 0;
 +}
 +
 +static u64 tslack_read_range(struct cgroup *cgroup, struct cftype *cft)
 +{
 +	struct timer_slack_cgroup *tslack_cgroup;
 +
 +	tslack_cgroup = cgroup_to_tslack_cgroup(cgroup);
 +	switch (cft->private) {
 +	case TIMER_SLACK_MIN:
 +		return tslack_cgroup->min_slack_ns;
 +	case TIMER_SLACK_MAX:
 +		return tslack_cgroup->max_slack_ns;
 +	default:
 +		BUG();
 +	};
 +}
 +
 +static int tslack_write_range(struct cgroup *cgroup, struct cftype *cft,
 +		u64 val)
 +{
 +	struct timer_slack_cgroup *tslack_cgroup;
 +	struct cgroup_iter it;
 +	struct task_struct *task;
 +
 +	if (cgroup->parent) {
 +		struct timer_slack_cgroup *parent;
 +		parent = cgroup_to_tslack_cgroup(cgroup->parent);
 +		if (!is_timer_slack_allowed(parent, val))
 +			return -EPERM;
 +	}
 +
 +	tslack_cgroup = cgroup_to_tslack_cgroup(cgroup);
 +	switch (cft->private) {
 +	case TIMER_SLACK_MIN:
 +		if (val > tslack_cgroup->max_slack_ns)
 +			return -EINVAL;
 +		tslack_cgroup->min_slack_ns = val;
 +		break;
 +	case TIMER_SLACK_MAX:
 +		if (val < tslack_cgroup->min_slack_ns)
 +			return -EINVAL;
 +		tslack_cgroup->max_slack_ns = val;
 +		break;
 +	default:
 +		BUG();
 +	}
 +
 +	/*
 +	 * Adjust timer slack value for all tasks in the cgroup to fit
 +	 * min-max range.
 +	 */
 +	cgroup_iter_start(cgroup, &it);
 +	while ((task = cgroup_iter_next(cgroup, &it)))
 +		tslack_adjust_task(tslack_cgroup, task);
 +	cgroup_iter_end(cgroup, &it);
 +
 +	return 0;
 +}
 +
 +static struct cftype files[] = {
 +	{
 +		.name = "set_slack_ns",
 +		.write_u64 = tslack_write_set_slack_ns,
 +	},
 +	{
 +		.name = "min_slack_ns",
 +		.private = TIMER_SLACK_MIN,
 +		.read_u64 = tslack_read_range,
 +		.write_u64 = tslack_write_range,
 +	},
 +	{
 +		.name = "max_slack_ns",
 +		.private = TIMER_SLACK_MAX,
 +		.read_u64 = tslack_read_range,
 +		.write_u64 = tslack_write_range,
 +	},
 +};
 +
 +static int tslack_cgroup_populate(struct cgroup_subsys *subsys,
 +		struct cgr
...
 
 
 |  
	|  |  |  
	| 
		
			| Re: [PATCH, v4 2/2] cgroups: introduce timer slack subsystem [message #41587 is a reply to message #41516] | Tue, 08 February 2011 23:08   |  
			| 
				
				
					|  akpm Messages: 224
 Registered: March 2007
 | Senior Member |  |  |  
	| On Thu,  3 Feb 2011 16:34:14 +0200 "Kirill A. Shutsemov" <kirill@shutemov.name> wrote:
 
 > From: Kirill A. Shutemov <kirill@shutemov.name>
 >
 > Provides a way of tasks grouping by timer slack value. Introduces per
 > cgroup max and min timer slack value. When a task attaches to a cgroup,
 > its timer slack value adjusts (if needed) to fit min-max range.
 >
 > It also provides a way to set timer slack value for all tasks in the
 > cgroup at once.
 >
 > This functionality is useful in mobile devices where certain background
 > apps are attached to a cgroup and minimum wakeups are desired.
 
 This description is quite scanty.  It doesn't explain what the benefit
 is, when one might want to use it, how to use it, etc.  A nice
 description under Documentation/cgroups/ would be appropriate.
 
 I read this and come away with no sense of how useful or desirable this
 code is.
 
 >
 > ...
 >
 > --- a/include/linux/init_task.h
 > +++ b/include/linux/init_task.h
 > @@ -124,6 +124,8 @@ extern struct cred init_cred;
 >  # define INIT_PERF_EVENTS(tsk)
 >  #endif
 >
 > +#define TIMER_SLACK_NS_DEFAULT 50000
 
 Seems to be an unrelated cleanup.  And given that this #define is only
 used in a single place, its cleanliness is questionable.
 
 >  /*
 >   *  INIT_TASK is used to set up the first task table, touch at
 >   * your own risk!. Base=0, limit=0x1fffff (=2MB)
 > @@ -177,7 +179,7 @@ extern struct cred init_cred;
 >  	.cpu_timers	= INIT_CPU_TIMERS(tsk.cpu_timers),		\
 >  	.fs_excl	= ATOMIC_INIT(0),				\
 >  	.pi_lock	= __RAW_SPIN_LOCK_UNLOCKED(tsk.pi_lock),	\
 > -	.timer_slack_ns = 50000, /* 50 usec default slack */		\
 > +	.timer_slack_ns = TIMER_SLACK_NS_DEFAULT,			\
 >  	.pids = {							\
 >  		[PIDTYPE_PID]  = INIT_PID_LINK(PIDTYPE_PID),		\
 >  		[PIDTYPE_PGID] = INIT_PID_LINK(PIDTYPE_PGID),		\
 >
 > ...
 >
 > +extern int (*timer_slack_check)(struct task_struct *task,
 > +		unsigned long slack_ns);
 
 Nope.  Please put this in a header file so we can be sure that callers
 see the same prototype as does the definition.
 
 >
 > ...
 >
 > +/*
 > + * Adjust ->timer_slack_ns and ->default_max_slack_ns of the task to fit
 > + * limits of the cgroup.
 > + */
 > +static void tslack_adjust_task(struct timer_slack_cgroup *tslack_cgroup,
 > +		struct task_struct *tsk)
 > +{
 > +	if (tslack_cgroup->min_slack_ns > tsk->timer_slack_ns)
 > +		tsk->timer_slack_ns = tslack_cgroup->min_slack_ns;
 > +	else if (tslack_cgroup->max_slack_ns < tsk->timer_slack_ns)
 > +		tsk->timer_slack_ns = tslack_cgroup->max_slack_ns;
 > +
 > +	if (tslack_cgroup->min_slack_ns > tsk->default_timer_slack_ns)
 > +		tsk->default_timer_slack_ns = tslack_cgroup->min_slack_ns;
 > +	else if (tslack_cgroup->max_slack_ns < tsk->default_timer_slack_ns)
 > +		tsk->default_timer_slack_ns = tslack_cgroup->max_slack_ns;
 > +}
 > +
 > +static void tslack_cgroup_attach(struct cgroup_subsys *subsys,
 > +		struct cgroup *cgroup, struct cgroup *prev,
 > +		struct task_struct *tsk, bool threadgroup)
 > +{
 > +	tslack_adjust_task(cgroup_to_tslack_cgroup(cgroup), tsk);
 > +}
 > +
 > +static int tslack_write_set_slack_ns(struct cgroup *cgroup, struct cftype *cft,
 > +		u64 val)
 > +{
 > +	struct timer_slack_cgroup *tslack_cgroup;
 > +	struct cgroup_iter it;
 > +	struct task_struct *task;
 > +
 > +	tslack_cgroup = cgroup_to_tslack_cgroup(cgroup);
 > +	if (!is_timer_slack_allowed(cgroup_to_tslack_cgroup(cgroup), val))
 > +		return -EPERM;
 > +
 > +	/* Change timer slack value for all tasks in the cgroup */
 > +	cgroup_iter_start(cgroup, &it);
 > +	while ((task = cgroup_iter_next(cgroup, &it)))
 > +		task->timer_slack_ns = val;
 > +	cgroup_iter_end(cgroup, &it);
 > +
 > +	return 0;
 > +}
 > +
 > +static u64 tslack_read_range(struct cgroup *cgroup, struct cftype *cft)
 > +{
 > +	struct timer_slack_cgroup *tslack_cgroup;
 > +
 > +	tslack_cgroup = cgroup_to_tslack_cgroup(cgroup);
 > +	switch (cft->private) {
 > +	case TIMER_SLACK_MIN:
 > +		return tslack_cgroup->min_slack_ns;
 > +	case TIMER_SLACK_MAX:
 > +		return tslack_cgroup->max_slack_ns;
 > +	default:
 > +		BUG();
 > +	};
 
 Extraneous ";".
 
 > +}
 
 These proposed new userspace interfaces should be documented somewhere,
 please.  They are the most important part of the patch.
 
 >
 > ...
 >
 > +struct cgroup_subsys timer_slack_subsys = {
 > +	.name = "timer_slack",
 > +	.module = THIS_MODULE,
 > +#ifdef CONFIG_CGROUP_TIMER_SLACK
 
 Confused.  This file won't even be compiled if
 CONFIG_CGROUP_TIMER_SLACK=n?
 
 > +	.subsys_id = timer_slack_subsys_id,
 > +#endif
 > +	.create = tslack_cgroup_create,
 > +	.destroy = tslack_cgroup_destroy,
 > +	.attach = tslack_cgroup_attach,
 > +	.populate = tslack_cgroup_populate,
 > +};
 > +
 >
 > ...
 >
 > @@ -1694,12 +1698,15 @@ SYSCALL_DEFINE5(prctl, int, option, unsigned long, arg2, unsigned long, arg3,
 >  			error = current->timer_slack_ns;
 >  			break;
 >  		case PR_SET_TIMERSLACK:
 > -			if (arg2 <= 0)
 > -				current->timer_slack_ns =
 > -					current->default_timer_slack_ns;
 > -			else
 > -				current->timer_slack_ns = arg2;
 > -			error = 0;
 > +			if (arg2 <= 0) {
 > +				me->timer_slack_ns = me->default_timer_slack_ns;
 > +				break;
 > +			}
 > +
 > +			error = timer_slack_check ?
 > +				timer_slack_check(me, arg2) : 0;
 
 This is racy against init_cgroup_timer_slack().  And against
 exit_cgroup_timer_slack().
 
 This whole scheme of using a single hook to a single "check" function
 is rather grubby.  I guess that using a notifier_call_chain() would fix
 things: support multiple "check" functions and hopefully fix the races.
 
 > +			if (!error)
 > +				me->timer_slack_ns = arg2;
 >  			break;
 >  		case PR_MCE_KILL:
 >  			if (arg4 | arg5)
 
 I don't know whether PR_SET_TIMERSLACK is presently documented in the
 manpages.
 
 Please cc linux-api@vger.kernel.org on future versions of this work and
 ensure that the patch (via changelog, Documentation or code comments)
 has sufficient information for the manpages maintainers to be able to
 easily update the manpages.
 
 
 _______________________________________________
 Containers mailing list
 Containers@lists.linux-foundation.org
 https://lists.linux-foundation.org/mailman/listinfo/containe rs
 |  
	|  |  |  
	| 
		
			| Re: [PATCH, v4 2/2] cgroups: introduce timer slack subsystem [message #41597 is a reply to message #41587] | Wed, 09 February 2011 13:23  |  
			| 
				
				
					|  Kirill A. Shutsemov Messages: 32
 Registered: February 2011
 | Member |  |  |  
	| On Tue, Feb 08, 2011 at 03:08:35PM -0800, Andrew Morton wrote: > On Thu,  3 Feb 2011 16:34:14 +0200
 > "Kirill A. Shutsemov" <kirill@shutemov.name> wrote:
 >
 > > From: Kirill A. Shutemov <kirill@shutemov.name>
 > >
 > > Provides a way of tasks grouping by timer slack value. Introduces per
 > > cgroup max and min timer slack value. When a task attaches to a cgroup,
 > > its timer slack value adjusts (if needed) to fit min-max range.
 > >
 > > It also provides a way to set timer slack value for all tasks in the
 > > cgroup at once.
 > >
 > > This functionality is useful in mobile devices where certain background
 > > apps are attached to a cgroup and minimum wakeups are desired.
 >
 > This description is quite scanty.  It doesn't explain what the benefit
 > is, when one might want to use it, how to use it, etc.  A nice
 > description under Documentation/cgroups/ would be appropriate.
 >
 > I read this and come away with no sense of how useful or desirable this
 > code is.
 
 Ok, I'll add file to Documentation/cgroups/ and extend description.
 
 > >
 > > ...
 > >
 > > --- a/include/linux/init_task.h
 > > +++ b/include/linux/init_task.h
 > > @@ -124,6 +124,8 @@ extern struct cred init_cred;
 > >  # define INIT_PERF_EVENTS(tsk)
 > >  #endif
 > >
 > > +#define TIMER_SLACK_NS_DEFAULT 50000
 >
 > Seems to be an unrelated cleanup.  And given that this #define is only
 > used in a single place, its cleanliness is questionable.
 
 I used it in previous patch revision. I'll remove it.
 
 > >  /*
 > >   *  INIT_TASK is used to set up the first task table, touch at
 > >   * your own risk!. Base=0, limit=0x1fffff (=2MB)
 > > @@ -177,7 +179,7 @@ extern struct cred init_cred;
 > >  	.cpu_timers	= INIT_CPU_TIMERS(tsk.cpu_timers),		\
 > >  	.fs_excl	= ATOMIC_INIT(0),				\
 > >  	.pi_lock	= __RAW_SPIN_LOCK_UNLOCKED(tsk.pi_lock),	\
 > > -	.timer_slack_ns = 50000, /* 50 usec default slack */		\
 > > +	.timer_slack_ns = TIMER_SLACK_NS_DEFAULT,			\
 > >  	.pids = {							\
 > >  		[PIDTYPE_PID]  = INIT_PID_LINK(PIDTYPE_PID),		\
 > >  		[PIDTYPE_PGID] = INIT_PID_LINK(PIDTYPE_PGID),		\
 > >
 > > ...
 > >
 > > +extern int (*timer_slack_check)(struct task_struct *task,
 > > +		unsigned long slack_ns);
 >
 > Nope.  Please put this in a header file so we can be sure that callers
 > see the same prototype as does the definition.
 
 Ok.
 
 > >
 > > ...
 > >
 > > +/*
 > > + * Adjust ->timer_slack_ns and ->default_max_slack_ns of the task to fit
 > > + * limits of the cgroup.
 > > + */
 > > +static void tslack_adjust_task(struct timer_slack_cgroup *tslack_cgroup,
 > > +		struct task_struct *tsk)
 > > +{
 > > +	if (tslack_cgroup->min_slack_ns > tsk->timer_slack_ns)
 > > +		tsk->timer_slack_ns = tslack_cgroup->min_slack_ns;
 > > +	else if (tslack_cgroup->max_slack_ns < tsk->timer_slack_ns)
 > > +		tsk->timer_slack_ns = tslack_cgroup->max_slack_ns;
 > > +
 > > +	if (tslack_cgroup->min_slack_ns > tsk->default_timer_slack_ns)
 > > +		tsk->default_timer_slack_ns = tslack_cgroup->min_slack_ns;
 > > +	else if (tslack_cgroup->max_slack_ns < tsk->default_timer_slack_ns)
 > > +		tsk->default_timer_slack_ns = tslack_cgroup->max_slack_ns;
 > > +}
 > > +
 > > +static void tslack_cgroup_attach(struct cgroup_subsys *subsys,
 > > +		struct cgroup *cgroup, struct cgroup *prev,
 > > +		struct task_struct *tsk, bool threadgroup)
 > > +{
 > > +	tslack_adjust_task(cgroup_to_tslack_cgroup(cgroup), tsk);
 > > +}
 > > +
 > > +static int tslack_write_set_slack_ns(struct cgroup *cgroup, struct cftype *cft,
 > > +		u64 val)
 > > +{
 > > +	struct timer_slack_cgroup *tslack_cgroup;
 > > +	struct cgroup_iter it;
 > > +	struct task_struct *task;
 > > +
 > > +	tslack_cgroup = cgroup_to_tslack_cgroup(cgroup);
 > > +	if (!is_timer_slack_allowed(cgroup_to_tslack_cgroup(cgroup), val))
 > > +		return -EPERM;
 > > +
 > > +	/* Change timer slack value for all tasks in the cgroup */
 > > +	cgroup_iter_start(cgroup, &it);
 > > +	while ((task = cgroup_iter_next(cgroup, &it)))
 > > +		task->timer_slack_ns = val;
 > > +	cgroup_iter_end(cgroup, &it);
 > > +
 > > +	return 0;
 > > +}
 > > +
 > > +static u64 tslack_read_range(struct cgroup *cgroup, struct cftype *cft)
 > > +{
 > > +	struct timer_slack_cgroup *tslack_cgroup;
 > > +
 > > +	tslack_cgroup = cgroup_to_tslack_cgroup(cgroup);
 > > +	switch (cft->private) {
 > > +	case TIMER_SLACK_MIN:
 > > +		return tslack_cgroup->min_slack_ns;
 > > +	case TIMER_SLACK_MAX:
 > > +		return tslack_cgroup->max_slack_ns;
 > > +	default:
 > > +		BUG();
 > > +	};
 >
 > Extraneous ";".
 >
 > > +}
 >
 > These proposed new userspace interfaces should be documented somewhere,
 > please.  They are the most important part of the patch.
 >
 > >
 > > ...
 > >
 > > +struct cgroup_subsys timer_slack_subsys = {
 > > +	.name = "timer_slack",
 > > +	.module = THIS_MODULE,
 > > +#ifdef CONFIG_CGROUP_TIMER_SLACK
 >
 > Confused.  This file won't even be compiled if
 > CONFIG_CGROUP_TIMER_SLACK=n?
 
 Timer slack cgroup subsystem can be compiled as module. In this case
 CONFIG_CGROUP_TIMER_SLACK_MODULE defined, not CONFIG_CGROUP_TIMER_SLACK.
 I'll replace it with
 
 #ifndef CONFIG_CGROUP_TIMER_SLACK_MODULE
 
 to avoid confusion.
 
 > > +	.subsys_id = timer_slack_subsys_id,
 > > +#endif
 > > +	.create = tslack_cgroup_create,
 > > +	.destroy = tslack_cgroup_destroy,
 > > +	.attach = tslack_cgroup_attach,
 > > +	.populate = tslack_cgroup_populate,
 > > +};
 > > +
 > >
 > > ...
 > >
 > > @@ -1694,12 +1698,15 @@ SYSCALL_DEFINE5(prctl, int, option, unsigned long, arg2, unsigned long, arg3,
 > >  			error = current->timer_slack_ns;
 > >  			break;
 > >  		case PR_SET_TIMERSLACK:
 > > -			if (arg2 <= 0)
 > > -				current->timer_slack_ns =
 > > -					current->default_timer_slack_ns;
 > > -			else
 > > -				current->timer_slack_ns = arg2;
 > > -			error = 0;
 > > +			if (arg2 <= 0) {
 > > +				me->timer_slack_ns = me->default_timer_slack_ns;
 > > +				break;
 > > +			}
 > > +
 > > +			error = timer_slack_check ?
 > > +				timer_slack_check(me, arg2) : 0;
 >
 > This is racy against init_cgroup_timer_slack().  And against
 > exit_cgroup_timer_slack().
 >
 > This whole scheme of using a single hook to a single "check" function
 > is rather grubby.  I guess that using a notifier_call_chain() would fix
 > things: support multiple "check" functions and hopefully fix the races.
 
 Ok, I'll rewrite it using blocking_notifier_call_chain().
 
 > > +			if (!error)
 > > +				me->timer_slack_ns = arg2;
 > >  			break;
 > >  		case PR_MCE_KILL:
 > >  			if (arg4 | arg5)
 >
 > I don't know whether PR_SET_TIMERSLACK is presently documented in the
 > manpages.
 
 It's in todo list:
 
 http://git.kernel.org/?p=docs/man-pages/man-pages.git;a=blob;f=man2/prctl.2#l42
 
 > Please cc linux-api@vger.kernel.org on future versions of this work and
 > ensure that the patch (via changelog, Documentation or code comments)
 > has sufficient information for the manpages maintainers to be able to
 > easily update the manpages.
 
 Ok.
 
 Thank you for reviewing.
 
 --
 Kirill A. Shutemov
 _______________________________________________
 Containers mailing list
 Containers@lists.linux-foundation.org
 https://lists.linux-foundation.org/mailman/listinfo/containe rs
 |  
	|  |  | 
 
 
 Current Time: Sun Oct 26 11:41:57 GMT 2025 
 Total time taken to generate the page: 0.08643 seconds |