diff options
author | Peter Zijlstra <a.p.zijlstra@chello.nl> | 2008-02-13 09:45:39 -0500 |
---|---|---|
committer | Ingo Molnar <mingo@elte.hu> | 2008-02-13 09:45:39 -0500 |
commit | 8ed3699682be75fd68281239c202ad3830f9c72d (patch) | |
tree | 5af86fb155e475e906e14dc6aa5aa5a890cca7a2 /kernel/sched.c | |
parent | 720a2592cf1b9af86f30c44e8d89348826c03372 (diff) |
sched: fair-group: separate tg->shares from task_group_lock
On Mon, 2008-02-11 at 15:09 +0300, Denis V. Lunev wrote:
> BUG: sleeping function called from invalid context
> at /home/den/src/linux-netns26/kernel/mutex.c:209
> in_atomic():1, irqs_disabled():0
> no locks held by swapper/0.
> Pid: 0, comm: swapper Not tainted 2.6.24 #304
>
> Call Trace:
> <IRQ> [<ffffffff80252d1e>] ? __debug_show_held_locks+0x15/0x27
> [<ffffffff8022c2a8>] __might_sleep+0xc0/0xdf
> [<ffffffff8049f1df>] mutex_lock_nested+0x28/0x2a9
> [<ffffffff80231294>] sched_destroy_group+0x18/0xea
> [<ffffffff8023e835>] sched_destroy_user+0xd/0xf
> [<ffffffff8023e8c1>] free_uid+0x8a/0xab
> [<ffffffff80233e24>] __put_task_struct+0x3f/0xd3
> [<ffffffff80236708>] delayed_put_task_struct+0x23/0x25
> [<ffffffff8026fda7>] __rcu_process_callbacks+0x8d/0x215
> [<ffffffff8026ff52>] rcu_process_callbacks+0x23/0x44
> [<ffffffff8023a2ae>] __do_softirq+0x79/0xf8
> [<ffffffff8020f8c3>] ? profile_pc+0x2a/0x67
> [<ffffffff8020d38c>] call_softirq+0x1c/0x30
> [<ffffffff8020f689>] do_softirq+0x61/0x9c
> [<ffffffff8023a233>] irq_exit+0x51/0x53
> [<ffffffff8021bd1a>] smp_apic_timer_interrupt+0x77/0xad
> [<ffffffff8020ce3b>] apic_timer_interrupt+0x6b/0x70
> <EOI> [<ffffffff8020b0dd>] ? default_idle+0x43/0x76
> [<ffffffff8020b0db>] ? default_idle+0x41/0x76
> [<ffffffff8020b09a>] ? default_idle+0x0/0x76
> [<ffffffff8020b186>] ? cpu_idle+0x76/0x98
separate the tg->shares protection from the task_group lock.
Reported-by: Denis V. Lunev <den@openvz.org>
Tested-by: Denis V. Lunev <den@openvz.org>
Signed-off-by: Peter Zijlstra <a.p.zijlstra@chello.nl>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
Diffstat (limited to 'kernel/sched.c')
-rw-r--r-- | kernel/sched.c | 37 |
1 files changed, 17 insertions, 20 deletions
diff --git a/kernel/sched.c b/kernel/sched.c index 3eedd5260907..6b02276baaa6 100644 --- a/kernel/sched.c +++ b/kernel/sched.c | |||
@@ -232,10 +232,10 @@ static struct cfs_rq *init_cfs_rq_p[NR_CPUS]; | |||
232 | static struct sched_rt_entity *init_sched_rt_entity_p[NR_CPUS]; | 232 | static struct sched_rt_entity *init_sched_rt_entity_p[NR_CPUS]; |
233 | static struct rt_rq *init_rt_rq_p[NR_CPUS]; | 233 | static struct rt_rq *init_rt_rq_p[NR_CPUS]; |
234 | 234 | ||
235 | /* task_group_mutex serializes add/remove of task groups and also changes to | 235 | /* task_group_lock serializes add/remove of task groups and also changes to |
236 | * a task group's cpu shares. | 236 | * a task group's cpu shares. |
237 | */ | 237 | */ |
238 | static DEFINE_MUTEX(task_group_mutex); | 238 | static DEFINE_SPINLOCK(task_group_lock); |
239 | 239 | ||
240 | /* doms_cur_mutex serializes access to doms_cur[] array */ | 240 | /* doms_cur_mutex serializes access to doms_cur[] array */ |
241 | static DEFINE_MUTEX(doms_cur_mutex); | 241 | static DEFINE_MUTEX(doms_cur_mutex); |
@@ -295,16 +295,6 @@ static inline void set_task_rq(struct task_struct *p, unsigned int cpu) | |||
295 | p->rt.parent = task_group(p)->rt_se[cpu]; | 295 | p->rt.parent = task_group(p)->rt_se[cpu]; |
296 | } | 296 | } |
297 | 297 | ||
298 | static inline void lock_task_group_list(void) | ||
299 | { | ||
300 | mutex_lock(&task_group_mutex); | ||
301 | } | ||
302 | |||
303 | static inline void unlock_task_group_list(void) | ||
304 | { | ||
305 | mutex_unlock(&task_group_mutex); | ||
306 | } | ||
307 | |||
308 | static inline void lock_doms_cur(void) | 298 | static inline void lock_doms_cur(void) |
309 | { | 299 | { |
310 | mutex_lock(&doms_cur_mutex); | 300 | mutex_lock(&doms_cur_mutex); |
@@ -318,8 +308,6 @@ static inline void unlock_doms_cur(void) | |||
318 | #else | 308 | #else |
319 | 309 | ||
320 | static inline void set_task_rq(struct task_struct *p, unsigned int cpu) { } | 310 | static inline void set_task_rq(struct task_struct *p, unsigned int cpu) { } |
321 | static inline void lock_task_group_list(void) { } | ||
322 | static inline void unlock_task_group_list(void) { } | ||
323 | static inline void lock_doms_cur(void) { } | 311 | static inline void lock_doms_cur(void) { } |
324 | static inline void unlock_doms_cur(void) { } | 312 | static inline void unlock_doms_cur(void) { } |
325 | 313 | ||
@@ -7571,6 +7559,7 @@ struct task_group *sched_create_group(void) | |||
7571 | struct rt_rq *rt_rq; | 7559 | struct rt_rq *rt_rq; |
7572 | struct sched_rt_entity *rt_se; | 7560 | struct sched_rt_entity *rt_se; |
7573 | struct rq *rq; | 7561 | struct rq *rq; |
7562 | unsigned long flags; | ||
7574 | int i; | 7563 | int i; |
7575 | 7564 | ||
7576 | tg = kzalloc(sizeof(*tg), GFP_KERNEL); | 7565 | tg = kzalloc(sizeof(*tg), GFP_KERNEL); |
@@ -7620,7 +7609,7 @@ struct task_group *sched_create_group(void) | |||
7620 | init_tg_rt_entry(rq, tg, rt_rq, rt_se, i, 0); | 7609 | init_tg_rt_entry(rq, tg, rt_rq, rt_se, i, 0); |
7621 | } | 7610 | } |
7622 | 7611 | ||
7623 | lock_task_group_list(); | 7612 | spin_lock_irqsave(&task_group_lock, flags); |
7624 | for_each_possible_cpu(i) { | 7613 | for_each_possible_cpu(i) { |
7625 | rq = cpu_rq(i); | 7614 | rq = cpu_rq(i); |
7626 | cfs_rq = tg->cfs_rq[i]; | 7615 | cfs_rq = tg->cfs_rq[i]; |
@@ -7629,7 +7618,7 @@ struct task_group *sched_create_group(void) | |||
7629 | list_add_rcu(&rt_rq->leaf_rt_rq_list, &rq->leaf_rt_rq_list); | 7618 | list_add_rcu(&rt_rq->leaf_rt_rq_list, &rq->leaf_rt_rq_list); |
7630 | } | 7619 | } |
7631 | list_add_rcu(&tg->list, &task_groups); | 7620 | list_add_rcu(&tg->list, &task_groups); |
7632 | unlock_task_group_list(); | 7621 | spin_unlock_irqrestore(&task_group_lock, flags); |
7633 | 7622 | ||
7634 | return tg; | 7623 | return tg; |
7635 | 7624 | ||
@@ -7650,9 +7639,10 @@ void sched_destroy_group(struct task_group *tg) | |||
7650 | { | 7639 | { |
7651 | struct cfs_rq *cfs_rq = NULL; | 7640 | struct cfs_rq *cfs_rq = NULL; |
7652 | struct rt_rq *rt_rq = NULL; | 7641 | struct rt_rq *rt_rq = NULL; |
7642 | unsigned long flags; | ||
7653 | int i; | 7643 | int i; |
7654 | 7644 | ||
7655 | lock_task_group_list(); | 7645 | spin_lock_irqsave(&task_group_lock, flags); |
7656 | for_each_possible_cpu(i) { | 7646 | for_each_possible_cpu(i) { |
7657 | cfs_rq = tg->cfs_rq[i]; | 7647 | cfs_rq = tg->cfs_rq[i]; |
7658 | list_del_rcu(&cfs_rq->leaf_cfs_rq_list); | 7648 | list_del_rcu(&cfs_rq->leaf_cfs_rq_list); |
@@ -7660,7 +7650,7 @@ void sched_destroy_group(struct task_group *tg) | |||
7660 | list_del_rcu(&rt_rq->leaf_rt_rq_list); | 7650 | list_del_rcu(&rt_rq->leaf_rt_rq_list); |
7661 | } | 7651 | } |
7662 | list_del_rcu(&tg->list); | 7652 | list_del_rcu(&tg->list); |
7663 | unlock_task_group_list(); | 7653 | spin_unlock_irqrestore(&task_group_lock, flags); |
7664 | 7654 | ||
7665 | BUG_ON(!cfs_rq); | 7655 | BUG_ON(!cfs_rq); |
7666 | 7656 | ||
@@ -7728,13 +7718,16 @@ static void set_se_shares(struct sched_entity *se, unsigned long shares) | |||
7728 | } | 7718 | } |
7729 | } | 7719 | } |
7730 | 7720 | ||
7721 | static DEFINE_MUTEX(shares_mutex); | ||
7722 | |||
7731 | int sched_group_set_shares(struct task_group *tg, unsigned long shares) | 7723 | int sched_group_set_shares(struct task_group *tg, unsigned long shares) |
7732 | { | 7724 | { |
7733 | int i; | 7725 | int i; |
7734 | struct cfs_rq *cfs_rq; | 7726 | struct cfs_rq *cfs_rq; |
7735 | struct rq *rq; | 7727 | struct rq *rq; |
7728 | unsigned long flags; | ||
7736 | 7729 | ||
7737 | lock_task_group_list(); | 7730 | mutex_lock(&shares_mutex); |
7738 | if (tg->shares == shares) | 7731 | if (tg->shares == shares) |
7739 | goto done; | 7732 | goto done; |
7740 | 7733 | ||
@@ -7746,10 +7739,12 @@ int sched_group_set_shares(struct task_group *tg, unsigned long shares) | |||
7746 | * load_balance_fair) from referring to this group first, | 7739 | * load_balance_fair) from referring to this group first, |
7747 | * by taking it off the rq->leaf_cfs_rq_list on each cpu. | 7740 | * by taking it off the rq->leaf_cfs_rq_list on each cpu. |
7748 | */ | 7741 | */ |
7742 | spin_lock_irqsave(&task_group_lock, flags); | ||
7749 | for_each_possible_cpu(i) { | 7743 | for_each_possible_cpu(i) { |
7750 | cfs_rq = tg->cfs_rq[i]; | 7744 | cfs_rq = tg->cfs_rq[i]; |
7751 | list_del_rcu(&cfs_rq->leaf_cfs_rq_list); | 7745 | list_del_rcu(&cfs_rq->leaf_cfs_rq_list); |
7752 | } | 7746 | } |
7747 | spin_unlock_irqrestore(&task_group_lock, flags); | ||
7753 | 7748 | ||
7754 | /* wait for any ongoing reference to this group to finish */ | 7749 | /* wait for any ongoing reference to this group to finish */ |
7755 | synchronize_sched(); | 7750 | synchronize_sched(); |
@@ -7769,13 +7764,15 @@ int sched_group_set_shares(struct task_group *tg, unsigned long shares) | |||
7769 | * Enable load balance activity on this group, by inserting it back on | 7764 | * Enable load balance activity on this group, by inserting it back on |
7770 | * each cpu's rq->leaf_cfs_rq_list. | 7765 | * each cpu's rq->leaf_cfs_rq_list. |
7771 | */ | 7766 | */ |
7767 | spin_lock_irqsave(&task_group_lock, flags); | ||
7772 | for_each_possible_cpu(i) { | 7768 | for_each_possible_cpu(i) { |
7773 | rq = cpu_rq(i); | 7769 | rq = cpu_rq(i); |
7774 | cfs_rq = tg->cfs_rq[i]; | 7770 | cfs_rq = tg->cfs_rq[i]; |
7775 | list_add_rcu(&cfs_rq->leaf_cfs_rq_list, &rq->leaf_cfs_rq_list); | 7771 | list_add_rcu(&cfs_rq->leaf_cfs_rq_list, &rq->leaf_cfs_rq_list); |
7776 | } | 7772 | } |
7773 | spin_unlock_irqrestore(&task_group_lock, flags); | ||
7777 | done: | 7774 | done: |
7778 | unlock_task_group_list(); | 7775 | mutex_unlock(&shares_mutex); |
7779 | return 0; | 7776 | return 0; |
7780 | } | 7777 | } |
7781 | 7778 | ||