aboutsummaryrefslogtreecommitdiffstats
path: root/kernel
diff options
context:
space:
mode:
authorPaul Turner <pjt@google.com>2011-07-21 12:43:27 -0400
committerIngo Molnar <mingo@elte.hu>2011-08-14 06:01:13 -0400
commit953bfcd10e6f3697233e8e5128c611d275da39c1 (patch)
treea3ca8136bb9e992bb40945c5eee2a8dcc0fd0b57 /kernel
parent5710f15b52664ae0bfa60a66d75464769d297b2b (diff)
sched: Implement hierarchical task accounting for SCHED_OTHER
Introduce hierarchical task accounting for the group scheduling case in CFS, as well as promoting the responsibility for maintaining rq->nr_running to the scheduling classes. The primary motivation for this is that with scheduling classes supporting bandwidth throttling it is possible for entities participating in throttled sub-trees to not have root visible changes in rq->nr_running across activate and de-activate operations. This in turn leads to incorrect idle and weight-per-task load balance decisions. This also allows us to make a small fixlet to the fastpath in pick_next_task() under group scheduling. Note: this issue also exists with the existing sched_rt throttling mechanism. This patch does not address that. Signed-off-by: Paul Turner <pjt@google.com> Reviewed-by: Hidetoshi Seto <seto.hidetoshi@jp.fujitsu.com> Signed-off-by: Peter Zijlstra <a.p.zijlstra@chello.nl> Link: http://lkml.kernel.org/r/20110721184756.878333391@google.com Signed-off-by: Ingo Molnar <mingo@elte.hu>
Diffstat (limited to 'kernel')
-rw-r--r--kernel/sched.c6
-rw-r--r--kernel/sched_fair.c6
-rw-r--r--kernel/sched_rt.c5
-rw-r--r--kernel/sched_stoptask.c2
4 files changed, 14 insertions, 5 deletions
diff --git a/kernel/sched.c b/kernel/sched.c
index cf427bb2b65e..cd1a531ca8ff 100644
--- a/kernel/sched.c
+++ b/kernel/sched.c
@@ -311,7 +311,7 @@ struct task_group root_task_group;
311/* CFS-related fields in a runqueue */ 311/* CFS-related fields in a runqueue */
312struct cfs_rq { 312struct cfs_rq {
313 struct load_weight load; 313 struct load_weight load;
314 unsigned long nr_running; 314 unsigned long nr_running, h_nr_running;
315 315
316 u64 exec_clock; 316 u64 exec_clock;
317 u64 min_vruntime; 317 u64 min_vruntime;
@@ -1802,7 +1802,6 @@ static void activate_task(struct rq *rq, struct task_struct *p, int flags)
1802 rq->nr_uninterruptible--; 1802 rq->nr_uninterruptible--;
1803 1803
1804 enqueue_task(rq, p, flags); 1804 enqueue_task(rq, p, flags);
1805 inc_nr_running(rq);
1806} 1805}
1807 1806
1808/* 1807/*
@@ -1814,7 +1813,6 @@ static void deactivate_task(struct rq *rq, struct task_struct *p, int flags)
1814 rq->nr_uninterruptible++; 1813 rq->nr_uninterruptible++;
1815 1814
1816 dequeue_task(rq, p, flags); 1815 dequeue_task(rq, p, flags);
1817 dec_nr_running(rq);
1818} 1816}
1819 1817
1820#ifdef CONFIG_IRQ_TIME_ACCOUNTING 1818#ifdef CONFIG_IRQ_TIME_ACCOUNTING
@@ -4258,7 +4256,7 @@ pick_next_task(struct rq *rq)
4258 * Optimization: we know that if all tasks are in 4256 * Optimization: we know that if all tasks are in
4259 * the fair class we can call that function directly: 4257 * the fair class we can call that function directly:
4260 */ 4258 */
4261 if (likely(rq->nr_running == rq->cfs.nr_running)) { 4259 if (likely(rq->nr_running == rq->cfs.h_nr_running)) {
4262 p = fair_sched_class.pick_next_task(rq); 4260 p = fair_sched_class.pick_next_task(rq);
4263 if (likely(p)) 4261 if (likely(p))
4264 return p; 4262 return p;
diff --git a/kernel/sched_fair.c b/kernel/sched_fair.c
index f4b732a3552b..f86b0cb5eb29 100644
--- a/kernel/sched_fair.c
+++ b/kernel/sched_fair.c
@@ -1310,16 +1310,19 @@ enqueue_task_fair(struct rq *rq, struct task_struct *p, int flags)
1310 break; 1310 break;
1311 cfs_rq = cfs_rq_of(se); 1311 cfs_rq = cfs_rq_of(se);
1312 enqueue_entity(cfs_rq, se, flags); 1312 enqueue_entity(cfs_rq, se, flags);
1313 cfs_rq->h_nr_running++;
1313 flags = ENQUEUE_WAKEUP; 1314 flags = ENQUEUE_WAKEUP;
1314 } 1315 }
1315 1316
1316 for_each_sched_entity(se) { 1317 for_each_sched_entity(se) {
1317 cfs_rq = cfs_rq_of(se); 1318 cfs_rq = cfs_rq_of(se);
1319 cfs_rq->h_nr_running++;
1318 1320
1319 update_cfs_load(cfs_rq, 0); 1321 update_cfs_load(cfs_rq, 0);
1320 update_cfs_shares(cfs_rq); 1322 update_cfs_shares(cfs_rq);
1321 } 1323 }
1322 1324
1325 inc_nr_running(rq);
1323 hrtick_update(rq); 1326 hrtick_update(rq);
1324} 1327}
1325 1328
@@ -1339,6 +1342,7 @@ static void dequeue_task_fair(struct rq *rq, struct task_struct *p, int flags)
1339 for_each_sched_entity(se) { 1342 for_each_sched_entity(se) {
1340 cfs_rq = cfs_rq_of(se); 1343 cfs_rq = cfs_rq_of(se);
1341 dequeue_entity(cfs_rq, se, flags); 1344 dequeue_entity(cfs_rq, se, flags);
1345 cfs_rq->h_nr_running--;
1342 1346
1343 /* Don't dequeue parent if it has other entities besides us */ 1347 /* Don't dequeue parent if it has other entities besides us */
1344 if (cfs_rq->load.weight) { 1348 if (cfs_rq->load.weight) {
@@ -1358,11 +1362,13 @@ static void dequeue_task_fair(struct rq *rq, struct task_struct *p, int flags)
1358 1362
1359 for_each_sched_entity(se) { 1363 for_each_sched_entity(se) {
1360 cfs_rq = cfs_rq_of(se); 1364 cfs_rq = cfs_rq_of(se);
1365 cfs_rq->h_nr_running--;
1361 1366
1362 update_cfs_load(cfs_rq, 0); 1367 update_cfs_load(cfs_rq, 0);
1363 update_cfs_shares(cfs_rq); 1368 update_cfs_shares(cfs_rq);
1364 } 1369 }
1365 1370
1371 dec_nr_running(rq);
1366 hrtick_update(rq); 1372 hrtick_update(rq);
1367} 1373}
1368 1374
diff --git a/kernel/sched_rt.c b/kernel/sched_rt.c
index a8c207ff3492..a9d3c6bc684a 100644
--- a/kernel/sched_rt.c
+++ b/kernel/sched_rt.c
@@ -936,6 +936,8 @@ enqueue_task_rt(struct rq *rq, struct task_struct *p, int flags)
936 936
937 if (!task_current(rq, p) && p->rt.nr_cpus_allowed > 1) 937 if (!task_current(rq, p) && p->rt.nr_cpus_allowed > 1)
938 enqueue_pushable_task(rq, p); 938 enqueue_pushable_task(rq, p);
939
940 inc_nr_running(rq);
939} 941}
940 942
941static void dequeue_task_rt(struct rq *rq, struct task_struct *p, int flags) 943static void dequeue_task_rt(struct rq *rq, struct task_struct *p, int flags)
@@ -946,6 +948,8 @@ static void dequeue_task_rt(struct rq *rq, struct task_struct *p, int flags)
946 dequeue_rt_entity(rt_se); 948 dequeue_rt_entity(rt_se);
947 949
948 dequeue_pushable_task(rq, p); 950 dequeue_pushable_task(rq, p);
951
952 dec_nr_running(rq);
949} 953}
950 954
951/* 955/*
@@ -1841,4 +1845,3 @@ static void print_rt_stats(struct seq_file *m, int cpu)
1841 rcu_read_unlock(); 1845 rcu_read_unlock();
1842} 1846}
1843#endif /* CONFIG_SCHED_DEBUG */ 1847#endif /* CONFIG_SCHED_DEBUG */
1844
diff --git a/kernel/sched_stoptask.c b/kernel/sched_stoptask.c
index 6f437632afab..8b44e7fa7fb3 100644
--- a/kernel/sched_stoptask.c
+++ b/kernel/sched_stoptask.c
@@ -34,11 +34,13 @@ static struct task_struct *pick_next_task_stop(struct rq *rq)
34static void 34static void
35enqueue_task_stop(struct rq *rq, struct task_struct *p, int flags) 35enqueue_task_stop(struct rq *rq, struct task_struct *p, int flags)
36{ 36{
37 inc_nr_running(rq);
37} 38}
38 39
39static void 40static void
40dequeue_task_stop(struct rq *rq, struct task_struct *p, int flags) 41dequeue_task_stop(struct rq *rq, struct task_struct *p, int flags)
41{ 42{
43 dec_nr_running(rq);
42} 44}
43 45
44static void yield_task_stop(struct rq *rq) 46static void yield_task_stop(struct rq *rq)