diff options
author | Mike Galbraith <bitbucket@online.de> | 2013-01-28 06:19:25 -0500 |
---|---|---|
committer | Ingo Molnar <mingo@kernel.org> | 2013-02-04 14:07:24 -0500 |
commit | e0a79f529d5ba2507486d498b25da40911d95cf6 (patch) | |
tree | 469947cd4407877ba69aa474cdfed0f2bda61d92 /kernel/sched | |
parent | 60334caf37dc7c59120b21faa625534a6fffead0 (diff) |
sched: Fix select_idle_sibling() bouncing cow syndrome
If the previous CPU is cache affine and idle, select it.
The current implementation simply traverses the sd_llc domain,
taking the first idle CPU encountered, which walks buddy pairs
hand in hand over the package, inflicting excruciating pain.
1 tbench pair (worst case) in a 10 core + SMT package:
pre 15.22 MB/sec 1 procs
post 252.01 MB/sec 1 procs
Signed-off-by: Mike Galbraith <bitbucket@online.de>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1359371965.5783.127.camel@marge.simpson.net
Signed-off-by: Ingo Molnar <mingo@kernel.org>
Diffstat (limited to 'kernel/sched')
-rw-r--r-- | kernel/sched/fair.c | 21 |
1 files changed, 7 insertions, 14 deletions
diff --git a/kernel/sched/fair.c b/kernel/sched/fair.c index 8dbee9f4ceb2..ed18c74db017 100644 --- a/kernel/sched/fair.c +++ b/kernel/sched/fair.c | |||
@@ -3252,25 +3252,18 @@ find_idlest_cpu(struct sched_group *group, struct task_struct *p, int this_cpu) | |||
3252 | */ | 3252 | */ |
3253 | static int select_idle_sibling(struct task_struct *p, int target) | 3253 | static int select_idle_sibling(struct task_struct *p, int target) |
3254 | { | 3254 | { |
3255 | int cpu = smp_processor_id(); | ||
3256 | int prev_cpu = task_cpu(p); | ||
3257 | struct sched_domain *sd; | 3255 | struct sched_domain *sd; |
3258 | struct sched_group *sg; | 3256 | struct sched_group *sg; |
3259 | int i; | 3257 | int i = task_cpu(p); |
3260 | 3258 | ||
3261 | /* | 3259 | if (idle_cpu(target)) |
3262 | * If the task is going to be woken-up on this cpu and if it is | 3260 | return target; |
3263 | * already idle, then it is the right target. | ||
3264 | */ | ||
3265 | if (target == cpu && idle_cpu(cpu)) | ||
3266 | return cpu; | ||
3267 | 3261 | ||
3268 | /* | 3262 | /* |
3269 | * If the task is going to be woken-up on the cpu where it previously | 3263 | * If the prevous cpu is cache affine and idle, don't be stupid. |
3270 | * ran and if it is currently idle, then it the right target. | ||
3271 | */ | 3264 | */ |
3272 | if (target == prev_cpu && idle_cpu(prev_cpu)) | 3265 | if (i != target && cpus_share_cache(i, target) && idle_cpu(i)) |
3273 | return prev_cpu; | 3266 | return i; |
3274 | 3267 | ||
3275 | /* | 3268 | /* |
3276 | * Otherwise, iterate the domains and find an elegible idle cpu. | 3269 | * Otherwise, iterate the domains and find an elegible idle cpu. |
@@ -3284,7 +3277,7 @@ static int select_idle_sibling(struct task_struct *p, int target) | |||
3284 | goto next; | 3277 | goto next; |
3285 | 3278 | ||
3286 | for_each_cpu(i, sched_group_cpus(sg)) { | 3279 | for_each_cpu(i, sched_group_cpus(sg)) { |
3287 | if (!idle_cpu(i)) | 3280 | if (i == target || !idle_cpu(i)) |
3288 | goto next; | 3281 | goto next; |
3289 | } | 3282 | } |
3290 | 3283 | ||