summaryrefslogtreecommitdiffstats
path: root/kernel/sched/fair.c
diff options
context:
space:
mode:
authorJoonsoo Kim <iamjoonsoo.kim@lge.com>2013-04-23 04:27:42 -0400
committerIngo Molnar <mingo@kernel.org>2013-04-24 02:52:46 -0400
commite02e60c109ca70935bad1131976bdbf5160cf576 (patch)
tree56295c7eacea90fb95a2febf178ea287664e4407 /kernel/sched/fair.c
parente6252c3ef4b9cd251b53f7b68035f395d20b044e (diff)
sched: Prevent to re-select dst-cpu in load_balance()
Commit 88b8dac0 makes load_balance() consider other cpus in its group. But, in that, there is no code for preventing to re-select dst-cpu. So, same dst-cpu can be selected over and over. This patch add functionality to load_balance() in order to exclude cpu which is selected once. We prevent to re-select dst_cpu via env's cpus, so now, env's cpus is a candidate not only for src_cpus, but also dst_cpus. With this patch, we can remove lb_iterations and max_lb_iterations, because we decide whether we can go ahead or not via env's cpus. Signed-off-by: Joonsoo Kim <iamjoonsoo.kim@lge.com> Acked-by: Peter Zijlstra <a.p.zijlstra@chello.nl> Tested-by: Jason Low <jason.low2@hp.com> Cc: Srivatsa Vaddagiri <vatsa@linux.vnet.ibm.com> Cc: Davidlohr Bueso <davidlohr.bueso@hp.com> Cc: Peter Zijlstra <peterz@infradead.org> Link: http://lkml.kernel.org/r/1366705662-3587-7-git-send-email-iamjoonsoo.kim@lge.com Signed-off-by: Ingo Molnar <mingo@kernel.org>
Diffstat (limited to 'kernel/sched/fair.c')
-rw-r--r--kernel/sched/fair.c33
1 files changed, 15 insertions, 18 deletions
diff --git a/kernel/sched/fair.c b/kernel/sched/fair.c
index 5b1e96687b49..acaf567a03d2 100644
--- a/kernel/sched/fair.c
+++ b/kernel/sched/fair.c
@@ -3905,7 +3905,7 @@ int can_migrate_task(struct task_struct *p, struct lb_env *env)
3905 return 0; 3905 return 0;
3906 3906
3907 if (!cpumask_test_cpu(env->dst_cpu, tsk_cpus_allowed(p))) { 3907 if (!cpumask_test_cpu(env->dst_cpu, tsk_cpus_allowed(p))) {
3908 int new_dst_cpu; 3908 int cpu;
3909 3909
3910 schedstat_inc(p, se.statistics.nr_failed_migrations_affine); 3910 schedstat_inc(p, se.statistics.nr_failed_migrations_affine);
3911 3911
@@ -3920,12 +3920,15 @@ int can_migrate_task(struct task_struct *p, struct lb_env *env)
3920 if (!env->dst_grpmask || (env->flags & LBF_SOME_PINNED)) 3920 if (!env->dst_grpmask || (env->flags & LBF_SOME_PINNED))
3921 return 0; 3921 return 0;
3922 3922
3923 new_dst_cpu = cpumask_first_and(env->dst_grpmask, 3923 /* Prevent to re-select dst_cpu via env's cpus */
3924 tsk_cpus_allowed(p)); 3924 for_each_cpu_and(cpu, env->dst_grpmask, env->cpus) {
3925 if (new_dst_cpu < nr_cpu_ids) { 3925 if (cpumask_test_cpu(cpu, tsk_cpus_allowed(p))) {
3926 env->flags |= LBF_SOME_PINNED; 3926 env->flags |= LBF_SOME_PINNED;
3927 env->new_dst_cpu = new_dst_cpu; 3927 env->new_dst_cpu = cpu;
3928 break;
3929 }
3928 } 3930 }
3931
3929 return 0; 3932 return 0;
3930 } 3933 }
3931 3934
@@ -5008,7 +5011,6 @@ static int load_balance(int this_cpu, struct rq *this_rq,
5008 int *balance) 5011 int *balance)
5009{ 5012{
5010 int ld_moved, cur_ld_moved, active_balance = 0; 5013 int ld_moved, cur_ld_moved, active_balance = 0;
5011 int lb_iterations, max_lb_iterations;
5012 struct sched_group *group; 5014 struct sched_group *group;
5013 struct rq *busiest; 5015 struct rq *busiest;
5014 unsigned long flags; 5016 unsigned long flags;
@@ -5028,15 +5030,8 @@ static int load_balance(int this_cpu, struct rq *this_rq,
5028 * For NEWLY_IDLE load_balancing, we don't need to consider 5030 * For NEWLY_IDLE load_balancing, we don't need to consider
5029 * other cpus in our group 5031 * other cpus in our group
5030 */ 5032 */
5031 if (idle == CPU_NEWLY_IDLE) { 5033 if (idle == CPU_NEWLY_IDLE)
5032 env.dst_grpmask = NULL; 5034 env.dst_grpmask = NULL;
5033 /*
5034 * we don't care max_lb_iterations in this case,
5035 * in following patch, this will be removed
5036 */
5037 max_lb_iterations = 0;
5038 } else
5039 max_lb_iterations = cpumask_weight(env.dst_grpmask);
5040 5035
5041 cpumask_copy(cpus, cpu_active_mask); 5036 cpumask_copy(cpus, cpu_active_mask);
5042 5037
@@ -5064,7 +5059,6 @@ redo:
5064 schedstat_add(sd, lb_imbalance[idle], env.imbalance); 5059 schedstat_add(sd, lb_imbalance[idle], env.imbalance);
5065 5060
5066 ld_moved = 0; 5061 ld_moved = 0;
5067 lb_iterations = 1;
5068 if (busiest->nr_running > 1) { 5062 if (busiest->nr_running > 1) {
5069 /* 5063 /*
5070 * Attempt to move tasks. If find_busiest_group has found 5064 * Attempt to move tasks. If find_busiest_group has found
@@ -5121,14 +5115,17 @@ more_balance:
5121 * moreover subsequent load balance cycles should correct the 5115 * moreover subsequent load balance cycles should correct the
5122 * excess load moved. 5116 * excess load moved.
5123 */ 5117 */
5124 if ((env.flags & LBF_SOME_PINNED) && env.imbalance > 0 && 5118 if ((env.flags & LBF_SOME_PINNED) && env.imbalance > 0) {
5125 lb_iterations++ < max_lb_iterations) {
5126 5119
5127 env.dst_rq = cpu_rq(env.new_dst_cpu); 5120 env.dst_rq = cpu_rq(env.new_dst_cpu);
5128 env.dst_cpu = env.new_dst_cpu; 5121 env.dst_cpu = env.new_dst_cpu;
5129 env.flags &= ~LBF_SOME_PINNED; 5122 env.flags &= ~LBF_SOME_PINNED;
5130 env.loop = 0; 5123 env.loop = 0;
5131 env.loop_break = sched_nr_migrate_break; 5124 env.loop_break = sched_nr_migrate_break;
5125
5126 /* Prevent to re-select dst_cpu via env's cpus */
5127 cpumask_clear_cpu(env.dst_cpu, env.cpus);
5128
5132 /* 5129 /*
5133 * Go back to "more_balance" rather than "redo" since we 5130 * Go back to "more_balance" rather than "redo" since we
5134 * need to continue with same src_cpu. 5131 * need to continue with same src_cpu.