diff options
author | Preeti U Murthy <preeti@linux.vnet.ibm.com> | 2013-10-29 23:12:52 -0400 |
---|---|---|
committer | Ingo Molnar <mingo@kernel.org> | 2013-11-06 06:37:55 -0500 |
commit | 37dc6b50cee97954c4e6edcd5b1fa614b76038ee (patch) | |
tree | f317a2532d134b113c088bdf5026fb4aef1423c4 | |
parent | 2042abe7977222ef606306faa2dce8fd51e98e65 (diff) |
sched: Remove unnecessary iteration over sched domains to update nr_busy_cpus
nr_busy_cpus parameter is used by nohz_kick_needed() to find out the
number of busy cpus in a sched domain which has SD_SHARE_PKG_RESOURCES
flag set. Therefore instead of updating nr_busy_cpus at every level
of sched domain, since it is irrelevant, we can update this parameter
only at the parent domain of the sd which has this flag set. Introduce
a per-cpu parameter sd_busy which represents this parent domain.
In nohz_kick_needed() we directly query the nr_busy_cpus parameter
associated with the groups of sd_busy.
By associating sd_busy with the highest domain which has
SD_SHARE_PKG_RESOURCES flag set, we cover all lower level domains
which could have this flag set and trigger nohz_idle_balancing if any
of the levels have more than one busy cpu.
sd_busy is irrelevant for asymmetric load balancing. However sd_asym
has been introduced to represent the highest sched domain which has
SD_ASYM_PACKING flag set so that it can be queried directly when
required.
While we are at it, we might as well change the nohz_idle parameter to
be updated at the sd_busy domain level alone and not the base domain
level of a CPU. This will unify the concept of busy cpus at just one
level of sched domain where it is currently used.
Signed-off-by: Preeti U Murthy<preeti@linux.vnet.ibm.com>
Signed-off-by: Peter Zijlstra <peterz@infradead.org>
Cc: svaidy@linux.vnet.ibm.com
Cc: vincent.guittot@linaro.org
Cc: bitbucket@online.de
Cc: benh@kernel.crashing.org
Cc: anton@samba.org
Cc: Morten.Rasmussen@arm.com
Cc: pjt@google.com
Cc: peterz@infradead.org
Cc: mikey@neuling.org
Link: http://lkml.kernel.org/r/20131030031252.23426.4417.stgit@preeti.in.ibm.com
Signed-off-by: Ingo Molnar <mingo@kernel.org>
-rw-r--r-- | kernel/sched/core.c | 6 | ||||
-rw-r--r-- | kernel/sched/fair.c | 38 | ||||
-rw-r--r-- | kernel/sched/sched.h | 2 |
3 files changed, 28 insertions, 18 deletions
diff --git a/kernel/sched/core.c b/kernel/sched/core.c index aa066f306be2..1deccd78be98 100644 --- a/kernel/sched/core.c +++ b/kernel/sched/core.c | |||
@@ -4883,6 +4883,8 @@ DEFINE_PER_CPU(struct sched_domain *, sd_llc); | |||
4883 | DEFINE_PER_CPU(int, sd_llc_size); | 4883 | DEFINE_PER_CPU(int, sd_llc_size); |
4884 | DEFINE_PER_CPU(int, sd_llc_id); | 4884 | DEFINE_PER_CPU(int, sd_llc_id); |
4885 | DEFINE_PER_CPU(struct sched_domain *, sd_numa); | 4885 | DEFINE_PER_CPU(struct sched_domain *, sd_numa); |
4886 | DEFINE_PER_CPU(struct sched_domain *, sd_busy); | ||
4887 | DEFINE_PER_CPU(struct sched_domain *, sd_asym); | ||
4886 | 4888 | ||
4887 | static void update_top_cache_domain(int cpu) | 4889 | static void update_top_cache_domain(int cpu) |
4888 | { | 4890 | { |
@@ -4894,6 +4896,7 @@ static void update_top_cache_domain(int cpu) | |||
4894 | if (sd) { | 4896 | if (sd) { |
4895 | id = cpumask_first(sched_domain_span(sd)); | 4897 | id = cpumask_first(sched_domain_span(sd)); |
4896 | size = cpumask_weight(sched_domain_span(sd)); | 4898 | size = cpumask_weight(sched_domain_span(sd)); |
4899 | rcu_assign_pointer(per_cpu(sd_busy, cpu), sd->parent); | ||
4897 | } | 4900 | } |
4898 | 4901 | ||
4899 | rcu_assign_pointer(per_cpu(sd_llc, cpu), sd); | 4902 | rcu_assign_pointer(per_cpu(sd_llc, cpu), sd); |
@@ -4902,6 +4905,9 @@ static void update_top_cache_domain(int cpu) | |||
4902 | 4905 | ||
4903 | sd = lowest_flag_domain(cpu, SD_NUMA); | 4906 | sd = lowest_flag_domain(cpu, SD_NUMA); |
4904 | rcu_assign_pointer(per_cpu(sd_numa, cpu), sd); | 4907 | rcu_assign_pointer(per_cpu(sd_numa, cpu), sd); |
4908 | |||
4909 | sd = highest_flag_domain(cpu, SD_ASYM_PACKING); | ||
4910 | rcu_assign_pointer(per_cpu(sd_asym, cpu), sd); | ||
4905 | } | 4911 | } |
4906 | 4912 | ||
4907 | /* | 4913 | /* |
diff --git a/kernel/sched/fair.c b/kernel/sched/fair.c index 074551a792f7..df77c605c7a6 100644 --- a/kernel/sched/fair.c +++ b/kernel/sched/fair.c | |||
@@ -6534,16 +6534,16 @@ static inline void nohz_balance_exit_idle(int cpu) | |||
6534 | static inline void set_cpu_sd_state_busy(void) | 6534 | static inline void set_cpu_sd_state_busy(void) |
6535 | { | 6535 | { |
6536 | struct sched_domain *sd; | 6536 | struct sched_domain *sd; |
6537 | int cpu = smp_processor_id(); | ||
6537 | 6538 | ||
6538 | rcu_read_lock(); | 6539 | rcu_read_lock(); |
6539 | sd = rcu_dereference_check_sched_domain(this_rq()->sd); | 6540 | sd = rcu_dereference(per_cpu(sd_busy, cpu)); |
6540 | 6541 | ||
6541 | if (!sd || !sd->nohz_idle) | 6542 | if (!sd || !sd->nohz_idle) |
6542 | goto unlock; | 6543 | goto unlock; |
6543 | sd->nohz_idle = 0; | 6544 | sd->nohz_idle = 0; |
6544 | 6545 | ||
6545 | for (; sd; sd = sd->parent) | 6546 | atomic_inc(&sd->groups->sgp->nr_busy_cpus); |
6546 | atomic_inc(&sd->groups->sgp->nr_busy_cpus); | ||
6547 | unlock: | 6547 | unlock: |
6548 | rcu_read_unlock(); | 6548 | rcu_read_unlock(); |
6549 | } | 6549 | } |
@@ -6551,16 +6551,16 @@ unlock: | |||
6551 | void set_cpu_sd_state_idle(void) | 6551 | void set_cpu_sd_state_idle(void) |
6552 | { | 6552 | { |
6553 | struct sched_domain *sd; | 6553 | struct sched_domain *sd; |
6554 | int cpu = smp_processor_id(); | ||
6554 | 6555 | ||
6555 | rcu_read_lock(); | 6556 | rcu_read_lock(); |
6556 | sd = rcu_dereference_check_sched_domain(this_rq()->sd); | 6557 | sd = rcu_dereference(per_cpu(sd_busy, cpu)); |
6557 | 6558 | ||
6558 | if (!sd || sd->nohz_idle) | 6559 | if (!sd || sd->nohz_idle) |
6559 | goto unlock; | 6560 | goto unlock; |
6560 | sd->nohz_idle = 1; | 6561 | sd->nohz_idle = 1; |
6561 | 6562 | ||
6562 | for (; sd; sd = sd->parent) | 6563 | atomic_dec(&sd->groups->sgp->nr_busy_cpus); |
6563 | atomic_dec(&sd->groups->sgp->nr_busy_cpus); | ||
6564 | unlock: | 6564 | unlock: |
6565 | rcu_read_unlock(); | 6565 | rcu_read_unlock(); |
6566 | } | 6566 | } |
@@ -6767,6 +6767,8 @@ static inline int nohz_kick_needed(struct rq *rq, int cpu) | |||
6767 | { | 6767 | { |
6768 | unsigned long now = jiffies; | 6768 | unsigned long now = jiffies; |
6769 | struct sched_domain *sd; | 6769 | struct sched_domain *sd; |
6770 | struct sched_group_power *sgp; | ||
6771 | int nr_busy; | ||
6770 | 6772 | ||
6771 | if (unlikely(idle_cpu(cpu))) | 6773 | if (unlikely(idle_cpu(cpu))) |
6772 | return 0; | 6774 | return 0; |
@@ -6792,22 +6794,22 @@ static inline int nohz_kick_needed(struct rq *rq, int cpu) | |||
6792 | goto need_kick; | 6794 | goto need_kick; |
6793 | 6795 | ||
6794 | rcu_read_lock(); | 6796 | rcu_read_lock(); |
6795 | for_each_domain(cpu, sd) { | 6797 | sd = rcu_dereference(per_cpu(sd_busy, cpu)); |
6796 | struct sched_group *sg = sd->groups; | ||
6797 | struct sched_group_power *sgp = sg->sgp; | ||
6798 | int nr_busy = atomic_read(&sgp->nr_busy_cpus); | ||
6799 | 6798 | ||
6800 | if (sd->flags & SD_SHARE_PKG_RESOURCES && nr_busy > 1) | 6799 | if (sd) { |
6801 | goto need_kick_unlock; | 6800 | sgp = sd->groups->sgp; |
6801 | nr_busy = atomic_read(&sgp->nr_busy_cpus); | ||
6802 | 6802 | ||
6803 | if (sd->flags & SD_ASYM_PACKING | 6803 | if (nr_busy > 1) |
6804 | && (cpumask_first_and(nohz.idle_cpus_mask, | ||
6805 | sched_domain_span(sd)) < cpu)) | ||
6806 | goto need_kick_unlock; | 6804 | goto need_kick_unlock; |
6807 | |||
6808 | if (!(sd->flags & (SD_SHARE_PKG_RESOURCES | SD_ASYM_PACKING))) | ||
6809 | break; | ||
6810 | } | 6805 | } |
6806 | |||
6807 | sd = rcu_dereference(per_cpu(sd_asym, cpu)); | ||
6808 | |||
6809 | if (sd && (cpumask_first_and(nohz.idle_cpus_mask, | ||
6810 | sched_domain_span(sd)) < cpu)) | ||
6811 | goto need_kick_unlock; | ||
6812 | |||
6811 | rcu_read_unlock(); | 6813 | rcu_read_unlock(); |
6812 | return 0; | 6814 | return 0; |
6813 | 6815 | ||
diff --git a/kernel/sched/sched.h b/kernel/sched/sched.h index 4e650acffed7..88c85b21d633 100644 --- a/kernel/sched/sched.h +++ b/kernel/sched/sched.h | |||
@@ -623,6 +623,8 @@ DECLARE_PER_CPU(struct sched_domain *, sd_llc); | |||
623 | DECLARE_PER_CPU(int, sd_llc_size); | 623 | DECLARE_PER_CPU(int, sd_llc_size); |
624 | DECLARE_PER_CPU(int, sd_llc_id); | 624 | DECLARE_PER_CPU(int, sd_llc_id); |
625 | DECLARE_PER_CPU(struct sched_domain *, sd_numa); | 625 | DECLARE_PER_CPU(struct sched_domain *, sd_numa); |
626 | DECLARE_PER_CPU(struct sched_domain *, sd_busy); | ||
627 | DECLARE_PER_CPU(struct sched_domain *, sd_asym); | ||
626 | 628 | ||
627 | struct sched_group_power { | 629 | struct sched_group_power { |
628 | atomic_t ref; | 630 | atomic_t ref; |