Merge branch 'sched-core-for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/tip/tip

Pull scheduler changes from Ingo Molnar: "The biggest change is the cleanup/simplification of the load-balancer: instead of the current practice of architectures twiddling scheduler internal data structures and providing the scheduler domains in colorfully inconsistent ways, we now have generic scheduler code in kernel/sched/core.c:sched_init_numa() that looks at the architecture's node_distance() parameters and (while not fully trusting it) deducts a NUMA topology from it. This inevitably changes balancing behavior - hopefully for the better. There are various smaller optimizations, cleanups and fixlets as well" * 'sched-core-for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/tip/tip: sched: Taint kernel with TAINT_WARN after sleep-in-atomic bug sched: Remove stale power aware scheduling remnants and dysfunctional knobs sched/debug: Fix printing large integers on 32-bit platforms sched/fair: Improve the ->group_imb logic sched/nohz: Fix rq->cpu_load[] calculations sched/numa: Don't scale the imbalance sched/fair: Revert sched-domain iteration breakage sched/x86: Rewrite set_cpu_sibling_map() sched/numa: Fix the new NUMA topology bits sched/numa: Rewrite the CONFIG_NUMA sched domain support sched/fair: Propagate 'struct lb_env' usage into find_busiest_group sched/fair: Add some serialization to the sched_domain load-balance walk sched/fair: Let minimally loaded cpu balance the group sched: Change rq->nr_running to unsigned int x86/numa: Check for nonsensical topologies on real hw as well x86/numa: Hard partition cpu topology masks on node boundaries x86/numa: Allow specifying node_distance() for numa=fake x86/sched: Make mwait_usable() heed to "idle=" kernel parameters properly sched: Update documentation and comments sched_rt: Avoid unnecessary dequeue and enqueue of pushable tasks in set_cpus_allowed_rt()
author: Linus Torvalds <torvalds@linux-foundation.org> 2012-05-22 21:27:32 -0400
committer: Linus Torvalds <torvalds@linux-foundation.org> 2012-05-22 21:27:32 -0400
commit: d79ee93de909dfb252279b9a95978bbda9a814a9 (patch)
tree: bfccca60fd36259ff4bcc5e78a2c272fbd680065 /arch/x86/kernel/smpboot.c
parent: 2ff2b289a695807e291e1ed9f639d8a3ba5f4254 (diff)
parent: 1c2927f18576d65631d8e0ddd19e1d023183222e (diff)
1 files changed, 69 insertions, 39 deletions
diff --git a/arch/x86/kernel/smpboot.c b/arch/x86/kernel/smpboot.c
index 3acaf51dfddb..433529e29be4 100644
--- a/arch/x86/kernel/smpboot.c
+++ b/arch/x86/kernel/smpboot.c
@@ -299,59 +299,90 @@ void __cpuinit smp_store_cpu_info(int id)
                identify_secondary_cpu(c);
 }
-static void __cpuinit link_thread_siblings(int cpu1, int cpu2)
+static bool __cpuinit
+topology_sane(struct cpuinfo_x86 *c, struct cpuinfo_x86 *o, const char *name)
 {
-        cpumask_set_cpu(cpu1, cpu_sibling_mask(cpu2));
+        int cpu1 = c->cpu_index, cpu2 = o->cpu_index;
-        cpumask_set_cpu(cpu2, cpu_sibling_mask(cpu1));
-        cpumask_set_cpu(cpu1, cpu_core_mask(cpu2));
+        return !WARN_ONCE(cpu_to_node(cpu1) != cpu_to_node(cpu2),
-        cpumask_set_cpu(cpu2, cpu_core_mask(cpu1));
+                "sched: CPU #%d's %s-sibling CPU #%d is not on the same node! "
-        cpumask_set_cpu(cpu1, cpu_llc_shared_mask(cpu2));
+                "[node: %d != %d]. Ignoring dependency.\n",
-        cpumask_set_cpu(cpu2, cpu_llc_shared_mask(cpu1));
+                cpu1, name, cpu2, cpu_to_node(cpu1), cpu_to_node(cpu2));
 }
+#define link_mask(_m, c1, c2)                                           \
+do {                                                                    \
+        cpumask_set_cpu((c1), cpu_##_m##_mask(c2));                     \
+        cpumask_set_cpu((c2), cpu_##_m##_mask(c1));                     \
+} while (0)
+static bool __cpuinit match_smt(struct cpuinfo_x86 *c, struct cpuinfo_x86 *o)
+{
+        if (cpu_has(c, X86_FEATURE_TOPOEXT)) {
+                int cpu1 = c->cpu_index, cpu2 = o->cpu_index;
+                if (c->phys_proc_id == o->phys_proc_id &&
+                    per_cpu(cpu_llc_id, cpu1) == per_cpu(cpu_llc_id, cpu2) &&
+                    c->compute_unit_id == o->compute_unit_id)
+                        return topology_sane(c, o, "smt");
+        } else if (c->phys_proc_id == o->phys_proc_id &&
+                   c->cpu_core_id == o->cpu_core_id) {
+                return topology_sane(c, o, "smt");
+        }
+        return false;
+}
+static bool __cpuinit match_llc(struct cpuinfo_x86 *c, struct cpuinfo_x86 *o)
+{
+        int cpu1 = c->cpu_index, cpu2 = o->cpu_index;
+        if (per_cpu(cpu_llc_id, cpu1) != BAD_APICID &&
+            per_cpu(cpu_llc_id, cpu1) == per_cpu(cpu_llc_id, cpu2))
+                return topology_sane(c, o, "llc");
+        return false;
+}
+static bool __cpuinit match_mc(struct cpuinfo_x86 *c, struct cpuinfo_x86 *o)
+{
+        if (c->phys_proc_id == o->phys_proc_id)
+                return topology_sane(c, o, "mc");
+        return false;
+}
 void __cpuinit set_cpu_sibling_map(int cpu)
 {
-        int i;
+        bool has_mc = boot_cpu_data.x86_max_cores > 1;
+        bool has_smt = smp_num_siblings > 1;
        struct cpuinfo_x86 *c = &cpu_data(cpu);
+        struct cpuinfo_x86 *o;
+        int i;
        cpumask_set_cpu(cpu, cpu_sibling_setup_mask);
-        if (smp_num_siblings > 1) {
+        if (!has_smt && !has_mc) {
-                for_each_cpu(i, cpu_sibling_setup_mask) {
-                        struct cpuinfo_x86 *o = &cpu_data(i);
-                        if (cpu_has(c, X86_FEATURE_TOPOEXT)) {
-                                if (c->phys_proc_id == o->phys_proc_id &&
-                                    per_cpu(cpu_llc_id, cpu) == per_cpu(cpu_llc_id, i) &&
-                                    c->compute_unit_id == o->compute_unit_id)
-                                        link_thread_siblings(cpu, i);
-                        } else if (c->phys_proc_id == o->phys_proc_id &&
-                                   c->cpu_core_id == o->cpu_core_id) {
-                                link_thread_siblings(cpu, i);
-                        }
-                }
-        } else {
                cpumask_set_cpu(cpu, cpu_sibling_mask(cpu));
-        }
+                cpumask_set_cpu(cpu, cpu_llc_shared_mask(cpu));
+                cpumask_set_cpu(cpu, cpu_core_mask(cpu));
-        cpumask_set_cpu(cpu, cpu_llc_shared_mask(cpu));
-        if (__this_cpu_read(cpu_info.x86_max_cores) == 1) {
-                cpumask_copy(cpu_core_mask(cpu), cpu_sibling_mask(cpu));
                c->booted_cores = 1;
                return;
        }
        for_each_cpu(i, cpu_sibling_setup_mask) {
-                if (per_cpu(cpu_llc_id, cpu) != BAD_APICID &&
+                o = &cpu_data(i);
-                    per_cpu(cpu_llc_id, cpu) == per_cpu(cpu_llc_id, i)) {
-                        cpumask_set_cpu(i, cpu_llc_shared_mask(cpu));
+                if ((i == cpu) || (has_smt && match_smt(c, o)))
-                        cpumask_set_cpu(cpu, cpu_llc_shared_mask(i));
+                        link_mask(sibling, cpu, i);
-                }
-                if (c->phys_proc_id == cpu_data(i).phys_proc_id) {
+                if ((i == cpu) || (has_mc && match_llc(c, o)))
-                        cpumask_set_cpu(i, cpu_core_mask(cpu));
+                        link_mask(llc_shared, cpu, i);
-                        cpumask_set_cpu(cpu, cpu_core_mask(i));
+                if ((i == cpu) || (has_mc && match_mc(c, o))) {
+                        link_mask(core, cpu, i);
                        /*
                         *  Does this new cpu bringup a new core?
                         */
@@ -382,8 +413,7 @@ const struct cpumask *cpu_coregroup_mask(int cpu)
         * For perf, we return last level cache shared map.
         * And for power savings, we return cpu_core_map
         */
-        if ((sched_mc_power_savings || sched_smt_power_savings) &&
+        if (!(cpu_has(c, X86_FEATURE_AMD_DCM)))
-            !(cpu_has(c, X86_FEATURE_AMD_DCM)))
                return cpu_core_mask(cpu);
        else
                return cpu_llc_shared_mask(cpu);
author	Linus Torvalds <torvalds@linux-foundation.org>	2012-05-22 21:27:32 -0400
committer	Linus Torvalds <torvalds@linux-foundation.org>	2012-05-22 21:27:32 -0400
commit	d79ee93de909dfb252279b9a95978bbda9a814a9 (patch)
tree	bfccca60fd36259ff4bcc5e78a2c272fbd680065 /arch/x86/kernel/smpboot.c
parent	2ff2b289a695807e291e1ed9f639d8a3ba5f4254 (diff)
parent	1c2927f18576d65631d8e0ddd19e1d023183222e (diff)

diff --git a/arch/x86/kernel/smpboot.c b/arch/x86/kernel/smpboot.c index 3acaf51dfddb..433529e29be4 100644 --- a/arch/x86/kernel/smpboot.c +++ b/arch/x86/kernel/smpboot.c
@@ -299,59 +299,90 @@ void __cpuinit smp_store_cpu_info(int id)
299	identify_secondary_cpu(c);	299	identify_secondary_cpu(c);
300	}	300	}
301		301
302	static void __cpuinit link_thread_siblings(int cpu1, int cpu2)	302	static bool __cpuinit
		303	topology_sane(struct cpuinfo_x86 c, struct cpuinfo_x86 o, const char *name)
303	{	304	{
304	cpumask_set_cpu(cpu1, cpu_sibling_mask(cpu2));	305	int cpu1 = c->cpu_index, cpu2 = o->cpu_index;
305	cpumask_set_cpu(cpu2, cpu_sibling_mask(cpu1));	306
306	cpumask_set_cpu(cpu1, cpu_core_mask(cpu2));	307	return !WARN_ONCE(cpu_to_node(cpu1) != cpu_to_node(cpu2),
307	cpumask_set_cpu(cpu2, cpu_core_mask(cpu1));	308	"sched: CPU #%d's %s-sibling CPU #%d is not on the same node! "
308	cpumask_set_cpu(cpu1, cpu_llc_shared_mask(cpu2));	309	"[node: %d != %d]. Ignoring dependency.\n",
309	cpumask_set_cpu(cpu2, cpu_llc_shared_mask(cpu1));	310	cpu1, name, cpu2, cpu_to_node(cpu1), cpu_to_node(cpu2));
310	}	311	}
311		312
		313	#define link_mask(_m, c1, c2) \
		314	do { \
		315	cpumask_set_cpu((c1), cpu_##_m##_mask(c2)); \
		316	cpumask_set_cpu((c2), cpu_##_m##_mask(c1)); \
		317	} while (0)
		318
		319	static bool __cpuinit match_smt(struct cpuinfo_x86 c, struct cpuinfo_x86 o)
		320	{
		321	if (cpu_has(c, X86_FEATURE_TOPOEXT)) {
		322	int cpu1 = c->cpu_index, cpu2 = o->cpu_index;
		323
		324	if (c->phys_proc_id == o->phys_proc_id &&
		325	per_cpu(cpu_llc_id, cpu1) == per_cpu(cpu_llc_id, cpu2) &&
		326	c->compute_unit_id == o->compute_unit_id)
		327	return topology_sane(c, o, "smt");
		328
		329	} else if (c->phys_proc_id == o->phys_proc_id &&
		330	c->cpu_core_id == o->cpu_core_id) {
		331	return topology_sane(c, o, "smt");
		332	}
		333
		334	return false;
		335	}
		336
		337	static bool __cpuinit match_llc(struct cpuinfo_x86 c, struct cpuinfo_x86 o)
		338	{
		339	int cpu1 = c->cpu_index, cpu2 = o->cpu_index;
		340
		341	if (per_cpu(cpu_llc_id, cpu1) != BAD_APICID &&
		342	per_cpu(cpu_llc_id, cpu1) == per_cpu(cpu_llc_id, cpu2))
		343	return topology_sane(c, o, "llc");
		344
		345	return false;
		346	}
		347
		348	static bool __cpuinit match_mc(struct cpuinfo_x86 c, struct cpuinfo_x86 o)
		349	{
		350	if (c->phys_proc_id == o->phys_proc_id)
		351	return topology_sane(c, o, "mc");
		352
		353	return false;
		354	}
312		355
313	void __cpuinit set_cpu_sibling_map(int cpu)	356	void __cpuinit set_cpu_sibling_map(int cpu)
314	{	357	{
315	int i;	358	bool has_mc = boot_cpu_data.x86_max_cores > 1;
		359	bool has_smt = smp_num_siblings > 1;
316	struct cpuinfo_x86 *c = &cpu_data(cpu);	360	struct cpuinfo_x86 *c = &cpu_data(cpu);
		361	struct cpuinfo_x86 *o;
		362	int i;
317		363
318	cpumask_set_cpu(cpu, cpu_sibling_setup_mask);	364	cpumask_set_cpu(cpu, cpu_sibling_setup_mask);
319		365
320	if (smp_num_siblings > 1) {	366	if (!has_smt && !has_mc) {
321	for_each_cpu(i, cpu_sibling_setup_mask) {
322	struct cpuinfo_x86 *o = &cpu_data(i);
323
324	if (cpu_has(c, X86_FEATURE_TOPOEXT)) {
325	if (c->phys_proc_id == o->phys_proc_id &&
326	per_cpu(cpu_llc_id, cpu) == per_cpu(cpu_llc_id, i) &&
327	c->compute_unit_id == o->compute_unit_id)
328	link_thread_siblings(cpu, i);
329	} else if (c->phys_proc_id == o->phys_proc_id &&
330	c->cpu_core_id == o->cpu_core_id) {
331	link_thread_siblings(cpu, i);
332	}
333	}
334	} else {
335	cpumask_set_cpu(cpu, cpu_sibling_mask(cpu));	367	cpumask_set_cpu(cpu, cpu_sibling_mask(cpu));
336	}	368	cpumask_set_cpu(cpu, cpu_llc_shared_mask(cpu));
337		369	cpumask_set_cpu(cpu, cpu_core_mask(cpu));
338	cpumask_set_cpu(cpu, cpu_llc_shared_mask(cpu));
339
340	if (__this_cpu_read(cpu_info.x86_max_cores) == 1) {
341	cpumask_copy(cpu_core_mask(cpu), cpu_sibling_mask(cpu));
342	c->booted_cores = 1;	370	c->booted_cores = 1;
343	return;	371	return;
344	}	372	}
345		373
346	for_each_cpu(i, cpu_sibling_setup_mask) {	374	for_each_cpu(i, cpu_sibling_setup_mask) {
347	if (per_cpu(cpu_llc_id, cpu) != BAD_APICID &&	375	o = &cpu_data(i);
348	per_cpu(cpu_llc_id, cpu) == per_cpu(cpu_llc_id, i)) {	376
349	cpumask_set_cpu(i, cpu_llc_shared_mask(cpu));	377	if ((i == cpu) \|\| (has_smt && match_smt(c, o)))
350	cpumask_set_cpu(cpu, cpu_llc_shared_mask(i));	378	link_mask(sibling, cpu, i);
351	}	379
352	if (c->phys_proc_id == cpu_data(i).phys_proc_id) {	380	if ((i == cpu) \|\| (has_mc && match_llc(c, o)))
353	cpumask_set_cpu(i, cpu_core_mask(cpu));	381	link_mask(llc_shared, cpu, i);
354	cpumask_set_cpu(cpu, cpu_core_mask(i));	382
		383	if ((i == cpu) \|\| (has_mc && match_mc(c, o))) {
		384	link_mask(core, cpu, i);
		385
355	/*	386	/*
356	* Does this new cpu bringup a new core?	387	* Does this new cpu bringup a new core?
357	*/	388	*/
@@ -382,8 +413,7 @@ const struct cpumask *cpu_coregroup_mask(int cpu)
382	* For perf, we return last level cache shared map.	413	* For perf, we return last level cache shared map.
383	* And for power savings, we return cpu_core_map	414	* And for power savings, we return cpu_core_map
384	*/	415	*/
385	if ((sched_mc_power_savings \|\| sched_smt_power_savings) &&	416	if (!(cpu_has(c, X86_FEATURE_AMD_DCM)))
386	!(cpu_has(c, X86_FEATURE_AMD_DCM)))
387	return cpu_core_mask(cpu);	417	return cpu_core_mask(cpu);
388	else	418	else
389	return cpu_llc_shared_mask(cpu);	419	return cpu_llc_shared_mask(cpu);