aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBrian Gerst <brgerst@gmail.com>2009-01-26 22:56:47 -0500
committerTejun Heo <tj@kernel.org>2009-01-26 22:56:47 -0500
commit6470aff619fbb9dff8dfe8afa5033084cd55ca20 (patch)
treec5734a7afc33ef665b1cacc3a715ab7e0c85787a
parent0d77e7f04d5da160307f4f5c030a171e004f602b (diff)
x86: move 64-bit NUMA code
Impact: Code movement, no functional change. Move the 64-bit NUMA code from setup_percpu.c to numa_64.c Signed-off-by: Brian Gerst <brgerst@gmail.com> Signed-off-by: Tejun Heo <tj@kernel.org>
-rw-r--r--arch/x86/include/asm/topology.h6
-rw-r--r--arch/x86/kernel/setup_percpu.c237
-rw-r--r--arch/x86/mm/numa_64.c217
3 files changed, 228 insertions, 232 deletions
diff --git a/arch/x86/include/asm/topology.h b/arch/x86/include/asm/topology.h
index 10022ed3a4b6..77cfb2cfb386 100644
--- a/arch/x86/include/asm/topology.h
+++ b/arch/x86/include/asm/topology.h
@@ -74,6 +74,8 @@ static inline const struct cpumask *cpumask_of_node(int node)
74 return &node_to_cpumask_map[node]; 74 return &node_to_cpumask_map[node];
75} 75}
76 76
77static inline void setup_node_to_cpumask_map(void) { }
78
77#else /* CONFIG_X86_64 */ 79#else /* CONFIG_X86_64 */
78 80
79/* Mappings between node number and cpus on that node. */ 81/* Mappings between node number and cpus on that node. */
@@ -120,6 +122,8 @@ static inline cpumask_t node_to_cpumask(int node)
120 122
121#endif /* !CONFIG_DEBUG_PER_CPU_MAPS */ 123#endif /* !CONFIG_DEBUG_PER_CPU_MAPS */
122 124
125extern void setup_node_to_cpumask_map(void);
126
123/* 127/*
124 * Replace default node_to_cpumask_ptr with optimized version 128 * Replace default node_to_cpumask_ptr with optimized version
125 * Deprecated: use "const struct cpumask *mask = cpumask_of_node(node)" 129 * Deprecated: use "const struct cpumask *mask = cpumask_of_node(node)"
@@ -218,6 +222,8 @@ static inline int node_to_first_cpu(int node)
218 return first_cpu(cpu_online_map); 222 return first_cpu(cpu_online_map);
219} 223}
220 224
225static inline void setup_node_to_cpumask_map(void) { }
226
221/* 227/*
222 * Replace default node_to_cpumask_ptr with optimized version 228 * Replace default node_to_cpumask_ptr with optimized version
223 * Deprecated: use "const struct cpumask *mask = cpumask_of_node(node)" 229 * Deprecated: use "const struct cpumask *mask = cpumask_of_node(node)"
diff --git a/arch/x86/kernel/setup_percpu.c b/arch/x86/kernel/setup_percpu.c
index d0b1476490a7..cb6d622520be 100644
--- a/arch/x86/kernel/setup_percpu.c
+++ b/arch/x86/kernel/setup_percpu.c
@@ -51,32 +51,6 @@ DEFINE_EARLY_PER_CPU(u16, x86_bios_cpu_apicid, BAD_APICID);
51EXPORT_EARLY_PER_CPU_SYMBOL(x86_cpu_to_apicid); 51EXPORT_EARLY_PER_CPU_SYMBOL(x86_cpu_to_apicid);
52EXPORT_EARLY_PER_CPU_SYMBOL(x86_bios_cpu_apicid); 52EXPORT_EARLY_PER_CPU_SYMBOL(x86_bios_cpu_apicid);
53 53
54#if defined(CONFIG_NUMA) && defined(CONFIG_X86_64)
55#define X86_64_NUMA 1 /* (used later) */
56DEFINE_PER_CPU(int, node_number) = 0;
57EXPORT_PER_CPU_SYMBOL(node_number);
58
59/*
60 * Map cpu index to node index
61 */
62DEFINE_EARLY_PER_CPU(int, x86_cpu_to_node_map, NUMA_NO_NODE);
63EXPORT_EARLY_PER_CPU_SYMBOL(x86_cpu_to_node_map);
64
65/*
66 * Which logical CPUs are on which nodes
67 */
68cpumask_t *node_to_cpumask_map;
69EXPORT_SYMBOL(node_to_cpumask_map);
70
71/*
72 * Setup node_to_cpumask_map
73 */
74static void __init setup_node_to_cpumask_map(void);
75
76#else
77static inline void setup_node_to_cpumask_map(void) { }
78#endif
79
80#ifdef CONFIG_X86_64 54#ifdef CONFIG_X86_64
81 55
82/* correctly size the local cpu masks */ 56/* correctly size the local cpu masks */
@@ -163,13 +137,13 @@ void __init setup_per_cpu_areas(void)
163 early_per_cpu_map(x86_cpu_to_apicid, cpu); 137 early_per_cpu_map(x86_cpu_to_apicid, cpu);
164 per_cpu(x86_bios_cpu_apicid, cpu) = 138 per_cpu(x86_bios_cpu_apicid, cpu) =
165 early_per_cpu_map(x86_bios_cpu_apicid, cpu); 139 early_per_cpu_map(x86_bios_cpu_apicid, cpu);
166#ifdef X86_64_NUMA
167 per_cpu(x86_cpu_to_node_map, cpu) =
168 early_per_cpu_map(x86_cpu_to_node_map, cpu);
169#endif
170#ifdef CONFIG_X86_64 140#ifdef CONFIG_X86_64
171 per_cpu(irq_stack_ptr, cpu) = 141 per_cpu(irq_stack_ptr, cpu) =
172 per_cpu(irq_stack_union.irq_stack, cpu) + IRQ_STACK_SIZE - 64; 142 per_cpu(irq_stack_union.irq_stack, cpu) + IRQ_STACK_SIZE - 64;
143#ifdef CONFIG_NUMA
144 per_cpu(x86_cpu_to_node_map, cpu) =
145 early_per_cpu_map(x86_cpu_to_node_map, cpu);
146#endif
173 /* 147 /*
174 * Up to this point, CPU0 has been using .data.init 148 * Up to this point, CPU0 has been using .data.init
175 * area. Reload %gs offset for CPU0. 149 * area. Reload %gs offset for CPU0.
@@ -184,7 +158,7 @@ void __init setup_per_cpu_areas(void)
184 /* indicate the early static arrays will soon be gone */ 158 /* indicate the early static arrays will soon be gone */
185 early_per_cpu_ptr(x86_cpu_to_apicid) = NULL; 159 early_per_cpu_ptr(x86_cpu_to_apicid) = NULL;
186 early_per_cpu_ptr(x86_bios_cpu_apicid) = NULL; 160 early_per_cpu_ptr(x86_bios_cpu_apicid) = NULL;
187#ifdef X86_64_NUMA 161#if defined(CONFIG_X86_64) && defined(CONFIG_NUMA)
188 early_per_cpu_ptr(x86_cpu_to_node_map) = NULL; 162 early_per_cpu_ptr(x86_cpu_to_node_map) = NULL;
189#endif 163#endif
190 164
@@ -197,204 +171,3 @@ void __init setup_per_cpu_areas(void)
197 171
198#endif 172#endif
199 173
200#ifdef X86_64_NUMA
201
202/*
203 * Allocate node_to_cpumask_map based on number of available nodes
204 * Requires node_possible_map to be valid.
205 *
206 * Note: node_to_cpumask() is not valid until after this is done.
207 * (Use CONFIG_DEBUG_PER_CPU_MAPS to check this.)
208 */
209static void __init setup_node_to_cpumask_map(void)
210{
211 unsigned int node, num = 0;
212 cpumask_t *map;
213
214 /* setup nr_node_ids if not done yet */
215 if (nr_node_ids == MAX_NUMNODES) {
216 for_each_node_mask(node, node_possible_map)
217 num = node;
218 nr_node_ids = num + 1;
219 }
220
221 /* allocate the map */
222 map = alloc_bootmem_low(nr_node_ids * sizeof(cpumask_t));
223 DBG("node_to_cpumask_map at %p for %d nodes\n", map, nr_node_ids);
224
225 pr_debug("Node to cpumask map at %p for %d nodes\n",
226 map, nr_node_ids);
227
228 /* node_to_cpumask() will now work */
229 node_to_cpumask_map = map;
230}
231
232void __cpuinit numa_set_node(int cpu, int node)
233{
234 int *cpu_to_node_map = early_per_cpu_ptr(x86_cpu_to_node_map);
235
236 /* early setting, no percpu area yet */
237 if (cpu_to_node_map) {
238 cpu_to_node_map[cpu] = node;
239 return;
240 }
241
242#ifdef CONFIG_DEBUG_PER_CPU_MAPS
243 if (cpu >= nr_cpu_ids || !per_cpu_offset(cpu)) {
244 printk(KERN_ERR "numa_set_node: invalid cpu# (%d)\n", cpu);
245 dump_stack();
246 return;
247 }
248#endif
249 per_cpu(x86_cpu_to_node_map, cpu) = node;
250
251 if (node != NUMA_NO_NODE)
252 per_cpu(node_number, cpu) = node;
253}
254
255void __cpuinit numa_clear_node(int cpu)
256{
257 numa_set_node(cpu, NUMA_NO_NODE);
258}
259
260#ifndef CONFIG_DEBUG_PER_CPU_MAPS
261
262void __cpuinit numa_add_cpu(int cpu)
263{
264 cpu_set(cpu, node_to_cpumask_map[early_cpu_to_node(cpu)]);
265}
266
267void __cpuinit numa_remove_cpu(int cpu)
268{
269 cpu_clear(cpu, node_to_cpumask_map[early_cpu_to_node(cpu)]);
270}
271
272#else /* CONFIG_DEBUG_PER_CPU_MAPS */
273
274/*
275 * --------- debug versions of the numa functions ---------
276 */
277static void __cpuinit numa_set_cpumask(int cpu, int enable)
278{
279 int node = early_cpu_to_node(cpu);
280 cpumask_t *mask;
281 char buf[64];
282
283 if (node_to_cpumask_map == NULL) {
284 printk(KERN_ERR "node_to_cpumask_map NULL\n");
285 dump_stack();
286 return;
287 }
288
289 mask = &node_to_cpumask_map[node];
290 if (enable)
291 cpu_set(cpu, *mask);
292 else
293 cpu_clear(cpu, *mask);
294
295 cpulist_scnprintf(buf, sizeof(buf), mask);
296 printk(KERN_DEBUG "%s cpu %d node %d: mask now %s\n",
297 enable ? "numa_add_cpu" : "numa_remove_cpu", cpu, node, buf);
298}
299
300void __cpuinit numa_add_cpu(int cpu)
301{
302 numa_set_cpumask(cpu, 1);
303}
304
305void __cpuinit numa_remove_cpu(int cpu)
306{
307 numa_set_cpumask(cpu, 0);
308}
309
310int cpu_to_node(int cpu)
311{
312 if (early_per_cpu_ptr(x86_cpu_to_node_map)) {
313 printk(KERN_WARNING
314 "cpu_to_node(%d): usage too early!\n", cpu);
315 dump_stack();
316 return early_per_cpu_ptr(x86_cpu_to_node_map)[cpu];
317 }
318 return per_cpu(x86_cpu_to_node_map, cpu);
319}
320EXPORT_SYMBOL(cpu_to_node);
321
322/*
323 * Same function as cpu_to_node() but used if called before the
324 * per_cpu areas are setup.
325 */
326int early_cpu_to_node(int cpu)
327{
328 if (early_per_cpu_ptr(x86_cpu_to_node_map))
329 return early_per_cpu_ptr(x86_cpu_to_node_map)[cpu];
330
331 if (!per_cpu_offset(cpu)) {
332 printk(KERN_WARNING
333 "early_cpu_to_node(%d): no per_cpu area!\n", cpu);
334 dump_stack();
335 return NUMA_NO_NODE;
336 }
337 return per_cpu(x86_cpu_to_node_map, cpu);
338}
339
340
341/* empty cpumask */
342static const cpumask_t cpu_mask_none;
343
344/*
345 * Returns a pointer to the bitmask of CPUs on Node 'node'.
346 */
347const cpumask_t *cpumask_of_node(int node)
348{
349 if (node_to_cpumask_map == NULL) {
350 printk(KERN_WARNING
351 "cpumask_of_node(%d): no node_to_cpumask_map!\n",
352 node);
353 dump_stack();
354 return (const cpumask_t *)&cpu_online_map;
355 }
356 if (node >= nr_node_ids) {
357 printk(KERN_WARNING
358 "cpumask_of_node(%d): node > nr_node_ids(%d)\n",
359 node, nr_node_ids);
360 dump_stack();
361 return &cpu_mask_none;
362 }
363 return &node_to_cpumask_map[node];
364}
365EXPORT_SYMBOL(cpumask_of_node);
366
367/*
368 * Returns a bitmask of CPUs on Node 'node'.
369 *
370 * Side note: this function creates the returned cpumask on the stack
371 * so with a high NR_CPUS count, excessive stack space is used. The
372 * node_to_cpumask_ptr function should be used whenever possible.
373 */
374cpumask_t node_to_cpumask(int node)
375{
376 if (node_to_cpumask_map == NULL) {
377 printk(KERN_WARNING
378 "node_to_cpumask(%d): no node_to_cpumask_map!\n", node);
379 dump_stack();
380 return cpu_online_map;
381 }
382 if (node >= nr_node_ids) {
383 printk(KERN_WARNING
384 "node_to_cpumask(%d): node > nr_node_ids(%d)\n",
385 node, nr_node_ids);
386 dump_stack();
387 return cpu_mask_none;
388 }
389 return node_to_cpumask_map[node];
390}
391EXPORT_SYMBOL(node_to_cpumask);
392
393/*
394 * --------- end of debug versions of the numa functions ---------
395 */
396
397#endif /* CONFIG_DEBUG_PER_CPU_MAPS */
398
399#endif /* X86_64_NUMA */
400
diff --git a/arch/x86/mm/numa_64.c b/arch/x86/mm/numa_64.c
index 71a14f89f89e..08d140fbc31b 100644
--- a/arch/x86/mm/numa_64.c
+++ b/arch/x86/mm/numa_64.c
@@ -20,6 +20,12 @@
20#include <asm/acpi.h> 20#include <asm/acpi.h>
21#include <asm/k8.h> 21#include <asm/k8.h>
22 22
23#ifdef CONFIG_DEBUG_PER_CPU_MAPS
24# define DBG(x...) printk(KERN_DEBUG x)
25#else
26# define DBG(x...)
27#endif
28
23struct pglist_data *node_data[MAX_NUMNODES] __read_mostly; 29struct pglist_data *node_data[MAX_NUMNODES] __read_mostly;
24EXPORT_SYMBOL(node_data); 30EXPORT_SYMBOL(node_data);
25 31
@@ -33,6 +39,21 @@ int numa_off __initdata;
33static unsigned long __initdata nodemap_addr; 39static unsigned long __initdata nodemap_addr;
34static unsigned long __initdata nodemap_size; 40static unsigned long __initdata nodemap_size;
35 41
42DEFINE_PER_CPU(int, node_number) = 0;
43EXPORT_PER_CPU_SYMBOL(node_number);
44
45/*
46 * Map cpu index to node index
47 */
48DEFINE_EARLY_PER_CPU(int, x86_cpu_to_node_map, NUMA_NO_NODE);
49EXPORT_EARLY_PER_CPU_SYMBOL(x86_cpu_to_node_map);
50
51/*
52 * Which logical CPUs are on which nodes
53 */
54cpumask_t *node_to_cpumask_map;
55EXPORT_SYMBOL(node_to_cpumask_map);
56
36/* 57/*
37 * Given a shift value, try to populate memnodemap[] 58 * Given a shift value, try to populate memnodemap[]
38 * Returns : 59 * Returns :
@@ -640,3 +661,199 @@ void __init init_cpu_to_node(void)
640#endif 661#endif
641 662
642 663
664/*
665 * Allocate node_to_cpumask_map based on number of available nodes
666 * Requires node_possible_map to be valid.
667 *
668 * Note: node_to_cpumask() is not valid until after this is done.
669 * (Use CONFIG_DEBUG_PER_CPU_MAPS to check this.)
670 */
671void __init setup_node_to_cpumask_map(void)
672{
673 unsigned int node, num = 0;
674 cpumask_t *map;
675
676 /* setup nr_node_ids if not done yet */
677 if (nr_node_ids == MAX_NUMNODES) {
678 for_each_node_mask(node, node_possible_map)
679 num = node;
680 nr_node_ids = num + 1;
681 }
682
683 /* allocate the map */
684 map = alloc_bootmem_low(nr_node_ids * sizeof(cpumask_t));
685 DBG("node_to_cpumask_map at %p for %d nodes\n", map, nr_node_ids);
686
687 pr_debug("Node to cpumask map at %p for %d nodes\n",
688 map, nr_node_ids);
689
690 /* node_to_cpumask() will now work */
691 node_to_cpumask_map = map;
692}
693
694void __cpuinit numa_set_node(int cpu, int node)
695{
696 int *cpu_to_node_map = early_per_cpu_ptr(x86_cpu_to_node_map);
697
698 /* early setting, no percpu area yet */
699 if (cpu_to_node_map) {
700 cpu_to_node_map[cpu] = node;
701 return;
702 }
703
704#ifdef CONFIG_DEBUG_PER_CPU_MAPS
705 if (cpu >= nr_cpu_ids || !per_cpu_offset(cpu)) {
706 printk(KERN_ERR "numa_set_node: invalid cpu# (%d)\n", cpu);
707 dump_stack();
708 return;
709 }
710#endif
711 per_cpu(x86_cpu_to_node_map, cpu) = node;
712
713 if (node != NUMA_NO_NODE)
714 per_cpu(node_number, cpu) = node;
715}
716
717void __cpuinit numa_clear_node(int cpu)
718{
719 numa_set_node(cpu, NUMA_NO_NODE);
720}
721
722#ifndef CONFIG_DEBUG_PER_CPU_MAPS
723
724void __cpuinit numa_add_cpu(int cpu)
725{
726 cpu_set(cpu, node_to_cpumask_map[early_cpu_to_node(cpu)]);
727}
728
729void __cpuinit numa_remove_cpu(int cpu)
730{
731 cpu_clear(cpu, node_to_cpumask_map[early_cpu_to_node(cpu)]);
732}
733
734#else /* CONFIG_DEBUG_PER_CPU_MAPS */
735
736/*
737 * --------- debug versions of the numa functions ---------
738 */
739static void __cpuinit numa_set_cpumask(int cpu, int enable)
740{
741 int node = early_cpu_to_node(cpu);
742 cpumask_t *mask;
743 char buf[64];
744
745 if (node_to_cpumask_map == NULL) {
746 printk(KERN_ERR "node_to_cpumask_map NULL\n");
747 dump_stack();
748 return;
749 }
750
751 mask = &node_to_cpumask_map[node];
752 if (enable)
753 cpu_set(cpu, *mask);
754 else
755 cpu_clear(cpu, *mask);
756
757 cpulist_scnprintf(buf, sizeof(buf), mask);
758 printk(KERN_DEBUG "%s cpu %d node %d: mask now %s\n",
759 enable ? "numa_add_cpu" : "numa_remove_cpu", cpu, node, buf);
760}
761
762void __cpuinit numa_add_cpu(int cpu)
763{
764 numa_set_cpumask(cpu, 1);
765}
766
767void __cpuinit numa_remove_cpu(int cpu)
768{
769 numa_set_cpumask(cpu, 0);
770}
771
772int cpu_to_node(int cpu)
773{
774 if (early_per_cpu_ptr(x86_cpu_to_node_map)) {
775 printk(KERN_WARNING
776 "cpu_to_node(%d): usage too early!\n", cpu);
777 dump_stack();
778 return early_per_cpu_ptr(x86_cpu_to_node_map)[cpu];
779 }
780 return per_cpu(x86_cpu_to_node_map, cpu);
781}
782EXPORT_SYMBOL(cpu_to_node);
783
784/*
785 * Same function as cpu_to_node() but used if called before the
786 * per_cpu areas are setup.
787 */
788int early_cpu_to_node(int cpu)
789{
790 if (early_per_cpu_ptr(x86_cpu_to_node_map))
791 return early_per_cpu_ptr(x86_cpu_to_node_map)[cpu];
792
793 if (!per_cpu_offset(cpu)) {
794 printk(KERN_WARNING
795 "early_cpu_to_node(%d): no per_cpu area!\n", cpu);
796 dump_stack();
797 return NUMA_NO_NODE;
798 }
799 return per_cpu(x86_cpu_to_node_map, cpu);
800}
801
802
803/* empty cpumask */
804static const cpumask_t cpu_mask_none;
805
806/*
807 * Returns a pointer to the bitmask of CPUs on Node 'node'.
808 */
809const cpumask_t *cpumask_of_node(int node)
810{
811 if (node_to_cpumask_map == NULL) {
812 printk(KERN_WARNING
813 "cpumask_of_node(%d): no node_to_cpumask_map!\n",
814 node);
815 dump_stack();
816 return (const cpumask_t *)&cpu_online_map;
817 }
818 if (node >= nr_node_ids) {
819 printk(KERN_WARNING
820 "cpumask_of_node(%d): node > nr_node_ids(%d)\n",
821 node, nr_node_ids);
822 dump_stack();
823 return &cpu_mask_none;
824 }
825 return &node_to_cpumask_map[node];
826}
827EXPORT_SYMBOL(cpumask_of_node);
828
829/*
830 * Returns a bitmask of CPUs on Node 'node'.
831 *
832 * Side note: this function creates the returned cpumask on the stack
833 * so with a high NR_CPUS count, excessive stack space is used. The
834 * node_to_cpumask_ptr function should be used whenever possible.
835 */
836cpumask_t node_to_cpumask(int node)
837{
838 if (node_to_cpumask_map == NULL) {
839 printk(KERN_WARNING
840 "node_to_cpumask(%d): no node_to_cpumask_map!\n", node);
841 dump_stack();
842 return cpu_online_map;
843 }
844 if (node >= nr_node_ids) {
845 printk(KERN_WARNING
846 "node_to_cpumask(%d): node > nr_node_ids(%d)\n",
847 node, nr_node_ids);
848 dump_stack();
849 return cpu_mask_none;
850 }
851 return node_to_cpumask_map[node];
852}
853EXPORT_SYMBOL(node_to_cpumask);
854
855/*
856 * --------- end of debug versions of the numa functions ---------
857 */
858
859#endif /* CONFIG_DEBUG_PER_CPU_MAPS */