aboutsummaryrefslogtreecommitdiffstats
path: root/arch/s390/kernel/smp.c
diff options
context:
space:
mode:
authorLinus Torvalds <torvalds@linux-foundation.org>2012-03-22 21:15:32 -0400
committerLinus Torvalds <torvalds@linux-foundation.org>2012-03-22 21:15:32 -0400
commitdb1417967959569599da2a4bd0ffb93b17ad795f (patch)
tree08751414d5f4a9e264af924154ed3543a8e573a9 /arch/s390/kernel/smp.c
parent48aab2f79dfc1357c48ce22ff5c989b52a590069 (diff)
parentc6da39f26cfe475704ec521723192e520e8f51b8 (diff)
Merge branch 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/s390/linux
Pull s390 patches from Martin Schwidefsky: "The biggest patch is the rework of the smp code, something I wanted to do for some time. There are some patches for our various dump methods and one new thing: z/VM LGR detection. LGR stands for linux-guest- relocation and is the guest migration feature of z/VM. For debugging purposes we keep a log of the systems where a specific guest has lived." Fix up trivial conflict in arch/s390/kernel/smp.c due to the scheduler cleanup having removed some code next to removed s390 code. * 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/s390/linux: [S390] kernel: Pass correct stack for smp_call_ipl_cpu() [S390] Ensure that vmcore_info pointer is never accessed directly [S390] dasd: prevent validate server for offline devices [S390] Remove monolithic build option for zcrypt driver. [S390] stack dump: fix indentation in output [S390] kernel: Add OS info memory interface [S390] Use block_sigmask() [S390] kernel: Add z/VM LGR detection [S390] irq: external interrupt code passing [S390] irq: set __ARCH_IRQ_EXIT_IRQS_DISABLED [S390] zfcpdump: Implement async sdias event processing [S390] Use copy_to_absolute_zero() instead of "stura/sturg" [S390] rework idle code [S390] rework smp code [S390] rename lowcore field [S390] Fix gcc 4.6.0 compile warning
Diffstat (limited to 'arch/s390/kernel/smp.c')
-rw-r--r--arch/s390/kernel/smp.c1147
1 files changed, 577 insertions, 570 deletions
diff --git a/arch/s390/kernel/smp.c b/arch/s390/kernel/smp.c
index b0e28c47ab83..a8bf9994b086 100644
--- a/arch/s390/kernel/smp.c
+++ b/arch/s390/kernel/smp.c
@@ -1,23 +1,18 @@
1/* 1/*
2 * arch/s390/kernel/smp.c 2 * SMP related functions
3 * 3 *
4 * Copyright IBM Corp. 1999, 2009 4 * Copyright IBM Corp. 1999,2012
5 * Author(s): Denis Joseph Barrow (djbarrow@de.ibm.com,barrow_dj@yahoo.com), 5 * Author(s): Denis Joseph Barrow,
6 * Martin Schwidefsky (schwidefsky@de.ibm.com) 6 * Martin Schwidefsky <schwidefsky@de.ibm.com>,
7 * Heiko Carstens (heiko.carstens@de.ibm.com) 7 * Heiko Carstens <heiko.carstens@de.ibm.com>,
8 * 8 *
9 * based on other smp stuff by 9 * based on other smp stuff by
10 * (c) 1995 Alan Cox, CymruNET Ltd <alan@cymru.net> 10 * (c) 1995 Alan Cox, CymruNET Ltd <alan@cymru.net>
11 * (c) 1998 Ingo Molnar 11 * (c) 1998 Ingo Molnar
12 * 12 *
13 * We work with logical cpu numbering everywhere we can. The only 13 * The code outside of smp.c uses logical cpu numbers, only smp.c does
14 * functions using the real cpu address (got from STAP) are the sigp 14 * the translation of logical to physical cpu ids. All new code that
15 * functions. For all other functions we use the identity mapping. 15 * operates on physical cpu numbers needs to go into smp.c.
16 * That means that cpu_number_map[i] == i for every cpu. cpu_number_map is
17 * used e.g. to find the idle task belonging to a logical cpu. Every array
18 * in the kernel is sorted by the logical cpu number and not by the physical
19 * one which is causing all the confusion with __cpu_logical_map and
20 * cpu_number_map in other architectures.
21 */ 16 */
22 17
23#define KMSG_COMPONENT "cpu" 18#define KMSG_COMPONENT "cpu"
@@ -31,198 +26,433 @@
31#include <linux/spinlock.h> 26#include <linux/spinlock.h>
32#include <linux/kernel_stat.h> 27#include <linux/kernel_stat.h>
33#include <linux/delay.h> 28#include <linux/delay.h>
34#include <linux/cache.h>
35#include <linux/interrupt.h> 29#include <linux/interrupt.h>
36#include <linux/irqflags.h> 30#include <linux/irqflags.h>
37#include <linux/cpu.h> 31#include <linux/cpu.h>
38#include <linux/timex.h>
39#include <linux/bootmem.h>
40#include <linux/slab.h> 32#include <linux/slab.h>
41#include <linux/crash_dump.h> 33#include <linux/crash_dump.h>
42#include <asm/asm-offsets.h> 34#include <asm/asm-offsets.h>
43#include <asm/ipl.h> 35#include <asm/ipl.h>
44#include <asm/setup.h> 36#include <asm/setup.h>
45#include <asm/sigp.h>
46#include <asm/pgalloc.h>
47#include <asm/irq.h> 37#include <asm/irq.h>
48#include <asm/cpcmd.h>
49#include <asm/tlbflush.h> 38#include <asm/tlbflush.h>
50#include <asm/timer.h> 39#include <asm/timer.h>
51#include <asm/lowcore.h> 40#include <asm/lowcore.h>
52#include <asm/sclp.h> 41#include <asm/sclp.h>
53#include <asm/cputime.h>
54#include <asm/vdso.h> 42#include <asm/vdso.h>
55#include <asm/cpu.h> 43#include <asm/debug.h>
44#include <asm/os_info.h>
56#include "entry.h" 45#include "entry.h"
57 46
58/* logical cpu to cpu address */ 47enum {
59unsigned short __cpu_logical_map[NR_CPUS]; 48 sigp_sense = 1,
49 sigp_external_call = 2,
50 sigp_emergency_signal = 3,
51 sigp_start = 4,
52 sigp_stop = 5,
53 sigp_restart = 6,
54 sigp_stop_and_store_status = 9,
55 sigp_initial_cpu_reset = 11,
56 sigp_cpu_reset = 12,
57 sigp_set_prefix = 13,
58 sigp_store_status_at_address = 14,
59 sigp_store_extended_status_at_address = 15,
60 sigp_set_architecture = 18,
61 sigp_conditional_emergency_signal = 19,
62 sigp_sense_running = 21,
63};
60 64
61static struct task_struct *current_set[NR_CPUS]; 65enum {
66 sigp_order_code_accepted = 0,
67 sigp_status_stored = 1,
68 sigp_busy = 2,
69 sigp_not_operational = 3,
70};
62 71
63static u8 smp_cpu_type; 72enum {
64static int smp_use_sigp_detection; 73 ec_schedule = 0,
74 ec_call_function,
75 ec_call_function_single,
76 ec_stop_cpu,
77};
65 78
66enum s390_cpu_state { 79enum {
67 CPU_STATE_STANDBY, 80 CPU_STATE_STANDBY,
68 CPU_STATE_CONFIGURED, 81 CPU_STATE_CONFIGURED,
69}; 82};
70 83
84struct pcpu {
85 struct cpu cpu;
86 struct task_struct *idle; /* idle process for the cpu */
87 struct _lowcore *lowcore; /* lowcore page(s) for the cpu */
88 unsigned long async_stack; /* async stack for the cpu */
89 unsigned long panic_stack; /* panic stack for the cpu */
90 unsigned long ec_mask; /* bit mask for ec_xxx functions */
91 int state; /* physical cpu state */
92 u32 status; /* last status received via sigp */
93 u16 address; /* physical cpu address */
94};
95
96static u8 boot_cpu_type;
97static u16 boot_cpu_address;
98static struct pcpu pcpu_devices[NR_CPUS];
99
71DEFINE_MUTEX(smp_cpu_state_mutex); 100DEFINE_MUTEX(smp_cpu_state_mutex);
72static int smp_cpu_state[NR_CPUS];
73 101
74static DEFINE_PER_CPU(struct cpu, cpu_devices); 102/*
103 * Signal processor helper functions.
104 */
105static inline int __pcpu_sigp(u16 addr, u8 order, u32 parm, u32 *status)
106{
107 register unsigned int reg1 asm ("1") = parm;
108 int cc;
75 109
76static void smp_ext_bitcall(int, int); 110 asm volatile(
111 " sigp %1,%2,0(%3)\n"
112 " ipm %0\n"
113 " srl %0,28\n"
114 : "=d" (cc), "+d" (reg1) : "d" (addr), "a" (order) : "cc");
115 if (status && cc == 1)
116 *status = reg1;
117 return cc;
118}
77 119
78static int raw_cpu_stopped(int cpu) 120static inline int __pcpu_sigp_relax(u16 addr, u8 order, u32 parm, u32 *status)
79{ 121{
80 u32 status; 122 int cc;
81 123
82 switch (raw_sigp_ps(&status, 0, cpu, sigp_sense)) { 124 while (1) {
83 case sigp_status_stored: 125 cc = __pcpu_sigp(addr, order, parm, status);
84 /* Check for stopped and check stop state */ 126 if (cc != sigp_busy)
85 if (status & 0x50) 127 return cc;
86 return 1; 128 cpu_relax();
87 break;
88 default:
89 break;
90 } 129 }
91 return 0;
92} 130}
93 131
94static inline int cpu_stopped(int cpu) 132static int pcpu_sigp_retry(struct pcpu *pcpu, u8 order, u32 parm)
133{
134 int cc, retry;
135
136 for (retry = 0; ; retry++) {
137 cc = __pcpu_sigp(pcpu->address, order, parm, &pcpu->status);
138 if (cc != sigp_busy)
139 break;
140 if (retry >= 3)
141 udelay(10);
142 }
143 return cc;
144}
145
146static inline int pcpu_stopped(struct pcpu *pcpu)
147{
148 if (__pcpu_sigp(pcpu->address, sigp_sense,
149 0, &pcpu->status) != sigp_status_stored)
150 return 0;
151 /* Check for stopped and check stop state */
152 return !!(pcpu->status & 0x50);
153}
154
155static inline int pcpu_running(struct pcpu *pcpu)
95{ 156{
96 return raw_cpu_stopped(cpu_logical_map(cpu)); 157 if (__pcpu_sigp(pcpu->address, sigp_sense_running,
158 0, &pcpu->status) != sigp_status_stored)
159 return 1;
160 /* Check for running status */
161 return !(pcpu->status & 0x400);
97} 162}
98 163
99/* 164/*
100 * Ensure that PSW restart is done on an online CPU 165 * Find struct pcpu by cpu address.
101 */ 166 */
102void smp_restart_with_online_cpu(void) 167static struct pcpu *pcpu_find_address(const struct cpumask *mask, int address)
103{ 168{
104 int cpu; 169 int cpu;
105 170
106 for_each_online_cpu(cpu) { 171 for_each_cpu(cpu, mask)
107 if (stap() == __cpu_logical_map[cpu]) { 172 if (pcpu_devices[cpu].address == address)
108 /* We are online: Enable DAT again and return */ 173 return pcpu_devices + cpu;
109 __load_psw_mask(psw_kernel_bits | PSW_MASK_DAT); 174 return NULL;
110 return; 175}
111 } 176
177static void pcpu_ec_call(struct pcpu *pcpu, int ec_bit)
178{
179 int order;
180
181 set_bit(ec_bit, &pcpu->ec_mask);
182 order = pcpu_running(pcpu) ?
183 sigp_external_call : sigp_emergency_signal;
184 pcpu_sigp_retry(pcpu, order, 0);
185}
186
187static int __cpuinit pcpu_alloc_lowcore(struct pcpu *pcpu, int cpu)
188{
189 struct _lowcore *lc;
190
191 if (pcpu != &pcpu_devices[0]) {
192 pcpu->lowcore = (struct _lowcore *)
193 __get_free_pages(GFP_KERNEL | GFP_DMA, LC_ORDER);
194 pcpu->async_stack = __get_free_pages(GFP_KERNEL, ASYNC_ORDER);
195 pcpu->panic_stack = __get_free_page(GFP_KERNEL);
196 if (!pcpu->lowcore || !pcpu->panic_stack || !pcpu->async_stack)
197 goto out;
112 } 198 }
113 /* We are not online: Do PSW restart on an online CPU */ 199 lc = pcpu->lowcore;
114 while (sigp(cpu, sigp_restart) == sigp_busy) 200 memcpy(lc, &S390_lowcore, 512);
115 cpu_relax(); 201 memset((char *) lc + 512, 0, sizeof(*lc) - 512);
116 /* And stop ourself */ 202 lc->async_stack = pcpu->async_stack + ASYNC_SIZE;
117 while (raw_sigp(stap(), sigp_stop) == sigp_busy) 203 lc->panic_stack = pcpu->panic_stack + PAGE_SIZE;
118 cpu_relax(); 204 lc->cpu_nr = cpu;
119 for (;;); 205#ifndef CONFIG_64BIT
206 if (MACHINE_HAS_IEEE) {
207 lc->extended_save_area_addr = get_zeroed_page(GFP_KERNEL);
208 if (!lc->extended_save_area_addr)
209 goto out;
210 }
211#else
212 if (vdso_alloc_per_cpu(lc))
213 goto out;
214#endif
215 lowcore_ptr[cpu] = lc;
216 pcpu_sigp_retry(pcpu, sigp_set_prefix, (u32)(unsigned long) lc);
217 return 0;
218out:
219 if (pcpu != &pcpu_devices[0]) {
220 free_page(pcpu->panic_stack);
221 free_pages(pcpu->async_stack, ASYNC_ORDER);
222 free_pages((unsigned long) pcpu->lowcore, LC_ORDER);
223 }
224 return -ENOMEM;
120} 225}
121 226
122void smp_switch_to_ipl_cpu(void (*func)(void *), void *data) 227static void pcpu_free_lowcore(struct pcpu *pcpu)
123{ 228{
124 struct _lowcore *lc, *current_lc; 229 pcpu_sigp_retry(pcpu, sigp_set_prefix, 0);
125 struct stack_frame *sf; 230 lowcore_ptr[pcpu - pcpu_devices] = NULL;
126 struct pt_regs *regs; 231#ifndef CONFIG_64BIT
127 unsigned long sp; 232 if (MACHINE_HAS_IEEE) {
128 233 struct _lowcore *lc = pcpu->lowcore;
129 if (smp_processor_id() == 0) 234
130 func(data); 235 free_page((unsigned long) lc->extended_save_area_addr);
131 __load_psw_mask(PSW_DEFAULT_KEY | PSW_MASK_BASE | 236 lc->extended_save_area_addr = 0;
132 PSW_MASK_EA | PSW_MASK_BA); 237 }
133 /* Disable lowcore protection */ 238#else
134 __ctl_clear_bit(0, 28); 239 vdso_free_per_cpu(pcpu->lowcore);
135 current_lc = lowcore_ptr[smp_processor_id()]; 240#endif
136 lc = lowcore_ptr[0]; 241 if (pcpu != &pcpu_devices[0]) {
137 if (!lc) 242 free_page(pcpu->panic_stack);
138 lc = current_lc; 243 free_pages(pcpu->async_stack, ASYNC_ORDER);
139 lc->restart_psw.mask = 244 free_pages((unsigned long) pcpu->lowcore, LC_ORDER);
140 PSW_DEFAULT_KEY | PSW_MASK_BASE | PSW_MASK_EA | PSW_MASK_BA; 245 }
141 lc->restart_psw.addr = PSW_ADDR_AMODE | (unsigned long) smp_restart_cpu; 246}
142 if (!cpu_online(0)) 247
143 smp_switch_to_cpu(func, data, 0, stap(), __cpu_logical_map[0]); 248static void pcpu_prepare_secondary(struct pcpu *pcpu, int cpu)
144 while (sigp(0, sigp_stop_and_store_status) == sigp_busy) 249{
145 cpu_relax(); 250 struct _lowcore *lc = pcpu->lowcore;
146 sp = lc->panic_stack; 251
147 sp -= sizeof(struct pt_regs); 252 atomic_inc(&init_mm.context.attach_count);
148 regs = (struct pt_regs *) sp; 253 lc->cpu_nr = cpu;
149 memcpy(&regs->gprs, &current_lc->gpregs_save_area, sizeof(regs->gprs)); 254 lc->percpu_offset = __per_cpu_offset[cpu];
150 regs->psw = current_lc->psw_save_area; 255 lc->kernel_asce = S390_lowcore.kernel_asce;
151 sp -= STACK_FRAME_OVERHEAD; 256 lc->machine_flags = S390_lowcore.machine_flags;
152 sf = (struct stack_frame *) sp; 257 lc->ftrace_func = S390_lowcore.ftrace_func;
153 sf->back_chain = 0; 258 lc->user_timer = lc->system_timer = lc->steal_timer = 0;
154 smp_switch_to_cpu(func, data, sp, stap(), __cpu_logical_map[0]); 259 __ctl_store(lc->cregs_save_area, 0, 15);
260 save_access_regs((unsigned int *) lc->access_regs_save_area);
261 memcpy(lc->stfle_fac_list, S390_lowcore.stfle_fac_list,
262 MAX_FACILITY_BIT/8);
263}
264
265static void pcpu_attach_task(struct pcpu *pcpu, struct task_struct *tsk)
266{
267 struct _lowcore *lc = pcpu->lowcore;
268 struct thread_info *ti = task_thread_info(tsk);
269
270 lc->kernel_stack = (unsigned long) task_stack_page(tsk) + THREAD_SIZE;
271 lc->thread_info = (unsigned long) task_thread_info(tsk);
272 lc->current_task = (unsigned long) tsk;
273 lc->user_timer = ti->user_timer;
274 lc->system_timer = ti->system_timer;
275 lc->steal_timer = 0;
276}
277
278static void pcpu_start_fn(struct pcpu *pcpu, void (*func)(void *), void *data)
279{
280 struct _lowcore *lc = pcpu->lowcore;
281
282 lc->restart_stack = lc->kernel_stack;
283 lc->restart_fn = (unsigned long) func;
284 lc->restart_data = (unsigned long) data;
285 lc->restart_source = -1UL;
286 pcpu_sigp_retry(pcpu, sigp_restart, 0);
287}
288
289/*
290 * Call function via PSW restart on pcpu and stop the current cpu.
291 */
292static void pcpu_delegate(struct pcpu *pcpu, void (*func)(void *),
293 void *data, unsigned long stack)
294{
295 struct _lowcore *lc = pcpu->lowcore;
296 unsigned short this_cpu;
297
298 __load_psw_mask(psw_kernel_bits);
299 this_cpu = stap();
300 if (pcpu->address == this_cpu)
301 func(data); /* should not return */
302 /* Stop target cpu (if func returns this stops the current cpu). */
303 pcpu_sigp_retry(pcpu, sigp_stop, 0);
304 /* Restart func on the target cpu and stop the current cpu. */
305 lc->restart_stack = stack;
306 lc->restart_fn = (unsigned long) func;
307 lc->restart_data = (unsigned long) data;
308 lc->restart_source = (unsigned long) this_cpu;
309 asm volatile(
310 "0: sigp 0,%0,6 # sigp restart to target cpu\n"
311 " brc 2,0b # busy, try again\n"
312 "1: sigp 0,%1,5 # sigp stop to current cpu\n"
313 " brc 2,1b # busy, try again\n"
314 : : "d" (pcpu->address), "d" (this_cpu) : "0", "1", "cc");
315 for (;;) ;
316}
317
318/*
319 * Call function on an online CPU.
320 */
321void smp_call_online_cpu(void (*func)(void *), void *data)
322{
323 struct pcpu *pcpu;
324
325 /* Use the current cpu if it is online. */
326 pcpu = pcpu_find_address(cpu_online_mask, stap());
327 if (!pcpu)
328 /* Use the first online cpu. */
329 pcpu = pcpu_devices + cpumask_first(cpu_online_mask);
330 pcpu_delegate(pcpu, func, data, (unsigned long) restart_stack);
331}
332
333/*
334 * Call function on the ipl CPU.
335 */
336void smp_call_ipl_cpu(void (*func)(void *), void *data)
337{
338 pcpu_delegate(&pcpu_devices[0], func, data,
339 pcpu_devices->panic_stack + PAGE_SIZE);
340}
341
342int smp_find_processor_id(u16 address)
343{
344 int cpu;
345
346 for_each_present_cpu(cpu)
347 if (pcpu_devices[cpu].address == address)
348 return cpu;
349 return -1;
350}
351
352int smp_vcpu_scheduled(int cpu)
353{
354 return pcpu_running(pcpu_devices + cpu);
355}
356
357void smp_yield(void)
358{
359 if (MACHINE_HAS_DIAG44)
360 asm volatile("diag 0,0,0x44");
155} 361}
156 362
157static void smp_stop_cpu(void) 363void smp_yield_cpu(int cpu)
158{ 364{
159 while (sigp(smp_processor_id(), sigp_stop) == sigp_busy) 365 if (MACHINE_HAS_DIAG9C)
366 asm volatile("diag %0,0,0x9c"
367 : : "d" (pcpu_devices[cpu].address));
368 else if (MACHINE_HAS_DIAG44)
369 asm volatile("diag 0,0,0x44");
370}
371
372/*
373 * Send cpus emergency shutdown signal. This gives the cpus the
374 * opportunity to complete outstanding interrupts.
375 */
376void smp_emergency_stop(cpumask_t *cpumask)
377{
378 u64 end;
379 int cpu;
380
381 end = get_clock() + (1000000UL << 12);
382 for_each_cpu(cpu, cpumask) {
383 struct pcpu *pcpu = pcpu_devices + cpu;
384 set_bit(ec_stop_cpu, &pcpu->ec_mask);
385 while (__pcpu_sigp(pcpu->address, sigp_emergency_signal,
386 0, NULL) == sigp_busy &&
387 get_clock() < end)
388 cpu_relax();
389 }
390 while (get_clock() < end) {
391 for_each_cpu(cpu, cpumask)
392 if (pcpu_stopped(pcpu_devices + cpu))
393 cpumask_clear_cpu(cpu, cpumask);
394 if (cpumask_empty(cpumask))
395 break;
160 cpu_relax(); 396 cpu_relax();
397 }
161} 398}
162 399
400/*
401 * Stop all cpus but the current one.
402 */
163void smp_send_stop(void) 403void smp_send_stop(void)
164{ 404{
165 cpumask_t cpumask; 405 cpumask_t cpumask;
166 int cpu; 406 int cpu;
167 u64 end;
168 407
169 /* Disable all interrupts/machine checks */ 408 /* Disable all interrupts/machine checks */
170 __load_psw_mask(psw_kernel_bits | PSW_MASK_DAT); 409 __load_psw_mask(psw_kernel_bits | PSW_MASK_DAT);
171 trace_hardirqs_off(); 410 trace_hardirqs_off();
172 411
412 debug_set_critical();
173 cpumask_copy(&cpumask, cpu_online_mask); 413 cpumask_copy(&cpumask, cpu_online_mask);
174 cpumask_clear_cpu(smp_processor_id(), &cpumask); 414 cpumask_clear_cpu(smp_processor_id(), &cpumask);
175 415
176 if (oops_in_progress) { 416 if (oops_in_progress)
177 /* 417 smp_emergency_stop(&cpumask);
178 * Give the other cpus the opportunity to complete
179 * outstanding interrupts before stopping them.
180 */
181 end = get_clock() + (1000000UL << 12);
182 for_each_cpu(cpu, &cpumask) {
183 set_bit(ec_stop_cpu, (unsigned long *)
184 &lowcore_ptr[cpu]->ext_call_fast);
185 while (sigp(cpu, sigp_emergency_signal) == sigp_busy &&
186 get_clock() < end)
187 cpu_relax();
188 }
189 while (get_clock() < end) {
190 for_each_cpu(cpu, &cpumask)
191 if (cpu_stopped(cpu))
192 cpumask_clear_cpu(cpu, &cpumask);
193 if (cpumask_empty(&cpumask))
194 break;
195 cpu_relax();
196 }
197 }
198 418
199 /* stop all processors */ 419 /* stop all processors */
200 for_each_cpu(cpu, &cpumask) { 420 for_each_cpu(cpu, &cpumask) {
201 while (sigp(cpu, sigp_stop) == sigp_busy) 421 struct pcpu *pcpu = pcpu_devices + cpu;
202 cpu_relax(); 422 pcpu_sigp_retry(pcpu, sigp_stop, 0);
203 while (!cpu_stopped(cpu)) 423 while (!pcpu_stopped(pcpu))
204 cpu_relax(); 424 cpu_relax();
205 } 425 }
206} 426}
207 427
208/* 428/*
429 * Stop the current cpu.
430 */
431void smp_stop_cpu(void)
432{
433 pcpu_sigp_retry(pcpu_devices + smp_processor_id(), sigp_stop, 0);
434 for (;;) ;
435}
436
437/*
209 * This is the main routine where commands issued by other 438 * This is the main routine where commands issued by other
210 * cpus are handled. 439 * cpus are handled.
211 */ 440 */
212 441static void do_ext_call_interrupt(struct ext_code ext_code,
213static void do_ext_call_interrupt(unsigned int ext_int_code,
214 unsigned int param32, unsigned long param64) 442 unsigned int param32, unsigned long param64)
215{ 443{
216 unsigned long bits; 444 unsigned long bits;
445 int cpu;
217 446
218 if ((ext_int_code & 0xffff) == 0x1202) 447 cpu = smp_processor_id();
219 kstat_cpu(smp_processor_id()).irqs[EXTINT_EXC]++; 448 if (ext_code.code == 0x1202)
449 kstat_cpu(cpu).irqs[EXTINT_EXC]++;
220 else 450 else
221 kstat_cpu(smp_processor_id()).irqs[EXTINT_EMS]++; 451 kstat_cpu(cpu).irqs[EXTINT_EMS]++;
222 /* 452 /*
223 * handle bit signal external calls 453 * handle bit signal external calls
224 */ 454 */
225 bits = xchg(&S390_lowcore.ext_call_fast, 0); 455 bits = xchg(&pcpu_devices[cpu].ec_mask, 0);
226 456
227 if (test_bit(ec_stop_cpu, &bits)) 457 if (test_bit(ec_stop_cpu, &bits))
228 smp_stop_cpu(); 458 smp_stop_cpu();
@@ -238,38 +468,17 @@ static void do_ext_call_interrupt(unsigned int ext_int_code,
238 468
239} 469}
240 470
241/*
242 * Send an external call sigp to another cpu and return without waiting
243 * for its completion.
244 */
245static void smp_ext_bitcall(int cpu, int sig)
246{
247 int order;
248
249 /*
250 * Set signaling bit in lowcore of target cpu and kick it
251 */
252 set_bit(sig, (unsigned long *) &lowcore_ptr[cpu]->ext_call_fast);
253 while (1) {
254 order = smp_vcpu_scheduled(cpu) ?
255 sigp_external_call : sigp_emergency_signal;
256 if (sigp(cpu, order) != sigp_busy)
257 break;
258 udelay(10);
259 }
260}
261
262void arch_send_call_function_ipi_mask(const struct cpumask *mask) 471void arch_send_call_function_ipi_mask(const struct cpumask *mask)
263{ 472{
264 int cpu; 473 int cpu;
265 474
266 for_each_cpu(cpu, mask) 475 for_each_cpu(cpu, mask)
267 smp_ext_bitcall(cpu, ec_call_function); 476 pcpu_ec_call(pcpu_devices + cpu, ec_call_function);
268} 477}
269 478
270void arch_send_call_function_single_ipi(int cpu) 479void arch_send_call_function_single_ipi(int cpu)
271{ 480{
272 smp_ext_bitcall(cpu, ec_call_function_single); 481 pcpu_ec_call(pcpu_devices + cpu, ec_call_function_single);
273} 482}
274 483
275#ifndef CONFIG_64BIT 484#ifndef CONFIG_64BIT
@@ -295,15 +504,16 @@ EXPORT_SYMBOL(smp_ptlb_all);
295 */ 504 */
296void smp_send_reschedule(int cpu) 505void smp_send_reschedule(int cpu)
297{ 506{
298 smp_ext_bitcall(cpu, ec_schedule); 507 pcpu_ec_call(pcpu_devices + cpu, ec_schedule);
299} 508}
300 509
301/* 510/*
302 * parameter area for the set/clear control bit callbacks 511 * parameter area for the set/clear control bit callbacks
303 */ 512 */
304struct ec_creg_mask_parms { 513struct ec_creg_mask_parms {
305 unsigned long orvals[16]; 514 unsigned long orval;
306 unsigned long andvals[16]; 515 unsigned long andval;
516 int cr;
307}; 517};
308 518
309/* 519/*
@@ -313,11 +523,9 @@ static void smp_ctl_bit_callback(void *info)
313{ 523{
314 struct ec_creg_mask_parms *pp = info; 524 struct ec_creg_mask_parms *pp = info;
315 unsigned long cregs[16]; 525 unsigned long cregs[16];
316 int i;
317 526
318 __ctl_store(cregs, 0, 15); 527 __ctl_store(cregs, 0, 15);
319 for (i = 0; i <= 15; i++) 528 cregs[pp->cr] = (cregs[pp->cr] & pp->andval) | pp->orval;
320 cregs[i] = (cregs[i] & pp->andvals[i]) | pp->orvals[i];
321 __ctl_load(cregs, 0, 15); 529 __ctl_load(cregs, 0, 15);
322} 530}
323 531
@@ -326,11 +534,8 @@ static void smp_ctl_bit_callback(void *info)
326 */ 534 */
327void smp_ctl_set_bit(int cr, int bit) 535void smp_ctl_set_bit(int cr, int bit)
328{ 536{
329 struct ec_creg_mask_parms parms; 537 struct ec_creg_mask_parms parms = { 1UL << bit, -1UL, cr };
330 538
331 memset(&parms.orvals, 0, sizeof(parms.orvals));
332 memset(&parms.andvals, 0xff, sizeof(parms.andvals));
333 parms.orvals[cr] = 1UL << bit;
334 on_each_cpu(smp_ctl_bit_callback, &parms, 1); 539 on_each_cpu(smp_ctl_bit_callback, &parms, 1);
335} 540}
336EXPORT_SYMBOL(smp_ctl_set_bit); 541EXPORT_SYMBOL(smp_ctl_set_bit);
@@ -340,220 +545,178 @@ EXPORT_SYMBOL(smp_ctl_set_bit);
340 */ 545 */
341void smp_ctl_clear_bit(int cr, int bit) 546void smp_ctl_clear_bit(int cr, int bit)
342{ 547{
343 struct ec_creg_mask_parms parms; 548 struct ec_creg_mask_parms parms = { 0, ~(1UL << bit), cr };
344 549
345 memset(&parms.orvals, 0, sizeof(parms.orvals));
346 memset(&parms.andvals, 0xff, sizeof(parms.andvals));
347 parms.andvals[cr] = ~(1UL << bit);
348 on_each_cpu(smp_ctl_bit_callback, &parms, 1); 550 on_each_cpu(smp_ctl_bit_callback, &parms, 1);
349} 551}
350EXPORT_SYMBOL(smp_ctl_clear_bit); 552EXPORT_SYMBOL(smp_ctl_clear_bit);
351 553
352#if defined(CONFIG_ZFCPDUMP) || defined(CONFIG_CRASH_DUMP) 554#if defined(CONFIG_ZFCPDUMP) || defined(CONFIG_CRASH_DUMP)
353 555
354static void __init smp_get_save_area(unsigned int cpu, unsigned int phy_cpu) 556struct save_area *zfcpdump_save_areas[NR_CPUS + 1];
557EXPORT_SYMBOL_GPL(zfcpdump_save_areas);
558
559static void __init smp_get_save_area(int cpu, u16 address)
355{ 560{
356 if (ipl_info.type != IPL_TYPE_FCP_DUMP && !OLDMEM_BASE) 561 void *lc = pcpu_devices[0].lowcore;
357 return; 562 struct save_area *save_area;
563
358 if (is_kdump_kernel()) 564 if (is_kdump_kernel())
359 return; 565 return;
566 if (!OLDMEM_BASE && (address == boot_cpu_address ||
567 ipl_info.type != IPL_TYPE_FCP_DUMP))
568 return;
360 if (cpu >= NR_CPUS) { 569 if (cpu >= NR_CPUS) {
361 pr_warning("CPU %i exceeds the maximum %i and is excluded from " 570 pr_warning("CPU %i exceeds the maximum %i and is excluded "
362 "the dump\n", cpu, NR_CPUS - 1); 571 "from the dump\n", cpu, NR_CPUS - 1);
363 return; 572 return;
364 } 573 }
365 zfcpdump_save_areas[cpu] = kmalloc(sizeof(struct save_area), GFP_KERNEL); 574 save_area = kmalloc(sizeof(struct save_area), GFP_KERNEL);
366 while (raw_sigp(phy_cpu, sigp_stop_and_store_status) == sigp_busy) 575 if (!save_area)
367 cpu_relax(); 576 panic("could not allocate memory for save area\n");
368 memcpy_real(zfcpdump_save_areas[cpu], 577 zfcpdump_save_areas[cpu] = save_area;
369 (void *)(unsigned long) store_prefix() + SAVE_AREA_BASE, 578#ifdef CONFIG_CRASH_DUMP
370 sizeof(struct save_area)); 579 if (address == boot_cpu_address) {
580 /* Copy the registers of the boot cpu. */
581 copy_oldmem_page(1, (void *) save_area, sizeof(*save_area),
582 SAVE_AREA_BASE - PAGE_SIZE, 0);
583 return;
584 }
585#endif
586 /* Get the registers of a non-boot cpu. */
587 __pcpu_sigp_relax(address, sigp_stop_and_store_status, 0, NULL);
588 memcpy_real(save_area, lc + SAVE_AREA_BASE, sizeof(*save_area));
371} 589}
372 590
373struct save_area *zfcpdump_save_areas[NR_CPUS + 1]; 591int smp_store_status(int cpu)
374EXPORT_SYMBOL_GPL(zfcpdump_save_areas);
375
376#else
377
378static inline void smp_get_save_area(unsigned int cpu, unsigned int phy_cpu) { }
379
380#endif /* CONFIG_ZFCPDUMP */
381
382static int cpu_known(int cpu_id)
383{ 592{
384 int cpu; 593 struct pcpu *pcpu;
385 594
386 for_each_present_cpu(cpu) { 595 pcpu = pcpu_devices + cpu;
387 if (__cpu_logical_map[cpu] == cpu_id) 596 if (__pcpu_sigp_relax(pcpu->address, sigp_stop_and_store_status,
388 return 1; 597 0, NULL) != sigp_order_code_accepted)
389 } 598 return -EIO;
390 return 0; 599 return 0;
391} 600}
392 601
393static int smp_rescan_cpus_sigp(cpumask_t avail) 602#else /* CONFIG_ZFCPDUMP || CONFIG_CRASH_DUMP */
394{
395 int cpu_id, logical_cpu;
396 603
397 logical_cpu = cpumask_first(&avail); 604static inline void smp_get_save_area(int cpu, u16 address) { }
398 if (logical_cpu >= nr_cpu_ids)
399 return 0;
400 for (cpu_id = 0; cpu_id <= MAX_CPU_ADDRESS; cpu_id++) {
401 if (cpu_known(cpu_id))
402 continue;
403 __cpu_logical_map[logical_cpu] = cpu_id;
404 cpu_set_polarization(logical_cpu, POLARIZATION_UNKNOWN);
405 if (!cpu_stopped(logical_cpu))
406 continue;
407 set_cpu_present(logical_cpu, true);
408 smp_cpu_state[logical_cpu] = CPU_STATE_CONFIGURED;
409 logical_cpu = cpumask_next(logical_cpu, &avail);
410 if (logical_cpu >= nr_cpu_ids)
411 break;
412 }
413 return 0;
414}
415 605
416static int smp_rescan_cpus_sclp(cpumask_t avail) 606#endif /* CONFIG_ZFCPDUMP || CONFIG_CRASH_DUMP */
607
608static struct sclp_cpu_info *smp_get_cpu_info(void)
417{ 609{
610 static int use_sigp_detection;
418 struct sclp_cpu_info *info; 611 struct sclp_cpu_info *info;
419 int cpu_id, logical_cpu, cpu; 612 int address;
420 int rc; 613
421 614 info = kzalloc(sizeof(*info), GFP_KERNEL);
422 logical_cpu = cpumask_first(&avail); 615 if (info && (use_sigp_detection || sclp_get_cpu_info(info))) {
423 if (logical_cpu >= nr_cpu_ids) 616 use_sigp_detection = 1;
424 return 0; 617 for (address = 0; address <= MAX_CPU_ADDRESS; address++) {
425 info = kmalloc(sizeof(*info), GFP_KERNEL); 618 if (__pcpu_sigp_relax(address, sigp_sense, 0, NULL) ==
426 if (!info) 619 sigp_not_operational)
427 return -ENOMEM; 620 continue;
428 rc = sclp_get_cpu_info(info); 621 info->cpu[info->configured].address = address;
429 if (rc) 622 info->configured++;
430 goto out; 623 }
431 for (cpu = 0; cpu < info->combined; cpu++) { 624 info->combined = info->configured;
432 if (info->has_cpu_type && info->cpu[cpu].type != smp_cpu_type)
433 continue;
434 cpu_id = info->cpu[cpu].address;
435 if (cpu_known(cpu_id))
436 continue;
437 __cpu_logical_map[logical_cpu] = cpu_id;
438 cpu_set_polarization(logical_cpu, POLARIZATION_UNKNOWN);
439 set_cpu_present(logical_cpu, true);
440 if (cpu >= info->configured)
441 smp_cpu_state[logical_cpu] = CPU_STATE_STANDBY;
442 else
443 smp_cpu_state[logical_cpu] = CPU_STATE_CONFIGURED;
444 logical_cpu = cpumask_next(logical_cpu, &avail);
445 if (logical_cpu >= nr_cpu_ids)
446 break;
447 } 625 }
448out: 626 return info;
449 kfree(info);
450 return rc;
451} 627}
452 628
453static int __smp_rescan_cpus(void) 629static int __devinit smp_add_present_cpu(int cpu);
630
631static int __devinit __smp_rescan_cpus(struct sclp_cpu_info *info,
632 int sysfs_add)
454{ 633{
634 struct pcpu *pcpu;
455 cpumask_t avail; 635 cpumask_t avail;
636 int cpu, nr, i;
456 637
638 nr = 0;
457 cpumask_xor(&avail, cpu_possible_mask, cpu_present_mask); 639 cpumask_xor(&avail, cpu_possible_mask, cpu_present_mask);
458 if (smp_use_sigp_detection) 640 cpu = cpumask_first(&avail);
459 return smp_rescan_cpus_sigp(avail); 641 for (i = 0; (i < info->combined) && (cpu < nr_cpu_ids); i++) {
460 else 642 if (info->has_cpu_type && info->cpu[i].type != boot_cpu_type)
461 return smp_rescan_cpus_sclp(avail); 643 continue;
644 if (pcpu_find_address(cpu_present_mask, info->cpu[i].address))
645 continue;
646 pcpu = pcpu_devices + cpu;
647 pcpu->address = info->cpu[i].address;
648 pcpu->state = (cpu >= info->configured) ?
649 CPU_STATE_STANDBY : CPU_STATE_CONFIGURED;
650 cpu_set_polarization(cpu, POLARIZATION_UNKNOWN);
651 set_cpu_present(cpu, true);
652 if (sysfs_add && smp_add_present_cpu(cpu) != 0)
653 set_cpu_present(cpu, false);
654 else
655 nr++;
656 cpu = cpumask_next(cpu, &avail);
657 }
658 return nr;
462} 659}
463 660
464static void __init smp_detect_cpus(void) 661static void __init smp_detect_cpus(void)
465{ 662{
466 unsigned int cpu, c_cpus, s_cpus; 663 unsigned int cpu, c_cpus, s_cpus;
467 struct sclp_cpu_info *info; 664 struct sclp_cpu_info *info;
468 u16 boot_cpu_addr, cpu_addr;
469 665
470 c_cpus = 1; 666 info = smp_get_cpu_info();
471 s_cpus = 0;
472 boot_cpu_addr = __cpu_logical_map[0];
473 info = kmalloc(sizeof(*info), GFP_KERNEL);
474 if (!info) 667 if (!info)
475 panic("smp_detect_cpus failed to allocate memory\n"); 668 panic("smp_detect_cpus failed to allocate memory\n");
476#ifdef CONFIG_CRASH_DUMP
477 if (OLDMEM_BASE && !is_kdump_kernel()) {
478 struct save_area *save_area;
479
480 save_area = kmalloc(sizeof(*save_area), GFP_KERNEL);
481 if (!save_area)
482 panic("could not allocate memory for save area\n");
483 copy_oldmem_page(1, (void *) save_area, sizeof(*save_area),
484 0x200, 0);
485 zfcpdump_save_areas[0] = save_area;
486 }
487#endif
488 /* Use sigp detection algorithm if sclp doesn't work. */
489 if (sclp_get_cpu_info(info)) {
490 smp_use_sigp_detection = 1;
491 for (cpu = 0; cpu <= MAX_CPU_ADDRESS; cpu++) {
492 if (cpu == boot_cpu_addr)
493 continue;
494 if (!raw_cpu_stopped(cpu))
495 continue;
496 smp_get_save_area(c_cpus, cpu);
497 c_cpus++;
498 }
499 goto out;
500 }
501
502 if (info->has_cpu_type) { 669 if (info->has_cpu_type) {
503 for (cpu = 0; cpu < info->combined; cpu++) { 670 for (cpu = 0; cpu < info->combined; cpu++) {
504 if (info->cpu[cpu].address == boot_cpu_addr) { 671 if (info->cpu[cpu].address != boot_cpu_address)
505 smp_cpu_type = info->cpu[cpu].type; 672 continue;
506 break; 673 /* The boot cpu dictates the cpu type. */
507 } 674 boot_cpu_type = info->cpu[cpu].type;
675 break;
508 } 676 }
509 } 677 }
510 678 c_cpus = s_cpus = 0;
511 for (cpu = 0; cpu < info->combined; cpu++) { 679 for (cpu = 0; cpu < info->combined; cpu++) {
512 if (info->has_cpu_type && info->cpu[cpu].type != smp_cpu_type) 680 if (info->has_cpu_type && info->cpu[cpu].type != boot_cpu_type)
513 continue; 681 continue;
514 cpu_addr = info->cpu[cpu].address; 682 if (cpu < info->configured) {
515 if (cpu_addr == boot_cpu_addr) 683 smp_get_save_area(c_cpus, info->cpu[cpu].address);
516 continue; 684 c_cpus++;
517 if (!raw_cpu_stopped(cpu_addr)) { 685 } else
518 s_cpus++; 686 s_cpus++;
519 continue;
520 }
521 smp_get_save_area(c_cpus, cpu_addr);
522 c_cpus++;
523 } 687 }
524out:
525 kfree(info);
526 pr_info("%d configured CPUs, %d standby CPUs\n", c_cpus, s_cpus); 688 pr_info("%d configured CPUs, %d standby CPUs\n", c_cpus, s_cpus);
527 get_online_cpus(); 689 get_online_cpus();
528 __smp_rescan_cpus(); 690 __smp_rescan_cpus(info, 0);
529 put_online_cpus(); 691 put_online_cpus();
692 kfree(info);
530} 693}
531 694
532/* 695/*
533 * Activate a secondary processor. 696 * Activate a secondary processor.
534 */ 697 */
535int __cpuinit start_secondary(void *cpuvoid) 698static void __cpuinit smp_start_secondary(void *cpuvoid)
536{ 699{
700 S390_lowcore.last_update_clock = get_clock();
701 S390_lowcore.restart_stack = (unsigned long) restart_stack;
702 S390_lowcore.restart_fn = (unsigned long) do_restart;
703 S390_lowcore.restart_data = 0;
704 S390_lowcore.restart_source = -1UL;
705 restore_access_regs(S390_lowcore.access_regs_save_area);
706 __ctl_load(S390_lowcore.cregs_save_area, 0, 15);
707 __load_psw_mask(psw_kernel_bits | PSW_MASK_DAT);
537 cpu_init(); 708 cpu_init();
538 preempt_disable(); 709 preempt_disable();
539 init_cpu_timer(); 710 init_cpu_timer();
540 init_cpu_vtimer(); 711 init_cpu_vtimer();
541 pfault_init(); 712 pfault_init();
542
543 notify_cpu_starting(smp_processor_id()); 713 notify_cpu_starting(smp_processor_id());
544 ipi_call_lock(); 714 ipi_call_lock();
545 set_cpu_online(smp_processor_id(), true); 715 set_cpu_online(smp_processor_id(), true);
546 ipi_call_unlock(); 716 ipi_call_unlock();
547 __ctl_clear_bit(0, 28); /* Disable lowcore protection */
548 S390_lowcore.restart_psw.mask =
549 PSW_DEFAULT_KEY | PSW_MASK_BASE | PSW_MASK_EA | PSW_MASK_BA;
550 S390_lowcore.restart_psw.addr =
551 PSW_ADDR_AMODE | (unsigned long) psw_restart_int_handler;
552 __ctl_set_bit(0, 28); /* Enable lowcore protection */
553 local_irq_enable(); 717 local_irq_enable();
554 /* cpu_idle will call schedule for us */ 718 /* cpu_idle will call schedule for us */
555 cpu_idle(); 719 cpu_idle();
556 return 0;
557} 720}
558 721
559struct create_idle { 722struct create_idle {
@@ -572,82 +735,20 @@ static void __cpuinit smp_fork_idle(struct work_struct *work)
572 complete(&c_idle->done); 735 complete(&c_idle->done);
573} 736}
574 737
575static int __cpuinit smp_alloc_lowcore(int cpu)
576{
577 unsigned long async_stack, panic_stack;
578 struct _lowcore *lowcore;
579
580 lowcore = (void *) __get_free_pages(GFP_KERNEL | GFP_DMA, LC_ORDER);
581 if (!lowcore)
582 return -ENOMEM;
583 async_stack = __get_free_pages(GFP_KERNEL, ASYNC_ORDER);
584 panic_stack = __get_free_page(GFP_KERNEL);
585 if (!panic_stack || !async_stack)
586 goto out;
587 memcpy(lowcore, &S390_lowcore, 512);
588 memset((char *)lowcore + 512, 0, sizeof(*lowcore) - 512);
589 lowcore->async_stack = async_stack + ASYNC_SIZE;
590 lowcore->panic_stack = panic_stack + PAGE_SIZE;
591 lowcore->restart_psw.mask =
592 PSW_DEFAULT_KEY | PSW_MASK_BASE | PSW_MASK_EA | PSW_MASK_BA;
593 lowcore->restart_psw.addr =
594 PSW_ADDR_AMODE | (unsigned long) restart_int_handler;
595 if (user_mode != HOME_SPACE_MODE)
596 lowcore->restart_psw.mask |= PSW_ASC_HOME;
597#ifndef CONFIG_64BIT
598 if (MACHINE_HAS_IEEE) {
599 unsigned long save_area;
600
601 save_area = get_zeroed_page(GFP_KERNEL);
602 if (!save_area)
603 goto out;
604 lowcore->extended_save_area_addr = (u32) save_area;
605 }
606#else
607 if (vdso_alloc_per_cpu(cpu, lowcore))
608 goto out;
609#endif
610 lowcore_ptr[cpu] = lowcore;
611 return 0;
612
613out:
614 free_page(panic_stack);
615 free_pages(async_stack, ASYNC_ORDER);
616 free_pages((unsigned long) lowcore, LC_ORDER);
617 return -ENOMEM;
618}
619
620static void smp_free_lowcore(int cpu)
621{
622 struct _lowcore *lowcore;
623
624 lowcore = lowcore_ptr[cpu];
625#ifndef CONFIG_64BIT
626 if (MACHINE_HAS_IEEE)
627 free_page((unsigned long) lowcore->extended_save_area_addr);
628#else
629 vdso_free_per_cpu(cpu, lowcore);
630#endif
631 free_page(lowcore->panic_stack - PAGE_SIZE);
632 free_pages(lowcore->async_stack - ASYNC_SIZE, ASYNC_ORDER);
633 free_pages((unsigned long) lowcore, LC_ORDER);
634 lowcore_ptr[cpu] = NULL;
635}
636
637/* Upping and downing of CPUs */ 738/* Upping and downing of CPUs */
638int __cpuinit __cpu_up(unsigned int cpu) 739int __cpuinit __cpu_up(unsigned int cpu)
639{ 740{
640 struct _lowcore *cpu_lowcore;
641 struct create_idle c_idle; 741 struct create_idle c_idle;
642 struct task_struct *idle; 742 struct pcpu *pcpu;
643 struct stack_frame *sf; 743 int rc;
644 u32 lowcore;
645 int ccode;
646 744
647 if (smp_cpu_state[cpu] != CPU_STATE_CONFIGURED) 745 pcpu = pcpu_devices + cpu;
746 if (pcpu->state != CPU_STATE_CONFIGURED)
747 return -EIO;
748 if (pcpu_sigp_retry(pcpu, sigp_initial_cpu_reset, 0) !=
749 sigp_order_code_accepted)
648 return -EIO; 750 return -EIO;
649 idle = current_set[cpu]; 751 if (!pcpu->idle) {
650 if (!idle) {
651 c_idle.done = COMPLETION_INITIALIZER_ONSTACK(c_idle.done); 752 c_idle.done = COMPLETION_INITIALIZER_ONSTACK(c_idle.done);
652 INIT_WORK_ONSTACK(&c_idle.work, smp_fork_idle); 753 INIT_WORK_ONSTACK(&c_idle.work, smp_fork_idle);
653 c_idle.cpu = cpu; 754 c_idle.cpu = cpu;
@@ -655,68 +756,28 @@ int __cpuinit __cpu_up(unsigned int cpu)
655 wait_for_completion(&c_idle.done); 756 wait_for_completion(&c_idle.done);
656 if (IS_ERR(c_idle.idle)) 757 if (IS_ERR(c_idle.idle))
657 return PTR_ERR(c_idle.idle); 758 return PTR_ERR(c_idle.idle);
658 idle = c_idle.idle; 759 pcpu->idle = c_idle.idle;
659 current_set[cpu] = c_idle.idle;
660 } 760 }
661 init_idle(idle, cpu); 761 init_idle(pcpu->idle, cpu);
662 if (smp_alloc_lowcore(cpu)) 762 rc = pcpu_alloc_lowcore(pcpu, cpu);
663 return -ENOMEM; 763 if (rc)
664 do { 764 return rc;
665 ccode = sigp(cpu, sigp_initial_cpu_reset); 765 pcpu_prepare_secondary(pcpu, cpu);
666 if (ccode == sigp_busy) 766 pcpu_attach_task(pcpu, pcpu->idle);
667 udelay(10); 767 pcpu_start_fn(pcpu, smp_start_secondary, NULL);
668 if (ccode == sigp_not_operational)
669 goto err_out;
670 } while (ccode == sigp_busy);
671
672 lowcore = (u32)(unsigned long)lowcore_ptr[cpu];
673 while (sigp_p(lowcore, cpu, sigp_set_prefix) == sigp_busy)
674 udelay(10);
675
676 cpu_lowcore = lowcore_ptr[cpu];
677 cpu_lowcore->kernel_stack = (unsigned long)
678 task_stack_page(idle) + THREAD_SIZE;
679 cpu_lowcore->thread_info = (unsigned long) task_thread_info(idle);
680 sf = (struct stack_frame *) (cpu_lowcore->kernel_stack
681 - sizeof(struct pt_regs)
682 - sizeof(struct stack_frame));
683 memset(sf, 0, sizeof(struct stack_frame));
684 sf->gprs[9] = (unsigned long) sf;
685 cpu_lowcore->gpregs_save_area[15] = (unsigned long) sf;
686 __ctl_store(cpu_lowcore->cregs_save_area, 0, 15);
687 atomic_inc(&init_mm.context.attach_count);
688 asm volatile(
689 " stam 0,15,0(%0)"
690 : : "a" (&cpu_lowcore->access_regs_save_area) : "memory");
691 cpu_lowcore->percpu_offset = __per_cpu_offset[cpu];
692 cpu_lowcore->current_task = (unsigned long) idle;
693 cpu_lowcore->cpu_nr = cpu;
694 cpu_lowcore->kernel_asce = S390_lowcore.kernel_asce;
695 cpu_lowcore->machine_flags = S390_lowcore.machine_flags;
696 cpu_lowcore->ftrace_func = S390_lowcore.ftrace_func;
697 memcpy(cpu_lowcore->stfle_fac_list, S390_lowcore.stfle_fac_list,
698 MAX_FACILITY_BIT/8);
699 eieio();
700
701 while (sigp(cpu, sigp_restart) == sigp_busy)
702 udelay(10);
703
704 while (!cpu_online(cpu)) 768 while (!cpu_online(cpu))
705 cpu_relax(); 769 cpu_relax();
706 return 0; 770 return 0;
707
708err_out:
709 smp_free_lowcore(cpu);
710 return -EIO;
711} 771}
712 772
713static int __init setup_possible_cpus(char *s) 773static int __init setup_possible_cpus(char *s)
714{ 774{
715 int pcpus, cpu; 775 int max, cpu;
716 776
717 pcpus = simple_strtoul(s, NULL, 0); 777 if (kstrtoint(s, 0, &max) < 0)
778 return 0;
718 init_cpu_possible(cpumask_of(0)); 779 init_cpu_possible(cpumask_of(0));
719 for (cpu = 1; cpu < pcpus && cpu < nr_cpu_ids; cpu++) 780 for (cpu = 1; cpu < max && cpu < nr_cpu_ids; cpu++)
720 set_cpu_possible(cpu, true); 781 set_cpu_possible(cpu, true);
721 return 0; 782 return 0;
722} 783}
@@ -726,113 +787,79 @@ early_param("possible_cpus", setup_possible_cpus);
726 787
727int __cpu_disable(void) 788int __cpu_disable(void)
728{ 789{
729 struct ec_creg_mask_parms cr_parms; 790 unsigned long cregs[16];
730 int cpu = smp_processor_id();
731
732 set_cpu_online(cpu, false);
733 791
734 /* Disable pfault pseudo page faults on this cpu. */ 792 set_cpu_online(smp_processor_id(), false);
793 /* Disable pseudo page faults on this cpu. */
735 pfault_fini(); 794 pfault_fini();
736 795 /* Disable interrupt sources via control register. */
737 memset(&cr_parms.orvals, 0, sizeof(cr_parms.orvals)); 796 __ctl_store(cregs, 0, 15);
738 memset(&cr_parms.andvals, 0xff, sizeof(cr_parms.andvals)); 797 cregs[0] &= ~0x0000ee70UL; /* disable all external interrupts */
739 798 cregs[6] &= ~0xff000000UL; /* disable all I/O interrupts */
740 /* disable all external interrupts */ 799 cregs[14] &= ~0x1f000000UL; /* disable most machine checks */
741 cr_parms.orvals[0] = 0; 800 __ctl_load(cregs, 0, 15);
742 cr_parms.andvals[0] = ~(1 << 15 | 1 << 14 | 1 << 13 | 1 << 11 |
743 1 << 10 | 1 << 9 | 1 << 6 | 1 << 5 |
744 1 << 4);
745 /* disable all I/O interrupts */
746 cr_parms.orvals[6] = 0;
747 cr_parms.andvals[6] = ~(1 << 31 | 1 << 30 | 1 << 29 | 1 << 28 |
748 1 << 27 | 1 << 26 | 1 << 25 | 1 << 24);
749 /* disable most machine checks */
750 cr_parms.orvals[14] = 0;
751 cr_parms.andvals[14] = ~(1 << 28 | 1 << 27 | 1 << 26 |
752 1 << 25 | 1 << 24);
753
754 smp_ctl_bit_callback(&cr_parms);
755
756 return 0; 801 return 0;
757} 802}
758 803
759void __cpu_die(unsigned int cpu) 804void __cpu_die(unsigned int cpu)
760{ 805{
806 struct pcpu *pcpu;
807
761 /* Wait until target cpu is down */ 808 /* Wait until target cpu is down */
762 while (!cpu_stopped(cpu)) 809 pcpu = pcpu_devices + cpu;
810 while (!pcpu_stopped(pcpu))
763 cpu_relax(); 811 cpu_relax();
764 while (sigp_p(0, cpu, sigp_set_prefix) == sigp_busy) 812 pcpu_free_lowcore(pcpu);
765 udelay(10);
766 smp_free_lowcore(cpu);
767 atomic_dec(&init_mm.context.attach_count); 813 atomic_dec(&init_mm.context.attach_count);
768} 814}
769 815
770void __noreturn cpu_die(void) 816void __noreturn cpu_die(void)
771{ 817{
772 idle_task_exit(); 818 idle_task_exit();
773 while (sigp(smp_processor_id(), sigp_stop) == sigp_busy) 819 pcpu_sigp_retry(pcpu_devices + smp_processor_id(), sigp_stop, 0);
774 cpu_relax(); 820 for (;;) ;
775 for (;;);
776} 821}
777 822
778#endif /* CONFIG_HOTPLUG_CPU */ 823#endif /* CONFIG_HOTPLUG_CPU */
779 824
780void __init smp_prepare_cpus(unsigned int max_cpus) 825static void smp_call_os_info_init_fn(void)
781{ 826{
782#ifndef CONFIG_64BIT 827 int (*init_fn)(void);
783 unsigned long save_area = 0; 828 unsigned long size;
784#endif
785 unsigned long async_stack, panic_stack;
786 struct _lowcore *lowcore;
787 829
788 smp_detect_cpus(); 830 init_fn = os_info_old_entry(OS_INFO_INIT_FN, &size);
831 if (!init_fn)
832 return;
833 init_fn();
834}
789 835
836void __init smp_prepare_cpus(unsigned int max_cpus)
837{
790 /* request the 0x1201 emergency signal external interrupt */ 838 /* request the 0x1201 emergency signal external interrupt */
791 if (register_external_interrupt(0x1201, do_ext_call_interrupt) != 0) 839 if (register_external_interrupt(0x1201, do_ext_call_interrupt) != 0)
792 panic("Couldn't request external interrupt 0x1201"); 840 panic("Couldn't request external interrupt 0x1201");
793 /* request the 0x1202 external call external interrupt */ 841 /* request the 0x1202 external call external interrupt */
794 if (register_external_interrupt(0x1202, do_ext_call_interrupt) != 0) 842 if (register_external_interrupt(0x1202, do_ext_call_interrupt) != 0)
795 panic("Couldn't request external interrupt 0x1202"); 843 panic("Couldn't request external interrupt 0x1202");
796 844 smp_call_os_info_init_fn();
797 /* Reallocate current lowcore, but keep its contents. */ 845 smp_detect_cpus();
798 lowcore = (void *) __get_free_pages(GFP_KERNEL | GFP_DMA, LC_ORDER);
799 panic_stack = __get_free_page(GFP_KERNEL);
800 async_stack = __get_free_pages(GFP_KERNEL, ASYNC_ORDER);
801 BUG_ON(!lowcore || !panic_stack || !async_stack);
802#ifndef CONFIG_64BIT
803 if (MACHINE_HAS_IEEE)
804 save_area = get_zeroed_page(GFP_KERNEL);
805#endif
806 local_irq_disable();
807 local_mcck_disable();
808 lowcore_ptr[smp_processor_id()] = lowcore;
809 *lowcore = S390_lowcore;
810 lowcore->panic_stack = panic_stack + PAGE_SIZE;
811 lowcore->async_stack = async_stack + ASYNC_SIZE;
812#ifndef CONFIG_64BIT
813 if (MACHINE_HAS_IEEE)
814 lowcore->extended_save_area_addr = (u32) save_area;
815#endif
816 set_prefix((u32)(unsigned long) lowcore);
817 local_mcck_enable();
818 local_irq_enable();
819#ifdef CONFIG_64BIT
820 if (vdso_alloc_per_cpu(smp_processor_id(), &S390_lowcore))
821 BUG();
822#endif
823} 846}
824 847
825void __init smp_prepare_boot_cpu(void) 848void __init smp_prepare_boot_cpu(void)
826{ 849{
827 BUG_ON(smp_processor_id() != 0); 850 struct pcpu *pcpu = pcpu_devices;
828 851
829 current_thread_info()->cpu = 0; 852 boot_cpu_address = stap();
830 set_cpu_present(0, true); 853 pcpu->idle = current;
831 set_cpu_online(0, true); 854 pcpu->state = CPU_STATE_CONFIGURED;
855 pcpu->address = boot_cpu_address;
856 pcpu->lowcore = (struct _lowcore *)(unsigned long) store_prefix();
857 pcpu->async_stack = S390_lowcore.async_stack - ASYNC_SIZE;
858 pcpu->panic_stack = S390_lowcore.panic_stack - PAGE_SIZE;
832 S390_lowcore.percpu_offset = __per_cpu_offset[0]; 859 S390_lowcore.percpu_offset = __per_cpu_offset[0];
833 current_set[0] = current;
834 smp_cpu_state[0] = CPU_STATE_CONFIGURED;
835 cpu_set_polarization(0, POLARIZATION_UNKNOWN); 860 cpu_set_polarization(0, POLARIZATION_UNKNOWN);
861 set_cpu_present(0, true);
862 set_cpu_online(0, true);
836} 863}
837 864
838void __init smp_cpus_done(unsigned int max_cpus) 865void __init smp_cpus_done(unsigned int max_cpus)
@@ -842,7 +869,6 @@ void __init smp_cpus_done(unsigned int max_cpus)
842void __init smp_setup_processor_id(void) 869void __init smp_setup_processor_id(void)
843{ 870{
844 S390_lowcore.cpu_nr = 0; 871 S390_lowcore.cpu_nr = 0;
845 __cpu_logical_map[0] = stap();
846} 872}
847 873
848/* 874/*
@@ -858,56 +884,57 @@ int setup_profiling_timer(unsigned int multiplier)
858 884
859#ifdef CONFIG_HOTPLUG_CPU 885#ifdef CONFIG_HOTPLUG_CPU
860static ssize_t cpu_configure_show(struct device *dev, 886static ssize_t cpu_configure_show(struct device *dev,
861 struct device_attribute *attr, char *buf) 887 struct device_attribute *attr, char *buf)
862{ 888{
863 ssize_t count; 889 ssize_t count;
864 890
865 mutex_lock(&smp_cpu_state_mutex); 891 mutex_lock(&smp_cpu_state_mutex);
866 count = sprintf(buf, "%d\n", smp_cpu_state[dev->id]); 892 count = sprintf(buf, "%d\n", pcpu_devices[dev->id].state);
867 mutex_unlock(&smp_cpu_state_mutex); 893 mutex_unlock(&smp_cpu_state_mutex);
868 return count; 894 return count;
869} 895}
870 896
871static ssize_t cpu_configure_store(struct device *dev, 897static ssize_t cpu_configure_store(struct device *dev,
872 struct device_attribute *attr, 898 struct device_attribute *attr,
873 const char *buf, size_t count) 899 const char *buf, size_t count)
874{ 900{
875 int cpu = dev->id; 901 struct pcpu *pcpu;
876 int val, rc; 902 int cpu, val, rc;
877 char delim; 903 char delim;
878 904
879 if (sscanf(buf, "%d %c", &val, &delim) != 1) 905 if (sscanf(buf, "%d %c", &val, &delim) != 1)
880 return -EINVAL; 906 return -EINVAL;
881 if (val != 0 && val != 1) 907 if (val != 0 && val != 1)
882 return -EINVAL; 908 return -EINVAL;
883
884 get_online_cpus(); 909 get_online_cpus();
885 mutex_lock(&smp_cpu_state_mutex); 910 mutex_lock(&smp_cpu_state_mutex);
886 rc = -EBUSY; 911 rc = -EBUSY;
887 /* disallow configuration changes of online cpus and cpu 0 */ 912 /* disallow configuration changes of online cpus and cpu 0 */
913 cpu = dev->id;
888 if (cpu_online(cpu) || cpu == 0) 914 if (cpu_online(cpu) || cpu == 0)
889 goto out; 915 goto out;
916 pcpu = pcpu_devices + cpu;
890 rc = 0; 917 rc = 0;
891 switch (val) { 918 switch (val) {
892 case 0: 919 case 0:
893 if (smp_cpu_state[cpu] == CPU_STATE_CONFIGURED) { 920 if (pcpu->state != CPU_STATE_CONFIGURED)
894 rc = sclp_cpu_deconfigure(__cpu_logical_map[cpu]); 921 break;
895 if (!rc) { 922 rc = sclp_cpu_deconfigure(pcpu->address);
896 smp_cpu_state[cpu] = CPU_STATE_STANDBY; 923 if (rc)
897 cpu_set_polarization(cpu, POLARIZATION_UNKNOWN); 924 break;
898 topology_expect_change(); 925 pcpu->state = CPU_STATE_STANDBY;
899 } 926 cpu_set_polarization(cpu, POLARIZATION_UNKNOWN);
900 } 927 topology_expect_change();
901 break; 928 break;
902 case 1: 929 case 1:
903 if (smp_cpu_state[cpu] == CPU_STATE_STANDBY) { 930 if (pcpu->state != CPU_STATE_STANDBY)
904 rc = sclp_cpu_configure(__cpu_logical_map[cpu]); 931 break;
905 if (!rc) { 932 rc = sclp_cpu_configure(pcpu->address);
906 smp_cpu_state[cpu] = CPU_STATE_CONFIGURED; 933 if (rc)
907 cpu_set_polarization(cpu, POLARIZATION_UNKNOWN); 934 break;
908 topology_expect_change(); 935 pcpu->state = CPU_STATE_CONFIGURED;
909 } 936 cpu_set_polarization(cpu, POLARIZATION_UNKNOWN);
910 } 937 topology_expect_change();
911 break; 938 break;
912 default: 939 default:
913 break; 940 break;
@@ -923,7 +950,7 @@ static DEVICE_ATTR(configure, 0644, cpu_configure_show, cpu_configure_store);
923static ssize_t show_cpu_address(struct device *dev, 950static ssize_t show_cpu_address(struct device *dev,
924 struct device_attribute *attr, char *buf) 951 struct device_attribute *attr, char *buf)
925{ 952{
926 return sprintf(buf, "%d\n", __cpu_logical_map[dev->id]); 953 return sprintf(buf, "%d\n", pcpu_devices[dev->id].address);
927} 954}
928static DEVICE_ATTR(address, 0444, show_cpu_address, NULL); 955static DEVICE_ATTR(address, 0444, show_cpu_address, NULL);
929 956
@@ -955,22 +982,16 @@ static DEVICE_ATTR(capability, 0444, show_capability, NULL);
955static ssize_t show_idle_count(struct device *dev, 982static ssize_t show_idle_count(struct device *dev,
956 struct device_attribute *attr, char *buf) 983 struct device_attribute *attr, char *buf)
957{ 984{
958 struct s390_idle_data *idle; 985 struct s390_idle_data *idle = &per_cpu(s390_idle, dev->id);
959 unsigned long long idle_count; 986 unsigned long long idle_count;
960 unsigned int sequence; 987 unsigned int sequence;
961 988
962 idle = &per_cpu(s390_idle, dev->id); 989 do {
963repeat: 990 sequence = ACCESS_ONCE(idle->sequence);
964 sequence = idle->sequence; 991 idle_count = ACCESS_ONCE(idle->idle_count);
965 smp_rmb(); 992 if (ACCESS_ONCE(idle->idle_enter))
966 if (sequence & 1) 993 idle_count++;
967 goto repeat; 994 } while ((sequence & 1) || (idle->sequence != sequence));
968 idle_count = idle->idle_count;
969 if (idle->idle_enter)
970 idle_count++;
971 smp_rmb();
972 if (idle->sequence != sequence)
973 goto repeat;
974 return sprintf(buf, "%llu\n", idle_count); 995 return sprintf(buf, "%llu\n", idle_count);
975} 996}
976static DEVICE_ATTR(idle_count, 0444, show_idle_count, NULL); 997static DEVICE_ATTR(idle_count, 0444, show_idle_count, NULL);
@@ -978,24 +999,18 @@ static DEVICE_ATTR(idle_count, 0444, show_idle_count, NULL);
978static ssize_t show_idle_time(struct device *dev, 999static ssize_t show_idle_time(struct device *dev,
979 struct device_attribute *attr, char *buf) 1000 struct device_attribute *attr, char *buf)
980{ 1001{
981 struct s390_idle_data *idle; 1002 struct s390_idle_data *idle = &per_cpu(s390_idle, dev->id);
982 unsigned long long now, idle_time, idle_enter; 1003 unsigned long long now, idle_time, idle_enter, idle_exit;
983 unsigned int sequence; 1004 unsigned int sequence;
984 1005
985 idle = &per_cpu(s390_idle, dev->id); 1006 do {
986 now = get_clock(); 1007 now = get_clock();
987repeat: 1008 sequence = ACCESS_ONCE(idle->sequence);
988 sequence = idle->sequence; 1009 idle_time = ACCESS_ONCE(idle->idle_time);
989 smp_rmb(); 1010 idle_enter = ACCESS_ONCE(idle->idle_enter);
990 if (sequence & 1) 1011 idle_exit = ACCESS_ONCE(idle->idle_exit);
991 goto repeat; 1012 } while ((sequence & 1) || (idle->sequence != sequence));
992 idle_time = idle->idle_time; 1013 idle_time += idle_enter ? ((idle_exit ? : now) - idle_enter) : 0;
993 idle_enter = idle->idle_enter;
994 if (idle_enter != 0ULL && idle_enter < now)
995 idle_time += now - idle_enter;
996 smp_rmb();
997 if (idle->sequence != sequence)
998 goto repeat;
999 return sprintf(buf, "%llu\n", idle_time >> 12); 1014 return sprintf(buf, "%llu\n", idle_time >> 12);
1000} 1015}
1001static DEVICE_ATTR(idle_time_us, 0444, show_idle_time, NULL); 1016static DEVICE_ATTR(idle_time_us, 0444, show_idle_time, NULL);
@@ -1015,7 +1030,7 @@ static int __cpuinit smp_cpu_notify(struct notifier_block *self,
1015 unsigned long action, void *hcpu) 1030 unsigned long action, void *hcpu)
1016{ 1031{
1017 unsigned int cpu = (unsigned int)(long)hcpu; 1032 unsigned int cpu = (unsigned int)(long)hcpu;
1018 struct cpu *c = &per_cpu(cpu_devices, cpu); 1033 struct cpu *c = &pcpu_devices[cpu].cpu;
1019 struct device *s = &c->dev; 1034 struct device *s = &c->dev;
1020 struct s390_idle_data *idle; 1035 struct s390_idle_data *idle;
1021 int err = 0; 1036 int err = 0;
@@ -1041,7 +1056,7 @@ static struct notifier_block __cpuinitdata smp_cpu_nb = {
1041 1056
1042static int __devinit smp_add_present_cpu(int cpu) 1057static int __devinit smp_add_present_cpu(int cpu)
1043{ 1058{
1044 struct cpu *c = &per_cpu(cpu_devices, cpu); 1059 struct cpu *c = &pcpu_devices[cpu].cpu;
1045 struct device *s = &c->dev; 1060 struct device *s = &c->dev;
1046 int rc; 1061 int rc;
1047 1062
@@ -1079,29 +1094,21 @@ out:
1079 1094
1080int __ref smp_rescan_cpus(void) 1095int __ref smp_rescan_cpus(void)
1081{ 1096{
1082 cpumask_t newcpus; 1097 struct sclp_cpu_info *info;
1083 int cpu; 1098 int nr;
1084 int rc;
1085 1099
1100 info = smp_get_cpu_info();
1101 if (!info)
1102 return -ENOMEM;
1086 get_online_cpus(); 1103 get_online_cpus();
1087 mutex_lock(&smp_cpu_state_mutex); 1104 mutex_lock(&smp_cpu_state_mutex);
1088 cpumask_copy(&newcpus, cpu_present_mask); 1105 nr = __smp_rescan_cpus(info, 1);
1089 rc = __smp_rescan_cpus();
1090 if (rc)
1091 goto out;
1092 cpumask_andnot(&newcpus, cpu_present_mask, &newcpus);
1093 for_each_cpu(cpu, &newcpus) {
1094 rc = smp_add_present_cpu(cpu);
1095 if (rc)
1096 set_cpu_present(cpu, false);
1097 }
1098 rc = 0;
1099out:
1100 mutex_unlock(&smp_cpu_state_mutex); 1106 mutex_unlock(&smp_cpu_state_mutex);
1101 put_online_cpus(); 1107 put_online_cpus();
1102 if (!cpumask_empty(&newcpus)) 1108 kfree(info);
1109 if (nr)
1103 topology_schedule_update(); 1110 topology_schedule_update();
1104 return rc; 1111 return 0;
1105} 1112}
1106 1113
1107static ssize_t __ref rescan_store(struct device *dev, 1114static ssize_t __ref rescan_store(struct device *dev,