]> bbs.cooldavid.org Git - net-next-2.6.git/blame - arch/s390/kernel/smp.c
[S390] cpu topology support for s390.
[net-next-2.6.git] / arch / s390 / kernel / smp.c
CommitLineData
1da177e4
LT
1/*
2 * arch/s390/kernel/smp.c
3 *
39ce010d 4 * Copyright IBM Corp. 1999,2007
1da177e4 5 * Author(s): Denis Joseph Barrow (djbarrow@de.ibm.com,barrow_dj@yahoo.com),
39ce010d
HC
6 * Martin Schwidefsky (schwidefsky@de.ibm.com)
7 * Heiko Carstens (heiko.carstens@de.ibm.com)
1da177e4 8 *
39ce010d 9 * based on other smp stuff by
1da177e4
LT
10 * (c) 1995 Alan Cox, CymruNET Ltd <alan@cymru.net>
11 * (c) 1998 Ingo Molnar
12 *
13 * We work with logical cpu numbering everywhere we can. The only
14 * functions using the real cpu address (got from STAP) are the sigp
15 * functions. For all other functions we use the identity mapping.
16 * That means that cpu_number_map[i] == i for every cpu. cpu_number_map is
17 * used e.g. to find the idle task belonging to a logical cpu. Every array
18 * in the kernel is sorted by the logical cpu number and not by the physical
19 * one which is causing all the confusion with __cpu_logical_map and
20 * cpu_number_map in other architectures.
21 */
22
23#include <linux/module.h>
24#include <linux/init.h>
1da177e4 25#include <linux/mm.h>
4e950f6f 26#include <linux/err.h>
1da177e4
LT
27#include <linux/spinlock.h>
28#include <linux/kernel_stat.h>
1da177e4
LT
29#include <linux/delay.h>
30#include <linux/cache.h>
31#include <linux/interrupt.h>
32#include <linux/cpu.h>
2b67fc46 33#include <linux/timex.h>
411ed322 34#include <linux/bootmem.h>
46b05d26 35#include <asm/ipl.h>
2b67fc46 36#include <asm/setup.h>
1da177e4
LT
37#include <asm/sigp.h>
38#include <asm/pgalloc.h>
39#include <asm/irq.h>
40#include <asm/s390_ext.h>
41#include <asm/cpcmd.h>
42#include <asm/tlbflush.h>
2b67fc46 43#include <asm/timer.h>
411ed322 44#include <asm/lowcore.h>
08d07968 45#include <asm/sclp.h>
fae8b22d 46#include <asm/cpu.h>
1da177e4 47
1da177e4
LT
48/*
49 * An array with a pointer the lowcore of every CPU.
50 */
1da177e4 51struct _lowcore *lowcore_ptr[NR_CPUS];
39ce010d 52EXPORT_SYMBOL(lowcore_ptr);
1da177e4 53
255acee7 54cpumask_t cpu_online_map = CPU_MASK_NONE;
39ce010d
HC
55EXPORT_SYMBOL(cpu_online_map);
56
48483b32 57cpumask_t cpu_possible_map = CPU_MASK_ALL;
39ce010d 58EXPORT_SYMBOL(cpu_possible_map);
1da177e4
LT
59
60static struct task_struct *current_set[NR_CPUS];
61
08d07968
HC
62static u8 smp_cpu_type;
63static int smp_use_sigp_detection;
64
65enum s390_cpu_state {
66 CPU_STATE_STANDBY,
67 CPU_STATE_CONFIGURED,
68};
69
dbd70fb4 70DEFINE_MUTEX(smp_cpu_state_mutex);
08d07968
HC
71static int smp_cpu_state[NR_CPUS];
72
73static DEFINE_PER_CPU(struct cpu, cpu_devices);
74DEFINE_PER_CPU(struct s390_idle_data, s390_idle);
75
1da177e4 76static void smp_ext_bitcall(int, ec_bit_sig);
1da177e4
LT
77
78/*
63db6e8d
JG
79 * Structure and data for __smp_call_function_map(). This is designed to
80 * minimise static memory requirements. It also looks cleaner.
1da177e4
LT
81 */
82static DEFINE_SPINLOCK(call_lock);
83
84struct call_data_struct {
85 void (*func) (void *info);
86 void *info;
63db6e8d
JG
87 cpumask_t started;
88 cpumask_t finished;
1da177e4
LT
89 int wait;
90};
91
39ce010d 92static struct call_data_struct *call_data;
1da177e4
LT
93
94/*
95 * 'Call function' interrupt callback
96 */
97static void do_call_function(void)
98{
99 void (*func) (void *info) = call_data->func;
100 void *info = call_data->info;
101 int wait = call_data->wait;
102
63db6e8d 103 cpu_set(smp_processor_id(), call_data->started);
1da177e4
LT
104 (*func)(info);
105 if (wait)
63db6e8d 106 cpu_set(smp_processor_id(), call_data->finished);;
1da177e4
LT
107}
108
63db6e8d
JG
109static void __smp_call_function_map(void (*func) (void *info), void *info,
110 int nonatomic, int wait, cpumask_t map)
1da177e4
LT
111{
112 struct call_data_struct data;
63db6e8d 113 int cpu, local = 0;
1da177e4 114
63db6e8d 115 /*
25864162 116 * Can deadlock when interrupts are disabled or if in wrong context.
63db6e8d 117 */
25864162 118 WARN_ON(irqs_disabled() || in_irq());
1da177e4 119
63db6e8d
JG
120 /*
121 * Check for local function call. We have to have the same call order
122 * as in on_each_cpu() because of machine_restart_smp().
123 */
124 if (cpu_isset(smp_processor_id(), map)) {
125 local = 1;
126 cpu_clear(smp_processor_id(), map);
127 }
128
129 cpus_and(map, map, cpu_online_map);
130 if (cpus_empty(map))
131 goto out;
1da177e4
LT
132
133 data.func = func;
134 data.info = info;
63db6e8d 135 data.started = CPU_MASK_NONE;
1da177e4
LT
136 data.wait = wait;
137 if (wait)
63db6e8d 138 data.finished = CPU_MASK_NONE;
1da177e4 139
8da1aecd 140 spin_lock(&call_lock);
1da177e4 141 call_data = &data;
63db6e8d
JG
142
143 for_each_cpu_mask(cpu, map)
144 smp_ext_bitcall(cpu, ec_call_function);
1da177e4
LT
145
146 /* Wait for response */
63db6e8d 147 while (!cpus_equal(map, data.started))
1da177e4 148 cpu_relax();
1da177e4 149 if (wait)
63db6e8d 150 while (!cpus_equal(map, data.finished))
1da177e4 151 cpu_relax();
8da1aecd 152 spin_unlock(&call_lock);
63db6e8d 153out:
8da1aecd
HC
154 if (local) {
155 local_irq_disable();
63db6e8d 156 func(info);
8da1aecd
HC
157 local_irq_enable();
158 }
1da177e4
LT
159}
160
161/*
63db6e8d
JG
162 * smp_call_function:
163 * @func: the function to run; this must be fast and non-blocking
164 * @info: an arbitrary pointer to pass to the function
165 * @nonatomic: unused
166 * @wait: if true, wait (atomically) until function has completed on other CPUs
1da177e4 167 *
63db6e8d 168 * Run a function on all other CPUs.
1da177e4 169 *
39ce010d
HC
170 * You must not call this function with disabled interrupts, from a
171 * hardware interrupt handler or from a bottom half.
1da177e4 172 */
63db6e8d
JG
173int smp_call_function(void (*func) (void *info), void *info, int nonatomic,
174 int wait)
1da177e4 175{
63db6e8d 176 cpumask_t map;
1da177e4 177
25864162 178 preempt_disable();
63db6e8d
JG
179 map = cpu_online_map;
180 cpu_clear(smp_processor_id(), map);
181 __smp_call_function_map(func, info, nonatomic, wait, map);
25864162 182 preempt_enable();
63db6e8d
JG
183 return 0;
184}
185EXPORT_SYMBOL(smp_call_function);
1da177e4 186
63db6e8d 187/*
3bb447fc
HC
188 * smp_call_function_single:
189 * @cpu: the CPU where func should run
63db6e8d
JG
190 * @func: the function to run; this must be fast and non-blocking
191 * @info: an arbitrary pointer to pass to the function
192 * @nonatomic: unused
193 * @wait: if true, wait (atomically) until function has completed on other CPUs
63db6e8d
JG
194 *
195 * Run a function on one processor.
196 *
39ce010d
HC
197 * You must not call this function with disabled interrupts, from a
198 * hardware interrupt handler or from a bottom half.
63db6e8d 199 */
3bb447fc
HC
200int smp_call_function_single(int cpu, void (*func) (void *info), void *info,
201 int nonatomic, int wait)
63db6e8d 202{
25864162 203 preempt_disable();
3bb447fc
HC
204 __smp_call_function_map(func, info, nonatomic, wait,
205 cpumask_of_cpu(cpu));
25864162 206 preempt_enable();
1da177e4
LT
207 return 0;
208}
3bb447fc 209EXPORT_SYMBOL(smp_call_function_single);
1da177e4 210
dab5209c
CO
211/**
212 * smp_call_function_mask(): Run a function on a set of other CPUs.
213 * @mask: The set of cpus to run on. Must not include the current cpu.
214 * @func: The function to run. This must be fast and non-blocking.
215 * @info: An arbitrary pointer to pass to the function.
216 * @wait: If true, wait (atomically) until function has completed on other CPUs.
217 *
218 * Returns 0 on success, else a negative status code.
219 *
220 * If @wait is true, then returns once @func has returned; otherwise
221 * it returns just before the target cpu calls @func.
222 *
223 * You must not call this function with disabled interrupts or from a
224 * hardware interrupt handler or from a bottom half handler.
225 */
37c5f719
HC
226int smp_call_function_mask(cpumask_t mask, void (*func)(void *), void *info,
227 int wait)
dab5209c
CO
228{
229 preempt_disable();
37c5f719 230 cpu_clear(smp_processor_id(), mask);
dab5209c
CO
231 __smp_call_function_map(func, info, 0, wait, mask);
232 preempt_enable();
233 return 0;
234}
235EXPORT_SYMBOL(smp_call_function_mask);
236
677d7623 237void smp_send_stop(void)
1da177e4 238{
39ce010d 239 int cpu, rc;
1da177e4 240
677d7623
HC
241 /* Disable all interrupts/machine checks */
242 __load_psw_mask(psw_kernel_bits & ~PSW_MASK_MCHECK);
1da177e4 243
677d7623
HC
244 /* write magic number to zero page (absolute 0) */
245 lowcore_ptr[smp_processor_id()]->panic_magic = __PANIC_MAGIC;
1da177e4 246
677d7623 247 /* stop all processors */
1da177e4
LT
248 for_each_online_cpu(cpu) {
249 if (cpu == smp_processor_id())
250 continue;
251 do {
677d7623 252 rc = signal_processor(cpu, sigp_stop);
39ce010d 253 } while (rc == sigp_busy);
1da177e4 254
39ce010d 255 while (!smp_cpu_not_running(cpu))
c6b5b847
HC
256 cpu_relax();
257 }
258}
259
1da177e4
LT
260/*
261 * This is the main routine where commands issued by other
262 * cpus are handled.
263 */
264
2b67fc46 265static void do_ext_call_interrupt(__u16 code)
1da177e4 266{
39ce010d 267 unsigned long bits;
1da177e4 268
39ce010d
HC
269 /*
270 * handle bit signal external calls
271 *
272 * For the ec_schedule signal we have to do nothing. All the work
273 * is done automatically when we return from the interrupt.
274 */
1da177e4
LT
275 bits = xchg(&S390_lowcore.ext_call_fast, 0);
276
39ce010d 277 if (test_bit(ec_call_function, &bits))
1da177e4
LT
278 do_call_function();
279}
280
281/*
282 * Send an external call sigp to another cpu and return without waiting
283 * for its completion.
284 */
285static void smp_ext_bitcall(int cpu, ec_bit_sig sig)
286{
39ce010d
HC
287 /*
288 * Set signaling bit in lowcore of target cpu and kick it
289 */
1da177e4 290 set_bit(sig, (unsigned long *) &lowcore_ptr[cpu]->ext_call_fast);
39ce010d 291 while (signal_processor(cpu, sigp_emergency_signal) == sigp_busy)
1da177e4
LT
292 udelay(10);
293}
294
347a8dc3 295#ifndef CONFIG_64BIT
1da177e4
LT
296/*
297 * this function sends a 'purge tlb' signal to another CPU.
298 */
299void smp_ptlb_callback(void *info)
300{
ba8a9229 301 __tlb_flush_local();
1da177e4
LT
302}
303
304void smp_ptlb_all(void)
305{
39ce010d 306 on_each_cpu(smp_ptlb_callback, NULL, 0, 1);
1da177e4
LT
307}
308EXPORT_SYMBOL(smp_ptlb_all);
347a8dc3 309#endif /* ! CONFIG_64BIT */
1da177e4
LT
310
311/*
312 * this function sends a 'reschedule' IPI to another CPU.
313 * it goes straight through and wastes no time serializing
314 * anything. Worst case is that we lose a reschedule ...
315 */
316void smp_send_reschedule(int cpu)
317{
39ce010d 318 smp_ext_bitcall(cpu, ec_schedule);
1da177e4
LT
319}
320
321/*
322 * parameter area for the set/clear control bit callbacks
323 */
94c12cc7 324struct ec_creg_mask_parms {
1da177e4
LT
325 unsigned long orvals[16];
326 unsigned long andvals[16];
94c12cc7 327};
1da177e4
LT
328
329/*
330 * callback for setting/clearing control bits
331 */
39ce010d
HC
332static void smp_ctl_bit_callback(void *info)
333{
94c12cc7 334 struct ec_creg_mask_parms *pp = info;
1da177e4
LT
335 unsigned long cregs[16];
336 int i;
39ce010d 337
94c12cc7
MS
338 __ctl_store(cregs, 0, 15);
339 for (i = 0; i <= 15; i++)
1da177e4 340 cregs[i] = (cregs[i] & pp->andvals[i]) | pp->orvals[i];
94c12cc7 341 __ctl_load(cregs, 0, 15);
1da177e4
LT
342}
343
344/*
345 * Set a bit in a control register of all cpus
346 */
94c12cc7
MS
347void smp_ctl_set_bit(int cr, int bit)
348{
349 struct ec_creg_mask_parms parms;
1da177e4 350
94c12cc7
MS
351 memset(&parms.orvals, 0, sizeof(parms.orvals));
352 memset(&parms.andvals, 0xff, sizeof(parms.andvals));
1da177e4 353 parms.orvals[cr] = 1 << bit;
94c12cc7 354 on_each_cpu(smp_ctl_bit_callback, &parms, 0, 1);
1da177e4 355}
39ce010d 356EXPORT_SYMBOL(smp_ctl_set_bit);
1da177e4
LT
357
358/*
359 * Clear a bit in a control register of all cpus
360 */
94c12cc7
MS
361void smp_ctl_clear_bit(int cr, int bit)
362{
363 struct ec_creg_mask_parms parms;
1da177e4 364
94c12cc7
MS
365 memset(&parms.orvals, 0, sizeof(parms.orvals));
366 memset(&parms.andvals, 0xff, sizeof(parms.andvals));
1da177e4 367 parms.andvals[cr] = ~(1L << bit);
94c12cc7 368 on_each_cpu(smp_ctl_bit_callback, &parms, 0, 1);
1da177e4 369}
39ce010d 370EXPORT_SYMBOL(smp_ctl_clear_bit);
1da177e4 371
08d07968
HC
372/*
373 * In early ipl state a temp. logically cpu number is needed, so the sigp
374 * functions can be used to sense other cpus. Since NR_CPUS is >= 2 on
375 * CONFIG_SMP and the ipl cpu is logical cpu 0, it must be 1.
376 */
377#define CPU_INIT_NO 1
378
411ed322
MH
379#if defined(CONFIG_ZFCPDUMP) || defined(CONFIG_ZFCPDUMP_MODULE)
380
381/*
382 * zfcpdump_prefix_array holds prefix registers for the following scenario:
383 * 64 bit zfcpdump kernel and 31 bit kernel which is to be dumped. We have to
384 * save its prefix registers, since they get lost, when switching from 31 bit
385 * to 64 bit.
386 */
387unsigned int zfcpdump_prefix_array[NR_CPUS + 1] \
388 __attribute__((__section__(".data")));
389
285f6722 390static void __init smp_get_save_area(unsigned int cpu, unsigned int phy_cpu)
411ed322 391{
411ed322
MH
392 if (ipl_info.type != IPL_TYPE_FCP_DUMP)
393 return;
285f6722
HC
394 if (cpu >= NR_CPUS) {
395 printk(KERN_WARNING "Registers for cpu %i not saved since dump "
396 "kernel was compiled with NR_CPUS=%i\n", cpu, NR_CPUS);
397 return;
411ed322 398 }
48483b32 399 zfcpdump_save_areas[cpu] = kmalloc(sizeof(union save_area), GFP_KERNEL);
08d07968
HC
400 __cpu_logical_map[CPU_INIT_NO] = (__u16) phy_cpu;
401 while (signal_processor(CPU_INIT_NO, sigp_stop_and_store_status) ==
402 sigp_busy)
285f6722
HC
403 cpu_relax();
404 memcpy(zfcpdump_save_areas[cpu],
405 (void *)(unsigned long) store_prefix() + SAVE_AREA_BASE,
406 SAVE_AREA_SIZE);
407#ifdef CONFIG_64BIT
408 /* copy original prefix register */
409 zfcpdump_save_areas[cpu]->s390x.pref_reg = zfcpdump_prefix_array[cpu];
410#endif
411ed322
MH
411}
412
413union save_area *zfcpdump_save_areas[NR_CPUS + 1];
414EXPORT_SYMBOL_GPL(zfcpdump_save_areas);
415
416#else
285f6722
HC
417
418static inline void smp_get_save_area(unsigned int cpu, unsigned int phy_cpu) { }
419
420#endif /* CONFIG_ZFCPDUMP || CONFIG_ZFCPDUMP_MODULE */
411ed322 421
08d07968
HC
422static int cpu_stopped(int cpu)
423{
424 __u32 status;
425
426 /* Check for stopped state */
427 if (signal_processor_ps(&status, 0, cpu, sigp_sense) ==
428 sigp_status_stored) {
429 if (status & 0x40)
430 return 1;
431 }
432 return 0;
433}
434
08d07968
HC
435static int cpu_known(int cpu_id)
436{
437 int cpu;
438
439 for_each_present_cpu(cpu) {
440 if (__cpu_logical_map[cpu] == cpu_id)
441 return 1;
442 }
443 return 0;
444}
445
446static int smp_rescan_cpus_sigp(cpumask_t avail)
447{
448 int cpu_id, logical_cpu;
449
450 logical_cpu = first_cpu(avail);
451 if (logical_cpu == NR_CPUS)
452 return 0;
453 for (cpu_id = 0; cpu_id <= 65535; cpu_id++) {
454 if (cpu_known(cpu_id))
455 continue;
456 __cpu_logical_map[logical_cpu] = cpu_id;
457 if (!cpu_stopped(logical_cpu))
458 continue;
459 cpu_set(logical_cpu, cpu_present_map);
460 smp_cpu_state[logical_cpu] = CPU_STATE_CONFIGURED;
461 logical_cpu = next_cpu(logical_cpu, avail);
462 if (logical_cpu == NR_CPUS)
463 break;
464 }
465 return 0;
466}
467
48483b32 468static int smp_rescan_cpus_sclp(cpumask_t avail)
08d07968
HC
469{
470 struct sclp_cpu_info *info;
471 int cpu_id, logical_cpu, cpu;
472 int rc;
473
474 logical_cpu = first_cpu(avail);
475 if (logical_cpu == NR_CPUS)
476 return 0;
48483b32 477 info = kmalloc(sizeof(*info), GFP_KERNEL);
08d07968
HC
478 if (!info)
479 return -ENOMEM;
480 rc = sclp_get_cpu_info(info);
481 if (rc)
482 goto out;
483 for (cpu = 0; cpu < info->combined; cpu++) {
484 if (info->has_cpu_type && info->cpu[cpu].type != smp_cpu_type)
485 continue;
486 cpu_id = info->cpu[cpu].address;
487 if (cpu_known(cpu_id))
488 continue;
489 __cpu_logical_map[logical_cpu] = cpu_id;
490 cpu_set(logical_cpu, cpu_present_map);
491 if (cpu >= info->configured)
492 smp_cpu_state[logical_cpu] = CPU_STATE_STANDBY;
493 else
494 smp_cpu_state[logical_cpu] = CPU_STATE_CONFIGURED;
495 logical_cpu = next_cpu(logical_cpu, avail);
496 if (logical_cpu == NR_CPUS)
497 break;
498 }
499out:
48483b32 500 kfree(info);
08d07968
HC
501 return rc;
502}
503
504static int smp_rescan_cpus(void)
505{
506 cpumask_t avail;
507
48483b32 508 cpus_xor(avail, cpu_possible_map, cpu_present_map);
08d07968
HC
509 if (smp_use_sigp_detection)
510 return smp_rescan_cpus_sigp(avail);
511 else
512 return smp_rescan_cpus_sclp(avail);
1da177e4
LT
513}
514
48483b32
HC
515static void __init smp_detect_cpus(void)
516{
517 unsigned int cpu, c_cpus, s_cpus;
518 struct sclp_cpu_info *info;
519 u16 boot_cpu_addr, cpu_addr;
520
521 c_cpus = 1;
522 s_cpus = 0;
523 boot_cpu_addr = S390_lowcore.cpu_data.cpu_addr;
524 info = kmalloc(sizeof(*info), GFP_KERNEL);
525 if (!info)
526 panic("smp_detect_cpus failed to allocate memory\n");
527 /* Use sigp detection algorithm if sclp doesn't work. */
528 if (sclp_get_cpu_info(info)) {
529 smp_use_sigp_detection = 1;
530 for (cpu = 0; cpu <= 65535; cpu++) {
531 if (cpu == boot_cpu_addr)
532 continue;
533 __cpu_logical_map[CPU_INIT_NO] = cpu;
534 if (!cpu_stopped(CPU_INIT_NO))
535 continue;
536 smp_get_save_area(c_cpus, cpu);
537 c_cpus++;
538 }
539 goto out;
540 }
541
542 if (info->has_cpu_type) {
543 for (cpu = 0; cpu < info->combined; cpu++) {
544 if (info->cpu[cpu].address == boot_cpu_addr) {
545 smp_cpu_type = info->cpu[cpu].type;
546 break;
547 }
548 }
549 }
550
551 for (cpu = 0; cpu < info->combined; cpu++) {
552 if (info->has_cpu_type && info->cpu[cpu].type != smp_cpu_type)
553 continue;
554 cpu_addr = info->cpu[cpu].address;
555 if (cpu_addr == boot_cpu_addr)
556 continue;
557 __cpu_logical_map[CPU_INIT_NO] = cpu_addr;
558 if (!cpu_stopped(CPU_INIT_NO)) {
559 s_cpus++;
560 continue;
561 }
562 smp_get_save_area(c_cpus, cpu_addr);
563 c_cpus++;
564 }
565out:
566 kfree(info);
567 printk(KERN_INFO "CPUs: %d configured, %d standby\n", c_cpus, s_cpus);
9d40d2e3 568 get_online_cpus();
48483b32 569 smp_rescan_cpus();
9d40d2e3 570 put_online_cpus();
48483b32
HC
571}
572
1da177e4 573/*
39ce010d 574 * Activate a secondary processor.
1da177e4 575 */
ea1f4eec 576int __cpuinit start_secondary(void *cpuvoid)
1da177e4 577{
39ce010d
HC
578 /* Setup the cpu */
579 cpu_init();
5bfb5d69 580 preempt_disable();
d54853ef 581 /* Enable TOD clock interrupts on the secondary cpu. */
39ce010d 582 init_cpu_timer();
1da177e4 583#ifdef CONFIG_VIRT_TIMER
d54853ef 584 /* Enable cpu timer interrupts on the secondary cpu. */
39ce010d 585 init_cpu_vtimer();
1da177e4 586#endif
1da177e4 587 /* Enable pfault pseudo page faults on this cpu. */
29b08d2b
HC
588 pfault_init();
589
1da177e4
LT
590 /* Mark this cpu as online */
591 cpu_set(smp_processor_id(), cpu_online_map);
592 /* Switch on interrupts */
593 local_irq_enable();
39ce010d
HC
594 /* Print info about this processor */
595 print_cpu_info(&S390_lowcore.cpu_data);
596 /* cpu_idle will call schedule for us */
597 cpu_idle();
598 return 0;
1da177e4
LT
599}
600
601static void __init smp_create_idle(unsigned int cpu)
602{
603 struct task_struct *p;
604
605 /*
606 * don't care about the psw and regs settings since we'll never
607 * reschedule the forked task.
608 */
609 p = fork_idle(cpu);
610 if (IS_ERR(p))
611 panic("failed fork for CPU %u: %li", cpu, PTR_ERR(p));
612 current_set[cpu] = p;
fae8b22d 613 spin_lock_init(&(&per_cpu(s390_idle, cpu))->lock);
1da177e4
LT
614}
615
1cb6bb4b
HC
616static int __cpuinit smp_alloc_lowcore(int cpu)
617{
618 unsigned long async_stack, panic_stack;
619 struct _lowcore *lowcore;
620 int lc_order;
621
622 lc_order = sizeof(long) == 8 ? 1 : 0;
623 lowcore = (void *) __get_free_pages(GFP_KERNEL | GFP_DMA, lc_order);
624 if (!lowcore)
625 return -ENOMEM;
626 async_stack = __get_free_pages(GFP_KERNEL, ASYNC_ORDER);
1cb6bb4b 627 panic_stack = __get_free_page(GFP_KERNEL);
591bb4f6
HC
628 if (!panic_stack || !async_stack)
629 goto out;
98c7b388
HC
630 memcpy(lowcore, &S390_lowcore, 512);
631 memset((char *)lowcore + 512, 0, sizeof(*lowcore) - 512);
1cb6bb4b
HC
632 lowcore->async_stack = async_stack + ASYNC_SIZE;
633 lowcore->panic_stack = panic_stack + PAGE_SIZE;
634
635#ifndef CONFIG_64BIT
636 if (MACHINE_HAS_IEEE) {
637 unsigned long save_area;
638
639 save_area = get_zeroed_page(GFP_KERNEL);
640 if (!save_area)
641 goto out_save_area;
642 lowcore->extended_save_area_addr = (u32) save_area;
643 }
644#endif
645 lowcore_ptr[cpu] = lowcore;
646 return 0;
647
648#ifndef CONFIG_64BIT
649out_save_area:
650 free_page(panic_stack);
651#endif
591bb4f6 652out:
1cb6bb4b 653 free_pages(async_stack, ASYNC_ORDER);
1cb6bb4b
HC
654 free_pages((unsigned long) lowcore, lc_order);
655 return -ENOMEM;
656}
657
658#ifdef CONFIG_HOTPLUG_CPU
659static void smp_free_lowcore(int cpu)
660{
661 struct _lowcore *lowcore;
662 int lc_order;
663
664 lc_order = sizeof(long) == 8 ? 1 : 0;
665 lowcore = lowcore_ptr[cpu];
666#ifndef CONFIG_64BIT
667 if (MACHINE_HAS_IEEE)
668 free_page((unsigned long) lowcore->extended_save_area_addr);
669#endif
670 free_page(lowcore->panic_stack - PAGE_SIZE);
671 free_pages(lowcore->async_stack - ASYNC_SIZE, ASYNC_ORDER);
672 free_pages((unsigned long) lowcore, lc_order);
673 lowcore_ptr[cpu] = NULL;
674}
675#endif /* CONFIG_HOTPLUG_CPU */
676
1da177e4 677/* Upping and downing of CPUs */
1cb6bb4b 678int __cpuinit __cpu_up(unsigned int cpu)
1da177e4
LT
679{
680 struct task_struct *idle;
39ce010d 681 struct _lowcore *cpu_lowcore;
1da177e4 682 struct stack_frame *sf;
39ce010d 683 sigp_ccode ccode;
1da177e4 684
08d07968
HC
685 if (smp_cpu_state[cpu] != CPU_STATE_CONFIGURED)
686 return -EIO;
1cb6bb4b
HC
687 if (smp_alloc_lowcore(cpu))
688 return -ENOMEM;
1da177e4
LT
689
690 ccode = signal_processor_p((__u32)(unsigned long)(lowcore_ptr[cpu]),
691 cpu, sigp_set_prefix);
39ce010d 692 if (ccode) {
1da177e4
LT
693 printk("sigp_set_prefix failed for cpu %d "
694 "with condition code %d\n",
695 (int) cpu, (int) ccode);
696 return -EIO;
697 }
698
699 idle = current_set[cpu];
39ce010d 700 cpu_lowcore = lowcore_ptr[cpu];
1da177e4 701 cpu_lowcore->kernel_stack = (unsigned long)
39ce010d 702 task_stack_page(idle) + THREAD_SIZE;
1cb6bb4b 703 cpu_lowcore->thread_info = (unsigned long) task_thread_info(idle);
1da177e4
LT
704 sf = (struct stack_frame *) (cpu_lowcore->kernel_stack
705 - sizeof(struct pt_regs)
706 - sizeof(struct stack_frame));
707 memset(sf, 0, sizeof(struct stack_frame));
708 sf->gprs[9] = (unsigned long) sf;
709 cpu_lowcore->save_area[15] = (unsigned long) sf;
710 __ctl_store(cpu_lowcore->cregs_save_area[0], 0, 15);
94c12cc7
MS
711 asm volatile(
712 " stam 0,15,0(%0)"
713 : : "a" (&cpu_lowcore->access_regs_save_area) : "memory");
1da177e4 714 cpu_lowcore->percpu_offset = __per_cpu_offset[cpu];
39ce010d
HC
715 cpu_lowcore->current_task = (unsigned long) idle;
716 cpu_lowcore->cpu_data.cpu_nr = cpu;
591bb4f6
HC
717 cpu_lowcore->kernel_asce = S390_lowcore.kernel_asce;
718 cpu_lowcore->ipl_device = S390_lowcore.ipl_device;
1da177e4 719 eieio();
699ff13f 720
39ce010d 721 while (signal_processor(cpu, sigp_restart) == sigp_busy)
699ff13f 722 udelay(10);
1da177e4
LT
723
724 while (!cpu_online(cpu))
725 cpu_relax();
726 return 0;
727}
728
48483b32 729static int __init setup_possible_cpus(char *s)
255acee7 730{
48483b32 731 int pcpus, cpu;
255acee7 732
48483b32
HC
733 pcpus = simple_strtoul(s, NULL, 0);
734 cpu_possible_map = cpumask_of_cpu(0);
735 for (cpu = 1; cpu < pcpus && cpu < NR_CPUS; cpu++)
255acee7 736 cpu_set(cpu, cpu_possible_map);
37a33026
HC
737 return 0;
738}
739early_param("possible_cpus", setup_possible_cpus);
740
48483b32
HC
741#ifdef CONFIG_HOTPLUG_CPU
742
39ce010d 743int __cpu_disable(void)
1da177e4 744{
94c12cc7 745 struct ec_creg_mask_parms cr_parms;
f3705136 746 int cpu = smp_processor_id();
1da177e4 747
f3705136 748 cpu_clear(cpu, cpu_online_map);
1da177e4 749
1da177e4 750 /* Disable pfault pseudo page faults on this cpu. */
29b08d2b 751 pfault_fini();
1da177e4 752
94c12cc7
MS
753 memset(&cr_parms.orvals, 0, sizeof(cr_parms.orvals));
754 memset(&cr_parms.andvals, 0xff, sizeof(cr_parms.andvals));
1da177e4 755
94c12cc7 756 /* disable all external interrupts */
1da177e4 757 cr_parms.orvals[0] = 0;
39ce010d
HC
758 cr_parms.andvals[0] = ~(1 << 15 | 1 << 14 | 1 << 13 | 1 << 12 |
759 1 << 11 | 1 << 10 | 1 << 6 | 1 << 4);
1da177e4 760 /* disable all I/O interrupts */
1da177e4 761 cr_parms.orvals[6] = 0;
39ce010d
HC
762 cr_parms.andvals[6] = ~(1 << 31 | 1 << 30 | 1 << 29 | 1 << 28 |
763 1 << 27 | 1 << 26 | 1 << 25 | 1 << 24);
1da177e4 764 /* disable most machine checks */
1da177e4 765 cr_parms.orvals[14] = 0;
39ce010d
HC
766 cr_parms.andvals[14] = ~(1 << 28 | 1 << 27 | 1 << 26 |
767 1 << 25 | 1 << 24);
94c12cc7 768
1da177e4
LT
769 smp_ctl_bit_callback(&cr_parms);
770
1da177e4
LT
771 return 0;
772}
773
39ce010d 774void __cpu_die(unsigned int cpu)
1da177e4
LT
775{
776 /* Wait until target cpu is down */
777 while (!smp_cpu_not_running(cpu))
778 cpu_relax();
1cb6bb4b 779 smp_free_lowcore(cpu);
08d07968 780 printk(KERN_INFO "Processor %d spun down\n", cpu);
1da177e4
LT
781}
782
39ce010d 783void cpu_die(void)
1da177e4
LT
784{
785 idle_task_exit();
786 signal_processor(smp_processor_id(), sigp_stop);
787 BUG();
39ce010d 788 for (;;);
1da177e4
LT
789}
790
255acee7
HC
791#endif /* CONFIG_HOTPLUG_CPU */
792
1da177e4
LT
793void __init smp_prepare_cpus(unsigned int max_cpus)
794{
591bb4f6
HC
795#ifndef CONFIG_64BIT
796 unsigned long save_area = 0;
797#endif
798 unsigned long async_stack, panic_stack;
799 struct _lowcore *lowcore;
1da177e4 800 unsigned int cpu;
591bb4f6 801 int lc_order;
39ce010d 802
48483b32
HC
803 smp_detect_cpus();
804
39ce010d
HC
805 /* request the 0x1201 emergency signal external interrupt */
806 if (register_external_interrupt(0x1201, do_ext_call_interrupt) != 0)
807 panic("Couldn't request external interrupt 0x1201");
1da177e4
LT
808 print_cpu_info(&S390_lowcore.cpu_data);
809
591bb4f6
HC
810 /* Reallocate current lowcore, but keep its contents. */
811 lc_order = sizeof(long) == 8 ? 1 : 0;
812 lowcore = (void *) __get_free_pages(GFP_KERNEL | GFP_DMA, lc_order);
813 panic_stack = __get_free_page(GFP_KERNEL);
814 async_stack = __get_free_pages(GFP_KERNEL, ASYNC_ORDER);
347a8dc3 815#ifndef CONFIG_64BIT
77fa2245 816 if (MACHINE_HAS_IEEE)
591bb4f6 817 save_area = get_zeroed_page(GFP_KERNEL);
77fa2245 818#endif
591bb4f6
HC
819 local_irq_disable();
820 local_mcck_disable();
821 lowcore_ptr[smp_processor_id()] = lowcore;
822 *lowcore = S390_lowcore;
823 lowcore->panic_stack = panic_stack + PAGE_SIZE;
824 lowcore->async_stack = async_stack + ASYNC_SIZE;
825#ifndef CONFIG_64BIT
826 if (MACHINE_HAS_IEEE)
827 lowcore->extended_save_area_addr = (u32) save_area;
828#endif
829 set_prefix((u32)(unsigned long) lowcore);
830 local_mcck_enable();
831 local_irq_enable();
97db7fbf 832 for_each_possible_cpu(cpu)
1da177e4
LT
833 if (cpu != smp_processor_id())
834 smp_create_idle(cpu);
835}
836
ea1f4eec 837void __init smp_prepare_boot_cpu(void)
1da177e4
LT
838{
839 BUG_ON(smp_processor_id() != 0);
840
48483b32
HC
841 current_thread_info()->cpu = 0;
842 cpu_set(0, cpu_present_map);
1da177e4 843 cpu_set(0, cpu_online_map);
1da177e4
LT
844 S390_lowcore.percpu_offset = __per_cpu_offset[0];
845 current_set[0] = current;
08d07968 846 smp_cpu_state[0] = CPU_STATE_CONFIGURED;
fae8b22d 847 spin_lock_init(&(&__get_cpu_var(s390_idle))->lock);
1da177e4
LT
848}
849
ea1f4eec 850void __init smp_cpus_done(unsigned int max_cpus)
1da177e4 851{
1da177e4
LT
852}
853
854/*
855 * the frequency of the profiling timer can be changed
856 * by writing a multiplier value into /proc/profile.
857 *
858 * usually you want to run this on all CPUs ;)
859 */
860int setup_profiling_timer(unsigned int multiplier)
861{
39ce010d 862 return 0;
1da177e4
LT
863}
864
08d07968
HC
865#ifdef CONFIG_HOTPLUG_CPU
866static ssize_t cpu_configure_show(struct sys_device *dev, char *buf)
867{
868 ssize_t count;
869
870 mutex_lock(&smp_cpu_state_mutex);
871 count = sprintf(buf, "%d\n", smp_cpu_state[dev->id]);
872 mutex_unlock(&smp_cpu_state_mutex);
873 return count;
874}
875
876static ssize_t cpu_configure_store(struct sys_device *dev, const char *buf,
877 size_t count)
878{
879 int cpu = dev->id;
880 int val, rc;
881 char delim;
882
883 if (sscanf(buf, "%d %c", &val, &delim) != 1)
884 return -EINVAL;
885 if (val != 0 && val != 1)
886 return -EINVAL;
887
888 mutex_lock(&smp_cpu_state_mutex);
9d40d2e3 889 get_online_cpus();
08d07968
HC
890 rc = -EBUSY;
891 if (cpu_online(cpu))
892 goto out;
893 rc = 0;
894 switch (val) {
895 case 0:
896 if (smp_cpu_state[cpu] == CPU_STATE_CONFIGURED) {
897 rc = sclp_cpu_deconfigure(__cpu_logical_map[cpu]);
898 if (!rc)
899 smp_cpu_state[cpu] = CPU_STATE_STANDBY;
900 }
901 break;
902 case 1:
903 if (smp_cpu_state[cpu] == CPU_STATE_STANDBY) {
904 rc = sclp_cpu_configure(__cpu_logical_map[cpu]);
905 if (!rc)
906 smp_cpu_state[cpu] = CPU_STATE_CONFIGURED;
907 }
908 break;
909 default:
910 break;
911 }
912out:
9d40d2e3 913 put_online_cpus();
08d07968
HC
914 mutex_unlock(&smp_cpu_state_mutex);
915 return rc ? rc : count;
916}
917static SYSDEV_ATTR(configure, 0644, cpu_configure_show, cpu_configure_store);
918#endif /* CONFIG_HOTPLUG_CPU */
919
920static ssize_t show_cpu_address(struct sys_device *dev, char *buf)
921{
922 return sprintf(buf, "%d\n", __cpu_logical_map[dev->id]);
923}
924static SYSDEV_ATTR(address, 0444, show_cpu_address, NULL);
925
926
927static struct attribute *cpu_common_attrs[] = {
928#ifdef CONFIG_HOTPLUG_CPU
929 &attr_configure.attr,
930#endif
931 &attr_address.attr,
932 NULL,
933};
934
935static struct attribute_group cpu_common_attr_group = {
936 .attrs = cpu_common_attrs,
937};
1da177e4 938
2fc2d1e9
HC
939static ssize_t show_capability(struct sys_device *dev, char *buf)
940{
941 unsigned int capability;
942 int rc;
943
944 rc = get_cpu_capability(&capability);
945 if (rc)
946 return rc;
947 return sprintf(buf, "%u\n", capability);
948}
949static SYSDEV_ATTR(capability, 0444, show_capability, NULL);
950
fae8b22d
HC
951static ssize_t show_idle_count(struct sys_device *dev, char *buf)
952{
953 struct s390_idle_data *idle;
954 unsigned long long idle_count;
955
956 idle = &per_cpu(s390_idle, dev->id);
957 spin_lock_irq(&idle->lock);
958 idle_count = idle->idle_count;
959 spin_unlock_irq(&idle->lock);
960 return sprintf(buf, "%llu\n", idle_count);
961}
962static SYSDEV_ATTR(idle_count, 0444, show_idle_count, NULL);
963
964static ssize_t show_idle_time(struct sys_device *dev, char *buf)
965{
966 struct s390_idle_data *idle;
967 unsigned long long new_time;
968
969 idle = &per_cpu(s390_idle, dev->id);
970 spin_lock_irq(&idle->lock);
971 if (idle->in_idle) {
972 new_time = get_clock();
973 idle->idle_time += new_time - idle->idle_enter;
974 idle->idle_enter = new_time;
975 }
976 new_time = idle->idle_time;
977 spin_unlock_irq(&idle->lock);
69d39d66 978 return sprintf(buf, "%llu\n", new_time >> 12);
fae8b22d 979}
69d39d66 980static SYSDEV_ATTR(idle_time_us, 0444, show_idle_time, NULL);
fae8b22d 981
08d07968 982static struct attribute *cpu_online_attrs[] = {
fae8b22d
HC
983 &attr_capability.attr,
984 &attr_idle_count.attr,
69d39d66 985 &attr_idle_time_us.attr,
fae8b22d
HC
986 NULL,
987};
988
08d07968
HC
989static struct attribute_group cpu_online_attr_group = {
990 .attrs = cpu_online_attrs,
fae8b22d
HC
991};
992
2fc2d1e9
HC
993static int __cpuinit smp_cpu_notify(struct notifier_block *self,
994 unsigned long action, void *hcpu)
995{
996 unsigned int cpu = (unsigned int)(long)hcpu;
997 struct cpu *c = &per_cpu(cpu_devices, cpu);
998 struct sys_device *s = &c->sysdev;
fae8b22d 999 struct s390_idle_data *idle;
2fc2d1e9
HC
1000
1001 switch (action) {
1002 case CPU_ONLINE:
8bb78442 1003 case CPU_ONLINE_FROZEN:
fae8b22d
HC
1004 idle = &per_cpu(s390_idle, cpu);
1005 spin_lock_irq(&idle->lock);
1006 idle->idle_enter = 0;
1007 idle->idle_time = 0;
1008 idle->idle_count = 0;
1009 spin_unlock_irq(&idle->lock);
08d07968 1010 if (sysfs_create_group(&s->kobj, &cpu_online_attr_group))
2fc2d1e9
HC
1011 return NOTIFY_BAD;
1012 break;
1013 case CPU_DEAD:
8bb78442 1014 case CPU_DEAD_FROZEN:
08d07968 1015 sysfs_remove_group(&s->kobj, &cpu_online_attr_group);
2fc2d1e9
HC
1016 break;
1017 }
1018 return NOTIFY_OK;
1019}
1020
1021static struct notifier_block __cpuinitdata smp_cpu_nb = {
39ce010d 1022 .notifier_call = smp_cpu_notify,
2fc2d1e9
HC
1023};
1024
2bc89b5e 1025static int __devinit smp_add_present_cpu(int cpu)
08d07968
HC
1026{
1027 struct cpu *c = &per_cpu(cpu_devices, cpu);
1028 struct sys_device *s = &c->sysdev;
1029 int rc;
1030
1031 c->hotpluggable = 1;
1032 rc = register_cpu(c, cpu);
1033 if (rc)
1034 goto out;
1035 rc = sysfs_create_group(&s->kobj, &cpu_common_attr_group);
1036 if (rc)
1037 goto out_cpu;
1038 if (!cpu_online(cpu))
1039 goto out;
1040 rc = sysfs_create_group(&s->kobj, &cpu_online_attr_group);
1041 if (!rc)
1042 return 0;
1043 sysfs_remove_group(&s->kobj, &cpu_common_attr_group);
1044out_cpu:
1045#ifdef CONFIG_HOTPLUG_CPU
1046 unregister_cpu(c);
1047#endif
1048out:
1049 return rc;
1050}
1051
1052#ifdef CONFIG_HOTPLUG_CPU
2bc89b5e
HC
1053static ssize_t __ref rescan_store(struct sys_device *dev,
1054 const char *buf, size_t count)
08d07968
HC
1055{
1056 cpumask_t newcpus;
1057 int cpu;
1058 int rc;
1059
1060 mutex_lock(&smp_cpu_state_mutex);
9d40d2e3 1061 get_online_cpus();
08d07968
HC
1062 newcpus = cpu_present_map;
1063 rc = smp_rescan_cpus();
1064 if (rc)
1065 goto out;
1066 cpus_andnot(newcpus, cpu_present_map, newcpus);
1067 for_each_cpu_mask(cpu, newcpus) {
1068 rc = smp_add_present_cpu(cpu);
1069 if (rc)
1070 cpu_clear(cpu, cpu_present_map);
1071 }
1072 rc = 0;
1073out:
9d40d2e3 1074 put_online_cpus();
08d07968
HC
1075 mutex_unlock(&smp_cpu_state_mutex);
1076 return rc ? rc : count;
1077}
1078static SYSDEV_ATTR(rescan, 0200, NULL, rescan_store);
1079#endif /* CONFIG_HOTPLUG_CPU */
1080
1da177e4
LT
1081static int __init topology_init(void)
1082{
1083 int cpu;
fae8b22d 1084 int rc;
2fc2d1e9
HC
1085
1086 register_cpu_notifier(&smp_cpu_nb);
1da177e4 1087
08d07968
HC
1088#ifdef CONFIG_HOTPLUG_CPU
1089 rc = sysfs_create_file(&cpu_sysdev_class.kset.kobj,
1090 &attr_rescan.attr);
1091 if (rc)
1092 return rc;
1093#endif
1094 for_each_present_cpu(cpu) {
1095 rc = smp_add_present_cpu(cpu);
fae8b22d
HC
1096 if (rc)
1097 return rc;
1da177e4
LT
1098 }
1099 return 0;
1100}
1da177e4 1101subsys_initcall(topology_init);