smp.c 19.2 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3
/*
 *  arch/s390/kernel/smp.c
 *
4
 *    Copyright IBM Corp. 1999,2007
L
Linus Torvalds 已提交
5
 *    Author(s): Denis Joseph Barrow (djbarrow@de.ibm.com,barrow_dj@yahoo.com),
6 7
 *		 Martin Schwidefsky (schwidefsky@de.ibm.com)
 *		 Heiko Carstens (heiko.carstens@de.ibm.com)
L
Linus Torvalds 已提交
8
 *
9
 *  based on other smp stuff by
L
Linus Torvalds 已提交
10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
 *    (c) 1995 Alan Cox, CymruNET Ltd  <alan@cymru.net>
 *    (c) 1998 Ingo Molnar
 *
 * We work with logical cpu numbering everywhere we can. The only
 * functions using the real cpu address (got from STAP) are the sigp
 * functions. For all other functions we use the identity mapping.
 * That means that cpu_number_map[i] == i for every cpu. cpu_number_map is
 * used e.g. to find the idle task belonging to a logical cpu. Every array
 * in the kernel is sorted by the logical cpu number and not by the physical
 * one which is causing all the confusion with __cpu_logical_map and
 * cpu_number_map in other architectures.
 */

#include <linux/module.h>
#include <linux/init.h>
#include <linux/mm.h>
#include <linux/spinlock.h>
#include <linux/kernel_stat.h>
#include <linux/delay.h>
#include <linux/cache.h>
#include <linux/interrupt.h>
#include <linux/cpu.h>
32
#include <linux/timex.h>
M
Michael Holzheu 已提交
33
#include <linux/bootmem.h>
M
Michael Holzheu 已提交
34
#include <asm/ipl.h>
35
#include <asm/setup.h>
L
Linus Torvalds 已提交
36 37 38 39 40 41
#include <asm/sigp.h>
#include <asm/pgalloc.h>
#include <asm/irq.h>
#include <asm/s390_ext.h>
#include <asm/cpcmd.h>
#include <asm/tlbflush.h>
42
#include <asm/timer.h>
M
Michael Holzheu 已提交
43
#include <asm/lowcore.h>
L
Linus Torvalds 已提交
44 45 46 47 48

/*
 * An array with a pointer the lowcore of every CPU.
 */
struct _lowcore *lowcore_ptr[NR_CPUS];
49
EXPORT_SYMBOL(lowcore_ptr);
L
Linus Torvalds 已提交
50

51
cpumask_t cpu_online_map = CPU_MASK_NONE;
52 53
EXPORT_SYMBOL(cpu_online_map);

54
cpumask_t cpu_possible_map = CPU_MASK_NONE;
55
EXPORT_SYMBOL(cpu_possible_map);
L
Linus Torvalds 已提交
56 57 58 59 60 61

static struct task_struct *current_set[NR_CPUS];

static void smp_ext_bitcall(int, ec_bit_sig);

/*
J
Jan Glauber 已提交
62 63
 * Structure and data for __smp_call_function_map(). This is designed to
 * minimise static memory requirements. It also looks cleaner.
L
Linus Torvalds 已提交
64 65 66 67 68 69
 */
static DEFINE_SPINLOCK(call_lock);

struct call_data_struct {
	void (*func) (void *info);
	void *info;
J
Jan Glauber 已提交
70 71
	cpumask_t started;
	cpumask_t finished;
L
Linus Torvalds 已提交
72 73 74
	int wait;
};

75
static struct call_data_struct *call_data;
L
Linus Torvalds 已提交
76 77 78 79 80 81 82 83 84 85

/*
 * 'Call function' interrupt callback
 */
static void do_call_function(void)
{
	void (*func) (void *info) = call_data->func;
	void *info = call_data->info;
	int wait = call_data->wait;

J
Jan Glauber 已提交
86
	cpu_set(smp_processor_id(), call_data->started);
L
Linus Torvalds 已提交
87 88
	(*func)(info);
	if (wait)
J
Jan Glauber 已提交
89
		cpu_set(smp_processor_id(), call_data->finished);;
L
Linus Torvalds 已提交
90 91
}

J
Jan Glauber 已提交
92 93
static void __smp_call_function_map(void (*func) (void *info), void *info,
				    int nonatomic, int wait, cpumask_t map)
L
Linus Torvalds 已提交
94 95
{
	struct call_data_struct data;
J
Jan Glauber 已提交
96
	int cpu, local = 0;
L
Linus Torvalds 已提交
97

J
Jan Glauber 已提交
98
	/*
99
	 * Can deadlock when interrupts are disabled or if in wrong context.
J
Jan Glauber 已提交
100
	 */
101
	WARN_ON(irqs_disabled() || in_irq());
L
Linus Torvalds 已提交
102

J
Jan Glauber 已提交
103 104 105 106 107 108 109 110 111 112 113 114
	/*
	 * Check for local function call. We have to have the same call order
	 * as in on_each_cpu() because of machine_restart_smp().
	 */
	if (cpu_isset(smp_processor_id(), map)) {
		local = 1;
		cpu_clear(smp_processor_id(), map);
	}

	cpus_and(map, map, cpu_online_map);
	if (cpus_empty(map))
		goto out;
L
Linus Torvalds 已提交
115 116 117

	data.func = func;
	data.info = info;
J
Jan Glauber 已提交
118
	data.started = CPU_MASK_NONE;
L
Linus Torvalds 已提交
119 120
	data.wait = wait;
	if (wait)
J
Jan Glauber 已提交
121
		data.finished = CPU_MASK_NONE;
L
Linus Torvalds 已提交
122

123
	spin_lock_bh(&call_lock);
L
Linus Torvalds 已提交
124
	call_data = &data;
J
Jan Glauber 已提交
125 126 127

	for_each_cpu_mask(cpu, map)
		smp_ext_bitcall(cpu, ec_call_function);
L
Linus Torvalds 已提交
128 129

	/* Wait for response */
J
Jan Glauber 已提交
130
	while (!cpus_equal(map, data.started))
L
Linus Torvalds 已提交
131 132 133
		cpu_relax();

	if (wait)
J
Jan Glauber 已提交
134
		while (!cpus_equal(map, data.finished))
L
Linus Torvalds 已提交
135
			cpu_relax();
J
Jan Glauber 已提交
136

137
	spin_unlock_bh(&call_lock);
L
Linus Torvalds 已提交
138

J
Jan Glauber 已提交
139 140 141 142 143
out:
	local_irq_disable();
	if (local)
		func(info);
	local_irq_enable();
L
Linus Torvalds 已提交
144 145 146
}

/*
J
Jan Glauber 已提交
147 148 149 150 151
 * smp_call_function:
 * @func: the function to run; this must be fast and non-blocking
 * @info: an arbitrary pointer to pass to the function
 * @nonatomic: unused
 * @wait: if true, wait (atomically) until function has completed on other CPUs
L
Linus Torvalds 已提交
152
 *
J
Jan Glauber 已提交
153
 * Run a function on all other CPUs.
L
Linus Torvalds 已提交
154
 *
155 156
 * You must not call this function with disabled interrupts, from a
 * hardware interrupt handler or from a bottom half.
L
Linus Torvalds 已提交
157
 */
J
Jan Glauber 已提交
158 159
int smp_call_function(void (*func) (void *info), void *info, int nonatomic,
		      int wait)
L
Linus Torvalds 已提交
160
{
J
Jan Glauber 已提交
161
	cpumask_t map;
L
Linus Torvalds 已提交
162

163
	preempt_disable();
J
Jan Glauber 已提交
164 165 166
	map = cpu_online_map;
	cpu_clear(smp_processor_id(), map);
	__smp_call_function_map(func, info, nonatomic, wait, map);
167
	preempt_enable();
J
Jan Glauber 已提交
168 169 170
	return 0;
}
EXPORT_SYMBOL(smp_call_function);
L
Linus Torvalds 已提交
171

J
Jan Glauber 已提交
172 173 174 175 176 177 178 179 180 181
/*
 * smp_call_function_on:
 * @func: the function to run; this must be fast and non-blocking
 * @info: an arbitrary pointer to pass to the function
 * @nonatomic: unused
 * @wait: if true, wait (atomically) until function has completed on other CPUs
 * @cpu: the CPU where func should run
 *
 * Run a function on one processor.
 *
182 183
 * You must not call this function with disabled interrupts, from a
 * hardware interrupt handler or from a bottom half.
J
Jan Glauber 已提交
184 185
 */
int smp_call_function_on(void (*func) (void *info), void *info, int nonatomic,
186
			 int wait, int cpu)
J
Jan Glauber 已提交
187 188
{
	cpumask_t map = CPU_MASK_NONE;
L
Linus Torvalds 已提交
189

190
	preempt_disable();
J
Jan Glauber 已提交
191 192
	cpu_set(cpu, map);
	__smp_call_function_map(func, info, nonatomic, wait, map);
193
	preempt_enable();
L
Linus Torvalds 已提交
194 195 196 197
	return 0;
}
EXPORT_SYMBOL(smp_call_function_on);

198
static void do_send_stop(void)
L
Linus Torvalds 已提交
199
{
200
	int cpu, rc;
L
Linus Torvalds 已提交
201

202
	/* stop all processors */
L
Linus Torvalds 已提交
203 204 205 206 207 208 209 210 211
	for_each_online_cpu(cpu) {
		if (cpu == smp_processor_id())
			continue;
		do {
			rc = signal_processor(cpu, sigp_stop);
		} while (rc == sigp_busy);
	}
}

212
static void do_store_status(void)
L
Linus Torvalds 已提交
213
{
214
	int cpu, rc;
L
Linus Torvalds 已提交
215

216
	/* store status of all processors in their lowcores (real 0) */
L
Linus Torvalds 已提交
217 218 219 220 221 222 223
	for_each_online_cpu(cpu) {
		if (cpu == smp_processor_id())
			continue;
		do {
			rc = signal_processor_p(
				(__u32)(unsigned long) lowcore_ptr[cpu], cpu,
				sigp_store_status_at_address);
224 225
		} while (rc == sigp_busy);
	}
L
Linus Torvalds 已提交
226 227
}

228
static void do_wait_for_stop(void)
H
Heiko Carstens 已提交
229 230 231 232 233 234 235
{
	int cpu;

	/* Wait for all other cpus to enter stopped state */
	for_each_online_cpu(cpu) {
		if (cpu == smp_processor_id())
			continue;
236
		while (!smp_cpu_not_running(cpu))
H
Heiko Carstens 已提交
237 238 239 240
			cpu_relax();
	}
}

L
Linus Torvalds 已提交
241 242 243 244 245 246
/*
 * this function sends a 'stop' sigp to all other CPUs in the system.
 * it goes straight through.
 */
void smp_send_stop(void)
{
H
Heiko Carstens 已提交
247
	/* Disable all interrupts/machine checks */
G
Gerald Schaefer 已提交
248
	__load_psw_mask(psw_kernel_bits & ~PSW_MASK_MCHECK);
H
Heiko Carstens 已提交
249

250
	/* write magic number to zero page (absolute 0) */
L
Linus Torvalds 已提交
251 252 253 254 255
	lowcore_ptr[smp_processor_id()]->panic_magic = __PANIC_MAGIC;

	/* stop other processors. */
	do_send_stop();

H
Heiko Carstens 已提交
256 257 258
	/* wait until other processors are stopped */
	do_wait_for_stop();

L
Linus Torvalds 已提交
259 260 261 262 263 264 265
	/* store status of other processors. */
	do_store_status();
}

/*
 * Reboot, halt and power_off routines for SMP.
 */
266
void machine_restart_smp(char *__unused)
L
Linus Torvalds 已提交
267
{
H
Heiko Carstens 已提交
268 269
	smp_send_stop();
	do_reipl();
L
Linus Torvalds 已提交
270 271 272 273
}

void machine_halt_smp(void)
{
H
Heiko Carstens 已提交
274 275 276 277 278
	smp_send_stop();
	if (MACHINE_IS_VM && strlen(vmhalt_cmd) > 0)
		__cpcmd(vmhalt_cmd, NULL, 0, NULL);
	signal_processor(smp_processor_id(), sigp_stop_and_store_status);
	for (;;);
L
Linus Torvalds 已提交
279 280 281 282
}

void machine_power_off_smp(void)
{
H
Heiko Carstens 已提交
283 284 285 286 287
	smp_send_stop();
	if (MACHINE_IS_VM && strlen(vmpoff_cmd) > 0)
		__cpcmd(vmpoff_cmd, NULL, 0, NULL);
	signal_processor(smp_processor_id(), sigp_stop_and_store_status);
	for (;;);
L
Linus Torvalds 已提交
288 289 290 291 292 293 294
}

/*
 * This is the main routine where commands issued by other
 * cpus are handled.
 */

295
static void do_ext_call_interrupt(__u16 code)
L
Linus Torvalds 已提交
296
{
297
	unsigned long bits;
L
Linus Torvalds 已提交
298

299 300 301 302 303 304
	/*
	 * handle bit signal external calls
	 *
	 * For the ec_schedule signal we have to do nothing. All the work
	 * is done automatically when we return from the interrupt.
	 */
L
Linus Torvalds 已提交
305 306
	bits = xchg(&S390_lowcore.ext_call_fast, 0);

307
	if (test_bit(ec_call_function, &bits))
L
Linus Torvalds 已提交
308 309 310 311 312 313 314 315 316
		do_call_function();
}

/*
 * Send an external call sigp to another cpu and return without waiting
 * for its completion.
 */
static void smp_ext_bitcall(int cpu, ec_bit_sig sig)
{
317 318 319
	/*
	 * Set signaling bit in lowcore of target cpu and kick it
	 */
L
Linus Torvalds 已提交
320
	set_bit(sig, (unsigned long *) &lowcore_ptr[cpu]->ext_call_fast);
321
	while (signal_processor(cpu, sigp_emergency_signal) == sigp_busy)
L
Linus Torvalds 已提交
322 323 324
		udelay(10);
}

325
#ifndef CONFIG_64BIT
L
Linus Torvalds 已提交
326 327 328 329 330 331 332 333 334 335
/*
 * this function sends a 'purge tlb' signal to another CPU.
 */
void smp_ptlb_callback(void *info)
{
	local_flush_tlb();
}

void smp_ptlb_all(void)
{
336
	on_each_cpu(smp_ptlb_callback, NULL, 0, 1);
L
Linus Torvalds 已提交
337 338
}
EXPORT_SYMBOL(smp_ptlb_all);
339
#endif /* ! CONFIG_64BIT */
L
Linus Torvalds 已提交
340 341 342 343 344 345 346 347

/*
 * this function sends a 'reschedule' IPI to another CPU.
 * it goes straight through and wastes no time serializing
 * anything. Worst case is that we lose a reschedule ...
 */
void smp_send_reschedule(int cpu)
{
348
	smp_ext_bitcall(cpu, ec_schedule);
L
Linus Torvalds 已提交
349 350 351 352 353
}

/*
 * parameter area for the set/clear control bit callbacks
 */
354
struct ec_creg_mask_parms {
L
Linus Torvalds 已提交
355 356
	unsigned long orvals[16];
	unsigned long andvals[16];
357
};
L
Linus Torvalds 已提交
358 359 360 361

/*
 * callback for setting/clearing control bits
 */
362 363
static void smp_ctl_bit_callback(void *info)
{
364
	struct ec_creg_mask_parms *pp = info;
L
Linus Torvalds 已提交
365 366
	unsigned long cregs[16];
	int i;
367

368 369
	__ctl_store(cregs, 0, 15);
	for (i = 0; i <= 15; i++)
L
Linus Torvalds 已提交
370
		cregs[i] = (cregs[i] & pp->andvals[i]) | pp->orvals[i];
371
	__ctl_load(cregs, 0, 15);
L
Linus Torvalds 已提交
372 373 374 375 376
}

/*
 * Set a bit in a control register of all cpus
 */
377 378 379
void smp_ctl_set_bit(int cr, int bit)
{
	struct ec_creg_mask_parms parms;
L
Linus Torvalds 已提交
380

381 382
	memset(&parms.orvals, 0, sizeof(parms.orvals));
	memset(&parms.andvals, 0xff, sizeof(parms.andvals));
L
Linus Torvalds 已提交
383
	parms.orvals[cr] = 1 << bit;
384
	on_each_cpu(smp_ctl_bit_callback, &parms, 0, 1);
L
Linus Torvalds 已提交
385
}
386
EXPORT_SYMBOL(smp_ctl_set_bit);
L
Linus Torvalds 已提交
387 388 389 390

/*
 * Clear a bit in a control register of all cpus
 */
391 392 393
void smp_ctl_clear_bit(int cr, int bit)
{
	struct ec_creg_mask_parms parms;
L
Linus Torvalds 已提交
394

395 396
	memset(&parms.orvals, 0, sizeof(parms.orvals));
	memset(&parms.andvals, 0xff, sizeof(parms.andvals));
L
Linus Torvalds 已提交
397
	parms.andvals[cr] = ~(1L << bit);
398
	on_each_cpu(smp_ctl_bit_callback, &parms, 0, 1);
L
Linus Torvalds 已提交
399
}
400
EXPORT_SYMBOL(smp_ctl_clear_bit);
L
Linus Torvalds 已提交
401

M
Michael Holzheu 已提交
402 403 404 405 406 407 408 409 410 411 412
#if defined(CONFIG_ZFCPDUMP) || defined(CONFIG_ZFCPDUMP_MODULE)

/*
 * zfcpdump_prefix_array holds prefix registers for the following scenario:
 * 64 bit zfcpdump kernel and 31 bit kernel which is to be dumped. We have to
 * save its prefix registers, since they get lost, when switching from 31 bit
 * to 64 bit.
 */
unsigned int zfcpdump_prefix_array[NR_CPUS + 1] \
	__attribute__((__section__(".data")));

413
static void __init smp_get_save_area(unsigned int cpu, unsigned int phy_cpu)
M
Michael Holzheu 已提交
414 415 416
{
	if (ipl_info.type != IPL_TYPE_FCP_DUMP)
		return;
417 418 419 420
	if (cpu >= NR_CPUS) {
		printk(KERN_WARNING "Registers for cpu %i not saved since dump "
		       "kernel was compiled with NR_CPUS=%i\n", cpu, NR_CPUS);
		return;
M
Michael Holzheu 已提交
421
	}
422 423 424 425 426 427 428 429 430 431 432
	zfcpdump_save_areas[cpu] = alloc_bootmem(sizeof(union save_area));
	__cpu_logical_map[1] = (__u16) phy_cpu;
	while (signal_processor(1, sigp_stop_and_store_status) == sigp_busy)
		cpu_relax();
	memcpy(zfcpdump_save_areas[cpu],
	       (void *)(unsigned long) store_prefix() + SAVE_AREA_BASE,
	       SAVE_AREA_SIZE);
#ifdef CONFIG_64BIT
	/* copy original prefix register */
	zfcpdump_save_areas[cpu]->s390x.pref_reg = zfcpdump_prefix_array[cpu];
#endif
M
Michael Holzheu 已提交
433 434 435 436 437 438
}

union save_area *zfcpdump_save_areas[NR_CPUS + 1];
EXPORT_SYMBOL_GPL(zfcpdump_save_areas);

#else
439 440 441 442

static inline void smp_get_save_area(unsigned int cpu, unsigned int phy_cpu) { }

#endif /* CONFIG_ZFCPDUMP || CONFIG_ZFCPDUMP_MODULE */
M
Michael Holzheu 已提交
443

L
Linus Torvalds 已提交
444 445 446
/*
 * Lets check how many CPUs we have.
 */
447
static unsigned int __init smp_count_cpus(void)
L
Linus Torvalds 已提交
448
{
449
	unsigned int cpu, num_cpus;
L
Linus Torvalds 已提交
450 451 452 453 454 455 456 457
	__u16 boot_cpu_addr;

	/*
	 * cpu 0 is the boot cpu. See smp_prepare_boot_cpu.
	 */
	boot_cpu_addr = S390_lowcore.cpu_data.cpu_addr;
	current_thread_info()->cpu = 0;
	num_cpus = 1;
458
	for (cpu = 0; cpu <= 65535; cpu++) {
L
Linus Torvalds 已提交
459 460
		if ((__u16) cpu == boot_cpu_addr)
			continue;
461
		__cpu_logical_map[1] = (__u16) cpu;
462
		if (signal_processor(1, sigp_sense) == sigp_not_operational)
L
Linus Torvalds 已提交
463
			continue;
464
		smp_get_save_area(num_cpus, cpu);
L
Linus Torvalds 已提交
465 466
		num_cpus++;
	}
467
	printk("Detected %d CPU's\n", (int) num_cpus);
L
Linus Torvalds 已提交
468
	printk("Boot cpu address %2X\n", boot_cpu_addr);
469
	return num_cpus;
L
Linus Torvalds 已提交
470 471 472
}

/*
473
 *	Activate a secondary processor.
L
Linus Torvalds 已提交
474
 */
H
Heiko Carstens 已提交
475
int __cpuinit start_secondary(void *cpuvoid)
L
Linus Torvalds 已提交
476
{
477 478
	/* Setup the cpu */
	cpu_init();
479
	preempt_disable();
M
Martin Schwidefsky 已提交
480
	/* Enable TOD clock interrupts on the secondary cpu. */
481
	init_cpu_timer();
L
Linus Torvalds 已提交
482
#ifdef CONFIG_VIRT_TIMER
M
Martin Schwidefsky 已提交
483
	/* Enable cpu timer interrupts on the secondary cpu. */
484
	init_cpu_vtimer();
L
Linus Torvalds 已提交
485 486
#endif
	/* Enable pfault pseudo page faults on this cpu. */
H
Heiko Carstens 已提交
487 488
	pfault_init();

L
Linus Torvalds 已提交
489 490 491 492
	/* Mark this cpu as online */
	cpu_set(smp_processor_id(), cpu_online_map);
	/* Switch on interrupts */
	local_irq_enable();
493 494 495 496 497
	/* Print info about this processor */
	print_cpu_info(&S390_lowcore.cpu_data);
	/* cpu_idle will call schedule for us */
	cpu_idle();
	return 0;
L
Linus Torvalds 已提交
498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513
}

static void __init smp_create_idle(unsigned int cpu)
{
	struct task_struct *p;

	/*
	 *  don't care about the psw and regs settings since we'll never
	 *  reschedule the forked task.
	 */
	p = fork_idle(cpu);
	if (IS_ERR(p))
		panic("failed fork for CPU %u: %li", cpu, PTR_ERR(p));
	current_set[cpu] = p;
}

514
static int cpu_stopped(int cpu)
L
Linus Torvalds 已提交
515 516 517 518
{
	__u32 status;

	/* Check for stopped state */
519 520
	if (signal_processor_ps(&status, 0, cpu, sigp_sense) ==
	    sigp_status_stored) {
L
Linus Torvalds 已提交
521 522 523 524 525 526 527 528
		if (status & 0x40)
			return 1;
	}
	return 0;
}

/* Upping and downing of CPUs */

529
int __cpu_up(unsigned int cpu)
L
Linus Torvalds 已提交
530 531
{
	struct task_struct *idle;
532
	struct _lowcore *cpu_lowcore;
L
Linus Torvalds 已提交
533
	struct stack_frame *sf;
534 535
	sigp_ccode ccode;
	int curr_cpu;
L
Linus Torvalds 已提交
536 537 538 539 540 541 542 543 544 545 546 547

	for (curr_cpu = 0; curr_cpu <= 65535; curr_cpu++) {
		__cpu_logical_map[cpu] = (__u16) curr_cpu;
		if (cpu_stopped(cpu))
			break;
	}

	if (!cpu_stopped(cpu))
		return -ENODEV;

	ccode = signal_processor_p((__u32)(unsigned long)(lowcore_ptr[cpu]),
				   cpu, sigp_set_prefix);
548
	if (ccode) {
L
Linus Torvalds 已提交
549 550 551 552 553 554 555
		printk("sigp_set_prefix failed for cpu %d "
		       "with condition code %d\n",
		       (int) cpu, (int) ccode);
		return -EIO;
	}

	idle = current_set[cpu];
556
	cpu_lowcore = lowcore_ptr[cpu];
L
Linus Torvalds 已提交
557
	cpu_lowcore->kernel_stack = (unsigned long)
558
		task_stack_page(idle) + THREAD_SIZE;
L
Linus Torvalds 已提交
559 560 561 562 563 564 565
	sf = (struct stack_frame *) (cpu_lowcore->kernel_stack
				     - sizeof(struct pt_regs)
				     - sizeof(struct stack_frame));
	memset(sf, 0, sizeof(struct stack_frame));
	sf->gprs[9] = (unsigned long) sf;
	cpu_lowcore->save_area[15] = (unsigned long) sf;
	__ctl_store(cpu_lowcore->cregs_save_area[0], 0, 15);
566 567 568
	asm volatile(
		"	stam	0,15,0(%0)"
		: : "a" (&cpu_lowcore->access_regs_save_area) : "memory");
L
Linus Torvalds 已提交
569
	cpu_lowcore->percpu_offset = __per_cpu_offset[cpu];
570 571
	cpu_lowcore->current_task = (unsigned long) idle;
	cpu_lowcore->cpu_data.cpu_nr = cpu;
L
Linus Torvalds 已提交
572
	eieio();
M
Michael Ryan 已提交
573

574
	while (signal_processor(cpu, sigp_restart) == sigp_busy)
M
Michael Ryan 已提交
575
		udelay(10);
L
Linus Torvalds 已提交
576 577 578 579 580 581

	while (!cpu_online(cpu))
		cpu_relax();
	return 0;
}

582
static unsigned int __initdata additional_cpus;
583
static unsigned int __initdata possible_cpus;
584 585 586

void __init smp_setup_cpu_possible_map(void)
{
587
	unsigned int phy_cpus, pos_cpus, cpu;
588

589 590
	phy_cpus = smp_count_cpus();
	pos_cpus = min(phy_cpus + additional_cpus, (unsigned int) NR_CPUS);
591

592
	if (possible_cpus)
593
		pos_cpus = min(possible_cpus, (unsigned int) NR_CPUS);
594

595
	for (cpu = 0; cpu < pos_cpus; cpu++)
596 597
		cpu_set(cpu, cpu_possible_map);

598 599 600 601
	phy_cpus = min(phy_cpus, pos_cpus);

	for (cpu = 0; cpu < phy_cpus; cpu++)
		cpu_set(cpu, cpu_present_map);
602 603 604 605 606 607 608 609 610 611 612
}

#ifdef CONFIG_HOTPLUG_CPU

static int __init setup_additional_cpus(char *s)
{
	additional_cpus = simple_strtoul(s, NULL, 0);
	return 0;
}
early_param("additional_cpus", setup_additional_cpus);

613 614 615 616 617 618 619
static int __init setup_possible_cpus(char *s)
{
	possible_cpus = simple_strtoul(s, NULL, 0);
	return 0;
}
early_param("possible_cpus", setup_possible_cpus);

620
int __cpu_disable(void)
L
Linus Torvalds 已提交
621
{
622
	struct ec_creg_mask_parms cr_parms;
Z
Zwane Mwaikambo 已提交
623
	int cpu = smp_processor_id();
L
Linus Torvalds 已提交
624

Z
Zwane Mwaikambo 已提交
625
	cpu_clear(cpu, cpu_online_map);
L
Linus Torvalds 已提交
626 627

	/* Disable pfault pseudo page faults on this cpu. */
H
Heiko Carstens 已提交
628
	pfault_fini();
L
Linus Torvalds 已提交
629

630 631
	memset(&cr_parms.orvals, 0, sizeof(cr_parms.orvals));
	memset(&cr_parms.andvals, 0xff, sizeof(cr_parms.andvals));
L
Linus Torvalds 已提交
632

633
	/* disable all external interrupts */
L
Linus Torvalds 已提交
634
	cr_parms.orvals[0] = 0;
635 636
	cr_parms.andvals[0] = ~(1 << 15 | 1 << 14 | 1 << 13 | 1 << 12 |
				1 << 11 | 1 << 10 | 1 <<  6 | 1 <<  4);
L
Linus Torvalds 已提交
637 638
	/* disable all I/O interrupts */
	cr_parms.orvals[6] = 0;
639 640
	cr_parms.andvals[6] = ~(1 << 31 | 1 << 30 | 1 << 29 | 1 << 28 |
				1 << 27 | 1 << 26 | 1 << 25 | 1 << 24);
L
Linus Torvalds 已提交
641 642
	/* disable most machine checks */
	cr_parms.orvals[14] = 0;
643 644
	cr_parms.andvals[14] = ~(1 << 28 | 1 << 27 | 1 << 26 |
				 1 << 25 | 1 << 24);
645

L
Linus Torvalds 已提交
646 647 648 649 650
	smp_ctl_bit_callback(&cr_parms);

	return 0;
}

651
void __cpu_die(unsigned int cpu)
L
Linus Torvalds 已提交
652 653 654 655 656 657 658
{
	/* Wait until target cpu is down */
	while (!smp_cpu_not_running(cpu))
		cpu_relax();
	printk("Processor %d spun down\n", cpu);
}

659
void cpu_die(void)
L
Linus Torvalds 已提交
660 661 662 663
{
	idle_task_exit();
	signal_processor(smp_processor_id(), sigp_stop);
	BUG();
664
	for (;;);
L
Linus Torvalds 已提交
665 666
}

667 668
#endif /* CONFIG_HOTPLUG_CPU */

L
Linus Torvalds 已提交
669 670 671 672 673 674 675 676
/*
 *	Cycle through the processors and setup structures.
 */

void __init smp_prepare_cpus(unsigned int max_cpus)
{
	unsigned long stack;
	unsigned int cpu;
677 678 679 680 681 682 683 684 685
	int i;

	/* request the 0x1201 emergency signal external interrupt */
	if (register_external_interrupt(0x1201, do_ext_call_interrupt) != 0)
		panic("Couldn't request external interrupt 0x1201");
	memset(lowcore_ptr, 0, sizeof(lowcore_ptr));
	/*
	 *  Initialize prefix pages and stacks for all possible cpus
	 */
L
Linus Torvalds 已提交
686 687
	print_cpu_info(&S390_lowcore.cpu_data);

688
	for_each_possible_cpu(i) {
L
Linus Torvalds 已提交
689
		lowcore_ptr[i] = (struct _lowcore *)
690 691 692 693
			__get_free_pages(GFP_KERNEL | GFP_DMA,
					 sizeof(void*) == 8 ? 1 : 0);
		stack = __get_free_pages(GFP_KERNEL, ASYNC_ORDER);
		if (!lowcore_ptr[i] || !stack)
L
Linus Torvalds 已提交
694 695 696
			panic("smp_boot_cpus failed to allocate memory\n");

		*(lowcore_ptr[i]) = S390_lowcore;
697 698 699
		lowcore_ptr[i]->async_stack = stack + ASYNC_SIZE;
		stack = __get_free_pages(GFP_KERNEL, 0);
		if (!stack)
L
Linus Torvalds 已提交
700
			panic("smp_boot_cpus failed to allocate memory\n");
701
		lowcore_ptr[i]->panic_stack = stack + PAGE_SIZE;
702
#ifndef CONFIG_64BIT
703 704
		if (MACHINE_HAS_IEEE) {
			lowcore_ptr[i]->extended_save_area_addr =
705 706
				(__u32) __get_free_pages(GFP_KERNEL, 0);
			if (!lowcore_ptr[i]->extended_save_area_addr)
707 708 709
				panic("smp_boot_cpus failed to "
				      "allocate memory\n");
		}
L
Linus Torvalds 已提交
710 711
#endif
	}
712
#ifndef CONFIG_64BIT
713 714 715
	if (MACHINE_HAS_IEEE)
		ctl_set_bit(14, 29); /* enable extended save area */
#endif
L
Linus Torvalds 已提交
716 717
	set_prefix((u32)(unsigned long) lowcore_ptr[smp_processor_id()]);

718
	for_each_possible_cpu(cpu)
L
Linus Torvalds 已提交
719 720 721 722
		if (cpu != smp_processor_id())
			smp_create_idle(cpu);
}

H
Heiko Carstens 已提交
723
void __init smp_prepare_boot_cpu(void)
L
Linus Torvalds 已提交
724 725 726 727 728 729 730 731
{
	BUG_ON(smp_processor_id() != 0);

	cpu_set(0, cpu_online_map);
	S390_lowcore.percpu_offset = __per_cpu_offset[0];
	current_set[0] = current;
}

H
Heiko Carstens 已提交
732
void __init smp_cpus_done(unsigned int max_cpus)
L
Linus Torvalds 已提交
733
{
734
	cpu_present_map = cpu_possible_map;
L
Linus Torvalds 已提交
735 736 737 738 739 740 741 742 743 744
}

/*
 * the frequency of the profiling timer can be changed
 * by writing a multiplier value into /proc/profile.
 *
 * usually you want to run this on all CPUs ;)
 */
int setup_profiling_timer(unsigned int multiplier)
{
745
	return 0;
L
Linus Torvalds 已提交
746 747 748 749
}

static DEFINE_PER_CPU(struct cpu, cpu_devices);

750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770
static ssize_t show_capability(struct sys_device *dev, char *buf)
{
	unsigned int capability;
	int rc;

	rc = get_cpu_capability(&capability);
	if (rc)
		return rc;
	return sprintf(buf, "%u\n", capability);
}
static SYSDEV_ATTR(capability, 0444, show_capability, NULL);

static int __cpuinit smp_cpu_notify(struct notifier_block *self,
				    unsigned long action, void *hcpu)
{
	unsigned int cpu = (unsigned int)(long)hcpu;
	struct cpu *c = &per_cpu(cpu_devices, cpu);
	struct sys_device *s = &c->sysdev;

	switch (action) {
	case CPU_ONLINE:
771
	case CPU_ONLINE_FROZEN:
772 773 774 775
		if (sysdev_create_file(s, &attr_capability))
			return NOTIFY_BAD;
		break;
	case CPU_DEAD:
776
	case CPU_DEAD_FROZEN:
777 778 779 780 781 782 783
		sysdev_remove_file(s, &attr_capability);
		break;
	}
	return NOTIFY_OK;
}

static struct notifier_block __cpuinitdata smp_cpu_nb = {
784
	.notifier_call = smp_cpu_notify,
785 786
};

L
Linus Torvalds 已提交
787 788 789
static int __init topology_init(void)
{
	int cpu;
790 791

	register_cpu_notifier(&smp_cpu_nb);
L
Linus Torvalds 已提交
792

793
	for_each_possible_cpu(cpu) {
794
		struct cpu *c = &per_cpu(cpu_devices, cpu);
795
		struct sys_device *s = &c->sysdev;
796 797

		c->hotpluggable = 1;
798 799 800 801 802
		register_cpu(c, cpu);
		if (!cpu_online(cpu))
			continue;
		s = &c->sysdev;
		sysdev_create_file(s, &attr_capability);
L
Linus Torvalds 已提交
803 804 805 806
	}
	return 0;
}
subsys_initcall(topology_init);