smp.c 19.2 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3
/*
 *  arch/s390/kernel/smp.c
 *
4
 *    Copyright IBM Corp. 1999,2007
L
Linus Torvalds 已提交
5
 *    Author(s): Denis Joseph Barrow (djbarrow@de.ibm.com,barrow_dj@yahoo.com),
6 7
 *		 Martin Schwidefsky (schwidefsky@de.ibm.com)
 *		 Heiko Carstens (heiko.carstens@de.ibm.com)
L
Linus Torvalds 已提交
8
 *
9
 *  based on other smp stuff by
L
Linus Torvalds 已提交
10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
 *    (c) 1995 Alan Cox, CymruNET Ltd  <alan@cymru.net>
 *    (c) 1998 Ingo Molnar
 *
 * We work with logical cpu numbering everywhere we can. The only
 * functions using the real cpu address (got from STAP) are the sigp
 * functions. For all other functions we use the identity mapping.
 * That means that cpu_number_map[i] == i for every cpu. cpu_number_map is
 * used e.g. to find the idle task belonging to a logical cpu. Every array
 * in the kernel is sorted by the logical cpu number and not by the physical
 * one which is causing all the confusion with __cpu_logical_map and
 * cpu_number_map in other architectures.
 */

#include <linux/module.h>
#include <linux/init.h>
#include <linux/mm.h>
#include <linux/spinlock.h>
#include <linux/kernel_stat.h>
#include <linux/delay.h>
#include <linux/cache.h>
#include <linux/interrupt.h>
#include <linux/cpu.h>
32
#include <linux/timex.h>
M
Michael Holzheu 已提交
33
#include <linux/bootmem.h>
M
Michael Holzheu 已提交
34
#include <asm/ipl.h>
35
#include <asm/setup.h>
L
Linus Torvalds 已提交
36 37 38 39 40 41
#include <asm/sigp.h>
#include <asm/pgalloc.h>
#include <asm/irq.h>
#include <asm/s390_ext.h>
#include <asm/cpcmd.h>
#include <asm/tlbflush.h>
42
#include <asm/timer.h>
M
Michael Holzheu 已提交
43
#include <asm/lowcore.h>
L
Linus Torvalds 已提交
44 45 46 47 48

/*
 * An array with a pointer the lowcore of every CPU.
 */
struct _lowcore *lowcore_ptr[NR_CPUS];
49
EXPORT_SYMBOL(lowcore_ptr);
L
Linus Torvalds 已提交
50

51
cpumask_t cpu_online_map = CPU_MASK_NONE;
52 53
EXPORT_SYMBOL(cpu_online_map);

54
cpumask_t cpu_possible_map = CPU_MASK_NONE;
55
EXPORT_SYMBOL(cpu_possible_map);
L
Linus Torvalds 已提交
56 57 58 59 60 61

static struct task_struct *current_set[NR_CPUS];

static void smp_ext_bitcall(int, ec_bit_sig);

/*
J
Jan Glauber 已提交
62 63
 * Structure and data for __smp_call_function_map(). This is designed to
 * minimise static memory requirements. It also looks cleaner.
L
Linus Torvalds 已提交
64 65 66 67 68 69
 */
static DEFINE_SPINLOCK(call_lock);

struct call_data_struct {
	void (*func) (void *info);
	void *info;
J
Jan Glauber 已提交
70 71
	cpumask_t started;
	cpumask_t finished;
L
Linus Torvalds 已提交
72 73 74
	int wait;
};

75
static struct call_data_struct *call_data;
L
Linus Torvalds 已提交
76 77 78 79 80 81 82 83 84 85

/*
 * 'Call function' interrupt callback
 */
static void do_call_function(void)
{
	void (*func) (void *info) = call_data->func;
	void *info = call_data->info;
	int wait = call_data->wait;

J
Jan Glauber 已提交
86
	cpu_set(smp_processor_id(), call_data->started);
L
Linus Torvalds 已提交
87 88
	(*func)(info);
	if (wait)
J
Jan Glauber 已提交
89
		cpu_set(smp_processor_id(), call_data->finished);;
L
Linus Torvalds 已提交
90 91
}

J
Jan Glauber 已提交
92 93
static void __smp_call_function_map(void (*func) (void *info), void *info,
				    int nonatomic, int wait, cpumask_t map)
L
Linus Torvalds 已提交
94 95
{
	struct call_data_struct data;
J
Jan Glauber 已提交
96
	int cpu, local = 0;
L
Linus Torvalds 已提交
97

J
Jan Glauber 已提交
98
	/*
99
	 * Can deadlock when interrupts are disabled or if in wrong context.
J
Jan Glauber 已提交
100
	 */
101
	WARN_ON(irqs_disabled() || in_irq());
L
Linus Torvalds 已提交
102

J
Jan Glauber 已提交
103 104 105 106 107 108 109 110 111 112 113 114
	/*
	 * Check for local function call. We have to have the same call order
	 * as in on_each_cpu() because of machine_restart_smp().
	 */
	if (cpu_isset(smp_processor_id(), map)) {
		local = 1;
		cpu_clear(smp_processor_id(), map);
	}

	cpus_and(map, map, cpu_online_map);
	if (cpus_empty(map))
		goto out;
L
Linus Torvalds 已提交
115 116 117

	data.func = func;
	data.info = info;
J
Jan Glauber 已提交
118
	data.started = CPU_MASK_NONE;
L
Linus Torvalds 已提交
119 120
	data.wait = wait;
	if (wait)
J
Jan Glauber 已提交
121
		data.finished = CPU_MASK_NONE;
L
Linus Torvalds 已提交
122

123
	spin_lock_bh(&call_lock);
L
Linus Torvalds 已提交
124
	call_data = &data;
J
Jan Glauber 已提交
125 126 127

	for_each_cpu_mask(cpu, map)
		smp_ext_bitcall(cpu, ec_call_function);
L
Linus Torvalds 已提交
128 129

	/* Wait for response */
J
Jan Glauber 已提交
130
	while (!cpus_equal(map, data.started))
L
Linus Torvalds 已提交
131 132 133
		cpu_relax();

	if (wait)
J
Jan Glauber 已提交
134
		while (!cpus_equal(map, data.finished))
L
Linus Torvalds 已提交
135
			cpu_relax();
J
Jan Glauber 已提交
136

137
	spin_unlock_bh(&call_lock);
L
Linus Torvalds 已提交
138

J
Jan Glauber 已提交
139 140 141 142 143
out:
	local_irq_disable();
	if (local)
		func(info);
	local_irq_enable();
L
Linus Torvalds 已提交
144 145 146
}

/*
J
Jan Glauber 已提交
147 148 149 150 151
 * smp_call_function:
 * @func: the function to run; this must be fast and non-blocking
 * @info: an arbitrary pointer to pass to the function
 * @nonatomic: unused
 * @wait: if true, wait (atomically) until function has completed on other CPUs
L
Linus Torvalds 已提交
152
 *
J
Jan Glauber 已提交
153
 * Run a function on all other CPUs.
L
Linus Torvalds 已提交
154
 *
155 156
 * You must not call this function with disabled interrupts, from a
 * hardware interrupt handler or from a bottom half.
L
Linus Torvalds 已提交
157
 */
J
Jan Glauber 已提交
158 159
int smp_call_function(void (*func) (void *info), void *info, int nonatomic,
		      int wait)
L
Linus Torvalds 已提交
160
{
J
Jan Glauber 已提交
161
	cpumask_t map;
L
Linus Torvalds 已提交
162

163
	preempt_disable();
J
Jan Glauber 已提交
164 165 166
	map = cpu_online_map;
	cpu_clear(smp_processor_id(), map);
	__smp_call_function_map(func, info, nonatomic, wait, map);
167
	preempt_enable();
J
Jan Glauber 已提交
168 169 170
	return 0;
}
EXPORT_SYMBOL(smp_call_function);
L
Linus Torvalds 已提交
171

J
Jan Glauber 已提交
172
/*
173 174
 * smp_call_function_single:
 * @cpu: the CPU where func should run
J
Jan Glauber 已提交
175 176 177 178 179 180 181
 * @func: the function to run; this must be fast and non-blocking
 * @info: an arbitrary pointer to pass to the function
 * @nonatomic: unused
 * @wait: if true, wait (atomically) until function has completed on other CPUs
 *
 * Run a function on one processor.
 *
182 183
 * You must not call this function with disabled interrupts, from a
 * hardware interrupt handler or from a bottom half.
J
Jan Glauber 已提交
184
 */
185 186
int smp_call_function_single(int cpu, void (*func) (void *info), void *info,
			     int nonatomic, int wait)
J
Jan Glauber 已提交
187
{
188
	preempt_disable();
189 190
	__smp_call_function_map(func, info, nonatomic, wait,
				cpumask_of_cpu(cpu));
191
	preempt_enable();
L
Linus Torvalds 已提交
192 193
	return 0;
}
194
EXPORT_SYMBOL(smp_call_function_single);
L
Linus Torvalds 已提交
195

196
static void do_send_stop(void)
L
Linus Torvalds 已提交
197
{
198
	int cpu, rc;
L
Linus Torvalds 已提交
199

200
	/* stop all processors */
L
Linus Torvalds 已提交
201 202 203 204 205 206 207 208 209
	for_each_online_cpu(cpu) {
		if (cpu == smp_processor_id())
			continue;
		do {
			rc = signal_processor(cpu, sigp_stop);
		} while (rc == sigp_busy);
	}
}

210
static void do_store_status(void)
L
Linus Torvalds 已提交
211
{
212
	int cpu, rc;
L
Linus Torvalds 已提交
213

214
	/* store status of all processors in their lowcores (real 0) */
L
Linus Torvalds 已提交
215 216 217 218 219 220 221
	for_each_online_cpu(cpu) {
		if (cpu == smp_processor_id())
			continue;
		do {
			rc = signal_processor_p(
				(__u32)(unsigned long) lowcore_ptr[cpu], cpu,
				sigp_store_status_at_address);
222 223
		} while (rc == sigp_busy);
	}
L
Linus Torvalds 已提交
224 225
}

226
static void do_wait_for_stop(void)
H
Heiko Carstens 已提交
227 228 229 230 231 232 233
{
	int cpu;

	/* Wait for all other cpus to enter stopped state */
	for_each_online_cpu(cpu) {
		if (cpu == smp_processor_id())
			continue;
234
		while (!smp_cpu_not_running(cpu))
H
Heiko Carstens 已提交
235 236 237 238
			cpu_relax();
	}
}

L
Linus Torvalds 已提交
239 240 241 242 243 244
/*
 * this function sends a 'stop' sigp to all other CPUs in the system.
 * it goes straight through.
 */
void smp_send_stop(void)
{
H
Heiko Carstens 已提交
245
	/* Disable all interrupts/machine checks */
G
Gerald Schaefer 已提交
246
	__load_psw_mask(psw_kernel_bits & ~PSW_MASK_MCHECK);
H
Heiko Carstens 已提交
247

248
	/* write magic number to zero page (absolute 0) */
L
Linus Torvalds 已提交
249 250 251 252 253
	lowcore_ptr[smp_processor_id()]->panic_magic = __PANIC_MAGIC;

	/* stop other processors. */
	do_send_stop();

H
Heiko Carstens 已提交
254 255 256
	/* wait until other processors are stopped */
	do_wait_for_stop();

L
Linus Torvalds 已提交
257 258 259 260 261 262 263
	/* store status of other processors. */
	do_store_status();
}

/*
 * Reboot, halt and power_off routines for SMP.
 */
264
void machine_restart_smp(char *__unused)
L
Linus Torvalds 已提交
265
{
H
Heiko Carstens 已提交
266 267
	smp_send_stop();
	do_reipl();
L
Linus Torvalds 已提交
268 269 270 271
}

void machine_halt_smp(void)
{
H
Heiko Carstens 已提交
272 273 274 275 276
	smp_send_stop();
	if (MACHINE_IS_VM && strlen(vmhalt_cmd) > 0)
		__cpcmd(vmhalt_cmd, NULL, 0, NULL);
	signal_processor(smp_processor_id(), sigp_stop_and_store_status);
	for (;;);
L
Linus Torvalds 已提交
277 278 279 280
}

void machine_power_off_smp(void)
{
H
Heiko Carstens 已提交
281 282 283 284 285
	smp_send_stop();
	if (MACHINE_IS_VM && strlen(vmpoff_cmd) > 0)
		__cpcmd(vmpoff_cmd, NULL, 0, NULL);
	signal_processor(smp_processor_id(), sigp_stop_and_store_status);
	for (;;);
L
Linus Torvalds 已提交
286 287 288 289 290 291 292
}

/*
 * This is the main routine where commands issued by other
 * cpus are handled.
 */

293
static void do_ext_call_interrupt(__u16 code)
L
Linus Torvalds 已提交
294
{
295
	unsigned long bits;
L
Linus Torvalds 已提交
296

297 298 299 300 301 302
	/*
	 * handle bit signal external calls
	 *
	 * For the ec_schedule signal we have to do nothing. All the work
	 * is done automatically when we return from the interrupt.
	 */
L
Linus Torvalds 已提交
303 304
	bits = xchg(&S390_lowcore.ext_call_fast, 0);

305
	if (test_bit(ec_call_function, &bits))
L
Linus Torvalds 已提交
306 307 308 309 310 311 312 313 314
		do_call_function();
}

/*
 * Send an external call sigp to another cpu and return without waiting
 * for its completion.
 */
static void smp_ext_bitcall(int cpu, ec_bit_sig sig)
{
315 316 317
	/*
	 * Set signaling bit in lowcore of target cpu and kick it
	 */
L
Linus Torvalds 已提交
318
	set_bit(sig, (unsigned long *) &lowcore_ptr[cpu]->ext_call_fast);
319
	while (signal_processor(cpu, sigp_emergency_signal) == sigp_busy)
L
Linus Torvalds 已提交
320 321 322
		udelay(10);
}

323
#ifndef CONFIG_64BIT
L
Linus Torvalds 已提交
324 325 326 327 328 329 330 331 332 333
/*
 * this function sends a 'purge tlb' signal to another CPU.
 */
void smp_ptlb_callback(void *info)
{
	local_flush_tlb();
}

void smp_ptlb_all(void)
{
334
	on_each_cpu(smp_ptlb_callback, NULL, 0, 1);
L
Linus Torvalds 已提交
335 336
}
EXPORT_SYMBOL(smp_ptlb_all);
337
#endif /* ! CONFIG_64BIT */
L
Linus Torvalds 已提交
338 339 340 341 342 343 344 345

/*
 * this function sends a 'reschedule' IPI to another CPU.
 * it goes straight through and wastes no time serializing
 * anything. Worst case is that we lose a reschedule ...
 */
void smp_send_reschedule(int cpu)
{
346
	smp_ext_bitcall(cpu, ec_schedule);
L
Linus Torvalds 已提交
347 348 349 350 351
}

/*
 * parameter area for the set/clear control bit callbacks
 */
352
struct ec_creg_mask_parms {
L
Linus Torvalds 已提交
353 354
	unsigned long orvals[16];
	unsigned long andvals[16];
355
};
L
Linus Torvalds 已提交
356 357 358 359

/*
 * callback for setting/clearing control bits
 */
360 361
static void smp_ctl_bit_callback(void *info)
{
362
	struct ec_creg_mask_parms *pp = info;
L
Linus Torvalds 已提交
363 364
	unsigned long cregs[16];
	int i;
365

366 367
	__ctl_store(cregs, 0, 15);
	for (i = 0; i <= 15; i++)
L
Linus Torvalds 已提交
368
		cregs[i] = (cregs[i] & pp->andvals[i]) | pp->orvals[i];
369
	__ctl_load(cregs, 0, 15);
L
Linus Torvalds 已提交
370 371 372 373 374
}

/*
 * Set a bit in a control register of all cpus
 */
375 376 377
void smp_ctl_set_bit(int cr, int bit)
{
	struct ec_creg_mask_parms parms;
L
Linus Torvalds 已提交
378

379 380
	memset(&parms.orvals, 0, sizeof(parms.orvals));
	memset(&parms.andvals, 0xff, sizeof(parms.andvals));
L
Linus Torvalds 已提交
381
	parms.orvals[cr] = 1 << bit;
382
	on_each_cpu(smp_ctl_bit_callback, &parms, 0, 1);
L
Linus Torvalds 已提交
383
}
384
EXPORT_SYMBOL(smp_ctl_set_bit);
L
Linus Torvalds 已提交
385 386 387 388

/*
 * Clear a bit in a control register of all cpus
 */
389 390 391
void smp_ctl_clear_bit(int cr, int bit)
{
	struct ec_creg_mask_parms parms;
L
Linus Torvalds 已提交
392

393 394
	memset(&parms.orvals, 0, sizeof(parms.orvals));
	memset(&parms.andvals, 0xff, sizeof(parms.andvals));
L
Linus Torvalds 已提交
395
	parms.andvals[cr] = ~(1L << bit);
396
	on_each_cpu(smp_ctl_bit_callback, &parms, 0, 1);
L
Linus Torvalds 已提交
397
}
398
EXPORT_SYMBOL(smp_ctl_clear_bit);
L
Linus Torvalds 已提交
399

M
Michael Holzheu 已提交
400 401 402 403 404 405 406 407 408 409 410
#if defined(CONFIG_ZFCPDUMP) || defined(CONFIG_ZFCPDUMP_MODULE)

/*
 * zfcpdump_prefix_array holds prefix registers for the following scenario:
 * 64 bit zfcpdump kernel and 31 bit kernel which is to be dumped. We have to
 * save its prefix registers, since they get lost, when switching from 31 bit
 * to 64 bit.
 */
unsigned int zfcpdump_prefix_array[NR_CPUS + 1] \
	__attribute__((__section__(".data")));

411
static void __init smp_get_save_area(unsigned int cpu, unsigned int phy_cpu)
M
Michael Holzheu 已提交
412 413 414
{
	if (ipl_info.type != IPL_TYPE_FCP_DUMP)
		return;
415 416 417 418
	if (cpu >= NR_CPUS) {
		printk(KERN_WARNING "Registers for cpu %i not saved since dump "
		       "kernel was compiled with NR_CPUS=%i\n", cpu, NR_CPUS);
		return;
M
Michael Holzheu 已提交
419
	}
420 421 422 423 424 425 426 427 428 429 430
	zfcpdump_save_areas[cpu] = alloc_bootmem(sizeof(union save_area));
	__cpu_logical_map[1] = (__u16) phy_cpu;
	while (signal_processor(1, sigp_stop_and_store_status) == sigp_busy)
		cpu_relax();
	memcpy(zfcpdump_save_areas[cpu],
	       (void *)(unsigned long) store_prefix() + SAVE_AREA_BASE,
	       SAVE_AREA_SIZE);
#ifdef CONFIG_64BIT
	/* copy original prefix register */
	zfcpdump_save_areas[cpu]->s390x.pref_reg = zfcpdump_prefix_array[cpu];
#endif
M
Michael Holzheu 已提交
431 432 433 434 435 436
}

union save_area *zfcpdump_save_areas[NR_CPUS + 1];
EXPORT_SYMBOL_GPL(zfcpdump_save_areas);

#else
437 438 439 440

static inline void smp_get_save_area(unsigned int cpu, unsigned int phy_cpu) { }

#endif /* CONFIG_ZFCPDUMP || CONFIG_ZFCPDUMP_MODULE */
M
Michael Holzheu 已提交
441

L
Linus Torvalds 已提交
442 443 444
/*
 * Lets check how many CPUs we have.
 */
445
static unsigned int __init smp_count_cpus(void)
L
Linus Torvalds 已提交
446
{
447
	unsigned int cpu, num_cpus;
L
Linus Torvalds 已提交
448 449 450 451 452 453 454 455
	__u16 boot_cpu_addr;

	/*
	 * cpu 0 is the boot cpu. See smp_prepare_boot_cpu.
	 */
	boot_cpu_addr = S390_lowcore.cpu_data.cpu_addr;
	current_thread_info()->cpu = 0;
	num_cpus = 1;
456
	for (cpu = 0; cpu <= 65535; cpu++) {
L
Linus Torvalds 已提交
457 458
		if ((__u16) cpu == boot_cpu_addr)
			continue;
459
		__cpu_logical_map[1] = (__u16) cpu;
460
		if (signal_processor(1, sigp_sense) == sigp_not_operational)
L
Linus Torvalds 已提交
461
			continue;
462
		smp_get_save_area(num_cpus, cpu);
L
Linus Torvalds 已提交
463 464
		num_cpus++;
	}
465
	printk("Detected %d CPU's\n", (int) num_cpus);
L
Linus Torvalds 已提交
466
	printk("Boot cpu address %2X\n", boot_cpu_addr);
467
	return num_cpus;
L
Linus Torvalds 已提交
468 469 470
}

/*
471
 *	Activate a secondary processor.
L
Linus Torvalds 已提交
472
 */
H
Heiko Carstens 已提交
473
int __cpuinit start_secondary(void *cpuvoid)
L
Linus Torvalds 已提交
474
{
475 476
	/* Setup the cpu */
	cpu_init();
477
	preempt_disable();
M
Martin Schwidefsky 已提交
478
	/* Enable TOD clock interrupts on the secondary cpu. */
479
	init_cpu_timer();
L
Linus Torvalds 已提交
480
#ifdef CONFIG_VIRT_TIMER
M
Martin Schwidefsky 已提交
481
	/* Enable cpu timer interrupts on the secondary cpu. */
482
	init_cpu_vtimer();
L
Linus Torvalds 已提交
483 484
#endif
	/* Enable pfault pseudo page faults on this cpu. */
H
Heiko Carstens 已提交
485 486
	pfault_init();

L
Linus Torvalds 已提交
487 488 489 490
	/* Mark this cpu as online */
	cpu_set(smp_processor_id(), cpu_online_map);
	/* Switch on interrupts */
	local_irq_enable();
491 492 493 494 495
	/* Print info about this processor */
	print_cpu_info(&S390_lowcore.cpu_data);
	/* cpu_idle will call schedule for us */
	cpu_idle();
	return 0;
L
Linus Torvalds 已提交
496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511
}

static void __init smp_create_idle(unsigned int cpu)
{
	struct task_struct *p;

	/*
	 *  don't care about the psw and regs settings since we'll never
	 *  reschedule the forked task.
	 */
	p = fork_idle(cpu);
	if (IS_ERR(p))
		panic("failed fork for CPU %u: %li", cpu, PTR_ERR(p));
	current_set[cpu] = p;
}

512
static int cpu_stopped(int cpu)
L
Linus Torvalds 已提交
513 514 515 516
{
	__u32 status;

	/* Check for stopped state */
517 518
	if (signal_processor_ps(&status, 0, cpu, sigp_sense) ==
	    sigp_status_stored) {
L
Linus Torvalds 已提交
519 520 521 522 523 524 525 526
		if (status & 0x40)
			return 1;
	}
	return 0;
}

/* Upping and downing of CPUs */

527
int __cpu_up(unsigned int cpu)
L
Linus Torvalds 已提交
528 529
{
	struct task_struct *idle;
530
	struct _lowcore *cpu_lowcore;
L
Linus Torvalds 已提交
531
	struct stack_frame *sf;
532 533
	sigp_ccode ccode;
	int curr_cpu;
L
Linus Torvalds 已提交
534 535 536 537 538 539 540 541 542 543 544 545

	for (curr_cpu = 0; curr_cpu <= 65535; curr_cpu++) {
		__cpu_logical_map[cpu] = (__u16) curr_cpu;
		if (cpu_stopped(cpu))
			break;
	}

	if (!cpu_stopped(cpu))
		return -ENODEV;

	ccode = signal_processor_p((__u32)(unsigned long)(lowcore_ptr[cpu]),
				   cpu, sigp_set_prefix);
546
	if (ccode) {
L
Linus Torvalds 已提交
547 548 549 550 551 552 553
		printk("sigp_set_prefix failed for cpu %d "
		       "with condition code %d\n",
		       (int) cpu, (int) ccode);
		return -EIO;
	}

	idle = current_set[cpu];
554
	cpu_lowcore = lowcore_ptr[cpu];
L
Linus Torvalds 已提交
555
	cpu_lowcore->kernel_stack = (unsigned long)
556
		task_stack_page(idle) + THREAD_SIZE;
L
Linus Torvalds 已提交
557 558 559 560 561 562 563
	sf = (struct stack_frame *) (cpu_lowcore->kernel_stack
				     - sizeof(struct pt_regs)
				     - sizeof(struct stack_frame));
	memset(sf, 0, sizeof(struct stack_frame));
	sf->gprs[9] = (unsigned long) sf;
	cpu_lowcore->save_area[15] = (unsigned long) sf;
	__ctl_store(cpu_lowcore->cregs_save_area[0], 0, 15);
564 565 566
	asm volatile(
		"	stam	0,15,0(%0)"
		: : "a" (&cpu_lowcore->access_regs_save_area) : "memory");
L
Linus Torvalds 已提交
567
	cpu_lowcore->percpu_offset = __per_cpu_offset[cpu];
568 569
	cpu_lowcore->current_task = (unsigned long) idle;
	cpu_lowcore->cpu_data.cpu_nr = cpu;
L
Linus Torvalds 已提交
570
	eieio();
M
Michael Ryan 已提交
571

572
	while (signal_processor(cpu, sigp_restart) == sigp_busy)
M
Michael Ryan 已提交
573
		udelay(10);
L
Linus Torvalds 已提交
574 575 576 577 578 579

	while (!cpu_online(cpu))
		cpu_relax();
	return 0;
}

580
static unsigned int __initdata additional_cpus;
581
static unsigned int __initdata possible_cpus;
582 583 584

void __init smp_setup_cpu_possible_map(void)
{
585
	unsigned int phy_cpus, pos_cpus, cpu;
586

587 588
	phy_cpus = smp_count_cpus();
	pos_cpus = min(phy_cpus + additional_cpus, (unsigned int) NR_CPUS);
589

590
	if (possible_cpus)
591
		pos_cpus = min(possible_cpus, (unsigned int) NR_CPUS);
592

593
	for (cpu = 0; cpu < pos_cpus; cpu++)
594 595
		cpu_set(cpu, cpu_possible_map);

596 597 598 599
	phy_cpus = min(phy_cpus, pos_cpus);

	for (cpu = 0; cpu < phy_cpus; cpu++)
		cpu_set(cpu, cpu_present_map);
600 601 602 603 604 605 606 607 608 609 610
}

#ifdef CONFIG_HOTPLUG_CPU

static int __init setup_additional_cpus(char *s)
{
	additional_cpus = simple_strtoul(s, NULL, 0);
	return 0;
}
early_param("additional_cpus", setup_additional_cpus);

611 612 613 614 615 616 617
static int __init setup_possible_cpus(char *s)
{
	possible_cpus = simple_strtoul(s, NULL, 0);
	return 0;
}
early_param("possible_cpus", setup_possible_cpus);

618
int __cpu_disable(void)
L
Linus Torvalds 已提交
619
{
620
	struct ec_creg_mask_parms cr_parms;
Z
Zwane Mwaikambo 已提交
621
	int cpu = smp_processor_id();
L
Linus Torvalds 已提交
622

Z
Zwane Mwaikambo 已提交
623
	cpu_clear(cpu, cpu_online_map);
L
Linus Torvalds 已提交
624 625

	/* Disable pfault pseudo page faults on this cpu. */
H
Heiko Carstens 已提交
626
	pfault_fini();
L
Linus Torvalds 已提交
627

628 629
	memset(&cr_parms.orvals, 0, sizeof(cr_parms.orvals));
	memset(&cr_parms.andvals, 0xff, sizeof(cr_parms.andvals));
L
Linus Torvalds 已提交
630

631
	/* disable all external interrupts */
L
Linus Torvalds 已提交
632
	cr_parms.orvals[0] = 0;
633 634
	cr_parms.andvals[0] = ~(1 << 15 | 1 << 14 | 1 << 13 | 1 << 12 |
				1 << 11 | 1 << 10 | 1 <<  6 | 1 <<  4);
L
Linus Torvalds 已提交
635 636
	/* disable all I/O interrupts */
	cr_parms.orvals[6] = 0;
637 638
	cr_parms.andvals[6] = ~(1 << 31 | 1 << 30 | 1 << 29 | 1 << 28 |
				1 << 27 | 1 << 26 | 1 << 25 | 1 << 24);
L
Linus Torvalds 已提交
639 640
	/* disable most machine checks */
	cr_parms.orvals[14] = 0;
641 642
	cr_parms.andvals[14] = ~(1 << 28 | 1 << 27 | 1 << 26 |
				 1 << 25 | 1 << 24);
643

L
Linus Torvalds 已提交
644 645 646 647 648
	smp_ctl_bit_callback(&cr_parms);

	return 0;
}

649
void __cpu_die(unsigned int cpu)
L
Linus Torvalds 已提交
650 651 652 653 654 655 656
{
	/* Wait until target cpu is down */
	while (!smp_cpu_not_running(cpu))
		cpu_relax();
	printk("Processor %d spun down\n", cpu);
}

657
void cpu_die(void)
L
Linus Torvalds 已提交
658 659 660 661
{
	idle_task_exit();
	signal_processor(smp_processor_id(), sigp_stop);
	BUG();
662
	for (;;);
L
Linus Torvalds 已提交
663 664
}

665 666
#endif /* CONFIG_HOTPLUG_CPU */

L
Linus Torvalds 已提交
667 668 669 670 671 672 673 674
/*
 *	Cycle through the processors and setup structures.
 */

void __init smp_prepare_cpus(unsigned int max_cpus)
{
	unsigned long stack;
	unsigned int cpu;
675 676 677 678 679 680 681 682 683
	int i;

	/* request the 0x1201 emergency signal external interrupt */
	if (register_external_interrupt(0x1201, do_ext_call_interrupt) != 0)
		panic("Couldn't request external interrupt 0x1201");
	memset(lowcore_ptr, 0, sizeof(lowcore_ptr));
	/*
	 *  Initialize prefix pages and stacks for all possible cpus
	 */
L
Linus Torvalds 已提交
684 685
	print_cpu_info(&S390_lowcore.cpu_data);

686
	for_each_possible_cpu(i) {
L
Linus Torvalds 已提交
687
		lowcore_ptr[i] = (struct _lowcore *)
688 689 690 691
			__get_free_pages(GFP_KERNEL | GFP_DMA,
					 sizeof(void*) == 8 ? 1 : 0);
		stack = __get_free_pages(GFP_KERNEL, ASYNC_ORDER);
		if (!lowcore_ptr[i] || !stack)
L
Linus Torvalds 已提交
692 693 694
			panic("smp_boot_cpus failed to allocate memory\n");

		*(lowcore_ptr[i]) = S390_lowcore;
695 696 697
		lowcore_ptr[i]->async_stack = stack + ASYNC_SIZE;
		stack = __get_free_pages(GFP_KERNEL, 0);
		if (!stack)
L
Linus Torvalds 已提交
698
			panic("smp_boot_cpus failed to allocate memory\n");
699
		lowcore_ptr[i]->panic_stack = stack + PAGE_SIZE;
700
#ifndef CONFIG_64BIT
701 702
		if (MACHINE_HAS_IEEE) {
			lowcore_ptr[i]->extended_save_area_addr =
703 704
				(__u32) __get_free_pages(GFP_KERNEL, 0);
			if (!lowcore_ptr[i]->extended_save_area_addr)
705 706 707
				panic("smp_boot_cpus failed to "
				      "allocate memory\n");
		}
L
Linus Torvalds 已提交
708 709
#endif
	}
710
#ifndef CONFIG_64BIT
711 712 713
	if (MACHINE_HAS_IEEE)
		ctl_set_bit(14, 29); /* enable extended save area */
#endif
L
Linus Torvalds 已提交
714 715
	set_prefix((u32)(unsigned long) lowcore_ptr[smp_processor_id()]);

716
	for_each_possible_cpu(cpu)
L
Linus Torvalds 已提交
717 718 719 720
		if (cpu != smp_processor_id())
			smp_create_idle(cpu);
}

H
Heiko Carstens 已提交
721
void __init smp_prepare_boot_cpu(void)
L
Linus Torvalds 已提交
722 723 724 725 726 727 728 729
{
	BUG_ON(smp_processor_id() != 0);

	cpu_set(0, cpu_online_map);
	S390_lowcore.percpu_offset = __per_cpu_offset[0];
	current_set[0] = current;
}

H
Heiko Carstens 已提交
730
void __init smp_cpus_done(unsigned int max_cpus)
L
Linus Torvalds 已提交
731
{
732
	cpu_present_map = cpu_possible_map;
L
Linus Torvalds 已提交
733 734 735 736 737 738 739 740 741 742
}

/*
 * the frequency of the profiling timer can be changed
 * by writing a multiplier value into /proc/profile.
 *
 * usually you want to run this on all CPUs ;)
 */
int setup_profiling_timer(unsigned int multiplier)
{
743
	return 0;
L
Linus Torvalds 已提交
744 745 746 747
}

static DEFINE_PER_CPU(struct cpu, cpu_devices);

748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768
static ssize_t show_capability(struct sys_device *dev, char *buf)
{
	unsigned int capability;
	int rc;

	rc = get_cpu_capability(&capability);
	if (rc)
		return rc;
	return sprintf(buf, "%u\n", capability);
}
static SYSDEV_ATTR(capability, 0444, show_capability, NULL);

static int __cpuinit smp_cpu_notify(struct notifier_block *self,
				    unsigned long action, void *hcpu)
{
	unsigned int cpu = (unsigned int)(long)hcpu;
	struct cpu *c = &per_cpu(cpu_devices, cpu);
	struct sys_device *s = &c->sysdev;

	switch (action) {
	case CPU_ONLINE:
769
	case CPU_ONLINE_FROZEN:
770 771 772 773
		if (sysdev_create_file(s, &attr_capability))
			return NOTIFY_BAD;
		break;
	case CPU_DEAD:
774
	case CPU_DEAD_FROZEN:
775 776 777 778 779 780 781
		sysdev_remove_file(s, &attr_capability);
		break;
	}
	return NOTIFY_OK;
}

static struct notifier_block __cpuinitdata smp_cpu_nb = {
782
	.notifier_call = smp_cpu_notify,
783 784
};

L
Linus Torvalds 已提交
785 786 787
static int __init topology_init(void)
{
	int cpu;
788 789

	register_cpu_notifier(&smp_cpu_nb);
L
Linus Torvalds 已提交
790

791
	for_each_possible_cpu(cpu) {
792
		struct cpu *c = &per_cpu(cpu_devices, cpu);
793
		struct sys_device *s = &c->sysdev;
794 795

		c->hotpluggable = 1;
796 797 798 799 800
		register_cpu(c, cpu);
		if (!cpu_online(cpu))
			continue;
		s = &c->sysdev;
		sysdev_create_file(s, &attr_capability);
L
Linus Torvalds 已提交
801 802 803 804
	}
	return 0;
}
subsys_initcall(topology_init);