smp.c 19.2 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3
/*
 *  arch/s390/kernel/smp.c
 *
4
 *    Copyright IBM Corp. 1999,2007
L
Linus Torvalds 已提交
5
 *    Author(s): Denis Joseph Barrow (djbarrow@de.ibm.com,barrow_dj@yahoo.com),
6 7
 *		 Martin Schwidefsky (schwidefsky@de.ibm.com)
 *		 Heiko Carstens (heiko.carstens@de.ibm.com)
L
Linus Torvalds 已提交
8
 *
9
 *  based on other smp stuff by
L
Linus Torvalds 已提交
10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
 *    (c) 1995 Alan Cox, CymruNET Ltd  <alan@cymru.net>
 *    (c) 1998 Ingo Molnar
 *
 * We work with logical cpu numbering everywhere we can. The only
 * functions using the real cpu address (got from STAP) are the sigp
 * functions. For all other functions we use the identity mapping.
 * That means that cpu_number_map[i] == i for every cpu. cpu_number_map is
 * used e.g. to find the idle task belonging to a logical cpu. Every array
 * in the kernel is sorted by the logical cpu number and not by the physical
 * one which is causing all the confusion with __cpu_logical_map and
 * cpu_number_map in other architectures.
 */

#include <linux/module.h>
#include <linux/init.h>
#include <linux/mm.h>
#include <linux/spinlock.h>
#include <linux/kernel_stat.h>
#include <linux/delay.h>
#include <linux/cache.h>
#include <linux/interrupt.h>
#include <linux/cpu.h>
32
#include <linux/timex.h>
M
Michael Holzheu 已提交
33
#include <linux/bootmem.h>
M
Michael Holzheu 已提交
34
#include <asm/ipl.h>
35
#include <asm/setup.h>
L
Linus Torvalds 已提交
36 37 38 39 40 41
#include <asm/sigp.h>
#include <asm/pgalloc.h>
#include <asm/irq.h>
#include <asm/s390_ext.h>
#include <asm/cpcmd.h>
#include <asm/tlbflush.h>
42
#include <asm/timer.h>
M
Michael Holzheu 已提交
43
#include <asm/lowcore.h>
L
Linus Torvalds 已提交
44 45 46 47 48

/*
 * An array with a pointer the lowcore of every CPU.
 */
struct _lowcore *lowcore_ptr[NR_CPUS];
49
EXPORT_SYMBOL(lowcore_ptr);
L
Linus Torvalds 已提交
50

51
cpumask_t cpu_online_map = CPU_MASK_NONE;
52 53
EXPORT_SYMBOL(cpu_online_map);

54
cpumask_t cpu_possible_map = CPU_MASK_NONE;
55
EXPORT_SYMBOL(cpu_possible_map);
L
Linus Torvalds 已提交
56 57 58 59 60 61

static struct task_struct *current_set[NR_CPUS];

static void smp_ext_bitcall(int, ec_bit_sig);

/*
J
Jan Glauber 已提交
62 63
 * Structure and data for __smp_call_function_map(). This is designed to
 * minimise static memory requirements. It also looks cleaner.
L
Linus Torvalds 已提交
64 65 66 67 68 69
 */
static DEFINE_SPINLOCK(call_lock);

struct call_data_struct {
	void (*func) (void *info);
	void *info;
J
Jan Glauber 已提交
70 71
	cpumask_t started;
	cpumask_t finished;
L
Linus Torvalds 已提交
72 73 74
	int wait;
};

75
static struct call_data_struct *call_data;
L
Linus Torvalds 已提交
76 77 78 79 80 81 82 83 84 85

/*
 * 'Call function' interrupt callback
 */
static void do_call_function(void)
{
	void (*func) (void *info) = call_data->func;
	void *info = call_data->info;
	int wait = call_data->wait;

J
Jan Glauber 已提交
86
	cpu_set(smp_processor_id(), call_data->started);
L
Linus Torvalds 已提交
87 88
	(*func)(info);
	if (wait)
J
Jan Glauber 已提交
89
		cpu_set(smp_processor_id(), call_data->finished);;
L
Linus Torvalds 已提交
90 91
}

J
Jan Glauber 已提交
92 93
static void __smp_call_function_map(void (*func) (void *info), void *info,
				    int nonatomic, int wait, cpumask_t map)
L
Linus Torvalds 已提交
94 95
{
	struct call_data_struct data;
J
Jan Glauber 已提交
96
	int cpu, local = 0;
L
Linus Torvalds 已提交
97

J
Jan Glauber 已提交
98
	/*
99
	 * Can deadlock when interrupts are disabled or if in wrong context.
J
Jan Glauber 已提交
100
	 */
101
	WARN_ON(irqs_disabled() || in_irq());
L
Linus Torvalds 已提交
102

J
Jan Glauber 已提交
103 104 105 106 107 108 109 110 111 112 113 114
	/*
	 * Check for local function call. We have to have the same call order
	 * as in on_each_cpu() because of machine_restart_smp().
	 */
	if (cpu_isset(smp_processor_id(), map)) {
		local = 1;
		cpu_clear(smp_processor_id(), map);
	}

	cpus_and(map, map, cpu_online_map);
	if (cpus_empty(map))
		goto out;
L
Linus Torvalds 已提交
115 116 117

	data.func = func;
	data.info = info;
J
Jan Glauber 已提交
118
	data.started = CPU_MASK_NONE;
L
Linus Torvalds 已提交
119 120
	data.wait = wait;
	if (wait)
J
Jan Glauber 已提交
121
		data.finished = CPU_MASK_NONE;
L
Linus Torvalds 已提交
122

123
	spin_lock(&call_lock);
L
Linus Torvalds 已提交
124
	call_data = &data;
J
Jan Glauber 已提交
125 126 127

	for_each_cpu_mask(cpu, map)
		smp_ext_bitcall(cpu, ec_call_function);
L
Linus Torvalds 已提交
128 129

	/* Wait for response */
J
Jan Glauber 已提交
130
	while (!cpus_equal(map, data.started))
L
Linus Torvalds 已提交
131 132
		cpu_relax();
	if (wait)
J
Jan Glauber 已提交
133
		while (!cpus_equal(map, data.finished))
L
Linus Torvalds 已提交
134
			cpu_relax();
135
	spin_unlock(&call_lock);
J
Jan Glauber 已提交
136
out:
137 138
	if (local) {
		local_irq_disable();
J
Jan Glauber 已提交
139
		func(info);
140 141
		local_irq_enable();
	}
L
Linus Torvalds 已提交
142 143 144
}

/*
J
Jan Glauber 已提交
145 146 147 148 149
 * smp_call_function:
 * @func: the function to run; this must be fast and non-blocking
 * @info: an arbitrary pointer to pass to the function
 * @nonatomic: unused
 * @wait: if true, wait (atomically) until function has completed on other CPUs
L
Linus Torvalds 已提交
150
 *
J
Jan Glauber 已提交
151
 * Run a function on all other CPUs.
L
Linus Torvalds 已提交
152
 *
153 154
 * You must not call this function with disabled interrupts, from a
 * hardware interrupt handler or from a bottom half.
L
Linus Torvalds 已提交
155
 */
J
Jan Glauber 已提交
156 157
int smp_call_function(void (*func) (void *info), void *info, int nonatomic,
		      int wait)
L
Linus Torvalds 已提交
158
{
J
Jan Glauber 已提交
159
	cpumask_t map;
L
Linus Torvalds 已提交
160

161
	preempt_disable();
J
Jan Glauber 已提交
162 163 164
	map = cpu_online_map;
	cpu_clear(smp_processor_id(), map);
	__smp_call_function_map(func, info, nonatomic, wait, map);
165
	preempt_enable();
J
Jan Glauber 已提交
166 167 168
	return 0;
}
EXPORT_SYMBOL(smp_call_function);
L
Linus Torvalds 已提交
169

J
Jan Glauber 已提交
170
/*
171 172
 * smp_call_function_single:
 * @cpu: the CPU where func should run
J
Jan Glauber 已提交
173 174 175 176 177 178 179
 * @func: the function to run; this must be fast and non-blocking
 * @info: an arbitrary pointer to pass to the function
 * @nonatomic: unused
 * @wait: if true, wait (atomically) until function has completed on other CPUs
 *
 * Run a function on one processor.
 *
180 181
 * You must not call this function with disabled interrupts, from a
 * hardware interrupt handler or from a bottom half.
J
Jan Glauber 已提交
182
 */
183 184
int smp_call_function_single(int cpu, void (*func) (void *info), void *info,
			     int nonatomic, int wait)
J
Jan Glauber 已提交
185
{
186
	preempt_disable();
187 188
	__smp_call_function_map(func, info, nonatomic, wait,
				cpumask_of_cpu(cpu));
189
	preempt_enable();
L
Linus Torvalds 已提交
190 191
	return 0;
}
192
EXPORT_SYMBOL(smp_call_function_single);
L
Linus Torvalds 已提交
193

194
static void do_send_stop(void)
L
Linus Torvalds 已提交
195
{
196
	int cpu, rc;
L
Linus Torvalds 已提交
197

198
	/* stop all processors */
L
Linus Torvalds 已提交
199 200 201 202 203 204 205 206 207
	for_each_online_cpu(cpu) {
		if (cpu == smp_processor_id())
			continue;
		do {
			rc = signal_processor(cpu, sigp_stop);
		} while (rc == sigp_busy);
	}
}

208
static void do_store_status(void)
L
Linus Torvalds 已提交
209
{
210
	int cpu, rc;
L
Linus Torvalds 已提交
211

212
	/* store status of all processors in their lowcores (real 0) */
L
Linus Torvalds 已提交
213 214 215 216 217 218 219
	for_each_online_cpu(cpu) {
		if (cpu == smp_processor_id())
			continue;
		do {
			rc = signal_processor_p(
				(__u32)(unsigned long) lowcore_ptr[cpu], cpu,
				sigp_store_status_at_address);
220 221
		} while (rc == sigp_busy);
	}
L
Linus Torvalds 已提交
222 223
}

224
static void do_wait_for_stop(void)
H
Heiko Carstens 已提交
225 226 227 228 229 230 231
{
	int cpu;

	/* Wait for all other cpus to enter stopped state */
	for_each_online_cpu(cpu) {
		if (cpu == smp_processor_id())
			continue;
232
		while (!smp_cpu_not_running(cpu))
H
Heiko Carstens 已提交
233 234 235 236
			cpu_relax();
	}
}

L
Linus Torvalds 已提交
237 238 239 240 241 242
/*
 * this function sends a 'stop' sigp to all other CPUs in the system.
 * it goes straight through.
 */
void smp_send_stop(void)
{
H
Heiko Carstens 已提交
243
	/* Disable all interrupts/machine checks */
G
Gerald Schaefer 已提交
244
	__load_psw_mask(psw_kernel_bits & ~PSW_MASK_MCHECK);
H
Heiko Carstens 已提交
245

246
	/* write magic number to zero page (absolute 0) */
L
Linus Torvalds 已提交
247 248 249 250 251
	lowcore_ptr[smp_processor_id()]->panic_magic = __PANIC_MAGIC;

	/* stop other processors. */
	do_send_stop();

H
Heiko Carstens 已提交
252 253 254
	/* wait until other processors are stopped */
	do_wait_for_stop();

L
Linus Torvalds 已提交
255 256 257 258 259 260 261
	/* store status of other processors. */
	do_store_status();
}

/*
 * Reboot, halt and power_off routines for SMP.
 */
262
void machine_restart_smp(char *__unused)
L
Linus Torvalds 已提交
263
{
H
Heiko Carstens 已提交
264 265
	smp_send_stop();
	do_reipl();
L
Linus Torvalds 已提交
266 267 268 269
}

void machine_halt_smp(void)
{
H
Heiko Carstens 已提交
270 271 272 273 274
	smp_send_stop();
	if (MACHINE_IS_VM && strlen(vmhalt_cmd) > 0)
		__cpcmd(vmhalt_cmd, NULL, 0, NULL);
	signal_processor(smp_processor_id(), sigp_stop_and_store_status);
	for (;;);
L
Linus Torvalds 已提交
275 276 277 278
}

void machine_power_off_smp(void)
{
H
Heiko Carstens 已提交
279 280 281 282 283
	smp_send_stop();
	if (MACHINE_IS_VM && strlen(vmpoff_cmd) > 0)
		__cpcmd(vmpoff_cmd, NULL, 0, NULL);
	signal_processor(smp_processor_id(), sigp_stop_and_store_status);
	for (;;);
L
Linus Torvalds 已提交
284 285 286 287 288 289 290
}

/*
 * This is the main routine where commands issued by other
 * cpus are handled.
 */

291
static void do_ext_call_interrupt(__u16 code)
L
Linus Torvalds 已提交
292
{
293
	unsigned long bits;
L
Linus Torvalds 已提交
294

295 296 297 298 299 300
	/*
	 * handle bit signal external calls
	 *
	 * For the ec_schedule signal we have to do nothing. All the work
	 * is done automatically when we return from the interrupt.
	 */
L
Linus Torvalds 已提交
301 302
	bits = xchg(&S390_lowcore.ext_call_fast, 0);

303
	if (test_bit(ec_call_function, &bits))
L
Linus Torvalds 已提交
304 305 306 307 308 309 310 311 312
		do_call_function();
}

/*
 * Send an external call sigp to another cpu and return without waiting
 * for its completion.
 */
static void smp_ext_bitcall(int cpu, ec_bit_sig sig)
{
313 314 315
	/*
	 * Set signaling bit in lowcore of target cpu and kick it
	 */
L
Linus Torvalds 已提交
316
	set_bit(sig, (unsigned long *) &lowcore_ptr[cpu]->ext_call_fast);
317
	while (signal_processor(cpu, sigp_emergency_signal) == sigp_busy)
L
Linus Torvalds 已提交
318 319 320
		udelay(10);
}

321
#ifndef CONFIG_64BIT
L
Linus Torvalds 已提交
322 323 324 325 326 327 328 329 330 331
/*
 * this function sends a 'purge tlb' signal to another CPU.
 */
void smp_ptlb_callback(void *info)
{
	local_flush_tlb();
}

void smp_ptlb_all(void)
{
332
	on_each_cpu(smp_ptlb_callback, NULL, 0, 1);
L
Linus Torvalds 已提交
333 334
}
EXPORT_SYMBOL(smp_ptlb_all);
335
#endif /* ! CONFIG_64BIT */
L
Linus Torvalds 已提交
336 337 338 339 340 341 342 343

/*
 * this function sends a 'reschedule' IPI to another CPU.
 * it goes straight through and wastes no time serializing
 * anything. Worst case is that we lose a reschedule ...
 */
void smp_send_reschedule(int cpu)
{
344
	smp_ext_bitcall(cpu, ec_schedule);
L
Linus Torvalds 已提交
345 346 347 348 349
}

/*
 * parameter area for the set/clear control bit callbacks
 */
350
struct ec_creg_mask_parms {
L
Linus Torvalds 已提交
351 352
	unsigned long orvals[16];
	unsigned long andvals[16];
353
};
L
Linus Torvalds 已提交
354 355 356 357

/*
 * callback for setting/clearing control bits
 */
358 359
static void smp_ctl_bit_callback(void *info)
{
360
	struct ec_creg_mask_parms *pp = info;
L
Linus Torvalds 已提交
361 362
	unsigned long cregs[16];
	int i;
363

364 365
	__ctl_store(cregs, 0, 15);
	for (i = 0; i <= 15; i++)
L
Linus Torvalds 已提交
366
		cregs[i] = (cregs[i] & pp->andvals[i]) | pp->orvals[i];
367
	__ctl_load(cregs, 0, 15);
L
Linus Torvalds 已提交
368 369 370 371 372
}

/*
 * Set a bit in a control register of all cpus
 */
373 374 375
void smp_ctl_set_bit(int cr, int bit)
{
	struct ec_creg_mask_parms parms;
L
Linus Torvalds 已提交
376

377 378
	memset(&parms.orvals, 0, sizeof(parms.orvals));
	memset(&parms.andvals, 0xff, sizeof(parms.andvals));
L
Linus Torvalds 已提交
379
	parms.orvals[cr] = 1 << bit;
380
	on_each_cpu(smp_ctl_bit_callback, &parms, 0, 1);
L
Linus Torvalds 已提交
381
}
382
EXPORT_SYMBOL(smp_ctl_set_bit);
L
Linus Torvalds 已提交
383 384 385 386

/*
 * Clear a bit in a control register of all cpus
 */
387 388 389
void smp_ctl_clear_bit(int cr, int bit)
{
	struct ec_creg_mask_parms parms;
L
Linus Torvalds 已提交
390

391 392
	memset(&parms.orvals, 0, sizeof(parms.orvals));
	memset(&parms.andvals, 0xff, sizeof(parms.andvals));
L
Linus Torvalds 已提交
393
	parms.andvals[cr] = ~(1L << bit);
394
	on_each_cpu(smp_ctl_bit_callback, &parms, 0, 1);
L
Linus Torvalds 已提交
395
}
396
EXPORT_SYMBOL(smp_ctl_clear_bit);
L
Linus Torvalds 已提交
397

M
Michael Holzheu 已提交
398 399 400 401 402 403 404 405 406 407 408
#if defined(CONFIG_ZFCPDUMP) || defined(CONFIG_ZFCPDUMP_MODULE)

/*
 * zfcpdump_prefix_array holds prefix registers for the following scenario:
 * 64 bit zfcpdump kernel and 31 bit kernel which is to be dumped. We have to
 * save its prefix registers, since they get lost, when switching from 31 bit
 * to 64 bit.
 */
unsigned int zfcpdump_prefix_array[NR_CPUS + 1] \
	__attribute__((__section__(".data")));

409
static void __init smp_get_save_area(unsigned int cpu, unsigned int phy_cpu)
M
Michael Holzheu 已提交
410 411 412
{
	if (ipl_info.type != IPL_TYPE_FCP_DUMP)
		return;
413 414 415 416
	if (cpu >= NR_CPUS) {
		printk(KERN_WARNING "Registers for cpu %i not saved since dump "
		       "kernel was compiled with NR_CPUS=%i\n", cpu, NR_CPUS);
		return;
M
Michael Holzheu 已提交
417
	}
418 419 420 421 422 423 424 425 426 427 428
	zfcpdump_save_areas[cpu] = alloc_bootmem(sizeof(union save_area));
	__cpu_logical_map[1] = (__u16) phy_cpu;
	while (signal_processor(1, sigp_stop_and_store_status) == sigp_busy)
		cpu_relax();
	memcpy(zfcpdump_save_areas[cpu],
	       (void *)(unsigned long) store_prefix() + SAVE_AREA_BASE,
	       SAVE_AREA_SIZE);
#ifdef CONFIG_64BIT
	/* copy original prefix register */
	zfcpdump_save_areas[cpu]->s390x.pref_reg = zfcpdump_prefix_array[cpu];
#endif
M
Michael Holzheu 已提交
429 430 431 432 433 434
}

union save_area *zfcpdump_save_areas[NR_CPUS + 1];
EXPORT_SYMBOL_GPL(zfcpdump_save_areas);

#else
435 436 437 438

static inline void smp_get_save_area(unsigned int cpu, unsigned int phy_cpu) { }

#endif /* CONFIG_ZFCPDUMP || CONFIG_ZFCPDUMP_MODULE */
M
Michael Holzheu 已提交
439

L
Linus Torvalds 已提交
440 441 442
/*
 * Lets check how many CPUs we have.
 */
443
static unsigned int __init smp_count_cpus(void)
L
Linus Torvalds 已提交
444
{
445
	unsigned int cpu, num_cpus;
L
Linus Torvalds 已提交
446 447 448 449 450 451 452 453
	__u16 boot_cpu_addr;

	/*
	 * cpu 0 is the boot cpu. See smp_prepare_boot_cpu.
	 */
	boot_cpu_addr = S390_lowcore.cpu_data.cpu_addr;
	current_thread_info()->cpu = 0;
	num_cpus = 1;
454
	for (cpu = 0; cpu <= 65535; cpu++) {
L
Linus Torvalds 已提交
455 456
		if ((__u16) cpu == boot_cpu_addr)
			continue;
457
		__cpu_logical_map[1] = (__u16) cpu;
458
		if (signal_processor(1, sigp_sense) == sigp_not_operational)
L
Linus Torvalds 已提交
459
			continue;
460
		smp_get_save_area(num_cpus, cpu);
L
Linus Torvalds 已提交
461 462
		num_cpus++;
	}
463
	printk("Detected %d CPU's\n", (int) num_cpus);
L
Linus Torvalds 已提交
464
	printk("Boot cpu address %2X\n", boot_cpu_addr);
465
	return num_cpus;
L
Linus Torvalds 已提交
466 467 468
}

/*
469
 *	Activate a secondary processor.
L
Linus Torvalds 已提交
470
 */
H
Heiko Carstens 已提交
471
int __cpuinit start_secondary(void *cpuvoid)
L
Linus Torvalds 已提交
472
{
473 474
	/* Setup the cpu */
	cpu_init();
475
	preempt_disable();
M
Martin Schwidefsky 已提交
476
	/* Enable TOD clock interrupts on the secondary cpu. */
477
	init_cpu_timer();
L
Linus Torvalds 已提交
478
#ifdef CONFIG_VIRT_TIMER
M
Martin Schwidefsky 已提交
479
	/* Enable cpu timer interrupts on the secondary cpu. */
480
	init_cpu_vtimer();
L
Linus Torvalds 已提交
481 482
#endif
	/* Enable pfault pseudo page faults on this cpu. */
H
Heiko Carstens 已提交
483 484
	pfault_init();

L
Linus Torvalds 已提交
485 486 487 488
	/* Mark this cpu as online */
	cpu_set(smp_processor_id(), cpu_online_map);
	/* Switch on interrupts */
	local_irq_enable();
489 490 491 492 493
	/* Print info about this processor */
	print_cpu_info(&S390_lowcore.cpu_data);
	/* cpu_idle will call schedule for us */
	cpu_idle();
	return 0;
L
Linus Torvalds 已提交
494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509
}

static void __init smp_create_idle(unsigned int cpu)
{
	struct task_struct *p;

	/*
	 *  don't care about the psw and regs settings since we'll never
	 *  reschedule the forked task.
	 */
	p = fork_idle(cpu);
	if (IS_ERR(p))
		panic("failed fork for CPU %u: %li", cpu, PTR_ERR(p));
	current_set[cpu] = p;
}

510
static int cpu_stopped(int cpu)
L
Linus Torvalds 已提交
511 512 513 514
{
	__u32 status;

	/* Check for stopped state */
515 516
	if (signal_processor_ps(&status, 0, cpu, sigp_sense) ==
	    sigp_status_stored) {
L
Linus Torvalds 已提交
517 518 519 520 521 522 523 524
		if (status & 0x40)
			return 1;
	}
	return 0;
}

/* Upping and downing of CPUs */

525
int __cpu_up(unsigned int cpu)
L
Linus Torvalds 已提交
526 527
{
	struct task_struct *idle;
528
	struct _lowcore *cpu_lowcore;
L
Linus Torvalds 已提交
529
	struct stack_frame *sf;
530 531
	sigp_ccode ccode;
	int curr_cpu;
L
Linus Torvalds 已提交
532 533 534 535 536 537 538 539 540 541 542 543

	for (curr_cpu = 0; curr_cpu <= 65535; curr_cpu++) {
		__cpu_logical_map[cpu] = (__u16) curr_cpu;
		if (cpu_stopped(cpu))
			break;
	}

	if (!cpu_stopped(cpu))
		return -ENODEV;

	ccode = signal_processor_p((__u32)(unsigned long)(lowcore_ptr[cpu]),
				   cpu, sigp_set_prefix);
544
	if (ccode) {
L
Linus Torvalds 已提交
545 546 547 548 549 550 551
		printk("sigp_set_prefix failed for cpu %d "
		       "with condition code %d\n",
		       (int) cpu, (int) ccode);
		return -EIO;
	}

	idle = current_set[cpu];
552
	cpu_lowcore = lowcore_ptr[cpu];
L
Linus Torvalds 已提交
553
	cpu_lowcore->kernel_stack = (unsigned long)
554
		task_stack_page(idle) + THREAD_SIZE;
L
Linus Torvalds 已提交
555 556 557 558 559 560 561
	sf = (struct stack_frame *) (cpu_lowcore->kernel_stack
				     - sizeof(struct pt_regs)
				     - sizeof(struct stack_frame));
	memset(sf, 0, sizeof(struct stack_frame));
	sf->gprs[9] = (unsigned long) sf;
	cpu_lowcore->save_area[15] = (unsigned long) sf;
	__ctl_store(cpu_lowcore->cregs_save_area[0], 0, 15);
562 563 564
	asm volatile(
		"	stam	0,15,0(%0)"
		: : "a" (&cpu_lowcore->access_regs_save_area) : "memory");
L
Linus Torvalds 已提交
565
	cpu_lowcore->percpu_offset = __per_cpu_offset[cpu];
566 567
	cpu_lowcore->current_task = (unsigned long) idle;
	cpu_lowcore->cpu_data.cpu_nr = cpu;
L
Linus Torvalds 已提交
568
	eieio();
M
Michael Ryan 已提交
569

570
	while (signal_processor(cpu, sigp_restart) == sigp_busy)
M
Michael Ryan 已提交
571
		udelay(10);
L
Linus Torvalds 已提交
572 573 574 575 576 577

	while (!cpu_online(cpu))
		cpu_relax();
	return 0;
}

578
static unsigned int __initdata additional_cpus;
579
static unsigned int __initdata possible_cpus;
580 581 582

void __init smp_setup_cpu_possible_map(void)
{
583
	unsigned int phy_cpus, pos_cpus, cpu;
584

585 586
	phy_cpus = smp_count_cpus();
	pos_cpus = min(phy_cpus + additional_cpus, (unsigned int) NR_CPUS);
587

588
	if (possible_cpus)
589
		pos_cpus = min(possible_cpus, (unsigned int) NR_CPUS);
590

591
	for (cpu = 0; cpu < pos_cpus; cpu++)
592 593
		cpu_set(cpu, cpu_possible_map);

594 595 596 597
	phy_cpus = min(phy_cpus, pos_cpus);

	for (cpu = 0; cpu < phy_cpus; cpu++)
		cpu_set(cpu, cpu_present_map);
598 599 600 601 602 603 604 605 606 607 608
}

#ifdef CONFIG_HOTPLUG_CPU

static int __init setup_additional_cpus(char *s)
{
	additional_cpus = simple_strtoul(s, NULL, 0);
	return 0;
}
early_param("additional_cpus", setup_additional_cpus);

609 610 611 612 613 614 615
static int __init setup_possible_cpus(char *s)
{
	possible_cpus = simple_strtoul(s, NULL, 0);
	return 0;
}
early_param("possible_cpus", setup_possible_cpus);

616
int __cpu_disable(void)
L
Linus Torvalds 已提交
617
{
618
	struct ec_creg_mask_parms cr_parms;
Z
Zwane Mwaikambo 已提交
619
	int cpu = smp_processor_id();
L
Linus Torvalds 已提交
620

Z
Zwane Mwaikambo 已提交
621
	cpu_clear(cpu, cpu_online_map);
L
Linus Torvalds 已提交
622 623

	/* Disable pfault pseudo page faults on this cpu. */
H
Heiko Carstens 已提交
624
	pfault_fini();
L
Linus Torvalds 已提交
625

626 627
	memset(&cr_parms.orvals, 0, sizeof(cr_parms.orvals));
	memset(&cr_parms.andvals, 0xff, sizeof(cr_parms.andvals));
L
Linus Torvalds 已提交
628

629
	/* disable all external interrupts */
L
Linus Torvalds 已提交
630
	cr_parms.orvals[0] = 0;
631 632
	cr_parms.andvals[0] = ~(1 << 15 | 1 << 14 | 1 << 13 | 1 << 12 |
				1 << 11 | 1 << 10 | 1 <<  6 | 1 <<  4);
L
Linus Torvalds 已提交
633 634
	/* disable all I/O interrupts */
	cr_parms.orvals[6] = 0;
635 636
	cr_parms.andvals[6] = ~(1 << 31 | 1 << 30 | 1 << 29 | 1 << 28 |
				1 << 27 | 1 << 26 | 1 << 25 | 1 << 24);
L
Linus Torvalds 已提交
637 638
	/* disable most machine checks */
	cr_parms.orvals[14] = 0;
639 640
	cr_parms.andvals[14] = ~(1 << 28 | 1 << 27 | 1 << 26 |
				 1 << 25 | 1 << 24);
641

L
Linus Torvalds 已提交
642 643 644 645 646
	smp_ctl_bit_callback(&cr_parms);

	return 0;
}

647
void __cpu_die(unsigned int cpu)
L
Linus Torvalds 已提交
648 649 650 651 652 653 654
{
	/* Wait until target cpu is down */
	while (!smp_cpu_not_running(cpu))
		cpu_relax();
	printk("Processor %d spun down\n", cpu);
}

655
void cpu_die(void)
L
Linus Torvalds 已提交
656 657 658 659
{
	idle_task_exit();
	signal_processor(smp_processor_id(), sigp_stop);
	BUG();
660
	for (;;);
L
Linus Torvalds 已提交
661 662
}

663 664
#endif /* CONFIG_HOTPLUG_CPU */

L
Linus Torvalds 已提交
665 666 667 668 669 670 671 672
/*
 *	Cycle through the processors and setup structures.
 */

void __init smp_prepare_cpus(unsigned int max_cpus)
{
	unsigned long stack;
	unsigned int cpu;
673 674 675 676 677 678 679 680 681
	int i;

	/* request the 0x1201 emergency signal external interrupt */
	if (register_external_interrupt(0x1201, do_ext_call_interrupt) != 0)
		panic("Couldn't request external interrupt 0x1201");
	memset(lowcore_ptr, 0, sizeof(lowcore_ptr));
	/*
	 *  Initialize prefix pages and stacks for all possible cpus
	 */
L
Linus Torvalds 已提交
682 683
	print_cpu_info(&S390_lowcore.cpu_data);

684
	for_each_possible_cpu(i) {
L
Linus Torvalds 已提交
685
		lowcore_ptr[i] = (struct _lowcore *)
686 687 688 689
			__get_free_pages(GFP_KERNEL | GFP_DMA,
					 sizeof(void*) == 8 ? 1 : 0);
		stack = __get_free_pages(GFP_KERNEL, ASYNC_ORDER);
		if (!lowcore_ptr[i] || !stack)
L
Linus Torvalds 已提交
690 691 692
			panic("smp_boot_cpus failed to allocate memory\n");

		*(lowcore_ptr[i]) = S390_lowcore;
693 694 695
		lowcore_ptr[i]->async_stack = stack + ASYNC_SIZE;
		stack = __get_free_pages(GFP_KERNEL, 0);
		if (!stack)
L
Linus Torvalds 已提交
696
			panic("smp_boot_cpus failed to allocate memory\n");
697
		lowcore_ptr[i]->panic_stack = stack + PAGE_SIZE;
698
#ifndef CONFIG_64BIT
699 700
		if (MACHINE_HAS_IEEE) {
			lowcore_ptr[i]->extended_save_area_addr =
701 702
				(__u32) __get_free_pages(GFP_KERNEL, 0);
			if (!lowcore_ptr[i]->extended_save_area_addr)
703 704 705
				panic("smp_boot_cpus failed to "
				      "allocate memory\n");
		}
L
Linus Torvalds 已提交
706 707
#endif
	}
708
#ifndef CONFIG_64BIT
709 710 711
	if (MACHINE_HAS_IEEE)
		ctl_set_bit(14, 29); /* enable extended save area */
#endif
L
Linus Torvalds 已提交
712 713
	set_prefix((u32)(unsigned long) lowcore_ptr[smp_processor_id()]);

714
	for_each_possible_cpu(cpu)
L
Linus Torvalds 已提交
715 716 717 718
		if (cpu != smp_processor_id())
			smp_create_idle(cpu);
}

H
Heiko Carstens 已提交
719
void __init smp_prepare_boot_cpu(void)
L
Linus Torvalds 已提交
720 721 722 723 724 725 726 727
{
	BUG_ON(smp_processor_id() != 0);

	cpu_set(0, cpu_online_map);
	S390_lowcore.percpu_offset = __per_cpu_offset[0];
	current_set[0] = current;
}

H
Heiko Carstens 已提交
728
void __init smp_cpus_done(unsigned int max_cpus)
L
Linus Torvalds 已提交
729
{
730
	cpu_present_map = cpu_possible_map;
L
Linus Torvalds 已提交
731 732 733 734 735 736 737 738 739 740
}

/*
 * the frequency of the profiling timer can be changed
 * by writing a multiplier value into /proc/profile.
 *
 * usually you want to run this on all CPUs ;)
 */
int setup_profiling_timer(unsigned int multiplier)
{
741
	return 0;
L
Linus Torvalds 已提交
742 743 744 745
}

static DEFINE_PER_CPU(struct cpu, cpu_devices);

746 747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766
static ssize_t show_capability(struct sys_device *dev, char *buf)
{
	unsigned int capability;
	int rc;

	rc = get_cpu_capability(&capability);
	if (rc)
		return rc;
	return sprintf(buf, "%u\n", capability);
}
static SYSDEV_ATTR(capability, 0444, show_capability, NULL);

static int __cpuinit smp_cpu_notify(struct notifier_block *self,
				    unsigned long action, void *hcpu)
{
	unsigned int cpu = (unsigned int)(long)hcpu;
	struct cpu *c = &per_cpu(cpu_devices, cpu);
	struct sys_device *s = &c->sysdev;

	switch (action) {
	case CPU_ONLINE:
767
	case CPU_ONLINE_FROZEN:
768 769 770 771
		if (sysdev_create_file(s, &attr_capability))
			return NOTIFY_BAD;
		break;
	case CPU_DEAD:
772
	case CPU_DEAD_FROZEN:
773 774 775 776 777 778 779
		sysdev_remove_file(s, &attr_capability);
		break;
	}
	return NOTIFY_OK;
}

static struct notifier_block __cpuinitdata smp_cpu_nb = {
780
	.notifier_call = smp_cpu_notify,
781 782
};

L
Linus Torvalds 已提交
783 784 785
static int __init topology_init(void)
{
	int cpu;
786 787

	register_cpu_notifier(&smp_cpu_nb);
L
Linus Torvalds 已提交
788

789
	for_each_possible_cpu(cpu) {
790
		struct cpu *c = &per_cpu(cpu_devices, cpu);
791
		struct sys_device *s = &c->sysdev;
792 793

		c->hotpluggable = 1;
794 795 796 797 798
		register_cpu(c, cpu);
		if (!cpu_online(cpu))
			continue;
		s = &c->sysdev;
		sysdev_create_file(s, &attr_capability);
L
Linus Torvalds 已提交
799 800 801 802
	}
	return 0;
}
subsys_initcall(topology_init);