smp.c 19.5 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3
/*
 *  arch/s390/kernel/smp.c
 *
4
 *    Copyright IBM Corp. 1999,2007
L
Linus Torvalds 已提交
5
 *    Author(s): Denis Joseph Barrow (djbarrow@de.ibm.com,barrow_dj@yahoo.com),
6 7
 *		 Martin Schwidefsky (schwidefsky@de.ibm.com)
 *		 Heiko Carstens (heiko.carstens@de.ibm.com)
L
Linus Torvalds 已提交
8
 *
9
 *  based on other smp stuff by
L
Linus Torvalds 已提交
10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
 *    (c) 1995 Alan Cox, CymruNET Ltd  <alan@cymru.net>
 *    (c) 1998 Ingo Molnar
 *
 * We work with logical cpu numbering everywhere we can. The only
 * functions using the real cpu address (got from STAP) are the sigp
 * functions. For all other functions we use the identity mapping.
 * That means that cpu_number_map[i] == i for every cpu. cpu_number_map is
 * used e.g. to find the idle task belonging to a logical cpu. Every array
 * in the kernel is sorted by the logical cpu number and not by the physical
 * one which is causing all the confusion with __cpu_logical_map and
 * cpu_number_map in other architectures.
 */

#include <linux/module.h>
#include <linux/init.h>
#include <linux/mm.h>
#include <linux/spinlock.h>
#include <linux/kernel_stat.h>
#include <linux/delay.h>
#include <linux/cache.h>
#include <linux/interrupt.h>
#include <linux/cpu.h>
32
#include <linux/timex.h>
M
Michael Holzheu 已提交
33
#include <linux/bootmem.h>
M
Michael Holzheu 已提交
34
#include <asm/ipl.h>
35
#include <asm/setup.h>
L
Linus Torvalds 已提交
36 37 38 39 40 41
#include <asm/sigp.h>
#include <asm/pgalloc.h>
#include <asm/irq.h>
#include <asm/s390_ext.h>
#include <asm/cpcmd.h>
#include <asm/tlbflush.h>
42
#include <asm/timer.h>
M
Michael Holzheu 已提交
43
#include <asm/lowcore.h>
L
Linus Torvalds 已提交
44 45 46 47 48

/*
 * An array with a pointer the lowcore of every CPU.
 */
struct _lowcore *lowcore_ptr[NR_CPUS];
49
EXPORT_SYMBOL(lowcore_ptr);
L
Linus Torvalds 已提交
50

51
cpumask_t cpu_online_map = CPU_MASK_NONE;
52 53
EXPORT_SYMBOL(cpu_online_map);

54
cpumask_t cpu_possible_map = CPU_MASK_NONE;
55
EXPORT_SYMBOL(cpu_possible_map);
L
Linus Torvalds 已提交
56 57 58 59 60 61

static struct task_struct *current_set[NR_CPUS];

static void smp_ext_bitcall(int, ec_bit_sig);

/*
J
Jan Glauber 已提交
62 63
 * Structure and data for __smp_call_function_map(). This is designed to
 * minimise static memory requirements. It also looks cleaner.
L
Linus Torvalds 已提交
64 65 66 67 68 69
 */
static DEFINE_SPINLOCK(call_lock);

struct call_data_struct {
	void (*func) (void *info);
	void *info;
J
Jan Glauber 已提交
70 71
	cpumask_t started;
	cpumask_t finished;
L
Linus Torvalds 已提交
72 73 74
	int wait;
};

75
static struct call_data_struct *call_data;
L
Linus Torvalds 已提交
76 77 78 79 80 81 82 83 84 85

/*
 * 'Call function' interrupt callback
 */
static void do_call_function(void)
{
	void (*func) (void *info) = call_data->func;
	void *info = call_data->info;
	int wait = call_data->wait;

J
Jan Glauber 已提交
86
	cpu_set(smp_processor_id(), call_data->started);
L
Linus Torvalds 已提交
87 88
	(*func)(info);
	if (wait)
J
Jan Glauber 已提交
89
		cpu_set(smp_processor_id(), call_data->finished);;
L
Linus Torvalds 已提交
90 91
}

J
Jan Glauber 已提交
92 93
static void __smp_call_function_map(void (*func) (void *info), void *info,
				    int nonatomic, int wait, cpumask_t map)
L
Linus Torvalds 已提交
94 95
{
	struct call_data_struct data;
J
Jan Glauber 已提交
96
	int cpu, local = 0;
L
Linus Torvalds 已提交
97

J
Jan Glauber 已提交
98
	/*
99
	 * Can deadlock when interrupts are disabled or if in wrong context.
J
Jan Glauber 已提交
100
	 */
101
	WARN_ON(irqs_disabled() || in_irq());
L
Linus Torvalds 已提交
102

J
Jan Glauber 已提交
103 104 105 106 107 108 109 110 111 112 113 114
	/*
	 * Check for local function call. We have to have the same call order
	 * as in on_each_cpu() because of machine_restart_smp().
	 */
	if (cpu_isset(smp_processor_id(), map)) {
		local = 1;
		cpu_clear(smp_processor_id(), map);
	}

	cpus_and(map, map, cpu_online_map);
	if (cpus_empty(map))
		goto out;
L
Linus Torvalds 已提交
115 116 117

	data.func = func;
	data.info = info;
J
Jan Glauber 已提交
118
	data.started = CPU_MASK_NONE;
L
Linus Torvalds 已提交
119 120
	data.wait = wait;
	if (wait)
J
Jan Glauber 已提交
121
		data.finished = CPU_MASK_NONE;
L
Linus Torvalds 已提交
122

123
	spin_lock_bh(&call_lock);
L
Linus Torvalds 已提交
124
	call_data = &data;
J
Jan Glauber 已提交
125 126 127

	for_each_cpu_mask(cpu, map)
		smp_ext_bitcall(cpu, ec_call_function);
L
Linus Torvalds 已提交
128 129

	/* Wait for response */
J
Jan Glauber 已提交
130
	while (!cpus_equal(map, data.started))
L
Linus Torvalds 已提交
131 132 133
		cpu_relax();

	if (wait)
J
Jan Glauber 已提交
134
		while (!cpus_equal(map, data.finished))
L
Linus Torvalds 已提交
135
			cpu_relax();
J
Jan Glauber 已提交
136

137
	spin_unlock_bh(&call_lock);
L
Linus Torvalds 已提交
138

J
Jan Glauber 已提交
139 140 141 142 143
out:
	local_irq_disable();
	if (local)
		func(info);
	local_irq_enable();
L
Linus Torvalds 已提交
144 145 146
}

/*
J
Jan Glauber 已提交
147 148 149 150 151
 * smp_call_function:
 * @func: the function to run; this must be fast and non-blocking
 * @info: an arbitrary pointer to pass to the function
 * @nonatomic: unused
 * @wait: if true, wait (atomically) until function has completed on other CPUs
L
Linus Torvalds 已提交
152
 *
J
Jan Glauber 已提交
153
 * Run a function on all other CPUs.
L
Linus Torvalds 已提交
154
 *
155 156
 * You must not call this function with disabled interrupts, from a
 * hardware interrupt handler or from a bottom half.
L
Linus Torvalds 已提交
157
 */
J
Jan Glauber 已提交
158 159
int smp_call_function(void (*func) (void *info), void *info, int nonatomic,
		      int wait)
L
Linus Torvalds 已提交
160
{
J
Jan Glauber 已提交
161
	cpumask_t map;
L
Linus Torvalds 已提交
162

163
	preempt_disable();
J
Jan Glauber 已提交
164 165 166
	map = cpu_online_map;
	cpu_clear(smp_processor_id(), map);
	__smp_call_function_map(func, info, nonatomic, wait, map);
167
	preempt_enable();
J
Jan Glauber 已提交
168 169 170
	return 0;
}
EXPORT_SYMBOL(smp_call_function);
L
Linus Torvalds 已提交
171

J
Jan Glauber 已提交
172 173 174 175 176 177 178 179 180 181
/*
 * smp_call_function_on:
 * @func: the function to run; this must be fast and non-blocking
 * @info: an arbitrary pointer to pass to the function
 * @nonatomic: unused
 * @wait: if true, wait (atomically) until function has completed on other CPUs
 * @cpu: the CPU where func should run
 *
 * Run a function on one processor.
 *
182 183
 * You must not call this function with disabled interrupts, from a
 * hardware interrupt handler or from a bottom half.
J
Jan Glauber 已提交
184 185
 */
int smp_call_function_on(void (*func) (void *info), void *info, int nonatomic,
186
			 int wait, int cpu)
J
Jan Glauber 已提交
187 188
{
	cpumask_t map = CPU_MASK_NONE;
L
Linus Torvalds 已提交
189

190
	preempt_disable();
J
Jan Glauber 已提交
191 192
	cpu_set(cpu, map);
	__smp_call_function_map(func, info, nonatomic, wait, map);
193
	preempt_enable();
L
Linus Torvalds 已提交
194 195 196 197
	return 0;
}
EXPORT_SYMBOL(smp_call_function_on);

198
static void do_send_stop(void)
L
Linus Torvalds 已提交
199
{
200
	int cpu, rc;
L
Linus Torvalds 已提交
201

202
	/* stop all processors */
L
Linus Torvalds 已提交
203 204 205 206 207 208 209 210 211
	for_each_online_cpu(cpu) {
		if (cpu == smp_processor_id())
			continue;
		do {
			rc = signal_processor(cpu, sigp_stop);
		} while (rc == sigp_busy);
	}
}

212
static void do_store_status(void)
L
Linus Torvalds 已提交
213
{
214
	int cpu, rc;
L
Linus Torvalds 已提交
215

216
	/* store status of all processors in their lowcores (real 0) */
L
Linus Torvalds 已提交
217 218 219 220 221 222 223
	for_each_online_cpu(cpu) {
		if (cpu == smp_processor_id())
			continue;
		do {
			rc = signal_processor_p(
				(__u32)(unsigned long) lowcore_ptr[cpu], cpu,
				sigp_store_status_at_address);
224 225
		} while (rc == sigp_busy);
	}
L
Linus Torvalds 已提交
226 227
}

228
static void do_wait_for_stop(void)
H
Heiko Carstens 已提交
229 230 231 232 233 234 235
{
	int cpu;

	/* Wait for all other cpus to enter stopped state */
	for_each_online_cpu(cpu) {
		if (cpu == smp_processor_id())
			continue;
236
		while (!smp_cpu_not_running(cpu))
H
Heiko Carstens 已提交
237 238 239 240
			cpu_relax();
	}
}

L
Linus Torvalds 已提交
241 242 243 244 245 246
/*
 * this function sends a 'stop' sigp to all other CPUs in the system.
 * it goes straight through.
 */
void smp_send_stop(void)
{
H
Heiko Carstens 已提交
247
	/* Disable all interrupts/machine checks */
G
Gerald Schaefer 已提交
248
	__load_psw_mask(psw_kernel_bits & ~PSW_MASK_MCHECK);
H
Heiko Carstens 已提交
249

250
	/* write magic number to zero page (absolute 0) */
L
Linus Torvalds 已提交
251 252 253 254 255
	lowcore_ptr[smp_processor_id()]->panic_magic = __PANIC_MAGIC;

	/* stop other processors. */
	do_send_stop();

H
Heiko Carstens 已提交
256 257 258
	/* wait until other processors are stopped */
	do_wait_for_stop();

L
Linus Torvalds 已提交
259 260 261 262 263 264 265
	/* store status of other processors. */
	do_store_status();
}

/*
 * Reboot, halt and power_off routines for SMP.
 */
266
void machine_restart_smp(char *__unused)
L
Linus Torvalds 已提交
267
{
H
Heiko Carstens 已提交
268 269
	smp_send_stop();
	do_reipl();
L
Linus Torvalds 已提交
270 271 272 273
}

void machine_halt_smp(void)
{
H
Heiko Carstens 已提交
274 275 276 277 278
	smp_send_stop();
	if (MACHINE_IS_VM && strlen(vmhalt_cmd) > 0)
		__cpcmd(vmhalt_cmd, NULL, 0, NULL);
	signal_processor(smp_processor_id(), sigp_stop_and_store_status);
	for (;;);
L
Linus Torvalds 已提交
279 280 281 282
}

void machine_power_off_smp(void)
{
H
Heiko Carstens 已提交
283 284 285 286 287
	smp_send_stop();
	if (MACHINE_IS_VM && strlen(vmpoff_cmd) > 0)
		__cpcmd(vmpoff_cmd, NULL, 0, NULL);
	signal_processor(smp_processor_id(), sigp_stop_and_store_status);
	for (;;);
L
Linus Torvalds 已提交
288 289 290 291 292 293 294
}

/*
 * This is the main routine where commands issued by other
 * cpus are handled.
 */

295
static void do_ext_call_interrupt(__u16 code)
L
Linus Torvalds 已提交
296
{
297
	unsigned long bits;
L
Linus Torvalds 已提交
298

299 300 301 302 303 304
	/*
	 * handle bit signal external calls
	 *
	 * For the ec_schedule signal we have to do nothing. All the work
	 * is done automatically when we return from the interrupt.
	 */
L
Linus Torvalds 已提交
305 306
	bits = xchg(&S390_lowcore.ext_call_fast, 0);

307
	if (test_bit(ec_call_function, &bits))
L
Linus Torvalds 已提交
308 309 310 311 312 313 314 315 316
		do_call_function();
}

/*
 * Send an external call sigp to another cpu and return without waiting
 * for its completion.
 */
static void smp_ext_bitcall(int cpu, ec_bit_sig sig)
{
317 318 319
	/*
	 * Set signaling bit in lowcore of target cpu and kick it
	 */
L
Linus Torvalds 已提交
320
	set_bit(sig, (unsigned long *) &lowcore_ptr[cpu]->ext_call_fast);
321
	while (signal_processor(cpu, sigp_emergency_signal) == sigp_busy)
L
Linus Torvalds 已提交
322 323 324
		udelay(10);
}

325
#ifndef CONFIG_64BIT
L
Linus Torvalds 已提交
326 327 328 329 330 331 332 333 334 335
/*
 * this function sends a 'purge tlb' signal to another CPU.
 */
void smp_ptlb_callback(void *info)
{
	local_flush_tlb();
}

void smp_ptlb_all(void)
{
336
	on_each_cpu(smp_ptlb_callback, NULL, 0, 1);
L
Linus Torvalds 已提交
337 338
}
EXPORT_SYMBOL(smp_ptlb_all);
339
#endif /* ! CONFIG_64BIT */
L
Linus Torvalds 已提交
340 341 342 343 344 345 346 347

/*
 * this function sends a 'reschedule' IPI to another CPU.
 * it goes straight through and wastes no time serializing
 * anything. Worst case is that we lose a reschedule ...
 */
void smp_send_reschedule(int cpu)
{
348
	smp_ext_bitcall(cpu, ec_schedule);
L
Linus Torvalds 已提交
349 350 351 352 353
}

/*
 * parameter area for the set/clear control bit callbacks
 */
354
struct ec_creg_mask_parms {
L
Linus Torvalds 已提交
355 356
	unsigned long orvals[16];
	unsigned long andvals[16];
357
};
L
Linus Torvalds 已提交
358 359 360 361

/*
 * callback for setting/clearing control bits
 */
362 363
static void smp_ctl_bit_callback(void *info)
{
364
	struct ec_creg_mask_parms *pp = info;
L
Linus Torvalds 已提交
365 366
	unsigned long cregs[16];
	int i;
367

368 369
	__ctl_store(cregs, 0, 15);
	for (i = 0; i <= 15; i++)
L
Linus Torvalds 已提交
370
		cregs[i] = (cregs[i] & pp->andvals[i]) | pp->orvals[i];
371
	__ctl_load(cregs, 0, 15);
L
Linus Torvalds 已提交
372 373 374 375 376
}

/*
 * Set a bit in a control register of all cpus
 */
377 378 379
void smp_ctl_set_bit(int cr, int bit)
{
	struct ec_creg_mask_parms parms;
L
Linus Torvalds 已提交
380

381 382
	memset(&parms.orvals, 0, sizeof(parms.orvals));
	memset(&parms.andvals, 0xff, sizeof(parms.andvals));
L
Linus Torvalds 已提交
383
	parms.orvals[cr] = 1 << bit;
384
	on_each_cpu(smp_ctl_bit_callback, &parms, 0, 1);
L
Linus Torvalds 已提交
385
}
386
EXPORT_SYMBOL(smp_ctl_set_bit);
L
Linus Torvalds 已提交
387 388 389 390

/*
 * Clear a bit in a control register of all cpus
 */
391 392 393
void smp_ctl_clear_bit(int cr, int bit)
{
	struct ec_creg_mask_parms parms;
L
Linus Torvalds 已提交
394

395 396
	memset(&parms.orvals, 0, sizeof(parms.orvals));
	memset(&parms.andvals, 0xff, sizeof(parms.andvals));
L
Linus Torvalds 已提交
397
	parms.andvals[cr] = ~(1L << bit);
398
	on_each_cpu(smp_ctl_bit_callback, &parms, 0, 1);
L
Linus Torvalds 已提交
399
}
400
EXPORT_SYMBOL(smp_ctl_clear_bit);
L
Linus Torvalds 已提交
401

M
Michael Holzheu 已提交
402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460
#if defined(CONFIG_ZFCPDUMP) || defined(CONFIG_ZFCPDUMP_MODULE)

/*
 * zfcpdump_prefix_array holds prefix registers for the following scenario:
 * 64 bit zfcpdump kernel and 31 bit kernel which is to be dumped. We have to
 * save its prefix registers, since they get lost, when switching from 31 bit
 * to 64 bit.
 */
unsigned int zfcpdump_prefix_array[NR_CPUS + 1] \
	__attribute__((__section__(".data")));

static void __init smp_get_save_areas(void)
{
	unsigned int cpu, cpu_num, rc;
	__u16 boot_cpu_addr;

	if (ipl_info.type != IPL_TYPE_FCP_DUMP)
		return;
	boot_cpu_addr = S390_lowcore.cpu_data.cpu_addr;
	cpu_num = 1;
	for (cpu = 0; cpu <= 65535; cpu++) {
		if ((u16) cpu == boot_cpu_addr)
			continue;
		__cpu_logical_map[1] = (__u16) cpu;
		if (signal_processor(1, sigp_sense) == sigp_not_operational)
			continue;
		if (cpu_num >= NR_CPUS) {
			printk("WARNING: Registers for cpu %i are not "
			       "saved, since dump kernel was compiled with"
			       "NR_CPUS=%i!\n", cpu_num, NR_CPUS);
			continue;
		}
		zfcpdump_save_areas[cpu_num] =
			alloc_bootmem(sizeof(union save_area));
		while (1) {
			rc = signal_processor(1, sigp_stop_and_store_status);
			if (rc != sigp_busy)
				break;
			cpu_relax();
		}
		memcpy(zfcpdump_save_areas[cpu_num],
		       (void *)(unsigned long) store_prefix() +
		       SAVE_AREA_BASE, SAVE_AREA_SIZE);
#ifdef __s390x__
		/* copy original prefix register */
		zfcpdump_save_areas[cpu_num]->s390x.pref_reg =
			zfcpdump_prefix_array[cpu_num];
#endif
		cpu_num++;
	}
}

union save_area *zfcpdump_save_areas[NR_CPUS + 1];
EXPORT_SYMBOL_GPL(zfcpdump_save_areas);

#else
#define smp_get_save_areas() do { } while (0)
#endif

L
Linus Torvalds 已提交
461 462 463 464
/*
 * Lets check how many CPUs we have.
 */

465
static unsigned int __init smp_count_cpus(void)
L
Linus Torvalds 已提交
466
{
467
	unsigned int cpu, num_cpus;
L
Linus Torvalds 已提交
468 469 470 471 472 473 474 475 476
	__u16 boot_cpu_addr;

	/*
	 * cpu 0 is the boot cpu. See smp_prepare_boot_cpu.
	 */

	boot_cpu_addr = S390_lowcore.cpu_data.cpu_addr;
	current_thread_info()->cpu = 0;
	num_cpus = 1;
477
	for (cpu = 0; cpu <= 65535; cpu++) {
L
Linus Torvalds 已提交
478 479
		if ((__u16) cpu == boot_cpu_addr)
			continue;
480
		__cpu_logical_map[1] = (__u16) cpu;
481
		if (signal_processor(1, sigp_sense) == sigp_not_operational)
L
Linus Torvalds 已提交
482 483 484 485
			continue;
		num_cpus++;
	}

486
	printk("Detected %d CPU's\n", (int) num_cpus);
L
Linus Torvalds 已提交
487
	printk("Boot cpu address %2X\n", boot_cpu_addr);
488 489

	return num_cpus;
L
Linus Torvalds 已提交
490 491 492
}

/*
493
 *	Activate a secondary processor.
L
Linus Torvalds 已提交
494 495 496
 */
int __devinit start_secondary(void *cpuvoid)
{
497 498
	/* Setup the cpu */
	cpu_init();
499
	preempt_disable();
M
Martin Schwidefsky 已提交
500
	/* Enable TOD clock interrupts on the secondary cpu. */
501
	init_cpu_timer();
L
Linus Torvalds 已提交
502
#ifdef CONFIG_VIRT_TIMER
M
Martin Schwidefsky 已提交
503
	/* Enable cpu timer interrupts on the secondary cpu. */
504
	init_cpu_vtimer();
L
Linus Torvalds 已提交
505 506
#endif
	/* Enable pfault pseudo page faults on this cpu. */
H
Heiko Carstens 已提交
507 508
	pfault_init();

L
Linus Torvalds 已提交
509 510 511 512
	/* Mark this cpu as online */
	cpu_set(smp_processor_id(), cpu_online_map);
	/* Switch on interrupts */
	local_irq_enable();
513 514 515 516 517
	/* Print info about this processor */
	print_cpu_info(&S390_lowcore.cpu_data);
	/* cpu_idle will call schedule for us */
	cpu_idle();
	return 0;
L
Linus Torvalds 已提交
518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533
}

static void __init smp_create_idle(unsigned int cpu)
{
	struct task_struct *p;

	/*
	 *  don't care about the psw and regs settings since we'll never
	 *  reschedule the forked task.
	 */
	p = fork_idle(cpu);
	if (IS_ERR(p))
		panic("failed fork for CPU %u: %li", cpu, PTR_ERR(p));
	current_set[cpu] = p;
}

534
static int cpu_stopped(int cpu)
L
Linus Torvalds 已提交
535 536 537 538
{
	__u32 status;

	/* Check for stopped state */
539 540
	if (signal_processor_ps(&status, 0, cpu, sigp_sense) ==
	    sigp_status_stored) {
L
Linus Torvalds 已提交
541 542 543 544 545 546 547 548
		if (status & 0x40)
			return 1;
	}
	return 0;
}

/* Upping and downing of CPUs */

549
int __cpu_up(unsigned int cpu)
L
Linus Torvalds 已提交
550 551
{
	struct task_struct *idle;
552
	struct _lowcore *cpu_lowcore;
L
Linus Torvalds 已提交
553
	struct stack_frame *sf;
554 555
	sigp_ccode ccode;
	int curr_cpu;
L
Linus Torvalds 已提交
556 557 558 559 560 561 562 563 564 565 566 567

	for (curr_cpu = 0; curr_cpu <= 65535; curr_cpu++) {
		__cpu_logical_map[cpu] = (__u16) curr_cpu;
		if (cpu_stopped(cpu))
			break;
	}

	if (!cpu_stopped(cpu))
		return -ENODEV;

	ccode = signal_processor_p((__u32)(unsigned long)(lowcore_ptr[cpu]),
				   cpu, sigp_set_prefix);
568
	if (ccode) {
L
Linus Torvalds 已提交
569 570 571 572 573 574 575
		printk("sigp_set_prefix failed for cpu %d "
		       "with condition code %d\n",
		       (int) cpu, (int) ccode);
		return -EIO;
	}

	idle = current_set[cpu];
576
	cpu_lowcore = lowcore_ptr[cpu];
L
Linus Torvalds 已提交
577
	cpu_lowcore->kernel_stack = (unsigned long)
578
		task_stack_page(idle) + THREAD_SIZE;
L
Linus Torvalds 已提交
579 580 581 582 583 584 585
	sf = (struct stack_frame *) (cpu_lowcore->kernel_stack
				     - sizeof(struct pt_regs)
				     - sizeof(struct stack_frame));
	memset(sf, 0, sizeof(struct stack_frame));
	sf->gprs[9] = (unsigned long) sf;
	cpu_lowcore->save_area[15] = (unsigned long) sf;
	__ctl_store(cpu_lowcore->cregs_save_area[0], 0, 15);
586 587 588
	asm volatile(
		"	stam	0,15,0(%0)"
		: : "a" (&cpu_lowcore->access_regs_save_area) : "memory");
L
Linus Torvalds 已提交
589
	cpu_lowcore->percpu_offset = __per_cpu_offset[cpu];
590 591
	cpu_lowcore->current_task = (unsigned long) idle;
	cpu_lowcore->cpu_data.cpu_nr = cpu;
L
Linus Torvalds 已提交
592
	eieio();
M
Michael Ryan 已提交
593

594
	while (signal_processor(cpu, sigp_restart) == sigp_busy)
M
Michael Ryan 已提交
595
		udelay(10);
L
Linus Torvalds 已提交
596 597 598 599 600 601

	while (!cpu_online(cpu))
		cpu_relax();
	return 0;
}

602
static unsigned int __initdata additional_cpus;
603
static unsigned int __initdata possible_cpus;
604 605 606

void __init smp_setup_cpu_possible_map(void)
{
607
	unsigned int phy_cpus, pos_cpus, cpu;
608

M
Michael Holzheu 已提交
609
	smp_get_save_areas();
610 611
	phy_cpus = smp_count_cpus();
	pos_cpus = min(phy_cpus + additional_cpus, (unsigned int) NR_CPUS);
612

613
	if (possible_cpus)
614
		pos_cpus = min(possible_cpus, (unsigned int) NR_CPUS);
615

616
	for (cpu = 0; cpu < pos_cpus; cpu++)
617 618
		cpu_set(cpu, cpu_possible_map);

619 620 621 622
	phy_cpus = min(phy_cpus, pos_cpus);

	for (cpu = 0; cpu < phy_cpus; cpu++)
		cpu_set(cpu, cpu_present_map);
623 624 625 626 627 628 629 630 631 632 633
}

#ifdef CONFIG_HOTPLUG_CPU

static int __init setup_additional_cpus(char *s)
{
	additional_cpus = simple_strtoul(s, NULL, 0);
	return 0;
}
early_param("additional_cpus", setup_additional_cpus);

634 635 636 637 638 639 640
static int __init setup_possible_cpus(char *s)
{
	possible_cpus = simple_strtoul(s, NULL, 0);
	return 0;
}
early_param("possible_cpus", setup_possible_cpus);

641
int __cpu_disable(void)
L
Linus Torvalds 已提交
642
{
643
	struct ec_creg_mask_parms cr_parms;
Z
Zwane Mwaikambo 已提交
644
	int cpu = smp_processor_id();
L
Linus Torvalds 已提交
645

Z
Zwane Mwaikambo 已提交
646
	cpu_clear(cpu, cpu_online_map);
L
Linus Torvalds 已提交
647 648

	/* Disable pfault pseudo page faults on this cpu. */
H
Heiko Carstens 已提交
649
	pfault_fini();
L
Linus Torvalds 已提交
650

651 652
	memset(&cr_parms.orvals, 0, sizeof(cr_parms.orvals));
	memset(&cr_parms.andvals, 0xff, sizeof(cr_parms.andvals));
L
Linus Torvalds 已提交
653

654
	/* disable all external interrupts */
L
Linus Torvalds 已提交
655
	cr_parms.orvals[0] = 0;
656 657
	cr_parms.andvals[0] = ~(1 << 15 | 1 << 14 | 1 << 13 | 1 << 12 |
				1 << 11 | 1 << 10 | 1 <<  6 | 1 <<  4);
L
Linus Torvalds 已提交
658 659
	/* disable all I/O interrupts */
	cr_parms.orvals[6] = 0;
660 661
	cr_parms.andvals[6] = ~(1 << 31 | 1 << 30 | 1 << 29 | 1 << 28 |
				1 << 27 | 1 << 26 | 1 << 25 | 1 << 24);
L
Linus Torvalds 已提交
662 663
	/* disable most machine checks */
	cr_parms.orvals[14] = 0;
664 665
	cr_parms.andvals[14] = ~(1 << 28 | 1 << 27 | 1 << 26 |
				 1 << 25 | 1 << 24);
666

L
Linus Torvalds 已提交
667 668 669 670 671
	smp_ctl_bit_callback(&cr_parms);

	return 0;
}

672
void __cpu_die(unsigned int cpu)
L
Linus Torvalds 已提交
673 674 675 676 677 678 679
{
	/* Wait until target cpu is down */
	while (!smp_cpu_not_running(cpu))
		cpu_relax();
	printk("Processor %d spun down\n", cpu);
}

680
void cpu_die(void)
L
Linus Torvalds 已提交
681 682 683 684
{
	idle_task_exit();
	signal_processor(smp_processor_id(), sigp_stop);
	BUG();
685
	for (;;);
L
Linus Torvalds 已提交
686 687
}

688 689
#endif /* CONFIG_HOTPLUG_CPU */

L
Linus Torvalds 已提交
690 691 692 693 694 695 696 697
/*
 *	Cycle through the processors and setup structures.
 */

void __init smp_prepare_cpus(unsigned int max_cpus)
{
	unsigned long stack;
	unsigned int cpu;
698 699 700 701 702 703 704 705 706
	int i;

	/* request the 0x1201 emergency signal external interrupt */
	if (register_external_interrupt(0x1201, do_ext_call_interrupt) != 0)
		panic("Couldn't request external interrupt 0x1201");
	memset(lowcore_ptr, 0, sizeof(lowcore_ptr));
	/*
	 *  Initialize prefix pages and stacks for all possible cpus
	 */
L
Linus Torvalds 已提交
707 708
	print_cpu_info(&S390_lowcore.cpu_data);

709
	for_each_possible_cpu(i) {
L
Linus Torvalds 已提交
710
		lowcore_ptr[i] = (struct _lowcore *)
711 712 713 714
			__get_free_pages(GFP_KERNEL | GFP_DMA,
					 sizeof(void*) == 8 ? 1 : 0);
		stack = __get_free_pages(GFP_KERNEL, ASYNC_ORDER);
		if (!lowcore_ptr[i] || !stack)
L
Linus Torvalds 已提交
715 716 717
			panic("smp_boot_cpus failed to allocate memory\n");

		*(lowcore_ptr[i]) = S390_lowcore;
718 719 720
		lowcore_ptr[i]->async_stack = stack + ASYNC_SIZE;
		stack = __get_free_pages(GFP_KERNEL, 0);
		if (!stack)
L
Linus Torvalds 已提交
721
			panic("smp_boot_cpus failed to allocate memory\n");
722
		lowcore_ptr[i]->panic_stack = stack + PAGE_SIZE;
723
#ifndef CONFIG_64BIT
724 725
		if (MACHINE_HAS_IEEE) {
			lowcore_ptr[i]->extended_save_area_addr =
726 727
				(__u32) __get_free_pages(GFP_KERNEL, 0);
			if (!lowcore_ptr[i]->extended_save_area_addr)
728 729 730
				panic("smp_boot_cpus failed to "
				      "allocate memory\n");
		}
L
Linus Torvalds 已提交
731 732
#endif
	}
733
#ifndef CONFIG_64BIT
734 735 736
	if (MACHINE_HAS_IEEE)
		ctl_set_bit(14, 29); /* enable extended save area */
#endif
L
Linus Torvalds 已提交
737 738
	set_prefix((u32)(unsigned long) lowcore_ptr[smp_processor_id()]);

739
	for_each_possible_cpu(cpu)
L
Linus Torvalds 已提交
740 741 742 743 744 745 746 747 748 749 750 751 752 753 754
		if (cpu != smp_processor_id())
			smp_create_idle(cpu);
}

void __devinit smp_prepare_boot_cpu(void)
{
	BUG_ON(smp_processor_id() != 0);

	cpu_set(0, cpu_online_map);
	S390_lowcore.percpu_offset = __per_cpu_offset[0];
	current_set[0] = current;
}

void smp_cpus_done(unsigned int max_cpus)
{
755
	cpu_present_map = cpu_possible_map;
L
Linus Torvalds 已提交
756 757 758 759 760 761 762 763 764 765
}

/*
 * the frequency of the profiling timer can be changed
 * by writing a multiplier value into /proc/profile.
 *
 * usually you want to run this on all CPUs ;)
 */
int setup_profiling_timer(unsigned int multiplier)
{
766
	return 0;
L
Linus Torvalds 已提交
767 768 769 770
}

static DEFINE_PER_CPU(struct cpu, cpu_devices);

771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791
static ssize_t show_capability(struct sys_device *dev, char *buf)
{
	unsigned int capability;
	int rc;

	rc = get_cpu_capability(&capability);
	if (rc)
		return rc;
	return sprintf(buf, "%u\n", capability);
}
static SYSDEV_ATTR(capability, 0444, show_capability, NULL);

static int __cpuinit smp_cpu_notify(struct notifier_block *self,
				    unsigned long action, void *hcpu)
{
	unsigned int cpu = (unsigned int)(long)hcpu;
	struct cpu *c = &per_cpu(cpu_devices, cpu);
	struct sys_device *s = &c->sysdev;

	switch (action) {
	case CPU_ONLINE:
792
	case CPU_ONLINE_FROZEN:
793 794 795 796
		if (sysdev_create_file(s, &attr_capability))
			return NOTIFY_BAD;
		break;
	case CPU_DEAD:
797
	case CPU_DEAD_FROZEN:
798 799 800 801 802 803 804
		sysdev_remove_file(s, &attr_capability);
		break;
	}
	return NOTIFY_OK;
}

static struct notifier_block __cpuinitdata smp_cpu_nb = {
805
	.notifier_call = smp_cpu_notify,
806 807
};

L
Linus Torvalds 已提交
808 809 810
static int __init topology_init(void)
{
	int cpu;
811 812

	register_cpu_notifier(&smp_cpu_nb);
L
Linus Torvalds 已提交
813

814
	for_each_possible_cpu(cpu) {
815
		struct cpu *c = &per_cpu(cpu_devices, cpu);
816
		struct sys_device *s = &c->sysdev;
817 818

		c->hotpluggable = 1;
819 820 821 822 823
		register_cpu(c, cpu);
		if (!cpu_online(cpu))
			continue;
		s = &c->sysdev;
		sysdev_create_file(s, &attr_capability);
L
Linus Torvalds 已提交
824 825 826 827
	}
	return 0;
}
subsys_initcall(topology_init);