smp.c 19.9 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3
/*
 *  arch/s390/kernel/smp.c
 *
4
 *    Copyright IBM Corp. 1999,2007
L
Linus Torvalds 已提交
5
 *    Author(s): Denis Joseph Barrow (djbarrow@de.ibm.com,barrow_dj@yahoo.com),
6 7
 *		 Martin Schwidefsky (schwidefsky@de.ibm.com)
 *		 Heiko Carstens (heiko.carstens@de.ibm.com)
L
Linus Torvalds 已提交
8
 *
9
 *  based on other smp stuff by
L
Linus Torvalds 已提交
10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
 *    (c) 1995 Alan Cox, CymruNET Ltd  <alan@cymru.net>
 *    (c) 1998 Ingo Molnar
 *
 * We work with logical cpu numbering everywhere we can. The only
 * functions using the real cpu address (got from STAP) are the sigp
 * functions. For all other functions we use the identity mapping.
 * That means that cpu_number_map[i] == i for every cpu. cpu_number_map is
 * used e.g. to find the idle task belonging to a logical cpu. Every array
 * in the kernel is sorted by the logical cpu number and not by the physical
 * one which is causing all the confusion with __cpu_logical_map and
 * cpu_number_map in other architectures.
 */

#include <linux/module.h>
#include <linux/init.h>
#include <linux/mm.h>
A
Alexey Dobriyan 已提交
26
#include <linux/err.h>
L
Linus Torvalds 已提交
27 28 29 30 31 32
#include <linux/spinlock.h>
#include <linux/kernel_stat.h>
#include <linux/delay.h>
#include <linux/cache.h>
#include <linux/interrupt.h>
#include <linux/cpu.h>
33
#include <linux/timex.h>
M
Michael Holzheu 已提交
34
#include <linux/bootmem.h>
M
Michael Holzheu 已提交
35
#include <asm/ipl.h>
36
#include <asm/setup.h>
L
Linus Torvalds 已提交
37 38 39 40 41 42
#include <asm/sigp.h>
#include <asm/pgalloc.h>
#include <asm/irq.h>
#include <asm/s390_ext.h>
#include <asm/cpcmd.h>
#include <asm/tlbflush.h>
43
#include <asm/timer.h>
M
Michael Holzheu 已提交
44
#include <asm/lowcore.h>
45
#include <asm/cpu.h>
L
Linus Torvalds 已提交
46 47 48 49 50

/*
 * An array with a pointer the lowcore of every CPU.
 */
struct _lowcore *lowcore_ptr[NR_CPUS];
51
EXPORT_SYMBOL(lowcore_ptr);
L
Linus Torvalds 已提交
52

53
cpumask_t cpu_online_map = CPU_MASK_NONE;
54 55
EXPORT_SYMBOL(cpu_online_map);

56
cpumask_t cpu_possible_map = CPU_MASK_NONE;
57
EXPORT_SYMBOL(cpu_possible_map);
L
Linus Torvalds 已提交
58 59 60 61 62 63

static struct task_struct *current_set[NR_CPUS];

static void smp_ext_bitcall(int, ec_bit_sig);

/*
J
Jan Glauber 已提交
64 65
 * Structure and data for __smp_call_function_map(). This is designed to
 * minimise static memory requirements. It also looks cleaner.
L
Linus Torvalds 已提交
66 67 68 69 70 71
 */
static DEFINE_SPINLOCK(call_lock);

struct call_data_struct {
	void (*func) (void *info);
	void *info;
J
Jan Glauber 已提交
72 73
	cpumask_t started;
	cpumask_t finished;
L
Linus Torvalds 已提交
74 75 76
	int wait;
};

77
static struct call_data_struct *call_data;
L
Linus Torvalds 已提交
78 79 80 81 82 83 84 85 86 87

/*
 * 'Call function' interrupt callback
 */
static void do_call_function(void)
{
	void (*func) (void *info) = call_data->func;
	void *info = call_data->info;
	int wait = call_data->wait;

J
Jan Glauber 已提交
88
	cpu_set(smp_processor_id(), call_data->started);
L
Linus Torvalds 已提交
89 90
	(*func)(info);
	if (wait)
J
Jan Glauber 已提交
91
		cpu_set(smp_processor_id(), call_data->finished);;
L
Linus Torvalds 已提交
92 93
}

J
Jan Glauber 已提交
94 95
static void __smp_call_function_map(void (*func) (void *info), void *info,
				    int nonatomic, int wait, cpumask_t map)
L
Linus Torvalds 已提交
96 97
{
	struct call_data_struct data;
J
Jan Glauber 已提交
98
	int cpu, local = 0;
L
Linus Torvalds 已提交
99

J
Jan Glauber 已提交
100
	/*
101
	 * Can deadlock when interrupts are disabled or if in wrong context.
J
Jan Glauber 已提交
102
	 */
103
	WARN_ON(irqs_disabled() || in_irq());
L
Linus Torvalds 已提交
104

J
Jan Glauber 已提交
105 106 107 108 109 110 111 112 113 114 115 116
	/*
	 * Check for local function call. We have to have the same call order
	 * as in on_each_cpu() because of machine_restart_smp().
	 */
	if (cpu_isset(smp_processor_id(), map)) {
		local = 1;
		cpu_clear(smp_processor_id(), map);
	}

	cpus_and(map, map, cpu_online_map);
	if (cpus_empty(map))
		goto out;
L
Linus Torvalds 已提交
117 118 119

	data.func = func;
	data.info = info;
J
Jan Glauber 已提交
120
	data.started = CPU_MASK_NONE;
L
Linus Torvalds 已提交
121 122
	data.wait = wait;
	if (wait)
J
Jan Glauber 已提交
123
		data.finished = CPU_MASK_NONE;
L
Linus Torvalds 已提交
124

125
	spin_lock(&call_lock);
L
Linus Torvalds 已提交
126
	call_data = &data;
J
Jan Glauber 已提交
127 128 129

	for_each_cpu_mask(cpu, map)
		smp_ext_bitcall(cpu, ec_call_function);
L
Linus Torvalds 已提交
130 131

	/* Wait for response */
J
Jan Glauber 已提交
132
	while (!cpus_equal(map, data.started))
L
Linus Torvalds 已提交
133 134
		cpu_relax();
	if (wait)
J
Jan Glauber 已提交
135
		while (!cpus_equal(map, data.finished))
L
Linus Torvalds 已提交
136
			cpu_relax();
137
	spin_unlock(&call_lock);
J
Jan Glauber 已提交
138
out:
139 140
	if (local) {
		local_irq_disable();
J
Jan Glauber 已提交
141
		func(info);
142 143
		local_irq_enable();
	}
L
Linus Torvalds 已提交
144 145 146
}

/*
J
Jan Glauber 已提交
147 148 149 150 151
 * smp_call_function:
 * @func: the function to run; this must be fast and non-blocking
 * @info: an arbitrary pointer to pass to the function
 * @nonatomic: unused
 * @wait: if true, wait (atomically) until function has completed on other CPUs
L
Linus Torvalds 已提交
152
 *
J
Jan Glauber 已提交
153
 * Run a function on all other CPUs.
L
Linus Torvalds 已提交
154
 *
155 156
 * You must not call this function with disabled interrupts, from a
 * hardware interrupt handler or from a bottom half.
L
Linus Torvalds 已提交
157
 */
J
Jan Glauber 已提交
158 159
int smp_call_function(void (*func) (void *info), void *info, int nonatomic,
		      int wait)
L
Linus Torvalds 已提交
160
{
J
Jan Glauber 已提交
161
	cpumask_t map;
L
Linus Torvalds 已提交
162

163
	preempt_disable();
J
Jan Glauber 已提交
164 165 166
	map = cpu_online_map;
	cpu_clear(smp_processor_id(), map);
	__smp_call_function_map(func, info, nonatomic, wait, map);
167
	preempt_enable();
J
Jan Glauber 已提交
168 169 170
	return 0;
}
EXPORT_SYMBOL(smp_call_function);
L
Linus Torvalds 已提交
171

J
Jan Glauber 已提交
172
/*
173 174
 * smp_call_function_single:
 * @cpu: the CPU where func should run
J
Jan Glauber 已提交
175 176 177 178 179 180 181
 * @func: the function to run; this must be fast and non-blocking
 * @info: an arbitrary pointer to pass to the function
 * @nonatomic: unused
 * @wait: if true, wait (atomically) until function has completed on other CPUs
 *
 * Run a function on one processor.
 *
182 183
 * You must not call this function with disabled interrupts, from a
 * hardware interrupt handler or from a bottom half.
J
Jan Glauber 已提交
184
 */
185 186
int smp_call_function_single(int cpu, void (*func) (void *info), void *info,
			     int nonatomic, int wait)
J
Jan Glauber 已提交
187
{
188
	preempt_disable();
189 190
	__smp_call_function_map(func, info, nonatomic, wait,
				cpumask_of_cpu(cpu));
191
	preempt_enable();
L
Linus Torvalds 已提交
192 193
	return 0;
}
194
EXPORT_SYMBOL(smp_call_function_single);
L
Linus Torvalds 已提交
195

196
void smp_send_stop(void)
L
Linus Torvalds 已提交
197
{
198
	int cpu, rc;
L
Linus Torvalds 已提交
199

200 201
	/* Disable all interrupts/machine checks */
	__load_psw_mask(psw_kernel_bits & ~PSW_MASK_MCHECK);
L
Linus Torvalds 已提交
202

203 204
	/* write magic number to zero page (absolute 0) */
	lowcore_ptr[smp_processor_id()]->panic_magic = __PANIC_MAGIC;
L
Linus Torvalds 已提交
205

206
	/* stop all processors */
L
Linus Torvalds 已提交
207 208 209 210
	for_each_online_cpu(cpu) {
		if (cpu == smp_processor_id())
			continue;
		do {
211
			rc = signal_processor(cpu, sigp_stop);
212
		} while (rc == sigp_busy);
L
Linus Torvalds 已提交
213

214
		while (!smp_cpu_not_running(cpu))
H
Heiko Carstens 已提交
215 216 217 218
			cpu_relax();
	}
}

L
Linus Torvalds 已提交
219 220 221
/*
 * Reboot, halt and power_off routines for SMP.
 */
222
void machine_restart_smp(char *__unused)
L
Linus Torvalds 已提交
223
{
H
Heiko Carstens 已提交
224 225
	smp_send_stop();
	do_reipl();
L
Linus Torvalds 已提交
226 227 228 229
}

void machine_halt_smp(void)
{
H
Heiko Carstens 已提交
230 231 232 233 234
	smp_send_stop();
	if (MACHINE_IS_VM && strlen(vmhalt_cmd) > 0)
		__cpcmd(vmhalt_cmd, NULL, 0, NULL);
	signal_processor(smp_processor_id(), sigp_stop_and_store_status);
	for (;;);
L
Linus Torvalds 已提交
235 236 237 238
}

void machine_power_off_smp(void)
{
H
Heiko Carstens 已提交
239 240 241 242 243
	smp_send_stop();
	if (MACHINE_IS_VM && strlen(vmpoff_cmd) > 0)
		__cpcmd(vmpoff_cmd, NULL, 0, NULL);
	signal_processor(smp_processor_id(), sigp_stop_and_store_status);
	for (;;);
L
Linus Torvalds 已提交
244 245 246 247 248 249 250
}

/*
 * This is the main routine where commands issued by other
 * cpus are handled.
 */

251
static void do_ext_call_interrupt(__u16 code)
L
Linus Torvalds 已提交
252
{
253
	unsigned long bits;
L
Linus Torvalds 已提交
254

255 256 257 258 259 260
	/*
	 * handle bit signal external calls
	 *
	 * For the ec_schedule signal we have to do nothing. All the work
	 * is done automatically when we return from the interrupt.
	 */
L
Linus Torvalds 已提交
261 262
	bits = xchg(&S390_lowcore.ext_call_fast, 0);

263
	if (test_bit(ec_call_function, &bits))
L
Linus Torvalds 已提交
264 265 266 267 268 269 270 271 272
		do_call_function();
}

/*
 * Send an external call sigp to another cpu and return without waiting
 * for its completion.
 */
static void smp_ext_bitcall(int cpu, ec_bit_sig sig)
{
273 274 275
	/*
	 * Set signaling bit in lowcore of target cpu and kick it
	 */
L
Linus Torvalds 已提交
276
	set_bit(sig, (unsigned long *) &lowcore_ptr[cpu]->ext_call_fast);
277
	while (signal_processor(cpu, sigp_emergency_signal) == sigp_busy)
L
Linus Torvalds 已提交
278 279 280
		udelay(10);
}

281
#ifndef CONFIG_64BIT
L
Linus Torvalds 已提交
282 283 284 285 286
/*
 * this function sends a 'purge tlb' signal to another CPU.
 */
void smp_ptlb_callback(void *info)
{
M
Martin Schwidefsky 已提交
287
	__tlb_flush_local();
L
Linus Torvalds 已提交
288 289 290 291
}

void smp_ptlb_all(void)
{
292
	on_each_cpu(smp_ptlb_callback, NULL, 0, 1);
L
Linus Torvalds 已提交
293 294
}
EXPORT_SYMBOL(smp_ptlb_all);
295
#endif /* ! CONFIG_64BIT */
L
Linus Torvalds 已提交
296 297 298 299 300 301 302 303

/*
 * this function sends a 'reschedule' IPI to another CPU.
 * it goes straight through and wastes no time serializing
 * anything. Worst case is that we lose a reschedule ...
 */
void smp_send_reschedule(int cpu)
{
304
	smp_ext_bitcall(cpu, ec_schedule);
L
Linus Torvalds 已提交
305 306 307 308 309
}

/*
 * parameter area for the set/clear control bit callbacks
 */
310
struct ec_creg_mask_parms {
L
Linus Torvalds 已提交
311 312
	unsigned long orvals[16];
	unsigned long andvals[16];
313
};
L
Linus Torvalds 已提交
314 315 316 317

/*
 * callback for setting/clearing control bits
 */
318 319
static void smp_ctl_bit_callback(void *info)
{
320
	struct ec_creg_mask_parms *pp = info;
L
Linus Torvalds 已提交
321 322
	unsigned long cregs[16];
	int i;
323

324 325
	__ctl_store(cregs, 0, 15);
	for (i = 0; i <= 15; i++)
L
Linus Torvalds 已提交
326
		cregs[i] = (cregs[i] & pp->andvals[i]) | pp->orvals[i];
327
	__ctl_load(cregs, 0, 15);
L
Linus Torvalds 已提交
328 329 330 331 332
}

/*
 * Set a bit in a control register of all cpus
 */
333 334 335
void smp_ctl_set_bit(int cr, int bit)
{
	struct ec_creg_mask_parms parms;
L
Linus Torvalds 已提交
336

337 338
	memset(&parms.orvals, 0, sizeof(parms.orvals));
	memset(&parms.andvals, 0xff, sizeof(parms.andvals));
L
Linus Torvalds 已提交
339
	parms.orvals[cr] = 1 << bit;
340
	on_each_cpu(smp_ctl_bit_callback, &parms, 0, 1);
L
Linus Torvalds 已提交
341
}
342
EXPORT_SYMBOL(smp_ctl_set_bit);
L
Linus Torvalds 已提交
343 344 345 346

/*
 * Clear a bit in a control register of all cpus
 */
347 348 349
void smp_ctl_clear_bit(int cr, int bit)
{
	struct ec_creg_mask_parms parms;
L
Linus Torvalds 已提交
350

351 352
	memset(&parms.orvals, 0, sizeof(parms.orvals));
	memset(&parms.andvals, 0xff, sizeof(parms.andvals));
L
Linus Torvalds 已提交
353
	parms.andvals[cr] = ~(1L << bit);
354
	on_each_cpu(smp_ctl_bit_callback, &parms, 0, 1);
L
Linus Torvalds 已提交
355
}
356
EXPORT_SYMBOL(smp_ctl_clear_bit);
L
Linus Torvalds 已提交
357

M
Michael Holzheu 已提交
358 359 360 361 362 363 364 365 366 367 368
#if defined(CONFIG_ZFCPDUMP) || defined(CONFIG_ZFCPDUMP_MODULE)

/*
 * zfcpdump_prefix_array holds prefix registers for the following scenario:
 * 64 bit zfcpdump kernel and 31 bit kernel which is to be dumped. We have to
 * save its prefix registers, since they get lost, when switching from 31 bit
 * to 64 bit.
 */
unsigned int zfcpdump_prefix_array[NR_CPUS + 1] \
	__attribute__((__section__(".data")));

369
static void __init smp_get_save_area(unsigned int cpu, unsigned int phy_cpu)
M
Michael Holzheu 已提交
370 371 372
{
	if (ipl_info.type != IPL_TYPE_FCP_DUMP)
		return;
373 374 375 376
	if (cpu >= NR_CPUS) {
		printk(KERN_WARNING "Registers for cpu %i not saved since dump "
		       "kernel was compiled with NR_CPUS=%i\n", cpu, NR_CPUS);
		return;
M
Michael Holzheu 已提交
377
	}
378 379 380 381 382 383 384 385 386 387 388
	zfcpdump_save_areas[cpu] = alloc_bootmem(sizeof(union save_area));
	__cpu_logical_map[1] = (__u16) phy_cpu;
	while (signal_processor(1, sigp_stop_and_store_status) == sigp_busy)
		cpu_relax();
	memcpy(zfcpdump_save_areas[cpu],
	       (void *)(unsigned long) store_prefix() + SAVE_AREA_BASE,
	       SAVE_AREA_SIZE);
#ifdef CONFIG_64BIT
	/* copy original prefix register */
	zfcpdump_save_areas[cpu]->s390x.pref_reg = zfcpdump_prefix_array[cpu];
#endif
M
Michael Holzheu 已提交
389 390 391 392 393 394
}

union save_area *zfcpdump_save_areas[NR_CPUS + 1];
EXPORT_SYMBOL_GPL(zfcpdump_save_areas);

#else
395 396 397 398

static inline void smp_get_save_area(unsigned int cpu, unsigned int phy_cpu) { }

#endif /* CONFIG_ZFCPDUMP || CONFIG_ZFCPDUMP_MODULE */
M
Michael Holzheu 已提交
399

L
Linus Torvalds 已提交
400 401 402
/*
 * Lets check how many CPUs we have.
 */
403
static unsigned int __init smp_count_cpus(void)
L
Linus Torvalds 已提交
404
{
405
	unsigned int cpu, num_cpus;
L
Linus Torvalds 已提交
406 407 408 409 410 411 412 413
	__u16 boot_cpu_addr;

	/*
	 * cpu 0 is the boot cpu. See smp_prepare_boot_cpu.
	 */
	boot_cpu_addr = S390_lowcore.cpu_data.cpu_addr;
	current_thread_info()->cpu = 0;
	num_cpus = 1;
414
	for (cpu = 0; cpu <= 65535; cpu++) {
L
Linus Torvalds 已提交
415 416
		if ((__u16) cpu == boot_cpu_addr)
			continue;
417
		__cpu_logical_map[1] = (__u16) cpu;
418
		if (signal_processor(1, sigp_sense) == sigp_not_operational)
L
Linus Torvalds 已提交
419
			continue;
420
		smp_get_save_area(num_cpus, cpu);
L
Linus Torvalds 已提交
421 422
		num_cpus++;
	}
423
	printk("Detected %d CPU's\n", (int) num_cpus);
L
Linus Torvalds 已提交
424
	printk("Boot cpu address %2X\n", boot_cpu_addr);
425
	return num_cpus;
L
Linus Torvalds 已提交
426 427 428
}

/*
429
 *	Activate a secondary processor.
L
Linus Torvalds 已提交
430
 */
H
Heiko Carstens 已提交
431
int __cpuinit start_secondary(void *cpuvoid)
L
Linus Torvalds 已提交
432
{
433 434
	/* Setup the cpu */
	cpu_init();
435
	preempt_disable();
M
Martin Schwidefsky 已提交
436
	/* Enable TOD clock interrupts on the secondary cpu. */
437
	init_cpu_timer();
L
Linus Torvalds 已提交
438
#ifdef CONFIG_VIRT_TIMER
M
Martin Schwidefsky 已提交
439
	/* Enable cpu timer interrupts on the secondary cpu. */
440
	init_cpu_vtimer();
L
Linus Torvalds 已提交
441 442
#endif
	/* Enable pfault pseudo page faults on this cpu. */
H
Heiko Carstens 已提交
443 444
	pfault_init();

L
Linus Torvalds 已提交
445 446 447 448
	/* Mark this cpu as online */
	cpu_set(smp_processor_id(), cpu_online_map);
	/* Switch on interrupts */
	local_irq_enable();
449 450 451 452 453
	/* Print info about this processor */
	print_cpu_info(&S390_lowcore.cpu_data);
	/* cpu_idle will call schedule for us */
	cpu_idle();
	return 0;
L
Linus Torvalds 已提交
454 455
}

456 457
DEFINE_PER_CPU(struct s390_idle_data, s390_idle);

L
Linus Torvalds 已提交
458 459 460 461 462 463 464 465 466 467 468 469
static void __init smp_create_idle(unsigned int cpu)
{
	struct task_struct *p;

	/*
	 *  don't care about the psw and regs settings since we'll never
	 *  reschedule the forked task.
	 */
	p = fork_idle(cpu);
	if (IS_ERR(p))
		panic("failed fork for CPU %u: %li", cpu, PTR_ERR(p));
	current_set[cpu] = p;
470
	spin_lock_init(&(&per_cpu(s390_idle, cpu))->lock);
L
Linus Torvalds 已提交
471 472
}

473
static int cpu_stopped(int cpu)
L
Linus Torvalds 已提交
474 475 476 477
{
	__u32 status;

	/* Check for stopped state */
478 479
	if (signal_processor_ps(&status, 0, cpu, sigp_sense) ==
	    sigp_status_stored) {
L
Linus Torvalds 已提交
480 481 482 483 484 485 486 487
		if (status & 0x40)
			return 1;
	}
	return 0;
}

/* Upping and downing of CPUs */

488
int __cpu_up(unsigned int cpu)
L
Linus Torvalds 已提交
489 490
{
	struct task_struct *idle;
491
	struct _lowcore *cpu_lowcore;
L
Linus Torvalds 已提交
492
	struct stack_frame *sf;
493 494
	sigp_ccode ccode;
	int curr_cpu;
L
Linus Torvalds 已提交
495 496 497 498 499 500 501 502 503 504 505 506

	for (curr_cpu = 0; curr_cpu <= 65535; curr_cpu++) {
		__cpu_logical_map[cpu] = (__u16) curr_cpu;
		if (cpu_stopped(cpu))
			break;
	}

	if (!cpu_stopped(cpu))
		return -ENODEV;

	ccode = signal_processor_p((__u32)(unsigned long)(lowcore_ptr[cpu]),
				   cpu, sigp_set_prefix);
507
	if (ccode) {
L
Linus Torvalds 已提交
508 509 510 511 512 513 514
		printk("sigp_set_prefix failed for cpu %d "
		       "with condition code %d\n",
		       (int) cpu, (int) ccode);
		return -EIO;
	}

	idle = current_set[cpu];
515
	cpu_lowcore = lowcore_ptr[cpu];
L
Linus Torvalds 已提交
516
	cpu_lowcore->kernel_stack = (unsigned long)
517
		task_stack_page(idle) + THREAD_SIZE;
L
Linus Torvalds 已提交
518 519 520 521 522 523 524
	sf = (struct stack_frame *) (cpu_lowcore->kernel_stack
				     - sizeof(struct pt_regs)
				     - sizeof(struct stack_frame));
	memset(sf, 0, sizeof(struct stack_frame));
	sf->gprs[9] = (unsigned long) sf;
	cpu_lowcore->save_area[15] = (unsigned long) sf;
	__ctl_store(cpu_lowcore->cregs_save_area[0], 0, 15);
525 526 527
	asm volatile(
		"	stam	0,15,0(%0)"
		: : "a" (&cpu_lowcore->access_regs_save_area) : "memory");
L
Linus Torvalds 已提交
528
	cpu_lowcore->percpu_offset = __per_cpu_offset[cpu];
529 530
	cpu_lowcore->current_task = (unsigned long) idle;
	cpu_lowcore->cpu_data.cpu_nr = cpu;
L
Linus Torvalds 已提交
531
	eieio();
M
Michael Ryan 已提交
532

533
	while (signal_processor(cpu, sigp_restart) == sigp_busy)
M
Michael Ryan 已提交
534
		udelay(10);
L
Linus Torvalds 已提交
535 536 537 538 539 540

	while (!cpu_online(cpu))
		cpu_relax();
	return 0;
}

541
static unsigned int __initdata additional_cpus;
542
static unsigned int __initdata possible_cpus;
543 544 545

void __init smp_setup_cpu_possible_map(void)
{
546
	unsigned int phy_cpus, pos_cpus, cpu;
547

548 549
	phy_cpus = smp_count_cpus();
	pos_cpus = min(phy_cpus + additional_cpus, (unsigned int) NR_CPUS);
550

551
	if (possible_cpus)
552
		pos_cpus = min(possible_cpus, (unsigned int) NR_CPUS);
553

554
	for (cpu = 0; cpu < pos_cpus; cpu++)
555 556
		cpu_set(cpu, cpu_possible_map);

557 558 559 560
	phy_cpus = min(phy_cpus, pos_cpus);

	for (cpu = 0; cpu < phy_cpus; cpu++)
		cpu_set(cpu, cpu_present_map);
561 562 563 564 565 566 567 568 569 570 571
}

#ifdef CONFIG_HOTPLUG_CPU

static int __init setup_additional_cpus(char *s)
{
	additional_cpus = simple_strtoul(s, NULL, 0);
	return 0;
}
early_param("additional_cpus", setup_additional_cpus);

572 573 574 575 576 577 578
static int __init setup_possible_cpus(char *s)
{
	possible_cpus = simple_strtoul(s, NULL, 0);
	return 0;
}
early_param("possible_cpus", setup_possible_cpus);

579
int __cpu_disable(void)
L
Linus Torvalds 已提交
580
{
581
	struct ec_creg_mask_parms cr_parms;
Z
Zwane Mwaikambo 已提交
582
	int cpu = smp_processor_id();
L
Linus Torvalds 已提交
583

Z
Zwane Mwaikambo 已提交
584
	cpu_clear(cpu, cpu_online_map);
L
Linus Torvalds 已提交
585 586

	/* Disable pfault pseudo page faults on this cpu. */
H
Heiko Carstens 已提交
587
	pfault_fini();
L
Linus Torvalds 已提交
588

589 590
	memset(&cr_parms.orvals, 0, sizeof(cr_parms.orvals));
	memset(&cr_parms.andvals, 0xff, sizeof(cr_parms.andvals));
L
Linus Torvalds 已提交
591

592
	/* disable all external interrupts */
L
Linus Torvalds 已提交
593
	cr_parms.orvals[0] = 0;
594 595
	cr_parms.andvals[0] = ~(1 << 15 | 1 << 14 | 1 << 13 | 1 << 12 |
				1 << 11 | 1 << 10 | 1 <<  6 | 1 <<  4);
L
Linus Torvalds 已提交
596 597
	/* disable all I/O interrupts */
	cr_parms.orvals[6] = 0;
598 599
	cr_parms.andvals[6] = ~(1 << 31 | 1 << 30 | 1 << 29 | 1 << 28 |
				1 << 27 | 1 << 26 | 1 << 25 | 1 << 24);
L
Linus Torvalds 已提交
600 601
	/* disable most machine checks */
	cr_parms.orvals[14] = 0;
602 603
	cr_parms.andvals[14] = ~(1 << 28 | 1 << 27 | 1 << 26 |
				 1 << 25 | 1 << 24);
604

L
Linus Torvalds 已提交
605 606 607 608 609
	smp_ctl_bit_callback(&cr_parms);

	return 0;
}

610
void __cpu_die(unsigned int cpu)
L
Linus Torvalds 已提交
611 612 613 614 615 616 617
{
	/* Wait until target cpu is down */
	while (!smp_cpu_not_running(cpu))
		cpu_relax();
	printk("Processor %d spun down\n", cpu);
}

618
void cpu_die(void)
L
Linus Torvalds 已提交
619 620 621 622
{
	idle_task_exit();
	signal_processor(smp_processor_id(), sigp_stop);
	BUG();
623
	for (;;);
L
Linus Torvalds 已提交
624 625
}

626 627
#endif /* CONFIG_HOTPLUG_CPU */

L
Linus Torvalds 已提交
628 629 630 631 632 633 634 635
/*
 *	Cycle through the processors and setup structures.
 */

void __init smp_prepare_cpus(unsigned int max_cpus)
{
	unsigned long stack;
	unsigned int cpu;
636 637 638 639 640 641 642 643 644
	int i;

	/* request the 0x1201 emergency signal external interrupt */
	if (register_external_interrupt(0x1201, do_ext_call_interrupt) != 0)
		panic("Couldn't request external interrupt 0x1201");
	memset(lowcore_ptr, 0, sizeof(lowcore_ptr));
	/*
	 *  Initialize prefix pages and stacks for all possible cpus
	 */
L
Linus Torvalds 已提交
645 646
	print_cpu_info(&S390_lowcore.cpu_data);

647
	for_each_possible_cpu(i) {
L
Linus Torvalds 已提交
648
		lowcore_ptr[i] = (struct _lowcore *)
649 650 651 652
			__get_free_pages(GFP_KERNEL | GFP_DMA,
					 sizeof(void*) == 8 ? 1 : 0);
		stack = __get_free_pages(GFP_KERNEL, ASYNC_ORDER);
		if (!lowcore_ptr[i] || !stack)
L
Linus Torvalds 已提交
653 654 655
			panic("smp_boot_cpus failed to allocate memory\n");

		*(lowcore_ptr[i]) = S390_lowcore;
656 657 658
		lowcore_ptr[i]->async_stack = stack + ASYNC_SIZE;
		stack = __get_free_pages(GFP_KERNEL, 0);
		if (!stack)
L
Linus Torvalds 已提交
659
			panic("smp_boot_cpus failed to allocate memory\n");
660
		lowcore_ptr[i]->panic_stack = stack + PAGE_SIZE;
661
#ifndef CONFIG_64BIT
662 663
		if (MACHINE_HAS_IEEE) {
			lowcore_ptr[i]->extended_save_area_addr =
664 665
				(__u32) __get_free_pages(GFP_KERNEL, 0);
			if (!lowcore_ptr[i]->extended_save_area_addr)
666 667 668
				panic("smp_boot_cpus failed to "
				      "allocate memory\n");
		}
L
Linus Torvalds 已提交
669 670
#endif
	}
671
#ifndef CONFIG_64BIT
672 673 674
	if (MACHINE_HAS_IEEE)
		ctl_set_bit(14, 29); /* enable extended save area */
#endif
L
Linus Torvalds 已提交
675 676
	set_prefix((u32)(unsigned long) lowcore_ptr[smp_processor_id()]);

677
	for_each_possible_cpu(cpu)
L
Linus Torvalds 已提交
678 679 680 681
		if (cpu != smp_processor_id())
			smp_create_idle(cpu);
}

H
Heiko Carstens 已提交
682
void __init smp_prepare_boot_cpu(void)
L
Linus Torvalds 已提交
683 684 685 686 687 688
{
	BUG_ON(smp_processor_id() != 0);

	cpu_set(0, cpu_online_map);
	S390_lowcore.percpu_offset = __per_cpu_offset[0];
	current_set[0] = current;
689
	spin_lock_init(&(&__get_cpu_var(s390_idle))->lock);
L
Linus Torvalds 已提交
690 691
}

H
Heiko Carstens 已提交
692
void __init smp_cpus_done(unsigned int max_cpus)
L
Linus Torvalds 已提交
693
{
694
	cpu_present_map = cpu_possible_map;
L
Linus Torvalds 已提交
695 696 697 698 699 700 701 702 703 704
}

/*
 * the frequency of the profiling timer can be changed
 * by writing a multiplier value into /proc/profile.
 *
 * usually you want to run this on all CPUs ;)
 */
int setup_profiling_timer(unsigned int multiplier)
{
705
	return 0;
L
Linus Torvalds 已提交
706 707 708 709
}

static DEFINE_PER_CPU(struct cpu, cpu_devices);

710 711 712 713 714 715 716 717 718 719 720 721
static ssize_t show_capability(struct sys_device *dev, char *buf)
{
	unsigned int capability;
	int rc;

	rc = get_cpu_capability(&capability);
	if (rc)
		return rc;
	return sprintf(buf, "%u\n", capability);
}
static SYSDEV_ATTR(capability, 0444, show_capability, NULL);

722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748
static ssize_t show_idle_count(struct sys_device *dev, char *buf)
{
	struct s390_idle_data *idle;
	unsigned long long idle_count;

	idle = &per_cpu(s390_idle, dev->id);
	spin_lock_irq(&idle->lock);
	idle_count = idle->idle_count;
	spin_unlock_irq(&idle->lock);
	return sprintf(buf, "%llu\n", idle_count);
}
static SYSDEV_ATTR(idle_count, 0444, show_idle_count, NULL);

static ssize_t show_idle_time(struct sys_device *dev, char *buf)
{
	struct s390_idle_data *idle;
	unsigned long long new_time;

	idle = &per_cpu(s390_idle, dev->id);
	spin_lock_irq(&idle->lock);
	if (idle->in_idle) {
		new_time = get_clock();
		idle->idle_time += new_time - idle->idle_enter;
		idle->idle_enter = new_time;
	}
	new_time = idle->idle_time;
	spin_unlock_irq(&idle->lock);
749
	return sprintf(buf, "%llu\n", new_time >> 12);
750
}
751
static SYSDEV_ATTR(idle_time_us, 0444, show_idle_time, NULL);
752 753 754 755

static struct attribute *cpu_attrs[] = {
	&attr_capability.attr,
	&attr_idle_count.attr,
756
	&attr_idle_time_us.attr,
757 758 759 760 761 762 763
	NULL,
};

static struct attribute_group cpu_attr_group = {
	.attrs = cpu_attrs,
};

764 765 766 767 768 769
static int __cpuinit smp_cpu_notify(struct notifier_block *self,
				    unsigned long action, void *hcpu)
{
	unsigned int cpu = (unsigned int)(long)hcpu;
	struct cpu *c = &per_cpu(cpu_devices, cpu);
	struct sys_device *s = &c->sysdev;
770
	struct s390_idle_data *idle;
771 772 773

	switch (action) {
	case CPU_ONLINE:
774
	case CPU_ONLINE_FROZEN:
775 776 777 778 779 780 781
		idle = &per_cpu(s390_idle, cpu);
		spin_lock_irq(&idle->lock);
		idle->idle_enter = 0;
		idle->idle_time = 0;
		idle->idle_count = 0;
		spin_unlock_irq(&idle->lock);
		if (sysfs_create_group(&s->kobj, &cpu_attr_group))
782 783 784
			return NOTIFY_BAD;
		break;
	case CPU_DEAD:
785
	case CPU_DEAD_FROZEN:
786
		sysfs_remove_group(&s->kobj, &cpu_attr_group);
787 788 789 790 791 792
		break;
	}
	return NOTIFY_OK;
}

static struct notifier_block __cpuinitdata smp_cpu_nb = {
793
	.notifier_call = smp_cpu_notify,
794 795
};

L
Linus Torvalds 已提交
796 797 798
static int __init topology_init(void)
{
	int cpu;
799
	int rc;
800 801

	register_cpu_notifier(&smp_cpu_nb);
L
Linus Torvalds 已提交
802

803
	for_each_possible_cpu(cpu) {
804
		struct cpu *c = &per_cpu(cpu_devices, cpu);
805
		struct sys_device *s = &c->sysdev;
806 807

		c->hotpluggable = 1;
808 809 810 811
		register_cpu(c, cpu);
		if (!cpu_online(cpu))
			continue;
		s = &c->sysdev;
812 813 814
		rc = sysfs_create_group(&s->kobj, &cpu_attr_group);
		if (rc)
			return rc;
L
Linus Torvalds 已提交
815 816 817 818
	}
	return 0;
}
subsys_initcall(topology_init);