smp.c 26.3 KB
Newer Older
L
Linus Torvalds 已提交
1
/*
M
Martin Schwidefsky 已提交
2
 *  SMP related functions
L
Linus Torvalds 已提交
3
 *
M
Martin Schwidefsky 已提交
4 5 6 7
 *    Copyright IBM Corp. 1999,2012
 *    Author(s): Denis Joseph Barrow,
 *		 Martin Schwidefsky <schwidefsky@de.ibm.com>,
 *		 Heiko Carstens <heiko.carstens@de.ibm.com>,
L
Linus Torvalds 已提交
8
 *
9
 *  based on other smp stuff by
L
Linus Torvalds 已提交
10 11 12
 *    (c) 1995 Alan Cox, CymruNET Ltd  <alan@cymru.net>
 *    (c) 1998 Ingo Molnar
 *
M
Martin Schwidefsky 已提交
13 14 15
 * The code outside of smp.c uses logical cpu numbers, only smp.c does
 * the translation of logical to physical cpu ids. All new code that
 * operates on physical cpu numbers needs to go into smp.c.
L
Linus Torvalds 已提交
16 17
 */

18 19 20
#define KMSG_COMPONENT "cpu"
#define pr_fmt(fmt) KMSG_COMPONENT ": " fmt

21
#include <linux/workqueue.h>
L
Linus Torvalds 已提交
22 23 24
#include <linux/module.h>
#include <linux/init.h>
#include <linux/mm.h>
A
Alexey Dobriyan 已提交
25
#include <linux/err.h>
L
Linus Torvalds 已提交
26 27 28 29
#include <linux/spinlock.h>
#include <linux/kernel_stat.h>
#include <linux/delay.h>
#include <linux/interrupt.h>
30
#include <linux/irqflags.h>
L
Linus Torvalds 已提交
31
#include <linux/cpu.h>
32
#include <linux/slab.h>
M
Michael Holzheu 已提交
33
#include <linux/crash_dump.h>
34
#include <asm/asm-offsets.h>
35 36
#include <asm/switch_to.h>
#include <asm/facility.h>
M
Michael Holzheu 已提交
37
#include <asm/ipl.h>
38
#include <asm/setup.h>
L
Linus Torvalds 已提交
39 40
#include <asm/irq.h>
#include <asm/tlbflush.h>
41
#include <asm/timer.h>
M
Michael Holzheu 已提交
42
#include <asm/lowcore.h>
43
#include <asm/sclp.h>
44
#include <asm/vdso.h>
45
#include <asm/debug.h>
46
#include <asm/os_info.h>
47
#include "entry.h"
L
Linus Torvalds 已提交
48

M
Martin Schwidefsky 已提交
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65
enum {
	sigp_sense = 1,
	sigp_external_call = 2,
	sigp_emergency_signal = 3,
	sigp_start = 4,
	sigp_stop = 5,
	sigp_restart = 6,
	sigp_stop_and_store_status = 9,
	sigp_initial_cpu_reset = 11,
	sigp_cpu_reset = 12,
	sigp_set_prefix = 13,
	sigp_store_status_at_address = 14,
	sigp_store_extended_status_at_address = 15,
	sigp_set_architecture = 18,
	sigp_conditional_emergency_signal = 19,
	sigp_sense_running = 21,
};
66

M
Martin Schwidefsky 已提交
67 68 69 70 71 72
enum {
	sigp_order_code_accepted = 0,
	sigp_status_stored = 1,
	sigp_busy = 2,
	sigp_not_operational = 3,
};
L
Linus Torvalds 已提交
73

M
Martin Schwidefsky 已提交
74 75 76 77 78 79
enum {
	ec_schedule = 0,
	ec_call_function,
	ec_call_function_single,
	ec_stop_cpu,
};
80

M
Martin Schwidefsky 已提交
81
enum {
82 83 84 85
	CPU_STATE_STANDBY,
	CPU_STATE_CONFIGURED,
};

M
Martin Schwidefsky 已提交
86 87 88 89 90 91 92 93 94 95 96 97 98 99 100
struct pcpu {
	struct cpu cpu;
	struct _lowcore *lowcore;	/* lowcore page(s) for the cpu */
	unsigned long async_stack;	/* async stack for the cpu */
	unsigned long panic_stack;	/* panic stack for the cpu */
	unsigned long ec_mask;		/* bit mask for ec_xxx functions */
	int state;			/* physical cpu state */
	u32 status;			/* last status received via sigp */
	u16 address;			/* physical cpu address */
};

static u8 boot_cpu_type;
static u16 boot_cpu_address;
static struct pcpu pcpu_devices[NR_CPUS];

101
DEFINE_MUTEX(smp_cpu_state_mutex);
102

M
Martin Schwidefsky 已提交
103 104 105 106 107 108 109
/*
 * Signal processor helper functions.
 */
static inline int __pcpu_sigp(u16 addr, u8 order, u32 parm, u32 *status)
{
	register unsigned int reg1 asm ("1") = parm;
	int cc;
110

M
Martin Schwidefsky 已提交
111 112 113 114 115 116 117 118 119
	asm volatile(
		"	sigp	%1,%2,0(%3)\n"
		"	ipm	%0\n"
		"	srl	%0,28\n"
		: "=d" (cc), "+d" (reg1) : "d" (addr), "a" (order) : "cc");
	if (status && cc == 1)
		*status = reg1;
	return cc;
}
L
Linus Torvalds 已提交
120

M
Martin Schwidefsky 已提交
121
static inline int __pcpu_sigp_relax(u16 addr, u8 order, u32 parm, u32 *status)
122
{
M
Martin Schwidefsky 已提交
123
	int cc;
124

M
Martin Schwidefsky 已提交
125 126 127 128 129
	while (1) {
		cc = __pcpu_sigp(addr, order, parm, status);
		if (cc != sigp_busy)
			return cc;
		cpu_relax();
130 131 132
	}
}

M
Martin Schwidefsky 已提交
133
static int pcpu_sigp_retry(struct pcpu *pcpu, u8 order, u32 parm)
H
Heiko Carstens 已提交
134
{
M
Martin Schwidefsky 已提交
135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156
	int cc, retry;

	for (retry = 0; ; retry++) {
		cc = __pcpu_sigp(pcpu->address, order, parm, &pcpu->status);
		if (cc != sigp_busy)
			break;
		if (retry >= 3)
			udelay(10);
	}
	return cc;
}

static inline int pcpu_stopped(struct pcpu *pcpu)
{
	if (__pcpu_sigp(pcpu->address, sigp_sense,
			0, &pcpu->status) != sigp_status_stored)
		return 0;
	/* Check for stopped and check stop state */
	return !!(pcpu->status & 0x50);
}

static inline int pcpu_running(struct pcpu *pcpu)
H
Heiko Carstens 已提交
157
{
M
Martin Schwidefsky 已提交
158 159 160 161 162
	if (__pcpu_sigp(pcpu->address, sigp_sense_running,
			0, &pcpu->status) != sigp_status_stored)
		return 1;
	/* Check for running status */
	return !(pcpu->status & 0x400);
H
Heiko Carstens 已提交
163 164
}

165
/*
M
Martin Schwidefsky 已提交
166
 * Find struct pcpu by cpu address.
167
 */
M
Martin Schwidefsky 已提交
168
static struct pcpu *pcpu_find_address(const struct cpumask *mask, int address)
169 170 171
{
	int cpu;

M
Martin Schwidefsky 已提交
172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198
	for_each_cpu(cpu, mask)
		if (pcpu_devices[cpu].address == address)
			return pcpu_devices + cpu;
	return NULL;
}

static void pcpu_ec_call(struct pcpu *pcpu, int ec_bit)
{
	int order;

	set_bit(ec_bit, &pcpu->ec_mask);
	order = pcpu_running(pcpu) ?
		sigp_external_call : sigp_emergency_signal;
	pcpu_sigp_retry(pcpu, order, 0);
}

static int __cpuinit pcpu_alloc_lowcore(struct pcpu *pcpu, int cpu)
{
	struct _lowcore *lc;

	if (pcpu != &pcpu_devices[0]) {
		pcpu->lowcore =	(struct _lowcore *)
			__get_free_pages(GFP_KERNEL | GFP_DMA, LC_ORDER);
		pcpu->async_stack = __get_free_pages(GFP_KERNEL, ASYNC_ORDER);
		pcpu->panic_stack = __get_free_page(GFP_KERNEL);
		if (!pcpu->lowcore || !pcpu->panic_stack || !pcpu->async_stack)
			goto out;
199
	}
M
Martin Schwidefsky 已提交
200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225
	lc = pcpu->lowcore;
	memcpy(lc, &S390_lowcore, 512);
	memset((char *) lc + 512, 0, sizeof(*lc) - 512);
	lc->async_stack = pcpu->async_stack + ASYNC_SIZE;
	lc->panic_stack = pcpu->panic_stack + PAGE_SIZE;
	lc->cpu_nr = cpu;
#ifndef CONFIG_64BIT
	if (MACHINE_HAS_IEEE) {
		lc->extended_save_area_addr = get_zeroed_page(GFP_KERNEL);
		if (!lc->extended_save_area_addr)
			goto out;
	}
#else
	if (vdso_alloc_per_cpu(lc))
		goto out;
#endif
	lowcore_ptr[cpu] = lc;
	pcpu_sigp_retry(pcpu, sigp_set_prefix, (u32)(unsigned long) lc);
	return 0;
out:
	if (pcpu != &pcpu_devices[0]) {
		free_page(pcpu->panic_stack);
		free_pages(pcpu->async_stack, ASYNC_ORDER);
		free_pages((unsigned long) pcpu->lowcore, LC_ORDER);
	}
	return -ENOMEM;
226 227
}

228 229
#ifdef CONFIG_HOTPLUG_CPU

M
Martin Schwidefsky 已提交
230
static void pcpu_free_lowcore(struct pcpu *pcpu)
231
{
M
Martin Schwidefsky 已提交
232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250
	pcpu_sigp_retry(pcpu, sigp_set_prefix, 0);
	lowcore_ptr[pcpu - pcpu_devices] = NULL;
#ifndef CONFIG_64BIT
	if (MACHINE_HAS_IEEE) {
		struct _lowcore *lc = pcpu->lowcore;

		free_page((unsigned long) lc->extended_save_area_addr);
		lc->extended_save_area_addr = 0;
	}
#else
	vdso_free_per_cpu(pcpu->lowcore);
#endif
	if (pcpu != &pcpu_devices[0]) {
		free_page(pcpu->panic_stack);
		free_pages(pcpu->async_stack, ASYNC_ORDER);
		free_pages((unsigned long) pcpu->lowcore, LC_ORDER);
	}
}

251 252
#endif /* CONFIG_HOTPLUG_CPU */

M
Martin Schwidefsky 已提交
253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299
static void pcpu_prepare_secondary(struct pcpu *pcpu, int cpu)
{
	struct _lowcore *lc = pcpu->lowcore;

	atomic_inc(&init_mm.context.attach_count);
	lc->cpu_nr = cpu;
	lc->percpu_offset = __per_cpu_offset[cpu];
	lc->kernel_asce = S390_lowcore.kernel_asce;
	lc->machine_flags = S390_lowcore.machine_flags;
	lc->ftrace_func = S390_lowcore.ftrace_func;
	lc->user_timer = lc->system_timer = lc->steal_timer = 0;
	__ctl_store(lc->cregs_save_area, 0, 15);
	save_access_regs((unsigned int *) lc->access_regs_save_area);
	memcpy(lc->stfle_fac_list, S390_lowcore.stfle_fac_list,
	       MAX_FACILITY_BIT/8);
}

static void pcpu_attach_task(struct pcpu *pcpu, struct task_struct *tsk)
{
	struct _lowcore *lc = pcpu->lowcore;
	struct thread_info *ti = task_thread_info(tsk);

	lc->kernel_stack = (unsigned long) task_stack_page(tsk) + THREAD_SIZE;
	lc->thread_info = (unsigned long) task_thread_info(tsk);
	lc->current_task = (unsigned long) tsk;
	lc->user_timer = ti->user_timer;
	lc->system_timer = ti->system_timer;
	lc->steal_timer = 0;
}

static void pcpu_start_fn(struct pcpu *pcpu, void (*func)(void *), void *data)
{
	struct _lowcore *lc = pcpu->lowcore;

	lc->restart_stack = lc->kernel_stack;
	lc->restart_fn = (unsigned long) func;
	lc->restart_data = (unsigned long) data;
	lc->restart_source = -1UL;
	pcpu_sigp_retry(pcpu, sigp_restart, 0);
}

/*
 * Call function via PSW restart on pcpu and stop the current cpu.
 */
static void pcpu_delegate(struct pcpu *pcpu, void (*func)(void *),
			  void *data, unsigned long stack)
{
300 301 302 303 304 305 306
	struct _lowcore *lc = lowcore_ptr[pcpu - pcpu_devices];
	struct {
		unsigned long	stack;
		void		*func;
		void		*data;
		unsigned long	source;
	} restart = { stack, func, data, stap() };
M
Martin Schwidefsky 已提交
307 308

	__load_psw_mask(psw_kernel_bits);
309
	if (pcpu->address == restart.source)
M
Martin Schwidefsky 已提交
310 311 312 313
		func(data);	/* should not return */
	/* Stop target cpu (if func returns this stops the current cpu). */
	pcpu_sigp_retry(pcpu, sigp_stop, 0);
	/* Restart func on the target cpu and stop the current cpu. */
314
	memcpy_absolute(&lc->restart_stack, &restart, sizeof(restart));
M
Martin Schwidefsky 已提交
315 316 317 318 319
	asm volatile(
		"0:	sigp	0,%0,6	# sigp restart to target cpu\n"
		"	brc	2,0b	# busy, try again\n"
		"1:	sigp	0,%1,5	# sigp stop to current cpu\n"
		"	brc	2,1b	# busy, try again\n"
320
		: : "d" (pcpu->address), "d" (restart.source) : "0", "1", "cc");
M
Martin Schwidefsky 已提交
321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343
	for (;;) ;
}

/*
 * Call function on an online CPU.
 */
void smp_call_online_cpu(void (*func)(void *), void *data)
{
	struct pcpu *pcpu;

	/* Use the current cpu if it is online. */
	pcpu = pcpu_find_address(cpu_online_mask, stap());
	if (!pcpu)
		/* Use the first online cpu. */
		pcpu = pcpu_devices + cpumask_first(cpu_online_mask);
	pcpu_delegate(pcpu, func, data, (unsigned long) restart_stack);
}

/*
 * Call function on the ipl CPU.
 */
void smp_call_ipl_cpu(void (*func)(void *), void *data)
{
344 345
	pcpu_delegate(&pcpu_devices[0], func, data,
		      pcpu_devices->panic_stack + PAGE_SIZE);
M
Martin Schwidefsky 已提交
346 347 348 349 350 351 352 353 354 355
}

int smp_find_processor_id(u16 address)
{
	int cpu;

	for_each_present_cpu(cpu)
		if (pcpu_devices[cpu].address == address)
			return cpu;
	return -1;
356 357
}

M
Martin Schwidefsky 已提交
358
int smp_vcpu_scheduled(int cpu)
359
{
M
Martin Schwidefsky 已提交
360 361 362 363 364 365 366
	return pcpu_running(pcpu_devices + cpu);
}

void smp_yield(void)
{
	if (MACHINE_HAS_DIAG44)
		asm volatile("diag 0,0,0x44");
367 368
}

M
Martin Schwidefsky 已提交
369
void smp_yield_cpu(int cpu)
370
{
M
Martin Schwidefsky 已提交
371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401
	if (MACHINE_HAS_DIAG9C)
		asm volatile("diag %0,0,0x9c"
			     : : "d" (pcpu_devices[cpu].address));
	else if (MACHINE_HAS_DIAG44)
		asm volatile("diag 0,0,0x44");
}

/*
 * Send cpus emergency shutdown signal. This gives the cpus the
 * opportunity to complete outstanding interrupts.
 */
void smp_emergency_stop(cpumask_t *cpumask)
{
	u64 end;
	int cpu;

	end = get_clock() + (1000000UL << 12);
	for_each_cpu(cpu, cpumask) {
		struct pcpu *pcpu = pcpu_devices + cpu;
		set_bit(ec_stop_cpu, &pcpu->ec_mask);
		while (__pcpu_sigp(pcpu->address, sigp_emergency_signal,
				   0, NULL) == sigp_busy &&
		       get_clock() < end)
			cpu_relax();
	}
	while (get_clock() < end) {
		for_each_cpu(cpu, cpumask)
			if (pcpu_stopped(pcpu_devices + cpu))
				cpumask_clear_cpu(cpu, cpumask);
		if (cpumask_empty(cpumask))
			break;
402
		cpu_relax();
M
Martin Schwidefsky 已提交
403
	}
404 405
}

M
Martin Schwidefsky 已提交
406 407 408
/*
 * Stop all cpus but the current one.
 */
409
void smp_send_stop(void)
L
Linus Torvalds 已提交
410
{
411 412
	cpumask_t cpumask;
	int cpu;
L
Linus Torvalds 已提交
413

414
	/* Disable all interrupts/machine checks */
415
	__load_psw_mask(psw_kernel_bits | PSW_MASK_DAT);
416
	trace_hardirqs_off();
L
Linus Torvalds 已提交
417

418
	debug_set_critical();
419 420 421
	cpumask_copy(&cpumask, cpu_online_mask);
	cpumask_clear_cpu(smp_processor_id(), &cpumask);

M
Martin Schwidefsky 已提交
422 423
	if (oops_in_progress)
		smp_emergency_stop(&cpumask);
L
Linus Torvalds 已提交
424

425 426
	/* stop all processors */
	for_each_cpu(cpu, &cpumask) {
M
Martin Schwidefsky 已提交
427 428 429
		struct pcpu *pcpu = pcpu_devices + cpu;
		pcpu_sigp_retry(pcpu, sigp_stop, 0);
		while (!pcpu_stopped(pcpu))
H
Heiko Carstens 已提交
430 431 432 433
			cpu_relax();
	}
}

M
Martin Schwidefsky 已提交
434 435 436 437 438 439 440 441 442
/*
 * Stop the current cpu.
 */
void smp_stop_cpu(void)
{
	pcpu_sigp_retry(pcpu_devices + smp_processor_id(), sigp_stop, 0);
	for (;;) ;
}

L
Linus Torvalds 已提交
443 444 445 446
/*
 * This is the main routine where commands issued by other
 * cpus are handled.
 */
447
static void do_ext_call_interrupt(struct ext_code ext_code,
448
				  unsigned int param32, unsigned long param64)
L
Linus Torvalds 已提交
449
{
450
	unsigned long bits;
M
Martin Schwidefsky 已提交
451
	int cpu;
L
Linus Torvalds 已提交
452

M
Martin Schwidefsky 已提交
453
	cpu = smp_processor_id();
454
	if (ext_code.code == 0x1202)
M
Martin Schwidefsky 已提交
455
		kstat_cpu(cpu).irqs[EXTINT_EXC]++;
456
	else
M
Martin Schwidefsky 已提交
457
		kstat_cpu(cpu).irqs[EXTINT_EMS]++;
458 459 460
	/*
	 * handle bit signal external calls
	 */
M
Martin Schwidefsky 已提交
461
	bits = xchg(&pcpu_devices[cpu].ec_mask, 0);
L
Linus Torvalds 已提交
462

463 464 465
	if (test_bit(ec_stop_cpu, &bits))
		smp_stop_cpu();

466 467 468
	if (test_bit(ec_schedule, &bits))
		scheduler_ipi();

469
	if (test_bit(ec_call_function, &bits))
470 471 472 473
		generic_smp_call_function_interrupt();

	if (test_bit(ec_call_function_single, &bits))
		generic_smp_call_function_single_interrupt();
474

L
Linus Torvalds 已提交
475 476
}

477
void arch_send_call_function_ipi_mask(const struct cpumask *mask)
478 479 480
{
	int cpu;

481
	for_each_cpu(cpu, mask)
M
Martin Schwidefsky 已提交
482
		pcpu_ec_call(pcpu_devices + cpu, ec_call_function);
483 484 485 486
}

void arch_send_call_function_single_ipi(int cpu)
{
M
Martin Schwidefsky 已提交
487
	pcpu_ec_call(pcpu_devices + cpu, ec_call_function_single);
488 489
}

490
#ifndef CONFIG_64BIT
L
Linus Torvalds 已提交
491 492 493
/*
 * this function sends a 'purge tlb' signal to another CPU.
 */
494
static void smp_ptlb_callback(void *info)
L
Linus Torvalds 已提交
495
{
M
Martin Schwidefsky 已提交
496
	__tlb_flush_local();
L
Linus Torvalds 已提交
497 498 499 500
}

void smp_ptlb_all(void)
{
501
	on_each_cpu(smp_ptlb_callback, NULL, 1);
L
Linus Torvalds 已提交
502 503
}
EXPORT_SYMBOL(smp_ptlb_all);
504
#endif /* ! CONFIG_64BIT */
L
Linus Torvalds 已提交
505 506 507 508 509 510 511 512

/*
 * this function sends a 'reschedule' IPI to another CPU.
 * it goes straight through and wastes no time serializing
 * anything. Worst case is that we lose a reschedule ...
 */
void smp_send_reschedule(int cpu)
{
M
Martin Schwidefsky 已提交
513
	pcpu_ec_call(pcpu_devices + cpu, ec_schedule);
L
Linus Torvalds 已提交
514 515 516 517 518
}

/*
 * parameter area for the set/clear control bit callbacks
 */
519
struct ec_creg_mask_parms {
M
Martin Schwidefsky 已提交
520 521 522
	unsigned long orval;
	unsigned long andval;
	int cr;
523
};
L
Linus Torvalds 已提交
524 525 526 527

/*
 * callback for setting/clearing control bits
 */
528 529
static void smp_ctl_bit_callback(void *info)
{
530
	struct ec_creg_mask_parms *pp = info;
L
Linus Torvalds 已提交
531
	unsigned long cregs[16];
532

533
	__ctl_store(cregs, 0, 15);
M
Martin Schwidefsky 已提交
534
	cregs[pp->cr] = (cregs[pp->cr] & pp->andval) | pp->orval;
535
	__ctl_load(cregs, 0, 15);
L
Linus Torvalds 已提交
536 537 538 539 540
}

/*
 * Set a bit in a control register of all cpus
 */
541 542
void smp_ctl_set_bit(int cr, int bit)
{
M
Martin Schwidefsky 已提交
543
	struct ec_creg_mask_parms parms = { 1UL << bit, -1UL, cr };
L
Linus Torvalds 已提交
544

545
	on_each_cpu(smp_ctl_bit_callback, &parms, 1);
L
Linus Torvalds 已提交
546
}
547
EXPORT_SYMBOL(smp_ctl_set_bit);
L
Linus Torvalds 已提交
548 549 550 551

/*
 * Clear a bit in a control register of all cpus
 */
552 553
void smp_ctl_clear_bit(int cr, int bit)
{
M
Martin Schwidefsky 已提交
554
	struct ec_creg_mask_parms parms = { 0, ~(1UL << bit), cr };
L
Linus Torvalds 已提交
555

556
	on_each_cpu(smp_ctl_bit_callback, &parms, 1);
L
Linus Torvalds 已提交
557
}
558
EXPORT_SYMBOL(smp_ctl_clear_bit);
L
Linus Torvalds 已提交
559

M
Michael Holzheu 已提交
560
#if defined(CONFIG_ZFCPDUMP) || defined(CONFIG_CRASH_DUMP)
M
Michael Holzheu 已提交
561

M
Martin Schwidefsky 已提交
562 563 564 565
struct save_area *zfcpdump_save_areas[NR_CPUS + 1];
EXPORT_SYMBOL_GPL(zfcpdump_save_areas);

static void __init smp_get_save_area(int cpu, u16 address)
M
Michael Holzheu 已提交
566
{
M
Martin Schwidefsky 已提交
567 568 569
	void *lc = pcpu_devices[0].lowcore;
	struct save_area *save_area;

M
Michael Holzheu 已提交
570
	if (is_kdump_kernel())
M
Michael Holzheu 已提交
571
		return;
M
Martin Schwidefsky 已提交
572 573 574
	if (!OLDMEM_BASE && (address == boot_cpu_address ||
			     ipl_info.type != IPL_TYPE_FCP_DUMP))
		return;
575
	if (cpu >= NR_CPUS) {
M
Martin Schwidefsky 已提交
576 577
		pr_warning("CPU %i exceeds the maximum %i and is excluded "
			   "from the dump\n", cpu, NR_CPUS - 1);
578
		return;
M
Michael Holzheu 已提交
579
	}
M
Martin Schwidefsky 已提交
580 581 582 583 584 585 586 587 588 589 590 591 592 593 594
	save_area = kmalloc(sizeof(struct save_area), GFP_KERNEL);
	if (!save_area)
		panic("could not allocate memory for save area\n");
	zfcpdump_save_areas[cpu] = save_area;
#ifdef CONFIG_CRASH_DUMP
	if (address == boot_cpu_address) {
		/* Copy the registers of the boot cpu. */
		copy_oldmem_page(1, (void *) save_area, sizeof(*save_area),
				 SAVE_AREA_BASE - PAGE_SIZE, 0);
		return;
	}
#endif
	/* Get the registers of a non-boot cpu. */
	__pcpu_sigp_relax(address, sigp_stop_and_store_status, 0, NULL);
	memcpy_real(save_area, lc + SAVE_AREA_BASE, sizeof(*save_area));
M
Michael Holzheu 已提交
595 596
}

M
Martin Schwidefsky 已提交
597
int smp_store_status(int cpu)
598
{
M
Martin Schwidefsky 已提交
599
	struct pcpu *pcpu;
600

M
Martin Schwidefsky 已提交
601 602 603 604
	pcpu = pcpu_devices + cpu;
	if (__pcpu_sigp_relax(pcpu->address, sigp_stop_and_store_status,
			      0, NULL) != sigp_order_code_accepted)
		return -EIO;
605 606 607
	return 0;
}

M
Martin Schwidefsky 已提交
608
#else /* CONFIG_ZFCPDUMP || CONFIG_CRASH_DUMP */
609

M
Martin Schwidefsky 已提交
610
static inline void smp_get_save_area(int cpu, u16 address) { }
611

M
Martin Schwidefsky 已提交
612
#endif /* CONFIG_ZFCPDUMP || CONFIG_CRASH_DUMP */
613

M
Martin Schwidefsky 已提交
614
static struct sclp_cpu_info *smp_get_cpu_info(void)
615
{
M
Martin Schwidefsky 已提交
616
	static int use_sigp_detection;
617
	struct sclp_cpu_info *info;
M
Martin Schwidefsky 已提交
618 619 620 621 622 623 624 625 626 627 628 629 630
	int address;

	info = kzalloc(sizeof(*info), GFP_KERNEL);
	if (info && (use_sigp_detection || sclp_get_cpu_info(info))) {
		use_sigp_detection = 1;
		for (address = 0; address <= MAX_CPU_ADDRESS; address++) {
			if (__pcpu_sigp_relax(address, sigp_sense, 0, NULL) ==
			    sigp_not_operational)
				continue;
			info->cpu[info->configured].address = address;
			info->configured++;
		}
		info->combined = info->configured;
631
	}
M
Martin Schwidefsky 已提交
632
	return info;
633 634
}

M
Martin Schwidefsky 已提交
635 636 637 638
static int __devinit smp_add_present_cpu(int cpu);

static int __devinit __smp_rescan_cpus(struct sclp_cpu_info *info,
				       int sysfs_add)
639
{
M
Martin Schwidefsky 已提交
640
	struct pcpu *pcpu;
641
	cpumask_t avail;
M
Martin Schwidefsky 已提交
642
	int cpu, nr, i;
643

M
Martin Schwidefsky 已提交
644
	nr = 0;
645
	cpumask_xor(&avail, cpu_possible_mask, cpu_present_mask);
M
Martin Schwidefsky 已提交
646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664
	cpu = cpumask_first(&avail);
	for (i = 0; (i < info->combined) && (cpu < nr_cpu_ids); i++) {
		if (info->has_cpu_type && info->cpu[i].type != boot_cpu_type)
			continue;
		if (pcpu_find_address(cpu_present_mask, info->cpu[i].address))
			continue;
		pcpu = pcpu_devices + cpu;
		pcpu->address = info->cpu[i].address;
		pcpu->state = (cpu >= info->configured) ?
			CPU_STATE_STANDBY : CPU_STATE_CONFIGURED;
		cpu_set_polarization(cpu, POLARIZATION_UNKNOWN);
		set_cpu_present(cpu, true);
		if (sysfs_add && smp_add_present_cpu(cpu) != 0)
			set_cpu_present(cpu, false);
		else
			nr++;
		cpu = cpumask_next(cpu, &avail);
	}
	return nr;
L
Linus Torvalds 已提交
665 666
}

667 668 669 670 671
static void __init smp_detect_cpus(void)
{
	unsigned int cpu, c_cpus, s_cpus;
	struct sclp_cpu_info *info;

M
Martin Schwidefsky 已提交
672
	info = smp_get_cpu_info();
673 674 675 676
	if (!info)
		panic("smp_detect_cpus failed to allocate memory\n");
	if (info->has_cpu_type) {
		for (cpu = 0; cpu < info->combined; cpu++) {
M
Martin Schwidefsky 已提交
677 678 679 680 681
			if (info->cpu[cpu].address != boot_cpu_address)
				continue;
			/* The boot cpu dictates the cpu type. */
			boot_cpu_type = info->cpu[cpu].type;
			break;
682 683
		}
	}
M
Martin Schwidefsky 已提交
684
	c_cpus = s_cpus = 0;
685
	for (cpu = 0; cpu < info->combined; cpu++) {
M
Martin Schwidefsky 已提交
686
		if (info->has_cpu_type && info->cpu[cpu].type != boot_cpu_type)
687
			continue;
M
Martin Schwidefsky 已提交
688 689 690 691
		if (cpu < info->configured) {
			smp_get_save_area(c_cpus, info->cpu[cpu].address);
			c_cpus++;
		} else
692 693
			s_cpus++;
	}
694
	pr_info("%d configured CPUs, %d standby CPUs\n", c_cpus, s_cpus);
695
	get_online_cpus();
M
Martin Schwidefsky 已提交
696
	__smp_rescan_cpus(info, 0);
697
	put_online_cpus();
M
Martin Schwidefsky 已提交
698
	kfree(info);
699 700
}

L
Linus Torvalds 已提交
701
/*
702
 *	Activate a secondary processor.
L
Linus Torvalds 已提交
703
 */
M
Martin Schwidefsky 已提交
704
static void __cpuinit smp_start_secondary(void *cpuvoid)
L
Linus Torvalds 已提交
705
{
M
Martin Schwidefsky 已提交
706 707 708 709 710 711 712 713
	S390_lowcore.last_update_clock = get_clock();
	S390_lowcore.restart_stack = (unsigned long) restart_stack;
	S390_lowcore.restart_fn = (unsigned long) do_restart;
	S390_lowcore.restart_data = 0;
	S390_lowcore.restart_source = -1UL;
	restore_access_regs(S390_lowcore.access_regs_save_area);
	__ctl_load(S390_lowcore.cregs_save_area, 0, 15);
	__load_psw_mask(psw_kernel_bits | PSW_MASK_DAT);
714
	cpu_init();
715
	preempt_disable();
716 717
	init_cpu_timer();
	init_cpu_vtimer();
H
Heiko Carstens 已提交
718
	pfault_init();
719
	notify_cpu_starting(smp_processor_id());
720
	ipi_call_lock();
721
	set_cpu_online(smp_processor_id(), true);
722
	ipi_call_unlock();
L
Linus Torvalds 已提交
723
	local_irq_enable();
724 725
	/* cpu_idle will call schedule for us */
	cpu_idle();
L
Linus Torvalds 已提交
726 727 728
}

/* Upping and downing of CPUs */
729
int __cpuinit __cpu_up(unsigned int cpu, struct task_struct *tidle)
L
Linus Torvalds 已提交
730
{
M
Martin Schwidefsky 已提交
731 732
	struct pcpu *pcpu;
	int rc;
L
Linus Torvalds 已提交
733

M
Martin Schwidefsky 已提交
734 735
	pcpu = pcpu_devices + cpu;
	if (pcpu->state != CPU_STATE_CONFIGURED)
736
		return -EIO;
M
Martin Schwidefsky 已提交
737 738
	if (pcpu_sigp_retry(pcpu, sigp_initial_cpu_reset, 0) !=
	    sigp_order_code_accepted)
739
		return -EIO;
740

M
Martin Schwidefsky 已提交
741 742 743 744
	rc = pcpu_alloc_lowcore(pcpu, cpu);
	if (rc)
		return rc;
	pcpu_prepare_secondary(pcpu, cpu);
745
	pcpu_attach_task(pcpu, tidle);
M
Martin Schwidefsky 已提交
746
	pcpu_start_fn(pcpu, smp_start_secondary, NULL);
L
Linus Torvalds 已提交
747 748 749 750 751
	while (!cpu_online(cpu))
		cpu_relax();
	return 0;
}

752
static int __init setup_possible_cpus(char *s)
753
{
M
Martin Schwidefsky 已提交
754
	int max, cpu;
755

M
Martin Schwidefsky 已提交
756 757
	if (kstrtoint(s, 0, &max) < 0)
		return 0;
758
	init_cpu_possible(cpumask_of(0));
M
Martin Schwidefsky 已提交
759
	for (cpu = 1; cpu < max && cpu < nr_cpu_ids; cpu++)
760
		set_cpu_possible(cpu, true);
761 762 763 764
	return 0;
}
early_param("possible_cpus", setup_possible_cpus);

765 766
#ifdef CONFIG_HOTPLUG_CPU

767
int __cpu_disable(void)
L
Linus Torvalds 已提交
768
{
M
Martin Schwidefsky 已提交
769
	unsigned long cregs[16];
L
Linus Torvalds 已提交
770

M
Martin Schwidefsky 已提交
771 772
	set_cpu_online(smp_processor_id(), false);
	/* Disable pseudo page faults on this cpu. */
H
Heiko Carstens 已提交
773
	pfault_fini();
M
Martin Schwidefsky 已提交
774 775 776 777 778 779
	/* Disable interrupt sources via control register. */
	__ctl_store(cregs, 0, 15);
	cregs[0]  &= ~0x0000ee70UL;	/* disable all external interrupts */
	cregs[6]  &= ~0xff000000UL;	/* disable all I/O interrupts */
	cregs[14] &= ~0x1f000000UL;	/* disable most machine checks */
	__ctl_load(cregs, 0, 15);
L
Linus Torvalds 已提交
780 781 782
	return 0;
}

783
void __cpu_die(unsigned int cpu)
L
Linus Torvalds 已提交
784
{
M
Martin Schwidefsky 已提交
785 786
	struct pcpu *pcpu;

L
Linus Torvalds 已提交
787
	/* Wait until target cpu is down */
M
Martin Schwidefsky 已提交
788 789
	pcpu = pcpu_devices + cpu;
	while (!pcpu_stopped(pcpu))
L
Linus Torvalds 已提交
790
		cpu_relax();
M
Martin Schwidefsky 已提交
791
	pcpu_free_lowcore(pcpu);
792
	atomic_dec(&init_mm.context.attach_count);
L
Linus Torvalds 已提交
793 794
}

795
void __noreturn cpu_die(void)
L
Linus Torvalds 已提交
796 797
{
	idle_task_exit();
M
Martin Schwidefsky 已提交
798 799
	pcpu_sigp_retry(pcpu_devices + smp_processor_id(), sigp_stop, 0);
	for (;;) ;
L
Linus Torvalds 已提交
800 801
}

802 803
#endif /* CONFIG_HOTPLUG_CPU */

L
Linus Torvalds 已提交
804 805
void __init smp_prepare_cpus(unsigned int max_cpus)
{
806 807 808
	/* request the 0x1201 emergency signal external interrupt */
	if (register_external_interrupt(0x1201, do_ext_call_interrupt) != 0)
		panic("Couldn't request external interrupt 0x1201");
809 810 811
	/* request the 0x1202 external call external interrupt */
	if (register_external_interrupt(0x1202, do_ext_call_interrupt) != 0)
		panic("Couldn't request external interrupt 0x1202");
M
Martin Schwidefsky 已提交
812
	smp_detect_cpus();
L
Linus Torvalds 已提交
813 814
}

H
Heiko Carstens 已提交
815
void __init smp_prepare_boot_cpu(void)
L
Linus Torvalds 已提交
816
{
M
Martin Schwidefsky 已提交
817 818 819 820 821 822 823 824
	struct pcpu *pcpu = pcpu_devices;

	boot_cpu_address = stap();
	pcpu->state = CPU_STATE_CONFIGURED;
	pcpu->address = boot_cpu_address;
	pcpu->lowcore = (struct _lowcore *)(unsigned long) store_prefix();
	pcpu->async_stack = S390_lowcore.async_stack - ASYNC_SIZE;
	pcpu->panic_stack = S390_lowcore.panic_stack - PAGE_SIZE;
L
Linus Torvalds 已提交
825
	S390_lowcore.percpu_offset = __per_cpu_offset[0];
826
	cpu_set_polarization(0, POLARIZATION_UNKNOWN);
M
Martin Schwidefsky 已提交
827 828
	set_cpu_present(0, true);
	set_cpu_online(0, true);
L
Linus Torvalds 已提交
829 830
}

H
Heiko Carstens 已提交
831
void __init smp_cpus_done(unsigned int max_cpus)
L
Linus Torvalds 已提交
832 833 834
{
}

835 836 837 838 839
void __init smp_setup_processor_id(void)
{
	S390_lowcore.cpu_nr = 0;
}

L
Linus Torvalds 已提交
840 841 842 843 844 845 846 847
/*
 * the frequency of the profiling timer can be changed
 * by writing a multiplier value into /proc/profile.
 *
 * usually you want to run this on all CPUs ;)
 */
int setup_profiling_timer(unsigned int multiplier)
{
848
	return 0;
L
Linus Torvalds 已提交
849 850
}

851
#ifdef CONFIG_HOTPLUG_CPU
852
static ssize_t cpu_configure_show(struct device *dev,
M
Martin Schwidefsky 已提交
853
				  struct device_attribute *attr, char *buf)
854 855 856 857
{
	ssize_t count;

	mutex_lock(&smp_cpu_state_mutex);
M
Martin Schwidefsky 已提交
858
	count = sprintf(buf, "%d\n", pcpu_devices[dev->id].state);
859 860 861 862
	mutex_unlock(&smp_cpu_state_mutex);
	return count;
}

863
static ssize_t cpu_configure_store(struct device *dev,
M
Martin Schwidefsky 已提交
864 865
				   struct device_attribute *attr,
				   const char *buf, size_t count)
866
{
M
Martin Schwidefsky 已提交
867 868
	struct pcpu *pcpu;
	int cpu, val, rc;
869 870 871 872 873 874
	char delim;

	if (sscanf(buf, "%d %c", &val, &delim) != 1)
		return -EINVAL;
	if (val != 0 && val != 1)
		return -EINVAL;
875
	get_online_cpus();
H
Heiko Carstens 已提交
876
	mutex_lock(&smp_cpu_state_mutex);
877
	rc = -EBUSY;
878
	/* disallow configuration changes of online cpus and cpu 0 */
M
Martin Schwidefsky 已提交
879
	cpu = dev->id;
880
	if (cpu_online(cpu) || cpu == 0)
881
		goto out;
M
Martin Schwidefsky 已提交
882
	pcpu = pcpu_devices + cpu;
883 884 885
	rc = 0;
	switch (val) {
	case 0:
M
Martin Schwidefsky 已提交
886 887 888 889 890 891 892 893
		if (pcpu->state != CPU_STATE_CONFIGURED)
			break;
		rc = sclp_cpu_deconfigure(pcpu->address);
		if (rc)
			break;
		pcpu->state = CPU_STATE_STANDBY;
		cpu_set_polarization(cpu, POLARIZATION_UNKNOWN);
		topology_expect_change();
894 895
		break;
	case 1:
M
Martin Schwidefsky 已提交
896 897 898 899 900 901 902 903
		if (pcpu->state != CPU_STATE_STANDBY)
			break;
		rc = sclp_cpu_configure(pcpu->address);
		if (rc)
			break;
		pcpu->state = CPU_STATE_CONFIGURED;
		cpu_set_polarization(cpu, POLARIZATION_UNKNOWN);
		topology_expect_change();
904 905 906 907 908 909
		break;
	default:
		break;
	}
out:
	mutex_unlock(&smp_cpu_state_mutex);
H
Heiko Carstens 已提交
910
	put_online_cpus();
911 912
	return rc ? rc : count;
}
913
static DEVICE_ATTR(configure, 0644, cpu_configure_show, cpu_configure_store);
914 915
#endif /* CONFIG_HOTPLUG_CPU */

916 917
static ssize_t show_cpu_address(struct device *dev,
				struct device_attribute *attr, char *buf)
918
{
M
Martin Schwidefsky 已提交
919
	return sprintf(buf, "%d\n", pcpu_devices[dev->id].address);
920
}
921
static DEVICE_ATTR(address, 0444, show_cpu_address, NULL);
922 923 924

static struct attribute *cpu_common_attrs[] = {
#ifdef CONFIG_HOTPLUG_CPU
925
	&dev_attr_configure.attr,
926
#endif
927
	&dev_attr_address.attr,
928 929 930 931 932 933
	NULL,
};

static struct attribute_group cpu_common_attr_group = {
	.attrs = cpu_common_attrs,
};
L
Linus Torvalds 已提交
934

935 936
static ssize_t show_idle_count(struct device *dev,
				struct device_attribute *attr, char *buf)
937
{
M
Martin Schwidefsky 已提交
938
	struct s390_idle_data *idle = &per_cpu(s390_idle, dev->id);
939
	unsigned long long idle_count;
940
	unsigned int sequence;
941

M
Martin Schwidefsky 已提交
942 943 944 945 946 947
	do {
		sequence = ACCESS_ONCE(idle->sequence);
		idle_count = ACCESS_ONCE(idle->idle_count);
		if (ACCESS_ONCE(idle->idle_enter))
			idle_count++;
	} while ((sequence & 1) || (idle->sequence != sequence));
948 949
	return sprintf(buf, "%llu\n", idle_count);
}
950
static DEVICE_ATTR(idle_count, 0444, show_idle_count, NULL);
951

952 953
static ssize_t show_idle_time(struct device *dev,
				struct device_attribute *attr, char *buf)
954
{
M
Martin Schwidefsky 已提交
955 956
	struct s390_idle_data *idle = &per_cpu(s390_idle, dev->id);
	unsigned long long now, idle_time, idle_enter, idle_exit;
957
	unsigned int sequence;
958

M
Martin Schwidefsky 已提交
959 960 961 962 963 964 965 966
	do {
		now = get_clock();
		sequence = ACCESS_ONCE(idle->sequence);
		idle_time = ACCESS_ONCE(idle->idle_time);
		idle_enter = ACCESS_ONCE(idle->idle_enter);
		idle_exit = ACCESS_ONCE(idle->idle_exit);
	} while ((sequence & 1) || (idle->sequence != sequence));
	idle_time += idle_enter ? ((idle_exit ? : now) - idle_enter) : 0;
967
	return sprintf(buf, "%llu\n", idle_time >> 12);
968
}
969
static DEVICE_ATTR(idle_time_us, 0444, show_idle_time, NULL);
970

971
static struct attribute *cpu_online_attrs[] = {
972 973
	&dev_attr_idle_count.attr,
	&dev_attr_idle_time_us.attr,
974 975 976
	NULL,
};

977 978
static struct attribute_group cpu_online_attr_group = {
	.attrs = cpu_online_attrs,
979 980
};

981 982 983 984
static int __cpuinit smp_cpu_notify(struct notifier_block *self,
				    unsigned long action, void *hcpu)
{
	unsigned int cpu = (unsigned int)(long)hcpu;
M
Martin Schwidefsky 已提交
985
	struct cpu *c = &pcpu_devices[cpu].cpu;
986
	struct device *s = &c->dev;
987
	struct s390_idle_data *idle;
988
	int err = 0;
989 990 991

	switch (action) {
	case CPU_ONLINE:
992
	case CPU_ONLINE_FROZEN:
993
		idle = &per_cpu(s390_idle, cpu);
994
		memset(idle, 0, sizeof(struct s390_idle_data));
995
		err = sysfs_create_group(&s->kobj, &cpu_online_attr_group);
996 997
		break;
	case CPU_DEAD:
998
	case CPU_DEAD_FROZEN:
999
		sysfs_remove_group(&s->kobj, &cpu_online_attr_group);
1000 1001
		break;
	}
1002
	return notifier_from_errno(err);
1003 1004 1005
}

static struct notifier_block __cpuinitdata smp_cpu_nb = {
1006
	.notifier_call = smp_cpu_notify,
1007 1008
};

1009
static int __devinit smp_add_present_cpu(int cpu)
1010
{
M
Martin Schwidefsky 已提交
1011
	struct cpu *c = &pcpu_devices[cpu].cpu;
1012
	struct device *s = &c->dev;
1013 1014 1015 1016 1017 1018 1019 1020 1021
	int rc;

	c->hotpluggable = 1;
	rc = register_cpu(c, cpu);
	if (rc)
		goto out;
	rc = sysfs_create_group(&s->kobj, &cpu_common_attr_group);
	if (rc)
		goto out_cpu;
1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035
	if (cpu_online(cpu)) {
		rc = sysfs_create_group(&s->kobj, &cpu_online_attr_group);
		if (rc)
			goto out_online;
	}
	rc = topology_cpu_init(c);
	if (rc)
		goto out_topology;
	return 0;

out_topology:
	if (cpu_online(cpu))
		sysfs_remove_group(&s->kobj, &cpu_online_attr_group);
out_online:
1036 1037 1038 1039 1040 1041 1042 1043 1044 1045
	sysfs_remove_group(&s->kobj, &cpu_common_attr_group);
out_cpu:
#ifdef CONFIG_HOTPLUG_CPU
	unregister_cpu(c);
#endif
out:
	return rc;
}

#ifdef CONFIG_HOTPLUG_CPU
1046

1047
int __ref smp_rescan_cpus(void)
1048
{
M
Martin Schwidefsky 已提交
1049 1050
	struct sclp_cpu_info *info;
	int nr;
1051

M
Martin Schwidefsky 已提交
1052 1053 1054
	info = smp_get_cpu_info();
	if (!info)
		return -ENOMEM;
1055
	get_online_cpus();
H
Heiko Carstens 已提交
1056
	mutex_lock(&smp_cpu_state_mutex);
M
Martin Schwidefsky 已提交
1057
	nr = __smp_rescan_cpus(info, 1);
1058
	mutex_unlock(&smp_cpu_state_mutex);
H
Heiko Carstens 已提交
1059
	put_online_cpus();
M
Martin Schwidefsky 已提交
1060 1061
	kfree(info);
	if (nr)
H
Heiko Carstens 已提交
1062
		topology_schedule_update();
M
Martin Schwidefsky 已提交
1063
	return 0;
1064 1065
}

1066 1067
static ssize_t __ref rescan_store(struct device *dev,
				  struct device_attribute *attr,
1068
				  const char *buf,
1069 1070 1071 1072 1073
				  size_t count)
{
	int rc;

	rc = smp_rescan_cpus();
1074 1075
	return rc ? rc : count;
}
1076
static DEVICE_ATTR(rescan, 0200, NULL, rescan_store);
1077 1078
#endif /* CONFIG_HOTPLUG_CPU */

1079
static int __init s390_smp_init(void)
L
Linus Torvalds 已提交
1080
{
1081
	int cpu, rc;
1082 1083

	register_cpu_notifier(&smp_cpu_nb);
1084
#ifdef CONFIG_HOTPLUG_CPU
1085
	rc = device_create_file(cpu_subsys.dev_root, &dev_attr_rescan);
1086 1087 1088 1089 1090
	if (rc)
		return rc;
#endif
	for_each_present_cpu(cpu) {
		rc = smp_add_present_cpu(cpu);
1091 1092
		if (rc)
			return rc;
L
Linus Torvalds 已提交
1093 1094 1095
	}
	return 0;
}
1096
subsys_initcall(s390_smp_init);