smp.c 26.6 KB
Newer Older
L
Linus Torvalds 已提交
1
/*
M
Martin Schwidefsky 已提交
2
 *  SMP related functions
L
Linus Torvalds 已提交
3
 *
M
Martin Schwidefsky 已提交
4 5 6 7
 *    Copyright IBM Corp. 1999,2012
 *    Author(s): Denis Joseph Barrow,
 *		 Martin Schwidefsky <schwidefsky@de.ibm.com>,
 *		 Heiko Carstens <heiko.carstens@de.ibm.com>,
L
Linus Torvalds 已提交
8
 *
9
 *  based on other smp stuff by
L
Linus Torvalds 已提交
10 11 12
 *    (c) 1995 Alan Cox, CymruNET Ltd  <alan@cymru.net>
 *    (c) 1998 Ingo Molnar
 *
M
Martin Schwidefsky 已提交
13 14 15
 * The code outside of smp.c uses logical cpu numbers, only smp.c does
 * the translation of logical to physical cpu ids. All new code that
 * operates on physical cpu numbers needs to go into smp.c.
L
Linus Torvalds 已提交
16 17
 */

18 19 20
#define KMSG_COMPONENT "cpu"
#define pr_fmt(fmt) KMSG_COMPONENT ": " fmt

21
#include <linux/workqueue.h>
L
Linus Torvalds 已提交
22 23 24
#include <linux/module.h>
#include <linux/init.h>
#include <linux/mm.h>
A
Alexey Dobriyan 已提交
25
#include <linux/err.h>
L
Linus Torvalds 已提交
26 27 28 29
#include <linux/spinlock.h>
#include <linux/kernel_stat.h>
#include <linux/delay.h>
#include <linux/interrupt.h>
30
#include <linux/irqflags.h>
L
Linus Torvalds 已提交
31
#include <linux/cpu.h>
32
#include <linux/slab.h>
M
Michael Holzheu 已提交
33
#include <linux/crash_dump.h>
34
#include <asm/asm-offsets.h>
35 36
#include <asm/switch_to.h>
#include <asm/facility.h>
M
Michael Holzheu 已提交
37
#include <asm/ipl.h>
38
#include <asm/setup.h>
L
Linus Torvalds 已提交
39 40
#include <asm/irq.h>
#include <asm/tlbflush.h>
41
#include <asm/timer.h>
M
Michael Holzheu 已提交
42
#include <asm/lowcore.h>
43
#include <asm/sclp.h>
44
#include <asm/vdso.h>
45
#include <asm/debug.h>
46
#include <asm/os_info.h>
47
#include "entry.h"
L
Linus Torvalds 已提交
48

M
Martin Schwidefsky 已提交
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65
enum {
	sigp_sense = 1,
	sigp_external_call = 2,
	sigp_emergency_signal = 3,
	sigp_start = 4,
	sigp_stop = 5,
	sigp_restart = 6,
	sigp_stop_and_store_status = 9,
	sigp_initial_cpu_reset = 11,
	sigp_cpu_reset = 12,
	sigp_set_prefix = 13,
	sigp_store_status_at_address = 14,
	sigp_store_extended_status_at_address = 15,
	sigp_set_architecture = 18,
	sigp_conditional_emergency_signal = 19,
	sigp_sense_running = 21,
};
66

M
Martin Schwidefsky 已提交
67 68 69 70 71 72
enum {
	sigp_order_code_accepted = 0,
	sigp_status_stored = 1,
	sigp_busy = 2,
	sigp_not_operational = 3,
};
L
Linus Torvalds 已提交
73

M
Martin Schwidefsky 已提交
74 75 76 77 78 79
enum {
	ec_schedule = 0,
	ec_call_function,
	ec_call_function_single,
	ec_stop_cpu,
};
80

M
Martin Schwidefsky 已提交
81
enum {
82 83 84 85
	CPU_STATE_STANDBY,
	CPU_STATE_CONFIGURED,
};

M
Martin Schwidefsky 已提交
86 87 88 89 90 91 92 93 94 95 96 97 98 99 100
struct pcpu {
	struct cpu cpu;
	struct _lowcore *lowcore;	/* lowcore page(s) for the cpu */
	unsigned long async_stack;	/* async stack for the cpu */
	unsigned long panic_stack;	/* panic stack for the cpu */
	unsigned long ec_mask;		/* bit mask for ec_xxx functions */
	int state;			/* physical cpu state */
	u32 status;			/* last status received via sigp */
	u16 address;			/* physical cpu address */
};

static u8 boot_cpu_type;
static u16 boot_cpu_address;
static struct pcpu pcpu_devices[NR_CPUS];

101
DEFINE_MUTEX(smp_cpu_state_mutex);
102

M
Martin Schwidefsky 已提交
103 104 105 106 107 108 109
/*
 * Signal processor helper functions.
 */
static inline int __pcpu_sigp(u16 addr, u8 order, u32 parm, u32 *status)
{
	register unsigned int reg1 asm ("1") = parm;
	int cc;
110

M
Martin Schwidefsky 已提交
111 112 113 114 115 116 117 118 119
	asm volatile(
		"	sigp	%1,%2,0(%3)\n"
		"	ipm	%0\n"
		"	srl	%0,28\n"
		: "=d" (cc), "+d" (reg1) : "d" (addr), "a" (order) : "cc");
	if (status && cc == 1)
		*status = reg1;
	return cc;
}
L
Linus Torvalds 已提交
120

M
Martin Schwidefsky 已提交
121
static inline int __pcpu_sigp_relax(u16 addr, u8 order, u32 parm, u32 *status)
122
{
M
Martin Schwidefsky 已提交
123
	int cc;
124

M
Martin Schwidefsky 已提交
125 126 127 128 129
	while (1) {
		cc = __pcpu_sigp(addr, order, parm, status);
		if (cc != sigp_busy)
			return cc;
		cpu_relax();
130 131 132
	}
}

M
Martin Schwidefsky 已提交
133
static int pcpu_sigp_retry(struct pcpu *pcpu, u8 order, u32 parm)
H
Heiko Carstens 已提交
134
{
M
Martin Schwidefsky 已提交
135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156
	int cc, retry;

	for (retry = 0; ; retry++) {
		cc = __pcpu_sigp(pcpu->address, order, parm, &pcpu->status);
		if (cc != sigp_busy)
			break;
		if (retry >= 3)
			udelay(10);
	}
	return cc;
}

static inline int pcpu_stopped(struct pcpu *pcpu)
{
	if (__pcpu_sigp(pcpu->address, sigp_sense,
			0, &pcpu->status) != sigp_status_stored)
		return 0;
	/* Check for stopped and check stop state */
	return !!(pcpu->status & 0x50);
}

static inline int pcpu_running(struct pcpu *pcpu)
H
Heiko Carstens 已提交
157
{
M
Martin Schwidefsky 已提交
158 159 160 161 162
	if (__pcpu_sigp(pcpu->address, sigp_sense_running,
			0, &pcpu->status) != sigp_status_stored)
		return 1;
	/* Check for running status */
	return !(pcpu->status & 0x400);
H
Heiko Carstens 已提交
163 164
}

165
/*
M
Martin Schwidefsky 已提交
166
 * Find struct pcpu by cpu address.
167
 */
M
Martin Schwidefsky 已提交
168
static struct pcpu *pcpu_find_address(const struct cpumask *mask, int address)
169 170 171
{
	int cpu;

M
Martin Schwidefsky 已提交
172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198
	for_each_cpu(cpu, mask)
		if (pcpu_devices[cpu].address == address)
			return pcpu_devices + cpu;
	return NULL;
}

static void pcpu_ec_call(struct pcpu *pcpu, int ec_bit)
{
	int order;

	set_bit(ec_bit, &pcpu->ec_mask);
	order = pcpu_running(pcpu) ?
		sigp_external_call : sigp_emergency_signal;
	pcpu_sigp_retry(pcpu, order, 0);
}

static int __cpuinit pcpu_alloc_lowcore(struct pcpu *pcpu, int cpu)
{
	struct _lowcore *lc;

	if (pcpu != &pcpu_devices[0]) {
		pcpu->lowcore =	(struct _lowcore *)
			__get_free_pages(GFP_KERNEL | GFP_DMA, LC_ORDER);
		pcpu->async_stack = __get_free_pages(GFP_KERNEL, ASYNC_ORDER);
		pcpu->panic_stack = __get_free_page(GFP_KERNEL);
		if (!pcpu->lowcore || !pcpu->panic_stack || !pcpu->async_stack)
			goto out;
199
	}
M
Martin Schwidefsky 已提交
200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225
	lc = pcpu->lowcore;
	memcpy(lc, &S390_lowcore, 512);
	memset((char *) lc + 512, 0, sizeof(*lc) - 512);
	lc->async_stack = pcpu->async_stack + ASYNC_SIZE;
	lc->panic_stack = pcpu->panic_stack + PAGE_SIZE;
	lc->cpu_nr = cpu;
#ifndef CONFIG_64BIT
	if (MACHINE_HAS_IEEE) {
		lc->extended_save_area_addr = get_zeroed_page(GFP_KERNEL);
		if (!lc->extended_save_area_addr)
			goto out;
	}
#else
	if (vdso_alloc_per_cpu(lc))
		goto out;
#endif
	lowcore_ptr[cpu] = lc;
	pcpu_sigp_retry(pcpu, sigp_set_prefix, (u32)(unsigned long) lc);
	return 0;
out:
	if (pcpu != &pcpu_devices[0]) {
		free_page(pcpu->panic_stack);
		free_pages(pcpu->async_stack, ASYNC_ORDER);
		free_pages((unsigned long) pcpu->lowcore, LC_ORDER);
	}
	return -ENOMEM;
226 227
}

228 229
#ifdef CONFIG_HOTPLUG_CPU

M
Martin Schwidefsky 已提交
230
static void pcpu_free_lowcore(struct pcpu *pcpu)
231
{
M
Martin Schwidefsky 已提交
232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250
	pcpu_sigp_retry(pcpu, sigp_set_prefix, 0);
	lowcore_ptr[pcpu - pcpu_devices] = NULL;
#ifndef CONFIG_64BIT
	if (MACHINE_HAS_IEEE) {
		struct _lowcore *lc = pcpu->lowcore;

		free_page((unsigned long) lc->extended_save_area_addr);
		lc->extended_save_area_addr = 0;
	}
#else
	vdso_free_per_cpu(pcpu->lowcore);
#endif
	if (pcpu != &pcpu_devices[0]) {
		free_page(pcpu->panic_stack);
		free_pages(pcpu->async_stack, ASYNC_ORDER);
		free_pages((unsigned long) pcpu->lowcore, LC_ORDER);
	}
}

251 252
#endif /* CONFIG_HOTPLUG_CPU */

M
Martin Schwidefsky 已提交
253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342
static void pcpu_prepare_secondary(struct pcpu *pcpu, int cpu)
{
	struct _lowcore *lc = pcpu->lowcore;

	atomic_inc(&init_mm.context.attach_count);
	lc->cpu_nr = cpu;
	lc->percpu_offset = __per_cpu_offset[cpu];
	lc->kernel_asce = S390_lowcore.kernel_asce;
	lc->machine_flags = S390_lowcore.machine_flags;
	lc->ftrace_func = S390_lowcore.ftrace_func;
	lc->user_timer = lc->system_timer = lc->steal_timer = 0;
	__ctl_store(lc->cregs_save_area, 0, 15);
	save_access_regs((unsigned int *) lc->access_regs_save_area);
	memcpy(lc->stfle_fac_list, S390_lowcore.stfle_fac_list,
	       MAX_FACILITY_BIT/8);
}

static void pcpu_attach_task(struct pcpu *pcpu, struct task_struct *tsk)
{
	struct _lowcore *lc = pcpu->lowcore;
	struct thread_info *ti = task_thread_info(tsk);

	lc->kernel_stack = (unsigned long) task_stack_page(tsk) + THREAD_SIZE;
	lc->thread_info = (unsigned long) task_thread_info(tsk);
	lc->current_task = (unsigned long) tsk;
	lc->user_timer = ti->user_timer;
	lc->system_timer = ti->system_timer;
	lc->steal_timer = 0;
}

static void pcpu_start_fn(struct pcpu *pcpu, void (*func)(void *), void *data)
{
	struct _lowcore *lc = pcpu->lowcore;

	lc->restart_stack = lc->kernel_stack;
	lc->restart_fn = (unsigned long) func;
	lc->restart_data = (unsigned long) data;
	lc->restart_source = -1UL;
	pcpu_sigp_retry(pcpu, sigp_restart, 0);
}

/*
 * Call function via PSW restart on pcpu and stop the current cpu.
 */
static void pcpu_delegate(struct pcpu *pcpu, void (*func)(void *),
			  void *data, unsigned long stack)
{
	struct _lowcore *lc = pcpu->lowcore;
	unsigned short this_cpu;

	__load_psw_mask(psw_kernel_bits);
	this_cpu = stap();
	if (pcpu->address == this_cpu)
		func(data);	/* should not return */
	/* Stop target cpu (if func returns this stops the current cpu). */
	pcpu_sigp_retry(pcpu, sigp_stop, 0);
	/* Restart func on the target cpu and stop the current cpu. */
	lc->restart_stack = stack;
	lc->restart_fn = (unsigned long) func;
	lc->restart_data = (unsigned long) data;
	lc->restart_source = (unsigned long) this_cpu;
	asm volatile(
		"0:	sigp	0,%0,6	# sigp restart to target cpu\n"
		"	brc	2,0b	# busy, try again\n"
		"1:	sigp	0,%1,5	# sigp stop to current cpu\n"
		"	brc	2,1b	# busy, try again\n"
		: : "d" (pcpu->address), "d" (this_cpu) : "0", "1", "cc");
	for (;;) ;
}

/*
 * Call function on an online CPU.
 */
void smp_call_online_cpu(void (*func)(void *), void *data)
{
	struct pcpu *pcpu;

	/* Use the current cpu if it is online. */
	pcpu = pcpu_find_address(cpu_online_mask, stap());
	if (!pcpu)
		/* Use the first online cpu. */
		pcpu = pcpu_devices + cpumask_first(cpu_online_mask);
	pcpu_delegate(pcpu, func, data, (unsigned long) restart_stack);
}

/*
 * Call function on the ipl CPU.
 */
void smp_call_ipl_cpu(void (*func)(void *), void *data)
{
343 344
	pcpu_delegate(&pcpu_devices[0], func, data,
		      pcpu_devices->panic_stack + PAGE_SIZE);
M
Martin Schwidefsky 已提交
345 346 347 348 349 350 351 352 353 354
}

int smp_find_processor_id(u16 address)
{
	int cpu;

	for_each_present_cpu(cpu)
		if (pcpu_devices[cpu].address == address)
			return cpu;
	return -1;
355 356
}

M
Martin Schwidefsky 已提交
357
int smp_vcpu_scheduled(int cpu)
358
{
M
Martin Schwidefsky 已提交
359 360 361 362 363 364 365
	return pcpu_running(pcpu_devices + cpu);
}

void smp_yield(void)
{
	if (MACHINE_HAS_DIAG44)
		asm volatile("diag 0,0,0x44");
366 367
}

M
Martin Schwidefsky 已提交
368
void smp_yield_cpu(int cpu)
369
{
M
Martin Schwidefsky 已提交
370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400
	if (MACHINE_HAS_DIAG9C)
		asm volatile("diag %0,0,0x9c"
			     : : "d" (pcpu_devices[cpu].address));
	else if (MACHINE_HAS_DIAG44)
		asm volatile("diag 0,0,0x44");
}

/*
 * Send cpus emergency shutdown signal. This gives the cpus the
 * opportunity to complete outstanding interrupts.
 */
void smp_emergency_stop(cpumask_t *cpumask)
{
	u64 end;
	int cpu;

	end = get_clock() + (1000000UL << 12);
	for_each_cpu(cpu, cpumask) {
		struct pcpu *pcpu = pcpu_devices + cpu;
		set_bit(ec_stop_cpu, &pcpu->ec_mask);
		while (__pcpu_sigp(pcpu->address, sigp_emergency_signal,
				   0, NULL) == sigp_busy &&
		       get_clock() < end)
			cpu_relax();
	}
	while (get_clock() < end) {
		for_each_cpu(cpu, cpumask)
			if (pcpu_stopped(pcpu_devices + cpu))
				cpumask_clear_cpu(cpu, cpumask);
		if (cpumask_empty(cpumask))
			break;
401
		cpu_relax();
M
Martin Schwidefsky 已提交
402
	}
403 404
}

M
Martin Schwidefsky 已提交
405 406 407
/*
 * Stop all cpus but the current one.
 */
408
void smp_send_stop(void)
L
Linus Torvalds 已提交
409
{
410 411
	cpumask_t cpumask;
	int cpu;
L
Linus Torvalds 已提交
412

413
	/* Disable all interrupts/machine checks */
414
	__load_psw_mask(psw_kernel_bits | PSW_MASK_DAT);
415
	trace_hardirqs_off();
L
Linus Torvalds 已提交
416

417
	debug_set_critical();
418 419 420
	cpumask_copy(&cpumask, cpu_online_mask);
	cpumask_clear_cpu(smp_processor_id(), &cpumask);

M
Martin Schwidefsky 已提交
421 422
	if (oops_in_progress)
		smp_emergency_stop(&cpumask);
L
Linus Torvalds 已提交
423

424 425
	/* stop all processors */
	for_each_cpu(cpu, &cpumask) {
M
Martin Schwidefsky 已提交
426 427 428
		struct pcpu *pcpu = pcpu_devices + cpu;
		pcpu_sigp_retry(pcpu, sigp_stop, 0);
		while (!pcpu_stopped(pcpu))
H
Heiko Carstens 已提交
429 430 431 432
			cpu_relax();
	}
}

M
Martin Schwidefsky 已提交
433 434 435 436 437 438 439 440 441
/*
 * Stop the current cpu.
 */
void smp_stop_cpu(void)
{
	pcpu_sigp_retry(pcpu_devices + smp_processor_id(), sigp_stop, 0);
	for (;;) ;
}

L
Linus Torvalds 已提交
442 443 444 445
/*
 * This is the main routine where commands issued by other
 * cpus are handled.
 */
446
static void do_ext_call_interrupt(struct ext_code ext_code,
447
				  unsigned int param32, unsigned long param64)
L
Linus Torvalds 已提交
448
{
449
	unsigned long bits;
M
Martin Schwidefsky 已提交
450
	int cpu;
L
Linus Torvalds 已提交
451

M
Martin Schwidefsky 已提交
452
	cpu = smp_processor_id();
453
	if (ext_code.code == 0x1202)
M
Martin Schwidefsky 已提交
454
		kstat_cpu(cpu).irqs[EXTINT_EXC]++;
455
	else
M
Martin Schwidefsky 已提交
456
		kstat_cpu(cpu).irqs[EXTINT_EMS]++;
457 458 459
	/*
	 * handle bit signal external calls
	 */
M
Martin Schwidefsky 已提交
460
	bits = xchg(&pcpu_devices[cpu].ec_mask, 0);
L
Linus Torvalds 已提交
461

462 463 464
	if (test_bit(ec_stop_cpu, &bits))
		smp_stop_cpu();

465 466 467
	if (test_bit(ec_schedule, &bits))
		scheduler_ipi();

468
	if (test_bit(ec_call_function, &bits))
469 470 471 472
		generic_smp_call_function_interrupt();

	if (test_bit(ec_call_function_single, &bits))
		generic_smp_call_function_single_interrupt();
473

L
Linus Torvalds 已提交
474 475
}

476
void arch_send_call_function_ipi_mask(const struct cpumask *mask)
477 478 479
{
	int cpu;

480
	for_each_cpu(cpu, mask)
M
Martin Schwidefsky 已提交
481
		pcpu_ec_call(pcpu_devices + cpu, ec_call_function);
482 483 484 485
}

void arch_send_call_function_single_ipi(int cpu)
{
M
Martin Schwidefsky 已提交
486
	pcpu_ec_call(pcpu_devices + cpu, ec_call_function_single);
487 488
}

489
#ifndef CONFIG_64BIT
L
Linus Torvalds 已提交
490 491 492
/*
 * this function sends a 'purge tlb' signal to another CPU.
 */
493
static void smp_ptlb_callback(void *info)
L
Linus Torvalds 已提交
494
{
M
Martin Schwidefsky 已提交
495
	__tlb_flush_local();
L
Linus Torvalds 已提交
496 497 498 499
}

void smp_ptlb_all(void)
{
500
	on_each_cpu(smp_ptlb_callback, NULL, 1);
L
Linus Torvalds 已提交
501 502
}
EXPORT_SYMBOL(smp_ptlb_all);
503
#endif /* ! CONFIG_64BIT */
L
Linus Torvalds 已提交
504 505 506 507 508 509 510 511

/*
 * this function sends a 'reschedule' IPI to another CPU.
 * it goes straight through and wastes no time serializing
 * anything. Worst case is that we lose a reschedule ...
 */
void smp_send_reschedule(int cpu)
{
M
Martin Schwidefsky 已提交
512
	pcpu_ec_call(pcpu_devices + cpu, ec_schedule);
L
Linus Torvalds 已提交
513 514 515 516 517
}

/*
 * parameter area for the set/clear control bit callbacks
 */
518
struct ec_creg_mask_parms {
M
Martin Schwidefsky 已提交
519 520 521
	unsigned long orval;
	unsigned long andval;
	int cr;
522
};
L
Linus Torvalds 已提交
523 524 525 526

/*
 * callback for setting/clearing control bits
 */
527 528
static void smp_ctl_bit_callback(void *info)
{
529
	struct ec_creg_mask_parms *pp = info;
L
Linus Torvalds 已提交
530
	unsigned long cregs[16];
531

532
	__ctl_store(cregs, 0, 15);
M
Martin Schwidefsky 已提交
533
	cregs[pp->cr] = (cregs[pp->cr] & pp->andval) | pp->orval;
534
	__ctl_load(cregs, 0, 15);
L
Linus Torvalds 已提交
535 536 537 538 539
}

/*
 * Set a bit in a control register of all cpus
 */
540 541
void smp_ctl_set_bit(int cr, int bit)
{
M
Martin Schwidefsky 已提交
542
	struct ec_creg_mask_parms parms = { 1UL << bit, -1UL, cr };
L
Linus Torvalds 已提交
543

544
	on_each_cpu(smp_ctl_bit_callback, &parms, 1);
L
Linus Torvalds 已提交
545
}
546
EXPORT_SYMBOL(smp_ctl_set_bit);
L
Linus Torvalds 已提交
547 548 549 550

/*
 * Clear a bit in a control register of all cpus
 */
551 552
void smp_ctl_clear_bit(int cr, int bit)
{
M
Martin Schwidefsky 已提交
553
	struct ec_creg_mask_parms parms = { 0, ~(1UL << bit), cr };
L
Linus Torvalds 已提交
554

555
	on_each_cpu(smp_ctl_bit_callback, &parms, 1);
L
Linus Torvalds 已提交
556
}
557
EXPORT_SYMBOL(smp_ctl_clear_bit);
L
Linus Torvalds 已提交
558

M
Michael Holzheu 已提交
559
#if defined(CONFIG_ZFCPDUMP) || defined(CONFIG_CRASH_DUMP)
M
Michael Holzheu 已提交
560

M
Martin Schwidefsky 已提交
561 562 563 564
struct save_area *zfcpdump_save_areas[NR_CPUS + 1];
EXPORT_SYMBOL_GPL(zfcpdump_save_areas);

static void __init smp_get_save_area(int cpu, u16 address)
M
Michael Holzheu 已提交
565
{
M
Martin Schwidefsky 已提交
566 567 568
	void *lc = pcpu_devices[0].lowcore;
	struct save_area *save_area;

M
Michael Holzheu 已提交
569
	if (is_kdump_kernel())
M
Michael Holzheu 已提交
570
		return;
M
Martin Schwidefsky 已提交
571 572 573
	if (!OLDMEM_BASE && (address == boot_cpu_address ||
			     ipl_info.type != IPL_TYPE_FCP_DUMP))
		return;
574
	if (cpu >= NR_CPUS) {
M
Martin Schwidefsky 已提交
575 576
		pr_warning("CPU %i exceeds the maximum %i and is excluded "
			   "from the dump\n", cpu, NR_CPUS - 1);
577
		return;
M
Michael Holzheu 已提交
578
	}
M
Martin Schwidefsky 已提交
579 580 581 582 583 584 585 586 587 588 589 590 591 592 593
	save_area = kmalloc(sizeof(struct save_area), GFP_KERNEL);
	if (!save_area)
		panic("could not allocate memory for save area\n");
	zfcpdump_save_areas[cpu] = save_area;
#ifdef CONFIG_CRASH_DUMP
	if (address == boot_cpu_address) {
		/* Copy the registers of the boot cpu. */
		copy_oldmem_page(1, (void *) save_area, sizeof(*save_area),
				 SAVE_AREA_BASE - PAGE_SIZE, 0);
		return;
	}
#endif
	/* Get the registers of a non-boot cpu. */
	__pcpu_sigp_relax(address, sigp_stop_and_store_status, 0, NULL);
	memcpy_real(save_area, lc + SAVE_AREA_BASE, sizeof(*save_area));
M
Michael Holzheu 已提交
594 595
}

M
Martin Schwidefsky 已提交
596
int smp_store_status(int cpu)
597
{
M
Martin Schwidefsky 已提交
598
	struct pcpu *pcpu;
599

M
Martin Schwidefsky 已提交
600 601 602 603
	pcpu = pcpu_devices + cpu;
	if (__pcpu_sigp_relax(pcpu->address, sigp_stop_and_store_status,
			      0, NULL) != sigp_order_code_accepted)
		return -EIO;
604 605 606
	return 0;
}

M
Martin Schwidefsky 已提交
607
#else /* CONFIG_ZFCPDUMP || CONFIG_CRASH_DUMP */
608

M
Martin Schwidefsky 已提交
609
static inline void smp_get_save_area(int cpu, u16 address) { }
610

M
Martin Schwidefsky 已提交
611
#endif /* CONFIG_ZFCPDUMP || CONFIG_CRASH_DUMP */
612

M
Martin Schwidefsky 已提交
613
static struct sclp_cpu_info *smp_get_cpu_info(void)
614
{
M
Martin Schwidefsky 已提交
615
	static int use_sigp_detection;
616
	struct sclp_cpu_info *info;
M
Martin Schwidefsky 已提交
617 618 619 620 621 622 623 624 625 626 627 628 629
	int address;

	info = kzalloc(sizeof(*info), GFP_KERNEL);
	if (info && (use_sigp_detection || sclp_get_cpu_info(info))) {
		use_sigp_detection = 1;
		for (address = 0; address <= MAX_CPU_ADDRESS; address++) {
			if (__pcpu_sigp_relax(address, sigp_sense, 0, NULL) ==
			    sigp_not_operational)
				continue;
			info->cpu[info->configured].address = address;
			info->configured++;
		}
		info->combined = info->configured;
630
	}
M
Martin Schwidefsky 已提交
631
	return info;
632 633
}

M
Martin Schwidefsky 已提交
634 635 636 637
static int __devinit smp_add_present_cpu(int cpu);

static int __devinit __smp_rescan_cpus(struct sclp_cpu_info *info,
				       int sysfs_add)
638
{
M
Martin Schwidefsky 已提交
639
	struct pcpu *pcpu;
640
	cpumask_t avail;
M
Martin Schwidefsky 已提交
641
	int cpu, nr, i;
642

M
Martin Schwidefsky 已提交
643
	nr = 0;
644
	cpumask_xor(&avail, cpu_possible_mask, cpu_present_mask);
M
Martin Schwidefsky 已提交
645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663
	cpu = cpumask_first(&avail);
	for (i = 0; (i < info->combined) && (cpu < nr_cpu_ids); i++) {
		if (info->has_cpu_type && info->cpu[i].type != boot_cpu_type)
			continue;
		if (pcpu_find_address(cpu_present_mask, info->cpu[i].address))
			continue;
		pcpu = pcpu_devices + cpu;
		pcpu->address = info->cpu[i].address;
		pcpu->state = (cpu >= info->configured) ?
			CPU_STATE_STANDBY : CPU_STATE_CONFIGURED;
		cpu_set_polarization(cpu, POLARIZATION_UNKNOWN);
		set_cpu_present(cpu, true);
		if (sysfs_add && smp_add_present_cpu(cpu) != 0)
			set_cpu_present(cpu, false);
		else
			nr++;
		cpu = cpumask_next(cpu, &avail);
	}
	return nr;
L
Linus Torvalds 已提交
664 665
}

666 667 668 669 670
static void __init smp_detect_cpus(void)
{
	unsigned int cpu, c_cpus, s_cpus;
	struct sclp_cpu_info *info;

M
Martin Schwidefsky 已提交
671
	info = smp_get_cpu_info();
672 673 674 675
	if (!info)
		panic("smp_detect_cpus failed to allocate memory\n");
	if (info->has_cpu_type) {
		for (cpu = 0; cpu < info->combined; cpu++) {
M
Martin Schwidefsky 已提交
676 677 678 679 680
			if (info->cpu[cpu].address != boot_cpu_address)
				continue;
			/* The boot cpu dictates the cpu type. */
			boot_cpu_type = info->cpu[cpu].type;
			break;
681 682
		}
	}
M
Martin Schwidefsky 已提交
683
	c_cpus = s_cpus = 0;
684
	for (cpu = 0; cpu < info->combined; cpu++) {
M
Martin Schwidefsky 已提交
685
		if (info->has_cpu_type && info->cpu[cpu].type != boot_cpu_type)
686
			continue;
M
Martin Schwidefsky 已提交
687 688 689 690
		if (cpu < info->configured) {
			smp_get_save_area(c_cpus, info->cpu[cpu].address);
			c_cpus++;
		} else
691 692
			s_cpus++;
	}
693
	pr_info("%d configured CPUs, %d standby CPUs\n", c_cpus, s_cpus);
694
	get_online_cpus();
M
Martin Schwidefsky 已提交
695
	__smp_rescan_cpus(info, 0);
696
	put_online_cpus();
M
Martin Schwidefsky 已提交
697
	kfree(info);
698 699
}

L
Linus Torvalds 已提交
700
/*
701
 *	Activate a secondary processor.
L
Linus Torvalds 已提交
702
 */
M
Martin Schwidefsky 已提交
703
static void __cpuinit smp_start_secondary(void *cpuvoid)
L
Linus Torvalds 已提交
704
{
M
Martin Schwidefsky 已提交
705 706 707 708 709 710 711 712
	S390_lowcore.last_update_clock = get_clock();
	S390_lowcore.restart_stack = (unsigned long) restart_stack;
	S390_lowcore.restart_fn = (unsigned long) do_restart;
	S390_lowcore.restart_data = 0;
	S390_lowcore.restart_source = -1UL;
	restore_access_regs(S390_lowcore.access_regs_save_area);
	__ctl_load(S390_lowcore.cregs_save_area, 0, 15);
	__load_psw_mask(psw_kernel_bits | PSW_MASK_DAT);
713
	cpu_init();
714
	preempt_disable();
715 716
	init_cpu_timer();
	init_cpu_vtimer();
H
Heiko Carstens 已提交
717
	pfault_init();
718
	notify_cpu_starting(smp_processor_id());
719
	ipi_call_lock();
720
	set_cpu_online(smp_processor_id(), true);
721
	ipi_call_unlock();
L
Linus Torvalds 已提交
722
	local_irq_enable();
723 724
	/* cpu_idle will call schedule for us */
	cpu_idle();
L
Linus Torvalds 已提交
725 726 727
}

/* Upping and downing of CPUs */
728
int __cpuinit __cpu_up(unsigned int cpu, struct task_struct *tidle)
L
Linus Torvalds 已提交
729
{
M
Martin Schwidefsky 已提交
730 731
	struct pcpu *pcpu;
	int rc;
L
Linus Torvalds 已提交
732

M
Martin Schwidefsky 已提交
733 734
	pcpu = pcpu_devices + cpu;
	if (pcpu->state != CPU_STATE_CONFIGURED)
735
		return -EIO;
M
Martin Schwidefsky 已提交
736 737
	if (pcpu_sigp_retry(pcpu, sigp_initial_cpu_reset, 0) !=
	    sigp_order_code_accepted)
738
		return -EIO;
739

M
Martin Schwidefsky 已提交
740 741 742 743
	rc = pcpu_alloc_lowcore(pcpu, cpu);
	if (rc)
		return rc;
	pcpu_prepare_secondary(pcpu, cpu);
744
	pcpu_attach_task(pcpu, tidle);
M
Martin Schwidefsky 已提交
745
	pcpu_start_fn(pcpu, smp_start_secondary, NULL);
L
Linus Torvalds 已提交
746 747 748 749 750
	while (!cpu_online(cpu))
		cpu_relax();
	return 0;
}

751
static int __init setup_possible_cpus(char *s)
752
{
M
Martin Schwidefsky 已提交
753
	int max, cpu;
754

M
Martin Schwidefsky 已提交
755 756
	if (kstrtoint(s, 0, &max) < 0)
		return 0;
757
	init_cpu_possible(cpumask_of(0));
M
Martin Schwidefsky 已提交
758
	for (cpu = 1; cpu < max && cpu < nr_cpu_ids; cpu++)
759
		set_cpu_possible(cpu, true);
760 761 762 763
	return 0;
}
early_param("possible_cpus", setup_possible_cpus);

764 765
#ifdef CONFIG_HOTPLUG_CPU

766
int __cpu_disable(void)
L
Linus Torvalds 已提交
767
{
M
Martin Schwidefsky 已提交
768
	unsigned long cregs[16];
L
Linus Torvalds 已提交
769

M
Martin Schwidefsky 已提交
770 771
	set_cpu_online(smp_processor_id(), false);
	/* Disable pseudo page faults on this cpu. */
H
Heiko Carstens 已提交
772
	pfault_fini();
M
Martin Schwidefsky 已提交
773 774 775 776 777 778
	/* Disable interrupt sources via control register. */
	__ctl_store(cregs, 0, 15);
	cregs[0]  &= ~0x0000ee70UL;	/* disable all external interrupts */
	cregs[6]  &= ~0xff000000UL;	/* disable all I/O interrupts */
	cregs[14] &= ~0x1f000000UL;	/* disable most machine checks */
	__ctl_load(cregs, 0, 15);
L
Linus Torvalds 已提交
779 780 781
	return 0;
}

782
void __cpu_die(unsigned int cpu)
L
Linus Torvalds 已提交
783
{
M
Martin Schwidefsky 已提交
784 785
	struct pcpu *pcpu;

L
Linus Torvalds 已提交
786
	/* Wait until target cpu is down */
M
Martin Schwidefsky 已提交
787 788
	pcpu = pcpu_devices + cpu;
	while (!pcpu_stopped(pcpu))
L
Linus Torvalds 已提交
789
		cpu_relax();
M
Martin Schwidefsky 已提交
790
	pcpu_free_lowcore(pcpu);
791
	atomic_dec(&init_mm.context.attach_count);
L
Linus Torvalds 已提交
792 793
}

794
void __noreturn cpu_die(void)
L
Linus Torvalds 已提交
795 796
{
	idle_task_exit();
M
Martin Schwidefsky 已提交
797 798
	pcpu_sigp_retry(pcpu_devices + smp_processor_id(), sigp_stop, 0);
	for (;;) ;
L
Linus Torvalds 已提交
799 800
}

801 802
#endif /* CONFIG_HOTPLUG_CPU */

L
Linus Torvalds 已提交
803 804
void __init smp_prepare_cpus(unsigned int max_cpus)
{
805 806 807
	/* request the 0x1201 emergency signal external interrupt */
	if (register_external_interrupt(0x1201, do_ext_call_interrupt) != 0)
		panic("Couldn't request external interrupt 0x1201");
808 809 810
	/* request the 0x1202 external call external interrupt */
	if (register_external_interrupt(0x1202, do_ext_call_interrupt) != 0)
		panic("Couldn't request external interrupt 0x1202");
M
Martin Schwidefsky 已提交
811
	smp_detect_cpus();
L
Linus Torvalds 已提交
812 813
}

H
Heiko Carstens 已提交
814
void __init smp_prepare_boot_cpu(void)
L
Linus Torvalds 已提交
815
{
M
Martin Schwidefsky 已提交
816 817 818 819 820 821 822 823
	struct pcpu *pcpu = pcpu_devices;

	boot_cpu_address = stap();
	pcpu->state = CPU_STATE_CONFIGURED;
	pcpu->address = boot_cpu_address;
	pcpu->lowcore = (struct _lowcore *)(unsigned long) store_prefix();
	pcpu->async_stack = S390_lowcore.async_stack - ASYNC_SIZE;
	pcpu->panic_stack = S390_lowcore.panic_stack - PAGE_SIZE;
L
Linus Torvalds 已提交
824
	S390_lowcore.percpu_offset = __per_cpu_offset[0];
825
	cpu_set_polarization(0, POLARIZATION_UNKNOWN);
M
Martin Schwidefsky 已提交
826 827
	set_cpu_present(0, true);
	set_cpu_online(0, true);
L
Linus Torvalds 已提交
828 829
}

H
Heiko Carstens 已提交
830
void __init smp_cpus_done(unsigned int max_cpus)
L
Linus Torvalds 已提交
831 832 833
{
}

834 835 836 837 838
void __init smp_setup_processor_id(void)
{
	S390_lowcore.cpu_nr = 0;
}

L
Linus Torvalds 已提交
839 840 841 842 843 844 845 846
/*
 * the frequency of the profiling timer can be changed
 * by writing a multiplier value into /proc/profile.
 *
 * usually you want to run this on all CPUs ;)
 */
int setup_profiling_timer(unsigned int multiplier)
{
847
	return 0;
L
Linus Torvalds 已提交
848 849
}

850
#ifdef CONFIG_HOTPLUG_CPU
851
static ssize_t cpu_configure_show(struct device *dev,
M
Martin Schwidefsky 已提交
852
				  struct device_attribute *attr, char *buf)
853 854 855 856
{
	ssize_t count;

	mutex_lock(&smp_cpu_state_mutex);
M
Martin Schwidefsky 已提交
857
	count = sprintf(buf, "%d\n", pcpu_devices[dev->id].state);
858 859 860 861
	mutex_unlock(&smp_cpu_state_mutex);
	return count;
}

862
static ssize_t cpu_configure_store(struct device *dev,
M
Martin Schwidefsky 已提交
863 864
				   struct device_attribute *attr,
				   const char *buf, size_t count)
865
{
M
Martin Schwidefsky 已提交
866 867
	struct pcpu *pcpu;
	int cpu, val, rc;
868 869 870 871 872 873
	char delim;

	if (sscanf(buf, "%d %c", &val, &delim) != 1)
		return -EINVAL;
	if (val != 0 && val != 1)
		return -EINVAL;
874
	get_online_cpus();
H
Heiko Carstens 已提交
875
	mutex_lock(&smp_cpu_state_mutex);
876
	rc = -EBUSY;
877
	/* disallow configuration changes of online cpus and cpu 0 */
M
Martin Schwidefsky 已提交
878
	cpu = dev->id;
879
	if (cpu_online(cpu) || cpu == 0)
880
		goto out;
M
Martin Schwidefsky 已提交
881
	pcpu = pcpu_devices + cpu;
882 883 884
	rc = 0;
	switch (val) {
	case 0:
M
Martin Schwidefsky 已提交
885 886 887 888 889 890 891 892
		if (pcpu->state != CPU_STATE_CONFIGURED)
			break;
		rc = sclp_cpu_deconfigure(pcpu->address);
		if (rc)
			break;
		pcpu->state = CPU_STATE_STANDBY;
		cpu_set_polarization(cpu, POLARIZATION_UNKNOWN);
		topology_expect_change();
893 894
		break;
	case 1:
M
Martin Schwidefsky 已提交
895 896 897 898 899 900 901 902
		if (pcpu->state != CPU_STATE_STANDBY)
			break;
		rc = sclp_cpu_configure(pcpu->address);
		if (rc)
			break;
		pcpu->state = CPU_STATE_CONFIGURED;
		cpu_set_polarization(cpu, POLARIZATION_UNKNOWN);
		topology_expect_change();
903 904 905 906 907 908
		break;
	default:
		break;
	}
out:
	mutex_unlock(&smp_cpu_state_mutex);
H
Heiko Carstens 已提交
909
	put_online_cpus();
910 911
	return rc ? rc : count;
}
912
static DEVICE_ATTR(configure, 0644, cpu_configure_show, cpu_configure_store);
913 914
#endif /* CONFIG_HOTPLUG_CPU */

915 916
static ssize_t show_cpu_address(struct device *dev,
				struct device_attribute *attr, char *buf)
917
{
M
Martin Schwidefsky 已提交
918
	return sprintf(buf, "%d\n", pcpu_devices[dev->id].address);
919
}
920
static DEVICE_ATTR(address, 0444, show_cpu_address, NULL);
921 922 923

static struct attribute *cpu_common_attrs[] = {
#ifdef CONFIG_HOTPLUG_CPU
924
	&dev_attr_configure.attr,
925
#endif
926
	&dev_attr_address.attr,
927 928 929 930 931 932
	NULL,
};

static struct attribute_group cpu_common_attr_group = {
	.attrs = cpu_common_attrs,
};
L
Linus Torvalds 已提交
933

934 935
static ssize_t show_capability(struct device *dev,
				struct device_attribute *attr, char *buf)
936 937 938 939 940 941 942 943 944
{
	unsigned int capability;
	int rc;

	rc = get_cpu_capability(&capability);
	if (rc)
		return rc;
	return sprintf(buf, "%u\n", capability);
}
945
static DEVICE_ATTR(capability, 0444, show_capability, NULL);
946

947 948
static ssize_t show_idle_count(struct device *dev,
				struct device_attribute *attr, char *buf)
949
{
M
Martin Schwidefsky 已提交
950
	struct s390_idle_data *idle = &per_cpu(s390_idle, dev->id);
951
	unsigned long long idle_count;
952
	unsigned int sequence;
953

M
Martin Schwidefsky 已提交
954 955 956 957 958 959
	do {
		sequence = ACCESS_ONCE(idle->sequence);
		idle_count = ACCESS_ONCE(idle->idle_count);
		if (ACCESS_ONCE(idle->idle_enter))
			idle_count++;
	} while ((sequence & 1) || (idle->sequence != sequence));
960 961
	return sprintf(buf, "%llu\n", idle_count);
}
962
static DEVICE_ATTR(idle_count, 0444, show_idle_count, NULL);
963

964 965
static ssize_t show_idle_time(struct device *dev,
				struct device_attribute *attr, char *buf)
966
{
M
Martin Schwidefsky 已提交
967 968
	struct s390_idle_data *idle = &per_cpu(s390_idle, dev->id);
	unsigned long long now, idle_time, idle_enter, idle_exit;
969
	unsigned int sequence;
970

M
Martin Schwidefsky 已提交
971 972 973 974 975 976 977 978
	do {
		now = get_clock();
		sequence = ACCESS_ONCE(idle->sequence);
		idle_time = ACCESS_ONCE(idle->idle_time);
		idle_enter = ACCESS_ONCE(idle->idle_enter);
		idle_exit = ACCESS_ONCE(idle->idle_exit);
	} while ((sequence & 1) || (idle->sequence != sequence));
	idle_time += idle_enter ? ((idle_exit ? : now) - idle_enter) : 0;
979
	return sprintf(buf, "%llu\n", idle_time >> 12);
980
}
981
static DEVICE_ATTR(idle_time_us, 0444, show_idle_time, NULL);
982

983
static struct attribute *cpu_online_attrs[] = {
984 985 986
	&dev_attr_capability.attr,
	&dev_attr_idle_count.attr,
	&dev_attr_idle_time_us.attr,
987 988 989
	NULL,
};

990 991
static struct attribute_group cpu_online_attr_group = {
	.attrs = cpu_online_attrs,
992 993
};

994 995 996 997
static int __cpuinit smp_cpu_notify(struct notifier_block *self,
				    unsigned long action, void *hcpu)
{
	unsigned int cpu = (unsigned int)(long)hcpu;
M
Martin Schwidefsky 已提交
998
	struct cpu *c = &pcpu_devices[cpu].cpu;
999
	struct device *s = &c->dev;
1000
	struct s390_idle_data *idle;
1001
	int err = 0;
1002 1003 1004

	switch (action) {
	case CPU_ONLINE:
1005
	case CPU_ONLINE_FROZEN:
1006
		idle = &per_cpu(s390_idle, cpu);
1007
		memset(idle, 0, sizeof(struct s390_idle_data));
1008
		err = sysfs_create_group(&s->kobj, &cpu_online_attr_group);
1009 1010
		break;
	case CPU_DEAD:
1011
	case CPU_DEAD_FROZEN:
1012
		sysfs_remove_group(&s->kobj, &cpu_online_attr_group);
1013 1014
		break;
	}
1015
	return notifier_from_errno(err);
1016 1017 1018
}

static struct notifier_block __cpuinitdata smp_cpu_nb = {
1019
	.notifier_call = smp_cpu_notify,
1020 1021
};

1022
static int __devinit smp_add_present_cpu(int cpu)
1023
{
M
Martin Schwidefsky 已提交
1024
	struct cpu *c = &pcpu_devices[cpu].cpu;
1025
	struct device *s = &c->dev;
1026 1027 1028 1029 1030 1031 1032 1033 1034
	int rc;

	c->hotpluggable = 1;
	rc = register_cpu(c, cpu);
	if (rc)
		goto out;
	rc = sysfs_create_group(&s->kobj, &cpu_common_attr_group);
	if (rc)
		goto out_cpu;
1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045 1046 1047 1048
	if (cpu_online(cpu)) {
		rc = sysfs_create_group(&s->kobj, &cpu_online_attr_group);
		if (rc)
			goto out_online;
	}
	rc = topology_cpu_init(c);
	if (rc)
		goto out_topology;
	return 0;

out_topology:
	if (cpu_online(cpu))
		sysfs_remove_group(&s->kobj, &cpu_online_attr_group);
out_online:
1049 1050 1051 1052 1053 1054 1055 1056 1057 1058
	sysfs_remove_group(&s->kobj, &cpu_common_attr_group);
out_cpu:
#ifdef CONFIG_HOTPLUG_CPU
	unregister_cpu(c);
#endif
out:
	return rc;
}

#ifdef CONFIG_HOTPLUG_CPU
1059

1060
int __ref smp_rescan_cpus(void)
1061
{
M
Martin Schwidefsky 已提交
1062 1063
	struct sclp_cpu_info *info;
	int nr;
1064

M
Martin Schwidefsky 已提交
1065 1066 1067
	info = smp_get_cpu_info();
	if (!info)
		return -ENOMEM;
1068
	get_online_cpus();
H
Heiko Carstens 已提交
1069
	mutex_lock(&smp_cpu_state_mutex);
M
Martin Schwidefsky 已提交
1070
	nr = __smp_rescan_cpus(info, 1);
1071
	mutex_unlock(&smp_cpu_state_mutex);
H
Heiko Carstens 已提交
1072
	put_online_cpus();
M
Martin Schwidefsky 已提交
1073 1074
	kfree(info);
	if (nr)
H
Heiko Carstens 已提交
1075
		topology_schedule_update();
M
Martin Schwidefsky 已提交
1076
	return 0;
1077 1078
}

1079 1080
static ssize_t __ref rescan_store(struct device *dev,
				  struct device_attribute *attr,
1081
				  const char *buf,
1082 1083 1084 1085 1086
				  size_t count)
{
	int rc;

	rc = smp_rescan_cpus();
1087 1088
	return rc ? rc : count;
}
1089
static DEVICE_ATTR(rescan, 0200, NULL, rescan_store);
1090 1091
#endif /* CONFIG_HOTPLUG_CPU */

1092
static int __init s390_smp_init(void)
L
Linus Torvalds 已提交
1093
{
1094
	int cpu, rc;
1095 1096

	register_cpu_notifier(&smp_cpu_nb);
1097
#ifdef CONFIG_HOTPLUG_CPU
1098
	rc = device_create_file(cpu_subsys.dev_root, &dev_attr_rescan);
1099 1100 1101 1102 1103
	if (rc)
		return rc;
#endif
	for_each_present_cpu(cpu) {
		rc = smp_add_present_cpu(cpu);
1104 1105
		if (rc)
			return rc;
L
Linus Torvalds 已提交
1106 1107 1108
	}
	return 0;
}
1109
subsys_initcall(s390_smp_init);