smp.c 21.0 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3
/*
 *  arch/s390/kernel/smp.c
 *
4
 *    Copyright (C) IBM Corp. 1999,2006
L
Linus Torvalds 已提交
5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32
 *    Author(s): Denis Joseph Barrow (djbarrow@de.ibm.com,barrow_dj@yahoo.com),
 *               Martin Schwidefsky (schwidefsky@de.ibm.com)
 *               Heiko Carstens (heiko.carstens@de.ibm.com)
 *
 *  based on other smp stuff by 
 *    (c) 1995 Alan Cox, CymruNET Ltd  <alan@cymru.net>
 *    (c) 1998 Ingo Molnar
 *
 * We work with logical cpu numbering everywhere we can. The only
 * functions using the real cpu address (got from STAP) are the sigp
 * functions. For all other functions we use the identity mapping.
 * That means that cpu_number_map[i] == i for every cpu. cpu_number_map is
 * used e.g. to find the idle task belonging to a logical cpu. Every array
 * in the kernel is sorted by the logical cpu number and not by the physical
 * one which is causing all the confusion with __cpu_logical_map and
 * cpu_number_map in other architectures.
 */

#include <linux/module.h>
#include <linux/init.h>
#include <linux/mm.h>
#include <linux/spinlock.h>
#include <linux/kernel_stat.h>
#include <linux/smp_lock.h>
#include <linux/delay.h>
#include <linux/cache.h>
#include <linux/interrupt.h>
#include <linux/cpu.h>
33
#include <linux/timex.h>
M
Michael Holzheu 已提交
34
#include <linux/bootmem.h>
M
Michael Holzheu 已提交
35
#include <asm/ipl.h>
36
#include <asm/setup.h>
L
Linus Torvalds 已提交
37 38 39 40 41 42
#include <asm/sigp.h>
#include <asm/pgalloc.h>
#include <asm/irq.h>
#include <asm/s390_ext.h>
#include <asm/cpcmd.h>
#include <asm/tlbflush.h>
43
#include <asm/timer.h>
M
Michael Holzheu 已提交
44
#include <asm/lowcore.h>
L
Linus Torvalds 已提交
45 46 47 48 49 50 51 52 53

extern volatile int __cpu_logical_map[];

/*
 * An array with a pointer the lowcore of every CPU.
 */

struct _lowcore *lowcore_ptr[NR_CPUS];

54 55
cpumask_t cpu_online_map = CPU_MASK_NONE;
cpumask_t cpu_possible_map = CPU_MASK_NONE;
L
Linus Torvalds 已提交
56 57 58 59 60 61

static struct task_struct *current_set[NR_CPUS];

static void smp_ext_bitcall(int, ec_bit_sig);

/*
J
Jan Glauber 已提交
62 63
 * Structure and data for __smp_call_function_map(). This is designed to
 * minimise static memory requirements. It also looks cleaner.
L
Linus Torvalds 已提交
64 65 66 67 68 69
 */
static DEFINE_SPINLOCK(call_lock);

struct call_data_struct {
	void (*func) (void *info);
	void *info;
J
Jan Glauber 已提交
70 71
	cpumask_t started;
	cpumask_t finished;
L
Linus Torvalds 已提交
72 73 74 75 76 77 78 79 80 81 82 83 84 85
	int wait;
};

static struct call_data_struct * call_data;

/*
 * 'Call function' interrupt callback
 */
static void do_call_function(void)
{
	void (*func) (void *info) = call_data->func;
	void *info = call_data->info;
	int wait = call_data->wait;

J
Jan Glauber 已提交
86
	cpu_set(smp_processor_id(), call_data->started);
L
Linus Torvalds 已提交
87 88
	(*func)(info);
	if (wait)
J
Jan Glauber 已提交
89
		cpu_set(smp_processor_id(), call_data->finished);;
L
Linus Torvalds 已提交
90 91
}

J
Jan Glauber 已提交
92 93
static void __smp_call_function_map(void (*func) (void *info), void *info,
				    int nonatomic, int wait, cpumask_t map)
L
Linus Torvalds 已提交
94 95
{
	struct call_data_struct data;
J
Jan Glauber 已提交
96
	int cpu, local = 0;
L
Linus Torvalds 已提交
97

J
Jan Glauber 已提交
98
	/*
99
	 * Can deadlock when interrupts are disabled or if in wrong context.
J
Jan Glauber 已提交
100
	 */
101
	WARN_ON(irqs_disabled() || in_irq());
L
Linus Torvalds 已提交
102

J
Jan Glauber 已提交
103 104 105 106 107 108 109 110 111 112 113 114
	/*
	 * Check for local function call. We have to have the same call order
	 * as in on_each_cpu() because of machine_restart_smp().
	 */
	if (cpu_isset(smp_processor_id(), map)) {
		local = 1;
		cpu_clear(smp_processor_id(), map);
	}

	cpus_and(map, map, cpu_online_map);
	if (cpus_empty(map))
		goto out;
L
Linus Torvalds 已提交
115 116 117

	data.func = func;
	data.info = info;
J
Jan Glauber 已提交
118
	data.started = CPU_MASK_NONE;
L
Linus Torvalds 已提交
119 120
	data.wait = wait;
	if (wait)
J
Jan Glauber 已提交
121
		data.finished = CPU_MASK_NONE;
L
Linus Torvalds 已提交
122

123
	spin_lock_bh(&call_lock);
L
Linus Torvalds 已提交
124
	call_data = &data;
J
Jan Glauber 已提交
125 126 127

	for_each_cpu_mask(cpu, map)
		smp_ext_bitcall(cpu, ec_call_function);
L
Linus Torvalds 已提交
128 129

	/* Wait for response */
J
Jan Glauber 已提交
130
	while (!cpus_equal(map, data.started))
L
Linus Torvalds 已提交
131 132 133
		cpu_relax();

	if (wait)
J
Jan Glauber 已提交
134
		while (!cpus_equal(map, data.finished))
L
Linus Torvalds 已提交
135
			cpu_relax();
J
Jan Glauber 已提交
136

137
	spin_unlock_bh(&call_lock);
L
Linus Torvalds 已提交
138

J
Jan Glauber 已提交
139 140 141 142 143
out:
	local_irq_disable();
	if (local)
		func(info);
	local_irq_enable();
L
Linus Torvalds 已提交
144 145 146
}

/*
J
Jan Glauber 已提交
147 148 149 150 151
 * smp_call_function:
 * @func: the function to run; this must be fast and non-blocking
 * @info: an arbitrary pointer to pass to the function
 * @nonatomic: unused
 * @wait: if true, wait (atomically) until function has completed on other CPUs
L
Linus Torvalds 已提交
152
 *
J
Jan Glauber 已提交
153
 * Run a function on all other CPUs.
L
Linus Torvalds 已提交
154
 *
J
Jan Glauber 已提交
155
 * You must not call this function with disabled interrupts or from a
156
 * hardware interrupt handler. You may call it from a bottom half.
L
Linus Torvalds 已提交
157
 */
J
Jan Glauber 已提交
158 159
int smp_call_function(void (*func) (void *info), void *info, int nonatomic,
		      int wait)
L
Linus Torvalds 已提交
160
{
J
Jan Glauber 已提交
161
	cpumask_t map;
L
Linus Torvalds 已提交
162

163
	preempt_disable();
J
Jan Glauber 已提交
164 165 166
	map = cpu_online_map;
	cpu_clear(smp_processor_id(), map);
	__smp_call_function_map(func, info, nonatomic, wait, map);
167
	preempt_enable();
J
Jan Glauber 已提交
168 169 170
	return 0;
}
EXPORT_SYMBOL(smp_call_function);
L
Linus Torvalds 已提交
171

J
Jan Glauber 已提交
172 173 174 175 176 177 178 179 180 181 182
/*
 * smp_call_function_on:
 * @func: the function to run; this must be fast and non-blocking
 * @info: an arbitrary pointer to pass to the function
 * @nonatomic: unused
 * @wait: if true, wait (atomically) until function has completed on other CPUs
 * @cpu: the CPU where func should run
 *
 * Run a function on one processor.
 *
 * You must not call this function with disabled interrupts or from a
183
 * hardware interrupt handler. You may call it from a bottom half.
J
Jan Glauber 已提交
184 185 186 187 188
 */
int smp_call_function_on(void (*func) (void *info), void *info, int nonatomic,
			  int wait, int cpu)
{
	cpumask_t map = CPU_MASK_NONE;
L
Linus Torvalds 已提交
189

190
	preempt_disable();
J
Jan Glauber 已提交
191 192
	cpu_set(cpu, map);
	__smp_call_function_map(func, info, nonatomic, wait, map);
193
	preempt_enable();
L
Linus Torvalds 已提交
194 195 196 197
	return 0;
}
EXPORT_SYMBOL(smp_call_function_on);

198
static void do_send_stop(void)
L
Linus Torvalds 已提交
199 200 201 202 203 204 205 206 207 208 209 210 211
{
        int cpu, rc;

        /* stop all processors */
	for_each_online_cpu(cpu) {
		if (cpu == smp_processor_id())
			continue;
		do {
			rc = signal_processor(cpu, sigp_stop);
		} while (rc == sigp_busy);
	}
}

212
static void do_store_status(void)
L
Linus Torvalds 已提交
213 214 215 216 217 218 219 220 221 222 223 224 225 226 227
{
        int cpu, rc;

        /* store status of all processors in their lowcores (real 0) */
	for_each_online_cpu(cpu) {
		if (cpu == smp_processor_id())
			continue;
		do {
			rc = signal_processor_p(
				(__u32)(unsigned long) lowcore_ptr[cpu], cpu,
				sigp_store_status_at_address);
		} while(rc == sigp_busy);
        }
}

228
static void do_wait_for_stop(void)
H
Heiko Carstens 已提交
229 230 231 232 233 234 235 236 237 238 239 240
{
	int cpu;

	/* Wait for all other cpus to enter stopped state */
	for_each_online_cpu(cpu) {
		if (cpu == smp_processor_id())
			continue;
		while(!smp_cpu_not_running(cpu))
			cpu_relax();
	}
}

L
Linus Torvalds 已提交
241 242 243 244 245 246
/*
 * this function sends a 'stop' sigp to all other CPUs in the system.
 * it goes straight through.
 */
void smp_send_stop(void)
{
H
Heiko Carstens 已提交
247
	/* Disable all interrupts/machine checks */
G
Gerald Schaefer 已提交
248
	__load_psw_mask(psw_kernel_bits & ~PSW_MASK_MCHECK);
H
Heiko Carstens 已提交
249

L
Linus Torvalds 已提交
250 251 252 253 254 255
        /* write magic number to zero page (absolute 0) */
	lowcore_ptr[smp_processor_id()]->panic_magic = __PANIC_MAGIC;

	/* stop other processors. */
	do_send_stop();

H
Heiko Carstens 已提交
256 257 258
	/* wait until other processors are stopped */
	do_wait_for_stop();

L
Linus Torvalds 已提交
259 260 261 262 263 264 265 266 267 268
	/* store status of other processors. */
	do_store_status();
}

/*
 * Reboot, halt and power_off routines for SMP.
 */

void machine_restart_smp(char * __unused) 
{
H
Heiko Carstens 已提交
269 270
	smp_send_stop();
	do_reipl();
L
Linus Torvalds 已提交
271 272 273 274
}

void machine_halt_smp(void)
{
H
Heiko Carstens 已提交
275 276 277 278 279
	smp_send_stop();
	if (MACHINE_IS_VM && strlen(vmhalt_cmd) > 0)
		__cpcmd(vmhalt_cmd, NULL, 0, NULL);
	signal_processor(smp_processor_id(), sigp_stop_and_store_status);
	for (;;);
L
Linus Torvalds 已提交
280 281 282 283
}

void machine_power_off_smp(void)
{
H
Heiko Carstens 已提交
284 285 286 287 288
	smp_send_stop();
	if (MACHINE_IS_VM && strlen(vmpoff_cmd) > 0)
		__cpcmd(vmpoff_cmd, NULL, 0, NULL);
	signal_processor(smp_processor_id(), sigp_stop_and_store_status);
	for (;;);
L
Linus Torvalds 已提交
289 290 291 292 293 294 295
}

/*
 * This is the main routine where commands issued by other
 * cpus are handled.
 */

296
static void do_ext_call_interrupt(__u16 code)
L
Linus Torvalds 已提交
297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321
{
        unsigned long bits;

        /*
         * handle bit signal external calls
         *
         * For the ec_schedule signal we have to do nothing. All the work
         * is done automatically when we return from the interrupt.
         */
	bits = xchg(&S390_lowcore.ext_call_fast, 0);

	if (test_bit(ec_call_function, &bits)) 
		do_call_function();
}

/*
 * Send an external call sigp to another cpu and return without waiting
 * for its completion.
 */
static void smp_ext_bitcall(int cpu, ec_bit_sig sig)
{
        /*
         * Set signaling bit in lowcore of target cpu and kick it
         */
	set_bit(sig, (unsigned long *) &lowcore_ptr[cpu]->ext_call_fast);
322
	while(signal_processor(cpu, sigp_emergency_signal) == sigp_busy)
L
Linus Torvalds 已提交
323 324 325
		udelay(10);
}

326
#ifndef CONFIG_64BIT
L
Linus Torvalds 已提交
327 328 329 330 331 332 333 334 335 336 337 338 339
/*
 * this function sends a 'purge tlb' signal to another CPU.
 */
void smp_ptlb_callback(void *info)
{
	local_flush_tlb();
}

void smp_ptlb_all(void)
{
        on_each_cpu(smp_ptlb_callback, NULL, 0, 1);
}
EXPORT_SYMBOL(smp_ptlb_all);
340
#endif /* ! CONFIG_64BIT */
L
Linus Torvalds 已提交
341 342 343 344 345 346 347 348 349 350 351 352 353 354

/*
 * this function sends a 'reschedule' IPI to another CPU.
 * it goes straight through and wastes no time serializing
 * anything. Worst case is that we lose a reschedule ...
 */
void smp_send_reschedule(int cpu)
{
        smp_ext_bitcall(cpu, ec_schedule);
}

/*
 * parameter area for the set/clear control bit callbacks
 */
355
struct ec_creg_mask_parms {
L
Linus Torvalds 已提交
356 357
	unsigned long orvals[16];
	unsigned long andvals[16];
358
};
L
Linus Torvalds 已提交
359 360 361 362

/*
 * callback for setting/clearing control bits
 */
363
static void smp_ctl_bit_callback(void *info) {
364
	struct ec_creg_mask_parms *pp = info;
L
Linus Torvalds 已提交
365 366 367
	unsigned long cregs[16];
	int i;
	
368 369
	__ctl_store(cregs, 0, 15);
	for (i = 0; i <= 15; i++)
L
Linus Torvalds 已提交
370
		cregs[i] = (cregs[i] & pp->andvals[i]) | pp->orvals[i];
371
	__ctl_load(cregs, 0, 15);
L
Linus Torvalds 已提交
372 373 374 375 376
}

/*
 * Set a bit in a control register of all cpus
 */
377 378 379
void smp_ctl_set_bit(int cr, int bit)
{
	struct ec_creg_mask_parms parms;
L
Linus Torvalds 已提交
380

381 382
	memset(&parms.orvals, 0, sizeof(parms.orvals));
	memset(&parms.andvals, 0xff, sizeof(parms.andvals));
L
Linus Torvalds 已提交
383
	parms.orvals[cr] = 1 << bit;
384
	on_each_cpu(smp_ctl_bit_callback, &parms, 0, 1);
L
Linus Torvalds 已提交
385 386 387 388 389
}

/*
 * Clear a bit in a control register of all cpus
 */
390 391 392
void smp_ctl_clear_bit(int cr, int bit)
{
	struct ec_creg_mask_parms parms;
L
Linus Torvalds 已提交
393

394 395
	memset(&parms.orvals, 0, sizeof(parms.orvals));
	memset(&parms.andvals, 0xff, sizeof(parms.andvals));
L
Linus Torvalds 已提交
396
	parms.andvals[cr] = ~(1L << bit);
397
	on_each_cpu(smp_ctl_bit_callback, &parms, 0, 1);
L
Linus Torvalds 已提交
398 399
}

M
Michael Holzheu 已提交
400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458
#if defined(CONFIG_ZFCPDUMP) || defined(CONFIG_ZFCPDUMP_MODULE)

/*
 * zfcpdump_prefix_array holds prefix registers for the following scenario:
 * 64 bit zfcpdump kernel and 31 bit kernel which is to be dumped. We have to
 * save its prefix registers, since they get lost, when switching from 31 bit
 * to 64 bit.
 */
unsigned int zfcpdump_prefix_array[NR_CPUS + 1] \
	__attribute__((__section__(".data")));

static void __init smp_get_save_areas(void)
{
	unsigned int cpu, cpu_num, rc;
	__u16 boot_cpu_addr;

	if (ipl_info.type != IPL_TYPE_FCP_DUMP)
		return;
	boot_cpu_addr = S390_lowcore.cpu_data.cpu_addr;
	cpu_num = 1;
	for (cpu = 0; cpu <= 65535; cpu++) {
		if ((u16) cpu == boot_cpu_addr)
			continue;
		__cpu_logical_map[1] = (__u16) cpu;
		if (signal_processor(1, sigp_sense) == sigp_not_operational)
			continue;
		if (cpu_num >= NR_CPUS) {
			printk("WARNING: Registers for cpu %i are not "
			       "saved, since dump kernel was compiled with"
			       "NR_CPUS=%i!\n", cpu_num, NR_CPUS);
			continue;
		}
		zfcpdump_save_areas[cpu_num] =
			alloc_bootmem(sizeof(union save_area));
		while (1) {
			rc = signal_processor(1, sigp_stop_and_store_status);
			if (rc != sigp_busy)
				break;
			cpu_relax();
		}
		memcpy(zfcpdump_save_areas[cpu_num],
		       (void *)(unsigned long) store_prefix() +
		       SAVE_AREA_BASE, SAVE_AREA_SIZE);
#ifdef __s390x__
		/* copy original prefix register */
		zfcpdump_save_areas[cpu_num]->s390x.pref_reg =
			zfcpdump_prefix_array[cpu_num];
#endif
		cpu_num++;
	}
}

union save_area *zfcpdump_save_areas[NR_CPUS + 1];
EXPORT_SYMBOL_GPL(zfcpdump_save_areas);

#else
#define smp_get_save_areas() do { } while (0)
#endif

L
Linus Torvalds 已提交
459 460 461 462
/*
 * Lets check how many CPUs we have.
 */

463 464
static unsigned int
__init smp_count_cpus(void)
L
Linus Torvalds 已提交
465
{
466
	unsigned int cpu, num_cpus;
L
Linus Torvalds 已提交
467 468 469 470 471 472 473 474 475
	__u16 boot_cpu_addr;

	/*
	 * cpu 0 is the boot cpu. See smp_prepare_boot_cpu.
	 */

	boot_cpu_addr = S390_lowcore.cpu_data.cpu_addr;
	current_thread_info()->cpu = 0;
	num_cpus = 1;
476
	for (cpu = 0; cpu <= 65535; cpu++) {
L
Linus Torvalds 已提交
477 478
		if ((__u16) cpu == boot_cpu_addr)
			continue;
479 480
		__cpu_logical_map[1] = (__u16) cpu;
		if (signal_processor(1, sigp_sense) ==
L
Linus Torvalds 已提交
481 482 483 484 485 486 487
		    sigp_not_operational)
			continue;
		num_cpus++;
	}

	printk("Detected %d CPU's\n",(int) num_cpus);
	printk("Boot cpu address %2X\n", boot_cpu_addr);
488 489

	return num_cpus;
L
Linus Torvalds 已提交
490 491 492 493 494 495 496 497 498
}

/*
 *      Activate a secondary processor.
 */
int __devinit start_secondary(void *cpuvoid)
{
        /* Setup the cpu */
        cpu_init();
499
	preempt_disable();
M
Martin Schwidefsky 已提交
500
	/* Enable TOD clock interrupts on the secondary cpu. */
L
Linus Torvalds 已提交
501 502
        init_cpu_timer();
#ifdef CONFIG_VIRT_TIMER
M
Martin Schwidefsky 已提交
503
	/* Enable cpu timer interrupts on the secondary cpu. */
L
Linus Torvalds 已提交
504 505 506
        init_cpu_vtimer();
#endif
	/* Enable pfault pseudo page faults on this cpu. */
H
Heiko Carstens 已提交
507 508
	pfault_init();

L
Linus Torvalds 已提交
509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576
	/* Mark this cpu as online */
	cpu_set(smp_processor_id(), cpu_online_map);
	/* Switch on interrupts */
	local_irq_enable();
        /* Print info about this processor */
        print_cpu_info(&S390_lowcore.cpu_data);
        /* cpu_idle will call schedule for us */
        cpu_idle();
        return 0;
}

static void __init smp_create_idle(unsigned int cpu)
{
	struct task_struct *p;

	/*
	 *  don't care about the psw and regs settings since we'll never
	 *  reschedule the forked task.
	 */
	p = fork_idle(cpu);
	if (IS_ERR(p))
		panic("failed fork for CPU %u: %li", cpu, PTR_ERR(p));
	current_set[cpu] = p;
}

/* Reserving and releasing of CPUs */

static DEFINE_SPINLOCK(smp_reserve_lock);
static int smp_cpu_reserved[NR_CPUS];

int
smp_get_cpu(cpumask_t cpu_mask)
{
	unsigned long flags;
	int cpu;

	spin_lock_irqsave(&smp_reserve_lock, flags);
	/* Try to find an already reserved cpu. */
	for_each_cpu_mask(cpu, cpu_mask) {
		if (smp_cpu_reserved[cpu] != 0) {
			smp_cpu_reserved[cpu]++;
			/* Found one. */
			goto out;
		}
	}
	/* Reserve a new cpu from cpu_mask. */
	for_each_cpu_mask(cpu, cpu_mask) {
		if (cpu_online(cpu)) {
			smp_cpu_reserved[cpu]++;
			goto out;
		}
	}
	cpu = -ENODEV;
out:
	spin_unlock_irqrestore(&smp_reserve_lock, flags);
	return cpu;
}

void
smp_put_cpu(int cpu)
{
	unsigned long flags;

	spin_lock_irqsave(&smp_reserve_lock, flags);
	smp_cpu_reserved[cpu]--;
	spin_unlock_irqrestore(&smp_reserve_lock, flags);
}

577
static int
L
Linus Torvalds 已提交
578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621
cpu_stopped(int cpu)
{
	__u32 status;

	/* Check for stopped state */
	if (signal_processor_ps(&status, 0, cpu, sigp_sense) == sigp_status_stored) {
		if (status & 0x40)
			return 1;
	}
	return 0;
}

/* Upping and downing of CPUs */

int
__cpu_up(unsigned int cpu)
{
	struct task_struct *idle;
        struct _lowcore    *cpu_lowcore;
	struct stack_frame *sf;
        sigp_ccode          ccode;
	int                 curr_cpu;

	for (curr_cpu = 0; curr_cpu <= 65535; curr_cpu++) {
		__cpu_logical_map[cpu] = (__u16) curr_cpu;
		if (cpu_stopped(cpu))
			break;
	}

	if (!cpu_stopped(cpu))
		return -ENODEV;

	ccode = signal_processor_p((__u32)(unsigned long)(lowcore_ptr[cpu]),
				   cpu, sigp_set_prefix);
	if (ccode){
		printk("sigp_set_prefix failed for cpu %d "
		       "with condition code %d\n",
		       (int) cpu, (int) ccode);
		return -EIO;
	}

	idle = current_set[cpu];
        cpu_lowcore = lowcore_ptr[cpu];
	cpu_lowcore->kernel_stack = (unsigned long)
A
Al Viro 已提交
622
		task_stack_page(idle) + (THREAD_SIZE);
L
Linus Torvalds 已提交
623 624 625 626 627 628 629
	sf = (struct stack_frame *) (cpu_lowcore->kernel_stack
				     - sizeof(struct pt_regs)
				     - sizeof(struct stack_frame));
	memset(sf, 0, sizeof(struct stack_frame));
	sf->gprs[9] = (unsigned long) sf;
	cpu_lowcore->save_area[15] = (unsigned long) sf;
	__ctl_store(cpu_lowcore->cregs_save_area[0], 0, 15);
630 631 632
	asm volatile(
		"	stam	0,15,0(%0)"
		: : "a" (&cpu_lowcore->access_regs_save_area) : "memory");
L
Linus Torvalds 已提交
633 634 635 636
	cpu_lowcore->percpu_offset = __per_cpu_offset[cpu];
        cpu_lowcore->current_task = (unsigned long) idle;
        cpu_lowcore->cpu_data.cpu_nr = cpu;
	eieio();
M
Michael Ryan 已提交
637 638 639

	while (signal_processor(cpu,sigp_restart) == sigp_busy)
		udelay(10);
L
Linus Torvalds 已提交
640 641 642 643 644 645

	while (!cpu_online(cpu))
		cpu_relax();
	return 0;
}

646
static unsigned int __initdata additional_cpus;
647
static unsigned int __initdata possible_cpus;
648 649 650

void __init smp_setup_cpu_possible_map(void)
{
651
	unsigned int phy_cpus, pos_cpus, cpu;
652

M
Michael Holzheu 已提交
653
	smp_get_save_areas();
654 655
	phy_cpus = smp_count_cpus();
	pos_cpus = min(phy_cpus + additional_cpus, (unsigned int) NR_CPUS);
656

657
	if (possible_cpus)
658
		pos_cpus = min(possible_cpus, (unsigned int) NR_CPUS);
659

660
	for (cpu = 0; cpu < pos_cpus; cpu++)
661 662
		cpu_set(cpu, cpu_possible_map);

663 664 665 666
	phy_cpus = min(phy_cpus, pos_cpus);

	for (cpu = 0; cpu < phy_cpus; cpu++)
		cpu_set(cpu, cpu_present_map);
667 668 669 670 671 672 673 674 675 676 677
}

#ifdef CONFIG_HOTPLUG_CPU

static int __init setup_additional_cpus(char *s)
{
	additional_cpus = simple_strtoul(s, NULL, 0);
	return 0;
}
early_param("additional_cpus", setup_additional_cpus);

678 679 680 681 682 683 684
static int __init setup_possible_cpus(char *s)
{
	possible_cpus = simple_strtoul(s, NULL, 0);
	return 0;
}
early_param("possible_cpus", setup_possible_cpus);

L
Linus Torvalds 已提交
685 686 687 688
int
__cpu_disable(void)
{
	unsigned long flags;
689
	struct ec_creg_mask_parms cr_parms;
Z
Zwane Mwaikambo 已提交
690
	int cpu = smp_processor_id();
L
Linus Torvalds 已提交
691 692

	spin_lock_irqsave(&smp_reserve_lock, flags);
Z
Zwane Mwaikambo 已提交
693
	if (smp_cpu_reserved[cpu] != 0) {
L
Linus Torvalds 已提交
694 695 696
		spin_unlock_irqrestore(&smp_reserve_lock, flags);
		return -EBUSY;
	}
Z
Zwane Mwaikambo 已提交
697
	cpu_clear(cpu, cpu_online_map);
L
Linus Torvalds 已提交
698 699

	/* Disable pfault pseudo page faults on this cpu. */
H
Heiko Carstens 已提交
700
	pfault_fini();
L
Linus Torvalds 已提交
701

702 703
	memset(&cr_parms.orvals, 0, sizeof(cr_parms.orvals));
	memset(&cr_parms.andvals, 0xff, sizeof(cr_parms.andvals));
L
Linus Torvalds 已提交
704

705
	/* disable all external interrupts */
L
Linus Torvalds 已提交
706 707 708 709 710 711 712 713 714 715
	cr_parms.orvals[0] = 0;
	cr_parms.andvals[0] = ~(1<<15 | 1<<14 | 1<<13 | 1<<12 |
				1<<11 | 1<<10 | 1<< 6 | 1<< 4);
	/* disable all I/O interrupts */
	cr_parms.orvals[6] = 0;
	cr_parms.andvals[6] = ~(1<<31 | 1<<30 | 1<<29 | 1<<28 |
				1<<27 | 1<<26 | 1<<25 | 1<<24);
	/* disable most machine checks */
	cr_parms.orvals[14] = 0;
	cr_parms.andvals[14] = ~(1<<28 | 1<<27 | 1<<26 | 1<<25 | 1<<24);
716

L
Linus Torvalds 已提交
717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740
	smp_ctl_bit_callback(&cr_parms);

	spin_unlock_irqrestore(&smp_reserve_lock, flags);
	return 0;
}

void
__cpu_die(unsigned int cpu)
{
	/* Wait until target cpu is down */
	while (!smp_cpu_not_running(cpu))
		cpu_relax();
	printk("Processor %d spun down\n", cpu);
}

void
cpu_die(void)
{
	idle_task_exit();
	signal_processor(smp_processor_id(), sigp_stop);
	BUG();
	for(;;);
}

741 742
#endif /* CONFIG_HOTPLUG_CPU */

L
Linus Torvalds 已提交
743 744 745 746 747 748 749 750 751 752
/*
 *	Cycle through the processors and setup structures.
 */

void __init smp_prepare_cpus(unsigned int max_cpus)
{
	unsigned long stack;
	unsigned int cpu;
        int i;

753 754 755
        /* request the 0x1201 emergency signal external interrupt */
        if (register_external_interrupt(0x1201, do_ext_call_interrupt) != 0)
                panic("Couldn't request external interrupt 0x1201");
L
Linus Torvalds 已提交
756 757 758 759 760 761
        memset(lowcore_ptr,0,sizeof(lowcore_ptr));  
        /*
         *  Initialize prefix pages and stacks for all possible cpus
         */
	print_cpu_info(&S390_lowcore.cpu_data);

762
        for_each_possible_cpu(i) {
L
Linus Torvalds 已提交
763 764 765 766 767 768 769 770 771 772 773 774 775
		lowcore_ptr[i] = (struct _lowcore *)
			__get_free_pages(GFP_KERNEL|GFP_DMA, 
					sizeof(void*) == 8 ? 1 : 0);
		stack = __get_free_pages(GFP_KERNEL,ASYNC_ORDER);
		if (lowcore_ptr[i] == NULL || stack == 0ULL)
			panic("smp_boot_cpus failed to allocate memory\n");

		*(lowcore_ptr[i]) = S390_lowcore;
		lowcore_ptr[i]->async_stack = stack + (ASYNC_SIZE);
		stack = __get_free_pages(GFP_KERNEL,0);
		if (stack == 0ULL)
			panic("smp_boot_cpus failed to allocate memory\n");
		lowcore_ptr[i]->panic_stack = stack + (PAGE_SIZE);
776
#ifndef CONFIG_64BIT
777 778 779 780 781 782 783
		if (MACHINE_HAS_IEEE) {
			lowcore_ptr[i]->extended_save_area_addr =
				(__u32) __get_free_pages(GFP_KERNEL,0);
			if (lowcore_ptr[i]->extended_save_area_addr == 0)
				panic("smp_boot_cpus failed to "
				      "allocate memory\n");
		}
L
Linus Torvalds 已提交
784 785
#endif
	}
786
#ifndef CONFIG_64BIT
787 788 789
	if (MACHINE_HAS_IEEE)
		ctl_set_bit(14, 29); /* enable extended save area */
#endif
L
Linus Torvalds 已提交
790 791
	set_prefix((u32)(unsigned long) lowcore_ptr[smp_processor_id()]);

792
	for_each_possible_cpu(cpu)
L
Linus Torvalds 已提交
793 794 795 796 797 798 799 800 801 802 803 804 805 806 807
		if (cpu != smp_processor_id())
			smp_create_idle(cpu);
}

void __devinit smp_prepare_boot_cpu(void)
{
	BUG_ON(smp_processor_id() != 0);

	cpu_set(0, cpu_online_map);
	S390_lowcore.percpu_offset = __per_cpu_offset[0];
	current_set[0] = current;
}

void smp_cpus_done(unsigned int max_cpus)
{
808
	cpu_present_map = cpu_possible_map;
L
Linus Torvalds 已提交
809 810 811 812 813 814 815 816 817 818 819 820 821 822 823
}

/*
 * the frequency of the profiling timer can be changed
 * by writing a multiplier value into /proc/profile.
 *
 * usually you want to run this on all CPUs ;)
 */
int setup_profiling_timer(unsigned int multiplier)
{
        return 0;
}

static DEFINE_PER_CPU(struct cpu, cpu_devices);

824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858
static ssize_t show_capability(struct sys_device *dev, char *buf)
{
	unsigned int capability;
	int rc;

	rc = get_cpu_capability(&capability);
	if (rc)
		return rc;
	return sprintf(buf, "%u\n", capability);
}
static SYSDEV_ATTR(capability, 0444, show_capability, NULL);

static int __cpuinit smp_cpu_notify(struct notifier_block *self,
				    unsigned long action, void *hcpu)
{
	unsigned int cpu = (unsigned int)(long)hcpu;
	struct cpu *c = &per_cpu(cpu_devices, cpu);
	struct sys_device *s = &c->sysdev;

	switch (action) {
	case CPU_ONLINE:
		if (sysdev_create_file(s, &attr_capability))
			return NOTIFY_BAD;
		break;
	case CPU_DEAD:
		sysdev_remove_file(s, &attr_capability);
		break;
	}
	return NOTIFY_OK;
}

static struct notifier_block __cpuinitdata smp_cpu_nb = {
	.notifier_call	= smp_cpu_notify,
};

L
Linus Torvalds 已提交
859 860 861
static int __init topology_init(void)
{
	int cpu;
862 863

	register_cpu_notifier(&smp_cpu_nb);
L
Linus Torvalds 已提交
864

865
	for_each_possible_cpu(cpu) {
866
		struct cpu *c = &per_cpu(cpu_devices, cpu);
867
		struct sys_device *s = &c->sysdev;
868 869

		c->hotpluggable = 1;
870 871 872 873 874
		register_cpu(c, cpu);
		if (!cpu_online(cpu))
			continue;
		s = &c->sysdev;
		sysdev_create_file(s, &attr_capability);
L
Linus Torvalds 已提交
875 876 877 878 879 880
	}
	return 0;
}

subsys_initcall(topology_init);

881
EXPORT_SYMBOL(cpu_online_map);
L
Linus Torvalds 已提交
882 883 884 885 886 887
EXPORT_SYMBOL(cpu_possible_map);
EXPORT_SYMBOL(lowcore_ptr);
EXPORT_SYMBOL(smp_ctl_set_bit);
EXPORT_SYMBOL(smp_ctl_clear_bit);
EXPORT_SYMBOL(smp_get_cpu);
EXPORT_SYMBOL(smp_put_cpu);