x2apic_uv_x.c 21.2 KB
Newer Older
J
Jack Steiner 已提交
1 2 3 4 5 6 7
/*
 * This file is subject to the terms and conditions of the GNU General Public
 * License.  See the file "COPYING" in the main directory of this archive
 * for more details.
 *
 * SGI UV APIC functions (note: not an Intel compatible APIC)
 *
8
 * Copyright (C) 2007-2010 Silicon Graphics, Inc. All rights reserved.
J
Jack Steiner 已提交
9 10
 */
#include <linux/cpumask.h>
11 12 13 14 15
#include <linux/hardirq.h>
#include <linux/proc_fs.h>
#include <linux/threads.h>
#include <linux/kernel.h>
#include <linux/module.h>
J
Jack Steiner 已提交
16 17 18
#include <linux/string.h>
#include <linux/ctype.h>
#include <linux/sched.h>
19
#include <linux/timer.h>
20
#include <linux/slab.h>
21 22
#include <linux/cpu.h>
#include <linux/init.h>
23
#include <linux/io.h>
24
#include <linux/pci.h>
25
#include <linux/kdebug.h>
26
#include <linux/delay.h>
C
Cliff Wickman 已提交
27
#include <linux/crash_dump.h>
28

J
Jack Steiner 已提交
29 30
#include <asm/uv/uv_mmrs.h>
#include <asm/uv/uv_hub.h>
31 32
#include <asm/current.h>
#include <asm/pgtable.h>
33
#include <asm/uv/bios.h>
34 35 36 37
#include <asm/uv/uv.h>
#include <asm/apic.h>
#include <asm/ipi.h>
#include <asm/smp.h>
38
#include <asm/x86_init.h>
C
Cliff Wickman 已提交
39
#include <asm/emergency-restart.h>
J
Jack Steiner 已提交
40

41 42
DEFINE_PER_CPU(int, x2apic_extra_bits);

43 44
#define PR_DEVEL(fmt, args...)	pr_devel("%s: " fmt, __func__, args)

45
static enum uv_system_type uv_system_type;
46
static u64 gru_start_paddr, gru_end_paddr;
47
static union uvh_apicid uvh_apicid;
48 49
int uv_min_hub_revision_id;
EXPORT_SYMBOL_GPL(uv_min_hub_revision_id);
50 51
unsigned int uv_apicid_hibits;
EXPORT_SYMBOL_GPL(uv_apicid_hibits);
52
static DEFINE_SPINLOCK(uv_nmi_lock);
53

54 55 56 57 58 59 60 61 62 63
static unsigned long __init uv_early_read_mmr(unsigned long addr)
{
	unsigned long val, *mmr;

	mmr = early_ioremap(UV_LOCAL_MMR_BASE | addr, sizeof(*mmr));
	val = *mmr;
	early_iounmap(mmr, sizeof(*mmr));
	return val;
}

64
static inline bool is_GRU_range(u64 start, u64 end)
65
{
66
	return start >= gru_start_paddr && end <= gru_end_paddr;
67 68
}

69
static bool uv_is_untracked_pat_range(u64 start, u64 end)
70 71 72
{
	return is_ISA_range(start, end) || is_GRU_range(start, end);
}
73

74
static int __init early_get_pnodeid(void)
75 76
{
	union uvh_node_id_u node_id;
77 78
	union uvh_rh_gam_config_mmr_u  m_n_config;
	int pnode;
79 80

	/* Currently, all blades have same revision number */
81
	node_id.v = uv_early_read_mmr(UVH_NODE_ID);
82
	m_n_config.v = uv_early_read_mmr(UVH_RH_GAM_CONFIG_MMR);
83 84
	uv_min_hub_revision_id = node_id.s.revision;

85 86
	pnode = (node_id.s.node_id >> 1) & ((1 << m_n_config.s.n_skt) - 1);
	return pnode;
87 88
}

89
static void __init early_get_apic_pnode_shift(void)
90
{
91
	uvh_apicid.v = uv_early_read_mmr(UVH_APICID);
92 93 94 95 96 97 98
	if (!uvh_apicid.v)
		/*
		 * Old bios, use default value
		 */
		uvh_apicid.s.pnode_shift = UV_APIC_PNODE_SHIFT;
}

99 100 101 102 103 104 105 106 107
/*
 * Add an extra bit as dictated by bios to the destination apicid of
 * interrupts potentially passing through the UV HUB.  This prevents
 * a deadlock between interrupts and IO port operations.
 */
static void __init uv_set_apicid_hibit(void)
{
	union uvh_lb_target_physical_apic_id_mask_u apicid_mask;

108
	apicid_mask.v = uv_early_read_mmr(UVH_LB_TARGET_PHYSICAL_APIC_ID_MASK);
109 110 111
	uv_apicid_hibits = apicid_mask.s.bit_enables & UV_APICID_HIBIT_MASK;
}

112
static int __init uv_acpi_madt_oem_check(char *oem_id, char *oem_table_id)
113
{
114
	int pnodeid;
115

116
	if (!strcmp(oem_id, "SGI")) {
117
		pnodeid = early_get_pnodeid();
118
		early_get_apic_pnode_shift();
119
		x86_platform.is_untracked_pat_range =  uv_is_untracked_pat_range;
120
		x86_platform.nmi_init = uv_nmi_init;
121 122 123 124 125
		if (!strcmp(oem_table_id, "UVL"))
			uv_system_type = UV_LEGACY_APIC;
		else if (!strcmp(oem_table_id, "UVX"))
			uv_system_type = UV_X2APIC;
		else if (!strcmp(oem_table_id, "UVH")) {
T
Tejun Heo 已提交
126
			__this_cpu_write(x2apic_extra_bits,
127
				pnodeid << uvh_apicid.s.pnode_shift);
128
			uv_system_type = UV_NON_UNIQUE_APIC;
129
			uv_set_apicid_hibit();
130 131 132 133 134 135 136 137 138 139 140 141 142 143 144
			return 1;
		}
	}
	return 0;
}

enum uv_system_type get_uv_system_type(void)
{
	return uv_system_type;
}

int is_uv_system(void)
{
	return uv_system_type != UV_NONE;
}
145
EXPORT_SYMBOL_GPL(is_uv_system);
146

J
Jack Steiner 已提交
147 148 149 150 151 152 153 154 155 156 157 158 159 160 161
DEFINE_PER_CPU(struct uv_hub_info_s, __uv_hub_info);
EXPORT_PER_CPU_SYMBOL_GPL(__uv_hub_info);

struct uv_blade_info *uv_blade_info;
EXPORT_SYMBOL_GPL(uv_blade_info);

short *uv_node_to_blade;
EXPORT_SYMBOL_GPL(uv_node_to_blade);

short *uv_cpu_to_blade;
EXPORT_SYMBOL_GPL(uv_cpu_to_blade);

short uv_possible_blades;
EXPORT_SYMBOL_GPL(uv_possible_blades);

162 163 164
unsigned long sn_rtc_cycles_per_second;
EXPORT_SYMBOL(sn_rtc_cycles_per_second);

165
static const struct cpumask *uv_target_cpus(void)
J
Jack Steiner 已提交
166
{
167
	return cpu_online_mask;
J
Jack Steiner 已提交
168 169
}

170
static void uv_vector_allocation_domain(int cpu, struct cpumask *retmask)
J
Jack Steiner 已提交
171
{
172 173
	cpumask_clear(retmask);
	cpumask_set_cpu(cpu, retmask);
J
Jack Steiner 已提交
174 175
}

176
static int __cpuinit uv_wakeup_secondary(int phys_apicid, unsigned long start_rip)
J
Jack Steiner 已提交
177
{
178
#ifdef CONFIG_SMP
J
Jack Steiner 已提交
179
	unsigned long val;
180
	int pnode;
J
Jack Steiner 已提交
181

182
	pnode = uv_apicid_to_pnode(phys_apicid);
183
	phys_apicid |= uv_apicid_hibits;
J
Jack Steiner 已提交
184 185
	val = (1UL << UVH_IPI_INT_SEND_SHFT) |
	    (phys_apicid << UVH_IPI_INT_APIC_ID_SHFT) |
186
	    ((start_rip << UVH_IPI_INT_VECTOR_SHFT) >> 12) |
J
Jack Steiner 已提交
187
	    APIC_DM_INIT;
188
	uv_write_global_mmr64(pnode, UVH_IPI_INT, val);
J
Jack Steiner 已提交
189 190 191 192
	mdelay(10);

	val = (1UL << UVH_IPI_INT_SEND_SHFT) |
	    (phys_apicid << UVH_IPI_INT_APIC_ID_SHFT) |
193
	    ((start_rip << UVH_IPI_INT_VECTOR_SHFT) >> 12) |
J
Jack Steiner 已提交
194
	    APIC_DM_STARTUP;
195
	uv_write_global_mmr64(pnode, UVH_IPI_INT, val);
196 197

	atomic_set(&init_deasserted, 1);
198
#endif
J
Jack Steiner 已提交
199 200 201 202 203
	return 0;
}

static void uv_send_IPI_one(int cpu, int vector)
{
204
	unsigned long apicid;
205
	int pnode;
J
Jack Steiner 已提交
206

207
	apicid = per_cpu(x86_cpu_to_apicid, cpu);
208
	pnode = uv_apicid_to_pnode(apicid);
209
	uv_hub_send_ipi(pnode, apicid, vector);
J
Jack Steiner 已提交
210 211
}

212
static void uv_send_IPI_mask(const struct cpumask *mask, int vector)
J
Jack Steiner 已提交
213 214 215
{
	unsigned int cpu;

216
	for_each_cpu(cpu, mask)
217 218 219
		uv_send_IPI_one(cpu, vector);
}

220
static void uv_send_IPI_mask_allbutself(const struct cpumask *mask, int vector)
221 222
{
	unsigned int this_cpu = smp_processor_id();
223
	unsigned int cpu;
224

225
	for_each_cpu(cpu, mask) {
226
		if (cpu != this_cpu)
J
Jack Steiner 已提交
227
			uv_send_IPI_one(cpu, vector);
228
	}
J
Jack Steiner 已提交
229 230 231 232
}

static void uv_send_IPI_allbutself(int vector)
{
233
	unsigned int this_cpu = smp_processor_id();
234
	unsigned int cpu;
J
Jack Steiner 已提交
235

236
	for_each_online_cpu(cpu) {
237 238
		if (cpu != this_cpu)
			uv_send_IPI_one(cpu, vector);
239
	}
J
Jack Steiner 已提交
240 241 242 243
}

static void uv_send_IPI_all(int vector)
{
244
	uv_send_IPI_mask(cpu_online_mask, vector);
J
Jack Steiner 已提交
245 246 247 248 249 250 251
}

static int uv_apic_id_registered(void)
{
	return 1;
}

252
static void uv_init_apic_ldr(void)
253 254 255
{
}

256
static unsigned int uv_cpu_mask_to_apicid(const struct cpumask *cpumask)
J
Jack Steiner 已提交
257 258 259 260 261
{
	/*
	 * We're using fixed IRQ delivery, can only return one phys APIC ID.
	 * May as well be the first.
	 */
262 263
	int cpu = cpumask_first(cpumask);

264
	if ((unsigned)cpu < nr_cpu_ids)
265
		return per_cpu(x86_cpu_to_apicid, cpu) | uv_apicid_hibits;
J
Jack Steiner 已提交
266 267 268 269
	else
		return BAD_APICID;
}

270 271 272
static unsigned int
uv_cpu_mask_to_apicid_and(const struct cpumask *cpumask,
			  const struct cpumask *andmask)
M
Mike Travis 已提交
273 274 275 276 277 278 279
{
	int cpu;

	/*
	 * We're using fixed IRQ delivery, can only return one phys APIC ID.
	 * May as well be the first.
	 */
280
	for_each_cpu_and(cpu, cpumask, andmask) {
281 282
		if (cpumask_test_cpu(cpu, cpu_online_mask))
			break;
283
	}
284
	return per_cpu(x86_cpu_to_apicid, cpu) | uv_apicid_hibits;
M
Mike Travis 已提交
285 286
}

287
static unsigned int x2apic_get_apic_id(unsigned long x)
288 289 290 291
{
	unsigned int id;

	WARN_ON(preemptible() && num_online_cpus() > 1);
T
Tejun Heo 已提交
292
	id = x | __this_cpu_read(x2apic_extra_bits);
293 294 295 296

	return id;
}

297
static unsigned long set_apic_id(unsigned int id)
Y
Yinghai Lu 已提交
298 299 300 301 302 303 304 305 306 307 308
{
	unsigned long x;

	/* maskout x2apic_extra_bits ? */
	x = id;
	return x;
}

static unsigned int uv_read_apic_id(void)
{

309
	return x2apic_get_apic_id(apic_read(APIC_ID));
Y
Yinghai Lu 已提交
310 311
}

I
Ingo Molnar 已提交
312
static int uv_phys_pkg_id(int initial_apicid, int index_msb)
J
Jack Steiner 已提交
313
{
314
	return uv_read_apic_id() >> index_msb;
J
Jack Steiner 已提交
315 316 317 318 319 320 321
}

static void uv_send_IPI_self(int vector)
{
	apic_write(APIC_SELF_IPI, vector);
}

322
struct apic __refdata apic_x2apic_uv_x = {
I
Ingo Molnar 已提交
323 324 325 326 327 328

	.name				= "UV large system",
	.probe				= NULL,
	.acpi_madt_oem_check		= uv_acpi_madt_oem_check,
	.apic_id_registered		= uv_apic_id_registered,

329
	.irq_delivery_mode		= dest_Fixed,
J
Jack Steiner 已提交
330
	.irq_dest_mode			= 0, /* physical */
I
Ingo Molnar 已提交
331 332

	.target_cpus			= uv_target_cpus,
333
	.disable_esr			= 0,
334
	.dest_logical			= APIC_DEST_LOGICAL,
I
Ingo Molnar 已提交
335 336 337 338 339 340 341 342 343
	.check_apicid_used		= NULL,
	.check_apicid_present		= NULL,

	.vector_allocation_domain	= uv_vector_allocation_domain,
	.init_apic_ldr			= uv_init_apic_ldr,

	.ioapic_phys_id_map		= NULL,
	.setup_apic_routing		= NULL,
	.multi_timer_check		= NULL,
344
	.cpu_present_to_apicid		= default_cpu_present_to_apicid,
I
Ingo Molnar 已提交
345 346
	.apicid_to_cpu_present		= NULL,
	.setup_portio_remap		= NULL,
347
	.check_phys_apicid_present	= default_check_phys_apicid_present,
I
Ingo Molnar 已提交
348
	.enable_apic_mode		= NULL,
I
Ingo Molnar 已提交
349
	.phys_pkg_id			= uv_phys_pkg_id,
I
Ingo Molnar 已提交
350 351
	.mps_oem_check			= NULL,

352
	.get_apic_id			= x2apic_get_apic_id,
I
Ingo Molnar 已提交
353 354 355 356 357 358 359 360 361 362 363 364
	.set_apic_id			= set_apic_id,
	.apic_id_mask			= 0xFFFFFFFFu,

	.cpu_mask_to_apicid		= uv_cpu_mask_to_apicid,
	.cpu_mask_to_apicid_and		= uv_cpu_mask_to_apicid_and,

	.send_IPI_mask			= uv_send_IPI_mask,
	.send_IPI_mask_allbutself	= uv_send_IPI_mask_allbutself,
	.send_IPI_allbutself		= uv_send_IPI_allbutself,
	.send_IPI_all			= uv_send_IPI_all,
	.send_IPI_self			= uv_send_IPI_self,

365
	.wakeup_secondary_cpu		= uv_wakeup_secondary,
366 367
	.trampoline_phys_low		= DEFAULT_TRAMPOLINE_PHYS_LOW,
	.trampoline_phys_high		= DEFAULT_TRAMPOLINE_PHYS_HIGH,
I
Ingo Molnar 已提交
368 369 370
	.wait_for_init_deassert		= NULL,
	.smp_callin_clear_local_apic	= NULL,
	.inquire_remote_apic		= NULL,
Y
Yinghai Lu 已提交
371 372 373 374 375 376 377

	.read				= native_apic_msr_read,
	.write				= native_apic_msr_write,
	.icr_read			= native_x2apic_icr_read,
	.icr_write			= native_x2apic_icr_write,
	.wait_icr_idle			= native_x2apic_wait_icr_idle,
	.safe_wait_icr_idle		= native_safe_x2apic_wait_icr_idle,
J
Jack Steiner 已提交
378 379
};

380
static __cpuinit void set_x2apic_extra_bits(int pnode)
J
Jack Steiner 已提交
381
{
382
	__this_cpu_write(x2apic_extra_bits, pnode << uvh_apicid.s.pnode_shift);
J
Jack Steiner 已提交
383 384 385 386 387
}

/*
 * Called on boot cpu.
 */
388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405
static __init int boot_pnode_to_blade(int pnode)
{
	int blade;

	for (blade = 0; blade < uv_num_possible_blades(); blade++)
		if (pnode == uv_blade_info[blade].pnode)
			return blade;
	BUG();
}

struct redir_addr {
	unsigned long redirect;
	unsigned long alias;
};

#define DEST_SHIFT UVH_RH_GAM_ALIAS210_REDIRECT_CONFIG_0_MMR_DEST_BASE_SHFT

static __initdata struct redir_addr redir_addrs[] = {
406 407 408
	{UVH_RH_GAM_ALIAS210_REDIRECT_CONFIG_0_MMR, UVH_RH_GAM_ALIAS210_OVERLAY_CONFIG_0_MMR},
	{UVH_RH_GAM_ALIAS210_REDIRECT_CONFIG_1_MMR, UVH_RH_GAM_ALIAS210_OVERLAY_CONFIG_1_MMR},
	{UVH_RH_GAM_ALIAS210_REDIRECT_CONFIG_2_MMR, UVH_RH_GAM_ALIAS210_OVERLAY_CONFIG_2_MMR},
409 410 411 412
};

static __init void get_lowmem_redirect(unsigned long *base, unsigned long *size)
{
413
	union uvh_rh_gam_alias210_overlay_config_2_mmr_u alias;
414 415 416 417 418
	union uvh_rh_gam_alias210_redirect_config_2_mmr_u redirect;
	int i;

	for (i = 0; i < ARRAY_SIZE(redir_addrs); i++) {
		alias.v = uv_read_local_mmr(redir_addrs[i].alias);
419
		if (alias.s.enable && alias.s.base == 0) {
420 421 422 423 424 425
			*size = (1UL << alias.s.m_alias);
			redirect.v = uv_read_local_mmr(redir_addrs[i].redirect);
			*base = (unsigned long)redirect.s.dest_base << DEST_SHIFT;
			return;
		}
	}
426
	*base = *size = 0;
427 428
}

429 430
enum map_type {map_wb, map_uc};

431 432
static __init void map_high(char *id, unsigned long base, int pshift,
			int bshift, int max_pnode, enum map_type map_type)
433 434 435
{
	unsigned long bytes, paddr;

436 437
	paddr = base << pshift;
	bytes = (1UL << bshift) * (max_pnode + 1);
438
	printk(KERN_INFO "UV: Map %s_HI 0x%lx - 0x%lx\n", id, paddr,
439
						paddr + bytes);
440 441 442 443 444 445 446 447 448 449 450 451
	if (map_type == map_uc)
		init_extra_mapping_uc(paddr, bytes);
	else
		init_extra_mapping_wb(paddr, bytes);

}
static __init void map_gru_high(int max_pnode)
{
	union uvh_rh_gam_gru_overlay_config_mmr_u gru;
	int shift = UVH_RH_GAM_GRU_OVERLAY_CONFIG_MMR_BASE_SHFT;

	gru.v = uv_read_local_mmr(UVH_RH_GAM_GRU_OVERLAY_CONFIG_MMR);
452
	if (gru.s.enable) {
453
		map_high("GRU", gru.s.base, shift, shift, max_pnode, map_wb);
454 455 456 457
		gru_start_paddr = ((u64)gru.s.base << shift);
		gru_end_paddr = gru_start_paddr + (1UL << shift) * (max_pnode + 1);

	}
458 459
}

460 461 462 463 464 465 466
static __init void map_mmr_high(int max_pnode)
{
	union uvh_rh_gam_mmr_overlay_config_mmr_u mmr;
	int shift = UVH_RH_GAM_MMR_OVERLAY_CONFIG_MMR_BASE_SHFT;

	mmr.v = uv_read_local_mmr(UVH_RH_GAM_MMR_OVERLAY_CONFIG_MMR);
	if (mmr.s.enable)
467
		map_high("MMR", mmr.s.base, shift, shift, max_pnode, map_uc);
468 469
}

470 471 472 473 474 475 476
static __init void map_mmioh_high(int max_pnode)
{
	union uvh_rh_gam_mmioh_overlay_config_mmr_u mmioh;
	int shift = UVH_RH_GAM_MMIOH_OVERLAY_CONFIG_MMR_BASE_SHFT;

	mmioh.v = uv_read_local_mmr(UVH_RH_GAM_MMIOH_OVERLAY_CONFIG_MMR);
	if (mmioh.s.enable)
477 478
		map_high("MMIOH", mmioh.s.base, shift, mmioh.s.m_io,
			max_pnode, map_uc);
479 480
}

J
Jack Steiner 已提交
481 482 483 484 485 486
static __init void map_low_mmrs(void)
{
	init_extra_mapping_uc(UV_GLOBAL_MMR32_BASE, UV_GLOBAL_MMR32_SIZE);
	init_extra_mapping_uc(UV_LOCAL_MMR_BASE, UV_LOCAL_MMR_SIZE);
}

487 488
static __init void uv_rtc_init(void)
{
R
Russ Anderson 已提交
489 490
	long status;
	u64 ticks_per_sec;
491

R
Russ Anderson 已提交
492 493 494
	status = uv_bios_freq_base(BIOS_FREQ_BASE_REALTIME_CLOCK,
					&ticks_per_sec);
	if (status != BIOS_STATUS_SUCCESS || ticks_per_sec < 100000) {
495 496 497 498 499 500 501 502 503
		printk(KERN_WARNING
			"unable to determine platform RTC clock frequency, "
			"guessing.\n");
		/* BIOS gives wrong value for clock freq. so guess */
		sn_rtc_cycles_per_second = 1000000000000UL / 30000UL;
	} else
		sn_rtc_cycles_per_second = ticks_per_sec;
}

504 505 506 507 508 509 510 511 512 513 514
/*
 * percpu heartbeat timer
 */
static void uv_heartbeat(unsigned long ignored)
{
	struct timer_list *timer = &uv_hub_info->scir.timer;
	unsigned char bits = uv_hub_info->scir.state;

	/* flip heartbeat bit */
	bits ^= SCIR_CPU_HEARTBEAT;

515 516
	/* is this cpu idle? */
	if (idle_cpu(raw_smp_processor_id()))
517 518 519 520 521 522 523 524
		bits &= ~SCIR_CPU_ACTIVITY;
	else
		bits |= SCIR_CPU_ACTIVITY;

	/* update system controller interface reg */
	uv_set_scir_bits(bits);

	/* enable next timer period */
525
	mod_timer_pinned(timer, jiffies + SCIR_CPU_HB_INTERVAL);
526 527 528 529
}

static void __cpuinit uv_heartbeat_enable(int cpu)
{
530
	while (!uv_cpu_hub_info(cpu)->scir.enabled) {
531 532 533 534 535 536 537 538
		struct timer_list *timer = &uv_cpu_hub_info(cpu)->scir.timer;

		uv_set_cpu_scir_bits(cpu, SCIR_CPU_HEARTBEAT|SCIR_CPU_ACTIVITY);
		setup_timer(timer, uv_heartbeat, cpu);
		timer->expires = jiffies + SCIR_CPU_HB_INTERVAL;
		add_timer_on(timer, cpu);
		uv_cpu_hub_info(cpu)->scir.enabled = 1;

539 540 541
		/* also ensure that boot cpu is enabled */
		cpu = 0;
	}
542 543
}

544
#ifdef CONFIG_HOTPLUG_CPU
545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599
static void __cpuinit uv_heartbeat_disable(int cpu)
{
	if (uv_cpu_hub_info(cpu)->scir.enabled) {
		uv_cpu_hub_info(cpu)->scir.enabled = 0;
		del_timer(&uv_cpu_hub_info(cpu)->scir.timer);
	}
	uv_set_cpu_scir_bits(cpu, 0xff);
}

/*
 * cpu hotplug notifier
 */
static __cpuinit int uv_scir_cpu_notify(struct notifier_block *self,
				       unsigned long action, void *hcpu)
{
	long cpu = (long)hcpu;

	switch (action) {
	case CPU_ONLINE:
		uv_heartbeat_enable(cpu);
		break;
	case CPU_DOWN_PREPARE:
		uv_heartbeat_disable(cpu);
		break;
	default:
		break;
	}
	return NOTIFY_OK;
}

static __init void uv_scir_register_cpu_notifier(void)
{
	hotcpu_notifier(uv_scir_cpu_notify, 0);
}

#else /* !CONFIG_HOTPLUG_CPU */

static __init void uv_scir_register_cpu_notifier(void)
{
}

static __init int uv_init_heartbeat(void)
{
	int cpu;

	if (is_uv_system())
		for_each_online_cpu(cpu)
			uv_heartbeat_enable(cpu);
	return 0;
}

late_initcall(uv_init_heartbeat);

#endif /* !CONFIG_HOTPLUG_CPU */

600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623
/* Direct Legacy VGA I/O traffic to designated IOH */
int uv_set_vga_state(struct pci_dev *pdev, bool decode,
		      unsigned int command_bits, bool change_bridge)
{
	int domain, bus, rc;

	PR_DEVEL("devfn %x decode %d cmd %x chg_brdg %d\n",
			pdev->devfn, decode, command_bits, change_bridge);

	if (!change_bridge)
		return 0;

	if ((command_bits & PCI_COMMAND_IO) == 0)
		return 0;

	domain = pci_domain_nr(pdev->bus);
	bus = pdev->bus->number;

	rc = uv_bios_set_legacy_vga_target(decode, domain, bus);
	PR_DEVEL("vga decode %d %x:%x, rc: %d\n", decode, domain, bus, rc);

	return rc;
}

624 625
/*
 * Called on each cpu to initialize the per_cpu UV data area.
626
 * FIXME: hotplug not supported yet
627 628 629 630 631 632 633 634 635 636 637 638 639
 */
void __cpuinit uv_cpu_init(void)
{
	/* CPU 0 initilization will be done via uv_system_init. */
	if (!uv_blade_info)
		return;

	uv_blade_info[uv_numa_blade_id()].nr_online_cpus++;

	if (get_uv_system_type() == UV_NON_UNIQUE_APIC)
		set_x2apic_extra_bits(uv_hub_info->pnode);
}

640 641 642 643 644
/*
 * When NMI is received, print a stack trace.
 */
int uv_handle_nmi(struct notifier_block *self, unsigned long reason, void *data)
{
645
	if (reason != DIE_NMIUNKNOWN)
646
		return NOTIFY_OK;
647 648 649 650

	if (in_crash_kexec)
		/* do nothing if entering the crash kernel */
		return NOTIFY_OK;
651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683
	/*
	 * Use a lock so only one cpu prints at a time
	 * to prevent intermixed output.
	 */
	spin_lock(&uv_nmi_lock);
	pr_info("NMI stack dump cpu %u:\n", smp_processor_id());
	dump_stack();
	spin_unlock(&uv_nmi_lock);

	return NOTIFY_STOP;
}

static struct notifier_block uv_dump_stack_nmi_nb = {
	.notifier_call	= uv_handle_nmi
};

void uv_register_nmi_notifier(void)
{
	if (register_die_notifier(&uv_dump_stack_nmi_nb))
		printk(KERN_WARNING "UV NMI handler failed to register\n");
}

void uv_nmi_init(void)
{
	unsigned int value;

	/*
	 * Unmask NMI on all cpus
	 */
	value = apic_read(APIC_LVT1) | APIC_DM_NMI;
	value &= ~APIC_LVT_MASKED;
	apic_write(APIC_LVT1, value);
}
684 685

void __init uv_system_init(void)
J
Jack Steiner 已提交
686
{
687
	union uvh_rh_gam_config_mmr_u  m_n_config;
688
	union uvh_rh_gam_mmioh_overlay_config_mmr_u mmioh;
689 690
	union uvh_node_id_u node_id;
	unsigned long gnode_upper, lowmem_redir_base, lowmem_redir_size;
691
	int bytes, nid, cpu, lcpu, pnode, blade, i, j, m_val, n_val, n_io;
692
	int gnode_extra, max_pnode = 0;
693
	unsigned long mmr_base, present, paddr;
694
	unsigned short pnode_mask, pnode_io_mask;
J
Jack Steiner 已提交
695

J
Jack Steiner 已提交
696 697
	map_low_mmrs();

698
	m_n_config.v = uv_read_local_mmr(UVH_RH_GAM_CONFIG_MMR );
699 700
	m_val = m_n_config.s.m_skt;
	n_val = m_n_config.s.n_skt;
701 702
	mmioh.v = uv_read_local_mmr(UVH_RH_GAM_MMIOH_OVERLAY_CONFIG_MMR);
	n_io = mmioh.s.n_io;
J
Jack Steiner 已提交
703 704 705
	mmr_base =
	    uv_read_local_mmr(UVH_RH_GAM_MMR_OVERLAY_CONFIG_MMR) &
	    ~UV_MMR_ENABLE;
706
	pnode_mask = (1 << n_val) - 1;
707 708
	pnode_io_mask = (1 << n_io) - 1;

709 710 711
	node_id.v = uv_read_local_mmr(UVH_NODE_ID);
	gnode_extra = (node_id.s.node_id & ~((1 << n_val) - 1)) >> 1;
	gnode_upper = ((unsigned long)gnode_extra  << m_val);
712 713
	printk(KERN_INFO "UV: N %d, M %d, N_IO: %d, gnode_upper 0x%lx, gnode_extra 0x%x, pnode_mask 0x%x, pnode_io_mask 0x%x\n",
			n_val, m_val, n_io, gnode_upper, gnode_extra, pnode_mask, pnode_io_mask);
714

J
Jack Steiner 已提交
715 716
	printk(KERN_DEBUG "UV: global MMR base 0x%lx\n", mmr_base);

717 718 719
	for(i = 0; i < UVH_NODE_PRESENT_TABLE_DEPTH; i++)
		uv_possible_blades +=
		  hweight64(uv_read_local_mmr( UVH_NODE_PRESENT_TABLE + i * 8));
J
Jack Steiner 已提交
720 721 722
	printk(KERN_DEBUG "UV: Found %d blades\n", uv_num_possible_blades());

	bytes = sizeof(struct uv_blade_info) * uv_num_possible_blades();
723
	uv_blade_info = kmalloc(bytes, GFP_KERNEL);
724
	BUG_ON(!uv_blade_info);
725 726
	for (blade = 0; blade < uv_num_possible_blades(); blade++)
		uv_blade_info[blade].memory_nid = -1;
J
Jack Steiner 已提交
727

728 729
	get_lowmem_redirect(&lowmem_redir_base, &lowmem_redir_size);

J
Jack Steiner 已提交
730
	bytes = sizeof(uv_node_to_blade[0]) * num_possible_nodes();
731
	uv_node_to_blade = kmalloc(bytes, GFP_KERNEL);
732
	BUG_ON(!uv_node_to_blade);
J
Jack Steiner 已提交
733 734 735
	memset(uv_node_to_blade, 255, bytes);

	bytes = sizeof(uv_cpu_to_blade[0]) * num_possible_cpus();
736
	uv_cpu_to_blade = kmalloc(bytes, GFP_KERNEL);
737
	BUG_ON(!uv_cpu_to_blade);
J
Jack Steiner 已提交
738 739
	memset(uv_cpu_to_blade, 255, bytes);

740 741 742 743 744 745
	blade = 0;
	for (i = 0; i < UVH_NODE_PRESENT_TABLE_DEPTH; i++) {
		present = uv_read_local_mmr(UVH_NODE_PRESENT_TABLE + i * 8);
		for (j = 0; j < 64; j++) {
			if (!test_bit(j, &present))
				continue;
746
			pnode = (i * 64 + j) & pnode_mask;
747
			uv_blade_info[blade].pnode = pnode;
748
			uv_blade_info[blade].nr_possible_cpus = 0;
J
Jack Steiner 已提交
749
			uv_blade_info[blade].nr_online_cpus = 0;
750
			max_pnode = max(pnode, max_pnode);
751
			blade++;
J
Jack Steiner 已提交
752
		}
753
	}
J
Jack Steiner 已提交
754

755
	uv_bios_init();
756 757
	uv_bios_get_sn_info(0, &uv_type, &sn_partition_id, &sn_coherency_id,
			    &sn_region_size, &system_serial_number);
758 759
	uv_rtc_init();

760
	for_each_present_cpu(cpu) {
761 762
		int apicid = per_cpu(x86_cpu_to_apicid, cpu);

763
		nid = cpu_to_node(cpu);
764 765 766
		/*
		 * apic_pnode_shift must be set before calling uv_apicid_to_pnode();
		 */
767
		uv_cpu_hub_info(cpu)->pnode_mask = pnode_mask;
768
		uv_cpu_hub_info(cpu)->apic_pnode_shift = uvh_apicid.s.pnode_shift;
769
		pnode = uv_apicid_to_pnode(apicid);
770 771 772 773
		blade = boot_pnode_to_blade(pnode);
		lcpu = uv_blade_info[blade].nr_possible_cpus;
		uv_blade_info[blade].nr_possible_cpus++;

774 775 776
		/* Any node on the blade, else will contain -1. */
		uv_blade_info[blade].memory_nid = nid;

777
		uv_cpu_hub_info(cpu)->lowmem_remap_base = lowmem_redir_base;
778
		uv_cpu_hub_info(cpu)->lowmem_remap_top = lowmem_redir_size;
779
		uv_cpu_hub_info(cpu)->m_val = m_val;
780
		uv_cpu_hub_info(cpu)->n_val = n_val;
J
Jack Steiner 已提交
781 782
		uv_cpu_hub_info(cpu)->numa_blade_id = blade;
		uv_cpu_hub_info(cpu)->blade_processor_id = lcpu;
783
		uv_cpu_hub_info(cpu)->pnode = pnode;
784
		uv_cpu_hub_info(cpu)->gpa_mask = (1UL << (m_val + n_val)) - 1;
785
		uv_cpu_hub_info(cpu)->gnode_upper = gnode_upper;
786
		uv_cpu_hub_info(cpu)->gnode_extra = gnode_extra;
J
Jack Steiner 已提交
787
		uv_cpu_hub_info(cpu)->global_mmr_base = mmr_base;
788
		uv_cpu_hub_info(cpu)->coherency_domain_number = sn_coherency_id;
789
		uv_cpu_hub_info(cpu)->scir.offset = uv_scir_offset(apicid);
J
Jack Steiner 已提交
790 791 792
		uv_node_to_blade[nid] = blade;
		uv_cpu_to_blade[cpu] = blade;
	}
793

794 795 796 797 798
	/* Add blade/pnode info for nodes without cpus */
	for_each_online_node(nid) {
		if (uv_node_to_blade[nid] >= 0)
			continue;
		paddr = node_start_pfn(nid) << PAGE_SHIFT;
799
		paddr = uv_soc_phys_ram_to_gpa(paddr);
800 801 802 803 804
		pnode = (paddr >> m_val) & pnode_mask;
		blade = boot_pnode_to_blade(pnode);
		uv_node_to_blade[nid] = blade;
	}

805
	map_gru_high(max_pnode);
806
	map_mmr_high(max_pnode);
807
	map_mmioh_high(max_pnode & pnode_io_mask);
J
Jack Steiner 已提交
808

809
	uv_cpu_init();
810
	uv_scir_register_cpu_notifier();
811
	uv_register_nmi_notifier();
812
	proc_mkdir("sgi_uv", NULL);
813 814 815

	/* register Legacy VGA I/O redirection handler */
	pci_register_set_vga_state(uv_set_vga_state);
C
Cliff Wickman 已提交
816 817 818 819 820 821 822

	/*
	 * For a kdump kernel the reset must be BOOT_ACPI, not BOOT_EFI, as
	 * EFI is not enabled in the kdump kernel.
	 */
	if (is_kdump_kernel())
		reboot_type = BOOT_ACPI;
J
Jack Steiner 已提交
823
}