x2apic_uv_x.c 22.4 KB
Newer Older
J
Jack Steiner 已提交
1 2 3 4 5 6 7
/*
 * This file is subject to the terms and conditions of the GNU General Public
 * License.  See the file "COPYING" in the main directory of this archive
 * for more details.
 *
 * SGI UV APIC functions (note: not an Intel compatible APIC)
 *
8
 * Copyright (C) 2007-2010 Silicon Graphics, Inc. All rights reserved.
J
Jack Steiner 已提交
9 10
 */
#include <linux/cpumask.h>
11 12 13 14 15
#include <linux/hardirq.h>
#include <linux/proc_fs.h>
#include <linux/threads.h>
#include <linux/kernel.h>
#include <linux/module.h>
J
Jack Steiner 已提交
16 17 18
#include <linux/string.h>
#include <linux/ctype.h>
#include <linux/sched.h>
19
#include <linux/timer.h>
20
#include <linux/slab.h>
21 22
#include <linux/cpu.h>
#include <linux/init.h>
23
#include <linux/io.h>
24
#include <linux/pci.h>
25
#include <linux/kdebug.h>
26
#include <linux/delay.h>
C
Cliff Wickman 已提交
27
#include <linux/crash_dump.h>
28

J
Jack Steiner 已提交
29 30
#include <asm/uv/uv_mmrs.h>
#include <asm/uv/uv_hub.h>
31 32
#include <asm/current.h>
#include <asm/pgtable.h>
33
#include <asm/uv/bios.h>
34 35 36 37
#include <asm/uv/uv.h>
#include <asm/apic.h>
#include <asm/ipi.h>
#include <asm/smp.h>
38
#include <asm/x86_init.h>
C
Cliff Wickman 已提交
39
#include <asm/emergency-restart.h>
40 41 42 43 44 45 46
#include <asm/nmi.h>

/* BMC sets a bit this MMR non-zero before sending an NMI */
#define UVH_NMI_MMR				UVH_SCRATCH5
#define UVH_NMI_MMR_CLEAR			(UVH_NMI_MMR + 8)
#define UV_NMI_PENDING_MASK			(1UL << 63)
DEFINE_PER_CPU(unsigned long, cpu_last_nmi_count);
J
Jack Steiner 已提交
47

48 49
DEFINE_PER_CPU(int, x2apic_extra_bits);

50 51
#define PR_DEVEL(fmt, args...)	pr_devel("%s: " fmt, __func__, args)

52
static enum uv_system_type uv_system_type;
53
static u64 gru_start_paddr, gru_end_paddr;
54
static union uvh_apicid uvh_apicid;
55 56
int uv_min_hub_revision_id;
EXPORT_SYMBOL_GPL(uv_min_hub_revision_id);
57 58
unsigned int uv_apicid_hibits;
EXPORT_SYMBOL_GPL(uv_apicid_hibits);
59
static DEFINE_SPINLOCK(uv_nmi_lock);
60

61 62 63 64 65 66 67 68 69 70
static unsigned long __init uv_early_read_mmr(unsigned long addr)
{
	unsigned long val, *mmr;

	mmr = early_ioremap(UV_LOCAL_MMR_BASE | addr, sizeof(*mmr));
	val = *mmr;
	early_iounmap(mmr, sizeof(*mmr));
	return val;
}

71
static inline bool is_GRU_range(u64 start, u64 end)
72
{
73
	return start >= gru_start_paddr && end <= gru_end_paddr;
74 75
}

76
static bool uv_is_untracked_pat_range(u64 start, u64 end)
77 78 79
{
	return is_ISA_range(start, end) || is_GRU_range(start, end);
}
80

81
static int __init early_get_pnodeid(void)
82 83
{
	union uvh_node_id_u node_id;
84 85
	union uvh_rh_gam_config_mmr_u  m_n_config;
	int pnode;
86 87

	/* Currently, all blades have same revision number */
88
	node_id.v = uv_early_read_mmr(UVH_NODE_ID);
89
	m_n_config.v = uv_early_read_mmr(UVH_RH_GAM_CONFIG_MMR);
90 91
	uv_min_hub_revision_id = node_id.s.revision;

92 93
	pnode = (node_id.s.node_id >> 1) & ((1 << m_n_config.s.n_skt) - 1);
	return pnode;
94 95
}

96
static void __init early_get_apic_pnode_shift(void)
97
{
98
	uvh_apicid.v = uv_early_read_mmr(UVH_APICID);
99 100 101 102 103 104 105
	if (!uvh_apicid.v)
		/*
		 * Old bios, use default value
		 */
		uvh_apicid.s.pnode_shift = UV_APIC_PNODE_SHIFT;
}

106 107 108 109 110 111 112 113 114
/*
 * Add an extra bit as dictated by bios to the destination apicid of
 * interrupts potentially passing through the UV HUB.  This prevents
 * a deadlock between interrupts and IO port operations.
 */
static void __init uv_set_apicid_hibit(void)
{
	union uvh_lb_target_physical_apic_id_mask_u apicid_mask;

115
	apicid_mask.v = uv_early_read_mmr(UVH_LB_TARGET_PHYSICAL_APIC_ID_MASK);
116 117 118
	uv_apicid_hibits = apicid_mask.s.bit_enables & UV_APICID_HIBIT_MASK;
}

119
static int __init uv_acpi_madt_oem_check(char *oem_id, char *oem_table_id)
120
{
121
	int pnodeid;
122

123
	if (!strcmp(oem_id, "SGI")) {
124
		pnodeid = early_get_pnodeid();
125
		early_get_apic_pnode_shift();
126
		x86_platform.is_untracked_pat_range =  uv_is_untracked_pat_range;
127
		x86_platform.nmi_init = uv_nmi_init;
128 129 130 131 132
		if (!strcmp(oem_table_id, "UVL"))
			uv_system_type = UV_LEGACY_APIC;
		else if (!strcmp(oem_table_id, "UVX"))
			uv_system_type = UV_X2APIC;
		else if (!strcmp(oem_table_id, "UVH")) {
T
Tejun Heo 已提交
133
			__this_cpu_write(x2apic_extra_bits,
134
				pnodeid << uvh_apicid.s.pnode_shift);
135
			uv_system_type = UV_NON_UNIQUE_APIC;
136
			uv_set_apicid_hibit();
137 138 139 140 141 142 143 144 145 146 147 148 149 150 151
			return 1;
		}
	}
	return 0;
}

enum uv_system_type get_uv_system_type(void)
{
	return uv_system_type;
}

int is_uv_system(void)
{
	return uv_system_type != UV_NONE;
}
152
EXPORT_SYMBOL_GPL(is_uv_system);
153

J
Jack Steiner 已提交
154 155 156 157 158 159 160 161 162 163 164 165 166 167 168
DEFINE_PER_CPU(struct uv_hub_info_s, __uv_hub_info);
EXPORT_PER_CPU_SYMBOL_GPL(__uv_hub_info);

struct uv_blade_info *uv_blade_info;
EXPORT_SYMBOL_GPL(uv_blade_info);

short *uv_node_to_blade;
EXPORT_SYMBOL_GPL(uv_node_to_blade);

short *uv_cpu_to_blade;
EXPORT_SYMBOL_GPL(uv_cpu_to_blade);

short uv_possible_blades;
EXPORT_SYMBOL_GPL(uv_possible_blades);

169 170 171
unsigned long sn_rtc_cycles_per_second;
EXPORT_SYMBOL(sn_rtc_cycles_per_second);

172
static const struct cpumask *uv_target_cpus(void)
J
Jack Steiner 已提交
173
{
174
	return cpu_online_mask;
J
Jack Steiner 已提交
175 176
}

177
static void uv_vector_allocation_domain(int cpu, struct cpumask *retmask)
J
Jack Steiner 已提交
178
{
179 180
	cpumask_clear(retmask);
	cpumask_set_cpu(cpu, retmask);
J
Jack Steiner 已提交
181 182
}

183
static int __cpuinit uv_wakeup_secondary(int phys_apicid, unsigned long start_rip)
J
Jack Steiner 已提交
184
{
185
#ifdef CONFIG_SMP
J
Jack Steiner 已提交
186
	unsigned long val;
187
	int pnode;
J
Jack Steiner 已提交
188

189
	pnode = uv_apicid_to_pnode(phys_apicid);
190
	phys_apicid |= uv_apicid_hibits;
J
Jack Steiner 已提交
191 192
	val = (1UL << UVH_IPI_INT_SEND_SHFT) |
	    (phys_apicid << UVH_IPI_INT_APIC_ID_SHFT) |
193
	    ((start_rip << UVH_IPI_INT_VECTOR_SHFT) >> 12) |
J
Jack Steiner 已提交
194
	    APIC_DM_INIT;
195
	uv_write_global_mmr64(pnode, UVH_IPI_INT, val);
J
Jack Steiner 已提交
196 197 198 199
	mdelay(10);

	val = (1UL << UVH_IPI_INT_SEND_SHFT) |
	    (phys_apicid << UVH_IPI_INT_APIC_ID_SHFT) |
200
	    ((start_rip << UVH_IPI_INT_VECTOR_SHFT) >> 12) |
J
Jack Steiner 已提交
201
	    APIC_DM_STARTUP;
202
	uv_write_global_mmr64(pnode, UVH_IPI_INT, val);
203 204

	atomic_set(&init_deasserted, 1);
205
#endif
J
Jack Steiner 已提交
206 207 208 209 210
	return 0;
}

static void uv_send_IPI_one(int cpu, int vector)
{
211
	unsigned long apicid;
212
	int pnode;
J
Jack Steiner 已提交
213

214
	apicid = per_cpu(x86_cpu_to_apicid, cpu);
215
	pnode = uv_apicid_to_pnode(apicid);
216
	uv_hub_send_ipi(pnode, apicid, vector);
J
Jack Steiner 已提交
217 218
}

219
static void uv_send_IPI_mask(const struct cpumask *mask, int vector)
J
Jack Steiner 已提交
220 221 222
{
	unsigned int cpu;

223
	for_each_cpu(cpu, mask)
224 225 226
		uv_send_IPI_one(cpu, vector);
}

227
static void uv_send_IPI_mask_allbutself(const struct cpumask *mask, int vector)
228 229
{
	unsigned int this_cpu = smp_processor_id();
230
	unsigned int cpu;
231

232
	for_each_cpu(cpu, mask) {
233
		if (cpu != this_cpu)
J
Jack Steiner 已提交
234
			uv_send_IPI_one(cpu, vector);
235
	}
J
Jack Steiner 已提交
236 237 238 239
}

static void uv_send_IPI_allbutself(int vector)
{
240
	unsigned int this_cpu = smp_processor_id();
241
	unsigned int cpu;
J
Jack Steiner 已提交
242

243
	for_each_online_cpu(cpu) {
244 245
		if (cpu != this_cpu)
			uv_send_IPI_one(cpu, vector);
246
	}
J
Jack Steiner 已提交
247 248 249 250
}

static void uv_send_IPI_all(int vector)
{
251
	uv_send_IPI_mask(cpu_online_mask, vector);
J
Jack Steiner 已提交
252 253 254 255 256 257 258
}

static int uv_apic_id_registered(void)
{
	return 1;
}

259
static void uv_init_apic_ldr(void)
260 261 262
{
}

263
static unsigned int uv_cpu_mask_to_apicid(const struct cpumask *cpumask)
J
Jack Steiner 已提交
264 265 266 267 268
{
	/*
	 * We're using fixed IRQ delivery, can only return one phys APIC ID.
	 * May as well be the first.
	 */
269 270
	int cpu = cpumask_first(cpumask);

271
	if ((unsigned)cpu < nr_cpu_ids)
272
		return per_cpu(x86_cpu_to_apicid, cpu) | uv_apicid_hibits;
J
Jack Steiner 已提交
273 274 275 276
	else
		return BAD_APICID;
}

277 278 279
static unsigned int
uv_cpu_mask_to_apicid_and(const struct cpumask *cpumask,
			  const struct cpumask *andmask)
M
Mike Travis 已提交
280 281 282 283 284 285 286
{
	int cpu;

	/*
	 * We're using fixed IRQ delivery, can only return one phys APIC ID.
	 * May as well be the first.
	 */
287
	for_each_cpu_and(cpu, cpumask, andmask) {
288 289
		if (cpumask_test_cpu(cpu, cpu_online_mask))
			break;
290
	}
291
	return per_cpu(x86_cpu_to_apicid, cpu) | uv_apicid_hibits;
M
Mike Travis 已提交
292 293
}

294
static unsigned int x2apic_get_apic_id(unsigned long x)
295 296 297 298
{
	unsigned int id;

	WARN_ON(preemptible() && num_online_cpus() > 1);
T
Tejun Heo 已提交
299
	id = x | __this_cpu_read(x2apic_extra_bits);
300 301 302 303

	return id;
}

304
static unsigned long set_apic_id(unsigned int id)
Y
Yinghai Lu 已提交
305 306 307 308 309 310 311 312 313 314 315
{
	unsigned long x;

	/* maskout x2apic_extra_bits ? */
	x = id;
	return x;
}

static unsigned int uv_read_apic_id(void)
{

316
	return x2apic_get_apic_id(apic_read(APIC_ID));
Y
Yinghai Lu 已提交
317 318
}

I
Ingo Molnar 已提交
319
static int uv_phys_pkg_id(int initial_apicid, int index_msb)
J
Jack Steiner 已提交
320
{
321
	return uv_read_apic_id() >> index_msb;
J
Jack Steiner 已提交
322 323 324 325 326 327 328
}

static void uv_send_IPI_self(int vector)
{
	apic_write(APIC_SELF_IPI, vector);
}

329
struct apic __refdata apic_x2apic_uv_x = {
I
Ingo Molnar 已提交
330 331 332 333 334 335

	.name				= "UV large system",
	.probe				= NULL,
	.acpi_madt_oem_check		= uv_acpi_madt_oem_check,
	.apic_id_registered		= uv_apic_id_registered,

336
	.irq_delivery_mode		= dest_Fixed,
J
Jack Steiner 已提交
337
	.irq_dest_mode			= 0, /* physical */
I
Ingo Molnar 已提交
338 339

	.target_cpus			= uv_target_cpus,
340
	.disable_esr			= 0,
341
	.dest_logical			= APIC_DEST_LOGICAL,
I
Ingo Molnar 已提交
342 343 344 345 346 347 348 349 350
	.check_apicid_used		= NULL,
	.check_apicid_present		= NULL,

	.vector_allocation_domain	= uv_vector_allocation_domain,
	.init_apic_ldr			= uv_init_apic_ldr,

	.ioapic_phys_id_map		= NULL,
	.setup_apic_routing		= NULL,
	.multi_timer_check		= NULL,
351
	.cpu_present_to_apicid		= default_cpu_present_to_apicid,
I
Ingo Molnar 已提交
352 353
	.apicid_to_cpu_present		= NULL,
	.setup_portio_remap		= NULL,
354
	.check_phys_apicid_present	= default_check_phys_apicid_present,
I
Ingo Molnar 已提交
355
	.enable_apic_mode		= NULL,
I
Ingo Molnar 已提交
356
	.phys_pkg_id			= uv_phys_pkg_id,
I
Ingo Molnar 已提交
357 358
	.mps_oem_check			= NULL,

359
	.get_apic_id			= x2apic_get_apic_id,
I
Ingo Molnar 已提交
360 361 362 363 364 365 366 367 368 369 370 371
	.set_apic_id			= set_apic_id,
	.apic_id_mask			= 0xFFFFFFFFu,

	.cpu_mask_to_apicid		= uv_cpu_mask_to_apicid,
	.cpu_mask_to_apicid_and		= uv_cpu_mask_to_apicid_and,

	.send_IPI_mask			= uv_send_IPI_mask,
	.send_IPI_mask_allbutself	= uv_send_IPI_mask_allbutself,
	.send_IPI_allbutself		= uv_send_IPI_allbutself,
	.send_IPI_all			= uv_send_IPI_all,
	.send_IPI_self			= uv_send_IPI_self,

372
	.wakeup_secondary_cpu		= uv_wakeup_secondary,
373 374
	.trampoline_phys_low		= DEFAULT_TRAMPOLINE_PHYS_LOW,
	.trampoline_phys_high		= DEFAULT_TRAMPOLINE_PHYS_HIGH,
I
Ingo Molnar 已提交
375 376 377
	.wait_for_init_deassert		= NULL,
	.smp_callin_clear_local_apic	= NULL,
	.inquire_remote_apic		= NULL,
Y
Yinghai Lu 已提交
378 379 380 381 382 383 384

	.read				= native_apic_msr_read,
	.write				= native_apic_msr_write,
	.icr_read			= native_x2apic_icr_read,
	.icr_write			= native_x2apic_icr_write,
	.wait_icr_idle			= native_x2apic_wait_icr_idle,
	.safe_wait_icr_idle		= native_safe_x2apic_wait_icr_idle,
J
Jack Steiner 已提交
385 386
};

387
static __cpuinit void set_x2apic_extra_bits(int pnode)
J
Jack Steiner 已提交
388
{
389
	__this_cpu_write(x2apic_extra_bits, pnode << uvh_apicid.s.pnode_shift);
J
Jack Steiner 已提交
390 391 392 393 394
}

/*
 * Called on boot cpu.
 */
395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412
static __init int boot_pnode_to_blade(int pnode)
{
	int blade;

	for (blade = 0; blade < uv_num_possible_blades(); blade++)
		if (pnode == uv_blade_info[blade].pnode)
			return blade;
	BUG();
}

struct redir_addr {
	unsigned long redirect;
	unsigned long alias;
};

#define DEST_SHIFT UVH_RH_GAM_ALIAS210_REDIRECT_CONFIG_0_MMR_DEST_BASE_SHFT

static __initdata struct redir_addr redir_addrs[] = {
413 414 415
	{UVH_RH_GAM_ALIAS210_REDIRECT_CONFIG_0_MMR, UVH_RH_GAM_ALIAS210_OVERLAY_CONFIG_0_MMR},
	{UVH_RH_GAM_ALIAS210_REDIRECT_CONFIG_1_MMR, UVH_RH_GAM_ALIAS210_OVERLAY_CONFIG_1_MMR},
	{UVH_RH_GAM_ALIAS210_REDIRECT_CONFIG_2_MMR, UVH_RH_GAM_ALIAS210_OVERLAY_CONFIG_2_MMR},
416 417 418 419
};

static __init void get_lowmem_redirect(unsigned long *base, unsigned long *size)
{
420
	union uvh_rh_gam_alias210_overlay_config_2_mmr_u alias;
421 422 423 424 425
	union uvh_rh_gam_alias210_redirect_config_2_mmr_u redirect;
	int i;

	for (i = 0; i < ARRAY_SIZE(redir_addrs); i++) {
		alias.v = uv_read_local_mmr(redir_addrs[i].alias);
426
		if (alias.s.enable && alias.s.base == 0) {
427 428 429 430 431 432
			*size = (1UL << alias.s.m_alias);
			redirect.v = uv_read_local_mmr(redir_addrs[i].redirect);
			*base = (unsigned long)redirect.s.dest_base << DEST_SHIFT;
			return;
		}
	}
433
	*base = *size = 0;
434 435
}

436 437
enum map_type {map_wb, map_uc};

438 439
static __init void map_high(char *id, unsigned long base, int pshift,
			int bshift, int max_pnode, enum map_type map_type)
440 441 442
{
	unsigned long bytes, paddr;

443 444
	paddr = base << pshift;
	bytes = (1UL << bshift) * (max_pnode + 1);
445
	printk(KERN_INFO "UV: Map %s_HI 0x%lx - 0x%lx\n", id, paddr,
446
						paddr + bytes);
447 448 449 450 451 452 453 454 455 456 457 458
	if (map_type == map_uc)
		init_extra_mapping_uc(paddr, bytes);
	else
		init_extra_mapping_wb(paddr, bytes);

}
static __init void map_gru_high(int max_pnode)
{
	union uvh_rh_gam_gru_overlay_config_mmr_u gru;
	int shift = UVH_RH_GAM_GRU_OVERLAY_CONFIG_MMR_BASE_SHFT;

	gru.v = uv_read_local_mmr(UVH_RH_GAM_GRU_OVERLAY_CONFIG_MMR);
459
	if (gru.s.enable) {
460
		map_high("GRU", gru.s.base, shift, shift, max_pnode, map_wb);
461 462 463 464
		gru_start_paddr = ((u64)gru.s.base << shift);
		gru_end_paddr = gru_start_paddr + (1UL << shift) * (max_pnode + 1);

	}
465 466
}

467 468 469 470 471 472 473
static __init void map_mmr_high(int max_pnode)
{
	union uvh_rh_gam_mmr_overlay_config_mmr_u mmr;
	int shift = UVH_RH_GAM_MMR_OVERLAY_CONFIG_MMR_BASE_SHFT;

	mmr.v = uv_read_local_mmr(UVH_RH_GAM_MMR_OVERLAY_CONFIG_MMR);
	if (mmr.s.enable)
474
		map_high("MMR", mmr.s.base, shift, shift, max_pnode, map_uc);
475 476
}

477 478 479 480 481 482 483
static __init void map_mmioh_high(int max_pnode)
{
	union uvh_rh_gam_mmioh_overlay_config_mmr_u mmioh;
	int shift = UVH_RH_GAM_MMIOH_OVERLAY_CONFIG_MMR_BASE_SHFT;

	mmioh.v = uv_read_local_mmr(UVH_RH_GAM_MMIOH_OVERLAY_CONFIG_MMR);
	if (mmioh.s.enable)
484 485
		map_high("MMIOH", mmioh.s.base, shift, mmioh.s.m_io,
			max_pnode, map_uc);
486 487
}

J
Jack Steiner 已提交
488 489 490 491 492 493
static __init void map_low_mmrs(void)
{
	init_extra_mapping_uc(UV_GLOBAL_MMR32_BASE, UV_GLOBAL_MMR32_SIZE);
	init_extra_mapping_uc(UV_LOCAL_MMR_BASE, UV_LOCAL_MMR_SIZE);
}

494 495
static __init void uv_rtc_init(void)
{
R
Russ Anderson 已提交
496 497
	long status;
	u64 ticks_per_sec;
498

R
Russ Anderson 已提交
499 500 501
	status = uv_bios_freq_base(BIOS_FREQ_BASE_REALTIME_CLOCK,
					&ticks_per_sec);
	if (status != BIOS_STATUS_SUCCESS || ticks_per_sec < 100000) {
502 503 504 505 506 507 508 509 510
		printk(KERN_WARNING
			"unable to determine platform RTC clock frequency, "
			"guessing.\n");
		/* BIOS gives wrong value for clock freq. so guess */
		sn_rtc_cycles_per_second = 1000000000000UL / 30000UL;
	} else
		sn_rtc_cycles_per_second = ticks_per_sec;
}

511 512 513 514 515 516 517 518 519 520 521
/*
 * percpu heartbeat timer
 */
static void uv_heartbeat(unsigned long ignored)
{
	struct timer_list *timer = &uv_hub_info->scir.timer;
	unsigned char bits = uv_hub_info->scir.state;

	/* flip heartbeat bit */
	bits ^= SCIR_CPU_HEARTBEAT;

522 523
	/* is this cpu idle? */
	if (idle_cpu(raw_smp_processor_id()))
524 525 526 527 528 529 530 531
		bits &= ~SCIR_CPU_ACTIVITY;
	else
		bits |= SCIR_CPU_ACTIVITY;

	/* update system controller interface reg */
	uv_set_scir_bits(bits);

	/* enable next timer period */
532
	mod_timer_pinned(timer, jiffies + SCIR_CPU_HB_INTERVAL);
533 534 535 536
}

static void __cpuinit uv_heartbeat_enable(int cpu)
{
537
	while (!uv_cpu_hub_info(cpu)->scir.enabled) {
538 539 540 541 542 543 544 545
		struct timer_list *timer = &uv_cpu_hub_info(cpu)->scir.timer;

		uv_set_cpu_scir_bits(cpu, SCIR_CPU_HEARTBEAT|SCIR_CPU_ACTIVITY);
		setup_timer(timer, uv_heartbeat, cpu);
		timer->expires = jiffies + SCIR_CPU_HB_INTERVAL;
		add_timer_on(timer, cpu);
		uv_cpu_hub_info(cpu)->scir.enabled = 1;

546 547 548
		/* also ensure that boot cpu is enabled */
		cpu = 0;
	}
549 550
}

551
#ifdef CONFIG_HOTPLUG_CPU
552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606
static void __cpuinit uv_heartbeat_disable(int cpu)
{
	if (uv_cpu_hub_info(cpu)->scir.enabled) {
		uv_cpu_hub_info(cpu)->scir.enabled = 0;
		del_timer(&uv_cpu_hub_info(cpu)->scir.timer);
	}
	uv_set_cpu_scir_bits(cpu, 0xff);
}

/*
 * cpu hotplug notifier
 */
static __cpuinit int uv_scir_cpu_notify(struct notifier_block *self,
				       unsigned long action, void *hcpu)
{
	long cpu = (long)hcpu;

	switch (action) {
	case CPU_ONLINE:
		uv_heartbeat_enable(cpu);
		break;
	case CPU_DOWN_PREPARE:
		uv_heartbeat_disable(cpu);
		break;
	default:
		break;
	}
	return NOTIFY_OK;
}

static __init void uv_scir_register_cpu_notifier(void)
{
	hotcpu_notifier(uv_scir_cpu_notify, 0);
}

#else /* !CONFIG_HOTPLUG_CPU */

static __init void uv_scir_register_cpu_notifier(void)
{
}

static __init int uv_init_heartbeat(void)
{
	int cpu;

	if (is_uv_system())
		for_each_online_cpu(cpu)
			uv_heartbeat_enable(cpu);
	return 0;
}

late_initcall(uv_init_heartbeat);

#endif /* !CONFIG_HOTPLUG_CPU */

607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630
/* Direct Legacy VGA I/O traffic to designated IOH */
int uv_set_vga_state(struct pci_dev *pdev, bool decode,
		      unsigned int command_bits, bool change_bridge)
{
	int domain, bus, rc;

	PR_DEVEL("devfn %x decode %d cmd %x chg_brdg %d\n",
			pdev->devfn, decode, command_bits, change_bridge);

	if (!change_bridge)
		return 0;

	if ((command_bits & PCI_COMMAND_IO) == 0)
		return 0;

	domain = pci_domain_nr(pdev->bus);
	bus = pdev->bus->number;

	rc = uv_bios_set_legacy_vga_target(decode, domain, bus);
	PR_DEVEL("vga decode %d %x:%x, rc: %d\n", decode, domain, bus, rc);

	return rc;
}

631 632
/*
 * Called on each cpu to initialize the per_cpu UV data area.
633
 * FIXME: hotplug not supported yet
634 635 636 637 638 639 640 641 642 643 644 645 646
 */
void __cpuinit uv_cpu_init(void)
{
	/* CPU 0 initilization will be done via uv_system_init. */
	if (!uv_blade_info)
		return;

	uv_blade_info[uv_numa_blade_id()].nr_online_cpus++;

	if (get_uv_system_type() == UV_NON_UNIQUE_APIC)
		set_x2apic_extra_bits(uv_hub_info->pnode);
}

647 648 649 650 651
/*
 * When NMI is received, print a stack trace.
 */
int uv_handle_nmi(struct notifier_block *self, unsigned long reason, void *data)
{
652 653 654
	unsigned long real_uv_nmi;
	int bid;

655
	if (reason != DIE_NMIUNKNOWN)
656
		return NOTIFY_OK;
657 658 659 660

	if (in_crash_kexec)
		/* do nothing if entering the crash kernel */
		return NOTIFY_OK;
661

662
	/*
663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688
	 * Each blade has an MMR that indicates when an NMI has been sent
	 * to cpus on the blade. If an NMI is detected, atomically
	 * clear the MMR and update a per-blade NMI count used to
	 * cause each cpu on the blade to notice a new NMI.
	 */
	bid = uv_numa_blade_id();
	real_uv_nmi = (uv_read_local_mmr(UVH_NMI_MMR) & UV_NMI_PENDING_MASK);

	if (unlikely(real_uv_nmi)) {
		spin_lock(&uv_blade_info[bid].nmi_lock);
		real_uv_nmi = (uv_read_local_mmr(UVH_NMI_MMR) & UV_NMI_PENDING_MASK);
		if (real_uv_nmi) {
			uv_blade_info[bid].nmi_count++;
			uv_write_local_mmr(UVH_NMI_MMR_CLEAR, UV_NMI_PENDING_MASK);
		}
		spin_unlock(&uv_blade_info[bid].nmi_lock);
	}

	if (likely(__get_cpu_var(cpu_last_nmi_count) == uv_blade_info[bid].nmi_count))
		return NOTIFY_DONE;

	__get_cpu_var(cpu_last_nmi_count) = uv_blade_info[bid].nmi_count;

	/*
	 * Use a lock so only one cpu prints at a time.
	 * This prevents intermixed output.
689 690
	 */
	spin_lock(&uv_nmi_lock);
691
	pr_info("UV NMI stack dump cpu %u:\n", smp_processor_id());
692 693 694 695 696 697 698
	dump_stack();
	spin_unlock(&uv_nmi_lock);

	return NOTIFY_STOP;
}

static struct notifier_block uv_dump_stack_nmi_nb = {
699 700
	.notifier_call	= uv_handle_nmi,
	.priority = NMI_LOCAL_LOW_PRIOR - 1,
701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719
};

void uv_register_nmi_notifier(void)
{
	if (register_die_notifier(&uv_dump_stack_nmi_nb))
		printk(KERN_WARNING "UV NMI handler failed to register\n");
}

void uv_nmi_init(void)
{
	unsigned int value;

	/*
	 * Unmask NMI on all cpus
	 */
	value = apic_read(APIC_LVT1) | APIC_DM_NMI;
	value &= ~APIC_LVT_MASKED;
	apic_write(APIC_LVT1, value);
}
720 721

void __init uv_system_init(void)
J
Jack Steiner 已提交
722
{
723
	union uvh_rh_gam_config_mmr_u  m_n_config;
724
	union uvh_rh_gam_mmioh_overlay_config_mmr_u mmioh;
725 726
	union uvh_node_id_u node_id;
	unsigned long gnode_upper, lowmem_redir_base, lowmem_redir_size;
727
	int bytes, nid, cpu, lcpu, pnode, blade, i, j, m_val, n_val, n_io;
728
	int gnode_extra, max_pnode = 0;
729
	unsigned long mmr_base, present, paddr;
730
	unsigned short pnode_mask, pnode_io_mask;
J
Jack Steiner 已提交
731

J
Jack Steiner 已提交
732 733
	map_low_mmrs();

734
	m_n_config.v = uv_read_local_mmr(UVH_RH_GAM_CONFIG_MMR );
735 736
	m_val = m_n_config.s.m_skt;
	n_val = m_n_config.s.n_skt;
737 738
	mmioh.v = uv_read_local_mmr(UVH_RH_GAM_MMIOH_OVERLAY_CONFIG_MMR);
	n_io = mmioh.s.n_io;
J
Jack Steiner 已提交
739 740 741
	mmr_base =
	    uv_read_local_mmr(UVH_RH_GAM_MMR_OVERLAY_CONFIG_MMR) &
	    ~UV_MMR_ENABLE;
742
	pnode_mask = (1 << n_val) - 1;
743 744
	pnode_io_mask = (1 << n_io) - 1;

745 746 747
	node_id.v = uv_read_local_mmr(UVH_NODE_ID);
	gnode_extra = (node_id.s.node_id & ~((1 << n_val) - 1)) >> 1;
	gnode_upper = ((unsigned long)gnode_extra  << m_val);
748 749
	printk(KERN_INFO "UV: N %d, M %d, N_IO: %d, gnode_upper 0x%lx, gnode_extra 0x%x, pnode_mask 0x%x, pnode_io_mask 0x%x\n",
			n_val, m_val, n_io, gnode_upper, gnode_extra, pnode_mask, pnode_io_mask);
750

J
Jack Steiner 已提交
751 752
	printk(KERN_DEBUG "UV: global MMR base 0x%lx\n", mmr_base);

753 754 755
	for(i = 0; i < UVH_NODE_PRESENT_TABLE_DEPTH; i++)
		uv_possible_blades +=
		  hweight64(uv_read_local_mmr( UVH_NODE_PRESENT_TABLE + i * 8));
J
Jack Steiner 已提交
756 757 758
	printk(KERN_DEBUG "UV: Found %d blades\n", uv_num_possible_blades());

	bytes = sizeof(struct uv_blade_info) * uv_num_possible_blades();
759
	uv_blade_info = kzalloc(bytes, GFP_KERNEL);
760
	BUG_ON(!uv_blade_info);
761

762 763
	for (blade = 0; blade < uv_num_possible_blades(); blade++)
		uv_blade_info[blade].memory_nid = -1;
J
Jack Steiner 已提交
764

765 766
	get_lowmem_redirect(&lowmem_redir_base, &lowmem_redir_size);

J
Jack Steiner 已提交
767
	bytes = sizeof(uv_node_to_blade[0]) * num_possible_nodes();
768
	uv_node_to_blade = kmalloc(bytes, GFP_KERNEL);
769
	BUG_ON(!uv_node_to_blade);
J
Jack Steiner 已提交
770 771 772
	memset(uv_node_to_blade, 255, bytes);

	bytes = sizeof(uv_cpu_to_blade[0]) * num_possible_cpus();
773
	uv_cpu_to_blade = kmalloc(bytes, GFP_KERNEL);
774
	BUG_ON(!uv_cpu_to_blade);
J
Jack Steiner 已提交
775 776
	memset(uv_cpu_to_blade, 255, bytes);

777 778 779 780 781 782
	blade = 0;
	for (i = 0; i < UVH_NODE_PRESENT_TABLE_DEPTH; i++) {
		present = uv_read_local_mmr(UVH_NODE_PRESENT_TABLE + i * 8);
		for (j = 0; j < 64; j++) {
			if (!test_bit(j, &present))
				continue;
783
			pnode = (i * 64 + j) & pnode_mask;
784
			uv_blade_info[blade].pnode = pnode;
785
			uv_blade_info[blade].nr_possible_cpus = 0;
J
Jack Steiner 已提交
786
			uv_blade_info[blade].nr_online_cpus = 0;
787
			spin_lock_init(&uv_blade_info[blade].nmi_lock);
788
			max_pnode = max(pnode, max_pnode);
789
			blade++;
J
Jack Steiner 已提交
790
		}
791
	}
J
Jack Steiner 已提交
792

793
	uv_bios_init();
794 795
	uv_bios_get_sn_info(0, &uv_type, &sn_partition_id, &sn_coherency_id,
			    &sn_region_size, &system_serial_number);
796 797
	uv_rtc_init();

798
	for_each_present_cpu(cpu) {
799 800
		int apicid = per_cpu(x86_cpu_to_apicid, cpu);

801
		nid = cpu_to_node(cpu);
802 803 804
		/*
		 * apic_pnode_shift must be set before calling uv_apicid_to_pnode();
		 */
805
		uv_cpu_hub_info(cpu)->pnode_mask = pnode_mask;
806
		uv_cpu_hub_info(cpu)->apic_pnode_shift = uvh_apicid.s.pnode_shift;
807
		pnode = uv_apicid_to_pnode(apicid);
808 809 810 811
		blade = boot_pnode_to_blade(pnode);
		lcpu = uv_blade_info[blade].nr_possible_cpus;
		uv_blade_info[blade].nr_possible_cpus++;

812 813 814
		/* Any node on the blade, else will contain -1. */
		uv_blade_info[blade].memory_nid = nid;

815
		uv_cpu_hub_info(cpu)->lowmem_remap_base = lowmem_redir_base;
816
		uv_cpu_hub_info(cpu)->lowmem_remap_top = lowmem_redir_size;
817
		uv_cpu_hub_info(cpu)->m_val = m_val;
818
		uv_cpu_hub_info(cpu)->n_val = n_val;
J
Jack Steiner 已提交
819 820
		uv_cpu_hub_info(cpu)->numa_blade_id = blade;
		uv_cpu_hub_info(cpu)->blade_processor_id = lcpu;
821
		uv_cpu_hub_info(cpu)->pnode = pnode;
822
		uv_cpu_hub_info(cpu)->gpa_mask = (1UL << (m_val + n_val)) - 1;
823
		uv_cpu_hub_info(cpu)->gnode_upper = gnode_upper;
824
		uv_cpu_hub_info(cpu)->gnode_extra = gnode_extra;
J
Jack Steiner 已提交
825
		uv_cpu_hub_info(cpu)->global_mmr_base = mmr_base;
826
		uv_cpu_hub_info(cpu)->coherency_domain_number = sn_coherency_id;
827
		uv_cpu_hub_info(cpu)->scir.offset = uv_scir_offset(apicid);
J
Jack Steiner 已提交
828 829 830
		uv_node_to_blade[nid] = blade;
		uv_cpu_to_blade[cpu] = blade;
	}
831

832 833 834 835 836
	/* Add blade/pnode info for nodes without cpus */
	for_each_online_node(nid) {
		if (uv_node_to_blade[nid] >= 0)
			continue;
		paddr = node_start_pfn(nid) << PAGE_SHIFT;
837
		paddr = uv_soc_phys_ram_to_gpa(paddr);
838 839 840 841 842
		pnode = (paddr >> m_val) & pnode_mask;
		blade = boot_pnode_to_blade(pnode);
		uv_node_to_blade[nid] = blade;
	}

843
	map_gru_high(max_pnode);
844
	map_mmr_high(max_pnode);
845
	map_mmioh_high(max_pnode & pnode_io_mask);
J
Jack Steiner 已提交
846

847
	uv_cpu_init();
848
	uv_scir_register_cpu_notifier();
849
	uv_register_nmi_notifier();
850
	proc_mkdir("sgi_uv", NULL);
851 852 853

	/* register Legacy VGA I/O redirection handler */
	pci_register_set_vga_state(uv_set_vga_state);
C
Cliff Wickman 已提交
854 855 856 857 858 859 860

	/*
	 * For a kdump kernel the reset must be BOOT_ACPI, not BOOT_EFI, as
	 * EFI is not enabled in the kdump kernel.
	 */
	if (is_kdump_kernel())
		reboot_type = BOOT_ACPI;
J
Jack Steiner 已提交
861
}