x2apic_uv_x.c 23.5 KB
Newer Older
J
Jack Steiner 已提交
1 2 3 4 5 6 7
/*
 * This file is subject to the terms and conditions of the GNU General Public
 * License.  See the file "COPYING" in the main directory of this archive
 * for more details.
 *
 * SGI UV APIC functions (note: not an Intel compatible APIC)
 *
8
 * Copyright (C) 2007-2010 Silicon Graphics, Inc. All rights reserved.
J
Jack Steiner 已提交
9 10
 */
#include <linux/cpumask.h>
11 12 13 14 15
#include <linux/hardirq.h>
#include <linux/proc_fs.h>
#include <linux/threads.h>
#include <linux/kernel.h>
#include <linux/module.h>
J
Jack Steiner 已提交
16 17 18
#include <linux/string.h>
#include <linux/ctype.h>
#include <linux/sched.h>
19
#include <linux/timer.h>
20
#include <linux/slab.h>
21 22
#include <linux/cpu.h>
#include <linux/init.h>
23
#include <linux/io.h>
24
#include <linux/pci.h>
25
#include <linux/kdebug.h>
26
#include <linux/delay.h>
C
Cliff Wickman 已提交
27
#include <linux/crash_dump.h>
28

J
Jack Steiner 已提交
29 30
#include <asm/uv/uv_mmrs.h>
#include <asm/uv/uv_hub.h>
31 32
#include <asm/current.h>
#include <asm/pgtable.h>
33
#include <asm/uv/bios.h>
34 35 36 37
#include <asm/uv/uv.h>
#include <asm/apic.h>
#include <asm/ipi.h>
#include <asm/smp.h>
38
#include <asm/x86_init.h>
C
Cliff Wickman 已提交
39
#include <asm/emergency-restart.h>
40 41 42 43 44 45 46
#include <asm/nmi.h>

/* BMC sets a bit this MMR non-zero before sending an NMI */
#define UVH_NMI_MMR				UVH_SCRATCH5
#define UVH_NMI_MMR_CLEAR			(UVH_NMI_MMR + 8)
#define UV_NMI_PENDING_MASK			(1UL << 63)
DEFINE_PER_CPU(unsigned long, cpu_last_nmi_count);
J
Jack Steiner 已提交
47

48 49
DEFINE_PER_CPU(int, x2apic_extra_bits);

50 51
#define PR_DEVEL(fmt, args...)	pr_devel("%s: " fmt, __func__, args)

52
static enum uv_system_type uv_system_type;
53
static u64 gru_start_paddr, gru_end_paddr;
54
static union uvh_apicid uvh_apicid;
55 56
int uv_min_hub_revision_id;
EXPORT_SYMBOL_GPL(uv_min_hub_revision_id);
57 58
unsigned int uv_apicid_hibits;
EXPORT_SYMBOL_GPL(uv_apicid_hibits);
59
static DEFINE_SPINLOCK(uv_nmi_lock);
60

61 62
static struct apic apic_x2apic_uv_x;

63 64 65 66 67 68 69 70 71 72
static unsigned long __init uv_early_read_mmr(unsigned long addr)
{
	unsigned long val, *mmr;

	mmr = early_ioremap(UV_LOCAL_MMR_BASE | addr, sizeof(*mmr));
	val = *mmr;
	early_iounmap(mmr, sizeof(*mmr));
	return val;
}

73
static inline bool is_GRU_range(u64 start, u64 end)
74
{
75
	return start >= gru_start_paddr && end <= gru_end_paddr;
76 77
}

78
static bool uv_is_untracked_pat_range(u64 start, u64 end)
79 80 81
{
	return is_ISA_range(start, end) || is_GRU_range(start, end);
}
82

83
static int __init early_get_pnodeid(void)
84 85
{
	union uvh_node_id_u node_id;
86 87
	union uvh_rh_gam_config_mmr_u  m_n_config;
	int pnode;
88 89

	/* Currently, all blades have same revision number */
90
	node_id.v = uv_early_read_mmr(UVH_NODE_ID);
91
	m_n_config.v = uv_early_read_mmr(UVH_RH_GAM_CONFIG_MMR);
92 93
	uv_min_hub_revision_id = node_id.s.revision;

94 95
	if (node_id.s.part_number == UV2_HUB_PART_NUMBER)
		uv_min_hub_revision_id += UV2_HUB_REVISION_BASE - 1;
J
Jack Steiner 已提交
96 97
	if (node_id.s.part_number == UV2_HUB_PART_NUMBER_X)
		uv_min_hub_revision_id += UV2_HUB_REVISION_BASE - 1;
98 99

	uv_hub_info->hub_revision = uv_min_hub_revision_id;
100 101
	pnode = (node_id.s.node_id >> 1) & ((1 << m_n_config.s.n_skt) - 1);
	return pnode;
102 103
}

104
static void __init early_get_apic_pnode_shift(void)
105
{
106
	uvh_apicid.v = uv_early_read_mmr(UVH_APICID);
107 108 109 110 111 112 113
	if (!uvh_apicid.v)
		/*
		 * Old bios, use default value
		 */
		uvh_apicid.s.pnode_shift = UV_APIC_PNODE_SHIFT;
}

114 115 116 117 118 119 120
/*
 * Add an extra bit as dictated by bios to the destination apicid of
 * interrupts potentially passing through the UV HUB.  This prevents
 * a deadlock between interrupts and IO port operations.
 */
static void __init uv_set_apicid_hibit(void)
{
121
	union uv1h_lb_target_physical_apic_id_mask_u apicid_mask;
122

123 124 125 126 127 128
	if (is_uv1_hub()) {
		apicid_mask.v =
			uv_early_read_mmr(UV1H_LB_TARGET_PHYSICAL_APIC_ID_MASK);
		uv_apicid_hibits =
			apicid_mask.s1.bit_enables & UV_APICID_HIBIT_MASK;
	}
129 130
}

131
static int __init uv_acpi_madt_oem_check(char *oem_id, char *oem_table_id)
132
{
133
	int pnodeid, is_uv1, is_uv2;
134

135 136 137 138 139
	is_uv1 = !strcmp(oem_id, "SGI");
	is_uv2 = !strcmp(oem_id, "SGI2");
	if (is_uv1 || is_uv2) {
		uv_hub_info->hub_revision =
			is_uv1 ? UV1_HUB_REVISION_BASE : UV2_HUB_REVISION_BASE;
140
		pnodeid = early_get_pnodeid();
141
		early_get_apic_pnode_shift();
142
		x86_platform.is_untracked_pat_range =  uv_is_untracked_pat_range;
143
		x86_platform.nmi_init = uv_nmi_init;
144 145 146 147 148
		if (!strcmp(oem_table_id, "UVL"))
			uv_system_type = UV_LEGACY_APIC;
		else if (!strcmp(oem_table_id, "UVX"))
			uv_system_type = UV_X2APIC;
		else if (!strcmp(oem_table_id, "UVH")) {
T
Tejun Heo 已提交
149
			__this_cpu_write(x2apic_extra_bits,
150
				pnodeid << uvh_apicid.s.pnode_shift);
151
			uv_system_type = UV_NON_UNIQUE_APIC;
152
			uv_set_apicid_hibit();
153 154 155 156 157 158 159 160 161 162 163 164 165 166 167
			return 1;
		}
	}
	return 0;
}

enum uv_system_type get_uv_system_type(void)
{
	return uv_system_type;
}

int is_uv_system(void)
{
	return uv_system_type != UV_NONE;
}
168
EXPORT_SYMBOL_GPL(is_uv_system);
169

J
Jack Steiner 已提交
170 171 172 173 174 175 176 177 178 179 180 181 182 183 184
DEFINE_PER_CPU(struct uv_hub_info_s, __uv_hub_info);
EXPORT_PER_CPU_SYMBOL_GPL(__uv_hub_info);

struct uv_blade_info *uv_blade_info;
EXPORT_SYMBOL_GPL(uv_blade_info);

short *uv_node_to_blade;
EXPORT_SYMBOL_GPL(uv_node_to_blade);

short *uv_cpu_to_blade;
EXPORT_SYMBOL_GPL(uv_cpu_to_blade);

short uv_possible_blades;
EXPORT_SYMBOL_GPL(uv_possible_blades);

185 186 187
unsigned long sn_rtc_cycles_per_second;
EXPORT_SYMBOL(sn_rtc_cycles_per_second);

188
static const struct cpumask *uv_target_cpus(void)
J
Jack Steiner 已提交
189
{
190
	return cpu_online_mask;
J
Jack Steiner 已提交
191 192
}

193
static void uv_vector_allocation_domain(int cpu, struct cpumask *retmask)
J
Jack Steiner 已提交
194
{
195 196
	cpumask_clear(retmask);
	cpumask_set_cpu(cpu, retmask);
J
Jack Steiner 已提交
197 198
}

199
static int __cpuinit uv_wakeup_secondary(int phys_apicid, unsigned long start_rip)
J
Jack Steiner 已提交
200
{
201
#ifdef CONFIG_SMP
J
Jack Steiner 已提交
202
	unsigned long val;
203
	int pnode;
J
Jack Steiner 已提交
204

205
	pnode = uv_apicid_to_pnode(phys_apicid);
206
	phys_apicid |= uv_apicid_hibits;
J
Jack Steiner 已提交
207 208
	val = (1UL << UVH_IPI_INT_SEND_SHFT) |
	    (phys_apicid << UVH_IPI_INT_APIC_ID_SHFT) |
209
	    ((start_rip << UVH_IPI_INT_VECTOR_SHFT) >> 12) |
J
Jack Steiner 已提交
210
	    APIC_DM_INIT;
211
	uv_write_global_mmr64(pnode, UVH_IPI_INT, val);
J
Jack Steiner 已提交
212 213 214

	val = (1UL << UVH_IPI_INT_SEND_SHFT) |
	    (phys_apicid << UVH_IPI_INT_APIC_ID_SHFT) |
215
	    ((start_rip << UVH_IPI_INT_VECTOR_SHFT) >> 12) |
J
Jack Steiner 已提交
216
	    APIC_DM_STARTUP;
217
	uv_write_global_mmr64(pnode, UVH_IPI_INT, val);
218 219

	atomic_set(&init_deasserted, 1);
220
#endif
J
Jack Steiner 已提交
221 222 223 224 225
	return 0;
}

static void uv_send_IPI_one(int cpu, int vector)
{
226
	unsigned long apicid;
227
	int pnode;
J
Jack Steiner 已提交
228

229
	apicid = per_cpu(x86_cpu_to_apicid, cpu);
230
	pnode = uv_apicid_to_pnode(apicid);
231
	uv_hub_send_ipi(pnode, apicid, vector);
J
Jack Steiner 已提交
232 233
}

234
static void uv_send_IPI_mask(const struct cpumask *mask, int vector)
J
Jack Steiner 已提交
235 236 237
{
	unsigned int cpu;

238
	for_each_cpu(cpu, mask)
239 240 241
		uv_send_IPI_one(cpu, vector);
}

242
static void uv_send_IPI_mask_allbutself(const struct cpumask *mask, int vector)
243 244
{
	unsigned int this_cpu = smp_processor_id();
245
	unsigned int cpu;
246

247
	for_each_cpu(cpu, mask) {
248
		if (cpu != this_cpu)
J
Jack Steiner 已提交
249
			uv_send_IPI_one(cpu, vector);
250
	}
J
Jack Steiner 已提交
251 252 253 254
}

static void uv_send_IPI_allbutself(int vector)
{
255
	unsigned int this_cpu = smp_processor_id();
256
	unsigned int cpu;
J
Jack Steiner 已提交
257

258
	for_each_online_cpu(cpu) {
259 260
		if (cpu != this_cpu)
			uv_send_IPI_one(cpu, vector);
261
	}
J
Jack Steiner 已提交
262 263 264 265
}

static void uv_send_IPI_all(int vector)
{
266
	uv_send_IPI_mask(cpu_online_mask, vector);
J
Jack Steiner 已提交
267 268
}

269 270 271 272 273
static int uv_apic_id_valid(int apicid)
{
	return 1;
}

J
Jack Steiner 已提交
274 275 276 277 278
static int uv_apic_id_registered(void)
{
	return 1;
}

279
static void uv_init_apic_ldr(void)
280 281 282
{
}

283
static unsigned int uv_cpu_mask_to_apicid(const struct cpumask *cpumask)
J
Jack Steiner 已提交
284 285 286 287 288
{
	/*
	 * We're using fixed IRQ delivery, can only return one phys APIC ID.
	 * May as well be the first.
	 */
289 290
	int cpu = cpumask_first(cpumask);

291
	if ((unsigned)cpu < nr_cpu_ids)
292
		return per_cpu(x86_cpu_to_apicid, cpu) | uv_apicid_hibits;
J
Jack Steiner 已提交
293 294 295 296
	else
		return BAD_APICID;
}

297 298 299
static unsigned int
uv_cpu_mask_to_apicid_and(const struct cpumask *cpumask,
			  const struct cpumask *andmask)
M
Mike Travis 已提交
300 301 302 303 304 305 306
{
	int cpu;

	/*
	 * We're using fixed IRQ delivery, can only return one phys APIC ID.
	 * May as well be the first.
	 */
307
	for_each_cpu_and(cpu, cpumask, andmask) {
308 309
		if (cpumask_test_cpu(cpu, cpu_online_mask))
			break;
310
	}
311
	return per_cpu(x86_cpu_to_apicid, cpu) | uv_apicid_hibits;
M
Mike Travis 已提交
312 313
}

314
static unsigned int x2apic_get_apic_id(unsigned long x)
315 316 317 318
{
	unsigned int id;

	WARN_ON(preemptible() && num_online_cpus() > 1);
T
Tejun Heo 已提交
319
	id = x | __this_cpu_read(x2apic_extra_bits);
320 321 322 323

	return id;
}

324
static unsigned long set_apic_id(unsigned int id)
Y
Yinghai Lu 已提交
325 326 327 328 329 330 331 332 333 334 335
{
	unsigned long x;

	/* maskout x2apic_extra_bits ? */
	x = id;
	return x;
}

static unsigned int uv_read_apic_id(void)
{

336
	return x2apic_get_apic_id(apic_read(APIC_ID));
Y
Yinghai Lu 已提交
337 338
}

I
Ingo Molnar 已提交
339
static int uv_phys_pkg_id(int initial_apicid, int index_msb)
J
Jack Steiner 已提交
340
{
341
	return uv_read_apic_id() >> index_msb;
J
Jack Steiner 已提交
342 343 344 345 346 347 348
}

static void uv_send_IPI_self(int vector)
{
	apic_write(APIC_SELF_IPI, vector);
}

349 350 351 352 353
static int uv_probe(void)
{
	return apic == &apic_x2apic_uv_x;
}

354
static struct apic __refdata apic_x2apic_uv_x = {
I
Ingo Molnar 已提交
355 356

	.name				= "UV large system",
357
	.probe				= uv_probe,
I
Ingo Molnar 已提交
358
	.acpi_madt_oem_check		= uv_acpi_madt_oem_check,
359
	.apic_id_valid			= uv_apic_id_valid,
I
Ingo Molnar 已提交
360 361
	.apic_id_registered		= uv_apic_id_registered,

362
	.irq_delivery_mode		= dest_Fixed,
J
Jack Steiner 已提交
363
	.irq_dest_mode			= 0, /* physical */
I
Ingo Molnar 已提交
364 365

	.target_cpus			= uv_target_cpus,
366
	.disable_esr			= 0,
367
	.dest_logical			= APIC_DEST_LOGICAL,
I
Ingo Molnar 已提交
368 369 370 371 372 373 374 375 376
	.check_apicid_used		= NULL,
	.check_apicid_present		= NULL,

	.vector_allocation_domain	= uv_vector_allocation_domain,
	.init_apic_ldr			= uv_init_apic_ldr,

	.ioapic_phys_id_map		= NULL,
	.setup_apic_routing		= NULL,
	.multi_timer_check		= NULL,
377
	.cpu_present_to_apicid		= default_cpu_present_to_apicid,
I
Ingo Molnar 已提交
378 379
	.apicid_to_cpu_present		= NULL,
	.setup_portio_remap		= NULL,
380
	.check_phys_apicid_present	= default_check_phys_apicid_present,
I
Ingo Molnar 已提交
381
	.enable_apic_mode		= NULL,
I
Ingo Molnar 已提交
382
	.phys_pkg_id			= uv_phys_pkg_id,
I
Ingo Molnar 已提交
383 384
	.mps_oem_check			= NULL,

385
	.get_apic_id			= x2apic_get_apic_id,
I
Ingo Molnar 已提交
386 387 388 389 390 391 392 393 394 395 396 397
	.set_apic_id			= set_apic_id,
	.apic_id_mask			= 0xFFFFFFFFu,

	.cpu_mask_to_apicid		= uv_cpu_mask_to_apicid,
	.cpu_mask_to_apicid_and		= uv_cpu_mask_to_apicid_and,

	.send_IPI_mask			= uv_send_IPI_mask,
	.send_IPI_mask_allbutself	= uv_send_IPI_mask_allbutself,
	.send_IPI_allbutself		= uv_send_IPI_allbutself,
	.send_IPI_all			= uv_send_IPI_all,
	.send_IPI_self			= uv_send_IPI_self,

398
	.wakeup_secondary_cpu		= uv_wakeup_secondary,
399 400
	.trampoline_phys_low		= DEFAULT_TRAMPOLINE_PHYS_LOW,
	.trampoline_phys_high		= DEFAULT_TRAMPOLINE_PHYS_HIGH,
I
Ingo Molnar 已提交
401 402 403
	.wait_for_init_deassert		= NULL,
	.smp_callin_clear_local_apic	= NULL,
	.inquire_remote_apic		= NULL,
Y
Yinghai Lu 已提交
404 405 406

	.read				= native_apic_msr_read,
	.write				= native_apic_msr_write,
407
	.eoi_write			= native_apic_msr_eoi_write,
Y
Yinghai Lu 已提交
408 409 410 411
	.icr_read			= native_x2apic_icr_read,
	.icr_write			= native_x2apic_icr_write,
	.wait_icr_idle			= native_x2apic_wait_icr_idle,
	.safe_wait_icr_idle		= native_safe_x2apic_wait_icr_idle,
J
Jack Steiner 已提交
412 413
};

414
static __cpuinit void set_x2apic_extra_bits(int pnode)
J
Jack Steiner 已提交
415
{
416
	__this_cpu_write(x2apic_extra_bits, pnode << uvh_apicid.s.pnode_shift);
J
Jack Steiner 已提交
417 418 419 420 421
}

/*
 * Called on boot cpu.
 */
422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439
static __init int boot_pnode_to_blade(int pnode)
{
	int blade;

	for (blade = 0; blade < uv_num_possible_blades(); blade++)
		if (pnode == uv_blade_info[blade].pnode)
			return blade;
	BUG();
}

struct redir_addr {
	unsigned long redirect;
	unsigned long alias;
};

#define DEST_SHIFT UVH_RH_GAM_ALIAS210_REDIRECT_CONFIG_0_MMR_DEST_BASE_SHFT

static __initdata struct redir_addr redir_addrs[] = {
440 441 442
	{UVH_RH_GAM_ALIAS210_REDIRECT_CONFIG_0_MMR, UVH_RH_GAM_ALIAS210_OVERLAY_CONFIG_0_MMR},
	{UVH_RH_GAM_ALIAS210_REDIRECT_CONFIG_1_MMR, UVH_RH_GAM_ALIAS210_OVERLAY_CONFIG_1_MMR},
	{UVH_RH_GAM_ALIAS210_REDIRECT_CONFIG_2_MMR, UVH_RH_GAM_ALIAS210_OVERLAY_CONFIG_2_MMR},
443 444 445 446
};

static __init void get_lowmem_redirect(unsigned long *base, unsigned long *size)
{
447
	union uvh_rh_gam_alias210_overlay_config_2_mmr_u alias;
448 449 450 451 452
	union uvh_rh_gam_alias210_redirect_config_2_mmr_u redirect;
	int i;

	for (i = 0; i < ARRAY_SIZE(redir_addrs); i++) {
		alias.v = uv_read_local_mmr(redir_addrs[i].alias);
453
		if (alias.s.enable && alias.s.base == 0) {
454 455 456 457 458 459
			*size = (1UL << alias.s.m_alias);
			redirect.v = uv_read_local_mmr(redir_addrs[i].redirect);
			*base = (unsigned long)redirect.s.dest_base << DEST_SHIFT;
			return;
		}
	}
460
	*base = *size = 0;
461 462
}

463 464
enum map_type {map_wb, map_uc};

465 466
static __init void map_high(char *id, unsigned long base, int pshift,
			int bshift, int max_pnode, enum map_type map_type)
467 468 469
{
	unsigned long bytes, paddr;

470 471
	paddr = base << pshift;
	bytes = (1UL << bshift) * (max_pnode + 1);
472
	printk(KERN_INFO "UV: Map %s_HI 0x%lx - 0x%lx\n", id, paddr,
473
						paddr + bytes);
474 475 476 477 478 479 480 481 482 483 484 485
	if (map_type == map_uc)
		init_extra_mapping_uc(paddr, bytes);
	else
		init_extra_mapping_wb(paddr, bytes);

}
static __init void map_gru_high(int max_pnode)
{
	union uvh_rh_gam_gru_overlay_config_mmr_u gru;
	int shift = UVH_RH_GAM_GRU_OVERLAY_CONFIG_MMR_BASE_SHFT;

	gru.v = uv_read_local_mmr(UVH_RH_GAM_GRU_OVERLAY_CONFIG_MMR);
486
	if (gru.s.enable) {
487
		map_high("GRU", gru.s.base, shift, shift, max_pnode, map_wb);
488 489 490 491
		gru_start_paddr = ((u64)gru.s.base << shift);
		gru_end_paddr = gru_start_paddr + (1UL << shift) * (max_pnode + 1);

	}
492 493
}

494 495 496 497 498 499 500
static __init void map_mmr_high(int max_pnode)
{
	union uvh_rh_gam_mmr_overlay_config_mmr_u mmr;
	int shift = UVH_RH_GAM_MMR_OVERLAY_CONFIG_MMR_BASE_SHFT;

	mmr.v = uv_read_local_mmr(UVH_RH_GAM_MMR_OVERLAY_CONFIG_MMR);
	if (mmr.s.enable)
501
		map_high("MMR", mmr.s.base, shift, shift, max_pnode, map_uc);
502 503
}

504 505 506
static __init void map_mmioh_high(int max_pnode)
{
	union uvh_rh_gam_mmioh_overlay_config_mmr_u mmioh;
507
	int shift;
508 509

	mmioh.v = uv_read_local_mmr(UVH_RH_GAM_MMIOH_OVERLAY_CONFIG_MMR);
510 511 512 513 514 515 516 517
	if (is_uv1_hub() && mmioh.s1.enable) {
		shift = UV1H_RH_GAM_MMIOH_OVERLAY_CONFIG_MMR_BASE_SHFT;
		map_high("MMIOH", mmioh.s1.base, shift, mmioh.s1.m_io,
			max_pnode, map_uc);
	}
	if (is_uv2_hub() && mmioh.s2.enable) {
		shift = UV2H_RH_GAM_MMIOH_OVERLAY_CONFIG_MMR_BASE_SHFT;
		map_high("MMIOH", mmioh.s2.base, shift, mmioh.s2.m_io,
518
			max_pnode, map_uc);
519
	}
520 521
}

J
Jack Steiner 已提交
522 523 524 525 526 527
static __init void map_low_mmrs(void)
{
	init_extra_mapping_uc(UV_GLOBAL_MMR32_BASE, UV_GLOBAL_MMR32_SIZE);
	init_extra_mapping_uc(UV_LOCAL_MMR_BASE, UV_LOCAL_MMR_SIZE);
}

528 529
static __init void uv_rtc_init(void)
{
R
Russ Anderson 已提交
530 531
	long status;
	u64 ticks_per_sec;
532

R
Russ Anderson 已提交
533 534 535
	status = uv_bios_freq_base(BIOS_FREQ_BASE_REALTIME_CLOCK,
					&ticks_per_sec);
	if (status != BIOS_STATUS_SUCCESS || ticks_per_sec < 100000) {
536 537 538 539 540 541 542 543 544
		printk(KERN_WARNING
			"unable to determine platform RTC clock frequency, "
			"guessing.\n");
		/* BIOS gives wrong value for clock freq. so guess */
		sn_rtc_cycles_per_second = 1000000000000UL / 30000UL;
	} else
		sn_rtc_cycles_per_second = ticks_per_sec;
}

545 546 547 548 549 550 551 552 553 554 555
/*
 * percpu heartbeat timer
 */
static void uv_heartbeat(unsigned long ignored)
{
	struct timer_list *timer = &uv_hub_info->scir.timer;
	unsigned char bits = uv_hub_info->scir.state;

	/* flip heartbeat bit */
	bits ^= SCIR_CPU_HEARTBEAT;

556 557
	/* is this cpu idle? */
	if (idle_cpu(raw_smp_processor_id()))
558 559 560 561 562 563 564 565
		bits &= ~SCIR_CPU_ACTIVITY;
	else
		bits |= SCIR_CPU_ACTIVITY;

	/* update system controller interface reg */
	uv_set_scir_bits(bits);

	/* enable next timer period */
566
	mod_timer_pinned(timer, jiffies + SCIR_CPU_HB_INTERVAL);
567 568 569 570
}

static void __cpuinit uv_heartbeat_enable(int cpu)
{
571
	while (!uv_cpu_hub_info(cpu)->scir.enabled) {
572 573 574 575 576 577 578 579
		struct timer_list *timer = &uv_cpu_hub_info(cpu)->scir.timer;

		uv_set_cpu_scir_bits(cpu, SCIR_CPU_HEARTBEAT|SCIR_CPU_ACTIVITY);
		setup_timer(timer, uv_heartbeat, cpu);
		timer->expires = jiffies + SCIR_CPU_HB_INTERVAL;
		add_timer_on(timer, cpu);
		uv_cpu_hub_info(cpu)->scir.enabled = 1;

580 581 582
		/* also ensure that boot cpu is enabled */
		cpu = 0;
	}
583 584
}

585
#ifdef CONFIG_HOTPLUG_CPU
586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640
static void __cpuinit uv_heartbeat_disable(int cpu)
{
	if (uv_cpu_hub_info(cpu)->scir.enabled) {
		uv_cpu_hub_info(cpu)->scir.enabled = 0;
		del_timer(&uv_cpu_hub_info(cpu)->scir.timer);
	}
	uv_set_cpu_scir_bits(cpu, 0xff);
}

/*
 * cpu hotplug notifier
 */
static __cpuinit int uv_scir_cpu_notify(struct notifier_block *self,
				       unsigned long action, void *hcpu)
{
	long cpu = (long)hcpu;

	switch (action) {
	case CPU_ONLINE:
		uv_heartbeat_enable(cpu);
		break;
	case CPU_DOWN_PREPARE:
		uv_heartbeat_disable(cpu);
		break;
	default:
		break;
	}
	return NOTIFY_OK;
}

static __init void uv_scir_register_cpu_notifier(void)
{
	hotcpu_notifier(uv_scir_cpu_notify, 0);
}

#else /* !CONFIG_HOTPLUG_CPU */

static __init void uv_scir_register_cpu_notifier(void)
{
}

static __init int uv_init_heartbeat(void)
{
	int cpu;

	if (is_uv_system())
		for_each_online_cpu(cpu)
			uv_heartbeat_enable(cpu);
	return 0;
}

late_initcall(uv_init_heartbeat);

#endif /* !CONFIG_HOTPLUG_CPU */

641 642
/* Direct Legacy VGA I/O traffic to designated IOH */
int uv_set_vga_state(struct pci_dev *pdev, bool decode,
643
		      unsigned int command_bits, u32 flags)
644 645 646
{
	int domain, bus, rc;

647 648
	PR_DEVEL("devfn %x decode %d cmd %x flags %d\n",
			pdev->devfn, decode, command_bits, flags);
649

650
	if (!(flags & PCI_VGA_STATE_CHANGE_BRIDGE))
651 652 653 654 655 656 657 658 659 660 661 662 663 664
		return 0;

	if ((command_bits & PCI_COMMAND_IO) == 0)
		return 0;

	domain = pci_domain_nr(pdev->bus);
	bus = pdev->bus->number;

	rc = uv_bios_set_legacy_vga_target(decode, domain, bus);
	PR_DEVEL("vga decode %d %x:%x, rc: %d\n", decode, domain, bus, rc);

	return rc;
}

665 666
/*
 * Called on each cpu to initialize the per_cpu UV data area.
667
 * FIXME: hotplug not supported yet
668 669 670 671 672 673 674 675 676 677 678 679 680
 */
void __cpuinit uv_cpu_init(void)
{
	/* CPU 0 initilization will be done via uv_system_init. */
	if (!uv_blade_info)
		return;

	uv_blade_info[uv_numa_blade_id()].nr_online_cpus++;

	if (get_uv_system_type() == UV_NON_UNIQUE_APIC)
		set_x2apic_extra_bits(uv_hub_info->pnode);
}

681 682 683
/*
 * When NMI is received, print a stack trace.
 */
684
int uv_handle_nmi(unsigned int reason, struct pt_regs *regs)
685
{
686 687 688
	unsigned long real_uv_nmi;
	int bid;

689
	/*
690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708
	 * Each blade has an MMR that indicates when an NMI has been sent
	 * to cpus on the blade. If an NMI is detected, atomically
	 * clear the MMR and update a per-blade NMI count used to
	 * cause each cpu on the blade to notice a new NMI.
	 */
	bid = uv_numa_blade_id();
	real_uv_nmi = (uv_read_local_mmr(UVH_NMI_MMR) & UV_NMI_PENDING_MASK);

	if (unlikely(real_uv_nmi)) {
		spin_lock(&uv_blade_info[bid].nmi_lock);
		real_uv_nmi = (uv_read_local_mmr(UVH_NMI_MMR) & UV_NMI_PENDING_MASK);
		if (real_uv_nmi) {
			uv_blade_info[bid].nmi_count++;
			uv_write_local_mmr(UVH_NMI_MMR_CLEAR, UV_NMI_PENDING_MASK);
		}
		spin_unlock(&uv_blade_info[bid].nmi_lock);
	}

	if (likely(__get_cpu_var(cpu_last_nmi_count) == uv_blade_info[bid].nmi_count))
709
		return NMI_DONE;
710 711 712 713 714 715

	__get_cpu_var(cpu_last_nmi_count) = uv_blade_info[bid].nmi_count;

	/*
	 * Use a lock so only one cpu prints at a time.
	 * This prevents intermixed output.
716 717
	 */
	spin_lock(&uv_nmi_lock);
718
	pr_info("UV NMI stack dump cpu %u:\n", smp_processor_id());
719 720 721
	dump_stack();
	spin_unlock(&uv_nmi_lock);

722
	return NMI_HANDLED;
723 724 725 726
}

void uv_register_nmi_notifier(void)
{
727
	if (register_nmi_handler(NMI_UNKNOWN, uv_handle_nmi, 0, "uv"))
728 729 730 731 732 733 734 735 736 737 738 739 740 741
		printk(KERN_WARNING "UV NMI handler failed to register\n");
}

void uv_nmi_init(void)
{
	unsigned int value;

	/*
	 * Unmask NMI on all cpus
	 */
	value = apic_read(APIC_LVT1) | APIC_DM_NMI;
	value &= ~APIC_LVT_MASKED;
	apic_write(APIC_LVT1, value);
}
742 743

void __init uv_system_init(void)
J
Jack Steiner 已提交
744
{
745
	union uvh_rh_gam_config_mmr_u  m_n_config;
746
	union uvh_rh_gam_mmioh_overlay_config_mmr_u mmioh;
747 748
	union uvh_node_id_u node_id;
	unsigned long gnode_upper, lowmem_redir_base, lowmem_redir_size;
749
	int bytes, nid, cpu, lcpu, pnode, blade, i, j, m_val, n_val, n_io;
750
	int gnode_extra, max_pnode = 0;
751
	unsigned long mmr_base, present, paddr;
752
	unsigned short pnode_mask, pnode_io_mask;
J
Jack Steiner 已提交
753

754
	printk(KERN_INFO "UV: Found %s hub\n", is_uv1_hub() ? "UV1" : "UV2");
J
Jack Steiner 已提交
755 756
	map_low_mmrs();

757
	m_n_config.v = uv_read_local_mmr(UVH_RH_GAM_CONFIG_MMR );
758 759
	m_val = m_n_config.s.m_skt;
	n_val = m_n_config.s.n_skt;
760
	mmioh.v = uv_read_local_mmr(UVH_RH_GAM_MMIOH_OVERLAY_CONFIG_MMR);
761
	n_io = is_uv1_hub() ? mmioh.s1.n_io : mmioh.s2.n_io;
J
Jack Steiner 已提交
762 763 764
	mmr_base =
	    uv_read_local_mmr(UVH_RH_GAM_MMR_OVERLAY_CONFIG_MMR) &
	    ~UV_MMR_ENABLE;
765
	pnode_mask = (1 << n_val) - 1;
766 767
	pnode_io_mask = (1 << n_io) - 1;

768 769 770
	node_id.v = uv_read_local_mmr(UVH_NODE_ID);
	gnode_extra = (node_id.s.node_id & ~((1 << n_val) - 1)) >> 1;
	gnode_upper = ((unsigned long)gnode_extra  << m_val);
771 772
	printk(KERN_INFO "UV: N %d, M %d, N_IO: %d, gnode_upper 0x%lx, gnode_extra 0x%x, pnode_mask 0x%x, pnode_io_mask 0x%x\n",
			n_val, m_val, n_io, gnode_upper, gnode_extra, pnode_mask, pnode_io_mask);
773

J
Jack Steiner 已提交
774 775
	printk(KERN_DEBUG "UV: global MMR base 0x%lx\n", mmr_base);

776 777 778
	for(i = 0; i < UVH_NODE_PRESENT_TABLE_DEPTH; i++)
		uv_possible_blades +=
		  hweight64(uv_read_local_mmr( UVH_NODE_PRESENT_TABLE + i * 8));
779 780 781 782 783 784

	/* uv_num_possible_blades() is really the hub count */
	printk(KERN_INFO "UV: Found %d blades, %d hubs\n",
			is_uv1_hub() ? uv_num_possible_blades() :
			(uv_num_possible_blades() + 1) / 2,
			uv_num_possible_blades());
J
Jack Steiner 已提交
785 786

	bytes = sizeof(struct uv_blade_info) * uv_num_possible_blades();
787
	uv_blade_info = kzalloc(bytes, GFP_KERNEL);
788
	BUG_ON(!uv_blade_info);
789

790 791
	for (blade = 0; blade < uv_num_possible_blades(); blade++)
		uv_blade_info[blade].memory_nid = -1;
J
Jack Steiner 已提交
792

793 794
	get_lowmem_redirect(&lowmem_redir_base, &lowmem_redir_size);

J
Jack Steiner 已提交
795
	bytes = sizeof(uv_node_to_blade[0]) * num_possible_nodes();
796
	uv_node_to_blade = kmalloc(bytes, GFP_KERNEL);
797
	BUG_ON(!uv_node_to_blade);
J
Jack Steiner 已提交
798 799 800
	memset(uv_node_to_blade, 255, bytes);

	bytes = sizeof(uv_cpu_to_blade[0]) * num_possible_cpus();
801
	uv_cpu_to_blade = kmalloc(bytes, GFP_KERNEL);
802
	BUG_ON(!uv_cpu_to_blade);
J
Jack Steiner 已提交
803 804
	memset(uv_cpu_to_blade, 255, bytes);

805 806 807 808 809 810
	blade = 0;
	for (i = 0; i < UVH_NODE_PRESENT_TABLE_DEPTH; i++) {
		present = uv_read_local_mmr(UVH_NODE_PRESENT_TABLE + i * 8);
		for (j = 0; j < 64; j++) {
			if (!test_bit(j, &present))
				continue;
811
			pnode = (i * 64 + j) & pnode_mask;
812
			uv_blade_info[blade].pnode = pnode;
813
			uv_blade_info[blade].nr_possible_cpus = 0;
J
Jack Steiner 已提交
814
			uv_blade_info[blade].nr_online_cpus = 0;
815
			spin_lock_init(&uv_blade_info[blade].nmi_lock);
816
			max_pnode = max(pnode, max_pnode);
817
			blade++;
J
Jack Steiner 已提交
818
		}
819
	}
J
Jack Steiner 已提交
820

821
	uv_bios_init();
822 823
	uv_bios_get_sn_info(0, &uv_type, &sn_partition_id, &sn_coherency_id,
			    &sn_region_size, &system_serial_number);
824 825
	uv_rtc_init();

826
	for_each_present_cpu(cpu) {
827 828
		int apicid = per_cpu(x86_cpu_to_apicid, cpu);

829
		nid = cpu_to_node(cpu);
830 831 832
		/*
		 * apic_pnode_shift must be set before calling uv_apicid_to_pnode();
		 */
833
		uv_cpu_hub_info(cpu)->pnode_mask = pnode_mask;
834
		uv_cpu_hub_info(cpu)->apic_pnode_shift = uvh_apicid.s.pnode_shift;
835 836
		uv_cpu_hub_info(cpu)->hub_revision = uv_hub_info->hub_revision;

837 838 839 840
		uv_cpu_hub_info(cpu)->m_shift = 64 - m_val;
		uv_cpu_hub_info(cpu)->n_lshift = is_uv2_1_hub() ?
				(m_val == 40 ? 40 : 39) : m_val;

841
		pnode = uv_apicid_to_pnode(apicid);
842 843 844 845
		blade = boot_pnode_to_blade(pnode);
		lcpu = uv_blade_info[blade].nr_possible_cpus;
		uv_blade_info[blade].nr_possible_cpus++;

846 847 848
		/* Any node on the blade, else will contain -1. */
		uv_blade_info[blade].memory_nid = nid;

849
		uv_cpu_hub_info(cpu)->lowmem_remap_base = lowmem_redir_base;
850
		uv_cpu_hub_info(cpu)->lowmem_remap_top = lowmem_redir_size;
851
		uv_cpu_hub_info(cpu)->m_val = m_val;
852
		uv_cpu_hub_info(cpu)->n_val = n_val;
J
Jack Steiner 已提交
853 854
		uv_cpu_hub_info(cpu)->numa_blade_id = blade;
		uv_cpu_hub_info(cpu)->blade_processor_id = lcpu;
855
		uv_cpu_hub_info(cpu)->pnode = pnode;
856
		uv_cpu_hub_info(cpu)->gpa_mask = (1UL << (m_val + n_val)) - 1;
857
		uv_cpu_hub_info(cpu)->gnode_upper = gnode_upper;
858
		uv_cpu_hub_info(cpu)->gnode_extra = gnode_extra;
J
Jack Steiner 已提交
859
		uv_cpu_hub_info(cpu)->global_mmr_base = mmr_base;
860
		uv_cpu_hub_info(cpu)->coherency_domain_number = sn_coherency_id;
861
		uv_cpu_hub_info(cpu)->scir.offset = uv_scir_offset(apicid);
J
Jack Steiner 已提交
862 863 864
		uv_node_to_blade[nid] = blade;
		uv_cpu_to_blade[cpu] = blade;
	}
865

866 867 868 869 870
	/* Add blade/pnode info for nodes without cpus */
	for_each_online_node(nid) {
		if (uv_node_to_blade[nid] >= 0)
			continue;
		paddr = node_start_pfn(nid) << PAGE_SHIFT;
871
		pnode = uv_gpa_to_pnode(uv_soc_phys_ram_to_gpa(paddr));
872 873 874 875
		blade = boot_pnode_to_blade(pnode);
		uv_node_to_blade[nid] = blade;
	}

876
	map_gru_high(max_pnode);
877
	map_mmr_high(max_pnode);
878
	map_mmioh_high(max_pnode & pnode_io_mask);
J
Jack Steiner 已提交
879

880
	uv_cpu_init();
881
	uv_scir_register_cpu_notifier();
882
	uv_register_nmi_notifier();
883
	proc_mkdir("sgi_uv", NULL);
884 885 886

	/* register Legacy VGA I/O redirection handler */
	pci_register_set_vga_state(uv_set_vga_state);
C
Cliff Wickman 已提交
887 888 889 890 891 892 893

	/*
	 * For a kdump kernel the reset must be BOOT_ACPI, not BOOT_EFI, as
	 * EFI is not enabled in the kdump kernel.
	 */
	if (is_kdump_kernel())
		reboot_type = BOOT_ACPI;
J
Jack Steiner 已提交
894
}
895 896

apic_driver(apic_x2apic_uv_x);