x2apic_uv_x.c 22.5 KB
Newer Older
J
Jack Steiner 已提交
1 2 3 4 5 6 7
/*
 * This file is subject to the terms and conditions of the GNU General Public
 * License.  See the file "COPYING" in the main directory of this archive
 * for more details.
 *
 * SGI UV APIC functions (note: not an Intel compatible APIC)
 *
8
 * Copyright (C) 2007-2010 Silicon Graphics, Inc. All rights reserved.
J
Jack Steiner 已提交
9 10
 */
#include <linux/cpumask.h>
11 12 13 14 15
#include <linux/hardirq.h>
#include <linux/proc_fs.h>
#include <linux/threads.h>
#include <linux/kernel.h>
#include <linux/module.h>
J
Jack Steiner 已提交
16 17 18
#include <linux/string.h>
#include <linux/ctype.h>
#include <linux/sched.h>
19
#include <linux/timer.h>
20
#include <linux/slab.h>
21 22
#include <linux/cpu.h>
#include <linux/init.h>
23
#include <linux/io.h>
24
#include <linux/pci.h>
25
#include <linux/kdebug.h>
26
#include <linux/delay.h>
C
Cliff Wickman 已提交
27
#include <linux/crash_dump.h>
28

J
Jack Steiner 已提交
29 30
#include <asm/uv/uv_mmrs.h>
#include <asm/uv/uv_hub.h>
31 32
#include <asm/current.h>
#include <asm/pgtable.h>
33
#include <asm/uv/bios.h>
34 35 36 37
#include <asm/uv/uv.h>
#include <asm/apic.h>
#include <asm/ipi.h>
#include <asm/smp.h>
38
#include <asm/x86_init.h>
C
Cliff Wickman 已提交
39
#include <asm/emergency-restart.h>
40 41 42 43 44 45 46
#include <asm/nmi.h>

/* BMC sets a bit this MMR non-zero before sending an NMI */
#define UVH_NMI_MMR				UVH_SCRATCH5
#define UVH_NMI_MMR_CLEAR			(UVH_NMI_MMR + 8)
#define UV_NMI_PENDING_MASK			(1UL << 63)
DEFINE_PER_CPU(unsigned long, cpu_last_nmi_count);
J
Jack Steiner 已提交
47

48 49
DEFINE_PER_CPU(int, x2apic_extra_bits);

50 51
#define PR_DEVEL(fmt, args...)	pr_devel("%s: " fmt, __func__, args)

52
static enum uv_system_type uv_system_type;
53
static u64 gru_start_paddr, gru_end_paddr;
54
static union uvh_apicid uvh_apicid;
55 56
int uv_min_hub_revision_id;
EXPORT_SYMBOL_GPL(uv_min_hub_revision_id);
57 58
unsigned int uv_apicid_hibits;
EXPORT_SYMBOL_GPL(uv_apicid_hibits);
59
static DEFINE_SPINLOCK(uv_nmi_lock);
60

61 62
static struct apic apic_x2apic_uv_x;

63 64 65 66 67 68 69 70 71 72
static unsigned long __init uv_early_read_mmr(unsigned long addr)
{
	unsigned long val, *mmr;

	mmr = early_ioremap(UV_LOCAL_MMR_BASE | addr, sizeof(*mmr));
	val = *mmr;
	early_iounmap(mmr, sizeof(*mmr));
	return val;
}

73
static inline bool is_GRU_range(u64 start, u64 end)
74
{
75
	return start >= gru_start_paddr && end <= gru_end_paddr;
76 77
}

78
static bool uv_is_untracked_pat_range(u64 start, u64 end)
79 80 81
{
	return is_ISA_range(start, end) || is_GRU_range(start, end);
}
82

83
static int __init early_get_pnodeid(void)
84 85
{
	union uvh_node_id_u node_id;
86 87
	union uvh_rh_gam_config_mmr_u  m_n_config;
	int pnode;
88 89

	/* Currently, all blades have same revision number */
90
	node_id.v = uv_early_read_mmr(UVH_NODE_ID);
91
	m_n_config.v = uv_early_read_mmr(UVH_RH_GAM_CONFIG_MMR);
92 93
	uv_min_hub_revision_id = node_id.s.revision;

94 95
	pnode = (node_id.s.node_id >> 1) & ((1 << m_n_config.s.n_skt) - 1);
	return pnode;
96 97
}

98
static void __init early_get_apic_pnode_shift(void)
99
{
100
	uvh_apicid.v = uv_early_read_mmr(UVH_APICID);
101 102 103 104 105 106 107
	if (!uvh_apicid.v)
		/*
		 * Old bios, use default value
		 */
		uvh_apicid.s.pnode_shift = UV_APIC_PNODE_SHIFT;
}

108 109 110 111 112 113 114 115 116
/*
 * Add an extra bit as dictated by bios to the destination apicid of
 * interrupts potentially passing through the UV HUB.  This prevents
 * a deadlock between interrupts and IO port operations.
 */
static void __init uv_set_apicid_hibit(void)
{
	union uvh_lb_target_physical_apic_id_mask_u apicid_mask;

117
	apicid_mask.v = uv_early_read_mmr(UVH_LB_TARGET_PHYSICAL_APIC_ID_MASK);
118 119 120
	uv_apicid_hibits = apicid_mask.s.bit_enables & UV_APICID_HIBIT_MASK;
}

121
static int __init uv_acpi_madt_oem_check(char *oem_id, char *oem_table_id)
122
{
123
	int pnodeid;
124

125
	if (!strcmp(oem_id, "SGI")) {
126
		pnodeid = early_get_pnodeid();
127
		early_get_apic_pnode_shift();
128
		x86_platform.is_untracked_pat_range =  uv_is_untracked_pat_range;
129
		x86_platform.nmi_init = uv_nmi_init;
130 131 132 133 134
		if (!strcmp(oem_table_id, "UVL"))
			uv_system_type = UV_LEGACY_APIC;
		else if (!strcmp(oem_table_id, "UVX"))
			uv_system_type = UV_X2APIC;
		else if (!strcmp(oem_table_id, "UVH")) {
T
Tejun Heo 已提交
135
			__this_cpu_write(x2apic_extra_bits,
136
				pnodeid << uvh_apicid.s.pnode_shift);
137
			uv_system_type = UV_NON_UNIQUE_APIC;
138
			uv_set_apicid_hibit();
139 140 141 142 143 144 145 146 147 148 149 150 151 152 153
			return 1;
		}
	}
	return 0;
}

enum uv_system_type get_uv_system_type(void)
{
	return uv_system_type;
}

int is_uv_system(void)
{
	return uv_system_type != UV_NONE;
}
154
EXPORT_SYMBOL_GPL(is_uv_system);
155

J
Jack Steiner 已提交
156 157 158 159 160 161 162 163 164 165 166 167 168 169 170
DEFINE_PER_CPU(struct uv_hub_info_s, __uv_hub_info);
EXPORT_PER_CPU_SYMBOL_GPL(__uv_hub_info);

struct uv_blade_info *uv_blade_info;
EXPORT_SYMBOL_GPL(uv_blade_info);

short *uv_node_to_blade;
EXPORT_SYMBOL_GPL(uv_node_to_blade);

short *uv_cpu_to_blade;
EXPORT_SYMBOL_GPL(uv_cpu_to_blade);

short uv_possible_blades;
EXPORT_SYMBOL_GPL(uv_possible_blades);

171 172 173
unsigned long sn_rtc_cycles_per_second;
EXPORT_SYMBOL(sn_rtc_cycles_per_second);

174
static const struct cpumask *uv_target_cpus(void)
J
Jack Steiner 已提交
175
{
176
	return cpu_online_mask;
J
Jack Steiner 已提交
177 178
}

179
static void uv_vector_allocation_domain(int cpu, struct cpumask *retmask)
J
Jack Steiner 已提交
180
{
181 182
	cpumask_clear(retmask);
	cpumask_set_cpu(cpu, retmask);
J
Jack Steiner 已提交
183 184
}

185
static int __cpuinit uv_wakeup_secondary(int phys_apicid, unsigned long start_rip)
J
Jack Steiner 已提交
186
{
187
#ifdef CONFIG_SMP
J
Jack Steiner 已提交
188
	unsigned long val;
189
	int pnode;
J
Jack Steiner 已提交
190

191
	pnode = uv_apicid_to_pnode(phys_apicid);
192
	phys_apicid |= uv_apicid_hibits;
J
Jack Steiner 已提交
193 194
	val = (1UL << UVH_IPI_INT_SEND_SHFT) |
	    (phys_apicid << UVH_IPI_INT_APIC_ID_SHFT) |
195
	    ((start_rip << UVH_IPI_INT_VECTOR_SHFT) >> 12) |
J
Jack Steiner 已提交
196
	    APIC_DM_INIT;
197
	uv_write_global_mmr64(pnode, UVH_IPI_INT, val);
J
Jack Steiner 已提交
198 199 200 201
	mdelay(10);

	val = (1UL << UVH_IPI_INT_SEND_SHFT) |
	    (phys_apicid << UVH_IPI_INT_APIC_ID_SHFT) |
202
	    ((start_rip << UVH_IPI_INT_VECTOR_SHFT) >> 12) |
J
Jack Steiner 已提交
203
	    APIC_DM_STARTUP;
204
	uv_write_global_mmr64(pnode, UVH_IPI_INT, val);
205 206

	atomic_set(&init_deasserted, 1);
207
#endif
J
Jack Steiner 已提交
208 209 210 211 212
	return 0;
}

static void uv_send_IPI_one(int cpu, int vector)
{
213
	unsigned long apicid;
214
	int pnode;
J
Jack Steiner 已提交
215

216
	apicid = per_cpu(x86_cpu_to_apicid, cpu);
217
	pnode = uv_apicid_to_pnode(apicid);
218
	uv_hub_send_ipi(pnode, apicid, vector);
J
Jack Steiner 已提交
219 220
}

221
static void uv_send_IPI_mask(const struct cpumask *mask, int vector)
J
Jack Steiner 已提交
222 223 224
{
	unsigned int cpu;

225
	for_each_cpu(cpu, mask)
226 227 228
		uv_send_IPI_one(cpu, vector);
}

229
static void uv_send_IPI_mask_allbutself(const struct cpumask *mask, int vector)
230 231
{
	unsigned int this_cpu = smp_processor_id();
232
	unsigned int cpu;
233

234
	for_each_cpu(cpu, mask) {
235
		if (cpu != this_cpu)
J
Jack Steiner 已提交
236
			uv_send_IPI_one(cpu, vector);
237
	}
J
Jack Steiner 已提交
238 239 240 241
}

static void uv_send_IPI_allbutself(int vector)
{
242
	unsigned int this_cpu = smp_processor_id();
243
	unsigned int cpu;
J
Jack Steiner 已提交
244

245
	for_each_online_cpu(cpu) {
246 247
		if (cpu != this_cpu)
			uv_send_IPI_one(cpu, vector);
248
	}
J
Jack Steiner 已提交
249 250 251 252
}

static void uv_send_IPI_all(int vector)
{
253
	uv_send_IPI_mask(cpu_online_mask, vector);
J
Jack Steiner 已提交
254 255 256 257 258 259 260
}

static int uv_apic_id_registered(void)
{
	return 1;
}

261
static void uv_init_apic_ldr(void)
262 263 264
{
}

265
static unsigned int uv_cpu_mask_to_apicid(const struct cpumask *cpumask)
J
Jack Steiner 已提交
266 267 268 269 270
{
	/*
	 * We're using fixed IRQ delivery, can only return one phys APIC ID.
	 * May as well be the first.
	 */
271 272
	int cpu = cpumask_first(cpumask);

273
	if ((unsigned)cpu < nr_cpu_ids)
274
		return per_cpu(x86_cpu_to_apicid, cpu) | uv_apicid_hibits;
J
Jack Steiner 已提交
275 276 277 278
	else
		return BAD_APICID;
}

279 280 281
static unsigned int
uv_cpu_mask_to_apicid_and(const struct cpumask *cpumask,
			  const struct cpumask *andmask)
M
Mike Travis 已提交
282 283 284 285 286 287 288
{
	int cpu;

	/*
	 * We're using fixed IRQ delivery, can only return one phys APIC ID.
	 * May as well be the first.
	 */
289
	for_each_cpu_and(cpu, cpumask, andmask) {
290 291
		if (cpumask_test_cpu(cpu, cpu_online_mask))
			break;
292
	}
293
	return per_cpu(x86_cpu_to_apicid, cpu) | uv_apicid_hibits;
M
Mike Travis 已提交
294 295
}

296
static unsigned int x2apic_get_apic_id(unsigned long x)
297 298 299 300
{
	unsigned int id;

	WARN_ON(preemptible() && num_online_cpus() > 1);
T
Tejun Heo 已提交
301
	id = x | __this_cpu_read(x2apic_extra_bits);
302 303 304 305

	return id;
}

306
static unsigned long set_apic_id(unsigned int id)
Y
Yinghai Lu 已提交
307 308 309 310 311 312 313 314 315 316 317
{
	unsigned long x;

	/* maskout x2apic_extra_bits ? */
	x = id;
	return x;
}

static unsigned int uv_read_apic_id(void)
{

318
	return x2apic_get_apic_id(apic_read(APIC_ID));
Y
Yinghai Lu 已提交
319 320
}

I
Ingo Molnar 已提交
321
static int uv_phys_pkg_id(int initial_apicid, int index_msb)
J
Jack Steiner 已提交
322
{
323
	return uv_read_apic_id() >> index_msb;
J
Jack Steiner 已提交
324 325 326 327 328 329 330
}

static void uv_send_IPI_self(int vector)
{
	apic_write(APIC_SELF_IPI, vector);
}

331 332 333 334 335
static int uv_probe(void)
{
	return apic == &apic_x2apic_uv_x;
}

336
static struct apic __refdata apic_x2apic_uv_x = {
I
Ingo Molnar 已提交
337 338

	.name				= "UV large system",
339
	.probe				= uv_probe,
I
Ingo Molnar 已提交
340 341 342
	.acpi_madt_oem_check		= uv_acpi_madt_oem_check,
	.apic_id_registered		= uv_apic_id_registered,

343
	.irq_delivery_mode		= dest_Fixed,
J
Jack Steiner 已提交
344
	.irq_dest_mode			= 0, /* physical */
I
Ingo Molnar 已提交
345 346

	.target_cpus			= uv_target_cpus,
347
	.disable_esr			= 0,
348
	.dest_logical			= APIC_DEST_LOGICAL,
I
Ingo Molnar 已提交
349 350 351 352 353 354 355 356 357
	.check_apicid_used		= NULL,
	.check_apicid_present		= NULL,

	.vector_allocation_domain	= uv_vector_allocation_domain,
	.init_apic_ldr			= uv_init_apic_ldr,

	.ioapic_phys_id_map		= NULL,
	.setup_apic_routing		= NULL,
	.multi_timer_check		= NULL,
358
	.cpu_present_to_apicid		= default_cpu_present_to_apicid,
I
Ingo Molnar 已提交
359 360
	.apicid_to_cpu_present		= NULL,
	.setup_portio_remap		= NULL,
361
	.check_phys_apicid_present	= default_check_phys_apicid_present,
I
Ingo Molnar 已提交
362
	.enable_apic_mode		= NULL,
I
Ingo Molnar 已提交
363
	.phys_pkg_id			= uv_phys_pkg_id,
I
Ingo Molnar 已提交
364 365
	.mps_oem_check			= NULL,

366
	.get_apic_id			= x2apic_get_apic_id,
I
Ingo Molnar 已提交
367 368 369 370 371 372 373 374 375 376 377 378
	.set_apic_id			= set_apic_id,
	.apic_id_mask			= 0xFFFFFFFFu,

	.cpu_mask_to_apicid		= uv_cpu_mask_to_apicid,
	.cpu_mask_to_apicid_and		= uv_cpu_mask_to_apicid_and,

	.send_IPI_mask			= uv_send_IPI_mask,
	.send_IPI_mask_allbutself	= uv_send_IPI_mask_allbutself,
	.send_IPI_allbutself		= uv_send_IPI_allbutself,
	.send_IPI_all			= uv_send_IPI_all,
	.send_IPI_self			= uv_send_IPI_self,

379
	.wakeup_secondary_cpu		= uv_wakeup_secondary,
380 381
	.trampoline_phys_low		= DEFAULT_TRAMPOLINE_PHYS_LOW,
	.trampoline_phys_high		= DEFAULT_TRAMPOLINE_PHYS_HIGH,
I
Ingo Molnar 已提交
382 383 384
	.wait_for_init_deassert		= NULL,
	.smp_callin_clear_local_apic	= NULL,
	.inquire_remote_apic		= NULL,
Y
Yinghai Lu 已提交
385 386 387 388 389 390 391

	.read				= native_apic_msr_read,
	.write				= native_apic_msr_write,
	.icr_read			= native_x2apic_icr_read,
	.icr_write			= native_x2apic_icr_write,
	.wait_icr_idle			= native_x2apic_wait_icr_idle,
	.safe_wait_icr_idle		= native_safe_x2apic_wait_icr_idle,
J
Jack Steiner 已提交
392 393
};

394
static __cpuinit void set_x2apic_extra_bits(int pnode)
J
Jack Steiner 已提交
395
{
396
	__this_cpu_write(x2apic_extra_bits, pnode << uvh_apicid.s.pnode_shift);
J
Jack Steiner 已提交
397 398 399 400 401
}

/*
 * Called on boot cpu.
 */
402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419
static __init int boot_pnode_to_blade(int pnode)
{
	int blade;

	for (blade = 0; blade < uv_num_possible_blades(); blade++)
		if (pnode == uv_blade_info[blade].pnode)
			return blade;
	BUG();
}

struct redir_addr {
	unsigned long redirect;
	unsigned long alias;
};

#define DEST_SHIFT UVH_RH_GAM_ALIAS210_REDIRECT_CONFIG_0_MMR_DEST_BASE_SHFT

static __initdata struct redir_addr redir_addrs[] = {
420 421 422
	{UVH_RH_GAM_ALIAS210_REDIRECT_CONFIG_0_MMR, UVH_RH_GAM_ALIAS210_OVERLAY_CONFIG_0_MMR},
	{UVH_RH_GAM_ALIAS210_REDIRECT_CONFIG_1_MMR, UVH_RH_GAM_ALIAS210_OVERLAY_CONFIG_1_MMR},
	{UVH_RH_GAM_ALIAS210_REDIRECT_CONFIG_2_MMR, UVH_RH_GAM_ALIAS210_OVERLAY_CONFIG_2_MMR},
423 424 425 426
};

static __init void get_lowmem_redirect(unsigned long *base, unsigned long *size)
{
427
	union uvh_rh_gam_alias210_overlay_config_2_mmr_u alias;
428 429 430 431 432
	union uvh_rh_gam_alias210_redirect_config_2_mmr_u redirect;
	int i;

	for (i = 0; i < ARRAY_SIZE(redir_addrs); i++) {
		alias.v = uv_read_local_mmr(redir_addrs[i].alias);
433
		if (alias.s.enable && alias.s.base == 0) {
434 435 436 437 438 439
			*size = (1UL << alias.s.m_alias);
			redirect.v = uv_read_local_mmr(redir_addrs[i].redirect);
			*base = (unsigned long)redirect.s.dest_base << DEST_SHIFT;
			return;
		}
	}
440
	*base = *size = 0;
441 442
}

443 444
enum map_type {map_wb, map_uc};

445 446
static __init void map_high(char *id, unsigned long base, int pshift,
			int bshift, int max_pnode, enum map_type map_type)
447 448 449
{
	unsigned long bytes, paddr;

450 451
	paddr = base << pshift;
	bytes = (1UL << bshift) * (max_pnode + 1);
452
	printk(KERN_INFO "UV: Map %s_HI 0x%lx - 0x%lx\n", id, paddr,
453
						paddr + bytes);
454 455 456 457 458 459 460 461 462 463 464 465
	if (map_type == map_uc)
		init_extra_mapping_uc(paddr, bytes);
	else
		init_extra_mapping_wb(paddr, bytes);

}
static __init void map_gru_high(int max_pnode)
{
	union uvh_rh_gam_gru_overlay_config_mmr_u gru;
	int shift = UVH_RH_GAM_GRU_OVERLAY_CONFIG_MMR_BASE_SHFT;

	gru.v = uv_read_local_mmr(UVH_RH_GAM_GRU_OVERLAY_CONFIG_MMR);
466
	if (gru.s.enable) {
467
		map_high("GRU", gru.s.base, shift, shift, max_pnode, map_wb);
468 469 470 471
		gru_start_paddr = ((u64)gru.s.base << shift);
		gru_end_paddr = gru_start_paddr + (1UL << shift) * (max_pnode + 1);

	}
472 473
}

474 475 476 477 478 479 480
static __init void map_mmr_high(int max_pnode)
{
	union uvh_rh_gam_mmr_overlay_config_mmr_u mmr;
	int shift = UVH_RH_GAM_MMR_OVERLAY_CONFIG_MMR_BASE_SHFT;

	mmr.v = uv_read_local_mmr(UVH_RH_GAM_MMR_OVERLAY_CONFIG_MMR);
	if (mmr.s.enable)
481
		map_high("MMR", mmr.s.base, shift, shift, max_pnode, map_uc);
482 483
}

484 485 486 487 488 489 490
static __init void map_mmioh_high(int max_pnode)
{
	union uvh_rh_gam_mmioh_overlay_config_mmr_u mmioh;
	int shift = UVH_RH_GAM_MMIOH_OVERLAY_CONFIG_MMR_BASE_SHFT;

	mmioh.v = uv_read_local_mmr(UVH_RH_GAM_MMIOH_OVERLAY_CONFIG_MMR);
	if (mmioh.s.enable)
491 492
		map_high("MMIOH", mmioh.s.base, shift, mmioh.s.m_io,
			max_pnode, map_uc);
493 494
}

J
Jack Steiner 已提交
495 496 497 498 499 500
static __init void map_low_mmrs(void)
{
	init_extra_mapping_uc(UV_GLOBAL_MMR32_BASE, UV_GLOBAL_MMR32_SIZE);
	init_extra_mapping_uc(UV_LOCAL_MMR_BASE, UV_LOCAL_MMR_SIZE);
}

501 502
static __init void uv_rtc_init(void)
{
R
Russ Anderson 已提交
503 504
	long status;
	u64 ticks_per_sec;
505

R
Russ Anderson 已提交
506 507 508
	status = uv_bios_freq_base(BIOS_FREQ_BASE_REALTIME_CLOCK,
					&ticks_per_sec);
	if (status != BIOS_STATUS_SUCCESS || ticks_per_sec < 100000) {
509 510 511 512 513 514 515 516 517
		printk(KERN_WARNING
			"unable to determine platform RTC clock frequency, "
			"guessing.\n");
		/* BIOS gives wrong value for clock freq. so guess */
		sn_rtc_cycles_per_second = 1000000000000UL / 30000UL;
	} else
		sn_rtc_cycles_per_second = ticks_per_sec;
}

518 519 520 521 522 523 524 525 526 527 528
/*
 * percpu heartbeat timer
 */
static void uv_heartbeat(unsigned long ignored)
{
	struct timer_list *timer = &uv_hub_info->scir.timer;
	unsigned char bits = uv_hub_info->scir.state;

	/* flip heartbeat bit */
	bits ^= SCIR_CPU_HEARTBEAT;

529 530
	/* is this cpu idle? */
	if (idle_cpu(raw_smp_processor_id()))
531 532 533 534 535 536 537 538
		bits &= ~SCIR_CPU_ACTIVITY;
	else
		bits |= SCIR_CPU_ACTIVITY;

	/* update system controller interface reg */
	uv_set_scir_bits(bits);

	/* enable next timer period */
539
	mod_timer_pinned(timer, jiffies + SCIR_CPU_HB_INTERVAL);
540 541 542 543
}

static void __cpuinit uv_heartbeat_enable(int cpu)
{
544
	while (!uv_cpu_hub_info(cpu)->scir.enabled) {
545 546 547 548 549 550 551 552
		struct timer_list *timer = &uv_cpu_hub_info(cpu)->scir.timer;

		uv_set_cpu_scir_bits(cpu, SCIR_CPU_HEARTBEAT|SCIR_CPU_ACTIVITY);
		setup_timer(timer, uv_heartbeat, cpu);
		timer->expires = jiffies + SCIR_CPU_HB_INTERVAL;
		add_timer_on(timer, cpu);
		uv_cpu_hub_info(cpu)->scir.enabled = 1;

553 554 555
		/* also ensure that boot cpu is enabled */
		cpu = 0;
	}
556 557
}

558
#ifdef CONFIG_HOTPLUG_CPU
559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613
static void __cpuinit uv_heartbeat_disable(int cpu)
{
	if (uv_cpu_hub_info(cpu)->scir.enabled) {
		uv_cpu_hub_info(cpu)->scir.enabled = 0;
		del_timer(&uv_cpu_hub_info(cpu)->scir.timer);
	}
	uv_set_cpu_scir_bits(cpu, 0xff);
}

/*
 * cpu hotplug notifier
 */
static __cpuinit int uv_scir_cpu_notify(struct notifier_block *self,
				       unsigned long action, void *hcpu)
{
	long cpu = (long)hcpu;

	switch (action) {
	case CPU_ONLINE:
		uv_heartbeat_enable(cpu);
		break;
	case CPU_DOWN_PREPARE:
		uv_heartbeat_disable(cpu);
		break;
	default:
		break;
	}
	return NOTIFY_OK;
}

static __init void uv_scir_register_cpu_notifier(void)
{
	hotcpu_notifier(uv_scir_cpu_notify, 0);
}

#else /* !CONFIG_HOTPLUG_CPU */

static __init void uv_scir_register_cpu_notifier(void)
{
}

static __init int uv_init_heartbeat(void)
{
	int cpu;

	if (is_uv_system())
		for_each_online_cpu(cpu)
			uv_heartbeat_enable(cpu);
	return 0;
}

late_initcall(uv_init_heartbeat);

#endif /* !CONFIG_HOTPLUG_CPU */

614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637
/* Direct Legacy VGA I/O traffic to designated IOH */
int uv_set_vga_state(struct pci_dev *pdev, bool decode,
		      unsigned int command_bits, bool change_bridge)
{
	int domain, bus, rc;

	PR_DEVEL("devfn %x decode %d cmd %x chg_brdg %d\n",
			pdev->devfn, decode, command_bits, change_bridge);

	if (!change_bridge)
		return 0;

	if ((command_bits & PCI_COMMAND_IO) == 0)
		return 0;

	domain = pci_domain_nr(pdev->bus);
	bus = pdev->bus->number;

	rc = uv_bios_set_legacy_vga_target(decode, domain, bus);
	PR_DEVEL("vga decode %d %x:%x, rc: %d\n", decode, domain, bus, rc);

	return rc;
}

638 639
/*
 * Called on each cpu to initialize the per_cpu UV data area.
640
 * FIXME: hotplug not supported yet
641 642 643 644 645 646 647 648 649 650 651 652 653
 */
void __cpuinit uv_cpu_init(void)
{
	/* CPU 0 initilization will be done via uv_system_init. */
	if (!uv_blade_info)
		return;

	uv_blade_info[uv_numa_blade_id()].nr_online_cpus++;

	if (get_uv_system_type() == UV_NON_UNIQUE_APIC)
		set_x2apic_extra_bits(uv_hub_info->pnode);
}

654 655 656 657 658
/*
 * When NMI is received, print a stack trace.
 */
int uv_handle_nmi(struct notifier_block *self, unsigned long reason, void *data)
{
659 660 661
	unsigned long real_uv_nmi;
	int bid;

662
	if (reason != DIE_NMIUNKNOWN)
663
		return NOTIFY_OK;
664 665 666 667

	if (in_crash_kexec)
		/* do nothing if entering the crash kernel */
		return NOTIFY_OK;
668

669
	/*
670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695
	 * Each blade has an MMR that indicates when an NMI has been sent
	 * to cpus on the blade. If an NMI is detected, atomically
	 * clear the MMR and update a per-blade NMI count used to
	 * cause each cpu on the blade to notice a new NMI.
	 */
	bid = uv_numa_blade_id();
	real_uv_nmi = (uv_read_local_mmr(UVH_NMI_MMR) & UV_NMI_PENDING_MASK);

	if (unlikely(real_uv_nmi)) {
		spin_lock(&uv_blade_info[bid].nmi_lock);
		real_uv_nmi = (uv_read_local_mmr(UVH_NMI_MMR) & UV_NMI_PENDING_MASK);
		if (real_uv_nmi) {
			uv_blade_info[bid].nmi_count++;
			uv_write_local_mmr(UVH_NMI_MMR_CLEAR, UV_NMI_PENDING_MASK);
		}
		spin_unlock(&uv_blade_info[bid].nmi_lock);
	}

	if (likely(__get_cpu_var(cpu_last_nmi_count) == uv_blade_info[bid].nmi_count))
		return NOTIFY_DONE;

	__get_cpu_var(cpu_last_nmi_count) = uv_blade_info[bid].nmi_count;

	/*
	 * Use a lock so only one cpu prints at a time.
	 * This prevents intermixed output.
696 697
	 */
	spin_lock(&uv_nmi_lock);
698
	pr_info("UV NMI stack dump cpu %u:\n", smp_processor_id());
699 700 701 702 703 704 705
	dump_stack();
	spin_unlock(&uv_nmi_lock);

	return NOTIFY_STOP;
}

static struct notifier_block uv_dump_stack_nmi_nb = {
706 707
	.notifier_call	= uv_handle_nmi,
	.priority = NMI_LOCAL_LOW_PRIOR - 1,
708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726
};

void uv_register_nmi_notifier(void)
{
	if (register_die_notifier(&uv_dump_stack_nmi_nb))
		printk(KERN_WARNING "UV NMI handler failed to register\n");
}

void uv_nmi_init(void)
{
	unsigned int value;

	/*
	 * Unmask NMI on all cpus
	 */
	value = apic_read(APIC_LVT1) | APIC_DM_NMI;
	value &= ~APIC_LVT_MASKED;
	apic_write(APIC_LVT1, value);
}
727 728

void __init uv_system_init(void)
J
Jack Steiner 已提交
729
{
730
	union uvh_rh_gam_config_mmr_u  m_n_config;
731
	union uvh_rh_gam_mmioh_overlay_config_mmr_u mmioh;
732 733
	union uvh_node_id_u node_id;
	unsigned long gnode_upper, lowmem_redir_base, lowmem_redir_size;
734
	int bytes, nid, cpu, lcpu, pnode, blade, i, j, m_val, n_val, n_io;
735
	int gnode_extra, max_pnode = 0;
736
	unsigned long mmr_base, present, paddr;
737
	unsigned short pnode_mask, pnode_io_mask;
J
Jack Steiner 已提交
738

J
Jack Steiner 已提交
739 740
	map_low_mmrs();

741
	m_n_config.v = uv_read_local_mmr(UVH_RH_GAM_CONFIG_MMR );
742 743
	m_val = m_n_config.s.m_skt;
	n_val = m_n_config.s.n_skt;
744 745
	mmioh.v = uv_read_local_mmr(UVH_RH_GAM_MMIOH_OVERLAY_CONFIG_MMR);
	n_io = mmioh.s.n_io;
J
Jack Steiner 已提交
746 747 748
	mmr_base =
	    uv_read_local_mmr(UVH_RH_GAM_MMR_OVERLAY_CONFIG_MMR) &
	    ~UV_MMR_ENABLE;
749
	pnode_mask = (1 << n_val) - 1;
750 751
	pnode_io_mask = (1 << n_io) - 1;

752 753 754
	node_id.v = uv_read_local_mmr(UVH_NODE_ID);
	gnode_extra = (node_id.s.node_id & ~((1 << n_val) - 1)) >> 1;
	gnode_upper = ((unsigned long)gnode_extra  << m_val);
755 756
	printk(KERN_INFO "UV: N %d, M %d, N_IO: %d, gnode_upper 0x%lx, gnode_extra 0x%x, pnode_mask 0x%x, pnode_io_mask 0x%x\n",
			n_val, m_val, n_io, gnode_upper, gnode_extra, pnode_mask, pnode_io_mask);
757

J
Jack Steiner 已提交
758 759
	printk(KERN_DEBUG "UV: global MMR base 0x%lx\n", mmr_base);

760 761 762
	for(i = 0; i < UVH_NODE_PRESENT_TABLE_DEPTH; i++)
		uv_possible_blades +=
		  hweight64(uv_read_local_mmr( UVH_NODE_PRESENT_TABLE + i * 8));
J
Jack Steiner 已提交
763 764 765
	printk(KERN_DEBUG "UV: Found %d blades\n", uv_num_possible_blades());

	bytes = sizeof(struct uv_blade_info) * uv_num_possible_blades();
766
	uv_blade_info = kzalloc(bytes, GFP_KERNEL);
767
	BUG_ON(!uv_blade_info);
768

769 770
	for (blade = 0; blade < uv_num_possible_blades(); blade++)
		uv_blade_info[blade].memory_nid = -1;
J
Jack Steiner 已提交
771

772 773
	get_lowmem_redirect(&lowmem_redir_base, &lowmem_redir_size);

J
Jack Steiner 已提交
774
	bytes = sizeof(uv_node_to_blade[0]) * num_possible_nodes();
775
	uv_node_to_blade = kmalloc(bytes, GFP_KERNEL);
776
	BUG_ON(!uv_node_to_blade);
J
Jack Steiner 已提交
777 778 779
	memset(uv_node_to_blade, 255, bytes);

	bytes = sizeof(uv_cpu_to_blade[0]) * num_possible_cpus();
780
	uv_cpu_to_blade = kmalloc(bytes, GFP_KERNEL);
781
	BUG_ON(!uv_cpu_to_blade);
J
Jack Steiner 已提交
782 783
	memset(uv_cpu_to_blade, 255, bytes);

784 785 786 787 788 789
	blade = 0;
	for (i = 0; i < UVH_NODE_PRESENT_TABLE_DEPTH; i++) {
		present = uv_read_local_mmr(UVH_NODE_PRESENT_TABLE + i * 8);
		for (j = 0; j < 64; j++) {
			if (!test_bit(j, &present))
				continue;
790
			pnode = (i * 64 + j) & pnode_mask;
791
			uv_blade_info[blade].pnode = pnode;
792
			uv_blade_info[blade].nr_possible_cpus = 0;
J
Jack Steiner 已提交
793
			uv_blade_info[blade].nr_online_cpus = 0;
794
			spin_lock_init(&uv_blade_info[blade].nmi_lock);
795
			max_pnode = max(pnode, max_pnode);
796
			blade++;
J
Jack Steiner 已提交
797
		}
798
	}
J
Jack Steiner 已提交
799

800
	uv_bios_init();
801 802
	uv_bios_get_sn_info(0, &uv_type, &sn_partition_id, &sn_coherency_id,
			    &sn_region_size, &system_serial_number);
803 804
	uv_rtc_init();

805
	for_each_present_cpu(cpu) {
806 807
		int apicid = per_cpu(x86_cpu_to_apicid, cpu);

808
		nid = cpu_to_node(cpu);
809 810 811
		/*
		 * apic_pnode_shift must be set before calling uv_apicid_to_pnode();
		 */
812
		uv_cpu_hub_info(cpu)->pnode_mask = pnode_mask;
813
		uv_cpu_hub_info(cpu)->apic_pnode_shift = uvh_apicid.s.pnode_shift;
814
		pnode = uv_apicid_to_pnode(apicid);
815 816 817 818
		blade = boot_pnode_to_blade(pnode);
		lcpu = uv_blade_info[blade].nr_possible_cpus;
		uv_blade_info[blade].nr_possible_cpus++;

819 820 821
		/* Any node on the blade, else will contain -1. */
		uv_blade_info[blade].memory_nid = nid;

822
		uv_cpu_hub_info(cpu)->lowmem_remap_base = lowmem_redir_base;
823
		uv_cpu_hub_info(cpu)->lowmem_remap_top = lowmem_redir_size;
824
		uv_cpu_hub_info(cpu)->m_val = m_val;
825
		uv_cpu_hub_info(cpu)->n_val = n_val;
J
Jack Steiner 已提交
826 827
		uv_cpu_hub_info(cpu)->numa_blade_id = blade;
		uv_cpu_hub_info(cpu)->blade_processor_id = lcpu;
828
		uv_cpu_hub_info(cpu)->pnode = pnode;
829
		uv_cpu_hub_info(cpu)->gpa_mask = (1UL << (m_val + n_val)) - 1;
830
		uv_cpu_hub_info(cpu)->gnode_upper = gnode_upper;
831
		uv_cpu_hub_info(cpu)->gnode_extra = gnode_extra;
J
Jack Steiner 已提交
832
		uv_cpu_hub_info(cpu)->global_mmr_base = mmr_base;
833
		uv_cpu_hub_info(cpu)->coherency_domain_number = sn_coherency_id;
834
		uv_cpu_hub_info(cpu)->scir.offset = uv_scir_offset(apicid);
J
Jack Steiner 已提交
835 836 837
		uv_node_to_blade[nid] = blade;
		uv_cpu_to_blade[cpu] = blade;
	}
838

839 840 841 842 843
	/* Add blade/pnode info for nodes without cpus */
	for_each_online_node(nid) {
		if (uv_node_to_blade[nid] >= 0)
			continue;
		paddr = node_start_pfn(nid) << PAGE_SHIFT;
844
		paddr = uv_soc_phys_ram_to_gpa(paddr);
845 846 847 848 849
		pnode = (paddr >> m_val) & pnode_mask;
		blade = boot_pnode_to_blade(pnode);
		uv_node_to_blade[nid] = blade;
	}

850
	map_gru_high(max_pnode);
851
	map_mmr_high(max_pnode);
852
	map_mmioh_high(max_pnode & pnode_io_mask);
J
Jack Steiner 已提交
853

854
	uv_cpu_init();
855
	uv_scir_register_cpu_notifier();
856
	uv_register_nmi_notifier();
857
	proc_mkdir("sgi_uv", NULL);
858 859 860

	/* register Legacy VGA I/O redirection handler */
	pci_register_set_vga_state(uv_set_vga_state);
C
Cliff Wickman 已提交
861 862 863 864 865 866 867

	/*
	 * For a kdump kernel the reset must be BOOT_ACPI, not BOOT_EFI, as
	 * EFI is not enabled in the kdump kernel.
	 */
	if (is_kdump_kernel())
		reboot_type = BOOT_ACPI;
J
Jack Steiner 已提交
868
}
869 870

apic_driver(apic_x2apic_uv_x);