mce_amd.c 16.1 KB
Newer Older
1
#include <linux/module.h>
2 3
#include <linux/slab.h>

B
Borislav Petkov 已提交
4
#include "mce_amd.h"
D
Doug Thompson 已提交
5

6 7
static struct amd_decoder_ops *fam_ops;

8
static u8 xec_mask	 = 0xf;
9 10
static u8 nb_err_cpumask = 0xf;

11
static bool report_gart_errors;
12
static void (*nb_bus_decoder)(int node_id, struct mce *m);
13 14 15 16 17 18 19

void amd_report_gart_errors(bool v)
{
	report_gart_errors = v;
}
EXPORT_SYMBOL_GPL(amd_report_gart_errors);

20
void amd_register_ecc_decoder(void (*f)(int, struct mce *))
21 22 23 24 25
{
	nb_bus_decoder = f;
}
EXPORT_SYMBOL_GPL(amd_register_ecc_decoder);

26
void amd_unregister_ecc_decoder(void (*f)(int, struct mce *))
27 28 29 30 31 32 33 34 35
{
	if (nb_bus_decoder) {
		WARN_ON(nb_bus_decoder != f);

		nb_bus_decoder = NULL;
	}
}
EXPORT_SYMBOL_GPL(amd_unregister_ecc_decoder);

D
Doug Thompson 已提交
36 37 38 39
/*
 * string representation for the different MCA reported error types, see F3x48
 * or MSR0000_0411.
 */
B
Borislav Petkov 已提交
40 41

/* transaction type */
42
const char * const tt_msgs[] = { "INSN", "DATA", "GEN", "RESV" };
43
EXPORT_SYMBOL_GPL(tt_msgs);
D
Doug Thompson 已提交
44

B
Borislav Petkov 已提交
45
/* cache level */
46
const char * const ll_msgs[] = { "RESV", "L1", "L2", "L3/GEN" };
47
EXPORT_SYMBOL_GPL(ll_msgs);
D
Doug Thompson 已提交
48

B
Borislav Petkov 已提交
49
/* memory transaction type */
50
const char * const rrrr_msgs[] = {
B
Borislav Petkov 已提交
51
       "GEN", "RD", "WR", "DRD", "DWR", "IRD", "PRF", "EV", "SNP"
D
Doug Thompson 已提交
52
};
53
EXPORT_SYMBOL_GPL(rrrr_msgs);
D
Doug Thompson 已提交
54

B
Borislav Petkov 已提交
55
/* participating processor */
56
const char * const pp_msgs[] = { "SRC", "RES", "OBS", "GEN" };
57
EXPORT_SYMBOL_GPL(pp_msgs);
D
Doug Thompson 已提交
58

B
Borislav Petkov 已提交
59
/* request timeout */
60
const char * const to_msgs[] = { "no timeout", "timed out" };
61
EXPORT_SYMBOL_GPL(to_msgs);
D
Doug Thompson 已提交
62

B
Borislav Petkov 已提交
63
/* memory or i/o */
64
const char * const ii_msgs[] = { "MEM", "RESV", "IO", "GEN" };
65
EXPORT_SYMBOL_GPL(ii_msgs);
D
Doug Thompson 已提交
66

67
static const char * const f15h_mc1_mce_desc[] = {
68 69 70 71 72 73 74 75 76 77 78 79
	"UC during a demand linefill from L2",
	"Parity error during data load from IC",
	"Parity error for IC valid bit",
	"Main tag parity error",
	"Parity error in prediction queue",
	"PFB data/address parity error",
	"Parity error in the branch status reg",
	"PFB promotion address error",
	"Tag error during probe/victimization",
	"Parity error for IC probe tag valid bit",
	"PFB non-cacheable bit parity error",
	"PFB valid bit parity error",			/* xec = 0xd */
80
	"Microcode Patch Buffer",			/* xec = 010 */
81 82 83 84 85 86
	"uop queue",
	"insn buffer",
	"predecode buffer",
	"fetch address FIFO"
};

87
static const char * const f15h_mc2_mce_desc[] = {
88 89 90 91 92 93 94 95
	"Fill ECC error on data fills",			/* xec = 0x4 */
	"Fill parity error on insn fills",
	"Prefetcher request FIFO parity error",
	"PRQ address parity error",
	"PRQ data parity error",
	"WCC Tag ECC error",
	"WCC Data ECC error",
	"WCB Data parity error",
96
	"VB Data ECC or parity error",
97 98 99 100 101 102 103
	"L2 Tag ECC error",				/* xec = 0x10 */
	"Hard L2 Tag ECC error",
	"Multiple hits on L2 tag",
	"XAB parity error",
	"PRB address parity error"
};

104
static const char * const mc4_mce_desc[] = {
105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125
	"DRAM ECC error detected on the NB",
	"CRC error detected on HT link",
	"Link-defined sync error packets detected on HT link",
	"HT Master abort",
	"HT Target abort",
	"Invalid GART PTE entry during GART table walk",
	"Unsupported atomic RMW received from an IO link",
	"Watchdog timeout due to lack of progress",
	"DRAM ECC error detected on the NB",
	"SVM DMA Exclusion Vector error",
	"HT data error detected on link",
	"Protocol error (link, L3, probe filter)",
	"NB internal arrays parity error",
	"DRAM addr/ctl signals parity error",
	"IO link transmission error",
	"L3 data cache ECC error",			/* xec = 0x1c */
	"L3 cache tag error",
	"L3 LRU parity bits error",
	"ECC Error in the Probe Filter directory"
};

126
static const char * const mc5_mce_desc[] = {
127 128 129 130 131 132 133 134 135 136 137 138
	"CPU Watchdog timer expire",
	"Wakeup array dest tag",
	"AG payload array",
	"EX payload array",
	"IDRF array",
	"Retire dispatch queue",
	"Mapper checkpoint array",
	"Physical register file EX0 port",
	"Physical register file EX1 port",
	"Physical register file AG0 port",
	"Physical register file AG1 port",
	"Flag register file",
139
	"DE error occurred"
140 141
};

142
static bool f12h_mc0_mce(u16 ec, u8 xec)
143
{
144
	bool ret = false;
145

146
	if (MEM_ERROR(ec)) {
147
		u8 ll = LL(ec);
148
		ret = true;
149

150 151 152
		if (ll == LL_L2)
			pr_cont("during L1 linefill from L2.\n");
		else if (ll == LL_L1)
153
			pr_cont("Data/Tag %s error.\n", R4_MSG(ec));
154 155 156 157 158
		else
			ret = false;
	}
	return ret;
}
159

160
static bool f10h_mc0_mce(u16 ec, u8 xec)
161
{
162
	if (R4(ec) == R4_GEN && LL(ec) == LL_L1) {
163 164 165
		pr_cont("during data scrub.\n");
		return true;
	}
166
	return f12h_mc0_mce(ec, xec);
167 168
}

169
static bool k8_mc0_mce(u16 ec, u8 xec)
170 171 172 173 174
{
	if (BUS_ERROR(ec)) {
		pr_cont("during system linefill.\n");
		return true;
	}
175

176
	return f10h_mc0_mce(ec, xec);
177 178
}

179
static bool f14h_mc0_mce(u16 ec, u8 xec)
180
{
181
	u8 r4	 = R4(ec);
182 183 184 185
	bool ret = true;

	if (MEM_ERROR(ec)) {

186
		if (TT(ec) != TT_DATA || LL(ec) != LL_L1)
187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205
			return false;

		switch (r4) {
		case R4_DRD:
		case R4_DWR:
			pr_cont("Data/Tag parity error due to %s.\n",
				(r4 == R4_DRD ? "load/hw prf" : "store"));
			break;
		case R4_EVICT:
			pr_cont("Copyback parity error on a tag miss.\n");
			break;
		case R4_SNOOP:
			pr_cont("Tag parity error during snoop.\n");
			break;
		default:
			ret = false;
		}
	} else if (BUS_ERROR(ec)) {

206
		if ((II(ec) != II_MEM && II(ec) != II_IO) || LL(ec) != LL_LG)
207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230
			return false;

		pr_cont("System read data error on a ");

		switch (r4) {
		case R4_RD:
			pr_cont("TLB reload.\n");
			break;
		case R4_DWR:
			pr_cont("store.\n");
			break;
		case R4_DRD:
			pr_cont("load.\n");
			break;
		default:
			ret = false;
		}
	} else {
		ret = false;
	}

	return ret;
}

231
static bool f15h_mc0_mce(u16 ec, u8 xec)
232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268
{
	bool ret = true;

	if (MEM_ERROR(ec)) {

		switch (xec) {
		case 0x0:
			pr_cont("Data Array access error.\n");
			break;

		case 0x1:
			pr_cont("UC error during a linefill from L2/NB.\n");
			break;

		case 0x2:
		case 0x11:
			pr_cont("STQ access error.\n");
			break;

		case 0x3:
			pr_cont("SCB access error.\n");
			break;

		case 0x10:
			pr_cont("Tag error.\n");
			break;

		case 0x12:
			pr_cont("LDQ access error.\n");
			break;

		default:
			ret = false;
		}
	} else if (BUS_ERROR(ec)) {

		if (!xec)
269
			pr_cont("System Read Data Error.\n");
270
		else
271
			pr_cont(" Internal error condition type %d.\n", xec);
272 273 274 275 276 277
	} else
		ret = false;

	return ret;
}

278
static void decode_mc0_mce(struct mce *m)
279
{
280 281
	u16 ec = EC(m->status);
	u8 xec = XEC(m->status, xec_mask);
282

283
	pr_emerg(HW_ERR "MC0 Error: ");
284 285 286

	/* TLB error signatures are the same across families */
	if (TLB_ERROR(ec)) {
287
		if (TT(ec) == TT_DATA) {
288
			pr_cont("%s TLB %s.\n", LL_MSG(ec),
289 290
				((xec == 2) ? "locked miss"
					    : (xec ? "multimatch" : "parity")));
291 292
			return;
		}
293
	} else if (fam_ops->mc0_mce(ec, xec))
294 295
		;
	else
296
		pr_emerg(HW_ERR "Corrupted MC0 MCE info?\n");
297 298
}

299
static bool k8_mc1_mce(u16 ec, u8 xec)
300
{
301
	u8 ll	 = LL(ec);
302
	bool ret = true;
303

304 305
	if (!MEM_ERROR(ec))
		return false;
306

307 308 309
	if (ll == 0x2)
		pr_cont("during a linefill from L2.\n");
	else if (ll == 0x1) {
310
		switch (R4(ec)) {
311 312 313
		case R4_IRD:
			pr_cont("Parity error during data load.\n");
			break;
314

315 316 317 318 319 320 321 322 323 324 325 326
		case R4_EVICT:
			pr_cont("Copyback Parity/Victim error.\n");
			break;

		case R4_SNOOP:
			pr_cont("Tag Snoop error.\n");
			break;

		default:
			ret = false;
			break;
		}
327
	} else
328
		ret = false;
329

330 331 332
	return ret;
}

333
static bool f14h_mc1_mce(u16 ec, u8 xec)
334
{
335
	u8 r4    = R4(ec);
336
	bool ret = true;
337

338
	if (MEM_ERROR(ec)) {
339
		if (TT(ec) != 0 || LL(ec) != 1)
340 341 342 343 344 345 346 347 348 349 350 351
			ret = false;

		if (r4 == R4_IRD)
			pr_cont("Data/tag array parity error for a tag hit.\n");
		else if (r4 == R4_SNOOP)
			pr_cont("Tag error during snoop/victimization.\n");
		else
			ret = false;
	}
	return ret;
}

352
static bool f15h_mc1_mce(u16 ec, u8 xec)
353 354 355 356 357 358 359 360
{
	bool ret = true;

	if (!MEM_ERROR(ec))
		return false;

	switch (xec) {
	case 0x0 ... 0xa:
361
		pr_cont("%s.\n", f15h_mc1_mce_desc[xec]);
362 363 364
		break;

	case 0xd:
365
		pr_cont("%s.\n", f15h_mc1_mce_desc[xec-2]);
366 367
		break;

368
	case 0x10:
369
		pr_cont("%s.\n", f15h_mc1_mce_desc[xec-4]);
370 371 372
		break;

	case 0x11 ... 0x14:
373
		pr_cont("Decoder %s parity error.\n", f15h_mc1_mce_desc[xec-4]);
374 375 376 377 378 379 380 381
		break;

	default:
		ret = false;
	}
	return ret;
}

382
static void decode_mc1_mce(struct mce *m)
383
{
384 385
	u16 ec = EC(m->status);
	u8 xec = XEC(m->status, xec_mask);
386

387
	pr_emerg(HW_ERR "MC1 Error: ");
388 389 390 391 392

	if (TLB_ERROR(ec))
		pr_cont("%s TLB %s.\n", LL_MSG(ec),
			(xec ? "multimatch" : "parity error"));
	else if (BUS_ERROR(ec)) {
393
		bool k8 = (boot_cpu_data.x86 == 0xf && (m->status & BIT_64(58)));
394 395

		pr_cont("during %s.\n", (k8 ? "system linefill" : "NB data read"));
396
	} else if (fam_ops->mc1_mce(ec, xec))
397 398
		;
	else
399
		pr_emerg(HW_ERR "Corrupted MC1 MCE info?\n");
400 401
}

402
static void decode_mc2_mce(struct mce *m)
403
{
404 405
	u16 ec = EC(m->status);
	u8 xec = XEC(m->status, xec_mask);
406

407
	pr_emerg(HW_ERR "MC2 Error");
408 409 410 411 412 413

	if (xec == 0x1)
		pr_cont(" in the write data buffers.\n");
	else if (xec == 0x3)
		pr_cont(" in the victim data buffers.\n");
	else if (xec == 0x2 && MEM_ERROR(ec))
414
		pr_cont(": %s error in the L2 cache tags.\n", R4_MSG(ec));
415 416 417 418 419 420
	else if (xec == 0x0) {
		if (TLB_ERROR(ec))
			pr_cont(": %s error in a Page Descriptor Cache or "
				"Guest TLB.\n", TT_MSG(ec));
		else if (BUS_ERROR(ec))
			pr_cont(": %s/ECC error in data read from NB: %s.\n",
421
				R4_MSG(ec), PP_MSG(ec));
422
		else if (MEM_ERROR(ec)) {
423
			u8 r4 = R4(ec);
424

425
			if (r4 >= 0x7)
426
				pr_cont(": %s error during data copyback.\n",
427 428
					R4_MSG(ec));
			else if (r4 <= 0x1)
429
				pr_cont(": %s parity/ECC error during data "
430
					"access from L2.\n", R4_MSG(ec));
431
			else
432
				goto wrong_mc2_mce;
433
		} else
434
			goto wrong_mc2_mce;
435
	} else
436
		goto wrong_mc2_mce;
437 438 439

	return;

440 441
 wrong_mc2_mce:
	pr_emerg(HW_ERR "Corrupted MC2 MCE info?\n");
442 443
}

444
static void decode_f15_mc2_mce(struct mce *m)
445
{
446 447
	u16 ec = EC(m->status);
	u8 xec = XEC(m->status, xec_mask);
448

449
	pr_emerg(HW_ERR "MC2 Error: ");
450 451 452 453 454 455 456

	if (TLB_ERROR(ec)) {
		if (xec == 0x0)
			pr_cont("Data parity TLB read error.\n");
		else if (xec == 0x1)
			pr_cont("Poison data provided for TLB fill.\n");
		else
457
			goto wrong_f15_mc2_mce;
458 459
	} else if (BUS_ERROR(ec)) {
		if (xec > 2)
460
			goto wrong_f15_mc2_mce;
461 462 463 464 465

		pr_cont("Error during attempted NB data read.\n");
	} else if (MEM_ERROR(ec)) {
		switch (xec) {
		case 0x4 ... 0xc:
466
			pr_cont("%s.\n", f15h_mc2_mce_desc[xec - 0x4]);
467 468 469
			break;

		case 0x10 ... 0x14:
470
			pr_cont("%s.\n", f15h_mc2_mce_desc[xec - 0x7]);
471 472 473
			break;

		default:
474
			goto wrong_f15_mc2_mce;
475 476 477 478 479
		}
	}

	return;

480 481
 wrong_f15_mc2_mce:
	pr_emerg(HW_ERR "Corrupted MC2 MCE info?\n");
482 483
}

484
static void decode_mc3_mce(struct mce *m)
485
{
486 487
	u16 ec = EC(m->status);
	u8 xec = XEC(m->status, xec_mask);
488

489
	if (boot_cpu_data.x86 >= 0x14) {
490
		pr_emerg("You shouldn't be seeing MC3 MCE on this cpu family,"
491 492 493
			 " please report on LKML.\n");
		return;
	}
494

495
	pr_emerg(HW_ERR "MC3 Error");
496 497

	if (xec == 0x0) {
498
		u8 r4 = R4(ec);
499

500
		if (!BUS_ERROR(ec) || (r4 != R4_DRD && r4 != R4_DWR))
501
			goto wrong_mc3_mce;
502

503
		pr_cont(" during %s.\n", R4_MSG(ec));
504
	} else
505
		goto wrong_mc3_mce;
506

507 508
	return;

509 510
 wrong_mc3_mce:
	pr_emerg(HW_ERR "Corrupted MC3 MCE info?\n");
511 512
}

513
static void decode_mc4_mce(struct mce *m)
514
{
515 516 517 518 519
	struct cpuinfo_x86 *c = &boot_cpu_data;
	int node_id = amd_get_nb_id(m->extcpu);
	u16 ec = EC(m->status);
	u8 xec = XEC(m->status, 0x1f);
	u8 offset = 0;
520

521
	pr_emerg(HW_ERR "MC4 Error (node %d): ", node_id);
522

523 524
	switch (xec) {
	case 0x0 ... 0xe:
525

526 527 528 529
		/* special handling for DRAM ECCs */
		if (xec == 0x0 || xec == 0x8) {
			/* no ECCs on F11h */
			if (c->x86 == 0x11)
530
				goto wrong_mc4_mce;
531

532
			pr_cont("%s.\n", mc4_mce_desc[xec]);
533

534 535 536 537
			if (nb_bus_decoder)
				nb_bus_decoder(node_id, m);
			return;
		}
538 539 540 541 542 543 544 545
		break;

	case 0xf:
		if (TLB_ERROR(ec))
			pr_cont("GART Table Walk data error.\n");
		else if (BUS_ERROR(ec))
			pr_cont("DMA Exclusion Vector Table Walk error.\n");
		else
546
			goto wrong_mc4_mce;
547
		return;
548

549 550 551 552
	case 0x19:
		if (boot_cpu_data.x86 == 0x15)
			pr_cont("Compute Unit Data Error.\n");
		else
553
			goto wrong_mc4_mce;
554
		return;
555

556
	case 0x1c ... 0x1f:
557
		offset = 13;
558 559 560
		break;

	default:
561
		goto wrong_mc4_mce;
562
	}
563

564
	pr_cont("%s.\n", mc4_mce_desc[xec - offset]);
565 566
	return;

567 568
 wrong_mc4_mce:
	pr_emerg(HW_ERR "Corrupted MC4 MCE info?\n");
569 570
}

571
static void decode_mc5_mce(struct mce *m)
B
Borislav Petkov 已提交
572
{
573
	struct cpuinfo_x86 *c = &boot_cpu_data;
574
	u8 xec = XEC(m->status, xec_mask);
575 576

	if (c->x86 == 0xf || c->x86 == 0x11)
577
		goto wrong_mc5_mce;
B
Borislav Petkov 已提交
578

579
	pr_emerg(HW_ERR "MC5 Error: ");
580 581

	if (xec == 0x0 || xec == 0xc)
582
		pr_cont("%s.\n", mc5_mce_desc[xec]);
583
	else if (xec < 0xd)
584
		pr_cont("%s parity error.\n", mc5_mce_desc[xec]);
585
	else
586
		goto wrong_mc5_mce;
587 588

	return;
B
Borislav Petkov 已提交
589

590 591
 wrong_mc5_mce:
	pr_emerg(HW_ERR "Corrupted MC5 MCE info?\n");
B
Borislav Petkov 已提交
592 593
}

594
static void decode_mc6_mce(struct mce *m)
595
{
596
	u8 xec = XEC(m->status, xec_mask);
597

598
	pr_emerg(HW_ERR "MC6 Error: ");
599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621

	switch (xec) {
	case 0x1:
		pr_cont("Free List");
		break;

	case 0x2:
		pr_cont("Physical Register File");
		break;

	case 0x3:
		pr_cont("Retire Queue");
		break;

	case 0x4:
		pr_cont("Scheduler table");
		break;

	case 0x5:
		pr_cont("Status Register File");
		break;

	default:
622
		goto wrong_mc6_mce;
623 624 625 626 627 628 629
		break;
	}

	pr_cont(" parity error.\n");

	return;

630 631
 wrong_mc6_mce:
	pr_emerg(HW_ERR "Corrupted MC6 MCE info?\n");
632 633
}

B
Borislav Petkov 已提交
634
static inline void amd_decode_err_code(u16 ec)
635
{
636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651

	pr_emerg(HW_ERR "cache level: %s", LL_MSG(ec));

	if (BUS_ERROR(ec))
		pr_cont(", mem/io: %s", II_MSG(ec));
	else
		pr_cont(", tx: %s", TT_MSG(ec));

	if (MEM_ERROR(ec) || BUS_ERROR(ec)) {
		pr_cont(", mem-tx: %s", R4_MSG(ec));

		if (BUS_ERROR(ec))
			pr_cont(", part-proc: %s (%s)", PP_MSG(ec), TO_MSG(ec));
	}

	pr_cont("\n");
652 653
}

654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669
/*
 * Filter out unwanted MCE signatures here.
 */
static bool amd_filter_mce(struct mce *m)
{
	u8 xec = (m->status >> 16) & 0x1f;

	/*
	 * NB GART TLB error reporting is disabled by default.
	 */
	if (m->bank == 4 && xec == 0x5 && !report_gart_errors)
		return true;

	return false;
}

B
Borislav Petkov 已提交
670
int amd_decode_mce(struct notifier_block *nb, unsigned long val, void *data)
671
{
672
	struct mce *m = (struct mce *)data;
673
	struct cpuinfo_x86 *c = &boot_cpu_data;
674
	int ecc;
675

676 677 678
	if (amd_filter_mce(m))
		return NOTIFY_STOP;

679
	pr_emerg(HW_ERR "CPU:%d\tMC%d_STATUS[%s|%s|%s|%s|%s",
680
		m->extcpu, m->bank,
681 682 683 684 685
		((m->status & MCI_STATUS_OVER)	? "Over"  : "-"),
		((m->status & MCI_STATUS_UC)	? "UE"	  : "CE"),
		((m->status & MCI_STATUS_MISCV)	? "MiscV" : "-"),
		((m->status & MCI_STATUS_PCC)	? "PCC"	  : "-"),
		((m->status & MCI_STATUS_ADDRV)	? "AddrV" : "-"));
686

687 688
	if (c->x86 == 0x15)
		pr_cont("|%s|%s",
689 690
			((m->status & BIT_64(44)) ? "Deferred" : "-"),
			((m->status & BIT_64(43)) ? "Poison"   : "-"));
691

692
	/* do the two bits[14:13] together */
693
	ecc = (m->status >> 45) & 0x3;
694
	if (ecc)
695 696 697
		pr_cont("|%sECC", ((ecc == 2) ? "C" : "U"));

	pr_cont("]: 0x%016llx\n", m->status);
698

699 700
	if (m->status & MCI_STATUS_ADDRV)
		pr_emerg(HW_ERR "\tMC%d_ADDR: 0x%016llx\n", m->bank, m->addr);
701

702 703
	switch (m->bank) {
	case 0:
704
		decode_mc0_mce(m);
705
		break;
706

707
	case 1:
708
		decode_mc1_mce(m);
709 710
		break;

711
	case 2:
712
		if (c->x86 == 0x15)
713
			decode_f15_mc2_mce(m);
714
		else
715
			decode_mc2_mce(m);
716 717
		break;

718
	case 3:
719
		decode_mc3_mce(m);
720 721
		break;

722
	case 4:
723
		decode_mc4_mce(m);
724 725
		break;

B
Borislav Petkov 已提交
726
	case 5:
727
		decode_mc5_mce(m);
B
Borislav Petkov 已提交
728 729
		break;

730
	case 6:
731
		decode_mc6_mce(m);
732 733
		break;

734 735
	default:
		break;
736
	}
737 738

	amd_decode_err_code(m->status & 0xffff);
739 740

	return NOTIFY_STOP;
741
}
B
Borislav Petkov 已提交
742
EXPORT_SYMBOL_GPL(amd_decode_mce);
743

744 745 746 747
static struct notifier_block amd_mce_dec_nb = {
	.notifier_call	= amd_decode_mce,
};

748 749
static int __init mce_amd_init(void)
{
750 751 752
	struct cpuinfo_x86 *c = &boot_cpu_data;

	if (c->x86_vendor != X86_VENDOR_AMD)
753 754
		return 0;

755
	if (c->x86 < 0xf || c->x86 > 0x15)
756 757
		return 0;

758 759 760 761
	fam_ops = kzalloc(sizeof(struct amd_decoder_ops), GFP_KERNEL);
	if (!fam_ops)
		return -ENOMEM;

762
	switch (c->x86) {
763
	case 0xf:
764 765
		fam_ops->mc0_mce = k8_mc0_mce;
		fam_ops->mc1_mce = k8_mc1_mce;
766 767 768
		break;

	case 0x10:
769 770
		fam_ops->mc0_mce = f10h_mc0_mce;
		fam_ops->mc1_mce = k8_mc1_mce;
771 772
		break;

773
	case 0x11:
774 775
		fam_ops->mc0_mce = k8_mc0_mce;
		fam_ops->mc1_mce = k8_mc1_mce;
776 777
		break;

778
	case 0x12:
779 780
		fam_ops->mc0_mce = f12h_mc0_mce;
		fam_ops->mc1_mce = k8_mc1_mce;
781 782
		break;

783
	case 0x14:
784
		nb_err_cpumask  = 0x3;
785 786
		fam_ops->mc0_mce = f14h_mc0_mce;
		fam_ops->mc1_mce = f14h_mc1_mce;
787 788
		break;

789 790
	case 0x15:
		xec_mask = 0x1f;
791 792
		fam_ops->mc0_mce = f15h_mc0_mce;
		fam_ops->mc1_mce = f15h_mc1_mce;
793 794
		break;

795
	default:
796
		printk(KERN_WARNING "Huh? What family is it: 0x%x?!\n", c->x86);
797 798 799 800
		kfree(fam_ops);
		return -EINVAL;
	}

801 802
	pr_info("MCE: In-kernel MCE decoding enabled.\n");

803
	mce_register_decode_chain(&amd_mce_dec_nb);
804 805 806 807

	return 0;
}
early_initcall(mce_amd_init);
808 809 810 811

#ifdef MODULE
static void __exit mce_amd_exit(void)
{
812
	mce_unregister_decode_chain(&amd_mce_dec_nb);
813
	kfree(fam_ops);
814 815 816 817 818 819 820
}

MODULE_DESCRIPTION("AMD MCE decoder");
MODULE_ALIAS("edac-mce-amd");
MODULE_LICENSE("GPL");
module_exit(mce_amd_exit);
#endif