mce_amd.c 16.6 KB
Newer Older
1
#include <linux/module.h>
2 3
#include <linux/slab.h>

B
Borislav Petkov 已提交
4
#include "mce_amd.h"
D
Doug Thompson 已提交
5

6 7
static struct amd_decoder_ops *fam_ops;

8
static u8 xec_mask	 = 0xf;
9 10
static u8 nb_err_cpumask = 0xf;

11
static bool report_gart_errors;
12
static void (*nb_bus_decoder)(int node_id, struct mce *m);
13 14 15 16 17 18 19

void amd_report_gart_errors(bool v)
{
	report_gart_errors = v;
}
EXPORT_SYMBOL_GPL(amd_report_gart_errors);

20
void amd_register_ecc_decoder(void (*f)(int, struct mce *))
21 22 23 24 25
{
	nb_bus_decoder = f;
}
EXPORT_SYMBOL_GPL(amd_register_ecc_decoder);

26
void amd_unregister_ecc_decoder(void (*f)(int, struct mce *))
27 28 29 30 31 32 33 34 35
{
	if (nb_bus_decoder) {
		WARN_ON(nb_bus_decoder != f);

		nb_bus_decoder = NULL;
	}
}
EXPORT_SYMBOL_GPL(amd_unregister_ecc_decoder);

D
Doug Thompson 已提交
36 37 38 39
/*
 * string representation for the different MCA reported error types, see F3x48
 * or MSR0000_0411.
 */
B
Borislav Petkov 已提交
40 41

/* transaction type */
42
const char * const tt_msgs[] = { "INSN", "DATA", "GEN", "RESV" };
43
EXPORT_SYMBOL_GPL(tt_msgs);
D
Doug Thompson 已提交
44

B
Borislav Petkov 已提交
45
/* cache level */
46
const char * const ll_msgs[] = { "RESV", "L1", "L2", "L3/GEN" };
47
EXPORT_SYMBOL_GPL(ll_msgs);
D
Doug Thompson 已提交
48

B
Borislav Petkov 已提交
49
/* memory transaction type */
50
const char * const rrrr_msgs[] = {
B
Borislav Petkov 已提交
51
       "GEN", "RD", "WR", "DRD", "DWR", "IRD", "PRF", "EV", "SNP"
D
Doug Thompson 已提交
52
};
53
EXPORT_SYMBOL_GPL(rrrr_msgs);
D
Doug Thompson 已提交
54

B
Borislav Petkov 已提交
55
/* participating processor */
56
const char * const pp_msgs[] = { "SRC", "RES", "OBS", "GEN" };
57
EXPORT_SYMBOL_GPL(pp_msgs);
D
Doug Thompson 已提交
58

B
Borislav Petkov 已提交
59
/* request timeout */
60
const char * const to_msgs[] = { "no timeout", "timed out" };
61
EXPORT_SYMBOL_GPL(to_msgs);
D
Doug Thompson 已提交
62

B
Borislav Petkov 已提交
63
/* memory or i/o */
64
const char * const ii_msgs[] = { "MEM", "RESV", "IO", "GEN" };
65
EXPORT_SYMBOL_GPL(ii_msgs);
D
Doug Thompson 已提交
66

67
static const char * const f15h_mc1_mce_desc[] = {
68 69 70 71 72 73 74 75 76 77 78 79
	"UC during a demand linefill from L2",
	"Parity error during data load from IC",
	"Parity error for IC valid bit",
	"Main tag parity error",
	"Parity error in prediction queue",
	"PFB data/address parity error",
	"Parity error in the branch status reg",
	"PFB promotion address error",
	"Tag error during probe/victimization",
	"Parity error for IC probe tag valid bit",
	"PFB non-cacheable bit parity error",
	"PFB valid bit parity error",			/* xec = 0xd */
80
	"Microcode Patch Buffer",			/* xec = 010 */
81 82 83 84 85 86
	"uop queue",
	"insn buffer",
	"predecode buffer",
	"fetch address FIFO"
};

87
static const char * const f15h_mc2_mce_desc[] = {
88 89 90 91 92 93 94 95
	"Fill ECC error on data fills",			/* xec = 0x4 */
	"Fill parity error on insn fills",
	"Prefetcher request FIFO parity error",
	"PRQ address parity error",
	"PRQ data parity error",
	"WCC Tag ECC error",
	"WCC Data ECC error",
	"WCB Data parity error",
96
	"VB Data ECC or parity error",
97 98 99 100 101 102 103
	"L2 Tag ECC error",				/* xec = 0x10 */
	"Hard L2 Tag ECC error",
	"Multiple hits on L2 tag",
	"XAB parity error",
	"PRB address parity error"
};

104
static const char * const mc4_mce_desc[] = {
105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125
	"DRAM ECC error detected on the NB",
	"CRC error detected on HT link",
	"Link-defined sync error packets detected on HT link",
	"HT Master abort",
	"HT Target abort",
	"Invalid GART PTE entry during GART table walk",
	"Unsupported atomic RMW received from an IO link",
	"Watchdog timeout due to lack of progress",
	"DRAM ECC error detected on the NB",
	"SVM DMA Exclusion Vector error",
	"HT data error detected on link",
	"Protocol error (link, L3, probe filter)",
	"NB internal arrays parity error",
	"DRAM addr/ctl signals parity error",
	"IO link transmission error",
	"L3 data cache ECC error",			/* xec = 0x1c */
	"L3 cache tag error",
	"L3 LRU parity bits error",
	"ECC Error in the Probe Filter directory"
};

126
static const char * const mc5_mce_desc[] = {
127 128 129 130 131 132 133 134 135 136 137 138
	"CPU Watchdog timer expire",
	"Wakeup array dest tag",
	"AG payload array",
	"EX payload array",
	"IDRF array",
	"Retire dispatch queue",
	"Mapper checkpoint array",
	"Physical register file EX0 port",
	"Physical register file EX1 port",
	"Physical register file AG0 port",
	"Physical register file AG1 port",
	"Flag register file",
139
	"DE error occurred"
140 141
};

142
static bool f12h_mc0_mce(u16 ec, u8 xec)
143
{
144
	bool ret = false;
145

146
	if (MEM_ERROR(ec)) {
147
		u8 ll = LL(ec);
148
		ret = true;
149

150 151 152
		if (ll == LL_L2)
			pr_cont("during L1 linefill from L2.\n");
		else if (ll == LL_L1)
153
			pr_cont("Data/Tag %s error.\n", R4_MSG(ec));
154 155 156 157 158
		else
			ret = false;
	}
	return ret;
}
159

160
static bool f10h_mc0_mce(u16 ec, u8 xec)
161
{
162
	if (R4(ec) == R4_GEN && LL(ec) == LL_L1) {
163 164 165
		pr_cont("during data scrub.\n");
		return true;
	}
166
	return f12h_mc0_mce(ec, xec);
167 168
}

169
static bool k8_mc0_mce(u16 ec, u8 xec)
170 171 172 173 174
{
	if (BUS_ERROR(ec)) {
		pr_cont("during system linefill.\n");
		return true;
	}
175

176
	return f10h_mc0_mce(ec, xec);
177 178
}

179
static bool f14h_mc0_mce(u16 ec, u8 xec)
180
{
181
	u8 r4	 = R4(ec);
182 183 184 185
	bool ret = true;

	if (MEM_ERROR(ec)) {

186
		if (TT(ec) != TT_DATA || LL(ec) != LL_L1)
187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205
			return false;

		switch (r4) {
		case R4_DRD:
		case R4_DWR:
			pr_cont("Data/Tag parity error due to %s.\n",
				(r4 == R4_DRD ? "load/hw prf" : "store"));
			break;
		case R4_EVICT:
			pr_cont("Copyback parity error on a tag miss.\n");
			break;
		case R4_SNOOP:
			pr_cont("Tag parity error during snoop.\n");
			break;
		default:
			ret = false;
		}
	} else if (BUS_ERROR(ec)) {

206
		if ((II(ec) != II_MEM && II(ec) != II_IO) || LL(ec) != LL_LG)
207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230
			return false;

		pr_cont("System read data error on a ");

		switch (r4) {
		case R4_RD:
			pr_cont("TLB reload.\n");
			break;
		case R4_DWR:
			pr_cont("store.\n");
			break;
		case R4_DRD:
			pr_cont("load.\n");
			break;
		default:
			ret = false;
		}
	} else {
		ret = false;
	}

	return ret;
}

231
static bool f15h_mc0_mce(u16 ec, u8 xec)
232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268
{
	bool ret = true;

	if (MEM_ERROR(ec)) {

		switch (xec) {
		case 0x0:
			pr_cont("Data Array access error.\n");
			break;

		case 0x1:
			pr_cont("UC error during a linefill from L2/NB.\n");
			break;

		case 0x2:
		case 0x11:
			pr_cont("STQ access error.\n");
			break;

		case 0x3:
			pr_cont("SCB access error.\n");
			break;

		case 0x10:
			pr_cont("Tag error.\n");
			break;

		case 0x12:
			pr_cont("LDQ access error.\n");
			break;

		default:
			ret = false;
		}
	} else if (BUS_ERROR(ec)) {

		if (!xec)
269
			pr_cont("System Read Data Error.\n");
270
		else
271
			pr_cont(" Internal error condition type %d.\n", xec);
272 273 274 275 276 277
	} else
		ret = false;

	return ret;
}

278
static void decode_mc0_mce(struct mce *m)
279
{
280 281
	u16 ec = EC(m->status);
	u8 xec = XEC(m->status, xec_mask);
282

283
	pr_emerg(HW_ERR "MC0 Error: ");
284 285 286

	/* TLB error signatures are the same across families */
	if (TLB_ERROR(ec)) {
287
		if (TT(ec) == TT_DATA) {
288
			pr_cont("%s TLB %s.\n", LL_MSG(ec),
289 290
				((xec == 2) ? "locked miss"
					    : (xec ? "multimatch" : "parity")));
291 292
			return;
		}
293
	} else if (fam_ops->mc0_mce(ec, xec))
294 295
		;
	else
296
		pr_emerg(HW_ERR "Corrupted MC0 MCE info?\n");
297 298
}

299
static bool k8_mc1_mce(u16 ec, u8 xec)
300
{
301
	u8 ll	 = LL(ec);
302
	bool ret = true;
303

304 305
	if (!MEM_ERROR(ec))
		return false;
306

307 308 309
	if (ll == 0x2)
		pr_cont("during a linefill from L2.\n");
	else if (ll == 0x1) {
310
		switch (R4(ec)) {
311 312 313
		case R4_IRD:
			pr_cont("Parity error during data load.\n");
			break;
314

315 316 317 318 319 320 321 322 323 324 325 326
		case R4_EVICT:
			pr_cont("Copyback Parity/Victim error.\n");
			break;

		case R4_SNOOP:
			pr_cont("Tag Snoop error.\n");
			break;

		default:
			ret = false;
			break;
		}
327
	} else
328
		ret = false;
329

330 331 332
	return ret;
}

333
static bool f14h_mc1_mce(u16 ec, u8 xec)
334
{
335
	u8 r4    = R4(ec);
336
	bool ret = true;
337

338
	if (MEM_ERROR(ec)) {
339
		if (TT(ec) != 0 || LL(ec) != 1)
340 341 342 343 344 345 346 347 348 349 350 351
			ret = false;

		if (r4 == R4_IRD)
			pr_cont("Data/tag array parity error for a tag hit.\n");
		else if (r4 == R4_SNOOP)
			pr_cont("Tag error during snoop/victimization.\n");
		else
			ret = false;
	}
	return ret;
}

352
static bool f15h_mc1_mce(u16 ec, u8 xec)
353 354 355 356 357 358 359 360
{
	bool ret = true;

	if (!MEM_ERROR(ec))
		return false;

	switch (xec) {
	case 0x0 ... 0xa:
361
		pr_cont("%s.\n", f15h_mc1_mce_desc[xec]);
362 363 364
		break;

	case 0xd:
365
		pr_cont("%s.\n", f15h_mc1_mce_desc[xec-2]);
366 367
		break;

368
	case 0x10:
369
		pr_cont("%s.\n", f15h_mc1_mce_desc[xec-4]);
370 371 372
		break;

	case 0x11 ... 0x14:
373
		pr_cont("Decoder %s parity error.\n", f15h_mc1_mce_desc[xec-4]);
374 375 376 377 378 379 380 381
		break;

	default:
		ret = false;
	}
	return ret;
}

382
static void decode_mc1_mce(struct mce *m)
383
{
384 385
	u16 ec = EC(m->status);
	u8 xec = XEC(m->status, xec_mask);
386

387
	pr_emerg(HW_ERR "MC1 Error: ");
388 389 390 391 392

	if (TLB_ERROR(ec))
		pr_cont("%s TLB %s.\n", LL_MSG(ec),
			(xec ? "multimatch" : "parity error"));
	else if (BUS_ERROR(ec)) {
393
		bool k8 = (boot_cpu_data.x86 == 0xf && (m->status & BIT_64(58)));
394 395

		pr_cont("during %s.\n", (k8 ? "system linefill" : "NB data read"));
396
	} else if (fam_ops->mc1_mce(ec, xec))
397 398
		;
	else
399
		pr_emerg(HW_ERR "Corrupted MC1 MCE info?\n");
400 401
}

402
static bool k8_mc2_mce(u16 ec, u8 xec)
403
{
404
	bool ret = true;
405 406 407 408 409 410

	if (xec == 0x1)
		pr_cont(" in the write data buffers.\n");
	else if (xec == 0x3)
		pr_cont(" in the victim data buffers.\n");
	else if (xec == 0x2 && MEM_ERROR(ec))
411
		pr_cont(": %s error in the L2 cache tags.\n", R4_MSG(ec));
412 413 414 415 416 417
	else if (xec == 0x0) {
		if (TLB_ERROR(ec))
			pr_cont(": %s error in a Page Descriptor Cache or "
				"Guest TLB.\n", TT_MSG(ec));
		else if (BUS_ERROR(ec))
			pr_cont(": %s/ECC error in data read from NB: %s.\n",
418
				R4_MSG(ec), PP_MSG(ec));
419
		else if (MEM_ERROR(ec)) {
420
			u8 r4 = R4(ec);
421

422
			if (r4 >= 0x7)
423
				pr_cont(": %s error during data copyback.\n",
424 425
					R4_MSG(ec));
			else if (r4 <= 0x1)
426
				pr_cont(": %s parity/ECC error during data "
427
					"access from L2.\n", R4_MSG(ec));
428
			else
429
				ret = false;
430
		} else
431
			ret = false;
432
	} else
433
		ret = false;
434

435
	return ret;
436 437
}

438
static bool f15h_mc2_mce(u16 ec, u8 xec)
439
{
440
	bool ret = true;
441 442 443 444 445 446 447

	if (TLB_ERROR(ec)) {
		if (xec == 0x0)
			pr_cont("Data parity TLB read error.\n");
		else if (xec == 0x1)
			pr_cont("Poison data provided for TLB fill.\n");
		else
448
			ret = false;
449 450
	} else if (BUS_ERROR(ec)) {
		if (xec > 2)
451
			ret = false;
452 453 454 455 456

		pr_cont("Error during attempted NB data read.\n");
	} else if (MEM_ERROR(ec)) {
		switch (xec) {
		case 0x4 ... 0xc:
457
			pr_cont("%s.\n", f15h_mc2_mce_desc[xec - 0x4]);
458 459 460
			break;

		case 0x10 ... 0x14:
461
			pr_cont("%s.\n", f15h_mc2_mce_desc[xec - 0x7]);
462 463 464
			break;

		default:
465
			ret = false;
466 467 468
		}
	}

469 470 471 472 473 474 475
	return ret;
}

static void decode_mc2_mce(struct mce *m)
{
	u16 ec = EC(m->status);
	u8 xec = XEC(m->status, xec_mask);
476

477 478 479 480
	pr_emerg(HW_ERR "MC2 Error: ");

	if (!fam_ops->mc2_mce(ec, xec))
		pr_cont(HW_ERR "Corrupted MC2 MCE info?\n");
481 482
}

483
static void decode_mc3_mce(struct mce *m)
484
{
485 486
	u16 ec = EC(m->status);
	u8 xec = XEC(m->status, xec_mask);
487

488
	if (boot_cpu_data.x86 >= 0x14) {
489
		pr_emerg("You shouldn't be seeing MC3 MCE on this cpu family,"
490 491 492
			 " please report on LKML.\n");
		return;
	}
493

494
	pr_emerg(HW_ERR "MC3 Error");
495 496

	if (xec == 0x0) {
497
		u8 r4 = R4(ec);
498

499
		if (!BUS_ERROR(ec) || (r4 != R4_DRD && r4 != R4_DWR))
500
			goto wrong_mc3_mce;
501

502
		pr_cont(" during %s.\n", R4_MSG(ec));
503
	} else
504
		goto wrong_mc3_mce;
505

506 507
	return;

508 509
 wrong_mc3_mce:
	pr_emerg(HW_ERR "Corrupted MC3 MCE info?\n");
510 511
}

512
static void decode_mc4_mce(struct mce *m)
513
{
514 515 516 517 518
	struct cpuinfo_x86 *c = &boot_cpu_data;
	int node_id = amd_get_nb_id(m->extcpu);
	u16 ec = EC(m->status);
	u8 xec = XEC(m->status, 0x1f);
	u8 offset = 0;
519

520
	pr_emerg(HW_ERR "MC4 Error (node %d): ", node_id);
521

522 523
	switch (xec) {
	case 0x0 ... 0xe:
524

525 526 527 528
		/* special handling for DRAM ECCs */
		if (xec == 0x0 || xec == 0x8) {
			/* no ECCs on F11h */
			if (c->x86 == 0x11)
529
				goto wrong_mc4_mce;
530

531
			pr_cont("%s.\n", mc4_mce_desc[xec]);
532

533 534 535 536
			if (nb_bus_decoder)
				nb_bus_decoder(node_id, m);
			return;
		}
537 538 539 540 541 542 543 544
		break;

	case 0xf:
		if (TLB_ERROR(ec))
			pr_cont("GART Table Walk data error.\n");
		else if (BUS_ERROR(ec))
			pr_cont("DMA Exclusion Vector Table Walk error.\n");
		else
545
			goto wrong_mc4_mce;
546
		return;
547

548 549 550 551
	case 0x19:
		if (boot_cpu_data.x86 == 0x15)
			pr_cont("Compute Unit Data Error.\n");
		else
552
			goto wrong_mc4_mce;
553
		return;
554

555
	case 0x1c ... 0x1f:
556
		offset = 13;
557 558 559
		break;

	default:
560
		goto wrong_mc4_mce;
561
	}
562

563
	pr_cont("%s.\n", mc4_mce_desc[xec - offset]);
564 565
	return;

566 567
 wrong_mc4_mce:
	pr_emerg(HW_ERR "Corrupted MC4 MCE info?\n");
568 569
}

570
static void decode_mc5_mce(struct mce *m)
B
Borislav Petkov 已提交
571
{
572
	struct cpuinfo_x86 *c = &boot_cpu_data;
573
	u8 xec = XEC(m->status, xec_mask);
574 575

	if (c->x86 == 0xf || c->x86 == 0x11)
576
		goto wrong_mc5_mce;
B
Borislav Petkov 已提交
577

578
	pr_emerg(HW_ERR "MC5 Error: ");
579 580

	if (xec == 0x0 || xec == 0xc)
581
		pr_cont("%s.\n", mc5_mce_desc[xec]);
582
	else if (xec < 0xd)
583
		pr_cont("%s parity error.\n", mc5_mce_desc[xec]);
584
	else
585
		goto wrong_mc5_mce;
586 587

	return;
B
Borislav Petkov 已提交
588

589 590
 wrong_mc5_mce:
	pr_emerg(HW_ERR "Corrupted MC5 MCE info?\n");
B
Borislav Petkov 已提交
591 592
}

593
static void decode_mc6_mce(struct mce *m)
594
{
595
	u8 xec = XEC(m->status, xec_mask);
596

597
	pr_emerg(HW_ERR "MC6 Error: ");
598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620

	switch (xec) {
	case 0x1:
		pr_cont("Free List");
		break;

	case 0x2:
		pr_cont("Physical Register File");
		break;

	case 0x3:
		pr_cont("Retire Queue");
		break;

	case 0x4:
		pr_cont("Scheduler table");
		break;

	case 0x5:
		pr_cont("Status Register File");
		break;

	default:
621
		goto wrong_mc6_mce;
622 623 624 625 626 627 628
		break;
	}

	pr_cont(" parity error.\n");

	return;

629 630
 wrong_mc6_mce:
	pr_emerg(HW_ERR "Corrupted MC6 MCE info?\n");
631 632
}

B
Borislav Petkov 已提交
633
static inline void amd_decode_err_code(u16 ec)
634
{
635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650

	pr_emerg(HW_ERR "cache level: %s", LL_MSG(ec));

	if (BUS_ERROR(ec))
		pr_cont(", mem/io: %s", II_MSG(ec));
	else
		pr_cont(", tx: %s", TT_MSG(ec));

	if (MEM_ERROR(ec) || BUS_ERROR(ec)) {
		pr_cont(", mem-tx: %s", R4_MSG(ec));

		if (BUS_ERROR(ec))
			pr_cont(", part-proc: %s (%s)", PP_MSG(ec), TO_MSG(ec));
	}

	pr_cont("\n");
651 652
}

653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668
/*
 * Filter out unwanted MCE signatures here.
 */
static bool amd_filter_mce(struct mce *m)
{
	u8 xec = (m->status >> 16) & 0x1f;

	/*
	 * NB GART TLB error reporting is disabled by default.
	 */
	if (m->bank == 4 && xec == 0x5 && !report_gart_errors)
		return true;

	return false;
}

B
Borislav Petkov 已提交
669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684
static const char *decode_error_status(struct mce *m)
{
	if (m->status & MCI_STATUS_UC) {
		if (m->status & MCI_STATUS_PCC)
			return "System Fatal error.";
		if (m->mcgstatus & MCG_STATUS_RIPV)
			return "Uncorrected, software restartable error.";
		return "Uncorrected, software containable error.";
	}

	if (m->status & MCI_STATUS_DEFERRED)
		return "Deferred error.";

	return "Corrected error, no action required.";
}

B
Borislav Petkov 已提交
685
int amd_decode_mce(struct notifier_block *nb, unsigned long val, void *data)
686
{
687
	struct mce *m = (struct mce *)data;
688
	struct cpuinfo_x86 *c = &cpu_data(m->extcpu);
689
	int ecc;
690

691 692 693
	if (amd_filter_mce(m))
		return NOTIFY_STOP;

694 695
	switch (m->bank) {
	case 0:
696
		decode_mc0_mce(m);
697
		break;
698

699
	case 1:
700
		decode_mc1_mce(m);
701 702
		break;

703
	case 2:
704
		decode_mc2_mce(m);
705 706
		break;

707
	case 3:
708
		decode_mc3_mce(m);
709 710
		break;

711
	case 4:
712
		decode_mc4_mce(m);
713 714
		break;

B
Borislav Petkov 已提交
715
	case 5:
716
		decode_mc5_mce(m);
B
Borislav Petkov 已提交
717 718
		break;

719
	case 6:
720
		decode_mc6_mce(m);
721 722
		break;

723 724
	default:
		break;
725
	}
726

B
Borislav Petkov 已提交
727 728
	pr_emerg(HW_ERR "Error Status: %s\n", decode_error_status(m));

729 730 731 732 733 734 735 736 737 738 739 740
	pr_emerg(HW_ERR "CPU:%d (%x:%x:%x) MC%d_STATUS[%s|%s|%s|%s|%s",
		m->extcpu,
		c->x86, c->x86_model, c->x86_mask,
		m->bank,
		((m->status & MCI_STATUS_OVER)	? "Over"  : "-"),
		((m->status & MCI_STATUS_UC)	? "UE"	  : "CE"),
		((m->status & MCI_STATUS_MISCV)	? "MiscV" : "-"),
		((m->status & MCI_STATUS_PCC)	? "PCC"	  : "-"),
		((m->status & MCI_STATUS_ADDRV)	? "AddrV" : "-"));

	if (c->x86 == 0x15)
		pr_cont("|%s|%s",
B
Borislav Petkov 已提交
741 742
			((m->status & MCI_STATUS_DEFERRED) ? "Deferred" : "-"),
			((m->status & MCI_STATUS_POISON)   ? "Poison"   : "-"));
743 744 745 746 747 748 749 750 751 752 753

	/* do the two bits[14:13] together */
	ecc = (m->status >> 45) & 0x3;
	if (ecc)
		pr_cont("|%sECC", ((ecc == 2) ? "C" : "U"));

	pr_cont("]: 0x%016llx\n", m->status);

	if (m->status & MCI_STATUS_ADDRV)
		pr_emerg(HW_ERR "MC%d_ADDR: 0x%016llx\n", m->bank, m->addr);

754
	amd_decode_err_code(m->status & 0xffff);
755 756

	return NOTIFY_STOP;
757
}
B
Borislav Petkov 已提交
758
EXPORT_SYMBOL_GPL(amd_decode_mce);
759

760 761 762 763
static struct notifier_block amd_mce_dec_nb = {
	.notifier_call	= amd_decode_mce,
};

764 765
static int __init mce_amd_init(void)
{
766 767 768
	struct cpuinfo_x86 *c = &boot_cpu_data;

	if (c->x86_vendor != X86_VENDOR_AMD)
769 770
		return 0;

771
	if (c->x86 < 0xf || c->x86 > 0x15)
772 773
		return 0;

774 775 776 777
	fam_ops = kzalloc(sizeof(struct amd_decoder_ops), GFP_KERNEL);
	if (!fam_ops)
		return -ENOMEM;

778
	switch (c->x86) {
779
	case 0xf:
780 781
		fam_ops->mc0_mce = k8_mc0_mce;
		fam_ops->mc1_mce = k8_mc1_mce;
782
		fam_ops->mc2_mce = k8_mc2_mce;
783 784 785
		break;

	case 0x10:
786 787
		fam_ops->mc0_mce = f10h_mc0_mce;
		fam_ops->mc1_mce = k8_mc1_mce;
788
		fam_ops->mc2_mce = k8_mc2_mce;
789 790
		break;

791
	case 0x11:
792 793
		fam_ops->mc0_mce = k8_mc0_mce;
		fam_ops->mc1_mce = k8_mc1_mce;
794
		fam_ops->mc2_mce = k8_mc2_mce;
795 796
		break;

797
	case 0x12:
798 799
		fam_ops->mc0_mce = f12h_mc0_mce;
		fam_ops->mc1_mce = k8_mc1_mce;
800
		fam_ops->mc2_mce = k8_mc2_mce;
801 802
		break;

803
	case 0x14:
804
		nb_err_cpumask  = 0x3;
805 806
		fam_ops->mc0_mce = f14h_mc0_mce;
		fam_ops->mc1_mce = f14h_mc1_mce;
807
		fam_ops->mc2_mce = k8_mc2_mce;
808 809
		break;

810 811
	case 0x15:
		xec_mask = 0x1f;
812 813
		fam_ops->mc0_mce = f15h_mc0_mce;
		fam_ops->mc1_mce = f15h_mc1_mce;
814
		fam_ops->mc2_mce = f15h_mc2_mce;
815 816
		break;

817
	default:
818
		printk(KERN_WARNING "Huh? What family is it: 0x%x?!\n", c->x86);
819 820 821 822
		kfree(fam_ops);
		return -EINVAL;
	}

823 824
	pr_info("MCE: In-kernel MCE decoding enabled.\n");

825
	mce_register_decode_chain(&amd_mce_dec_nb);
826 827 828 829

	return 0;
}
early_initcall(mce_amd_init);
830 831 832 833

#ifdef MODULE
static void __exit mce_amd_exit(void)
{
834
	mce_unregister_decode_chain(&amd_mce_dec_nb);
835
	kfree(fam_ops);
836 837 838 839 840 841 842
}

MODULE_DESCRIPTION("AMD MCE decoder");
MODULE_ALIAS("edac-mce-amd");
MODULE_LICENSE("GPL");
module_exit(mce_amd_exit);
#endif