e752x_edac.c 39.7 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Intel e752x Memory Controller kernel module
 * (C) 2004 Linux Networx (http://lnxi.com)
 * This file may be distributed under the terms of the
 * GNU General Public License.
 *
 * See "enum e752x_chips" below for supported chipsets
 *
 * Written by Tom Zimmerman
 *
 * Contributors:
 * 	Thayne Harbaugh at realmsys.com (?)
 * 	Wang Zhenyu at intel.com
 * 	Dave Jiang at mvista.com
 *
A
Alan Cox 已提交
16
 * $Id: edac_e752x.c,v 1.5.2.11 2005/10/05 00:43:44 dsp_llnl Exp $
17 18 19 20 21 22 23
 *
 */

#include <linux/module.h>
#include <linux/init.h>
#include <linux/pci.h>
#include <linux/pci_ids.h>
D
Dave Jiang 已提交
24
#include <linux/edac.h>
25
#include "edac_core.h"
26

M
Michal Marek 已提交
27
#define E752X_REVISION	" Ver: 2.0.2"
28
#define EDAC_MOD_STR	"e752x_edac"
29

30
static int report_non_memory_errors;
M
mark gross 已提交
31
static int force_function_unhide;
32
static int sysbus_parity = -1;
M
mark gross 已提交
33

34 35
static struct edac_pci_ctl_info *e752x_pci;

D
Dave Peterson 已提交
36
#define e752x_printk(level, fmt, arg...) \
D
Dave Peterson 已提交
37
	edac_printk(level, "e752x", fmt, ##arg)
D
Dave Peterson 已提交
38 39

#define e752x_mc_printk(mci, level, fmt, arg...) \
D
Dave Peterson 已提交
40
	edac_mc_chipset_printk(mci, level, "e752x", fmt, ##arg)
D
Dave Peterson 已提交
41

42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65
#ifndef PCI_DEVICE_ID_INTEL_7520_0
#define PCI_DEVICE_ID_INTEL_7520_0      0x3590
#endif				/* PCI_DEVICE_ID_INTEL_7520_0      */

#ifndef PCI_DEVICE_ID_INTEL_7520_1_ERR
#define PCI_DEVICE_ID_INTEL_7520_1_ERR  0x3591
#endif				/* PCI_DEVICE_ID_INTEL_7520_1_ERR  */

#ifndef PCI_DEVICE_ID_INTEL_7525_0
#define PCI_DEVICE_ID_INTEL_7525_0      0x359E
#endif				/* PCI_DEVICE_ID_INTEL_7525_0      */

#ifndef PCI_DEVICE_ID_INTEL_7525_1_ERR
#define PCI_DEVICE_ID_INTEL_7525_1_ERR  0x3593
#endif				/* PCI_DEVICE_ID_INTEL_7525_1_ERR  */

#ifndef PCI_DEVICE_ID_INTEL_7320_0
#define PCI_DEVICE_ID_INTEL_7320_0	0x3592
#endif				/* PCI_DEVICE_ID_INTEL_7320_0 */

#ifndef PCI_DEVICE_ID_INTEL_7320_1_ERR
#define PCI_DEVICE_ID_INTEL_7320_1_ERR	0x3593
#endif				/* PCI_DEVICE_ID_INTEL_7320_1_ERR */

66 67 68 69 70 71 72 73
#ifndef PCI_DEVICE_ID_INTEL_3100_0
#define PCI_DEVICE_ID_INTEL_3100_0	0x35B0
#endif				/* PCI_DEVICE_ID_INTEL_3100_0 */

#ifndef PCI_DEVICE_ID_INTEL_3100_1_ERR
#define PCI_DEVICE_ID_INTEL_3100_1_ERR	0x35B1
#endif				/* PCI_DEVICE_ID_INTEL_3100_1_ERR */

74 75 76
#define E752X_NR_CSROWS		8	/* number of csrows */

/* E752X register addresses - device 0 function 0 */
77 78 79 80 81 82 83 84
#define E752X_MCHSCRB		0x52	/* Memory Scrub register (16b) */
					/*
					 * 6:5     Scrub Completion Count
					 * 3:2     Scrub Rate (i3100 only)
					 *      01=fast 10=normal
					 * 1:0     Scrub Mode enable
					 *      00=off 10=on
					 */
85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127
#define E752X_DRB		0x60	/* DRAM row boundary register (8b) */
#define E752X_DRA		0x70	/* DRAM row attribute register (8b) */
					/*
					 * 31:30   Device width row 7
					 *      01=x8 10=x4 11=x8 DDR2
					 * 27:26   Device width row 6
					 * 23:22   Device width row 5
					 * 19:20   Device width row 4
					 * 15:14   Device width row 3
					 * 11:10   Device width row 2
					 *  7:6    Device width row 1
					 *  3:2    Device width row 0
					 */
#define E752X_DRC		0x7C	/* DRAM controller mode reg (32b) */
					/* FIXME:IS THIS RIGHT? */
					/*
					 * 22    Number channels 0=1,1=2
					 * 19:18 DRB Granularity 32/64MB
					 */
#define E752X_DRM		0x80	/* Dimm mapping register */
#define E752X_DDRCSR		0x9A	/* DDR control and status reg (16b) */
					/*
					 * 14:12 1 single A, 2 single B, 3 dual
					 */
#define E752X_TOLM		0xC4	/* DRAM top of low memory reg (16b) */
#define E752X_REMAPBASE		0xC6	/* DRAM remap base address reg (16b) */
#define E752X_REMAPLIMIT	0xC8	/* DRAM remap limit address reg (16b) */
#define E752X_REMAPOFFSET	0xCA	/* DRAM remap limit offset reg (16b) */

/* E752X register addresses - device 0 function 1 */
#define E752X_FERR_GLOBAL	0x40	/* Global first error register (32b) */
#define E752X_NERR_GLOBAL	0x44	/* Global next error register (32b) */
#define E752X_HI_FERR		0x50	/* Hub interface first error reg (8b) */
#define E752X_HI_NERR		0x52	/* Hub interface next error reg (8b) */
#define E752X_HI_ERRMASK	0x54	/* Hub interface error mask reg (8b) */
#define E752X_HI_SMICMD		0x5A	/* Hub interface SMI command reg (8b) */
#define E752X_SYSBUS_FERR	0x60	/* System buss first error reg (16b) */
#define E752X_SYSBUS_NERR	0x62	/* System buss next error reg (16b) */
#define E752X_SYSBUS_ERRMASK	0x64	/* System buss error mask reg (16b) */
#define E752X_SYSBUS_SMICMD	0x6A	/* System buss SMI command reg (16b) */
#define E752X_BUF_FERR		0x70	/* Memory buffer first error reg (8b) */
#define E752X_BUF_NERR		0x72	/* Memory buffer next error reg (8b) */
#define E752X_BUF_ERRMASK	0x74	/* Memory buffer error mask reg (8b) */
128
#define E752X_BUF_SMICMD	0x7A	/* Memory buffer SMI cmd reg (8b) */
129 130 131 132 133 134 135 136 137
#define E752X_DRAM_FERR		0x80	/* DRAM first error register (16b) */
#define E752X_DRAM_NERR		0x82	/* DRAM next error register (16b) */
#define E752X_DRAM_ERRMASK	0x84	/* DRAM error mask register (8b) */
#define E752X_DRAM_SMICMD	0x8A	/* DRAM SMI command register (8b) */
#define E752X_DRAM_RETR_ADD	0xAC	/* DRAM Retry address register (32b) */
#define E752X_DRAM_SEC1_ADD	0xA0	/* DRAM first correctable memory */
					/*     error address register (32b) */
					/*
					 * 31    Reserved
138
					 * 30:2  CE address (64 byte block 34:6
139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157
					 * 1     Reserved
					 * 0     HiLoCS
					 */
#define E752X_DRAM_SEC2_ADD	0xC8	/* DRAM first correctable memory */
					/*     error address register (32b) */
					/*
					 * 31    Reserved
					 * 30:2  CE address (64 byte block 34:6)
					 * 1     Reserved
					 * 0     HiLoCS
					 */
#define E752X_DRAM_DED_ADD	0xA4	/* DRAM first uncorrectable memory */
					/*     error address register (32b) */
					/*
					 * 31    Reserved
					 * 30:2  CE address (64 byte block 34:6)
					 * 1     Reserved
					 * 0     HiLoCS
					 */
158
#define E752X_DRAM_SCRB_ADD	0xA8	/* DRAM 1st uncorrectable scrub mem */
159 160 161
					/*     error address register (32b) */
					/*
					 * 31    Reserved
162
					 * 30:2  CE address (64 byte block 34:6
163 164 165 166 167 168 169 170 171
					 * 1     Reserved
					 * 0     HiLoCS
					 */
#define E752X_DRAM_SEC1_SYNDROME 0xC4	/* DRAM first correctable memory */
					/*     error syndrome register (16b) */
#define E752X_DRAM_SEC2_SYNDROME 0xC6	/* DRAM second correctable memory */
					/*     error syndrome register (16b) */
#define E752X_DEVPRES1		0xF4	/* Device Present 1 register (8b) */

172 173 174 175 176 177
/* 3100 IMCH specific register addresses - device 0 function 1 */
#define I3100_NSI_FERR		0x48	/* NSI first error reg (32b) */
#define I3100_NSI_NERR		0x4C	/* NSI next error reg (32b) */
#define I3100_NSI_SMICMD	0x54	/* NSI SMI command register (32b) */
#define I3100_NSI_EMASK		0x90	/* NSI error mask register (32b) */

178 179 180 181 182 183 184 185
/* ICH5R register addresses - device 30 function 0 */
#define ICH5R_PCI_STAT		0x06	/* PCI status register (16b) */
#define ICH5R_PCI_2ND_STAT	0x1E	/* PCI status secondary reg (16b) */
#define ICH5R_PCI_BRIDGE_CTL	0x3E	/* PCI bridge control register (16b) */

enum e752x_chips {
	E7520 = 0,
	E7525 = 1,
186 187
	E7320 = 2,
	I3100 = 3
188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204
};

struct e752x_pvt {
	struct pci_dev *bridge_ck;
	struct pci_dev *dev_d0f0;
	struct pci_dev *dev_d0f1;
	u32 tolm;
	u32 remapbase;
	u32 remaplimit;
	int mc_symmetric;
	u8 map[8];
	int map_type;
	const struct e752x_dev_info *dev_info;
};

struct e752x_dev_info {
	u16 err_dev;
D
Dave Peterson 已提交
205
	u16 ctl_dev;
206 207 208 209 210 211
	const char *ctl_name;
};

struct e752x_error_info {
	u32 ferr_global;
	u32 nerr_global;
212 213 214 215
	u32 nsi_ferr;	/* 3100 only */
	u32 nsi_nerr;	/* 3100 only */
	u8 hi_ferr;	/* all but 3100 */
	u8 hi_nerr;	/* all but 3100 */
216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232
	u16 sysbus_ferr;
	u16 sysbus_nerr;
	u8 buf_ferr;
	u8 buf_nerr;
	u16 dram_ferr;
	u16 dram_nerr;
	u32 dram_sec1_add;
	u32 dram_sec2_add;
	u16 dram_sec1_syndrome;
	u16 dram_sec2_syndrome;
	u32 dram_ded_add;
	u32 dram_scrb_add;
	u32 dram_retr_add;
};

static const struct e752x_dev_info e752x_devs[] = {
	[E7520] = {
233 234 235
		.err_dev = PCI_DEVICE_ID_INTEL_7520_1_ERR,
		.ctl_dev = PCI_DEVICE_ID_INTEL_7520_0,
		.ctl_name = "E7520"},
236
	[E7525] = {
237 238 239
		.err_dev = PCI_DEVICE_ID_INTEL_7525_1_ERR,
		.ctl_dev = PCI_DEVICE_ID_INTEL_7525_0,
		.ctl_name = "E7525"},
240
	[E7320] = {
241 242 243
		.err_dev = PCI_DEVICE_ID_INTEL_7320_1_ERR,
		.ctl_dev = PCI_DEVICE_ID_INTEL_7320_0,
		.ctl_name = "E7320"},
244 245 246 247
	[I3100] = {
		.err_dev = PCI_DEVICE_ID_INTEL_3100_1_ERR,
		.ctl_dev = PCI_DEVICE_ID_INTEL_3100_0,
		.ctl_name = "3100"},
248 249
};

250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284
/* Valid scrub rates for the e752x/3100 hardware memory scrubber. We
 * map the scrubbing bandwidth to a hardware register value. The 'set'
 * operation finds the 'matching or higher value'.  Note that scrubbing
 * on the e752x can only be enabled/disabled.  The 3100 supports
 * a normal and fast mode.
 */

#define SDRATE_EOT 0xFFFFFFFF

struct scrubrate {
	u32 bandwidth;	/* bandwidth consumed by scrubbing in bytes/sec */
	u16 scrubval;	/* register value for scrub rate */
};

/* Rate below assumes same performance as i3100 using PC3200 DDR2 in
 * normal mode.  e752x bridges don't support choosing normal or fast mode,
 * so the scrubbing bandwidth value isn't all that important - scrubbing is
 * either on or off.
 */
static const struct scrubrate scrubrates_e752x[] = {
	{0,		0x00},	/* Scrubbing Off */
	{500000,	0x02},	/* Scrubbing On */
	{SDRATE_EOT,	0x00}	/* End of Table */
};

/* Fast mode: 2 GByte PC3200 DDR2 scrubbed in 33s = 63161283 bytes/s
 * Normal mode: 125 (32000 / 256) times slower than fast mode.
 */
static const struct scrubrate scrubrates_i3100[] = {
	{0,		0x00},	/* Scrubbing Off */
	{500000,	0x0a},	/* Normal mode - 32k clocks */
	{62500000,	0x06},	/* Fast mode - 256 clocks */
	{SDRATE_EOT,	0x00}	/* End of Table */
};

285
static unsigned long ctl_page_to_phys(struct mem_ctl_info *mci,
286
				unsigned long page)
287 288
{
	u32 remap;
D
Dave Jiang 已提交
289
	struct e752x_pvt *pvt = (struct e752x_pvt *)mci->pvt_info;
290

D
Dave Peterson 已提交
291
	debugf3("%s()\n", __func__);
292 293 294

	if (page < pvt->tolm)
		return page;
D
Dave Peterson 已提交
295

296 297
	if ((page >= 0x100000) && (page < pvt->remapbase))
		return page;
D
Dave Peterson 已提交
298

299
	remap = (page - pvt->tolm) + pvt->remapbase;
D
Dave Peterson 已提交
300

301 302
	if (remap < pvt->remaplimit)
		return remap;
D
Dave Peterson 已提交
303

D
Dave Peterson 已提交
304
	e752x_printk(KERN_ERR, "Invalid page %lx - out of range\n", page);
305 306 307 308
	return pvt->tolm - 1;
}

static void do_process_ce(struct mem_ctl_info *mci, u16 error_one,
309
			u32 sec1_add, u16 sec1_syndrome)
310 311 312 313 314
{
	u32 page;
	int row;
	int channel;
	int i;
D
Dave Jiang 已提交
315
	struct e752x_pvt *pvt = (struct e752x_pvt *)mci->pvt_info;
316

D
Dave Peterson 已提交
317
	debugf3("%s()\n", __func__);
318 319 320 321 322 323 324 325

	/* convert the addr to 4k page */
	page = sec1_add >> (PAGE_SHIFT - 4);

	/* FIXME - check for -1 */
	if (pvt->mc_symmetric) {
		/* chip select are bits 14 & 13 */
		row = ((page >> 1) & 3);
D
Dave Peterson 已提交
326
		e752x_printk(KERN_WARNING,
327 328 329 330
			"Test row %d Table %d %d %d %d %d %d %d %d\n", row,
			pvt->map[0], pvt->map[1], pvt->map[2], pvt->map[3],
			pvt->map[4], pvt->map[5], pvt->map[6],
			pvt->map[7]);
331 332 333 334 335 336

		/* test for channel remapping */
		for (i = 0; i < 8; i++) {
			if (pvt->map[i] == row)
				break;
		}
D
Dave Peterson 已提交
337

D
Dave Peterson 已提交
338
		e752x_printk(KERN_WARNING, "Test computed row %d\n", i);
D
Dave Peterson 已提交
339

340 341 342
		if (i < 8)
			row = i;
		else
D
Dave Peterson 已提交
343
			e752x_mc_printk(mci, KERN_WARNING,
D
Dave Jiang 已提交
344 345
					"row %d not found in remap table\n",
					row);
346 347
	} else
		row = edac_mc_find_csrow_by_page(mci, page);
D
Dave Peterson 已提交
348

349 350 351
	/* 0 = channel A, 1 = channel B */
	channel = !(error_one & 1);

M
Mike Chan 已提交
352 353
	/* e752x mc reads 34:6 of the DRAM linear address */
	edac_mc_handle_ce(mci, page, offset_in_page(sec1_add << 4),
354
			sec1_syndrome, row, channel, "e752x CE");
355 356 357
}

static inline void process_ce(struct mem_ctl_info *mci, u16 error_one,
358 359
			u32 sec1_add, u16 sec1_syndrome, int *error_found,
			int handle_error)
360 361 362 363 364 365 366
{
	*error_found = 1;

	if (handle_error)
		do_process_ce(mci, error_one, sec1_add, sec1_syndrome);
}

D
Dave Peterson 已提交
367
static void do_process_ue(struct mem_ctl_info *mci, u16 error_one,
368
			u32 ded_add, u32 scrb_add)
369 370 371
{
	u32 error_2b, block_page;
	int row;
D
Dave Jiang 已提交
372
	struct e752x_pvt *pvt = (struct e752x_pvt *)mci->pvt_info;
373

D
Dave Peterson 已提交
374
	debugf3("%s()\n", __func__);
375 376 377

	if (error_one & 0x0202) {
		error_2b = ded_add;
D
Dave Peterson 已提交
378

379 380
		/* convert to 4k address */
		block_page = error_2b >> (PAGE_SHIFT - 4);
D
Dave Peterson 已提交
381

382
		row = pvt->mc_symmetric ?
383 384 385
		/* chip select are bits 14 & 13 */
			((block_page >> 1) & 3) :
			edac_mc_find_csrow_by_page(mci, block_page);
D
Dave Peterson 已提交
386

M
Mike Chan 已提交
387 388
		/* e752x mc reads 34:6 of the DRAM linear address */
		edac_mc_handle_ue(mci, block_page,
389 390
				offset_in_page(error_2b << 4),
				row, "e752x UE from Read");
391 392 393
	}
	if (error_one & 0x0404) {
		error_2b = scrb_add;
D
Dave Peterson 已提交
394

395 396
		/* convert to 4k address */
		block_page = error_2b >> (PAGE_SHIFT - 4);
D
Dave Peterson 已提交
397

398
		row = pvt->mc_symmetric ?
399 400 401
		/* chip select are bits 14 & 13 */
			((block_page >> 1) & 3) :
			edac_mc_find_csrow_by_page(mci, block_page);
D
Dave Peterson 已提交
402

M
Mike Chan 已提交
403 404
		/* e752x mc reads 34:6 of the DRAM linear address */
		edac_mc_handle_ue(mci, block_page,
405 406
				offset_in_page(error_2b << 4),
				row, "e752x UE from Scruber");
407 408 409 410
	}
}

static inline void process_ue(struct mem_ctl_info *mci, u16 error_one,
411 412
			u32 ded_add, u32 scrb_add, int *error_found,
			int handle_error)
413 414 415 416 417 418 419 420
{
	*error_found = 1;

	if (handle_error)
		do_process_ue(mci, error_one, ded_add, scrb_add);
}

static inline void process_ue_no_info_wr(struct mem_ctl_info *mci,
D
Dave Jiang 已提交
421
					 int *error_found, int handle_error)
422 423 424 425 426 427
{
	*error_found = 1;

	if (!handle_error)
		return;

D
Dave Peterson 已提交
428
	debugf3("%s()\n", __func__);
429 430 431 432
	edac_mc_handle_ue_no_info(mci, "e752x UE log memory write");
}

static void do_process_ded_retry(struct mem_ctl_info *mci, u16 error,
D
Dave Jiang 已提交
433
				 u32 retry_add)
434 435 436
{
	u32 error_1b, page;
	int row;
D
Dave Jiang 已提交
437
	struct e752x_pvt *pvt = (struct e752x_pvt *)mci->pvt_info;
438 439

	error_1b = retry_add;
440 441 442 443
	page = error_1b >> (PAGE_SHIFT - 4);  /* convert the addr to 4k page */

	/* chip select are bits 14 & 13 */
	row = pvt->mc_symmetric ? ((page >> 1) & 3) :
444
		edac_mc_find_csrow_by_page(mci, page);
445

D
Dave Peterson 已提交
446
	e752x_mc_printk(mci, KERN_WARNING,
D
Dave Jiang 已提交
447 448
			"CE page 0x%lx, row %d : Memory read retry\n",
			(long unsigned int)page, row);
449 450 451
}

static inline void process_ded_retry(struct mem_ctl_info *mci, u16 error,
452 453
				u32 retry_add, int *error_found,
				int handle_error)
454 455 456 457 458 459 460 461
{
	*error_found = 1;

	if (handle_error)
		do_process_ded_retry(mci, error, retry_add);
}

static inline void process_threshold_ce(struct mem_ctl_info *mci, u16 error,
D
Dave Jiang 已提交
462
					int *error_found, int handle_error)
463 464 465 466
{
	*error_found = 1;

	if (handle_error)
D
Dave Peterson 已提交
467
		e752x_mc_printk(mci, KERN_WARNING, "Memory threshold CE\n");
468 469
}

A
Alan Cox 已提交
470
static char *global_message[11] = {
471 472 473 474 475 476 477 478 479 480 481
	"PCI Express C1",
	"PCI Express C",
	"PCI Express B1",
	"PCI Express B",
	"PCI Express A1",
	"PCI Express A",
	"DMA Controller",
	"HUB or NS Interface",
	"System Bus",
	"DRAM Controller",  /* 9th entry */
	"Internal Buffer"
482 483
};

484 485
#define DRAM_ENTRY	9

A
Alan Cox 已提交
486
static char *fatal_message[2] = { "Non-Fatal ", "Fatal " };
487 488 489 490 491 492

static void do_global_error(int fatal, u32 errors)
{
	int i;

	for (i = 0; i < 11; i++) {
493 494 495 496 497 498 499 500 501 502
		if (errors & (1 << i)) {
			/* If the error is from DRAM Controller OR
			 * we are to report ALL errors, then
			 * report the error
			 */
			if ((i == DRAM_ENTRY) || report_non_memory_errors)
				e752x_printk(KERN_WARNING, "%sError %s\n",
					fatal_message[fatal],
					global_message[i]);
		}
503 504 505 506
	}
}

static inline void global_error(int fatal, u32 errors, int *error_found,
D
Dave Jiang 已提交
507
				int handle_error)
508 509 510 511 512 513 514
{
	*error_found = 1;

	if (handle_error)
		do_global_error(fatal, errors);
}

A
Alan Cox 已提交
515
static char *hub_message[7] = {
516 517 518 519 520 521 522 523 524 525 526 527
	"HI Address or Command Parity", "HI Illegal Access",
	"HI Internal Parity", "Out of Range Access",
	"HI Data Parity", "Enhanced Config Access",
	"Hub Interface Target Abort"
};

static void do_hub_error(int fatal, u8 errors)
{
	int i;

	for (i = 0; i < 7; i++) {
		if (errors & (1 << i))
D
Dave Peterson 已提交
528
			e752x_printk(KERN_WARNING, "%sError %s\n",
529
				fatal_message[fatal], hub_message[i]);
530 531 532 533
	}
}

static inline void hub_error(int fatal, u8 errors, int *error_found,
534
			int handle_error)
535 536 537 538 539 540 541
{
	*error_found = 1;

	if (handle_error)
		do_hub_error(fatal, errors);
}

542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598
#define NSI_FATAL_MASK		0x0c080081
#define NSI_NON_FATAL_MASK	0x23a0ba64
#define NSI_ERR_MASK		(NSI_FATAL_MASK | NSI_NON_FATAL_MASK)

static char *nsi_message[30] = {
	"NSI Link Down",	/* NSI_FERR/NSI_NERR bit 0, fatal error */
	"",						/* reserved */
	"NSI Parity Error",				/* bit 2, non-fatal */
	"",						/* reserved */
	"",						/* reserved */
	"Correctable Error Message",			/* bit 5, non-fatal */
	"Non-Fatal Error Message",			/* bit 6, non-fatal */
	"Fatal Error Message",				/* bit 7, fatal */
	"",						/* reserved */
	"Receiver Error",				/* bit 9, non-fatal */
	"",						/* reserved */
	"Bad TLP",					/* bit 11, non-fatal */
	"Bad DLLP",					/* bit 12, non-fatal */
	"REPLAY_NUM Rollover",				/* bit 13, non-fatal */
	"",						/* reserved */
	"Replay Timer Timeout",				/* bit 15, non-fatal */
	"",						/* reserved */
	"",						/* reserved */
	"",						/* reserved */
	"Data Link Protocol Error",			/* bit 19, fatal */
	"",						/* reserved */
	"Poisoned TLP",					/* bit 21, non-fatal */
	"",						/* reserved */
	"Completion Timeout",				/* bit 23, non-fatal */
	"Completer Abort",				/* bit 24, non-fatal */
	"Unexpected Completion",			/* bit 25, non-fatal */
	"Receiver Overflow",				/* bit 26, fatal */
	"Malformed TLP",				/* bit 27, fatal */
	"",						/* reserved */
	"Unsupported Request"				/* bit 29, non-fatal */
};

static void do_nsi_error(int fatal, u32 errors)
{
	int i;

	for (i = 0; i < 30; i++) {
		if (errors & (1 << i))
			printk(KERN_WARNING "%sError %s\n",
			       fatal_message[fatal], nsi_message[i]);
	}
}

static inline void nsi_error(int fatal, u32 errors, int *error_found,
		int handle_error)
{
	*error_found = 1;

	if (handle_error)
		do_nsi_error(fatal, errors);
}

A
Alan Cox 已提交
599
static char *membuf_message[4] = {
600 601 602 603 604 605 606 607 608 609 610 611
	"Internal PMWB to DRAM parity",
	"Internal PMWB to System Bus Parity",
	"Internal System Bus or IO to PMWB Parity",
	"Internal DRAM to PMWB Parity"
};

static void do_membuf_error(u8 errors)
{
	int i;

	for (i = 0; i < 4; i++) {
		if (errors & (1 << i))
D
Dave Peterson 已提交
612
			e752x_printk(KERN_WARNING, "Non-Fatal Error %s\n",
613
				membuf_message[i]);
614 615 616 617 618 619 620 621 622 623 624
	}
}

static inline void membuf_error(u8 errors, int *error_found, int handle_error)
{
	*error_found = 1;

	if (handle_error)
		do_membuf_error(errors);
}

625
static char *sysbus_message[10] = {
626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642
	"Addr or Request Parity",
	"Data Strobe Glitch",
	"Addr Strobe Glitch",
	"Data Parity",
	"Addr Above TOM",
	"Non DRAM Lock Error",
	"MCERR", "BINIT",
	"Memory Parity",
	"IO Subsystem Parity"
};

static void do_sysbus_error(int fatal, u32 errors)
{
	int i;

	for (i = 0; i < 10; i++) {
		if (errors & (1 << i))
D
Dave Peterson 已提交
643
			e752x_printk(KERN_WARNING, "%sError System Bus %s\n",
644
				fatal_message[fatal], sysbus_message[i]);
645 646 647 648
	}
}

static inline void sysbus_error(int fatal, u32 errors, int *error_found,
D
Dave Jiang 已提交
649
				int handle_error)
650 651 652 653 654 655 656
{
	*error_found = 1;

	if (handle_error)
		do_sysbus_error(fatal, errors);
}

D
Dave Peterson 已提交
657
static void e752x_check_hub_interface(struct e752x_error_info *info,
658
				int *error_found, int handle_error)
659 660 661 662
{
	u8 stat8;

	//pci_read_config_byte(dev,E752X_HI_FERR,&stat8);
D
Dave Peterson 已提交
663

664
	stat8 = info->hi_ferr;
D
Dave Peterson 已提交
665

D
Dave Jiang 已提交
666
	if (stat8 & 0x7f) {	/* Error, so process */
667
		stat8 &= 0x7f;
D
Dave Peterson 已提交
668

D
Dave Jiang 已提交
669
		if (stat8 & 0x2b)
670
			hub_error(1, stat8 & 0x2b, error_found, handle_error);
D
Dave Peterson 已提交
671

D
Dave Jiang 已提交
672
		if (stat8 & 0x54)
673 674 675
			hub_error(0, stat8 & 0x54, error_found, handle_error);
	}
	//pci_read_config_byte(dev,E752X_HI_NERR,&stat8);
D
Dave Peterson 已提交
676

677
	stat8 = info->hi_nerr;
D
Dave Peterson 已提交
678

D
Dave Jiang 已提交
679
	if (stat8 & 0x7f) {	/* Error, so process */
680
		stat8 &= 0x7f;
D
Dave Peterson 已提交
681

682 683
		if (stat8 & 0x2b)
			hub_error(1, stat8 & 0x2b, error_found, handle_error);
D
Dave Peterson 已提交
684

D
Dave Jiang 已提交
685
		if (stat8 & 0x54)
686 687 688 689
			hub_error(0, stat8 & 0x54, error_found, handle_error);
	}
}

690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714
static void e752x_check_ns_interface(struct e752x_error_info *info,
				int *error_found, int handle_error)
{
	u32 stat32;

	stat32 = info->nsi_ferr;
	if (stat32 & NSI_ERR_MASK) { /* Error, so process */
		if (stat32 & NSI_FATAL_MASK)	/* check for fatal errors */
			nsi_error(1, stat32 & NSI_FATAL_MASK, error_found,
				  handle_error);
		if (stat32 & NSI_NON_FATAL_MASK) /* check for non-fatal ones */
			nsi_error(0, stat32 & NSI_NON_FATAL_MASK, error_found,
				  handle_error);
	}
	stat32 = info->nsi_nerr;
	if (stat32 & NSI_ERR_MASK) {
		if (stat32 & NSI_FATAL_MASK)
			nsi_error(1, stat32 & NSI_FATAL_MASK, error_found,
				  handle_error);
		if (stat32 & NSI_NON_FATAL_MASK)
			nsi_error(0, stat32 & NSI_NON_FATAL_MASK, error_found,
				  handle_error);
	}
}

D
Dave Peterson 已提交
715
static void e752x_check_sysbus(struct e752x_error_info *info,
716
			int *error_found, int handle_error)
717 718 719 720 721 722 723
{
	u32 stat32, error32;

	//pci_read_config_dword(dev,E752X_SYSBUS_FERR,&stat32);
	stat32 = info->sysbus_ferr + (info->sysbus_nerr << 16);

	if (stat32 == 0)
D
Dave Jiang 已提交
724
		return;		/* no errors */
725 726 727

	error32 = (stat32 >> 16) & 0x3ff;
	stat32 = stat32 & 0x3ff;
D
Dave Peterson 已提交
728

D
Dave Jiang 已提交
729
	if (stat32 & 0x087)
730
		sysbus_error(1, stat32 & 0x087, error_found, handle_error);
D
Dave Peterson 已提交
731

D
Dave Jiang 已提交
732
	if (stat32 & 0x378)
733
		sysbus_error(0, stat32 & 0x378, error_found, handle_error);
D
Dave Peterson 已提交
734

D
Dave Jiang 已提交
735
	if (error32 & 0x087)
736
		sysbus_error(1, error32 & 0x087, error_found, handle_error);
D
Dave Peterson 已提交
737

D
Dave Jiang 已提交
738
	if (error32 & 0x378)
739
		sysbus_error(0, error32 & 0x378, error_found, handle_error);
740 741
}

D
Dave Jiang 已提交
742
static void e752x_check_membuf(struct e752x_error_info *info,
743
			int *error_found, int handle_error)
744 745 746 747
{
	u8 stat8;

	stat8 = info->buf_ferr;
D
Dave Peterson 已提交
748

D
Dave Jiang 已提交
749
	if (stat8 & 0x0f) {	/* Error, so process */
750 751 752
		stat8 &= 0x0f;
		membuf_error(stat8, error_found, handle_error);
	}
D
Dave Peterson 已提交
753

754
	stat8 = info->buf_nerr;
D
Dave Peterson 已提交
755

D
Dave Jiang 已提交
756
	if (stat8 & 0x0f) {	/* Error, so process */
757 758 759 760 761
		stat8 &= 0x0f;
		membuf_error(stat8, error_found, handle_error);
	}
}

D
Dave Jiang 已提交
762
static void e752x_check_dram(struct mem_ctl_info *mci,
763 764
			struct e752x_error_info *info, int *error_found,
			int handle_error)
765 766 767 768 769 770 771
{
	u16 error_one, error_next;

	error_one = info->dram_ferr;
	error_next = info->dram_nerr;

	/* decode and report errors */
D
Dave Jiang 已提交
772
	if (error_one & 0x0101)	/* check first error correctable */
773
		process_ce(mci, error_one, info->dram_sec1_add,
774
			info->dram_sec1_syndrome, error_found, handle_error);
775

D
Dave Jiang 已提交
776
	if (error_next & 0x0101)	/* check next error correctable */
777
		process_ce(mci, error_next, info->dram_sec2_add,
778
			info->dram_sec2_syndrome, error_found, handle_error);
779

D
Dave Jiang 已提交
780
	if (error_one & 0x4040)
781 782
		process_ue_no_info_wr(mci, error_found, handle_error);

D
Dave Jiang 已提交
783
	if (error_next & 0x4040)
784 785
		process_ue_no_info_wr(mci, error_found, handle_error);

D
Dave Jiang 已提交
786
	if (error_one & 0x2020)
787
		process_ded_retry(mci, error_one, info->dram_retr_add,
788
				error_found, handle_error);
789

D
Dave Jiang 已提交
790
	if (error_next & 0x2020)
791
		process_ded_retry(mci, error_next, info->dram_retr_add,
792
				error_found, handle_error);
793

D
Dave Jiang 已提交
794 795
	if (error_one & 0x0808)
		process_threshold_ce(mci, error_one, error_found, handle_error);
796

D
Dave Jiang 已提交
797
	if (error_next & 0x0808)
798
		process_threshold_ce(mci, error_next, error_found,
799
				handle_error);
800

D
Dave Jiang 已提交
801
	if (error_one & 0x0606)
802
		process_ue(mci, error_one, info->dram_ded_add,
803
			info->dram_scrb_add, error_found, handle_error);
804

D
Dave Jiang 已提交
805
	if (error_next & 0x0606)
806
		process_ue(mci, error_next, info->dram_ded_add,
807
			info->dram_scrb_add, error_found, handle_error);
808 809
}

D
Dave Jiang 已提交
810 811
static void e752x_get_error_info(struct mem_ctl_info *mci,
				 struct e752x_error_info *info)
812 813 814 815 816
{
	struct pci_dev *dev;
	struct e752x_pvt *pvt;

	memset(info, 0, sizeof(*info));
D
Dave Jiang 已提交
817
	pvt = (struct e752x_pvt *)mci->pvt_info;
818 819 820 821
	dev = pvt->dev_d0f1;
	pci_read_config_dword(dev, E752X_FERR_GLOBAL, &info->ferr_global);

	if (info->ferr_global) {
822 823 824 825 826 827 828 829 830
		if (pvt->dev_info->err_dev == PCI_DEVICE_ID_INTEL_3100_1_ERR) {
			pci_read_config_dword(dev, I3100_NSI_FERR,
					     &info->nsi_ferr);
			info->hi_ferr = 0;
		} else {
			pci_read_config_byte(dev, E752X_HI_FERR,
					     &info->hi_ferr);
			info->nsi_ferr = 0;
		}
831
		pci_read_config_word(dev, E752X_SYSBUS_FERR,
832
				&info->sysbus_ferr);
833
		pci_read_config_byte(dev, E752X_BUF_FERR, &info->buf_ferr);
D
Dave Jiang 已提交
834
		pci_read_config_word(dev, E752X_DRAM_FERR, &info->dram_ferr);
835
		pci_read_config_dword(dev, E752X_DRAM_SEC1_ADD,
836
				&info->dram_sec1_add);
837
		pci_read_config_word(dev, E752X_DRAM_SEC1_SYNDROME,
838
				&info->dram_sec1_syndrome);
839
		pci_read_config_dword(dev, E752X_DRAM_DED_ADD,
840
				&info->dram_ded_add);
841
		pci_read_config_dword(dev, E752X_DRAM_SCRB_ADD,
842
				&info->dram_scrb_add);
843
		pci_read_config_dword(dev, E752X_DRAM_RETR_ADD,
844
				&info->dram_retr_add);
845

846
		/* ignore the reserved bits just in case */
847 848
		if (info->hi_ferr & 0x7f)
			pci_write_config_byte(dev, E752X_HI_FERR,
849
					info->hi_ferr);
850

851 852 853 854
		if (info->nsi_ferr & NSI_ERR_MASK)
			pci_write_config_dword(dev, I3100_NSI_FERR,
					info->nsi_ferr);

855 856
		if (info->sysbus_ferr)
			pci_write_config_word(dev, E752X_SYSBUS_FERR,
857
					info->sysbus_ferr);
858 859 860

		if (info->buf_ferr & 0x0f)
			pci_write_config_byte(dev, E752X_BUF_FERR,
861
					info->buf_ferr);
862 863 864

		if (info->dram_ferr)
			pci_write_bits16(pvt->bridge_ck, E752X_DRAM_FERR,
D
Dave Jiang 已提交
865
					 info->dram_ferr, info->dram_ferr);
866 867

		pci_write_config_dword(dev, E752X_FERR_GLOBAL,
868
				info->ferr_global);
869 870 871 872 873
	}

	pci_read_config_dword(dev, E752X_NERR_GLOBAL, &info->nerr_global);

	if (info->nerr_global) {
874 875 876 877 878 879 880 881 882
		if (pvt->dev_info->err_dev == PCI_DEVICE_ID_INTEL_3100_1_ERR) {
			pci_read_config_dword(dev, I3100_NSI_NERR,
					     &info->nsi_nerr);
			info->hi_nerr = 0;
		} else {
			pci_read_config_byte(dev, E752X_HI_NERR,
					     &info->hi_nerr);
			info->nsi_nerr = 0;
		}
883
		pci_read_config_word(dev, E752X_SYSBUS_NERR,
884
				&info->sysbus_nerr);
885
		pci_read_config_byte(dev, E752X_BUF_NERR, &info->buf_nerr);
D
Dave Jiang 已提交
886
		pci_read_config_word(dev, E752X_DRAM_NERR, &info->dram_nerr);
887
		pci_read_config_dword(dev, E752X_DRAM_SEC2_ADD,
888
				&info->dram_sec2_add);
889
		pci_read_config_word(dev, E752X_DRAM_SEC2_SYNDROME,
890
				&info->dram_sec2_syndrome);
891 892 893

		if (info->hi_nerr & 0x7f)
			pci_write_config_byte(dev, E752X_HI_NERR,
894
					info->hi_nerr);
895

896 897 898 899
		if (info->nsi_nerr & NSI_ERR_MASK)
			pci_write_config_dword(dev, I3100_NSI_NERR,
					info->nsi_nerr);

900 901
		if (info->sysbus_nerr)
			pci_write_config_word(dev, E752X_SYSBUS_NERR,
902
					info->sysbus_nerr);
903 904 905

		if (info->buf_nerr & 0x0f)
			pci_write_config_byte(dev, E752X_BUF_NERR,
906
					info->buf_nerr);
907 908 909

		if (info->dram_nerr)
			pci_write_bits16(pvt->bridge_ck, E752X_DRAM_NERR,
D
Dave Jiang 已提交
910
					 info->dram_nerr, info->dram_nerr);
911 912

		pci_write_config_dword(dev, E752X_NERR_GLOBAL,
913
				info->nerr_global);
914 915 916
	}
}

D
Dave Jiang 已提交
917
static int e752x_process_error_info(struct mem_ctl_info *mci,
918 919
				struct e752x_error_info *info,
				int handle_errors)
920 921 922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943
{
	u32 error32, stat32;
	int error_found;

	error_found = 0;
	error32 = (info->ferr_global >> 18) & 0x3ff;
	stat32 = (info->ferr_global >> 4) & 0x7ff;

	if (error32)
		global_error(1, error32, &error_found, handle_errors);

	if (stat32)
		global_error(0, stat32, &error_found, handle_errors);

	error32 = (info->nerr_global >> 18) & 0x3ff;
	stat32 = (info->nerr_global >> 4) & 0x7ff;

	if (error32)
		global_error(1, error32, &error_found, handle_errors);

	if (stat32)
		global_error(0, stat32, &error_found, handle_errors);

	e752x_check_hub_interface(info, &error_found, handle_errors);
944
	e752x_check_ns_interface(info, &error_found, handle_errors);
945 946 947 948 949 950 951 952 953
	e752x_check_sysbus(info, &error_found, handle_errors);
	e752x_check_membuf(info, &error_found, handle_errors);
	e752x_check_dram(mci, info, &error_found, handle_errors);
	return error_found;
}

static void e752x_check(struct mem_ctl_info *mci)
{
	struct e752x_error_info info;
D
Dave Peterson 已提交
954

D
Dave Peterson 已提交
955
	debugf3("%s()\n", __func__);
956 957 958 959
	e752x_get_error_info(mci, &info);
	e752x_process_error_info(mci, &info, 1);
}

960
/* Program byte/sec bandwidth scrub rate to hardware */
961
static int set_sdram_scrub_rate(struct mem_ctl_info *mci, u32 new_bw)
962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977
{
	const struct scrubrate *scrubrates;
	struct e752x_pvt *pvt = (struct e752x_pvt *) mci->pvt_info;
	struct pci_dev *pdev = pvt->dev_d0f0;
	int i;

	if (pvt->dev_info->ctl_dev == PCI_DEVICE_ID_INTEL_3100_0)
		scrubrates = scrubrates_i3100;
	else
		scrubrates = scrubrates_e752x;

	/* Translate the desired scrub rate to a e752x/3100 register value.
	 * Search for the bandwidth that is equal or greater than the
	 * desired rate and program the cooresponding register value.
	 */
	for (i = 0; scrubrates[i].bandwidth != SDRATE_EOT; i++)
978
		if (scrubrates[i].bandwidth >= new_bw)
979 980 981 982 983 984 985
			break;

	if (scrubrates[i].bandwidth == SDRATE_EOT)
		return -1;

	pci_write_config_word(pdev, E752X_MCHSCRB, scrubrates[i].scrubval);

986
	return scrubrates[i].bandwidth;
987 988 989
}

/* Convert current scrub rate value into byte/sec bandwidth */
990
static int get_sdram_scrub_rate(struct mem_ctl_info *mci)
991 992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015
{
	const struct scrubrate *scrubrates;
	struct e752x_pvt *pvt = (struct e752x_pvt *) mci->pvt_info;
	struct pci_dev *pdev = pvt->dev_d0f0;
	u16 scrubval;
	int i;

	if (pvt->dev_info->ctl_dev == PCI_DEVICE_ID_INTEL_3100_0)
		scrubrates = scrubrates_i3100;
	else
		scrubrates = scrubrates_e752x;

	/* Find the bandwidth matching the memory scrubber configuration */
	pci_read_config_word(pdev, E752X_MCHSCRB, &scrubval);
	scrubval = scrubval & 0x0f;

	for (i = 0; scrubrates[i].bandwidth != SDRATE_EOT; i++)
		if (scrubrates[i].scrubval == scrubval)
			break;

	if (scrubrates[i].bandwidth == SDRATE_EOT) {
		e752x_printk(KERN_WARNING,
			"Invalid sdram scrub control value: 0x%x\n", scrubval);
		return -1;
	}
1016
	return scrubrates[i].bandwidth;
1017 1018 1019

}

1020 1021 1022 1023 1024 1025
/* Return 1 if dual channel mode is active.  Else return 0. */
static inline int dual_channel_active(u16 ddrcsr)
{
	return (((ddrcsr >> 12) & 3) == 3);
}

1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037
/* Remap csrow index numbers if map_type is "reverse"
 */
static inline int remap_csrow_index(struct mem_ctl_info *mci, int index)
{
	struct e752x_pvt *pvt = mci->pvt_info;

	if (!pvt->map_type)
		return (7 - index);

	return (index);
}

1038
static void e752x_init_csrows(struct mem_ctl_info *mci, struct pci_dev *pdev,
1039
			u16 ddrcsr)
1040 1041 1042 1043
{
	struct csrow_info *csrow;
	unsigned long last_cumul_size;
	int index, mem_dev, drc_chan;
D
Dave Jiang 已提交
1044 1045
	int drc_drbg;		/* DRB granularity 0=64mb, 1=128mb */
	int drc_ddim;		/* DRAM Data Integrity Mode 0=none, 2=edac */
1046 1047 1048
	u8 value;
	u32 dra, drc, cumul_size;

1049
	dra = 0;
D
Dave Jiang 已提交
1050
	for (index = 0; index < 4; index++) {
1051
		u8 dra_reg;
D
Dave Jiang 已提交
1052
		pci_read_config_byte(pdev, E752X_DRA + index, &dra_reg);
1053 1054
		dra |= dra_reg << (index * 8);
	}
1055 1056
	pci_read_config_dword(pdev, E752X_DRC, &drc);
	drc_chan = dual_channel_active(ddrcsr);
D
Dave Jiang 已提交
1057
	drc_drbg = drc_chan + 1;	/* 128 in dual mode, 64 in single */
1058 1059 1060 1061 1062 1063 1064 1065 1066 1067
	drc_ddim = (drc >> 20) & 0x3;

	/* The dram row boundary (DRB) reg values are boundary address for
	 * each DRAM row with a granularity of 64 or 128MB (single/dual
	 * channel operation).  DRB regs are cumulative; therefore DRB7 will
	 * contain the total memory contained in all eight rows.
	 */
	for (last_cumul_size = index = 0; index < mci->nr_csrows; index++) {
		/* mem_dev 0=x8, 1=x4 */
		mem_dev = (dra >> (index * 4 + 2)) & 0x3;
1068
		csrow = &mci->csrows[remap_csrow_index(mci, index)];
1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101 1102 1103 1104

		mem_dev = (mem_dev == 2);
		pci_read_config_byte(pdev, E752X_DRB + index, &value);
		/* convert a 128 or 64 MiB DRB to a page size. */
		cumul_size = value << (25 + drc_drbg - PAGE_SHIFT);
		debugf3("%s(): (%d) cumul_size 0x%x\n", __func__, index,
			cumul_size);
		if (cumul_size == last_cumul_size)
			continue;	/* not populated */

		csrow->first_page = last_cumul_size;
		csrow->last_page = cumul_size - 1;
		csrow->nr_pages = cumul_size - last_cumul_size;
		last_cumul_size = cumul_size;
		csrow->grain = 1 << 12;	/* 4KiB - resolution of CELOG */
		csrow->mtype = MEM_RDDR;	/* only one type supported */
		csrow->dtype = mem_dev ? DEV_X4 : DEV_X8;

		/*
		 * if single channel or x8 devices then SECDED
		 * if dual channel and x4 then S4ECD4ED
		 */
		if (drc_ddim) {
			if (drc_chan && mem_dev) {
				csrow->edac_mode = EDAC_S4ECD4ED;
				mci->edac_cap |= EDAC_FLAG_S4ECD4ED;
			} else {
				csrow->edac_mode = EDAC_SECDED;
				mci->edac_cap |= EDAC_FLAG_SECDED;
			}
		} else
			csrow->edac_mode = EDAC_NONE;
	}
}

static void e752x_init_mem_map_table(struct pci_dev *pdev,
1105
				struct e752x_pvt *pvt)
1106 1107
{
	int index;
1108
	u8 value, last, row;
1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119

	last = 0;
	row = 0;

	for (index = 0; index < 8; index += 2) {
		pci_read_config_byte(pdev, E752X_DRB + index, &value);
		/* test if there is a dimm in this slot */
		if (value == last) {
			/* no dimm in the slot, so flag it as empty */
			pvt->map[index] = 0xff;
			pvt->map[index + 1] = 0xff;
D
Dave Jiang 已提交
1120
		} else {	/* there is a dimm in the slot */
1121 1122 1123 1124 1125 1126 1127
			pvt->map[index] = row;
			row++;
			last = value;
			/* test the next value to see if the dimm is double
			 * sided
			 */
			pci_read_config_byte(pdev, E752X_DRB + index + 1,
1128 1129 1130 1131 1132
					&value);

			/* the dimm is single sided, so flag as empty */
			/* this is a double sided dimm to save the next row #*/
			pvt->map[index + 1] = (value == last) ? 0xff :	row;
1133 1134 1135 1136 1137 1138 1139 1140
			row++;
			last = value;
		}
	}
}

/* Return 0 on success or 1 on failure. */
static int e752x_get_devs(struct pci_dev *pdev, int dev_idx,
1141
			struct e752x_pvt *pvt)
1142 1143 1144 1145
{
	struct pci_dev *dev;

	pvt->bridge_ck = pci_get_device(PCI_VENDOR_ID_INTEL,
1146
				pvt->dev_info->err_dev, pvt->bridge_ck);
1147 1148 1149 1150 1151 1152 1153

	if (pvt->bridge_ck == NULL)
		pvt->bridge_ck = pci_scan_single_device(pdev->bus,
							PCI_DEVFN(0, 1));

	if (pvt->bridge_ck == NULL) {
		e752x_printk(KERN_ERR, "error reporting device not found:"
1154 1155
			"vendor %x device 0x%x (broken BIOS?)\n",
			PCI_VENDOR_ID_INTEL, e752x_devs[dev_idx].err_dev);
1156 1157 1158
		return 1;
	}

1159 1160 1161
	dev = pci_get_device(PCI_VENDOR_ID_INTEL,
				e752x_devs[dev_idx].ctl_dev,
				NULL);
1162 1163 1164 1165 1166 1167 1168 1169 1170

	if (dev == NULL)
		goto fail;

	pvt->dev_d0f0 = dev;
	pvt->dev_d0f1 = pci_dev_get(pvt->bridge_ck);

	return 0;

1171
fail:
1172 1173 1174 1175
	pci_dev_put(pvt->bridge_ck);
	return 1;
}

1176 1177
/* Setup system bus parity mask register.
 * Sysbus parity supported on:
K
Konstantin Olifer 已提交
1178
 * e7320/e7520/e7525 + Xeon
1179 1180 1181 1182 1183 1184 1185
 */
static void e752x_init_sysbus_parity_mask(struct e752x_pvt *pvt)
{
	char *cpu_id = cpu_data(0).x86_model_id;
	struct pci_dev *dev = pvt->dev_d0f1;
	int enable = 1;

1186
	/* Allow module parameter override, else see if CPU supports parity */
1187 1188
	if (sysbus_parity != -1) {
		enable = sysbus_parity;
K
Konstantin Olifer 已提交
1189
	} else if (cpu_id[0] && !strstr(cpu_id, "Xeon")) {
1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200
		e752x_printk(KERN_INFO, "System Bus Parity not "
			     "supported by CPU, disabling\n");
		enable = 0;
	}

	if (enable)
		pci_write_config_word(dev, E752X_SYSBUS_ERRMASK, 0x0000);
	else
		pci_write_config_word(dev, E752X_SYSBUS_ERRMASK, 0x0309);
}

1201 1202 1203 1204 1205 1206
static void e752x_init_error_reporting_regs(struct e752x_pvt *pvt)
{
	struct pci_dev *dev;

	dev = pvt->dev_d0f1;
	/* Turn off error disable & SMI in case the BIOS turned it on */
1207 1208 1209 1210 1211 1212 1213
	if (pvt->dev_info->err_dev == PCI_DEVICE_ID_INTEL_3100_1_ERR) {
		pci_write_config_dword(dev, I3100_NSI_EMASK, 0);
		pci_write_config_dword(dev, I3100_NSI_SMICMD, 0);
	} else {
		pci_write_config_byte(dev, E752X_HI_ERRMASK, 0x00);
		pci_write_config_byte(dev, E752X_HI_SMICMD, 0x00);
	}
1214 1215 1216

	e752x_init_sysbus_parity_mask(pvt);

1217 1218 1219 1220 1221 1222 1223 1224 1225
	pci_write_config_word(dev, E752X_SYSBUS_SMICMD, 0x00);
	pci_write_config_byte(dev, E752X_BUF_ERRMASK, 0x00);
	pci_write_config_byte(dev, E752X_BUF_SMICMD, 0x00);
	pci_write_config_byte(dev, E752X_DRAM_ERRMASK, 0x00);
	pci_write_config_byte(dev, E752X_DRAM_SMICMD, 0x00);
}

static int e752x_probe1(struct pci_dev *pdev, int dev_idx)
{
D
Dave Peterson 已提交
1226
	u16 pci_data;
1227
	u8 stat8;
1228 1229
	struct mem_ctl_info *mci;
	struct e752x_pvt *pvt;
1230
	u16 ddrcsr;
D
Dave Jiang 已提交
1231
	int drc_chan;		/* Number of channels 0=1chan,1=2chan */
1232
	struct e752x_error_info discard;
1233

D
Dave Peterson 已提交
1234
	debugf0("%s(): mci\n", __func__);
1235 1236
	debugf0("Starting Probe1\n");

M
mark gross 已提交
1237 1238 1239 1240
	/* check to see if device 0 function 1 is enabled; if it isn't, we
	 * assume the BIOS has reserved it for a reason and is expecting
	 * exclusive access, we take care not to violate that assumption and
	 * fail the probe. */
1241
	pci_read_config_byte(pdev, E752X_DEVPRES1, &stat8);
M
mark gross 已提交
1242 1243
	if (!force_function_unhide && !(stat8 & (1 << 5))) {
		printk(KERN_INFO "Contact your BIOS vendor to see if the "
1244
			"E752x error registers can be safely un-hidden\n");
1245
		return -ENODEV;
M
mark gross 已提交
1246
	}
1247 1248 1249 1250 1251 1252
	stat8 |= (1 << 5);
	pci_write_config_byte(pdev, E752X_DEVPRES1, stat8);

	pci_read_config_word(pdev, E752X_DDRCSR, &ddrcsr);
	/* FIXME: should check >>12 or 0xf, true for all? */
	/* Dual channel = 1, Single channel = 0 */
1253
	drc_chan = dual_channel_active(ddrcsr);
1254

1255
	mci = edac_mc_alloc(sizeof(*pvt), E752X_NR_CSROWS, drc_chan + 1, 0);
1256 1257

	if (mci == NULL) {
1258
		return -ENOMEM;
1259 1260
	}

D
Dave Peterson 已提交
1261
	debugf3("%s(): init mci\n", __func__);
1262
	mci->mtype_cap = MEM_FLAG_RDDR;
1263 1264 1265
	/* 3100 IMCH supports SECDEC only */
	mci->edac_ctl_cap = (dev_idx == I3100) ? EDAC_FLAG_SECDED :
		(EDAC_FLAG_NONE | EDAC_FLAG_SECDED | EDAC_FLAG_S4ECD4ED);
1266
	/* FIXME - what if different memory types are in different csrows? */
D
Dave Peterson 已提交
1267
	mci->mod_name = EDAC_MOD_STR;
1268 1269
	mci->mod_ver = E752X_REVISION;
	mci->dev = &pdev->dev;
1270

D
Dave Peterson 已提交
1271
	debugf3("%s(): init pvt\n", __func__);
D
Dave Jiang 已提交
1272
	pvt = (struct e752x_pvt *)mci->pvt_info;
1273
	pvt->dev_info = &e752x_devs[dev_idx];
1274
	pvt->mc_symmetric = ((ddrcsr & 0x10) != 0);
D
Dave Peterson 已提交
1275

1276 1277 1278
	if (e752x_get_devs(pdev, dev_idx, pvt)) {
		edac_mc_free(mci);
		return -ENODEV;
1279 1280
	}

D
Dave Peterson 已提交
1281
	debugf3("%s(): more mci init\n", __func__);
1282
	mci->ctl_name = pvt->dev_info->ctl_name;
1283
	mci->dev_name = pci_name(pdev);
1284 1285
	mci->edac_check = e752x_check;
	mci->ctl_page_to_phys = ctl_page_to_phys;
1286 1287
	mci->set_sdram_scrub_rate = set_sdram_scrub_rate;
	mci->get_sdram_scrub_rate = get_sdram_scrub_rate;
1288

1289 1290 1291 1292
	/* set the map type.  1 = normal, 0 = reversed
	 * Must be set before e752x_init_csrows in case csrow mapping
	 * is reversed.
	 */
1293
	pci_read_config_byte(pdev, E752X_DRM, &stat8);
1294 1295
	pvt->map_type = ((stat8 & 0x0f) > ((stat8 >> 4) & 0x0f));

1296 1297 1298
	e752x_init_csrows(mci, pdev, ddrcsr);
	e752x_init_mem_map_table(pdev, pvt);

1299 1300 1301 1302
	if (dev_idx == I3100)
		mci->edac_cap = EDAC_FLAG_SECDED; /* the only mode supported */
	else
		mci->edac_cap |= EDAC_FLAG_NONE;
D
Dave Peterson 已提交
1303
	debugf3("%s(): tolm, remapbase, remaplimit\n", __func__);
D
Dave Peterson 已提交
1304

1305
	/* load the top of low memory, remap base, and remap limit vars */
1306
	pci_read_config_word(pdev, E752X_TOLM, &pci_data);
1307
	pvt->tolm = ((u32) pci_data) << 4;
1308
	pci_read_config_word(pdev, E752X_REMAPBASE, &pci_data);
1309
	pvt->remapbase = ((u32) pci_data) << 14;
1310
	pci_read_config_word(pdev, E752X_REMAPLIMIT, &pci_data);
1311
	pvt->remaplimit = ((u32) pci_data) << 14;
D
Dave Peterson 已提交
1312
	e752x_printk(KERN_INFO,
1313 1314
			"tolm = %x, remapbase = %x, remaplimit = %x\n",
			pvt->tolm, pvt->remapbase, pvt->remaplimit);
1315

1316 1317 1318
	/* Here we assume that we will never see multiple instances of this
	 * type of memory controller.  The ID is therefore hardcoded to 0.
	 */
1319
	if (edac_mc_add_mc(mci)) {
D
Dave Peterson 已提交
1320
		debugf3("%s(): failed edac_mc_add_mc()\n", __func__);
1321 1322 1323
		goto fail;
	}

1324
	e752x_init_error_reporting_regs(pvt);
D
Dave Jiang 已提交
1325
	e752x_get_error_info(mci, &discard);	/* clear other MCH errors */
1326

1327 1328 1329 1330
	/* allocating generic PCI control info */
	e752x_pci = edac_pci_create_generic_ctl(&pdev->dev, EDAC_MOD_STR);
	if (!e752x_pci) {
		printk(KERN_WARNING
1331
			"%s(): Unable to create PCI control\n", __func__);
1332
		printk(KERN_WARNING
1333 1334
			"%s(): PCI error report via EDAC not setup\n",
			__func__);
1335 1336
	}

1337
	/* get this far and it's successful */
D
Dave Peterson 已提交
1338
	debugf3("%s(): success\n", __func__);
1339 1340
	return 0;

1341
fail:
1342 1343 1344 1345
	pci_dev_put(pvt->dev_d0f0);
	pci_dev_put(pvt->dev_d0f1);
	pci_dev_put(pvt->bridge_ck);
	edac_mc_free(mci);
D
Dave Peterson 已提交
1346

1347
	return -ENODEV;
1348 1349 1350 1351
}

/* returns count (>= 0), or negative on error */
static int __devinit e752x_init_one(struct pci_dev *pdev,
1352
				const struct pci_device_id *ent)
1353
{
D
Dave Peterson 已提交
1354
	debugf0("%s()\n", __func__);
1355 1356

	/* wake up and enable device */
D
Dave Jiang 已提交
1357
	if (pci_enable_device(pdev) < 0)
1358
		return -EIO;
D
Dave Peterson 已提交
1359

1360 1361 1362 1363 1364 1365 1366 1367
	return e752x_probe1(pdev, ent->driver_data);
}

static void __devexit e752x_remove_one(struct pci_dev *pdev)
{
	struct mem_ctl_info *mci;
	struct e752x_pvt *pvt;

D
Dave Peterson 已提交
1368
	debugf0("%s()\n", __func__);
1369

1370 1371 1372
	if (e752x_pci)
		edac_pci_release_generic_ctl(e752x_pci);

1373
	if ((mci = edac_mc_del_mc(&pdev->dev)) == NULL)
1374 1375
		return;

D
Dave Jiang 已提交
1376
	pvt = (struct e752x_pvt *)mci->pvt_info;
1377 1378 1379 1380 1381 1382 1383
	pci_dev_put(pvt->dev_d0f0);
	pci_dev_put(pvt->dev_d0f1);
	pci_dev_put(pvt->bridge_ck);
	edac_mc_free(mci);
}

static const struct pci_device_id e752x_pci_tbl[] __devinitdata = {
D
Dave Peterson 已提交
1384
	{
D
Dave Jiang 已提交
1385 1386
	 PCI_VEND_DEV(INTEL, 7520_0), PCI_ANY_ID, PCI_ANY_ID, 0, 0,
	 E7520},
D
Dave Peterson 已提交
1387
	{
D
Dave Jiang 已提交
1388 1389
	 PCI_VEND_DEV(INTEL, 7525_0), PCI_ANY_ID, PCI_ANY_ID, 0, 0,
	 E7525},
D
Dave Peterson 已提交
1390
	{
D
Dave Jiang 已提交
1391 1392
	 PCI_VEND_DEV(INTEL, 7320_0), PCI_ANY_ID, PCI_ANY_ID, 0, 0,
	 E7320},
1393 1394 1395
	{
	 PCI_VEND_DEV(INTEL, 3100_0), PCI_ANY_ID, PCI_ANY_ID, 0, 0,
	 I3100},
D
Dave Peterson 已提交
1396
	{
D
Dave Jiang 已提交
1397 1398
	 0,
	 }			/* 0 terminated list. */
1399 1400 1401 1402 1403
};

MODULE_DEVICE_TABLE(pci, e752x_pci_tbl);

static struct pci_driver e752x_driver = {
D
Dave Peterson 已提交
1404
	.name = EDAC_MOD_STR,
1405 1406 1407
	.probe = e752x_init_one,
	.remove = __devexit_p(e752x_remove_one),
	.id_table = e752x_pci_tbl,
1408 1409
};

A
Alan Cox 已提交
1410
static int __init e752x_init(void)
1411 1412 1413
{
	int pci_rc;

D
Dave Peterson 已提交
1414
	debugf3("%s()\n", __func__);
1415 1416 1417 1418

       /* Ensure that the OPSTATE is set correctly for POLL or NMI */
       opstate_init();

1419 1420 1421 1422 1423 1424
	pci_rc = pci_register_driver(&e752x_driver);
	return (pci_rc < 0) ? pci_rc : 0;
}

static void __exit e752x_exit(void)
{
D
Dave Peterson 已提交
1425
	debugf3("%s()\n", __func__);
1426 1427 1428 1429 1430 1431 1432 1433
	pci_unregister_driver(&e752x_driver);
}

module_init(e752x_init);
module_exit(e752x_exit);

MODULE_LICENSE("GPL");
MODULE_AUTHOR("Linux Networx (http://lnxi.com) Tom Zimmerman\n");
1434
MODULE_DESCRIPTION("MC support for Intel e752x/3100 memory controllers");
M
mark gross 已提交
1435 1436 1437

module_param(force_function_unhide, int, 0444);
MODULE_PARM_DESC(force_function_unhide, "if BIOS sets Dev0:Fun1 up as hidden:"
1438 1439
		 " 1=force unhide and hope BIOS doesn't fight driver for "
		"Dev0:Fun1 access");
1440

D
Dave Jiang 已提交
1441 1442
module_param(edac_op_state, int, 0444);
MODULE_PARM_DESC(edac_op_state, "EDAC Error Reporting state: 0=Poll,1=NMI");
1443 1444 1445 1446

module_param(sysbus_parity, int, 0444);
MODULE_PARM_DESC(sysbus_parity, "0=disable system bus parity checking,"
		" 1=enable system bus parity checking, default=auto-detect");
1447 1448 1449
module_param(report_non_memory_errors, int, 0644);
MODULE_PARM_DESC(report_non_memory_errors, "0=disable non-memory error "
		"reporting, 1=enable non-memory error reporting");