e752x_edac.c 41.2 KB
Newer Older
1 2 3 4 5 6
/*
 * Intel e752x Memory Controller kernel module
 * (C) 2004 Linux Networx (http://lnxi.com)
 * This file may be distributed under the terms of the
 * GNU General Public License.
 *
7
 * Implement support for the e7520, E7525, e7320 and i3100 memory controllers.
8
 *
9
 * Datasheets:
10
 *	http://www.intel.in/content/www/in/en/chipsets/e7525-memory-controller-hub-datasheet.html
11
 *	ftp://download.intel.com/design/intarch/datashts/31345803.pdf
12
 *
13 14 15 16 17 18 19 20 21 22 23 24 25
 * Written by Tom Zimmerman
 *
 * Contributors:
 * 	Thayne Harbaugh at realmsys.com (?)
 * 	Wang Zhenyu at intel.com
 * 	Dave Jiang at mvista.com
 *
 */

#include <linux/module.h>
#include <linux/init.h>
#include <linux/pci.h>
#include <linux/pci_ids.h>
D
Dave Jiang 已提交
26
#include <linux/edac.h>
27
#include "edac_core.h"
28

M
Michal Marek 已提交
29
#define E752X_REVISION	" Ver: 2.0.2"
30
#define EDAC_MOD_STR	"e752x_edac"
31

32
static int report_non_memory_errors;
M
mark gross 已提交
33
static int force_function_unhide;
34
static int sysbus_parity = -1;
M
mark gross 已提交
35

36 37
static struct edac_pci_ctl_info *e752x_pci;

D
Dave Peterson 已提交
38
#define e752x_printk(level, fmt, arg...) \
D
Dave Peterson 已提交
39
	edac_printk(level, "e752x", fmt, ##arg)
D
Dave Peterson 已提交
40 41

#define e752x_mc_printk(mci, level, fmt, arg...) \
D
Dave Peterson 已提交
42
	edac_mc_chipset_printk(mci, level, "e752x", fmt, ##arg)
D
Dave Peterson 已提交
43

44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67
#ifndef PCI_DEVICE_ID_INTEL_7520_0
#define PCI_DEVICE_ID_INTEL_7520_0      0x3590
#endif				/* PCI_DEVICE_ID_INTEL_7520_0      */

#ifndef PCI_DEVICE_ID_INTEL_7520_1_ERR
#define PCI_DEVICE_ID_INTEL_7520_1_ERR  0x3591
#endif				/* PCI_DEVICE_ID_INTEL_7520_1_ERR  */

#ifndef PCI_DEVICE_ID_INTEL_7525_0
#define PCI_DEVICE_ID_INTEL_7525_0      0x359E
#endif				/* PCI_DEVICE_ID_INTEL_7525_0      */

#ifndef PCI_DEVICE_ID_INTEL_7525_1_ERR
#define PCI_DEVICE_ID_INTEL_7525_1_ERR  0x3593
#endif				/* PCI_DEVICE_ID_INTEL_7525_1_ERR  */

#ifndef PCI_DEVICE_ID_INTEL_7320_0
#define PCI_DEVICE_ID_INTEL_7320_0	0x3592
#endif				/* PCI_DEVICE_ID_INTEL_7320_0 */

#ifndef PCI_DEVICE_ID_INTEL_7320_1_ERR
#define PCI_DEVICE_ID_INTEL_7320_1_ERR	0x3593
#endif				/* PCI_DEVICE_ID_INTEL_7320_1_ERR */

68 69 70 71 72 73 74 75
#ifndef PCI_DEVICE_ID_INTEL_3100_0
#define PCI_DEVICE_ID_INTEL_3100_0	0x35B0
#endif				/* PCI_DEVICE_ID_INTEL_3100_0 */

#ifndef PCI_DEVICE_ID_INTEL_3100_1_ERR
#define PCI_DEVICE_ID_INTEL_3100_1_ERR	0x35B1
#endif				/* PCI_DEVICE_ID_INTEL_3100_1_ERR */

76 77 78
#define E752X_NR_CSROWS		8	/* number of csrows */

/* E752X register addresses - device 0 function 0 */
79 80 81 82 83 84 85 86
#define E752X_MCHSCRB		0x52	/* Memory Scrub register (16b) */
					/*
					 * 6:5     Scrub Completion Count
					 * 3:2     Scrub Rate (i3100 only)
					 *      01=fast 10=normal
					 * 1:0     Scrub Mode enable
					 *      00=off 10=on
					 */
87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129
#define E752X_DRB		0x60	/* DRAM row boundary register (8b) */
#define E752X_DRA		0x70	/* DRAM row attribute register (8b) */
					/*
					 * 31:30   Device width row 7
					 *      01=x8 10=x4 11=x8 DDR2
					 * 27:26   Device width row 6
					 * 23:22   Device width row 5
					 * 19:20   Device width row 4
					 * 15:14   Device width row 3
					 * 11:10   Device width row 2
					 *  7:6    Device width row 1
					 *  3:2    Device width row 0
					 */
#define E752X_DRC		0x7C	/* DRAM controller mode reg (32b) */
					/* FIXME:IS THIS RIGHT? */
					/*
					 * 22    Number channels 0=1,1=2
					 * 19:18 DRB Granularity 32/64MB
					 */
#define E752X_DRM		0x80	/* Dimm mapping register */
#define E752X_DDRCSR		0x9A	/* DDR control and status reg (16b) */
					/*
					 * 14:12 1 single A, 2 single B, 3 dual
					 */
#define E752X_TOLM		0xC4	/* DRAM top of low memory reg (16b) */
#define E752X_REMAPBASE		0xC6	/* DRAM remap base address reg (16b) */
#define E752X_REMAPLIMIT	0xC8	/* DRAM remap limit address reg (16b) */
#define E752X_REMAPOFFSET	0xCA	/* DRAM remap limit offset reg (16b) */

/* E752X register addresses - device 0 function 1 */
#define E752X_FERR_GLOBAL	0x40	/* Global first error register (32b) */
#define E752X_NERR_GLOBAL	0x44	/* Global next error register (32b) */
#define E752X_HI_FERR		0x50	/* Hub interface first error reg (8b) */
#define E752X_HI_NERR		0x52	/* Hub interface next error reg (8b) */
#define E752X_HI_ERRMASK	0x54	/* Hub interface error mask reg (8b) */
#define E752X_HI_SMICMD		0x5A	/* Hub interface SMI command reg (8b) */
#define E752X_SYSBUS_FERR	0x60	/* System buss first error reg (16b) */
#define E752X_SYSBUS_NERR	0x62	/* System buss next error reg (16b) */
#define E752X_SYSBUS_ERRMASK	0x64	/* System buss error mask reg (16b) */
#define E752X_SYSBUS_SMICMD	0x6A	/* System buss SMI command reg (16b) */
#define E752X_BUF_FERR		0x70	/* Memory buffer first error reg (8b) */
#define E752X_BUF_NERR		0x72	/* Memory buffer next error reg (8b) */
#define E752X_BUF_ERRMASK	0x74	/* Memory buffer error mask reg (8b) */
130
#define E752X_BUF_SMICMD	0x7A	/* Memory buffer SMI cmd reg (8b) */
131 132 133 134 135 136 137 138 139
#define E752X_DRAM_FERR		0x80	/* DRAM first error register (16b) */
#define E752X_DRAM_NERR		0x82	/* DRAM next error register (16b) */
#define E752X_DRAM_ERRMASK	0x84	/* DRAM error mask register (8b) */
#define E752X_DRAM_SMICMD	0x8A	/* DRAM SMI command register (8b) */
#define E752X_DRAM_RETR_ADD	0xAC	/* DRAM Retry address register (32b) */
#define E752X_DRAM_SEC1_ADD	0xA0	/* DRAM first correctable memory */
					/*     error address register (32b) */
					/*
					 * 31    Reserved
140
					 * 30:2  CE address (64 byte block 34:6
141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159
					 * 1     Reserved
					 * 0     HiLoCS
					 */
#define E752X_DRAM_SEC2_ADD	0xC8	/* DRAM first correctable memory */
					/*     error address register (32b) */
					/*
					 * 31    Reserved
					 * 30:2  CE address (64 byte block 34:6)
					 * 1     Reserved
					 * 0     HiLoCS
					 */
#define E752X_DRAM_DED_ADD	0xA4	/* DRAM first uncorrectable memory */
					/*     error address register (32b) */
					/*
					 * 31    Reserved
					 * 30:2  CE address (64 byte block 34:6)
					 * 1     Reserved
					 * 0     HiLoCS
					 */
160
#define E752X_DRAM_SCRB_ADD	0xA8	/* DRAM 1st uncorrectable scrub mem */
161 162 163
					/*     error address register (32b) */
					/*
					 * 31    Reserved
164
					 * 30:2  CE address (64 byte block 34:6
165 166 167 168 169 170 171 172 173
					 * 1     Reserved
					 * 0     HiLoCS
					 */
#define E752X_DRAM_SEC1_SYNDROME 0xC4	/* DRAM first correctable memory */
					/*     error syndrome register (16b) */
#define E752X_DRAM_SEC2_SYNDROME 0xC6	/* DRAM second correctable memory */
					/*     error syndrome register (16b) */
#define E752X_DEVPRES1		0xF4	/* Device Present 1 register (8b) */

174 175 176 177 178 179
/* 3100 IMCH specific register addresses - device 0 function 1 */
#define I3100_NSI_FERR		0x48	/* NSI first error reg (32b) */
#define I3100_NSI_NERR		0x4C	/* NSI next error reg (32b) */
#define I3100_NSI_SMICMD	0x54	/* NSI SMI command register (32b) */
#define I3100_NSI_EMASK		0x90	/* NSI error mask register (32b) */

180 181 182 183 184 185 186 187
/* ICH5R register addresses - device 30 function 0 */
#define ICH5R_PCI_STAT		0x06	/* PCI status register (16b) */
#define ICH5R_PCI_2ND_STAT	0x1E	/* PCI status secondary reg (16b) */
#define ICH5R_PCI_BRIDGE_CTL	0x3E	/* PCI bridge control register (16b) */

enum e752x_chips {
	E7520 = 0,
	E7525 = 1,
188 189
	E7320 = 2,
	I3100 = 3
190 191
};

192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210
/*
 * Those chips Support single-rank and dual-rank memories only.
 *
 * On e752x chips, the odd rows are present only on dual-rank memories.
 * Dividing the rank by two will provide the dimm#
 *
 * i3100 MC has a different mapping: it supports only 4 ranks.
 *
 * The mapping is (from 1 to n):
 *	slot	   single-ranked	double-ranked
 *	dimm #1 -> rank #4		NA
 *	dimm #2 -> rank #3		NA
 *	dimm #3 -> rank #2		Ranks 2 and 3
 *	dimm #4 -> rank $1		Ranks 1 and 4
 *
 * FIXME: The current mapping for i3100 considers that it supports up to 8
 *	  ranks/chanel, but datasheet says that the MC supports only 4 ranks.
 */

211 212 213 214 215 216 217 218 219 220 221 222 223 224 225
struct e752x_pvt {
	struct pci_dev *bridge_ck;
	struct pci_dev *dev_d0f0;
	struct pci_dev *dev_d0f1;
	u32 tolm;
	u32 remapbase;
	u32 remaplimit;
	int mc_symmetric;
	u8 map[8];
	int map_type;
	const struct e752x_dev_info *dev_info;
};

struct e752x_dev_info {
	u16 err_dev;
D
Dave Peterson 已提交
226
	u16 ctl_dev;
227 228 229 230 231 232
	const char *ctl_name;
};

struct e752x_error_info {
	u32 ferr_global;
	u32 nerr_global;
233 234 235 236
	u32 nsi_ferr;	/* 3100 only */
	u32 nsi_nerr;	/* 3100 only */
	u8 hi_ferr;	/* all but 3100 */
	u8 hi_nerr;	/* all but 3100 */
237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253
	u16 sysbus_ferr;
	u16 sysbus_nerr;
	u8 buf_ferr;
	u8 buf_nerr;
	u16 dram_ferr;
	u16 dram_nerr;
	u32 dram_sec1_add;
	u32 dram_sec2_add;
	u16 dram_sec1_syndrome;
	u16 dram_sec2_syndrome;
	u32 dram_ded_add;
	u32 dram_scrb_add;
	u32 dram_retr_add;
};

static const struct e752x_dev_info e752x_devs[] = {
	[E7520] = {
254 255 256
		.err_dev = PCI_DEVICE_ID_INTEL_7520_1_ERR,
		.ctl_dev = PCI_DEVICE_ID_INTEL_7520_0,
		.ctl_name = "E7520"},
257
	[E7525] = {
258 259 260
		.err_dev = PCI_DEVICE_ID_INTEL_7525_1_ERR,
		.ctl_dev = PCI_DEVICE_ID_INTEL_7525_0,
		.ctl_name = "E7525"},
261
	[E7320] = {
262 263 264
		.err_dev = PCI_DEVICE_ID_INTEL_7320_1_ERR,
		.ctl_dev = PCI_DEVICE_ID_INTEL_7320_0,
		.ctl_name = "E7320"},
265 266 267 268
	[I3100] = {
		.err_dev = PCI_DEVICE_ID_INTEL_3100_1_ERR,
		.ctl_dev = PCI_DEVICE_ID_INTEL_3100_0,
		.ctl_name = "3100"},
269 270
};

271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305
/* Valid scrub rates for the e752x/3100 hardware memory scrubber. We
 * map the scrubbing bandwidth to a hardware register value. The 'set'
 * operation finds the 'matching or higher value'.  Note that scrubbing
 * on the e752x can only be enabled/disabled.  The 3100 supports
 * a normal and fast mode.
 */

#define SDRATE_EOT 0xFFFFFFFF

struct scrubrate {
	u32 bandwidth;	/* bandwidth consumed by scrubbing in bytes/sec */
	u16 scrubval;	/* register value for scrub rate */
};

/* Rate below assumes same performance as i3100 using PC3200 DDR2 in
 * normal mode.  e752x bridges don't support choosing normal or fast mode,
 * so the scrubbing bandwidth value isn't all that important - scrubbing is
 * either on or off.
 */
static const struct scrubrate scrubrates_e752x[] = {
	{0,		0x00},	/* Scrubbing Off */
	{500000,	0x02},	/* Scrubbing On */
	{SDRATE_EOT,	0x00}	/* End of Table */
};

/* Fast mode: 2 GByte PC3200 DDR2 scrubbed in 33s = 63161283 bytes/s
 * Normal mode: 125 (32000 / 256) times slower than fast mode.
 */
static const struct scrubrate scrubrates_i3100[] = {
	{0,		0x00},	/* Scrubbing Off */
	{500000,	0x0a},	/* Normal mode - 32k clocks */
	{62500000,	0x06},	/* Fast mode - 256 clocks */
	{SDRATE_EOT,	0x00}	/* End of Table */
};

306
static unsigned long ctl_page_to_phys(struct mem_ctl_info *mci,
307
				unsigned long page)
308 309
{
	u32 remap;
D
Dave Jiang 已提交
310
	struct e752x_pvt *pvt = (struct e752x_pvt *)mci->pvt_info;
311

D
Dave Peterson 已提交
312
	debugf3("%s()\n", __func__);
313 314 315

	if (page < pvt->tolm)
		return page;
D
Dave Peterson 已提交
316

317 318
	if ((page >= 0x100000) && (page < pvt->remapbase))
		return page;
D
Dave Peterson 已提交
319

320
	remap = (page - pvt->tolm) + pvt->remapbase;
D
Dave Peterson 已提交
321

322 323
	if (remap < pvt->remaplimit)
		return remap;
D
Dave Peterson 已提交
324

D
Dave Peterson 已提交
325
	e752x_printk(KERN_ERR, "Invalid page %lx - out of range\n", page);
326 327 328 329
	return pvt->tolm - 1;
}

static void do_process_ce(struct mem_ctl_info *mci, u16 error_one,
330
			u32 sec1_add, u16 sec1_syndrome)
331 332 333 334 335
{
	u32 page;
	int row;
	int channel;
	int i;
D
Dave Jiang 已提交
336
	struct e752x_pvt *pvt = (struct e752x_pvt *)mci->pvt_info;
337

D
Dave Peterson 已提交
338
	debugf3("%s()\n", __func__);
339 340 341 342 343 344 345 346

	/* convert the addr to 4k page */
	page = sec1_add >> (PAGE_SHIFT - 4);

	/* FIXME - check for -1 */
	if (pvt->mc_symmetric) {
		/* chip select are bits 14 & 13 */
		row = ((page >> 1) & 3);
D
Dave Peterson 已提交
347
		e752x_printk(KERN_WARNING,
348 349 350 351
			"Test row %d Table %d %d %d %d %d %d %d %d\n", row,
			pvt->map[0], pvt->map[1], pvt->map[2], pvt->map[3],
			pvt->map[4], pvt->map[5], pvt->map[6],
			pvt->map[7]);
352 353 354 355 356 357

		/* test for channel remapping */
		for (i = 0; i < 8; i++) {
			if (pvt->map[i] == row)
				break;
		}
D
Dave Peterson 已提交
358

D
Dave Peterson 已提交
359
		e752x_printk(KERN_WARNING, "Test computed row %d\n", i);
D
Dave Peterson 已提交
360

361 362 363
		if (i < 8)
			row = i;
		else
D
Dave Peterson 已提交
364
			e752x_mc_printk(mci, KERN_WARNING,
D
Dave Jiang 已提交
365 366
					"row %d not found in remap table\n",
					row);
367 368
	} else
		row = edac_mc_find_csrow_by_page(mci, page);
D
Dave Peterson 已提交
369

370 371 372
	/* 0 = channel A, 1 = channel B */
	channel = !(error_one & 1);

M
Mike Chan 已提交
373
	/* e752x mc reads 34:6 of the DRAM linear address */
374 375 376 377
	edac_mc_handle_error(HW_EVENT_ERR_CORRECTED, mci,
			     page, offset_in_page(sec1_add << 4), sec1_syndrome,
			     row, channel, -1,
			     "e752x CE", "", NULL);
378 379 380
}

static inline void process_ce(struct mem_ctl_info *mci, u16 error_one,
381 382
			u32 sec1_add, u16 sec1_syndrome, int *error_found,
			int handle_error)
383 384 385 386 387 388 389
{
	*error_found = 1;

	if (handle_error)
		do_process_ce(mci, error_one, sec1_add, sec1_syndrome);
}

D
Dave Peterson 已提交
390
static void do_process_ue(struct mem_ctl_info *mci, u16 error_one,
391
			u32 ded_add, u32 scrb_add)
392 393 394
{
	u32 error_2b, block_page;
	int row;
D
Dave Jiang 已提交
395
	struct e752x_pvt *pvt = (struct e752x_pvt *)mci->pvt_info;
396

D
Dave Peterson 已提交
397
	debugf3("%s()\n", __func__);
398 399 400

	if (error_one & 0x0202) {
		error_2b = ded_add;
D
Dave Peterson 已提交
401

402 403
		/* convert to 4k address */
		block_page = error_2b >> (PAGE_SHIFT - 4);
D
Dave Peterson 已提交
404

405
		row = pvt->mc_symmetric ?
406 407 408
		/* chip select are bits 14 & 13 */
			((block_page >> 1) & 3) :
			edac_mc_find_csrow_by_page(mci, block_page);
D
Dave Peterson 已提交
409

M
Mike Chan 已提交
410
		/* e752x mc reads 34:6 of the DRAM linear address */
411 412 413 414 415 416
		edac_mc_handle_error(HW_EVENT_ERR_UNCORRECTED, mci,
					block_page,
					offset_in_page(error_2b << 4), 0,
					 row, -1, -1,
					"e752x UE from Read", "", NULL);

417 418 419
	}
	if (error_one & 0x0404) {
		error_2b = scrb_add;
D
Dave Peterson 已提交
420

421 422
		/* convert to 4k address */
		block_page = error_2b >> (PAGE_SHIFT - 4);
D
Dave Peterson 已提交
423

424
		row = pvt->mc_symmetric ?
425 426 427
		/* chip select are bits 14 & 13 */
			((block_page >> 1) & 3) :
			edac_mc_find_csrow_by_page(mci, block_page);
D
Dave Peterson 已提交
428

M
Mike Chan 已提交
429
		/* e752x mc reads 34:6 of the DRAM linear address */
430 431 432 433 434
		edac_mc_handle_error(HW_EVENT_ERR_UNCORRECTED, mci,
					block_page,
					offset_in_page(error_2b << 4), 0,
					row, -1, -1,
					"e752x UE from Scruber", "", NULL);
435 436 437 438
	}
}

static inline void process_ue(struct mem_ctl_info *mci, u16 error_one,
439 440
			u32 ded_add, u32 scrb_add, int *error_found,
			int handle_error)
441 442 443 444 445 446 447 448
{
	*error_found = 1;

	if (handle_error)
		do_process_ue(mci, error_one, ded_add, scrb_add);
}

static inline void process_ue_no_info_wr(struct mem_ctl_info *mci,
D
Dave Jiang 已提交
449
					 int *error_found, int handle_error)
450 451 452 453 454 455
{
	*error_found = 1;

	if (!handle_error)
		return;

D
Dave Peterson 已提交
456
	debugf3("%s()\n", __func__);
457 458 459
	edac_mc_handle_error(HW_EVENT_ERR_UNCORRECTED, mci, 0, 0, 0,
			     -1, -1, -1,
			     "e752x UE log memory write", "", NULL);
460 461 462
}

static void do_process_ded_retry(struct mem_ctl_info *mci, u16 error,
D
Dave Jiang 已提交
463
				 u32 retry_add)
464 465 466
{
	u32 error_1b, page;
	int row;
D
Dave Jiang 已提交
467
	struct e752x_pvt *pvt = (struct e752x_pvt *)mci->pvt_info;
468 469

	error_1b = retry_add;
470 471 472 473
	page = error_1b >> (PAGE_SHIFT - 4);  /* convert the addr to 4k page */

	/* chip select are bits 14 & 13 */
	row = pvt->mc_symmetric ? ((page >> 1) & 3) :
474
		edac_mc_find_csrow_by_page(mci, page);
475

D
Dave Peterson 已提交
476
	e752x_mc_printk(mci, KERN_WARNING,
D
Dave Jiang 已提交
477 478
			"CE page 0x%lx, row %d : Memory read retry\n",
			(long unsigned int)page, row);
479 480 481
}

static inline void process_ded_retry(struct mem_ctl_info *mci, u16 error,
482 483
				u32 retry_add, int *error_found,
				int handle_error)
484 485 486 487 488 489 490 491
{
	*error_found = 1;

	if (handle_error)
		do_process_ded_retry(mci, error, retry_add);
}

static inline void process_threshold_ce(struct mem_ctl_info *mci, u16 error,
D
Dave Jiang 已提交
492
					int *error_found, int handle_error)
493 494 495 496
{
	*error_found = 1;

	if (handle_error)
D
Dave Peterson 已提交
497
		e752x_mc_printk(mci, KERN_WARNING, "Memory threshold CE\n");
498 499
}

A
Alan Cox 已提交
500
static char *global_message[11] = {
501 502 503 504 505 506 507 508 509 510 511
	"PCI Express C1",
	"PCI Express C",
	"PCI Express B1",
	"PCI Express B",
	"PCI Express A1",
	"PCI Express A",
	"DMA Controller",
	"HUB or NS Interface",
	"System Bus",
	"DRAM Controller",  /* 9th entry */
	"Internal Buffer"
512 513
};

514 515
#define DRAM_ENTRY	9

A
Alan Cox 已提交
516
static char *fatal_message[2] = { "Non-Fatal ", "Fatal " };
517 518 519 520 521 522

static void do_global_error(int fatal, u32 errors)
{
	int i;

	for (i = 0; i < 11; i++) {
523 524 525 526 527 528 529 530 531 532
		if (errors & (1 << i)) {
			/* If the error is from DRAM Controller OR
			 * we are to report ALL errors, then
			 * report the error
			 */
			if ((i == DRAM_ENTRY) || report_non_memory_errors)
				e752x_printk(KERN_WARNING, "%sError %s\n",
					fatal_message[fatal],
					global_message[i]);
		}
533 534 535 536
	}
}

static inline void global_error(int fatal, u32 errors, int *error_found,
D
Dave Jiang 已提交
537
				int handle_error)
538 539 540 541 542 543 544
{
	*error_found = 1;

	if (handle_error)
		do_global_error(fatal, errors);
}

A
Alan Cox 已提交
545
static char *hub_message[7] = {
546 547 548 549 550 551 552 553 554 555 556 557
	"HI Address or Command Parity", "HI Illegal Access",
	"HI Internal Parity", "Out of Range Access",
	"HI Data Parity", "Enhanced Config Access",
	"Hub Interface Target Abort"
};

static void do_hub_error(int fatal, u8 errors)
{
	int i;

	for (i = 0; i < 7; i++) {
		if (errors & (1 << i))
D
Dave Peterson 已提交
558
			e752x_printk(KERN_WARNING, "%sError %s\n",
559
				fatal_message[fatal], hub_message[i]);
560 561 562 563
	}
}

static inline void hub_error(int fatal, u8 errors, int *error_found,
564
			int handle_error)
565 566 567 568 569 570 571
{
	*error_found = 1;

	if (handle_error)
		do_hub_error(fatal, errors);
}

572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628
#define NSI_FATAL_MASK		0x0c080081
#define NSI_NON_FATAL_MASK	0x23a0ba64
#define NSI_ERR_MASK		(NSI_FATAL_MASK | NSI_NON_FATAL_MASK)

static char *nsi_message[30] = {
	"NSI Link Down",	/* NSI_FERR/NSI_NERR bit 0, fatal error */
	"",						/* reserved */
	"NSI Parity Error",				/* bit 2, non-fatal */
	"",						/* reserved */
	"",						/* reserved */
	"Correctable Error Message",			/* bit 5, non-fatal */
	"Non-Fatal Error Message",			/* bit 6, non-fatal */
	"Fatal Error Message",				/* bit 7, fatal */
	"",						/* reserved */
	"Receiver Error",				/* bit 9, non-fatal */
	"",						/* reserved */
	"Bad TLP",					/* bit 11, non-fatal */
	"Bad DLLP",					/* bit 12, non-fatal */
	"REPLAY_NUM Rollover",				/* bit 13, non-fatal */
	"",						/* reserved */
	"Replay Timer Timeout",				/* bit 15, non-fatal */
	"",						/* reserved */
	"",						/* reserved */
	"",						/* reserved */
	"Data Link Protocol Error",			/* bit 19, fatal */
	"",						/* reserved */
	"Poisoned TLP",					/* bit 21, non-fatal */
	"",						/* reserved */
	"Completion Timeout",				/* bit 23, non-fatal */
	"Completer Abort",				/* bit 24, non-fatal */
	"Unexpected Completion",			/* bit 25, non-fatal */
	"Receiver Overflow",				/* bit 26, fatal */
	"Malformed TLP",				/* bit 27, fatal */
	"",						/* reserved */
	"Unsupported Request"				/* bit 29, non-fatal */
};

static void do_nsi_error(int fatal, u32 errors)
{
	int i;

	for (i = 0; i < 30; i++) {
		if (errors & (1 << i))
			printk(KERN_WARNING "%sError %s\n",
			       fatal_message[fatal], nsi_message[i]);
	}
}

static inline void nsi_error(int fatal, u32 errors, int *error_found,
		int handle_error)
{
	*error_found = 1;

	if (handle_error)
		do_nsi_error(fatal, errors);
}

A
Alan Cox 已提交
629
static char *membuf_message[4] = {
630 631 632 633 634 635 636 637 638 639 640 641
	"Internal PMWB to DRAM parity",
	"Internal PMWB to System Bus Parity",
	"Internal System Bus or IO to PMWB Parity",
	"Internal DRAM to PMWB Parity"
};

static void do_membuf_error(u8 errors)
{
	int i;

	for (i = 0; i < 4; i++) {
		if (errors & (1 << i))
D
Dave Peterson 已提交
642
			e752x_printk(KERN_WARNING, "Non-Fatal Error %s\n",
643
				membuf_message[i]);
644 645 646 647 648 649 650 651 652 653 654
	}
}

static inline void membuf_error(u8 errors, int *error_found, int handle_error)
{
	*error_found = 1;

	if (handle_error)
		do_membuf_error(errors);
}

655
static char *sysbus_message[10] = {
656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672
	"Addr or Request Parity",
	"Data Strobe Glitch",
	"Addr Strobe Glitch",
	"Data Parity",
	"Addr Above TOM",
	"Non DRAM Lock Error",
	"MCERR", "BINIT",
	"Memory Parity",
	"IO Subsystem Parity"
};

static void do_sysbus_error(int fatal, u32 errors)
{
	int i;

	for (i = 0; i < 10; i++) {
		if (errors & (1 << i))
D
Dave Peterson 已提交
673
			e752x_printk(KERN_WARNING, "%sError System Bus %s\n",
674
				fatal_message[fatal], sysbus_message[i]);
675 676 677 678
	}
}

static inline void sysbus_error(int fatal, u32 errors, int *error_found,
D
Dave Jiang 已提交
679
				int handle_error)
680 681 682 683 684 685 686
{
	*error_found = 1;

	if (handle_error)
		do_sysbus_error(fatal, errors);
}

D
Dave Peterson 已提交
687
static void e752x_check_hub_interface(struct e752x_error_info *info,
688
				int *error_found, int handle_error)
689 690 691 692
{
	u8 stat8;

	//pci_read_config_byte(dev,E752X_HI_FERR,&stat8);
D
Dave Peterson 已提交
693

694
	stat8 = info->hi_ferr;
D
Dave Peterson 已提交
695

D
Dave Jiang 已提交
696
	if (stat8 & 0x7f) {	/* Error, so process */
697
		stat8 &= 0x7f;
D
Dave Peterson 已提交
698

D
Dave Jiang 已提交
699
		if (stat8 & 0x2b)
700
			hub_error(1, stat8 & 0x2b, error_found, handle_error);
D
Dave Peterson 已提交
701

D
Dave Jiang 已提交
702
		if (stat8 & 0x54)
703 704 705
			hub_error(0, stat8 & 0x54, error_found, handle_error);
	}
	//pci_read_config_byte(dev,E752X_HI_NERR,&stat8);
D
Dave Peterson 已提交
706

707
	stat8 = info->hi_nerr;
D
Dave Peterson 已提交
708

D
Dave Jiang 已提交
709
	if (stat8 & 0x7f) {	/* Error, so process */
710
		stat8 &= 0x7f;
D
Dave Peterson 已提交
711

712 713
		if (stat8 & 0x2b)
			hub_error(1, stat8 & 0x2b, error_found, handle_error);
D
Dave Peterson 已提交
714

D
Dave Jiang 已提交
715
		if (stat8 & 0x54)
716 717 718 719
			hub_error(0, stat8 & 0x54, error_found, handle_error);
	}
}

720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742 743 744
static void e752x_check_ns_interface(struct e752x_error_info *info,
				int *error_found, int handle_error)
{
	u32 stat32;

	stat32 = info->nsi_ferr;
	if (stat32 & NSI_ERR_MASK) { /* Error, so process */
		if (stat32 & NSI_FATAL_MASK)	/* check for fatal errors */
			nsi_error(1, stat32 & NSI_FATAL_MASK, error_found,
				  handle_error);
		if (stat32 & NSI_NON_FATAL_MASK) /* check for non-fatal ones */
			nsi_error(0, stat32 & NSI_NON_FATAL_MASK, error_found,
				  handle_error);
	}
	stat32 = info->nsi_nerr;
	if (stat32 & NSI_ERR_MASK) {
		if (stat32 & NSI_FATAL_MASK)
			nsi_error(1, stat32 & NSI_FATAL_MASK, error_found,
				  handle_error);
		if (stat32 & NSI_NON_FATAL_MASK)
			nsi_error(0, stat32 & NSI_NON_FATAL_MASK, error_found,
				  handle_error);
	}
}

D
Dave Peterson 已提交
745
static void e752x_check_sysbus(struct e752x_error_info *info,
746
			int *error_found, int handle_error)
747 748 749 750 751 752 753
{
	u32 stat32, error32;

	//pci_read_config_dword(dev,E752X_SYSBUS_FERR,&stat32);
	stat32 = info->sysbus_ferr + (info->sysbus_nerr << 16);

	if (stat32 == 0)
D
Dave Jiang 已提交
754
		return;		/* no errors */
755 756 757

	error32 = (stat32 >> 16) & 0x3ff;
	stat32 = stat32 & 0x3ff;
D
Dave Peterson 已提交
758

D
Dave Jiang 已提交
759
	if (stat32 & 0x087)
760
		sysbus_error(1, stat32 & 0x087, error_found, handle_error);
D
Dave Peterson 已提交
761

D
Dave Jiang 已提交
762
	if (stat32 & 0x378)
763
		sysbus_error(0, stat32 & 0x378, error_found, handle_error);
D
Dave Peterson 已提交
764

D
Dave Jiang 已提交
765
	if (error32 & 0x087)
766
		sysbus_error(1, error32 & 0x087, error_found, handle_error);
D
Dave Peterson 已提交
767

D
Dave Jiang 已提交
768
	if (error32 & 0x378)
769
		sysbus_error(0, error32 & 0x378, error_found, handle_error);
770 771
}

D
Dave Jiang 已提交
772
static void e752x_check_membuf(struct e752x_error_info *info,
773
			int *error_found, int handle_error)
774 775 776 777
{
	u8 stat8;

	stat8 = info->buf_ferr;
D
Dave Peterson 已提交
778

D
Dave Jiang 已提交
779
	if (stat8 & 0x0f) {	/* Error, so process */
780 781 782
		stat8 &= 0x0f;
		membuf_error(stat8, error_found, handle_error);
	}
D
Dave Peterson 已提交
783

784
	stat8 = info->buf_nerr;
D
Dave Peterson 已提交
785

D
Dave Jiang 已提交
786
	if (stat8 & 0x0f) {	/* Error, so process */
787 788 789 790 791
		stat8 &= 0x0f;
		membuf_error(stat8, error_found, handle_error);
	}
}

D
Dave Jiang 已提交
792
static void e752x_check_dram(struct mem_ctl_info *mci,
793 794
			struct e752x_error_info *info, int *error_found,
			int handle_error)
795 796 797 798 799 800 801
{
	u16 error_one, error_next;

	error_one = info->dram_ferr;
	error_next = info->dram_nerr;

	/* decode and report errors */
D
Dave Jiang 已提交
802
	if (error_one & 0x0101)	/* check first error correctable */
803
		process_ce(mci, error_one, info->dram_sec1_add,
804
			info->dram_sec1_syndrome, error_found, handle_error);
805

D
Dave Jiang 已提交
806
	if (error_next & 0x0101)	/* check next error correctable */
807
		process_ce(mci, error_next, info->dram_sec2_add,
808
			info->dram_sec2_syndrome, error_found, handle_error);
809

D
Dave Jiang 已提交
810
	if (error_one & 0x4040)
811 812
		process_ue_no_info_wr(mci, error_found, handle_error);

D
Dave Jiang 已提交
813
	if (error_next & 0x4040)
814 815
		process_ue_no_info_wr(mci, error_found, handle_error);

D
Dave Jiang 已提交
816
	if (error_one & 0x2020)
817
		process_ded_retry(mci, error_one, info->dram_retr_add,
818
				error_found, handle_error);
819

D
Dave Jiang 已提交
820
	if (error_next & 0x2020)
821
		process_ded_retry(mci, error_next, info->dram_retr_add,
822
				error_found, handle_error);
823

D
Dave Jiang 已提交
824 825
	if (error_one & 0x0808)
		process_threshold_ce(mci, error_one, error_found, handle_error);
826

D
Dave Jiang 已提交
827
	if (error_next & 0x0808)
828
		process_threshold_ce(mci, error_next, error_found,
829
				handle_error);
830

D
Dave Jiang 已提交
831
	if (error_one & 0x0606)
832
		process_ue(mci, error_one, info->dram_ded_add,
833
			info->dram_scrb_add, error_found, handle_error);
834

D
Dave Jiang 已提交
835
	if (error_next & 0x0606)
836
		process_ue(mci, error_next, info->dram_ded_add,
837
			info->dram_scrb_add, error_found, handle_error);
838 839
}

D
Dave Jiang 已提交
840 841
static void e752x_get_error_info(struct mem_ctl_info *mci,
				 struct e752x_error_info *info)
842 843 844 845 846
{
	struct pci_dev *dev;
	struct e752x_pvt *pvt;

	memset(info, 0, sizeof(*info));
D
Dave Jiang 已提交
847
	pvt = (struct e752x_pvt *)mci->pvt_info;
848 849 850 851
	dev = pvt->dev_d0f1;
	pci_read_config_dword(dev, E752X_FERR_GLOBAL, &info->ferr_global);

	if (info->ferr_global) {
852 853 854 855 856 857 858 859 860
		if (pvt->dev_info->err_dev == PCI_DEVICE_ID_INTEL_3100_1_ERR) {
			pci_read_config_dword(dev, I3100_NSI_FERR,
					     &info->nsi_ferr);
			info->hi_ferr = 0;
		} else {
			pci_read_config_byte(dev, E752X_HI_FERR,
					     &info->hi_ferr);
			info->nsi_ferr = 0;
		}
861
		pci_read_config_word(dev, E752X_SYSBUS_FERR,
862
				&info->sysbus_ferr);
863
		pci_read_config_byte(dev, E752X_BUF_FERR, &info->buf_ferr);
D
Dave Jiang 已提交
864
		pci_read_config_word(dev, E752X_DRAM_FERR, &info->dram_ferr);
865
		pci_read_config_dword(dev, E752X_DRAM_SEC1_ADD,
866
				&info->dram_sec1_add);
867
		pci_read_config_word(dev, E752X_DRAM_SEC1_SYNDROME,
868
				&info->dram_sec1_syndrome);
869
		pci_read_config_dword(dev, E752X_DRAM_DED_ADD,
870
				&info->dram_ded_add);
871
		pci_read_config_dword(dev, E752X_DRAM_SCRB_ADD,
872
				&info->dram_scrb_add);
873
		pci_read_config_dword(dev, E752X_DRAM_RETR_ADD,
874
				&info->dram_retr_add);
875

876
		/* ignore the reserved bits just in case */
877 878
		if (info->hi_ferr & 0x7f)
			pci_write_config_byte(dev, E752X_HI_FERR,
879
					info->hi_ferr);
880

881 882 883 884
		if (info->nsi_ferr & NSI_ERR_MASK)
			pci_write_config_dword(dev, I3100_NSI_FERR,
					info->nsi_ferr);

885 886
		if (info->sysbus_ferr)
			pci_write_config_word(dev, E752X_SYSBUS_FERR,
887
					info->sysbus_ferr);
888 889 890

		if (info->buf_ferr & 0x0f)
			pci_write_config_byte(dev, E752X_BUF_FERR,
891
					info->buf_ferr);
892 893 894

		if (info->dram_ferr)
			pci_write_bits16(pvt->bridge_ck, E752X_DRAM_FERR,
D
Dave Jiang 已提交
895
					 info->dram_ferr, info->dram_ferr);
896 897

		pci_write_config_dword(dev, E752X_FERR_GLOBAL,
898
				info->ferr_global);
899 900 901 902 903
	}

	pci_read_config_dword(dev, E752X_NERR_GLOBAL, &info->nerr_global);

	if (info->nerr_global) {
904 905 906 907 908 909 910 911 912
		if (pvt->dev_info->err_dev == PCI_DEVICE_ID_INTEL_3100_1_ERR) {
			pci_read_config_dword(dev, I3100_NSI_NERR,
					     &info->nsi_nerr);
			info->hi_nerr = 0;
		} else {
			pci_read_config_byte(dev, E752X_HI_NERR,
					     &info->hi_nerr);
			info->nsi_nerr = 0;
		}
913
		pci_read_config_word(dev, E752X_SYSBUS_NERR,
914
				&info->sysbus_nerr);
915
		pci_read_config_byte(dev, E752X_BUF_NERR, &info->buf_nerr);
D
Dave Jiang 已提交
916
		pci_read_config_word(dev, E752X_DRAM_NERR, &info->dram_nerr);
917
		pci_read_config_dword(dev, E752X_DRAM_SEC2_ADD,
918
				&info->dram_sec2_add);
919
		pci_read_config_word(dev, E752X_DRAM_SEC2_SYNDROME,
920
				&info->dram_sec2_syndrome);
921 922 923

		if (info->hi_nerr & 0x7f)
			pci_write_config_byte(dev, E752X_HI_NERR,
924
					info->hi_nerr);
925

926 927 928 929
		if (info->nsi_nerr & NSI_ERR_MASK)
			pci_write_config_dword(dev, I3100_NSI_NERR,
					info->nsi_nerr);

930 931
		if (info->sysbus_nerr)
			pci_write_config_word(dev, E752X_SYSBUS_NERR,
932
					info->sysbus_nerr);
933 934 935

		if (info->buf_nerr & 0x0f)
			pci_write_config_byte(dev, E752X_BUF_NERR,
936
					info->buf_nerr);
937 938 939

		if (info->dram_nerr)
			pci_write_bits16(pvt->bridge_ck, E752X_DRAM_NERR,
D
Dave Jiang 已提交
940
					 info->dram_nerr, info->dram_nerr);
941 942

		pci_write_config_dword(dev, E752X_NERR_GLOBAL,
943
				info->nerr_global);
944 945 946
	}
}

D
Dave Jiang 已提交
947
static int e752x_process_error_info(struct mem_ctl_info *mci,
948 949
				struct e752x_error_info *info,
				int handle_errors)
950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973
{
	u32 error32, stat32;
	int error_found;

	error_found = 0;
	error32 = (info->ferr_global >> 18) & 0x3ff;
	stat32 = (info->ferr_global >> 4) & 0x7ff;

	if (error32)
		global_error(1, error32, &error_found, handle_errors);

	if (stat32)
		global_error(0, stat32, &error_found, handle_errors);

	error32 = (info->nerr_global >> 18) & 0x3ff;
	stat32 = (info->nerr_global >> 4) & 0x7ff;

	if (error32)
		global_error(1, error32, &error_found, handle_errors);

	if (stat32)
		global_error(0, stat32, &error_found, handle_errors);

	e752x_check_hub_interface(info, &error_found, handle_errors);
974
	e752x_check_ns_interface(info, &error_found, handle_errors);
975 976 977 978 979 980 981 982 983
	e752x_check_sysbus(info, &error_found, handle_errors);
	e752x_check_membuf(info, &error_found, handle_errors);
	e752x_check_dram(mci, info, &error_found, handle_errors);
	return error_found;
}

static void e752x_check(struct mem_ctl_info *mci)
{
	struct e752x_error_info info;
D
Dave Peterson 已提交
984

D
Dave Peterson 已提交
985
	debugf3("%s()\n", __func__);
986 987 988 989
	e752x_get_error_info(mci, &info);
	e752x_process_error_info(mci, &info, 1);
}

990
/* Program byte/sec bandwidth scrub rate to hardware */
991
static int set_sdram_scrub_rate(struct mem_ctl_info *mci, u32 new_bw)
992 993 994 995 996 997 998 999 1000 1001 1002 1003 1004 1005 1006 1007
{
	const struct scrubrate *scrubrates;
	struct e752x_pvt *pvt = (struct e752x_pvt *) mci->pvt_info;
	struct pci_dev *pdev = pvt->dev_d0f0;
	int i;

	if (pvt->dev_info->ctl_dev == PCI_DEVICE_ID_INTEL_3100_0)
		scrubrates = scrubrates_i3100;
	else
		scrubrates = scrubrates_e752x;

	/* Translate the desired scrub rate to a e752x/3100 register value.
	 * Search for the bandwidth that is equal or greater than the
	 * desired rate and program the cooresponding register value.
	 */
	for (i = 0; scrubrates[i].bandwidth != SDRATE_EOT; i++)
1008
		if (scrubrates[i].bandwidth >= new_bw)
1009 1010 1011 1012 1013 1014 1015
			break;

	if (scrubrates[i].bandwidth == SDRATE_EOT)
		return -1;

	pci_write_config_word(pdev, E752X_MCHSCRB, scrubrates[i].scrubval);

1016
	return scrubrates[i].bandwidth;
1017 1018 1019
}

/* Convert current scrub rate value into byte/sec bandwidth */
1020
static int get_sdram_scrub_rate(struct mem_ctl_info *mci)
1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045
{
	const struct scrubrate *scrubrates;
	struct e752x_pvt *pvt = (struct e752x_pvt *) mci->pvt_info;
	struct pci_dev *pdev = pvt->dev_d0f0;
	u16 scrubval;
	int i;

	if (pvt->dev_info->ctl_dev == PCI_DEVICE_ID_INTEL_3100_0)
		scrubrates = scrubrates_i3100;
	else
		scrubrates = scrubrates_e752x;

	/* Find the bandwidth matching the memory scrubber configuration */
	pci_read_config_word(pdev, E752X_MCHSCRB, &scrubval);
	scrubval = scrubval & 0x0f;

	for (i = 0; scrubrates[i].bandwidth != SDRATE_EOT; i++)
		if (scrubrates[i].scrubval == scrubval)
			break;

	if (scrubrates[i].bandwidth == SDRATE_EOT) {
		e752x_printk(KERN_WARNING,
			"Invalid sdram scrub control value: 0x%x\n", scrubval);
		return -1;
	}
1046
	return scrubrates[i].bandwidth;
1047 1048 1049

}

1050 1051 1052 1053 1054 1055
/* Return 1 if dual channel mode is active.  Else return 0. */
static inline int dual_channel_active(u16 ddrcsr)
{
	return (((ddrcsr >> 12) & 3) == 3);
}

1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067
/* Remap csrow index numbers if map_type is "reverse"
 */
static inline int remap_csrow_index(struct mem_ctl_info *mci, int index)
{
	struct e752x_pvt *pvt = mci->pvt_info;

	if (!pvt->map_type)
		return (7 - index);

	return (index);
}

1068
static void e752x_init_csrows(struct mem_ctl_info *mci, struct pci_dev *pdev,
1069
			u16 ddrcsr)
1070 1071
{
	struct csrow_info *csrow;
1072
	enum edac_type edac_mode;
1073 1074
	unsigned long last_cumul_size;
	int index, mem_dev, drc_chan;
D
Dave Jiang 已提交
1075 1076
	int drc_drbg;		/* DRB granularity 0=64mb, 1=128mb */
	int drc_ddim;		/* DRAM Data Integrity Mode 0=none, 2=edac */
1077
	u8 value;
1078
	u32 dra, drc, cumul_size, i, nr_pages;
1079

1080
	dra = 0;
D
Dave Jiang 已提交
1081
	for (index = 0; index < 4; index++) {
1082
		u8 dra_reg;
D
Dave Jiang 已提交
1083
		pci_read_config_byte(pdev, E752X_DRA + index, &dra_reg);
1084 1085
		dra |= dra_reg << (index * 8);
	}
1086
	pci_read_config_dword(pdev, E752X_DRC, &drc);
1087
	drc_chan = dual_channel_active(ddrcsr) ? 1 : 0;
D
Dave Jiang 已提交
1088
	drc_drbg = drc_chan + 1;	/* 128 in dual mode, 64 in single */
1089 1090 1091 1092 1093 1094 1095 1096 1097 1098
	drc_ddim = (drc >> 20) & 0x3;

	/* The dram row boundary (DRB) reg values are boundary address for
	 * each DRAM row with a granularity of 64 or 128MB (single/dual
	 * channel operation).  DRB regs are cumulative; therefore DRB7 will
	 * contain the total memory contained in all eight rows.
	 */
	for (last_cumul_size = index = 0; index < mci->nr_csrows; index++) {
		/* mem_dev 0=x8, 1=x4 */
		mem_dev = (dra >> (index * 4 + 2)) & 0x3;
1099
		csrow = &mci->csrows[remap_csrow_index(mci, index)];
1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111

		mem_dev = (mem_dev == 2);
		pci_read_config_byte(pdev, E752X_DRB + index, &value);
		/* convert a 128 or 64 MiB DRB to a page size. */
		cumul_size = value << (25 + drc_drbg - PAGE_SHIFT);
		debugf3("%s(): (%d) cumul_size 0x%x\n", __func__, index,
			cumul_size);
		if (cumul_size == last_cumul_size)
			continue;	/* not populated */

		csrow->first_page = last_cumul_size;
		csrow->last_page = cumul_size - 1;
1112
		nr_pages = cumul_size - last_cumul_size;
1113
		last_cumul_size = cumul_size;
1114

1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128
		/*
		* if single channel or x8 devices then SECDED
		* if dual channel and x4 then S4ECD4ED
		*/
		if (drc_ddim) {
			if (drc_chan && mem_dev) {
				edac_mode = EDAC_S4ECD4ED;
				mci->edac_cap |= EDAC_FLAG_S4ECD4ED;
			} else {
				edac_mode = EDAC_SECDED;
				mci->edac_cap |= EDAC_FLAG_SECDED;
			}
		} else
			edac_mode = EDAC_NONE;
1129
		for (i = 0; i < csrow->nr_channels; i++) {
1130
			struct dimm_info *dimm = csrow->channels[i].dimm;
1131

1132 1133
			debugf3("Initializing rank at (%i,%i)\n", index, i);
			dimm->nr_pages = nr_pages / csrow->nr_channels;
1134 1135 1136
			dimm->grain = 1 << 12;	/* 4KiB - resolution of CELOG */
			dimm->mtype = MEM_RDDR;	/* only one type supported */
			dimm->dtype = mem_dev ? DEV_X4 : DEV_X8;
1137
			dimm->edac_mode = edac_mode;
1138
		}
1139 1140 1141 1142
	}
}

static void e752x_init_mem_map_table(struct pci_dev *pdev,
1143
				struct e752x_pvt *pvt)
1144 1145
{
	int index;
1146
	u8 value, last, row;
1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157

	last = 0;
	row = 0;

	for (index = 0; index < 8; index += 2) {
		pci_read_config_byte(pdev, E752X_DRB + index, &value);
		/* test if there is a dimm in this slot */
		if (value == last) {
			/* no dimm in the slot, so flag it as empty */
			pvt->map[index] = 0xff;
			pvt->map[index + 1] = 0xff;
D
Dave Jiang 已提交
1158
		} else {	/* there is a dimm in the slot */
1159 1160 1161 1162 1163 1164 1165
			pvt->map[index] = row;
			row++;
			last = value;
			/* test the next value to see if the dimm is double
			 * sided
			 */
			pci_read_config_byte(pdev, E752X_DRB + index + 1,
1166 1167 1168 1169 1170
					&value);

			/* the dimm is single sided, so flag as empty */
			/* this is a double sided dimm to save the next row #*/
			pvt->map[index + 1] = (value == last) ? 0xff :	row;
1171 1172 1173 1174 1175 1176 1177 1178
			row++;
			last = value;
		}
	}
}

/* Return 0 on success or 1 on failure. */
static int e752x_get_devs(struct pci_dev *pdev, int dev_idx,
1179
			struct e752x_pvt *pvt)
1180 1181 1182 1183
{
	struct pci_dev *dev;

	pvt->bridge_ck = pci_get_device(PCI_VENDOR_ID_INTEL,
1184
				pvt->dev_info->err_dev, pvt->bridge_ck);
1185 1186 1187 1188 1189 1190 1191

	if (pvt->bridge_ck == NULL)
		pvt->bridge_ck = pci_scan_single_device(pdev->bus,
							PCI_DEVFN(0, 1));

	if (pvt->bridge_ck == NULL) {
		e752x_printk(KERN_ERR, "error reporting device not found:"
1192 1193
			"vendor %x device 0x%x (broken BIOS?)\n",
			PCI_VENDOR_ID_INTEL, e752x_devs[dev_idx].err_dev);
1194 1195 1196
		return 1;
	}

1197 1198 1199
	dev = pci_get_device(PCI_VENDOR_ID_INTEL,
				e752x_devs[dev_idx].ctl_dev,
				NULL);
1200 1201 1202 1203 1204 1205 1206 1207 1208

	if (dev == NULL)
		goto fail;

	pvt->dev_d0f0 = dev;
	pvt->dev_d0f1 = pci_dev_get(pvt->bridge_ck);

	return 0;

1209
fail:
1210 1211 1212 1213
	pci_dev_put(pvt->bridge_ck);
	return 1;
}

1214 1215
/* Setup system bus parity mask register.
 * Sysbus parity supported on:
K
Konstantin Olifer 已提交
1216
 * e7320/e7520/e7525 + Xeon
1217 1218 1219 1220 1221 1222 1223
 */
static void e752x_init_sysbus_parity_mask(struct e752x_pvt *pvt)
{
	char *cpu_id = cpu_data(0).x86_model_id;
	struct pci_dev *dev = pvt->dev_d0f1;
	int enable = 1;

1224
	/* Allow module parameter override, else see if CPU supports parity */
1225 1226
	if (sysbus_parity != -1) {
		enable = sysbus_parity;
K
Konstantin Olifer 已提交
1227
	} else if (cpu_id[0] && !strstr(cpu_id, "Xeon")) {
1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238
		e752x_printk(KERN_INFO, "System Bus Parity not "
			     "supported by CPU, disabling\n");
		enable = 0;
	}

	if (enable)
		pci_write_config_word(dev, E752X_SYSBUS_ERRMASK, 0x0000);
	else
		pci_write_config_word(dev, E752X_SYSBUS_ERRMASK, 0x0309);
}

1239 1240 1241 1242 1243 1244
static void e752x_init_error_reporting_regs(struct e752x_pvt *pvt)
{
	struct pci_dev *dev;

	dev = pvt->dev_d0f1;
	/* Turn off error disable & SMI in case the BIOS turned it on */
1245 1246 1247 1248 1249 1250 1251
	if (pvt->dev_info->err_dev == PCI_DEVICE_ID_INTEL_3100_1_ERR) {
		pci_write_config_dword(dev, I3100_NSI_EMASK, 0);
		pci_write_config_dword(dev, I3100_NSI_SMICMD, 0);
	} else {
		pci_write_config_byte(dev, E752X_HI_ERRMASK, 0x00);
		pci_write_config_byte(dev, E752X_HI_SMICMD, 0x00);
	}
1252 1253 1254

	e752x_init_sysbus_parity_mask(pvt);

1255 1256 1257 1258 1259 1260 1261 1262 1263
	pci_write_config_word(dev, E752X_SYSBUS_SMICMD, 0x00);
	pci_write_config_byte(dev, E752X_BUF_ERRMASK, 0x00);
	pci_write_config_byte(dev, E752X_BUF_SMICMD, 0x00);
	pci_write_config_byte(dev, E752X_DRAM_ERRMASK, 0x00);
	pci_write_config_byte(dev, E752X_DRAM_SMICMD, 0x00);
}

static int e752x_probe1(struct pci_dev *pdev, int dev_idx)
{
D
Dave Peterson 已提交
1264
	u16 pci_data;
1265
	u8 stat8;
1266
	struct mem_ctl_info *mci;
1267
	struct edac_mc_layer layers[2];
1268
	struct e752x_pvt *pvt;
1269
	u16 ddrcsr;
D
Dave Jiang 已提交
1270
	int drc_chan;		/* Number of channels 0=1chan,1=2chan */
1271
	struct e752x_error_info discard;
1272

D
Dave Peterson 已提交
1273
	debugf0("%s(): mci\n", __func__);
1274 1275
	debugf0("Starting Probe1\n");

M
mark gross 已提交
1276 1277 1278 1279
	/* check to see if device 0 function 1 is enabled; if it isn't, we
	 * assume the BIOS has reserved it for a reason and is expecting
	 * exclusive access, we take care not to violate that assumption and
	 * fail the probe. */
1280
	pci_read_config_byte(pdev, E752X_DEVPRES1, &stat8);
M
mark gross 已提交
1281 1282
	if (!force_function_unhide && !(stat8 & (1 << 5))) {
		printk(KERN_INFO "Contact your BIOS vendor to see if the "
1283
			"E752x error registers can be safely un-hidden\n");
1284
		return -ENODEV;
M
mark gross 已提交
1285
	}
1286 1287 1288 1289 1290 1291
	stat8 |= (1 << 5);
	pci_write_config_byte(pdev, E752X_DEVPRES1, stat8);

	pci_read_config_word(pdev, E752X_DDRCSR, &ddrcsr);
	/* FIXME: should check >>12 or 0xf, true for all? */
	/* Dual channel = 1, Single channel = 0 */
1292
	drc_chan = dual_channel_active(ddrcsr);
1293

1294 1295 1296 1297 1298 1299
	layers[0].type = EDAC_MC_LAYER_CHIP_SELECT;
	layers[0].size = E752X_NR_CSROWS;
	layers[0].is_virt_csrow = true;
	layers[1].type = EDAC_MC_LAYER_CHANNEL;
	layers[1].size = drc_chan + 1;
	layers[1].is_virt_csrow = false;
1300
	mci = edac_mc_alloc(0, ARRAY_SIZE(layers), layers, sizeof(*pvt));
1301
	if (mci == NULL)
1302
		return -ENOMEM;
1303

D
Dave Peterson 已提交
1304
	debugf3("%s(): init mci\n", __func__);
1305
	mci->mtype_cap = MEM_FLAG_RDDR;
1306 1307 1308
	/* 3100 IMCH supports SECDEC only */
	mci->edac_ctl_cap = (dev_idx == I3100) ? EDAC_FLAG_SECDED :
		(EDAC_FLAG_NONE | EDAC_FLAG_SECDED | EDAC_FLAG_S4ECD4ED);
1309
	/* FIXME - what if different memory types are in different csrows? */
D
Dave Peterson 已提交
1310
	mci->mod_name = EDAC_MOD_STR;
1311
	mci->mod_ver = E752X_REVISION;
1312
	mci->pdev = &pdev->dev;
1313

D
Dave Peterson 已提交
1314
	debugf3("%s(): init pvt\n", __func__);
D
Dave Jiang 已提交
1315
	pvt = (struct e752x_pvt *)mci->pvt_info;
1316
	pvt->dev_info = &e752x_devs[dev_idx];
1317
	pvt->mc_symmetric = ((ddrcsr & 0x10) != 0);
D
Dave Peterson 已提交
1318

1319 1320 1321
	if (e752x_get_devs(pdev, dev_idx, pvt)) {
		edac_mc_free(mci);
		return -ENODEV;
1322 1323
	}

D
Dave Peterson 已提交
1324
	debugf3("%s(): more mci init\n", __func__);
1325
	mci->ctl_name = pvt->dev_info->ctl_name;
1326
	mci->dev_name = pci_name(pdev);
1327 1328
	mci->edac_check = e752x_check;
	mci->ctl_page_to_phys = ctl_page_to_phys;
1329 1330
	mci->set_sdram_scrub_rate = set_sdram_scrub_rate;
	mci->get_sdram_scrub_rate = get_sdram_scrub_rate;
1331

1332 1333 1334 1335
	/* set the map type.  1 = normal, 0 = reversed
	 * Must be set before e752x_init_csrows in case csrow mapping
	 * is reversed.
	 */
1336
	pci_read_config_byte(pdev, E752X_DRM, &stat8);
1337 1338
	pvt->map_type = ((stat8 & 0x0f) > ((stat8 >> 4) & 0x0f));

1339 1340 1341
	e752x_init_csrows(mci, pdev, ddrcsr);
	e752x_init_mem_map_table(pdev, pvt);

1342 1343 1344 1345
	if (dev_idx == I3100)
		mci->edac_cap = EDAC_FLAG_SECDED; /* the only mode supported */
	else
		mci->edac_cap |= EDAC_FLAG_NONE;
D
Dave Peterson 已提交
1346
	debugf3("%s(): tolm, remapbase, remaplimit\n", __func__);
D
Dave Peterson 已提交
1347

1348
	/* load the top of low memory, remap base, and remap limit vars */
1349
	pci_read_config_word(pdev, E752X_TOLM, &pci_data);
1350
	pvt->tolm = ((u32) pci_data) << 4;
1351
	pci_read_config_word(pdev, E752X_REMAPBASE, &pci_data);
1352
	pvt->remapbase = ((u32) pci_data) << 14;
1353
	pci_read_config_word(pdev, E752X_REMAPLIMIT, &pci_data);
1354
	pvt->remaplimit = ((u32) pci_data) << 14;
D
Dave Peterson 已提交
1355
	e752x_printk(KERN_INFO,
1356 1357
			"tolm = %x, remapbase = %x, remaplimit = %x\n",
			pvt->tolm, pvt->remapbase, pvt->remaplimit);
1358

1359 1360 1361
	/* Here we assume that we will never see multiple instances of this
	 * type of memory controller.  The ID is therefore hardcoded to 0.
	 */
1362
	if (edac_mc_add_mc(mci)) {
D
Dave Peterson 已提交
1363
		debugf3("%s(): failed edac_mc_add_mc()\n", __func__);
1364 1365 1366
		goto fail;
	}

1367
	e752x_init_error_reporting_regs(pvt);
D
Dave Jiang 已提交
1368
	e752x_get_error_info(mci, &discard);	/* clear other MCH errors */
1369

1370 1371 1372 1373
	/* allocating generic PCI control info */
	e752x_pci = edac_pci_create_generic_ctl(&pdev->dev, EDAC_MOD_STR);
	if (!e752x_pci) {
		printk(KERN_WARNING
1374
			"%s(): Unable to create PCI control\n", __func__);
1375
		printk(KERN_WARNING
1376 1377
			"%s(): PCI error report via EDAC not setup\n",
			__func__);
1378 1379
	}

1380
	/* get this far and it's successful */
D
Dave Peterson 已提交
1381
	debugf3("%s(): success\n", __func__);
1382 1383
	return 0;

1384
fail:
1385 1386 1387 1388
	pci_dev_put(pvt->dev_d0f0);
	pci_dev_put(pvt->dev_d0f1);
	pci_dev_put(pvt->bridge_ck);
	edac_mc_free(mci);
D
Dave Peterson 已提交
1389

1390
	return -ENODEV;
1391 1392 1393 1394
}

/* returns count (>= 0), or negative on error */
static int __devinit e752x_init_one(struct pci_dev *pdev,
1395
				const struct pci_device_id *ent)
1396
{
D
Dave Peterson 已提交
1397
	debugf0("%s()\n", __func__);
1398 1399

	/* wake up and enable device */
D
Dave Jiang 已提交
1400
	if (pci_enable_device(pdev) < 0)
1401
		return -EIO;
D
Dave Peterson 已提交
1402

1403 1404 1405 1406 1407 1408 1409 1410
	return e752x_probe1(pdev, ent->driver_data);
}

static void __devexit e752x_remove_one(struct pci_dev *pdev)
{
	struct mem_ctl_info *mci;
	struct e752x_pvt *pvt;

D
Dave Peterson 已提交
1411
	debugf0("%s()\n", __func__);
1412

1413 1414 1415
	if (e752x_pci)
		edac_pci_release_generic_ctl(e752x_pci);

1416
	if ((mci = edac_mc_del_mc(&pdev->dev)) == NULL)
1417 1418
		return;

D
Dave Jiang 已提交
1419
	pvt = (struct e752x_pvt *)mci->pvt_info;
1420 1421 1422 1423 1424 1425
	pci_dev_put(pvt->dev_d0f0);
	pci_dev_put(pvt->dev_d0f1);
	pci_dev_put(pvt->bridge_ck);
	edac_mc_free(mci);
}

1426
static DEFINE_PCI_DEVICE_TABLE(e752x_pci_tbl) = {
D
Dave Peterson 已提交
1427
	{
D
Dave Jiang 已提交
1428 1429
	 PCI_VEND_DEV(INTEL, 7520_0), PCI_ANY_ID, PCI_ANY_ID, 0, 0,
	 E7520},
D
Dave Peterson 已提交
1430
	{
D
Dave Jiang 已提交
1431 1432
	 PCI_VEND_DEV(INTEL, 7525_0), PCI_ANY_ID, PCI_ANY_ID, 0, 0,
	 E7525},
D
Dave Peterson 已提交
1433
	{
D
Dave Jiang 已提交
1434 1435
	 PCI_VEND_DEV(INTEL, 7320_0), PCI_ANY_ID, PCI_ANY_ID, 0, 0,
	 E7320},
1436 1437 1438
	{
	 PCI_VEND_DEV(INTEL, 3100_0), PCI_ANY_ID, PCI_ANY_ID, 0, 0,
	 I3100},
D
Dave Peterson 已提交
1439
	{
D
Dave Jiang 已提交
1440 1441
	 0,
	 }			/* 0 terminated list. */
1442 1443 1444 1445 1446
};

MODULE_DEVICE_TABLE(pci, e752x_pci_tbl);

static struct pci_driver e752x_driver = {
D
Dave Peterson 已提交
1447
	.name = EDAC_MOD_STR,
1448 1449 1450
	.probe = e752x_init_one,
	.remove = __devexit_p(e752x_remove_one),
	.id_table = e752x_pci_tbl,
1451 1452
};

A
Alan Cox 已提交
1453
static int __init e752x_init(void)
1454 1455 1456
{
	int pci_rc;

D
Dave Peterson 已提交
1457
	debugf3("%s()\n", __func__);
1458 1459 1460 1461

       /* Ensure that the OPSTATE is set correctly for POLL or NMI */
       opstate_init();

1462 1463 1464 1465 1466 1467
	pci_rc = pci_register_driver(&e752x_driver);
	return (pci_rc < 0) ? pci_rc : 0;
}

static void __exit e752x_exit(void)
{
D
Dave Peterson 已提交
1468
	debugf3("%s()\n", __func__);
1469 1470 1471 1472 1473 1474 1475 1476
	pci_unregister_driver(&e752x_driver);
}

module_init(e752x_init);
module_exit(e752x_exit);

MODULE_LICENSE("GPL");
MODULE_AUTHOR("Linux Networx (http://lnxi.com) Tom Zimmerman\n");
1477
MODULE_DESCRIPTION("MC support for Intel e752x/3100 memory controllers");
M
mark gross 已提交
1478 1479 1480

module_param(force_function_unhide, int, 0444);
MODULE_PARM_DESC(force_function_unhide, "if BIOS sets Dev0:Fun1 up as hidden:"
1481 1482
		 " 1=force unhide and hope BIOS doesn't fight driver for "
		"Dev0:Fun1 access");
1483

D
Dave Jiang 已提交
1484 1485
module_param(edac_op_state, int, 0444);
MODULE_PARM_DESC(edac_op_state, "EDAC Error Reporting state: 0=Poll,1=NMI");
1486 1487 1488 1489

module_param(sysbus_parity, int, 0444);
MODULE_PARM_DESC(sysbus_parity, "0=disable system bus parity checking,"
		" 1=enable system bus parity checking, default=auto-detect");
1490 1491 1492
module_param(report_non_memory_errors, int, 0644);
MODULE_PARM_DESC(report_non_memory_errors, "0=disable non-memory error "
		"reporting, 1=enable non-memory error reporting");