edac_pci_sysfs.c 19.3 KB
Newer Older
1
/*
2 3 4 5 6 7 8 9 10 11 12
 * (C) 2005, 2006 Linux Networx (http://lnxi.com)
 * This file may be distributed under the terms of the
 * GNU General Public License.
 *
 * Written Doug Thompson <norsk5@xmission.com>
 *
 */
#include <linux/module.h>
#include <linux/sysdev.h>
#include <linux/ctype.h>

13
#include "edac_core.h"
14 15
#include "edac_module.h"

D
Doug Thompson 已提交
16
/* Turn off this whole feature if PCI is not configured */
17
#ifdef CONFIG_PCI
18 19 20

#define EDAC_PCI_SYMLINK	"device"

D
Doug Thompson 已提交
21 22 23 24
/* data variables exported via sysfs */
static int check_pci_errors;		/* default NO check PCI parity */
static int edac_pci_panic_on_pe;	/* default NO panic on PCI Parity */
static int edac_pci_log_pe = 1;		/* log PCI parity errors */
D
Dave Jiang 已提交
25
static int edac_pci_log_npe = 1;	/* log PCI non-parity error errors */
D
Doug Thompson 已提交
26 27
static int edac_pci_poll_msec = 1000;	/* one second workq period */

28
static atomic_t pci_parity_count = ATOMIC_INIT(0);
29
static atomic_t pci_nonparity_count = ATOMIC_INIT(0);
30

D
Doug Thompson 已提交
31
static struct kobject edac_pci_top_main_kobj;
32 33
static atomic_t edac_pci_sysfs_refcount = ATOMIC_INIT(0);

D
Doug Thompson 已提交
34
/* getter functions for the data variables */
D
Dave Jiang 已提交
35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59
int edac_pci_get_check_errors(void)
{
	return check_pci_errors;
}

int edac_pci_get_log_pe(void)
{
	return edac_pci_log_pe;
}

int edac_pci_get_log_npe(void)
{
	return edac_pci_log_npe;
}

int edac_pci_get_panic_on_pe(void)
{
	return edac_pci_panic_on_pe;
}

int edac_pci_get_poll_msec(void)
{
	return edac_pci_poll_msec;
}

60 61 62
/**************************** EDAC PCI sysfs instance *******************/
static ssize_t instance_pe_count_show(struct edac_pci_ctl_info *pci, char *data)
{
63
	return sprintf(data, "%u\n", atomic_read(&pci->counters.pe_count));
64 65 66
}

static ssize_t instance_npe_count_show(struct edac_pci_ctl_info *pci,
67
				char *data)
68
{
69
	return sprintf(data, "%u\n", atomic_read(&pci->counters.npe_count));
70 71 72 73 74 75 76 77 78 79
}

#define to_instance(k) container_of(k, struct edac_pci_ctl_info, kobj)
#define to_instance_attr(a) container_of(a, struct instance_attribute, attr)

/* DEVICE instance kobject release() function */
static void edac_pci_instance_release(struct kobject *kobj)
{
	struct edac_pci_ctl_info *pci;

D
Doug Thompson 已提交
80
	debugf0("%s()\n", __func__);
81

D
Doug Thompson 已提交
82
	/* Form pointer to containing struct, the pci control struct */
83
	pci = to_instance(kobj);
D
Doug Thompson 已提交
84 85 86 87 88

	/* decrement reference count on top main kobj */
	kobject_put(&edac_pci_top_main_kobj);

	kfree(pci);	/* Free the control struct */
89 90 91 92
}

/* instance specific attribute structure */
struct instance_attribute {
93
	struct attribute attr;
D
Doug Thompson 已提交
94 95
	ssize_t(*show) (struct edac_pci_ctl_info *, char *);
	ssize_t(*store) (struct edac_pci_ctl_info *, const char *, size_t);
96 97 98 99
};

/* Function to 'show' fields from the edac_pci 'instance' structure */
static ssize_t edac_pci_instance_show(struct kobject *kobj,
100
				struct attribute *attr, char *buffer)
101
{
102 103
	struct edac_pci_ctl_info *pci = to_instance(kobj);
	struct instance_attribute *instance_attr = to_instance_attr(attr);
104

105 106 107
	if (instance_attr->show)
		return instance_attr->show(pci, buffer);
	return -EIO;
108 109 110 111
}

/* Function to 'store' fields into the edac_pci 'instance' structure */
static ssize_t edac_pci_instance_store(struct kobject *kobj,
112 113
				struct attribute *attr,
				const char *buffer, size_t count)
114
{
115 116
	struct edac_pci_ctl_info *pci = to_instance(kobj);
	struct instance_attribute *instance_attr = to_instance_attr(attr);
117

118 119 120
	if (instance_attr->store)
		return instance_attr->store(pci, buffer, count);
	return -EIO;
121 122
}

D
Doug Thompson 已提交
123
/* fs_ops table */
124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144
static struct sysfs_ops pci_instance_ops = {
	.show = edac_pci_instance_show,
	.store = edac_pci_instance_store
};

#define INSTANCE_ATTR(_name, _mode, _show, _store)	\
static struct instance_attribute attr_instance_##_name = {	\
	.attr	= {.name = __stringify(_name), .mode = _mode },	\
	.show	= _show,					\
	.store	= _store,					\
};

INSTANCE_ATTR(pe_count, S_IRUGO, instance_pe_count_show, NULL);
INSTANCE_ATTR(npe_count, S_IRUGO, instance_npe_count_show, NULL);

/* pci instance attributes */
static struct instance_attribute *pci_instance_attr[] = {
	&attr_instance_pe_count,
	&attr_instance_npe_count,
	NULL
};
145

D
Doug Thompson 已提交
146
/* the ktype for a pci instance */
147 148 149 150 151 152
static struct kobj_type ktype_pci_instance = {
	.release = edac_pci_instance_release,
	.sysfs_ops = &pci_instance_ops,
	.default_attrs = (struct attribute **)pci_instance_attr,
};

D
Doug Thompson 已提交
153 154 155 156 157
/*
 * edac_pci_create_instance_kobj
 *
 *	construct one EDAC PCI instance's kobject for use
 */
158 159
static int edac_pci_create_instance_kobj(struct edac_pci_ctl_info *pci, int idx)
{
D
Doug Thompson 已提交
160
	struct kobject *main_kobj;
161 162
	int err;

D
Doug Thompson 已提交
163 164 165 166 167 168 169 170 171 172 173 174 175
	debugf0("%s()\n", __func__);

	/* First bump the ref count on the top main kobj, which will
	 * track the number of PCI instances we have, and thus nest
	 * properly on keeping the module loaded
	 */
	main_kobj = kobject_get(&edac_pci_top_main_kobj);
	if (!main_kobj) {
		err = -ENODEV;
		goto error_out;
	}

	/* And now register this new kobject under the main kobj */
176 177
	err = kobject_init_and_add(&pci->kobj, &ktype_pci_instance,
				   &edac_pci_top_main_kobj, "pci%d", idx);
178 179
	if (err != 0) {
		debugf2("%s() failed to register instance pci%d\n",
180
			__func__, idx);
D
Doug Thompson 已提交
181 182
		kobject_put(&edac_pci_top_main_kobj);
		goto error_out;
183 184
	}

185
	kobject_uevent(&pci->kobj, KOBJ_ADD);
186 187 188
	debugf1("%s() Register instance 'pci%d' kobject\n", __func__, idx);

	return 0;
D
Doug Thompson 已提交
189 190 191 192

	/* Error unwind statck */
error_out:
	return err;
193 194
}

D
Doug Thompson 已提交
195 196 197 198 199 200
/*
 * edac_pci_unregister_sysfs_instance_kobj
 *
 *	unregister the kobj for the EDAC PCI instance
 */
void edac_pci_unregister_sysfs_instance_kobj(struct edac_pci_ctl_info *pci)
201
{
D
Doug Thompson 已提交
202 203 204 205 206 207
	debugf0("%s()\n", __func__);

	/* Unregister the instance kobject and allow its release
	 * function release the main reference count and then
	 * kfree the memory
	 */
208 209 210 211 212 213
	kobject_unregister(&pci->kobj);
}

/***************************** EDAC PCI sysfs root **********************/
#define to_edacpci(k) container_of(k, struct edac_pci_ctl_info, kobj)
#define to_edacpci_attr(a) container_of(a, struct edac_pci_attr, attr)
214

D
Doug Thompson 已提交
215
/* simple show/store functions for attributes */
216 217 218
static ssize_t edac_pci_int_show(void *ptr, char *buffer)
{
	int *value = ptr;
219
	return sprintf(buffer, "%d\n", *value);
220 221 222 223 224 225 226
}

static ssize_t edac_pci_int_store(void *ptr, const char *buffer, size_t count)
{
	int *value = ptr;

	if (isdigit(*buffer))
227
		*value = simple_strtoul(buffer, NULL, 0);
228 229 230 231 232 233 234

	return count;
}

struct edac_pci_dev_attribute {
	struct attribute attr;
	void *value;
235 236
	 ssize_t(*show) (void *, char *);
	 ssize_t(*store) (void *, const char *, size_t);
237 238 239 240
};

/* Set of show/store abstract level functions for PCI Parity object */
static ssize_t edac_pci_dev_show(struct kobject *kobj, struct attribute *attr,
241
				 char *buffer)
242 243
{
	struct edac_pci_dev_attribute *edac_pci_dev;
244
	edac_pci_dev = (struct edac_pci_dev_attribute *)attr;
245 246 247 248 249 250 251

	if (edac_pci_dev->show)
		return edac_pci_dev->show(edac_pci_dev->value, buffer);
	return -EIO;
}

static ssize_t edac_pci_dev_store(struct kobject *kobj,
252 253
				struct attribute *attr, const char *buffer,
				size_t count)
254 255
{
	struct edac_pci_dev_attribute *edac_pci_dev;
256
	edac_pci_dev = (struct edac_pci_dev_attribute *)attr;
257 258 259 260 261 262 263

	if (edac_pci_dev->show)
		return edac_pci_dev->store(edac_pci_dev->value, buffer, count);
	return -EIO;
}

static struct sysfs_ops edac_pci_sysfs_ops = {
264 265
	.show = edac_pci_dev_show,
	.store = edac_pci_dev_store
266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284
};

#define EDAC_PCI_ATTR(_name,_mode,_show,_store)			\
static struct edac_pci_dev_attribute edac_pci_attr_##_name = {		\
	.attr = {.name = __stringify(_name), .mode = _mode },	\
	.value  = &_name,					\
	.show   = _show,					\
	.store  = _store,					\
};

#define EDAC_PCI_STRING_ATTR(_name,_data,_mode,_show,_store)	\
static struct edac_pci_dev_attribute edac_pci_attr_##_name = {		\
	.attr = {.name = __stringify(_name), .mode = _mode },	\
	.value  = _data,					\
	.show   = _show,					\
	.store  = _store,					\
};

/* PCI Parity control files */
285
EDAC_PCI_ATTR(check_pci_errors, S_IRUGO | S_IWUSR, edac_pci_int_show,
286
	edac_pci_int_store);
287
EDAC_PCI_ATTR(edac_pci_log_pe, S_IRUGO | S_IWUSR, edac_pci_int_show,
288
	edac_pci_int_store);
289
EDAC_PCI_ATTR(edac_pci_log_npe, S_IRUGO | S_IWUSR, edac_pci_int_show,
290
	edac_pci_int_store);
291
EDAC_PCI_ATTR(edac_pci_panic_on_pe, S_IRUGO | S_IWUSR, edac_pci_int_show,
292
	edac_pci_int_store);
293
EDAC_PCI_ATTR(pci_parity_count, S_IRUGO, edac_pci_int_show, NULL);
294
EDAC_PCI_ATTR(pci_nonparity_count, S_IRUGO, edac_pci_int_show, NULL);
295 296 297

/* Base Attributes of the memory ECC object */
static struct edac_pci_dev_attribute *edac_pci_attr[] = {
298
	&edac_pci_attr_check_pci_errors,
D
Dave Jiang 已提交
299 300 301
	&edac_pci_attr_edac_pci_log_pe,
	&edac_pci_attr_edac_pci_log_npe,
	&edac_pci_attr_edac_pci_panic_on_pe,
302
	&edac_pci_attr_pci_parity_count,
303
	&edac_pci_attr_pci_nonparity_count,
304 305 306
	NULL,
};

D
Doug Thompson 已提交
307 308 309 310 311 312 313 314 315 316
/*
 * edac_pci_release_main_kobj
 *
 *	This release function is called when the reference count to the
 *	passed kobj goes to zero.
 *
 *	This kobj is the 'main' kobject that EDAC PCI instances
 *	link to, and thus provide for proper nesting counts
 */
static void edac_pci_release_main_kobj(struct kobject *kobj)
317
{
318

D
Doug Thompson 已提交
319
	debugf0("%s() here to module_put(THIS_MODULE)\n", __func__);
320

D
Doug Thompson 已提交
321 322 323 324
	/* last reference to top EDAC PCI kobject has been removed,
	 * NOW release our ref count on the core module
	 */
	module_put(THIS_MODULE);
325 326
}

D
Doug Thompson 已提交
327 328 329
/* ktype struct for the EDAC PCI main kobj */
static struct kobj_type ktype_edac_pci_main_kobj = {
	.release = edac_pci_release_main_kobj,
330
	.sysfs_ops = &edac_pci_sysfs_ops,
331
	.default_attrs = (struct attribute **)edac_pci_attr,
332 333 334
};

/**
D
Doug Thompson 已提交
335
 * edac_pci_main_kobj_setup()
336 337 338 339
 *
 *	setup the sysfs for EDAC PCI attributes
 *	assumes edac_class has already been initialized
 */
D
Doug Thompson 已提交
340
int edac_pci_main_kobj_setup(void)
341 342 343 344
{
	int err;
	struct sysdev_class *edac_class;

D
Doug Thompson 已提交
345 346 347 348 349
	debugf0("%s()\n", __func__);

	/* check and count if we have already created the main kobject */
	if (atomic_inc_return(&edac_pci_sysfs_refcount) != 1)
		return 0;
350

D
Doug Thompson 已提交
351 352 353
	/* First time, so create the main kobject and its
	 * controls and atributes
	 */
354
	edac_class = edac_get_edac_class();
355 356
	if (edac_class == NULL) {
		debugf1("%s() no edac_class\n", __func__);
D
Doug Thompson 已提交
357 358
		err = -ENODEV;
		goto decrement_count_fail;
359
	}
360

D
Doug Thompson 已提交
361 362 363 364 365 366 367 368 369
	/* Bump the reference count on this module to ensure the
	 * modules isn't unloaded until we deconstruct the top
	 * level main kobj for EDAC PCI
	 */
	if (!try_module_get(THIS_MODULE)) {
		debugf1("%s() try_module_get() failed\n", __func__);
		err = -ENODEV;
		goto decrement_count_fail;
	}
370

371
	/* Instanstiate the pci object */
372 373
	err = kobject_init_and_add(&edac_pci_top_main_kobj, &ktype_edac_pci_main_kobj,
				   &edac_class->kset.kobj, "pci");
374 375
	if (err) {
		debugf1("Failed to register '.../edac/pci'\n");
376
		goto kobject_init_and_add_fail;
377 378
	}

D
Doug Thompson 已提交
379 380 381 382
	/* At this point, to 'release' the top level kobject
	 * for EDAC PCI, then edac_pci_main_kobj_teardown()
	 * must be used, for resources to be cleaned up properly
	 */
383
	kobject_uevent(&edac_pci_top_main_kobj, KOBJ_ADD);
384 385 386
	debugf1("Registered '.../edac/pci' kobject\n");

	return 0;
D
Doug Thompson 已提交
387 388

	/* Error unwind statck */
389
kobject_init_and_add_fail:
D
Doug Thompson 已提交
390 391 392 393 394 395 396
	module_put(THIS_MODULE);

decrement_count_fail:
	/* if are on this error exit, nothing to tear down */
	atomic_dec(&edac_pci_sysfs_refcount);

	return err;
397 398 399
}

/*
D
Doug Thompson 已提交
400
 * edac_pci_main_kobj_teardown()
401
 *
D
Doug Thompson 已提交
402 403
 *	if no longer linked (needed) remove the top level EDAC PCI
 *	kobject with its controls and attributes
404
 */
D
Doug Thompson 已提交
405
static void edac_pci_main_kobj_teardown(void)
406 407
{
	debugf0("%s()\n", __func__);
D
Doug Thompson 已提交
408 409 410 411 412 413 414 415 416 417

	/* Decrement the count and only if no more controller instances
	 * are connected perform the unregisteration of the top level
	 * main kobj
	 */
	if (atomic_dec_return(&edac_pci_sysfs_refcount) == 0) {
		debugf0("%s() called kobject_unregister on main kobj\n",
			__func__);
		kobject_unregister(&edac_pci_top_main_kobj);
	}
418 419
}

D
Doug Thompson 已提交
420 421 422 423 424 425
/*
 *
 * edac_pci_create_sysfs
 *
 *	Create the controls/attributes for the specified EDAC PCI device
 */
426 427 428 429 430
int edac_pci_create_sysfs(struct edac_pci_ctl_info *pci)
{
	int err;
	struct kobject *edac_kobj = &pci->kobj;

D
Doug Thompson 已提交
431
	debugf0("%s() idx=%d\n", __func__, pci->pci_idx);
432

D
Doug Thompson 已提交
433 434 435 436
	/* create the top main EDAC PCI kobject, IF needed */
	err = edac_pci_main_kobj_setup();
	if (err)
		return err;
437

D
Doug Thompson 已提交
438 439 440 441
	/* Create this instance's kobject under the MAIN kobject */
	err = edac_pci_create_instance_kobj(pci, pci->pci_idx);
	if (err)
		goto unregister_cleanup;
442

443
	err = sysfs_create_link(edac_kobj, &pci->dev->kobj, EDAC_PCI_SYMLINK);
444 445
	if (err) {
		debugf0("%s() sysfs_create_link() returned err= %d\n",
446
			__func__, err);
D
Doug Thompson 已提交
447
		goto symlink_fail;
448 449 450
	}

	return 0;
D
Doug Thompson 已提交
451 452 453 454 455 456 457 458 459

	/* Error unwind stack */
symlink_fail:
	edac_pci_unregister_sysfs_instance_kobj(pci);

unregister_cleanup:
	edac_pci_main_kobj_teardown();

	return err;
460 461
}

D
Doug Thompson 已提交
462 463 464 465 466
/*
 * edac_pci_remove_sysfs
 *
 *	remove the controls and attributes for this EDAC PCI device
 */
467 468
void edac_pci_remove_sysfs(struct edac_pci_ctl_info *pci)
{
D
Doug Thompson 已提交
469
	debugf0("%s() index=%d\n", __func__, pci->pci_idx);
470

D
Doug Thompson 已提交
471
	/* Remove the symlink */
472 473
	sysfs_remove_link(&pci->kobj, EDAC_PCI_SYMLINK);

D
Doug Thompson 已提交
474 475 476 477 478 479 480 481 482
	/* remove this PCI instance's sysfs entries */
	edac_pci_unregister_sysfs_instance_kobj(pci);

	/* Call the main unregister function, which will determine
	 * if this 'pci' is the last instance.
	 * If it is, the main kobject will be unregistered as a result
	 */
	debugf0("%s() calling edac_pci_main_kobj_teardown()\n", __func__);
	edac_pci_main_kobj_teardown();
483 484 485
}

/************************ PCI error handling *************************/
486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508
static u16 get_pci_parity_status(struct pci_dev *dev, int secondary)
{
	int where;
	u16 status;

	where = secondary ? PCI_SEC_STATUS : PCI_STATUS;
	pci_read_config_word(dev, where, &status);

	/* If we get back 0xFFFF then we must suspect that the card has been
	 * pulled but the Linux PCI layer has not yet finished cleaning up.
	 * We don't want to report on such devices
	 */

	if (status == 0xFFFF) {
		u32 sanity;

		pci_read_config_dword(dev, 0, &sanity);

		if (sanity == 0xFFFFFFFF)
			return 0;
	}

	status &= PCI_STATUS_DETECTED_PARITY | PCI_STATUS_SIG_SYSTEM_ERROR |
509
		PCI_STATUS_PARITY;
510 511 512 513 514 515 516 517 518 519 520 521 522 523

	if (status)
		/* reset only the bits we are interested in */
		pci_write_config_word(dev, where, status);

	return status;
}


/* Clear any PCI parity errors logged by this device. */
static void edac_pci_dev_parity_clear(struct pci_dev *dev)
{
	u8 header_type;

D
Doug Thompson 已提交
524 525
	debugf0("%s()\n", __func__);

526 527 528 529 530 531 532 533 534 535 536 537
	get_pci_parity_status(dev, 0);

	/* read the device TYPE, looking for bridges */
	pci_read_config_byte(dev, PCI_HEADER_TYPE, &header_type);

	if ((header_type & 0x7F) == PCI_HEADER_TYPE_BRIDGE)
		get_pci_parity_status(dev, 1);
}

/*
 *  PCI Parity polling
 *
D
Doug Thompson 已提交
538 539 540
 *	Fucntion to retrieve the current parity status
 *	and decode it
 *
541 542 543
 */
static void edac_pci_dev_parity_test(struct pci_dev *dev)
{
D
Doug Thompson 已提交
544
	unsigned long flags;
545
	u16 status;
546
	u8 header_type;
547

D
Doug Thompson 已提交
548 549 550 551
	/* stop any interrupts until we can acquire the status */
	local_irq_save(flags);

	/* read the STATUS register on this device */
552 553
	status = get_pci_parity_status(dev, 0);

D
Doug Thompson 已提交
554 555 556 557 558 559
	/* read the device TYPE, looking for bridges */
	pci_read_config_byte(dev, PCI_HEADER_TYPE, &header_type);

	local_irq_restore(flags);

	debugf4("PCI STATUS= 0x%04x %s\n", status, dev->dev.bus_id);
560 561 562

	/* check the status reg for errors */
	if (status) {
563
		if (status & (PCI_STATUS_SIG_SYSTEM_ERROR)) {
564
			edac_printk(KERN_CRIT, EDAC_PCI,
565 566
				"Signaled System Error on %s\n",
				pci_name(dev));
567 568
			atomic_inc(&pci_nonparity_count);
		}
569 570 571

		if (status & (PCI_STATUS_PARITY)) {
			edac_printk(KERN_CRIT, EDAC_PCI,
572 573
				"Master Data Parity Error on %s\n",
				pci_name(dev));
574 575 576 577 578 579

			atomic_inc(&pci_parity_count);
		}

		if (status & (PCI_STATUS_DETECTED_PARITY)) {
			edac_printk(KERN_CRIT, EDAC_PCI,
580 581
				"Detected Parity Error on %s\n",
				pci_name(dev));
582 583 584 585 586 587

			atomic_inc(&pci_parity_count);
		}
	}


D
Doug Thompson 已提交
588
	debugf4("PCI HEADER TYPE= 0x%02x %s\n", header_type, dev->dev.bus_id);
589 590 591 592 593

	if ((header_type & 0x7F) == PCI_HEADER_TYPE_BRIDGE) {
		/* On bridges, need to examine secondary status register  */
		status = get_pci_parity_status(dev, 1);

D
Doug Thompson 已提交
594
		debugf4("PCI SEC_STATUS= 0x%04x %s\n", status, dev->dev.bus_id);
595 596 597

		/* check the secondary status reg for errors */
		if (status) {
598
			if (status & (PCI_STATUS_SIG_SYSTEM_ERROR)) {
599
				edac_printk(KERN_CRIT, EDAC_PCI, "Bridge "
600 601
					"Signaled System Error on %s\n",
					pci_name(dev));
602 603
				atomic_inc(&pci_nonparity_count);
			}
604 605 606

			if (status & (PCI_STATUS_PARITY)) {
				edac_printk(KERN_CRIT, EDAC_PCI, "Bridge "
607 608
					"Master Data Parity Error on "
					"%s\n", pci_name(dev));
609 610 611 612 613 614

				atomic_inc(&pci_parity_count);
			}

			if (status & (PCI_STATUS_DETECTED_PARITY)) {
				edac_printk(KERN_CRIT, EDAC_PCI, "Bridge "
615 616
					"Detected Parity Error on %s\n",
					pci_name(dev));
617 618 619 620 621 622 623

				atomic_inc(&pci_parity_count);
			}
		}
	}
}

D
Doug Thompson 已提交
624 625 626
/* reduce some complexity in definition of the iterator */
typedef void (*pci_parity_check_fn_t) (struct pci_dev *dev);

627 628
/*
 * pci_dev parity list iterator
D
Doug Thompson 已提交
629
 *	Scan the PCI device list for one pass, looking for SERRORs
630 631 632 633 634 635 636 637 638 639
 *	Master Parity ERRORS or Parity ERRORs on primary or secondary devices
 */
static inline void edac_pci_dev_parity_iterator(pci_parity_check_fn_t fn)
{
	struct pci_dev *dev = NULL;

	/* request for kernel access to the next PCI device, if any,
	 * and while we are looking at it have its reference count
	 * bumped until we are done with it
	 */
640
	while ((dev = pci_get_device(PCI_ANY_ID, PCI_ANY_ID, dev)) != NULL) {
641 642 643 644 645 646 647 648 649 650 651 652 653 654 655
		fn(dev);
	}
}

/*
 * edac_pci_do_parity_check
 *
 *	performs the actual PCI parity check operation
 */
void edac_pci_do_parity_check(void)
{
	int before_count;

	debugf3("%s()\n", __func__);

D
Doug Thompson 已提交
656
	/* if policy has PCI check off, leave now */
657
	if (!check_pci_errors)
658 659 660 661 662
		return;

	before_count = atomic_read(&pci_parity_count);

	/* scan all PCI devices looking for a Parity Error on devices and
D
Doug Thompson 已提交
663 664 665
	 * bridges.
	 * The iterator calls pci_get_device() which might sleep, thus
	 * we cannot disable interrupts in this scan.
666 667 668 669
	 */
	edac_pci_dev_parity_iterator(edac_pci_dev_parity_test);

	/* Only if operator has selected panic on PCI Error */
D
Dave Jiang 已提交
670
	if (edac_pci_get_panic_on_pe()) {
671 672 673 674 675 676
		/* If the count is different 'after' from 'before' */
		if (before_count != atomic_read(&pci_parity_count))
			panic("EDAC: PCI Parity Error");
	}
}

D
Doug Thompson 已提交
677 678 679 680 681 682
/*
 * edac_pci_clear_parity_errors
 *
 *	function to perform an iteration over the PCI devices
 *	and clearn their current status
 */
683 684 685 686 687 688 689
void edac_pci_clear_parity_errors(void)
{
	/* Clear any PCI bus parity errors that devices initially have logged
	 * in their registers.
	 */
	edac_pci_dev_parity_iterator(edac_pci_dev_parity_clear);
}
D
Doug Thompson 已提交
690 691 692 693 694 695

/*
 * edac_pci_handle_pe
 *
 *	Called to handle a PARITY ERROR event
 */
696 697 698 699 700 701
void edac_pci_handle_pe(struct edac_pci_ctl_info *pci, const char *msg)
{

	/* global PE counter incremented by edac_pci_do_parity_check() */
	atomic_inc(&pci->counters.pe_count);

D
Dave Jiang 已提交
702
	if (edac_pci_get_log_pe())
703 704 705 706 707 708 709 710 711 712 713
		edac_pci_printk(pci, KERN_WARNING,
				"Parity Error ctl: %s %d: %s\n",
				pci->ctl_name, pci->pci_idx, msg);

	/*
	 * poke all PCI devices and see which one is the troublemaker
	 * panic() is called if set
	 */
	edac_pci_do_parity_check();
}
EXPORT_SYMBOL_GPL(edac_pci_handle_pe);
714

D
Doug Thompson 已提交
715 716 717 718 719 720

/*
 * edac_pci_handle_npe
 *
 *	Called to handle a NON-PARITY ERROR event
 */
721 722 723 724 725 726
void edac_pci_handle_npe(struct edac_pci_ctl_info *pci, const char *msg)
{

	/* global NPE counter incremented by edac_pci_do_parity_check() */
	atomic_inc(&pci->counters.npe_count);

D
Dave Jiang 已提交
727
	if (edac_pci_get_log_npe())
728 729 730 731 732 733 734 735 736 737 738
		edac_pci_printk(pci, KERN_WARNING,
				"Non-Parity Error ctl: %s %d: %s\n",
				pci->ctl_name, pci->pci_idx, msg);

	/*
	 * poke all PCI devices and see which one is the troublemaker
	 * panic() is called if set
	 */
	edac_pci_do_parity_check();
}
EXPORT_SYMBOL_GPL(edac_pci_handle_npe);
739 740 741 742

/*
 * Define the PCI parameter to the module
 */
743
module_param(check_pci_errors, int, 0644);
D
Dave Jiang 已提交
744
MODULE_PARM_DESC(check_pci_errors,
745
		 "Check for PCI bus parity errors: 0=off 1=on");
D
Dave Jiang 已提交
746 747
module_param(edac_pci_panic_on_pe, int, 0644);
MODULE_PARM_DESC(edac_pci_panic_on_pe,
748
		 "Panic on PCI Bus Parity error: 0=off 1=on");
749

750
#endif				/* CONFIG_PCI */