362 lines
8.9 KiB
C
362 lines
8.9 KiB
C
|
/* edac_mc kernel module
|
||
|
* (C) 2005, 2006 Linux Networx (http://lnxi.com)
|
||
|
* This file may be distributed under the terms of the
|
||
|
* GNU General Public License.
|
||
|
*
|
||
|
* Written Doug Thompson <norsk5@xmission.com>
|
||
|
*
|
||
|
*/
|
||
|
#include <linux/module.h>
|
||
|
#include <linux/sysdev.h>
|
||
|
#include <linux/ctype.h>
|
||
|
|
||
|
#include "edac_mc.h"
|
||
|
#include "edac_module.h"
|
||
|
|
||
|
|
||
|
#ifdef CONFIG_PCI
|
||
|
static int check_pci_parity = 0; /* default YES check PCI parity */
|
||
|
static int panic_on_pci_parity; /* default no panic on PCI Parity */
|
||
|
static atomic_t pci_parity_count = ATOMIC_INIT(0);
|
||
|
|
||
|
static struct kobject edac_pci_kobj; /* /sys/devices/system/edac/pci */
|
||
|
static struct completion edac_pci_kobj_complete;
|
||
|
|
||
|
|
||
|
static ssize_t edac_pci_int_show(void *ptr, char *buffer)
|
||
|
{
|
||
|
int *value = ptr;
|
||
|
return sprintf(buffer,"%d\n",*value);
|
||
|
}
|
||
|
|
||
|
static ssize_t edac_pci_int_store(void *ptr, const char *buffer, size_t count)
|
||
|
{
|
||
|
int *value = ptr;
|
||
|
|
||
|
if (isdigit(*buffer))
|
||
|
*value = simple_strtoul(buffer,NULL,0);
|
||
|
|
||
|
return count;
|
||
|
}
|
||
|
|
||
|
struct edac_pci_dev_attribute {
|
||
|
struct attribute attr;
|
||
|
void *value;
|
||
|
ssize_t (*show)(void *,char *);
|
||
|
ssize_t (*store)(void *, const char *,size_t);
|
||
|
};
|
||
|
|
||
|
/* Set of show/store abstract level functions for PCI Parity object */
|
||
|
static ssize_t edac_pci_dev_show(struct kobject *kobj, struct attribute *attr,
|
||
|
char *buffer)
|
||
|
{
|
||
|
struct edac_pci_dev_attribute *edac_pci_dev;
|
||
|
edac_pci_dev= (struct edac_pci_dev_attribute*)attr;
|
||
|
|
||
|
if (edac_pci_dev->show)
|
||
|
return edac_pci_dev->show(edac_pci_dev->value, buffer);
|
||
|
return -EIO;
|
||
|
}
|
||
|
|
||
|
static ssize_t edac_pci_dev_store(struct kobject *kobj,
|
||
|
struct attribute *attr, const char *buffer, size_t count)
|
||
|
{
|
||
|
struct edac_pci_dev_attribute *edac_pci_dev;
|
||
|
edac_pci_dev= (struct edac_pci_dev_attribute*)attr;
|
||
|
|
||
|
if (edac_pci_dev->show)
|
||
|
return edac_pci_dev->store(edac_pci_dev->value, buffer, count);
|
||
|
return -EIO;
|
||
|
}
|
||
|
|
||
|
static struct sysfs_ops edac_pci_sysfs_ops = {
|
||
|
.show = edac_pci_dev_show,
|
||
|
.store = edac_pci_dev_store
|
||
|
};
|
||
|
|
||
|
#define EDAC_PCI_ATTR(_name,_mode,_show,_store) \
|
||
|
static struct edac_pci_dev_attribute edac_pci_attr_##_name = { \
|
||
|
.attr = {.name = __stringify(_name), .mode = _mode }, \
|
||
|
.value = &_name, \
|
||
|
.show = _show, \
|
||
|
.store = _store, \
|
||
|
};
|
||
|
|
||
|
#define EDAC_PCI_STRING_ATTR(_name,_data,_mode,_show,_store) \
|
||
|
static struct edac_pci_dev_attribute edac_pci_attr_##_name = { \
|
||
|
.attr = {.name = __stringify(_name), .mode = _mode }, \
|
||
|
.value = _data, \
|
||
|
.show = _show, \
|
||
|
.store = _store, \
|
||
|
};
|
||
|
|
||
|
/* PCI Parity control files */
|
||
|
EDAC_PCI_ATTR(check_pci_parity, S_IRUGO|S_IWUSR, edac_pci_int_show,
|
||
|
edac_pci_int_store);
|
||
|
EDAC_PCI_ATTR(panic_on_pci_parity, S_IRUGO|S_IWUSR, edac_pci_int_show,
|
||
|
edac_pci_int_store);
|
||
|
EDAC_PCI_ATTR(pci_parity_count, S_IRUGO, edac_pci_int_show, NULL);
|
||
|
|
||
|
/* Base Attributes of the memory ECC object */
|
||
|
static struct edac_pci_dev_attribute *edac_pci_attr[] = {
|
||
|
&edac_pci_attr_check_pci_parity,
|
||
|
&edac_pci_attr_panic_on_pci_parity,
|
||
|
&edac_pci_attr_pci_parity_count,
|
||
|
NULL,
|
||
|
};
|
||
|
|
||
|
/* No memory to release */
|
||
|
static void edac_pci_release(struct kobject *kobj)
|
||
|
{
|
||
|
debugf1("%s()\n", __func__);
|
||
|
complete(&edac_pci_kobj_complete);
|
||
|
}
|
||
|
|
||
|
static struct kobj_type ktype_edac_pci = {
|
||
|
.release = edac_pci_release,
|
||
|
.sysfs_ops = &edac_pci_sysfs_ops,
|
||
|
.default_attrs = (struct attribute **) edac_pci_attr,
|
||
|
};
|
||
|
|
||
|
/**
|
||
|
* edac_sysfs_pci_setup()
|
||
|
*
|
||
|
* setup the sysfs for EDAC PCI attributes
|
||
|
* assumes edac_class has already been initialized
|
||
|
*/
|
||
|
int edac_sysfs_pci_setup(void)
|
||
|
{
|
||
|
int err;
|
||
|
struct sysdev_class *edac_class;
|
||
|
|
||
|
debugf1("%s()\n", __func__);
|
||
|
|
||
|
edac_class = edac_get_edac_class();
|
||
|
|
||
|
memset(&edac_pci_kobj, 0, sizeof(edac_pci_kobj));
|
||
|
edac_pci_kobj.parent = &edac_class->kset.kobj;
|
||
|
edac_pci_kobj.ktype = &ktype_edac_pci;
|
||
|
err = kobject_set_name(&edac_pci_kobj, "pci");
|
||
|
|
||
|
if (!err) {
|
||
|
/* Instanstiate the pci object */
|
||
|
/* FIXME: maybe new sysdev_create_subdir() */
|
||
|
err = kobject_register(&edac_pci_kobj);
|
||
|
|
||
|
if (err)
|
||
|
debugf1("Failed to register '.../edac/pci'\n");
|
||
|
else
|
||
|
debugf1("Registered '.../edac/pci' kobject\n");
|
||
|
}
|
||
|
|
||
|
return err;
|
||
|
}
|
||
|
|
||
|
/*
|
||
|
* edac_sysfs_pci_teardown
|
||
|
*
|
||
|
* perform the sysfs teardown for the PCI attributes
|
||
|
*/
|
||
|
void edac_sysfs_pci_teardown(void)
|
||
|
{
|
||
|
debugf0("%s()\n", __func__);
|
||
|
init_completion(&edac_pci_kobj_complete);
|
||
|
kobject_unregister(&edac_pci_kobj);
|
||
|
wait_for_completion(&edac_pci_kobj_complete);
|
||
|
}
|
||
|
|
||
|
|
||
|
static u16 get_pci_parity_status(struct pci_dev *dev, int secondary)
|
||
|
{
|
||
|
int where;
|
||
|
u16 status;
|
||
|
|
||
|
where = secondary ? PCI_SEC_STATUS : PCI_STATUS;
|
||
|
pci_read_config_word(dev, where, &status);
|
||
|
|
||
|
/* If we get back 0xFFFF then we must suspect that the card has been
|
||
|
* pulled but the Linux PCI layer has not yet finished cleaning up.
|
||
|
* We don't want to report on such devices
|
||
|
*/
|
||
|
|
||
|
if (status == 0xFFFF) {
|
||
|
u32 sanity;
|
||
|
|
||
|
pci_read_config_dword(dev, 0, &sanity);
|
||
|
|
||
|
if (sanity == 0xFFFFFFFF)
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
status &= PCI_STATUS_DETECTED_PARITY | PCI_STATUS_SIG_SYSTEM_ERROR |
|
||
|
PCI_STATUS_PARITY;
|
||
|
|
||
|
if (status)
|
||
|
/* reset only the bits we are interested in */
|
||
|
pci_write_config_word(dev, where, status);
|
||
|
|
||
|
return status;
|
||
|
}
|
||
|
|
||
|
typedef void (*pci_parity_check_fn_t) (struct pci_dev *dev);
|
||
|
|
||
|
/* Clear any PCI parity errors logged by this device. */
|
||
|
static void edac_pci_dev_parity_clear(struct pci_dev *dev)
|
||
|
{
|
||
|
u8 header_type;
|
||
|
|
||
|
get_pci_parity_status(dev, 0);
|
||
|
|
||
|
/* read the device TYPE, looking for bridges */
|
||
|
pci_read_config_byte(dev, PCI_HEADER_TYPE, &header_type);
|
||
|
|
||
|
if ((header_type & 0x7F) == PCI_HEADER_TYPE_BRIDGE)
|
||
|
get_pci_parity_status(dev, 1);
|
||
|
}
|
||
|
|
||
|
/*
|
||
|
* PCI Parity polling
|
||
|
*
|
||
|
*/
|
||
|
static void edac_pci_dev_parity_test(struct pci_dev *dev)
|
||
|
{
|
||
|
u16 status;
|
||
|
u8 header_type;
|
||
|
|
||
|
/* read the STATUS register on this device
|
||
|
*/
|
||
|
status = get_pci_parity_status(dev, 0);
|
||
|
|
||
|
debugf2("PCI STATUS= 0x%04x %s\n", status, dev->dev.bus_id );
|
||
|
|
||
|
/* check the status reg for errors */
|
||
|
if (status) {
|
||
|
if (status & (PCI_STATUS_SIG_SYSTEM_ERROR))
|
||
|
edac_printk(KERN_CRIT, EDAC_PCI,
|
||
|
"Signaled System Error on %s\n",
|
||
|
pci_name(dev));
|
||
|
|
||
|
if (status & (PCI_STATUS_PARITY)) {
|
||
|
edac_printk(KERN_CRIT, EDAC_PCI,
|
||
|
"Master Data Parity Error on %s\n",
|
||
|
pci_name(dev));
|
||
|
|
||
|
atomic_inc(&pci_parity_count);
|
||
|
}
|
||
|
|
||
|
if (status & (PCI_STATUS_DETECTED_PARITY)) {
|
||
|
edac_printk(KERN_CRIT, EDAC_PCI,
|
||
|
"Detected Parity Error on %s\n",
|
||
|
pci_name(dev));
|
||
|
|
||
|
atomic_inc(&pci_parity_count);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/* read the device TYPE, looking for bridges */
|
||
|
pci_read_config_byte(dev, PCI_HEADER_TYPE, &header_type);
|
||
|
|
||
|
debugf2("PCI HEADER TYPE= 0x%02x %s\n", header_type, dev->dev.bus_id );
|
||
|
|
||
|
if ((header_type & 0x7F) == PCI_HEADER_TYPE_BRIDGE) {
|
||
|
/* On bridges, need to examine secondary status register */
|
||
|
status = get_pci_parity_status(dev, 1);
|
||
|
|
||
|
debugf2("PCI SEC_STATUS= 0x%04x %s\n",
|
||
|
status, dev->dev.bus_id );
|
||
|
|
||
|
/* check the secondary status reg for errors */
|
||
|
if (status) {
|
||
|
if (status & (PCI_STATUS_SIG_SYSTEM_ERROR))
|
||
|
edac_printk(KERN_CRIT, EDAC_PCI, "Bridge "
|
||
|
"Signaled System Error on %s\n",
|
||
|
pci_name(dev));
|
||
|
|
||
|
if (status & (PCI_STATUS_PARITY)) {
|
||
|
edac_printk(KERN_CRIT, EDAC_PCI, "Bridge "
|
||
|
"Master Data Parity Error on "
|
||
|
"%s\n", pci_name(dev));
|
||
|
|
||
|
atomic_inc(&pci_parity_count);
|
||
|
}
|
||
|
|
||
|
if (status & (PCI_STATUS_DETECTED_PARITY)) {
|
||
|
edac_printk(KERN_CRIT, EDAC_PCI, "Bridge "
|
||
|
"Detected Parity Error on %s\n",
|
||
|
pci_name(dev));
|
||
|
|
||
|
atomic_inc(&pci_parity_count);
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/*
|
||
|
* pci_dev parity list iterator
|
||
|
* Scan the PCI device list for one iteration, looking for SERRORs
|
||
|
* Master Parity ERRORS or Parity ERRORs on primary or secondary devices
|
||
|
*/
|
||
|
static inline void edac_pci_dev_parity_iterator(pci_parity_check_fn_t fn)
|
||
|
{
|
||
|
struct pci_dev *dev = NULL;
|
||
|
|
||
|
/* request for kernel access to the next PCI device, if any,
|
||
|
* and while we are looking at it have its reference count
|
||
|
* bumped until we are done with it
|
||
|
*/
|
||
|
while((dev = pci_get_device(PCI_ANY_ID, PCI_ANY_ID, dev)) != NULL) {
|
||
|
fn(dev);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/*
|
||
|
* edac_pci_do_parity_check
|
||
|
*
|
||
|
* performs the actual PCI parity check operation
|
||
|
*/
|
||
|
void edac_pci_do_parity_check(void)
|
||
|
{
|
||
|
unsigned long flags;
|
||
|
int before_count;
|
||
|
|
||
|
debugf3("%s()\n", __func__);
|
||
|
|
||
|
if (!check_pci_parity)
|
||
|
return;
|
||
|
|
||
|
before_count = atomic_read(&pci_parity_count);
|
||
|
|
||
|
/* scan all PCI devices looking for a Parity Error on devices and
|
||
|
* bridges
|
||
|
*/
|
||
|
local_irq_save(flags);
|
||
|
edac_pci_dev_parity_iterator(edac_pci_dev_parity_test);
|
||
|
local_irq_restore(flags);
|
||
|
|
||
|
/* Only if operator has selected panic on PCI Error */
|
||
|
if (panic_on_pci_parity) {
|
||
|
/* If the count is different 'after' from 'before' */
|
||
|
if (before_count != atomic_read(&pci_parity_count))
|
||
|
panic("EDAC: PCI Parity Error");
|
||
|
}
|
||
|
}
|
||
|
|
||
|
void edac_pci_clear_parity_errors(void)
|
||
|
{
|
||
|
/* Clear any PCI bus parity errors that devices initially have logged
|
||
|
* in their registers.
|
||
|
*/
|
||
|
edac_pci_dev_parity_iterator(edac_pci_dev_parity_clear);
|
||
|
}
|
||
|
|
||
|
|
||
|
/*
|
||
|
* Define the PCI parameter to the module
|
||
|
*/
|
||
|
module_param(check_pci_parity, int, 0644);
|
||
|
MODULE_PARM_DESC(check_pci_parity, "Check for PCI bus parity errors: 0=off 1=on");
|
||
|
module_param(panic_on_pci_parity, int, 0644);
|
||
|
MODULE_PARM_DESC(panic_on_pci_parity, "Panic on PCI Bus Parity error: 0=off 1=on");
|
||
|
|
||
|
#endif /* CONFIG_PCI */
|