2005-04-16 16:20:36 -06:00
|
|
|
/*
|
|
|
|
* Non Fatal Machine Check Exception Reporting
|
|
|
|
*
|
2008-10-20 11:31:45 -06:00
|
|
|
* (C) Copyright 2002 Dave Jones. <davej@redhat.com>
|
2005-04-16 16:20:36 -06:00
|
|
|
*
|
|
|
|
* This file contains routines to check for non-fatal MCEs every 15s
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <linux/init.h>
|
|
|
|
#include <linux/types.h>
|
|
|
|
#include <linux/kernel.h>
|
|
|
|
#include <linux/jiffies.h>
|
|
|
|
#include <linux/workqueue.h>
|
|
|
|
#include <linux/interrupt.h>
|
|
|
|
#include <linux/smp.h>
|
|
|
|
#include <linux/module.h>
|
|
|
|
|
2008-02-22 15:10:49 -07:00
|
|
|
#include <asm/processor.h>
|
2005-04-16 16:20:36 -06:00
|
|
|
#include <asm/system.h>
|
|
|
|
#include <asm/msr.h>
|
|
|
|
|
|
|
|
#include "mce.h"
|
|
|
|
|
|
|
|
static int firstbank;
|
|
|
|
|
|
|
|
#define MCE_RATE 15*HZ /* timer rate is 15s */
|
|
|
|
|
2008-02-22 15:10:49 -07:00
|
|
|
static void mce_checkregs(void *info)
|
2005-04-16 16:20:36 -06:00
|
|
|
{
|
|
|
|
u32 low, high;
|
|
|
|
int i;
|
|
|
|
|
2008-02-22 15:10:49 -07:00
|
|
|
for (i = firstbank; i < nr_mce_banks; i++) {
|
|
|
|
rdmsr(MSR_IA32_MC0_STATUS+i*4, low, high);
|
2005-04-16 16:20:36 -06:00
|
|
|
|
|
|
|
if (high & (1<<31)) {
|
|
|
|
printk(KERN_INFO "MCE: The hardware reports a non "
|
|
|
|
"fatal, correctable incident occurred on "
|
|
|
|
"CPU %d.\n",
|
|
|
|
smp_processor_id());
|
2008-02-22 15:10:49 -07:00
|
|
|
printk(KERN_INFO "Bank %d: %08x%08x\n", i, high, low);
|
2005-04-16 16:20:36 -06:00
|
|
|
|
2008-02-22 15:10:49 -07:00
|
|
|
/*
|
|
|
|
* Scrub the error so we don't pick it up in MCE_RATE
|
|
|
|
* seconds time.
|
|
|
|
*/
|
|
|
|
wrmsr(MSR_IA32_MC0_STATUS+i*4, 0UL, 0UL);
|
2005-04-16 16:20:36 -06:00
|
|
|
|
|
|
|
/* Serialize */
|
|
|
|
wmb();
|
|
|
|
add_taint(TAINT_MACHINE_CHECK);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2006-11-22 07:57:56 -07:00
|
|
|
static void mce_work_fn(struct work_struct *work);
|
|
|
|
static DECLARE_DELAYED_WORK(mce_work, mce_work_fn);
|
2005-04-16 16:20:36 -06:00
|
|
|
|
2006-11-22 07:57:56 -07:00
|
|
|
static void mce_work_fn(struct work_struct *work)
|
2008-02-22 15:10:49 -07:00
|
|
|
{
|
2008-05-09 01:39:44 -06:00
|
|
|
on_each_cpu(mce_checkregs, NULL, 1);
|
2007-07-21 09:10:44 -06:00
|
|
|
schedule_delayed_work(&mce_work, round_jiffies_relative(MCE_RATE));
|
2008-02-22 15:10:49 -07:00
|
|
|
}
|
2005-04-16 16:20:36 -06:00
|
|
|
|
|
|
|
static int __init init_nonfatal_mce_checker(void)
|
|
|
|
{
|
|
|
|
struct cpuinfo_x86 *c = &boot_cpu_data;
|
|
|
|
|
|
|
|
/* Check for MCE support */
|
|
|
|
if (!cpu_has(c, X86_FEATURE_MCE))
|
|
|
|
return -ENODEV;
|
|
|
|
|
|
|
|
/* Check for PPro style MCA */
|
|
|
|
if (!cpu_has(c, X86_FEATURE_MCA))
|
|
|
|
return -ENODEV;
|
|
|
|
|
|
|
|
/* Some Athlons misbehave when we frob bank 0 */
|
|
|
|
if (boot_cpu_data.x86_vendor == X86_VENDOR_AMD &&
|
|
|
|
boot_cpu_data.x86 == 6)
|
|
|
|
firstbank = 1;
|
|
|
|
else
|
|
|
|
firstbank = 0;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Check for non-fatal errors every MCE_RATE s
|
|
|
|
*/
|
2007-07-21 09:10:44 -06:00
|
|
|
schedule_delayed_work(&mce_work, round_jiffies_relative(MCE_RATE));
|
2005-04-16 16:20:36 -06:00
|
|
|
printk(KERN_INFO "Machine check exception polling timer started.\n");
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
module_init(init_nonfatal_mce_checker);
|
|
|
|
|
|
|
|
MODULE_LICENSE("GPL");
|