|
@@ -85,6 +85,18 @@ static DECLARE_WAIT_QUEUE_HEAD(mce_wait);
|
|
static DEFINE_PER_CPU(struct mce, mces_seen);
|
|
static DEFINE_PER_CPU(struct mce, mces_seen);
|
|
static int cpu_missing;
|
|
static int cpu_missing;
|
|
|
|
|
|
|
|
+static void default_decode_mce(struct mce *m)
|
|
|
|
+{
|
|
|
|
+ pr_emerg("No human readable MCE decoding support on this CPU type.\n");
|
|
|
|
+ pr_emerg("Run the message through 'mcelog --ascii' to decode.\n");
|
|
|
|
+}
|
|
|
|
+
|
|
|
|
+/*
|
|
|
|
+ * CPU/chipset specific EDAC code can register a callback here to print
|
|
|
|
+ * MCE errors in a human-readable form:
|
|
|
|
+ */
|
|
|
|
+void (*x86_mce_decode_callback)(struct mce *m) = default_decode_mce;
|
|
|
|
+EXPORT_SYMBOL(x86_mce_decode_callback);
|
|
|
|
|
|
/* MCA banks polled by the period polling timer for corrected events */
|
|
/* MCA banks polled by the period polling timer for corrected events */
|
|
DEFINE_PER_CPU(mce_banks_t, mce_poll_banks) = {
|
|
DEFINE_PER_CPU(mce_banks_t, mce_poll_banks) = {
|
|
@@ -165,46 +177,46 @@ void mce_log(struct mce *mce)
|
|
set_bit(0, &mce_need_notify);
|
|
set_bit(0, &mce_need_notify);
|
|
}
|
|
}
|
|
|
|
|
|
-void __weak decode_mce(struct mce *m)
|
|
|
|
-{
|
|
|
|
- return;
|
|
|
|
-}
|
|
|
|
-
|
|
|
|
static void print_mce(struct mce *m)
|
|
static void print_mce(struct mce *m)
|
|
{
|
|
{
|
|
- printk(KERN_EMERG
|
|
|
|
- "CPU %d: Machine Check Exception: %16Lx Bank %d: %016Lx\n",
|
|
|
|
|
|
+ pr_emerg("CPU %d: Machine Check Exception: %16Lx Bank %d: %016Lx\n",
|
|
m->extcpu, m->mcgstatus, m->bank, m->status);
|
|
m->extcpu, m->mcgstatus, m->bank, m->status);
|
|
|
|
+
|
|
if (m->ip) {
|
|
if (m->ip) {
|
|
- printk(KERN_EMERG "RIP%s %02x:<%016Lx> ",
|
|
|
|
- !(m->mcgstatus & MCG_STATUS_EIPV) ? " !INEXACT!" : "",
|
|
|
|
- m->cs, m->ip);
|
|
|
|
|
|
+ pr_emerg("RIP%s %02x:<%016Lx> ",
|
|
|
|
+ !(m->mcgstatus & MCG_STATUS_EIPV) ? " !INEXACT!" : "",
|
|
|
|
+ m->cs, m->ip);
|
|
|
|
+
|
|
if (m->cs == __KERNEL_CS)
|
|
if (m->cs == __KERNEL_CS)
|
|
print_symbol("{%s}", m->ip);
|
|
print_symbol("{%s}", m->ip);
|
|
- printk(KERN_CONT "\n");
|
|
|
|
|
|
+ pr_cont("\n");
|
|
}
|
|
}
|
|
- printk(KERN_EMERG "TSC %llx ", m->tsc);
|
|
|
|
|
|
+
|
|
|
|
+ pr_emerg("TSC %llx ", m->tsc);
|
|
if (m->addr)
|
|
if (m->addr)
|
|
- printk(KERN_CONT "ADDR %llx ", m->addr);
|
|
|
|
|
|
+ pr_cont("ADDR %llx ", m->addr);
|
|
if (m->misc)
|
|
if (m->misc)
|
|
- printk(KERN_CONT "MISC %llx ", m->misc);
|
|
|
|
- printk(KERN_CONT "\n");
|
|
|
|
- printk(KERN_EMERG "PROCESSOR %u:%x TIME %llu SOCKET %u APIC %x\n",
|
|
|
|
- m->cpuvendor, m->cpuid, m->time, m->socketid,
|
|
|
|
- m->apicid);
|
|
|
|
|
|
+ pr_cont("MISC %llx ", m->misc);
|
|
|
|
+
|
|
|
|
+ pr_cont("\n");
|
|
|
|
+ pr_emerg("PROCESSOR %u:%x TIME %llu SOCKET %u APIC %x\n",
|
|
|
|
+ m->cpuvendor, m->cpuid, m->time, m->socketid, m->apicid);
|
|
|
|
|
|
- decode_mce(m);
|
|
|
|
|
|
+ /*
|
|
|
|
+ * Print out human-readable details about the MCE error,
|
|
|
|
+ * (if the CPU has an implementation for that):
|
|
|
|
+ */
|
|
|
|
+ x86_mce_decode_callback(m);
|
|
}
|
|
}
|
|
|
|
|
|
static void print_mce_head(void)
|
|
static void print_mce_head(void)
|
|
{
|
|
{
|
|
- printk(KERN_EMERG "\nHARDWARE ERROR\n");
|
|
|
|
|
|
+ pr_emerg("\nHARDWARE ERROR\n");
|
|
}
|
|
}
|
|
|
|
|
|
static void print_mce_tail(void)
|
|
static void print_mce_tail(void)
|
|
{
|
|
{
|
|
- printk(KERN_EMERG "This is not a software problem!\n"
|
|
|
|
- "Run through mcelog --ascii to decode and contact your hardware vendor\n");
|
|
|
|
|
|
+ pr_emerg("This is not a software problem!\n");
|
|
}
|
|
}
|
|
|
|
|
|
#define PANIC_TIMEOUT 5 /* 5 seconds */
|
|
#define PANIC_TIMEOUT 5 /* 5 seconds */
|
|
@@ -218,6 +230,7 @@ static atomic_t mce_fake_paniced;
|
|
static void wait_for_panic(void)
|
|
static void wait_for_panic(void)
|
|
{
|
|
{
|
|
long timeout = PANIC_TIMEOUT*USEC_PER_SEC;
|
|
long timeout = PANIC_TIMEOUT*USEC_PER_SEC;
|
|
|
|
+
|
|
preempt_disable();
|
|
preempt_disable();
|
|
local_irq_enable();
|
|
local_irq_enable();
|
|
while (timeout-- > 0)
|
|
while (timeout-- > 0)
|
|
@@ -285,6 +298,7 @@ static void mce_panic(char *msg, struct mce *final, char *exp)
|
|
static int msr_to_offset(u32 msr)
|
|
static int msr_to_offset(u32 msr)
|
|
{
|
|
{
|
|
unsigned bank = __get_cpu_var(injectm.bank);
|
|
unsigned bank = __get_cpu_var(injectm.bank);
|
|
|
|
+
|
|
if (msr == rip_msr)
|
|
if (msr == rip_msr)
|
|
return offsetof(struct mce, ip);
|
|
return offsetof(struct mce, ip);
|
|
if (msr == MSR_IA32_MCx_STATUS(bank))
|
|
if (msr == MSR_IA32_MCx_STATUS(bank))
|