aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorHidetoshi Seto <seto.hidetoshi@jp.fujitsu.com>2009-08-26 03:20:36 -0400
committerIngo Molnar <mingo@elte.hu>2009-08-26 14:21:11 -0400
commit680b6cfd3cee30a7d997d49430fb73af84523853 (patch)
treeb1ba1c3acb3611fc84aaaa5d5216a64db3b6a06e
parentbf783f9f7d33576815bc89f9f1856a7309ea2f17 (diff)
x86, mce: CE in last bank prevents panic by unknown MCE
If MCE handler is called but none of mces_seen have machine check event which might signal the MCE (i.e. event higher than MCE_KEEP_SEVERITY), panic with "Machine check from unknown source" will be taken since the MCE is assumed to be signaled from external agent or so. Usually mces_seen never point MCE_KEEP_SEVERITY event such as CE. But it can happen because initial value of mces_seen is accidentally modified by mce_no_way_out() - in case if mce_no_way_out() run through all banks and the last bank has the CE, mces_seen points the CE and the "panic by unknown" will not be taken. This patch fixes this undesired behavior, and clarifies the logic. Signed-off-by: Hidetoshi Seto <seto.hidetoshi@jp.fujitsu.com> Cc: H. Peter Anvin <hpa@zytor.com> Cc: Andi Kleen <ak@linux.intel.com> Cc: Jin Dongming <jin.dongming@np.css.fujitsu.com> LKML-Reference: <4A94E244.3020301@jp.fujitsu.com> Signed-off-by: Ingo Molnar <mingo@elte.hu> Reported-by: Jin Dongming <jin.dongming@np.css.fujitsu.com>
-rw-r--r--arch/x86/kernel/cpu/mcheck/mce.c8
1 files changed, 4 insertions, 4 deletions
diff --git a/arch/x86/kernel/cpu/mcheck/mce.c b/arch/x86/kernel/cpu/mcheck/mce.c
index 54bd1b2fb4c0..325559d1aa58 100644
--- a/arch/x86/kernel/cpu/mcheck/mce.c
+++ b/arch/x86/kernel/cpu/mcheck/mce.c
@@ -612,7 +612,7 @@ out:
612 * This way we prevent any potential data corruption in a unrecoverable case 612 * This way we prevent any potential data corruption in a unrecoverable case
613 * and also makes sure always all CPU's errors are examined. 613 * and also makes sure always all CPU's errors are examined.
614 * 614 *
615 * Also this detects the case of an machine check event coming from outer 615 * Also this detects the case of a machine check event coming from outer
616 * space (not detected by any CPUs) In this case some external agent wants 616 * space (not detected by any CPUs) In this case some external agent wants
617 * us to shut down, so panic too. 617 * us to shut down, so panic too.
618 * 618 *
@@ -665,7 +665,7 @@ static void mce_reign(void)
665 * No machine check event found. Must be some external 665 * No machine check event found. Must be some external
666 * source or one CPU is hung. Panic. 666 * source or one CPU is hung. Panic.
667 */ 667 */
668 if (!m && tolerant < 3) 668 if (global_worst <= MCE_KEEP_SEVERITY && tolerant < 3)
669 mce_panic("Machine check from unknown source", NULL, NULL); 669 mce_panic("Machine check from unknown source", NULL, NULL);
670 670
671 /* 671 /*
@@ -889,11 +889,11 @@ void do_machine_check(struct pt_regs *regs, long error_code)
889 mce_setup(&m); 889 mce_setup(&m);
890 890
891 m.mcgstatus = mce_rdmsrl(MSR_IA32_MCG_STATUS); 891 m.mcgstatus = mce_rdmsrl(MSR_IA32_MCG_STATUS);
892 no_way_out = mce_no_way_out(&m, &msg);
893
894 final = &__get_cpu_var(mces_seen); 892 final = &__get_cpu_var(mces_seen);
895 *final = m; 893 *final = m;
896 894
895 no_way_out = mce_no_way_out(&m, &msg);
896
897 barrier(); 897 barrier();
898 898
899 /* 899 /*