diff options
author | Hidetoshi Seto <seto.hidetoshi@jp.fujitsu.com> | 2009-08-26 03:20:36 -0400 |
---|---|---|
committer | Ingo Molnar <mingo@elte.hu> | 2009-08-26 14:21:11 -0400 |
commit | 680b6cfd3cee30a7d997d49430fb73af84523853 (patch) | |
tree | b1ba1c3acb3611fc84aaaa5d5216a64db3b6a06e | |
parent | bf783f9f7d33576815bc89f9f1856a7309ea2f17 (diff) |
x86, mce: CE in last bank prevents panic by unknown MCE
If MCE handler is called but none of mces_seen have machine
check event which might signal the MCE (i.e. event higher than
MCE_KEEP_SEVERITY), panic with "Machine check from unknown
source" will be taken since the MCE is assumed to be signaled
from external agent or so.
Usually mces_seen never point MCE_KEEP_SEVERITY event such as
CE. But it can happen because initial value of mces_seen is
accidentally modified by mce_no_way_out() - in case if
mce_no_way_out() run through all banks and the last bank has
the CE, mces_seen points the CE and the "panic by unknown" will
not be taken.
This patch fixes this undesired behavior, and clarifies the logic.
Signed-off-by: Hidetoshi Seto <seto.hidetoshi@jp.fujitsu.com>
Cc: H. Peter Anvin <hpa@zytor.com>
Cc: Andi Kleen <ak@linux.intel.com>
Cc: Jin Dongming <jin.dongming@np.css.fujitsu.com>
LKML-Reference: <4A94E244.3020301@jp.fujitsu.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
Reported-by: Jin Dongming <jin.dongming@np.css.fujitsu.com>
-rw-r--r-- | arch/x86/kernel/cpu/mcheck/mce.c | 8 |
1 files changed, 4 insertions, 4 deletions
diff --git a/arch/x86/kernel/cpu/mcheck/mce.c b/arch/x86/kernel/cpu/mcheck/mce.c index 54bd1b2fb4c0..325559d1aa58 100644 --- a/arch/x86/kernel/cpu/mcheck/mce.c +++ b/arch/x86/kernel/cpu/mcheck/mce.c | |||
@@ -612,7 +612,7 @@ out: | |||
612 | * This way we prevent any potential data corruption in a unrecoverable case | 612 | * This way we prevent any potential data corruption in a unrecoverable case |
613 | * and also makes sure always all CPU's errors are examined. | 613 | * and also makes sure always all CPU's errors are examined. |
614 | * | 614 | * |
615 | * Also this detects the case of an machine check event coming from outer | 615 | * Also this detects the case of a machine check event coming from outer |
616 | * space (not detected by any CPUs) In this case some external agent wants | 616 | * space (not detected by any CPUs) In this case some external agent wants |
617 | * us to shut down, so panic too. | 617 | * us to shut down, so panic too. |
618 | * | 618 | * |
@@ -665,7 +665,7 @@ static void mce_reign(void) | |||
665 | * No machine check event found. Must be some external | 665 | * No machine check event found. Must be some external |
666 | * source or one CPU is hung. Panic. | 666 | * source or one CPU is hung. Panic. |
667 | */ | 667 | */ |
668 | if (!m && tolerant < 3) | 668 | if (global_worst <= MCE_KEEP_SEVERITY && tolerant < 3) |
669 | mce_panic("Machine check from unknown source", NULL, NULL); | 669 | mce_panic("Machine check from unknown source", NULL, NULL); |
670 | 670 | ||
671 | /* | 671 | /* |
@@ -889,11 +889,11 @@ void do_machine_check(struct pt_regs *regs, long error_code) | |||
889 | mce_setup(&m); | 889 | mce_setup(&m); |
890 | 890 | ||
891 | m.mcgstatus = mce_rdmsrl(MSR_IA32_MCG_STATUS); | 891 | m.mcgstatus = mce_rdmsrl(MSR_IA32_MCG_STATUS); |
892 | no_way_out = mce_no_way_out(&m, &msg); | ||
893 | |||
894 | final = &__get_cpu_var(mces_seen); | 892 | final = &__get_cpu_var(mces_seen); |
895 | *final = m; | 893 | *final = m; |
896 | 894 | ||
895 | no_way_out = mce_no_way_out(&m, &msg); | ||
896 | |||
897 | barrier(); | 897 | barrier(); |
898 | 898 | ||
899 | /* | 899 | /* |