For Fam10h onwards, bank4 MCE are reported only to the node base
cores. This patch modifies the do_inject code path to take care
of this.

Refer D18F3x44[NbMcaToMstCpuEn] on BKDGs of Fam10h and later for
clarifications on the reporting of MC4 errors only to NBC MSRs.

Signed-off-by: Aravind Gopalakrishnan <aravind.gopalakrish...@amd.com>
---
 drivers/edac/mce_amd_inj.c | 21 +++++++++++++++++----
 1 file changed, 17 insertions(+), 4 deletions(-)

diff --git a/drivers/edac/mce_amd_inj.c b/drivers/edac/mce_amd_inj.c
index 0bd91a8..d4aa14f 100644
--- a/drivers/edac/mce_amd_inj.c
+++ b/drivers/edac/mce_amd_inj.c
@@ -126,6 +126,7 @@ static void do_inject(void)
 {
        u64 mcg_status = 0;
        unsigned int cpu = i_mce.extcpu;
+       int saved_cpu = -1;
        u8 b = i_mce.bank;
 
        if (!(i_mce.inject_flags & MCJ_EXCEPTION)) {
@@ -143,22 +144,34 @@ static void do_inject(void)
        if (!(i_mce.status & MCI_STATUS_PCC))
                mcg_status |= MCG_STATUS_RIPV;
 
-       toggle_hw_mce_inject(cpu, true);
-
        wrmsr_on_cpu(cpu, MSR_IA32_MCG_STATUS,
                     (u32)mcg_status, (u32)(mcg_status >> 32));
 
+       /*
+        * for Fam10h+, if bank = 4, then we should write to NBC MSR
+        * for multi-node processors else to core 0 for single node processors
+        */
+       if (boot_cpu_data.x86 >= 0x10 && b == 4) {
+               saved_cpu = cpu;
+               cpu = amd_get_nbc_for_cpu(cpu);
+       }
+
+       toggle_hw_mce_inject(cpu, true);
+
        wrmsr_on_cpu(cpu, MSR_IA32_MCx_STATUS(b),
                     (u32)i_mce.status, (u32)(i_mce.status >> 32));
 
        wrmsr_on_cpu(cpu, MSR_IA32_MCx_ADDR(b),
                     (u32)i_mce.addr, (u32)(i_mce.addr >> 32));
 
+       toggle_hw_mce_inject(cpu, false);
+
+       if (saved_cpu != -1)
+               cpu = saved_cpu;
+
        wrmsr_on_cpu(cpu, MSR_IA32_MCx_MISC(b),
                     (u32)i_mce.misc, (u32)(i_mce.misc >> 32));
 
-       toggle_hw_mce_inject(cpu, false);
-
        smp_call_function_single(cpu, trigger_mce, NULL, 0);
 
 err:
-- 
2.0.2

--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html
Please read the FAQ at  http://www.tux.org/lkml/

Reply via email to