x86/mce: Enable additional error logging on certain Intel CPUs
authorTony Luck <tony.luck@intel.com>
Fri, 30 Oct 2020 19:04:00 +0000 (12:04 -0700)
committerBorislav Petkov <bp@suse.de>
Mon, 2 Nov 2020 10:15:59 +0000 (11:15 +0100)
The Xeon versions of Sandy Bridge, Ivy Bridge and Haswell support an
optional additional error logging mode which is enabled by an MSR.

Previously, this mode was enabled from the mcelog(8) tool via /dev/cpu,
but userspace should not be poking at MSRs. So move the enabling into
the kernel.

 [ bp: Correct the explanation why this is done. ]

Suggested-by: Boris Petkov <bp@alien8.de>
Signed-off-by: Tony Luck <tony.luck@intel.com>
Signed-off-by: Borislav Petkov <bp@suse.de>
Link: https://lkml.kernel.org/r/20201030190807.GA13884@agluck-desk2.amr.corp.intel.com
arch/x86/include/asm/msr-index.h
arch/x86/kernel/cpu/mce/intel.c

index 972a34d935059aa49d01db8f20c3e598fffb22ac..b2dd2648c0e23ba22e60b23d550f72e7abeeb377 100644 (file)
 #define MSR_IA32_MCG_CAP               0x00000179
 #define MSR_IA32_MCG_STATUS            0x0000017a
 #define MSR_IA32_MCG_CTL               0x0000017b
+#define MSR_ERROR_CONTROL              0x0000017f
 #define MSR_IA32_MCG_EXT_CTL           0x000004d0
 
 #define MSR_OFFCORE_RSP_0              0x000001a6
index abe9fe0fb8517ce9b1af73740684708a83f07829..b47883e364b40115e7711429ae3e7e8479caebdb 100644 (file)
@@ -509,12 +509,32 @@ static void intel_ppin_init(struct cpuinfo_x86 *c)
        }
 }
 
+/*
+ * Enable additional error logs from the integrated
+ * memory controller on processors that support this.
+ */
+static void intel_imc_init(struct cpuinfo_x86 *c)
+{
+       u64 error_control;
+
+       switch (c->x86_model) {
+       case INTEL_FAM6_SANDYBRIDGE_X:
+       case INTEL_FAM6_IVYBRIDGE_X:
+       case INTEL_FAM6_HASWELL_X:
+               rdmsrl(MSR_ERROR_CONTROL, error_control);
+               error_control |= 2;
+               wrmsrl(MSR_ERROR_CONTROL, error_control);
+               break;
+       }
+}
+
 void mce_intel_feature_init(struct cpuinfo_x86 *c)
 {
        intel_init_thermal(c);
        intel_init_cmci();
        intel_init_lmce();
        intel_ppin_init(c);
+       intel_imc_init(c);
 }
 
 void mce_intel_feature_clear(struct cpuinfo_x86 *c)