x86/barrier: Do not serialize MSR accesses on AMD

author Borislav Petkov (AMD) <bp@alien8.de>

Fri, 27 Oct 2023 12:24:16 +0000 (14:24 +0200)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Sat, 14 Dec 2024 18:50:42 +0000 (19:50 +0100)
author Borislav Petkov (AMD) <bp@alien8.de>
Fri, 27 Oct 2023 12:24:16 +0000 (14:24 +0200)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Sat, 14 Dec 2024 18:50:42 +0000 (19:50 +0100)
diff --git a/arch/x86/include/asm/barrier.h b/arch/x86/include/asm/barrier.h

index 3ba772a69cc8baf5ab6b0065527d353c3ac04bd0..dab2db15a8c471c8038edbdff1b54b55c75b0182 100644 (file)
--- a/arch/x86/include/asm/barrier.h
+++ b/arch/x86/include/asm/barrier.h
@@ -81,22 +81,4 @@ do {                                                                 \
  
  #include <asm-generic/barrier.h>
  
-/*
- * Make previous memory operations globally visible before
- * a WRMSR.
- *
- * MFENCE makes writes visible, but only affects load/store
- * instructions.  WRMSR is unfortunately not a load/store
- * instruction and is unaffected by MFENCE.  The LFENCE ensures
- * that the WRMSR is not reordered.
- *
- * Most WRMSRs are full serializing instructions themselves and
- * do not require this barrier.  This is only required for the
- * IA32_TSC_DEADLINE and X2APIC MSRs.
- */
-static inline void weak_wrmsr_fence(void)
-{
-       asm volatile("mfence; lfence" : : : "memory");
-}
-
  #endif /* _ASM_X86_BARRIER_H */
diff --git a/arch/x86/include/asm/cpufeatures.h b/arch/x86/include/asm/cpufeatures.h

index 3c0f7e3324788deac2f9038c4806347ddd9c798b..4faa47cc1a5c3cac0a4c917f5c6dea53dd40fcbf 100644 (file)
--- a/arch/x86/include/asm/cpufeatures.h
+++ b/arch/x86/include/asm/cpufeatures.h
@@ -309,6 +309,7 @@
  #define X86_FEATURE_SRSO               (11*32+24) /* "" AMD BTB untrain RETs */
  #define X86_FEATURE_SRSO_ALIAS         (11*32+25) /* "" AMD BTB untrain RETs through aliasing */
  #define X86_FEATURE_IBPB_ON_VMEXIT     (11*32+26) /* "" Issue an IBPB only on VMEXIT */
+#define X86_FEATURE_APIC_MSRS_FENCE    (11*32+27) /* "" IA32_TSC_DEADLINE and X2APIC MSRs need fencing */
  
  /* Intel-defined CPU features, CPUID level 0x00000007:1 (EAX), word 12 */
  #define X86_FEATURE_AVX_VNNI           (12*32+ 4) /* AVX VNNI instructions */
diff --git a/arch/x86/include/asm/processor.h b/arch/x86/include/asm/processor.h

index 0702e0c5dbb8d27ec4e4c86c03e7c48bd6d0def4..b7186deb8262bb772564762b588005bd451c9c9b 100644 (file)
--- a/arch/x86/include/asm/processor.h
+++ b/arch/x86/include/asm/processor.h
@@ -860,4 +860,22 @@ enum mds_mitigations {
  
  extern bool gds_ucode_mitigated(void);
  
+/*
+ * Make previous memory operations globally visible before
+ * a WRMSR.
+ *
+ * MFENCE makes writes visible, but only affects load/store
+ * instructions.  WRMSR is unfortunately not a load/store
+ * instruction and is unaffected by MFENCE.  The LFENCE ensures
+ * that the WRMSR is not reordered.
+ *
+ * Most WRMSRs are full serializing instructions themselves and
+ * do not require this barrier.  This is only required for the
+ * IA32_TSC_DEADLINE and X2APIC MSRs.
+ */
+static inline void weak_wrmsr_fence(void)
+{
+       alternative("mfence; lfence", "", ALT_NOT(X86_FEATURE_APIC_MSRS_FENCE));
+}
+
  #endif /* _ASM_X86_PROCESSOR_H */
diff --git a/arch/x86/kernel/cpu/amd.c b/arch/x86/kernel/cpu/amd.c

index 9fb890574f36bbee91f3c1bb90d67de320872051..ce5b27db65e10f34d02df4a7d61102e5059d5c55 100644 (file)
--- a/arch/x86/kernel/cpu/amd.c
+++ b/arch/x86/kernel/cpu/amd.c
@@ -1158,6 +1158,9 @@ static void init_amd(struct cpuinfo_x86 *c)
         if (!cpu_has(c, X86_FEATURE_HYPERVISOR) &&
              cpu_has_amd_erratum(c, amd_erratum_1485))
                 msr_set_bit(MSR_ZEN4_BP_CFG, MSR_ZEN4_BP_CFG_SHARED_BTB_FIX_BIT);
+
+       /* AMD CPUs don't need fencing after x2APIC/TSC_DEADLINE MSR writes. */
+       clear_cpu_cap(c, X86_FEATURE_APIC_MSRS_FENCE);
  }
  
  #ifdef CONFIG_X86_32
diff --git a/arch/x86/kernel/cpu/common.c b/arch/x86/kernel/cpu/common.c

index f0cc4c616ceb34e1a6bcecb6c6bb4a3573eb97bd..93b5cd12b9d4c5eba6d47b74b39729e981df5cca 100644 (file)
--- a/arch/x86/kernel/cpu/common.c
+++ b/arch/x86/kernel/cpu/common.c
@@ -1733,6 +1733,13 @@ static void identify_cpu(struct cpuinfo_x86 *c)
         c->apicid = apic->phys_pkg_id(c->initial_apicid, 0);
  #endif
  
+
+       /*
+        * Set default APIC and TSC_DEADLINE MSR fencing flag. AMD and
+        * Hygon will clear it in ->c_init() below.
+        */
+       set_cpu_cap(c, X86_FEATURE_APIC_MSRS_FENCE);
+
         /*
          * Vendor-specific initialization.  In this section we
          * canonicalize the feature flags, meaning if there are
diff --git a/arch/x86/kernel/cpu/hygon.c b/arch/x86/kernel/cpu/hygon.c

index 9e8380bd4fb9fd89c56b457af80e9710b02f37a3..8a80d5343f3a12025b6a5d6a058383f31f2e8d15 100644 (file)
--- a/arch/x86/kernel/cpu/hygon.c
+++ b/arch/x86/kernel/cpu/hygon.c
@@ -347,6 +347,9 @@ static void init_hygon(struct cpuinfo_x86 *c)
                 set_cpu_bug(c, X86_BUG_SYSRET_SS_ATTRS);
  
         check_null_seg_clears_base(c);
+
+       /* Hygon CPUs don't need fencing after x2APIC/TSC_DEADLINE MSR writes. */
+       clear_cpu_cap(c, X86_FEATURE_APIC_MSRS_FENCE);
  }
  
  static void cpu_detect_tlb_hygon(struct cpuinfo_x86 *c)
author	Borislav Petkov (AMD) <bp@alien8.de>
	Fri, 27 Oct 2023 12:24:16 +0000 (14:24 +0200)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Sat, 14 Dec 2024 18:50:42 +0000 (19:50 +0100)
arch/x86/include/asm/barrier.h		patch \| blob \| blame \| history
arch/x86/include/asm/cpufeatures.h		patch \| blob \| blame \| history
arch/x86/include/asm/processor.h		patch \| blob \| blame \| history
arch/x86/kernel/cpu/amd.c		patch \| blob \| blame \| history
arch/x86/kernel/cpu/common.c		patch \| blob \| blame \| history
arch/x86/kernel/cpu/hygon.c		patch \| blob \| blame \| history