x86/barrier: Do not serialize MSR accesses on AMD

author Borislav Petkov (AMD) <bp@alien8.de>

Fri, 27 Oct 2023 12:24:16 +0000 (14:24 +0200)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Sat, 14 Dec 2024 18:47:43 +0000 (19:47 +0100)
author Borislav Petkov (AMD) <bp@alien8.de>
Fri, 27 Oct 2023 12:24:16 +0000 (14:24 +0200)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Sat, 14 Dec 2024 18:47:43 +0000 (19:47 +0100)
diff --git a/arch/x86/include/asm/barrier.h b/arch/x86/include/asm/barrier.h

index 4819d5e5a3353d7db2fa314f9665a6cd07db741a..7f828fe497978e3132a2c6d87786d02029719fd2 100644 (file)
--- a/arch/x86/include/asm/barrier.h
+++ b/arch/x86/include/asm/barrier.h
@@ -84,22 +84,4 @@ do {                                                                 \
  
  #include <asm-generic/barrier.h>
  
-/*
- * Make previous memory operations globally visible before
- * a WRMSR.
- *
- * MFENCE makes writes visible, but only affects load/store
- * instructions.  WRMSR is unfortunately not a load/store
- * instruction and is unaffected by MFENCE.  The LFENCE ensures
- * that the WRMSR is not reordered.
- *
- * Most WRMSRs are full serializing instructions themselves and
- * do not require this barrier.  This is only required for the
- * IA32_TSC_DEADLINE and X2APIC MSRs.
- */
-static inline void weak_wrmsr_fence(void)
-{
-       asm volatile("mfence; lfence" : : : "memory");
-}
-
  #endif /* _ASM_X86_BARRIER_H */
diff --git a/arch/x86/include/asm/cpufeatures.h b/arch/x86/include/asm/cpufeatures.h

index 23f563493e810bce4986bdd534902d3bc4699535..f3365ec973763bbfe94c335ee9811f93272b0c80 100644 (file)
--- a/arch/x86/include/asm/cpufeatures.h
+++ b/arch/x86/include/asm/cpufeatures.h
@@ -305,6 +305,7 @@
  #define X86_FEATURE_SRSO               (11*32+24) /* "" AMD BTB untrain RETs */
  #define X86_FEATURE_SRSO_ALIAS         (11*32+25) /* "" AMD BTB untrain RETs through aliasing */
  #define X86_FEATURE_IBPB_ON_VMEXIT     (11*32+26) /* "" Issue an IBPB only on VMEXIT */
+#define X86_FEATURE_APIC_MSRS_FENCE    (11*32+27) /* "" IA32_TSC_DEADLINE and X2APIC MSRs need fencing */
  
  /* Intel-defined CPU features, CPUID level 0x00000007:1 (EAX), word 12 */
  #define X86_FEATURE_AVX512_BF16                (12*32+ 5) /* AVX512 BFLOAT16 instructions */
diff --git a/arch/x86/include/asm/processor.h b/arch/x86/include/asm/processor.h

index c682a14299e0ed5de8a9f9de3f53fbeacf0d7236..5defef9f286e143ca47e3e8ed367e07a7d1d0621 100644 (file)
--- a/arch/x86/include/asm/processor.h
+++ b/arch/x86/include/asm/processor.h
@@ -858,4 +858,22 @@ enum mds_mitigations {
  
  extern bool gds_ucode_mitigated(void);
  
+/*
+ * Make previous memory operations globally visible before
+ * a WRMSR.
+ *
+ * MFENCE makes writes visible, but only affects load/store
+ * instructions.  WRMSR is unfortunately not a load/store
+ * instruction and is unaffected by MFENCE.  The LFENCE ensures
+ * that the WRMSR is not reordered.
+ *
+ * Most WRMSRs are full serializing instructions themselves and
+ * do not require this barrier.  This is only required for the
+ * IA32_TSC_DEADLINE and X2APIC MSRs.
+ */
+static inline void weak_wrmsr_fence(void)
+{
+       alternative("mfence; lfence", "", ALT_NOT(X86_FEATURE_APIC_MSRS_FENCE));
+}
+
  #endif /* _ASM_X86_PROCESSOR_H */
diff --git a/arch/x86/kernel/cpu/amd.c b/arch/x86/kernel/cpu/amd.c

index 3b02cb8b0533859954b21244da0a413d65ee7340..c10f7dcaa7b7c715f9fdc4d069a860a054d41c59 100644 (file)
--- a/arch/x86/kernel/cpu/amd.c
+++ b/arch/x86/kernel/cpu/amd.c
@@ -1186,6 +1186,9 @@ static void init_amd(struct cpuinfo_x86 *c)
         if (!cpu_has(c, X86_FEATURE_HYPERVISOR) &&
              cpu_has_amd_erratum(c, amd_erratum_1485))
                 msr_set_bit(MSR_ZEN4_BP_CFG, MSR_ZEN4_BP_CFG_SHARED_BTB_FIX_BIT);
+
+       /* AMD CPUs don't need fencing after x2APIC/TSC_DEADLINE MSR writes. */
+       clear_cpu_cap(c, X86_FEATURE_APIC_MSRS_FENCE);
  }
  
  #ifdef CONFIG_X86_32
diff --git a/arch/x86/kernel/cpu/common.c b/arch/x86/kernel/cpu/common.c

index bdcf1e9375ee2a160c70a6d62c44773dfcb7e7c6..6d86585f6d24ef4fe9ecbfa4873ade4131d2aa8f 100644 (file)
--- a/arch/x86/kernel/cpu/common.c
+++ b/arch/x86/kernel/cpu/common.c
@@ -1716,6 +1716,13 @@ static void identify_cpu(struct cpuinfo_x86 *c)
         c->apicid = apic->phys_pkg_id(c->initial_apicid, 0);
  #endif
  
+
+       /*
+        * Set default APIC and TSC_DEADLINE MSR fencing flag. AMD and
+        * Hygon will clear it in ->c_init() below.
+        */
+       set_cpu_cap(c, X86_FEATURE_APIC_MSRS_FENCE);
+
         /*
          * Vendor-specific initialization.  In this section we
          * canonicalize the feature flags, meaning if there are
diff --git a/arch/x86/kernel/cpu/hygon.c b/arch/x86/kernel/cpu/hygon.c

index 3f5c00b15e2c102d5253732b774cfa1aa8f783d5..b49f662f68718ba163e2eca4e7477e69cf435da4 100644 (file)
--- a/arch/x86/kernel/cpu/hygon.c
+++ b/arch/x86/kernel/cpu/hygon.c
@@ -363,6 +363,9 @@ static void init_hygon(struct cpuinfo_x86 *c)
                 set_cpu_bug(c, X86_BUG_SYSRET_SS_ATTRS);
  
         check_null_seg_clears_base(c);
+
+       /* Hygon CPUs don't need fencing after x2APIC/TSC_DEADLINE MSR writes. */
+       clear_cpu_cap(c, X86_FEATURE_APIC_MSRS_FENCE);
  }
  
  static void cpu_detect_tlb_hygon(struct cpuinfo_x86 *c)
author	Borislav Petkov (AMD) <bp@alien8.de>
	Fri, 27 Oct 2023 12:24:16 +0000 (14:24 +0200)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Sat, 14 Dec 2024 18:47:43 +0000 (19:47 +0100)
arch/x86/include/asm/barrier.h		patch \| blob \| blame \| history
arch/x86/include/asm/cpufeatures.h		patch \| blob \| blame \| history
arch/x86/include/asm/processor.h		patch \| blob \| blame \| history
arch/x86/kernel/cpu/amd.c		patch \| blob \| blame \| history
arch/x86/kernel/cpu/common.c		patch \| blob \| blame \| history
arch/x86/kernel/cpu/hygon.c		patch \| blob \| blame \| history