]> git.ipfire.org Git - thirdparty/kernel/stable-queue.git/commitdiff
4.12-stable patches
authorGreg Kroah-Hartman <gregkh@linuxfoundation.org>
Mon, 18 Sep 2017 06:53:22 +0000 (08:53 +0200)
committerGreg Kroah-Hartman <gregkh@linuxfoundation.org>
Mon, 18 Sep 2017 06:53:22 +0000 (08:53 +0200)
added patches:
x86-fsgsbase-64-fully-initialize-fs-and-gs-state-in-start_thread_common.patch
x86-fsgsbase-64-report-fsbase-and-gsbase-correctly-in-core-dumps.patch
x86-switch_to-64-rewrite-fs-gs-switching-yet-again-to-fix-amd-cpus.patch

queue-4.12/series
queue-4.12/x86-fsgsbase-64-fully-initialize-fs-and-gs-state-in-start_thread_common.patch [new file with mode: 0644]
queue-4.12/x86-fsgsbase-64-report-fsbase-and-gsbase-correctly-in-core-dumps.patch [new file with mode: 0644]
queue-4.12/x86-switch_to-64-rewrite-fs-gs-switching-yet-again-to-fix-amd-cpus.patch [new file with mode: 0644]

index 5264d8690e47512784bda1d9b56373e4fea24a15..070a9ed9aab663a960f0e1aa82724841832ca74d 100644 (file)
@@ -43,3 +43,6 @@ ipv6-fix-typo-in-fib6_net_exit.patch
 sctp-fix-missing-wake-ups-in-some-situations.patch
 f2fs-let-fill_super-handle-roll-forward-errors.patch
 f2fs-check-hot_data-for-roll-forward-recovery.patch
+x86-fsgsbase-64-fully-initialize-fs-and-gs-state-in-start_thread_common.patch
+x86-fsgsbase-64-report-fsbase-and-gsbase-correctly-in-core-dumps.patch
+x86-switch_to-64-rewrite-fs-gs-switching-yet-again-to-fix-amd-cpus.patch
diff --git a/queue-4.12/x86-fsgsbase-64-fully-initialize-fs-and-gs-state-in-start_thread_common.patch b/queue-4.12/x86-fsgsbase-64-fully-initialize-fs-and-gs-state-in-start_thread_common.patch
new file mode 100644 (file)
index 0000000..0493522
--- /dev/null
@@ -0,0 +1,58 @@
+From 767d035d838f4fd6b5a5bbd7a3f6d293b7f65a49 Mon Sep 17 00:00:00 2001
+From: Andy Lutomirski <luto@kernel.org>
+Date: Tue, 1 Aug 2017 07:11:34 -0700
+Subject: x86/fsgsbase/64: Fully initialize FS and GS state in start_thread_common
+
+From: Andy Lutomirski <luto@kernel.org>
+
+commit 767d035d838f4fd6b5a5bbd7a3f6d293b7f65a49 upstream.
+
+execve used to leak FSBASE and GSBASE on AMD CPUs.  Fix it.
+
+The security impact of this bug is small but not quite zero -- it
+could weaken ASLR when a privileged task execs a less privileged
+program, but only if program changed bitness across the exec, or the
+child binary was highly unusual or actively malicious.  A child
+program that was compromised after the exec would not have access to
+the leaked base.
+
+Signed-off-by: Andy Lutomirski <luto@kernel.org>
+Cc: Borislav Petkov <bp@alien8.de>
+Cc: Borislav Petkov <bpetkov@suse.de>
+Cc: Brian Gerst <brgerst@gmail.com>
+Cc: Chang Seok <chang.seok.bae@intel.com>
+Cc: Denys Vlasenko <dvlasenk@redhat.com>
+Cc: H. Peter Anvin <hpa@zytor.com>
+Cc: Josh Poimboeuf <jpoimboe@redhat.com>
+Cc: Linus Torvalds <torvalds@linux-foundation.org>
+Cc: Peter Zijlstra <peterz@infradead.org>
+Cc: Thomas Gleixner <tglx@linutronix.de>
+Signed-off-by: Ingo Molnar <mingo@kernel.org>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ arch/x86/kernel/process_64.c |    9 +++++++++
+ 1 file changed, 9 insertions(+)
+
+--- a/arch/x86/kernel/process_64.c
++++ b/arch/x86/kernel/process_64.c
+@@ -229,10 +229,19 @@ start_thread_common(struct pt_regs *regs
+                   unsigned long new_sp,
+                   unsigned int _cs, unsigned int _ss, unsigned int _ds)
+ {
++      WARN_ON_ONCE(regs != current_pt_regs());
++
++      if (static_cpu_has(X86_BUG_NULL_SEG)) {
++              /* Loading zero below won't clear the base. */
++              loadsegment(fs, __USER_DS);
++              load_gs_index(__USER_DS);
++      }
++
+       loadsegment(fs, 0);
+       loadsegment(es, _ds);
+       loadsegment(ds, _ds);
+       load_gs_index(0);
++
+       regs->ip                = new_ip;
+       regs->sp                = new_sp;
+       regs->cs                = _cs;
diff --git a/queue-4.12/x86-fsgsbase-64-report-fsbase-and-gsbase-correctly-in-core-dumps.patch b/queue-4.12/x86-fsgsbase-64-report-fsbase-and-gsbase-correctly-in-core-dumps.patch
new file mode 100644 (file)
index 0000000..95e32d8
--- /dev/null
@@ -0,0 +1,56 @@
+From 9584d98bed7a7a904d0702ad06bbcc94703cb5b4 Mon Sep 17 00:00:00 2001
+From: Andy Lutomirski <luto@kernel.org>
+Date: Tue, 1 Aug 2017 07:11:35 -0700
+Subject: x86/fsgsbase/64: Report FSBASE and GSBASE correctly in core dumps
+
+From: Andy Lutomirski <luto@kernel.org>
+
+commit 9584d98bed7a7a904d0702ad06bbcc94703cb5b4 upstream.
+
+In ELF_COPY_CORE_REGS, we're copying from the current task, so
+accessing thread.fsbase and thread.gsbase makes no sense.  Just read
+the values from the CPU registers.
+
+In practice, the old code would have been correct most of the time
+simply because thread.fsbase and thread.gsbase usually matched the
+CPU registers.
+
+Signed-off-by: Andy Lutomirski <luto@kernel.org>
+Cc: Borislav Petkov <bp@alien8.de>
+Cc: Borislav Petkov <bpetkov@suse.de>
+Cc: Brian Gerst <brgerst@gmail.com>
+Cc: Chang Seok <chang.seok.bae@intel.com>
+Cc: Denys Vlasenko <dvlasenk@redhat.com>
+Cc: H. Peter Anvin <hpa@zytor.com>
+Cc: Josh Poimboeuf <jpoimboe@redhat.com>
+Cc: Linus Torvalds <torvalds@linux-foundation.org>
+Cc: Peter Zijlstra <peterz@infradead.org>
+Cc: Thomas Gleixner <tglx@linutronix.de>
+Signed-off-by: Ingo Molnar <mingo@kernel.org>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ arch/x86/include/asm/elf.h |    5 +++--
+ 1 file changed, 3 insertions(+), 2 deletions(-)
+
+--- a/arch/x86/include/asm/elf.h
++++ b/arch/x86/include/asm/elf.h
+@@ -204,6 +204,7 @@ void set_personality_ia32(bool);
+ #define ELF_CORE_COPY_REGS(pr_reg, regs)                      \
+ do {                                                          \
++      unsigned long base;                                     \
+       unsigned v;                                             \
+       (pr_reg)[0] = (regs)->r15;                              \
+       (pr_reg)[1] = (regs)->r14;                              \
+@@ -226,8 +227,8 @@ do {                                                               \
+       (pr_reg)[18] = (regs)->flags;                           \
+       (pr_reg)[19] = (regs)->sp;                              \
+       (pr_reg)[20] = (regs)->ss;                              \
+-      (pr_reg)[21] = current->thread.fsbase;                  \
+-      (pr_reg)[22] = current->thread.gsbase;                  \
++      rdmsrl(MSR_FS_BASE, base); (pr_reg)[21] = base;         \
++      rdmsrl(MSR_KERNEL_GS_BASE, base); (pr_reg)[22] = base;  \
+       asm("movl %%ds,%0" : "=r" (v)); (pr_reg)[23] = v;       \
+       asm("movl %%es,%0" : "=r" (v)); (pr_reg)[24] = v;       \
+       asm("movl %%fs,%0" : "=r" (v)); (pr_reg)[25] = v;       \
diff --git a/queue-4.12/x86-switch_to-64-rewrite-fs-gs-switching-yet-again-to-fix-amd-cpus.patch b/queue-4.12/x86-switch_to-64-rewrite-fs-gs-switching-yet-again-to-fix-amd-cpus.patch
new file mode 100644 (file)
index 0000000..1d9bb93
--- /dev/null
@@ -0,0 +1,297 @@
+From e137a4d8f4dd2e277e355495b6b2cb241a8693c3 Mon Sep 17 00:00:00 2001
+From: Andy Lutomirski <luto@kernel.org>
+Date: Tue, 1 Aug 2017 07:11:37 -0700
+Subject: x86/switch_to/64: Rewrite FS/GS switching yet again to fix AMD CPUs
+
+From: Andy Lutomirski <luto@kernel.org>
+
+commit e137a4d8f4dd2e277e355495b6b2cb241a8693c3 upstream.
+
+Switching FS and GS is a mess, and the current code is still subtly
+wrong: it assumes that "Loading a nonzero value into FS sets the
+index and base", which is false on AMD CPUs if the value being
+loaded is 1, 2, or 3.
+
+(The current code came from commit 3e2b68d752c9 ("x86/asm,
+sched/x86: Rewrite the FS and GS context switch code"), which made
+it better but didn't fully fix it.)
+
+Rewrite it to be much simpler and more obviously correct.  This
+should fix it fully on AMD CPUs and shouldn't adversely affect
+performance.
+
+Signed-off-by: Andy Lutomirski <luto@kernel.org>
+Cc: Borislav Petkov <bp@alien8.de>
+Cc: Borislav Petkov <bpetkov@suse.de>
+Cc: Brian Gerst <brgerst@gmail.com>
+Cc: Chang Seok <chang.seok.bae@intel.com>
+Cc: Denys Vlasenko <dvlasenk@redhat.com>
+Cc: H. Peter Anvin <hpa@zytor.com>
+Cc: Josh Poimboeuf <jpoimboe@redhat.com>
+Cc: Linus Torvalds <torvalds@linux-foundation.org>
+Cc: Peter Zijlstra <peterz@infradead.org>
+Cc: Thomas Gleixner <tglx@linutronix.de>
+Signed-off-by: Ingo Molnar <mingo@kernel.org>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ arch/x86/kernel/process_64.c |  227 +++++++++++++++++++++++--------------------
+ 1 file changed, 122 insertions(+), 105 deletions(-)
+
+--- a/arch/x86/kernel/process_64.c
++++ b/arch/x86/kernel/process_64.c
+@@ -149,6 +149,123 @@ void release_thread(struct task_struct *
+       }
+ }
++enum which_selector {
++      FS,
++      GS
++};
++
++/*
++ * Saves the FS or GS base for an outgoing thread if FSGSBASE extensions are
++ * not available.  The goal is to be reasonably fast on non-FSGSBASE systems.
++ * It's forcibly inlined because it'll generate better code and this function
++ * is hot.
++ */
++static __always_inline void save_base_legacy(struct task_struct *prev_p,
++                                           unsigned short selector,
++                                           enum which_selector which)
++{
++      if (likely(selector == 0)) {
++              /*
++               * On Intel (without X86_BUG_NULL_SEG), the segment base could
++               * be the pre-existing saved base or it could be zero.  On AMD
++               * (with X86_BUG_NULL_SEG), the segment base could be almost
++               * anything.
++               *
++               * This branch is very hot (it's hit twice on almost every
++               * context switch between 64-bit programs), and avoiding
++               * the RDMSR helps a lot, so we just assume that whatever
++               * value is already saved is correct.  This matches historical
++               * Linux behavior, so it won't break existing applications.
++               *
++               * To avoid leaking state, on non-X86_BUG_NULL_SEG CPUs, if we
++               * report that the base is zero, it needs to actually be zero:
++               * see the corresponding logic in load_seg_legacy.
++               */
++      } else {
++              /*
++               * If the selector is 1, 2, or 3, then the base is zero on
++               * !X86_BUG_NULL_SEG CPUs and could be anything on
++               * X86_BUG_NULL_SEG CPUs.  In the latter case, Linux
++               * has never attempted to preserve the base across context
++               * switches.
++               *
++               * If selector > 3, then it refers to a real segment, and
++               * saving the base isn't necessary.
++               */
++              if (which == FS)
++                      prev_p->thread.fsbase = 0;
++              else
++                      prev_p->thread.gsbase = 0;
++      }
++}
++
++static __always_inline void save_fsgs(struct task_struct *task)
++{
++      savesegment(fs, task->thread.fsindex);
++      savesegment(gs, task->thread.gsindex);
++      save_base_legacy(task, task->thread.fsindex, FS);
++      save_base_legacy(task, task->thread.gsindex, GS);
++}
++
++static __always_inline void loadseg(enum which_selector which,
++                                  unsigned short sel)
++{
++      if (which == FS)
++              loadsegment(fs, sel);
++      else
++              load_gs_index(sel);
++}
++
++static __always_inline void load_seg_legacy(unsigned short prev_index,
++                                          unsigned long prev_base,
++                                          unsigned short next_index,
++                                          unsigned long next_base,
++                                          enum which_selector which)
++{
++      if (likely(next_index <= 3)) {
++              /*
++               * The next task is using 64-bit TLS, is not using this
++               * segment at all, or is having fun with arcane CPU features.
++               */
++              if (next_base == 0) {
++                      /*
++                       * Nasty case: on AMD CPUs, we need to forcibly zero
++                       * the base.
++                       */
++                      if (static_cpu_has_bug(X86_BUG_NULL_SEG)) {
++                              loadseg(which, __USER_DS);
++                              loadseg(which, next_index);
++                      } else {
++                              /*
++                               * We could try to exhaustively detect cases
++                               * under which we can skip the segment load,
++                               * but there's really only one case that matters
++                               * for performance: if both the previous and
++                               * next states are fully zeroed, we can skip
++                               * the load.
++                               *
++                               * (This assumes that prev_base == 0 has no
++                               * false positives.  This is the case on
++                               * Intel-style CPUs.)
++                               */
++                              if (likely(prev_index | next_index | prev_base))
++                                      loadseg(which, next_index);
++                      }
++              } else {
++                      if (prev_index != next_index)
++                              loadseg(which, next_index);
++                      wrmsrl(which == FS ? MSR_FS_BASE : MSR_KERNEL_GS_BASE,
++                             next_base);
++              }
++      } else {
++              /*
++               * The next task is using a real segment.  Loading the selector
++               * is sufficient.
++               */
++              loadseg(which, next_index);
++      }
++}
++
+ int copy_thread_tls(unsigned long clone_flags, unsigned long sp,
+               unsigned long arg, struct task_struct *p, unsigned long tls)
+ {
+@@ -286,7 +403,6 @@ __switch_to(struct task_struct *prev_p,
+       struct fpu *next_fpu = &next->fpu;
+       int cpu = smp_processor_id();
+       struct tss_struct *tss = &per_cpu(cpu_tss, cpu);
+-      unsigned prev_fsindex, prev_gsindex;
+       switch_fpu_prepare(prev_fpu, cpu);
+@@ -295,8 +411,7 @@ __switch_to(struct task_struct *prev_p,
+        *
+        * (e.g. xen_load_tls())
+        */
+-      savesegment(fs, prev_fsindex);
+-      savesegment(gs, prev_gsindex);
++      save_fsgs(prev_p);
+       /*
+        * Load TLS before restoring any segments so that segment loads
+@@ -335,108 +450,10 @@ __switch_to(struct task_struct *prev_p,
+       if (unlikely(next->ds | prev->ds))
+               loadsegment(ds, next->ds);
+-      /*
+-       * Switch FS and GS.
+-       *
+-       * These are even more complicated than DS and ES: they have
+-       * 64-bit bases are that controlled by arch_prctl.  The bases
+-       * don't necessarily match the selectors, as user code can do
+-       * any number of things to cause them to be inconsistent.
+-       *
+-       * We don't promise to preserve the bases if the selectors are
+-       * nonzero.  We also don't promise to preserve the base if the
+-       * selector is zero and the base doesn't match whatever was
+-       * most recently passed to ARCH_SET_FS/GS.  (If/when the
+-       * FSGSBASE instructions are enabled, we'll need to offer
+-       * stronger guarantees.)
+-       *
+-       * As an invariant,
+-       * (fsbase != 0 && fsindex != 0) || (gsbase != 0 && gsindex != 0) is
+-       * impossible.
+-       */
+-      if (next->fsindex) {
+-              /* Loading a nonzero value into FS sets the index and base. */
+-              loadsegment(fs, next->fsindex);
+-      } else {
+-              if (next->fsbase) {
+-                      /* Next index is zero but next base is nonzero. */
+-                      if (prev_fsindex)
+-                              loadsegment(fs, 0);
+-                      wrmsrl(MSR_FS_BASE, next->fsbase);
+-              } else {
+-                      /* Next base and index are both zero. */
+-                      if (static_cpu_has_bug(X86_BUG_NULL_SEG)) {
+-                              /*
+-                               * We don't know the previous base and can't
+-                               * find out without RDMSR.  Forcibly clear it.
+-                               */
+-                              loadsegment(fs, __USER_DS);
+-                              loadsegment(fs, 0);
+-                      } else {
+-                              /*
+-                               * If the previous index is zero and ARCH_SET_FS
+-                               * didn't change the base, then the base is
+-                               * also zero and we don't need to do anything.
+-                               */
+-                              if (prev->fsbase || prev_fsindex)
+-                                      loadsegment(fs, 0);
+-                      }
+-              }
+-      }
+-      /*
+-       * Save the old state and preserve the invariant.
+-       * NB: if prev_fsindex == 0, then we can't reliably learn the base
+-       * without RDMSR because Intel user code can zero it without telling
+-       * us and AMD user code can program any 32-bit value without telling
+-       * us.
+-       */
+-      if (prev_fsindex)
+-              prev->fsbase = 0;
+-      prev->fsindex = prev_fsindex;
+-
+-      if (next->gsindex) {
+-              /* Loading a nonzero value into GS sets the index and base. */
+-              load_gs_index(next->gsindex);
+-      } else {
+-              if (next->gsbase) {
+-                      /* Next index is zero but next base is nonzero. */
+-                      if (prev_gsindex)
+-                              load_gs_index(0);
+-                      wrmsrl(MSR_KERNEL_GS_BASE, next->gsbase);
+-              } else {
+-                      /* Next base and index are both zero. */
+-                      if (static_cpu_has_bug(X86_BUG_NULL_SEG)) {
+-                              /*
+-                               * We don't know the previous base and can't
+-                               * find out without RDMSR.  Forcibly clear it.
+-                               *
+-                               * This contains a pointless SWAPGS pair.
+-                               * Fixing it would involve an explicit check
+-                               * for Xen or a new pvop.
+-                               */
+-                              load_gs_index(__USER_DS);
+-                              load_gs_index(0);
+-                      } else {
+-                              /*
+-                               * If the previous index is zero and ARCH_SET_GS
+-                               * didn't change the base, then the base is
+-                               * also zero and we don't need to do anything.
+-                               */
+-                              if (prev->gsbase || prev_gsindex)
+-                                      load_gs_index(0);
+-                      }
+-              }
+-      }
+-      /*
+-       * Save the old state and preserve the invariant.
+-       * NB: if prev_gsindex == 0, then we can't reliably learn the base
+-       * without RDMSR because Intel user code can zero it without telling
+-       * us and AMD user code can program any 32-bit value without telling
+-       * us.
+-       */
+-      if (prev_gsindex)
+-              prev->gsbase = 0;
+-      prev->gsindex = prev_gsindex;
++      load_seg_legacy(prev->fsindex, prev->fsbase,
++                      next->fsindex, next->fsbase, FS);
++      load_seg_legacy(prev->gsindex, prev->gsbase,
++                      next->gsindex, next->gsbase, GS);
+       switch_fpu_finish(next_fpu, cpu);