4.9-stable patches

author Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Thu, 4 Mar 2021 13:50:51 +0000 (14:50 +0100)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Thu, 4 Mar 2021 13:50:51 +0000 (14:50 +0100)
author Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Thu, 4 Mar 2021 13:50:51 +0000 (14:50 +0100)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Thu, 4 Mar 2021 13:50:51 +0000 (14:50 +0100)
diff --git a/queue-4.9/arm-kprobes-allow-to-handle-reentered-kprobe-on-single-stepping.patch b/queue-4.9/arm-kprobes-allow-to-handle-reentered-kprobe-on-single-stepping.patch

new file mode 100644 (file)

index 0000000..8469941
--- /dev/null
+++ b/queue-4.9/arm-kprobes-allow-to-handle-reentered-kprobe-on-single-stepping.patch
@@ -0,0 +1,55 @@
+From f3fbd7ec62dec1528fb8044034e2885f2b257941 Mon Sep 17 00:00:00 2001
+From: Masami Hiramatsu <mhiramat@kernel.org>
+Date: Tue, 14 Feb 2017 00:03:38 +0900
+Subject: arm: kprobes: Allow to handle reentered kprobe on single-stepping
+
+From: Masami Hiramatsu <mhiramat@kernel.org>
+
+commit f3fbd7ec62dec1528fb8044034e2885f2b257941 upstream.
+
+This is arm port of commit 6a5022a56ac3 ("kprobes/x86: Allow to
+handle reentered kprobe on single-stepping")
+
+Since the FIQ handlers can interrupt in the single stepping
+(or preparing the single stepping, do_debug etc.), we should
+consider a kprobe is hit in the NMI handler. Even in that
+case, the kprobe is allowed to be reentered as same as the
+kprobes hit in kprobe handlers
+(KPROBE_HIT_ACTIVE or KPROBE_HIT_SSDONE).
+
+The real issue will happen when a kprobe hit while another
+reentered kprobe is processing (KPROBE_REENTER), because
+we already consumed a saved-area for the previous kprobe.
+
+Signed-off-by: Masami Hiramatsu <mhiramat@kernel.org>
+Signed-off-by: Jon Medhurst <tixy@linaro.org>
+Fixes: 24ba613c9d6c ("ARM kprobes: core code")
+Cc: stable@vger.kernel.org #v2.6.25~v4.11
+Signed-off-by: huangshaobo <huangshaobo6@huawei.com>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ arch/arm/probes/kprobes/core.c |    6 ++++++
+ 1 file changed, 6 insertions(+)
+
+--- a/arch/arm/probes/kprobes/core.c
++++ b/arch/arm/probes/kprobes/core.c
+@@ -270,6 +270,7 @@ void __kprobes kprobe_handler(struct pt_
+                       switch (kcb->kprobe_status) {
+                       case KPROBE_HIT_ACTIVE:
+                       case KPROBE_HIT_SSDONE:
++                      case KPROBE_HIT_SS:
+                               /* A pre- or post-handler probe got us here. */
+                               kprobes_inc_nmissed_count(p);
+                               save_previous_kprobe(kcb);
+@@ -278,6 +279,11 @@ void __kprobes kprobe_handler(struct pt_
+                               singlestep(p, regs, kcb);
+                               restore_previous_kprobe(kcb);
+                               break;
++                      case KPROBE_REENTER:
++                              /* A nested probe was hit in FIQ, it is a BUG */
++                              pr_warn("Unrecoverable kprobe detected at %p.\n",
++                                      p->addr);
++                              /* fall through */
+                       default:
+                               /* impossible cases */
+                               BUG();
diff --git a/queue-4.9/arm64-avoid-redundant-type-conversions-in-xchg-and-cmpxchg.patch b/queue-4.9/arm64-avoid-redundant-type-conversions-in-xchg-and-cmpxchg.patch

new file mode 100644 (file)

index 0000000..fa4333f
--- /dev/null
+++ b/queue-4.9/arm64-avoid-redundant-type-conversions-in-xchg-and-cmpxchg.patch
@@ -0,0 +1,348 @@
+From foo@baz Thu Mar  4 02:49:26 PM CET 2021
+From: Will Deacon <will.deacon@arm.com>
+Date: Thu, 13 Sep 2018 13:30:45 +0100
+Subject: arm64: Avoid redundant type conversions in xchg() and cmpxchg()
+
+From: Will Deacon <will.deacon@arm.com>
+
+commit 5ef3fe4cecdf82fdd71ce78988403963d01444d4 upstream.
+
+Our atomic instructions (either LSE atomics of LDXR/STXR sequences)
+natively support byte, half-word, word and double-word memory accesses
+so there is no need to mask the data register prior to being stored.
+
+Signed-off-by: Will Deacon <will.deacon@arm.com>
+Signed-off-by: Ben Hutchings <ben@decadent.org.uk>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ arch/arm64/include/asm/atomic_ll_sc.h |   53 +++++++--------
+ arch/arm64/include/asm/atomic_lse.h   |   46 ++++++-------
+ arch/arm64/include/asm/cmpxchg.h      |  116 +++++++++++++++++-----------------
+ 3 files changed, 108 insertions(+), 107 deletions(-)
+
+--- a/arch/arm64/include/asm/atomic_ll_sc.h
++++ b/arch/arm64/include/asm/atomic_ll_sc.h
+@@ -248,48 +248,49 @@ __LL_SC_PREFIX(atomic64_dec_if_positive(
+ }
+ __LL_SC_EXPORT(atomic64_dec_if_positive);
+ 
+-#define __CMPXCHG_CASE(w, sz, name, mb, acq, rel, cl)                 \
+-__LL_SC_INLINE unsigned long                                          \
+-__LL_SC_PREFIX(__cmpxchg_case_##name(volatile void *ptr,              \
+-                                   unsigned long old,                 \
+-                                   unsigned long new))                \
++#define __CMPXCHG_CASE(w, sfx, name, sz, mb, acq, rel, cl)            \
++__LL_SC_INLINE u##sz                                                  \
++__LL_SC_PREFIX(__cmpxchg_case_##name##sz(volatile void *ptr,          \
++                                       unsigned long old,             \
++                                       u##sz new))                    \
+ {                                                                     \
+-      unsigned long tmp, oldval;                                      \
++      unsigned long tmp;                                              \
++      u##sz oldval;                                                   \
+                                                                       \
+       asm volatile(                                                   \
+       "       prfm    pstl1strm, %[v]\n"                              \
+-      "1:     ld" #acq "xr" #sz "\t%" #w "[oldval], %[v]\n"           \
++      "1:     ld" #acq "xr" #sfx "\t%" #w "[oldval], %[v]\n"          \
+       "       eor     %" #w "[tmp], %" #w "[oldval], %" #w "[old]\n"  \
+       "       cbnz    %" #w "[tmp], 2f\n"                             \
+-      "       st" #rel "xr" #sz "\t%w[tmp], %" #w "[new], %[v]\n"     \
++      "       st" #rel "xr" #sfx "\t%w[tmp], %" #w "[new], %[v]\n"    \
+       "       cbnz    %w[tmp], 1b\n"                                  \
+       "       " #mb "\n"                                              \
+       "2:"                                                            \
+       : [tmp] "=&r" (tmp), [oldval] "=&r" (oldval),                   \
+-        [v] "+Q" (*(unsigned long *)ptr)                              \
++        [v] "+Q" (*(u##sz *)ptr)                                      \
+       : [old] "Lr" (old), [new] "r" (new)                             \
+       : cl);                                                          \
+                                                                       \
+       return oldval;                                                  \
+ }                                                                     \
+-__LL_SC_EXPORT(__cmpxchg_case_##name);
++__LL_SC_EXPORT(__cmpxchg_case_##name##sz);
+ 
+-__CMPXCHG_CASE(w, b,     1,        ,  ,  ,         )
+-__CMPXCHG_CASE(w, h,     2,        ,  ,  ,         )
+-__CMPXCHG_CASE(w,  ,     4,        ,  ,  ,         )
+-__CMPXCHG_CASE( ,  ,     8,        ,  ,  ,         )
+-__CMPXCHG_CASE(w, b, acq_1,        , a,  , "memory")
+-__CMPXCHG_CASE(w, h, acq_2,        , a,  , "memory")
+-__CMPXCHG_CASE(w,  , acq_4,        , a,  , "memory")
+-__CMPXCHG_CASE( ,  , acq_8,        , a,  , "memory")
+-__CMPXCHG_CASE(w, b, rel_1,        ,  , l, "memory")
+-__CMPXCHG_CASE(w, h, rel_2,        ,  , l, "memory")
+-__CMPXCHG_CASE(w,  , rel_4,        ,  , l, "memory")
+-__CMPXCHG_CASE( ,  , rel_8,        ,  , l, "memory")
+-__CMPXCHG_CASE(w, b,  mb_1, dmb ish,  , l, "memory")
+-__CMPXCHG_CASE(w, h,  mb_2, dmb ish,  , l, "memory")
+-__CMPXCHG_CASE(w,  ,  mb_4, dmb ish,  , l, "memory")
+-__CMPXCHG_CASE( ,  ,  mb_8, dmb ish,  , l, "memory")
++__CMPXCHG_CASE(w, b,     ,  8,        ,  ,  ,         )
++__CMPXCHG_CASE(w, h,     , 16,        ,  ,  ,         )
++__CMPXCHG_CASE(w,  ,     , 32,        ,  ,  ,         )
++__CMPXCHG_CASE( ,  ,     , 64,        ,  ,  ,         )
++__CMPXCHG_CASE(w, b, acq_,  8,        , a,  , "memory")
++__CMPXCHG_CASE(w, h, acq_, 16,        , a,  , "memory")
++__CMPXCHG_CASE(w,  , acq_, 32,        , a,  , "memory")
++__CMPXCHG_CASE( ,  , acq_, 64,        , a,  , "memory")
++__CMPXCHG_CASE(w, b, rel_,  8,        ,  , l, "memory")
++__CMPXCHG_CASE(w, h, rel_, 16,        ,  , l, "memory")
++__CMPXCHG_CASE(w,  , rel_, 32,        ,  , l, "memory")
++__CMPXCHG_CASE( ,  , rel_, 64,        ,  , l, "memory")
++__CMPXCHG_CASE(w, b,  mb_,  8, dmb ish,  , l, "memory")
++__CMPXCHG_CASE(w, h,  mb_, 16, dmb ish,  , l, "memory")
++__CMPXCHG_CASE(w,  ,  mb_, 32, dmb ish,  , l, "memory")
++__CMPXCHG_CASE( ,  ,  mb_, 64, dmb ish,  , l, "memory")
+ 
+ #undef __CMPXCHG_CASE
+ 
+--- a/arch/arm64/include/asm/atomic_lse.h
++++ b/arch/arm64/include/asm/atomic_lse.h
+@@ -446,22 +446,22 @@ static inline long atomic64_dec_if_posit
+ 
+ #define __LL_SC_CMPXCHG(op)   __LL_SC_CALL(__cmpxchg_case_##op)
+ 
+-#define __CMPXCHG_CASE(w, sz, name, mb, cl...)                                \
+-static inline unsigned long __cmpxchg_case_##name(volatile void *ptr, \
+-                                                unsigned long old,    \
+-                                                unsigned long new)    \
++#define __CMPXCHG_CASE(w, sfx, name, sz, mb, cl...)                   \
++static inline u##sz __cmpxchg_case_##name##sz(volatile void *ptr,     \
++                                            unsigned long old,        \
++                                            u##sz new)                \
+ {                                                                     \
+       register unsigned long x0 asm ("x0") = (unsigned long)ptr;      \
+       register unsigned long x1 asm ("x1") = old;                     \
+-      register unsigned long x2 asm ("x2") = new;                     \
++      register u##sz x2 asm ("x2") = new;                             \
+                                                                       \
+       asm volatile(ARM64_LSE_ATOMIC_INSN(                             \
+       /* LL/SC */                                                     \
+-      __LL_SC_CMPXCHG(name)                                           \
++      __LL_SC_CMPXCHG(name##sz)                                       \
+       __nops(2),                                                      \
+       /* LSE atomics */                                               \
+       "       mov     " #w "30, %" #w "[old]\n"                       \
+-      "       cas" #mb #sz "\t" #w "30, %" #w "[new], %[v]\n"         \
++      "       cas" #mb #sfx "\t" #w "30, %" #w "[new], %[v]\n"        \
+       "       mov     %" #w "[ret], " #w "30")                        \
+       : [ret] "+r" (x0), [v] "+Q" (*(unsigned long *)ptr)             \
+       : [old] "r" (x1), [new] "r" (x2)                                \
+@@ -470,22 +470,22 @@ static inline unsigned long __cmpxchg_ca
+       return x0;                                                      \
+ }
+ 
+-__CMPXCHG_CASE(w, b,     1,   )
+-__CMPXCHG_CASE(w, h,     2,   )
+-__CMPXCHG_CASE(w,  ,     4,   )
+-__CMPXCHG_CASE(x,  ,     8,   )
+-__CMPXCHG_CASE(w, b, acq_1,  a, "memory")
+-__CMPXCHG_CASE(w, h, acq_2,  a, "memory")
+-__CMPXCHG_CASE(w,  , acq_4,  a, "memory")
+-__CMPXCHG_CASE(x,  , acq_8,  a, "memory")
+-__CMPXCHG_CASE(w, b, rel_1,  l, "memory")
+-__CMPXCHG_CASE(w, h, rel_2,  l, "memory")
+-__CMPXCHG_CASE(w,  , rel_4,  l, "memory")
+-__CMPXCHG_CASE(x,  , rel_8,  l, "memory")
+-__CMPXCHG_CASE(w, b,  mb_1, al, "memory")
+-__CMPXCHG_CASE(w, h,  mb_2, al, "memory")
+-__CMPXCHG_CASE(w,  ,  mb_4, al, "memory")
+-__CMPXCHG_CASE(x,  ,  mb_8, al, "memory")
++__CMPXCHG_CASE(w, b,     ,  8,   )
++__CMPXCHG_CASE(w, h,     , 16,   )
++__CMPXCHG_CASE(w,  ,     , 32,   )
++__CMPXCHG_CASE(x,  ,     , 64,   )
++__CMPXCHG_CASE(w, b, acq_,  8,  a, "memory")
++__CMPXCHG_CASE(w, h, acq_, 16,  a, "memory")
++__CMPXCHG_CASE(w,  , acq_, 32,  a, "memory")
++__CMPXCHG_CASE(x,  , acq_, 64,  a, "memory")
++__CMPXCHG_CASE(w, b, rel_,  8,  l, "memory")
++__CMPXCHG_CASE(w, h, rel_, 16,  l, "memory")
++__CMPXCHG_CASE(w,  , rel_, 32,  l, "memory")
++__CMPXCHG_CASE(x,  , rel_, 64,  l, "memory")
++__CMPXCHG_CASE(w, b,  mb_,  8, al, "memory")
++__CMPXCHG_CASE(w, h,  mb_, 16, al, "memory")
++__CMPXCHG_CASE(w,  ,  mb_, 32, al, "memory")
++__CMPXCHG_CASE(x,  ,  mb_, 64, al, "memory")
+ 
+ #undef __LL_SC_CMPXCHG
+ #undef __CMPXCHG_CASE
+--- a/arch/arm64/include/asm/cmpxchg.h
++++ b/arch/arm64/include/asm/cmpxchg.h
+@@ -29,46 +29,46 @@
+  * barrier case is generated as release+dmb for the former and
+  * acquire+release for the latter.
+  */
+-#define __XCHG_CASE(w, sz, name, mb, nop_lse, acq, acq_lse, rel, cl)  \
+-static inline unsigned long __xchg_case_##name(unsigned long x,               \
+-                                             volatile void *ptr)      \
+-{                                                                     \
+-      unsigned long ret, tmp;                                         \
+-                                                                      \
+-      asm volatile(ARM64_LSE_ATOMIC_INSN(                             \
+-      /* LL/SC */                                                     \
+-      "       prfm    pstl1strm, %2\n"                                \
+-      "1:     ld" #acq "xr" #sz "\t%" #w "0, %2\n"                    \
+-      "       st" #rel "xr" #sz "\t%w1, %" #w "3, %2\n"               \
+-      "       cbnz    %w1, 1b\n"                                      \
+-      "       " #mb,                                                  \
+-      /* LSE atomics */                                               \
+-      "       swp" #acq_lse #rel #sz "\t%" #w "3, %" #w "0, %2\n"     \
+-              __nops(3)                                               \
+-      "       " #nop_lse)                                             \
+-      : "=&r" (ret), "=&r" (tmp), "+Q" (*(unsigned long *)ptr)        \
+-      : "r" (x)                                                       \
+-      : cl);                                                          \
+-                                                                      \
+-      return ret;                                                     \
++#define __XCHG_CASE(w, sfx, name, sz, mb, nop_lse, acq, acq_lse, rel, cl)     \
++static inline u##sz __xchg_case_##name##sz(u##sz x, volatile void *ptr)               \
++{                                                                             \
++      u##sz ret;                                                              \
++      unsigned long tmp;                                                      \
++                                                                              \
++      asm volatile(ARM64_LSE_ATOMIC_INSN(                                     \
++      /* LL/SC */                                                             \
++      "       prfm    pstl1strm, %2\n"                                        \
++      "1:     ld" #acq "xr" #sfx "\t%" #w "0, %2\n"                           \
++      "       st" #rel "xr" #sfx "\t%w1, %" #w "3, %2\n"                      \
++      "       cbnz    %w1, 1b\n"                                              \
++      "       " #mb,                                                          \
++      /* LSE atomics */                                                       \
++      "       swp" #acq_lse #rel #sfx "\t%" #w "3, %" #w "0, %2\n"            \
++              __nops(3)                                                       \
++      "       " #nop_lse)                                                     \
++      : "=&r" (ret), "=&r" (tmp), "+Q" (*(u##sz *)ptr)                        \
++      : "r" (x)                                                               \
++      : cl);                                                                  \
++                                                                              \
++      return ret;                                                             \
+ }
+ 
+-__XCHG_CASE(w, b,     1,        ,    ,  ,  ,  ,         )
+-__XCHG_CASE(w, h,     2,        ,    ,  ,  ,  ,         )
+-__XCHG_CASE(w,  ,     4,        ,    ,  ,  ,  ,         )
+-__XCHG_CASE( ,  ,     8,        ,    ,  ,  ,  ,         )
+-__XCHG_CASE(w, b, acq_1,        ,    , a, a,  , "memory")
+-__XCHG_CASE(w, h, acq_2,        ,    , a, a,  , "memory")
+-__XCHG_CASE(w,  , acq_4,        ,    , a, a,  , "memory")
+-__XCHG_CASE( ,  , acq_8,        ,    , a, a,  , "memory")
+-__XCHG_CASE(w, b, rel_1,        ,    ,  ,  , l, "memory")
+-__XCHG_CASE(w, h, rel_2,        ,    ,  ,  , l, "memory")
+-__XCHG_CASE(w,  , rel_4,        ,    ,  ,  , l, "memory")
+-__XCHG_CASE( ,  , rel_8,        ,    ,  ,  , l, "memory")
+-__XCHG_CASE(w, b,  mb_1, dmb ish, nop,  , a, l, "memory")
+-__XCHG_CASE(w, h,  mb_2, dmb ish, nop,  , a, l, "memory")
+-__XCHG_CASE(w,  ,  mb_4, dmb ish, nop,  , a, l, "memory")
+-__XCHG_CASE( ,  ,  mb_8, dmb ish, nop,  , a, l, "memory")
++__XCHG_CASE(w, b,     ,  8,        ,    ,  ,  ,  ,         )
++__XCHG_CASE(w, h,     , 16,        ,    ,  ,  ,  ,         )
++__XCHG_CASE(w,  ,     , 32,        ,    ,  ,  ,  ,         )
++__XCHG_CASE( ,  ,     , 64,        ,    ,  ,  ,  ,         )
++__XCHG_CASE(w, b, acq_,  8,        ,    , a, a,  , "memory")
++__XCHG_CASE(w, h, acq_, 16,        ,    , a, a,  , "memory")
++__XCHG_CASE(w,  , acq_, 32,        ,    , a, a,  , "memory")
++__XCHG_CASE( ,  , acq_, 64,        ,    , a, a,  , "memory")
++__XCHG_CASE(w, b, rel_,  8,        ,    ,  ,  , l, "memory")
++__XCHG_CASE(w, h, rel_, 16,        ,    ,  ,  , l, "memory")
++__XCHG_CASE(w,  , rel_, 32,        ,    ,  ,  , l, "memory")
++__XCHG_CASE( ,  , rel_, 64,        ,    ,  ,  , l, "memory")
++__XCHG_CASE(w, b,  mb_,  8, dmb ish, nop,  , a, l, "memory")
++__XCHG_CASE(w, h,  mb_, 16, dmb ish, nop,  , a, l, "memory")
++__XCHG_CASE(w,  ,  mb_, 32, dmb ish, nop,  , a, l, "memory")
++__XCHG_CASE( ,  ,  mb_, 64, dmb ish, nop,  , a, l, "memory")
+ 
+ #undef __XCHG_CASE
+ 
+@@ -79,13 +79,13 @@ static __always_inline  unsigned long __
+ {                                                                     \
+       switch (size) {                                                 \
+       case 1:                                                         \
+-              return __xchg_case##sfx##_1(x, ptr);                    \
++              return __xchg_case##sfx##_8(x, ptr);                    \
+       case 2:                                                         \
+-              return __xchg_case##sfx##_2(x, ptr);                    \
++              return __xchg_case##sfx##_16(x, ptr);                   \
+       case 4:                                                         \
+-              return __xchg_case##sfx##_4(x, ptr);                    \
++              return __xchg_case##sfx##_32(x, ptr);                   \
+       case 8:                                                         \
+-              return __xchg_case##sfx##_8(x, ptr);                    \
++              return __xchg_case##sfx##_64(x, ptr);                   \
+       default:                                                        \
+               BUILD_BUG();                                            \
+       }                                                               \
+@@ -122,13 +122,13 @@ static __always_inline unsigned long __c
+ {                                                                     \
+       switch (size) {                                                 \
+       case 1:                                                         \
+-              return __cmpxchg_case##sfx##_1(ptr, (u8)old, new);      \
++              return __cmpxchg_case##sfx##_8(ptr, (u8)old, new);      \
+       case 2:                                                         \
+-              return __cmpxchg_case##sfx##_2(ptr, (u16)old, new);     \
++              return __cmpxchg_case##sfx##_16(ptr, (u16)old, new);    \
+       case 4:                                                         \
+-              return __cmpxchg_case##sfx##_4(ptr, old, new);          \
++              return __cmpxchg_case##sfx##_32(ptr, old, new);         \
+       case 8:                                                         \
+-              return __cmpxchg_case##sfx##_8(ptr, old, new);          \
++              return __cmpxchg_case##sfx##_64(ptr, old, new);         \
+       default:                                                        \
+               BUILD_BUG();                                            \
+       }                                                               \
+@@ -222,16 +222,16 @@ __CMPXCHG_GEN(_mb)
+       __ret;                                                          \
+ })
+ 
+-#define __CMPWAIT_CASE(w, sz, name)                                   \
+-static inline void __cmpwait_case_##name(volatile void *ptr,          \
+-                                       unsigned long val)             \
++#define __CMPWAIT_CASE(w, sfx, sz)                                    \
++static inline void __cmpwait_case_##sz(volatile void *ptr,            \
++                                     unsigned long val)               \
+ {                                                                     \
+       unsigned long tmp;                                              \
+                                                                       \
+       asm volatile(                                                   \
+       "       sevl\n"                                                 \
+       "       wfe\n"                                                  \
+-      "       ldxr" #sz "\t%" #w "[tmp], %[v]\n"                      \
++      "       ldxr" #sfx "\t%" #w "[tmp], %[v]\n"                     \
+       "       eor     %" #w "[tmp], %" #w "[tmp], %" #w "[val]\n"     \
+       "       cbnz    %" #w "[tmp], 1f\n"                             \
+       "       wfe\n"                                                  \
+@@ -240,10 +240,10 @@ static inline void __cmpwait_case_##name
+       : [val] "r" (val));                                             \
+ }
+ 
+-__CMPWAIT_CASE(w, b, 1);
+-__CMPWAIT_CASE(w, h, 2);
+-__CMPWAIT_CASE(w,  , 4);
+-__CMPWAIT_CASE( ,  , 8);
++__CMPWAIT_CASE(w, b, 8);
++__CMPWAIT_CASE(w, h, 16);
++__CMPWAIT_CASE(w,  , 32);
++__CMPWAIT_CASE( ,  , 64);
+ 
+ #undef __CMPWAIT_CASE
+ 
+@@ -254,13 +254,13 @@ static __always_inline void __cmpwait##s
+ {                                                                     \
+       switch (size) {                                                 \
+       case 1:                                                         \
+-              return __cmpwait_case##sfx##_1(ptr, (u8)val);           \
++              return __cmpwait_case##sfx##_8(ptr, (u8)val);           \
+       case 2:                                                         \
+-              return __cmpwait_case##sfx##_2(ptr, (u16)val);          \
++              return __cmpwait_case##sfx##_16(ptr, (u16)val);         \
+       case 4:                                                         \
+-              return __cmpwait_case##sfx##_4(ptr, val);               \
++              return __cmpwait_case##sfx##_32(ptr, val);              \
+       case 8:                                                         \
+-              return __cmpwait_case##sfx##_8(ptr, val);               \
++              return __cmpwait_case##sfx##_64(ptr, val);              \
+       default:                                                        \
+               BUILD_BUG();                                            \
+       }                                                               \
diff --git a/queue-4.9/arm64-cmpxchg-use-k-instead-of-l-for-ll-sc-immediate-constraint.patch b/queue-4.9/arm64-cmpxchg-use-k-instead-of-l-for-ll-sc-immediate-constraint.patch

new file mode 100644 (file)

index 0000000..22ccc0c
--- /dev/null
+++ b/queue-4.9/arm64-cmpxchg-use-k-instead-of-l-for-ll-sc-immediate-constraint.patch
@@ -0,0 +1,39 @@
+From foo@baz Thu Mar  4 02:49:26 PM CET 2021
+From: Will Deacon <will.deacon@arm.com>
+Date: Tue, 18 Sep 2018 09:39:55 +0100
+Subject: arm64: cmpxchg: Use "K" instead of "L" for ll/sc immediate constraint
+
+From: Will Deacon <will.deacon@arm.com>
+
+commit 4230509978f2921182da4e9197964dccdbe463c3 upstream.
+
+The "L" AArch64 machine constraint, which we use for the "old" value in
+an LL/SC cmpxchg(), generates an immediate that is suitable for a 64-bit
+logical instruction. However, for cmpxchg() operations on types smaller
+than 64 bits, this constraint can result in an invalid instruction which
+is correctly rejected by GAS, such as EOR W1, W1, #0xffffffff.
+
+Whilst we could special-case the constraint based on the cmpxchg size,
+it's far easier to change the constraint to "K" and put up with using
+a register for large 64-bit immediates. For out-of-line LL/SC atomics,
+this is all moot anyway.
+
+Reported-by: Robin Murphy <robin.murphy@arm.com>
+Signed-off-by: Will Deacon <will.deacon@arm.com>
+Signed-off-by: Ben Hutchings <ben@decadent.org.uk>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ arch/arm64/include/asm/atomic_ll_sc.h |    2 +-
+ 1 file changed, 1 insertion(+), 1 deletion(-)
+
+--- a/arch/arm64/include/asm/atomic_ll_sc.h
++++ b/arch/arm64/include/asm/atomic_ll_sc.h
+@@ -268,7 +268,7 @@ __LL_SC_PREFIX(__cmpxchg_case_##name##sz
+       "2:"                                                            \
+       : [tmp] "=&r" (tmp), [oldval] "=&r" (oldval),                   \
+         [v] "+Q" (*(u##sz *)ptr)                                      \
+-      : [old] "Lr" (old), [new] "r" (new)                             \
++      : [old] "Kr" (old), [new] "r" (new)                             \
+       : cl);                                                          \
+                                                                       \
+       return oldval;                                                  \
diff --git a/queue-4.9/arm64-remove-redundant-mov-from-ll-sc-cmpxchg.patch b/queue-4.9/arm64-remove-redundant-mov-from-ll-sc-cmpxchg.patch

new file mode 100644 (file)

index 0000000..8cb0f8f
--- /dev/null
+++ b/queue-4.9/arm64-remove-redundant-mov-from-ll-sc-cmpxchg.patch
@@ -0,0 +1,42 @@
+From foo@baz Thu Mar  4 02:49:26 PM CET 2021
+From: Robin Murphy <robin.murphy@arm.com>
+Date: Fri, 12 May 2017 13:48:41 +0100
+Subject: arm64: Remove redundant mov from LL/SC cmpxchg
+
+From: Robin Murphy <robin.murphy@arm.com>
+
+commit 8df728e1ae614f592961e51f65d3e3212ede5a75 upstream.
+
+The cmpxchg implementation introduced by commit c342f78217e8 ("arm64:
+cmpxchg: patch in lse instructions when supported by the CPU") performs
+an apparently redundant register move of [old] to [oldval] in the
+success case - it always uses the same register width as [oldval] was
+originally loaded with, and is only executed when [old] and [oldval] are
+known to be equal anyway.
+
+The only effect it seemingly does have is to take up a surprising amount
+of space in the kernel text, as removing it reveals:
+
+   text           data     bss     dec     hex filename
+12426658       1348614 4499749 18275021        116dacd vmlinux.o.new
+12429238       1348614 4499749 18277601        116e4e1 vmlinux.o.old
+
+Reviewed-by: Will Deacon <will.deacon@arm.com>
+Signed-off-by: Robin Murphy <robin.murphy@arm.com>
+Signed-off-by: Catalin Marinas <catalin.marinas@arm.com>
+Signed-off-by: Ben Hutchings <ben@decadent.org.uk>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ arch/arm64/include/asm/atomic_ll_sc.h |    1 -
+ 1 file changed, 1 deletion(-)
+
+--- a/arch/arm64/include/asm/atomic_ll_sc.h
++++ b/arch/arm64/include/asm/atomic_ll_sc.h
+@@ -264,7 +264,6 @@ __LL_SC_PREFIX(__cmpxchg_case_##name(vol
+       "       st" #rel "xr" #sz "\t%w[tmp], %" #w "[new], %[v]\n"     \
+       "       cbnz    %w[tmp], 1b\n"                                  \
+       "       " #mb "\n"                                              \
+-      "       mov     %" #w "[oldval], %" #w "[old]\n"                \
+       "2:"                                                            \
+       : [tmp] "=&r" (tmp), [oldval] "=&r" (oldval),                   \
+         [v] "+Q" (*(unsigned long *)ptr)                              \
diff --git a/queue-4.9/arm64-use-correct-ll-sc-atomic-constraints.patch b/queue-4.9/arm64-use-correct-ll-sc-atomic-constraints.patch

new file mode 100644 (file)

index 0000000..5b17e62
--- /dev/null
+++ b/queue-4.9/arm64-use-correct-ll-sc-atomic-constraints.patch
@@ -0,0 +1,253 @@
+From foo@baz Thu Mar  4 02:49:26 PM CET 2021
+From: Andrew Murray <andrew.murray@arm.com>
+Date: Wed, 28 Aug 2019 18:50:06 +0100
+Subject: arm64: Use correct ll/sc atomic constraints
+
+From: Andrew Murray <andrew.murray@arm.com>
+
+commit 580fa1b874711d633f9b145b7777b0e83ebf3787 upstream.
+
+The A64 ISA accepts distinct (but overlapping) ranges of immediates for:
+
+ * add arithmetic instructions ('I' machine constraint)
+ * sub arithmetic instructions ('J' machine constraint)
+ * 32-bit logical instructions ('K' machine constraint)
+ * 64-bit logical instructions ('L' machine constraint)
+
+... but we currently use the 'I' constraint for many atomic operations
+using sub or logical instructions, which is not always valid.
+
+When CONFIG_ARM64_LSE_ATOMICS is not set, this allows invalid immediates
+to be passed to instructions, potentially resulting in a build failure.
+When CONFIG_ARM64_LSE_ATOMICS is selected the out-of-line ll/sc atomics
+always use a register as they have no visibility of the value passed by
+the caller.
+
+This patch adds a constraint parameter to the ATOMIC_xx and
+__CMPXCHG_CASE macros so that we can pass appropriate constraints for
+each case, with uses updated accordingly.
+
+Unfortunately prior to GCC 8.1.0 the 'K' constraint erroneously accepted
+'4294967295', so we must instead force the use of a register.
+
+Signed-off-by: Andrew Murray <andrew.murray@arm.com>
+Signed-off-by: Will Deacon <will@kernel.org>
+[bwh: Backported to 4.9: adjust context]
+Signed-off-by: Ben Hutchings <ben@decadent.org.uk>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ arch/arm64/include/asm/atomic_ll_sc.h |   89 +++++++++++++++++-----------------
+ 1 file changed, 47 insertions(+), 42 deletions(-)
+
+--- a/arch/arm64/include/asm/atomic_ll_sc.h
++++ b/arch/arm64/include/asm/atomic_ll_sc.h
+@@ -37,7 +37,7 @@
+  * (the optimize attribute silently ignores these options).
+  */
+ 
+-#define ATOMIC_OP(op, asm_op)                                         \
++#define ATOMIC_OP(op, asm_op, constraint)                             \
+ __LL_SC_INLINE void                                                   \
+ __LL_SC_PREFIX(atomic_##op(int i, atomic_t *v))                               \
+ {                                                                     \
+@@ -51,11 +51,11 @@ __LL_SC_PREFIX(atomic_##op(int i, atomic
+ "     stxr    %w1, %w0, %2\n"                                         \
+ "     cbnz    %w1, 1b"                                                \
+       : "=&r" (result), "=&r" (tmp), "+Q" (v->counter)                \
+-      : "Ir" (i));                                                    \
++      : #constraint "r" (i));                                         \
+ }                                                                     \
+ __LL_SC_EXPORT(atomic_##op);
+ 
+-#define ATOMIC_OP_RETURN(name, mb, acq, rel, cl, op, asm_op)          \
++#define ATOMIC_OP_RETURN(name, mb, acq, rel, cl, op, asm_op, constraint)\
+ __LL_SC_INLINE int                                                    \
+ __LL_SC_PREFIX(atomic_##op##_return##name(int i, atomic_t *v))                \
+ {                                                                     \
+@@ -70,14 +70,14 @@ __LL_SC_PREFIX(atomic_##op##_return##nam
+ "     cbnz    %w1, 1b\n"                                              \
+ "     " #mb                                                           \
+       : "=&r" (result), "=&r" (tmp), "+Q" (v->counter)                \
+-      : "Ir" (i)                                                      \
++      : #constraint "r" (i)                                           \
+       : cl);                                                          \
+                                                                       \
+       return result;                                                  \
+ }                                                                     \
+ __LL_SC_EXPORT(atomic_##op##_return##name);
+ 
+-#define ATOMIC_FETCH_OP(name, mb, acq, rel, cl, op, asm_op)           \
++#define ATOMIC_FETCH_OP(name, mb, acq, rel, cl, op, asm_op, constraint)       \
+ __LL_SC_INLINE int                                                    \
+ __LL_SC_PREFIX(atomic_fetch_##op##name(int i, atomic_t *v))           \
+ {                                                                     \
+@@ -92,7 +92,7 @@ __LL_SC_PREFIX(atomic_fetch_##op##name(i
+ "     cbnz    %w2, 1b\n"                                              \
+ "     " #mb                                                           \
+       : "=&r" (result), "=&r" (val), "=&r" (tmp), "+Q" (v->counter)   \
+-      : "Ir" (i)                                                      \
++      : #constraint "r" (i)                                           \
+       : cl);                                                          \
+                                                                       \
+       return result;                                                  \
+@@ -110,8 +110,8 @@ __LL_SC_EXPORT(atomic_fetch_##op##name);
+       ATOMIC_FETCH_OP (_acquire,        , a,  , "memory", __VA_ARGS__)\
+       ATOMIC_FETCH_OP (_release,        ,  , l, "memory", __VA_ARGS__)
+ 
+-ATOMIC_OPS(add, add)
+-ATOMIC_OPS(sub, sub)
++ATOMIC_OPS(add, add, I)
++ATOMIC_OPS(sub, sub, J)
+ 
+ #undef ATOMIC_OPS
+ #define ATOMIC_OPS(...)                                                       \
+@@ -121,17 +121,17 @@ ATOMIC_OPS(sub, sub)
+       ATOMIC_FETCH_OP (_acquire,        , a,  , "memory", __VA_ARGS__)\
+       ATOMIC_FETCH_OP (_release,        ,  , l, "memory", __VA_ARGS__)
+ 
+-ATOMIC_OPS(and, and)
+-ATOMIC_OPS(andnot, bic)
+-ATOMIC_OPS(or, orr)
+-ATOMIC_OPS(xor, eor)
++ATOMIC_OPS(and, and, )
++ATOMIC_OPS(andnot, bic, )
++ATOMIC_OPS(or, orr, )
++ATOMIC_OPS(xor, eor, )
+ 
+ #undef ATOMIC_OPS
+ #undef ATOMIC_FETCH_OP
+ #undef ATOMIC_OP_RETURN
+ #undef ATOMIC_OP
+ 
+-#define ATOMIC64_OP(op, asm_op)                                               \
++#define ATOMIC64_OP(op, asm_op, constraint)                           \
+ __LL_SC_INLINE void                                                   \
+ __LL_SC_PREFIX(atomic64_##op(long i, atomic64_t *v))                  \
+ {                                                                     \
+@@ -145,11 +145,11 @@ __LL_SC_PREFIX(atomic64_##op(long i, ato
+ "     stxr    %w1, %0, %2\n"                                          \
+ "     cbnz    %w1, 1b"                                                \
+       : "=&r" (result), "=&r" (tmp), "+Q" (v->counter)                \
+-      : "Ir" (i));                                                    \
++      : #constraint "r" (i));                                         \
+ }                                                                     \
+ __LL_SC_EXPORT(atomic64_##op);
+ 
+-#define ATOMIC64_OP_RETURN(name, mb, acq, rel, cl, op, asm_op)                \
++#define ATOMIC64_OP_RETURN(name, mb, acq, rel, cl, op, asm_op, constraint)\
+ __LL_SC_INLINE long                                                   \
+ __LL_SC_PREFIX(atomic64_##op##_return##name(long i, atomic64_t *v))   \
+ {                                                                     \
+@@ -164,14 +164,14 @@ __LL_SC_PREFIX(atomic64_##op##_return##n
+ "     cbnz    %w1, 1b\n"                                              \
+ "     " #mb                                                           \
+       : "=&r" (result), "=&r" (tmp), "+Q" (v->counter)                \
+-      : "Ir" (i)                                                      \
++      : #constraint "r" (i)                                           \
+       : cl);                                                          \
+                                                                       \
+       return result;                                                  \
+ }                                                                     \
+ __LL_SC_EXPORT(atomic64_##op##_return##name);
+ 
+-#define ATOMIC64_FETCH_OP(name, mb, acq, rel, cl, op, asm_op)         \
++#define ATOMIC64_FETCH_OP(name, mb, acq, rel, cl, op, asm_op, constraint)\
+ __LL_SC_INLINE long                                                   \
+ __LL_SC_PREFIX(atomic64_fetch_##op##name(long i, atomic64_t *v))      \
+ {                                                                     \
+@@ -186,7 +186,7 @@ __LL_SC_PREFIX(atomic64_fetch_##op##name
+ "     cbnz    %w2, 1b\n"                                              \
+ "     " #mb                                                           \
+       : "=&r" (result), "=&r" (val), "=&r" (tmp), "+Q" (v->counter)   \
+-      : "Ir" (i)                                                      \
++      : #constraint "r" (i)                                           \
+       : cl);                                                          \
+                                                                       \
+       return result;                                                  \
+@@ -204,8 +204,8 @@ __LL_SC_EXPORT(atomic64_fetch_##op##name
+       ATOMIC64_FETCH_OP (_acquire,, a,  , "memory", __VA_ARGS__)      \
+       ATOMIC64_FETCH_OP (_release,,  , l, "memory", __VA_ARGS__)
+ 
+-ATOMIC64_OPS(add, add)
+-ATOMIC64_OPS(sub, sub)
++ATOMIC64_OPS(add, add, I)
++ATOMIC64_OPS(sub, sub, J)
+ 
+ #undef ATOMIC64_OPS
+ #define ATOMIC64_OPS(...)                                             \
+@@ -215,10 +215,10 @@ ATOMIC64_OPS(sub, sub)
+       ATOMIC64_FETCH_OP (_acquire,, a,  , "memory", __VA_ARGS__)      \
+       ATOMIC64_FETCH_OP (_release,,  , l, "memory", __VA_ARGS__)
+ 
+-ATOMIC64_OPS(and, and)
+-ATOMIC64_OPS(andnot, bic)
+-ATOMIC64_OPS(or, orr)
+-ATOMIC64_OPS(xor, eor)
++ATOMIC64_OPS(and, and, L)
++ATOMIC64_OPS(andnot, bic, )
++ATOMIC64_OPS(or, orr, L)
++ATOMIC64_OPS(xor, eor, L)
+ 
+ #undef ATOMIC64_OPS
+ #undef ATOMIC64_FETCH_OP
+@@ -248,7 +248,7 @@ __LL_SC_PREFIX(atomic64_dec_if_positive(
+ }
+ __LL_SC_EXPORT(atomic64_dec_if_positive);
+ 
+-#define __CMPXCHG_CASE(w, sfx, name, sz, mb, acq, rel, cl)            \
++#define __CMPXCHG_CASE(w, sfx, name, sz, mb, acq, rel, cl, constraint)        \
+ __LL_SC_INLINE u##sz                                                  \
+ __LL_SC_PREFIX(__cmpxchg_case_##name##sz(volatile void *ptr,          \
+                                        unsigned long old,             \
+@@ -268,29 +268,34 @@ __LL_SC_PREFIX(__cmpxchg_case_##name##sz
+       "2:"                                                            \
+       : [tmp] "=&r" (tmp), [oldval] "=&r" (oldval),                   \
+         [v] "+Q" (*(u##sz *)ptr)                                      \
+-      : [old] "Kr" (old), [new] "r" (new)                             \
++      : [old] #constraint "r" (old), [new] "r" (new)                  \
+       : cl);                                                          \
+                                                                       \
+       return oldval;                                                  \
+ }                                                                     \
+ __LL_SC_EXPORT(__cmpxchg_case_##name##sz);
+ 
+-__CMPXCHG_CASE(w, b,     ,  8,        ,  ,  ,         )
+-__CMPXCHG_CASE(w, h,     , 16,        ,  ,  ,         )
+-__CMPXCHG_CASE(w,  ,     , 32,        ,  ,  ,         )
+-__CMPXCHG_CASE( ,  ,     , 64,        ,  ,  ,         )
+-__CMPXCHG_CASE(w, b, acq_,  8,        , a,  , "memory")
+-__CMPXCHG_CASE(w, h, acq_, 16,        , a,  , "memory")
+-__CMPXCHG_CASE(w,  , acq_, 32,        , a,  , "memory")
+-__CMPXCHG_CASE( ,  , acq_, 64,        , a,  , "memory")
+-__CMPXCHG_CASE(w, b, rel_,  8,        ,  , l, "memory")
+-__CMPXCHG_CASE(w, h, rel_, 16,        ,  , l, "memory")
+-__CMPXCHG_CASE(w,  , rel_, 32,        ,  , l, "memory")
+-__CMPXCHG_CASE( ,  , rel_, 64,        ,  , l, "memory")
+-__CMPXCHG_CASE(w, b,  mb_,  8, dmb ish,  , l, "memory")
+-__CMPXCHG_CASE(w, h,  mb_, 16, dmb ish,  , l, "memory")
+-__CMPXCHG_CASE(w,  ,  mb_, 32, dmb ish,  , l, "memory")
+-__CMPXCHG_CASE( ,  ,  mb_, 64, dmb ish,  , l, "memory")
++/*
++ * Earlier versions of GCC (no later than 8.1.0) appear to incorrectly
++ * handle the 'K' constraint for the value 4294967295 - thus we use no
++ * constraint for 32 bit operations.
++ */
++__CMPXCHG_CASE(w, b,     ,  8,        ,  ,  ,         , )
++__CMPXCHG_CASE(w, h,     , 16,        ,  ,  ,         , )
++__CMPXCHG_CASE(w,  ,     , 32,        ,  ,  ,         , )
++__CMPXCHG_CASE( ,  ,     , 64,        ,  ,  ,         , L)
++__CMPXCHG_CASE(w, b, acq_,  8,        , a,  , "memory", )
++__CMPXCHG_CASE(w, h, acq_, 16,        , a,  , "memory", )
++__CMPXCHG_CASE(w,  , acq_, 32,        , a,  , "memory", )
++__CMPXCHG_CASE( ,  , acq_, 64,        , a,  , "memory", L)
++__CMPXCHG_CASE(w, b, rel_,  8,        ,  , l, "memory", )
++__CMPXCHG_CASE(w, h, rel_, 16,        ,  , l, "memory", )
++__CMPXCHG_CASE(w,  , rel_, 32,        ,  , l, "memory", )
++__CMPXCHG_CASE( ,  , rel_, 64,        ,  , l, "memory", L)
++__CMPXCHG_CASE(w, b,  mb_,  8, dmb ish,  , l, "memory", )
++__CMPXCHG_CASE(w, h,  mb_, 16, dmb ish,  , l, "memory", )
++__CMPXCHG_CASE(w,  ,  mb_, 32, dmb ish,  , l, "memory", )
++__CMPXCHG_CASE( ,  ,  mb_, 64, dmb ish,  , l, "memory", L)
+ 
+ #undef __CMPXCHG_CASE
+ 
diff --git a/queue-4.9/hugetlb-fix-update_and_free_page-contig-page-struct-assumption.patch b/queue-4.9/hugetlb-fix-update_and_free_page-contig-page-struct-assumption.patch

new file mode 100644 (file)

index 0000000..eeb3b68
--- /dev/null
+++ b/queue-4.9/hugetlb-fix-update_and_free_page-contig-page-struct-assumption.patch
@@ -0,0 +1,69 @@
+From dbfee5aee7e54f83d96ceb8e3e80717fac62ad63 Mon Sep 17 00:00:00 2001
+From: Mike Kravetz <mike.kravetz@oracle.com>
+Date: Wed, 24 Feb 2021 12:07:50 -0800
+Subject: hugetlb: fix update_and_free_page contig page struct assumption
+MIME-Version: 1.0
+Content-Type: text/plain; charset=UTF-8
+Content-Transfer-Encoding: 8bit
+
+From: Mike Kravetz <mike.kravetz@oracle.com>
+
+commit dbfee5aee7e54f83d96ceb8e3e80717fac62ad63 upstream.
+
+page structs are not guaranteed to be contiguous for gigantic pages.  The
+routine update_and_free_page can encounter a gigantic page, yet it assumes
+page structs are contiguous when setting page flags in subpages.
+
+If update_and_free_page encounters non-contiguous page structs, we can see
+“BUG: Bad page state in process …” errors.
+
+Non-contiguous page structs are generally not an issue.  However, they can
+exist with a specific kernel configuration and hotplug operations.  For
+example: Configure the kernel with CONFIG_SPARSEMEM and
+!CONFIG_SPARSEMEM_VMEMMAP.  Then, hotplug add memory for the area where
+the gigantic page will be allocated.  Zi Yan outlined steps to reproduce
+here [1].
+
+[1] https://lore.kernel.org/linux-mm/16F7C58B-4D79-41C5-9B64-A1A1628F4AF2@nvidia.com/
+
+Link: https://lkml.kernel.org/r/20210217184926.33567-1-mike.kravetz@oracle.com
+Fixes: 944d9fec8d7a ("hugetlb: add support for gigantic page allocation at runtime")
+Signed-off-by: Zi Yan <ziy@nvidia.com>
+Signed-off-by: Mike Kravetz <mike.kravetz@oracle.com>
+Cc: Zi Yan <ziy@nvidia.com>
+Cc: Davidlohr Bueso <dbueso@suse.de>
+Cc: "Kirill A . Shutemov" <kirill.shutemov@linux.intel.com>
+Cc: Andrea Arcangeli <aarcange@redhat.com>
+Cc: Matthew Wilcox <willy@infradead.org>
+Cc: Oscar Salvador <osalvador@suse.de>
+Cc: Joao Martins <joao.m.martins@oracle.com>
+Cc: <stable@vger.kernel.org>
+Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
+Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+Signed-off-by: Mike Kravetz <mike.kravetz@oracle.com>
+---
+ mm/hugetlb.c |    6 ++++--
+ 1 file changed, 4 insertions(+), 2 deletions(-)
+
+--- a/mm/hugetlb.c
++++ b/mm/hugetlb.c
+@@ -1185,14 +1185,16 @@ static inline int alloc_fresh_gigantic_p
+ static void update_and_free_page(struct hstate *h, struct page *page)
+ {
+       int i;
++      struct page *subpage = page;
+ 
+       if (hstate_is_gigantic(h) && !gigantic_page_supported())
+               return;
+ 
+       h->nr_huge_pages--;
+       h->nr_huge_pages_node[page_to_nid(page)]--;
+-      for (i = 0; i < pages_per_huge_page(h); i++) {
+-              page[i].flags &= ~(1 << PG_locked | 1 << PG_error |
++      for (i = 0; i < pages_per_huge_page(h);
++           i++, subpage = mem_map_next(subpage, page, i)) {
++              subpage->flags &= ~(1 << PG_locked | 1 << PG_error |
+                               1 << PG_referenced | 1 << PG_dirty |
+                               1 << PG_active | 1 << PG_private |
+                               1 << PG_writeback);
diff --git a/queue-4.9/net-usb-qmi_wwan-support-zte-p685m-modem.patch b/queue-4.9/net-usb-qmi_wwan-support-zte-p685m-modem.patch

new file mode 100644 (file)

index 0000000..ae4f80f
--- /dev/null
+++ b/queue-4.9/net-usb-qmi_wwan-support-zte-p685m-modem.patch
@@ -0,0 +1,65 @@
+From 88eee9b7b42e69fb622ddb3ff6f37e8e4347f5b2 Mon Sep 17 00:00:00 2001
+From: Lech Perczak <lech.perczak@gmail.com>
+Date: Tue, 23 Feb 2021 19:34:56 +0100
+Subject: net: usb: qmi_wwan: support ZTE P685M modem
+MIME-Version: 1.0
+Content-Type: text/plain; charset=UTF-8
+Content-Transfer-Encoding: 8bit
+
+From: Lech Perczak <lech.perczak@gmail.com>
+
+commit 88eee9b7b42e69fb622ddb3ff6f37e8e4347f5b2 upstream.
+
+Now that interface 3 in "option" driver is no longer mapped, add device
+ID matching it to qmi_wwan.
+
+The modem is used inside ZTE MF283+ router and carriers identify it as
+such.
+Interface mapping is:
+0: QCDM, 1: AT (PCUI), 2: AT (Modem), 3: QMI, 4: ADB
+
+T:  Bus=02 Lev=02 Prnt=02 Port=05 Cnt=01 Dev#=  3 Spd=480  MxCh= 0
+D:  Ver= 2.01 Cls=00(>ifc ) Sub=00 Prot=00 MxPS=64 #Cfgs=  1
+P:  Vendor=19d2 ProdID=1275 Rev=f0.00
+S:  Manufacturer=ZTE,Incorporated
+S:  Product=ZTE Technologies MSM
+S:  SerialNumber=P685M510ZTED0000CP&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&0
+C:* #Ifs= 5 Cfg#= 1 Atr=a0 MxPwr=500mA
+I:* If#= 0 Alt= 0 #EPs= 2 Cls=ff(vend.) Sub=ff Prot=ff Driver=option
+E:  Ad=81(I) Atr=02(Bulk) MxPS= 512 Ivl=0ms
+E:  Ad=01(O) Atr=02(Bulk) MxPS= 512 Ivl=0ms
+I:* If#= 1 Alt= 0 #EPs= 3 Cls=ff(vend.) Sub=00 Prot=00 Driver=option
+E:  Ad=83(I) Atr=03(Int.) MxPS=  10 Ivl=32ms
+E:  Ad=82(I) Atr=02(Bulk) MxPS= 512 Ivl=0ms
+E:  Ad=02(O) Atr=02(Bulk) MxPS= 512 Ivl=0ms
+I:* If#= 2 Alt= 0 #EPs= 3 Cls=ff(vend.) Sub=00 Prot=00 Driver=option
+E:  Ad=85(I) Atr=03(Int.) MxPS=  10 Ivl=32ms
+E:  Ad=84(I) Atr=02(Bulk) MxPS= 512 Ivl=0ms
+E:  Ad=03(O) Atr=02(Bulk) MxPS= 512 Ivl=0ms
+I:* If#= 3 Alt= 0 #EPs= 3 Cls=ff(vend.) Sub=ff Prot=ff Driver=qmi_wwan
+E:  Ad=87(I) Atr=03(Int.) MxPS=   8 Ivl=32ms
+E:  Ad=86(I) Atr=02(Bulk) MxPS= 512 Ivl=0ms
+E:  Ad=04(O) Atr=02(Bulk) MxPS= 512 Ivl=0ms
+I:* If#= 4 Alt= 0 #EPs= 2 Cls=ff(vend.) Sub=42 Prot=01 Driver=(none)
+E:  Ad=88(I) Atr=02(Bulk) MxPS= 512 Ivl=0ms
+E:  Ad=05(O) Atr=02(Bulk) MxPS= 512 Ivl=0ms
+
+Acked-by: Bjørn Mork <bjorn@mork.no>
+Signed-off-by: Lech Perczak <lech.perczak@gmail.com>
+Link: https://lore.kernel.org/r/20210223183456.6377-1-lech.perczak@gmail.com
+Signed-off-by: Jakub Kicinski <kuba@kernel.org>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ drivers/net/usb/qmi_wwan.c |    1 +
+ 1 file changed, 1 insertion(+)
+
+--- a/drivers/net/usb/qmi_wwan.c
++++ b/drivers/net/usb/qmi_wwan.c
+@@ -881,6 +881,7 @@ static const struct usb_device_id produc
+       {QMI_FIXED_INTF(0x19d2, 0x1255, 4)},
+       {QMI_FIXED_INTF(0x19d2, 0x1256, 4)},
+       {QMI_FIXED_INTF(0x19d2, 0x1270, 5)},    /* ZTE MF667 */
++      {QMI_FIXED_INTF(0x19d2, 0x1275, 3)},    /* ZTE P685M */
+       {QMI_FIXED_INTF(0x19d2, 0x1401, 2)},
+       {QMI_FIXED_INTF(0x19d2, 0x1402, 2)},    /* ZTE MF60 */
+       {QMI_FIXED_INTF(0x19d2, 0x1424, 2)},
diff --git a/queue-4.9/printk-fix-deadlock-when-kernel-panic.patch b/queue-4.9/printk-fix-deadlock-when-kernel-panic.patch

new file mode 100644 (file)

index 0000000..c5a8ad5
--- /dev/null
+++ b/queue-4.9/printk-fix-deadlock-when-kernel-panic.patch
@@ -0,0 +1,110 @@
+From 8a8109f303e25a27f92c1d8edd67d7cbbc60a4eb Mon Sep 17 00:00:00 2001
+From: Muchun Song <songmuchun@bytedance.com>
+Date: Wed, 10 Feb 2021 11:48:23 +0800
+Subject: printk: fix deadlock when kernel panic
+
+From: Muchun Song <songmuchun@bytedance.com>
+
+commit 8a8109f303e25a27f92c1d8edd67d7cbbc60a4eb upstream.
+
+printk_safe_flush_on_panic() caused the following deadlock on our
+server:
+
+CPU0:                                         CPU1:
+panic                                         rcu_dump_cpu_stacks
+  kdump_nmi_shootdown_cpus                      nmi_trigger_cpumask_backtrace
+    register_nmi_handler(crash_nmi_callback)      printk_safe_flush
+                                                    __printk_safe_flush
+                                                      raw_spin_lock_irqsave(&read_lock)
+    // send NMI to other processors
+    apic_send_IPI_allbutself(NMI_VECTOR)
+                                                        // NMI interrupt, dead loop
+                                                        crash_nmi_callback
+  printk_safe_flush_on_panic
+    printk_safe_flush
+      __printk_safe_flush
+        // deadlock
+        raw_spin_lock_irqsave(&read_lock)
+
+DEADLOCK: read_lock is taken on CPU1 and will never get released.
+
+It happens when panic() stops a CPU by NMI while it has been in
+the middle of printk_safe_flush().
+
+Handle the lock the same way as logbuf_lock. The printk_safe buffers
+are flushed only when both locks can be safely taken. It can avoid
+the deadlock _in this particular case_ at expense of losing contents
+of printk_safe buffers.
+
+Note: It would actually be safe to re-init the locks when all CPUs were
+      stopped by NMI. But it would require passing this information
+      from arch-specific code. It is not worth the complexity.
+      Especially because logbuf_lock and printk_safe buffers have been
+      obsoleted by the lockless ring buffer.
+
+Fixes: cf9b1106c81c ("printk/nmi: flush NMI messages on the system panic")
+Signed-off-by: Muchun Song <songmuchun@bytedance.com>
+Reviewed-by: Petr Mladek <pmladek@suse.com>
+Cc: <stable@vger.kernel.org>
+Acked-by: Sergey Senozhatsky <sergey.senozhatsky@gmail.com>
+Signed-off-by: Petr Mladek <pmladek@suse.com>
+Link: https://lore.kernel.org/r/20210210034823.64867-1-songmuchun@bytedance.com
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ kernel/printk/nmi.c |   16 ++++++++++++----
+ 1 file changed, 12 insertions(+), 4 deletions(-)
+
+--- a/kernel/printk/nmi.c
++++ b/kernel/printk/nmi.c
+@@ -52,6 +52,8 @@ struct nmi_seq_buf {
+ };
+ static DEFINE_PER_CPU(struct nmi_seq_buf, nmi_print_seq);
+ 
++static DEFINE_RAW_SPINLOCK(nmi_read_lock);
++
+ /*
+  * Safe printk() for NMI context. It uses a per-CPU buffer to
+  * store the message. NMIs are not nested, so there is always only
+@@ -134,8 +136,6 @@ static void printk_nmi_flush_seq_line(st
+  */
+ static void __printk_nmi_flush(struct irq_work *work)
+ {
+-      static raw_spinlock_t read_lock =
+-              __RAW_SPIN_LOCK_INITIALIZER(read_lock);
+       struct nmi_seq_buf *s = container_of(work, struct nmi_seq_buf, work);
+       unsigned long flags;
+       size_t len, size;
+@@ -148,7 +148,7 @@ static void __printk_nmi_flush(struct ir
+        * different CPUs. This is especially important when printing
+        * a backtrace.
+        */
+-      raw_spin_lock_irqsave(&read_lock, flags);
++      raw_spin_lock_irqsave(&nmi_read_lock, flags);
+ 
+       i = 0;
+ more:
+@@ -197,7 +197,7 @@ more:
+               goto more;
+ 
+ out:
+-      raw_spin_unlock_irqrestore(&read_lock, flags);
++      raw_spin_unlock_irqrestore(&nmi_read_lock, flags);
+ }
+ 
+ /**
+@@ -239,6 +239,14 @@ void printk_nmi_flush_on_panic(void)
+               raw_spin_lock_init(&logbuf_lock);
+       }
+ 
++      if (in_nmi() && raw_spin_is_locked(&nmi_read_lock)) {
++              if (num_online_cpus() > 1)
++                      return;
++
++              debug_locks_off();
++              raw_spin_lock_init(&nmi_read_lock);
++      }
++
+       printk_nmi_flush();
+ }
+ 
diff --git a/queue-4.9/scripts-set-proper-openssl-include-dir-also-for-sign-file.patch b/queue-4.9/scripts-set-proper-openssl-include-dir-also-for-sign-file.patch

new file mode 100644 (file)

index 0000000..5ca12bf
--- /dev/null
+++ b/queue-4.9/scripts-set-proper-openssl-include-dir-also-for-sign-file.patch
@@ -0,0 +1,29 @@
+From foo@baz Thu Mar  4 02:32:00 PM CET 2021
+From: Rolf Eike Beer <eb@emlix.com>
+Date: Thu, 04 Mar 2021 08:26:28 +0100
+Subject: scripts: set proper OpenSSL include dir also for  sign-file
+To: stable@vger.kernel.org
+Message-ID: <1859038.itBudK23F7@devpool47>
+
+From: Rolf Eike Beer <eb@emlix.com>
+
+commit fe968c41ac4f4ec9ffe3c4cf16b72285f5e9674f upstream.
+
+Fixes: 2cea4a7a1885 ("scripts: use pkg-config to locate libcrypto")
+Signed-off-by: Rolf Eike Beer <eb@emlix.com>
+Signed-off-by: Masahiro Yamada <masahiroy@kernel.org>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ scripts/Makefile |    1 +
+ 1 file changed, 1 insertion(+)
+
+--- a/scripts/Makefile
++++ b/scripts/Makefile
+@@ -26,6 +26,7 @@ hostprogs-$(CONFIG_SYSTEM_EXTRA_CERTIFIC
+ 
+ HOSTCFLAGS_sortextable.o = -I$(srctree)/tools/include
+ HOSTCFLAGS_asn1_compiler.o = -I$(srctree)/include
++HOSTCFLAGS_sign-file.o = $(CRYPTO_CFLAGS)
+ HOSTLOADLIBES_sign-file = $(CRYPTO_LIBS)
+ HOSTCFLAGS_extract-cert.o = $(CRYPTO_CFLAGS)
+ HOSTLOADLIBES_extract-cert = $(CRYPTO_LIBS)
diff --git a/queue-4.9/scripts-use-pkg-config-to-locate-libcrypto.patch b/queue-4.9/scripts-use-pkg-config-to-locate-libcrypto.patch

new file mode 100644 (file)

index 0000000..c19e5db
--- /dev/null
+++ b/queue-4.9/scripts-use-pkg-config-to-locate-libcrypto.patch
@@ -0,0 +1,45 @@
+From foo@baz Thu Mar  4 02:32:00 PM CET 2021
+From: Rolf Eike Beer <eb@emlix.com>
+Date: Thu, 04 Mar 2021 08:25:01 +0100
+Subject: scripts: use pkg-config to locate libcrypto
+To: stable@vger.kernel.org
+Message-ID: <1776617.4qmgp806CG@devpool47>
+
+From: Rolf Eike Beer <eb@emlix.com>
+
+commit 2cea4a7a1885bd0c765089afc14f7ff0eb77864e upstream.
+
+Otherwise build fails if the headers are not in the default location. While at
+it also ask pkg-config for the libs, with fallback to the existing value.
+
+Signed-off-by: Rolf Eike Beer <eb@emlix.com>
+Signed-off-by: Masahiro Yamada <masahiroy@kernel.org>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ scripts/Makefile |    8 ++++++--
+ 1 file changed, 6 insertions(+), 2 deletions(-)
+
+--- a/scripts/Makefile
++++ b/scripts/Makefile
+@@ -11,6 +11,9 @@
+ 
+ HOST_EXTRACFLAGS += -I$(srctree)/tools/include
+ 
++CRYPTO_LIBS = $(shell pkg-config --libs libcrypto 2> /dev/null || echo -lcrypto)
++CRYPTO_CFLAGS = $(shell pkg-config --cflags libcrypto 2> /dev/null)
++
+ hostprogs-$(CONFIG_KALLSYMS)     += kallsyms
+ hostprogs-$(CONFIG_LOGO)         += pnmtologo
+ hostprogs-$(CONFIG_VT)           += conmakehash
+@@ -23,8 +26,9 @@ hostprogs-$(CONFIG_SYSTEM_EXTRA_CERTIFIC
+ 
+ HOSTCFLAGS_sortextable.o = -I$(srctree)/tools/include
+ HOSTCFLAGS_asn1_compiler.o = -I$(srctree)/include
+-HOSTLOADLIBES_sign-file = -lcrypto
+-HOSTLOADLIBES_extract-cert = -lcrypto
++HOSTLOADLIBES_sign-file = $(CRYPTO_LIBS)
++HOSTCFLAGS_extract-cert.o = $(CRYPTO_CFLAGS)
++HOSTLOADLIBES_extract-cert = $(CRYPTO_LIBS)
+ 
+ always                := $(hostprogs-y) $(hostprogs-m)
+ 
diff --git a/queue-4.9/series b/queue-4.9/series

index d684987a8c8d976d52d762cd4e0f5fea825cf2b0..aefecce5f3da4952e43d4b30244ba2480bc0e18d 100644 (file)
--- a/queue-4.9/series
+++ b/queue-4.9/series
@@ -5,3 +5,13 @@ futex-futex_unlock_pi-determinism.patch
  futex-fix-pi_state-owner-serialization.patch
  futex-fix-more-put_pi_state-vs.-exit_pi_state_list-races.patch
  futex-don-t-enable-irqs-unconditionally-in-put_pi_state.patch
+net-usb-qmi_wwan-support-zte-p685m-modem.patch
+arm-kprobes-allow-to-handle-reentered-kprobe-on-single-stepping.patch
+scripts-use-pkg-config-to-locate-libcrypto.patch
+scripts-set-proper-openssl-include-dir-also-for-sign-file.patch
+hugetlb-fix-update_and_free_page-contig-page-struct-assumption.patch
+printk-fix-deadlock-when-kernel-panic.patch
+arm64-remove-redundant-mov-from-ll-sc-cmpxchg.patch
+arm64-avoid-redundant-type-conversions-in-xchg-and-cmpxchg.patch
+arm64-cmpxchg-use-k-instead-of-l-for-ll-sc-immediate-constraint.patch
+arm64-use-correct-ll-sc-atomic-constraints.patch
author	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Thu, 4 Mar 2021 13:50:51 +0000 (14:50 +0100)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Thu, 4 Mar 2021 13:50:51 +0000 (14:50 +0100)
queue-4.9/arm-kprobes-allow-to-handle-reentered-kprobe-on-single-stepping.patch	[new file with mode: 0644]	patch \| blob
queue-4.9/arm64-avoid-redundant-type-conversions-in-xchg-and-cmpxchg.patch	[new file with mode: 0644]	patch \| blob
queue-4.9/arm64-cmpxchg-use-k-instead-of-l-for-ll-sc-immediate-constraint.patch	[new file with mode: 0644]	patch \| blob
queue-4.9/arm64-remove-redundant-mov-from-ll-sc-cmpxchg.patch	[new file with mode: 0644]	patch \| blob
queue-4.9/arm64-use-correct-ll-sc-atomic-constraints.patch	[new file with mode: 0644]	patch \| blob
queue-4.9/hugetlb-fix-update_and_free_page-contig-page-struct-assumption.patch	[new file with mode: 0644]	patch \| blob
queue-4.9/net-usb-qmi_wwan-support-zte-p685m-modem.patch	[new file with mode: 0644]	patch \| blob
queue-4.9/printk-fix-deadlock-when-kernel-panic.patch	[new file with mode: 0644]	patch \| blob
queue-4.9/scripts-set-proper-openssl-include-dir-also-for-sign-file.patch	[new file with mode: 0644]	patch \| blob
queue-4.9/scripts-use-pkg-config-to-locate-libcrypto.patch	[new file with mode: 0644]	patch \| blob
queue-4.9/series		patch \| blob \| blame \| history