3.7-stable patches

author Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Wed, 23 Jan 2013 18:00:59 +0000 (10:00 -0800)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Wed, 23 Jan 2013 18:00:59 +0000 (10:00 -0800)
author Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Wed, 23 Jan 2013 18:00:59 +0000 (10:00 -0800)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Wed, 23 Jan 2013 18:00:59 +0000 (10:00 -0800)
diff --git a/queue-3.7/ptrace-ensure-arch_ptrace-ptrace_request-can-never-race-with-sigkill.patch b/queue-3.7/ptrace-ensure-arch_ptrace-ptrace_request-can-never-race-with-sigkill.patch

new file mode 100644 (file)

index 0000000..9cdeea6
--- /dev/null
+++ b/queue-3.7/ptrace-ensure-arch_ptrace-ptrace_request-can-never-race-with-sigkill.patch
@@ -0,0 +1,187 @@
+From 9899d11f654474d2d54ea52ceaa2a1f4db3abd68 Mon Sep 17 00:00:00 2001
+From: Oleg Nesterov <oleg@redhat.com>
+Date: Mon, 21 Jan 2013 20:48:00 +0100
+Subject: ptrace: ensure arch_ptrace/ptrace_request can never race with SIGKILL
+
+From: Oleg Nesterov <oleg@redhat.com>
+
+commit 9899d11f654474d2d54ea52ceaa2a1f4db3abd68 upstream.
+
+putreg() assumes that the tracee is not running and pt_regs_access() can
+safely play with its stack.  However a killed tracee can return from
+ptrace_stop() to the low-level asm code and do RESTORE_REST, this means
+that debugger can actually read/modify the kernel stack until the tracee
+does SAVE_REST again.
+
+set_task_blockstep() can race with SIGKILL too and in some sense this
+race is even worse, the very fact the tracee can be woken up breaks the
+logic.
+
+As Linus suggested we can clear TASK_WAKEKILL around the arch_ptrace()
+call, this ensures that nobody can ever wakeup the tracee while the
+debugger looks at it.  Not only this fixes the mentioned problems, we
+can do some cleanups/simplifications in arch_ptrace() paths.
+
+Probably ptrace_unfreeze_traced() needs more callers, for example it
+makes sense to make the tracee killable for oom-killer before
+access_process_vm().
+
+While at it, add the comment into may_ptrace_stop() to explain why
+ptrace_stop() still can't rely on SIGKILL and signal_pending_state().
+
+Reported-by: Salman Qazi <sqazi@google.com>
+Reported-by: Suleiman Souhlal <suleiman@google.com>
+Suggested-by: Linus Torvalds <torvalds@linux-foundation.org>
+Signed-off-by: Oleg Nesterov <oleg@redhat.com>
+Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ arch/x86/kernel/step.c |    9 +++---
+ kernel/ptrace.c        |   64 +++++++++++++++++++++++++++++++++++++++++--------
+ kernel/signal.c        |    5 +++
+ 3 files changed, 64 insertions(+), 14 deletions(-)
+
+--- a/arch/x86/kernel/step.c
++++ b/arch/x86/kernel/step.c
+@@ -165,10 +165,11 @@ void set_task_blockstep(struct task_stru
+        * Ensure irq/preemption can't change debugctl in between.
+        * Note also that both TIF_BLOCKSTEP and debugctl should
+        * be changed atomically wrt preemption.
+-       * FIXME: this means that set/clear TIF_BLOCKSTEP is simply
+-       * wrong if task != current, SIGKILL can wakeup the stopped
+-       * tracee and set/clear can play with the running task, this
+-       * can confuse the next __switch_to_xtra().
++       *
++       * NOTE: this means that set/clear TIF_BLOCKSTEP is only safe if
++       * task is current or it can't be running, otherwise we can race
++       * with __switch_to_xtra(). We rely on ptrace_freeze_traced() but
++       * PTRACE_KILL is not safe.
+        */
+       local_irq_disable();
+       debugctl = get_debugctlmsr();
+--- a/kernel/ptrace.c
++++ b/kernel/ptrace.c
+@@ -122,6 +122,40 @@ void __ptrace_unlink(struct task_struct
+       spin_unlock(&child->sighand->siglock);
+ }
+ 
++/* Ensure that nothing can wake it up, even SIGKILL */
++static bool ptrace_freeze_traced(struct task_struct *task)
++{
++      bool ret = false;
++
++      /* Lockless, nobody but us can set this flag */
++      if (task->jobctl & JOBCTL_LISTENING)
++              return ret;
++
++      spin_lock_irq(&task->sighand->siglock);
++      if (task_is_traced(task) && !__fatal_signal_pending(task)) {
++              task->state = __TASK_TRACED;
++              ret = true;
++      }
++      spin_unlock_irq(&task->sighand->siglock);
++
++      return ret;
++}
++
++static void ptrace_unfreeze_traced(struct task_struct *task)
++{
++      if (task->state != __TASK_TRACED)
++              return;
++
++      WARN_ON(!task->ptrace || task->parent != current);
++
++      spin_lock_irq(&task->sighand->siglock);
++      if (__fatal_signal_pending(task))
++              wake_up_state(task, __TASK_TRACED);
++      else
++              task->state = TASK_TRACED;
++      spin_unlock_irq(&task->sighand->siglock);
++}
++
+ /**
+  * ptrace_check_attach - check whether ptracee is ready for ptrace operation
+  * @child: ptracee to check for
+@@ -151,24 +185,29 @@ int ptrace_check_attach(struct task_stru
+        * be changed by us so it's not changing right after this.
+        */
+       read_lock(&tasklist_lock);
+-      if ((child->ptrace & PT_PTRACED) && child->parent == current) {
++      if (child->ptrace && child->parent == current) {
++              WARN_ON(child->state == __TASK_TRACED);
+               /*
+                * child->sighand can't be NULL, release_task()
+                * does ptrace_unlink() before __exit_signal().
+                */
+-              spin_lock_irq(&child->sighand->siglock);
+-              WARN_ON_ONCE(task_is_stopped(child));
+-              if (ignore_state || (task_is_traced(child) &&
+-                                   !(child->jobctl & JOBCTL_LISTENING)))
++              if (ignore_state || ptrace_freeze_traced(child))
+                       ret = 0;
+-              spin_unlock_irq(&child->sighand->siglock);
+       }
+       read_unlock(&tasklist_lock);
+ 
+-      if (!ret && !ignore_state)
+-              ret = wait_task_inactive(child, TASK_TRACED) ? 0 : -ESRCH;
++      if (!ret && !ignore_state) {
++              if (!wait_task_inactive(child, __TASK_TRACED)) {
++                      /*
++                       * This can only happen if may_ptrace_stop() fails and
++                       * ptrace_stop() changes ->state back to TASK_RUNNING,
++                       * so we should not worry about leaking __TASK_TRACED.
++                       */
++                      WARN_ON(child->state == __TASK_TRACED);
++                      ret = -ESRCH;
++              }
++      }
+ 
+-      /* All systems go.. */
+       return ret;
+ }
+ 
+@@ -891,6 +930,8 @@ SYSCALL_DEFINE4(ptrace, long, request, l
+               goto out_put_task_struct;
+ 
+       ret = arch_ptrace(child, request, addr, data);
++      if (ret || request != PTRACE_DETACH)
++              ptrace_unfreeze_traced(child);
+ 
+  out_put_task_struct:
+       put_task_struct(child);
+@@ -1030,8 +1071,11 @@ asmlinkage long compat_sys_ptrace(compat
+ 
+       ret = ptrace_check_attach(child, request == PTRACE_KILL ||
+                                 request == PTRACE_INTERRUPT);
+-      if (!ret)
++      if (!ret) {
+               ret = compat_arch_ptrace(child, request, addr, data);
++              if (ret || request != PTRACE_DETACH)
++                      ptrace_unfreeze_traced(child);
++      }
+ 
+  out_put_task_struct:
+       put_task_struct(child);
+--- a/kernel/signal.c
++++ b/kernel/signal.c
+@@ -1792,6 +1792,10 @@ static inline int may_ptrace_stop(void)
+        * If SIGKILL was already sent before the caller unlocked
+        * ->siglock we must see ->core_state != NULL. Otherwise it
+        * is safe to enter schedule().
++       *
++       * This is almost outdated, a task with the pending SIGKILL can't
++       * block in TASK_TRACED. But PTRACE_EVENT_EXIT can be reported
++       * after SIGKILL was already dequeued.
+        */
+       if (unlikely(current->mm->core_state) &&
+           unlikely(current->mm == current->parent->mm))
+@@ -1917,6 +1921,7 @@ static void ptrace_stop(int exit_code, i
+               if (gstop_done)
+                       do_notify_parent_cldstop(current, false, why);
+ 
++              /* tasklist protects us from ptrace_freeze_traced() */
+               __set_current_state(TASK_RUNNING);
+               if (clear_code)
+                       current->exit_code = 0;
diff --git a/queue-3.7/ptrace-introduce-signal_wake_up_state-and-ptrace_signal_wake_up.patch b/queue-3.7/ptrace-introduce-signal_wake_up_state-and-ptrace_signal_wake_up.patch

new file mode 100644 (file)

index 0000000..87c9998
--- /dev/null
+++ b/queue-3.7/ptrace-introduce-signal_wake_up_state-and-ptrace_signal_wake_up.patch
@@ -0,0 +1,128 @@
+From 910ffdb18a6408e14febbb6e4b6840fd2c928c82 Mon Sep 17 00:00:00 2001
+From: Oleg Nesterov <oleg@redhat.com>
+Date: Mon, 21 Jan 2013 20:47:41 +0100
+Subject: ptrace: introduce signal_wake_up_state() and ptrace_signal_wake_up()
+
+From: Oleg Nesterov <oleg@redhat.com>
+
+commit 910ffdb18a6408e14febbb6e4b6840fd2c928c82 upstream.
+
+Cleanup and preparation for the next change.
+
+signal_wake_up(resume => true) is overused. None of ptrace/jctl callers
+actually want to wakeup a TASK_WAKEKILL task, but they can't specify the
+necessary mask.
+
+Turn signal_wake_up() into signal_wake_up_state(state), reintroduce
+signal_wake_up() as a trivial helper, and add ptrace_signal_wake_up()
+which adds __TASK_TRACED.
+
+This way ptrace_signal_wake_up() can work "inside" ptrace_request()
+even if the tracee doesn't have the TASK_WAKEKILL bit set.
+
+Signed-off-by: Oleg Nesterov <oleg@redhat.com>
+Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ include/linux/sched.h |   11 ++++++++++-
+ kernel/ptrace.c       |    8 ++++----
+ kernel/signal.c       |   14 ++++----------
+ 3 files changed, 18 insertions(+), 15 deletions(-)
+
+--- a/include/linux/sched.h
++++ b/include/linux/sched.h
+@@ -2654,7 +2654,16 @@ static inline void thread_group_cputime_
+ extern void recalc_sigpending_and_wake(struct task_struct *t);
+ extern void recalc_sigpending(void);
+ 
+-extern void signal_wake_up(struct task_struct *t, int resume_stopped);
++extern void signal_wake_up_state(struct task_struct *t, unsigned int state);
++
++static inline void signal_wake_up(struct task_struct *t, bool resume)
++{
++      signal_wake_up_state(t, resume ? TASK_WAKEKILL : 0);
++}
++static inline void ptrace_signal_wake_up(struct task_struct *t, bool resume)
++{
++      signal_wake_up_state(t, resume ? __TASK_TRACED : 0);
++}
+ 
+ /*
+  * Wrappers for p->thread_info->cpu access. No-op on UP.
+--- a/kernel/ptrace.c
++++ b/kernel/ptrace.c
+@@ -117,7 +117,7 @@ void __ptrace_unlink(struct task_struct
+        * TASK_KILLABLE sleeps.
+        */
+       if (child->jobctl & JOBCTL_STOP_PENDING || task_is_traced(child))
+-              signal_wake_up(child, task_is_traced(child));
++              ptrace_signal_wake_up(child, true);
+ 
+       spin_unlock(&child->sighand->siglock);
+ }
+@@ -311,7 +311,7 @@ static int ptrace_attach(struct task_str
+        */
+       if (task_is_stopped(task) &&
+           task_set_jobctl_pending(task, JOBCTL_TRAP_STOP | JOBCTL_TRAPPING))
+-              signal_wake_up(task, 1);
++              signal_wake_up_state(task, __TASK_STOPPED);
+ 
+       spin_unlock(&task->sighand->siglock);
+ 
+@@ -728,7 +728,7 @@ int ptrace_request(struct task_struct *c
+                * tracee into STOP.
+                */
+               if (likely(task_set_jobctl_pending(child, JOBCTL_TRAP_STOP)))
+-                      signal_wake_up(child, child->jobctl & JOBCTL_LISTENING);
++                      ptrace_signal_wake_up(child, child->jobctl & JOBCTL_LISTENING);
+ 
+               unlock_task_sighand(child, &flags);
+               ret = 0;
+@@ -754,7 +754,7 @@ int ptrace_request(struct task_struct *c
+                        * start of this trap and now.  Trigger re-trap.
+                        */
+                       if (child->jobctl & JOBCTL_TRAP_NOTIFY)
+-                              signal_wake_up(child, true);
++                              ptrace_signal_wake_up(child, true);
+                       ret = 0;
+               }
+               unlock_task_sighand(child, &flags);
+--- a/kernel/signal.c
++++ b/kernel/signal.c
+@@ -679,23 +679,17 @@ int dequeue_signal(struct task_struct *t
+  * No need to set need_resched since signal event passing
+  * goes through ->blocked
+  */
+-void signal_wake_up(struct task_struct *t, int resume)
++void signal_wake_up_state(struct task_struct *t, unsigned int state)
+ {
+-      unsigned int mask;
+-
+       set_tsk_thread_flag(t, TIF_SIGPENDING);
+-
+       /*
+-       * For SIGKILL, we want to wake it up in the stopped/traced/killable
++       * TASK_WAKEKILL also means wake it up in the stopped/traced/killable
+        * case. We don't check t->state here because there is a race with it
+        * executing another processor and just now entering stopped state.
+        * By using wake_up_state, we ensure the process will wake up and
+        * handle its death signal.
+        */
+-      mask = TASK_INTERRUPTIBLE;
+-      if (resume)
+-              mask |= TASK_WAKEKILL;
+-      if (!wake_up_state(t, mask))
++      if (!wake_up_state(t, state | TASK_INTERRUPTIBLE))
+               kick_process(t);
+ }
+ 
+@@ -843,7 +837,7 @@ static void ptrace_trap_notify(struct ta
+       assert_spin_locked(&t->sighand->siglock);
+ 
+       task_set_jobctl_pending(t, JOBCTL_TRAP_NOTIFY);
+-      signal_wake_up(t, t->jobctl & JOBCTL_LISTENING);
++      ptrace_signal_wake_up(t, t->jobctl & JOBCTL_LISTENING);
+ }
+ 
+ /*
diff --git a/queue-3.7/series b/queue-3.7/series

index 68f491804c76dc702d047d6ff4e2e0c605842aff..fe1bed43869f932e33056efea88017c8fe051d61 100644 (file)
--- a/queue-3.7/series
+++ b/queue-3.7/series
@@ -10,3 +10,6 @@ virtio-blk-don-t-free-ida-when-disk-is-in-use.patch
  async-fix-__lowest_in_progress.patch
  vfio-pci-fix-buffer-overfill.patch
  perf-x86-revert-20b279-require-exclude_guest-to-use-pebs-kernel-side.patch
+ptrace-introduce-signal_wake_up_state-and-ptrace_signal_wake_up.patch
+ptrace-ensure-arch_ptrace-ptrace_request-can-never-race-with-sigkill.patch
+wake_up_process-should-be-never-used-to-wakeup-a-task_stopped-traced-task.patch
diff --git a/queue-3.7/wake_up_process-should-be-never-used-to-wakeup-a-task_stopped-traced-task.patch b/queue-3.7/wake_up_process-should-be-never-used-to-wakeup-a-task_stopped-traced-task.patch

new file mode 100644 (file)

index 0000000..b07ad2b
--- /dev/null
+++ b/queue-3.7/wake_up_process-should-be-never-used-to-wakeup-a-task_stopped-traced-task.patch
@@ -0,0 +1,34 @@
+From 9067ac85d533651b98c2ff903182a20cbb361fcb Mon Sep 17 00:00:00 2001
+From: Oleg Nesterov <oleg@redhat.com>
+Date: Mon, 21 Jan 2013 20:48:17 +0100
+Subject: wake_up_process() should be never used to wakeup a TASK_STOPPED/TRACED task
+
+From: Oleg Nesterov <oleg@redhat.com>
+
+commit 9067ac85d533651b98c2ff903182a20cbb361fcb upstream.
+
+wake_up_process() should never wakeup a TASK_STOPPED/TRACED task.
+Change it to use TASK_NORMAL and add the WARN_ON().
+
+TASK_ALL has no other users, probably can be killed.
+
+Signed-off-by: Oleg Nesterov <oleg@redhat.com>
+Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ kernel/sched/core.c |    3 ++-
+ 1 file changed, 2 insertions(+), 1 deletion(-)
+
+--- a/kernel/sched/core.c
++++ b/kernel/sched/core.c
+@@ -1497,7 +1497,8 @@ out:
+  */
+ int wake_up_process(struct task_struct *p)
+ {
+-      return try_to_wake_up(p, TASK_ALL, 0);
++      WARN_ON(task_is_stopped_or_traced(p));
++      return try_to_wake_up(p, TASK_NORMAL, 0);
+ }
+ EXPORT_SYMBOL(wake_up_process);
+
author	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Wed, 23 Jan 2013 18:00:59 +0000 (10:00 -0800)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Wed, 23 Jan 2013 18:00:59 +0000 (10:00 -0800)
queue-3.7/ptrace-ensure-arch_ptrace-ptrace_request-can-never-race-with-sigkill.patch	[new file with mode: 0644]	patch \| blob
queue-3.7/ptrace-introduce-signal_wake_up_state-and-ptrace_signal_wake_up.patch	[new file with mode: 0644]	patch \| blob
queue-3.7/series		patch \| blob \| blame \| history
queue-3.7/wake_up_process-should-be-never-used-to-wakeup-a-task_stopped-traced-task.patch	[new file with mode: 0644]	patch \| blob