restart the 2.6.21 queue

author Chris Wright <chrisw@sous-sol.org>

Mon, 11 Jun 2007 23:50:31 +0000 (16:50 -0700)

committer Chris Wright <chrisw@sous-sol.org>

Mon, 11 Jun 2007 23:50:31 +0000 (16:50 -0700)
author Chris Wright <chrisw@sous-sol.org>
Mon, 11 Jun 2007 23:50:31 +0000 (16:50 -0700)
committer Chris Wright <chrisw@sous-sol.org>
Mon, 11 Jun 2007 23:50:31 +0000 (16:50 -0700)
diff --git a/queue-2.6.21/bnx2-fix-netdev-watchdog-on-5708.patch b/queue-2.6.21/bnx2-fix-netdev-watchdog-on-5708.patch

new file mode 100644 (file)

index 0000000..792c1c0
--- /dev/null
+++ b/queue-2.6.21/bnx2-fix-netdev-watchdog-on-5708.patch
@@ -0,0 +1,73 @@
+From stable-bounces@linux.kernel.org  Tue Jun  5 10:44:15 2007
+From: "Michael Chan" <mchan@broadcom.com>
+To: stable@kernel.org
+Date: Tue, 05 Jun 2007 11:33:20 -0700
+Message-ID: <1181068400.4832.3.camel@dell>
+Subject: BNX2: Fix netdev watchdog on 5708.
+
+There's a bug in the driver that only initializes half of the context
+memory on the 5708.  Surprisingly, this works most of the time except
+for some occasional netdev watchdogs when sending a lot of 64-byte
+packets.  This fix is to add the missing code to initialize the 2nd
+half of the context memory.
+
+Update version to 1.5.8.2.
+
+Signed-off-by: Michael Chan <mchan@broadcom.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Chris Wright <chrisw@sous-sol.org>
+
+---
+ drivers/net/bnx2.c |   25 +++++++++++++++----------
+ 1 file changed, 15 insertions(+), 10 deletions(-)
+
+--- linux-2.6.21.5.orig/drivers/net/bnx2.c
++++ linux-2.6.21.5/drivers/net/bnx2.c
+@@ -54,8 +54,8 @@
+ 
+ #define DRV_MODULE_NAME               "bnx2"
+ #define PFX DRV_MODULE_NAME   ": "
+-#define DRV_MODULE_VERSION    "1.5.8.1"
+-#define DRV_MODULE_RELDATE    "May 7, 2007"
++#define DRV_MODULE_VERSION    "1.5.8.2"
++#define DRV_MODULE_RELDATE    "June 5, 2007"
+ 
+ #define RUN_AT(x) (jiffies + (x))
+ 
+@@ -1550,6 +1550,7 @@ bnx2_init_context(struct bnx2 *bp)
+       vcid = 96;
+       while (vcid) {
+               u32 vcid_addr, pcid_addr, offset;
++              int i;
+ 
+               vcid--;
+ 
+@@ -1570,16 +1571,20 @@ bnx2_init_context(struct bnx2 *bp)
+                       pcid_addr = vcid_addr;
+               }
+ 
+-              REG_WR(bp, BNX2_CTX_VIRT_ADDR, 0x00);
+-              REG_WR(bp, BNX2_CTX_PAGE_TBL, pcid_addr);
++              for (i = 0; i < (CTX_SIZE / PHY_CTX_SIZE); i++) {
++                      vcid_addr += (i << PHY_CTX_SHIFT);
++                      pcid_addr += (i << PHY_CTX_SHIFT);
++
++                      REG_WR(bp, BNX2_CTX_VIRT_ADDR, 0x00);
++                      REG_WR(bp, BNX2_CTX_PAGE_TBL, pcid_addr);
++
++                      /* Zero out the context. */
++                      for (offset = 0; offset < PHY_CTX_SIZE; offset += 4)
++                              CTX_WR(bp, 0x00, offset, 0);
+ 
+-              /* Zero out the context. */
+-              for (offset = 0; offset < PHY_CTX_SIZE; offset += 4) {
+-                      CTX_WR(bp, 0x00, offset, 0);
++                      REG_WR(bp, BNX2_CTX_VIRT_ADDR, vcid_addr);
++                      REG_WR(bp, BNX2_CTX_PAGE_TBL, pcid_addr);
+               }
+-
+-              REG_WR(bp, BNX2_CTX_VIRT_ADDR, vcid_addr);
+-              REG_WR(bp, BNX2_CTX_PAGE_TBL, pcid_addr);
+       }
+ }
+ 
diff --git a/queue-2.6.21/fix-show_mem-x86_64-sparsemem.patch b/queue-2.6.21/fix-show_mem-x86_64-sparsemem.patch

new file mode 100644 (file)

index 0000000..801e0d3
--- /dev/null
+++ b/queue-2.6.21/fix-show_mem-x86_64-sparsemem.patch
@@ -0,0 +1,39 @@
+From stable-bounces@linux.kernel.org  Thu Jun  7 18:02:08 2007
+From: "Bob Picco" <bob.picco@hp.com>
+Date: Thu, 7 Jun 2007 21:01:35 -0400
+To: stable@kernel.org
+Message-ID: <20070608010135.GG11999@localhost>
+Cc: andi@firstfloor.org, johnstul@us.ibm.com, Bernhard Walle <bwalle@suse.de>, Bob Picco <bob.picco@hp.com>, acme@redhat.com, Sripathi Kodi <sripathik@in.ibm.com>, Chuck Ebbert <cebbert@redhat.com>, tglx@linutronix.de
+Subject: sparsemem: fix oops in x86_64 show_mem
+
+We aren't sampling for holes in memory. Thus we encounter a section hole with
+empty section map pointer for SPARSEMEM and OOPs for show_mem. This issue
+has been seen in 2.6.21, current git and current mm. This patch is for
+2.6.21 stable. It was tested against sparsemem.
+
+Previous to commit f0a5a58aa812b31fd9f197c4ba48245942364eae memory_present
+was called for node_start_pfn to node_end_pfn. This would cover the hole(s)
+with reserved pages and valid sections. Most SPARSEMEM supported arches
+do a pfn_valid check in show_mem before computing the page structure address.
+
+This issue was brought to my attention on IRC by Arnaldo Carvalho de Melo at
+acme@redhat.com. Thanks to Arnaldo for testing.
+
+Signed-off-by: Bob Picco <bob.picco@hp.com>
+Signed-off-by: Chris Wright <chrisw@sous-sol.org>
+---
+
+ arch/x86_64/mm/init.c |    2 ++
+ 1 file changed, 2 insertions(+)
+
+--- linux-2.6.21.5.orig/arch/x86_64/mm/init.c
++++ linux-2.6.21.5/arch/x86_64/mm/init.c
+@@ -72,6 +72,8 @@ void show_mem(void)
+ 
+       for_each_online_pgdat(pgdat) {
+                for (i = 0; i < pgdat->node_spanned_pages; ++i) {
++                      if (!pfn_valid(pgdat->node_start_pfn + i))
++                              continue;
+                       page = pfn_to_page(pgdat->node_start_pfn + i);
+                       total++;
+                       if (PageReserved(page))
diff --git a/queue-2.6.21/pi-futex-fix-exit-races-and-locking-problems.patch b/queue-2.6.21/pi-futex-fix-exit-races-and-locking-problems.patch

new file mode 100644 (file)

index 0000000..1fe614b
--- /dev/null
+++ b/queue-2.6.21/pi-futex-fix-exit-races-and-locking-problems.patch
@@ -0,0 +1,445 @@
+From stable-bounces@linux.kernel.org  Fri Jun  8 03:16:17 2007
+Message-Id: <20070608101735.114323310@inhelltoy.tec.linutronix.de>
+Date: Fri, 08 Jun 2007 10:29:30 -0000
+From: Thomas Gleixner <tglx@linutronix.de>
+To: stable@kernel.org
+Cc: kuznet@ms2.inr.ac.ru, mingo@elte.hu, linux-kernel@vger.kernel.org
+Subject: pi-futex: Fix exit races and locking problems
+
+
+From: Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
+1. New entries can be added to tsk->pi_state_list after task completed
+   exit_pi_state_list(). The result is memory leakage and deadlocks.
+
+2. handle_mm_fault() is called under spinlock. The result is obvious.
+
+3. results in self-inflicted deadlock inside glibc.
+   Sometimes futex_lock_pi returns -ESRCH, when it is not expected
+   and glibc enters to for(;;) sleep() to simulate deadlock. This problem
+   is quite obvious and I think the patch is right. Though it looks like
+   each "if" in futex_lock_pi() got some stupid special case "else if". :-)
+
+4. sometimes futex_lock_pi() returns -EDEADLK,
+   when nobody has the lock. The reason is also obvious (see comment
+   in the patch), but correct fix is far beyond my comprehension.
+   I guess someone already saw this, the chunk:
+
+                        if (rt_mutex_trylock(&q.pi_state->pi_mutex))
+                                ret = 0;
+
+   is obviously from the same opera. But it does not work, because the
+   rtmutex is really taken at this point: wake_futex_pi() of previous
+   owner reassigned it to us. My fix works. But it looks very stupid.
+   I would think about removal of shift of ownership in wake_futex_pi()
+   and making all the work in context of process taking lock.
+
+From: Thomas Gleixner <tglx@linutronix.de>
+
+Fix 1) Avoid the tasklist lock variant of the exit race fix by adding
+    an additional state transition to the exit code.
+
+    This fixes also the issue, when a task with recursive segfaults
+    is not able to release the futexes.
+
+Fix 2) Cleanup the lookup_pi_state() failure path and solve the -ESRCH
+    problem finally.
+
+Fix 3) Solve the fixup_pi_state_owner() problem which needs to do the fixup
+    in the lock protected section by using the in_atomic userspace access
+    functions.
+       
+    This removes also the ugly lock drop / unqueue inside of fixup_pi_state()
+
+Fix 4) Fix a stale lock in the error path of futex_wake_pi()
+
+Added some error checks for verification.
+
+The -EDEADLK problem is solved by the rtmutex fixups.
+
+Cc: Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
+Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
+Acked-by: Ingo Molnar <mingo@elte.hu>
+Signed-off-by: Chris Wright <chrisw@sous-sol.org>
+
+---
+ include/linux/sched.h |    1 
+ kernel/exit.c         |   22 +++++
+ kernel/futex.c        |  191 +++++++++++++++++++++++++++++++++-----------------
+ 3 files changed, 150 insertions(+), 64 deletions(-)
+
+--- linux-2.6.21.5.orig/kernel/futex.c
++++ linux-2.6.21.5/kernel/futex.c
+@@ -396,10 +396,6 @@ static struct task_struct * futex_find_g
+               p = NULL;
+               goto out_unlock;
+       }
+-      if (p->exit_state != 0) {
+-              p = NULL;
+-              goto out_unlock;
+-      }
+       get_task_struct(p);
+ out_unlock:
+       rcu_read_unlock();
+@@ -467,7 +463,7 @@ lookup_pi_state(u32 uval, struct futex_h
+       struct futex_q *this, *next;
+       struct list_head *head;
+       struct task_struct *p;
+-      pid_t pid;
++      pid_t pid = uval & FUTEX_TID_MASK;
+ 
+       head = &hb->chain;
+ 
+@@ -485,6 +481,8 @@ lookup_pi_state(u32 uval, struct futex_h
+                               return -EINVAL;
+ 
+                       WARN_ON(!atomic_read(&pi_state->refcount));
++                      WARN_ON(pid && pi_state->owner &&
++                              pi_state->owner->pid != pid);
+ 
+                       atomic_inc(&pi_state->refcount);
+                       me->pi_state = pi_state;
+@@ -495,15 +493,33 @@ lookup_pi_state(u32 uval, struct futex_h
+ 
+       /*
+        * We are the first waiter - try to look up the real owner and attach
+-       * the new pi_state to it, but bail out when the owner died bit is set
+-       * and TID = 0:
++       * the new pi_state to it, but bail out when TID = 0
+        */
+-      pid = uval & FUTEX_TID_MASK;
+-      if (!pid && (uval & FUTEX_OWNER_DIED))
++      if (!pid)
+               return -ESRCH;
+       p = futex_find_get_task(pid);
+-      if (!p)
+-              return -ESRCH;
++      if (IS_ERR(p))
++              return PTR_ERR(p);
++
++      /*
++       * We need to look at the task state flags to figure out,
++       * whether the task is exiting. To protect against the do_exit
++       * change of the task flags, we do this protected by
++       * p->pi_lock:
++       */
++      spin_lock_irq(&p->pi_lock);
++      if (unlikely(p->flags & PF_EXITING)) {
++              /*
++               * The task is on the way out. When PF_EXITPIDONE is
++               * set, we know that the task has finished the
++               * cleanup:
++               */
++              int ret = (p->flags & PF_EXITPIDONE) ? -ESRCH : -EAGAIN;
++
++              spin_unlock_irq(&p->pi_lock);
++              put_task_struct(p);
++              return ret;
++      }
+ 
+       pi_state = alloc_pi_state();
+ 
+@@ -516,7 +532,6 @@ lookup_pi_state(u32 uval, struct futex_h
+       /* Store the key for possible exit cleanups: */
+       pi_state->key = me->key;
+ 
+-      spin_lock_irq(&p->pi_lock);
+       WARN_ON(!list_empty(&pi_state->list));
+       list_add(&pi_state->list, &p->pi_state_list);
+       pi_state->owner = p;
+@@ -583,15 +598,22 @@ static int wake_futex_pi(u32 __user *uad
+        * preserve the owner died bit.)
+        */
+       if (!(uval & FUTEX_OWNER_DIED)) {
++              int ret = 0;
++
+               newval = FUTEX_WAITERS | new_owner->pid;
+ 
+               pagefault_disable();
+               curval = futex_atomic_cmpxchg_inatomic(uaddr, uval, newval);
+               pagefault_enable();
++
+               if (curval == -EFAULT)
+-                      return -EFAULT;
++                      ret = -EFAULT;
+               if (curval != uval)
+-                      return -EINVAL;
++                      ret = -EINVAL;
++              if (ret) {
++                      spin_unlock(&pi_state->pi_mutex.wait_lock);
++                      return ret;
++              }
+       }
+ 
+       spin_lock_irq(&pi_state->owner->pi_lock);
+@@ -1149,6 +1171,7 @@ static int futex_lock_pi(u32 __user *uad
+       if (unlikely(ret != 0))
+               goto out_release_sem;
+ 
++ retry_unlocked:
+       hb = queue_lock(&q, -1, NULL);
+ 
+  retry_locked:
+@@ -1200,34 +1223,58 @@ static int futex_lock_pi(u32 __user *uad
+       ret = lookup_pi_state(uval, hb, &q);
+ 
+       if (unlikely(ret)) {
+-              /*
+-               * There were no waiters and the owner task lookup
+-               * failed. When the OWNER_DIED bit is set, then we
+-               * know that this is a robust futex and we actually
+-               * take the lock. This is safe as we are protected by
+-               * the hash bucket lock. We also set the waiters bit
+-               * unconditionally here, to simplify glibc handling of
+-               * multiple tasks racing to acquire the lock and
+-               * cleanup the problems which were left by the dead
+-               * owner.
+-               */
+-              if (curval & FUTEX_OWNER_DIED) {
+-                      uval = newval;
+-                      newval = current->pid |
+-                              FUTEX_OWNER_DIED | FUTEX_WAITERS;
++              switch (ret) {
+ 
+-                      pagefault_disable();
+-                      curval = futex_atomic_cmpxchg_inatomic(uaddr,
+-                                                             uval, newval);
+-                      pagefault_enable();
++              case -EAGAIN:
++                      /*
++                       * Task is exiting and we just wait for the
++                       * exit to complete.
++                       */
++                      queue_unlock(&q, hb);
++                      up_read(&curr->mm->mmap_sem);
++                      cond_resched();
++                      goto retry;
+ 
+-                      if (unlikely(curval == -EFAULT))
++              case -ESRCH:
++                      /*
++                       * No owner found for this futex. Check if the
++                       * OWNER_DIED bit is set to figure out whether
++                       * this is a robust futex or not.
++                       */
++                      if (get_futex_value_locked(&curval, uaddr))
+                               goto uaddr_faulted;
+-                      if (unlikely(curval != uval))
+-                              goto retry_locked;
+-                      ret = 0;
++
++                      /*
++                       * There were no waiters and the owner task lookup
++                       * failed. When the OWNER_DIED bit is set, then we
++                       * know that this is a robust futex and we actually
++                       * take the lock. This is safe as we are protected by
++                       * the hash bucket lock. We also set the waiters bit
++                       * unconditionally here, to simplify glibc handling of
++                       * multiple tasks racing to acquire the lock and
++                       * cleanup the problems which were left by the dead
++                       * owner.
++                       */
++                      if (curval & FUTEX_OWNER_DIED) {
++                              uval = newval;
++                              newval = current->pid |
++                                      FUTEX_OWNER_DIED | FUTEX_WAITERS;
++
++                              pagefault_disable();
++                              curval = futex_atomic_cmpxchg_inatomic(uaddr,
++                                                                     uval,
++                                                                     newval);
++                              pagefault_enable();
++
++                              if (unlikely(curval == -EFAULT))
++                                      goto uaddr_faulted;
++                              if (unlikely(curval != uval))
++                                      goto retry_locked;
++                              ret = 0;
++                      }
++              default:
++                      goto out_unlock_release_sem;
+               }
+-              goto out_unlock_release_sem;
+       }
+ 
+       /*
+@@ -1279,39 +1326,52 @@ static int futex_lock_pi(u32 __user *uad
+               list_add(&q.pi_state->list, &current->pi_state_list);
+               spin_unlock_irq(&current->pi_lock);
+ 
+-              /* Unqueue and drop the lock */
+-              unqueue_me_pi(&q, hb);
+-              up_read(&curr->mm->mmap_sem);
+               /*
+                * We own it, so we have to replace the pending owner
+-               * TID. This must be atomic as we have preserve the
++               * TID. This must be atomic as we have to preserve the
+                * owner died bit here.
+                */
+-              ret = get_user(uval, uaddr);
++              ret = get_futex_value_locked(&uval, uaddr);
+               while (!ret) {
+                       newval = (uval & FUTEX_OWNER_DIED) | newtid;
++
++                      pagefault_disable();
+                       curval = futex_atomic_cmpxchg_inatomic(uaddr,
+                                                              uval, newval);
++                      pagefault_enable();
++
+                       if (curval == -EFAULT)
+                               ret = -EFAULT;
+                       if (curval == uval)
+                               break;
+                       uval = curval;
+               }
+-      } else {
++      } else if (ret) {
+               /*
+                * Catch the rare case, where the lock was released
+                * when we were on the way back before we locked
+                * the hash bucket.
+                */
+-              if (ret && q.pi_state->owner == curr) {
+-                      if (rt_mutex_trylock(&q.pi_state->pi_mutex))
+-                              ret = 0;
++              if (q.pi_state->owner == curr &&
++                  rt_mutex_trylock(&q.pi_state->pi_mutex)) {
++                      ret = 0;
++              } else {
++                      /*
++                       * Paranoia check. If we did not take the lock
++                       * in the trylock above, then we should not be
++                       * the owner of the rtmutex, neither the real
++                       * nor the pending one:
++                       */
++                      if (rt_mutex_owner(&q.pi_state->pi_mutex) == curr)
++                              printk(KERN_ERR "futex_lock_pi: ret = %d "
++                                     "pi-mutex: %p pi-state %p\n", ret,
++                                     q.pi_state->pi_mutex.owner,
++                                     q.pi_state->owner);
+               }
+-              /* Unqueue and drop the lock */
+-              unqueue_me_pi(&q, hb);
+-              up_read(&curr->mm->mmap_sem);
+       }
++      /* Unqueue and drop the lock */
++      unqueue_me_pi(&q, hb);
++      up_read(&curr->mm->mmap_sem);
+ 
+       if (!detect && ret == -EDEADLK && 0)
+               force_sig(SIGKILL, current);
+@@ -1331,16 +1391,18 @@ static int futex_lock_pi(u32 __user *uad
+        * non-atomically.  Therefore, if get_user below is not
+        * enough, we need to handle the fault ourselves, while
+        * still holding the mmap_sem.
++       *
++       * ... and hb->lock. :-) --ANK
+        */
++      queue_unlock(&q, hb);
++
+       if (attempt++) {
+-              if (futex_handle_fault((unsigned long)uaddr, attempt)) {
+-                      ret = -EFAULT;
+-                      goto out_unlock_release_sem;
+-              }
+-              goto retry_locked;
++              ret = futex_handle_fault((unsigned long)uaddr, attempt);
++              if (ret)
++                      goto out_release_sem;
++              goto retry_unlocked;
+       }
+ 
+-      queue_unlock(&q, hb);
+       up_read(&curr->mm->mmap_sem);
+ 
+       ret = get_user(uval, uaddr);
+@@ -1382,9 +1444,9 @@ retry:
+               goto out;
+ 
+       hb = hash_futex(&key);
++retry_unlocked:
+       spin_lock(&hb->lock);
+ 
+-retry_locked:
+       /*
+        * To avoid races, try to do the TID -> 0 atomic transition
+        * again. If it succeeds then we can return without waking
+@@ -1446,16 +1508,17 @@ pi_faulted:
+        * non-atomically.  Therefore, if get_user below is not
+        * enough, we need to handle the fault ourselves, while
+        * still holding the mmap_sem.
++       *
++       * ... and hb->lock. :-) --ANK
+        */
++      spin_unlock(&hb->lock);
++
+       if (attempt++) {
+-              if (futex_handle_fault((unsigned long)uaddr, attempt)) {
+-                      ret = -EFAULT;
+-                      goto out_unlock;
+-              }
+-              goto retry_locked;
++              ret = futex_handle_fault((unsigned long)uaddr, attempt);
++              if (ret)
++                      goto out;
++              goto retry_unlocked;
+       }
+-
+-      spin_unlock(&hb->lock);
+       up_read(&current->mm->mmap_sem);
+ 
+       ret = get_user(uval, uaddr);
+--- linux-2.6.21.5.orig/include/linux/sched.h
++++ linux-2.6.21.5/include/linux/sched.h
+@@ -1138,6 +1138,7 @@ static inline void put_task_struct(struc
+                                       /* Not implemented yet, only for 486*/
+ #define PF_STARTING   0x00000002      /* being created */
+ #define PF_EXITING    0x00000004      /* getting shut down */
++#define PF_EXITPIDONE 0x00000008      /* pi exit done on shut down */
+ #define PF_FORKNOEXEC 0x00000040      /* forked but didn't exec */
+ #define PF_SUPERPRIV  0x00000100      /* used super-user privileges */
+ #define PF_DUMPCORE   0x00000200      /* dumped core */
+--- linux-2.6.21.5.orig/kernel/exit.c
++++ linux-2.6.21.5/kernel/exit.c
+@@ -884,13 +884,29 @@ fastcall NORET_TYPE void do_exit(long co
+       if (unlikely(tsk->flags & PF_EXITING)) {
+               printk(KERN_ALERT
+                       "Fixing recursive fault but reboot is needed!\n");
++              /*
++               * We can do this unlocked here. The futex code uses
++               * this flag just to verify whether the pi state
++               * cleanup has been done or not. In the worst case it
++               * loops once more. We pretend that the cleanup was
++               * done as there is no way to return. Either the
++               * OWNER_DIED bit is set by now or we push the blocked
++               * task into the wait for ever nirwana as well.
++               */
++              tsk->flags |= PF_EXITPIDONE;
+               if (tsk->io_context)
+                       exit_io_context();
+               set_current_state(TASK_UNINTERRUPTIBLE);
+               schedule();
+       }
+ 
++      /*
++       * tsk->flags are checked in the futex code to protect against
++       * an exiting task cleaning up the robust pi futexes.
++       */
++      spin_lock_irq(&tsk->pi_lock);
+       tsk->flags |= PF_EXITING;
++      spin_unlock_irq(&tsk->pi_lock);
+ 
+       if (unlikely(in_atomic()))
+               printk(KERN_INFO "note: %s[%d] exited with preempt_count %d\n",
+@@ -957,6 +973,12 @@ fastcall NORET_TYPE void do_exit(long co
+        * Make sure we are holding no locks:
+        */
+       debug_check_no_locks_held(tsk);
++      /*
++       * We can do this unlocked here. The futex code uses this flag
++       * just to verify whether the pi state cleanup has been done
++       * or not. In the worst case it loops once more.
++       */
++      tsk->flags |= PF_EXITPIDONE;
+ 
+       if (tsk->io_context)
+               exit_io_context();
diff --git a/queue-2.6.21/rt-mutex-fix-chain-walk-early-wakeup-bug.patch b/queue-2.6.21/rt-mutex-fix-chain-walk-early-wakeup-bug.patch

new file mode 100644 (file)

index 0000000..5be8c64
--- /dev/null
+++ b/queue-2.6.21/rt-mutex-fix-chain-walk-early-wakeup-bug.patch
@@ -0,0 +1,48 @@
+From stable-bounces@linux.kernel.org  Fri Jun  8 03:16:14 2007
+Message-Id: <20070608101735.088903362@inhelltoy.tec.linutronix.de>
+Date: Fri, 08 Jun 2007 10:29:29 -0000
+From: Thomas Gleixner <tglx@linutronix.de>
+To: stable@kernel.org
+Cc: kuznet@ms2.inr.ac.ru, mingo@elte.hu, linux-kernel@vger.kernel.org
+Subject: rt-mutex: Fix chain walk early wakeup bug
+
+Alexey Kuznetsov found some problems in the pi-futex code. 
+
+One of the root causes is:
+
+When a wakeup happens, we do not to stop the chain walk so we
+we follow a non existing locking chain.
+
+Drop out when this happens.
+
+Cc: Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
+Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
+Acked-by: Ingo Molnar <mingo@elte.hu>
+Signed-off-by: Chris Wright <chrisw@sous-sol.org>
+
+---
+ kernel/rtmutex.c |   13 +++++++++++++
+ 1 file changed, 13 insertions(+)
+
+--- linux-2.6.21.5.orig/kernel/rtmutex.c
++++ linux-2.6.21.5/kernel/rtmutex.c
+@@ -212,6 +212,19 @@ static int rt_mutex_adjust_prio_chain(st
+       if (!waiter || !waiter->task)
+               goto out_unlock_pi;
+ 
++      /*
++       * Check the orig_waiter state. After we dropped the locks,
++       * the previous owner of the lock might have released the lock
++       * and made us the pending owner:
++       */
++      if (orig_waiter && !orig_waiter->task)
++              goto out_unlock_pi;
++
++      /*
++       * Drop out, when the task has no waiters. Note,
++       * top_waiter can be NULL, when we are in the deboosting
++       * mode!
++       */
+       if (top_waiter && (!task_has_pi_waiters(task) ||
+                          top_waiter != task_top_pi_waiter(task)))
+               goto out_unlock_pi;
diff --git a/queue-2.6.21/rt-mutex-fix-stale-return-value.patch b/queue-2.6.21/rt-mutex-fix-stale-return-value.patch

new file mode 100644 (file)

index 0000000..771cb0e
--- /dev/null
+++ b/queue-2.6.21/rt-mutex-fix-stale-return-value.patch
@@ -0,0 +1,49 @@
+From stable-bounces@linux.kernel.org  Fri Jun  8 03:16:12 2007
+Message-Id: <20070608101735.036883282@inhelltoy.tec.linutronix.de>
+Date: Fri, 08 Jun 2007 10:29:28 -0000
+From: Thomas Gleixner <tglx@linutronix.de>
+To: stable@kernel.org
+Cc: kuznet@ms2.inr.ac.ru, mingo@elte.hu
+Subject: rt-mutex: Fix stale return value
+
+Alexey Kuznetsov found some problems in the pi-futex code. 
+
+The major problem is a stale return value in rt_mutex_slowlock():
+
+When the pi chain walk returns -EDEADLK, but the waiter was woken up 
+during the phases where the locks were dropped, the rtmutex could be
+acquired, but due to the stale return value -EDEADLK returned to the
+caller.
+
+Reset the return value in the woken up path.
+
+Cc: Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
+Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
+Acked-by: Ingo Molnar <mingo@elte.hu>
+Signed-off-by: Chris Wright <chrisw@sous-sol.org>
+
+---
+ kernel/rtmutex.c |   11 +++++++++--
+ 1 file changed, 9 insertions(+), 2 deletions(-)
+
+--- linux-2.6.21.5.orig/kernel/rtmutex.c
++++ linux-2.6.21.5/kernel/rtmutex.c
+@@ -659,9 +659,16 @@ rt_mutex_slowlock(struct rt_mutex *lock,
+                        * all over without going into schedule to try
+                        * to get the lock now:
+                        */
+-                      if (unlikely(!waiter.task))
++                      if (unlikely(!waiter.task)) {
++                              /*
++                               * Reset the return value. We might
++                               * have returned with -EDEADLK and the
++                               * owner released the lock while we
++                               * were walking the pi chain.
++                               */
++                              ret = 0;
+                               continue;
+-
++                      }
+                       if (unlikely(ret))
+                               break;
+               }
diff --git a/queue-2.6.21/series b/queue-2.6.21/series

new file mode 100644 (file)

index 0000000..04a0a24
--- /dev/null
+++ b/queue-2.6.21/series
@@ -0,0 +1,5 @@
+bnx2-fix-netdev-watchdog-on-5708.patch
+fix-show_mem-x86_64-sparsemem.patch
+rt-mutex-fix-stale-return-value.patch
+rt-mutex-fix-chain-walk-early-wakeup-bug.patch
+pi-futex-fix-exit-races-and-locking-problems.patch
author	Chris Wright <chrisw@sous-sol.org>
	Mon, 11 Jun 2007 23:50:31 +0000 (16:50 -0700)
committer	Chris Wright <chrisw@sous-sol.org>
	Mon, 11 Jun 2007 23:50:31 +0000 (16:50 -0700)
queue-2.6.21/bnx2-fix-netdev-watchdog-on-5708.patch	[new file with mode: 0644]	patch \| blob
queue-2.6.21/fix-show_mem-x86_64-sparsemem.patch	[new file with mode: 0644]	patch \| blob
queue-2.6.21/pi-futex-fix-exit-races-and-locking-problems.patch	[new file with mode: 0644]	patch \| blob
queue-2.6.21/rt-mutex-fix-chain-walk-early-wakeup-bug.patch	[new file with mode: 0644]	patch \| blob
queue-2.6.21/rt-mutex-fix-stale-return-value.patch	[new file with mode: 0644]	patch \| blob
queue-2.6.21/series	[new file with mode: 0644]	patch \| blob