libitm: Fix seq-cst MOs/fences in rwlock.

author torvald <torvald@138bc75d-0d04-0410-961f-82ee72b054a4>

Wed, 13 Jan 2016 21:39:50 +0000 (21:39 +0000)

committer torvald <torvald@138bc75d-0d04-0410-961f-82ee72b054a4>

Wed, 13 Jan 2016 21:39:50 +0000 (21:39 +0000)
author torvald <torvald@138bc75d-0d04-0410-961f-82ee72b054a4>
Wed, 13 Jan 2016 21:39:50 +0000 (21:39 +0000)
committer torvald <torvald@138bc75d-0d04-0410-961f-82ee72b054a4>
Wed, 13 Jan 2016 21:39:50 +0000 (21:39 +0000)
diff --git a/libitm/ChangeLog b/libitm/ChangeLog

index 7f7225a9b55678c5df8e9fb25cd7e218ebc88988..adcbf1d4f571d9c6c4fa9e634179ae546d3faa2f 100644 (file)
--- a/libitm/ChangeLog
+++ b/libitm/ChangeLog
@@ -1,3 +1,9 @@
+2016-01-13  Torvald Riegel  <triegel@redhat.com>
+
+       * beginend.cc (gtm_thread::trycommit): Fix seq_cst fences.
+       * config/linux/rwlock.cc (gtm_rwlock::write_lock_generic): Likewise.
+       (gtm_rwlock::write_unlock): Likewise.
+
  2016-01-13  Richard Henderson  <rth@redhat.com>
  
         * Makefile.am (libitm_la_SOURCES) [ARCH_AARCH64]: Add vect128.cc
diff --git a/libitm/beginend.cc b/libitm/beginend.cc

index 85fb4f13ed5b787fdda9627d5cd505b817795c80..00d28f4efb64d96f37d7be23b0bd897a0ab5cc61 100644 (file)
--- a/libitm/beginend.cc
+++ b/libitm/beginend.cc
@@ -619,8 +619,10 @@ GTM::gtm_thread::trycommit ()
            // acquisitions).  This ensures that if we read prior to other
            // reader transactions setting their shared_state to 0, then those
            // readers will observe our updates.  We can reuse the seq_cst fence
-          // in serial_lock.read_unlock() however, so we don't need another
-          // one here.
+          // in serial_lock.read_unlock() if we performed that; if not, we
+         // issue the fence.
+         if (do_read_unlock)
+           atomic_thread_fence (memory_order_seq_cst);
           // TODO Don't just spin but also block using cond vars / futexes
           // here. Should probably be integrated with the serial lock code.
           for (gtm_thread *it = gtm_thread::list_of_threads; it != 0;
diff --git a/libitm/config/linux/rwlock.cc b/libitm/config/linux/rwlock.cc

index 381a553171eb55811267a00aa1aee678b2de955b..b8d31ea7277e269dc9e0576424d6b3b7f58f61e6 100644 (file)
--- a/libitm/config/linux/rwlock.cc
+++ b/libitm/config/linux/rwlock.cc
@@ -122,9 +122,10 @@ gtm_rwlock::read_lock (gtm_thread *tx)
  bool
  gtm_rwlock::write_lock_generic (gtm_thread *tx)
  {
-  // Try to acquire the write lock.
+  // Try to acquire the write lock.  Relaxed MO is fine because of the
+  // additional fence below.
    int w = 0;
-  if (unlikely (!writers.compare_exchange_strong (w, 1)))
+  if (unlikely (!writers.compare_exchange_strong (w, 1, memory_order_relaxed)))
      {
        // If this is an upgrade, we must not wait for other writers or
        // upgrades.
@@ -135,18 +136,20 @@ gtm_rwlock::write_lock_generic (gtm_thread *tx)
        // switch to contended mode.  We need seq_cst memory order to make the
        // Dekker-style synchronization work.
        if (w != 2)
-       w = writers.exchange (2);
+       w = writers.exchange (2, memory_order_relaxed);
        while (w != 0)
         {
           futex_wait(&writers, 2);
-         w = writers.exchange (2);
+         w = writers.exchange (2, memory_order_relaxed);
         }
      }
+  // This fence is both required for the Dekker-like synchronization we do
+  // here and is the acquire MO required to make us synchronize-with prior
+  // writers.
+  atomic_thread_fence (memory_order_seq_cst);
  
    // We have acquired the writer side of the R/W lock. Now wait for any
    // readers that might still be active.
-  // We don't need an extra barrier here because the CAS and the xchg
-  // operations have full barrier semantics already.
    // TODO In the worst case, this requires one wait/wake pair for each
    // active reader. Reduce this!
    for (gtm_thread *it = gtm_thread::list_of_threads; it != 0;
@@ -259,28 +262,24 @@ gtm_rwlock::read_unlock (gtm_thread *tx)
  void
  gtm_rwlock::write_unlock ()
  {
-  // This needs to have seq_cst memory order.
-  if (writers.fetch_sub (1) == 2)
+  // Release MO so that we synchronize with subsequent writers.
+  if (writers.exchange (0, memory_order_release) == 2)
      {
-      // There might be waiting writers, so wake them.
-      writers.store (0, memory_order_relaxed);
-      if (futex_wake(&writers, 1) == 0)
-       {
-         // If we did not wake any waiting writers, we might indeed be the
-         // last writer (this can happen because write_lock_generic()
-         // exchanges 0 or 1 to 2 and thus might go to contended mode even if
-         // no other thread holds the write lock currently). Therefore, we
-         // have to wake up readers here as well.  Execute a barrier after
-         // the previous relaxed reset of writers (Dekker-style), and fall
-         // through to the normal reader wake-up code.
-         atomic_thread_fence (memory_order_seq_cst);
-       }
-      else
+      // There might be waiting writers, so wake them.  If we woke any thread,
+      // we assume it to indeed be a writer; waiting writers will never give
+      // up, so we can assume that they will take care of anything else such
+      // as waking readers.
+      if (futex_wake(&writers, 1) > 0)
         return;
+      // If we did not wake any waiting writers, we might indeed be the last
+      // writer (this can happen because write_lock_generic() exchanges 0 or 1
+      // to 2 and thus might go to contended mode even if no other thread
+      // holds the write lock currently). Therefore, we have to fall through
+      // to the normal reader wake-up code.
      }
+  // This fence is required because we do Dekker-like synchronization here.
+  atomic_thread_fence (memory_order_seq_cst);
    // No waiting writers, so wake up all waiting readers.
-  // Because the fetch_and_sub is a full barrier already, we don't need
-  // another barrier here (as in read_unlock()).
    if (readers.load (memory_order_relaxed) > 0)
      {
        // No additional barrier needed here.  The previous load must be in
author	torvald <torvald@138bc75d-0d04-0410-961f-82ee72b054a4>
	Wed, 13 Jan 2016 21:39:50 +0000 (21:39 +0000)
committer	torvald <torvald@138bc75d-0d04-0410-961f-82ee72b054a4>
	Wed, 13 Jan 2016 21:39:50 +0000 (21:39 +0000)
libitm/ChangeLog		patch \| blob \| blame \| history
libitm/beginend.cc		patch \| blob \| blame \| history
libitm/config/linux/rwlock.cc		patch \| blob \| blame \| history