Avoiding RCU synchronization deadlock when locking in critical section

author Maria Matejka <mq@ucw.cz>

Thu, 16 May 2024 08:22:19 +0000 (10:22 +0200)

committer Maria Matejka <mq@ucw.cz>

Wed, 22 May 2024 09:34:34 +0000 (11:34 +0200)
author Maria Matejka <mq@ucw.cz>
Thu, 16 May 2024 08:22:19 +0000 (10:22 +0200)
committer Maria Matejka <mq@ucw.cz>
Wed, 22 May 2024 09:34:34 +0000 (11:34 +0200)
diff --git a/lib/lockfree.h b/lib/lockfree.h

index 833b8366116215603467aa8fcdc426a1bd7c35f1..15b45010334f430624586934a2b4e1b5c0314dee 100644 (file)
--- a/lib/lockfree.h
+++ b/lib/lockfree.h
@@ -93,10 +93,6 @@ static inline void lfuc_unlock_immediately(struct lfuc *c, event_list *el, event
    u64 pending = (uc >> LFUC_PU_SHIFT) + 1;
    uc &= LFUC_IN_PROGRESS - 1;
  
-  /* We per-use the RCU critical section indicator to make the prune event wait
-   * until we finish here in the rare case we get preempted. */
-  rcu_read_lock();
-
    /* Obviously, there can't be more pending unlocks than the usecount itself */
    if (uc == pending)
      /* If we're the last unlocker (every owner is already unlocking), schedule
@@ -109,10 +105,6 @@ static inline void lfuc_unlock_immediately(struct lfuc *c, event_list *el, event
     * usecount, possibly allowing the pruning routine to free this structure */
    uc = atomic_fetch_sub_explicit(&c->uc, LFUC_IN_PROGRESS + 1, memory_order_acq_rel);
  
-  /* ... and to reduce the load a bit, the pruning routine will better wait for
-   * RCU synchronization instead of a busy loop. */
-  rcu_read_unlock();
-
  //  return uc - LFUC_IN_PROGRESS - 1;
  }
  
@@ -172,7 +164,7 @@ lfuc_finished(struct lfuc *c)
    u64 uc;
    /* Wait until all unlockers finish */
    while ((uc = atomic_load_explicit(&c->uc, memory_order_acquire)) >> LFUC_PU_SHIFT)
-    synchronize_rcu();
+    birdloop_yield();
  
    /* All of them are now done and if the usecount is now zero, then we're
     * the last place to reference the object and we can call it finished. */
diff --git a/lib/locking.h b/lib/locking.h

index 56ed2651dd515c0e74cf57ec4ceb09b795211332..7a59d470957a7149cb740e5cdc877955a792c518 100644 (file)
--- a/lib/locking.h
+++ b/lib/locking.h
@@ -43,8 +43,9 @@ extern _Thread_local struct domain_generic **last_locked;
  #define DOMAIN(type) struct domain__##type
  #define DOMAIN_ORDER(type)  OFFSETOF(struct lock_order, type)
  
-#define DOMAIN_NEW(type)  (DOMAIN(type)) { .type = domain_new(DOMAIN_ORDER(type)) }
-struct domain_generic *domain_new(uint order);
+#define DOMAIN_NEW(type)  (DOMAIN(type)) { .type = domain_new(DOMAIN_ORDER(type), 1) }
+#define DOMAIN_NEW_RCU_SYNC(type)  (DOMAIN(type)) { .type = domain_new(DOMAIN_ORDER(type), 0) }
+struct domain_generic *domain_new(uint order, _Bool allow_rcu);
  
  #define DOMAIN_FREE(type, d)   domain_free((d).type)
  void domain_free(struct domain_generic *);
diff --git a/lib/rcu.c b/lib/rcu.c

index 3491b1eca170c8e9107f96cc24027ea5660048e7..cfec36e62de276976bc452baca3448b2d63563d0 100644 (file)
--- a/lib/rcu.c
+++ b/lib/rcu.c
@@ -18,6 +18,7 @@
  
  _Atomic uint rcu_gp_ctl = RCU_NEST_CNT;
  _Thread_local struct rcu_thread *this_rcu_thread = NULL;
+_Thread_local uint rcu_blocked;
  
  static list rcu_thread_list;
  
@@ -45,6 +46,9 @@ update_counter_and_wait(void)
  void
  synchronize_rcu(void)
  {
+  if (!rcu_blocked && last_locked)
+    bug("Forbidden to synchronize RCU unless an appropriate lock is taken");
+
    LOCK_DOMAIN(resource, rcu_domain);
    update_counter_and_wait();
    update_counter_and_wait();
diff --git a/lib/rcu.h b/lib/rcu.h

index 30eacc5ba04256eb13b113cbcfecade3c5a121dd..632c6b189126ebafe6e296b395bac050b2fad924 100644 (file)
--- a/lib/rcu.h
+++ b/lib/rcu.h
@@ -27,6 +27,7 @@ struct rcu_thread {
  };
  
  extern _Thread_local struct rcu_thread *this_rcu_thread;
+extern _Thread_local uint rcu_blocked;
  
  static inline void rcu_read_lock(void)
  {
@@ -43,6 +44,11 @@ static inline void rcu_read_unlock(void)
    atomic_fetch_sub(&this_rcu_thread->ctl, RCU_NEST_CNT);
  }
  
+static inline _Bool rcu_read_active(void)
+{
+  return !!(atomic_load_explicit(&this_rcu_thread->ctl, memory_order_acquire) & RCU_NEST_MASK);
+}
+
  void synchronize_rcu(void);
  
  /* Registering and unregistering a birdloop. To be called from birdloop implementation */
diff --git a/nest/route.h b/nest/route.h

index 41c6aee3e06b004e6423e8c9fcb0e5e9aa258b2a..e44a791867f3db13b142e80832192a7d6e8f7349 100644 (file)
--- a/nest/route.h
+++ b/nest/route.h
@@ -188,21 +188,17 @@ static inline void rt_cork_acquire(void)
  static inline void rt_cork_release(void)
  {
    if (atomic_fetch_sub_explicit(&rt_cork.active, 1, memory_order_acq_rel) == 1)
-  {
-    synchronize_rcu();
      ev_send(&global_work_list, &rt_cork.run);
-  }
  }
  
-static inline int rt_cork_check(event *e)
+static inline _Bool rt_cork_check(event *e)
  {
-  rcu_read_lock();
-
    int corked = (atomic_load_explicit(&rt_cork.active, memory_order_acquire) > 0);
    if (corked)
      ev_send(&rt_cork.queue, e);
  
-  rcu_read_unlock();
+  if (atomic_load_explicit(&rt_cork.active, memory_order_acquire) == 0)
+    ev_send(&global_work_list, &rt_cork.run);
  
    return corked;
  }
diff --git a/nest/rt-attr.c b/nest/rt-attr.c

index b8fb508ebc2c044e5b46f8baf8f4c3405d46a499..ff895bcaf8c5f7d38bef3dd2855df36905cf0e31 100644 (file)
--- a/nest/rt-attr.c
+++ b/nest/rt-attr.c
@@ -1811,7 +1811,7 @@ ea_show_list(struct cli *c, ea_list *eal)
  void
  rta_init(void)
  {
-  attrs_domain = DOMAIN_NEW(attrs);
+  attrs_domain = DOMAIN_NEW_RCU_SYNC(attrs);
  
    RTA_LOCK;
    rta_pool = rp_new(&root_pool, attrs_domain.attrs, "Attributes");
diff --git a/nest/rt-table.c b/nest/rt-table.c

index de5a755d1b56a91196109e2ea877d7f574ca34d8..bd93e71b92f7db4eaad92509e16045daab11d656 100644 (file)
--- a/nest/rt-table.c
+++ b/nest/rt-table.c
@@ -814,7 +814,8 @@ rt_notify_basic(struct channel *c, const net_addr *net, rte *new, const rte *old
  void
  channel_rpe_mark_seen(struct channel *c, struct rt_pending_export *rpe)
  {
-  channel_trace(c, D_ROUTES, "Marking seen %p (%lu)", rpe, rpe->seq);
+  if (rpe->seq)
+    channel_trace(c, D_ROUTES, "Marking seen %p (%lu)", rpe, rpe->seq);
  
    ASSERT_DIE(c->out_req.hook);
    rpe_mark_seen(c->out_req.hook, rpe);
@@ -2788,7 +2789,7 @@ rt_setup(pool *pp, struct rtable_config *cf)
    pool *sp = birdloop_pool(loop);
  
    /* Create the table domain and pool */
-  DOMAIN(rtable) dom = DOMAIN_NEW(rtable);
+  DOMAIN(rtable) dom = DOMAIN_NEW_RCU_SYNC(rtable);
    LOCK_DOMAIN(rtable, dom);
  
    pool *p = rp_newf(sp, dom.rtable, "Routing table data %s", cf->name);
@@ -3088,7 +3089,7 @@ rt_prune_table(void *_tab)
  static void
  rt_cork_release_hook(void *data UNUSED)
  {
-  do synchronize_rcu();
+  do birdloop_yield();
    while (
        !atomic_load_explicit(&rt_cork.active, memory_order_acquire) &&
        ev_run_list(&rt_cork.queue)
@@ -4436,7 +4437,7 @@ hc_notify_export_one(struct rt_export_request *req, const net_addr *net, struct
           && !ev_active(tab->hcu_event))
        {
         if (req->trace_routes & D_EVENTS)
-         log(L_TRACE "%s requesting HCU");
+         log(L_TRACE "%s requesting HCU", req->name);
  
         ev_send_loop(tab->loop, tab->hcu_event);
        }
diff --git a/sysdep/unix/domain.c b/sysdep/unix/domain.c

index c04e91eab609d20ebd54b2bc26d872822510b99c..a176d7fcc1a9b140bee607827f806d72033b42da 100644 (file)
--- a/sysdep/unix/domain.c
+++ b/sysdep/unix/domain.c
@@ -43,24 +43,29 @@ _Thread_local struct domain_generic **last_locked = NULL;
  struct domain_generic {
    pthread_mutex_t mutex;
    uint order;
+  _Bool forbidden_when_reading_rcu;
    struct domain_generic **prev;
    struct lock_order *locked_by;
    const char *name;
    pool *pool;
  };
  
-#define DOMAIN_INIT(_order) { .mutex = PTHREAD_MUTEX_INITIALIZER, .order = _order }
+#define DOMAIN_INIT(_order, _allow_rcu) { \
+  .mutex = PTHREAD_MUTEX_INITIALIZER, \
+  .order = _order, \
+  .forbidden_when_reading_rcu = !_allow_rcu, \
+}
  
-static struct domain_generic the_bird_domain_gen = DOMAIN_INIT(OFFSETOF(struct lock_order, the_bird));
+static struct domain_generic the_bird_domain_gen = DOMAIN_INIT(OFFSETOF(struct lock_order, the_bird), 1);
  
  DOMAIN(the_bird) the_bird_domain = { .the_bird = &the_bird_domain_gen };
  
  struct domain_generic *
-domain_new(uint order)
+domain_new(uint order, _Bool allow_rcu)
  {
    ASSERT_DIE(order < sizeof(struct lock_order));
    struct domain_generic *dg = xmalloc(sizeof(struct domain_generic));
-  *dg = (struct domain_generic) DOMAIN_INIT(order);
+  *dg = (struct domain_generic) DOMAIN_INIT(order, allow_rcu);
    return dg;
  }
  
@@ -96,6 +101,12 @@ void do_lock(struct domain_generic *dg, struct domain_generic **lsp)
    memcpy(&stack_copy, &locking_stack, sizeof(stack_copy));
    struct domain_generic **lll = last_locked;
  
+  if (dg->forbidden_when_reading_rcu)
+    if (rcu_read_active())
+      bug("Locking of this lock forbidden while RCU reader is active");
+    else
+      rcu_blocked++;
+
    if ((char *) lsp - (char *) &locking_stack != dg->order)
      bug("Trying to lock on bad position: order=%u, lsp=%p, base=%p", dg->order, lsp, &locking_stack);
  
@@ -132,4 +143,7 @@ void do_unlock(struct domain_generic *dg, struct domain_generic **lsp)
    *lsp = NULL;
    dg->prev = NULL;
    pthread_mutex_unlock(&dg->mutex);
+
+  if (dg->forbidden_when_reading_rcu)
+    ASSERT_DIE(rcu_blocked--);
  }
diff --git a/sysdep/unix/io-loop.c b/sysdep/unix/io-loop.c

index 5934c12905234a8008a841f9ddc2e3301c36986b..76865a85af3ce50afc381f119739967c6624d826 100644 (file)
--- a/sysdep/unix/io-loop.c
+++ b/sysdep/unix/io-loop.c
@@ -1513,7 +1513,7 @@ birdloop_run_timer(timer *tm)
  static struct birdloop *
  birdloop_vnew_internal(pool *pp, uint order, struct birdloop_pickup_group *group, const char *name, va_list args)
  {
-  struct domain_generic *dg = domain_new(order);
+  struct domain_generic *dg = domain_new(order, 1);
    DG_LOCK(dg);
  
    pool *p = rp_vnewf(pp, dg, name, args);
author	Maria Matejka <mq@ucw.cz>
	Thu, 16 May 2024 08:22:19 +0000 (10:22 +0200)
committer	Maria Matejka <mq@ucw.cz>
	Wed, 22 May 2024 09:34:34 +0000 (11:34 +0200)
lib/lockfree.h		patch \| blob \| blame \| history
lib/locking.h		patch \| blob \| blame \| history
lib/rcu.c		patch \| blob \| blame \| history
lib/rcu.h		patch \| blob \| blame \| history
nest/route.h		patch \| blob \| blame \| history
nest/rt-attr.c		patch \| blob \| blame \| history
nest/rt-table.c		patch \| blob \| blame \| history
sysdep/unix/domain.c		patch \| blob \| blame \| history
sysdep/unix/io-loop.c		patch \| blob \| blame \| history