workqueue: Allow cancel_work_sync() and disable_work() from atomic contexts on BH...

author Tejun Heo <tj@kernel.org>

Mon, 25 Mar 2024 17:21:03 +0000 (07:21 -1000)

committer Tejun Heo <tj@kernel.org>

Mon, 25 Mar 2024 17:21:03 +0000 (07:21 -1000)
author Tejun Heo <tj@kernel.org>
Mon, 25 Mar 2024 17:21:03 +0000 (07:21 -1000)
committer Tejun Heo <tj@kernel.org>
Mon, 25 Mar 2024 17:21:03 +0000 (07:21 -1000)
diff --git a/kernel/workqueue.c b/kernel/workqueue.c

index baf7495338bc59f4636e87300661f96ed7463899..c0cc8b209d5cfe9b06b55de82e72338161b7df75 100644 (file)
--- a/kernel/workqueue.c
+++ b/kernel/workqueue.c
@@ -4105,8 +4105,6 @@ static bool start_flush_work(struct work_struct *work, struct wq_barrier *barr,
         struct pool_workqueue *pwq;
         struct workqueue_struct *wq;
  
-       might_sleep();
-
         rcu_read_lock();
         pool = get_work_pool(work);
         if (!pool) {
@@ -4158,6 +4156,7 @@ already_gone:
  static bool __flush_work(struct work_struct *work, bool from_cancel)
  {
         struct wq_barrier barr;
+       unsigned long data;
  
         if (WARN_ON(!wq_online))
                 return false;
@@ -4165,13 +4164,41 @@ static bool __flush_work(struct work_struct *work, bool from_cancel)
         if (WARN_ON(!work->func))
                 return false;
  
-       if (start_flush_work(work, &barr, from_cancel)) {
-               wait_for_completion(&barr.done);
-               destroy_work_on_stack(&barr.work);
-               return true;
-       } else {
+       if (!start_flush_work(work, &barr, from_cancel))
                 return false;
+
+       /*
+        * start_flush_work() returned %true. If @from_cancel is set, we know
+        * that @work must have been executing during start_flush_work() and
+        * can't currently be queued. Its data must contain OFFQ bits. If @work
+        * was queued on a BH workqueue, we also know that it was running in the
+        * BH context and thus can be busy-waited.
+        */
+       data = *work_data_bits(work);
+       if (from_cancel &&
+           !WARN_ON_ONCE(data & WORK_STRUCT_PWQ) && (data & WORK_OFFQ_BH)) {
+               /*
+                * On RT, prevent a live lock when %current preempted soft
+                * interrupt processing or prevents ksoftirqd from running by
+                * keeping flipping BH. If the BH work item runs on a different
+                * CPU then this has no effect other than doing the BH
+                * disable/enable dance for nothing. This is copied from
+                * kernel/softirq.c::tasklet_unlock_spin_wait().
+                */
+               while (!try_wait_for_completion(&barr.done)) {
+                       if (IS_ENABLED(CONFIG_PREEMPT_RT)) {
+                               local_bh_disable();
+                               local_bh_enable();
+                       } else {
+                               cpu_relax();
+                       }
+               }
+       } else {
+               wait_for_completion(&barr.done);
         }
+
+       destroy_work_on_stack(&barr.work);
+       return true;
  }
  
  /**
@@ -4187,6 +4214,7 @@ static bool __flush_work(struct work_struct *work, bool from_cancel)
   */
  bool flush_work(struct work_struct *work)
  {
+       might_sleep();
         return __flush_work(work, false);
  }
  EXPORT_SYMBOL_GPL(flush_work);
@@ -4276,6 +4304,11 @@ static bool __cancel_work_sync(struct work_struct *work, u32 cflags)
  
         ret = __cancel_work(work, cflags | WORK_CANCEL_DISABLE);
  
+       if (*work_data_bits(work) & WORK_OFFQ_BH)
+               WARN_ON_ONCE(in_hardirq());
+       else
+               might_sleep();
+
         /*
          * Skip __flush_work() during early boot when we know that @work isn't
          * executing. This allows canceling during early boot.
@@ -4302,19 +4335,19 @@ EXPORT_SYMBOL(cancel_work);
   * cancel_work_sync - cancel a work and wait for it to finish
   * @work: the work to cancel
   *
- * Cancel @work and wait for its execution to finish.  This function
- * can be used even if the work re-queues itself or migrates to
- * another workqueue.  On return from this function, @work is
- * guaranteed to be not pending or executing on any CPU.
+ * Cancel @work and wait for its execution to finish. This function can be used
+ * even if the work re-queues itself or migrates to another workqueue. On return
+ * from this function, @work is guaranteed to be not pending or executing on any
+ * CPU as long as there aren't racing enqueues.
   *
- * cancel_work_sync(&delayed_work->work) must not be used for
- * delayed_work's.  Use cancel_delayed_work_sync() instead.
+ * cancel_work_sync(&delayed_work->work) must not be used for delayed_work's.
+ * Use cancel_delayed_work_sync() instead.
   *
- * The caller must ensure that the workqueue on which @work was last
- * queued can't be destroyed before this function returns.
+ * Must be called from a sleepable context if @work was last queued on a non-BH
+ * workqueue. Can also be called from non-hardirq atomic contexts including BH
+ * if @work was last queued on a BH workqueue.
   *
- * Return:
- * %true if @work was pending, %false otherwise.
+ * Returns %true if @work was pending, %false otherwise.
   */
  bool cancel_work_sync(struct work_struct *work)
  {
@@ -4384,8 +4417,11 @@ EXPORT_SYMBOL_GPL(disable_work);
   * Similar to disable_work() but also wait for @work to finish if currently
   * executing.
   *
- * Must be called from a sleepable context. Returns %true if @work was pending,
- * %false otherwise.
+ * Must be called from a sleepable context if @work was last queued on a non-BH
+ * workqueue. Can also be called from non-hardirq atomic contexts including BH
+ * if @work was last queued on a BH workqueue.
+ *
+ * Returns %true if @work was pending, %false otherwise.
   */
  bool disable_work_sync(struct work_struct *work)
  {
author	Tejun Heo <tj@kernel.org>
	Mon, 25 Mar 2024 17:21:03 +0000 (07:21 -1000)
committer	Tejun Heo <tj@kernel.org>
	Mon, 25 Mar 2024 17:21:03 +0000 (07:21 -1000)