drm/xe/vf: Wakeup in GuC backend on VF post migration recovery

author Matthew Brost <matthew.brost@intel.com>

Wed, 8 Oct 2025 21:45:15 +0000 (14:45 -0700)

committer Matthew Brost <matthew.brost@intel.com>

Thu, 9 Oct 2025 10:22:39 +0000 (03:22 -0700)
author Matthew Brost <matthew.brost@intel.com>
Wed, 8 Oct 2025 21:45:15 +0000 (14:45 -0700)
committer Matthew Brost <matthew.brost@intel.com>
Thu, 9 Oct 2025 10:22:39 +0000 (03:22 -0700)
diff --git a/drivers/gpu/drm/xe/xe_exec_queue_types.h b/drivers/gpu/drm/xe/xe_exec_queue_types.h

index 27b76cf9da8958e2bb883233aa4a8daf57923cf6..282505fa13774eddefed854eaa825a575c15ea3e 100644 (file)
--- a/drivers/gpu/drm/xe/xe_exec_queue_types.h
+++ b/drivers/gpu/drm/xe/xe_exec_queue_types.h
@@ -207,6 +207,9 @@ struct xe_exec_queue_ops {
          * call after suspend. In dma-fencing path thus must return within a
          * reasonable amount of time. -ETIME return shall indicate an error
          * waiting for suspend resulting in associated VM getting killed.
+        * -EAGAIN return indicates the wait should be tried again, if the wait
+        * is within a work item, the work item should be requeued as deadlock
+        * avoidance mechanism.
          */
         int (*suspend_wait)(struct xe_exec_queue *q);
         /**
diff --git a/drivers/gpu/drm/xe/xe_gt_sriov_vf.c b/drivers/gpu/drm/xe/xe_gt_sriov_vf.c

index 96c93a64d754f803ab29a1ac4d083fdcad3c9591..b851285b8756c10f1ac63574084622dac9e8fea8 100644 (file)
--- a/drivers/gpu/drm/xe/xe_gt_sriov_vf.c
+++ b/drivers/gpu/drm/xe/xe_gt_sriov_vf.c
@@ -23,6 +23,7 @@
  #include "xe_gt_sriov_vf.h"
  #include "xe_gt_sriov_vf_types.h"
  #include "xe_guc.h"
+#include "xe_guc_ct.h"
  #include "xe_guc_hxg_helpers.h"
  #include "xe_guc_relay.h"
  #include "xe_guc_submit.h"
@@ -729,6 +730,9 @@ static void vf_start_migration_recovery(struct xe_gt *gt)
             !gt->sriov.vf.migration.recovery_teardown) {
                 gt->sriov.vf.migration.recovery_queued = true;
                 WRITE_ONCE(gt->sriov.vf.migration.recovery_inprogress, true);
+               smp_wmb();      /* Ensure above write visable before wake */
+
+               xe_guc_ct_wake_waiters(&gt->uc.guc.ct);
  
                 started = queue_work(gt->ordered_wq, &gt->sriov.vf.migration.worker);
                 xe_gt_sriov_info(gt, "VF migration recovery %s\n", started ?
diff --git a/drivers/gpu/drm/xe/xe_guc_ct.h b/drivers/gpu/drm/xe/xe_guc_ct.h

index d6c81325a76c97bd0eaf7c6f7735ac7e53fdbb9a..ae49364f6f2878fb864f09143ed776e5678db265 100644 (file)
--- a/drivers/gpu/drm/xe/xe_guc_ct.h
+++ b/drivers/gpu/drm/xe/xe_guc_ct.h
@@ -72,4 +72,13 @@ xe_guc_ct_send_block_no_fail(struct xe_guc_ct *ct, const u32 *action, u32 len)
  
  long xe_guc_ct_queue_proc_time_jiffies(struct xe_guc_ct *ct);
  
+/**
+ * xe_guc_ct_wake_waiters() - GuC CT wake up waiters
+ * @ct: GuC CT object
+ */
+static inline void xe_guc_ct_wake_waiters(struct xe_guc_ct *ct)
+{
+       wake_up_all(&ct->wq);
+}
+
  #endif
diff --git a/drivers/gpu/drm/xe/xe_guc_submit.c b/drivers/gpu/drm/xe/xe_guc_submit.c

index 59371b7cc8a4722427bae8837e83e9595b75caea..7f0ea35f4f0a073cf98c1542efadcc9d5dfb8e63 100644 (file)
--- a/drivers/gpu/drm/xe/xe_guc_submit.c
+++ b/drivers/gpu/drm/xe/xe_guc_submit.c
@@ -27,7 +27,6 @@
  #include "xe_gt.h"
  #include "xe_gt_clock.h"
  #include "xe_gt_printk.h"
-#include "xe_gt_sriov_vf.h"
  #include "xe_guc.h"
  #include "xe_guc_capture.h"
  #include "xe_guc_ct.h"
@@ -702,6 +701,11 @@ static u32 wq_space_until_wrap(struct xe_exec_queue *q)
         return (WQ_SIZE - q->guc->wqi_tail);
  }
  
+static bool vf_recovery(struct xe_guc *guc)
+{
+       return xe_gt_recovery_pending(guc_to_gt(guc));
+}
+
  static int wq_wait_for_space(struct xe_exec_queue *q, u32 wqi_size)
  {
         struct xe_guc *guc = exec_queue_to_guc(q);
@@ -711,7 +715,7 @@ static int wq_wait_for_space(struct xe_exec_queue *q, u32 wqi_size)
  
  #define AVAILABLE_SPACE \
         CIRC_SPACE(q->guc->wqi_tail, q->guc->wqi_head, WQ_SIZE)
-       if (wqi_size > AVAILABLE_SPACE) {
+       if (wqi_size > AVAILABLE_SPACE && !vf_recovery(guc)) {
  try_again:
                 q->guc->wqi_head = parallel_read(xe, map, wq_desc.head);
                 if (wqi_size > AVAILABLE_SPACE) {
@@ -910,9 +914,10 @@ static void disable_scheduling_deregister(struct xe_guc *guc,
         ret = wait_event_timeout(guc->ct.wq,
                                  (!exec_queue_pending_enable(q) &&
                                   !exec_queue_pending_disable(q)) ||
-                                        xe_guc_read_stopped(guc),
+                                        xe_guc_read_stopped(guc) ||
+                                        vf_recovery(guc),
                                  HZ * 5);
-       if (!ret) {
+       if (!ret && !vf_recovery(guc)) {
                 struct xe_gpu_scheduler *sched = &q->guc->sched;
  
                 xe_gt_warn(q->gt, "Pending enable/disable failed to respond\n");
@@ -1015,6 +1020,10 @@ static void xe_guc_exec_queue_lr_cleanup(struct work_struct *w)
         bool wedged = false;
  
         xe_gt_assert(guc_to_gt(guc), xe_exec_queue_is_lr(q));
+
+       if (vf_recovery(guc))
+               return;
+
         trace_xe_exec_queue_lr_cleanup(q);
  
         if (!exec_queue_killed(q))
@@ -1047,7 +1056,11 @@ static void xe_guc_exec_queue_lr_cleanup(struct work_struct *w)
                  */
                 ret = wait_event_timeout(guc->ct.wq,
                                          !exec_queue_pending_disable(q) ||
-                                        xe_guc_read_stopped(guc), HZ * 5);
+                                        xe_guc_read_stopped(guc) ||
+                                        vf_recovery(guc), HZ * 5);
+               if (vf_recovery(guc))
+                       return;
+
                 if (!ret) {
                         xe_gt_warn(q->gt, "Schedule disable failed to respond, guc_id=%d\n",
                                    q->guc->id);
@@ -1137,8 +1150,9 @@ static void enable_scheduling(struct xe_exec_queue *q)
  
         ret = wait_event_timeout(guc->ct.wq,
                                  !exec_queue_pending_enable(q) ||
-                                xe_guc_read_stopped(guc), HZ * 5);
-       if (!ret || xe_guc_read_stopped(guc)) {
+                                xe_guc_read_stopped(guc) ||
+                                vf_recovery(guc), HZ * 5);
+       if ((!ret && !vf_recovery(guc)) || xe_guc_read_stopped(guc)) {
                 xe_gt_warn(guc_to_gt(guc), "Schedule enable failed to respond");
                 set_exec_queue_banned(q);
                 xe_gt_reset_async(q->gt);
@@ -1209,7 +1223,8 @@ guc_exec_queue_timedout_job(struct drm_sched_job *drm_job)
          * list so job can be freed and kick scheduler ensuring free job is not
          * lost.
          */
-       if (test_bit(DMA_FENCE_FLAG_SIGNALED_BIT, &job->fence->flags))
+       if (test_bit(DMA_FENCE_FLAG_SIGNALED_BIT, &job->fence->flags) ||
+           vf_recovery(guc))
                 return DRM_GPU_SCHED_STAT_NO_HANG;
  
         /* Kill the run_job entry point */
@@ -1261,7 +1276,10 @@ guc_exec_queue_timedout_job(struct drm_sched_job *drm_job)
                         ret = wait_event_timeout(guc->ct.wq,
                                                  (!exec_queue_pending_enable(q) &&
                                                   !exec_queue_pending_disable(q)) ||
-                                                xe_guc_read_stopped(guc), HZ * 5);
+                                                xe_guc_read_stopped(guc) ||
+                                                vf_recovery(guc), HZ * 5);
+                       if (vf_recovery(guc))
+                               goto handle_vf_resume;
                         if (!ret || xe_guc_read_stopped(guc))
                                 goto trigger_reset;
  
@@ -1286,7 +1304,10 @@ guc_exec_queue_timedout_job(struct drm_sched_job *drm_job)
                 smp_rmb();
                 ret = wait_event_timeout(guc->ct.wq,
                                          !exec_queue_pending_disable(q) ||
-                                        xe_guc_read_stopped(guc), HZ * 5);
+                                        xe_guc_read_stopped(guc) ||
+                                        vf_recovery(guc), HZ * 5);
+               if (vf_recovery(guc))
+                       goto handle_vf_resume;
                 if (!ret || xe_guc_read_stopped(guc)) {
  trigger_reset:
                         if (!ret)
@@ -1391,6 +1412,7 @@ rearm:
          * some thought, do this in a follow up.
          */
         xe_sched_submission_start(sched);
+handle_vf_resume:
         return DRM_GPU_SCHED_STAT_NO_HANG;
  }
  
@@ -1487,11 +1509,24 @@ static void __guc_exec_queue_process_msg_set_sched_props(struct xe_sched_msg *ms
  
  static void __suspend_fence_signal(struct xe_exec_queue *q)
  {
+       struct xe_guc *guc = exec_queue_to_guc(q);
+       struct xe_device *xe = guc_to_xe(guc);
+
         if (!q->guc->suspend_pending)
                 return;
  
         WRITE_ONCE(q->guc->suspend_pending, false);
-       wake_up(&q->guc->suspend_wait);
+
+       /*
+        * We use a GuC shared wait queue for VFs because the VF resfix start
+        * interrupt must be able to wake all instances of suspend_wait. This
+        * prevents the VF migration worker from being starved during
+        * scheduling.
+        */
+       if (IS_SRIOV_VF(xe))
+               wake_up_all(&guc->ct.wq);
+       else
+               wake_up(&q->guc->suspend_wait);
  }
  
  static void suspend_fence_signal(struct xe_exec_queue *q)
@@ -1512,8 +1547,9 @@ static void __guc_exec_queue_process_msg_suspend(struct xe_sched_msg *msg)
  
         if (guc_exec_queue_allowed_to_change_state(q) && !exec_queue_suspended(q) &&
             exec_queue_enabled(q)) {
-               wait_event(guc->ct.wq, (q->guc->resume_time != RESUME_PENDING ||
-                          xe_guc_read_stopped(guc)) && !exec_queue_pending_disable(q));
+               wait_event(guc->ct.wq, vf_recovery(guc) ||
+                          ((q->guc->resume_time != RESUME_PENDING ||
+                          xe_guc_read_stopped(guc)) && !exec_queue_pending_disable(q)));
  
                 if (!xe_guc_read_stopped(guc)) {
                         s64 since_resume_ms =
@@ -1640,7 +1676,7 @@ static int guc_exec_queue_init(struct xe_exec_queue *q)
  
         q->entity = &ge->entity;
  
-       if (xe_guc_read_stopped(guc))
+       if (xe_guc_read_stopped(guc) || vf_recovery(guc))
                 xe_sched_stop(sched);
  
         mutex_unlock(&guc->submission_state.lock);
@@ -1786,6 +1822,7 @@ static int guc_exec_queue_suspend(struct xe_exec_queue *q)
  static int guc_exec_queue_suspend_wait(struct xe_exec_queue *q)
  {
         struct xe_guc *guc = exec_queue_to_guc(q);
+       struct xe_device *xe = guc_to_xe(guc);
         int ret;
  
         /*
@@ -1793,11 +1830,21 @@ static int guc_exec_queue_suspend_wait(struct xe_exec_queue *q)
          * suspend_pending upon kill but to be paranoid but races in which
          * suspend_pending is set after kill also check kill here.
          */
-       ret = wait_event_interruptible_timeout(q->guc->suspend_wait,
-                                              !READ_ONCE(q->guc->suspend_pending) ||
-                                              exec_queue_killed(q) ||
-                                              xe_guc_read_stopped(guc),
-                                              HZ * 5);
+#define WAIT_COND \
+       (!READ_ONCE(q->guc->suspend_pending) || exec_queue_killed(q) || \
+        xe_guc_read_stopped(guc))
+
+retry:
+       if (IS_SRIOV_VF(xe))
+               ret = wait_event_interruptible_timeout(guc->ct.wq, WAIT_COND ||
+                                                      vf_recovery(guc),
+                                                      HZ * 5);
+       else
+               ret = wait_event_interruptible_timeout(q->guc->suspend_wait,
+                                                      WAIT_COND, HZ * 5);
+
+       if (vf_recovery(guc) && !xe_device_wedged((guc_to_xe(guc))))
+               return -EAGAIN;
  
         if (!ret) {
                 xe_gt_warn(guc_to_gt(guc),
@@ -1805,8 +1852,13 @@ static int guc_exec_queue_suspend_wait(struct xe_exec_queue *q)
                            q->guc->id);
                 /* XXX: Trigger GT reset? */
                 return -ETIME;
+       } else if (IS_SRIOV_VF(xe) && !WAIT_COND) {
+               /* Corner case on RESFIX DONE where vf_recovery() changes */
+               goto retry;
         }
  
+#undef WAIT_COND
+
         return ret < 0 ? ret : 0;
  }
  
@@ -1905,8 +1957,7 @@ int xe_guc_submit_reset_prepare(struct xe_guc *guc)
  {
         int ret;
  
-       if (xe_gt_WARN_ON(guc_to_gt(guc),
-                         xe_gt_sriov_vf_recovery_pending(guc_to_gt(guc))))
+       if (xe_gt_WARN_ON(guc_to_gt(guc), vf_recovery(guc)))
                 return 0;
  
         if (!guc->submission_state.initialized)
diff --git a/drivers/gpu/drm/xe/xe_preempt_fence.c b/drivers/gpu/drm/xe/xe_preempt_fence.c

index 83fbeea5aa201a597cf9703834f78c4aab95d2ae..7f587ca3947def251f3815be93f5713ee739847d 100644 (file)
--- a/drivers/gpu/drm/xe/xe_preempt_fence.c
+++ b/drivers/gpu/drm/xe/xe_preempt_fence.c
@@ -8,6 +8,8 @@
  #include <linux/slab.h>
  
  #include "xe_exec_queue.h"
+#include "xe_gt_printk.h"
+#include "xe_guc_exec_queue_types.h"
  #include "xe_vm.h"
  
  static void preempt_fence_work_func(struct work_struct *w)
@@ -22,6 +24,15 @@ static void preempt_fence_work_func(struct work_struct *w)
         } else if (!q->ops->reset_status(q)) {
                 int err = q->ops->suspend_wait(q);
  
+               if (err == -EAGAIN) {
+                       xe_gt_dbg(q->gt, "PREEMPT FENCE RETRY guc_id=%d",
+                                 q->guc->id);
+                       queue_work(q->vm->xe->preempt_fence_wq,
+                                  &pfence->preempt_work);
+                       dma_fence_end_signalling(cookie);
+                       return;
+               }
+
                 if (err)
                         dma_fence_set_error(&pfence->base, err);
         } else {
author	Matthew Brost <matthew.brost@intel.com>
	Wed, 8 Oct 2025 21:45:15 +0000 (14:45 -0700)
committer	Matthew Brost <matthew.brost@intel.com>
	Thu, 9 Oct 2025 10:22:39 +0000 (03:22 -0700)
drivers/gpu/drm/xe/xe_exec_queue_types.h		patch \| blob \| blame \| history
drivers/gpu/drm/xe/xe_gt_sriov_vf.c		patch \| blob \| blame \| history
drivers/gpu/drm/xe/xe_guc_ct.h		patch \| blob \| blame \| history
drivers/gpu/drm/xe/xe_guc_submit.c		patch \| blob \| blame \| history
drivers/gpu/drm/xe/xe_preempt_fence.c		patch \| blob \| blame \| history