]> git.ipfire.org Git - thirdparty/kernel/stable.git/commitdiff
drm/xe/guc_submit: add missing locking in wedged_fini
authorMatthew Auld <matthew.auld@intel.com>
Tue, 24 Sep 2024 15:09:48 +0000 (16:09 +0100)
committerGreg Kroah-Hartman <gregkh@linuxfoundation.org>
Thu, 10 Oct 2024 10:03:04 +0000 (12:03 +0200)
[ Upstream commit 790533e44bfc7af929842fccd9674c9f424d4627 ]

Any non-wedged queue can have a zero refcount here and can be running
concurrently with an async queue destroy, therefore dereferencing the
queue ptr to check wedge status after the lookup can trigger UAF if
queue is not wedged.  Fix this by keeping the submission_state lock held
around the check to postpone the free and make the check safe, before
dropping again around the put() to avoid the deadlock.

Fixes: 8ed9aaae39f3 ("drm/xe: Force wedged state and block GT reset upon any GPU hang")
Signed-off-by: Matthew Auld <matthew.auld@intel.com>
Cc: Matthew Brost <matthew.brost@intel.com>
Reviewed-by: Matthew Brost <matthew.brost@intel.com>
Link: https://patchwork.freedesktop.org/patch/msgid/20240924150947.118433-2-matthew.auld@intel.com
(cherry picked from commit d28af0b6b9580b9f90c265a7da0315b0ad20bbfd)
Signed-off-by: Lucas De Marchi <lucas.demarchi@intel.com>
Signed-off-by: Sasha Levin <sashal@kernel.org>
drivers/gpu/drm/xe/xe_guc_submit.c

index 59b36c7998c243582e775ff911b6ab106668b6d9..3d91734980110f7b419b56f7410d813c2a4377c2 100644 (file)
@@ -290,9 +290,15 @@ static void guc_submit_wedged_fini(void *arg)
        struct xe_exec_queue *q;
        unsigned long index;
 
-       xa_for_each(&guc->submission_state.exec_queue_lookup, index, q)
-               if (exec_queue_wedged(q))
+       mutex_lock(&guc->submission_state.lock);
+       xa_for_each(&guc->submission_state.exec_queue_lookup, index, q) {
+               if (exec_queue_wedged(q)) {
+                       mutex_unlock(&guc->submission_state.lock);
                        xe_exec_queue_put(q);
+                       mutex_lock(&guc->submission_state.lock);
+               }
+       }
+       mutex_unlock(&guc->submission_state.lock);
 }
 
 static const struct xe_exec_queue_ops guc_exec_queue_ops;