]> git.ipfire.org Git - thirdparty/linux.git/commitdiff
drm/amdkfd: Fix race in GWS queue scheduling
authorJay Cornwall <jay.cornwall@amd.com>
Wed, 11 Jun 2025 14:52:14 +0000 (09:52 -0500)
committerAlex Deucher <alexander.deucher@amd.com>
Wed, 18 Jun 2025 17:17:32 +0000 (13:17 -0400)
q->gws is not updated atomically with qpd->mapped_gws_queue. If a
runlist is created between pqm_set_gws and update_queue it will
contain a queue which uses GWS in a process with no GWS allocated.
This will result in a scheduler hang.

Use q->properties.is_gws which is changed while holding the DQM lock.

Signed-off-by: Jay Cornwall <jay.cornwall@amd.com>
Reviewed-by: Harish Kasiviswanathan <Harish.Kasiviswanathan@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
(cherry picked from commit b98370220eb3110e82248e3354e16a489a492cfb)
Cc: stable@vger.kernel.org
drivers/gpu/drm/amd/amdkfd/kfd_packet_manager_v9.c

index 8fa6489b6f5d9fb4311177141869fa9fc66eb136..505036968a7759c752c1d81e840b539e884708ec 100644 (file)
@@ -240,7 +240,7 @@ static int pm_map_queues_v9(struct packet_manager *pm, uint32_t *buffer,
 
        packet->bitfields2.engine_sel =
                engine_sel__mes_map_queues__compute_vi;
-       packet->bitfields2.gws_control_queue = q->gws ? 1 : 0;
+       packet->bitfields2.gws_control_queue = q->properties.is_gws ? 1 : 0;
        packet->bitfields2.extended_engine_sel =
                extended_engine_sel__mes_map_queues__legacy_engine_sel;
        packet->bitfields2.queue_type =