]> git.ipfire.org Git - thirdparty/linux.git/commitdiff
drm/amdkfd: Don't clear PT after process killed
authorPhilip Yang <Philip.Yang@amd.com>
Fri, 31 Oct 2025 14:50:02 +0000 (10:50 -0400)
committerAlex Deucher <alexander.deucher@amd.com>
Tue, 4 Nov 2025 18:40:42 +0000 (13:40 -0500)
If process is killed. the vm entity is stopped, submit pt update job
will trigger the error message "*ERROR* Trying to push to a killed
entity", job will not execute.

Suggested-by: Christian König <christian.koenig@amd.com>
Signed-off-by: Philip Yang <Philip.Yang@amd.com>
Reviewed-by: Christian König <christian.koenig@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
(cherry picked from commit 10c382ec6c6d1e11975a11962bec21cba6360391)
Cc: stable@vger.kernel.org
drivers/gpu/drm/amd/amdgpu/amdgpu_amdkfd_gpuvm.c

index a2ca9acf8c4ea8eefd50d91ec88e046bc5cbdf29..923f0fa7350cf877635835dcc7101f7841376a05 100644 (file)
@@ -1267,6 +1267,10 @@ static int unmap_bo_from_gpuvm(struct kgd_mem *mem,
 
        (void)amdgpu_vm_bo_unmap(adev, bo_va, entry->va);
 
+       /* VM entity stopped if process killed, don't clear freed pt bo */
+       if (!amdgpu_vm_ready(vm))
+               return 0;
+
        (void)amdgpu_vm_clear_freed(adev, vm, &bo_va->last_pt_update);
 
        (void)amdgpu_sync_fence(sync, bo_va->last_pt_update, GFP_KERNEL);