]> git.ipfire.org Git - thirdparty/kernel/linux.git/commitdiff
drm/amdkfd: Don't clear PT after process killed
authorPhilip Yang <Philip.Yang@amd.com>
Fri, 31 Oct 2025 14:50:02 +0000 (10:50 -0400)
committerAlex Deucher <alexander.deucher@amd.com>
Tue, 4 Nov 2025 16:53:22 +0000 (11:53 -0500)
If process is killed. the vm entity is stopped, submit pt update job
will trigger the error message "*ERROR* Trying to push to a killed
entity", job will not execute.

Suggested-by: Christian König <christian.koenig@amd.com>
Signed-off-by: Philip Yang <Philip.Yang@amd.com>
Reviewed-by: Christian König <christian.koenig@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
drivers/gpu/drm/amd/amdgpu/amdgpu_amdkfd_gpuvm.c

index 96ccd5ade03154da55e1cef8adb6f2311ef66d7e..b1c24c8fa6862330920de902e903807ecfefabe7 100644 (file)
@@ -1274,6 +1274,10 @@ static int unmap_bo_from_gpuvm(struct kgd_mem *mem,
 
        (void)amdgpu_vm_bo_unmap(adev, bo_va, entry->va);
 
+       /* VM entity stopped if process killed, don't clear freed pt bo */
+       if (!amdgpu_vm_ready(vm))
+               return 0;
+
        (void)amdgpu_vm_clear_freed(adev, vm, &bo_va->last_pt_update);
 
        (void)amdgpu_sync_fence(sync, bo_va->last_pt_update, GFP_KERNEL);