drm/amdgpu: Fix error handling in slot reset

author Lijo Lazar <lijo.lazar@amd.com>

Tue, 24 Feb 2026 04:48:51 +0000 (10:18 +0530)

committer Alex Deucher <alexander.deucher@amd.com>

Wed, 25 Feb 2026 21:56:33 +0000 (16:56 -0500)
author Lijo Lazar <lijo.lazar@amd.com>
Tue, 24 Feb 2026 04:48:51 +0000 (10:18 +0530)
committer Alex Deucher <alexander.deucher@amd.com>
Wed, 25 Feb 2026 21:56:33 +0000 (16:56 -0500)
diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_device.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_device.c

index 0acddcb047300087bfb7053f74605a971022a3c8..d5bf62bb4602ac97b1f901465457ab9bab64890b 100644 (file)
--- a/drivers/gpu/drm/amd/amdgpu/amdgpu_device.c
+++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_device.c
@@ -7043,6 +7043,15 @@ pci_ers_result_t amdgpu_pci_slot_reset(struct pci_dev *pdev)
         dev_info(adev->dev, "PCI error: slot reset callback!!\n");
  
         memset(&reset_context, 0, sizeof(reset_context));
+       INIT_LIST_HEAD(&device_list);
+       hive = amdgpu_get_xgmi_hive(adev);
+       if (hive) {
+               mutex_lock(&hive->hive_lock);
+               list_for_each_entry(tmp_adev, &hive->device_list, gmc.xgmi.head)
+                       list_add_tail(&tmp_adev->reset_list, &device_list);
+       } else {
+               list_add_tail(&adev->reset_list, &device_list);
+       }
  
         if (adev->pcie_reset_ctx.swus)
                 link_dev = adev->pcie_reset_ctx.swus;
@@ -7083,19 +7092,13 @@ pci_ers_result_t amdgpu_pci_slot_reset(struct pci_dev *pdev)
         reset_context.reset_req_dev = adev;
         set_bit(AMDGPU_NEED_FULL_RESET, &reset_context.flags);
         set_bit(AMDGPU_SKIP_COREDUMP, &reset_context.flags);
-       INIT_LIST_HEAD(&device_list);
  
-       hive = amdgpu_get_xgmi_hive(adev);
         if (hive) {
-               mutex_lock(&hive->hive_lock);
                 reset_context.hive = hive;
-               list_for_each_entry(tmp_adev, &hive->device_list, gmc.xgmi.head) {
+               list_for_each_entry(tmp_adev, &hive->device_list, gmc.xgmi.head)
                         tmp_adev->pcie_reset_ctx.in_link_reset = true;
-                       list_add_tail(&tmp_adev->reset_list, &device_list);
-               }
         } else {
                 set_bit(AMDGPU_SKIP_HW_RESET, &reset_context.flags);
-               list_add_tail(&adev->reset_list, &device_list);
         }
  
         r = amdgpu_device_asic_reset(adev, &device_list, &reset_context);
author	Lijo Lazar <lijo.lazar@amd.com>
	Tue, 24 Feb 2026 04:48:51 +0000 (10:18 +0530)
committer	Alex Deucher <alexander.deucher@amd.com>
	Wed, 25 Feb 2026 21:56:33 +0000 (16:56 -0500)