]> git.ipfire.org Git - thirdparty/kernel/linux.git/commitdiff
drm/amdgpu/gfx12: Implement the GFX12 KCQ pipe reset
authorPrike Liang <Prike.Liang@amd.com>
Fri, 21 Feb 2025 12:34:32 +0000 (20:34 +0800)
committerAlex Deucher <alexander.deucher@amd.com>
Fri, 11 Apr 2025 20:56:07 +0000 (16:56 -0400)
Implement the GFX12 KCQ pipe reset, and disable the GFX12
kernel compute queue until the CPFW fully supports it.

Signed-off-by: Prike Liang <Prike.Liang@amd.com>
Acked-by: Alex Deucher <alexander.deucher@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
drivers/gpu/drm/amd/amdgpu/gfx_v12_0.c

index 3d87e445270e4025a41e9fd9b5fc2eda51a7b216..2474006b1a3407c1d23c5566dd91c1cc25a9dbd7 100644 (file)
@@ -5316,6 +5316,89 @@ static int gfx_v12_0_reset_kgq(struct amdgpu_ring *ring, unsigned int vmid)
        return amdgpu_ring_test_ring(ring);
 }
 
+static int gfx_v12_0_reset_compute_pipe(struct amdgpu_ring *ring)
+{
+       struct amdgpu_device *adev = ring->adev;
+       uint32_t reset_pipe = 0, clean_pipe = 0;
+       int r = 0;
+
+       if (!gfx_v12_pipe_reset_support(adev))
+               return -EOPNOTSUPP;
+
+       gfx_v12_0_set_safe_mode(adev, 0);
+       mutex_lock(&adev->srbm_mutex);
+       soc24_grbm_select(adev, ring->me, ring->pipe, ring->queue, 0);
+
+       reset_pipe = RREG32_SOC15(GC, 0, regCP_MEC_RS64_CNTL);
+       clean_pipe = reset_pipe;
+
+       if (adev->gfx.rs64_enable) {
+               switch (ring->pipe) {
+               case 0:
+                       reset_pipe = REG_SET_FIELD(reset_pipe, CP_MEC_RS64_CNTL,
+                                                  MEC_PIPE0_RESET, 1);
+                       clean_pipe = REG_SET_FIELD(clean_pipe, CP_MEC_RS64_CNTL,
+                                                  MEC_PIPE0_RESET, 0);
+                       break;
+               case 1:
+                       reset_pipe = REG_SET_FIELD(reset_pipe, CP_MEC_RS64_CNTL,
+                                                  MEC_PIPE1_RESET, 1);
+                       clean_pipe = REG_SET_FIELD(clean_pipe, CP_MEC_RS64_CNTL,
+                                                  MEC_PIPE1_RESET, 0);
+                       break;
+               case 2:
+                       reset_pipe = REG_SET_FIELD(reset_pipe, CP_MEC_RS64_CNTL,
+                                                  MEC_PIPE2_RESET, 1);
+                       clean_pipe = REG_SET_FIELD(clean_pipe, CP_MEC_RS64_CNTL,
+                                                  MEC_PIPE2_RESET, 0);
+                       break;
+               case 3:
+                       reset_pipe = REG_SET_FIELD(reset_pipe, CP_MEC_RS64_CNTL,
+                                                  MEC_PIPE3_RESET, 1);
+                       clean_pipe = REG_SET_FIELD(clean_pipe, CP_MEC_RS64_CNTL,
+                                                  MEC_PIPE3_RESET, 0);
+                       break;
+               default:
+                       break;
+               }
+               WREG32_SOC15(GC, 0, regCP_MEC_RS64_CNTL, reset_pipe);
+               WREG32_SOC15(GC, 0, regCP_MEC_RS64_CNTL, clean_pipe);
+               r = (RREG32_SOC15(GC, 0, regCP_MEC_RS64_INSTR_PNTR) << 2) -
+                               RS64_FW_UC_START_ADDR_LO;
+       } else {
+               switch (ring->pipe) {
+               case 0:
+                       reset_pipe = REG_SET_FIELD(reset_pipe, CP_MEC_CNTL,
+                                                          MEC_ME1_PIPE0_RESET, 1);
+                       clean_pipe = REG_SET_FIELD(clean_pipe, CP_MEC_CNTL,
+                                                          MEC_ME1_PIPE0_RESET, 0);
+                       break;
+               case 1:
+                       reset_pipe = REG_SET_FIELD(reset_pipe, CP_MEC_CNTL,
+                                                          MEC_ME1_PIPE1_RESET, 1);
+                       clean_pipe = REG_SET_FIELD(clean_pipe, CP_MEC_CNTL,
+                                                          MEC_ME1_PIPE1_RESET, 0);
+                       break;
+               default:
+               break;
+               }
+               WREG32_SOC15(GC, 0, regCP_MEC_CNTL, reset_pipe);
+               WREG32_SOC15(GC, 0, regCP_MEC_CNTL, clean_pipe);
+               /* Doesn't find the F32 MEC instruction pointer register, and suppose
+                * the driver won't run into the F32 mode.
+                */
+       }
+
+       soc24_grbm_select(adev, 0, 0, 0, 0);
+       mutex_unlock(&adev->srbm_mutex);
+       gfx_v12_0_unset_safe_mode(adev, 0);
+
+       dev_info(adev->dev, "The ring %s pipe resets: %s\n", ring->name,
+                       r == 0 ? "successfully" : "failed");
+       /* Need the ring test to verify the pipe reset result.*/
+       return 0;
+}
+
 static int gfx_v12_0_reset_kcq(struct amdgpu_ring *ring, unsigned int vmid)
 {
        struct amdgpu_device *adev = ring->adev;
@@ -5326,8 +5409,10 @@ static int gfx_v12_0_reset_kcq(struct amdgpu_ring *ring, unsigned int vmid)
 
        r = amdgpu_mes_reset_legacy_queue(ring->adev, ring, vmid, true);
        if (r) {
-               dev_err(adev->dev, "reset via MMIO failed %d\n", r);
-               return r;
+               dev_warn(adev->dev, "fail(%d) to reset kcq  and try pipe reset\n", r);
+               r = gfx_v12_0_reset_compute_pipe(ring);
+               if (r)
+                       return r;
        }
 
        r = gfx_v12_0_kcq_init_queue(ring, true);