]> git.ipfire.org Git - thirdparty/kernel/linux.git/commitdiff
drm/amdkfd: mark GFX12 system and peer GPU memory mappings as MTYPE_NC
authorSreekant Somasekharan <sreekant.somasekharan@amd.com>
Tue, 26 Mar 2024 20:19:28 +0000 (16:19 -0400)
committerAlex Deucher <alexander.deucher@amd.com>
Thu, 2 May 2024 20:18:13 +0000 (16:18 -0400)
Due to a HW bug, the system memory mappings and peer GPU mappings
on GFX12 need to be marked as MTYPE_NC.

Cc: Joe Greathouse <joseph.greathouse@amd.com>
Cc: David Belanger <david.belanger@amd.com>
Signed-off-by: Rajneesh Bhardwaj <rajneesh.bhardwaj@amd.com>
Signed-off-by: Sreekant Somasekharan <sreekant.somasekharan@amd.com>
Reviewed-by: Harish Kasiviswanathan <Harish.Kasiviswanathan@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
drivers/gpu/drm/amd/amdgpu/gmc_v12_0.c
drivers/gpu/drm/amd/amdkfd/kfd_svm.c

index c24f5bd3e09cee73bb83f5d8609808c492ba615f..3e6676fdc1875456564051b0de70ad463aec3d1c 100644 (file)
@@ -497,6 +497,10 @@ static void gmc_v12_0_get_vm_pte(struct amdgpu_device *adev,
                                 uint64_t *flags)
 {
        struct amdgpu_bo *bo = mapping->bo_va->base.bo;
+       struct amdgpu_device *bo_adev = amdgpu_ttm_adev(bo->tbo.bdev);
+       bool coherent = bo->flags & AMDGPU_GEM_CREATE_COHERENT;
+       bool is_system = bo->tbo.resource->mem_type == TTM_PL_SYSTEM;
+
 
        *flags &= ~AMDGPU_PTE_EXECUTABLE;
        *flags |= mapping->flags & AMDGPU_PTE_EXECUTABLE;
@@ -515,6 +519,11 @@ static void gmc_v12_0_get_vm_pte(struct amdgpu_device *adev,
                               AMDGPU_GEM_CREATE_UNCACHED))
                *flags = (*flags & ~AMDGPU_PTE_MTYPE_GFX12_MASK) |
                         AMDGPU_PTE_MTYPE_GFX12(MTYPE_UC);
+
+       /* WA for HW bug */
+       if ((bo && is_system) || ((bo_adev != adev) && coherent))
+               *flags |= AMDGPU_PTE_MTYPE_GFX12(MTYPE_NC);
+
 }
 
 static unsigned gmc_v12_0_get_vbios_fb_size(struct amdgpu_device *adev)
index 7bb3d76505689f27aaa6d42376d339d9bc1170d6..91175b1bd9ac0cffc83ca1ba9413765f86772ff0 100644 (file)
@@ -1249,6 +1249,15 @@ svm_range_get_pte_flags(struct kfd_node *node,
                        mapping_flags |= AMDGPU_VM_MTYPE_UC;
                }
                break;
+       case IP_VERSION(12, 0, 0):
+               if (domain == SVM_RANGE_VRAM_DOMAIN) {
+                       if (bo_node != node)
+                               mapping_flags |= AMDGPU_VM_MTYPE_NC;
+               } else {
+                       mapping_flags |= coherent ?
+                               AMDGPU_VM_MTYPE_UC : AMDGPU_VM_MTYPE_NC;
+               }
+               break;
        default:
                mapping_flags |= coherent ?
                        AMDGPU_VM_MTYPE_UC : AMDGPU_VM_MTYPE_NC;