drm/xe/svm: Add svm ranges migration policy on atomic access

author Himal Prasad Ghimiray <himal.prasad.ghimiray@intel.com>

Thu, 21 Aug 2025 17:30:53 +0000 (23:00 +0530)

committer Himal Prasad Ghimiray <himal.prasad.ghimiray@intel.com>

Tue, 26 Aug 2025 05:55:36 +0000 (11:25 +0530)
author Himal Prasad Ghimiray <himal.prasad.ghimiray@intel.com>
Thu, 21 Aug 2025 17:30:53 +0000 (23:00 +0530)
committer Himal Prasad Ghimiray <himal.prasad.ghimiray@intel.com>
Tue, 26 Aug 2025 05:55:36 +0000 (11:25 +0530)
diff --git a/drivers/gpu/drm/xe/xe_pt.c b/drivers/gpu/drm/xe/xe_pt.c

index bf50a821853e61cac3944153d8cffb13de7427d1..c0a70c80dff9a8de6bd34305acdab18966673971 100644 (file)
--- a/drivers/gpu/drm/xe/xe_pt.c
+++ b/drivers/gpu/drm/xe/xe_pt.c
@@ -640,28 +640,31 @@ static const struct xe_pt_walk_ops xe_pt_stage_bind_ops = {
   *    - In all other cases device atomics will be disabled with AE=0 until an application
   *      request differently using a ioctl like madvise.
   */
-static bool xe_atomic_for_vram(struct xe_vm *vm)
+static bool xe_atomic_for_vram(struct xe_vm *vm, struct xe_vma *vma)
  {
+       if (vma->attr.atomic_access == DRM_XE_ATOMIC_CPU)
+               return false;
+
         return true;
  }
  
-static bool xe_atomic_for_system(struct xe_vm *vm, struct xe_bo *bo)
+static bool xe_atomic_for_system(struct xe_vm *vm, struct xe_vma *vma)
  {
         struct xe_device *xe = vm->xe;
+       struct xe_bo *bo = xe_vma_bo(vma);
  
-       if (!xe->info.has_device_atomics_on_smem)
+       if (!xe->info.has_device_atomics_on_smem ||
+           vma->attr.atomic_access == DRM_XE_ATOMIC_CPU)
                 return false;
  
+       if (vma->attr.atomic_access == DRM_XE_ATOMIC_DEVICE)
+               return true;
+
         /*
          * If a SMEM+LMEM allocation is backed by SMEM, a device
          * atomics will cause a gpu page fault and which then
          * gets migrated to LMEM, bind such allocations with
          * device atomics enabled.
-        *
-        * TODO: Revisit this. Perhaps add something like a
-        * fault_on_atomics_in_system UAPI flag.
-        * Note that this also prohibits GPU atomics in LR mode for
-        * userptr and system memory on DGFX.
          */
         return (!IS_DGFX(xe) || (!xe_vm_in_lr_mode(vm) ||
                                  (bo && xe_bo_has_single_placement(bo))));
@@ -744,8 +747,8 @@ xe_pt_stage_bind(struct xe_tile *tile, struct xe_vma *vma,
                 goto walk_pt;
  
         if (vma->gpuva.flags & XE_VMA_ATOMIC_PTE_BIT) {
-               xe_walk.default_vram_pte = xe_atomic_for_vram(vm) ? XE_USM_PPGTT_PTE_AE : 0;
-               xe_walk.default_system_pte = xe_atomic_for_system(vm, bo) ?
+               xe_walk.default_vram_pte = xe_atomic_for_vram(vm, vma) ? XE_USM_PPGTT_PTE_AE : 0;
+               xe_walk.default_system_pte = xe_atomic_for_system(vm, vma) ?
                         XE_USM_PPGTT_PTE_AE : 0;
         }
  
diff --git a/drivers/gpu/drm/xe/xe_svm.c b/drivers/gpu/drm/xe/xe_svm.c

index c2306000f15e1820d7aa028dea1b16f862abf5d6..c660ccb21945acd6367c6729c0371e626e68b9a7 100644 (file)
--- a/drivers/gpu/drm/xe/xe_svm.c
+++ b/drivers/gpu/drm/xe/xe_svm.c
@@ -789,22 +789,9 @@ bool xe_svm_range_needs_migrate_to_vram(struct xe_svm_range *range, struct xe_vm
         return true;
  }
  
-/**
- * xe_svm_handle_pagefault() - SVM handle page fault
- * @vm: The VM.
- * @vma: The CPU address mirror VMA.
- * @gt: The gt upon the fault occurred.
- * @fault_addr: The GPU fault address.
- * @atomic: The fault atomic access bit.
- *
- * Create GPU bindings for a SVM page fault. Optionally migrate to device
- * memory.
- *
- * Return: 0 on success, negative error code on error.
- */
-int xe_svm_handle_pagefault(struct xe_vm *vm, struct xe_vma *vma,
-                           struct xe_gt *gt, u64 fault_addr,
-                           bool atomic)
+static int __xe_svm_handle_pagefault(struct xe_vm *vm, struct xe_vma *vma,
+                                    struct xe_gt *gt, u64 fault_addr,
+                                    bool need_vram)
  {
         struct drm_gpusvm_ctx ctx = {
                 .read_only = xe_vma_read_only(vma),
@@ -812,9 +799,8 @@ int xe_svm_handle_pagefault(struct xe_vm *vm, struct xe_vma *vma,
                         IS_ENABLED(CONFIG_DRM_XE_PAGEMAP),
                 .check_pages_threshold = IS_DGFX(vm->xe) &&
                         IS_ENABLED(CONFIG_DRM_XE_PAGEMAP) ? SZ_64K : 0,
-               .devmem_only = atomic && IS_DGFX(vm->xe) &&
-                       IS_ENABLED(CONFIG_DRM_XE_PAGEMAP),
-               .timeslice_ms = atomic && IS_DGFX(vm->xe) &&
+               .devmem_only = need_vram && IS_ENABLED(CONFIG_DRM_XE_PAGEMAP),
+               .timeslice_ms = need_vram && IS_DGFX(vm->xe) &&
                         IS_ENABLED(CONFIG_DRM_XE_PAGEMAP) ?
                         vm->xe->atomic_svm_timeslice_ms : 0,
         };
@@ -917,6 +903,32 @@ err_out:
         return err;
  }
  
+/**
+ * xe_svm_handle_pagefault() - SVM handle page fault
+ * @vm: The VM.
+ * @vma: The CPU address mirror VMA.
+ * @gt: The gt upon the fault occurred.
+ * @fault_addr: The GPU fault address.
+ * @atomic: The fault atomic access bit.
+ *
+ * Create GPU bindings for a SVM page fault. Optionally migrate to device
+ * memory.
+ *
+ * Return: 0 on success, negative error code on error.
+ */
+int xe_svm_handle_pagefault(struct xe_vm *vm, struct xe_vma *vma,
+                           struct xe_gt *gt, u64 fault_addr,
+                           bool atomic)
+{
+       int need_vram;
+
+       need_vram = xe_vma_need_vram_for_atomic(vm->xe, vma, atomic);
+       if (need_vram < 0)
+               return need_vram;
+
+       return __xe_svm_handle_pagefault(vm, vma, gt, fault_addr, need_vram ? true : false);
+}
+
  /**
   * xe_svm_has_mapping() - SVM has mappings
   * @vm: The VM.
diff --git a/drivers/gpu/drm/xe/xe_vm.c b/drivers/gpu/drm/xe/xe_vm.c

index 9fef01400c74ca78432a9b1c6b1d268c1c4f5675..7bbf12742606060fab4f2f62be8e4e02990ab362 100644 (file)
--- a/drivers/gpu/drm/xe/xe_vm.c
+++ b/drivers/gpu/drm/xe/xe_vm.c
@@ -4212,6 +4212,45 @@ void xe_vm_snapshot_free(struct xe_vm_snapshot *snap)
         kvfree(snap);
  }
  
+/**
+ * xe_vma_need_vram_for_atomic - Check if VMA needs VRAM migration for atomic operations
+ * @xe: Pointer to the XE device structure
+ * @vma: Pointer to the virtual memory area (VMA) structure
+ * @is_atomic: In pagefault path and atomic operation
+ *
+ * This function determines whether the given VMA needs to be migrated to
+ * VRAM in order to do atomic GPU operation.
+ *
+ * Return:
+ *   1        - Migration to VRAM is required
+ *   0        - Migration is not required
+ *   -EACCES  - Invalid access for atomic memory attr
+ *
+ */
+int xe_vma_need_vram_for_atomic(struct xe_device *xe, struct xe_vma *vma, bool is_atomic)
+{
+       if (!IS_DGFX(xe) || !is_atomic)
+               return 0;
+
+       /*
+        * NOTE: The checks implemented here are platform-specific. For
+        * instance, on a device supporting CXL atomics, these would ideally
+        * work universally without additional handling.
+        */
+       switch (vma->attr.atomic_access) {
+       case DRM_XE_ATOMIC_DEVICE:
+               return !xe->info.has_device_atomics_on_smem;
+
+       case DRM_XE_ATOMIC_CPU:
+               return -EACCES;
+
+       case DRM_XE_ATOMIC_UNDEFINED:
+       case DRM_XE_ATOMIC_GLOBAL:
+       default:
+               return 1;
+       }
+}
+
  /**
   * xe_vm_alloc_madvise_vma - Allocate VMA's with madvise ops
   * @vm: Pointer to the xe_vm structure
diff --git a/drivers/gpu/drm/xe/xe_vm.h b/drivers/gpu/drm/xe/xe_vm.h

index ccc549e39cfc835402f87f7c8f410388449a5e0e..dbb1bf3caf2deeaf85499a3ea0225ff429b738c6 100644 (file)
--- a/drivers/gpu/drm/xe/xe_vm.h
+++ b/drivers/gpu/drm/xe/xe_vm.h
@@ -171,6 +171,8 @@ static inline bool xe_vma_is_userptr(struct xe_vma *vma)
  
  struct xe_vma *xe_vm_find_vma_by_addr(struct xe_vm *vm, u64 page_addr);
  
+int xe_vma_need_vram_for_atomic(struct xe_device *xe, struct xe_vma *vma, bool is_atomic);
+
  int xe_vm_alloc_madvise_vma(struct xe_vm *vm, uint64_t addr, uint64_t size);
  
  /**
diff --git a/drivers/gpu/drm/xe/xe_vm_madvise.c b/drivers/gpu/drm/xe/xe_vm_madvise.c

index b861c3349b0afefa4615b3f4bddfbe99df03d1b3..95258bb6a8eef252946ff8e6f30e3600a95369cb 100644 (file)
--- a/drivers/gpu/drm/xe/xe_vm_madvise.c
+++ b/drivers/gpu/drm/xe/xe_vm_madvise.c
@@ -85,7 +85,20 @@ static void madvise_atomic(struct xe_device *xe, struct xe_vm *vm,
                            struct xe_vma **vmas, int num_vmas,
                            struct drm_xe_madvise *op)
  {
-       /* Implementation pending */
+       int i;
+
+       xe_assert(vm->xe, op->type == DRM_XE_MEM_RANGE_ATTR_ATOMIC);
+       xe_assert(vm->xe, op->atomic.val <= DRM_XE_ATOMIC_CPU);
+
+       for (i = 0; i < num_vmas; i++) {
+               if ((xe_vma_is_userptr(vmas[i]) &&
+                    !(op->atomic.val == DRM_XE_ATOMIC_DEVICE &&
+                      xe->info.has_device_atomics_on_smem)))
+                       continue;
+
+               vmas[i]->attr.atomic_access = op->atomic.val;
+       /*TODO: handle bo backed vmas */
+       }
  }
  
  static void madvise_pat_index(struct xe_device *xe, struct xe_vm *vm,
author	Himal Prasad Ghimiray <himal.prasad.ghimiray@intel.com>
	Thu, 21 Aug 2025 17:30:53 +0000 (23:00 +0530)
committer	Himal Prasad Ghimiray <himal.prasad.ghimiray@intel.com>
	Tue, 26 Aug 2025 05:55:36 +0000 (11:25 +0530)
drivers/gpu/drm/xe/xe_pt.c		patch \| blob \| blame \| history
drivers/gpu/drm/xe/xe_svm.c		patch \| blob \| blame \| history
drivers/gpu/drm/xe/xe_vm.c		patch \| blob \| blame \| history
drivers/gpu/drm/xe/xe_vm.h		patch \| blob \| blame \| history
drivers/gpu/drm/xe/xe_vm_madvise.c		patch \| blob \| blame \| history