drm/xe/userptr: Defer Waiting for TLB invalidation to the second pass if possible

author Thomas Hellström <thomas.hellstrom@linux.intel.com>

Thu, 5 Mar 2026 09:39:09 +0000 (10:39 +0100)

committer Thomas Hellström <thomas.hellstrom@linux.intel.com>

Wed, 11 Mar 2026 08:33:01 +0000 (09:33 +0100)
author Thomas Hellström <thomas.hellstrom@linux.intel.com>
Thu, 5 Mar 2026 09:39:09 +0000 (10:39 +0100)
committer Thomas Hellström <thomas.hellstrom@linux.intel.com>
Wed, 11 Mar 2026 08:33:01 +0000 (09:33 +0100)
diff --git a/drivers/gpu/drm/xe/xe_userptr.c b/drivers/gpu/drm/xe/xe_userptr.c

index 37032b8125a664fe96c73b9a3c14070172233a54..6761005c0b900ac8cf07ea8f1911f41c5d0244fb 100644 (file)
--- a/drivers/gpu/drm/xe/xe_userptr.c
+++ b/drivers/gpu/drm/xe/xe_userptr.c
@@ -8,6 +8,7 @@
  
  #include <linux/mm.h>
  
+#include "xe_tlb_inval.h"
  #include "xe_trace_bo.h"
  
  static void xe_userptr_assert_in_notifier(struct xe_vm *vm)
@@ -81,8 +82,8 @@ int xe_vma_userptr_pin_pages(struct xe_userptr_vma *uvma)
                                     &ctx);
  }
  
-static void xe_vma_userptr_do_inval(struct xe_vm *vm, struct xe_userptr_vma *uvma,
-                                   bool is_deferred)
+static struct mmu_interval_notifier_finish *
+xe_vma_userptr_do_inval(struct xe_vm *vm, struct xe_userptr_vma *uvma, bool is_deferred)
  {
         struct xe_userptr *userptr = &uvma->userptr;
         struct xe_vma *vma = &uvma->vma;
@@ -93,6 +94,8 @@ static void xe_vma_userptr_do_inval(struct xe_vm *vm, struct xe_userptr_vma *uvm
         long err;
  
         xe_userptr_assert_in_notifier(vm);
+       if (is_deferred)
+               xe_assert(vm->xe, userptr->finish_inuse && !userptr->tlb_inval_submitted);
  
         err = dma_resv_wait_timeout(xe_vm_resv(vm),
                                     DMA_RESV_USAGE_BOOKKEEP,
@@ -100,6 +103,19 @@ static void xe_vma_userptr_do_inval(struct xe_vm *vm, struct xe_userptr_vma *uvm
         XE_WARN_ON(err <= 0);
  
         if (xe_vm_in_fault_mode(vm) && userptr->initial_bind) {
+               if (!userptr->finish_inuse) {
+                       /*
+                        * Defer the TLB wait to an extra pass so the caller
+                        * can pipeline TLB flushes across GPUs before waiting
+                        * on any of them.
+                        */
+                       xe_assert(vm->xe, !userptr->tlb_inval_submitted);
+                       userptr->finish_inuse = true;
+                       userptr->tlb_inval_submitted = true;
+                       err = xe_vm_invalidate_vma_submit(vma, &userptr->inval_batch);
+                       XE_WARN_ON(err);
+                       return &userptr->finish;
+               }
                 err = xe_vm_invalidate_vma(vma);
                 XE_WARN_ON(err);
         }
@@ -108,6 +124,28 @@ static void xe_vma_userptr_do_inval(struct xe_vm *vm, struct xe_userptr_vma *uvm
                 userptr->finish_inuse = false;
         drm_gpusvm_unmap_pages(&vm->svm.gpusvm, &uvma->userptr.pages,
                                xe_vma_size(vma) >> PAGE_SHIFT, &ctx);
+       return NULL;
+}
+
+static void
+xe_vma_userptr_complete_tlb_inval(struct xe_vm *vm, struct xe_userptr_vma *uvma)
+{
+       struct xe_userptr *userptr = &uvma->userptr;
+       struct xe_vma *vma = &uvma->vma;
+       struct drm_gpusvm_ctx ctx = {
+               .in_notifier = true,
+               .read_only = xe_vma_read_only(vma),
+       };
+
+       xe_userptr_assert_in_notifier(vm);
+       xe_assert(vm->xe, userptr->finish_inuse);
+       xe_assert(vm->xe, userptr->tlb_inval_submitted);
+
+       xe_tlb_inval_batch_wait(&userptr->inval_batch);
+       userptr->tlb_inval_submitted = false;
+       userptr->finish_inuse = false;
+       drm_gpusvm_unmap_pages(&vm->svm.gpusvm, &uvma->userptr.pages,
+                              xe_vma_size(vma) >> PAGE_SHIFT, &ctx);
  }
  
  static struct mmu_interval_notifier_finish *
@@ -153,11 +191,10 @@ xe_vma_userptr_invalidate_pass1(struct xe_vm *vm, struct xe_userptr_vma *uvma)
          * If it's already in use, or all fences are already signaled,
          * proceed directly to invalidation without deferring.
          */
-       if (signaled || userptr->finish_inuse) {
-               xe_vma_userptr_do_inval(vm, uvma, false);
-               return NULL;
-       }
+       if (signaled || userptr->finish_inuse)
+               return xe_vma_userptr_do_inval(vm, uvma, false);
  
+       /* Defer: the notifier core will call invalidate_finish once done. */
         userptr->finish_inuse = true;
  
         return &userptr->finish;
@@ -205,7 +242,15 @@ static void xe_vma_userptr_invalidate_finish(struct mmu_interval_notifier_finish
                 xe_vma_start(vma), xe_vma_size(vma));
  
         down_write(&vm->svm.gpusvm.notifier_lock);
-       xe_vma_userptr_do_inval(vm, uvma, true);
+       /*
+        * If a TLB invalidation was previously submitted (deferred from the
+        * synchronous pass1 fallback), wait for it and unmap pages.
+        * Otherwise, fences have now completed: invalidate the TLB and unmap.
+        */
+       if (uvma->userptr.tlb_inval_submitted)
+               xe_vma_userptr_complete_tlb_inval(vm, uvma);
+       else
+               xe_vma_userptr_do_inval(vm, uvma, true);
         up_write(&vm->svm.gpusvm.notifier_lock);
         trace_xe_vma_userptr_invalidate_complete(vma);
  }
@@ -243,7 +288,9 @@ void xe_vma_userptr_force_invalidate(struct xe_userptr_vma *uvma)
  
         finish = xe_vma_userptr_invalidate_pass1(vm, uvma);
         if (finish)
-               xe_vma_userptr_do_inval(vm, uvma, true);
+               finish = xe_vma_userptr_do_inval(vm, uvma, true);
+       if (finish)
+               xe_vma_userptr_complete_tlb_inval(vm, uvma);
  }
  #endif
  
diff --git a/drivers/gpu/drm/xe/xe_userptr.h b/drivers/gpu/drm/xe/xe_userptr.h

index e1830c2f5fd2886dc2ca9b1174e7a5d6f0cfae98..2a3cd1b5efbb02a5f0ba2d2367be142981ed00bf 100644 (file)
--- a/drivers/gpu/drm/xe/xe_userptr.h
+++ b/drivers/gpu/drm/xe/xe_userptr.h
@@ -14,6 +14,8 @@
  
  #include <drm/drm_gpusvm.h>
  
+#include "xe_tlb_inval_types.h"
+
  struct xe_vm;
  struct xe_vma;
  struct xe_userptr_vma;
@@ -63,12 +65,27 @@ struct xe_userptr {
          * alternatively by the same lock in read mode *and* the vm resv held.
          */
         struct mmu_interval_notifier_finish finish;
+       /**
+        * @inval_batch: TLB invalidation batch for deferred completion.
+        * Stores an in-flight TLB invalidation submitted during a two-pass
+        * notifier so the wait can be deferred to a subsequent pass, allowing
+        * multiple GPUs to be signalled before any of them are waited on.
+        * Protected using the same locking as @finish.
+        */
+       struct xe_tlb_inval_batch inval_batch;
         /**
          * @finish_inuse: Whether @finish is currently in use by an in-progress
          * two-pass invalidation.
          * Protected using the same locking as @finish.
          */
         bool finish_inuse;
+       /**
+        * @tlb_inval_submitted: Whether a TLB invalidation has been submitted
+        * via @inval_batch and is pending completion.  When set, the next pass
+        * must call xe_tlb_inval_batch_wait() before reusing @inval_batch.
+        * Protected using the same locking as @finish.
+        */
+       bool tlb_inval_submitted;
         /**
          * @initial_bind: user pointer has been bound at least once.
          * write: vm->svm.gpusvm.notifier_lock in read mode and vm->resv held.
diff --git a/drivers/gpu/drm/xe/xe_vm.c b/drivers/gpu/drm/xe/xe_vm.c

index a4053fb75ebbbae4a2a898df9ca0c9d8640504dd..dea25aae2928d8711abf5744a414fa780cdf0c15 100644 (file)
--- a/drivers/gpu/drm/xe/xe_vm.c
+++ b/drivers/gpu/drm/xe/xe_vm.c
@@ -3970,20 +3970,23 @@ void xe_vm_unlock(struct xe_vm *vm)
  }
  
  /**
- * xe_vm_invalidate_vma - invalidate GPU mappings for VMA without a lock
+ * xe_vm_invalidate_vma_submit - Submit a job to invalidate GPU mappings for
+ * VMA.
   * @vma: VMA to invalidate
+ * @batch: TLB invalidation batch to populate; caller must later call
+ *         xe_tlb_inval_batch_wait() on it to wait for completion
   *
   * Walks a list of page tables leaves which it memset the entries owned by this
- * VMA to zero, invalidates the TLBs, and block until TLBs invalidation is
- * complete.
+ * VMA to zero, invalidates the TLBs, but doesn't block waiting for TLB flush
+ * to complete, but instead populates @batch which can be waited on using
+ * xe_tlb_inval_batch_wait().
   *
   * Returns 0 for success, negative error code otherwise.
   */
-int xe_vm_invalidate_vma(struct xe_vma *vma)
+int xe_vm_invalidate_vma_submit(struct xe_vma *vma, struct xe_tlb_inval_batch *batch)
  {
         struct xe_device *xe = xe_vma_vm(vma)->xe;
         struct xe_vm *vm = xe_vma_vm(vma);
-       struct xe_tlb_inval_batch batch;
         struct xe_tile *tile;
         u8 tile_mask = 0;
         int ret = 0;
@@ -4026,14 +4029,33 @@ int xe_vm_invalidate_vma(struct xe_vma *vma)
  
         ret = xe_tlb_inval_range_tilemask_submit(xe, xe_vma_vm(vma)->usm.asid,
                                                  xe_vma_start(vma), xe_vma_end(vma),
-                                                tile_mask, &batch);
+                                                tile_mask, batch);
  
         /* WRITE_ONCE pairs with READ_ONCE in xe_vm_has_valid_gpu_mapping() */
         WRITE_ONCE(vma->tile_invalidated, vma->tile_mask);
+       return ret;
+}
+
+/**
+ * xe_vm_invalidate_vma - invalidate GPU mappings for VMA without a lock
+ * @vma: VMA to invalidate
+ *
+ * Walks a list of page tables leaves which it memset the entries owned by this
+ * VMA to zero, invalidates the TLBs, and block until TLBs invalidation is
+ * complete.
+ *
+ * Returns 0 for success, negative error code otherwise.
+ */
+int xe_vm_invalidate_vma(struct xe_vma *vma)
+{
+       struct xe_tlb_inval_batch batch;
+       int ret;
  
-       if (!ret)
-               xe_tlb_inval_batch_wait(&batch);
+       ret = xe_vm_invalidate_vma_submit(vma, &batch);
+       if (ret)
+               return ret;
  
+       xe_tlb_inval_batch_wait(&batch);
         return ret;
  }
  
diff --git a/drivers/gpu/drm/xe/xe_vm.h b/drivers/gpu/drm/xe/xe_vm.h

index 62f4b6fec0bc171576857f3ddfc8248b9b98396f..0bc7ed23eeae06873192f94d07185323144de47d 100644 (file)
--- a/drivers/gpu/drm/xe/xe_vm.h
+++ b/drivers/gpu/drm/xe/xe_vm.h
@@ -242,6 +242,8 @@ struct dma_fence *xe_vm_range_unbind(struct xe_vm *vm,
  
  int xe_vm_invalidate_vma(struct xe_vma *vma);
  
+int xe_vm_invalidate_vma_submit(struct xe_vma *vma, struct xe_tlb_inval_batch *batch);
+
  int xe_vm_validate_protected(struct xe_vm *vm);
  
  static inline void xe_vm_queue_rebind_worker(struct xe_vm *vm)
author	Thomas Hellström <thomas.hellstrom@linux.intel.com>
	Thu, 5 Mar 2026 09:39:09 +0000 (10:39 +0100)
committer	Thomas Hellström <thomas.hellstrom@linux.intel.com>
	Wed, 11 Mar 2026 08:33:01 +0000 (09:33 +0100)
drivers/gpu/drm/xe/xe_userptr.c		patch \| blob \| blame \| history
drivers/gpu/drm/xe/xe_userptr.h		patch \| blob \| blame \| history
drivers/gpu/drm/xe/xe_vm.c		patch \| blob \| blame \| history
drivers/gpu/drm/xe/xe_vm.h		patch \| blob \| blame \| history