drm/amdgpu: rework TLB flushing

author Christian König <christian.koenig@amd.com>

Tue, 15 Mar 2022 14:27:45 +0000 (15:27 +0100)

committer Alex Deucher <alexander.deucher@amd.com>

Fri, 25 Mar 2022 16:40:51 +0000 (12:40 -0400)
author Christian König <christian.koenig@amd.com>
Tue, 15 Mar 2022 14:27:45 +0000 (15:27 +0100)
committer Alex Deucher <alexander.deucher@amd.com>
Fri, 25 Mar 2022 16:40:51 +0000 (12:40 -0400)
diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c

index 970b065e9a6b13929ed6f29bf1fc28e413e8b756..88681abc5f8c2b20a5ed75bff13c99ba2aff7d68 100644 (file)
--- a/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c
+++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c
@@ -810,7 +810,7 @@ static int amdgpu_cs_vm_handling(struct amdgpu_cs_parser *p)
         if (r)
                 return r;
  
-       r = amdgpu_sync_vm_fence(&p->job->sync, fpriv->prt_va->last_pt_update);
+       r = amdgpu_sync_fence(&p->job->sync, fpriv->prt_va->last_pt_update);
         if (r)
                 return r;
  
@@ -821,7 +821,7 @@ static int amdgpu_cs_vm_handling(struct amdgpu_cs_parser *p)
                 if (r)
                         return r;
  
-               r = amdgpu_sync_vm_fence(&p->job->sync, bo_va->last_pt_update);
+               r = amdgpu_sync_fence(&p->job->sync, bo_va->last_pt_update);
                 if (r)
                         return r;
         }
@@ -840,7 +840,7 @@ static int amdgpu_cs_vm_handling(struct amdgpu_cs_parser *p)
                 if (r)
                         return r;
  
-               r = amdgpu_sync_vm_fence(&p->job->sync, bo_va->last_pt_update);
+               r = amdgpu_sync_fence(&p->job->sync, bo_va->last_pt_update);
                 if (r)
                         return r;
         }
@@ -853,7 +853,7 @@ static int amdgpu_cs_vm_handling(struct amdgpu_cs_parser *p)
         if (r)
                 return r;
  
-       r = amdgpu_sync_vm_fence(&p->job->sync, vm->last_update);
+       r = amdgpu_sync_fence(&p->job->sync, vm->last_update);
         if (r)
                 return r;
  
diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_ids.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_ids.c

index 4f1399573107f94bda63bfb0b80e196c82b71515..558f90e11d7861a7b21aeb0bf71a65a634def982 100644 (file)
--- a/drivers/gpu/drm/amd/amdgpu/amdgpu_ids.c
+++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_ids.c
@@ -277,7 +277,7 @@ static int amdgpu_vmid_grab_reserved(struct amdgpu_vm *vm,
         unsigned vmhub = ring->funcs->vmhub;
         uint64_t fence_context = adev->fence_context + ring->idx;
         bool needs_flush = vm->use_cpu_for_update;
-       uint64_t updates = sync->last_vm_update;
+       uint64_t updates = amdgpu_vm_tlb_seq(vm);
         int r;
  
         *id = vm->reserved_vmid[vmhub];
@@ -338,7 +338,7 @@ static int amdgpu_vmid_grab_used(struct amdgpu_vm *vm,
         unsigned vmhub = ring->funcs->vmhub;
         struct amdgpu_vmid_mgr *id_mgr = &adev->vm_manager.id_mgr[vmhub];
         uint64_t fence_context = adev->fence_context + ring->idx;
-       uint64_t updates = sync->last_vm_update;
+       uint64_t updates = amdgpu_vm_tlb_seq(vm);
         int r;
  
         job->vm_needs_flush = vm->use_cpu_for_update;
@@ -426,7 +426,7 @@ int amdgpu_vmid_grab(struct amdgpu_vm *vm, struct amdgpu_ring *ring,
                         if (r)
                                 goto error;
  
-                       id->flushed_updates = sync->last_vm_update;
+                       id->flushed_updates = amdgpu_vm_tlb_seq(vm);
                         job->vm_needs_flush = true;
                 }
  
diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_sync.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_sync.c

index 05e1af9998a331b57c35f774c32bdbc3dc23fb03..edd49dd27422c7fee81ab3c072eb2d08bedc9264 100644 (file)
--- a/drivers/gpu/drm/amd/amdgpu/amdgpu_sync.c
+++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_sync.c
@@ -51,7 +51,6 @@ static struct kmem_cache *amdgpu_sync_slab;
  void amdgpu_sync_create(struct amdgpu_sync *sync)
  {
         hash_init(sync->fences);
-       sync->last_vm_update = 0;
  }
  
  /**
@@ -171,23 +170,6 @@ int amdgpu_sync_fence(struct amdgpu_sync *sync, struct dma_fence *f)
         return 0;
  }
  
-/**
- * amdgpu_sync_vm_fence - remember to sync to this VM fence
- *
- * @sync: sync object to add fence to
- * @fence: the VM fence to add
- *
- * Add the fence to the sync object and remember it as VM update.
- */
-int amdgpu_sync_vm_fence(struct amdgpu_sync *sync, struct dma_fence *fence)
-{
-       if (!fence)
-               return 0;
-
-       sync->last_vm_update = max(sync->last_vm_update, fence->seqno);
-       return amdgpu_sync_fence(sync, fence);
-}
-
  /* Determine based on the owner and mode if we should sync to a fence or not */
  static bool amdgpu_sync_test_fence(struct amdgpu_device *adev,
                                    enum amdgpu_sync_mode mode,
@@ -376,8 +358,6 @@ int amdgpu_sync_clone(struct amdgpu_sync *source, struct amdgpu_sync *clone)
                 }
         }
  
-       clone->last_vm_update = source->last_vm_update;
-
         return 0;
  }
  
diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_sync.h b/drivers/gpu/drm/amd/amdgpu/amdgpu_sync.h

index 876c1ee8869c1048bce856a4758d61b6f4a68c90..2d5c613cda10299050fbf57600ea49092b157948 100644 (file)
--- a/drivers/gpu/drm/amd/amdgpu/amdgpu_sync.h
+++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_sync.h
@@ -43,12 +43,10 @@ enum amdgpu_sync_mode {
   */
  struct amdgpu_sync {
         DECLARE_HASHTABLE(fences, 4);
-       uint64_t        last_vm_update;
  };
  
  void amdgpu_sync_create(struct amdgpu_sync *sync);
  int amdgpu_sync_fence(struct amdgpu_sync *sync, struct dma_fence *f);
-int amdgpu_sync_vm_fence(struct amdgpu_sync *sync, struct dma_fence *fence);
  int amdgpu_sync_resv(struct amdgpu_device *adev, struct amdgpu_sync *sync,
                      struct dma_resv *resv, enum amdgpu_sync_mode mode,
                      void *owner);
diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c

index accebbac2f29ba92f2cccccc96a7203d4a37ee11..ecdcf652ba41bb03e5af464a798741a4ae88a74e 100644 (file)
--- a/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c
+++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c
@@ -88,6 +88,21 @@ struct amdgpu_prt_cb {
         struct dma_fence_cb cb;
  };
  
+/**
+ * amdgpu_vm_tlb_seq_cb - Helper to increment the TLB flush sequence
+ */
+struct amdgpu_vm_tlb_seq_cb {
+       /**
+        * @vm: pointer to the amdgpu_vm structure to set the fence sequence on
+        */
+       struct amdgpu_vm *vm;
+
+       /**
+        * @cb: callback
+        */
+       struct dma_fence_cb cb;
+};
+
  /**
   * amdgpu_vm_set_pasid - manage pasid and vm ptr mapping
   *
@@ -760,6 +775,23 @@ error:
         return r;
  }
  
+/**
+ * amdgpu_vm_tlb_seq_cb - make sure to increment tlb sequence
+ * @fence: unused
+ * @cb: the callback structure
+ *
+ * Increments the tlb sequence to make sure that future CS execute a VM flush.
+ */
+static void amdgpu_vm_tlb_seq_cb(struct dma_fence *fence,
+                                struct dma_fence_cb *cb)
+{
+       struct amdgpu_vm_tlb_seq_cb *tlb_cb;
+
+       tlb_cb = container_of(cb, typeof(*tlb_cb), cb);
+       atomic64_inc(&tlb_cb->vm->tlb_seq);
+       kfree(tlb_cb);
+}
+
  /**
   * amdgpu_vm_bo_update_mapping - update a mapping in the vm page table
   *
@@ -795,6 +827,7 @@ int amdgpu_vm_bo_update_mapping(struct amdgpu_device *adev,
                                 bool *table_freed)
  {
         struct amdgpu_vm_update_params params;
+       struct amdgpu_vm_tlb_seq_cb *tlb_cb;
         struct amdgpu_res_cursor cursor;
         enum amdgpu_sync_mode sync_mode;
         int r, idx;
@@ -802,6 +835,12 @@ int amdgpu_vm_bo_update_mapping(struct amdgpu_device *adev,
         if (!drm_dev_enter(adev_to_drm(adev), &idx))
                 return -ENODEV;
  
+       tlb_cb = kmalloc(sizeof(*tlb_cb), GFP_KERNEL);
+       if (!tlb_cb) {
+               r = -ENOMEM;
+               goto error_unlock;
+       }
+
         memset(&params, 0, sizeof(params));
         params.adev = adev;
         params.vm = vm;
@@ -820,7 +859,7 @@ int amdgpu_vm_bo_update_mapping(struct amdgpu_device *adev,
         amdgpu_vm_eviction_lock(vm);
         if (vm->evicting) {
                 r = -EBUSY;
-               goto error_unlock;
+               goto error_free;
         }
  
         if (!unlocked && !dma_fence_is_signaled(vm->last_unlocked)) {
@@ -833,7 +872,7 @@ int amdgpu_vm_bo_update_mapping(struct amdgpu_device *adev,
  
         r = vm->update_funcs->prepare(&params, resv, sync_mode);
         if (r)
-               goto error_unlock;
+               goto error_free;
  
         amdgpu_res_first(pages_addr ? NULL : res, offset,
                          (last - start + 1) * AMDGPU_GPU_PAGE_SIZE, &cursor);
@@ -882,7 +921,7 @@ int amdgpu_vm_bo_update_mapping(struct amdgpu_device *adev,
                 tmp = start + num_entries;
                 r = amdgpu_vm_ptes_update(&params, start, tmp, addr, flags);
                 if (r)
-                       goto error_unlock;
+                       goto error_free;
  
                 amdgpu_res_next(&cursor, num_entries * AMDGPU_GPU_PAGE_SIZE);
                 start = tmp;
@@ -890,9 +929,21 @@ int amdgpu_vm_bo_update_mapping(struct amdgpu_device *adev,
  
         r = vm->update_funcs->commit(&params, fence);
  
+       if (!unlocked && (!(flags & AMDGPU_PTE_VALID) || params.table_freed)) {
+               tlb_cb->vm = vm;
+               if (!fence || !*fence ||
+                   dma_fence_add_callback(*fence, &tlb_cb->cb,
+                                          amdgpu_vm_tlb_seq_cb))
+                       amdgpu_vm_tlb_seq_cb(NULL, &tlb_cb->cb);
+               tlb_cb = NULL;
+       }
+
         if (table_freed)
                 *table_freed = *table_freed || params.table_freed;
  
+error_free:
+       kfree(tlb_cb);
+
  error_unlock:
         amdgpu_vm_eviction_unlock(vm);
         drm_dev_exit(idx);
diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.h b/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.h

index 1731681914f5d3b3b6e667edee50ced822579168..38a1eab1ff746d41ac0735964a46cc286481ef7f 100644 (file)
--- a/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.h
+++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_vm.h
@@ -284,6 +284,9 @@ struct amdgpu_vm {
         struct drm_sched_entity immediate;
         struct drm_sched_entity delayed;
  
+       /* Last finished delayed update */
+       atomic64_t              tlb_seq;
+
         /* Last unlocked submission to the scheduler entities */
         struct dma_fence        *last_unlocked;
  
@@ -478,4 +481,16 @@ int amdgpu_vm_ptes_update(struct amdgpu_vm_update_params *params,
  void amdgpu_debugfs_vm_bo_info(struct amdgpu_vm *vm, struct seq_file *m);
  #endif
  
+/**
+ * amdgpu_vm_tlb_seq - return tlb flush sequence number
+ * @vm: the amdgpu_vm structure to query
+ *
+ * Returns the tlb flush sequence number which indicates that the VM TLBs needs
+ * to be invalidated whenever the sequence number change.
+ */
+static inline uint64_t amdgpu_vm_tlb_seq(struct amdgpu_vm *vm)
+{
+       return atomic64_read(&vm->tlb_seq);
+}
+
  #endif
author	Christian König <christian.koenig@amd.com>
	Tue, 15 Mar 2022 14:27:45 +0000 (15:27 +0100)
committer	Alex Deucher <alexander.deucher@amd.com>
	Fri, 25 Mar 2022 16:40:51 +0000 (12:40 -0400)
drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c		patch \| blob \| history
drivers/gpu/drm/amd/amdgpu/amdgpu_ids.c		patch \| blob \| history
drivers/gpu/drm/amd/amdgpu/amdgpu_sync.c		patch \| blob \| history
drivers/gpu/drm/amd/amdgpu/amdgpu_sync.h		patch \| blob \| history
drivers/gpu/drm/amd/amdgpu/amdgpu_vm.c		patch \| blob \| history
drivers/gpu/drm/amd/amdgpu/amdgpu_vm.h		patch \| blob \| history