[PATCH v5 6/11] drm/amdkfd: Add unmap from GPU SMI event
Felix Kuehling
felix.kuehling at amd.com
Thu Jun 30 14:39:02 UTC 2022
Am 2022-06-28 um 10:50 schrieb Philip Yang:
> SVM range unmapped from GPUs when range is unmapped from CPU, or with
> xnack on from MMU notifier when range is evicted or migrated.
>
> Signed-off-by: Philip Yang <Philip.Yang at amd.com>
Reviewed-by: Felix Kuehling <Felix.Kuehling at amd.com>
> ---
> drivers/gpu/drm/amd/amdkfd/kfd_smi_events.c | 9 ++++++++
> drivers/gpu/drm/amd/amdkfd/kfd_smi_events.h | 3 +++
> drivers/gpu/drm/amd/amdkfd/kfd_svm.c | 25 +++++++++++++++------
> 3 files changed, 30 insertions(+), 7 deletions(-)
>
> diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_smi_events.c b/drivers/gpu/drm/amd/amdkfd/kfd_smi_events.c
> index 3917c38204d0..e5896b7a16dd 100644
> --- a/drivers/gpu/drm/amd/amdkfd/kfd_smi_events.c
> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_smi_events.c
> @@ -318,6 +318,15 @@ void kfd_smi_event_queue_restore_rescheduled(struct mm_struct *mm)
> kfd_unref_process(p);
> }
>
> +void kfd_smi_event_unmap_from_gpu(struct kfd_dev *dev, pid_t pid,
> + unsigned long address, unsigned long last,
> + uint32_t trigger)
> +{
> + kfd_smi_event_add(pid, dev, KFD_SMI_EVENT_UNMAP_FROM_GPU,
> + "%lld -%d @%lx(%lx) %x %d\n", ktime_get_boottime_ns(),
> + pid, address, last - address + 1, dev->id, trigger);
> +}
> +
> int kfd_smi_event_open(struct kfd_dev *dev, uint32_t *fd)
> {
> struct kfd_smi_client *client;
> diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_smi_events.h b/drivers/gpu/drm/amd/amdkfd/kfd_smi_events.h
> index b23292637239..76fe4e0ec2d2 100644
> --- a/drivers/gpu/drm/amd/amdkfd/kfd_smi_events.h
> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_smi_events.h
> @@ -46,4 +46,7 @@ void kfd_smi_event_queue_eviction(struct kfd_dev *dev, pid_t pid,
> uint32_t trigger);
> void kfd_smi_event_queue_restore(struct kfd_dev *dev, pid_t pid);
> void kfd_smi_event_queue_restore_rescheduled(struct mm_struct *mm);
> +void kfd_smi_event_unmap_from_gpu(struct kfd_dev *dev, pid_t pid,
> + unsigned long address, unsigned long last,
> + uint32_t trigger);
> #endif
> diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_svm.c b/drivers/gpu/drm/amd/amdkfd/kfd_svm.c
> index ddc1e4651919..bf888ae84c92 100644
> --- a/drivers/gpu/drm/amd/amdkfd/kfd_svm.c
> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_svm.c
> @@ -1200,7 +1200,7 @@ svm_range_unmap_from_gpu(struct amdgpu_device *adev, struct amdgpu_vm *vm,
>
> static int
> svm_range_unmap_from_gpus(struct svm_range *prange, unsigned long start,
> - unsigned long last)
> + unsigned long last, uint32_t trigger)
> {
> DECLARE_BITMAP(bitmap, MAX_GPU_INSTANCE);
> struct kfd_process_device *pdd;
> @@ -1232,6 +1232,9 @@ svm_range_unmap_from_gpus(struct svm_range *prange, unsigned long start,
> return -EINVAL;
> }
>
> + kfd_smi_event_unmap_from_gpu(pdd->dev, p->lead_thread->pid,
> + start, last, trigger);
> +
> r = svm_range_unmap_from_gpu(pdd->dev->adev,
> drm_priv_to_vm(pdd->drm_priv),
> start, last, &fence);
> @@ -1759,7 +1762,8 @@ static void svm_range_restore_work(struct work_struct *work)
> */
> static int
> svm_range_evict(struct svm_range *prange, struct mm_struct *mm,
> - unsigned long start, unsigned long last)
> + unsigned long start, unsigned long last,
> + enum mmu_notifier_event event)
> {
> struct svm_range_list *svms = prange->svms;
> struct svm_range *pchild;
> @@ -1804,6 +1808,12 @@ svm_range_evict(struct svm_range *prange, struct mm_struct *mm,
> msecs_to_jiffies(AMDGPU_SVM_RANGE_RESTORE_DELAY_MS));
> } else {
> unsigned long s, l;
> + uint32_t trigger;
> +
> + if (event == MMU_NOTIFY_MIGRATE)
> + trigger = KFD_SVM_UNMAP_TRIGGER_MMU_NOTIFY_MIGRATE;
> + else
> + trigger = KFD_SVM_UNMAP_TRIGGER_MMU_NOTIFY;
>
> pr_debug("invalidate unmap svms 0x%p [0x%lx 0x%lx] from GPUs\n",
> prange->svms, start, last);
> @@ -1812,13 +1822,13 @@ svm_range_evict(struct svm_range *prange, struct mm_struct *mm,
> s = max(start, pchild->start);
> l = min(last, pchild->last);
> if (l >= s)
> - svm_range_unmap_from_gpus(pchild, s, l);
> + svm_range_unmap_from_gpus(pchild, s, l, trigger);
> mutex_unlock(&pchild->lock);
> }
> s = max(start, prange->start);
> l = min(last, prange->last);
> if (l >= s)
> - svm_range_unmap_from_gpus(prange, s, l);
> + svm_range_unmap_from_gpus(prange, s, l, trigger);
> }
>
> return r;
> @@ -2232,6 +2242,7 @@ static void
> svm_range_unmap_from_cpu(struct mm_struct *mm, struct svm_range *prange,
> unsigned long start, unsigned long last)
> {
> + uint32_t trigger = KFD_SVM_UNMAP_TRIGGER_UNMAP_FROM_CPU;
> struct svm_range_list *svms;
> struct svm_range *pchild;
> struct kfd_process *p;
> @@ -2259,14 +2270,14 @@ svm_range_unmap_from_cpu(struct mm_struct *mm, struct svm_range *prange,
> s = max(start, pchild->start);
> l = min(last, pchild->last);
> if (l >= s)
> - svm_range_unmap_from_gpus(pchild, s, l);
> + svm_range_unmap_from_gpus(pchild, s, l, trigger);
> svm_range_unmap_split(mm, prange, pchild, start, last);
> mutex_unlock(&pchild->lock);
> }
> s = max(start, prange->start);
> l = min(last, prange->last);
> if (l >= s)
> - svm_range_unmap_from_gpus(prange, s, l);
> + svm_range_unmap_from_gpus(prange, s, l, trigger);
> svm_range_unmap_split(mm, prange, prange, start, last);
>
> if (unmap_parent)
> @@ -2333,7 +2344,7 @@ svm_range_cpu_invalidate_pagetables(struct mmu_interval_notifier *mni,
> svm_range_unmap_from_cpu(mni->mm, prange, start, last);
> break;
> default:
> - svm_range_evict(prange, mni->mm, start, last);
> + svm_range_evict(prange, mni->mm, start, last, range->event);
> break;
> }
>
More information about the amd-gfx
mailing list