[PATCH v2 5/7] drm/xe: Move vma rebinding to the drm_exec locking loop
Matthew Brost
matthew.brost at intel.com
Fri Mar 22 18:30:54 UTC 2024
On Fri, Mar 22, 2024 at 10:02:11AM +0100, Thomas Hellström wrote:
> Rebinding might allocate page-table bos, causing evictions.
> To support blocking locking during these evictions,
> perform the rebinding in the drm_exec locking loop.
>
> v2:
> - Remove a leftover call to xe_vm_rebind() (Matt Brost)
> - Add a helper function xe_vm_validate_rebind() (Matt Brost)
>
> Fixes: 24f947d58fe5 ("drm/xe: Use DRM GPUVM helpers for external- and evicted objects")
> Signed-off-by: Thomas Hellström <thomas.hellstrom at linux.intel.com>
> ---
> drivers/gpu/drm/xe/xe_exec.c | 24 ++--------------
> drivers/gpu/drm/xe/xe_vm.c | 55 +++++++++++++++++++++++++++---------
> drivers/gpu/drm/xe/xe_vm.h | 3 ++
> 3 files changed, 47 insertions(+), 35 deletions(-)
>
> diff --git a/drivers/gpu/drm/xe/xe_exec.c b/drivers/gpu/drm/xe/xe_exec.c
> index 397a49b731f1..f442ef495235 100644
> --- a/drivers/gpu/drm/xe/xe_exec.c
> +++ b/drivers/gpu/drm/xe/xe_exec.c
> @@ -96,21 +96,9 @@
>
> static int xe_exec_fn(struct drm_gpuvm_exec *vm_exec)
> {
> - struct drm_gem_object *obj;
> - unsigned long index;
> - int ret;
> -
> - ret = drm_gpuvm_validate(vm_exec->vm, &vm_exec->exec);
> - if (ret)
> - return ret;
> -
> - drm_exec_for_each_locked_object(&vm_exec->exec, index, obj) {
> - ret = dma_resv_reserve_fences(obj->resv, 1);
> - if (ret)
> - return ret;
> - }
> + struct xe_vm *vm = container_of(vm_exec->vm, struct xe_vm, gpuvm);
>
> - return 0;
Same comment as previous patch, maybe reorder these two / squash if you
think that is required + have a comment here.
> + return xe_vm_validate_rebind(vm, &vm_exec->exec, 1);
> }
>
> int xe_exec_ioctl(struct drm_device *dev, void *data, struct drm_file *file)
> @@ -264,14 +252,6 @@ int xe_exec_ioctl(struct drm_device *dev, void *data, struct drm_file *file)
> goto err_exec;
> }
>
> - /*
> - * Rebind any invalidated userptr or evicted BOs in the VM, non-compute
> - * VM mode only.
> - */
> - err = xe_vm_rebind(vm, false);
> - if (err)
> - goto err_put_job;
> -
> /* Wait behind rebinds */
> if (!xe_vm_in_lr_mode(vm)) {
> err = drm_sched_job_add_resv_dependencies(&job->drm,
> diff --git a/drivers/gpu/drm/xe/xe_vm.c b/drivers/gpu/drm/xe/xe_vm.c
> index 6aefd6602310..b1d0df178a2d 100644
> --- a/drivers/gpu/drm/xe/xe_vm.c
> +++ b/drivers/gpu/drm/xe/xe_vm.c
> @@ -482,11 +482,50 @@ static int xe_gpuvm_validate(struct drm_gpuvm_bo *vm_bo, struct drm_exec *exec)
> return 0;
> }
>
> -static int xe_preempt_work_begin(struct drm_exec *exec, struct xe_vm *vm,
> - bool *done)
> +/**
> + * xe_vm_validate_rebind() - Validate buffer objects and rebind vmas
> + * @vm: The vm for which we are rebinding.
> + * @exec: The struct drm_exec with the locked GEM objects.
> + * @num_fences: The number of fences to reserve for the operation, not
> + * including rebinds and validations.
> + *
> + * Validates all evicted gem objects and rebinds their vmas. Note that
> + * rebindings may cause evictions and hence the validation-rebind
> + * sequence is rerun until there are no more objects to validate.
> + *
> + * Return: 0 on success, negative error code on error. In particular,
> + * may return -EINTR or -ERESTARTSYS if interrupted, and -EDEADLK if
> + * the drm_exec transaction needs to be restarted.
> + */
> +int xe_vm_validate_rebind(struct xe_vm *vm, struct drm_exec *exec,
> + unsigned int num_fences)
> {
> struct drm_gem_object *obj;
> unsigned long index;
> + int ret;
> +
> + do {
> + ret = drm_gpuvm_validate(&vm->gpuvm, exec);
> + if (ret)
> + return ret;
> +
> + ret = xe_vm_rebind(vm, false);
> + if (ret)
> + return ret;
> + } while (!list_empty(&vm->gpuvm.evict.list));
> +
> + drm_exec_for_each_locked_object(exec, index, obj) {
> + ret = dma_resv_reserve_fences(obj->resv, num_fences);
> + if (ret)
> + return ret;
> + }
> +
> + return 0;
> +}
> +
> +static int xe_preempt_work_begin(struct drm_exec *exec, struct xe_vm *vm,
> + bool *done)
> +{
> int err;
>
> err = drm_gpuvm_prepare_vm(&vm->gpuvm, exec, 0);
> @@ -512,17 +551,7 @@ static int xe_preempt_work_begin(struct drm_exec *exec, struct xe_vm *vm,
> if (err)
> return err;
>
> - err = drm_gpuvm_validate(&vm->gpuvm, exec);
> - if (err)
> - return err;
> -
> - drm_exec_for_each_locked_object(exec, index, obj) {
> - err = dma_resv_reserve_fences(obj->resv, vm->preempt.num_exec_queues);
> - if (err)
> - return err;
> - }
> -
> - return 0;
Same goes here wrt a comment, it wouldn't hurt to have one.
With that:
Reviewed-by: Matthew Brost <matthew.brost at intel.com>
> + return xe_vm_validate_rebind(vm, exec, vm->preempt.num_exec_queues);
> }
>
> static void preempt_rebind_work_func(struct work_struct *w)
> diff --git a/drivers/gpu/drm/xe/xe_vm.h b/drivers/gpu/drm/xe/xe_vm.h
> index 20009d8b4702..306cd0934a19 100644
> --- a/drivers/gpu/drm/xe/xe_vm.h
> +++ b/drivers/gpu/drm/xe/xe_vm.h
> @@ -244,6 +244,9 @@ int xe_analyze_vm(struct drm_printer *p, struct xe_vm *vm, int gt_id);
>
> int xe_vm_lock_vma(struct drm_exec *exec, struct xe_vma *vma);
>
> +int xe_vm_validate_rebind(struct xe_vm *vm, struct drm_exec *exec,
> + unsigned int num_fences);
> +
> /**
> * xe_vm_resv() - Return's the vm's reservation object
> * @vm: The vm
> --
> 2.44.0
>
More information about the Intel-xe
mailing list