[PATCH] drm/xe: Convert to USM lock to rwsem

Wed Sep 18 07:56:26 UTC 2024

On 18/09/2024 06:44, Matthew Brost wrote:
> Remove contention from GPU fault path for ASID->VM lookup.
> 
> Signed-off-by: Matthew Brost <matthew.brost at intel.com>
> ---
>   drivers/gpu/drm/xe/xe_device.c       | 4 +---
>   drivers/gpu/drm/xe/xe_device_types.h | 2 +-
>   drivers/gpu/drm/xe/xe_gt_pagefault.c | 8 ++++----
>   drivers/gpu/drm/xe/xe_vm.c           | 8 ++++----
>   4 files changed, 10 insertions(+), 12 deletions(-)
> 
> diff --git a/drivers/gpu/drm/xe/xe_device.c b/drivers/gpu/drm/xe/xe_device.c
> index 4d3c794f134c..38eade07a004 100644
> --- a/drivers/gpu/drm/xe/xe_device.c
> +++ b/drivers/gpu/drm/xe/xe_device.c
> @@ -335,9 +335,7 @@ struct xe_device *xe_device_create(struct pci_dev *pdev,
>   
>   	init_waitqueue_head(&xe->ufence_wq);
>   
> -	err = drmm_mutex_init(&xe->drm, &xe->usm.lock);
> -	if (err)
> -		goto err;
> +	init_rwsem(&xe->usm.lock);
>   
>   	xa_init_flags(&xe->usm.asid_to_vm, XA_FLAGS_ALLOC);
>   
> diff --git a/drivers/gpu/drm/xe/xe_device_types.h b/drivers/gpu/drm/xe/xe_device_types.h
> index c92df0a2423f..4507a5756a05 100644
> --- a/drivers/gpu/drm/xe/xe_device_types.h
> +++ b/drivers/gpu/drm/xe/xe_device_types.h
> @@ -395,7 +395,7 @@ struct xe_device {
>   		/** @usm.next_asid: next ASID, used to cyclical alloc asids */
>   		u32 next_asid;
>   		/** @usm.lock: protects UM state */
> -		struct mutex lock;
> +		struct rw_semaphore lock;
>   	} usm;
>   
>   	/** @pinned: pinned BO state */
> diff --git a/drivers/gpu/drm/xe/xe_gt_pagefault.c b/drivers/gpu/drm/xe/xe_gt_pagefault.c
> index 00af059a8971..5c3af2bb5402 100644
> --- a/drivers/gpu/drm/xe/xe_gt_pagefault.c
> +++ b/drivers/gpu/drm/xe/xe_gt_pagefault.c
> @@ -198,13 +198,13 @@ static int handle_pagefault(struct xe_gt *gt, struct pagefault *pf)
>   		return -EFAULT;
>   
>   	/* ASID to VM */
> -	mutex_lock(&xe->usm.lock);
> +	down_read(&xe->usm.lock);
>   	vm = xa_load(&xe->usm.asid_to_vm, pf->asid);
>   	if (vm && xe_vm_in_fault_mode(vm))
>   		xe_vm_get(vm);
>   	else
>   		vm = NULL;
> -	mutex_unlock(&xe->usm.lock);
> +	up_read(&xe->usm.lock);
>   	if (!vm)
>   		return -EINVAL;
>   
> @@ -549,11 +549,11 @@ static int handle_acc(struct xe_gt *gt, struct acc *acc)
>   		return -EINVAL;
>   
>   	/* ASID to VM */
> -	mutex_lock(&xe->usm.lock);
> +	down_read(&xe->usm.lock);
>   	vm = xa_load(&xe->usm.asid_to_vm, acc->asid);
>   	if (vm)
>   		xe_vm_get(vm);
> -	mutex_unlock(&xe->usm.lock);
> +	up_read(&xe->usm.lock);
>   	if (!vm || !xe_vm_in_fault_mode(vm))
>   		return -EINVAL;

Looks like we potentially leak the vm here. Could maybe make this the 
same as above? Maybe even a small helper.

Anyway,
Reviewed-by: Matthew Auld <matthew.auld at intel.com>

>   
> diff --git a/drivers/gpu/drm/xe/xe_vm.c b/drivers/gpu/drm/xe/xe_vm.c
> index 7acd5fc9d032..a3d7cb7cfd22 100644
> --- a/drivers/gpu/drm/xe/xe_vm.c
> +++ b/drivers/gpu/drm/xe/xe_vm.c
> @@ -1613,7 +1613,7 @@ void xe_vm_close_and_put(struct xe_vm *vm)
>   
>   	up_write(&vm->lock);
>   
> -	mutex_lock(&xe->usm.lock);
> +	down_write(&xe->usm.lock);
>   	if (vm->usm.asid) {
>   		void *lookup;
>   
> @@ -1623,7 +1623,7 @@ void xe_vm_close_and_put(struct xe_vm *vm)
>   		lookup = xa_erase(&xe->usm.asid_to_vm, vm->usm.asid);
>   		xe_assert(xe, lookup == vm);
>   	}
> -	mutex_unlock(&xe->usm.lock);
> +	up_write(&xe->usm.lock);
>   
>   	for_each_tile(tile, xe, id)
>   		xe_range_fence_tree_fini(&vm->rftree[id]);
> @@ -1772,11 +1772,11 @@ int xe_vm_create_ioctl(struct drm_device *dev, void *data,
>   		goto err_close_and_put;
>   
>   	if (xe->info.has_asid) {
> -		mutex_lock(&xe->usm.lock);
> +		down_write(&xe->usm.lock);
>   		err = xa_alloc_cyclic(&xe->usm.asid_to_vm, &asid, vm,
>   				      XA_LIMIT(1, XE_MAX_ASID - 1),
>   				      &xe->usm.next_asid, GFP_KERNEL);
> -		mutex_unlock(&xe->usm.lock);
> +		up_write(&xe->usm.lock);
>   		if (err < 0)
>   			goto err_free_id;
>