[Intel-gfx] [RFC PATCH] drm/ttm: Allow the driver to resolve a WW transaction rollback
Thomas Hellström
thomas.hellstrom at linux.intel.com
Thu May 25 12:59:19 UTC 2023
On Fri, 2023-05-05 at 16:17 +0200, Thomas Hellström wrote:
> Allow drivers to resolve a WW transaction rollback. This allows for
> 1) Putting a lower-priority transaction to sleep allowing another to
> succeed instead both fighting using trylocks.
> 2) Letting the driver know whether a received -ENOMEM is the result
> of
> competition with another WW transaction, which can be resolved using
> rollback and retry or a real -ENOMEM which should be propagated back
> to user-space as a failure.
>
> Signed-off-by: Thomas Hellström <thomas.hellstrom at linux.intel.com>
Christian, Any objections?
/Thomas
> ---
> drivers/gpu/drm/ttm/ttm_bo.c | 17 +++++++++++++++--
> include/drm/ttm/ttm_bo.h | 2 ++
> 2 files changed, 17 insertions(+), 2 deletions(-)
>
> diff --git a/drivers/gpu/drm/ttm/ttm_bo.c
> b/drivers/gpu/drm/ttm/ttm_bo.c
> index bd5dae4d1624..c3ccbea2be3e 100644
> --- a/drivers/gpu/drm/ttm/ttm_bo.c
> +++ b/drivers/gpu/drm/ttm/ttm_bo.c
> @@ -561,6 +561,10 @@ static int ttm_mem_evict_wait_busy(struct
> ttm_buffer_object *busy_bo,
> if (!busy_bo || !ticket)
> return -EBUSY;
>
> + /* We want to resolve contention before trying to lock again.
> */
> + if (ctx->propagate_edeadlk && ctx->contended_bo)
> + return -EDEADLK;
> +
> if (ctx->interruptible)
> r = dma_resv_lock_interruptible(busy_bo->base.resv,
> ticket);
> @@ -575,7 +579,15 @@ static int ttm_mem_evict_wait_busy(struct
> ttm_buffer_object *busy_bo,
> if (!r)
> dma_resv_unlock(busy_bo->base.resv);
>
> - return r == -EDEADLK ? -EBUSY : r;
> + if (r == -EDEADLK) {
> + if (ctx->propagate_edeadlk) {
> + ttm_bo_get(busy_bo);
> + ctx->contended_bo = busy_bo;
> + }
> + r = -EBUSY;
> + }
> +
> + return r;
> }
>
> int ttm_mem_evict_first(struct ttm_device *bdev,
> @@ -816,7 +828,7 @@ int ttm_bo_mem_space(struct ttm_buffer_object
> *bo,
> goto error;
> }
>
> - ret = -ENOMEM;
> + ret = (ctx->propagate_edeadlk && ctx->contended_bo) ? -
> EDEADLK : -ENOMEM;
> if (!type_found) {
> pr_err(TTM_PFX "No compatible memory type found\n");
> ret = -EINVAL;
> @@ -913,6 +925,7 @@ int ttm_bo_validate(struct ttm_buffer_object *bo,
> if (ret)
> return ret;
> }
> +
> return 0;
> }
> EXPORT_SYMBOL(ttm_bo_validate);
> diff --git a/include/drm/ttm/ttm_bo.h b/include/drm/ttm/ttm_bo.h
> index 8b113c384236..d8e35a794ce5 100644
> --- a/include/drm/ttm/ttm_bo.h
> +++ b/include/drm/ttm/ttm_bo.h
> @@ -181,8 +181,10 @@ struct ttm_operation_ctx {
> bool gfp_retry_mayfail;
> bool allow_res_evict;
> bool force_alloc;
> + bool propagate_edeadlk;
> struct dma_resv *resv;
> uint64_t bytes_moved;
> + struct ttm_buffer_object *contended_bo;
> };
>
> /**
More information about the Intel-gfx
mailing list