[PATCH v2] drm/amdgpu: Protect the validate list with a mutex

Christian König christian.koenig at amd.com
Thu Jun 23 06:31:20 UTC 2022


The mutex must be added to the bo_list structure, not the parser structure.

The parser is only a temporary structure we allocate for the current thread.

Regards,
Christian.

Am 23.06.22 um 06:39 schrieb Luben Tuikov:
> Protect the parser's validate list with a mutex in order to avoid buffer
> object corruption as recorded in the link below.
>
> Cc: Christian König <christian.koenig at amd.com>
> Cc: Alex Deucher <Alexander.Deucher at amd.com>
> Cc: Andrey Grodzovsky <Andrey.Grodzovsky at amd.com>
> Cc: Vitaly Prosyak <Vitaly.Prosyak at amd.com>
> Link: https://gitlab.freedesktop.org/drm/amd/-/issues/2048
> Signed-off-by: Luben Tuikov <luben.tuikov at amd.com>
> ---
>   drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c | 30 ++++++++++++++++++++------
>   drivers/gpu/drm/amd/amdgpu/amdgpu_cs.h |  4 ++++
>   2 files changed, 28 insertions(+), 6 deletions(-)
>
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c b/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c
> index 36ac1f1d11e6b4..0be0bf17c05420 100644
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.c
> @@ -498,6 +498,7 @@ static int amdgpu_cs_parser_bos(struct amdgpu_cs_parser *p,
>   	struct amdgpu_bo *oa;
>   	int r;
>   
> +	mutex_init(&p->mutex_validated);
>   	INIT_LIST_HEAD(&p->validated);
>   
>   	/* p->bo_list could already be assigned if AMDGPU_CHUNK_ID_BO_HANDLES is present */
> @@ -521,13 +522,15 @@ static int amdgpu_cs_parser_bos(struct amdgpu_cs_parser *p,
>   	amdgpu_bo_list_for_each_entry(e, p->bo_list)
>   		e->tv.num_shared = 2;
>   
> -	amdgpu_bo_list_get_list(p->bo_list, &p->validated);
> -
>   	INIT_LIST_HEAD(&duplicates);
> +
> +	mutex_lock(&p->mutex_validated);
> +	amdgpu_bo_list_get_list(p->bo_list, &p->validated);
>   	amdgpu_vm_get_pd_bo(&fpriv->vm, &p->validated, &p->vm_pd);
>   
>   	if (p->uf_entry.tv.bo && !ttm_to_amdgpu_bo(p->uf_entry.tv.bo)->parent)
>   		list_add(&p->uf_entry.tv.head, &p->validated);
> +	mutex_unlock(&p->mutex_validated);
>   
>   	/* Get userptr backing pages. If pages are updated after registered
>   	 * in amdgpu_gem_userptr_ioctl(), amdgpu_cs_list_validate() will do
> @@ -563,8 +566,11 @@ static int amdgpu_cs_parser_bos(struct amdgpu_cs_parser *p,
>   		e->user_invalidated = userpage_invalidated;
>   	}
>   
> +	mutex_lock(&p->mutex_validated);
>   	r = ttm_eu_reserve_buffers(&p->ticket, &p->validated, true,
>   				   &duplicates);
> +	mutex_unlock(&p->mutex_validated);
> +
>   	if (unlikely(r != 0)) {
>   		if (r != -ERESTARTSYS)
>   			DRM_ERROR("ttm_eu_reserve_buffers failed.\n");
> @@ -607,11 +613,15 @@ static int amdgpu_cs_parser_bos(struct amdgpu_cs_parser *p,
>   		goto error_validate;
>   	}
>   
> +	mutex_lock(&p->mutex_validated);
>   	r = amdgpu_cs_list_validate(p, &duplicates);
> -	if (r)
> +	if (r) {
> +		mutex_unlock(&p->mutex_validated);
>   		goto error_validate;
> +	}
>   
>   	r = amdgpu_cs_list_validate(p, &p->validated);
> +	mutex_unlock(&p->mutex_validated);
>   	if (r)
>   		goto error_validate;
>   
> @@ -648,7 +658,9 @@ static int amdgpu_cs_parser_bos(struct amdgpu_cs_parser *p,
>   			dma_fence_chain_free(e->chain);
>   			e->chain = NULL;
>   		}
> +		mutex_lock(&p->mutex_validated);
>   		ttm_eu_backoff_reservation(&p->ticket, &p->validated);
> +		mutex_unlock(&p->mutex_validated);
>   	}
>   
>   out_free_user_pages:
> @@ -670,8 +682,9 @@ static int amdgpu_cs_sync_rings(struct amdgpu_cs_parser *p)
>   {
>   	struct amdgpu_fpriv *fpriv = p->filp->driver_priv;
>   	struct amdgpu_bo_list_entry *e;
> -	int r;
> +	int r = 0;
>   
> +	mutex_lock(&p->mutex_validated);
>   	list_for_each_entry(e, &p->validated, tv.head) {
>   		struct amdgpu_bo *bo = ttm_to_amdgpu_bo(e->tv.bo);
>   		struct dma_resv *resv = bo->tbo.base.resv;
> @@ -682,9 +695,10 @@ static int amdgpu_cs_sync_rings(struct amdgpu_cs_parser *p)
>   		r = amdgpu_sync_resv(p->adev, &p->job->sync, resv, sync_mode,
>   				     &fpriv->vm);
>   		if (r)
> -			return r;
> +			break;
>   	}
> -	return 0;
> +	mutex_unlock(&p->mutex_validated);
> +	return r;
>   }
>   
>   /**
> @@ -709,8 +723,10 @@ static void amdgpu_cs_parser_fini(struct amdgpu_cs_parser *parser, int error,
>   			e->chain = NULL;
>   		}
>   
> +		mutex_lock(&parser->mutex_validated);
>   		ttm_eu_backoff_reservation(&parser->ticket,
>   					   &parser->validated);
> +		mutex_unlock(&parser->mutex_validated);
>   	}
>   
>   	for (i = 0; i < parser->num_post_deps; i++) {
> @@ -1307,7 +1323,9 @@ static int amdgpu_cs_submit(struct amdgpu_cs_parser *p,
>   		e->chain = NULL;
>   	}
>   
> +	mutex_lock(&p->mutex_validated);
>   	ttm_eu_fence_buffer_objects(&p->ticket, &p->validated, p->fence);
> +	mutex_unlock(&p->mutex_validated);
>   	mutex_unlock(&p->adev->notifier_lock);
>   
>   	return 0;
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.h b/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.h
> index 30ecc4917f811d..284d1c03d65d0b 100644
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.h
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_cs.h
> @@ -59,6 +59,10 @@ struct amdgpu_cs_parser {
>   	struct amdgpu_bo_list		*bo_list;
>   	struct amdgpu_mn		*mn;
>   	struct amdgpu_bo_list_entry	vm_pd;
> +
> +	/* Protect access to list "valided" below.
> +	 */
> +	struct mutex                    mutex_validated;
>   	struct list_head		validated;
>   	struct dma_fence		*fence;
>   	uint64_t			bytes_moved_threshold;
>
> base-commit: ab7e60938be74e21c723223e7eb96cac7b441e5e



More information about the amd-gfx mailing list