[PATCH 1/4] Revert "drm/amdkfd: Fix sdma queue allocate race condition"
Yang, Philip
Philip.Yang at amd.com
Sat Jun 15 01:50:27 UTC 2019
I just figured out previous patch have issue. New patch is simple and
looks good to me.
This series is Reviewed-by: Philip.Yang <philip.yang at amd.com>
On 2019-06-14 9:27 p.m., Zeng, Oak wrote:
> This reverts commit 0a7c7281bdaae8cf63d77be26a4b46128114bdec.
> This fix is not proper. allocate_mqd can't be moved before
> allocate_sdma_queue as it depends on q->properties->sdma_id
> set in later.
>
> Change-Id: If4934afebda8cf37dfcde9b50ce53643d526584d
> Signed-off-by: Oak Zeng <Oak.Zeng at amd.com>
> ---
> .../gpu/drm/amd/amdkfd/kfd_device_queue_manager.c | 26 ++++++++++++----------
> 1 file changed, 14 insertions(+), 12 deletions(-)
>
> diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.c b/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.c
> index 250798b..d566c26 100644
> --- a/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.c
> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.c
> @@ -1133,27 +1133,23 @@ static int create_queue_cpsch(struct device_queue_manager *dqm, struct queue *q,
> if (dqm->total_queue_count >= max_num_of_queues_per_device) {
> pr_warn("Can't create new usermode queue because %d queues were already created\n",
> dqm->total_queue_count);
> - return -EPERM;
> + retval = -EPERM;
> + goto out;
> }
>
> - mqd_mgr = dqm->mqd_mgrs[get_mqd_type_from_queue_type(
> - q->properties.type)];
> - q->mqd_mem_obj = mqd_mgr->allocate_mqd(mqd_mgr->dev, &q->properties);
> - if (!q->mqd_mem_obj)
> - return -ENOMEM;
> -
> - dqm_lock(dqm);
> if (q->properties.type == KFD_QUEUE_TYPE_SDMA ||
> q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI) {
> retval = allocate_sdma_queue(dqm, q);
> if (retval)
> - goto out_unlock;
> + goto out;
> }
>
> retval = allocate_doorbell(qpd, q);
> if (retval)
> goto out_deallocate_sdma_queue;
>
> + mqd_mgr = dqm->mqd_mgrs[get_mqd_type_from_queue_type(
> + q->properties.type)];
> /*
> * Eviction state logic: mark all queues as evicted, even ones
> * not currently active. Restoring inactive queues later only
> @@ -1165,8 +1161,14 @@ static int create_queue_cpsch(struct device_queue_manager *dqm, struct queue *q,
> dqm->asic_ops.init_sdma_vm(dqm, q, qpd);
> q->properties.tba_addr = qpd->tba_addr;
> q->properties.tma_addr = qpd->tma_addr;
> + q->mqd_mem_obj = mqd_mgr->allocate_mqd(mqd_mgr->dev, &q->properties);
> + if (!q->mqd_mem_obj) {
> + retval = -ENOMEM;
> + goto out_deallocate_doorbell;
> + }
> mqd_mgr->init_mqd(mqd_mgr, &q->mqd, q->mqd_mem_obj,
> &q->gart_mqd_addr, &q->properties);
> + dqm_lock(dqm);
>
> list_add(&q->list, &qpd->queues_list);
> qpd->queue_count++;
> @@ -1192,13 +1194,13 @@ static int create_queue_cpsch(struct device_queue_manager *dqm, struct queue *q,
> dqm_unlock(dqm);
> return retval;
>
> +out_deallocate_doorbell:
> + deallocate_doorbell(qpd, q);
> out_deallocate_sdma_queue:
> if (q->properties.type == KFD_QUEUE_TYPE_SDMA ||
> q->properties.type == KFD_QUEUE_TYPE_SDMA_XGMI)
> deallocate_sdma_queue(dqm, q);
> -out_unlock:
> - dqm_unlock(dqm);
> - mqd_mgr->free_mqd(mqd_mgr, q->mqd, q->mqd_mem_obj);
> +out:
> return retval;
> }
>
>
More information about the amd-gfx
mailing list