[PATCH 4/6] drm/amdkfd: Record vmid pasid mapping in the driver
Zhao, Yong
Yong.Zhao at amd.com
Thu Sep 26 19:01:17 UTC 2019
I agree.
Yong
On 2019-09-26 2:54 p.m., Kuehling, Felix wrote:
> On 2019-09-26 2:38 p.m., Zhao, Yong wrote:
>> This makes possible the vmid pasid mapping query through software.
>>
>> Change-Id: Ib539aae277a227cc39f6469ae23c46c4d289b87b
>> Signed-off-by: Yong Zhao <Yong.Zhao at amd.com>
>> ---
>> .../drm/amd/amdkfd/kfd_device_queue_manager.c | 34 +++++++++++++------
>> .../drm/amd/amdkfd/kfd_device_queue_manager.h | 3 +-
>> 2 files changed, 26 insertions(+), 11 deletions(-)
>>
>> diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.c b/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.c
>> index e7f0a32e0e44..d006adefef55 100644
>> --- a/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.c
>> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.c
>> @@ -224,20 +224,30 @@ static int allocate_vmid(struct device_queue_manager *dqm,
>> struct qcm_process_device *qpd,
>> struct queue *q)
>> {
>> - int bit, allocated_vmid;
>> + int idx = -1, allocated_vmid, i;
>>
>> - if (dqm->vmid_bitmap == 0)
>> + for (i = 0; i < dqm->dev->vm_info.vmid_num_kfd; i++) {
>> + if (!dqm->vmid_pasid[i]) {
>> + idx = i;
>> + break;
>> + }
>> + }
>> +
>> + if (idx < 0) {
>> + pr_err("no more vmid to allocate\n");
>> return -ENOMEM;
>> + }
>> +
>> + dqm->vmid_pasid[idx] = q->process->pasid;
>>
>> - bit = ffs(dqm->vmid_bitmap) - 1;
>> - dqm->vmid_bitmap &= ~(1 << bit);
>> + allocated_vmid = idx + dqm->dev->vm_info.first_vmid_kfd;
>> + pr_debug("vmid allocated: %d\n", allocated_vmid);
>> +
>> + set_pasid_vmid_mapping(dqm, q->process->pasid, allocated_vmid);
>>
>> - allocated_vmid = bit + dqm->dev->vm_info.first_vmid_kfd;
>> - pr_debug("vmid allocation %d\n", allocated_vmid);
>> qpd->vmid = allocated_vmid;
>> q->properties.vmid = allocated_vmid;
>>
>> - set_pasid_vmid_mapping(dqm, q->process->pasid, q->properties.vmid);
>> program_sh_mem_settings(dqm, qpd);
>>
>> /* qpd->page_table_base is set earlier when register_process()
>> @@ -278,7 +288,7 @@ static void deallocate_vmid(struct device_queue_manager *dqm,
>> struct qcm_process_device *qpd,
>> struct queue *q)
>> {
>> - int bit = qpd->vmid - dqm->dev->vm_info.first_vmid_kfd;
>> + int idx;
>>
>> /* On GFX v7, CP doesn't flush TC at dequeue */
>> if (q->device->device_info->asic_family == CHIP_HAWAII)
>> @@ -290,7 +300,9 @@ static void deallocate_vmid(struct device_queue_manager *dqm,
>> /* Release the vmid mapping */
>> set_pasid_vmid_mapping(dqm, 0, qpd->vmid);
>>
>> - dqm->vmid_bitmap |= (1 << bit);
>> + idx = qpd->vmid - dqm->dev->vm_info.first_vmid_kfd;
>> + dqm->vmid_pasid[idx] = 0;
>> +
>> qpd->vmid = 0;
>> q->properties.vmid = 0;
>> }
>> @@ -1017,7 +1029,8 @@ static int initialize_nocpsch(struct device_queue_manager *dqm)
>> dqm->allocated_queues[pipe] |= 1 << queue;
>> }
>>
>> - dqm->vmid_bitmap = (1 << dqm->dev->vm_info.vmid_num_kfd) - 1;
>> + dqm->vmid_pasid = kcalloc(dqm->dev->vm_info.vmid_num_kfd,
>> + sizeof(uint16_t), GFP_KERNEL);
> If you allocate this dynamically, you need to check the return value.
> But see below ...
>
>
>> dqm->sdma_bitmap = ~0ULL >> (64 - get_num_sdma_queues(dqm));
>> dqm->xgmi_sdma_bitmap = ~0ULL >> (64 - get_num_xgmi_sdma_queues(dqm));
>>
>> @@ -1030,6 +1043,7 @@ static void uninitialize(struct device_queue_manager *dqm)
>>
>> WARN_ON(dqm->queue_count > 0 || dqm->processes_count > 0);
>>
>> + kfree(dqm->vmid_pasid);
>> kfree(dqm->allocated_queues);
>> for (i = 0 ; i < KFD_MQD_TYPE_MAX ; i++)
>> kfree(dqm->mqd_mgrs[i]);
>> diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.h b/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.h
>> index eed8f950b663..67b5e5fadd95 100644
>> --- a/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.h
>> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.h
>> @@ -188,7 +188,8 @@ struct device_queue_manager {
>> unsigned int *allocated_queues;
>> uint64_t sdma_bitmap;
>> uint64_t xgmi_sdma_bitmap;
>> - unsigned int vmid_bitmap;
>> + /* the pasid mapping for each kfd vmid */
>> + uint16_t *vmid_pasid;
> This could be a fixed-size array since the number of user mode VMIDs is
> limited to 15 by the HW. The size of the pointer alone is enough to
> store 4 PASIDs. Add overhead of kmalloc and you don't really save
> anything by allocating this dynamically. It only adds indirection,
> complexity (error handling) and the risk of memory leaks.
>
> Regards,
> Felix
>
>
>> uint64_t pipelines_addr;
>> struct kfd_mem_obj *pipeline_mem;
>> uint64_t fence_gpu_addr;
More information about the amd-gfx
mailing list