[PATCH 4/6] drm/amdkfd: Record vmid pasid mapping in the driver

Zhao, Yong Yong.Zhao at amd.com
Thu Sep 26 19:01:17 UTC 2019


I agree.

Yong

On 2019-09-26 2:54 p.m., Kuehling, Felix wrote:
> On 2019-09-26 2:38 p.m., Zhao, Yong wrote:
>> This makes possible the vmid pasid mapping query through software.
>>
>> Change-Id: Ib539aae277a227cc39f6469ae23c46c4d289b87b
>> Signed-off-by: Yong Zhao <Yong.Zhao at amd.com>
>> ---
>>    .../drm/amd/amdkfd/kfd_device_queue_manager.c | 34 +++++++++++++------
>>    .../drm/amd/amdkfd/kfd_device_queue_manager.h |  3 +-
>>    2 files changed, 26 insertions(+), 11 deletions(-)
>>
>> diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.c b/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.c
>> index e7f0a32e0e44..d006adefef55 100644
>> --- a/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.c
>> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.c
>> @@ -224,20 +224,30 @@ static int allocate_vmid(struct device_queue_manager *dqm,
>>    			struct qcm_process_device *qpd,
>>    			struct queue *q)
>>    {
>> -	int bit, allocated_vmid;
>> +	int idx = -1, allocated_vmid, i;
>>    
>> -	if (dqm->vmid_bitmap == 0)
>> +	for (i = 0; i < dqm->dev->vm_info.vmid_num_kfd; i++) {
>> +		if (!dqm->vmid_pasid[i]) {
>> +			idx = i;
>> +			break;
>> +		}
>> +	}
>> +
>> +	if (idx < 0) {
>> +		pr_err("no more vmid to allocate\n");
>>    		return -ENOMEM;
>> +	}
>> +
>> +	dqm->vmid_pasid[idx] = q->process->pasid;
>>    
>> -	bit = ffs(dqm->vmid_bitmap) - 1;
>> -	dqm->vmid_bitmap &= ~(1 << bit);
>> +	allocated_vmid = idx + dqm->dev->vm_info.first_vmid_kfd;
>> +	pr_debug("vmid allocated: %d\n", allocated_vmid);
>> +
>> +	set_pasid_vmid_mapping(dqm, q->process->pasid, allocated_vmid);
>>    
>> -	allocated_vmid = bit + dqm->dev->vm_info.first_vmid_kfd;
>> -	pr_debug("vmid allocation %d\n", allocated_vmid);
>>    	qpd->vmid = allocated_vmid;
>>    	q->properties.vmid = allocated_vmid;
>>    
>> -	set_pasid_vmid_mapping(dqm, q->process->pasid, q->properties.vmid);
>>    	program_sh_mem_settings(dqm, qpd);
>>    
>>    	/* qpd->page_table_base is set earlier when register_process()
>> @@ -278,7 +288,7 @@ static void deallocate_vmid(struct device_queue_manager *dqm,
>>    				struct qcm_process_device *qpd,
>>    				struct queue *q)
>>    {
>> -	int bit = qpd->vmid - dqm->dev->vm_info.first_vmid_kfd;
>> +	int idx;
>>    
>>    	/* On GFX v7, CP doesn't flush TC at dequeue */
>>    	if (q->device->device_info->asic_family == CHIP_HAWAII)
>> @@ -290,7 +300,9 @@ static void deallocate_vmid(struct device_queue_manager *dqm,
>>    	/* Release the vmid mapping */
>>    	set_pasid_vmid_mapping(dqm, 0, qpd->vmid);
>>    
>> -	dqm->vmid_bitmap |= (1 << bit);
>> +	idx = qpd->vmid - dqm->dev->vm_info.first_vmid_kfd;
>> +	dqm->vmid_pasid[idx] = 0;
>> +
>>    	qpd->vmid = 0;
>>    	q->properties.vmid = 0;
>>    }
>> @@ -1017,7 +1029,8 @@ static int initialize_nocpsch(struct device_queue_manager *dqm)
>>    				dqm->allocated_queues[pipe] |= 1 << queue;
>>    	}
>>    
>> -	dqm->vmid_bitmap = (1 << dqm->dev->vm_info.vmid_num_kfd) - 1;
>> +	dqm->vmid_pasid = kcalloc(dqm->dev->vm_info.vmid_num_kfd,
>> +			sizeof(uint16_t), GFP_KERNEL);
> If you allocate this dynamically, you need to check the return value.
> But see below ...
>
>
>>    	dqm->sdma_bitmap = ~0ULL >> (64 - get_num_sdma_queues(dqm));
>>    	dqm->xgmi_sdma_bitmap = ~0ULL >> (64 - get_num_xgmi_sdma_queues(dqm));
>>    
>> @@ -1030,6 +1043,7 @@ static void uninitialize(struct device_queue_manager *dqm)
>>    
>>    	WARN_ON(dqm->queue_count > 0 || dqm->processes_count > 0);
>>    
>> +	kfree(dqm->vmid_pasid);
>>    	kfree(dqm->allocated_queues);
>>    	for (i = 0 ; i < KFD_MQD_TYPE_MAX ; i++)
>>    		kfree(dqm->mqd_mgrs[i]);
>> diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.h b/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.h
>> index eed8f950b663..67b5e5fadd95 100644
>> --- a/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.h
>> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_device_queue_manager.h
>> @@ -188,7 +188,8 @@ struct device_queue_manager {
>>    	unsigned int		*allocated_queues;
>>    	uint64_t		sdma_bitmap;
>>    	uint64_t		xgmi_sdma_bitmap;
>> -	unsigned int		vmid_bitmap;
>> +	/* the pasid mapping for each kfd vmid */
>> +	uint16_t		*vmid_pasid;
> This could be a fixed-size array since the number of user mode VMIDs is
> limited to 15 by the HW. The size of the pointer alone is enough to
> store 4 PASIDs. Add overhead of kmalloc and you don't really save
> anything by allocating this dynamically. It only adds indirection,
> complexity (error handling) and the risk of memory leaks.
>
> Regards,
>     Felix
>
>
>>    	uint64_t		pipelines_addr;
>>    	struct kfd_mem_obj	*pipeline_mem;
>>    	uint64_t		fence_gpu_addr;


More information about the amd-gfx mailing list