[PATCH] drm/amdkfd: correct the SVM DMA device unmap direction

Christian König christian.koenig at amd.com
Wed Nov 6 12:24:14 UTC 2024


Am 05.11.24 um 17:34 schrieb Felix Kuehling:
> On 2024-11-05 06:04, Christian König wrote:
>> Am 05.11.24 um 03:33 schrieb Prike Liang:
>>> The SVM DMA device unmap direction should be same as
>>> the DMA map process.
>>
>> At least of hand that looks like it's only papering over a major 
>> problem.
>>
>> Why are DMA ranges for SVM mapped with a direction in the first 
>> place? That is usually not something we should do.
>
> These are DMA mappings of system memory pages. I guess we're creating 
> DMA mappings only for the access required for the migration, which is 
> not bidirectional. I see we do something similar for userptr mappings 
> depending on whether the GPU mapping is read-only or read-write. Is 
> that wrong for userptrs as well?

I think so, yes. The DMA directions are there to make explicit CPU cache 
management and bounce buffers possible.

Since we shouldn't need or even want either for a cache coherent PCIe 
device we should probably always use BIDIRECTIONAL.

Regards,
Christian.

>
> Regards,
>   Felix
>
>
>>
>> Regards,
>> Christian.
>>
>>>
>>> Signed-off-by: Prike Liang <Prike.Liang at amd.com>
>>> ---
>>>   drivers/gpu/drm/amd/amdkfd/kfd_migrate.c | 4 ++--
>>>   drivers/gpu/drm/amd/amdkfd/kfd_svm.c     | 6 +++---
>>>   drivers/gpu/drm/amd/amdkfd/kfd_svm.h     | 3 ++-
>>>   3 files changed, 7 insertions(+), 6 deletions(-)
>>>
>>> diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_migrate.c 
>>> b/drivers/gpu/drm/amd/amdkfd/kfd_migrate.c
>>> index eacfeb32f35d..9d83bb9dd004 100644
>>> --- a/drivers/gpu/drm/amd/amdkfd/kfd_migrate.c
>>> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_migrate.c
>>> @@ -445,7 +445,7 @@ svm_migrate_vma_to_vram(struct kfd_node *node, 
>>> struct svm_range *prange,
>>>       pr_debug("successful/cpages/npages 0x%lx/0x%lx/0x%lx\n",
>>>                mpages, cpages, migrate.npages);
>>>   -    svm_range_dma_unmap_dev(adev->dev, scratch, 0, npages);
>>> +    svm_range_dma_unmap_dev(adev->dev, scratch, 0, npages, 
>>> DMA_TO_DEVICE);
>>>     out_free:
>>>       kvfree(buf);
>>> @@ -750,7 +750,7 @@ svm_migrate_vma_to_ram(struct kfd_node *node, 
>>> struct svm_range *prange,
>>>       svm_migrate_copy_done(adev, mfence);
>>>       migrate_vma_finalize(&migrate);
>>>   -    svm_range_dma_unmap_dev(adev->dev, scratch, 0, npages);
>>> +    svm_range_dma_unmap_dev(adev->dev, scratch, 0, npages, 
>>> DMA_FROM_DEVICE);
>>>     out_free:
>>>       kvfree(buf);
>>> diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_svm.c 
>>> b/drivers/gpu/drm/amd/amdkfd/kfd_svm.c
>>> index 3e2911895c74..c21485fe6cbb 100644
>>> --- a/drivers/gpu/drm/amd/amdkfd/kfd_svm.c
>>> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_svm.c
>>> @@ -233,9 +233,9 @@ svm_range_dma_map(struct svm_range *prange, 
>>> unsigned long *bitmap,
>>>   }
>>>     void svm_range_dma_unmap_dev(struct device *dev, dma_addr_t 
>>> *dma_addr,
>>> -             unsigned long offset, unsigned long npages)
>>> +             unsigned long offset, unsigned long npages,
>>> +                enum dma_data_direction dir)
>>>   {
>>> -    enum dma_data_direction dir = DMA_BIDIRECTIONAL;
>>>       int i;
>>>         if (!dma_addr)
>>> @@ -272,7 +272,7 @@ void svm_range_dma_unmap(struct svm_range *prange)
>>>           }
>>>           dev = &pdd->dev->adev->pdev->dev;
>>>   -        svm_range_dma_unmap_dev(dev, dma_addr, 0, prange->npages);
>>> +        svm_range_dma_unmap_dev(dev, dma_addr, 0, prange->npages, 
>>> DMA_BIDIRECTIONAL);
>>>       }
>>>   }
>>>   diff --git a/drivers/gpu/drm/amd/amdkfd/kfd_svm.h 
>>> b/drivers/gpu/drm/amd/amdkfd/kfd_svm.h
>>> index bddd24f04669..5370d68bc5b2 100644
>>> --- a/drivers/gpu/drm/amd/amdkfd/kfd_svm.h
>>> +++ b/drivers/gpu/drm/amd/amdkfd/kfd_svm.h
>>> @@ -182,7 +182,8 @@ void svm_range_add_list_work(struct 
>>> svm_range_list *svms,
>>>                    enum svm_work_list_ops op);
>>>   void schedule_deferred_list_work(struct svm_range_list *svms);
>>>   void svm_range_dma_unmap_dev(struct device *dev, dma_addr_t 
>>> *dma_addr,
>>> -             unsigned long offset, unsigned long npages);
>>> +             unsigned long offset, unsigned long npages,
>>> +             enum dma_data_direction dir);
>>>   void svm_range_dma_unmap(struct svm_range *prange);
>>>   int svm_range_get_info(struct kfd_process *p, uint32_t 
>>> *num_svm_ranges,
>>>                  uint64_t *svm_priv_data_size);
>>



More information about the amd-gfx mailing list