[PATCH 3/6] drm/ttm: Support partial buffer mappings for ttm_bo_vmap()

Thomas Zimmermann tzimmermann at suse.de
Mon Jun 17 13:00:22 UTC 2024


Hi

Am 14.06.24 um 16:33 schrieb Christian König:
> Am 14.06.24 um 15:21 schrieb Thomas Zimmermann:
>> Add offset and size parameters to ttm_bo_vmap() to allow for partial
>> mappings of a buffer object. This brings the functionality on par with
>> ttm_bo_kmap().
>
> Well the long term plan was to remove this functionality from 
> ttm_bo_kmap() and nuke that function sooner or later.
>
> What exactly is the use case for partial mappings?

I don't have a use case; except for streamlining the DRM internals.

For the drivers, xe uses partial mappings in 
i915_gem_object_read_from_page(). But struct iosys_map to map the whole 
buffer and do memcpys within the range. See patch 6 for that. I think it 
could do without partial mappings. Vmwgfx uses a local mappings at [1], 
but as the nearby comment says, this could be a TTM helper. Or maybe TTM 
could provide a dedicated ttm_bo_kmap_local_page() for temporary 
mappings like this one. There's also [2], which looks like a candidate 
for a possible ttm_bo_kmap_local_page(). And in vmwgfx, there's the 
memcpy at [3], which could be replaced with ttm_bo_vmap() plus iosys_map 
helpers. I think that's it. Best regards Thomas [1] 
https://elixir.bootlin.com/linux/v6.9/source/drivers/gpu/drm/vmwgfx/vmwgfx_cotable.c#L457 
[2] 
https://elixir.bootlin.com/linux/v6.9/source/drivers/gpu/drm/vmwgfx/vmwgfx_drv.c#L418 
[3] 
https://elixir.bootlin.com/linux/v6.9/source/drivers/gpu/drm/vmwgfx/vmwgfx_kms.c#L430 

>
> Regards,
> Christian.
>
>>
>> Callers pass the byte offset and size within the buffer object and
>> receive a page-aligned mapping of the buffer object's memory for the
>> specified area.
>>
>> Also update all callers of ttm_bo_vmap() for the new parameters. As
>> before, existing callers map the buffer object's complete memory.
>>
>> Signed-off-by: Thomas Zimmermann <tzimmermann at suse.de>
>> ---
>>   drivers/gpu/drm/drm_gem_ttm_helper.c  |  2 +-
>>   drivers/gpu/drm/drm_gem_vram_helper.c |  2 +-
>>   drivers/gpu/drm/loongson/lsdc_gem.c   |  2 +-
>>   drivers/gpu/drm/qxl/qxl_object.c      |  2 +-
>>   drivers/gpu/drm/ttm/ttm_bo_util.c     | 21 +++++++++++++++------
>>   drivers/gpu/drm/xe/xe_lrc.c           |  2 +-
>>   drivers/gpu/drm/xe/xe_vm.c            |  2 +-
>>   include/drm/ttm/ttm_bo.h              |  4 +++-
>>   8 files changed, 24 insertions(+), 13 deletions(-)
>>
>> diff --git a/drivers/gpu/drm/drm_gem_ttm_helper.c 
>> b/drivers/gpu/drm/drm_gem_ttm_helper.c
>> index 3734aa2d1c5b5..f26b7c9077a68 100644
>> --- a/drivers/gpu/drm/drm_gem_ttm_helper.c
>> +++ b/drivers/gpu/drm/drm_gem_ttm_helper.c
>> @@ -67,7 +67,7 @@ int drm_gem_ttm_vmap(struct drm_gem_object *gem,
>>   {
>>       struct ttm_buffer_object *bo = drm_gem_ttm_of_gem(gem);
>>   -    return ttm_bo_vmap(bo, map);
>> +    return ttm_bo_vmap(bo, 0, gem->size, map);
>>   }
>>   EXPORT_SYMBOL(drm_gem_ttm_vmap);
>>   diff --git a/drivers/gpu/drm/drm_gem_vram_helper.c 
>> b/drivers/gpu/drm/drm_gem_vram_helper.c
>> index 6027584406af6..1670f9a459a9d 100644
>> --- a/drivers/gpu/drm/drm_gem_vram_helper.c
>> +++ b/drivers/gpu/drm/drm_gem_vram_helper.c
>> @@ -398,7 +398,7 @@ int drm_gem_vram_vmap(struct drm_gem_vram_object 
>> *gbo, struct iosys_map *map)
>>        * no mapping present.
>>        */
>>       if (iosys_map_is_null(&gbo->map)) {
>> -        ret = ttm_bo_vmap(&gbo->bo, &gbo->map);
>> +        ret = ttm_bo_vmap(&gbo->bo, 0, gbo->bo.base.size, &gbo->map);
>>           if (ret)
>>               return ret;
>>       }
>> diff --git a/drivers/gpu/drm/loongson/lsdc_gem.c 
>> b/drivers/gpu/drm/loongson/lsdc_gem.c
>> index a720d8f532093..f709960c781b9 100644
>> --- a/drivers/gpu/drm/loongson/lsdc_gem.c
>> +++ b/drivers/gpu/drm/loongson/lsdc_gem.c
>> @@ -77,7 +77,7 @@ static int lsdc_gem_object_vmap(struct 
>> drm_gem_object *obj, struct iosys_map *ma
>>           return ret;
>>       }
>>   -    ret = ttm_bo_vmap(tbo, &lbo->map);
>> +    ret = ttm_bo_vmap(tbo, 0, tbo->base.size, &lbo->map);
>>       if (ret) {
>>           drm_err(obj->dev, "ttm bo vmap failed\n");
>>           lsdc_bo_unpin(lbo);
>> diff --git a/drivers/gpu/drm/qxl/qxl_object.c 
>> b/drivers/gpu/drm/qxl/qxl_object.c
>> index 5893e27a7ae50..9f06d5e26a32c 100644
>> --- a/drivers/gpu/drm/qxl/qxl_object.c
>> +++ b/drivers/gpu/drm/qxl/qxl_object.c
>> @@ -164,7 +164,7 @@ int qxl_bo_vmap_locked(struct qxl_bo *bo, struct 
>> iosys_map *map)
>>           goto out;
>>       }
>>   -    r = ttm_bo_vmap(&bo->tbo, &bo->map);
>> +    r = ttm_bo_vmap(&bo->tbo, 0, bo->tbo.base.size, &bo->map);
>>       if (r) {
>>           qxl_bo_unpin_locked(bo);
>>           return r;
>> diff --git a/drivers/gpu/drm/ttm/ttm_bo_util.c 
>> b/drivers/gpu/drm/ttm/ttm_bo_util.c
>> index a9df0deff2deb..31f9772f05dac 100644
>> --- a/drivers/gpu/drm/ttm/ttm_bo_util.c
>> +++ b/drivers/gpu/drm/ttm/ttm_bo_util.c
>> @@ -457,17 +457,23 @@ EXPORT_SYMBOL(ttm_bo_kunmap);
>>    * ttm_bo_vmap
>>    *
>>    * @bo: The buffer object.
>> + * @offset: Byte offset into the buffer.
>> + * @size: Number of bytes to map.
>>    * @map: pointer to a struct iosys_map representing the map.
>>    *
>>    * Sets up a kernel virtual mapping, using ioremap or vmap to the
>>    * data in the buffer object. The parameter @map returns the virtual
>>    * address as struct iosys_map. Unmap the buffer with ttm_bo_vunmap().
>> + * The address stored in @map will be aligned to the next lower page
>> + * boundaries.
>>    *
>>    * Returns
>>    * -ENOMEM: Out of memory.
>>    * -EINVAL: Invalid range.
>>    */
>> -int ttm_bo_vmap(struct ttm_buffer_object *bo, struct iosys_map *map)
>> +int ttm_bo_vmap(struct ttm_buffer_object *bo,
>> +        unsigned long offset, unsigned long size,
>> +        struct iosys_map *map)
>>   {
>>       struct ttm_resource *mem = bo->resource;
>>       int ret;
>> @@ -483,18 +489,18 @@ int ttm_bo_vmap(struct ttm_buffer_object *bo, 
>> struct iosys_map *map)
>>           u16 alloc_flags;
>>             if (mem->bus.addr) {
>> -            vaddr_iomem = (void __iomem *)mem->bus.addr;
>> +            vaddr_iomem = (u8 __iomem *)mem->bus.addr + offset;
>>               alloc_flags = ttm_bo_map_premapped;
>>           } else if (mem->bus.caching == ttm_write_combined) {
>> -            vaddr_iomem = ioremap_wc(mem->bus.offset, bo->base.size);
>> +            vaddr_iomem = ioremap_wc(mem->bus.offset + offset, size);
>>               alloc_flags = ttm_bo_map_iomap;
>>   #ifdef CONFIG_X86
>>           } else if (mem->bus.caching == ttm_cached) {
>> -            vaddr_iomem = ioremap_cache(mem->bus.offset, 
>> bo->base.size);
>> +            vaddr_iomem = ioremap_cache(mem->bus.offset + offset, 
>> size);
>>               alloc_flags = ttm_bo_map_iomap;
>>   #endif
>>           } else {
>> -            vaddr_iomem = ioremap(mem->bus.offset, bo->base.size);
>> +            vaddr_iomem = ioremap(mem->bus.offset + offset, size);
>>               alloc_flags = ttm_bo_map_iomap;
>>           }
>>   @@ -510,6 +516,9 @@ int ttm_bo_vmap(struct ttm_buffer_object *bo, 
>> struct iosys_map *map)
>>               .no_wait_gpu = false
>>           };
>>           struct ttm_tt *ttm = bo->ttm;
>> +        unsigned long start_page = offset >> PAGE_SHIFT;
>> +        unsigned long aligned_size = size + (offset - (start_page << 
>> PAGE_SHIFT));
>> +        unsigned long num_pages = DIV_ROUND_UP(aligned_size, 
>> PAGE_SIZE);
>>           pgprot_t prot;
>>           void *vaddr;
>>           u16 alloc_flags;
>> @@ -523,7 +532,7 @@ int ttm_bo_vmap(struct ttm_buffer_object *bo, 
>> struct iosys_map *map)
>>            * or to make the buffer object look contiguous.
>>            */
>>           prot = ttm_io_prot(bo, mem, PAGE_KERNEL);
>> -        vaddr = vmap(ttm->pages, ttm->num_pages, 0, prot);
>> +        vaddr = vmap(ttm->pages + start_page, num_pages, 0, prot);
>>           if (!vaddr)
>>               return -ENOMEM;
>>           alloc_flags = ttm_bo_map_vmap;
>> diff --git a/drivers/gpu/drm/xe/xe_lrc.c b/drivers/gpu/drm/xe/xe_lrc.c
>> index c1bb85d2e243f..3a68fe6d592ed 100644
>> --- a/drivers/gpu/drm/xe/xe_lrc.c
>> +++ b/drivers/gpu/drm/xe/xe_lrc.c
>> @@ -1595,7 +1595,7 @@ void xe_lrc_snapshot_capture_delayed(struct 
>> xe_lrc_snapshot *snapshot)
>>           goto put_bo;
>>         xe_bo_lock(bo, false);
>> -    if (!ttm_bo_vmap(&bo->ttm, &src)) {
>> +    if (!ttm_bo_vmap(&bo->ttm, 0, bo->ttm.base.size, &src)) {
>>           xe_map_memcpy_from(xe_bo_device(bo),
>>                      snapshot->lrc_snapshot, &src, snapshot->lrc_offset,
>>                      snapshot->lrc_size);
>> diff --git a/drivers/gpu/drm/xe/xe_vm.c b/drivers/gpu/drm/xe/xe_vm.c
>> index 99bf7412475c0..81306c32f5d09 100644
>> --- a/drivers/gpu/drm/xe/xe_vm.c
>> +++ b/drivers/gpu/drm/xe/xe_vm.c
>> @@ -3485,7 +3485,7 @@ void xe_vm_snapshot_capture_delayed(struct 
>> xe_vm_snapshot *snap)
>>             if (bo) {
>>               xe_bo_lock(bo, false);
>> -            err = ttm_bo_vmap(&bo->ttm, &src);
>> +            err = ttm_bo_vmap(&bo->ttm, 0, bo->ttm.base.size, &src);
>>               if (!err) {
>>                   xe_map_memcpy_from(xe_bo_device(bo),
>>                              snap->snap[i].data,
>> diff --git a/include/drm/ttm/ttm_bo.h b/include/drm/ttm/ttm_bo.h
>> index 6ccf96c91f3ae..c421ffe3563b1 100644
>> --- a/include/drm/ttm/ttm_bo.h
>> +++ b/include/drm/ttm/ttm_bo.h
>> @@ -375,7 +375,9 @@ int ttm_bo_init_validate(struct ttm_device *bdev, 
>> struct ttm_buffer_object *bo,
>>   int ttm_bo_kmap(struct ttm_buffer_object *bo, unsigned long 
>> start_page,
>>           unsigned long num_pages, struct ttm_bo_kmap_obj *map);
>>   void ttm_bo_kunmap(struct ttm_bo_kmap_obj *map);
>> -int ttm_bo_vmap(struct ttm_buffer_object *bo, struct iosys_map *map);
>> +int ttm_bo_vmap(struct ttm_buffer_object *bo,
>> +        unsigned long offset, unsigned long size,
>> +        struct iosys_map *map);
>>   void ttm_bo_vunmap(struct ttm_buffer_object *bo, struct iosys_map 
>> *map);
>>   int ttm_bo_mmap_obj(struct vm_area_struct *vma, struct 
>> ttm_buffer_object *bo);
>>   int ttm_bo_swapout(struct ttm_buffer_object *bo, struct 
>> ttm_operation_ctx *ctx,
>

-- 
--
Thomas Zimmermann
Graphics Driver Developer
SUSE Software Solutions Germany GmbH
Frankenstrasse 146, 90461 Nuernberg, Germany
GF: Ivo Totev, Andrew Myers, Andrew McDonald, Boudien Moerman
HRB 36809 (AG Nuernberg)



More information about the Intel-gfx mailing list