[PATCH v2 3/6] drm/pagemap: DMA map folios when possible
Matthew Brost
matthew.brost at intel.com
Fri Jul 25 21:54:22 UTC 2025
On Fri, Jul 25, 2025 at 05:39:27PM +0200, Francois Dugast wrote:
> If the page is part of a folio, DMA map the whole folio at once instead of
> mapping individual pages one after the other. For example if 2MB folios
> are used instead of 4KB pages, this reduces the number of DMA mappings by
> 512.
>
> The folio order (and consequently, the size) is persisted in the struct
> drm_pagemap_device_addr to be available at the time of unmapping.
>
> v2:
> - Initialize order variable (Matthew Brost)
> - Set proto and dir for completeness (Matthew Brost)
> - Do not populate drm_pagemap_addr, document it (Matthew Brost)
> - Add and use macro NR_PAGES(order) (Matthew Brost)
>
> Signed-off-by: Francois Dugast <francois.dugast at intel.com>
> Cc: Matthew Brost <matthew.brost at intel.com>
Reviewed-by: Matthew Brost <matthew.brost at intel.com>
> ---
> drivers/gpu/drm/drm_pagemap.c | 25 ++++++++++++++++++-------
> include/drm/drm_pagemap.h | 10 ++++++++--
> 2 files changed, 26 insertions(+), 9 deletions(-)
>
> diff --git a/drivers/gpu/drm/drm_pagemap.c b/drivers/gpu/drm/drm_pagemap.c
> index de320aeed812..b6f5d3a8e445 100644
> --- a/drivers/gpu/drm/drm_pagemap.c
> +++ b/drivers/gpu/drm/drm_pagemap.c
> @@ -222,22 +222,30 @@ static int drm_pagemap_migrate_map_pages(struct device *dev,
> {
> unsigned long i;
>
> - for (i = 0; i < npages; ++i) {
> + for (i = 0; i < npages;) {
> struct page *page = migrate_pfn_to_page(migrate_pfn[i]);
> dma_addr_t dma_addr;
> + struct folio *folio;
> + unsigned int order = 0;
>
> if (!page)
> - continue;
> + goto next;
>
> if (WARN_ON_ONCE(is_zone_device_page(page)))
> return -EFAULT;
>
> - dma_addr = dma_map_page(dev, page, 0, PAGE_SIZE, dir);
> + folio = page_folio(page);
> + order = folio_order(folio);
> +
> + dma_addr = dma_map_page(dev, page, 0, page_size(page), dir);
> if (dma_mapping_error(dev, dma_addr))
> return -EFAULT;
>
> pagemap_addr[i] = drm_pagemap_addr_encode(
> - dma_addr, DRM_INTERCONNECT_SYSTEM, 0, dir);
> + dma_addr, DRM_INTERCONNECT_SYSTEM, order, dir);
> +
> +next:
> + i += NR_PAGES(order);
> }
>
> return 0;
> @@ -261,11 +269,14 @@ static void drm_pagemap_migrate_unmap_pages(struct device *dev,
> {
> unsigned long i;
>
> - for (i = 0; i < npages; ++i) {
> + for (i = 0; i < npages;) {
> if (!pagemap_addr[i].addr || dma_mapping_error(dev, pagemap_addr[i].addr))
> - continue;
> + goto next;
> +
> + dma_unmap_page(dev, pagemap_addr[i].addr, PAGE_SIZE << pagemap_addr[i].order, dir);
>
> - dma_unmap_page(dev, pagemap_addr[i].addr, PAGE_SIZE, dir);
> +next:
> + i += NR_PAGES(pagemap_addr[i].order);
> }
> }
>
> diff --git a/include/drm/drm_pagemap.h b/include/drm/drm_pagemap.h
> index 1d5919a99139..ef18d98dbc7e 100644
> --- a/include/drm/drm_pagemap.h
> +++ b/include/drm/drm_pagemap.h
> @@ -6,6 +6,8 @@
> #include <linux/hmm.h>
> #include <linux/types.h>
>
> +#define NR_PAGES(order) (1U << order)
> +
> struct drm_pagemap;
> struct drm_pagemap_zdd;
> struct device;
> @@ -173,7 +175,9 @@ struct drm_pagemap_devmem_ops {
> * @pagemap_addr: Pointer to array of DMA information (source)
> * @npages: Number of pages to copy
> *
> - * Copy pages to device memory.
> + * Copy pages to device memory. If the order of a @pagemap_addr entry
> + * is greater than 0, the entry is populated but subsequent entries
> + * within the range of that order are not populated.
> *
> * Return: 0 on success, a negative error code on failure.
> */
> @@ -187,7 +191,9 @@ struct drm_pagemap_devmem_ops {
> * @pagemap_addr: Pointer to array of DMA information (destination)
> * @npages: Number of pages to copy
> *
> - * Copy pages to system RAM.
> + * Copy pages to system RAM. If the order of a @pagemap_addr entry
> + * is greater than 0, the entry is populated but subsequent entries
> + * within the range of that order are not populated.
> *
> * Return: 0 on success, a negative error code on failure.
> */
> --
> 2.43.0
>
More information about the Intel-xe
mailing list