[PATCH v2 4/6] drm/pagemap: Allocate folios when possible
Matthew Brost
matthew.brost at intel.com
Fri Jul 25 21:43:48 UTC 2025
On Fri, Jul 25, 2025 at 05:39:28PM +0200, Francois Dugast wrote:
> If the order is greater than zero, allocate a folio when populating the
> RAM PFNs instead of allocating individual pages one after the other. For
> example if 2MB folios are used instead of 4KB pages, this reduces the
> number of calls to the allocation API by 512.
>
> v2:
> - Use page order instead of extr argument (Matthew Brost)
> - Allocate with folio_alloc() (Matthew Brost)
> - Loop for mpages and free_pages based on order (Matthew Brost)
>
> Signed-off-by: Francois Dugast <francois.dugast at intel.com>
> Cc: Matthew Brost <matthew.brost at intel.com>
> ---
> drivers/gpu/drm/drm_pagemap.c | 38 ++++++++++++++++++++++++++---------
> 1 file changed, 28 insertions(+), 10 deletions(-)
>
> diff --git a/drivers/gpu/drm/drm_pagemap.c b/drivers/gpu/drm/drm_pagemap.c
> index b6f5d3a8e445..38753ce2bca7 100644
> --- a/drivers/gpu/drm/drm_pagemap.c
> +++ b/drivers/gpu/drm/drm_pagemap.c
> @@ -458,54 +458,72 @@ static int drm_pagemap_migrate_populate_ram_pfn(struct vm_area_struct *vas,
> {
> unsigned long i;
>
> - for (i = 0; i < npages; ++i, addr += PAGE_SIZE) {
> + for (i = 0; i < npages;) {
> struct page *page, *src_page;
> + unsigned int order;
> + struct folio *folio;
>
> if (!(src_mpfn[i] & MIGRATE_PFN_MIGRATE))
> - continue;
> + goto next;
>
> src_page = migrate_pfn_to_page(src_mpfn[i]);
> if (!src_page)
> - continue;
> + goto next;
>
> if (fault_page) {
> if (src_page->zone_device_data !=
> fault_page->zone_device_data)
> - continue;
> + goto next;
> }
>
> + order = folio_order(page_folio(src_page));
> +
> + /* TODO: Support fallback to single pages if THP allocation fails */
> if (vas)
> - page = alloc_page_vma(GFP_HIGHUSER, vas, addr);
> + folio = vma_alloc_folio(GFP_HIGHUSER, order, vas, addr);
> else
> - page = alloc_page(GFP_HIGHUSER);
> + folio = folio_alloc(GFP_HIGHUSER, order);
I haven't checked but I assume if order == 0, then alloc_page_vma ==
vma_alloc_folio? So goes for alloc_page / folio_alloc. If so, then this
looks good.
>
> - if (!page)
> + if (!folio)
> goto free_pages;
>
> + page = folio_page(folio, 0);
> mpfn[i] = migrate_pfn(page_to_pfn(page));
> +
> +next:
> + addr += page_size(page);
> + i += NR_PAGES(order);
> }
>
> - for (i = 0; i < npages; ++i) {
> + for (i = 0; i < npages;) {
> struct page *page = migrate_pfn_to_page(mpfn[i]);
> + unsigned int order;
unsigned int order = 0;
>
> if (!page)
> continue;
s/continue/goto next;
>
> WARN_ON_ONCE(!trylock_page(page));
> - ++*mpages;
> +
> + order = folio_order(page_folio(page));
next:
> + *mpages += NR_PAGES(order);
> + i += NR_PAGES(order);
> }
>
> return 0;
>
> free_pages:
> - for (i = 0; i < npages; ++i) {
> + for (i = 0; i < npages;) {
Same logic changes to this loop as the one above.
Matt
> struct page *page = migrate_pfn_to_page(mpfn[i]);
> + unsigned int order;
>
> if (!page)
> continue;
>
> put_page(page);
> mpfn[i] = 0;
> +
> + order = folio_order(page_folio(page));
> + i += NR_PAGES(order);
> }
> return -ENOMEM;
> }
> --
> 2.43.0
>
More information about the Intel-xe
mailing list