[PATCH v7 3/3] drm/buddy: Add defragmentation support

Matthew Auld matthew.auld at intel.com
Mon Mar 4 12:36:36 UTC 2024


On 04/03/2024 12:22, Paneer Selvam, Arunpravin wrote:
> Hi Matthew,
> 
> On 2/22/2024 12:12 AM, Matthew Auld wrote:
>> On 21/02/2024 12:18, Arunpravin Paneer Selvam wrote:
>>> Add a function to support defragmentation.
>>>
>>> v1:
>>>    - Defragment the memory beginning from min_order
>>>      till the required memory space is available.
>>>
>>> v2(Matthew):
>>>    - add amdgpu user for defragmentation
>>>    - add a warning if the two blocks are incompatible on
>>>      defragmentation
>>>    - call full defragmentation in the fini() function
>>>    - place a condition to test if min_order is equal to 0
>>>    - replace the list with safe_reverse() variant as we might
>>>      remove the block from the list.
>>>
>>> Signed-off-by: Arunpravin Paneer Selvam 
>>> <Arunpravin.PaneerSelvam at amd.com>
>>> Suggested-by: Matthew Auld <matthew.auld at intel.com>
>>> ---
>>>   drivers/gpu/drm/amd/amdgpu/amdgpu_vram_mgr.c | 17 +++-
>>>   drivers/gpu/drm/drm_buddy.c                  | 93 +++++++++++++++++---
>>>   include/drm/drm_buddy.h                      |  3 +
>>>   3 files changed, 97 insertions(+), 16 deletions(-)
>>>
>>> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_vram_mgr.c 
>>> b/drivers/gpu/drm/amd/amdgpu/amdgpu_vram_mgr.c
>>> index e494f5bf136a..cff8a526c622 100644
>>> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu_vram_mgr.c
>>> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_vram_mgr.c
>>> @@ -533,8 +533,21 @@ static int amdgpu_vram_mgr_new(struct 
>>> ttm_resource_manager *man,
>>>                          min_block_size,
>>>                          &vres->blocks,
>>>                          vres->flags);
>>> -        if (unlikely(r))
>>> -            goto error_free_blocks;
>>> +        if (unlikely(r)) {
>>> +            if (r == -ENOSPC) {
>>> +                drm_buddy_defrag(mm, min_block_size);
>>> +                r = drm_buddy_alloc_blocks(mm, fpfn,
>>> +                               lpfn,
>>> +                               size,
>>> +                               min_block_size,
>>> +                               &vres->blocks,
>>> +                               vres->flags);
>>> +                if (unlikely(r))
>>> +                    goto error_free_blocks;
>>> +            } else {
>>> +                goto error_free_blocks;
>>> +            }
>>> +        }
>>>             if (size > remaining_size)
>>>               remaining_size = 0;
>>> diff --git a/drivers/gpu/drm/drm_buddy.c b/drivers/gpu/drm/drm_buddy.c
>>> index 18e004fa39d3..56bd1560fbcd 100644
>>> --- a/drivers/gpu/drm/drm_buddy.c
>>> +++ b/drivers/gpu/drm/drm_buddy.c
>>> @@ -203,6 +203,8 @@ void drm_buddy_fini(struct drm_buddy *mm)
>>>           drm_block_free(mm, mm->roots[i]);
>>>       }
>>>   +    drm_buddy_defrag(mm, mm->chunk_size << mm->max_order);
>>
>> I think this needs to be called higher up, otherwise we blow up with 
>> the WARN, plus we just freed the root(s). There is also the case with 
>> non-power-of-two VRAM size, in which case you get multiple roots and 
>> max_order is just the largest root and not entire address space. I 
>> guess do this in the loop above and use the root order instead?
>>
>> Also this should be done as part of the first patch and then in this 
>> patch it is just a case of exporting it. Every commit should ideally 
>> be functional by itself.
> You mean we move the above change in drm_buddy_fini function and 
> drm_buddy_defrag function as part of first patch.
> And just we add export function and add amdgpu user in this patch. Is my 
> understanding correct?

Yeah, I think that makes sense.

> 
> Thanks,
> Arun.
>>
>>> +
>>>       WARN_ON(mm->avail != mm->size);
>>>         kfree(mm->roots);
>>> @@ -276,25 +278,39 @@ drm_get_buddy(struct drm_buddy_block *block)
>>>   }
>>>   EXPORT_SYMBOL(drm_get_buddy);
>>>   -static void __drm_buddy_free(struct drm_buddy *mm,
>>> -                 struct drm_buddy_block *block)
>>> +static unsigned int __drm_buddy_free(struct drm_buddy *mm,
>>> +                     struct drm_buddy_block *block,
>>> +                     bool defrag)
>>>   {
>>> +    unsigned int order, block_order;
>>>       struct drm_buddy_block *parent;
>>>   +    block_order = drm_buddy_block_order(block);
>>> +
>>>       while ((parent = block->parent)) {
>>> -        struct drm_buddy_block *buddy;
>>> +        struct drm_buddy_block *buddy = NULL;
>>>             buddy = __get_buddy(block);
>>>             if (!drm_buddy_block_is_free(buddy))
>>>               break;
>>>   -        if (drm_buddy_block_is_clear(block) !=
>>> -            drm_buddy_block_is_clear(buddy))
>>> -            break;
>>> +        if (!defrag) {
>>> +            /*
>>> +             * Check the block and its buddy clear state and exit
>>> +             * the loop if they both have the dissimilar state.
>>> +             */
>>> +            if (drm_buddy_block_is_clear(block) !=
>>> +                drm_buddy_block_is_clear(buddy))
>>> +                break;
>>>   -        if (drm_buddy_block_is_clear(block))
>>> -            mark_cleared(parent);
>>> +            if (drm_buddy_block_is_clear(block))
>>> +                mark_cleared(parent);
>>> +        }
>>> +
>>> +        WARN_ON(defrag &&
>>> +            (drm_buddy_block_is_clear(block) ==
>>> +             drm_buddy_block_is_clear(buddy)));
>>>             list_del(&buddy->link);
>>>   @@ -304,8 +320,57 @@ static void __drm_buddy_free(struct drm_buddy 
>>> *mm,
>>>           block = parent;
>>>       }
>>>   -    mark_free(mm, block);
>>> +    order = drm_buddy_block_order(block);
>>> +    if (block_order != order)
>>> +        mark_free(mm, block);
>>> +
>>> +    return order;
>>> +}
>>> +
>>> +/**
>>> + * drm_buddy_defrag - Defragmentation routine
>>> + *
>>> + * @mm: DRM buddy manager
>>> + * @min_block_size: minimum size in bytes to begin
>>> + * the defragmentation process
>>> + *
>>> + * Driver calls the defragmentation function when the
>>> + * requested memory allocation returns -ENOSPC.
>>> + */
>>> +void drm_buddy_defrag(struct drm_buddy *mm,
>>> +              unsigned int min_block_size)
>>
>> u64 min_block_size. Most cards have 4G+ of VRAM :)
>>
>>> +{
>>> +    struct drm_buddy_block *block, *tmp;
>>> +    unsigned int order, min_order;
>>> +    struct list_head *list;
>>> +    unsigned long pages;
>>> +    int i;
>>> +
>>> +    pages = min_block_size >> ilog2(mm->chunk_size);
>>> +    min_order = fls(pages) - 1;
>>
>> I think min_block_size should be power-of-two, no?
>>
>>> +
>>> +    if (!min_order)
>>> +        return;
>>> +
>>> +    if (min_order > mm->max_order)
>>> +        return;
>>> +
>>> +    for (i = min_order - 1; i >= 0; i--) {
>>> +        list = &mm->free_list[i];
>>> +        if (list_empty(list))
>>> +            continue;
>>> +
>>> +        list_for_each_entry_safe_reverse(block, tmp, list, link) {
>>> +            if (!block->parent)
>>> +                continue;
>>> +
>>> +            order = __drm_buddy_free(mm, block, 1);
>>
>> s/1/true/
>>
>>> +            if (order >= min_order)
>>> +                return;
>>> +        }
>>> +    }
>>>   }
>>> +EXPORT_SYMBOL(drm_buddy_defrag);
>>>     /**
>>>    * drm_buddy_free_block - free a block
>>> @@ -321,7 +386,7 @@ void drm_buddy_free_block(struct drm_buddy *mm,
>>>       if (drm_buddy_block_is_clear(block))
>>>           mm->clear_avail += drm_buddy_block_size(mm, block);
>>>   -    __drm_buddy_free(mm, block);
>>> +    __drm_buddy_free(mm, block, 0);
>>>   }
>>>   EXPORT_SYMBOL(drm_buddy_free_block);
>>>   @@ -468,7 +533,7 @@ __alloc_range_bias(struct drm_buddy *mm,
>>>       if (buddy &&
>>>           (drm_buddy_block_is_free(block) &&
>>>            drm_buddy_block_is_free(buddy)))
>>> -        __drm_buddy_free(mm, block);
>>> +        __drm_buddy_free(mm, block, 0);
>>>       return ERR_PTR(err);
>>>   }
>>>   @@ -586,7 +651,7 @@ alloc_from_freelist(struct drm_buddy *mm,
>>>     err_undo:
>>>       if (tmp != order)
>>> -        __drm_buddy_free(mm, block);
>>> +        __drm_buddy_free(mm, block, 0);
>>>       return ERR_PTR(err);
>>>   }
>>>   @@ -666,7 +731,7 @@ static int __alloc_range(struct drm_buddy *mm,
>>>       if (buddy &&
>>>           (drm_buddy_block_is_free(block) &&
>>>            drm_buddy_block_is_free(buddy)))
>>> -        __drm_buddy_free(mm, block);
>>> +        __drm_buddy_free(mm, block, 0);
>>>     err_free:
>>>       if (err == -ENOSPC && total_allocated_on_err) {
>>> @@ -828,7 +893,7 @@ EXPORT_SYMBOL(drm_buddy_block_trim);
>>>    * @mm: DRM buddy manager to allocate from
>>>    * @start: start of the allowed range for this block
>>>    * @end: end of the allowed range for this block
>>> - * @size: size of the allocation
>>> + * @size: size of the allocation in bytes
>>>    * @min_block_size: alignment of the allocation
>>>    * @blocks: output list head to add allocated blocks
>>>    * @flags: DRM_BUDDY_*_ALLOCATION flags
>>> diff --git a/include/drm/drm_buddy.h b/include/drm/drm_buddy.h
>>> index 352a6364e26a..68a874846e78 100644
>>> --- a/include/drm/drm_buddy.h
>>> +++ b/include/drm/drm_buddy.h
>>> @@ -167,6 +167,9 @@ void drm_buddy_free_list(struct drm_buddy *mm,
>>>                struct list_head *objects,
>>>                unsigned int flags);
>>>   +void drm_buddy_defrag(struct drm_buddy *mm,
>>> +              unsigned int min_order);
>>> +
>>>   void drm_buddy_print(struct drm_buddy *mm, struct drm_printer *p);
>>>   void drm_buddy_block_print(struct drm_buddy *mm,
>>>                  struct drm_buddy_block *block,
> 


More information about the Intel-gfx mailing list