[Intel-gfx] [PATCH 1/5] drm/i915: Add ability for tracking buffer objects per client

Tvrtko Ursulin tvrtko.ursulin at linux.intel.com
Tue Jul 11 09:39:53 UTC 2023


On 11/07/2023 08:48, Iddamsetty, Aravind wrote:
> On 10-07-2023 18:50, Tvrtko Ursulin wrote:
>>
>> On 10/07/2023 11:44, Iddamsetty, Aravind wrote:
>>> On 07-07-2023 18:32, Tvrtko Ursulin wrote:
>>>> From: Tvrtko Ursulin <tvrtko.ursulin at intel.com>
>>>>
>>>> In order to show per client memory usage lets add some infrastructure
>>>> which enables tracking buffer objects owned by clients.
>>>>
>>>> We add a per client list protected by a new per client lock and to
>>>> support
>>>> delayed destruction (post client exit) we make tracked objects hold
>>>> references to the owning client.
>>>>
>>>> Also, object memory region teardown is moved to the existing RCU free
>>>> callback to allow safe dereference from the fdinfo RCU read section.
>>>>
>>>> Signed-off-by: Tvrtko Ursulin <tvrtko.ursulin at intel.com>
>>>> ---
>>>>    drivers/gpu/drm/i915/gem/i915_gem_object.c    | 13 +++++--
>>>>    .../gpu/drm/i915/gem/i915_gem_object_types.h  | 12 +++++++
>>>>    drivers/gpu/drm/i915/i915_drm_client.c        | 36 +++++++++++++++++++
>>>>    drivers/gpu/drm/i915/i915_drm_client.h        | 32 +++++++++++++++++
>>>>    4 files changed, 90 insertions(+), 3 deletions(-)
>>>>
>>>> diff --git a/drivers/gpu/drm/i915/gem/i915_gem_object.c
>>>> b/drivers/gpu/drm/i915/gem/i915_gem_object.c
>>>> index 97ac6fb37958..3dc4fbb67d2b 100644
>>>> --- a/drivers/gpu/drm/i915/gem/i915_gem_object.c
>>>> +++ b/drivers/gpu/drm/i915/gem/i915_gem_object.c
>>>> @@ -105,6 +105,10 @@ void i915_gem_object_init(struct
>>>> drm_i915_gem_object *obj,
>>>>          INIT_LIST_HEAD(&obj->mm.link);
>>>>    +#ifdef CONFIG_PROC_FS
>>>> +    INIT_LIST_HEAD(&obj->client_link);
>>>> +#endif
>>>> +
>>>>        INIT_LIST_HEAD(&obj->lut_list);
>>>>        spin_lock_init(&obj->lut_lock);
>>>>    @@ -292,6 +296,10 @@ void __i915_gem_free_object_rcu(struct
>>>> rcu_head *head)
>>>>            container_of(head, typeof(*obj), rcu);
>>>>        struct drm_i915_private *i915 = to_i915(obj->base.dev);
>>>>    +    /* We need to keep this alive for RCU read access from fdinfo. */
>>>> +    if (obj->mm.n_placements > 1)
>>>> +        kfree(obj->mm.placements);
>>>> +
>>>>        i915_gem_object_free(obj);
>>>>          GEM_BUG_ON(!atomic_read(&i915->mm.free_count));
>>>> @@ -388,9 +396,6 @@ void __i915_gem_free_object(struct
>>>> drm_i915_gem_object *obj)
>>>>        if (obj->ops->release)
>>>>            obj->ops->release(obj);
>>>>    -    if (obj->mm.n_placements > 1)
>>>> -        kfree(obj->mm.placements);
>>>> -
>>>>        if (obj->shares_resv_from)
>>>>            i915_vm_resv_put(obj->shares_resv_from);
>>>>    @@ -441,6 +446,8 @@ static void i915_gem_free_object(struct
>>>> drm_gem_object *gem_obj)
>>>>          GEM_BUG_ON(i915_gem_object_is_framebuffer(obj));
>>>>    +    i915_drm_client_remove_object(obj);
>>>> +
>>>>        /*
>>>>         * Before we free the object, make sure any pure RCU-only
>>>>         * read-side critical sections are complete, e.g.
>>>> diff --git a/drivers/gpu/drm/i915/gem/i915_gem_object_types.h
>>>> b/drivers/gpu/drm/i915/gem/i915_gem_object_types.h
>>>> index e72c57716bee..8de2b91b3edf 100644
>>>> --- a/drivers/gpu/drm/i915/gem/i915_gem_object_types.h
>>>> +++ b/drivers/gpu/drm/i915/gem/i915_gem_object_types.h
>>>> @@ -300,6 +300,18 @@ struct drm_i915_gem_object {
>>>>         */
>>>>        struct i915_address_space *shares_resv_from;
>>>>    +#ifdef CONFIG_PROC_FS
>>>> +    /**
>>>> +     * @client: @i915_drm_client which created the object
>>>> +     */
>>>> +    struct i915_drm_client *client;
>>>> +
>>>> +    /**
>>>> +     * @client_link: Link into @i915_drm_client.objects_list
>>>> +     */
>>>> +    struct list_head client_link;
>>>> +#endif
>>>> +
>>>>        union {
>>>>            struct rcu_head rcu;
>>>>            struct llist_node freed;
>>>> diff --git a/drivers/gpu/drm/i915/i915_drm_client.c
>>>> b/drivers/gpu/drm/i915/i915_drm_client.c
>>>> index 2a44b3876cb5..2e5e69edc0f9 100644
>>>> --- a/drivers/gpu/drm/i915/i915_drm_client.c
>>>> +++ b/drivers/gpu/drm/i915/i915_drm_client.c
>>>> @@ -28,6 +28,10 @@ struct i915_drm_client *i915_drm_client_alloc(void)
>>>>        kref_init(&client->kref);
>>>>        spin_lock_init(&client->ctx_lock);
>>>>        INIT_LIST_HEAD(&client->ctx_list);
>>>> +#ifdef CONFIG_PROC_FS
>>>> +    spin_lock_init(&client->objects_lock);
>>>> +    INIT_LIST_HEAD(&client->objects_list);
>>>> +#endif
>>>>          return client;
>>>>    }
>>>> @@ -108,4 +112,36 @@ void i915_drm_client_fdinfo(struct drm_printer
>>>> *p, struct drm_file *file)
>>>>        for (i = 0; i < ARRAY_SIZE(uabi_class_names); i++)
>>>>            show_client_class(p, i915, file_priv->client, i);
>>>>    }
>>>> +
>>>> +void i915_drm_client_add_object(struct i915_drm_client *client,
>>>> +                struct drm_i915_gem_object *obj)
>>>> +{
>>>> +    unsigned long flags;
>>>> +
>>>> +    GEM_WARN_ON(obj->client);
>>>> +    GEM_WARN_ON(!list_empty(&obj->client_link));
>>>> +
>>>> +    spin_lock_irqsave(&client->objects_lock, flags);
>>>> +    obj->client = i915_drm_client_get(client);
>>>> +    list_add_tail_rcu(&obj->client_link, &client->objects_list);
>>>> +    spin_unlock_irqrestore(&client->objects_lock, flags);
>>>> +}
>>>
>>> would it be nice to mention that we use this client infra only to track
>>> internal objects. While the user created through file->object_idr added
>>> during handle creation time.
>>
>> In this series it is indeed only used for that.
>>
>> But it would be nicer to use it to track everything, so fdinfo readers
>> would not be hitting the idr lock, which would avoid injecting latency
>> to real DRM clients.
>>
>> The only fly in the ointment IMO is that I needed that drm core helper
>> to be able to track dmabuf imports. Possibly something for flink too,
>> did not look into that yet.
> 
> wouldn't dmabuf be tracked via object_idr as a new handle is created for it.

Yes it is/would. I was talking about hypothetically not using object_idr 
and instead tracking everything via the mechanism introduced in this 
patch, which would allow for lockless fdinfo reads for everything. If 
you remember I had that approach in an earlier version but it needed a 
patch to drm code to split the prime helpers (or so) and also did not 
cover the question on how to handle flink.

Regards,

Tvrtko

> 
> Thanks,
> Aravind.
>>
>> In the light of all that I can mention in the cover letter next time
>> round. It is a bit stale anyway (the cover letter).
>>
>> Regards,
>>
>> Tvrtko
>>
>>>> +bool i915_drm_client_remove_object(struct drm_i915_gem_object *obj)
>>>> +{
>>>> +    struct i915_drm_client *client = fetch_and_zero(&obj->client);
>>>> +    unsigned long flags;
>>>> +
>>>> +    /* Object may not be associated with a client. */
>>>> +    if (!client)
>>>> +        return false;
>>>> +
>>>> +    spin_lock_irqsave(&client->objects_lock, flags);
>>>> +    list_del_rcu(&obj->client_link);
>>>> +    spin_unlock_irqrestore(&client->objects_lock, flags);
>>>> +
>>>> +    i915_drm_client_put(client);
>>>> +
>>>> +    return true;
>>>> +}
>>>>    #endif
>>>> diff --git a/drivers/gpu/drm/i915/i915_drm_client.h
>>>> b/drivers/gpu/drm/i915/i915_drm_client.h
>>>> index 67816c912bca..5f58fdf7dcb8 100644
>>>> --- a/drivers/gpu/drm/i915/i915_drm_client.h
>>>> +++ b/drivers/gpu/drm/i915/i915_drm_client.h
>>>> @@ -12,6 +12,9 @@
>>>>      #include <uapi/drm/i915_drm.h>
>>>>    +#include "i915_file_private.h"
>>>> +#include "gem/i915_gem_object_types.h"
>>>> +
>>>>    #define I915_LAST_UABI_ENGINE_CLASS I915_ENGINE_CLASS_COMPUTE
>>>>      struct drm_file;
>>>> @@ -25,6 +28,20 @@ struct i915_drm_client {
>>>>        spinlock_t ctx_lock; /* For add/remove from ctx_list. */
>>>>        struct list_head ctx_list; /* List of contexts belonging to
>>>> client. */
>>>>    +#ifdef CONFIG_PROC_FS
>>>> +    /**
>>>> +     * @objects_lock: lock protecting @objects_list
>>>> +     */
>>>> +    spinlock_t objects_lock;
>>>> +
>>>> +    /**
>>>> +     * @objects_list: list of objects created by this client
>>>> +     *
>>>> +     * Protected by @objects_lock.
>>>> +     */
>>>> +    struct list_head objects_list;
>>>> +#endif
>>>> +
>>>>        /**
>>>>         * @past_runtime: Accumulation of pphwsp runtimes from closed
>>>> contexts.
>>>>         */
>>>> @@ -49,4 +66,19 @@ struct i915_drm_client *i915_drm_client_alloc(void);
>>>>      void i915_drm_client_fdinfo(struct drm_printer *p, struct
>>>> drm_file *file);
>>>>    +#ifdef CONFIG_PROC_FS
>>>> +void i915_drm_client_add_object(struct i915_drm_client *client,
>>>> +                struct drm_i915_gem_object *obj);
>>>> +bool i915_drm_client_remove_object(struct drm_i915_gem_object *obj);
>>>> +#else
>>>> +static inline void i915_drm_client_add_object(struct i915_drm_client
>>>> *client,
>>>> +                          struct drm_i915_gem_object *obj)
>>>> +{
>>>> +}
>>>> +
>>>> +static inline bool i915_drm_client_remove_object(struct
>>>> drm_i915_gem_object *obj)
>>>> +{
>>>> +}
>>>> +#endif
>>>> +
>>>>    #endif /* !__I915_DRM_CLIENT_H__ */


More information about the Intel-gfx mailing list