[Intel-gfx] [PATCH 04/10] drm/i915: move intel_context slab to direct module init/exit

Jason Ekstrand jason at jlekstrand.net
Mon Jul 26 18:17:27 UTC 2021


On Mon, Jul 26, 2021 at 11:31 AM Tvrtko Ursulin
<tvrtko.ursulin at linux.intel.com> wrote:
>
>
> On 26/07/2021 17:20, Jason Ekstrand wrote:
> > On Mon, Jul 26, 2021 at 11:08 AM Tvrtko Ursulin
> > <tvrtko.ursulin at linux.intel.com> wrote:
> >> On 26/07/2021 16:42, Jason Ekstrand wrote:
> >>> On Mon, Jul 26, 2021 at 10:30 AM Jason Ekstrand <jason at jlekstrand.net> wrote:
> >>>>
> >>>> On Mon, Jul 26, 2021 at 3:35 AM Tvrtko Ursulin
> >>>> <tvrtko.ursulin at linux.intel.com> wrote:
> >>>>>
> >>>>>
> >>>>> On 23/07/2021 20:29, Daniel Vetter wrote:
> >>>>>> With the global kmem_cache shrink infrastructure gone there's nothing
> >>>>>> special and we can convert them over.
> >>>>>>
> >>>>>> I'm doing this split up into each patch because there's quite a bit of
> >>>>>> noise with removing the static global.slab_ce to just a
> >>>>>> slab_ce.
> >>>>>>
> >>>>>> Cc: Jason Ekstrand <jason at jlekstrand.net>
> >>>>>> Signed-off-by: Daniel Vetter <daniel.vetter at intel.com>
> >>>>>> ---
> >>>>>>     drivers/gpu/drm/i915/gt/intel_context.c | 25 ++++++++-----------------
> >>>>>>     drivers/gpu/drm/i915/gt/intel_context.h |  3 +++
> >>>>>>     drivers/gpu/drm/i915/i915_globals.c     |  2 --
> >>>>>>     drivers/gpu/drm/i915/i915_globals.h     |  1 -
> >>>>>>     drivers/gpu/drm/i915/i915_pci.c         |  2 ++
> >>>>>>     5 files changed, 13 insertions(+), 20 deletions(-)
> >>>>>>
> >>>>>> diff --git a/drivers/gpu/drm/i915/gt/intel_context.c b/drivers/gpu/drm/i915/gt/intel_context.c
> >>>>>> index baa05fddd690..283382549a6f 100644
> >>>>>> --- a/drivers/gpu/drm/i915/gt/intel_context.c
> >>>>>> +++ b/drivers/gpu/drm/i915/gt/intel_context.c
> >>>>>> @@ -7,7 +7,6 @@
> >>>>>>     #include "gem/i915_gem_pm.h"
> >>>>>>
> >>>>>>     #include "i915_drv.h"
> >>>>>> -#include "i915_globals.h"
> >>>>>>     #include "i915_trace.h"
> >>>>>>
> >>>>>>     #include "intel_context.h"
> >>>>>> @@ -15,14 +14,11 @@
> >>>>>>     #include "intel_engine_pm.h"
> >>>>>>     #include "intel_ring.h"
> >>>>>>
> >>>>>> -static struct i915_global_context {
> >>>>>> -     struct i915_global base;
> >>>>>> -     struct kmem_cache *slab_ce;
> >>>>>> -} global;
> >>>>>> +struct kmem_cache *slab_ce;
> >>>>
> >>>> Static?  With that,
> >>>>
> >>>> Reviewed-by: Jason Ekstrand <jason at jlekstrand.net>
> >>>>
> >>>>>>
> >>>>>>     static struct intel_context *intel_context_alloc(void)
> >>>>>>     {
> >>>>>> -     return kmem_cache_zalloc(global.slab_ce, GFP_KERNEL);
> >>>>>> +     return kmem_cache_zalloc(slab_ce, GFP_KERNEL);
> >>>>>>     }
> >>>>>>
> >>>>>>     static void rcu_context_free(struct rcu_head *rcu)
> >>>>>> @@ -30,7 +26,7 @@ static void rcu_context_free(struct rcu_head *rcu)
> >>>>>>         struct intel_context *ce = container_of(rcu, typeof(*ce), rcu);
> >>>>>>
> >>>>>>         trace_intel_context_free(ce);
> >>>>>> -     kmem_cache_free(global.slab_ce, ce);
> >>>>>> +     kmem_cache_free(slab_ce, ce);
> >>>>>>     }
> >>>>>>
> >>>>>>     void intel_context_free(struct intel_context *ce)
> >>>>>> @@ -410,22 +406,17 @@ void intel_context_fini(struct intel_context *ce)
> >>>>>>         i915_active_fini(&ce->active);
> >>>>>>     }
> >>>>>>
> >>>>>> -static void i915_global_context_exit(void)
> >>>>>> +void i915_context_module_exit(void)
> >>>>>>     {
> >>>>>> -     kmem_cache_destroy(global.slab_ce);
> >>>>>> +     kmem_cache_destroy(slab_ce);
> >>>>>>     }
> >>>>>>
> >>>>>> -static struct i915_global_context global = { {
> >>>>>> -     .exit = i915_global_context_exit,
> >>>>>> -} };
> >>>>>> -
> >>>>>> -int __init i915_global_context_init(void)
> >>>>>> +int __init i915_context_module_init(void)
> >>>>>>     {
> >>>>>> -     global.slab_ce = KMEM_CACHE(intel_context, SLAB_HWCACHE_ALIGN);
> >>>>>> -     if (!global.slab_ce)
> >>>>>> +     slab_ce = KMEM_CACHE(intel_context, SLAB_HWCACHE_ALIGN);
> >>>>>> +     if (!slab_ce)
> >>>>>>                 return -ENOMEM;
> >>>>>>
> >>>>>> -     i915_global_register(&global.base);
> >>>>>>         return 0;
> >>>>>>     }
> >>>>>>
> >>>>>> diff --git a/drivers/gpu/drm/i915/gt/intel_context.h b/drivers/gpu/drm/i915/gt/intel_context.h
> >>>>>> index 974ef85320c2..a0ca82e3c40d 100644
> >>>>>> --- a/drivers/gpu/drm/i915/gt/intel_context.h
> >>>>>> +++ b/drivers/gpu/drm/i915/gt/intel_context.h
> >>>>>> @@ -30,6 +30,9 @@ void intel_context_init(struct intel_context *ce,
> >>>>>>                         struct intel_engine_cs *engine);
> >>>>>>     void intel_context_fini(struct intel_context *ce);
> >>>>>>
> >>>>>> +void i915_context_module_exit(void);
> >>>>>> +int i915_context_module_init(void);
> >>>>>> +
> >>>>>>     struct intel_context *
> >>>>>>     intel_context_create(struct intel_engine_cs *engine);
> >>>>>>
> >>>>>> diff --git a/drivers/gpu/drm/i915/i915_globals.c b/drivers/gpu/drm/i915/i915_globals.c
> >>>>>> index 3de7cf22ec76..d36eb7dc40aa 100644
> >>>>>> --- a/drivers/gpu/drm/i915/i915_globals.c
> >>>>>> +++ b/drivers/gpu/drm/i915/i915_globals.c
> >>>>>> @@ -7,7 +7,6 @@
> >>>>>>     #include <linux/slab.h>
> >>>>>>     #include <linux/workqueue.h>
> >>>>>>
> >>>>>> -#include "gem/i915_gem_context.h"
> >>>>>>     #include "gem/i915_gem_object.h"
> >>>>>>     #include "i915_globals.h"
> >>>>>>     #include "i915_request.h"
> >>>>>> @@ -32,7 +31,6 @@ static void __i915_globals_cleanup(void)
> >>>>>>     }
> >>>>>>
> >>>>>>     static __initconst int (* const initfn[])(void) = {
> >>>>>> -     i915_global_context_init,
> >>>>>>         i915_global_gem_context_init,
> >>>>>>         i915_global_objects_init,
> >>>>>>         i915_global_request_init,
> >>>>>> diff --git a/drivers/gpu/drm/i915/i915_globals.h b/drivers/gpu/drm/i915/i915_globals.h
> >>>>>> index d80901ba75e3..60daa738a188 100644
> >>>>>> --- a/drivers/gpu/drm/i915/i915_globals.h
> >>>>>> +++ b/drivers/gpu/drm/i915/i915_globals.h
> >>>>>> @@ -23,7 +23,6 @@ int i915_globals_init(void);
> >>>>>>     void i915_globals_exit(void);
> >>>>>>
> >>>>>>     /* constructors */
> >>>>>> -int i915_global_context_init(void);
> >>>>>>     int i915_global_gem_context_init(void);
> >>>>>>     int i915_global_objects_init(void);
> >>>>>>     int i915_global_request_init(void);
> >>>>>> diff --git a/drivers/gpu/drm/i915/i915_pci.c b/drivers/gpu/drm/i915/i915_pci.c
> >>>>>> index f9527269e30a..266618157775 100644
> >>>>>> --- a/drivers/gpu/drm/i915/i915_pci.c
> >>>>>> +++ b/drivers/gpu/drm/i915/i915_pci.c
> >>>>>> @@ -33,6 +33,7 @@
> >>>>>>     #include "i915_active.h"
> >>>>>>     #include "i915_buddy.h"
> >>>>>>     #include "i915_drv.h"
> >>>>>> +#include "gem/i915_gem_context.h"
> >>>>>
> >>>>> It's a bit ugly to go to a design where i915_pci.c has to include so
> >>>>> many random parts of i915. IMO for a complex driver like i915,
> >>>>> compartmentalizing so much knowledge about the internals was better
> >>>>> inside the globals layer.
> >>>>
> >>>> I agree that i915_pci feels like the wrong place to put this but I
> >>>> don't think that's so much because globals don't belong in i915_pci
> >>>> but because i915_init/exit don't belong there.  Maybe, once this is
> >>>> all said and done (or at the start of the series), we should move
> >>>> i915_init/exit to i915_drv.c?  Of course, there's a bunch of PCI
> >>>> probing stuff in i915_drv.c so..... yeah.... our organization is
> >>>> pretty busted.
> >>>
> >>> To put a finer point on this, the new "design" is really to have a
> >>> single flat list instead of two, one nested inside the other.  There's
> >>> nothing wrong with that at all.  The fact that all this stuff now
> >>> lives in i915_pci.c is ugly.  But, as I said, that's kind-of an
> >>> accident of history because that's where i915_init() and i915_exit()
> >>> currently live.  We should just move the lot to i915_drv.c.
> >>
> >> Hmm.. on one hand it does sounds better to move to i915_drv.c, but is it
> >> just because all these new include directive are so visibly out of place
> >> in i915_pci.c?
> >>
> >> Perhaps we need i915_module.c and then i915_globals is a completely fine
> >> concept. Desired IMO even since we have to avoid globals in general
> >> (multi-gpu) so it sticks out nicely that all that is allowed to be
> >> global has a special place.
> >>
> >> And i915_drv.c can remain being about a driver instance as bound to one GPU.
> >
> > Is i915_drv.c about a single instance bound to a single GPU?  If so,
>
> Yep, all functions there either take drm_dev, pdev or dev_priv as
> argument, or return/initialize dev_priv.
>
> > then, yeah, maybe not the right place.  Maybe a i915_module.c would be
> > better.  It's all different shades of shed paint.
>
> Hm not really just different shades IMO. Because I argue the patch
> series as is is a retrograde step in the above discussed respect.
>
> I think i915_globals is cleaner code organisation. Because even if we
> add i915_module.c, then that can be made initialize globals and register
> with pci in cleanly separated steps without the need to include many
> driver internals.

Ok, so maybe I'm missing something in what you're saying.  I was under
the impression that your primary concern was separating PCI setup from
per-device from per-module stuff.  If so, moving it all to an
i915_module.c fixes that.

Are you arguing that a flat list of module init steps is bad?  And
that having globals be its own sub-list is good?  If so, then I have
to disagree.  I don't think splitting the calling of misc "set up my
slabs" functions from the final "register with PCI" at the end gains
us anything.  What it does do is give more files to search through,
more layers to think about when understanding the code, and more
infrastructure to maintain.

If, on the other hand, we had a globals infrastructure that actually
gained us something in terms of code simplicity, I might be able to
get behind that.  For instance, I could imagine something like this:

I915_DECL_SLAB(foo);

   /* Someone allocates something */
   kmem_cache_alloc(foo.slab);

where we somehow automagically declare the slab, initialize it on
module load, and tear it down on module exit.  That would add real
value.  As is, all i915_globals.c adds is extra layers.

--Jason


> I see r-b are accumulating but I hope reasonable objections will be
> considered.
>
> Regards,
>
> Tvrtko
>
> >
> > --Jason
> >
> >> That feels like the best of both worlds to me.
> >>
> >> Regards,
> >>
> >> Tvrtko
> >>
> >>>
> >>>> --Jason
> >>>>
> >>>>> Maybe add a cover letter to explain the perceived pros and cons and
> >>>>> thinking in general?
> >>>>>
> >>>>> Regards,
> >>>>>
> >>>>> Tvrtko
> >>>>>
> >>>>>>     #include "i915_perf.h"
> >>>>>>     #include "i915_globals.h"
> >>>>>>     #include "i915_selftest.h"
> >>>>>> @@ -1297,6 +1298,7 @@ static const struct {
> >>>>>>         { i915_check_nomodeset, NULL },
> >>>>>>         { i915_active_module_init, i915_active_module_exit },
> >>>>>>         { i915_buddy_module_init, i915_buddy_module_exit },
> >>>>>> +     { i915_context_module_init, i915_context_module_exit },
> >>>>>>         { i915_globals_init, i915_globals_exit },
> >>>>>>         { i915_mock_selftests, NULL },
> >>>>>>         { i915_pmu_init, i915_pmu_exit },
> >>>>>>
> >>>>> _______________________________________________
> >>>>> Intel-gfx mailing list
> >>>>> Intel-gfx at lists.freedesktop.org
> >>>>> https://lists.freedesktop.org/mailman/listinfo/intel-gfx


More information about the Intel-gfx mailing list