[Intel-gfx] [PATCH 1/2] drm/i915/pmu: Add a name to the execlists stats

Matthew Brost matthew.brost at intel.com
Wed Oct 27 18:56:26 UTC 2021


On Tue, Oct 26, 2021 at 05:48:20PM -0700, Umesh Nerlige Ramappa wrote:
> In preparation for GuC pmu stats, add a name to the execlists stats
> structure so that it can be differentiated from the GuC stats.
> 
> Signed-off-by: Umesh Nerlige Ramappa <umesh.nerlige.ramappa at intel.com>
> ---
>  drivers/gpu/drm/i915/gt/intel_engine_cs.c    | 14 +++---
>  drivers/gpu/drm/i915/gt/intel_engine_stats.h | 33 +++++++------
>  drivers/gpu/drm/i915/gt/intel_engine_types.h | 52 +++++++++++---------
>  3 files changed, 53 insertions(+), 46 deletions(-)
> 
> diff --git a/drivers/gpu/drm/i915/gt/intel_engine_cs.c b/drivers/gpu/drm/i915/gt/intel_engine_cs.c
> index ff6753ccb129..2de396e34d83 100644
> --- a/drivers/gpu/drm/i915/gt/intel_engine_cs.c
> +++ b/drivers/gpu/drm/i915/gt/intel_engine_cs.c
> @@ -363,7 +363,7 @@ static int intel_engine_setup(struct intel_gt *gt, enum intel_engine_id id,
>  		DRIVER_CAPS(i915)->has_logical_contexts = true;
>  
>  	ewma__engine_latency_init(&engine->latency);
> -	seqcount_init(&engine->stats.lock);
> +	seqcount_init(&engine->stats.execlists.lock);
>  
>  	ATOMIC_INIT_NOTIFIER_HEAD(&engine->context_status_notifier);
>  
> @@ -1918,15 +1918,16 @@ void intel_engine_dump(struct intel_engine_cs *engine,
>  static ktime_t __intel_engine_get_busy_time(struct intel_engine_cs *engine,
>  					    ktime_t *now)
>  {
> -	ktime_t total = engine->stats.total;
> +	struct intel_engine_execlists_stats *stats = &engine->stats.execlists;
> +	ktime_t total = stats->total;
>  
>  	/*
>  	 * If the engine is executing something at the moment
>  	 * add it to the total.
>  	 */
>  	*now = ktime_get();
> -	if (READ_ONCE(engine->stats.active))
> -		total = ktime_add(total, ktime_sub(*now, engine->stats.start));
> +	if (READ_ONCE(stats->active))
> +		total = ktime_add(total, ktime_sub(*now, stats->start));
>  
>  	return total;
>  }
> @@ -1940,13 +1941,14 @@ static ktime_t __intel_engine_get_busy_time(struct intel_engine_cs *engine,
>   */
>  ktime_t intel_engine_get_busy_time(struct intel_engine_cs *engine, ktime_t *now)
>  {
> +	struct intel_engine_execlists_stats *stats = &engine->stats.execlists;
>  	unsigned int seq;
>  	ktime_t total;
>  
>  	do {
> -		seq = read_seqcount_begin(&engine->stats.lock);
> +		seq = read_seqcount_begin(&stats->lock);
>  		total = __intel_engine_get_busy_time(engine, now);
> -	} while (read_seqcount_retry(&engine->stats.lock, seq));
> +	} while (read_seqcount_retry(&stats->lock, seq));
>  
>  	return total;
>  }
> diff --git a/drivers/gpu/drm/i915/gt/intel_engine_stats.h b/drivers/gpu/drm/i915/gt/intel_engine_stats.h
> index 24fbdd94351a..8e762d683e50 100644
> --- a/drivers/gpu/drm/i915/gt/intel_engine_stats.h
> +++ b/drivers/gpu/drm/i915/gt/intel_engine_stats.h
> @@ -15,45 +15,46 @@
>  
>  static inline void intel_engine_context_in(struct intel_engine_cs *engine)
>  {
> +	struct intel_engine_execlists_stats *stats = &engine->stats.execlists;
>  	unsigned long flags;
>  
> -	if (engine->stats.active) {
> -		engine->stats.active++;
> +	if (stats->active) {
> +		stats->active++;
>  		return;
>  	}
>  
>  	/* The writer is serialised; but the pmu reader may be from hardirq */
>  	local_irq_save(flags);
> -	write_seqcount_begin(&engine->stats.lock);
> +	write_seqcount_begin(&stats->lock);
>  
> -	engine->stats.start = ktime_get();
> -	engine->stats.active++;
> +	stats->start = ktime_get();
> +	stats->active++;
>  
> -	write_seqcount_end(&engine->stats.lock);
> +	write_seqcount_end(&stats->lock);
>  	local_irq_restore(flags);
>  
> -	GEM_BUG_ON(!engine->stats.active);
> +	GEM_BUG_ON(!stats->active);
>  }
>  
>  static inline void intel_engine_context_out(struct intel_engine_cs *engine)
>  {
> +	struct intel_engine_execlists_stats *stats = &engine->stats.execlists;
>  	unsigned long flags;
>  
> -	GEM_BUG_ON(!engine->stats.active);
> -	if (engine->stats.active > 1) {
> -		engine->stats.active--;
> +	GEM_BUG_ON(!stats->active);
> +	if (stats->active > 1) {
> +		stats->active--;
>  		return;
>  	}
>  
>  	local_irq_save(flags);
> -	write_seqcount_begin(&engine->stats.lock);
> +	write_seqcount_begin(&stats->lock);
>  
> -	engine->stats.active--;
> -	engine->stats.total =
> -		ktime_add(engine->stats.total,
> -			  ktime_sub(ktime_get(), engine->stats.start));
> +	stats->active--;
> +	stats->total = ktime_add(stats->total,
> +				 ktime_sub(ktime_get(), stats->start));
>  
> -	write_seqcount_end(&engine->stats.lock);
> +	write_seqcount_end(&stats->lock);
>  	local_irq_restore(flags);
>  }
>  
> diff --git a/drivers/gpu/drm/i915/gt/intel_engine_types.h b/drivers/gpu/drm/i915/gt/intel_engine_types.h
> index e0f773585c29..24fa7fb0e7de 100644
> --- a/drivers/gpu/drm/i915/gt/intel_engine_types.h
> +++ b/drivers/gpu/drm/i915/gt/intel_engine_types.h
> @@ -257,6 +257,33 @@ struct intel_engine_execlists {
>  
>  #define INTEL_ENGINE_CS_MAX_NAME 8
>  
> +struct intel_engine_execlists_stats {
> +	/**
> +	 * @active: Number of contexts currently scheduled in.
> +	 */
> +	unsigned int active;
> +
> +	/**
> +	 * @lock: Lock protecting the below fields.
> +	 */
> +	seqcount_t lock;
> +
> +	/**
> +	 * @total: Total time this engine was busy.
> +	 *
> +	 * Accumulated time not counting the most recent block in cases where
> +	 * engine is currently busy (active > 0).
> +	 */
> +	ktime_t total;
> +
> +	/**
> +	 * @start: Timestamp of the last idle to active transition.
> +	 *
> +	 * Idle is defined as active == 0, active is active > 0.
> +	 */
> +	ktime_t start;
> +};
> +
>  struct intel_engine_cs {
>  	struct drm_i915_private *i915;
>  	struct intel_gt *gt;
> @@ -488,30 +515,7 @@ struct intel_engine_cs {
>  	u32 (*get_cmd_length_mask)(u32 cmd_header);
>  
>  	struct {
> -		/**
> -		 * @active: Number of contexts currently scheduled in.
> -		 */
> -		unsigned int active;
> -
> -		/**
> -		 * @lock: Lock protecting the below fields.
> -		 */
> -		seqcount_t lock;
> -
> -		/**
> -		 * @total: Total time this engine was busy.
> -		 *
> -		 * Accumulated time not counting the most recent block in cases
> -		 * where engine is currently busy (active > 0).
> -		 */
> -		ktime_t total;
> -
> -		/**
> -		 * @start: Timestamp of the last idle to active transition.
> -		 *
> -		 * Idle is defined as active == 0, active is active > 0.
> -		 */
> -		ktime_t start;
> +		struct intel_engine_execlists_stats execlists;

I'd probably just define this sub-structure inline rather defining it
above. e.g.

struct {
	struct {
		fields...
	} execlists;
} stats;

Then the follow up patch:

union {
	struct {
		fields...
	} execlists;
	struct {
		fields...
	} guc;
} stats;

Or if there is common fields:

struct {
	common fields...
	struct {
		fields...
	} execlists;
	struct {
		fields...
	} guc;
} stats;

That being said, if you prefer to leave it as is, that's fine too.

With that:
Reviewed-by: Matthew Brost <matthew.brost at intel.com>

>  
>  		/**
>  		 * @rps: Utilisation at last RPS sampling.
> -- 
> 2.20.1
> 


More information about the Intel-gfx mailing list