[PATCH 6/8] drm/i915/xehp: Define context scheduling attributes in lrc descriptor
Tvrtko Ursulin
tvrtko.ursulin at linux.intel.com
Wed Sep 8 14:01:08 UTC 2021
On 07/09/2021 18:19, Matt Roper wrote:
> In Dual Context mode the EUs are shared between render and compute
> command streamers. The hardware provides a field in the lrc descriptor
> to indicate the prioritization of the thread dispatch associated to the
> corresponding context.
>
> The context priority is set to 'low' at creation time and relies on the
> existing context priority to set it to low/normal/high.
>
> HSDES: 1604462009
> Bspec: 46145, 46260
> Original-patch-by: Michel Thierry
> Cc: Tvrtko Ursulin <tvrtko.ursulin at linux.intel.com>
> Signed-off-by: Aravind Iddamsetty <aravind.iddamsetty at intel.com>
> Signed-off-by: Prasad Nallani <prasad.nallani at intel.com>
> Signed-off-by: Matt Roper <matthew.d.roper at intel.com>
> ---
> drivers/gpu/drm/i915/gt/intel_engine_cs.c | 4 +++-
> drivers/gpu/drm/i915/gt/intel_engine_types.h | 1 +
> drivers/gpu/drm/i915/gt/intel_execlists_submission.c | 6 +++++-
> drivers/gpu/drm/i915/gt/intel_lrc.h | 10 ++++++++++
> drivers/gpu/drm/i915/i915_reg.h | 4 ++++
> 5 files changed, 23 insertions(+), 2 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/gt/intel_engine_cs.c b/drivers/gpu/drm/i915/gt/intel_engine_cs.c
> index b346b946602d..2f719f0ecac3 100644
> --- a/drivers/gpu/drm/i915/gt/intel_engine_cs.c
> +++ b/drivers/gpu/drm/i915/gt/intel_engine_cs.c
> @@ -382,8 +382,10 @@ static int intel_engine_setup(struct intel_gt *gt, enum intel_engine_id id)
> engine->props.preempt_timeout_ms = 0;
>
> /* features common between engines sharing EUs */
> - if (engine->class == RENDER_CLASS || engine->class == COMPUTE_CLASS)
> + if (engine->class == RENDER_CLASS || engine->class == COMPUTE_CLASS) {
> engine->flags |= I915_ENGINE_HAS_RCS_REG_STATE;
> + engine->flags |= I915_ENGINE_HAS_EU_PRIORITY;
> + }
>
> engine->defaults = engine->props; /* never to change again */
>
> diff --git a/drivers/gpu/drm/i915/gt/intel_engine_types.h b/drivers/gpu/drm/i915/gt/intel_engine_types.h
> index 30a0c69c36c8..00bf0296b28a 100644
> --- a/drivers/gpu/drm/i915/gt/intel_engine_types.h
> +++ b/drivers/gpu/drm/i915/gt/intel_engine_types.h
> @@ -455,6 +455,7 @@ struct intel_engine_cs {
> #define I915_ENGINE_REQUIRES_CMD_PARSER BIT(7)
> #define I915_ENGINE_WANT_FORCED_PREEMPTION BIT(8)
> #define I915_ENGINE_HAS_RCS_REG_STATE BIT(9)
> +#define I915_ENGINE_HAS_EU_PRIORITY BIT(10)
> unsigned int flags;
>
> /*
> diff --git a/drivers/gpu/drm/i915/gt/intel_execlists_submission.c b/drivers/gpu/drm/i915/gt/intel_execlists_submission.c
> index 4c600c46414d..2b36ec7f3a04 100644
> --- a/drivers/gpu/drm/i915/gt/intel_execlists_submission.c
> +++ b/drivers/gpu/drm/i915/gt/intel_execlists_submission.c
> @@ -662,9 +662,13 @@ static inline void execlists_schedule_out(struct i915_request *rq)
> static u64 execlists_update_context(struct i915_request *rq)
> {
> struct intel_context *ce = rq->context;
> - u64 desc = ce->lrc.desc;
> + u64 desc;
> u32 tail, prev;
>
> + desc = ce->lrc.desc;
> + if (rq->engine->flags & I915_ENGINE_HAS_EU_PRIORITY)
> + desc |= lrc_desc_priority(rq_prio(rq));
> +
> /*
> * WaIdleLiteRestore:bdw,skl
> *
> diff --git a/drivers/gpu/drm/i915/gt/intel_lrc.h b/drivers/gpu/drm/i915/gt/intel_lrc.h
> index 7f697845c4cf..d3f2096b3d51 100644
> --- a/drivers/gpu/drm/i915/gt/intel_lrc.h
> +++ b/drivers/gpu/drm/i915/gt/intel_lrc.h
> @@ -79,4 +79,14 @@ static inline u32 lrc_get_runtime(const struct intel_context *ce)
> return READ_ONCE(ce->lrc_reg_state[CTX_TIMESTAMP]);
> }
>
> +static inline u32 lrc_desc_priority(int prio)
> +{
> + if (prio > I915_PRIORITY_NORMAL)
> + return GEN12_CTX_PRIORITY_HIGH;
> + else if (prio < I915_PRIORITY_NORMAL)
> + return GEN12_CTX_PRIORITY_LOW;
> + else
> + return GEN12_CTX_PRIORITY_NORMAL;
> +}
> +
> #endif /* __INTEL_LRC_H__ */
> diff --git a/drivers/gpu/drm/i915/i915_reg.h b/drivers/gpu/drm/i915/i915_reg.h
> index 0bb185ce9529..5b68c02c35af 100644
> --- a/drivers/gpu/drm/i915/i915_reg.h
> +++ b/drivers/gpu/drm/i915/i915_reg.h
> @@ -4212,6 +4212,10 @@ enum {
> #define GEN8_CTX_L3LLC_COHERENT (1 << 5)
> #define GEN8_CTX_PRIVILEGE (1 << 8)
> #define GEN8_CTX_ADDRESSING_MODE_SHIFT 3
> +#define GEN12_CTX_PRIORITY_MASK REG_GENMASK(10, 9)
> +#define GEN12_CTX_PRIORITY_HIGH REG_FIELD_PREP(GEN12_CTX_PRIORITY_MASK, 2)
> +#define GEN12_CTX_PRIORITY_NORMAL REG_FIELD_PREP(GEN12_CTX_PRIORITY_MASK, 1)
> +#define GEN12_CTX_PRIORITY_LOW REG_FIELD_PREP(GEN12_CTX_PRIORITY_MASK, 0)
>
> #define GEN8_CTX_ID_SHIFT 32
> #define GEN8_CTX_ID_WIDTH 21
>
Haven't checked bspec to check the bitfield but the mechanics look good.
Reviewed-by: Tvrtko Ursulin <tvrtko.ursulin at intel.com>
Regards,
Tvrtko
More information about the dri-devel
mailing list