[Intel-xe] [PATCH 03/15] drm/xe/xe2: Add MCR register steering for primary GT

Balasubramani Vivekanandan balasubramani.vivekanandan at intel.com
Fri Aug 18 06:11:33 UTC 2023


On 17.08.2023 07:47, Lucas De Marchi wrote:
> On Wed, Aug 16, 2023 at 03:27:54PM -0700, Matt Atwood wrote:
> > On Fri, Aug 11, 2023 at 09:06:06AM -0700, Lucas De Marchi wrote:
> > > From: Matt Roper <matthew.d.roper at intel.com>
> > > 
> > > Xe2 uses the same steering control register and steering semaphore
> > > register as MTL.  As with recent platforms, group/instance 0,0 is
> > > sufficient to target a non-terminated instance for most classes of MCR
> > > registers; the only types of ranges that need to consider platform
> > > fusing to find a non-terminated instance are SLICE/DSS ranges and a new
> > > SQIDI_PSMI type of range.
> > > 
> > > Note that the range of valid bits in XE2_NODE_ENABLE_MASK may be reduced
> > > for some Xe2 SKUs.  However the lowest bits are always valid and only
> > > the lowest instance is obtained via __ffs(), so there's no need to
> > > complicate the masking with extra platform/subplatform checks.
> > > 
> > > Also note that Wa_14017387313 suggests skipping MCR lock acquisition
> > > around GAM and GAMWKR registers to prevent MCR register accesses in an
> > > interrupt handler from deadlocking when the steering semaphore is
> > > already held outside the interrupt context.  At this time Xe never
> > > issues MCR accesses from within an interrupt handler so the workaround
> > > is not currently needed.
> > > 
> > > Bspec: 71185
> > > Signed-off-by: Matt Roper <matthew.d.roper at intel.com>
> > > Signed-off-by: Lucas De Marchi <lucas.demarchi at intel.com>
> > > ---
> > >  drivers/gpu/drm/xe/regs/xe_gt_regs.h |  1 +
> > >  drivers/gpu/drm/xe/xe_gt_mcr.c       | 50 +++++++++++++++++++++++++++-
> > >  drivers/gpu/drm/xe/xe_gt_types.h     |  1 +
> > >  3 files changed, 51 insertions(+), 1 deletion(-)
> > > 
> > > diff --git a/drivers/gpu/drm/xe/regs/xe_gt_regs.h b/drivers/gpu/drm/xe/regs/xe_gt_regs.h
> > > index ad7ae6a28caca..5bc6c7fa4759f 100644
> > > --- a/drivers/gpu/drm/xe/regs/xe_gt_regs.h
> > > +++ b/drivers/gpu/drm/xe/regs/xe_gt_regs.h
> > > @@ -145,6 +145,7 @@
> > >  #define   EN_32B_ACCESS				REG_BIT(30)
> > > 
> > >  #define	MIRROR_FUSE3				XE_REG(0x9118)
> > > +#define   XE2_NODE_ENABLE_MASK			REG_GENMASK(31, 16)
> > >  #define   L3BANK_PAIR_COUNT			4
> > >  #define   L3BANK_MASK				REG_GENMASK(3, 0)
> > >  /* on Xe_HP the same fuses indicates mslices instead of L3 banks */
> > > diff --git a/drivers/gpu/drm/xe/xe_gt_mcr.c b/drivers/gpu/drm/xe/xe_gt_mcr.c
> > > index 9eb7a6a1348d6..ef9f4044ca1fd 100644
> > > --- a/drivers/gpu/drm/xe/xe_gt_mcr.c
> > > +++ b/drivers/gpu/drm/xe/xe_gt_mcr.c
> > > @@ -181,6 +181,39 @@ static const struct xe_mmio_range dg2_implicit_steering_table[] = {
> > >  	{},
> > >  };
> > > 
> > > +static const struct xe_mmio_range xe2lpg_dss_steering_table[] = {
> > > +	{ 0x005200, 0x0052FF },         /* SLICE */
> > > +	{ 0x005500, 0x007FFF },         /* SLICE */
> > > +	{ 0x008140, 0x00815F },         /* SLICE (0x8140-0x814F), DSS (0x8150-0x815F) */
> > > +	{ 0x0094D0, 0x00955F },         /* SLICE (0x94D0-0x951F), DSS (0x9520-0x955F) */
> > > +	{ 0x009680, 0x0096FF },         /* DSS */
> > > +	{ 0x00D800, 0x00D87F },         /* SLICE */
> > > +	{ 0x00DC00, 0x00DCFF },         /* SLICE */
> > > +	{ 0x00DE80, 0x00E8FF },         /* DSS (0xE000-0xE0FF reserved) */
> > > +	{ 0x00E980, 0x00E9FF },         /* SLICE */
> > > +	{ 0x013000, 0x0133FF },         /* DSS (0x13000-0x131FF), SLICE (0x13200-0x133FF) */
> > > +	{},
> > > +};
> > > +
> > > +static const struct xe_mmio_range xe2lpg_sqidi_psmi_steering_table[] = {
> > > +	{ 0x000B00, 0x000BFF },
> > > +	{ 0x001000, 0x001FFF },
> > > +	{},
> > > +};
> > > +
> > > +static const struct xe_mmio_range xe2lpg_instance0_steering_table[] = {
> > > +	{ 0x004000, 0x004AFF },         /* GAM, rsvd, GAMWKR */
> > 						^(4200->43FF reserved)
> 
> This is intended so we have simpler ranges to lookup on every mcr
> register access. Intention is to keep the table as small as possible
> without causing issues.
> 
> If it's reserved, there shouldn't be any access going on and we can
> coalesce the range with the next ranges. Explicitely leaving out the
> rsvd range would benefit debugging as it would automatically create a
> warning when accessing such a register, but I'm not sure it's worth it.
> Matt Roper, any thoughts?
> 
> > > +	{ 0x008700, 0x0087FF },         /* SQIDI, MEMPIPE */
> > 8700->87FF is SQIDI only, to include MEMPIPE entry extend to 887F.
> 
> ack
> 
> > > +	{ 0x00B000, 0x00B3FF },         /* NODE, L3BANK */
> > > +	{ 0x00C800, 0x00CFFF },         /* GAM */
> > > +	{ 0x00D880, 0x00D8FF },         /* NODE */
> > > +	{ 0x00DD00, 0x00DDFF },         /* MEMPIPE */
> > > +	{ 0x00E900, 0x00E97F },         /* MEMPIPE */
> > > +	{ 0x00EF00, 0x00F4FF },         /* GAM, GAMWKR */
> > GAM starts ate F000, EF00->EFFF is reserved.
> 
> same reason as above, we don't care about the reserved "holes"

I guess the above range was calculated without using project filter in
the Bspec. After applying the filter for LunarLake, the range turns out
to be

 {0x00F000, 0xFFFF}, /* GAM, GAMWKR */

Regards,
Bala

> 
> thanks
> Lucas De Marchi
> 
> > > +	{ 0x013400, 0x0135FF },         /* MEMPIPE */
> > > +	{},
> > > +};
> > > +
> > >  static void init_steering_l3bank(struct xe_gt *gt)
> > >  {
> > >  	if (GRAPHICS_VERx100(gt_to_xe(gt)) >= 1270) {
> > > @@ -265,6 +298,16 @@ static void init_steering_oaddrm(struct xe_gt *gt)
> > >  	gt->steering[DSS].instance_target = 0;		/* unused */
> > >  }
> > > 
> > > +static void init_steering_sqidi_psmi(struct xe_gt *gt)
> > > +{
> > > +	u32 mask = REG_FIELD_GET(XE2_NODE_ENABLE_MASK,
> > > +				 xe_mmio_read32(gt, MIRROR_FUSE3));
> > > +	u32 select = __ffs(mask);
> > > +
> > > +	gt->steering[SQIDI_PSMI].group_target = select >> 1;
> > > +	gt->steering[SQIDI_PSMI].instance_target = select & 0x1;
> > > +}
> > > +
> > >  static void init_steering_inst0(struct xe_gt *gt)
> > >  {
> > >  	gt->steering[DSS].group_target = 0;		/* unused */
> > > @@ -280,6 +323,7 @@ static const struct {
> > >  	[LNCF] =	{ "LNCF",	NULL }, /* initialized by mslice init */
> > >  	[DSS] =		{ "DSS",	init_steering_dss },
> > >  	[OADDRM] =	{ "OADDRM",	init_steering_oaddrm },
> > > +	[SQIDI_PSMI] =  { "SQIDI_PSMI", init_steering_sqidi_psmi },
> > >  	[INSTANCE0] =	{ "INSTANCE 0",	init_steering_inst0 },
> > >  	[IMPLICIT_STEERING] = { "IMPLICIT", NULL },
> > >  };
> > > @@ -298,7 +342,11 @@ void xe_gt_mcr_init(struct xe_gt *gt)
> > > 
> > >  		gt->steering[OADDRM].ranges = xelpmp_oaddrm_steering_table;
> > >  	} else {
> > > -		if (GRAPHICS_VERx100(xe) >= 1270) {
> > > +		if (GRAPHICS_VER(xe) >= 20) {
> > > +			gt->steering[DSS].ranges = xe2lpg_dss_steering_table;
> > > +			gt->steering[SQIDI_PSMI].ranges = xe2lpg_sqidi_psmi_steering_table;
> > > +			gt->steering[INSTANCE0].ranges = xe2lpg_instance0_steering_table;
> > > +		} else if (GRAPHICS_VERx100(xe) >= 1270) {
> > >  			gt->steering[INSTANCE0].ranges = xelpg_instance0_steering_table;
> > >  			gt->steering[L3BANK].ranges = xelpg_l3bank_steering_table;
> > >  			gt->steering[DSS].ranges = xelpg_dss_steering_table;
> > > diff --git a/drivers/gpu/drm/xe/xe_gt_types.h b/drivers/gpu/drm/xe/xe_gt_types.h
> > > index 48fd698ff62aa..d4310be3e1e7c 100644
> > > --- a/drivers/gpu/drm/xe/xe_gt_types.h
> > > +++ b/drivers/gpu/drm/xe/xe_gt_types.h
> > > @@ -55,6 +55,7 @@ enum xe_steering_type {
> > >  	LNCF,
> > >  	DSS,
> > >  	OADDRM,
> > > +	SQIDI_PSMI,
> > > 
> > >  	/*
> > >  	 * On some platforms there are multiple types of MCR registers that
> > > --
> > > 2.40.1
> > > 


More information about the Intel-xe mailing list