[Intel-gfx] [PATCH] drm/i915/gt: Add general DSS steering iterator to intel_gt_mcr
Matt Atwood
matthew.s.atwood at intel.com
Fri Jul 8 16:23:03 UTC 2022
On Fri, Jul 01, 2022 at 04:20:06PM -0700, Matt Roper wrote:
> Although all DSS belong to a single pool on Xe_HP platforms (i.e.,
> they're not organized into slices from a topology point of view), we do
> still need to pass 'group' and 'instance' targets when steering register
> accesses to a specific instance of a per-DSS multicast register. The
> rules for how to determine group and instance IDs (which previously used
> legacy terms "slice" and "subslice") varies by platform. Some platforms
> determine steering by gslice membership, some platforms by cslice
> membership, and future platforms may have other rules.
>
> Since looping over each DSS and performing steered unicast register
> accesses is a relatively common pattern, let's add a dedicated iteration
> macro to handle this (and replace the platform-specific "instdone" loop
> we were using previously. This will avoid the calling code needing to
> figure out the details about how to obtain steering IDs for a specific
> DSS.
>
> Most of the places where we use this new loop are in the GPU errorstate
> code at the moment, but we do have some additional features coming in
> the future that will also need to loop over each DSS and steer some
> register accesses accordingly.
>
Reviewed-by: Matt Atwood <matthew.s.atwood at intel.com>
> Signed-off-by: Matt Roper <matthew.d.roper at intel.com>
> ---
> drivers/gpu/drm/i915/gt/intel_engine_cs.c | 34 ++++++-------------
> drivers/gpu/drm/i915/gt/intel_engine_types.h | 22 ------------
> drivers/gpu/drm/i915/gt/intel_gt_mcr.c | 25 ++++++++++++++
> drivers/gpu/drm/i915/gt/intel_gt_mcr.h | 24 +++++++++++++
> .../gpu/drm/i915/gt/uc/intel_guc_capture.c | 13 ++++---
> drivers/gpu/drm/i915/i915_gpu_error.c | 32 ++++++-----------
> 6 files changed, 75 insertions(+), 75 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/gt/intel_engine_cs.c b/drivers/gpu/drm/i915/gt/intel_engine_cs.c
> index 283870c65991..37fa813af766 100644
> --- a/drivers/gpu/drm/i915/gt/intel_engine_cs.c
> +++ b/drivers/gpu/drm/i915/gt/intel_engine_cs.c
> @@ -1517,7 +1517,6 @@ void intel_engine_get_instdone(const struct intel_engine_cs *engine,
> struct intel_instdone *instdone)
> {
> struct drm_i915_private *i915 = engine->i915;
> - const struct sseu_dev_info *sseu = &engine->gt->info.sseu;
> struct intel_uncore *uncore = engine->uncore;
> u32 mmio_base = engine->mmio_base;
> int slice;
> @@ -1542,32 +1541,19 @@ void intel_engine_get_instdone(const struct intel_engine_cs *engine,
> intel_uncore_read(uncore, GEN12_SC_INSTDONE_EXTRA2);
> }
>
> - if (GRAPHICS_VER_FULL(i915) >= IP_VER(12, 50)) {
> - for_each_instdone_gslice_dss_xehp(i915, sseu, iter, slice, subslice) {
> - instdone->sampler[slice][subslice] =
> - intel_gt_mcr_read(engine->gt,
> - GEN7_SAMPLER_INSTDONE,
> - slice, subslice);
> - instdone->row[slice][subslice] =
> - intel_gt_mcr_read(engine->gt,
> - GEN7_ROW_INSTDONE,
> - slice, subslice);
> - }
> - } else {
> - for_each_instdone_slice_subslice(i915, sseu, slice, subslice) {
> - instdone->sampler[slice][subslice] =
> - intel_gt_mcr_read(engine->gt,
> - GEN7_SAMPLER_INSTDONE,
> - slice, subslice);
> - instdone->row[slice][subslice] =
> - intel_gt_mcr_read(engine->gt,
> - GEN7_ROW_INSTDONE,
> - slice, subslice);
> - }
> + for_each_ss_steering(iter, engine->gt, slice, subslice) {
> + instdone->sampler[slice][subslice] =
> + intel_gt_mcr_read(engine->gt,
> + GEN7_SAMPLER_INSTDONE,
> + slice, subslice);
> + instdone->row[slice][subslice] =
> + intel_gt_mcr_read(engine->gt,
> + GEN7_ROW_INSTDONE,
> + slice, subslice);
> }
>
> if (GRAPHICS_VER_FULL(i915) >= IP_VER(12, 55)) {
> - for_each_instdone_gslice_dss_xehp(i915, sseu, iter, slice, subslice)
> + for_each_ss_steering(iter, engine->gt, slice, subslice)
> instdone->geom_svg[slice][subslice] =
> intel_gt_mcr_read(engine->gt,
> XEHPG_INSTDONE_GEOM_SVG,
> diff --git a/drivers/gpu/drm/i915/gt/intel_engine_types.h b/drivers/gpu/drm/i915/gt/intel_engine_types.h
> index 2286f96f5f87..633a7e5dba3b 100644
> --- a/drivers/gpu/drm/i915/gt/intel_engine_types.h
> +++ b/drivers/gpu/drm/i915/gt/intel_engine_types.h
> @@ -647,26 +647,4 @@ intel_engine_uses_wa_hold_ccs_switchout(struct intel_engine_cs *engine)
> return engine->flags & I915_ENGINE_USES_WA_HOLD_CCS_SWITCHOUT;
> }
>
> -#define instdone_has_slice(dev_priv___, sseu___, slice___) \
> - ((GRAPHICS_VER(dev_priv___) == 7 ? 1 : ((sseu___)->slice_mask)) & BIT(slice___))
> -
> -#define instdone_has_subslice(dev_priv__, sseu__, slice__, subslice__) \
> - (GRAPHICS_VER(dev_priv__) == 7 ? (1 & BIT(subslice__)) : \
> - intel_sseu_has_subslice(sseu__, 0, subslice__))
> -
> -#define for_each_instdone_slice_subslice(dev_priv_, sseu_, slice_, subslice_) \
> - for ((slice_) = 0, (subslice_) = 0; (slice_) < I915_MAX_SLICES; \
> - (subslice_) = ((subslice_) + 1) % I915_MAX_SUBSLICES, \
> - (slice_) += ((subslice_) == 0)) \
> - for_each_if((instdone_has_slice(dev_priv_, sseu_, slice_)) && \
> - (instdone_has_subslice(dev_priv_, sseu_, slice_, \
> - subslice_)))
> -
> -#define for_each_instdone_gslice_dss_xehp(dev_priv_, sseu_, iter_, gslice_, dss_) \
> - for ((iter_) = 0, (gslice_) = 0, (dss_) = 0; \
> - (iter_) < GEN_SS_MASK_SIZE; \
> - (iter_)++, (gslice_) = (iter_) / GEN_DSS_PER_GSLICE, \
> - (dss_) = (iter_) % GEN_DSS_PER_GSLICE) \
> - for_each_if(intel_sseu_has_subslice((sseu_), 0, (iter_)))
> -
> #endif /* __INTEL_ENGINE_TYPES_H__ */
> diff --git a/drivers/gpu/drm/i915/gt/intel_gt_mcr.c b/drivers/gpu/drm/i915/gt/intel_gt_mcr.c
> index 777025d5bd66..f8c64ab9d3ca 100644
> --- a/drivers/gpu/drm/i915/gt/intel_gt_mcr.c
> +++ b/drivers/gpu/drm/i915/gt/intel_gt_mcr.c
> @@ -495,3 +495,28 @@ void intel_gt_mcr_report_steering(struct drm_printer *p, struct intel_gt *gt,
> }
> }
>
> +/**
> + * intel_gt_mcr_get_ss_steering - returns the group/instance steering for a SS
> + * @gt: GT structure
> + * @dss: DSS ID to obtain steering for
> + * @group: pointer to storage for steering group ID
> + * @instance: pointer to storage for steering instance ID
> + *
> + * Returns the steering IDs (via the @group and @instance parameters) that
> + * correspond to a specific subslice/DSS ID.
> + */
> +void intel_gt_mcr_get_ss_steering(struct intel_gt *gt, unsigned int dss,
> + unsigned int *group, unsigned int *instance)
> +{
> + if (IS_PONTEVECCHIO(gt->i915)) {
> + *group = dss / GEN_DSS_PER_CSLICE;
> + *instance = dss % GEN_DSS_PER_CSLICE;
> + } else if (GRAPHICS_VER_FULL(gt->i915) >= IP_VER(12, 50)) {
> + *group = dss / GEN_DSS_PER_GSLICE;
> + *instance = dss % GEN_DSS_PER_GSLICE;
> + } else {
> + *group = dss / GEN_MAX_HSW_SLICES;
> + *instance = dss % GEN_MAX_SS_PER_HSW_SLICE;
> + return;
> + }
> +}
> diff --git a/drivers/gpu/drm/i915/gt/intel_gt_mcr.h b/drivers/gpu/drm/i915/gt/intel_gt_mcr.h
> index 506b0cbc8db3..77a8b11c287d 100644
> --- a/drivers/gpu/drm/i915/gt/intel_gt_mcr.h
> +++ b/drivers/gpu/drm/i915/gt/intel_gt_mcr.h
> @@ -31,4 +31,28 @@ void intel_gt_mcr_get_nonterminated_steering(struct intel_gt *gt,
> void intel_gt_mcr_report_steering(struct drm_printer *p, struct intel_gt *gt,
> bool dump_table);
>
> +void intel_gt_mcr_get_ss_steering(struct intel_gt *gt, unsigned int dss,
> + unsigned int *group, unsigned int *instance);
> +
> +/*
> + * Helper for for_each_ss_steering loop. On pre-Xe_HP platforms, subslice
> + * presence is determined by using the group/instance as direct lookups in the
> + * slice/subslice topology. On Xe_HP and beyond, the steering is unrelated to
> + * the topology, so we lookup the DSS ID directly in "slice 0."
> + */
> +#define _HAS_SS(ss_, gt_, group_, instance_) ( \
> + GRAPHICS_VER_FULL(gt_->i915) >= IP_VER(12, 50) ? \
> + intel_sseu_has_subslice(&(gt_)->info.sseu, 0, ss_) : \
> + intel_sseu_has_subslice(&(gt_)->info.sseu, group_, instance_))
> +
> +/*
> + * Loop over each subslice/DSS and determine the group and instance IDs that
> + * should be used to steer MCR accesses toward this DSS.
> + */
> +#define for_each_ss_steering(ss_, gt_, group_, instance_) \
> + for (ss_ = 0, intel_gt_mcr_get_ss_steering(gt_, 0, &group_, &instance_); \
> + ss_ < I915_MAX_SS_FUSE_BITS; \
> + ss_++, intel_gt_mcr_get_ss_steering(gt_, ss_, &group_, &instance_)) \
> + for_each_if(_HAS_SS(ss_, gt_, group_, instance_))
> +
> #endif /* __INTEL_GT_MCR__ */
> diff --git a/drivers/gpu/drm/i915/gt/uc/intel_guc_capture.c b/drivers/gpu/drm/i915/gt/uc/intel_guc_capture.c
> index 97a32e610c30..4e47d0a308f1 100644
> --- a/drivers/gpu/drm/i915/gt/uc/intel_guc_capture.c
> +++ b/drivers/gpu/drm/i915/gt/uc/intel_guc_capture.c
> @@ -9,6 +9,7 @@
>
> #include "gt/intel_engine_regs.h"
> #include "gt/intel_gt.h"
> +#include "gt/intel_gt_mcr.h"
> #include "gt/intel_gt_regs.h"
> #include "gt/intel_lrc.h"
> #include "guc_capture_fwif.h"
> @@ -281,8 +282,7 @@ guc_capture_alloc_steered_lists_xe_lpd(struct intel_guc *guc,
> const struct __guc_mmio_reg_descr_group *lists)
> {
> struct intel_gt *gt = guc_to_gt(guc);
> - struct drm_i915_private *i915 = guc_to_gt(guc)->i915;
> - int slice, subslice, i, num_steer_regs, num_tot_regs = 0;
> + int slice, subslice, iter, i, num_steer_regs, num_tot_regs = 0;
> const struct __guc_mmio_reg_descr_group *list;
> struct __guc_mmio_reg_descr_group *extlists;
> struct __guc_mmio_reg_descr *extarray;
> @@ -298,7 +298,7 @@ guc_capture_alloc_steered_lists_xe_lpd(struct intel_guc *guc,
> num_steer_regs = ARRAY_SIZE(xe_extregs);
>
> sseu = >->info.sseu;
> - for_each_instdone_slice_subslice(i915, sseu, slice, subslice)
> + for_each_ss_steering(iter, gt, slice, subslice)
> num_tot_regs += num_steer_regs;
>
> if (!num_tot_regs)
> @@ -315,7 +315,7 @@ guc_capture_alloc_steered_lists_xe_lpd(struct intel_guc *guc,
> }
>
> extarray = extlists[0].extlist;
> - for_each_instdone_slice_subslice(i915, sseu, slice, subslice) {
> + for_each_ss_steering(iter, gt, slice, subslice) {
> for (i = 0; i < num_steer_regs; ++i) {
> __fill_ext_reg(extarray, &xe_extregs[i], slice, subslice);
> ++extarray;
> @@ -359,9 +359,8 @@ guc_capture_alloc_steered_lists_xe_hpg(struct intel_guc *guc,
> num_steer_regs += ARRAY_SIZE(xehpg_extregs);
>
> sseu = >->info.sseu;
> - for_each_instdone_gslice_dss_xehp(i915, sseu, iter, slice, subslice) {
> + for_each_ss_steering(iter, gt, slice, subslice)
> num_tot_regs += num_steer_regs;
> - }
>
> if (!num_tot_regs)
> return;
> @@ -377,7 +376,7 @@ guc_capture_alloc_steered_lists_xe_hpg(struct intel_guc *guc,
> }
>
> extarray = extlists[0].extlist;
> - for_each_instdone_gslice_dss_xehp(i915, sseu, iter, slice, subslice) {
> + for_each_ss_steering(iter, gt, slice, subslice) {
> for (i = 0; i < ARRAY_SIZE(xe_extregs); ++i) {
> __fill_ext_reg(extarray, &xe_extregs[i], slice, subslice);
> ++extarray;
> diff --git a/drivers/gpu/drm/i915/i915_gpu_error.c b/drivers/gpu/drm/i915/i915_gpu_error.c
> index 52ea13fee015..32e92651ef7c 100644
> --- a/drivers/gpu/drm/i915/i915_gpu_error.c
> +++ b/drivers/gpu/drm/i915/i915_gpu_error.c
> @@ -46,6 +46,7 @@
> #include "gem/i915_gem_lmem.h"
> #include "gt/intel_engine_regs.h"
> #include "gt/intel_gt.h"
> +#include "gt/intel_gt_mcr.h"
> #include "gt/intel_gt_pm.h"
> #include "gt/intel_gt_regs.h"
> #include "gt/uc/intel_guc_capture.h"
> @@ -436,7 +437,6 @@ static void err_compression_marker(struct drm_i915_error_state_buf *m)
> static void error_print_instdone(struct drm_i915_error_state_buf *m,
> const struct intel_engine_coredump *ee)
> {
> - const struct sseu_dev_info *sseu = &ee->engine->gt->info.sseu;
> int slice;
> int subslice;
> int iter;
> @@ -453,33 +453,21 @@ static void error_print_instdone(struct drm_i915_error_state_buf *m,
> if (GRAPHICS_VER(m->i915) <= 6)
> return;
>
> - if (GRAPHICS_VER_FULL(m->i915) >= IP_VER(12, 50)) {
> - for_each_instdone_gslice_dss_xehp(m->i915, sseu, iter, slice, subslice)
> - err_printf(m, " SAMPLER_INSTDONE[%d][%d]: 0x%08x\n",
> - slice, subslice,
> - ee->instdone.sampler[slice][subslice]);
> + for_each_ss_steering(iter, ee->engine->gt, slice, subslice)
> + err_printf(m, " SAMPLER_INSTDONE[%d][%d]: 0x%08x\n",
> + slice, subslice,
> + ee->instdone.sampler[slice][subslice]);
>
> - for_each_instdone_gslice_dss_xehp(m->i915, sseu, iter, slice, subslice)
> - err_printf(m, " ROW_INSTDONE[%d][%d]: 0x%08x\n",
> - slice, subslice,
> - ee->instdone.row[slice][subslice]);
> - } else {
> - for_each_instdone_slice_subslice(m->i915, sseu, slice, subslice)
> - err_printf(m, " SAMPLER_INSTDONE[%d][%d]: 0x%08x\n",
> - slice, subslice,
> - ee->instdone.sampler[slice][subslice]);
> -
> - for_each_instdone_slice_subslice(m->i915, sseu, slice, subslice)
> - err_printf(m, " ROW_INSTDONE[%d][%d]: 0x%08x\n",
> - slice, subslice,
> - ee->instdone.row[slice][subslice]);
> - }
> + for_each_ss_steering(iter, ee->engine->gt, slice, subslice)
> + err_printf(m, " ROW_INSTDONE[%d][%d]: 0x%08x\n",
> + slice, subslice,
> + ee->instdone.row[slice][subslice]);
>
> if (GRAPHICS_VER(m->i915) < 12)
> return;
>
> if (GRAPHICS_VER_FULL(m->i915) >= IP_VER(12, 55)) {
> - for_each_instdone_gslice_dss_xehp(m->i915, sseu, iter, slice, subslice)
> + for_each_ss_steering(iter, ee->engine->gt, slice, subslice)
> err_printf(m, " GEOM_SVGUNIT_INSTDONE[%d][%d]: 0x%08x\n",
> slice, subslice,
> ee->instdone.geom_svg[slice][subslice]);
> --
> 2.36.1
>
More information about the Intel-gfx
mailing list