[Intel-gfx] [PATCH v2 3/6] drm/i915: Make shadow tables range-based
Yokoyama, Caz
caz.yokoyama at intel.com
Thu Jul 29 21:55:17 UTC 2021
On Thu, 2021-07-29 at 08:21 -0700, Matt Roper wrote:
> Rather than defining our shadow tables as a list of individual
> registers, provide them as a list of register ranges; we'll have some
> ranges of multiple registers being added soon (and we already have a
> couple adjacent registers that we can squash into a single range
> now).
>
> This change also defines the table with hex literal values rather
> than
> symbolic register names; since that's how the tables are defined in
> the
> bspec, this change will make it easier to review the tables overall.
>
> v2:
> - Force signed comparison on range overlap sanity check
>
> Signed-off-by: Matt Roper <matthew.d.roper at intel.com>
> ---
> drivers/gpu/drm/i915/gt/intel_workarounds.c | 13 +-
> drivers/gpu/drm/i915/intel_uncore.c | 160 +++++++++-------
> --
> drivers/gpu/drm/i915/intel_uncore.h | 6 +
> drivers/gpu/drm/i915/selftests/intel_uncore.c | 32 ++--
> 4 files changed, 108 insertions(+), 103 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/gt/intel_workarounds.c
> b/drivers/gpu/drm/i915/gt/intel_workarounds.c
> index 9173df59821a..7558414bafb2 100644
> --- a/drivers/gpu/drm/i915/gt/intel_workarounds.c
> +++ b/drivers/gpu/drm/i915/gt/intel_workarounds.c
> @@ -1963,12 +1963,7 @@ void intel_engine_apply_workarounds(struct
> intel_engine_cs *engine)
> wa_list_apply(engine->gt, &engine->wa_list);
> }
>
> -struct mcr_range {
> - u32 start;
> - u32 end;
> -};
> -
> -static const struct mcr_range mcr_ranges_gen8[] = {
> +static const struct i915_range mcr_ranges_gen8[] = {
> { .start = 0x5500, .end = 0x55ff },
> { .start = 0x7000, .end = 0x7fff },
> { .start = 0x9400, .end = 0x97ff },
> @@ -1977,7 +1972,7 @@ static const struct mcr_range mcr_ranges_gen8[]
> = {
> {},
> };
>
> -static const struct mcr_range mcr_ranges_gen12[] = {
> +static const struct i915_range mcr_ranges_gen12[] = {
> { .start = 0x8150, .end = 0x815f },
> { .start = 0x9520, .end = 0x955f },
> { .start = 0xb100, .end = 0xb3ff },
> @@ -1986,7 +1981,7 @@ static const struct mcr_range
> mcr_ranges_gen12[] = {
> {},
> };
>
> -static const struct mcr_range mcr_ranges_xehp[] = {
> +static const struct i915_range mcr_ranges_xehp[] = {
> { .start = 0x4000, .end = 0x4aff },
> { .start = 0x5200, .end = 0x52ff },
> { .start = 0x5400, .end = 0x7fff },
> @@ -2004,7 +1999,7 @@ static const struct mcr_range mcr_ranges_xehp[]
> = {
>
> static bool mcr_range(struct drm_i915_private *i915, u32 offset)
> {
> - const struct mcr_range *mcr_ranges;
> + const struct i915_range *mcr_ranges;
> int i;
>
> if (GRAPHICS_VER_FULL(i915) >= IP_VER(12, 50))
> diff --git a/drivers/gpu/drm/i915/intel_uncore.c
> b/drivers/gpu/drm/i915/intel_uncore.c
> index ea910f7ee635..2cfbc16f7dee 100644
> --- a/drivers/gpu/drm/i915/intel_uncore.c
> +++ b/drivers/gpu/drm/i915/intel_uncore.c
> @@ -946,101 +946,95 @@ static const struct intel_forcewake_range
> __vlv_fw_ranges[] = {
> find_fw_domain(uncore, offset)
>
> /* *Must* be sorted by offset! See intel_shadow_table_check(). */
> -static const i915_reg_t gen8_shadowed_regs[] = {
> - RING_TAIL(RENDER_RING_BASE), /* 0x2000 (base) */
> - GEN6_RPNSWREQ, /* 0xA008 *
> - GEN6_RC_VIDEO_FREQ, /* 0xA00C */
> - RING_TAIL(GEN6_BSD_RING_BASE), /* 0x12000 (base) */
> - RING_TAIL(VEBOX_RING_BASE), /* 0x1a000 (base) */
> - RING_TAIL(BLT_RING_BASE), /* 0x22000 (base) */
> +static const struct i915_range gen8_shadowed_regs[] = {
> + { .start = 0x2030, .end = 0x2030 },
> + { .start = 0xA008, .end = 0xA00C },
> + { .start = 0x12030, .end = 0x12030 },
> + { .start = 0x1a030, .end = 0x1a030 },
> + { .start = 0x22030, .end = 0x22030 },
You are replacing macro defined values by literal values. These macro
defined values are no longer used in this patch, but used in other
places such as intel_rps.c:gen6_rps_set(). What plan do you have about
the same address is defined in 2 ways, i.e. macro and literal value?
-caz
> /* TODO: Other registers are not yet used */
> };
>
> -static const i915_reg_t gen11_shadowed_regs[] = {
> - RING_TAIL(RENDER_RING_BASE), /* 0x2000
> (base) */
> - RING_EXECLIST_CONTROL(RENDER_RING_BASE), /* 0x2550 */
> - GEN6_RPNSWREQ, /* 0xA008 */
> - GEN6_RC_VIDEO_FREQ, /* 0xA00C */
> - RING_TAIL(BLT_RING_BASE), /* 0x22000 (base) */
> - RING_EXECLIST_CONTROL(BLT_RING_BASE), /* 0x22550 */
> - RING_TAIL(GEN11_BSD_RING_BASE), /* 0x1C0000
> (base) */
> - RING_EXECLIST_CONTROL(GEN11_BSD_RING_BASE), /* 0x1C0550
> */
> - RING_TAIL(GEN11_BSD2_RING_BASE), /* 0x1C4000 (base) */
> - RING_EXECLIST_CONTROL(GEN11_BSD2_RING_BASE), /* 0x1C4550
> */
> - RING_TAIL(GEN11_VEBOX_RING_BASE), /* 0x1C8000 (base) */
> - RING_EXECLIST_CONTROL(GEN11_VEBOX_RING_BASE), /* 0x1C8550
> */
> - RING_TAIL(GEN11_BSD3_RING_BASE), /* 0x1D0000 (base) */
> - RING_EXECLIST_CONTROL(GEN11_BSD3_RING_BASE), /* 0x1D0550
> */
> - RING_TAIL(GEN11_BSD4_RING_BASE), /* 0x1D4000 (base) */
> - RING_EXECLIST_CONTROL(GEN11_BSD4_RING_BASE), /* 0x1D4550
> */
> - RING_TAIL(GEN11_VEBOX2_RING_BASE), /* 0x1D8000
> (base) */
> - RING_EXECLIST_CONTROL(GEN11_VEBOX2_RING_BASE), /* 0x1D8550
> */
> +static const struct i915_range gen11_shadowed_regs[] = {
> + { .start = 0x2030, .end = 0x2030 },
> + { .start = 0x2550, .end = 0x2550 },
> + { .start = 0xA008, .end = 0xA00C },
> + { .start = 0x22030, .end = 0x22030 },
> + { .start = 0x22550, .end = 0x22550 },
> + { .start = 0x1C0030, .end = 0x1C0030 },
> + { .start = 0x1C0550, .end = 0x1C0550 },
> + { .start = 0x1C4030, .end = 0x1C4030 },
> + { .start = 0x1C4550, .end = 0x1C4550 },
> + { .start = 0x1C8030, .end = 0x1C8030 },
> + { .start = 0x1C8550, .end = 0x1C8550 },
> + { .start = 0x1D0030, .end = 0x1D0030 },
> + { .start = 0x1D0550, .end = 0x1D0550 },
> + { .start = 0x1D4030, .end = 0x1D4030 },
> + { .start = 0x1D4550, .end = 0x1D4550 },
> + { .start = 0x1D8030, .end = 0x1D8030 },
> + { .start = 0x1D8550, .end = 0x1D8550 },
> /* TODO: Other registers are not yet used */
> };
>
> -static const i915_reg_t gen12_shadowed_regs[] = {
> - RING_TAIL(RENDER_RING_BASE), /* 0x2000
> (base) */
> - RING_EXECLIST_CONTROL(RENDER_RING_BASE), /* 0x2550 */
> - GEN6_RPNSWREQ, /* 0xA008 */
> - GEN6_RC_VIDEO_FREQ, /* 0xA00C */
> - RING_TAIL(BLT_RING_BASE), /* 0x22000 (base) */
> - RING_EXECLIST_CONTROL(BLT_RING_BASE), /* 0x22550 */
> - RING_TAIL(GEN11_BSD_RING_BASE), /* 0x1C0000
> (base) */
> - RING_EXECLIST_CONTROL(GEN11_BSD_RING_BASE), /* 0x1C0550
> */
> - RING_TAIL(GEN11_BSD2_RING_BASE), /* 0x1C4000 (base) */
> - RING_EXECLIST_CONTROL(GEN11_BSD2_RING_BASE), /* 0x1C4550
> */
> - RING_TAIL(GEN11_VEBOX_RING_BASE), /* 0x1C8000 (base) */
> - RING_EXECLIST_CONTROL(GEN11_VEBOX_RING_BASE), /* 0x1C8550
> */
> - RING_TAIL(GEN11_BSD3_RING_BASE), /* 0x1D0000 (base) */
> - RING_EXECLIST_CONTROL(GEN11_BSD3_RING_BASE), /* 0x1D0550
> */
> - RING_TAIL(GEN11_BSD4_RING_BASE), /* 0x1D4000 (base) */
> - RING_EXECLIST_CONTROL(GEN11_BSD4_RING_BASE), /* 0x1D4550
> */
> - RING_TAIL(GEN11_VEBOX2_RING_BASE), /* 0x1D8000
> (base) */
> - RING_EXECLIST_CONTROL(GEN11_VEBOX2_RING_BASE), /* 0x1D8550
> */
> +static const struct i915_range gen12_shadowed_regs[] = {
> + { .start = 0x2030, .end = 0x2030 },
> + { .start = 0x2550, .end = 0x2550 },
> + { .start = 0xA008, .end = 0xA00C },
> + { .start = 0x22030, .end = 0x22030 },
> + { .start = 0x22550, .end = 0x22550 },
> + { .start = 0x1C0030, .end = 0x1C0030 },
> + { .start = 0x1C0550, .end = 0x1C0550 },
> + { .start = 0x1C4030, .end = 0x1C4030 },
> + { .start = 0x1C4550, .end = 0x1C4550 },
> + { .start = 0x1C8030, .end = 0x1C8030 },
> + { .start = 0x1C8550, .end = 0x1C8550 },
> + { .start = 0x1D0030, .end = 0x1D0030 },
> + { .start = 0x1D0550, .end = 0x1D0550 },
> + { .start = 0x1D4030, .end = 0x1D4030 },
> + { .start = 0x1D4550, .end = 0x1D4550 },
> + { .start = 0x1D8030, .end = 0x1D8030 },
> + { .start = 0x1D8550, .end = 0x1D8550 },
> /* TODO: Other registers are not yet used */
> };
>
> -static const i915_reg_t xehp_shadowed_regs[] = {
> - RING_TAIL(RENDER_RING_BASE), /* 0x2000
> (base) */
> - RING_EXECLIST_CONTROL(RENDER_RING_BASE), /* 0x2550 */
> - GEN6_RPNSWREQ, /* 0xA008 */
> - GEN6_RC_VIDEO_FREQ, /* 0xA00C */
> - RING_TAIL(BLT_RING_BASE), /* 0x22000 (base) */
> - RING_EXECLIST_CONTROL(BLT_RING_BASE), /* 0x22550 */
> - RING_TAIL(GEN11_BSD_RING_BASE), /* 0x1C0000
> (base) */
> - RING_EXECLIST_CONTROL(GEN11_BSD_RING_BASE), /* 0x1C0550
> */
> - RING_TAIL(GEN11_BSD2_RING_BASE), /* 0x1C4000 (base) */
> - RING_EXECLIST_CONTROL(GEN11_BSD2_RING_BASE), /* 0x1C4550
> */
> - RING_TAIL(GEN11_VEBOX_RING_BASE), /* 0x1C8000 (base) */
> - RING_EXECLIST_CONTROL(GEN11_VEBOX_RING_BASE), /* 0x1C8550
> */
> - RING_TAIL(GEN11_BSD3_RING_BASE), /* 0x1D0000 (base) */
> - RING_EXECLIST_CONTROL(GEN11_BSD3_RING_BASE), /* 0x1D0550
> */
> - RING_TAIL(GEN11_BSD4_RING_BASE), /* 0x1D4000 (base) */
> - RING_EXECLIST_CONTROL(GEN11_BSD4_RING_BASE), /* 0x1D4550
> */
> - RING_TAIL(GEN11_VEBOX2_RING_BASE), /* 0x1D8000
> (base) */
> - RING_EXECLIST_CONTROL(GEN11_VEBOX2_RING_BASE), /* 0x1D8550
> */
> - RING_TAIL(XEHP_BSD5_RING_BASE), /* 0x1E0000
> (base) */
> - RING_EXECLIST_CONTROL(XEHP_BSD5_RING_BASE), /* 0x1E0550
> */
> - RING_TAIL(XEHP_BSD6_RING_BASE), /* 0x1E4000
> (base) */
> - RING_EXECLIST_CONTROL(XEHP_BSD6_RING_BASE), /* 0x1E4550
> */
> - RING_TAIL(XEHP_VEBOX3_RING_BASE), /* 0x1E8000 (base) */
> - RING_EXECLIST_CONTROL(XEHP_VEBOX3_RING_BASE), /* 0x1E8550
> */
> - RING_TAIL(XEHP_BSD7_RING_BASE), /* 0x1F0000
> (base) */
> - RING_EXECLIST_CONTROL(XEHP_BSD7_RING_BASE), /* 0x1F0550
> */
> - RING_TAIL(XEHP_BSD8_RING_BASE), /* 0x1F4000
> (base) */
> - RING_EXECLIST_CONTROL(XEHP_BSD8_RING_BASE), /* 0x1F4550
> */
> - RING_TAIL(XEHP_VEBOX4_RING_BASE), /* 0x1F8000 (base) */
> - RING_EXECLIST_CONTROL(XEHP_VEBOX4_RING_BASE), /* 0x1F8550
> */
> +static const struct i915_range xehp_shadowed_regs[] = {
> + { .start = 0x2000, .end = 0x2030 },
> + { .start = 0x2550, .end = 0x2550 },
> + { .start = 0xA008, .end = 0xA00C },
> + { .start = 0x22030, .end = 0x22030 },
> + { .start = 0x22550, .end = 0x22550 },
> + { .start = 0x1C0030, .end = 0x1C0030 },
> + { .start = 0x1C0550, .end = 0x1C0550 },
> + { .start = 0x1C4030, .end = 0x1C4030 },
> + { .start = 0x1C4550, .end = 0x1C4550 },
> + { .start = 0x1C8030, .end = 0x1C8030 },
> + { .start = 0x1C8550, .end = 0x1C8550 },
> + { .start = 0x1D0030, .end = 0x1D0030 },
> + { .start = 0x1D0550, .end = 0x1D0550 },
> + { .start = 0x1D4030, .end = 0x1D4030 },
> + { .start = 0x1D4550, .end = 0x1D4550 },
> + { .start = 0x1D8030, .end = 0x1D8030 },
> + { .start = 0x1D8550, .end = 0x1D8550 },
> + { .start = 0x1E0030, .end = 0x1E0030 },
> + { .start = 0x1E0550, .end = 0x1E0550 },
> + { .start = 0x1E4030, .end = 0x1E4030 },
> + { .start = 0x1E4550, .end = 0x1E4550 },
> + { .start = 0x1E8030, .end = 0x1E8030 },
> + { .start = 0x1E8550, .end = 0x1E8550 },
> + { .start = 0x1F0030, .end = 0x1F0030 },
> + { .start = 0x1F0550, .end = 0x1F0550 },
> + { .start = 0x1F4030, .end = 0x1F4030 },
> + { .start = 0x1F4550, .end = 0x1F4550 },
> + { .start = 0x1F8030, .end = 0x1F8030 },
> + { .start = 0x1F8550, .end = 0x1F8550 },
> /* TODO: Other registers are not yet used */
> };
>
> -static int mmio_reg_cmp(u32 key, const i915_reg_t *reg)
> +static int mmio_range_cmp(u32 key, const struct i915_range *range)
> {
> - u32 offset = i915_mmio_reg_offset(*reg);
> -
> - if (key < offset)
> + if (key < range->start)
> return -1;
> - else if (key > offset)
> + else if (key > range->end)
> return 1;
> else
> return 0;
> @@ -1049,9 +1043,9 @@ static int mmio_reg_cmp(u32 key, const
> i915_reg_t *reg)
> #define __is_X_shadowed(x) \
> static bool is_##x##_shadowed(u32 offset) \
> { \
> - const i915_reg_t *regs = x##_shadowed_regs; \
> + const struct i915_range *regs = x##_shadowed_regs; \
> return BSEARCH(offset, regs, ARRAY_SIZE(x##_shadowed_regs), \
> - mmio_reg_cmp); \
> + mmio_range_cmp); \
> }
>
> __is_X_shadowed(gen8)
> diff --git a/drivers/gpu/drm/i915/intel_uncore.h
> b/drivers/gpu/drm/i915/intel_uncore.h
> index 3c0b0a8b5250..531665b08039 100644
> --- a/drivers/gpu/drm/i915/intel_uncore.h
> +++ b/drivers/gpu/drm/i915/intel_uncore.h
> @@ -119,6 +119,12 @@ struct intel_forcewake_range {
> enum forcewake_domains domains;
> };
>
> +/* Other register ranges (e.g., shadow tables, MCR tables, etc.) */
> +struct i915_range {
> + u32 start;
> + u32 end;
> +};
> +
> struct intel_uncore {
> void __iomem *regs;
>
> diff --git a/drivers/gpu/drm/i915/selftests/intel_uncore.c
> b/drivers/gpu/drm/i915/selftests/intel_uncore.c
> index 720b60853f8b..d6a9c11afa23 100644
> --- a/drivers/gpu/drm/i915/selftests/intel_uncore.c
> +++ b/drivers/gpu/drm/i915/selftests/intel_uncore.c
> @@ -62,30 +62,40 @@ static int intel_fw_table_check(const struct
> intel_forcewake_range *ranges,
> static int intel_shadow_table_check(void)
> {
> struct {
> - const i915_reg_t *regs;
> + const struct i915_range *regs;
> unsigned int size;
> - } reg_lists[] = {
> + } range_lists[] = {
> { gen8_shadowed_regs, ARRAY_SIZE(gen8_shadowed_regs) },
> { gen11_shadowed_regs, ARRAY_SIZE(gen11_shadowed_regs)
> },
> { gen12_shadowed_regs, ARRAY_SIZE(gen12_shadowed_regs)
> },
> { xehp_shadowed_regs, ARRAY_SIZE(xehp_shadowed_regs) },
> };
> - const i915_reg_t *reg;
> + const struct i915_range *range;
> unsigned int i, j;
> s32 prev;
>
> - for (j = 0; j < ARRAY_SIZE(reg_lists); ++j) {
> - reg = reg_lists[j].regs;
> - for (i = 0, prev = -1; i < reg_lists[j].size; i++,
> reg++) {
> - u32 offset = i915_mmio_reg_offset(*reg);
> + for (j = 0; j < ARRAY_SIZE(range_lists); ++j) {
> + range = range_lists[j].regs;
> + for (i = 0, prev = -1; i < range_lists[j].size; i++,
> range++) {
> + if (range->end < range->start) {
> + pr_err("%s: range[%d]:(%06x-%06x) has
> end before start\n",
> + __func__, i, range->start,
> range->end);
> + return -EINVAL;
> + }
> +
> + if (prev >= (s32)range->start) {
> + pr_err("%s: range[%d]:(%06x-%06x) is
> before end of previous (%06x)\n",
> + __func__, i, range->start,
> range->end, prev);
> + return -EINVAL;
> + }
>
> - if (prev >= (s32)offset) {
> - pr_err("%s: entry[%d]:(%x) is before
> previous (%x)\n",
> - __func__, i, offset, prev);
> + if (range->start % 4) {
> + pr_err("%s: range[%d]:(%06x-%06x) has
> non-dword-aligned start\n",
> + __func__, i, range->start,
> range->end);
> return -EINVAL;
> }
>
> - prev = offset;
> + prev = range->end;
> }
> }
>
More information about the Intel-gfx
mailing list