[Intel-gfx] [PATCH v1 2/2] drm/i915:gen9: Add disable gather at set shader w/a
Siluvery, Arun
arun.siluvery at linux.intel.com
Tue Aug 4 02:29:41 PDT 2015
On 04/08/2015 00:21, Ben Widawsky wrote:
> On Mon, Aug 03, 2015 at 08:24:57PM +0100, Arun Siluvery wrote:
>> This WA is implemented in init_context as well as WA batch init.
>> There are also some dependent bits need to be set in other registers
>> for this to be complete.
>>
>> Cc: Ben Widawsky <benjamin.widawsky at intel.com>
>> Cc: Joonas Lahtinen <joonas.lahtinen at linux.intel.com>
>> Signed-off-by: Arun Siluvery <arun.siluvery at linux.intel.com>
>> ---
>> drivers/gpu/drm/i915/i915_reg.h | 3 +++
>> drivers/gpu/drm/i915/intel_lrc.c | 8 ++++++++
>> drivers/gpu/drm/i915/intel_ringbuffer.c | 16 ++++++++++++++++
>> 3 files changed, 27 insertions(+)
>>
>> diff --git a/drivers/gpu/drm/i915/i915_reg.h b/drivers/gpu/drm/i915/i915_reg.h
>> index 8991cd5..24b8bb9 100644
>> --- a/drivers/gpu/drm/i915/i915_reg.h
>> +++ b/drivers/gpu/drm/i915/i915_reg.h
>> @@ -1720,7 +1720,9 @@ enum skl_disp_power_wells {
>> #define MEM_DISPLAY_A_TRICKLE_FEED_DISABLE (1<<2) /* 830/845 only */
>> #define MEM_DISPLAY_TRICKLE_FEED_DISABLE (1<<2) /* 85x only */
>> #define FW_BLC 0x020d8
>> +#define GEN9_DISABLE_GATHER_AT_SET_SHADER (1<<7)
>> #define FW_BLC2 0x020dc
>> +#define GEN9_RS_CHICKEN_DISABLE_GATHER_AT_SHADER (1<<2)
>
> Neither of these belong here. BLC is for backlight. Create a new define if we
> don't have one.
>
> #define RS_CHICKEN 0x20dc
I thought of reusing existing define but created a new one as you suggested.
>
>> #define FW_BLC_SELF 0x020e0 /* 915+ only */
>> #define FW_BLC_SELF_EN_MASK (1<<31)
>> #define FW_BLC_SELF_FIFO_MASK (1<<16) /* 945 only */
>> @@ -5836,6 +5838,7 @@ enum skl_disp_power_wells {
>> # define GEN7_CSC1_RHWO_OPT_DISABLE_IN_RCC ((1<<10) | (1<<26))
>> # define GEN9_RHWO_OPTIMIZATION_DISABLE (1<<14)
>> #define COMMON_SLICE_CHICKEN2 0x7014
>> +#define GEN9_DISABLE_GATHER_SET_SHADER_SLICE (1<<12)
>> # define GEN8_CSC2_SBE_VUE_CACHE_CONSERVATIVE (1<<0)
>>
>> #define HIZ_CHICKEN 0x7018
>> diff --git a/drivers/gpu/drm/i915/intel_lrc.c b/drivers/gpu/drm/i915/intel_lrc.c
>> index 9faad82..d3a03f3 100644
>> --- a/drivers/gpu/drm/i915/intel_lrc.c
>> +++ b/drivers/gpu/drm/i915/intel_lrc.c
>> @@ -1292,6 +1292,14 @@ static int gen9_init_perctx_bb(struct intel_engine_cs *ring,
>> struct drm_device *dev = ring->dev;
>> uint32_t index = wa_ctx_start(wa_ctx, *offset, CACHELINE_DWORDS);
>>
>> + /* WA to reset "disable gather at set shader slice" bit */
>> + if (IS_SKYLAKE(dev)) {
>> + wa_ctx_emit(batch, index, MI_LOAD_REGISTER_IMM(1));
>> + wa_ctx_emit(batch, index, COMMON_SLICE_CHICKEN2);
>> + wa_ctx_emit(batch, index,
>> + _MASKED_BIT_DISABLE(GEN9_DISABLE_GATHER_SET_SHADER_SLICE));
>> + }
>> +
>
> Shouldn't this be for BXT as well? Also, why bother with the revid check below
> and not here?
spec says only SKL+
>
>> /* WaSetDisablePixMaskCammingAndRhwoInCommonSliceChicken:skl,bxt */
>> if ((IS_SKYLAKE(dev) && (INTEL_REVID(dev) <= SKL_REVID_B0)) ||
>> (IS_BROXTON(dev) && (INTEL_REVID(dev) == BXT_REVID_A0))) {
>> diff --git a/drivers/gpu/drm/i915/intel_ringbuffer.c b/drivers/gpu/drm/i915/intel_ringbuffer.c
>> index dcd1b8f..4fc4b5e 100644
>> --- a/drivers/gpu/drm/i915/intel_ringbuffer.c
>> +++ b/drivers/gpu/drm/i915/intel_ringbuffer.c
>> @@ -985,6 +985,15 @@ static int gen9_init_workarounds(struct intel_engine_cs *ring)
>> tmp |= HDC_FORCE_CSR_NON_COHERENT_OVR_DISABLE;
>> WA_SET_BIT_MASKED(HDC_CHICKEN0, tmp);
>>
>> + /* WA to gather at set shader - skl,bxt
>> + * These are dependent bits need to be set for the WA.
>> + */
>> + if (IS_SKYLAKE(dev) && (INTEL_REVID(dev) > SKL_REVID_D0) ||
>> + (IS_BROXTON(dev) && INTEL_REVID(dev) > BXT_REVID_A0)) {
>> + WA_SET_BIT_MASKED(FW_BLC, GEN9_DISABLE_GATHER_AT_SET_SHADER);
>> + WA_SET_BIT_MASKED(FW_BLC2, GEN9_RS_CHICKEN_DISABLE_GATHER_AT_SHADER);
>> + }
>> +
>> return 0;
>> }
>>
>> @@ -1068,6 +1077,13 @@ static int skl_init_workarounds(struct intel_engine_cs *ring)
>> HDC_FENCE_DEST_SLM_DISABLE |
>> HDC_BARRIER_PERFORMANCE_DISABLE);
>>
>> + /* WA to Disable gather at set shader - skl
>> + * This bit needs to be reset in Per ctx WA batch and it is also
>> + * dependent on other bits in different register, all of them need
>> + * be set for the WA to be complete.
>> + */
>> + WA_SET_BIT_MASKED(COMMON_SLICE_CHICKEN2, GEN9_DISABLE_GATHER_SET_SHADER_SLICE);
>> +
>> return skl_tune_iz_hashing(ring);
>> }
>>
>
> I wouldn't set both 20dc, and 20d8, I am not sure what implication it has.
> Instead, set or read bit 15 of 0x20e0 and then just set one. To me, it seems
> like the best way to do this is to set 1<<15 of 0x20e0, and then use bit 2 of
> 0x20dc for the workaround. We don't need per context controls of something we
> have to disable always anyway.
>
changed it to use 0x20e0
regards
Arun
More information about the Intel-gfx
mailing list