[Intel-gfx] [PATCH] drm/i915/gt: Rearrange snb workarounds

Mika Kuoppala mika.kuoppala at linux.intel.com
Thu Dec 10 10:36:07 UTC 2020


Chris Wilson <chris at chris-wilson.co.uk> writes:

> Some rcs0 workarounds were being incorrectly applied to the GT, and so
> we failed to restore the expected register settings after a reset.
>
> Signed-off-by: Chris Wilson <chris at chris-wilson.co.uk>
> ---
>  drivers/gpu/drm/i915/gt/intel_workarounds.c | 67 ++++++++++-----------
>  1 file changed, 33 insertions(+), 34 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/gt/intel_workarounds.c b/drivers/gpu/drm/i915/gt/intel_workarounds.c
> index b5339a36d256..50cfe82f18a9 100644
> --- a/drivers/gpu/drm/i915/gt/intel_workarounds.c
> +++ b/drivers/gpu/drm/i915/gt/intel_workarounds.c
> @@ -823,40 +823,6 @@ ilk_gt_workarounds_init(struct drm_i915_private *i915, struct i915_wa_list *wal)
>  static void
>  snb_gt_workarounds_init(struct drm_i915_private *i915, struct i915_wa_list *wal)
>  {
> -	/* WaDisableHiZPlanesWhenMSAAEnabled:snb */
> -	wa_masked_en(wal,
> -		     _3D_CHICKEN,
> -		     _3D_CHICKEN_HIZ_PLANE_DISABLE_MSAA_4X_SNB);
> -
> -	/* WaDisable_RenderCache_OperationalFlush:snb */
> -	wa_masked_dis(wal, CACHE_MODE_0, RC_OP_FLUSH_ENABLE);
> -
> -	/*
> -	 * BSpec recommends 8x4 when MSAA is used,
> -	 * however in practice 16x4 seems fastest.
> -	 *
> -	 * Note that PS/WM thread counts depend on the WIZ hashing
> -	 * disable bit, which we don't touch here, but it's good
> -	 * to keep in mind (see 3DSTATE_PS and 3DSTATE_WM).
> -	 */
> -	wa_add(wal,
> -	       GEN6_GT_MODE, 0,
> -	       _MASKED_FIELD(GEN6_WIZ_HASHING_MASK, GEN6_WIZ_HASHING_16x4),
> -	       GEN6_WIZ_HASHING_16x4);
> -
> -	wa_masked_dis(wal, CACHE_MODE_0, CM0_STC_EVICT_DISABLE_LRA_SNB);

Where did this go?
-Mika

> -
> -	wa_masked_en(wal,
> -		     _3D_CHICKEN3,
> -		     /* WaStripsFansDisableFastClipPerformanceFix:snb */
> -		     _3D_CHICKEN3_SF_DISABLE_FASTCLIP_CULL |
> -		     /*
> -		      * Bspec says:
> -		      * "This bit must be set if 3DSTATE_CLIP clip mode is set
> -		      * to normal and 3DSTATE_SF number of SF output attributes
> -		      * is more than 16."
> -		      */
> -		   _3D_CHICKEN3_SF_DISABLE_PIPELINED_ATTR_FETCH);
>  }
>  
>  static void
> @@ -2008,6 +1974,39 @@ rcs_engine_wa_init(struct intel_engine_cs *engine, struct i915_wa_list *wal)
>  			     GFX_MODE,
>  			     GFX_TLB_INVALIDATE_EXPLICIT);
>  
> +		/* WaDisableHiZPlanesWhenMSAAEnabled:snb */
> +		wa_masked_en(wal,
> +			     _3D_CHICKEN,
> +			     _3D_CHICKEN_HIZ_PLANE_DISABLE_MSAA_4X_SNB);
> +
> +		wa_masked_en(wal,
> +			     _3D_CHICKEN3,
> +			     /* WaStripsFansDisableFastClipPerformanceFix:snb */
> +			     _3D_CHICKEN3_SF_DISABLE_FASTCLIP_CULL |
> +			     /*
> +			      * Bspec says:
> +			      * "This bit must be set if 3DSTATE_CLIP clip mode is set
> +			      * to normal and 3DSTATE_SF number of SF output attributes
> +			      * is more than 16."
> +			      */
> +			     _3D_CHICKEN3_SF_DISABLE_PIPELINED_ATTR_FETCH);
> +
> +		/*
> +		 * BSpec recommends 8x4 when MSAA is used,
> +		 * however in practice 16x4 seems fastest.
> +		 *
> +		 * Note that PS/WM thread counts depend on the WIZ hashing
> +		 * disable bit, which we don't touch here, but it's good
> +		 * to keep in mind (see 3DSTATE_PS and 3DSTATE_WM).
> +		 */
> +		wa_add(wal,
> +		       GEN6_GT_MODE, 0,
> +		       _MASKED_FIELD(GEN6_WIZ_HASHING_MASK, GEN6_WIZ_HASHING_16x4),
> +		       GEN6_WIZ_HASHING_16x4);
> +
> +		/* WaDisable_RenderCache_OperationalFlush:snb */
> +		wa_masked_dis(wal, CACHE_MODE_0, RC_OP_FLUSH_ENABLE);
> +
>  		/*
>  		 * From the Sandybridge PRM, volume 1 part 3, page 24:
>  		 * "If this bit is set, STCunit will have LRA as replacement
> -- 
> 2.20.1
>
> _______________________________________________
> Intel-gfx mailing list
> Intel-gfx at lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/intel-gfx


More information about the Intel-gfx mailing list