[Intel-gfx] [PATCH 5/8] drm/i915/selftests: Add tests for GT and engine workaround verification
Chris Wilson
chris at chris-wilson.co.uk
Fri Nov 30 11:43:21 UTC 2018
Quoting Tvrtko Ursulin (2018-11-30 11:31:58)
> From: Tvrtko Ursulin <tvrtko.ursulin at intel.com>
>
> Two simple selftests which test that both GT and engine workarounds are
> not lost after either a full GPU reset, or after the per-engine ones.
>
> (Including checks that one engine reset is not affecting workarounds not
> belonging to itself.)
>
> Signed-off-by: Tvrtko Ursulin <tvrtko.ursulin at intel.com>
> ---
> drivers/gpu/drm/i915/intel_workarounds.c | 21 +++--
> drivers/gpu/drm/i915/intel_workarounds.h | 4 +-
> .../drm/i915/selftests/intel_workarounds.c | 90 +++++++++++++++++++
> 3 files changed, 105 insertions(+), 10 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/intel_workarounds.c b/drivers/gpu/drm/i915/intel_workarounds.c
> index 2d17d8a36a57..a21a21855e6a 100644
> --- a/drivers/gpu/drm/i915/intel_workarounds.c
> +++ b/drivers/gpu/drm/i915/intel_workarounds.c
> @@ -990,7 +990,7 @@ wa_fail(const struct i915_wa *wa, u32 cur, const char *name, const char *from)
> cur, cur & wa->mask, wa->val, wa->mask);
> }
>
> -static void
> +static bool
> wa_verify_bits(const struct i915_wa *wa, u32 cur, const char *name,
> const char *from)
> {
> @@ -1001,30 +1001,35 @@ wa_verify_bits(const struct i915_wa *wa, u32 cur, const char *name,
> while (bits) {
> if ((bits & 1) && ((cur_ & 1) != (val_ & 1))) {
> wa_fail(wa, cur, name, from);
> - break;
> + return false;
> }
>
> bits >>= 1;
> cur_ >>= 1;
> val_ >>= 1;
> }
> +
> + return true;
> }
>
> -static void wa_list_verify(struct drm_i915_private *dev_priv,
> +static bool wa_list_verify(struct drm_i915_private *dev_priv,
> const struct i915_wa_list *wal,
> const char *from)
> {
> struct i915_wa *wa;
> unsigned int i;
> + bool res = true;
>
> for (i = 0, wa = wal->list; i < wal->count; i++, wa++)
> - wa_verify_bits(wa, I915_READ(wa->reg), wal->name, from);
> + res &= wa_verify_bits(wa, I915_READ(wa->reg), wal->name, from);
> +
> + return res;
> }
>
> -void intel_gt_workarounds_verify(struct drm_i915_private *dev_priv,
> +bool intel_gt_workarounds_verify(struct drm_i915_private *dev_priv,
> const char *from)
> {
> - wa_list_verify(dev_priv, &dev_priv->gt_wa_list, from);
> + return wa_list_verify(dev_priv, &dev_priv->gt_wa_list, from);
> }
>
> struct whitelist {
> @@ -1313,10 +1318,10 @@ void intel_engine_workarounds_apply(struct intel_engine_cs *engine)
> wa_list_apply(engine->i915, &engine->wa_list);
> }
>
> -void intel_engine_workarounds_verify(struct intel_engine_cs *engine,
> +bool intel_engine_workarounds_verify(struct intel_engine_cs *engine,
> const char *from)
> {
> - wa_list_verify(engine->i915, &engine->wa_list, from);
> + return wa_list_verify(engine->i915, &engine->wa_list, from);
> }
>
> #if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
> diff --git a/drivers/gpu/drm/i915/intel_workarounds.h b/drivers/gpu/drm/i915/intel_workarounds.h
> index f72cfda32d68..8f664d8b9e08 100644
> --- a/drivers/gpu/drm/i915/intel_workarounds.h
> +++ b/drivers/gpu/drm/i915/intel_workarounds.h
> @@ -33,14 +33,14 @@ int intel_ctx_workarounds_emit(struct i915_request *rq);
>
> void intel_gt_workarounds_init(struct drm_i915_private *dev_priv);
> void intel_gt_workarounds_apply(struct drm_i915_private *dev_priv);
> -void intel_gt_workarounds_verify(struct drm_i915_private *dev_priv,
> +bool intel_gt_workarounds_verify(struct drm_i915_private *dev_priv,
> const char *from);
>
> void intel_whitelist_workarounds_apply(struct intel_engine_cs *engine);
>
> void intel_engine_workarounds_init(struct intel_engine_cs *engine);
> void intel_engine_workarounds_apply(struct intel_engine_cs *engine);
> -void intel_engine_workarounds_verify(struct intel_engine_cs *engine,
> +bool intel_engine_workarounds_verify(struct intel_engine_cs *engine,
> const char *from);
>
> #endif
> diff --git a/drivers/gpu/drm/i915/selftests/intel_workarounds.c b/drivers/gpu/drm/i915/selftests/intel_workarounds.c
> index 80396b3592f5..c009eb2af7fc 100644
> --- a/drivers/gpu/drm/i915/selftests/intel_workarounds.c
> +++ b/drivers/gpu/drm/i915/selftests/intel_workarounds.c
> @@ -327,10 +327,100 @@ static int live_reset_whitelist(void *arg)
> return err;
> }
>
> +static bool verify_gt_engine_wa(struct drm_i915_private *i915, const char *str)
> +{
> + struct intel_engine_cs *engine;
> + enum intel_engine_id id;
> + bool ok = true;
> +
> + ok &= intel_gt_workarounds_verify(i915, str);
> +
> + for_each_engine(engine, i915, id)
> + ok &= intel_engine_workarounds_verify(engine, str);
Ok, ok.
> +
> + return ok;
> +}
> +
> +static int
> +live_gpu_reset_gt_engine_workarounds(void *arg)
> +{
> + struct drm_i915_private *i915 = arg;
> + struct i915_gpu_error *error = &i915->gpu_error;
> + bool ok;
> +
> + if (!intel_has_gpu_reset(i915))
> + return 0;
> +
> + pr_info("Verifying after GPU reset...\n");
> +
> + set_bit(I915_RESET_BACKOFF, &error->flags);
> + set_bit(I915_RESET_HANDOFF, &error->flags);
> +
> + ok = verify_gt_engine_wa(i915, "before reset");
> + if (!ok)
> + goto out;
> +
> + intel_runtime_pm_get(i915);
Move RESET_HANDOFF here to avoid any repetition of earlier problems we
had with the reset being applied too early.
> + i915_reset(i915, ~0, "live_workarounds");
> + intel_runtime_pm_put(i915);
> +
> + ok = verify_gt_engine_wa(i915, "after reset");
> +
> +out:
> + clear_bit(I915_RESET_BACKOFF, &error->flags);
> +
> + return ok ? 0 : -ESRCH;
> +}
> +
> +static int
> +live_engine_reset_gt_engine_workarounds(void *arg)
> +{
> + struct drm_i915_private *i915 = arg;
> + struct i915_gpu_error *error = &i915->gpu_error;
> + struct intel_engine_cs *engine;
> + enum intel_engine_id id;
> + bool ok;
> +
> + if (!intel_has_reset_engine(i915))
> + return 0;
May be easier to take global_reset_lock/unlock from
selftests/intel_hanghceck.
> +
> + for_each_engine(engine, i915, id) {
> + pr_info("Verifying after %s reset...\n", engine->name);
> +
> + set_bit(I915_RESET_BACKOFF, &error->flags);
> + set_bit(I915_RESET_ENGINE + engine->id, &error->flags);
> +
> + ok = verify_gt_engine_wa(i915, "before reset");
> + if (!ok)
> + goto out;
> +
> + intel_runtime_pm_get(i915);
> + i915_reset_engine(engine, "live_workarounds");
> + intel_runtime_pm_put(i915);
Once idle, and once with a spinner?
More information about the Intel-gfx
mailing list