[Intel-gfx] [PATCH 1/2] drm/i915/execlists: Peek at the next submission for error interrupts
Mika Kuoppala
mika.kuoppala at linux.intel.com
Thu Apr 2 20:16:52 UTC 2020
Chris Wilson <chris at chris-wilson.co.uk> writes:
> If we receive the error interrupt before the CS interrupt, we may find
> ourselves without an active request to reset, skipping the GPU reset.
> All because the attempt to reset was too early.
>
With the tracing, we will see the the out of sync situations
so
Reviewed-by: Mika Kuoppala <mika.kuoppala at linux.intel.com>
> Signed-off-by: Chris Wilson <chris at chris-wilson.co.uk>
> ---
> drivers/gpu/drm/i915/gt/intel_lrc.c | 41 ++++++++++++++++++++++++++++-
> 1 file changed, 40 insertions(+), 1 deletion(-)
>
> diff --git a/drivers/gpu/drm/i915/gt/intel_lrc.c b/drivers/gpu/drm/i915/gt/intel_lrc.c
> index 3479cda37fdc..f028114714cd 100644
> --- a/drivers/gpu/drm/i915/gt/intel_lrc.c
> +++ b/drivers/gpu/drm/i915/gt/intel_lrc.c
> @@ -2804,6 +2804,45 @@ static struct execlists_capture *capture_regs(struct intel_engine_cs *engine)
> return NULL;
> }
>
> +static struct i915_request *
> +active_context(struct intel_engine_cs *engine, u32 ccid)
> +{
> + const struct intel_engine_execlists * const el = &engine->execlists;
> + struct i915_request * const *port, *rq;
> +
> + /*
> + * Use the most recent result from process_csb(), but just in case
> + * we trigger an error (via interrupt) before the first CS event has
> + * been written, peek at the next submission.
> + */
> +
> + for (port = el->active; (rq = *port); port++) {
> + if (upper_32_bits(rq->context->lrc_desc) == ccid) {
> + ENGINE_TRACE(engine,
> + "ccid found at active:%zd\n",
> + port - el->active);
> + return rq;
> + }
> + }
> +
> + for (port = el->pending; (rq = *port); port++) {
> + if (upper_32_bits(rq->context->lrc_desc) == ccid) {
> + ENGINE_TRACE(engine,
> + "ccid found at pending:%zd\n",
> + port - el->pending);
> + return rq;
> + }
> + }
> +
> + ENGINE_TRACE(engine, "ccid:%x not found\n", ccid);
> + return NULL;
> +}
> +
> +static u32 active_ccid(struct intel_engine_cs *engine)
> +{
> + return ENGINE_READ_FW(engine, RING_EXECLIST_STATUS_HI);
> +}
> +
> static bool execlists_capture(struct intel_engine_cs *engine)
> {
> struct execlists_capture *cap;
> @@ -2821,7 +2860,7 @@ static bool execlists_capture(struct intel_engine_cs *engine)
> return true;
>
> spin_lock_irq(&engine->active.lock);
> - cap->rq = execlists_active(&engine->execlists);
> + cap->rq = active_context(engine, active_ccid(engine));
> if (cap->rq) {
> cap->rq = active_request(cap->rq->context->timeline, cap->rq);
> cap->rq = i915_request_get_rcu(cap->rq);
> --
> 2.20.1
>
> _______________________________________________
> Intel-gfx mailing list
> Intel-gfx at lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/intel-gfx
More information about the Intel-gfx
mailing list