[Intel-gfx] [PATCH] drm/i915: collect more per ring error state
Chris Wilson
chris at chris-wilson.co.uk
Sun Oct 30 19:46:22 CET 2011
On Sun, 30 Oct 2011 18:39:03 +0000, Chris Wilson <chris at chris-wilson.co.uk> wrote:
> On Tue, 11 Oct 2011 21:20:21 +0200, Daniel Vetter <daniel.vetter at ffwll.ch> wrote:
> > Based on a patch by Ben Widawsky, but with different colors
> > for the bikeshed.
> >
> > In contrast to Ben's patch this one doesn't add the fault regs.
> > Afaics they're for the optional page fault support which
> > - we're not enabling
> > - and which seems to be unsupported by the hw team. Recent bspec
> > lacks tons of information about this that the public docs released
> > half a year back still contain.
> >
> > Also dump ring HEAD/TAIL registers - I've recently seen a few
> > error_state where just guessing these is not good enough.
> >
> > v2: Also dump INSTPM for every ring.
> >
> > v3: Fix a few really silly goof-ups spotted by Chris Wilson.
> >
> > Signed-off-by: Daniel Vetter <daniel.vetter at ffwll.ch>
>
> This is independent of the "hangcheck robustification" (which I feel is
> false advertising ;-) and adds some mildly useful debug information.
> The patch itself is fine and worthy of a reviewed-by, there is just one
> nearby bug that may as well be squashed in with this cleanup...
>
> > ---
> > drivers/gpu/drm/i915/i915_debugfs.c | 16 ++++++++++------
> > drivers/gpu/drm/i915/i915_drv.h | 7 +++++--
> > drivers/gpu/drm/i915/i915_irq.c | 9 +++++++--
> > drivers/gpu/drm/i915/i915_reg.h | 3 +++
> > 4 files changed, 25 insertions(+), 10 deletions(-)
> >
> > diff --git a/drivers/gpu/drm/i915/i915_debugfs.c b/drivers/gpu/drm/i915/i915_debugfs.c
> > index d618f78..5f5eb5b 100644
> > --- a/drivers/gpu/drm/i915/i915_debugfs.c
> > +++ b/drivers/gpu/drm/i915/i915_debugfs.c
> > @@ -734,17 +734,21 @@ static void i915_ring_error_state(struct seq_file *m,
> > unsigned ring)
> > {
> > seq_printf(m, "%s command stream:\n", ring_str(ring));
> > + seq_printf(m, " HEAD: 0x%08x\n", error->head[ring]);
> > + seq_printf(m, " TAIL: 0x%08x\n", error->tail[ring]);
> > seq_printf(m, " ACTHD: 0x%08x\n", error->acthd[ring]);
> > seq_printf(m, " IPEIR: 0x%08x\n", error->ipeir[ring]);
> > seq_printf(m, " IPEHR: 0x%08x\n", error->ipehr[ring]);
> > seq_printf(m, " INSTDONE: 0x%08x\n", error->instdone[ring]);
> > - if (ring == RCS) {
> > - if (INTEL_INFO(dev)->gen >= 4) {
> > - seq_printf(m, " INSTDONE1: 0x%08x\n", error->instdone1);
> > - seq_printf(m, " INSTPS: 0x%08x\n", error->instps);
> > - }
> > - seq_printf(m, " INSTPM: 0x%08x\n", error->instpm);
> > + if (ring == RCS && INTEL_INFO(dev)->gen >= 4) {
> > + seq_printf(m, " INSTDONE1: 0x%08x\n", error->instdone1);
> > + seq_printf(m, " BBADDR: 0x%08llx\n", error->bbaddr);
> > }
> > + if (INTEL_INFO(dev)->gen >= 4)
> > + seq_printf(m, " INSTPS: 0x%08x\n", error->instps[ring]);
> > + seq_printf(m, " INSTPM: 0x%08x\n", error->instpm[ring]);
> > + if (INTEL_INFO(dev)->gen >= 6)
> > + seq_printf(m, " FADDR: 0x%08x\n", error->faddr[ring]);
> > seq_printf(m, " seqno: 0x%08x\n", error->seqno[ring]);
> > }
> >
> > diff --git a/drivers/gpu/drm/i915/i915_drv.h b/drivers/gpu/drm/i915/i915_drv.h
> > index 5f3ff9d..3701369 100644
> > --- a/drivers/gpu/drm/i915/i915_drv.h
> > +++ b/drivers/gpu/drm/i915/i915_drv.h
> > @@ -149,16 +149,19 @@ struct drm_i915_error_state {
> > u32 eir;
> > u32 pgtbl_er;
> > u32 pipestat[I915_MAX_PIPES];
> > + u32 tail[I915_NUM_RINGS];
> > + u32 head[I915_NUM_RINGS];
> > u32 ipeir[I915_NUM_RINGS];
> > u32 ipehr[I915_NUM_RINGS];
> > u32 instdone[I915_NUM_RINGS];
> > u32 acthd[I915_NUM_RINGS];
> > u32 error; /* gen6+ */
> > - u32 instpm;
> > - u32 instps;
> > + u32 instpm[I915_NUM_RINGS];
> > + u32 instps[I915_NUM_RINGS];
> > u32 instdone1;
> > u32 seqno[I915_NUM_RINGS];
> > u64 bbaddr;
> > + u32 faddr[I915_NUM_RINGS];
> > u64 fence[16];
> > struct timeval time;
> > struct drm_i915_error_object {
> > diff --git a/drivers/gpu/drm/i915/i915_irq.c b/drivers/gpu/drm/i915/i915_irq.c
> > index 79aba7f..ea1721f 100644
> > --- a/drivers/gpu/drm/i915/i915_irq.c
> > +++ b/drivers/gpu/drm/i915/i915_irq.c
> > @@ -878,12 +878,15 @@ static void i915_record_ring_state(struct drm_device *dev,
> > {
> > struct drm_i915_private *dev_priv = dev->dev_private;
> >
> > + if (INTEL_INFO(dev)->gen >= 6)
> > + error->faddr[ring->id] = I915_READ(RING_DMA_FADD(ring->mmio_base));
> > +
> > if (INTEL_INFO(dev)->gen >= 4) {
> > error->ipeir[ring->id] = I915_READ(RING_IPEIR(ring->mmio_base));
> > error->ipehr[ring->id] = I915_READ(RING_IPEHR(ring->mmio_base));
> > error->instdone[ring->id] = I915_READ(RING_INSTDONE(ring->mmio_base));
> > + error->instps[ring->id] = I915_READ(RING_INSTPS(ring->mmio_base));
> > if (ring->id == RCS) {
> > - error->instps = I915_READ(INSTPS);
> > error->instdone1 = I915_READ(INSTDONE1);
> > error->bbaddr = I915_READ64(BB_ADDR);
> > }
> > @@ -894,8 +897,11 @@ static void i915_record_ring_state(struct drm_device *dev,
> > error->bbaddr = 0;
> > }
> >
> > + error->instpm[ring->id] = I915_READ(RING_INSTPM(ring->mmio_base));
> > error->seqno[ring->id] = dev_priv->ring->get_seqno(ring);
> Whilst you are here, you may as well fix this ^.
Daniel pointed out that I already reviewed a patch to fix this, so I
hereby review this patch to add the extra debug information!
Reviewed-by: Chris Wilson <chris at chris-wilson.co.uk>
-Chris
--
Chris Wilson, Intel Open Source Technology Centre
More information about the Intel-gfx
mailing list