[Intel-gfx] [intel-gfx][PATCH 2/2] drm/i915: Add a new ring buffer on Sandybridge
Xiang, Haihao
haihao.xiang at intel.com
Thu Sep 2 10:59:20 CEST 2010
On Thu, 2010-09-02 at 15:16 +0800, Chris Wilson wrote:
> Comments inline.
Thanks for your comments.
>
> On Thu, 2 Sep 2010 21:46:54 +0800, "Xiang, Haihao" <haihao.xiang at intel.com> wrote:
> > This ring buffer is used for video decoding/encoding on Sandybridge.
> >
> > Signed-off-by: Xiang, Haihao <haihao.xiang at intel.com>
> > ---
> > drivers/gpu/drm/i915/i915_drv.h | 2 +-
> > drivers/gpu/drm/i915/i915_gem.c | 6 ++-
> > drivers/gpu/drm/i915/i915_irq.c | 15 +++--
> > drivers/gpu/drm/i915/i915_reg.h | 22 +++++-
> > drivers/gpu/drm/i915/intel_ringbuffer.c | 121 +++++++++++++++++++++++++++++++
> > drivers/gpu/drm/i915/intel_ringbuffer.h | 1 +
> > 6 files changed, 158 insertions(+), 9 deletions(-)
> >
> > diff --git a/drivers/gpu/drm/i915/i915_drv.h b/drivers/gpu/drm/i915/i915_drv.h
> > index 047cd7c..22d098b 100644
> > --- a/drivers/gpu/drm/i915/i915_drv.h
> > +++ b/drivers/gpu/drm/i915/i915_drv.h
> > @@ -1203,7 +1203,7 @@ extern void intel_overlay_print_error_state(struct seq_file *m, struct intel_ove
> > (dev)->pci_device == 0x2A42 || \
> > (dev)->pci_device == 0x2E42)
> >
> > -#define HAS_BSD(dev) (IS_IRONLAKE(dev) || IS_G4X(dev))
> > +#define HAS_BSD(dev) (IS_IRONLAKE(dev) || IS_G4X(dev) || IS_GEN6(dev))
>
> Convert HAS_BSD(dev) to INTEL_INFO(dev)->has_bsd_ring and update
> capabilities accordingly.
I will fix it.
>
> > #define I915_NEED_GFX_HWS(dev) (INTEL_INFO(dev)->need_gfx_hws)
> >
> > /* With the 945 and later, Y tiling got adjusted so that it was 32 128-byte
> > diff --git a/drivers/gpu/drm/i915/i915_gem.c b/drivers/gpu/drm/i915/i915_gem.c
> > index 8ccb55a..d2c825a 100644
> > --- a/drivers/gpu/drm/i915/i915_gem.c
> > +++ b/drivers/gpu/drm/i915/i915_gem.c
> > @@ -4504,7 +4504,11 @@ i915_gem_init_ringbuffer(struct drm_device *dev)
> > goto cleanup_pipe_control;
> >
> > if (HAS_BSD(dev)) {
> > - dev_priv->bsd_ring = bsd_ring;
> > + if (IS_GEN6(dev))
> > + dev_priv->bsd_ring = gen6_bsd_ring;
> > + else
> > + dev_priv->bsd_ring = bsd_ring;
> > +
>
> Lets stop exporting these struct initialisers before we end up with one
> per generation per ring. Introduce intel_init_render_ring_buffer() and
> intel_init_bsd_ring_buffer() and similarly tidy up the HWS page
> initialisation.
I will fix it.
>
> > ret = intel_init_ring_buffer(dev, &dev_priv->bsd_ring);
> > if (ret)
> > goto cleanup_render_ring;
> > diff --git a/drivers/gpu/drm/i915/i915_irq.c b/drivers/gpu/drm/i915/i915_irq.c
> > index 16861b8..82e708c 100644
> > --- a/drivers/gpu/drm/i915/i915_irq.c
> > +++ b/drivers/gpu/drm/i915/i915_irq.c
> > @@ -312,6 +312,10 @@ irqreturn_t ironlake_irq_handler(struct drm_device *dev)
> > u32 de_iir, gt_iir, de_ier, pch_iir;
> > struct drm_i915_master_private *master_priv;
> > struct intel_ring_buffer *render_ring = &dev_priv->render_ring;
> > + u32 bsd_usr_interrupt = GT_BSD_USER_INTERRUPT;
> > +
> > + if (IS_GEN6(dev))
> > + bsd_usr_interrupt = GT_GEN6_BSD_USER_INTERRUPT;
> >
> > /* disable master interrupt before clearing iir */
> > de_ier = I915_READ(DEIER);
> > @@ -342,10 +346,9 @@ irqreturn_t ironlake_irq_handler(struct drm_device *dev)
> > dev_priv->hangcheck_count = 0;
> > mod_timer(&dev_priv->hangcheck_timer, jiffies + DRM_I915_HANGCHECK_PERIOD);
> > }
> > - if (gt_iir & GT_BSD_USER_INTERRUPT)
> > + if (gt_iir & bsd_usr_interrupt)
> > DRM_WAKEUP(&dev_priv->bsd_ring.irq_queue);
> >
> > -
> > if (de_iir & DE_GSE)
> > ironlake_opregion_gse_intr(dev);
> >
> > @@ -1381,17 +1384,19 @@ static int ironlake_irq_postinstall(struct drm_device *dev)
> > I915_WRITE(DEIER, dev_priv->de_irq_enable_reg);
> > (void) I915_READ(DEIER);
> >
> > - /* Gen6 only needs render pipe_control now */
> > if (IS_GEN6(dev))
> > - render_mask = GT_PIPE_NOTIFY;
> > + render_mask = GT_PIPE_NOTIFY | GT_GEN6_BSD_USER_INTERRUPT;
> >
> > dev_priv->gt_irq_mask_reg = ~render_mask;
> > dev_priv->gt_irq_enable_reg = render_mask;
> >
> > I915_WRITE(GTIIR, I915_READ(GTIIR));
> > I915_WRITE(GTIMR, dev_priv->gt_irq_mask_reg);
> > - if (IS_GEN6(dev))
> > + if (IS_GEN6(dev)) {
> > I915_WRITE(GEN6_RENDER_IMR, ~GEN6_RENDER_PIPE_CONTROL_NOTIFY_INTERRUPT);
> > + I915_WRITE(GEN6_BSD_IMR, ~GEN6_BSD_IMR_USER_INTERRUPT);
> > + }
> > +
> > I915_WRITE(GTIER, dev_priv->gt_irq_enable_reg);
> > (void) I915_READ(GTIER);
> >
> > diff --git a/drivers/gpu/drm/i915/i915_reg.h b/drivers/gpu/drm/i915/i915_reg.h
> > index 67e3ec1..9d57ecc 100644
> > --- a/drivers/gpu/drm/i915/i915_reg.h
> > +++ b/drivers/gpu/drm/i915/i915_reg.h
> > @@ -192,11 +192,11 @@
> > #define MI_STORE_DWORD_INDEX MI_INSTR(0x21, 1)
> > #define MI_STORE_DWORD_INDEX_SHIFT 2
> > #define MI_LOAD_REGISTER_IMM MI_INSTR(0x22, 1)
> > +#define MI_FLUSH_DW MI_INSTR(0x26, 2) /* for GEN6 */
>
> Random new abbreviation. Use MI_FLUSH_DWORD for consistency.
MI_FLUSH_DW is a MI command and used by the document.
>
> > #define MI_BATCH_BUFFER MI_INSTR(0x30, 1)
> > #define MI_BATCH_NON_SECURE (1)
> > #define MI_BATCH_NON_SECURE_I965 (1<<8)
> > #define MI_BATCH_BUFFER_START MI_INSTR(0x31, 0)
> > -
> > /*
> > * 3D instructions used by the kernel
> > */
> > @@ -476,6 +476,24 @@
> > #define BSD_HWS_PGA 0x04080
> >
> > /*
> > + * video command stream instruction and interrupt control register defines
> > + * for GEN6
> > + */
> > +#define GEN6_BSD_RING_TAIL 0x12030
> > +#define GEN6_BSD_RING_HEAD 0x12034
> > +#define GEN6_BSD_RING_START 0x12038
> > +#define GEN6_BSD_RING_CTL 0x1203c
> > +#define GEN6_BSD_RING_ACTHD 0x12074
> > +#define GEN6_BSD_HWS_PGA 0x14080
> > +
> > +#define GEN6_BSD_SLEEP_PSMI_CONTROL 0x12050
> > +#define GEN6_BSD_SLEEP_PSMI_CONTROL_IDLE_INDICATOR (1 << 3)
> > +
> > +#define GEN6_BSD_IMR 0x120a8
> > +#define GEN6_BSD_IMR_USER_INTERRUPT (1 << 12)
> > +#define GEN6_BSD_RNCID 0x12198
> > +
> > +/*
> > * Framebuffer compression (915+ only)
> > */
> >
> > @@ -2507,7 +2525,7 @@
> > #define GT_SYNC_STATUS (1 << 2)
> > #define GT_USER_INTERRUPT (1 << 0)
> > #define GT_BSD_USER_INTERRUPT (1 << 5)
> > -
> > +#define GT_GEN6_BSD_USER_INTERRUPT (1 << 12)
> >
> > #define GTISR 0x44010
> > #define GTIMR 0x44014
> > diff --git a/drivers/gpu/drm/i915/intel_ringbuffer.c b/drivers/gpu/drm/i915/intel_ringbuffer.c
> > index dda2751..4c0f8c4 100644
> > --- a/drivers/gpu/drm/i915/intel_ringbuffer.c
> > +++ b/drivers/gpu/drm/i915/intel_ringbuffer.c
> > @@ -32,6 +32,7 @@
> > #include "i915_drv.h"
> > #include "i915_drm.h"
> > #include "i915_trace.h"
> > +#include "intel_drv.h"
> >
> > static u32 i915_gem_get_seqno(struct drm_device *dev)
> > {
> > @@ -874,3 +875,123 @@ struct intel_ring_buffer bsd_ring = {
> > .status_page = {NULL, 0, NULL},
> > .map = {0,}
> > };
> > +
> > +static void gen6_bsd_setup_status_page(struct drm_device *dev,
> > + struct intel_ring_buffer *ring)
> > +{
> > + drm_i915_private_t *dev_priv = dev->dev_private;
> > + I915_WRITE(GEN6_BSD_HWS_PGA, ring->status_page.gfx_addr);
> > + I915_READ(GEN6_BSD_HWS_PGA);
> > +}
> > +
> > +static inline unsigned int gen6_bsd_ring_get_head(struct drm_device *dev,
> > + struct intel_ring_buffer *ring)
> > +{
> > + drm_i915_private_t *dev_priv = dev->dev_private;
> > + return I915_READ(GEN6_BSD_RING_HEAD) & HEAD_ADDR;
> > +}
> > +
> > +static inline unsigned int gen6_bsd_ring_get_tail(struct drm_device *dev,
> > + struct intel_ring_buffer *ring)
> > +{
> > + drm_i915_private_t *dev_priv = dev->dev_private;
> > + return I915_READ(GEN6_BSD_RING_TAIL) & TAIL_ADDR;
> > +}
> > +
> > +static inline void gen6_bsd_ring_set_tail(struct drm_device *dev,
> > + u32 value)
> > +{
> > + drm_i915_private_t *dev_priv = dev->dev_private;
> > +
> > + /* Every tail move must follow the sequence below */
> > + I915_WRITE(GEN6_BSD_SLEEP_PSMI_CONTROL, 0x00010001);
>
> Magic number. (1 << 16) | (1 << 0) would be better just to distinguish
> between the mask and enable bits (guess). Actually naming the bits for
> that register would be preferable.
I will use some macros instead.
>
> > + I915_WRITE(GEN6_BSD_RNCID, 0x00000000);
> > +
> > + if (wait_for((I915_READ(GEN6_BSD_SLEEP_PSMI_CONTROL) &
> > + GEN6_BSD_SLEEP_PSMI_CONTROL_IDLE_INDICATOR) == 0,
> > + 50, 0))
> > + DRM_ERROR("timed out waiting for IDLE Indicator\n");
> > +
> > + I915_WRITE(GEN6_BSD_RING_TAIL, value);
> > + I915_WRITE(GEN6_BSD_SLEEP_PSMI_CONTROL, 0x00010000);
>
> Do you need to clear the IDLE_INDICATOR here as well?
IDLE_INDICATOR is a read-only field.
>
> > +}
> > +
> > +static inline unsigned int gen6_bsd_ring_get_active_head(struct drm_device *dev,
> > + struct intel_ring_buffer *ring)
> > +{
> > + drm_i915_private_t *dev_priv = dev->dev_private;
> > + return I915_READ(GEN6_BSD_RING_ACTHD);
> > +}
> > +
> > +static inline void gen6_bsd_ring_advance_ring(struct drm_device *dev,
> > + struct intel_ring_buffer *ring)
> > +{
> > + gen6_bsd_ring_set_tail(dev, ring->tail);
> > +}
> > +
> > +static void gen6_bsd_ring_flush(struct drm_device *dev,
> > + struct intel_ring_buffer *ring,
> > + u32 invalidate_domains,
> > + u32 flush_domains)
> > +{
> > + intel_ring_begin(dev, ring, 4);
> > + intel_ring_emit(dev, ring, MI_FLUSH_DW);
> > + intel_ring_emit(dev, ring, 0);
> > + intel_ring_emit(dev, ring, 0);
> > + intel_ring_emit(dev, ring, 0);
> > + intel_ring_advance(dev, ring);
> > +}
> > +
> > +static int
> > +gen6_bsd_ring_dispatch_gem_execbuffer(struct drm_device *dev,
> > + struct intel_ring_buffer *ring,
> > + struct drm_i915_gem_execbuffer2 *exec,
> > + struct drm_clip_rect *cliprects,
> > + uint64_t exec_offset)
> > +{
> > + uint32_t exec_start;
> > + exec_start = (uint32_t) exec_offset + exec->batch_start_offset;
> > + intel_ring_begin(dev, ring, 2);
> > + intel_ring_emit(dev, ring, MI_BATCH_BUFFER_START | MI_BATCH_NON_SECURE_I965); /* bit0-7 is the length on GEN6+ */
> > + intel_ring_emit(dev, ring, exec_start);
> > + intel_ring_advance(dev, ring);
> > + return 0;
> > +}
> > +
> > +/* ring buffer for Video Codec for Gen6+ */
> > +struct intel_ring_buffer gen6_bsd_ring = {
> > + .name = "gen6 bsd ring",
> > + .regs = {
> > + .ctl = GEN6_BSD_RING_CTL,
> > + .head = GEN6_BSD_RING_HEAD,
> > + .tail = GEN6_BSD_RING_TAIL,
> > + .start = GEN6_BSD_RING_START
> > + },
> > + .ring_flag = I915_EXEC_BSD,
> > + .size = 32 * PAGE_SIZE,
> > + .alignment = PAGE_SIZE,
> > + .virtual_start = NULL,
> > + .dev = NULL,
> > + .gem_object = NULL,
> > + .head = 0,
> > + .tail = 0,
> > + .space = 0,
> > + .user_irq_refcount = 0,
> > + .irq_gem_seqno = 0,
> > + .waiting_gem_seqno = 0,
> > + .setup_status_page = gen6_bsd_setup_status_page,
> > + .init = init_bsd_ring,
> > + .get_head = gen6_bsd_ring_get_head,
> > + .get_tail = gen6_bsd_ring_get_tail,
> > + .set_tail = gen6_bsd_ring_set_tail,
> > + .get_active_head = gen6_bsd_ring_get_active_head,
> > + .advance_ring = gen6_bsd_ring_advance_ring,
> > + .flush = gen6_bsd_ring_flush,
> > + .add_request = bsd_ring_add_request,
> > + .get_gem_seqno = bsd_ring_get_gem_seqno,
> > + .user_irq_get = bsd_ring_get_user_irq,
> > + .user_irq_put = bsd_ring_put_user_irq,
> > + .dispatch_gem_execbuffer = gen6_bsd_ring_dispatch_gem_execbuffer,
> > + .status_page = {NULL, 0, NULL},
> > + .map = {0,}
> > +};
> > diff --git a/drivers/gpu/drm/i915/intel_ringbuffer.h b/drivers/gpu/drm/i915/intel_ringbuffer.h
> > index 8245261..9d38c33 100644
> > --- a/drivers/gpu/drm/i915/intel_ringbuffer.h
> > +++ b/drivers/gpu/drm/i915/intel_ringbuffer.h
> > @@ -129,5 +129,6 @@ u32 intel_ring_get_seqno(struct drm_device *dev,
> >
> > extern struct intel_ring_buffer render_ring;
> > extern struct intel_ring_buffer bsd_ring;
> > +extern struct intel_ring_buffer gen6_bsd_ring;
> >
> > #endif /* _INTEL_RINGBUFFER_H_ */
> > --
> > 1.7.0.4
> >
> > _______________________________________________
> > Intel-gfx mailing list
> > Intel-gfx at lists.freedesktop.org
> > http://lists.freedesktop.org/mailman/listinfo/intel-gfx
> >
>
More information about the Intel-gfx
mailing list