[Intel-gfx] [PATCH v2 2/4] drm/i915: Ironlake mobile GPU with VT-d fix

Daniel Vetter daniel at ffwll.ch
Sun Sep 25 11:40:14 CEST 2011


On Sat, Sep 24, 2011 at 03:23:05PM -0700, Ben Widawsky wrote:
> Under certain circumstances, an IOTLB flush never completes and the hardware
> just locks up.  The fix is meant to idle the GPU both before and after
> any unmap occurs.
> 
> This patch also disables the warning which is meant to detect mismatches
> between when we think the command parse and arbiter should be idle, and
> when it actually is.
> 
> Cc: Dave Airlie <airlied at redhat.com>
> Cc: David Woodhouse <dwmw2 at infradead.org>
> Cc: Keith Packard <keithp at keithp.com>
> Cc: Chris Wilson <chris at chris-wilson.co.uk>
> Signed-off-by: Ben Widawsky <ben at bwidawsk.net>

A few nitpicks below ...

> ---
>  drivers/char/agp/intel-gtt.c        |   16 ++++++++++++++
>  drivers/gpu/drm/i915/i915_gem.c     |   32 +++++++++++++++++++---------
>  drivers/gpu/drm/i915/i915_gem_gtt.c |   39 +++++++++++++++++++++++++++++++++++
>  include/drm/intel-gtt.h             |    2 +
>  4 files changed, 79 insertions(+), 10 deletions(-)
> 
> diff --git a/drivers/char/agp/intel-gtt.c b/drivers/char/agp/intel-gtt.c
> index 8515101..47ca42f 100644
> --- a/drivers/char/agp/intel-gtt.c
> +++ b/drivers/char/agp/intel-gtt.c
> @@ -923,6 +923,9 @@ static int intel_fake_agp_insert_entries(struct agp_memory *mem,
>  {
>  	int ret = -EINVAL;
>  
> +	if (intel_private.base.do_idle_maps)
> +		return -ENODEV;

This reminds me to kick out intel-agp support for ilk+. Upstream never
ever supported ums without gem on these, and that's the only reason we
have this agp compat code still lying around.

> +
>  	if (intel_private.clear_fake_agp) {
>  		int start = intel_private.base.stolen_size / PAGE_SIZE;
>  		int end = intel_private.base.gtt_mappable_entries;
> @@ -985,6 +988,9 @@ static int intel_fake_agp_remove_entries(struct agp_memory *mem,
>  	if (mem->page_count == 0)
>  		return 0;
>  
> +	if (intel_private.base.do_idle_maps)
> +		return -ENODEV;
> +
>  	intel_gtt_clear_range(pg_start, mem->page_count);
>  
>  	if (intel_private.base.needs_dmar) {
> @@ -1180,8 +1186,12 @@ static void gen6_cleanup(void)
>  static int i9xx_setup(void)
>  {
>  	u32 reg_addr;
> +	u16 gmch_ctrl;
> +	const unsigned short gpu_devid = intel_private.pcidev->device;
>  
>  	pci_read_config_dword(intel_private.pcidev, I915_MMADDR, &reg_addr);
> +	pci_read_config_word(intel_private.bridge_dev,
> +			     I830_GMCH_CTRL, &gmch_ctrl);
>  
>  	reg_addr &= 0xfff80000;
>  
> @@ -1211,6 +1221,12 @@ static int i9xx_setup(void)
>  		intel_private.gtt_bus_addr = reg_addr + gtt_offset;
>  	}
>  
> +	if ((gpu_devid == PCI_DEVICE_ID_INTEL_IRONLAKE_M_HB ||
> +	     gpu_devid == PCI_DEVICE_ID_INTEL_IRONLAKE_M_IG) &&
> +	     (gmch_ctrl & G4x_GMCH_SIZE_VT_EN) &&
> +	     intel_private.base.needs_dmar)
> +		intel_private.base.do_idle_maps = 1;

Can you extract that horrible condition into e.g.
NEEDS_ILK_IOMMU_WORKAROUND or something like that? I think future me will
go wtf on this without the context ...

> +
>  	intel_i9xx_setup_flush();
>  
>  	return 0;
> diff --git a/drivers/gpu/drm/i915/i915_gem.c b/drivers/gpu/drm/i915/i915_gem.c
> index 61ce1b7..d369e48 100644
> --- a/drivers/gpu/drm/i915/i915_gem.c
> +++ b/drivers/gpu/drm/i915/i915_gem.c
> @@ -2268,27 +2268,39 @@ static int i915_ring_idle(struct intel_ring_buffer *ring)
>  	return i915_wait_request(ring, i915_gem_next_request_seqno(ring));
>  }
>  
> +static int
> +flush_rings(drm_i915_private_t *dev_priv)
> +{
> +	int i, ret;
> +
> +	/* Flush everything onto the inactive list. */
> +	for (i = 0; i < I915_NUM_RINGS; i++) {
> +		ret = i915_ring_idle(&dev_priv->ring[i]);
> +		if (ret)
> +			return ret;
> +	}
> +
> +	return 0;
> +}
> +
>  int
>  i915_gpu_idle(struct drm_device *dev)
>  {
>  	drm_i915_private_t *dev_priv = dev->dev_private;
>  	bool lists_empty;
> -	int ret, i;
>  
>  	lists_empty = (list_empty(&dev_priv->mm.flushing_list) &&
>  		       list_empty(&dev_priv->mm.active_list));
>  	if (lists_empty) {
> -		WARN_ON(!(I915_READ(MI_MODE) & MI_RINGS_IDLE));
> -		return 0;
> -
> -	/* Flush everything onto the inactive list. */
> -	for (i = 0; i < I915_NUM_RINGS; i++) {
> -		ret = i915_ring_idle(&dev_priv->ring[i]);
> -		if (ret)
> -			return ret;
> +		/* If we require idle maps, enforce the ring is idle */
> +		bool ring_idle = (I915_READ(MI_MODE) & MI_RINGS_IDLE) != 0;
> +		if (!ring_idle && dev_priv->mm.gtt->do_idle_maps)
> +			return flush_rings(dev_priv);
> +		else
> +			return 0;

Can you extract this hack into its own patch? This way
- the actual work-around would stand out more clearly
- we put more emphasive on the fact that we seem to lose track of things.

>  	}
>  
> -	return 0;
> +	return flush_rings(dev_priv);
>  }
>  
>  static int sandybridge_write_fence_reg(struct drm_i915_gem_object *obj,
> diff --git a/drivers/gpu/drm/i915/i915_gem_gtt.c b/drivers/gpu/drm/i915/i915_gem_gtt.c
> index 7a709cd..0c6226b 100644
> --- a/drivers/gpu/drm/i915/i915_gem_gtt.c
> +++ b/drivers/gpu/drm/i915/i915_gem_gtt.c
> @@ -49,10 +49,39 @@ static unsigned int cache_level_to_agp_type(struct drm_device *dev,
>  	}
>  }
>  
> +static bool do_idling(struct drm_i915_private *dev_priv)
> +{
> +	bool ret = dev_priv->mm.interruptible;
> +
> +	if (dev_priv->mm.gtt->do_idle_maps) {
> +		dev_priv->mm.interruptible = false;
> +		if (i915_gpu_idle(dev_priv->dev))
> +			DRM_ERROR("couldn't idle GPU %d\n", ret);
> +	}

I don't like the uninterruptible sleep in core gem - this is only for
modesetting where backtracking is just not really feasible. I've quickly
checked the code and I haven't seen any problems in handing back the
-ERESTARTSYS to gem_object_unbind.

> +
> +	return ret;
> +}
> +
> +static void undo_idling(struct drm_i915_private *dev_priv, bool idle)
> +{
> +	int ret;
> +	if (!dev_priv->mm.gtt->do_idle_maps)
> +		return;
> +
> +	/*NB: since GTT mappings don't actually touch the GPU, this is not
> +	 * strictly necessary.
> +	 */
> +	ret = i915_gpu_idle(dev_priv->dev);
> +	if (ret)
> +		DRM_ERROR("couldn't idle GPU %d\n", ret);
> +	dev_priv->mm.interruptible = idle;
> +}
> +
>  void i915_gem_restore_gtt_mappings(struct drm_device *dev)
>  {
>  	struct drm_i915_private *dev_priv = dev->dev_private;
>  	struct drm_i915_gem_object *obj;
> +	bool idle;

Patch-dirt? 2 more below ...

>  
>  	/* First fill our portion of the GTT with scratch pages */
>  	intel_gtt_clear_range(dev_priv->mm.gtt_start / PAGE_SIZE,
> @@ -71,6 +100,7 @@ int i915_gem_gtt_bind_object(struct drm_i915_gem_object *obj)
>  	struct drm_device *dev = obj->base.dev;
>  	struct drm_i915_private *dev_priv = dev->dev_private;
>  	unsigned int agp_type = cache_level_to_agp_type(dev, obj->cache_level);
> +	bool idle;
>  	int ret;
>  
>  	if (dev_priv->mm.gtt->needs_dmar) {
> @@ -100,6 +130,7 @@ void i915_gem_gtt_rebind_object(struct drm_i915_gem_object *obj,
>  	struct drm_device *dev = obj->base.dev;
>  	struct drm_i915_private *dev_priv = dev->dev_private;
>  	unsigned int agp_type = cache_level_to_agp_type(dev, cache_level);
> +	bool idle;
>  
>  	if (dev_priv->mm.gtt->needs_dmar) {
>  		BUG_ON(!obj->sg_list);
> @@ -117,6 +148,12 @@ void i915_gem_gtt_rebind_object(struct drm_i915_gem_object *obj,
>  
>  void i915_gem_gtt_unbind_object(struct drm_i915_gem_object *obj)
>  {
> +	struct drm_device *dev = obj->base.dev;
> +	struct drm_i915_private *dev_priv = dev->dev_private;
> +	bool idle;
> +
> +	idle = do_idling(dev_priv);
> +
>  	intel_gtt_clear_range(obj->gtt_space->start >> PAGE_SHIFT,
>  			      obj->base.size >> PAGE_SHIFT);
>  
> @@ -124,4 +161,6 @@ void i915_gem_gtt_unbind_object(struct drm_i915_gem_object *obj)
>  		intel_gtt_unmap_memory(obj->sg_list, obj->num_sg);
>  		obj->sg_list = NULL;
>  	}
> +
> +	undo_idling(dev_priv, idle);
>  }
> diff --git a/include/drm/intel-gtt.h b/include/drm/intel-gtt.h
> index 9e343c0..b174620 100644
> --- a/include/drm/intel-gtt.h
> +++ b/include/drm/intel-gtt.h
> @@ -13,6 +13,8 @@ const struct intel_gtt {
>  	unsigned int gtt_mappable_entries;
>  	/* Whether i915 needs to use the dmar apis or not. */
>  	unsigned int needs_dmar : 1;
> +	/* Whether we idle the gpu before mapping/unmapping */
> +	unsigned int do_idle_maps : 1;
>  } *intel_gtt_get(void);
>  
>  void intel_gtt_chipset_flush(void);
> -- 
> 1.7.6.3
> 
> _______________________________________________
> Intel-gfx mailing list
> Intel-gfx at lists.freedesktop.org
> http://lists.freedesktop.org/mailman/listinfo/intel-gfx

-- 
Daniel Vetter
Mail: daniel at ffwll.ch
Mobile: +41 (0)79 365 57 48



More information about the Intel-gfx mailing list