[Intel-gfx] [PATCH] drm/i915: Revoke fenced GTT mmapings across GPU reset
Tvrtko Ursulin
tvrtko.ursulin at linux.intel.com
Wed Jan 4 15:47:50 UTC 2017
On 04/01/2017 15:45, Chris Wilson wrote:
> On Wed, Jan 04, 2017 at 03:36:16PM +0000, Tvrtko Ursulin wrote:
>>
>> On 04/01/2017 14:51, Chris Wilson wrote:
>>> During the fence registers are clobbered by a GPU reset. Hence if
>>
>> During the reset I suppose, although it would sound still a bit
>> redundant. So maybe "Since GPU reset clobbers the fence registers,
>> if there is concurrent..."
>
> I was just going to leave it as "The fence registers are clobbered by
> a GPU reset. If..."
Fine by me.
>>> there is concurrent user access to a fenced region via a GTT mmaping,
>>> the access will not be fenced during the reset (until we restore the
>>> fences afterwards). In order to prevent invalid access during the reset,
>>> before we clobber the fences we must invalidate the GTT mmapings. Access
>>> to the mmap will then be forced to fault the page, and in handling the
>>> fault, i915_gem_fault() will take the struct_mutex and wait upon the
>>> reset to complete.
>>>
>>> Bugzilla: https://bugs.freedesktop.org/show_bug.cgi?id=99274
>>> Signed-off-by: Chris Wilson <chris at chris-wilson.co.uk>
>>> ---
>>> drivers/gpu/drm/i915/i915_drv.c | 3 ++-
>>> drivers/gpu/drm/i915/i915_drv.h | 4 +++-
>>> drivers/gpu/drm/i915/i915_gem.c | 7 ++++++-
>>> drivers/gpu/drm/i915/i915_gem_fence_reg.c | 24 ++++++++++++++++++++++++
>>> 4 files changed, 35 insertions(+), 3 deletions(-)
>>>
>>> diff --git a/drivers/gpu/drm/i915/i915_drv.c b/drivers/gpu/drm/i915/i915_drv.c
>>> index 72e29fcb1638..39463fcab593 100644
>>> --- a/drivers/gpu/drm/i915/i915_drv.c
>>> +++ b/drivers/gpu/drm/i915/i915_drv.c
>>> @@ -1780,6 +1780,7 @@ void i915_reset(struct drm_i915_private *dev_priv)
>>> error->reset_count++;
>>>
>>> pr_notice("drm/i915: Resetting chip after gpu hang\n");
>>> + i915_gem_reset_prepare(dev_priv);
>>>
>>> disable_engines_irq(dev_priv);
>>> ret = intel_gpu_reset(dev_priv, ALL_ENGINES);
>>> @@ -1793,7 +1794,7 @@ void i915_reset(struct drm_i915_private *dev_priv)
>>> goto error;
>>> }
>>>
>>> - i915_gem_reset(dev_priv);
>>> + i915_gem_reset_finish(dev_priv);
>>> intel_overlay_reset(dev_priv);
>>>
>>> /* Ok, now get things going again... */
>>> diff --git a/drivers/gpu/drm/i915/i915_drv.h b/drivers/gpu/drm/i915/i915_drv.h
>>> index c035b6576efa..f16986cfa127 100644
>>> --- a/drivers/gpu/drm/i915/i915_drv.h
>>> +++ b/drivers/gpu/drm/i915/i915_drv.h
>>> @@ -3355,7 +3355,8 @@ static inline u32 i915_reset_count(struct i915_gpu_error *error)
>>> return READ_ONCE(error->reset_count);
>>> }
>>>
>>> -void i915_gem_reset(struct drm_i915_private *dev_priv);
>>> +void i915_gem_reset_prepare(struct drm_i915_private *dev_priv);
>>> +void i915_gem_reset_finish(struct drm_i915_private *dev_priv);
>>> void i915_gem_set_wedged(struct drm_i915_private *dev_priv);
>>>
>>> void i915_gem_clflush_init(struct drm_i915_private *i915);
>>> @@ -3426,6 +3427,7 @@ i915_vm_to_ppgtt(struct i915_address_space *vm)
>>> int __must_check i915_vma_get_fence(struct i915_vma *vma);
>>> int __must_check i915_vma_put_fence(struct i915_vma *vma);
>>>
>>> +void i915_gem_revoke_fences(struct drm_i915_private *dev_priv);
>>> void i915_gem_restore_fences(struct drm_i915_private *dev_priv);
>>>
>>> void i915_gem_detect_bit_6_swizzle(struct drm_i915_private *dev_priv);
>>> diff --git a/drivers/gpu/drm/i915/i915_gem.c b/drivers/gpu/drm/i915/i915_gem.c
>>> index 73987014a7bd..019ea7cb13b5 100644
>>> --- a/drivers/gpu/drm/i915/i915_gem.c
>>> +++ b/drivers/gpu/drm/i915/i915_gem.c
>>> @@ -2715,6 +2715,11 @@ static void reset_request(struct drm_i915_gem_request *request)
>>> memset(vaddr + head, 0, request->postfix - head);
>>> }
>>>
>>> +void i915_gem_reset_prepare(struct drm_i915_private *dev_priv)
>>> +{
>>> + i915_gem_revoke_fences(dev_priv);
>>> +}
>>> +
>>> static void i915_gem_reset_engine(struct intel_engine_cs *engine)
>>> {
>>> struct drm_i915_gem_request *request;
>>> @@ -2780,7 +2785,7 @@ static void i915_gem_reset_engine(struct intel_engine_cs *engine)
>>> spin_unlock_irqrestore(&engine->timeline->lock, flags);
>>> }
>>>
>>> -void i915_gem_reset(struct drm_i915_private *dev_priv)
>>> +void i915_gem_reset_finish(struct drm_i915_private *dev_priv)
>>> {
>>> struct intel_engine_cs *engine;
>>> enum intel_engine_id id;
>>> diff --git a/drivers/gpu/drm/i915/i915_gem_fence_reg.c b/drivers/gpu/drm/i915/i915_gem_fence_reg.c
>>> index 67835d7b39c7..447abb1105ab 100644
>>> --- a/drivers/gpu/drm/i915/i915_gem_fence_reg.c
>>> +++ b/drivers/gpu/drm/i915/i915_gem_fence_reg.c
>>> @@ -358,6 +358,30 @@ i915_vma_get_fence(struct i915_vma *vma)
>>> }
>>>
>>> /**
>>> + * i915_gem_revoke_fences - revoke fence state
>>> + * @dev_priv: i915 device private
>>> + *
>>> + * Clears the hw fence state and removes all GTT mmappings via the fence. This
>>
>> The function doesn't clear the hw fence state - reset does that, no?
>
> The first version did, then realised all that was required was zapping
> the mmap.
Explains that then. :)
Regards,
Tvrtko
More information about the Intel-gfx
mailing list