[Intel-gfx] [PATCH 05/23] drm/i915: Remove locking from i915_gem_object_prepare_read/write

Tvrtko Ursulin tvrtko.ursulin at linux.intel.com
Fri Jul 3 13:43:43 UTC 2020


On 03/07/2020 13:22, Maarten Lankhorst wrote:
> Execbuffer submission will perform its own WW locking, and we
> cannot rely on the implicit lock there.
> 
> This also makes it clear that the GVT code will get a lockdep splat when
> multiple batchbuffer shadows need to be performed in the same instance,
> fix that up.
> 
> Signed-off-by: Maarten Lankhorst <maarten.lankhorst at linux.intel.com>

You have my r-b for this one from the previous round.

Regards,

Tvrtko

> ---
>   drivers/gpu/drm/i915/gem/i915_gem_domain.c    | 20 ++++++-------------
>   .../gpu/drm/i915/gem/i915_gem_execbuffer.c    | 13 ++++++++++--
>   drivers/gpu/drm/i915/gem/i915_gem_object.h    |  1 -
>   .../gpu/drm/i915/gem/selftests/huge_pages.c   |  5 ++++-
>   .../i915/gem/selftests/i915_gem_coherency.c   | 14 +++++++++----
>   .../drm/i915/gem/selftests/i915_gem_context.c | 12 ++++++++---
>   drivers/gpu/drm/i915/gvt/cmd_parser.c         |  1 +
>   drivers/gpu/drm/i915/i915_gem.c               | 20 +++++++++++++++++--
>   8 files changed, 59 insertions(+), 27 deletions(-)
> 
> diff --git a/drivers/gpu/drm/i915/gem/i915_gem_domain.c b/drivers/gpu/drm/i915/gem/i915_gem_domain.c
> index c0acfc97fae3..8ebceebd11b0 100644
> --- a/drivers/gpu/drm/i915/gem/i915_gem_domain.c
> +++ b/drivers/gpu/drm/i915/gem/i915_gem_domain.c
> @@ -576,19 +576,17 @@ int i915_gem_object_prepare_read(struct drm_i915_gem_object *obj,
>   	if (!i915_gem_object_has_struct_page(obj))
>   		return -ENODEV;
>   
> -	ret = i915_gem_object_lock_interruptible(obj, NULL);
> -	if (ret)
> -		return ret;
> +	assert_object_held(obj);
>   
>   	ret = i915_gem_object_wait(obj,
>   				   I915_WAIT_INTERRUPTIBLE,
>   				   MAX_SCHEDULE_TIMEOUT);
>   	if (ret)
> -		goto err_unlock;
> +		return ret;
>   
>   	ret = i915_gem_object_pin_pages(obj);
>   	if (ret)
> -		goto err_unlock;
> +		return ret;
>   
>   	if (obj->cache_coherent & I915_BO_CACHE_COHERENT_FOR_READ ||
>   	    !static_cpu_has(X86_FEATURE_CLFLUSH)) {
> @@ -616,8 +614,6 @@ int i915_gem_object_prepare_read(struct drm_i915_gem_object *obj,
>   
>   err_unpin:
>   	i915_gem_object_unpin_pages(obj);
> -err_unlock:
> -	i915_gem_object_unlock(obj);
>   	return ret;
>   }
>   
> @@ -630,20 +626,18 @@ int i915_gem_object_prepare_write(struct drm_i915_gem_object *obj,
>   	if (!i915_gem_object_has_struct_page(obj))
>   		return -ENODEV;
>   
> -	ret = i915_gem_object_lock_interruptible(obj, NULL);
> -	if (ret)
> -		return ret;
> +	assert_object_held(obj);
>   
>   	ret = i915_gem_object_wait(obj,
>   				   I915_WAIT_INTERRUPTIBLE |
>   				   I915_WAIT_ALL,
>   				   MAX_SCHEDULE_TIMEOUT);
>   	if (ret)
> -		goto err_unlock;
> +		return ret;
>   
>   	ret = i915_gem_object_pin_pages(obj);
>   	if (ret)
> -		goto err_unlock;
> +		return ret;
>   
>   	if (obj->cache_coherent & I915_BO_CACHE_COHERENT_FOR_WRITE ||
>   	    !static_cpu_has(X86_FEATURE_CLFLUSH)) {
> @@ -680,7 +674,5 @@ int i915_gem_object_prepare_write(struct drm_i915_gem_object *obj,
>   
>   err_unpin:
>   	i915_gem_object_unpin_pages(obj);
> -err_unlock:
> -	i915_gem_object_unlock(obj);
>   	return ret;
>   }
> diff --git a/drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c b/drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c
> index 370c1cbc4d3b..c2a4e499233b 100644
> --- a/drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c
> +++ b/drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c
> @@ -996,11 +996,14 @@ static void reloc_cache_reset(struct reloc_cache *cache)
>   
>   	vaddr = unmask_page(cache->vaddr);
>   	if (cache->vaddr & KMAP) {
> +		struct drm_i915_gem_object *obj =
> +			(struct drm_i915_gem_object *)cache->node.mm;
>   		if (cache->vaddr & CLFLUSH_AFTER)
>   			mb();
>   
>   		kunmap_atomic(vaddr);
> -		i915_gem_object_finish_access((struct drm_i915_gem_object *)cache->node.mm);
> +		i915_gem_object_finish_access(obj);
> +		i915_gem_object_unlock(obj);
>   	} else {
>   		struct i915_ggtt *ggtt = cache_to_ggtt(cache);
>   
> @@ -1035,10 +1038,16 @@ static void *reloc_kmap(struct drm_i915_gem_object *obj,
>   		unsigned int flushes;
>   		int err;
>   
> -		err = i915_gem_object_prepare_write(obj, &flushes);
> +		err = i915_gem_object_lock_interruptible(obj, NULL);
>   		if (err)
>   			return ERR_PTR(err);
>   
> +		err = i915_gem_object_prepare_write(obj, &flushes);
> +		if (err) {
> +			i915_gem_object_unlock(obj);
> +			return ERR_PTR(err);
> +		}
> +
>   		BUILD_BUG_ON(KMAP & CLFLUSH_FLAGS);
>   		BUILD_BUG_ON((KMAP | CLFLUSH_FLAGS) & PAGE_MASK);
>   
> diff --git a/drivers/gpu/drm/i915/gem/i915_gem_object.h b/drivers/gpu/drm/i915/gem/i915_gem_object.h
> index 5103067269b0..11b8e2735071 100644
> --- a/drivers/gpu/drm/i915/gem/i915_gem_object.h
> +++ b/drivers/gpu/drm/i915/gem/i915_gem_object.h
> @@ -434,7 +434,6 @@ static inline void
>   i915_gem_object_finish_access(struct drm_i915_gem_object *obj)
>   {
>   	i915_gem_object_unpin_pages(obj);
> -	i915_gem_object_unlock(obj);
>   }
>   
>   static inline struct intel_engine_cs *
> diff --git a/drivers/gpu/drm/i915/gem/selftests/huge_pages.c b/drivers/gpu/drm/i915/gem/selftests/huge_pages.c
> index eb2011ccb92b..fff11327a8da 100644
> --- a/drivers/gpu/drm/i915/gem/selftests/huge_pages.c
> +++ b/drivers/gpu/drm/i915/gem/selftests/huge_pages.c
> @@ -964,9 +964,10 @@ __cpu_check_shmem(struct drm_i915_gem_object *obj, u32 dword, u32 val)
>   	unsigned long n;
>   	int err;
>   
> +	i915_gem_object_lock(obj, NULL);
>   	err = i915_gem_object_prepare_read(obj, &needs_flush);
>   	if (err)
> -		return err;
> +		goto err_unlock;
>   
>   	for (n = 0; n < obj->base.size >> PAGE_SHIFT; ++n) {
>   		u32 *ptr = kmap_atomic(i915_gem_object_get_page(obj, n));
> @@ -986,6 +987,8 @@ __cpu_check_shmem(struct drm_i915_gem_object *obj, u32 dword, u32 val)
>   	}
>   
>   	i915_gem_object_finish_access(obj);
> +err_unlock:
> +	i915_gem_object_unlock(obj);
>   
>   	return err;
>   }
> diff --git a/drivers/gpu/drm/i915/gem/selftests/i915_gem_coherency.c b/drivers/gpu/drm/i915/gem/selftests/i915_gem_coherency.c
> index 1de2959b153c..dcdfc396f2f8 100644
> --- a/drivers/gpu/drm/i915/gem/selftests/i915_gem_coherency.c
> +++ b/drivers/gpu/drm/i915/gem/selftests/i915_gem_coherency.c
> @@ -27,9 +27,10 @@ static int cpu_set(struct context *ctx, unsigned long offset, u32 v)
>   	u32 *cpu;
>   	int err;
>   
> +	i915_gem_object_lock(ctx->obj, NULL);
>   	err = i915_gem_object_prepare_write(ctx->obj, &needs_clflush);
>   	if (err)
> -		return err;
> +		goto out;
>   
>   	page = i915_gem_object_get_page(ctx->obj, offset >> PAGE_SHIFT);
>   	map = kmap_atomic(page);
> @@ -46,7 +47,9 @@ static int cpu_set(struct context *ctx, unsigned long offset, u32 v)
>   	kunmap_atomic(map);
>   	i915_gem_object_finish_access(ctx->obj);
>   
> -	return 0;
> +out:
> +	i915_gem_object_unlock(ctx->obj);
> +	return err;
>   }
>   
>   static int cpu_get(struct context *ctx, unsigned long offset, u32 *v)
> @@ -57,9 +60,10 @@ static int cpu_get(struct context *ctx, unsigned long offset, u32 *v)
>   	u32 *cpu;
>   	int err;
>   
> +	i915_gem_object_lock(ctx->obj, NULL);
>   	err = i915_gem_object_prepare_read(ctx->obj, &needs_clflush);
>   	if (err)
> -		return err;
> +		goto out;
>   
>   	page = i915_gem_object_get_page(ctx->obj, offset >> PAGE_SHIFT);
>   	map = kmap_atomic(page);
> @@ -73,7 +77,9 @@ static int cpu_get(struct context *ctx, unsigned long offset, u32 *v)
>   	kunmap_atomic(map);
>   	i915_gem_object_finish_access(ctx->obj);
>   
> -	return 0;
> +out:
> +	i915_gem_object_unlock(ctx->obj);
> +	return err;
>   }
>   
>   static int gtt_set(struct context *ctx, unsigned long offset, u32 v)
> diff --git a/drivers/gpu/drm/i915/gem/selftests/i915_gem_context.c b/drivers/gpu/drm/i915/gem/selftests/i915_gem_context.c
> index 438c15ef2184..76671f587b9d 100644
> --- a/drivers/gpu/drm/i915/gem/selftests/i915_gem_context.c
> +++ b/drivers/gpu/drm/i915/gem/selftests/i915_gem_context.c
> @@ -461,9 +461,10 @@ static int cpu_fill(struct drm_i915_gem_object *obj, u32 value)
>   	unsigned int n, m, need_flush;
>   	int err;
>   
> +	i915_gem_object_lock(obj, NULL);
>   	err = i915_gem_object_prepare_write(obj, &need_flush);
>   	if (err)
> -		return err;
> +		goto out;
>   
>   	for (n = 0; n < real_page_count(obj); n++) {
>   		u32 *map;
> @@ -479,7 +480,9 @@ static int cpu_fill(struct drm_i915_gem_object *obj, u32 value)
>   	i915_gem_object_finish_access(obj);
>   	obj->read_domains = I915_GEM_DOMAIN_GTT | I915_GEM_DOMAIN_CPU;
>   	obj->write_domain = 0;
> -	return 0;
> +out:
> +	i915_gem_object_unlock(obj);
> +	return err;
>   }
>   
>   static noinline int cpu_check(struct drm_i915_gem_object *obj,
> @@ -488,9 +491,10 @@ static noinline int cpu_check(struct drm_i915_gem_object *obj,
>   	unsigned int n, m, needs_flush;
>   	int err;
>   
> +	i915_gem_object_lock(obj, NULL);
>   	err = i915_gem_object_prepare_read(obj, &needs_flush);
>   	if (err)
> -		return err;
> +		goto out_unlock;
>   
>   	for (n = 0; n < real_page_count(obj); n++) {
>   		u32 *map;
> @@ -527,6 +531,8 @@ static noinline int cpu_check(struct drm_i915_gem_object *obj,
>   	}
>   
>   	i915_gem_object_finish_access(obj);
> +out_unlock:
> +	i915_gem_object_unlock(obj);
>   	return err;
>   }
>   
> diff --git a/drivers/gpu/drm/i915/gvt/cmd_parser.c b/drivers/gpu/drm/i915/gvt/cmd_parser.c
> index 943c8d232703..d0a599b51bfe 100644
> --- a/drivers/gpu/drm/i915/gvt/cmd_parser.c
> +++ b/drivers/gpu/drm/i915/gvt/cmd_parser.c
> @@ -1923,6 +1923,7 @@ static int perform_bb_shadow(struct parser_exec_state *s)
>   	if (ret)
>   		goto err_unmap;
>   
> +	i915_gem_object_unlock(bb->obj);
>   	INIT_LIST_HEAD(&bb->list);
>   	list_add(&bb->list, &s->workload->shadow_bb);
>   
> diff --git a/drivers/gpu/drm/i915/i915_gem.c b/drivers/gpu/drm/i915/i915_gem.c
> index 1e06752835e5..33f6f88c8b08 100644
> --- a/drivers/gpu/drm/i915/i915_gem.c
> +++ b/drivers/gpu/drm/i915/i915_gem.c
> @@ -335,12 +335,20 @@ i915_gem_shmem_pread(struct drm_i915_gem_object *obj,
>   	u64 remain;
>   	int ret;
>   
> -	ret = i915_gem_object_prepare_read(obj, &needs_clflush);
> +	ret = i915_gem_object_lock_interruptible(obj, NULL);
>   	if (ret)
>   		return ret;
>   
> +	ret = i915_gem_object_prepare_read(obj, &needs_clflush);
> +	if (ret) {
> +		i915_gem_object_unlock(obj);
> +		return ret;
> +	}
> +
>   	fence = i915_gem_object_lock_fence(obj);
>   	i915_gem_object_finish_access(obj);
> +	i915_gem_object_unlock(obj);
> +
>   	if (!fence)
>   		return -ENOMEM;
>   
> @@ -734,12 +742,20 @@ i915_gem_shmem_pwrite(struct drm_i915_gem_object *obj,
>   	u64 remain;
>   	int ret;
>   
> -	ret = i915_gem_object_prepare_write(obj, &needs_clflush);
> +	ret = i915_gem_object_lock_interruptible(obj, NULL);
>   	if (ret)
>   		return ret;
>   
> +	ret = i915_gem_object_prepare_write(obj, &needs_clflush);
> +	if (ret) {
> +		i915_gem_object_unlock(obj);
> +		return ret;
> +	}
> +
>   	fence = i915_gem_object_lock_fence(obj);
>   	i915_gem_object_finish_access(obj);
> +	i915_gem_object_unlock(obj);
> +
>   	if (!fence)
>   		return -ENOMEM;
>   
> 


More information about the Intel-gfx mailing list