[Intel-gfx] [PATCH 06/23] drm/i915: Parse command buffer earlier in eb_relocate(slow)
Tvrtko Ursulin
tvrtko.ursulin at linux.intel.com
Fri Jul 3 13:49:08 UTC 2020
On 03/07/2020 13:22, Maarten Lankhorst wrote:
> We want to introduce backoff logic, but we need to lock the
> pool object as well for command parsing. Because of this, we
> will need backoff logic for the engine pool obj, move the batch
> validation up slightly to eb_lookup_vmas, and the actual command
> parsing in a separate function which can get called from execbuf
> relocation fast and slowpath.
On this one I also had some feedback in the previous round which you
maybe missed.
Regards,
Tvrtko
> Signed-off-by: Maarten Lankhorst <maarten.lankhorst at linux.intel.com>
> ---
> .../gpu/drm/i915/gem/i915_gem_execbuffer.c | 68 ++++++++++---------
> 1 file changed, 37 insertions(+), 31 deletions(-)
>
> diff --git a/drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c b/drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c
> index c2a4e499233b..64b75f71a6bb 100644
> --- a/drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c
> +++ b/drivers/gpu/drm/i915/gem/i915_gem_execbuffer.c
> @@ -290,6 +290,8 @@ struct i915_execbuffer {
> struct eb_vma_array *array;
> };
>
> +static int eb_parse(struct i915_execbuffer *eb);
> +
> static inline bool eb_use_cmdparser(const struct i915_execbuffer *eb)
> {
> return intel_engine_requires_cmd_parser(eb->engine) ||
> @@ -866,6 +868,7 @@ static struct i915_vma *eb_lookup_vma(struct i915_execbuffer *eb, u32 handle)
>
> static int eb_lookup_vmas(struct i915_execbuffer *eb)
> {
> + struct drm_i915_private *i915 = eb->i915;
> unsigned int batch = eb_batch_index(eb);
> unsigned int i;
> int err = 0;
> @@ -879,18 +882,37 @@ static int eb_lookup_vmas(struct i915_execbuffer *eb)
> vma = eb_lookup_vma(eb, eb->exec[i].handle);
> if (IS_ERR(vma)) {
> err = PTR_ERR(vma);
> - break;
> + goto err;
> }
>
> err = eb_validate_vma(eb, &eb->exec[i], vma);
> if (unlikely(err)) {
> i915_vma_put(vma);
> - break;
> + goto err;
> }
>
> eb_add_vma(eb, i, batch, vma);
> }
>
> + if (unlikely(eb->batch->flags & EXEC_OBJECT_WRITE)) {
> + drm_dbg(&i915->drm,
> + "Attempting to use self-modifying batch buffer\n");
> + return -EINVAL;
> + }
> +
> + if (range_overflows_t(u64,
> + eb->batch_start_offset, eb->batch_len,
> + eb->batch->vma->size)) {
> + drm_dbg(&i915->drm, "Attempting to use out-of-bounds batch\n");
> + return -EINVAL;
> + }
> +
> + if (eb->batch_len == 0)
> + eb->batch_len = eb->batch->vma->size - eb->batch_start_offset;
> +
> + return 0;
> +
> +err:
> eb->vma[i].vma = NULL;
> return err;
> }
> @@ -1802,7 +1824,7 @@ static int eb_prefault_relocations(const struct i915_execbuffer *eb)
> return 0;
> }
>
> -static noinline int eb_relocate_slow(struct i915_execbuffer *eb)
> +static noinline int eb_relocate_parse_slow(struct i915_execbuffer *eb)
> {
> bool have_copy = false;
> struct eb_vma *ev;
> @@ -1868,6 +1890,11 @@ static noinline int eb_relocate_slow(struct i915_execbuffer *eb)
> if (err)
> goto err;
>
> + /* as last step, parse the command buffer */
> + err = eb_parse(eb);
> + if (err)
> + goto err;
> +
> /*
> * Leave the user relocations as are, this is the painfully slow path,
> * and we want to avoid the complication of dropping the lock whilst
> @@ -1900,7 +1927,7 @@ static noinline int eb_relocate_slow(struct i915_execbuffer *eb)
> return err;
> }
>
> -static int eb_relocate(struct i915_execbuffer *eb)
> +static int eb_relocate_parse(struct i915_execbuffer *eb)
> {
> int err;
>
> @@ -1925,10 +1952,10 @@ static int eb_relocate(struct i915_execbuffer *eb)
> }
>
> if (err)
> - return eb_relocate_slow(eb);
> + return eb_relocate_parse_slow(eb);
> }
>
> - return 0;
> + return eb_parse(eb);
> }
>
> static int eb_move_to_gpu(struct i915_execbuffer *eb)
> @@ -2866,7 +2893,7 @@ i915_gem_do_execbuffer(struct drm_device *dev,
> if (unlikely(err))
> goto err_context;
>
> - err = eb_relocate(&eb);
> + err = eb_relocate_parse(&eb);
> if (err) {
> /*
> * If the user expects the execobject.offset and
> @@ -2879,33 +2906,10 @@ i915_gem_do_execbuffer(struct drm_device *dev,
> goto err_vma;
> }
>
> - if (unlikely(eb.batch->flags & EXEC_OBJECT_WRITE)) {
> - drm_dbg(&i915->drm,
> - "Attempting to use self-modifying batch buffer\n");
> - err = -EINVAL;
> - goto err_vma;
> - }
> -
> - if (range_overflows_t(u64,
> - eb.batch_start_offset, eb.batch_len,
> - eb.batch->vma->size)) {
> - drm_dbg(&i915->drm, "Attempting to use out-of-bounds batch\n");
> - err = -EINVAL;
> - goto err_vma;
> - }
> -
> - if (eb.batch_len == 0)
> - eb.batch_len = eb.batch->vma->size - eb.batch_start_offset;
> -
> - err = eb_parse(&eb);
> - if (err)
> - goto err_vma;
> -
> /*
> * snb/ivb/vlv conflate the "batch in ppgtt" bit with the "non-secure
> * batch" bit. Hence we need to pin secure batches into the global gtt.
> * hsw should have this fixed, but bdw mucks it up again. */
> - batch = eb.batch->vma;
> if (eb.batch_flags & I915_DISPATCH_SECURE) {
> struct i915_vma *vma;
>
> @@ -2919,13 +2923,15 @@ i915_gem_do_execbuffer(struct drm_device *dev,
> * fitting due to fragmentation.
> * So this is actually safe.
> */
> - vma = i915_gem_object_ggtt_pin(batch->obj, NULL, 0, 0, 0);
> + vma = i915_gem_object_ggtt_pin(eb.batch->vma->obj, NULL, 0, 0, 0);
> if (IS_ERR(vma)) {
> err = PTR_ERR(vma);
> goto err_parse;
> }
>
> batch = vma;
> + } else {
> + batch = eb.batch->vma;
> }
>
> /* All GPU relocation batches must be submitted prior to the user rq */
>
More information about the Intel-gfx
mailing list