[Intel-gfx] [CI 2/2] drm/i915/selftets: Check random hang recovery
Mika Kuoppala
mika.kuoppala at linux.intel.com
Fri Apr 24 23:12:06 UTC 2020
Chris Wilson <chris at chris-wilson.co.uk> writes:
> Userspace is untrusted and allowed to submit anything to the GPU for
> execution, including random garbage. Our recovery should do the right
> thing.
>
Subject:
s/tets/tests
> Signed-off-by: Chris Wilson <chris at chris-wilson.co.uk>
> Cc: Mika Kuoppala <mika.kuoppala at linux.intel.com>
> ---
> .../drm/i915/gem/selftests/i915_gem_context.c | 157 ++++++++++++++++++
> 1 file changed, 157 insertions(+)
>
> diff --git a/drivers/gpu/drm/i915/gem/selftests/i915_gem_context.c b/drivers/gpu/drm/i915/gem/selftests/i915_gem_context.c
> index c5c3433174dc..4cda46cfbe2a 100644
> --- a/drivers/gpu/drm/i915/gem/selftests/i915_gem_context.c
> +++ b/drivers/gpu/drm/i915/gem/selftests/i915_gem_context.c
> @@ -2305,6 +2305,162 @@ static int igt_reg_isolation(void *arg)
> return err;
> }
>
> +static struct i915_request *
> +exec_obj(struct i915_gem_context *ctx,
> + struct intel_engine_cs *engine,
> + struct drm_i915_gem_object *obj)
> +{
> + struct intel_context *ce;
> + struct i915_request *rq;
> + struct i915_vma *vma;
> + int err;
> +
> + ce = i915_gem_context_get_engine(ctx, engine->legacy_idx);
> + if (IS_ERR(ce))
> + return ERR_CAST(ce);
> +
> + vma = i915_vma_instance(obj, ce->vm, NULL);
> + if (IS_ERR(vma)) {
> + err = PTR_ERR(vma);
> + goto err_ce;
> + }
> +
> + err = i915_vma_pin(vma, 0, 0, PIN_USER);
> + if (err)
> + goto err_ce;
> +
> + rq = intel_context_create_request(ce);
> + if (IS_ERR(rq))
> + goto err_unpin;
> +
> + if (engine->emit_init_breadcrumb) {
> + err = engine->emit_init_breadcrumb(rq);
> + if (err)
> + goto err_rq;
> + }
> +
> + i915_vma_lock(vma);
> + err = i915_request_await_object(rq, vma->obj, false);
> + if (err == 0)
> + err = i915_vma_move_to_active(vma, rq, 0);
> + i915_vma_unlock(vma);
> + if (err)
> + goto err_rq;
> +
> + err = engine->emit_bb_start(rq, vma->node.start, vma->node.size, 0);
> +
> +err_rq:
> + if (!err)
> + i915_request_get(rq);
> + else
> + i915_request_set_error_once(rq, err);
> + i915_request_add(rq);
> +
> +err_unpin:
> + i915_vma_unpin(vma);
> +err_ce:
> + intel_context_put(ce);
> + return err ? ERR_PTR(err) : rq;
> +}
> +
> +static int randomise_object(struct drm_i915_gem_object *obj,
> + struct rnd_state *prng)
> +{
> + unsigned long i;
> + u32 *cs;
> +
> + cs = i915_gem_object_pin_map(obj, I915_MAP_WC);
> + if (IS_ERR(cs))
> + return PTR_ERR(cs);
> +
> + for (i = 0; i < obj->base.size / sizeof(*cs); i++)
> + cs[i] = prandom_u32_state(prng);
> +
> + i915_gem_object_flush_map(obj);
> + i915_gem_object_unpin_map(obj);
> +
> + return 0;
> +}
> +
> +static bool skip_garbage(const struct intel_engine_cs *engine)
> +{
> + if (IS_GEN(engine->i915, 6))
> + return true;
> +
> + return false;
> +}
> +
> +static int igt_ctx_garbage(void *arg)
> +{
> + struct drm_i915_private *i915 = arg;
> + struct drm_i915_gem_object *obj;
> + struct intel_engine_cs *engine;
> + struct i915_gem_context *ctx;
> + I915_RND_STATE(prng);
> + struct file *file;
> + int err;
> +
> + /*
> + * Imagine if userspace went crazy and submitted a batch of nothing
> + * but random junk. The GPU may hang and we may be forced to kill
> + * the context; but the driver will go on!
> + */
> +
> + file = mock_file(i915);
> + if (IS_ERR(file))
> + return PTR_ERR(file);
> +
> + ctx = live_context(i915, file);
> + if (IS_ERR(ctx)) {
> + err = PTR_ERR(ctx);
> + goto out_file;
> + }
> +
> + obj = i915_gem_object_create_internal(i915, 4096);
> + if (IS_ERR(obj)) {
> + err = PTR_ERR(obj);
> + goto out_file;
> + }
> +
> + err = randomise_object(obj, &prng);
> + if (err)
> + goto out_obj;
> +
> + i915_gem_context_clear_bannable(ctx);
> + for_each_uabi_engine(engine, i915) {
> + struct i915_request *rq;
> +
> + if (!IS_ENABLED(CONFIG_DRM_I915_SELFTEST_BROKEN) &&
> + skip_garbage(engine))
> + continue;
> +
> + rq = exec_obj(ctx, engine, obj);
> + if (IS_ERR(rq)) {
> + err = PTR_ERR(rq);
> + break;
> + }
> +
> + if (i915_request_wait(rq,
> + I915_WAIT_INTERRUPTIBLE,
> + HZ / 2) < 0) {
> + intel_gt_handle_error(engine->gt,
> + engine->mask, 0,
> + NULL);
> + }
> +
> + i915_request_put(rq);
> + }
> +
> + if (igt_flush_test(i915))
> + err = -EIO;
> +
> +out_obj:
> + i915_gem_object_put(obj);
> +out_file:
> + fput(file);
> + return err;
> +}
> +
> static bool skip_unused_engines(struct intel_context *ce, void *data)
> {
> return !ce->state;
> @@ -2441,6 +2597,7 @@ int i915_gem_context_live_selftests(struct drm_i915_private *i915)
> SUBTEST(igt_shared_ctx_exec),
> SUBTEST(igt_vm_isolation),
> SUBTEST(igt_reg_isolation),
> + SUBTEST(igt_ctx_garbage),
igt_exec_garbage?
Acked-by: Mika Kuoppala <mika.kuoppala at linux.intel.com>
> };
>
> if (intel_gt_is_wedged(&i915->gt))
> --
> 2.20.1
>
> _______________________________________________
> Intel-gfx mailing list
> Intel-gfx at lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/intel-gfx
More information about the Intel-gfx
mailing list