[Intel-gfx] [PATCH i-g-t 7/8] lib/igt_gt: Allow per engine reset testing
Matthew Brost
matthew.brost at intel.com
Wed Nov 3 00:47:40 UTC 2021
On Thu, Oct 21, 2021 at 04:40:43PM -0700, John.C.Harrison at Intel.com wrote:
> From: John Harrison <John.C.Harrison at Intel.com>
>
> With GuC submission, engine resets are handled entirely within GuC
> rather than within i915. Traditionally, IGT has disallowed engine
> based resets becuase they don't send the uevent which IGT uses to
> check for unexpected resets. However, it is important to be able to
> test all reset mechanisms that can be used, so allow engine based
> resets to be enabled.
>
> Signed-off-by: John Harrison <John.C.Harrison at Intel.com>
Reviewed-by: Matthew Brost <matthew.brost at intel.com>
> ---
> lib/igt_gt.c | 44 +++++++++++++++++++++++++++++---------------
> lib/igt_gt.h | 1 +
> 2 files changed, 30 insertions(+), 15 deletions(-)
>
> diff --git a/lib/igt_gt.c b/lib/igt_gt.c
> index a0ba04cc1..7c7df95ee 100644
> --- a/lib/igt_gt.c
> +++ b/lib/igt_gt.c
> @@ -56,23 +56,28 @@
> * engines.
> */
>
> +static int reset_query_once = -1;
> +
> static bool has_gpu_reset(int fd)
> {
> - static int once = -1;
> - if (once < 0) {
> - struct drm_i915_getparam gp;
> - int val = 0;
> -
> - memset(&gp, 0, sizeof(gp));
> - gp.param = 35; /* HAS_GPU_RESET */
> - gp.value = &val;
> -
> - if (ioctl(fd, DRM_IOCTL_I915_GETPARAM, &gp))
> - once = intel_gen(intel_get_drm_devid(fd)) >= 5;
> - else
> - once = val > 0;
> + if (reset_query_once < 0) {
> + reset_query_once = gem_gpu_reset_type(fd);
> +
> + /* Very old kernels did not support the query */
> + if (reset_query_once == -1)
> + reset_query_once =
> + (intel_gen(intel_get_drm_devid(fd)) >= 5) ? 1 : 0;
> }
> - return once;
> +
> + return reset_query_once > 0;
> +}
> +
> +static bool has_engine_reset(int fd)
> +{
> + if (reset_query_once < 0)
> + has_gpu_reset(fd);
> +
> + return reset_query_once > 1;
> }
>
> static void eat_error_state(int dev)
> @@ -176,7 +181,11 @@ igt_hang_t igt_allow_hang(int fd, unsigned ctx, unsigned flags)
> igt_skip("hang injection disabled by user [IGT_HANG=0]\n");
> gem_context_require_bannable(fd);
>
> - allow_reset = 1;
> + if (flags & HANG_WANT_ENGINE_RESET)
> + allow_reset = 2;
> + else
> + allow_reset = 1;
> +
> if ((flags & HANG_ALLOW_CAPTURE) == 0) {
> param.param = I915_CONTEXT_PARAM_NO_ERROR_CAPTURE;
> param.value = 1;
> @@ -187,11 +196,16 @@ igt_hang_t igt_allow_hang(int fd, unsigned ctx, unsigned flags)
> __gem_context_set_param(fd, ¶m);
> allow_reset = INT_MAX; /* any reset method */
> }
> +
> igt_require(igt_params_set(fd, "reset", "%d", allow_reset));
> + reset_query_once = -1; /* Re-query after changing param */
>
> if (!igt_check_boolean_env_var("IGT_HANG_WITHOUT_RESET", false))
> igt_require(has_gpu_reset(fd));
>
> + if (flags & HANG_WANT_ENGINE_RESET)
> + igt_require(has_engine_reset(fd));
> +
> ban = context_get_ban(fd, ctx);
> if ((flags & HANG_ALLOW_BAN) == 0)
> context_set_ban(fd, ctx, 0);
> diff --git a/lib/igt_gt.h b/lib/igt_gt.h
> index ceb044b86..c5059817b 100644
> --- a/lib/igt_gt.h
> +++ b/lib/igt_gt.h
> @@ -51,6 +51,7 @@ igt_hang_t igt_hang_ctx_with_ahnd(int fd, uint64_t ahnd, uint32_t ctx, int ring,
>
> #define HANG_ALLOW_BAN 1
> #define HANG_ALLOW_CAPTURE 2
> +#define HANG_WANT_ENGINE_RESET 4
>
> igt_hang_t igt_hang_ring(int fd, int ring);
> igt_hang_t igt_hang_ring_with_ahnd(int fd, int ring, uint64_t ahnd);
> --
> 2.25.1
>
More information about the Intel-gfx
mailing list