[igt-dev] [PATCH i-g-t] test/perf_pmu: Dump drpc on C6 failure
Riana Tauro
riana.tauro at intel.com
Wed Aug 2 09:36:03 UTC 2023
Hi Anshuman
On 8/1/2023 6:55 PM, Anshuman Gupta wrote:
> Dump drpc debugfs on RC6/MC6 failure, it will be useful to
> debug any C6 failure issue by using drpc debugfs debug info.
>
> Co-developed-by: Badal Nilawar <badal.nilawar at intel.com>
> Signed-off-by: Anshuman Gupta <anshuman.gupta at intel.com>
> ---
> tests/i915/perf_pmu.c | 61 +++++++++++++++++++++++++++++--------------
> 1 file changed, 42 insertions(+), 19 deletions(-)
>
> diff --git a/tests/i915/perf_pmu.c b/tests/i915/perf_pmu.c
> index 58f4a82a2..bcd6db799 100644
> --- a/tests/i915/perf_pmu.c
> +++ b/tests/i915/perf_pmu.c
> @@ -256,6 +256,18 @@ IGT_TEST_DESCRIPTION("Test the i915 pmu perf interface");
> const double tolerance = 0.05f;
> const unsigned long batch_duration_ns = 500e6;
>
> +char *drpc;
> +const char *no_debug_data = "\0";
> +
> +static char *get_drpc(int i915, int gt_id)
> +{
> + int gt_dir;
> +
> + gt_dir = igt_debugfs_gt_dir(i915, gt_id);
> + igt_assert(gt_dir != -1);
> + return igt_sysfs_get(gt_dir, "drpc");
> +}
> +
> static int open_pmu(int i915, uint64_t config)
> {
> int fd;
> @@ -336,17 +348,19 @@ static uint64_t pmu_read_multi(int fd, unsigned int num, uint64_t *val)
> return buf[1];
> }
>
> -#define __assert_within_epsilon(x, ref, tol_up, tol_down) \
> +#define __assert_within_epsilon(x, ref, tol_up, tol_down, debug_data) \
> igt_assert_f((double)(x) <= (1.0 + (tol_up)) * (double)(ref) && \
> (double)(x) >= (1.0 - (tol_down)) * (double)(ref), \
> - "'%s' != '%s' (%f not within +%.1f%%/-%.1f%% tolerance of %f)\n",\
> + "'%s' != '%s' (%f not within +%.1f%%/-%.1f%% tolerance of %f)\n%s\n",\
> #x, #ref, (double)(x), \
> (tol_up) * 100.0, (tol_down) * 100.0, \
> - (double)(ref))
> + (double)(ref), debug_data)
>
> #define assert_within_epsilon(x, ref, tolerance) \
> - __assert_within_epsilon(x, ref, tolerance, tolerance)
> + __assert_within_epsilon(x, ref, tolerance, tolerance, "\0")
>
> +#define assert_within_epsilon_dump(x, ref, tolerance, debug_data) \
> + __assert_within_epsilon(x, ref, tolerance, tolerance, debug_data)
debug instead of dump?
> /*
> * Helper for cases where we assert on time spent sleeping (directly or
> * indirectly), so make it more robust by ensuring the system sleep time
> @@ -1822,7 +1836,7 @@ test_frequency(int gem_fd, unsigned int gt)
> * On thermally throttled devices we cannot be sure maximum frequency
> * can be reached so use larger tolerance downards.
> */
> - __assert_within_epsilon(max[0], max_freq, tolerance, 0.15f);
> + __assert_within_epsilon(max[0], max_freq, tolerance, 0.15f, no_debug_data);
> }
>
> static void
> @@ -1967,7 +1981,8 @@ test_rc6(int gem_fd, unsigned int gt, unsigned int num_gt, unsigned int flags)
> }
> }
>
> - igt_require(wait_for_rc6(fd[0], 1, pmus, test_idx));
> + igt_require_f(wait_for_rc6(fd[0], 1, pmus, test_idx),
> + "failed to enter rc6/mc6 \n%s\n", drpc = get_drpc(gem_fd, test_idx));
test_idx is assigned to pmus in this function. Safer to use gt.
Thanks
Riana
>
> /* While idle check full RC6. */
> ts[0] = pmu_read_multi(fd[0], pmus, prev);
> @@ -1977,9 +1992,11 @@ test_rc6(int gem_fd, unsigned int gt, unsigned int num_gt, unsigned int flags)
> for (gt_ = 0; gt_ < pmus; gt_++) {
> igt_debug("gt%u: idle rc6=%"PRIu64", slept=%lu, perf=%"PRIu64"\n",
> gt_, idle[gt_] - prev[gt_], slept, ts[1] - ts[0]);
> - assert_within_epsilon(idle[gt_] - prev[gt_],
> - ts[1] - ts[0],
> - tolerance);
> + drpc = get_drpc(gem_fd, gt_);
> + assert_within_epsilon_dump(idle[gt_] - prev[gt_],
> + ts[1] - ts[0],
> + tolerance, drpc);
> + free(drpc);
> }
>
> if (flags & TEST_S3) {
> @@ -2005,7 +2022,8 @@ test_rc6(int gem_fd, unsigned int gt, unsigned int num_gt, unsigned int flags)
> }
> }
>
> - igt_assert(wait_for_rc6(fd[0], 5, pmus, test_idx));
> + igt_require_f(wait_for_rc6(fd[0], 5, pmus, test_idx),
> + "failed to enter rc6/mc6 \n%s\n", drpc = get_drpc(gem_fd, test_idx));
>
> ts[0] = pmu_read_multi(fd[0], pmus, prev);
> slept = measured_usleep(duration_ns / 1000);
> @@ -2014,9 +2032,11 @@ test_rc6(int gem_fd, unsigned int gt, unsigned int num_gt, unsigned int flags)
> for (gt_ = 0; gt_ < pmus; gt_++) {
> igt_debug("gt%u: idle rc6=%"PRIu64", slept=%lu, perf=%"PRIu64"\n",
> gt_, idle[gt_] - prev[gt_], slept, ts[1] - ts[0]);
> - assert_within_epsilon(idle[gt_] - prev[gt_],
> - ts[1] - ts[0],
> - tolerance);
> + drpc = get_drpc(gem_fd, gt_);
> + assert_within_epsilon_dump(idle[gt_] - prev[gt_],
> + ts[1] - ts[0],
> + tolerance, drpc);
> + free(drpc);
> }
>
> /* Wake up device and check no RC6. */
> @@ -2048,14 +2068,16 @@ test_rc6(int gem_fd, unsigned int gt, unsigned int num_gt, unsigned int flags)
> for (gt_ = 0; gt_ < pmus; gt_++) {
> igt_debug("gt%u: busy rc6=%"PRIu64", slept=%lu, perf=%"PRIu64"\n",
> gt_, busy[gt_] - prev[gt_], slept, ts[1] - ts[0]);
> + drpc = get_drpc(gem_fd, gt_);
> if (gt_ == test_idx || (flags & TEST_ALL))
> - assert_within_epsilon(busy[gt_] - prev[gt_],
> - 0.0,
> - tolerance);
> + assert_within_epsilon_dump(busy[gt_] - prev[gt_],
> + 0.0,
> + tolerance, drpc);
> else
> - assert_within_epsilon(busy[gt_] - prev[gt_],
> - ts[1] - ts[0],
> - tolerance);
> + assert_within_epsilon_dump(busy[gt_] - prev[gt_],
> + ts[1] - ts[0],
> + tolerance, drpc);
> + free(drpc);
> }
> }
>
> @@ -2720,6 +2742,7 @@ igt_main
> igt_fixture {
> intel_ctx_destroy(fd, ctx);
> drm_close_driver(fd);
> + free(drpc);
> }
>
> igt_subtest("module-unload") {
More information about the igt-dev
mailing list