[igt-dev] [PATCH i-g-t 1/2] i915/gem_exec_latency: Normalize results into ns
Antonio Argenziano
antonio.argenziano at intel.com
Tue Jan 29 17:55:45 UTC 2019
On 29/01/19 01:55, Chris Wilson wrote:
> Present the latency results in nanoseconds not RCS cycles.
>
> Signed-off-by: Chris Wilson <chris at chris-wilson.co.uk>
> ---
> tests/i915/gem_exec_latency.c | 38 +++++++++++++++++++++++++++++++----
> 1 file changed, 34 insertions(+), 4 deletions(-)
>
> diff --git a/tests/i915/gem_exec_latency.c b/tests/i915/gem_exec_latency.c
> index de16322a6..ea44adc14 100644
> --- a/tests/i915/gem_exec_latency.c
> +++ b/tests/i915/gem_exec_latency.c
> @@ -59,6 +59,7 @@
> #define PREEMPT 0x2
>
> static unsigned int ring_size;
> +static double rcs_clock;
>
> static void
> poll_ring(int fd, unsigned ring, const char *name)
> @@ -207,7 +208,7 @@ static void latency_on_ring(int fd,
> igt_cork_unplug(&c);
>
> gem_set_domain(fd, obj[1].handle, I915_GEM_DOMAIN_GTT, 0);
> - gpu_latency = (results[repeats-1] - results[0]) / (double)(repeats-1);
> + gpu_latency = (results[repeats-1] - results[1]) / (double)(repeats-2);
How come you don't like the value at 0? Maybe adding a comment would
make it clearer.
>
> gem_set_domain(fd, obj[2].handle,
> I915_GEM_DOMAIN_GTT, I915_GEM_DOMAIN_GTT);
> @@ -238,10 +239,11 @@ static void latency_on_ring(int fd,
> igt_assert(offset == obj[2].offset);
>
> gem_set_domain(fd, obj[1].handle, I915_GEM_DOMAIN_GTT, 0);
> - igt_info("%s: dispatch latency: %.2f, execution latency: %.2f (target %.2f)\n",
> + igt_info("%s: dispatch latency: %.1fns, execution latency: %.1fns (target %.1fns)\n",
> name,
> - (end - start) / (double)repeats,
> - gpu_latency, (results[repeats - 1] - results[0]) / (double)(repeats - 1));
> + (end - start) / (double)repeats * rcs_clock,
> + gpu_latency * rcs_clock,
> + (results[repeats - 1] - results[0]) / (double)(repeats - 1) * rcs_clock);
>
> munmap(map, 64*1024);
> munmap(results, 4096);
> @@ -620,6 +622,30 @@ rthog_latency_on_ring(int fd, unsigned int engine, const char *name, unsigned in
> munmap(results, MMAP_SZ);
> }
>
> +static double clockrate(void)
> +{
> + volatile uint32_t *reg;
> + uint32_t r_start, r_end;
> + struct timespec tv;
> + uint64_t t_start, t_end;
> + uint64_t elapsed;
> +
> + reg = (volatile uint32_t *)((volatile char *)igt_global_mmio + RCS_TIMESTAMP);
> +
> + t_start = igt_nsec_elapsed(&tv);
> + r_start = *reg;
> + elapsed = igt_nsec_elapsed(&tv) - t_start;
> +
> + usleep(1000);
> +
> + t_end = igt_nsec_elapsed(&tv);
> + r_end = *reg;
> + elapsed += igt_nsec_elapsed(&tv) - t_end;
> +
> + elapsed = (t_end - t_start) + elapsed / 2;
> + return (r_end - r_start) * 1e9 / elapsed;
> +}
> +
> igt_main
> {
> const struct intel_execution_engine *e;
> @@ -640,6 +666,10 @@ igt_main
> ring_size = 1024;
>
> intel_register_access_init(intel_get_pci_device(), false, device);
> + rcs_clock = clockrate();
> + igt_info("RCS timestamp clock: %.3fKHz, %.1fns\n",
> + rcs_clock / 1e3, 1e9 / rcs_clock);
> + rcs_clock = 1e9 / rcs_clock;
> }
>
> igt_subtest("all-rtidle-submit")
>
More information about the igt-dev
mailing list