[PATCH i-g-t 2/3] tests/intel/xe_pmu: Add PMU test to validate engine activity stats

Umesh Nerlige Ramappa umesh.nerlige.ramappa at intel.com
Fri Feb 14 19:01:18 UTC 2025


On Fri, Feb 14, 2025 at 10:55:38AM -0800, Umesh Nerlige Ramappa wrote:
>On Wed, Feb 12, 2025 at 03:28:28PM +0530, Riana Tauro wrote:
>>Add a test to validate engine activity by reading PMU counters
>>(engine-active-ticks, engine-total-ticks) when running
>>workload on every engine
>>
>>Signed-off-by: Riana Tauro <riana.tauro at intel.com>
>>---
>>tests/intel/xe_pmu.c | 147 +++++++++++++++++++++++++++++++++++++++++++
>>tests/meson.build    |   1 +
>>2 files changed, 148 insertions(+)
>>create mode 100644 tests/intel/xe_pmu.c
>>
>>diff --git a/tests/intel/xe_pmu.c b/tests/intel/xe_pmu.c
>>new file mode 100644
>>index 000000000..cbb825755
>>--- /dev/null
>>+++ b/tests/intel/xe_pmu.c
>>@@ -0,0 +1,147 @@
>>+// SPDX-License-Identifier: MIT
>>+/*
>>+ * Copyright © 2025 Intel Corporation
>>+ */
>>+
>>+/**
>>+ * TEST: Test Xe PMU(Performance Monitoring Unit) functionality
>>+ * Category: Metrics
>>+ * Functionality: Power/Perf
>>+ * Mega feature: Performance Monitoring Unit
>>+ * Sub-category: Telemetry
>>+ * Test category: Functional tests
>>+ */
>>+
>>+#include "igt.h"
>>+#include "igt_perf.h"
>>+
>>+#include "xe/xe_ioctl.h"
>>+#include "xe/xe_spin.h"
>>+
>>+#define SLEEP_DURATION 2 /* in seconds */
>>+const double tolerance = 0.1;
>>+
>>+#define assert_within_epsilon(x, ref, tolerance) \
>>+	igt_assert_f((double)(x) <= (1.0 + (tolerance)) * (double)(ref) && \
>>+		     (double)(x) >= (1.0 - (tolerance)) * (double)(ref), \
>>+		     "'%s' != '%s' (%f not within +%.1f%%/-%.1f%% tolerance of %f)\n",\
>>+		     #x, #ref, (double)(x), \
>>+		     (tolerance) * 100.0, (tolerance) * 100.0, \
>>+		     (double)(ref))
>>+
>>+static int open_group(int xe, uint64_t config, int group)
>>+{
>>+	int fd;
>>+
>>+	fd = igt_perf_open_group(xe_perf_type_id(xe), config, group);
>>+	igt_skip_on(fd < 0 && errno == ENODEV);
>>+	igt_assert(fd >= 0);
>>+
>>+	return fd;
>>+}
>>+
>>+static uint64_t pmu_read_multi(int fd, unsigned int num, uint64_t *val)
>>+{
>>+	uint64_t buf[2 + num];
>>+	unsigned int i;
>>+
>>+	igt_assert_eq(read(fd, buf, sizeof(buf)), sizeof(buf));
>>+
>>+	for (i = 0; i < num; i++)
>>+		val[i] = buf[2 + i];
>>+
>>+	return buf[1];
>>+}
>>+
>>+static uint64_t get_event_config(int xe, unsigned int gt, struct drm_xe_engine_class_instance *eci,
>>+				 const char *event)
>>+{
>>+	int ret;
>>+	char xe_device[100];
>>+	uint64_t pmu_config;
>>+	u32 start, end;
>
>end is unused, not sure if the c6 patches use them. If unused, then I 
>recommend just dropping it from the helper as well and s/start/shift/.
>
>>+
>>+	xe_perf_device(xe, xe_device, sizeof(xe_device));
>>+	ret = perf_event_config(xe_device, event, &pmu_config);
>>+	igt_assert(ret >= 0);
>
>Well, I commented on Vinay's patch to assert within the helper, so 
>these checks can be removed here. If that happens, then please drop 
>the return value checks here. If not, then checks needed below as well 
>at (1) and (2).
>
>>+	ret = perf_event_format(xe_device, "gt", &start, &end);
>>+	igt_assert(ret >= 0);
>>+	pmu_config |= (uint64_t)gt << start;
>>+
>>+	if (eci) {
>>+		ret = perf_event_format(xe_device, "engine_class", &start, &end);
>(1)
>>+		pmu_config |= (uint64_t)eci->engine_class << start;
>>+		ret = perf_event_format(xe_device, "engine_instance", &start, &end);
>(2)
>>+		pmu_config |= (uint64_t)eci->engine_instance << start;
>>+	}
>>+
>>+	return pmu_config;
>>+}

also s/busy/active/

>
>Thanks,
>Umesh
>>+
>>+/**
>>+ * SUBTEST: engine-activity
>>+ * Description: Test to validate engine activity stats by running a workload and
>>+ *              reading the active ticks and total ticks PMU counters
>>+ */
>>+static void engine_activity(int fd, struct drm_xe_engine_class_instance *eci)
>>+{
>>+	uint64_t config, busy_ticks, total_ticks, before[2], after[2];
>>+	struct xe_cork *cork = NULL;
>>+	uint32_t vm;
>>+	int pmu_fd[2];
>>+
>>+	config = get_event_config(fd, eci->gt_id, eci, "engine-active-ticks");
>>+	pmu_fd[0] = open_group(fd, config, -1);
>>+
>>+	config = get_event_config(fd, eci->gt_id, eci, "engine-total-ticks");
>>+	pmu_fd[1] = open_group(fd, config, pmu_fd[0]);
>>+
>>+	vm = xe_vm_create(fd, 0, 0);
>>+	cork = xe_cork_create_opts(fd, eci, vm, 1, 1);
>>+	xe_cork_sync_start(fd, cork);
>>+
>>+	pmu_read_multi(pmu_fd[0], 2, before);
>>+	usleep(SLEEP_DURATION * USEC_PER_SEC);
>>+	pmu_read_multi(pmu_fd[0], 2, after);
>>+
>>+	xe_cork_sync_end(fd, cork);
>>+
>>+	busy_ticks = after[0] - before[0];
>>+	total_ticks = after[1] - before[1];
>>+
>>+	igt_debug("Engine active ticks:  after %ld, before %ld delta %ld\n", after[0], before[0],
>>+		  busy_ticks);
>>+	igt_debug("Total ticks: after %ld, before %ld delta %ld\n", after[1], before[1],
>>+		  total_ticks);
>>+
>>+	if (cork)
>>+		xe_cork_destroy(fd, cork);
>>+
>>+	xe_vm_destroy(fd, vm);
>>+
>>+	close(pmu_fd[0]);
>>+	close(pmu_fd[1]);
>>+
>>+	assert_within_epsilon(busy_ticks, total_ticks, tolerance);
>>+}
>>+
>>+igt_main
>>+{
>>+	int fd;
>>+	struct drm_xe_engine_class_instance *hwe;
>>+
>>+	igt_fixture {
>>+		fd = drm_open_driver(DRIVER_XE);
>>+	}
>>+
>>+	igt_describe("Validate engine activity with workload running by reading pmu counters");
>>+	igt_subtest_with_dynamic("engine-activity")
>>+		xe_for_each_engine(fd, hwe)
>>+			igt_dynamic_f("engine-%s%d", xe_engine_class_string(hwe->engine_class),
>>+				      hwe->engine_instance)
>>+				engine_activity(fd, hwe);
>>+
>>+	igt_fixture {
>>+		close(fd);
>>+	}
>>+}
>>diff --git a/tests/meson.build b/tests/meson.build
>>index 33dffad31..d20f50766 100644
>>--- a/tests/meson.build
>>+++ b/tests/meson.build
>>@@ -309,6 +309,7 @@ intel_xe_progs = [
>>	'xe_pat',
>>	'xe_peer2peer',
>>	'xe_pm',
>>+	'xe_pmu',
>>	'xe_pm_residency',
>>	'xe_prime_self_import',
>>	'xe_query',
>>-- 
>>2.47.1
>>


More information about the igt-dev mailing list