[PATCH i-g-t 5/5] tools/intel_display_bandwidth: Tool for measuring display memory bandwidth utilization

Ville Syrjala ville.syrjala at linux.intel.com
Mon Sep 16 20:18:41 UTC 2024


From: Ville Syrjälä <ville.syrjala at linux.intel.com>

Introduce a small tool for measing the display enging
memory bandwidth utilization. Generally this is available
on SNB+, except on TGL/derivatives where the relevant
registers weren't updated to cope with the new ABOX layout
in the hardware.

Quite handy for confirming that FBC/CCS/etc. are doing their
job.

Not 100% sure about the required scaling factor because
bspec claims it's only needed for MTL, but my ADL definitely
needs it already.

Signed-off-by: Ville Syrjälä <ville.syrjala at linux.intel.com>
---
 lib/intel_reg.h                 |   5 +
 tools/intel_display_bandwidth.c | 171 ++++++++++++++++++++++++++++++++
 tools/meson.build               |   1 +
 3 files changed, 177 insertions(+)
 create mode 100644 tools/intel_display_bandwidth.c

diff --git a/lib/intel_reg.h b/lib/intel_reg.h
index 26833c66f8e7..5e049d8b14d6 100644
--- a/lib/intel_reg.h
+++ b/lib/intel_reg.h
@@ -1413,6 +1413,11 @@ SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
 #define PCH_3DRAMCGDIS0		0x46028
 #define SOUTH_DSPCLK_GATE_D	0xc2020
 
+#define DE_POWER1	0x42400
+#define DE_POWER2	0x42404
+#define DE_POWER2_ABOX0	0x42404
+#define DE_POWER2_ABOX1	0x42408
+
 #define CPU_eDP_A		0x64000
 #define PCH_DP_B		0xe4100
 #define PCH_DP_C		0xe4200
diff --git a/tools/intel_display_bandwidth.c b/tools/intel_display_bandwidth.c
new file mode 100644
index 000000000000..c7be3c390d08
--- /dev/null
+++ b/tools/intel_display_bandwidth.c
@@ -0,0 +1,171 @@
+// SPDX-License-Identifier: MIT
+/*
+ * Copyright © 2024 Intel Corporation
+ */
+
+#include <getopt.h>
+#include <inttypes.h>
+#include <stdbool.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <unistd.h>
+
+#include "intel_io.h"
+#include "intel_chipset.h"
+#include "intel_reg.h"
+
+static bool has_de_power2(uint32_t devid)
+{
+	/*
+	 * TGL has DE_POWER2 but it measures the low priority traffic
+	 * on ABOX, not not actual display traffic on ABOX0/ABOX1.
+	 */
+	if (intel_display_ver(devid) == 12)
+		return false;
+
+	return intel_display_ver(devid) >= 6 &&
+		!IS_VALLEYVIEW(devid) && !IS_CHERRYVIEW(devid);
+}
+
+static bool has_de_power2_abox0_abox1(uint32_t devid)
+{
+	/*
+	 * Despite having ABOX0/ABOX1 TGL lacks the
+	 * accompanying DE_POWER2_ABOX* registers.
+	 */
+	return intel_display_ver(devid) >= 13;
+}
+
+static int de_power2_scale(uint32_t devid)
+{
+	/*
+	 * FIXME should perhaps use something like
+	 * is_intel_dgfx() but that one wants to open the device :(
+	 */
+	switch (intel_display_ver(devid)) {
+	case 13:
+		return IS_DG2(devid) ? 1 : 2;
+	case 14:
+		return IS_BATTLEMAGE(devid) ? 1 : 2;
+	default:
+		return 1;
+	}
+}
+
+static int de_power2_unit(uint32_t devid)
+{
+	return 64 * de_power2_scale(devid);
+}
+
+static float bandwidth(uint32_t devid, int duration,
+		       uint32_t pre, uint32_t post)
+{
+	return (float)(post - pre) * de_power2_unit(devid) / (duration << 20);
+}
+
+static void measure_de_power2_abox0_abox1(uint32_t devid, unsigned int sleep_duration)
+{
+	uint32_t pre_abox0, post_abox0;
+	uint32_t pre_abox1, post_abox1;
+
+	pre_abox0 = INREG(DE_POWER2_ABOX0);
+	pre_abox1 = INREG(DE_POWER2_ABOX1);
+
+	if (sleep_duration) {
+		sleep(sleep_duration);
+
+		post_abox0 = INREG(DE_POWER2_ABOX0);
+		post_abox1 = INREG(DE_POWER2_ABOX1);
+
+		printf("DE_POWER2_ABOX0: 0x%08x->0x%08x\n",
+		       pre_abox0, post_abox0);
+		printf("DE_POWER2_ABOX1: 0x%08x->0x%08x\n",
+		       pre_abox1, post_abox1);
+
+		printf("ABOX0 bandwidth: %.2f MiB/s\n",
+		       bandwidth(devid, sleep_duration,
+				 pre_abox0, post_abox0));
+		printf("ABOX1 bandwidth: %.2f MiB/s\n",
+		       bandwidth(devid, sleep_duration,
+				 pre_abox1, post_abox1));
+		printf("Total bandwidth: %.2f MiB/s\n",
+		       bandwidth(devid, sleep_duration,
+				 pre_abox0 + pre_abox1, post_abox0 + post_abox1));
+	} else {
+		printf("DE_POWER2_ABOX0: 0x%08x\n", pre_abox0);
+		printf("DE_POWER2_ABOX1: 0x%08x\n", pre_abox1);
+	}
+}
+
+static void measure_de_power2(uint32_t devid, unsigned int sleep_duration)
+{
+	uint32_t pre, post;
+
+	pre = INREG(DE_POWER2);
+
+	if (sleep_duration) {
+		sleep(sleep_duration);
+
+		post = INREG(DE_POWER2);
+
+		printf("DE_POWER2: 0x%08x->0x%08x\n", pre, post);
+
+		printf("Total bandwidth: %.2f MiB/s\n",
+		       bandwidth(devid, sleep_duration, pre, post));
+	} else {
+		printf("DE_POWER2: 0x%08x\n", pre);
+	}
+}
+
+static void __attribute__((noreturn)) usage(const char *name)
+{
+	fprintf(stderr, "Usage: %s [options]\n"
+		" -s,--sleep <seconds>\n",
+		name);
+	exit(1);
+}
+
+int main(int argc, char *argv[])
+{
+	struct intel_mmio_data mmio_data;
+	unsigned int sleep_duration = 0;
+	uint32_t devid;
+
+	for (;;) {
+		static const struct option long_options[] = {
+			{ .name = "sleep", .has_arg = required_argument, },
+			{}
+		};
+
+		int opt = getopt_long(argc, argv, "s:", long_options, NULL);
+		if (opt == -1)
+			break;
+
+		switch (opt) {
+		case 's':
+			sleep_duration = atoi(optarg);
+			break;
+		default:
+			usage(argv[0]);
+			break;
+		}
+	}
+
+	devid = intel_get_pci_device()->device_id;
+
+	if (!has_de_power2(devid)) {
+		fprintf(stderr, "Display bandwidth counter not available\n");
+		return 2;
+	}
+
+	intel_register_access_init(&mmio_data, intel_get_pci_device(), 0, -1);
+
+	if (has_de_power2_abox0_abox1(devid))
+		measure_de_power2_abox0_abox1(devid, sleep_duration);
+	else
+		measure_de_power2(devid, sleep_duration);
+
+	intel_register_access_fini(&mmio_data);
+
+	return 0;
+}
diff --git a/tools/meson.build b/tools/meson.build
index 48c9a4b5089e..4e9100ddb2b7 100644
--- a/tools/meson.build
+++ b/tools/meson.build
@@ -16,6 +16,7 @@ tools_progs = [
 	'intel_audio_dump',
 	'intel_backlight',
 	'intel_bios_dumper',
+	'intel_display_bandwidth',
 	'intel_display_crc',
 	'intel_display_poller',
 	'intel_dump_decode',
-- 
2.44.2



More information about the igt-dev mailing list