[Intel-gfx] [igt-dev] [PATCH i-g-t 9/9] tools/intel_gpu_top: Add ability to show memory region breakdown
Kamil Konieczny
kamil.konieczny at linux.intel.com
Fri Nov 3 19:04:12 UTC 2023
Hi Tvrtko,
On 2023-10-12 at 09:15:47 +0100, Tvrtko Ursulin wrote:
> From: Tvrtko Ursulin <tvrtko.ursulin at intel.com>
>
> Similar as we can toggle between aggregated engines and clients, add the
> capability to toggle between aggregated and per memory region stats.
>
> It starts in aggregated mode by default and interactive command 'm' and
> command line switch '-m' can be used to toggle that.
>
> Both only affect the interactive view, while JSON output always contains
> separate memory regions.
>
> Signed-off-by: Tvrtko Ursulin <tvrtko.ursulin at intel.com>
Reviewed-by: Kamil Konieczny <kamil.konieczny at linux.intel.com>
> ---
> man/intel_gpu_top.rst | 4 ++++
> tools/intel_gpu_top.c | 55 ++++++++++++++++++++++++++++++++++---------
> 2 files changed, 48 insertions(+), 11 deletions(-)
>
> diff --git a/man/intel_gpu_top.rst b/man/intel_gpu_top.rst
> index 9499f87f1b4d..44a54a5f219d 100644
> --- a/man/intel_gpu_top.rst
> +++ b/man/intel_gpu_top.rst
> @@ -55,6 +55,9 @@ OPTIONS
> -p
> Default to showing physical engines instead of aggregated classes.
>
> +-m
> + Default to showing all memory regions separately.
> +
> RUNTIME CONTROL
> ===============
>
> @@ -68,6 +71,7 @@ Supported keys:
> | 's' Toggle between sort modes (runtime, total runtime, pid, client id).
> | 'i' Toggle display of clients which used no GPU time.
> | 'H' Toggle between per PID aggregation and individual clients.
> +| 'm' Toggle between aggregated memory regions and full breakdown.
>
> DEVICE SELECTION
> ================
> diff --git a/tools/intel_gpu_top.c b/tools/intel_gpu_top.c
> index 2c09895c79dd..046ead15a122 100644
> --- a/tools/intel_gpu_top.c
> +++ b/tools/intel_gpu_top.c
> @@ -138,6 +138,7 @@ struct intel_clients {
>
> static struct termios termios_orig;
> static bool class_view;
> +static bool aggregate_regions;
>
> /* Maps i915 fdinfo names to indices */
> static const char *memory_region_map[] = {
> @@ -1050,6 +1051,7 @@ usage(const char *appname)
> "\t[-L] List all cards.\n"
> "\t[-d <device>] Device filter, please check manual page for more details.\n"
> "\t[-p] Default to showing physical engines instead of classes.\n"
> + "\t[-m] Default to showing all memory regions.\n"
> "\n",
> appname, DEFAULT_PERIOD_MS);
> igt_device_print_filter_types();
> @@ -2032,6 +2034,7 @@ print_clients_header(struct igt_drm_clients *clients, int lines,
>
> if (output_mode == INTERACTIVE) {
> int len, num_active = 0;
> + unsigned int i;
>
> if (lines++ >= con_h)
> return lines;
> @@ -2042,11 +2045,17 @@ print_clients_header(struct igt_drm_clients *clients, int lines,
> if (lines++ >= con_h || len >= con_w)
> return lines;
>
> - if (iclients->regions)
> - len += printf(" MEM RSS ");
> + if (iclients->regions) {
> + if (aggregate_regions) {
> + len += printf(" MEM RSS ");
> + } else {
> + len += printf(" RAM RSS ");
> + if (iclients->regions->num_regions > 1)
> + len += printf(" VRAM VRSS ");
> + }
> + }
>
> if (iclients->classes.num_engines) {
> - unsigned int i;
> int width;
>
> for (i = 0; i <= iclients->classes.max_engine_id; i++) {
> @@ -2120,15 +2129,26 @@ print_client(struct igt_drm_client *c, struct engines *engines, double t, int li
> len = printf("%*s ", clients->max_pid_len, c->pid_str);
>
> if (iclients->regions) {
> - uint64_t sz;
> + if (aggregate_regions) {
> + uint64_t sz;
>
> - for (sz = 0, i = 0; i <= c->regions->max_region_id; i++)
> - sz += c->memory[i].total;
> - len += print_size(sz);
> + for (sz = 0, i = 0;
> + i <= c->regions->max_region_id; i++)
> + sz += c->memory[i].total;
> + len += print_size(sz);
>
> - for (sz = 0, i = 0; i <= c->regions->max_region_id; i++)
> - sz += c->memory[i].resident;
> - len += print_size(sz);
> + for (sz = 0, i = 0;
> + i <= c->regions->max_region_id; i++)
> + sz += c->memory[i].resident;
> + len += print_size(sz);
> + } else {
> + len += print_size(c->memory[0].total);
> + len += print_size(c->memory[0].resident);
> + if (c->regions->num_regions > 1) {
> + len += print_size(c->memory[1].total);
> + len += print_size(c->memory[1].resident);
> + }
> + }
> }
>
> for (i = 0; i <= iclients->classes.max_engine_id; i++) {
> @@ -2405,6 +2425,13 @@ static void process_normal_stdin(void)
> else
> header_msg = "Showing individual clients.";
> break;
> + case 'm':
> + aggregate_regions ^= true;
> + if (aggregate_regions)
> + header_msg = "Aggregating memory regions.";
> + else
> + header_msg = "Showing memory regions.";
> + break;
> };
> }
> }
> @@ -2453,6 +2480,7 @@ static void show_help_screen(void)
> " 's' Toggle between sort modes (runtime, total runtime, pid, client id).\n"
> " 'i' Toggle display of clients which used no GPU time.\n"
> " 'H' Toggle between per PID aggregation and individual clients.\n"
> +" 'm' Toggle between aggregated memory regions and full breakdown.\n"
> "\n"
> " 'h' or 'q' Exit interactive help.\n"
> "\n");
> @@ -2580,6 +2608,7 @@ int main(int argc, char **argv)
> {
> unsigned int period_us = DEFAULT_PERIOD_MS * 1000;
> bool physical_engines = false;
> + bool separate_regions = false;
> struct intel_clients iclients;
> int con_w = -1, con_h = -1;
> char *output_path = NULL;
> @@ -2592,7 +2621,7 @@ int main(int argc, char **argv)
> struct timespec ts;
>
> /* Parse options */
> - while ((ch = getopt(argc, argv, "o:s:d:pcJLlh")) != -1) {
> + while ((ch = getopt(argc, argv, "o:s:d:mpcJLlh")) != -1) {
> switch (ch) {
> case 'o':
> output_path = optarg;
> @@ -2606,6 +2635,9 @@ int main(int argc, char **argv)
> case 'p':
> physical_engines = true;
> break;
> + case 'm':
> + separate_regions = true;
> + break;
> case 'c':
> output_mode = CSV;
> break;
> @@ -2649,6 +2681,7 @@ int main(int argc, char **argv)
> fprintf(stderr, "Failed to install signal handler!\n");
>
> class_view = !physical_engines;
> + aggregate_regions = !separate_regions;
>
> switch (output_mode) {
> case INTERACTIVE:
> --
> 2.39.2
>
More information about the Intel-gfx
mailing list