[PATCH umr] Add initial SDMA ring decoding support

Tom St Denis tom.stdenis at amd.com
Tue Dec 5 17:03:53 UTC 2017


Tested on a Polaris10 running testdma with mesa.   Based on packet
descriptions found in tonga_sdma_pkt_open.h found in the kernel tree.

Like the other ring decoder also supports: follow_ib, bits, and use_colour.

Signed-off-by: Tom St Denis <tom.stdenis at amd.com>
---
 src/app/ring_read.c   |   5 +
 src/lib/dump_ib.c     |   1 +
 src/lib/ring_decode.c | 543 +++++++++++++++++++++++++++++++++++++++++++++++++-
 src/umr.h             |  20 ++
 4 files changed, 566 insertions(+), 3 deletions(-)

diff --git a/src/app/ring_read.c b/src/app/ring_read.c
index 424e44288f8c..f7fd3e58cae8 100644
--- a/src/app/ring_read.c
+++ b/src/app/ring_read.c
@@ -57,6 +57,9 @@ void umr_read_ring(struct umr_asic *asic, char *ringpath)
 	    !memcmp(ringname, "comp", 4)) {
 		enable_decoder = 1;
 		decoder.pm = 4;
+	} else if (!memcmp(ringname, "sdma", 4)) {
+		enable_decoder = 1;
+		decoder.pm = 3;
 	} else {
 		enable_decoder = 0;
 	}
@@ -105,6 +108,7 @@ void umr_read_ring(struct umr_asic *asic, char *ringpath)
 			end *= 4;
 			use_decoder = 1;
 			decoder.pm4.cur_opcode = 0xFFFFFFFF;
+			decoder.sdma.cur_opcode = 0xFFFFFFFF;
 		}
 	}
 	end %= ringsize;
@@ -125,6 +129,7 @@ void umr_read_ring(struct umr_asic *asic, char *ringpath)
 		if (enable_decoder && start == rptr && start != wptr) {
 			use_decoder = 1;
 			decoder.pm4.cur_opcode = 0xFFFFFFFF;
+			decoder.sdma.cur_opcode = 0xFFFFFFFF;
 		}
 		printf(" %c%c%c ",
 			(start == rptr) ? 'r' : '.',
diff --git a/src/lib/dump_ib.c b/src/lib/dump_ib.c
index 859da4f5203a..c313b87572d6 100644
--- a/src/lib/dump_ib.c
+++ b/src/lib/dump_ib.c
@@ -51,6 +51,7 @@ void umr_dump_ib(struct umr_asic *asic, struct umr_ring_decoder *decoder)
 	if (data && !umr_read_vram(asic, decoder->next_ib_info.vmid, decoder->next_ib_info.ib_addr, decoder->next_ib_info.size, data)) {
 	// dump IB
 		decoder->pm4.cur_opcode = 0xFFFFFFFF;
+		decoder->sdma.cur_opcode = 0xFFFFFFFF;
 		for (x = 0; x < decoder->next_ib_info.size/4; x++) {
 			decoder->next_ib_info.addr = x;
 			printf("IB[%s%5u%s] = %s0x%08lx%s ... ",
diff --git a/src/lib/ring_decode.c b/src/lib/ring_decode.c
index c904df0e281c..3fb6367ad142 100644
--- a/src/lib/ring_decode.c
+++ b/src/lib/ring_decode.c
@@ -340,7 +340,7 @@ static char *vgt_event_decode(unsigned tag)
 
 #define BITS(x, a, b) (unsigned long)((x >> (a)) & ((1ULL << ((b)-(a)))-1))
 
-static void add_ib(struct umr_ring_decoder *decoder)
+static void add_ib_pm4(struct umr_ring_decoder *decoder)
 {
 	struct umr_ring_decoder *pdecoder;
 
@@ -365,6 +365,31 @@ static void add_ib(struct umr_ring_decoder *decoder)
 	memset(&decoder->pm4.next_ib_state, 0, sizeof(decoder->pm4.next_ib_state));
 }
 
+static void add_ib_pm3(struct umr_ring_decoder *decoder)
+{
+	struct umr_ring_decoder *pdecoder;
+
+	pdecoder = decoder;
+	while (pdecoder->next_ib)
+		pdecoder = pdecoder->next_ib;
+
+	pdecoder->next_ib = calloc(1, sizeof(*(pdecoder->next_ib)));
+	pdecoder = pdecoder->next_ib;
+	pdecoder->pm = 3;
+	pdecoder->next_ib_info.ib_addr = ((uint64_t)decoder->sdma.next_ib_state.ib_addr_hi << 32) |
+					 decoder->sdma.next_ib_state.ib_addr_lo;
+	pdecoder->next_ib_info.size    = decoder->sdma.next_ib_state.ib_size;
+	pdecoder->next_ib_info.vmid    = decoder->sdma.next_ib_state.ib_vmid;
+	pdecoder->next_ib_info.vm_base_addr = ~0ULL; // not used yet.
+
+
+	pdecoder->src.ib_addr = decoder->next_ib_info.ib_addr;
+	pdecoder->src.vmid    = decoder->next_ib_info.vmid;
+	pdecoder->src.addr    = decoder->next_ib_info.addr;
+
+	memset(&decoder->sdma.next_ib_state, 0, sizeof(decoder->sdma.next_ib_state));
+}
+
 static char *umr_reg_name(struct umr_asic *asic, uint64_t addr)
 {
 	struct umr_reg *reg;
@@ -486,7 +511,7 @@ static void print_decode_pm4_pkt3(struct umr_asic *asic, struct umr_ring_decoder
 				case 2: printf("IB_SIZE:%s%lu%s, VMID: %s%lu%s", BLUE, BITS(ib, 0, 20), RST, BLUE, BITS(ib, 24, 32), RST);
 					decoder->pm4.next_ib_state.ib_size = BITS(ib, 0, 20) * 4;
 					decoder->pm4.next_ib_state.ib_vmid = BITS(ib, 24, 32);
-					add_ib(decoder);
+					add_ib_pm4(decoder);
 					break;
 				default: printf("Invalid word for opcode 0x%02lx", (unsigned long)decoder->pm4.cur_opcode);
 			}
@@ -834,7 +859,7 @@ static void print_decode_pm4(struct umr_asic *asic, struct umr_ring_decoder *dec
 
 			if (decoder->pm4.next_ib_state.tally == 15) {
 				decoder->pm4.next_ib_state.tally = 0;
-				add_ib(decoder);
+				add_ib_pm4(decoder);
 			}
 
 			decoder->pm4.next_write_mem.addr_lo++;
@@ -849,11 +874,523 @@ static void print_decode_pm4(struct umr_asic *asic, struct umr_ring_decoder *dec
 	}
 }
 
+static const char *sdma_opcodes[] = {
+	"NOP", // 0
+	"COPY", // 1
+	"WRITE", // 2
+	"",
+	"INDIRECT_BUFFER", // 4
+	"FENCE", //5
+	"TRAP", //6
+	"SEM", //7
+	"POLL_REGMEM", //8
+	"COND_EXE", //9
+	"ATOMIC", //10
+	"CONST_FILL", //11
+	"GEN_PTEPDE", //12
+	"TIMESTAMP", //13
+	"SRBM WRITE", //14
+	"PRE EXE",//15
+};
+
+static void parse_next_sdma_pkt(struct umr_asic *asic, struct umr_ring_decoder *decoder, uint32_t ib)
+{
+	if (decoder->sdma.n_words == 1)
+		printf("\\---+ ");
+	else
+		printf("|---+ ");
+
+	printf("WORD [%s%u%s]: ", BLUE, (unsigned)decoder->sdma.cur_word, RST);
+	switch (decoder->sdma.cur_opcode) {
+		case 1: // COPY
+			switch (decoder->sdma.cur_sub_opcode) {
+				case 0: // LINEAR
+					switch (decoder->sdma.header_dw & (1UL << 27)) {
+						case 0: // not broadcast
+							switch (decoder->sdma.cur_word) {
+								case 1: printf("COPY_COUNT: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+									break;
+								case 2: printf("DST_SW: %s%u%s, DST_HA: %s%u%s, SRC_SW: %s%u%s, SRC_HA: %s%u%s",
+										BLUE, ((unsigned)(ib >> 16) & 3), RST,
+										BLUE, ((unsigned)(ib >> 22) & 1), RST,
+										BLUE, ((unsigned)(ib >> 24) & 3), RST,
+										BLUE, ((unsigned)(ib >> 30) & 1), RST);
+									break;
+								case 3: printf("SRC_ADDR_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+									break;
+								case 4: printf("SRC_ADDR_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+									break;
+								case 5: printf("DST_ADDR_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+									break;
+								case 6: printf("DST_ADDR_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+									break;
+							}
+							break;
+						default: // broadcast
+							break;
+					}
+					break;
+				case 1: // TILED
+					break;
+				case 3: // SOA
+					break;
+				case 4: // LINEAR_SUB_WINDOW
+					switch (decoder->sdma.cur_word) {
+						case 1: printf("SRC_ADDR_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+							break;
+						case 2: printf("SRC_ADDR_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+							break;
+						case 3: printf("SRC_X: %s%u%s, SRC_Y: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x3FFF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3FFF), RST);
+							break;
+						case 4: printf("SRC_Z: %s%u%s, SRC_PITCH: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x7FF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3FFF), RST);
+							break;
+						case 5: printf("SRC_SLICE_PITCH: %s%u%s", BLUE, ib & 0xFFFFFFF, RST);
+							break;
+						case 6: printf("DST_ADDR_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+							break;
+						case 7: printf("DST_ADDR_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+							break;
+						case 8: printf("DST_X: %s%u%s, DST_Y: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x3FFF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3FFF), RST);
+							break;
+						case 9: printf("DST_Z: %s%u%s, DST_PITCH: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x7FF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3FFF), RST);
+							break;
+						case 10: printf("DST_SLICE_PITCH: %s%u%s", BLUE, ib & 0xFFFFFFF, RST);
+							break;
+						case 11: printf("RECT_X: %s%u%s, RECT_Y: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x3FFF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3FFF), RST);
+							break;
+						case 12: printf("RECT_Z: %s%u%s, DST_SW: %s%u%s, DST_HA: %s%u%s, SRC_SW: %s%u%s, SRC_HA: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x3FFF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3), RST,
+								BLUE, ((unsigned)(ib >> 22) & 0x1), RST,
+								BLUE, ((unsigned)(ib >> 24) & 0x3), RST,
+								BLUE, ((unsigned)(ib >> 30) & 0x1), RST);
+							break;
+					}
+					break;
+				case 5: // TILED_SUB_WINDOW (TODO bitfields)
+					switch (decoder->sdma.cur_word) {
+						case 1: printf("TILED_ADDR_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+							break;
+						case 2: printf("TILED_ADDR_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+							break;
+						case 3: printf("TILED_X: %s%u%s, TILED_Y: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x3FFF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3FFF), RST);
+							break;
+						case 4: printf("TILED_Z: %s%u%s, TILED_PITCH: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x7FF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3FFF), RST);
+							break;
+						case 5: printf("PITCH_IN_TILE: %s%u%s", BLUE, ib & 0xFFFFFFF, RST);
+							break;
+						case 6: printf("ELEMENT_SIZE: %s%u%s, ARRAY_MODE: %s%u%s, MIT_MODE: %s%u%s, TILESPLIT_SIZE: %s%u%s, BANK_W: %s%u%s, BANK_H: %s%u%s, NUM_BANK: %s%u%s, MAT_ASPT: %s%u%s, PIPE_CONFIG: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x7), RST,
+								BLUE, ((unsigned)(ib >> 3) & 0xF), RST,
+								BLUE, ((unsigned)(ib >> 8) & 0x7), RST,
+								BLUE, ((unsigned)(ib >> 11) & 0x7), RST,
+								BLUE, ((unsigned)(ib >> 15) & 0x3), RST,
+								BLUE, ((unsigned)(ib >> 18) & 0x3), RST,
+								BLUE, ((unsigned)(ib >> 21) & 0x3), RST,
+								BLUE, ((unsigned)(ib >> 24) & 0x3), RST,
+								BLUE, ((unsigned)(ib >> 26) & 0x1F), RST);
+							break;
+						case 7: printf("LINEAR_ADDR_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+							break;
+						case 8: printf("LINEAR_ADDR_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+							break;
+						case 9: printf("LINEAR_X: %s%u%s, LINEAR_Y: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x3FFF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3FFF), RST);
+							break;
+						case 10: printf("LINEAR_Z: %s%u%s, LINEAR_PITCH: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x7FF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3FFF), RST);
+							break;
+						case 11: printf("LINEAR_SLICE_PITCH: %s%u%s", BLUE, ib & 0xFFFFFFF, RST);
+							break;
+						case 12: printf("RECT_X: %s%u%s, RECT_Y: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x3FFF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3FFF), RST);
+							break;
+						case 13: printf("RECT_Z: %s%u%s, LINEAR_SW: %s%u%s, TILE_SW: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x7FF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3), RST,
+								BLUE, ((unsigned)(ib >> 24) & 0x3), RST);
+							break;
+					}
+					break;
+				case 6: // T2T_SUB_WINDOW
+					switch (decoder->sdma.cur_word) {
+						case 1: printf("SRC_ADDR_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+							break;
+						case 2: printf("SRC_ADDR_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+							break;
+						case 3: printf("SRC_X: %s%u%s, SRC_Y: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x3FFF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3FFF), RST);
+							break;
+						case 4: printf("SRC_Z: %s%u%s, SRC_PITCH: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x7FF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3FFF), RST);
+							break;
+						case 5: printf("SRC_SLICE_PITCH: %s%u%s", BLUE, ib & 0xFFFFFFF, RST);
+							break;
+						case 6: printf("SRC_ELEMENT_SIZE: %s%u%s, SRC_ARRAY_MODE: %s%u%s, SRC_MIT_MODE: %s%u%s, SRC_TILESPLIT_SIZE: %s%u%s, SRC_BANK_W: %s%u%s, SRC_BANK_H: %s%u%s, NUM_BANKS: %s%u%s, MAT_ASPT: %s%u%s, PIPE_CONFIG: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x7), RST,
+								BLUE, ((unsigned)(ib >> 3) & 0xF), RST,
+								BLUE, ((unsigned)(ib >> 8) & 0x7), RST,
+								BLUE, ((unsigned)(ib >> 11) & 0x7), RST,
+								BLUE, ((unsigned)(ib >> 15) & 0x3), RST,
+								BLUE, ((unsigned)(ib >> 18) & 0x3), RST,
+								BLUE, ((unsigned)(ib >> 21) & 0x3), RST,
+								BLUE, ((unsigned)(ib >> 24) & 0x3), RST,
+								BLUE, ((unsigned)(ib >> 26) & 0x1F), RST);
+							break;
+						case 7: printf("DST_ADDR_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+							break;
+						case 8: printf("DST_ADDR_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+							break;
+						case 9: printf("DW9: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+							break;
+						case 10: printf("DST_Z: %s%u%s, DST_PITCH: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x7FF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3FFF), RST);
+							break;
+						case 11: printf("DST_SLICE_PITCH: %s%u%s", BLUE, ib & 0xFFFFFFF, RST);
+							break;
+						case 12: printf("ARRAY_MODE: %s%u%s, MIT_MODE: %s%u%s, TILESPLIT_SIZE: %s%u%s, BANK_W: %s%u%s, BANK_H: %s%u%s, NUM_BANK: %s%u%s, MAT_ASPT: %s%u%s, PIPE_CONFIG: %s%u%s",
+								BLUE, ((unsigned)(ib >> 3) & 0xF), RST,
+								BLUE, ((unsigned)(ib >> 8) & 0x7), RST,
+								BLUE, ((unsigned)(ib >> 11) & 0x7), RST,
+								BLUE, ((unsigned)(ib >> 15) & 0x3), RST,
+								BLUE, ((unsigned)(ib >> 18) & 0x3), RST,
+								BLUE, ((unsigned)(ib >> 21) & 0x3), RST,
+								BLUE, ((unsigned)(ib >> 24) & 0x3), RST,
+								BLUE, ((unsigned)(ib >> 26) & 0x1F), RST);
+							break;
+						case 13: printf("RECT_X: %s%u%s, RECT_Y: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x3FFF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3FFF), RST);
+							break;
+						case 14: printf("RECT_Z: %s%u%s, DST_SW: %s%u%s, SRC_SW: %s%u%s",
+								BLUE, ((unsigned)(ib >> 0) & 0x7FF), RST,
+								BLUE, ((unsigned)(ib >> 16) & 0x3), RST,
+								BLUE, ((unsigned)(ib >> 24) & 0x3), RST);
+							break;
+					}
+					break;
+			}
+			break;
+		case 2: // WRITE
+			switch (decoder->sdma.cur_sub_opcode) {
+				case 0: // LINEAR
+					switch (decoder->sdma.cur_word) {
+						case 1: printf("DST_ADDR_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+							break;
+						case 2: printf("DST_ADDR_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+							break;
+						case 3: printf("COUNT: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+							decoder->sdma.n_words += ib - 1;
+							break;
+						default: printf("DATA: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+							break;
+					}
+					break;
+
+				case 1: // TILED (TODO bit decodings...)
+					switch (decoder->sdma.cur_word) {
+						case 1: printf("DST_ADDR_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+							break;
+						case 2: printf("DST_ADDR_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+							break;
+						case 3: printf("DW3: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+							break;
+						case 4: printf("DW4: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+							break;
+						case 5: printf("DW5: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+							break;
+						case 6: printf("DW6: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+							break;
+						case 7: printf("DW7: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+							break;
+					}
+					break;
+			}
+			break;
+		case 4: // INDIRECT
+			switch (decoder->sdma.cur_word) {
+				case 1: printf("IB_BASE_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+					decoder->sdma.next_ib_state.ib_addr_lo = ib;
+					break;
+				case 2: printf("IB_BASE_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+					decoder->sdma.next_ib_state.ib_addr_hi = ib;
+					break;
+				case 3: printf("IB_BASE_SIZE: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+					decoder->sdma.next_ib_state.ib_size = ib * 4; // number of bytesq
+					break;
+				case 4: printf("IB_CSA_ADDR_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+					decoder->sdma.next_ib_state.csa_addr_lo = ib;
+					break;
+				case 5: printf("IB_CSA_ADDR_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+					decoder->sdma.next_ib_state.csa_addr_hi = ib;
+					add_ib_pm3(decoder);
+					break;
+			}
+			break;
+		case 5: // FENCE
+			switch (decoder->sdma.cur_word) {
+				case 1: printf("FENCE_ADDR_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+					break;
+				case 2: printf("FENCE_ADDR_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+					break;
+				case 3: printf("FENCE_DATA: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+					break;
+			}
+			break;
+		case 6: // TRAP
+			switch (decoder->sdma.cur_word) {
+				case 1: printf("TRAP_INT_CONTEXT: %s0x%08lx%s", YELLOW, (unsigned long)ib & 0xFFFFFFF, RST);
+					break;
+			}
+			break;
+		case 8: // POLL_REGMEM
+			switch (decoder->sdma.cur_word) {
+				case 1: printf("POLL_REGMEM_ADDR_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+					if (!(decoder->sdma.header_dw & (1UL << 31))) printf("(%s)", umr_reg_name(asic, ib));
+					break;
+				case 2: printf("POLL_REGMEM_ADDR_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+					if (!(decoder->sdma.header_dw & (1UL << 31))) printf("(%s)", umr_reg_name(asic, ib));
+					break;
+				case 3: printf("POLL_REGMEM_ADDR_VALUE: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+					break;
+				case 4: printf("POLL_REGMEM_ADDR_MASK: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+					break;
+				case 5: printf("POLL_REGMEM_ADDR_DW5: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+					break;
+			}
+			break;
+		case 11: // CONST_FILL
+			switch (decoder->sdma.cur_word) {
+				case 1: printf("CONST_FILL_DST_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+					break;
+				case 2: printf("CONST_FILL_DST_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+					break;
+				case 3: printf("CONST_FILL_DATA: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+					break;
+				case 4: printf("CONST_FILL_BYTE_COUNT: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+					break;
+			}
+			break;
+		case 12: // GEN_PTEPDE
+			switch (decoder->sdma.cur_word) {
+				case 1: printf("GEN_PTEPDE_PE_ADDR_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+					break;
+				case 2: printf("GEN_PTEPDE_PE_ADDR_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+					break;
+				case 3: printf("GEN_PTEPDE_FLAGS_LO: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+					break;
+				case 4: printf("GEN_PTEPDE_FLAGS_HI: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+					break;
+				case 5: printf("GEN_PTEPDE_ADDR_LO: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+					break;
+				case 6: printf("GEN_PTEPDE_ADDR_HI: %s0x%08lx%s", YELLOW, (unsigned long)ib, RST);
+					break;
+				case 7: printf("GEN_PTEPDE_INC_SIZE: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+					break;
+				case 8: printf("GEN_PTEPDE_DW8: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+					break;
+				case 9: printf("GEN_PTEPDE_COUNT: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+					break;
+			}
+			break;
+		case 14: // SRBM_WRITE
+			switch (decoder->sdma.cur_word) {
+				case 1: printf("SRBM_WRITE_ADDR: %s0x%08lx%s(%s)",
+						YELLOW, (unsigned long)ib & 0xFFFF, RST, umr_reg_name(asic, ib & 0xFFFF));
+					decoder->sdma.next_write_mem = ib;
+					break;
+				case 2: printf("SRBM_WRITE_DATA: %s0x%08lx%s", BLUE, (unsigned long)ib, RST);
+					print_bits(asic, decoder->sdma.next_write_mem, ib, 1);
+					break;
+			}
+			break;
+	}
+
+	decoder->sdma.cur_word++;
+}
+
+static void print_decode_sdma(struct umr_asic *asic, struct umr_ring_decoder *decoder, uint32_t ib)
+{
+	static const char *poll_regmem_funcs[] = { "always", "<", "<=", "==", "!=", ">=", ">", "N/A" };
+	switch (decoder->sdma.cur_opcode) {
+		case 0xFFFFFFFF: // initial decode
+			decoder->sdma.cur_opcode = ib & 0xFF;
+			decoder->sdma.cur_sub_opcode = (ib >> 8) & 0xFF;
+			decoder->sdma.cur_word = 1;
+			decoder->sdma.header_dw = ib;
+
+			// sanity check
+			if (decoder->sdma.cur_opcode > 15) {
+				// invalid
+				decoder->sdma.cur_opcode = 0xFFFFFFFF;
+				break;
+			}
+
+			printf("OPCODE: [%s%s%s], SUB-OPCODE: [%s%u%s]",
+				CYAN, sdma_opcodes[decoder->sdma.cur_opcode], RST,
+				BLUE, (unsigned)decoder->sdma.cur_sub_opcode, RST);
+
+			// handle decoding "extra information" from header word
+			switch (decoder->sdma.cur_opcode) {
+				case 0: // NOP
+					decoder->sdma.n_words = 1;
+					break;
+				case 1:  // COPY
+					switch (decoder->sdma.cur_sub_opcode) {
+						case 0: // LINEAR
+							printf(", %sLINEAR", CYAN);
+							decoder->sdma.n_words = 7;
+
+							// BROADCAST
+							if (ib & (1UL << 27)) {
+								decoder->sdma.n_words += 2;
+								printf("_BROADCAST");
+							}
+							printf("_COPY%s", RST);
+							break;
+						case 1: // TILED
+							printf(", %sTILED_COPY%s", CYAN, RST);
+							decoder->sdma.n_words = 12;
+							break;
+						case 3: // STRUCTURE/SOA
+							printf(", %sSTRUCTURE_COPY%s", CYAN, RST);
+							decoder->sdma.n_words = 8;
+							break;
+						case 4: // LINEAR_SUB_WINDOW
+							printf(", %sLINEAR_SUB_WINDOW_COPY%s", CYAN, RST);
+							decoder->sdma.n_words = 13;
+							break;
+						case 5: // TILED_SUB_WINDOW
+							printf(", %sTILED_SUB_WINDOW_COPY%s, DETILE: %s%u%s", CYAN, RST, BLUE, (unsigned)(ib >> 31), RST);
+							decoder->sdma.n_words = 14;
+							break;
+						case 6: // T2T_SUB_WIND
+							printf(", %sT2T_SUB_WINDOW_COPY%s", CYAN, RST);
+							decoder->sdma.n_words = 15;
+							break;
+					}
+					break;
+				case 2:  // WRITE
+					switch (decoder->sdma.cur_sub_opcode) {
+						case 0: // LINEAR
+							printf(", %sLINEAR_WRITE%s", CYAN, RST);
+							decoder->sdma.n_words = 5;
+							break;
+						case 1: // TILED
+							printf(", %sTILED_WRITE%s", CYAN, RST);
+							decoder->sdma.n_words = 10;
+							break;
+					}
+					break;
+				case 4: // INDIRECT
+					decoder->sdma.next_ib_state.ib_vmid = (ib >> 16) & 0xF;
+					printf(", VMID: %s%u%s", BLUE, decoder->sdma.next_ib_state.ib_vmid, RST);
+					decoder->sdma.n_words = 6;
+					break;
+				case 5: // FENCE
+					decoder->sdma.n_words = 4;
+					break;
+				case 6: // TRAP
+					decoder->sdma.n_words = 2;
+					break;
+					break;
+				case 7: // SEM
+					printf(", WRITE_ONE: %s%u%s, SIGNAL: %s%u%s, MAILBOX: %s%u%s",
+						BLUE, (unsigned)((ib >> 29) & 1), RST,
+						BLUE, (unsigned)((ib >> 30) & 1), RST,
+						BLUE, (unsigned)((ib >> 31) & 1), RST);
+					decoder->sdma.n_words = 3;
+					break;
+				case 8: // POLL_REGMEM
+					printf(", HDP_FLUSH: %s%u%s, FUNCTION: %s%u%s (%s%s%s), MEM_POLL: %s%u%s",
+						BLUE, (unsigned)((ib >> 26) & 1), RST,
+						BLUE, (unsigned)((ib >> 28) & 7), RST,
+						CYAN, poll_regmem_funcs[((ib >> 28) & 7)], RST,
+						BLUE, (unsigned)((ib >> 31) & 1), RST);
+					decoder->sdma.n_words = 6;
+					break;
+				case 9: // COND_EXE
+					decoder->sdma.n_words = 5;
+					break;
+				case 10: // ATOMIC
+					printf(", LOOP: %s%u%s, OP: %s%u%s",
+						BLUE, (unsigned)((ib >> 16) & 1), RST,
+						BLUE, (unsigned)((ib >> 25) & 0x7F), RST);
+					decoder->sdma.n_words = 8;
+					break;
+				case 11: // CONST_FILL
+					printf(", FILL_SIZE: %s%u%s", BLUE, (unsigned)(ib >> 30), RST);
+					decoder->sdma.n_words = 5;
+					break;
+				case 12: // GEN_PTEPDE
+					decoder->sdma.n_words = 10;
+					break;
+				case 13: // TIMESTAMP
+					switch (decoder->sdma.cur_sub_opcode) {
+						case 0:
+							printf(", %sTIMESTAMP_SET%s", CYAN, RST);
+							decoder->sdma.n_words = 3;
+							break;
+						case 1:
+							printf(", %sTIMESTAMP_GET%s", CYAN, RST);
+							decoder->sdma.n_words = 3;
+							break;
+						case 2:
+							printf(", %sTIMESTAMP_GET_GLOBAL%s", CYAN, RST);
+							decoder->sdma.n_words = 3;
+							break;
+					}
+					break;
+				case 14: // SRBM_WRITE
+					printf(", BYTE ENABLE: %s0x%x%s", BLUE, (unsigned)(ib >> 28), RST);
+					decoder->sdma.n_words = 3;
+					break;
+				case 15: // PRE_EXE
+					printf(", DEV_SEL: %s%u%s",
+						BLUE, (unsigned)((ib >> 16) & 0xFF), RST);
+					decoder->sdma.n_words = 2;
+					break;
+				default:
+					break; // nothing to print
+			}
+			break;
+		default:
+			parse_next_sdma_pkt(asic, decoder, ib);
+			break;
+	}
+	if (!--(decoder->sdma.n_words) ) {
+		decoder->sdma.cur_opcode = 0xFFFFFFFF;
+	}
+}
+
 void umr_print_decode(struct umr_asic *asic, struct umr_ring_decoder *decoder, uint32_t ib)
 {
 	switch (decoder->pm) {
 		case 4:
 			print_decode_pm4(asic, decoder, ib);
 			break;
+		case 3:
+			print_decode_sdma(asic, decoder, ib);
+			break;
 	}
 }
diff --git a/src/umr.h b/src/umr.h
index c0821f2d2c03..f92b9c9591aa 100644
--- a/src/umr.h
+++ b/src/umr.h
@@ -382,6 +382,26 @@ struct umr_ring_decoder {
 		} next_write_mem;
 	} pm4;
 
+	struct {
+		uint32_t
+			cur_opcode,
+			cur_sub_opcode,
+			n_words,
+			cur_word,
+			header_dw,
+			next_write_mem;
+
+		struct {
+			uint32_t
+				ib_addr_lo,
+				ib_addr_hi,
+				csa_addr_lo,
+				csa_addr_hi,
+				ib_size,
+				ib_vmid;
+		} next_ib_state;
+	} sdma;
+
 	struct umr_ring_decoder *next_ib;
 
 	// only used by tail end of ring_read ...
-- 
2.12.0



More information about the amd-gfx mailing list