[Mesa-dev] [PATCH 04/10] radeon/vcn: implement jpeg decode functions

boyuan.zhang at amd.com boyuan.zhang at amd.com
Thu Aug 2 19:44:44 UTC 2018


From: Boyuan Zhang <boyuan.zhang at amd.com>

Signed-off-by: Boyuan Zhang <boyuan.zhang at amd.com>
---
 src/gallium/drivers/radeon/radeon_vcn_jpeg.c | 286 ++++++++++++++++++++++++++-
 1 file changed, 281 insertions(+), 5 deletions(-)

diff --git a/src/gallium/drivers/radeon/radeon_vcn_jpeg.c b/src/gallium/drivers/radeon/radeon_vcn_jpeg.c
index c078131..72dff57 100644
--- a/src/gallium/drivers/radeon/radeon_vcn_jpeg.c
+++ b/src/gallium/drivers/radeon/radeon_vcn_jpeg.c
@@ -63,12 +63,195 @@ struct radeon_jpeg_decoder {
 	unsigned			dt_chroma_top_offset;
 };
 
+static void radeon_jpeg_destroy_associated_data(void *data)
+{
+	/* NOOP, since we only use an intptr */
+}
+
+static struct pb_buffer *radeon_jpeg_get_decode_param(struct radeon_jpeg_decoder *dec,
+					struct pipe_video_buffer *target,
+					struct pipe_picture_desc *picture)
+{
+	struct r600_texture *luma = (struct r600_texture *)
+				((struct vl_video_buffer *)target)->resources[0];
+	struct r600_texture *chroma = (struct r600_texture *)
+				((struct vl_video_buffer *)target)->resources[1];
+
+	dec->bsd_size = align(dec->bs_size, 128);
+	dec->dt_luma_top_offset = luma->surface.u.gfx9.surf_offset;
+	if (target->buffer_format == PIPE_FORMAT_NV12) {
+		dec->dt_chroma_top_offset = chroma->surface.u.gfx9.surf_offset;
+		dec->dt_pitch = luma->surface.u.gfx9.surf_pitch * luma->surface.blk_w;
+	}
+	else if (target->buffer_format == PIPE_FORMAT_YUYV)
+		dec->dt_pitch = luma->surface.u.gfx9.surf_pitch;
+	dec->dt_uv_pitch = dec->dt_pitch / 2;
+
+	return luma->resource.buf;
+}
+
+static void get_mjpeg_slice_header(struct radeon_jpeg_decoder *dec, struct pipe_mjpeg_picture_desc *pic)
+{
+	int size = 0, saved_size, len_pos, i;
+	uint16_t *bs;
+	uint8_t *buf = dec->bs_ptr;
+
+	/* SOI */
+	buf[size++] = 0xff;
+	buf[size++] = 0xd8;
+
+	/* DQT */
+	buf[size++] = 0xff;
+	buf[size++] = 0xdb;
+
+	len_pos = size++;
+	size++;
+
+	for (i = 0; i < 4; ++i) {
+		if (pic->quantization_table.load_quantiser_table[i] == 0)
+			continue;
+
+		buf[size++] = i;
+		memcpy((buf + size), &pic->quantization_table.quantiser_table[i], 64);
+		size += 64;
+	}
+
+	bs = (uint16_t*)&buf[len_pos];
+	*bs = util_bswap16(size - 4);
+
+	saved_size = size;
+
+	/* DHT */
+	buf[size++] = 0xff;
+	buf[size++] = 0xc4;
+
+	len_pos = size++;
+	size++;
+
+	for (i = 0; i < 2; ++i) {
+		if (pic->huffman_table.load_huffman_table[i] == 0)
+			continue;
+
+		buf[size++] = 0x00 | i;
+		memcpy((buf + size), &pic->huffman_table.table[i].num_dc_codes, 16);
+		size += 16;
+		memcpy((buf + size), &pic->huffman_table.table[i].dc_values, 12);
+		size += 12;
+	}
+
+	for (i = 0; i < 2; ++i) {
+		if (pic->huffman_table.load_huffman_table[i] == 0)
+			continue;
+
+		buf[size++] = 0x10 | i;
+		memcpy((buf + size), &pic->huffman_table.table[i].num_ac_codes, 16);
+		size += 16;
+		memcpy((buf + size), &pic->huffman_table.table[i].ac_values, 162);
+		size += 162;
+	}
+
+	bs = (uint16_t*)&buf[len_pos];
+	*bs = util_bswap16(size - saved_size - 2);
+
+	saved_size = size;
+
+	/* DRI */
+	if (pic->slice_parameter.restart_interval) {
+		buf[size++] = 0xff;
+		buf[size++] = 0xdd;
+		buf[size++] = 0x00;
+		buf[size++] = 0x04;
+		bs = (uint16_t*)&buf[size++];
+		*bs = util_bswap16(pic->slice_parameter.restart_interval);
+		saved_size = ++size;
+	}
+
+	/* SOF */
+	buf[size++] = 0xff;
+	buf[size++] = 0xc0;
+
+	len_pos = size++;
+	size++;
+
+	buf[size++] = 0x08;
+
+	bs = (uint16_t*)&buf[size++];
+	*bs = util_bswap16(pic->picture_parameter.picture_height);
+	size++;
+
+	bs = (uint16_t*)&buf[size++];
+	*bs = util_bswap16(pic->picture_parameter.picture_width);
+	size++;
+
+	buf[size++] = pic->picture_parameter.num_components;
+
+	for (i = 0; i < pic->picture_parameter.num_components; ++i) {
+		buf[size++] = pic->picture_parameter.components[i].component_id;
+		buf[size++] = pic->picture_parameter.components[i].h_sampling_factor << 4 |
+					  pic->picture_parameter.components[i].v_sampling_factor;
+		buf[size++] = pic->picture_parameter.components[i].quantiser_table_selector;
+	}
+
+	bs = (uint16_t*)&buf[len_pos];
+	*bs = util_bswap16(size - saved_size - 2);
+
+	saved_size = size;
+
+	/* SOS */
+	buf[size++] = 0xff;
+	buf[size++] = 0xda;
+
+	len_pos = size++;
+	size++;
+
+	buf[size++] = pic->slice_parameter.num_components;
+
+	for (i = 0; i < pic->slice_parameter.num_components; ++i) {
+		buf[size++] = pic->slice_parameter.components[i].component_selector;
+		buf[size++] = pic->slice_parameter.components[i].dc_table_selector << 4 |
+					  pic->slice_parameter.components[i].ac_table_selector;
+	}
+
+	buf[size++] = 0x00;
+	buf[size++] = 0x3f;
+	buf[size++] = 0x00;
+
+	bs = (uint16_t*)&buf[len_pos];
+	*bs = util_bswap16(size - saved_size - 2);
+
+	dec->bs_ptr += size;
+	dec->bs_size += size;
+}
+
 /* flush IB to the hardware */
 static int flush(struct radeon_jpeg_decoder *dec, unsigned flags)
 {
 	return dec->ws->cs_flush(dec->cs, flags, NULL);
 }
 
+/* add a new set register command to the IB */
+static void set_reg_jpeg(struct radeon_jpeg_decoder *dec, unsigned reg,
+					unsigned cond, unsigned type, uint32_t val)
+{
+	/* TODO */
+}
+
+/* send a bitstream buffer command */
+static void send_cmd_bitstream(struct radeon_jpeg_decoder *dec,
+		     struct pb_buffer* buf, uint32_t off,
+		     enum radeon_bo_usage usage, enum radeon_bo_domain domain)
+{
+	/* TODO */
+}
+
+/* send a target buffer command */
+static void send_cmd_target(struct radeon_jpeg_decoder *dec,
+		     struct pb_buffer* buf, uint32_t off,
+		     enum radeon_bo_usage usage, enum radeon_bo_domain domain)
+{
+	/* TODO */
+}
+
 /* cycle to the next set of buffers */
 static void next_buffer(struct radeon_jpeg_decoder *dec)
 {
@@ -81,7 +264,20 @@ static void next_buffer(struct radeon_jpeg_decoder *dec)
  */
 static void radeon_jpeg_destroy(struct pipe_video_codec *decoder)
 {
-	/* TODO */
+	struct radeon_jpeg_decoder *dec = (struct radeon_jpeg_decoder*)decoder;
+	unsigned i;
+
+	assert(decoder);
+
+	flush(dec, 0);
+
+	dec->ws->cs_destroy(dec->cs);
+
+	for (i = 0; i < NUM_BUFFERS; ++i) {
+		si_vid_destroy_buffer(&dec->bs_buffers[i]);
+	}
+
+	FREE(dec);
 }
 
 /**
@@ -91,7 +287,19 @@ static void radeon_jpeg_begin_frame(struct pipe_video_codec *decoder,
 			     struct pipe_video_buffer *target,
 			     struct pipe_picture_desc *picture)
 {
-	/* TODO */
+	struct radeon_jpeg_decoder *dec = (struct radeon_jpeg_decoder*)decoder;
+	uintptr_t frame;
+
+	assert(decoder);
+
+	frame = ++dec->frame_number;
+	vl_video_buffer_set_associated_data(target, decoder, (void *)frame,
+					    &radeon_jpeg_destroy_associated_data);
+
+	dec->bs_size = 0;
+	dec->bs_ptr = dec->ws->buffer_map(
+		dec->bs_buffers[dec->cur_buffer].res->buf,
+		dec->cs, PIPE_TRANSFER_WRITE);
 }
 
 /**
@@ -103,7 +311,8 @@ static void radeon_jpeg_decode_macroblock(struct pipe_video_codec *decoder,
 				   const struct pipe_macroblock *macroblocks,
 				   unsigned num_macroblocks)
 {
-	/* TODO */
+	/* not supported (yet) */
+	assert(0);
 }
 
 /**
@@ -116,7 +325,51 @@ static void radeon_jpeg_decode_bitstream(struct pipe_video_codec *decoder,
 				  const void * const *buffers,
 				  const unsigned *sizes)
 {
-	/* TODO */
+	struct radeon_jpeg_decoder *dec = (struct radeon_jpeg_decoder*)decoder;
+	enum pipe_video_format format = u_reduce_video_profile(picture->profile);
+	unsigned i;
+
+	assert(decoder);
+
+	if (!dec->bs_ptr)
+		return;
+
+	if (format == PIPE_VIDEO_FORMAT_JPEG)
+		get_mjpeg_slice_header(dec, (struct pipe_mjpeg_picture_desc*)picture);
+
+	for (i = 0; i < num_buffers; ++i) {
+		struct rvid_buffer *buf = &dec->bs_buffers[dec->cur_buffer];
+		unsigned new_size = dec->bs_size + sizes[i];
+
+		if (format == PIPE_VIDEO_FORMAT_JPEG)
+			new_size += 2; /* save for EOI */
+
+		if (new_size > buf->res->buf->size) {
+			dec->ws->buffer_unmap(buf->res->buf);
+			if (!si_vid_resize_buffer(dec->screen, dec->cs, buf, new_size)) {
+				RVID_ERR("Can't resize bitstream buffer!");
+				return;
+			}
+
+			dec->bs_ptr = dec->ws->buffer_map(buf->res->buf, dec->cs,
+							  PIPE_TRANSFER_WRITE);
+			if (!dec->bs_ptr)
+				return;
+
+			dec->bs_ptr += dec->bs_size;
+		}
+
+		memcpy(dec->bs_ptr, buffers[i], sizes[i]);
+		dec->bs_size += sizes[i];
+		dec->bs_ptr += sizes[i];
+	}
+
+	if (format == PIPE_VIDEO_FORMAT_JPEG) {
+		((uint8_t *)dec->bs_ptr)[0] = 0xff;	/* EOI */
+		((uint8_t *)dec->bs_ptr)[1] = 0xd9;
+		dec->bs_size += 2;
+		dec->bs_ptr += 2;
+	}
 }
 
 /**
@@ -126,7 +379,30 @@ static void radeon_jpeg_end_frame(struct pipe_video_codec *decoder,
 			   struct pipe_video_buffer *target,
 			   struct pipe_picture_desc *picture)
 {
-	/* TODO */
+	struct radeon_jpeg_decoder *dec = (struct radeon_jpeg_decoder*)decoder;
+	struct pb_buffer *dt;
+	struct rvid_buffer *bs_buf;
+
+	assert(decoder);
+
+	if (!dec->bs_ptr)
+		return;
+
+	bs_buf = &dec->bs_buffers[dec->cur_buffer];
+
+	memset(dec->bs_ptr, 0, align(dec->bs_size, 128) - dec->bs_size);
+	dec->ws->buffer_unmap(bs_buf->res->buf);
+
+	dt = radeon_jpeg_get_decode_param(dec, target, picture);
+
+	send_cmd_bitstream(dec, bs_buf->res->buf,
+		 0, RADEON_USAGE_READ, RADEON_DOMAIN_GTT);
+	send_cmd_target(dec, dt, 0,
+		 RADEON_USAGE_WRITE, RADEON_DOMAIN_VRAM);
+
+	flush(dec, PIPE_FLUSH_ASYNC);
+
+	next_buffer(dec);
 }
 
 /**
-- 
2.7.4



More information about the mesa-dev mailing list