[Libva] [PATCH V1][libva-intel-driver] add the support of 8-aligned size setting for hevc encoding

peng.chen peng.c.chen at intel.com
Fri Apr 15 08:04:38 UTC 2016


Signed-off-by: peng.chen <peng.c.chen at intel.com>
---
 src/gen9_mfc_hevc.c | 68 +++++++++++++++++++++++++++++++++++++++++++++++++----
 1 file changed, 64 insertions(+), 4 deletions(-)

diff --git a/src/gen9_mfc_hevc.c b/src/gen9_mfc_hevc.c
index fd976f0..b7acc00 100644
--- a/src/gen9_mfc_hevc.c
+++ b/src/gen9_mfc_hevc.c
@@ -1687,6 +1687,8 @@ gen9_hcpe_hevc_pipeline_slice_programing(VADriverContextP ctx,
     int cu_index = 0;
     int inter_rdo, intra_rdo;
     int qp;
+    int drop_cu_row_in_last_mb = 0;
+    int drop_cu_column_in_last_mb = 0;
 
     if (log2_ctb_size == 5) num_cu_record = 16;
     else if (log2_ctb_size == 4) num_cu_record = 4;
@@ -1751,10 +1753,29 @@ gen9_hcpe_hevc_pipeline_slice_programing(VADriverContextP ctx,
         int last_ctb = (i_ctb == (pSliceParameter->slice_segment_address + pSliceParameter->num_ctu_in_slice - 1));
         int ctb_height_in_mb_internal = ctb_width_in_mb;
         int ctb_width_in_mb_internal = ctb_width_in_mb;
+        int max_cu_num_in_mb = 4;
+
         ctb_x = i_ctb % width_in_ctb;
         ctb_y = i_ctb / width_in_ctb;
-        if(ctb_y == (height_in_ctb - 1) && row_pad_flag)  ctb_height_in_mb_internal = 1;
-        if(ctb_x == (width_in_ctb - 1) && col_pad_flag)  ctb_width_in_mb_internal = 1;
+
+        drop_cu_row_in_last_mb = 0;
+        drop_cu_column_in_last_mb = 0;
+
+        if(ctb_y == (height_in_ctb - 1) && row_pad_flag)
+        {
+            ctb_height_in_mb_internal = (pSequenceParameter->pic_height_in_luma_samples - (ctb_y * ctb_size) + 15)/16;
+
+            if(log2_cu_size == 3)
+                drop_cu_row_in_last_mb = (16 - (pSequenceParameter->pic_height_in_luma_samples % 16))>>log2_cu_size;
+        }
+
+        if(ctb_x == (width_in_ctb - 1) && col_pad_flag)
+        {
+            ctb_width_in_mb_internal = (pSequenceParameter->pic_width_in_luma_samples - (ctb_x * ctb_size) + 15) / 16;
+
+            if(log2_cu_size == 3)
+                drop_cu_column_in_last_mb = (16 - (pSequenceParameter->pic_width_in_luma_samples % 16))>>log2_cu_size;
+        }
 
         mb_x = 0;
         mb_y = 0;
@@ -1769,6 +1790,13 @@ gen9_hcpe_hevc_pipeline_slice_programing(VADriverContextP ctx,
             mb_addr = macroblock_address + mb_y * width_in_mbs ;
             for (mb_x = 0; mb_x < ctb_width_in_mb_internal; mb_x++)
             {
+                max_cu_num_in_mb = 4;
+                if(drop_cu_row_in_last_mb && (mb_y == ctb_height_in_mb_internal - 1))
+                    max_cu_num_in_mb /= 2;
+
+                if(drop_cu_column_in_last_mb && (mb_x == ctb_width_in_mb_internal - 1))
+                    max_cu_num_in_mb /= 2;
+
                 /* get the mb info from the vme out */
                 msg = (unsigned int *)(msg_ptr + mb_addr * vme_context->vme_output.size_block);
 
@@ -1779,7 +1807,23 @@ gen9_hcpe_hevc_pipeline_slice_programing(VADriverContextP ctx,
                 if (is_intra || intra_rdo < inter_rdo) {
                     /* fill intra cu */
                     tmp_mb_mode = (msg[0] & AVC_INTRA_MODE_MASK) >> 4;
-                    if (tmp_mb_mode == AVC_INTRA_16X16) {
+                    if(max_cu_num_in_mb < 4){
+                        if(tmp_mb_mode == AVC_INTRA_16X16)
+                        {
+                            msg[0] = (msg[0] & !AVC_INTRA_MODE_MASK) | (AVC_INTRA_8X8<<4);
+                            tmp_mb_mode = AVC_INTRA_8X8;
+                        }
+
+                        gen9_hcpe_hevc_fill_indirect_cu_intra(ctx, encode_state, encoder_context, qp, msg, ctb_x, ctb_y, mb_x, mb_y, ctb_width_in_mb, width_in_ctb, num_cu_record, slice_type,cu_index++,0);
+                        if(--max_cu_num_in_mb > 0)
+                            gen9_hcpe_hevc_fill_indirect_cu_intra(ctx, encode_state, encoder_context, qp, msg, ctb_x, ctb_y, mb_x, mb_y, ctb_width_in_mb, width_in_ctb, num_cu_record, slice_type,cu_index++,2);
+
+                        if(ctb_width_in_mb == 2)
+                            split_coding_unit_flag |= 0x1 << (mb_x + mb_y * ctb_width_in_mb + 16);
+                        else if(ctb_width_in_mb == 1)
+                            split_coding_unit_flag |= 0x1 << 20;
+                    } 
+                    else if(tmp_mb_mode == AVC_INTRA_16X16) {
                         gen9_hcpe_hevc_fill_indirect_cu_intra(ctx, encode_state, encoder_context, qp, msg, ctb_x, ctb_y, mb_x, mb_y, ctb_width_in_mb, width_in_ctb, num_cu_record, slice_type,cu_index++,0);
                     } else { // for 4x4 to use 8x8 replace
                         gen9_hcpe_hevc_fill_indirect_cu_intra(ctx, encode_state, encoder_context, qp, msg, ctb_x, ctb_y, mb_x, mb_y, ctb_width_in_mb, width_in_ctb, num_cu_record, slice_type,cu_index++,0);
@@ -1795,7 +1839,23 @@ gen9_hcpe_hevc_pipeline_slice_programing(VADriverContextP ctx,
                     msg += AVC_INTER_MSG_OFFSET;
                     /* fill inter cu */
                     tmp_mb_mode = msg[0] & AVC_INTER_MODE_MASK;
-                    if (tmp_mb_mode == AVC_INTER_8X8){
+                    if(max_cu_num_in_mb < 4)
+                    {
+                        if(tmp_mb_mode != AVC_INTER_8X8)
+                        {
+                            msg[0] = (msg[0] & !AVC_INTER_MODE_MASK) | AVC_INTER_8X8;
+                            tmp_mb_mode = AVC_INTER_8X8;
+                        }
+                        gen9_hcpe_hevc_fill_indirect_cu_inter(ctx, encode_state, encoder_context, qp, msg, ctb_x, ctb_y, mb_x, mb_y, ctb_width_in_mb, width_in_ctb, num_cu_record, slice_type,cu_index++,0);
+                        if(--max_cu_num_in_mb > 0)
+                            gen9_hcpe_hevc_fill_indirect_cu_inter(ctx, encode_state, encoder_context, qp, msg, ctb_x, ctb_y, mb_x, mb_y, ctb_width_in_mb, width_in_ctb, num_cu_record, slice_type,cu_index++,1);
+
+                        if(ctb_width_in_mb == 2)
+                            split_coding_unit_flag |= 0x1 << (mb_x + mb_y * ctb_width_in_mb + 16);
+                        else if(ctb_width_in_mb == 1)
+                            split_coding_unit_flag |= 0x1 << 20;
+                    }
+                    else if (tmp_mb_mode == AVC_INTER_8X8){
                         gen9_hcpe_hevc_fill_indirect_cu_inter(ctx, encode_state, encoder_context, qp, msg, ctb_x, ctb_y, mb_x, mb_y, ctb_width_in_mb, width_in_ctb, num_cu_record, slice_type,cu_index++,0);
                         gen9_hcpe_hevc_fill_indirect_cu_inter(ctx, encode_state, encoder_context, qp, msg, ctb_x, ctb_y, mb_x, mb_y, ctb_width_in_mb, width_in_ctb, num_cu_record, slice_type,cu_index++,1);
                         gen9_hcpe_hevc_fill_indirect_cu_inter(ctx, encode_state, encoder_context, qp, msg, ctb_x, ctb_y, mb_x, mb_y, ctb_width_in_mb, width_in_ctb, num_cu_record, slice_type,cu_index++,2);
-- 
1.9.1



More information about the Libva mailing list