[PATCH] tests/amdgpu: add vce motion vector tests support

Tue Apr 3 19:48:04 UTC 2018

On 2018-04-03 03:14 PM, Leo Liu wrote:
>
>
> On 04/03/2018 03:02 PM, James Zhu wrote:
>> Signed-off-by: James Zhu <James.Zhu at amd.com>
>> ---
>>   tests/amdgpu/Makefile.am    |   1 +
>>   tests/amdgpu/amdgpu_test.c  |  11 +
>>   tests/amdgpu/amdgpu_test.h  |  20 ++
>>   tests/amdgpu/vce_ib.h       |  21 +-
>>   tests/amdgpu/vce_mv_tests.c | 537 
>> ++++++++++++++++++++++++++++++++++++++++++++
>>   5 files changed, 588 insertions(+), 2 deletions(-)
>>   create mode 100644 tests/amdgpu/vce_mv_tests.c
>>
>> diff --git a/tests/amdgpu/Makefile.am b/tests/amdgpu/Makefile.am
>> index e79c1bd..8e5e4c1 100644
>> --- a/tests/amdgpu/Makefile.am
>> +++ b/tests/amdgpu/Makefile.am
>> @@ -26,6 +26,7 @@ amdgpu_test_SOURCES = \
>>       cs_tests.c \
>>       decode_messages.h \
>>       vce_tests.c \
>> +    vce_mv_tests.c \
>>       vce_ib.h \
>>       frame.h \
>>       uvd_enc_tests.c \
>> diff --git a/tests/amdgpu/amdgpu_test.c b/tests/amdgpu/amdgpu_test.c
>> index 96fcd68..08fe94b 100644
>> --- a/tests/amdgpu/amdgpu_test.c
>> +++ b/tests/amdgpu/amdgpu_test.c
>> @@ -52,6 +52,7 @@
>>   #define BO_TESTS_STR "BO Tests"
>>   #define CS_TESTS_STR "CS Tests"
>>   #define VCE_TESTS_STR "VCE Tests"
>> +#define VCE_MV_TESTS_STR "VCE MV Tests"
>>   #define VCN_TESTS_STR "VCN Tests"
>>   #define UVD_ENC_TESTS_STR "UVD ENC Tests"
>>   #define DEADLOCK_TESTS_STR "Deadlock Tests"
>> @@ -93,6 +94,12 @@ static CU_SuiteInfo suites[] = {
>>           .pTests = vce_tests,
>>       },
>>       {
>> +        .pName = VCE_MV_TESTS_STR,
>> +        .pInitFunc = suite_vce_mv_tests_init,
>> +        .pCleanupFunc = suite_vce_mv_tests_clean,
>> +        .pTests = vce_mv_tests,
>> +    },
>> +    {
>>           .pName = VCN_TESTS_STR,
>>           .pInitFunc = suite_vcn_tests_init,
>>           .pCleanupFunc = suite_vcn_tests_clean,
>> @@ -150,6 +157,10 @@ static Suites_Active_Status suites_active_stat[] 
>> = {
>>               .pActive = suite_vce_tests_enable,
>>           },
>>           {
>> +            .pName = VCE_MV_TESTS_STR,
>> +            .pActive = suite_vce_mv_tests_enable,
>> +        },
>> +        {
>>               .pName = VCN_TESTS_STR,
>>               .pActive = suite_vcn_tests_enable,
>>           },
>> diff --git a/tests/amdgpu/amdgpu_test.h b/tests/amdgpu/amdgpu_test.h
>> index 6287573..bf6e7d8 100644
>> --- a/tests/amdgpu/amdgpu_test.h
>> +++ b/tests/amdgpu/amdgpu_test.h
>> @@ -115,6 +115,26 @@ CU_BOOL suite_vce_tests_enable(void);
>>   extern CU_TestInfo vce_tests[];
>>     /**
>> + * Initialize vce test suite
>> + */
>> +int suite_vce_mv_tests_init();
>> +
>> +/**
>> + * Deinitialize vce test suite
>> + */
>> +int suite_vce_mv_tests_clean();
>> +
>> +/**
>> + * Decide if the suite is enabled by default or not.
>> + */
>> +CU_BOOL suite_vce_mv_tests_enable(void);
>> +
>> +/**
>> + * Tests in vce test suite
>> + */
>> +extern CU_TestInfo vce_mv_tests[];
>> +
>> +/**
>>   + * Initialize vcn test suite
>>   + */
>>   int suite_vcn_tests_init();
>> diff --git a/tests/amdgpu/vce_ib.h b/tests/amdgpu/vce_ib.h
>> index 80ab179..cbdcc71 100644
>> --- a/tests/amdgpu/vce_ib.h
>> +++ b/tests/amdgpu/vce_ib.h
>> @@ -41,7 +41,7 @@ static uint32_t vce_taskinfo[8] = {
>>       0x00000000,
>>   };
>>   -static const uint32_t vce_create[] = {
>> +static uint32_t vce_create[] = {
>>       0x00000030,
>>       0x01000001,
>>       0x00000000,
>> @@ -144,7 +144,7 @@ static const uint32_t vce_rdo[] = {
>>       0x00000000,
>>   };
>>   -static const uint32_t vce_pic_ctrl[] = {
>> +static uint32_t vce_pic_ctrl[] = {
>>       0x00000074,
>>       0x04000002,
>>       0x00000000,
>> @@ -315,4 +315,21 @@ static const uint32_t vce_destroy[] = {
>>       0x00000008,
>>       0x02000001,
>>   };
>> +
>> +static const uint32_t vce_mv_buffer[] = {
>> +    0x00000038,
>> +    0x0500000d,
>> +    0x00000000,
>> +    0x00000000,
>> +    0x00000000,
>> +    0x00000000,
>> +    0x00000000,
>> +    0x00000000,
>> +    0x00000000,
>> +    0x00000000,
>> +    0x00000000,
>> +    0x00000000,
>> +    0x00000000,
>> +    0x00000000,
>> +};
>>   #endif /*_vce_ib_h*/
>> diff --git a/tests/amdgpu/vce_mv_tests.c b/tests/amdgpu/vce_mv_tests.c
>> new file mode 100644
>> index 0000000..89affb6
>> --- /dev/null
>> +++ b/tests/amdgpu/vce_mv_tests.c
>> @@ -0,0 +1,537 @@
>> +/*
>> + * Copyright 2018 Advanced Micro Devices, Inc.
>> + *
>> + * Permission is hereby granted, free of charge, to any person 
>> obtaining a
>> + * copy of this software and associated documentation files (the 
>> "Software"),
>> + * to deal in the Software without restriction, including without 
>> limitation
>> + * the rights to use, copy, modify, merge, publish, distribute, 
>> sublicense,
>> + * and/or sell copies of the Software, and to permit persons to whom 
>> the
>> + * Software is furnished to do so, subject to the following conditions:
>> + *
>> + * The above copyright notice and this permission notice shall be 
>> included in
>> + * all copies or substantial portions of the Software.
>> + *
>> + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 
>> EXPRESS OR
>> + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 
>> MERCHANTABILITY,
>> + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO 
>> EVENT SHALL
>> + * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, 
>> DAMAGES OR
>> + * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR 
>> OTHERWISE,
>> + * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE 
>> USE OR
>> + * OTHER DEALINGS IN THE SOFTWARE.
>> + *
>> +*/
>> +
>> +#include <stdio.h>
>> +#include <inttypes.h>
>> +
>> +#include "CUnit/Basic.h"
>> +
>> +#include "util_math.h"
>> +
>> +#include "amdgpu_test.h"
>> +#include "amdgpu_drm.h"
>> +#include "amdgpu_internal.h"
>> +
>> +#include "vce_ib.h"
>> +#include "frame.h"
>> +
>> +#define IB_SIZE        4096
>> +#define MAX_RESOURCES    16
>> +#define FW_53_0_03 ((53 << 24) | (0 << 16) | (03 << 8))
>> +
>> +struct amdgpu_vce_bo {
>> +    amdgpu_bo_handle handle;
>> +    amdgpu_va_handle va_handle;
>> +    uint64_t addr;
>> +    uint64_t size;
>> +    uint8_t *ptr;
>> +};
>> +
>> +struct amdgpu_vce_encode {
>> +    unsigned width;
>> +    unsigned height;
>> +    struct amdgpu_vce_bo vbuf;
>> +    struct amdgpu_vce_bo bs;
>> +    struct amdgpu_vce_bo fb;
>> +    struct amdgpu_vce_bo mvrefbuf;
>> +    struct amdgpu_vce_bo mvb;
>> +    struct amdgpu_vce_bo cpb;
>> +    unsigned mvbuf_size;
>> +    unsigned ib_len;
>> +};
>> +
>> +static amdgpu_device_handle device_handle;
>> +static uint32_t major_version;
>> +static uint32_t minor_version;
>> +static uint32_t family_id;
>> +static uint32_t chip_rev;
>> +static uint32_t chip_id;
>> +static uint32_t ids_flags;
>> +
>> +static amdgpu_context_handle context_handle;
>> +static amdgpu_bo_handle ib_handle;
>> +static amdgpu_va_handle ib_va_handle;
>> +static uint64_t ib_mc_address;
>> +static uint32_t *ib_cpu;
>> +
>> +static struct amdgpu_vce_encode enc;
>> +static amdgpu_bo_handle resources[MAX_RESOURCES];
>> +static unsigned num_resources;
>> +
>> +static void amdgpu_cs_vce_create(void);
>> +static void amdgpu_cs_vce_encode_mv(void);
>> +static void amdgpu_cs_vce_destroy(void);
>> +
>> +CU_TestInfo vce_mv_tests[] = {
>> +    { "VCE create",  amdgpu_cs_vce_create },
>> +    { "VCE mvdump",  amdgpu_cs_vce_encode_mv },
>> +    { "VCE destroy",  amdgpu_cs_vce_destroy },
> Why does it need to have a separated file, and many duplicated stuff 
> from vce_tests.c ?
>
> Regards,
> Leo
>
If we put them together. add one test set: { "VCE MV", 
amdgpu_cs_vce_mv_encode } in current vce test, this test must be execute 
no matter the asic support or not.
No way to bypass. If we always return success if the asic doesn't 
support, it looks weird. If you don't matter this, I can combine them 
together.

Best Regards!
James zhu

>
>> +    CU_TEST_INFO_NULL,
>> +};
>> +
>> +CU_BOOL suite_vce_mv_tests_enable(void)
>> +{
>> +    uint32_t version, feature;
>> +
>> +    if (amdgpu_device_initialize(drm_amdgpu[0], &major_version,
>> +                         &minor_version, &device_handle))
>> +        return CU_FALSE;
>> +
>> +    family_id = device_handle->info.family_id;
>> +    chip_rev = device_handle->info.chip_rev;
>> +    chip_id = device_handle->info.chip_external_rev;
>> +    ids_flags = device_handle->info.ids_flags;
>> +
>> +    amdgpu_query_firmware_version(device_handle, AMDGPU_INFO_FW_VCE, 0,
>> +                      0, &version, &feature);
>> +
>> +    if (amdgpu_device_deinitialize(device_handle))
>> +        return CU_FALSE;
>> +
>> +    if (family_id >= AMDGPU_FAMILY_RV || family_id == 
>> AMDGPU_FAMILY_SI) {
>> +        printf("\n\nThe ASIC family NOT support VCE MV, suite 
>> disabled\n");
>> +        return CU_FALSE;
>> +    }
>> +
>> +    if (!(chip_id == (chip_rev + 0x14) || /* TONGA */
>> +            chip_id == (chip_rev + 0x3C) || /* FIJI */
>> +            chip_id == (chip_rev + 0x50) || /* Polaris 10*/
>> +            chip_id == (chip_rev + 0x5A) || /* Polaris 11*/
>> +            chip_id == (chip_rev + 0x64) || /* Polaris 12*/
>> +            (family_id > AMDGPU_FAMILY_VI && !ids_flags))) /* dGPU > 
>> Polaris */{
>> +        printf("\n\nThe ASIC NOT support VCE MV, suite disabled\n");
>> +        return CU_FALSE;
>> +    }
>> +
>> +    if (FW_53_0_03 >= version){
>> +        printf("\n\nThe ASIC FW version NOT support VCE MV, suite 
>> disabled\n");
>> +        return CU_FALSE;
>> +    }
>> +    return CU_TRUE;
>> +}
>> +
>> +int suite_vce_mv_tests_init(void)
>> +{
>> +    int r;
>> +
>> +    r = amdgpu_device_initialize(drm_amdgpu[0], &major_version,
>> +                     &minor_version, &device_handle);
>> +    if (r) {
>> +        if ((r == -EACCES) && (errno == EACCES))
>> +            printf("\n\nError:%s. "
>> +                "Hint:Try to run this test program as root.",
>> +                strerror(errno));
>> +
>> +        return CUE_SINIT_FAILED;
>> +    }
>> +
>> +    family_id = device_handle->info.family_id;
>> +
>> +    r = amdgpu_cs_ctx_create(device_handle, &context_handle);
>> +    if (r)
>> +        return CUE_SINIT_FAILED;
>> +
>> +    r = amdgpu_bo_alloc_and_map(device_handle, IB_SIZE, 4096,
>> +                    AMDGPU_GEM_DOMAIN_GTT, 0,
>> +                    &ib_handle, (void**)&ib_cpu,
>> +                    &ib_mc_address, &ib_va_handle);
>> +    if (r)
>> +        return CUE_SINIT_FAILED;
>> +
>> +    memset(&enc, 0, sizeof(struct amdgpu_vce_encode));
>> +
>> +    return CUE_SUCCESS;
>> +}
>> +
>> +int suite_vce_mv_tests_clean(void)
>> +{
>> +    int r;
>> +
>> +    r = amdgpu_bo_unmap_and_free(ib_handle, ib_va_handle,
>> +                     ib_mc_address, IB_SIZE);
>> +    if (r)
>> +        return CUE_SCLEAN_FAILED;
>> +
>> +    r = amdgpu_cs_ctx_free(context_handle);
>> +    if (r)
>> +        return CUE_SCLEAN_FAILED;
>> +
>> +    r = amdgpu_device_deinitialize(device_handle);
>> +    if (r)
>> +        return CUE_SCLEAN_FAILED;
>> +
>> +    return CUE_SUCCESS;
>> +}
>> +
>> +static int submit(unsigned ndw, unsigned ip)
>> +{
>> +    struct amdgpu_cs_request ibs_request = {0};
>> +    struct amdgpu_cs_ib_info ib_info = {0};
>> +    struct amdgpu_cs_fence fence_status = {0};
>> +    uint32_t expired;
>> +    int r;
>> +
>> +    ib_info.ib_mc_address = ib_mc_address;
>> +    ib_info.size = ndw;
>> +
>> +    ibs_request.ip_type = ip;
>> +
>> +    r = amdgpu_bo_list_create(device_handle, num_resources, resources,
>> +                  NULL, &ibs_request.resources);
>> +    if (r)
>> +        return r;
>> +
>> +    ibs_request.number_of_ibs = 1;
>> +    ibs_request.ibs = &ib_info;
>> +    ibs_request.fence_info.handle = NULL;
>> +
>> +    r = amdgpu_cs_submit(context_handle, 0, &ibs_request, 1);
>> +    if (r)
>> +        return r;
>> +
>> +    r = amdgpu_bo_list_destroy(ibs_request.resources);
>> +    if (r)
>> +        return r;
>> +
>> +    fence_status.context = context_handle;
>> +    fence_status.ip_type = ip;
>> +    fence_status.fence = ibs_request.seq_no;
>> +
>> +    r = amdgpu_cs_query_fence_status(&fence_status,
>> +                     AMDGPU_TIMEOUT_INFINITE,
>> +                     0, &expired);
>> +    if (r)
>> +        return r;
>> +
>> +    return 0;
>> +}
>> +
>> +static void alloc_resource(struct amdgpu_vce_bo *vce_bo, unsigned 
>> size, unsigned domain)
>> +{
>> +    struct amdgpu_bo_alloc_request req = {0};
>> +    amdgpu_bo_handle buf_handle;
>> +    amdgpu_va_handle va_handle;
>> +    uint64_t va = 0;
>> +    int r;
>> +
>> +    req.alloc_size = ALIGN(size, 4096);
>> +    req.preferred_heap = domain;
>> +    r = amdgpu_bo_alloc(device_handle, &req, &buf_handle);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +    r = amdgpu_va_range_alloc(device_handle,
>> +                  amdgpu_gpu_va_range_general,
>> +                  req.alloc_size, 1, 0, &va,
>> +                  &va_handle, 0);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +    r = amdgpu_bo_va_op(buf_handle, 0, req.alloc_size, va, 0,
>> +                AMDGPU_VA_OP_MAP);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +    vce_bo->addr = va;
>> +    vce_bo->handle = buf_handle;
>> +    vce_bo->size = req.alloc_size;
>> +    vce_bo->va_handle = va_handle;
>> +    r = amdgpu_bo_cpu_map(vce_bo->handle, (void **)&vce_bo->ptr);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +    memset(vce_bo->ptr, 0, size);
>> +    r = amdgpu_bo_cpu_unmap(vce_bo->handle);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +}
>> +
>> +static void free_resource(struct amdgpu_vce_bo *vce_bo)
>> +{
>> +    int r;
>> +
>> +    r = amdgpu_bo_va_op(vce_bo->handle, 0, vce_bo->size,
>> +                vce_bo->addr, 0, AMDGPU_VA_OP_UNMAP);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +
>> +    r = amdgpu_va_range_free(vce_bo->va_handle);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +
>> +    r = amdgpu_bo_free(vce_bo->handle);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +    memset(vce_bo, 0, sizeof(*vce_bo));
>> +}
>> +
>> +static void amdgpu_cs_vce_create(void)
>> +{
>> +    unsigned align = (family_id >= AMDGPU_FAMILY_AI) ? 256 : 16;
>> +    int len, r;
>> +
>> +    vce_create[11] = 0x01000000;   /* disableTwoInstance */
>> +    vce_pic_ctrl[27] = 0x00000001; /* encSliceMode */
>> +
>> +    enc.width = vce_create[6];
>> +    enc.height = vce_create[7];
>> +
>> +    num_resources  = 0;
>> +    alloc_resource(&enc.fb, 4096, AMDGPU_GEM_DOMAIN_GTT);
>> +    resources[num_resources++] = enc.fb.handle;
>> +    resources[num_resources++] = ib_handle;
>> +
>> +    len = 0;
>> +    memcpy(ib_cpu, vce_session, sizeof(vce_session));
>> +    len += sizeof(vce_session) / 4;
>> +    memcpy((ib_cpu + len), vce_taskinfo, sizeof(vce_taskinfo));
>> +    len += sizeof(vce_taskinfo) / 4;
>> +    memcpy((ib_cpu + len), vce_create, sizeof(vce_create));
>> +    ib_cpu[len + 8] = ALIGN(enc.width, align);
>> +    ib_cpu[len + 9] = ALIGN(enc.width, align);
>> +    len += sizeof(vce_create) / 4;
>> +    memcpy((ib_cpu + len), vce_feedback, sizeof(vce_feedback));
>> +    ib_cpu[len + 2] = enc.fb.addr >> 32;
>> +    ib_cpu[len + 3] = enc.fb.addr;
>> +    len += sizeof(vce_feedback) / 4;
>> +
>> +    r = submit(len, AMDGPU_HW_IP_VCE);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +
>> +    free_resource(&enc.fb);
>> +}
>> +
>> +static void amdgpu_cs_vce_config(void)
>> +{
>> +    int len = 0, r;
>> +
>> +    memcpy((ib_cpu + len), vce_session, sizeof(vce_session));
>> +    len += sizeof(vce_session) / 4;
>> +    memcpy((ib_cpu + len), vce_taskinfo, sizeof(vce_taskinfo));
>> +    ib_cpu[len + 3] = 2;
>> +    ib_cpu[len + 6] = 0xffffffff;
>> +    len += sizeof(vce_taskinfo) / 4;
>> +    memcpy((ib_cpu + len), vce_rate_ctrl, sizeof(vce_rate_ctrl));
>> +    len += sizeof(vce_rate_ctrl) / 4;
>> +    memcpy((ib_cpu + len), vce_config_ext, sizeof(vce_config_ext));
>> +    len += sizeof(vce_config_ext) / 4;
>> +    memcpy((ib_cpu + len), vce_motion_est, sizeof(vce_motion_est));
>> +    len += sizeof(vce_motion_est) / 4;
>> +    memcpy((ib_cpu + len), vce_rdo, sizeof(vce_rdo));
>> +    len += sizeof(vce_rdo) / 4;
>> +    memcpy((ib_cpu + len), vce_pic_ctrl, sizeof(vce_pic_ctrl));
>> +    len += sizeof(vce_pic_ctrl) / 4;
>> +
>> +    r = submit(len, AMDGPU_HW_IP_VCE);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +}
>> +
>> +static  void amdgpu_cs_vce_mv(struct amdgpu_vce_encode *enc)
>> +{
>> +    uint64_t luma_offset, chroma_offset;
>> +    uint64_t mv_ref_luma_offset;
>> +    unsigned align = (family_id >= AMDGPU_FAMILY_AI) ? 256 : 16;
>> +    unsigned luma_size = ALIGN(enc->width, align) * 
>> ALIGN(enc->height, 16);
>> +    int len = 0, i, r;
>> +
>> +    luma_offset = enc->vbuf.addr;
>> +    chroma_offset = luma_offset + luma_size;
>> +    mv_ref_luma_offset = enc->mvrefbuf.addr;
>> +
>> +    memcpy((ib_cpu + len), vce_session, sizeof(vce_session));
>> +    len += sizeof(vce_session) / 4;
>> +    memcpy((ib_cpu + len), vce_taskinfo, sizeof(vce_taskinfo));
>> +    len += sizeof(vce_taskinfo) / 4;
>> +    memcpy((ib_cpu + len), vce_bs_buffer, sizeof(vce_bs_buffer));
>> +    ib_cpu[len + 2] = enc->bs.addr >> 32;
>> +    ib_cpu[len + 3] = enc->bs.addr;
>> +    len += sizeof(vce_bs_buffer) / 4;
>> +    memcpy((ib_cpu + len), vce_context_buffer, 
>> sizeof(vce_context_buffer));
>> +    ib_cpu[len + 2] = enc->cpb.addr >> 32;
>> +    ib_cpu[len + 3] = enc->cpb.addr;
>> +    len += sizeof(vce_context_buffer) / 4;
>> +    memcpy((ib_cpu + len), vce_aux_buffer, sizeof(vce_aux_buffer));
>> +    for (i = 0; i <  8; ++i)
>> +        ib_cpu[len + 2 + i] = luma_size * 1.5 * (i + 2);
>> +    for (i = 0; i <  8; ++i)
>> +        ib_cpu[len + 10 + i] = luma_size * 1.5;
>> +    len += sizeof(vce_aux_buffer) / 4;
>> +    memcpy((ib_cpu + len), vce_feedback, sizeof(vce_feedback));
>> +    ib_cpu[len + 2] = enc->fb.addr >> 32;
>> +    ib_cpu[len + 3] = enc->fb.addr;
>> +    len += sizeof(vce_feedback) / 4;
>> +    memcpy((ib_cpu + len), vce_mv_buffer, sizeof(vce_mv_buffer));
>> +    ib_cpu[len + 2] = mv_ref_luma_offset >> 32;
>> +    ib_cpu[len + 3] = mv_ref_luma_offset;
>> +    ib_cpu[len + 4] = ALIGN(enc->width, align);
>> +    ib_cpu[len + 5] = ALIGN(enc->width, align);
>> +    ib_cpu[len + 6] = luma_size;
>> +    ib_cpu[len + 7] = enc->mvb.addr >> 32;
>> +    ib_cpu[len + 8] = enc->mvb.addr;
>> +    len += sizeof(vce_mv_buffer) / 4;
>> +    memcpy((ib_cpu + len), vce_encode, sizeof(vce_encode));
>> +    ib_cpu[len + 2] = 0;
>> +    ib_cpu[len + 3] = 0;
>> +    ib_cpu[len + 4] = 0x154000;
>> +    ib_cpu[len + 9] = luma_offset >> 32;
>> +    ib_cpu[len + 10] = luma_offset;
>> +    ib_cpu[len + 11] = chroma_offset >> 32;
>> +    ib_cpu[len + 12] = chroma_offset;
>> +    ib_cpu[len + 13] = ALIGN(enc->height, 16);;
>> +    ib_cpu[len + 14] = ALIGN(enc->width, align);
>> +    ib_cpu[len + 15] = ALIGN(enc->width, align);
>> +    /* 
>> encDisableMBOffloading-encDisableTwoPipeMode-encInputPicArrayMode-encInputPicAddrMode 
>> */
>> +    ib_cpu[len + 16] = 0x01010000;
>> +    ib_cpu[len + 18] = 0; /* encPicType */
>> +    ib_cpu[len + 19] = 0; /* encIdrFlag */
>> +    ib_cpu[len + 20] = 0; /* encIdrPicId */
>> +    ib_cpu[len + 21] = 0; /* encMGSKeyPic */
>> +    ib_cpu[len + 22] = 0; /* encReferenceFlag */
>> +    ib_cpu[len + 23] = 0; /* encTemporalLayerIndex */
>> +    ib_cpu[len + 55] = 0; /* pictureStructure */
>> +    ib_cpu[len + 56] = 0; /* encPicType -ref[0] */
>> +    ib_cpu[len + 61] = 0; /* pictureStructure */
>> +    ib_cpu[len + 62] = 0; /* encPicType -ref[1] */
>> +    ib_cpu[len + 67] = 0; /* pictureStructure */
>> +    ib_cpu[len + 68] = 0; /* encPicType -ref1 */
>> +    ib_cpu[len + 81] = 1; /* frameNumber */
>> +    ib_cpu[len + 82] = 2; /* pictureOrderCount */
>> +    ib_cpu[len + 83] = 0xffffffff; /* numIPicRemainInRCGOP */
>> +    ib_cpu[len + 84] = 0xffffffff; /* numPPicRemainInRCGOP */
>> +    ib_cpu[len + 85] = 0xffffffff; /* numBPicRemainInRCGOP */
>> +    ib_cpu[len + 86] = 0xffffffff; /* numIRPicRemainInRCGOP */
>> +    ib_cpu[len + 87] = 0; /* remainedIntraRefreshPictures */
>> +    len += sizeof(vce_encode) / 4;
>> +
>> +    enc->ib_len = len;
>> +    r = submit(len, AMDGPU_HW_IP_VCE);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +}
>> +
>> +static void check_mv_result(struct amdgpu_vce_encode *enc)
>> +{
>> +    uint64_t sum;
>> +    uint32_t s = 140790;
>> +    uint32_t *ptr, size;
>> +    int i, j, r;
>> +
>> +    r = amdgpu_bo_cpu_map(enc->fb.handle, (void **)&enc->fb.ptr);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +    ptr = (uint32_t *)enc->fb.ptr;
>> +    r = amdgpu_bo_cpu_unmap(enc->fb.handle);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +    r = amdgpu_bo_cpu_map(enc->mvb.handle, (void **)&enc->mvb.ptr);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +    for (j = 0, sum = 0; j < enc->mvbuf_size; ++j)
>> +        sum += enc->mvb.ptr[j];
>> +    CU_ASSERT_EQUAL(sum, s);
>> +    r = amdgpu_bo_cpu_unmap(enc->mvb.handle);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +}
>> +
>> +static void amdgpu_cs_vce_encode_mv(void)
>> +{
>> +    uint32_t vbuf_size, bs_size = 0x154000, cpb_size;
>> +    unsigned align = (family_id >= AMDGPU_FAMILY_AI) ? 256 : 16;
>> +    int i, r;
>> +
>> +    vbuf_size = ALIGN(enc.width, align) * ALIGN(enc.height, 16) * 1.5;
>> +    enc.mvbuf_size = ALIGN(enc.width, 16) * ALIGN(enc.height, 16) / 8;
>> +    cpb_size = vbuf_size * 10;
>> +    num_resources = 0;
>> +    alloc_resource(&enc.fb, 4096, AMDGPU_GEM_DOMAIN_GTT);
>> +    resources[num_resources++] = enc.fb.handle;
>> +    alloc_resource(&enc.bs, bs_size, AMDGPU_GEM_DOMAIN_GTT);
>> +    resources[num_resources++] = enc.bs.handle;
>> +    alloc_resource(&enc.mvb, enc.mvbuf_size, AMDGPU_GEM_DOMAIN_GTT);
>> +    resources[num_resources++] = enc.mvb.handle;
>> +    alloc_resource(&enc.vbuf, vbuf_size, AMDGPU_GEM_DOMAIN_VRAM);
>> +    resources[num_resources++] = enc.vbuf.handle;
>> +    alloc_resource(&enc.mvrefbuf, vbuf_size, AMDGPU_GEM_DOMAIN_VRAM);
>> +    resources[num_resources++] = enc.mvrefbuf.handle;
>> +    alloc_resource(&enc.cpb, cpb_size, AMDGPU_GEM_DOMAIN_VRAM);
>> +    resources[num_resources++] = enc.cpb.handle;
>> +    resources[num_resources++] = ib_handle;
>> +
>> +    r = amdgpu_bo_cpu_map(enc.vbuf.handle, (void **)&enc.vbuf.ptr);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +
>> +    memset(enc.vbuf.ptr, 0, vbuf_size);
>> +    for (i = 0; i < enc.height; ++i) {
>> +        memcpy(enc.vbuf.ptr, (frame + i * enc.width), enc.width);
>> +        enc.vbuf.ptr += ALIGN(enc.width, align);
>> +    }
>> +    for (i = 0; i < enc.height / 2; ++i) {
>> +        memcpy(enc.vbuf.ptr, ((frame + enc.height * enc.width) + i * 
>> enc.width), enc.width);
>> +        enc.vbuf.ptr += ALIGN(enc.width, align);
>> +    }
>> +
>> +    r = amdgpu_bo_cpu_unmap(enc.vbuf.handle);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +
>> +    r = amdgpu_bo_cpu_map(enc.mvrefbuf.handle, (void 
>> **)&enc.mvrefbuf.ptr);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +
>> +    memset(enc.mvrefbuf.ptr, 0, vbuf_size);
>> +    for (i = 0; i < enc.height; ++i) {
>> +        memcpy(enc.mvrefbuf.ptr, (frame + (enc.height - i -1) * 
>> enc.width), enc.width);
>> +        enc.mvrefbuf.ptr += ALIGN(enc.width, align);
>> +    }
>> +    for (i = 0; i < enc.height / 2; ++i) {
>> +        memcpy(enc.mvrefbuf.ptr,
>> +        ((frame + enc.height * enc.width) + (enc.height / 2 - i -1) 
>> * enc.width), enc.width);
>> +        enc.mvrefbuf.ptr += ALIGN(enc.width, align);
>> +    }
>> +
>> +    r = amdgpu_bo_cpu_unmap(enc.mvrefbuf.handle);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +
>> +    amdgpu_cs_vce_config();
>> +
>> +    vce_taskinfo[3] = 3;
>> +    amdgpu_cs_vce_mv(&enc);
>> +    check_mv_result(&enc);
>> +
>> +    free_resource(&enc.fb);
>> +    free_resource(&enc.bs);
>> +    free_resource(&enc.vbuf);
>> +    free_resource(&enc.cpb);
>> +    free_resource(&enc.mvrefbuf);
>> +    free_resource(&enc.mvb);
>> +}
>> +
>> +static void amdgpu_cs_vce_destroy(void)
>> +{
>> +    int len, r;
>> +
>> +    num_resources  = 0;
>> +    alloc_resource(&enc.fb, 4096, AMDGPU_GEM_DOMAIN_GTT);
>> +    resources[num_resources++] = enc.fb.handle;
>> +    resources[num_resources++] = ib_handle;
>> +
>> +    len = 0;
>> +    memcpy(ib_cpu, vce_session, sizeof(vce_session));
>> +    len += sizeof(vce_session) / 4;
>> +    memcpy((ib_cpu + len), vce_taskinfo, sizeof(vce_taskinfo));
>> +    ib_cpu[len + 3] = 1;
>> +    len += sizeof(vce_taskinfo) / 4;
>> +    memcpy((ib_cpu + len), vce_feedback, sizeof(vce_feedback));
>> +    ib_cpu[len + 2] = enc.fb.addr >> 32;
>> +    ib_cpu[len + 3] = enc.fb.addr;
>> +    len += sizeof(vce_feedback) / 4;
>> +    memcpy((ib_cpu + len), vce_destroy, sizeof(vce_destroy));
>> +    len += sizeof(vce_destroy) / 4;
>> +
>> +    r = submit(len, AMDGPU_HW_IP_VCE);
>> +    CU_ASSERT_EQUAL(r, 0);
>> +
>> +    free_resource(&enc.fb);
>> +}
>