[PATCH 2/3] drm/amdgpu/vcn3: replace ip based software ring decode with common vcn software ring decode
Christian König
ckoenig.leichtzumerken at gmail.com
Wed May 4 13:50:29 UTC 2022
Am 04.05.22 um 15:23 schrieb James Zhu:
> Replace ip based software ring decode with common vcn software ring decode.
>
> Signed-off-by: James Zhu <James.Zhu at amd.com>
> ---
> drivers/gpu/drm/amd/amdgpu/vcn_v3_0.c | 82 ++++-----------------------
> drivers/gpu/drm/amd/amdgpu/vcn_v3_0.h | 12 ----
> 2 files changed, 11 insertions(+), 83 deletions(-)
>
> diff --git a/drivers/gpu/drm/amd/amdgpu/vcn_v3_0.c b/drivers/gpu/drm/amd/amdgpu/vcn_v3_0.c
> index c7280ca5e836..f761c569fcc6 100644
> --- a/drivers/gpu/drm/amd/amdgpu/vcn_v3_0.c
> +++ b/drivers/gpu/drm/amd/amdgpu/vcn_v3_0.c
> @@ -30,6 +30,7 @@
> #include "soc15d.h"
> #include "vcn_v2_0.h"
> #include "mmsch_v3_0.h"
> +#include "vcn_sw_ring.h"
>
> #include "vcn/vcn_3_0_0_offset.h"
> #include "vcn/vcn_3_0_0_sh_mask.h"
> @@ -1731,67 +1732,6 @@ static void vcn_v3_0_dec_ring_set_wptr(struct amdgpu_ring *ring)
> }
> }
>
> -void vcn_v3_0_dec_sw_ring_emit_fence(struct amdgpu_ring *ring, u64 addr,
> - u64 seq, uint32_t flags)
> -{
> - WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
> -
> - amdgpu_ring_write(ring, VCN_DEC_SW_CMD_FENCE);
> - amdgpu_ring_write(ring, addr);
> - amdgpu_ring_write(ring, upper_32_bits(addr));
> - amdgpu_ring_write(ring, seq);
> - amdgpu_ring_write(ring, VCN_DEC_SW_CMD_TRAP);
> -}
> -
> -void vcn_v3_0_dec_sw_ring_insert_end(struct amdgpu_ring *ring)
> -{
> - amdgpu_ring_write(ring, VCN_DEC_SW_CMD_END);
> -}
> -
> -void vcn_v3_0_dec_sw_ring_emit_ib(struct amdgpu_ring *ring, struct amdgpu_job *job,
> - struct amdgpu_ib *ib, uint32_t flags)
> -{
> - uint32_t vmid = AMDGPU_JOB_GET_VMID(job);
> -
> - amdgpu_ring_write(ring, VCN_DEC_SW_CMD_IB);
> - amdgpu_ring_write(ring, vmid);
> - amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
> - amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
> - amdgpu_ring_write(ring, ib->length_dw);
> -}
> -
> -void vcn_v3_0_dec_sw_ring_emit_reg_wait(struct amdgpu_ring *ring, uint32_t reg,
> - uint32_t val, uint32_t mask)
> -{
> - amdgpu_ring_write(ring, VCN_DEC_SW_CMD_REG_WAIT);
> - amdgpu_ring_write(ring, reg << 2);
> - amdgpu_ring_write(ring, mask);
> - amdgpu_ring_write(ring, val);
> -}
> -
> -void vcn_v3_0_dec_sw_ring_emit_vm_flush(struct amdgpu_ring *ring,
> - uint32_t vmid, uint64_t pd_addr)
> -{
> - struct amdgpu_vmhub *hub = &ring->adev->vmhub[ring->funcs->vmhub];
> - uint32_t data0, data1, mask;
> -
> - pd_addr = amdgpu_gmc_emit_flush_gpu_tlb(ring, vmid, pd_addr);
> -
> - /* wait for register write */
> - data0 = hub->ctx0_ptb_addr_lo32 + vmid * hub->ctx_addr_distance;
> - data1 = lower_32_bits(pd_addr);
> - mask = 0xffffffff;
> - vcn_v3_0_dec_sw_ring_emit_reg_wait(ring, data0, data1, mask);
> -}
> -
> -void vcn_v3_0_dec_sw_ring_emit_wreg(struct amdgpu_ring *ring, uint32_t reg,
> - uint32_t val)
> -{
> - amdgpu_ring_write(ring, VCN_DEC_SW_CMD_REG_WRITE);
> - amdgpu_ring_write(ring, reg << 2);
> - amdgpu_ring_write(ring, val);
> -}
> -
> static const struct amdgpu_ring_funcs vcn_v3_0_dec_sw_ring_vm_funcs = {
> .type = AMDGPU_RING_TYPE_VCN_DEC,
> .align_mask = 0x3f,
> @@ -1804,22 +1744,22 @@ static const struct amdgpu_ring_funcs vcn_v3_0_dec_sw_ring_vm_funcs = {
> .emit_frame_size =
> SOC15_FLUSH_GPU_TLB_NUM_WREG * 3 +
> SOC15_FLUSH_GPU_TLB_NUM_REG_WAIT * 4 +
> - 4 + /* vcn_v3_0_dec_sw_ring_emit_vm_flush */
> - 5 + 5 + /* vcn_v3_0_dec_sw_ring_emit_fdec_swe x2 vm fdec_swe */
> - 1, /* vcn_v3_0_dec_sw_ring_insert_end */
> - .emit_ib_size = 5, /* vcn_v3_0_dec_sw_ring_emit_ib */
> - .emit_ib = vcn_v3_0_dec_sw_ring_emit_ib,
> - .emit_fence = vcn_v3_0_dec_sw_ring_emit_fence,
> - .emit_vm_flush = vcn_v3_0_dec_sw_ring_emit_vm_flush,
> + 4 + /* vcn_dec_sw_ring_emit_vm_flush */
> + 5 + 5 + /* vcn_dec_sw_ring_emit_fdec_swe x2 vm fdec_swe */
> + 1, /* vcn_dec_sw_ring_insert_end */
Maybe add that calculation as define to vcn_sw_ring.h.
Apart from that looks really good to me.
Regards,
Christian.
> + .emit_ib_size = 5, /* vcn_dec_sw_ring_emit_ib */
> + .emit_ib = vcn_dec_sw_ring_emit_ib,
> + .emit_fence = vcn_dec_sw_ring_emit_fence,
> + .emit_vm_flush = vcn_dec_sw_ring_emit_vm_flush,
> .test_ring = amdgpu_vcn_dec_sw_ring_test_ring,
> .test_ib = NULL,//amdgpu_vcn_dec_sw_ring_test_ib,
> .insert_nop = amdgpu_ring_insert_nop,
> - .insert_end = vcn_v3_0_dec_sw_ring_insert_end,
> + .insert_end = vcn_dec_sw_ring_insert_end,
> .pad_ib = amdgpu_ring_generic_pad_ib,
> .begin_use = amdgpu_vcn_ring_begin_use,
> .end_use = amdgpu_vcn_ring_end_use,
> - .emit_wreg = vcn_v3_0_dec_sw_ring_emit_wreg,
> - .emit_reg_wait = vcn_v3_0_dec_sw_ring_emit_reg_wait,
> + .emit_wreg = vcn_dec_sw_ring_emit_wreg,
> + .emit_reg_wait = vcn_dec_sw_ring_emit_reg_wait,
> .emit_reg_write_reg_wait = amdgpu_ring_emit_reg_write_reg_wait_helper,
> };
>
> diff --git a/drivers/gpu/drm/amd/amdgpu/vcn_v3_0.h b/drivers/gpu/drm/amd/amdgpu/vcn_v3_0.h
> index 7a6655d3b79d..31683582d778 100644
> --- a/drivers/gpu/drm/amd/amdgpu/vcn_v3_0.h
> +++ b/drivers/gpu/drm/amd/amdgpu/vcn_v3_0.h
> @@ -26,16 +26,4 @@
>
> extern const struct amdgpu_ip_block_version vcn_v3_0_ip_block;
>
> -void vcn_v3_0_dec_sw_ring_emit_fence(struct amdgpu_ring *ring, u64 addr,
> - u64 seq, uint32_t flags);
> -void vcn_v3_0_dec_sw_ring_insert_end(struct amdgpu_ring *ring);
> -void vcn_v3_0_dec_sw_ring_emit_ib(struct amdgpu_ring *ring, struct amdgpu_job *job,
> - struct amdgpu_ib *ib, uint32_t flags);
> -void vcn_v3_0_dec_sw_ring_emit_reg_wait(struct amdgpu_ring *ring, uint32_t reg,
> - uint32_t val, uint32_t mask);
> -void vcn_v3_0_dec_sw_ring_emit_vm_flush(struct amdgpu_ring *ring,
> - uint32_t vmid, uint64_t pd_addr);
> -void vcn_v3_0_dec_sw_ring_emit_wreg(struct amdgpu_ring *ring, uint32_t reg,
> - uint32_t val);
> -
> #endif /* __VCN_V3_0_H__ */
More information about the amd-gfx
mailing list