[PATCH 9/9] drm/amdgpu: enable userqueue secure semaphore for GFX 12

Alex Deucher alexdeucher at gmail.com
Thu Nov 21 20:22:37 UTC 2024


On Thu, Nov 21, 2024 at 8:33 AM Shashank Sharma <shashank.sharma at amd.com> wrote:
>
> From: Arunpravin Paneer Selvam <Arunpravin.PaneerSelvam at amd.com>
>
> - Add a field in struct amdgpu_mqd_prop for userqueue
>   secure sem fence address since now we have a generic
>   file for mes_userqueue.c
> - Add secure sem fence address mqd support to gfx12 into
>   their corresponding init functions.
> - Enable secure semaphore IRQ handling
>
> Signed-off-by: Arunpravin Paneer Selvam <Arunpravin.PaneerSelvam at amd.com>
> Signed-off-by: Somalapuram Amaranath <Amaranath.Somalapuram at amd.com>
> Signed-off-by: Shashank Sharma <shashank.sharma at amd.com>
> ---
>  drivers/gpu/drm/amd/amdgpu/amdgpu.h        |  1 +
>  drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c     |  2 ++
>  drivers/gpu/drm/amd/amdgpu/gfx_v12_0.c     | 27 +++++++++++-----------
>  drivers/gpu/drm/amd/amdgpu/mes_userqueue.c | 11 +--------
>  drivers/gpu/drm/amd/include/v12_structs.h  |  4 ++--
>  5 files changed, 20 insertions(+), 25 deletions(-)
>
> diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu.h b/drivers/gpu/drm/amd/amdgpu/amdgpu.h
> index 2c889cc2a59e..9c4df966fa8a 100644
> --- a/drivers/gpu/drm/amd/amdgpu/amdgpu.h
> +++ b/drivers/gpu/drm/amd/amdgpu/amdgpu.h
> @@ -829,6 +829,7 @@ struct amdgpu_mqd_prop {
>         uint64_t shadow_addr;
>         uint64_t gds_bkup_addr;
>         uint64_t csa_addr;
> +       uint64_t fenceaddress;

I'd prefer fence_address here for readability.  With that and the
other comments on the earlier patches addressed, the series is:
Reviewed-by: Alex Deucher <alexander.deucher at amd.com>


>  };
>
>  struct amdgpu_mqd {
> diff --git a/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c b/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c
> index 0e5732795891..fc2e82eb0d64 100644
> --- a/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c
> +++ b/drivers/gpu/drm/amd/amdgpu/gfx_v11_0.c
> @@ -4058,6 +4058,8 @@ static int gfx_v11_0_gfx_mqd_init(struct amdgpu_device *adev, void *m,
>         mqd->gds_bkup_base_hi = upper_32_bits(prop->gds_bkup_addr);
>         mqd->fw_work_area_base_lo = prop->csa_addr & 0xFFFFFFFC;
>         mqd->fw_work_area_base_hi = upper_32_bits(prop->csa_addr);
> +       mqd->fenceaddress_lo = lower_32_bits(prop->fenceaddress);
> +       mqd->fenceaddress_hi = upper_32_bits(prop->fenceaddress);
>
>         return 0;
>  }
> diff --git a/drivers/gpu/drm/amd/amdgpu/gfx_v12_0.c b/drivers/gpu/drm/amd/amdgpu/gfx_v12_0.c
> index b151a75cf88c..ff74f7d389e9 100644
> --- a/drivers/gpu/drm/amd/amdgpu/gfx_v12_0.c
> +++ b/drivers/gpu/drm/amd/amdgpu/gfx_v12_0.c
> @@ -47,6 +47,7 @@
>  #include "nbif_v6_3_1.h"
>  #include "mes_v12_0.h"
>  #include "mes_userqueue.h"
> +#include "amdgpu_userq_fence.h"
>
>  #define GFX12_NUM_GFX_RINGS    1
>  #define GFX12_MEC_HPD_SIZE     2048
> @@ -2972,6 +2973,8 @@ static int gfx_v12_0_gfx_mqd_init(struct amdgpu_device *adev, void *m,
>         mqd->shadow_base_hi = upper_32_bits(prop->shadow_addr);
>         mqd->fw_work_area_base_lo = prop->csa_addr & 0xFFFFFFFC;
>         mqd->fw_work_area_base_hi = upper_32_bits(prop->csa_addr);
> +       mqd->fenceaddress_lo = lower_32_bits(prop->fenceaddress);
> +       mqd->fenceaddress_hi = upper_32_bits(prop->fenceaddress);
>
>         return 0;
>  }
> @@ -4817,25 +4820,23 @@ static int gfx_v12_0_eop_irq(struct amdgpu_device *adev,
>                              struct amdgpu_irq_src *source,
>                              struct amdgpu_iv_entry *entry)
>  {
> -       int i;
> +       u32 doorbell_offset = entry->src_data[0];
>         u8 me_id, pipe_id, queue_id;
>         struct amdgpu_ring *ring;
> -       uint32_t mes_queue_id = entry->src_data[0];
> +       int i;
>
>         DRM_DEBUG("IH: CP EOP\n");
>
> -       if (adev->enable_mes && (mes_queue_id & AMDGPU_FENCE_MES_QUEUE_FLAG)) {
> -               struct amdgpu_mes_queue *queue;
> +       if (adev->enable_mes && doorbell_offset) {
> +               struct amdgpu_userq_fence_driver *fence_drv = NULL;
> +               struct xarray *xa = &adev->userq_xa;
> +               unsigned long flags;
>
> -               mes_queue_id &= AMDGPU_FENCE_MES_QUEUE_ID_MASK;
> -
> -               spin_lock(&adev->mes.queue_id_lock);
> -               queue = idr_find(&adev->mes.queue_id_idr, mes_queue_id);
> -               if (queue) {
> -                       DRM_DEBUG("process mes queue id = %d\n", mes_queue_id);
> -                       amdgpu_fence_process(queue->ring);
> -               }
> -               spin_unlock(&adev->mes.queue_id_lock);
> +               xa_lock_irqsave(xa, flags);
> +               fence_drv = xa_load(xa, doorbell_offset);
> +               if (fence_drv)
> +                       amdgpu_userq_fence_driver_process(fence_drv);
> +               xa_unlock_irqrestore(xa, flags);
>         } else {
>                 me_id = (entry->ring_id & 0x0c) >> 2;
>                 pipe_id = (entry->ring_id & 0x03) >> 0;
> diff --git a/drivers/gpu/drm/amd/amdgpu/mes_userqueue.c b/drivers/gpu/drm/amd/amdgpu/mes_userqueue.c
> index fe50c85fb2ff..93eb26f072df 100644
> --- a/drivers/gpu/drm/amd/amdgpu/mes_userqueue.c
> +++ b/drivers/gpu/drm/amd/amdgpu/mes_userqueue.c
> @@ -183,14 +183,6 @@ static int mes_userq_create_ctx_space(struct amdgpu_userq_mgr *uq_mgr,
>         return 0;
>  }
>
> -static void mes_userq_set_fence_space(struct amdgpu_usermode_queue *queue)
> -{
> -       struct v11_gfx_mqd *mqd = queue->mqd.cpu_ptr;
> -
> -       mqd->fenceaddress_lo = lower_32_bits(queue->fence_drv->gpu_addr);
> -       mqd->fenceaddress_hi = upper_32_bits(queue->fence_drv->gpu_addr);
> -}
> -
>  static int mes_userq_mqd_create(struct amdgpu_userq_mgr *uq_mgr,
>                                 struct drm_amdgpu_userq_in *args_in,
>                                 struct amdgpu_usermode_queue *queue)
> @@ -229,6 +221,7 @@ static int mes_userq_mqd_create(struct amdgpu_userq_mgr *uq_mgr,
>         userq_props->mqd_gpu_addr = queue->mqd.gpu_addr;
>         userq_props->use_doorbell = true;
>         userq_props->doorbell_index = queue->doorbell_index;
> +       userq_props->fenceaddress = queue->fence_drv->gpu_addr;
>
>         if (queue->queue_type == AMDGPU_HW_IP_COMPUTE) {
>                 struct drm_amdgpu_userq_mqd_compute_gfx11 *compute_mqd;
> @@ -305,8 +298,6 @@ static int mes_userq_mqd_create(struct amdgpu_userq_mgr *uq_mgr,
>                 goto free_mqd;
>         }
>
> -       mes_userq_set_fence_space(queue);
> -
>         /* FW expects WPTR BOs to be mapped into GART */
>         r = mes_userq_create_wptr_mapping(uq_mgr, queue, userq_props->wptr_gpu_addr);
>         if (r) {
> diff --git a/drivers/gpu/drm/amd/include/v12_structs.h b/drivers/gpu/drm/amd/include/v12_structs.h
> index 5eabab611b02..bbb6ebdc6238 100644
> --- a/drivers/gpu/drm/amd/include/v12_structs.h
> +++ b/drivers/gpu/drm/amd/include/v12_structs.h
> @@ -535,8 +535,8 @@ struct v12_gfx_mqd {
>      uint32_t reserved_507; // offset: 507  (0x1FB)
>      uint32_t reserved_508; // offset: 508  (0x1FC)
>      uint32_t reserved_509; // offset: 509  (0x1FD)
> -    uint32_t reserved_510; // offset: 510  (0x1FE)
> -    uint32_t reserved_511; // offset: 511  (0x1FF)
> +    uint32_t fenceaddress_lo; // offset: 510  (0x1FE)
> +    uint32_t fenceaddress_hi; // offset: 511  (0x1FF)
>  };
>
>  struct v12_sdma_mqd {
> --
> 2.46.2
>


More information about the amd-gfx mailing list