[PATCH v3 1/9] drm/amdgpu: UAPI for user queue management
Shashank Sharma
shashank.sharma at amd.com
Thu Mar 30 06:13:11 UTC 2023
On 29/03/2023 21:46, Alex Deucher wrote:
> On Wed, Mar 29, 2023 at 3:21 PM Shashank Sharma <shashank.sharma at amd.com> wrote:
>> Hey Alex,
>>
>> On 29/03/2023 19:57, Alex Deucher wrote:
>>> On Wed, Mar 29, 2023 at 12:05 PM Shashank Sharma
>>> <shashank.sharma at amd.com> wrote:
>>>> From: Alex Deucher <alexander.deucher at amd.com>
>>>>
>>>> This patch intorduces new UAPI/IOCTL for usermode graphics
>>>> queue. The userspace app will fill this structure and request
>>>> the graphics driver to add a graphics work queue for it. The
>>>> output of this UAPI is a queue id.
>>>>
>>>> This UAPI maps the queue into GPU, so the graphics app can start
>>>> submitting work to the queue as soon as the call returns.
>>>>
>>>> V2: Addressed review comments from Alex and Christian
>>>> - Make the doorbell offset's comment clearer
>>>> - Change the output parameter name to queue_id
>>>> V3: Integration with doorbell manager
>>>>
>>>> Cc: Alex Deucher <alexander.deucher at amd.com>
>>>> Cc: Christian Koenig <christian.koenig at amd.com>
>>>> Signed-off-by: Alex Deucher <alexander.deucher at amd.com>
>>>> Signed-off-by: Shashank Sharma <shashank.sharma at amd.com>
>>>> ---
>>>> include/uapi/drm/amdgpu_drm.h | 55 +++++++++++++++++++++++++++++++++++
>>>> 1 file changed, 55 insertions(+)
>>>>
>>>> diff --git a/include/uapi/drm/amdgpu_drm.h b/include/uapi/drm/amdgpu_drm.h
>>>> index cc5d551abda5..e4943099b9d2 100644
>>>> --- a/include/uapi/drm/amdgpu_drm.h
>>>> +++ b/include/uapi/drm/amdgpu_drm.h
>>>> @@ -54,6 +54,7 @@ extern "C" {
>>>> #define DRM_AMDGPU_VM 0x13
>>>> #define DRM_AMDGPU_FENCE_TO_HANDLE 0x14
>>>> #define DRM_AMDGPU_SCHED 0x15
>>>> +#define DRM_AMDGPU_USERQ 0x16
>>>>
>>>> #define DRM_IOCTL_AMDGPU_GEM_CREATE DRM_IOWR(DRM_COMMAND_BASE + DRM_AMDGPU_GEM_CREATE, union drm_amdgpu_gem_create)
>>>> #define DRM_IOCTL_AMDGPU_GEM_MMAP DRM_IOWR(DRM_COMMAND_BASE + DRM_AMDGPU_GEM_MMAP, union drm_amdgpu_gem_mmap)
>>>> @@ -71,6 +72,7 @@ extern "C" {
>>>> #define DRM_IOCTL_AMDGPU_VM DRM_IOWR(DRM_COMMAND_BASE + DRM_AMDGPU_VM, union drm_amdgpu_vm)
>>>> #define DRM_IOCTL_AMDGPU_FENCE_TO_HANDLE DRM_IOWR(DRM_COMMAND_BASE + DRM_AMDGPU_FENCE_TO_HANDLE, union drm_amdgpu_fence_to_handle)
>>>> #define DRM_IOCTL_AMDGPU_SCHED DRM_IOW(DRM_COMMAND_BASE + DRM_AMDGPU_SCHED, union drm_amdgpu_sched)
>>>> +#define DRM_IOCTL_AMDGPU_USERQ DRM_IOW(DRM_COMMAND_BASE + DRM_AMDGPU_USERQ, union drm_amdgpu_userq)
>>>>
>>>> /**
>>>> * DOC: memory domains
>>>> @@ -307,6 +309,59 @@ union drm_amdgpu_ctx {
>>>> union drm_amdgpu_ctx_out out;
>>>> };
>>>>
>>>> +/* user queue IOCTL */
>>>> +#define AMDGPU_USERQ_OP_CREATE 1
>>>> +#define AMDGPU_USERQ_OP_FREE 2
>>>> +
>>>> +#define AMDGPU_USERQ_MQD_FLAGS_SECURE (1 << 0)
>>>> +#define AMDGPU_USERQ_MQD_FLAGS_AQL (1 << 1)
>>>> +
>>>> +struct drm_amdgpu_userq_mqd {
>>>> + /** Flags: AMDGPU_USERQ_MQD_FLAGS_* */
>>>> + __u32 flags;
>>>> + /** IP type: AMDGPU_HW_IP_* */
>>>> + __u32 ip_type;
>>>> + /** GEM object handle */
>>>> + __u32 doorbell_handle;
>>>> + /** Doorbell's offset in the doorbell bo */
>>>> + __u32 doorbell_offset;
>>>> + /** GPU virtual address of the queue */
>>>> + __u64 queue_va;
>>>> + /** Size of the queue in bytes */
>>>> + __u64 queue_size;
>>>> + /** GPU virtual address of the rptr */
>>>> + __u64 rptr_va;
>>>> + /** GPU virtual address of the wptr */
>>>> + __u64 wptr_va;
>>>> + /** GPU virtual address of the shadow context space */
>>>> + __u64 shadow_va;
>>>> +};
>>> We may want to make the MQD engine specific. E.g., shadow is gfx
>>> specific. We also probably need the csa and gds buffers for gfx as
>>> well. Other engines may have their own additional buffer
>>> requirements.
>>>
>>> Alex
>> Sure, we can call it drm_amdgpu_userq_mqd_gfx to clarify that this MQD
>> is specific to GFX engine.
> We can make it a union and then add additional entries for SDMA,
> compute, and VCN. We should also move the IP type into struct
> drm_amdgpu_userq_in so we know how to interpret the union.
I was exactly thinking to do this :), it would be a small change.
Please have a look at rest of the series as well considering this done.
- Shashank
> Or make it
> a u64 and handle it similarly to the chunks interface in
> drm_amdgpu_cs_chunk.
> Alex
>
>> - Shashank
>>
>>>
>>>> +
>>>> +struct drm_amdgpu_userq_in {
>>>> + /** AMDGPU_USERQ_OP_* */
>>>> + __u32 op;
>>>> + /** Flags */
>>>> + __u32 flags;
>>>> + /** Queue handle to associate the queue free call with,
>>>> + * unused for queue create calls */
>>>> + __u32 queue_id;
>>>> + __u32 pad;
>>>> + /** Queue descriptor */
>>>> + struct drm_amdgpu_userq_mqd mqd;
>>>> +};
>>>> +
>>>> +struct drm_amdgpu_userq_out {
>>>> + /** Queue handle */
>>>> + __u32 queue_id;
>>>> + /** Flags */
>>>> + __u32 flags;
>>>> +};
>>>> +
>>>> +union drm_amdgpu_userq {
>>>> + struct drm_amdgpu_userq_in in;
>>>> + struct drm_amdgpu_userq_out out;
>>>> +};
>>>> +
>>>> /* vm ioctl */
>>>> #define AMDGPU_VM_OP_RESERVE_VMID 1
>>>> #define AMDGPU_VM_OP_UNRESERVE_VMID 2
>>>> --
>>>> 2.40.0
>>>>
More information about the amd-gfx
mailing list