[PATCH v2 07/12] drm/xe/pxp: Add spport for PXP-using queues

Thu Nov 7 23:57:11 UTC 2024

On 10/8/2024 4:55 PM, John Harrison wrote:
> On 8/16/2024 12:00, Daniele Ceraolo Spurio wrote:
>> Userspace is required to mark a queue as using PXP to guarantee that the
>> PXP instructions will work. When a PXP queue is created, the driver will
>> do the following:
>> - Start the default PXP session if it is not already running;
>> - set the relevant bits in the context control register;
>> - assign an rpm ref to the queue to keep for its lifetime (this is
>>    required because PXP HWDRM sessions are killed by the HW suspend 
>> flow).
>>
>> When a PXP invalidation occurs, all the PXP queue will be killed.
> "all the PXP queue" -> should be 'queues' or should not say 'all'?
>
>> On submission of a valid PXP queue, the driver will validate all
>> encrypted objects mapped to the VM to ensured they were encrypted with
>> the current key.
>>
>> Signed-off-by: Daniele Ceraolo Spurio <daniele.ceraolospurio at intel.com>
>> ---
>>   drivers/gpu/drm/xe/regs/xe_engine_regs.h |   1 +
>>   drivers/gpu/drm/xe/xe_exec_queue.c       |  58 ++++-
>>   drivers/gpu/drm/xe/xe_exec_queue.h       |   5 +
>>   drivers/gpu/drm/xe/xe_exec_queue_types.h |   8 +
>>   drivers/gpu/drm/xe/xe_hw_engine.c        |   2 +-
>>   drivers/gpu/drm/xe/xe_lrc.c              |  16 +-
>>   drivers/gpu/drm/xe/xe_lrc.h              |   4 +-
>>   drivers/gpu/drm/xe/xe_pxp.c              | 295 ++++++++++++++++++++++-
>>   drivers/gpu/drm/xe/xe_pxp.h              |   7 +
>>   drivers/gpu/drm/xe/xe_pxp_submit.c       |   4 +-
>>   drivers/gpu/drm/xe/xe_pxp_types.h        |  26 ++
>>   include/uapi/drm/xe_drm.h                |  40 ++-
>>   12 files changed, 450 insertions(+), 16 deletions(-)
>>
>> diff --git a/drivers/gpu/drm/xe/regs/xe_engine_regs.h 
>> b/drivers/gpu/drm/xe/regs/xe_engine_regs.h
>> index 81b71903675e..3692e887f503 100644
>> --- a/drivers/gpu/drm/xe/regs/xe_engine_regs.h
>> +++ b/drivers/gpu/drm/xe/regs/xe_engine_regs.h
>> @@ -130,6 +130,7 @@
>>   #define RING_EXECLIST_STATUS_HI(base)        XE_REG((base) + 0x234 
>> + 4)
>>     #define RING_CONTEXT_CONTROL(base)        XE_REG((base) + 0x244, 
>> XE_REG_OPTION_MASKED)
>> +#define      CTX_CTRL_PXP_ENABLE            REG_BIT(10)
>>   #define      CTX_CTRL_OAC_CONTEXT_ENABLE        REG_BIT(8)
>>   #define      CTX_CTRL_RUN_ALONE            REG_BIT(7)
>>   #define      CTX_CTRL_INDIRECT_RING_STATE_ENABLE    REG_BIT(4)
>> diff --git a/drivers/gpu/drm/xe/xe_exec_queue.c 
>> b/drivers/gpu/drm/xe/xe_exec_queue.c
>> index e98e8794eddf..504ba4aa2357 100644
>> --- a/drivers/gpu/drm/xe/xe_exec_queue.c
>> +++ b/drivers/gpu/drm/xe/xe_exec_queue.c
>> @@ -22,6 +22,8 @@
>>   #include "xe_ring_ops_types.h"
>>   #include "xe_trace.h"
>>   #include "xe_vm.h"
>> +#include "xe_pxp.h"
>> +#include "xe_pxp_types.h"
>>     enum xe_exec_queue_sched_prop {
>>       XE_EXEC_QUEUE_JOB_TIMEOUT = 0,
>> @@ -35,6 +37,8 @@ static int exec_queue_user_extensions(struct 
>> xe_device *xe, struct xe_exec_queue
>>     static void __xe_exec_queue_free(struct xe_exec_queue *q)
>>   {
>> +    if (xe_exec_queue_uses_pxp(q))
>> +        xe_pxp_exec_queue_remove(gt_to_xe(q->gt)->pxp, q);
>>       if (q->vm)
>>           xe_vm_put(q->vm);
>>   @@ -73,6 +77,7 @@ static struct xe_exec_queue 
>> *__xe_exec_queue_alloc(struct xe_device *xe,
>>       q->ops = gt->exec_queue_ops;
>>       INIT_LIST_HEAD(&q->lr.link);
>>       INIT_LIST_HEAD(&q->multi_gt_link);
>> +    INIT_LIST_HEAD(&q->pxp.link);
>>         q->sched_props.timeslice_us = 
>> hwe->eclass->sched_props.timeslice_us;
>>       q->sched_props.preempt_timeout_us =
>> @@ -107,6 +112,21 @@ static int __xe_exec_queue_init(struct 
>> xe_exec_queue *q)
>>   {
>>       struct xe_vm *vm = q->vm;
>>       int i, err;
>> +    u32 flags = 0;
>> +
>> +    /*
>> +     * PXP workloads executing on RCS or CCS must run in isolation 
>> (i.e. no
>> +     * other workload can use the EUs at the same time). On MTL this 
>> is done
>> +     * by setting the RUNALONE bit in the LRC, while starting on Xe2 
>> there
>> +     * is a dedicated bit for it.
>> +     */
>> +    if (xe_exec_queue_uses_pxp(q) &&
>> +        (q->class == XE_ENGINE_CLASS_RENDER || q->class == 
>> XE_ENGINE_CLASS_COMPUTE)) {
>> +        if (GRAPHICS_VER(gt_to_xe(q->gt)) >= 20)
>> +            flags |= XE_LRC_CREATE_PXP;
>> +        else
>> +            flags |= XE_LRC_CREATE_RUNALONE;
>> +    }
>>         if (vm) {
>>           err = xe_vm_lock(vm, true);
>> @@ -115,7 +135,7 @@ static int __xe_exec_queue_init(struct 
>> xe_exec_queue *q)
>>       }
>>         for (i = 0; i < q->width; ++i) {
>> -        q->lrc[i] = xe_lrc_create(q->hwe, q->vm, SZ_16K);
>> +        q->lrc[i] = xe_lrc_create(q->hwe, q->vm, SZ_16K, flags);
>>           if (IS_ERR(q->lrc[i])) {
>>               err = PTR_ERR(q->lrc[i]);
>>               goto err_unlock;
>> @@ -160,6 +180,17 @@ struct xe_exec_queue 
>> *xe_exec_queue_create(struct xe_device *xe, struct xe_vm *v
>>       if (err)
>>           goto err_post_alloc;
>>   +    /*
>> +     * we can only add the queue to the PXP list after the init is 
>> complete,
>> +     * because the PXP termination can call exec_queue_kill and that 
>> will
>> +     * go bad if the queue is only half-initialized.
>> +     */
> Not following how this comment relates to this code block. The comment 
> implies there should be a wait of some kind.

We set the PXP type for the queue as part of the extension handling in 
__xe_exec_queue_alloc. This comment was supposed to indicate that we 
can't add the queue to the list back there because the init is not 
complete yet, so we do it here instead. I'll add the explanation about 
the extension handling to the comment.

>
>> +    if (xe_exec_queue_uses_pxp(q)) {
>> +        err = xe_pxp_exec_queue_add(xe->pxp, q);
>> +        if (err)
>> +            goto err_post_alloc;
>> +    }
>> +
>>       return q;
>>     err_post_alloc:
>> @@ -197,6 +228,9 @@ void xe_exec_queue_destroy(struct kref *ref)
>>       struct xe_exec_queue *q = container_of(ref, struct 
>> xe_exec_queue, refcount);
>>       struct xe_exec_queue *eq, *next;
>>   +    if (xe_exec_queue_uses_pxp(q))
>> +        xe_pxp_exec_queue_remove(gt_to_xe(q->gt)->pxp, q);
>> +
>>       xe_exec_queue_last_fence_put_unlocked(q);
>>       if (!(q->flags & EXEC_QUEUE_FLAG_BIND_ENGINE_CHILD)) {
>>           list_for_each_entry_safe(eq, next, &q->multi_gt_list,
>> @@ -343,6 +377,24 @@ static int exec_queue_set_timeslice(struct 
>> xe_device *xe, struct xe_exec_queue *
>>       return 0;
>>   }
>>   +static int
>> +exec_queue_set_pxp_type(struct xe_device *xe, struct xe_exec_queue 
>> *q, u64 value)
>> +{
>> +    BUILD_BUG_ON(DRM_XE_PXP_TYPE_NONE != 0);
> Why a build bug for something that is a simple 'enum { X=0 }'? It's 
> not like there is some complex macro calculation that could be broken 
> by some seemingly unrelated change.

This was more to make sure that the default value for the extension was 
0. Given that this is UAPI and therefore can't change anyway, I'll drop 
the BUG_ON

>
>> +
>> +    if (value == DRM_XE_PXP_TYPE_NONE)
>> +        return 0;
> This doesn't need to shut any existing PXP down? Is it not possible to 
> dynamically change the type?

No, this can only be set at queue creation time

>
>> +
>> +    if (!xe_pxp_is_enabled(xe->pxp))
>> +        return -ENODEV;
>> +
>> +    /* we only support HWDRM sessions right now */
>> +    if (XE_IOCTL_DBG(xe, value != DRM_XE_PXP_TYPE_HWDRM))
>> +        return -EINVAL;
>> +
>> +    return xe_pxp_exec_queue_set_type(xe->pxp, q, 
>> DRM_XE_PXP_TYPE_HWDRM);
>> +}
>> +
>>   typedef int (*xe_exec_queue_set_property_fn)(struct xe_device *xe,
>>                            struct xe_exec_queue *q,
>>                            u64 value);
>> @@ -350,6 +402,7 @@ typedef int 
>> (*xe_exec_queue_set_property_fn)(struct xe_device *xe,
>>   static const xe_exec_queue_set_property_fn 
>> exec_queue_set_property_funcs[] = {
>>       [DRM_XE_EXEC_QUEUE_SET_PROPERTY_PRIORITY] = 
>> exec_queue_set_priority,
>>       [DRM_XE_EXEC_QUEUE_SET_PROPERTY_TIMESLICE] = 
>> exec_queue_set_timeslice,
>> +    [DRM_XE_EXEC_QUEUE_SET_PROPERTY_PXP_TYPE] = 
>> exec_queue_set_pxp_type,
>>   };
>>     static int exec_queue_user_ext_set_property(struct xe_device *xe,
>> @@ -369,7 +422,8 @@ static int 
>> exec_queue_user_ext_set_property(struct xe_device *xe,
>>                ARRAY_SIZE(exec_queue_set_property_funcs)) ||
>>           XE_IOCTL_DBG(xe, ext.pad) ||
>>           XE_IOCTL_DBG(xe, ext.property != 
>> DRM_XE_EXEC_QUEUE_SET_PROPERTY_PRIORITY &&
>> -             ext.property != DRM_XE_EXEC_QUEUE_SET_PROPERTY_TIMESLICE))
>> +             ext.property != 
>> DRM_XE_EXEC_QUEUE_SET_PROPERTY_TIMESLICE &&
>> +             ext.property != DRM_XE_EXEC_QUEUE_SET_PROPERTY_PXP_TYPE))
>>           return -EINVAL;
>>         idx = array_index_nospec(ext.property, 
>> ARRAY_SIZE(exec_queue_set_property_funcs));
>> diff --git a/drivers/gpu/drm/xe/xe_exec_queue.h 
>> b/drivers/gpu/drm/xe/xe_exec_queue.h
>> index ded77b0f3b90..7fa97719667a 100644
>> --- a/drivers/gpu/drm/xe/xe_exec_queue.h
>> +++ b/drivers/gpu/drm/xe/xe_exec_queue.h
>> @@ -53,6 +53,11 @@ static inline bool 
>> xe_exec_queue_is_parallel(struct xe_exec_queue *q)
>>       return q->width > 1;
>>   }
>>   +static inline bool xe_exec_queue_uses_pxp(struct xe_exec_queue *q)
>> +{
>> +    return q->pxp.type;
>> +}
>> +
>>   bool xe_exec_queue_is_lr(struct xe_exec_queue *q);
>>     bool xe_exec_queue_ring_full(struct xe_exec_queue *q);
>> diff --git a/drivers/gpu/drm/xe/xe_exec_queue_types.h 
>> b/drivers/gpu/drm/xe/xe_exec_queue_types.h
>> index 1408b02eea53..28b56217f1df 100644
>> --- a/drivers/gpu/drm/xe/xe_exec_queue_types.h
>> +++ b/drivers/gpu/drm/xe/xe_exec_queue_types.h
>> @@ -130,6 +130,14 @@ struct xe_exec_queue {
>>           spinlock_t lock;
>>       } lr;
>>   +    /** @pxp: PXP info tracking */
>> +    struct {
>> +        /** @pxp.type: PXP session type used by this queue */
>> +        u8 type;
>> +        /** @pxp.link: link into the list of PXP exec queues */
>> +        struct list_head link;
>> +    } pxp;
>> +
>>       /** @ops: submission backend exec queue operations */
>>       const struct xe_exec_queue_ops *ops;
>>   diff --git a/drivers/gpu/drm/xe/xe_hw_engine.c 
>> b/drivers/gpu/drm/xe/xe_hw_engine.c
>> index e195022ca836..469932e7d7a6 100644
>> --- a/drivers/gpu/drm/xe/xe_hw_engine.c
>> +++ b/drivers/gpu/drm/xe/xe_hw_engine.c
>> @@ -557,7 +557,7 @@ static int hw_engine_init(struct xe_gt *gt, 
>> struct xe_hw_engine *hwe,
>>           goto err_name;
>>       }
>>   -    hwe->kernel_lrc = xe_lrc_create(hwe, NULL, SZ_16K);
>> +    hwe->kernel_lrc = xe_lrc_create(hwe, NULL, SZ_16K, 0);
>>       if (IS_ERR(hwe->kernel_lrc)) {
>>           err = PTR_ERR(hwe->kernel_lrc);
>>           goto err_hwsp;
>> diff --git a/drivers/gpu/drm/xe/xe_lrc.c b/drivers/gpu/drm/xe/xe_lrc.c
>> index 974a9cd8c379..4f3e676db646 100644
>> --- a/drivers/gpu/drm/xe/xe_lrc.c
>> +++ b/drivers/gpu/drm/xe/xe_lrc.c
>> @@ -893,7 +893,7 @@ static void xe_lrc_finish(struct xe_lrc *lrc)
>>   #define PVC_CTX_ACC_CTR_THOLD    (0x2a + 1)
>>     static int xe_lrc_init(struct xe_lrc *lrc, struct xe_hw_engine *hwe,
>> -               struct xe_vm *vm, u32 ring_size)
>> +               struct xe_vm *vm, u32 ring_size, u32 init_flags)
>>   {
>>       struct xe_gt *gt = hwe->gt;
>>       struct xe_tile *tile = gt_to_tile(gt);
>> @@ -981,6 +981,16 @@ static int xe_lrc_init(struct xe_lrc *lrc, 
>> struct xe_hw_engine *hwe,
>>                        RING_CTL_SIZE(lrc->ring.size) | RING_VALID);
>>       }
>>   +    if (init_flags & XE_LRC_CREATE_RUNALONE)
>> +        xe_lrc_write_ctx_reg(lrc, CTX_CONTEXT_CONTROL,
>> +                     xe_lrc_read_ctx_reg(lrc, CTX_CONTEXT_CONTROL) |
>> +                     _MASKED_BIT_ENABLE(CTX_CTRL_RUN_ALONE));
>> +
>> +    if (init_flags & XE_LRC_CREATE_PXP)
>> +        xe_lrc_write_ctx_reg(lrc, CTX_CONTEXT_CONTROL,
>> +                     xe_lrc_read_ctx_reg(lrc, CTX_CONTEXT_CONTROL) |
>> +                     _MASKED_BIT_ENABLE(CTX_CTRL_PXP_ENABLE));
>> +
>>       xe_lrc_write_ctx_reg(lrc, CTX_TIMESTAMP, 0);
>>         if (xe->info.has_asid && vm)
>> @@ -1029,7 +1039,7 @@ static int xe_lrc_init(struct xe_lrc *lrc, 
>> struct xe_hw_engine *hwe,
>>    * upon failure.
>>    */
>>   struct xe_lrc *xe_lrc_create(struct xe_hw_engine *hwe, struct xe_vm 
>> *vm,
>> -                 u32 ring_size)
>> +                 u32 ring_size, u32 flags)
>>   {
>>       struct xe_lrc *lrc;
>>       int err;
>> @@ -1038,7 +1048,7 @@ struct xe_lrc *xe_lrc_create(struct 
>> xe_hw_engine *hwe, struct xe_vm *vm,
>>       if (!lrc)
>>           return ERR_PTR(-ENOMEM);
>>   -    err = xe_lrc_init(lrc, hwe, vm, ring_size);
>> +    err = xe_lrc_init(lrc, hwe, vm, ring_size, flags);
>>       if (err) {
>>           kfree(lrc);
>>           return ERR_PTR(err);
>> diff --git a/drivers/gpu/drm/xe/xe_lrc.h b/drivers/gpu/drm/xe/xe_lrc.h
>> index d411c3fbcbc6..cc8091bba2a0 100644
>> --- a/drivers/gpu/drm/xe/xe_lrc.h
>> +++ b/drivers/gpu/drm/xe/xe_lrc.h
>> @@ -23,8 +23,10 @@ struct xe_vm;
>>   #define LRC_PPHWSP_FLUSH_INVAL_SCRATCH_ADDR (0x34 * 4)
>>   #define LRC_PPHWSP_PXP_INVAL_SCRATCH_ADDR (0x40 * 4)
>>   +#define XE_LRC_CREATE_RUNALONE 0x1
>> +#define XE_LRC_CREATE_PXP 0x2
>>   struct xe_lrc *xe_lrc_create(struct xe_hw_engine *hwe, struct xe_vm 
>> *vm,
>> -                 u32 ring_size);
>> +                 u32 ring_size, u32 flags);
>>   void xe_lrc_destroy(struct kref *ref);
>>     /**
>> diff --git a/drivers/gpu/drm/xe/xe_pxp.c b/drivers/gpu/drm/xe/xe_pxp.c
>> index 382eb0cb0018..acdc25c8e8a1 100644
>> --- a/drivers/gpu/drm/xe/xe_pxp.c
>> +++ b/drivers/gpu/drm/xe/xe_pxp.c
>> @@ -6,11 +6,17 @@
>>   #include "xe_pxp.h"
>>     #include <drm/drm_managed.h>
>> +#include <drm/xe_drm.h>
>>     #include "xe_device_types.h"
>> +#include "xe_exec_queue.h"
>> +#include "xe_exec_queue_types.h"
>>   #include "xe_force_wake.h"
>> +#include "xe_guc_submit.h"
>> +#include "xe_gsc_proxy.h"
>>   #include "xe_gt.h"
>>   #include "xe_gt_types.h"
>> +#include "xe_huc.h"
>>   #include "xe_mmio.h"
>>   #include "xe_pm.h"
>>   #include "xe_pxp_submit.h"
>> @@ -27,18 +33,45 @@
>>    * integrated parts.
>>    */
>>   -#define ARB_SESSION 0xF /* TODO: move to UAPI */
>> +#define ARB_SESSION DRM_XE_PXP_HWDRM_DEFAULT_SESSION /* shorter 
>> define */
> Is this really worthwhile?

The define is used enough time in this file that IMO it's worth having a 
shorter version for redability

>
>>     bool xe_pxp_is_supported(const struct xe_device *xe)
>>   {
>>       return xe->info.has_pxp && IS_ENABLED(CONFIG_INTEL_MEI_GSC_PROXY);
>>   }
>>   -static bool pxp_is_enabled(const struct xe_pxp *pxp)
>> +bool xe_pxp_is_enabled(const struct xe_pxp *pxp)
>>   {
>>       return pxp;
>>   }
>>   +static bool pxp_prerequisites_done(const struct xe_pxp *pxp)
>> +{
>> +    bool ready;
>> +
>> +    XE_WARN_ON(xe_force_wake_get(gt_to_fw(pxp->gt), XE_FW_GSC));
> Again, why warn on this fw and then proceed anyway when others 
> silently return an error code to the layer above?

In this case because I wanted to have this function return a bool, so 
can't escalate the error. In the unlikely case that this fails, the 
caller will consider PXP not ready, which will be escalated out. If 
forcewake doesn't work the GT is non-functional anyway, so reporting PXP 
not ready it's not going to make things worse.

>
>> +
>> +    /* PXP requires both HuC authentication via GSC and GSC proxy 
>> initialized */
>> +    ready = xe_huc_is_authenticated(&pxp->gt->uc.huc, 
>> XE_HUC_AUTH_VIA_GSC) &&
>> +        xe_gsc_proxy_init_done(&pxp->gt->uc.gsc);
>> +
>> +    xe_force_wake_put(gt_to_fw(pxp->gt), XE_FW_GSC);
>> +
>> +    return ready;
>> +}
>> +
>> +static bool pxp_session_is_in_play(struct xe_pxp *pxp, u32 id)
>> +{
>> +    struct xe_gt *gt = pxp->gt;
>> +    u32 sip = 0;
>> +
>> +    XE_WARN_ON(xe_force_wake_get(gt_to_fw(gt), XE_FW_GT));
> Same as above.

Same reasoning, just that we'll report that PXP failed to start if this 
fails, which again it's not going to make things worse if the GT is broken.

>
>> +    sip = xe_mmio_read32(gt, KCR_SIP);
>> +    xe_force_wake_put(gt_to_fw(gt), XE_FW_GT);
>> +
>> +    return sip & BIT(id);
>> +}
>> +
>>   static int pxp_wait_for_session_state(struct xe_pxp *pxp, u32 id, 
>> bool in_play)
>>   {
>>       struct xe_gt *gt = pxp->gt;
>> @@ -56,12 +89,30 @@ static int pxp_wait_for_session_state(struct 
>> xe_pxp *pxp, u32 id, bool in_play)
>>       return ret;
>>   }
>>   +static void pxp_invalidate_queues(struct xe_pxp *pxp);
>> +
>>   static void pxp_terminate(struct xe_pxp *pxp)
>>   {
>>       int ret = 0;
>>       struct xe_device *xe = pxp->xe;
>>       struct xe_gt *gt = pxp->gt;
> Should add a "lockdep_assert_held(pxp->mutex)" here?

I'll add it in

>
>>   +    pxp_invalidate_queues(pxp);
>> +
>> +    /*
>> +     * If we have a termination already in progress, we need to wait 
>> for
>> +     * it to complete before queueing another one. We update the state
>> +     * to signal that another termination is required and leave it 
>> to the
>> +     * pxp_start() call to take care of it.
>> +     */
>> +    if (!completion_done(&pxp->termination)) {
>> +        pxp->status = XE_PXP_NEEDS_TERMINATION;
>> +        return;
>> +    }
>> +
>> +    reinit_completion(&pxp->termination);
>> +    pxp->status = XE_PXP_TERMINATION_IN_PROGRESS;
>> +
>>       drm_dbg(&xe->drm, "Terminating PXP\n");
>>         /* terminate the hw session */
>> @@ -82,13 +133,32 @@ static void pxp_terminate(struct xe_pxp *pxp)
>>       ret = xe_pxp_submit_session_invalidation(&pxp->gsc_res, 
>> ARB_SESSION);
>>     out:
>> -    if (ret)
>> +    if (ret) {
>>           drm_err(&xe->drm, "PXP termination failed: %pe\n", 
>> ERR_PTR(ret));
>> +        pxp->status = XE_PXP_ERROR;
>> +        complete_all(&pxp->termination);
>> +    }
>>   }
>>     static void pxp_terminate_complete(struct xe_pxp *pxp)
>>   {
>> -    /* TODO mark the session as ready to start */
>> +    /*
>> +     * We expect PXP to be in one of 2 states when we get here:
>> +     * - XE_PXP_TERMINATION_IN_PROGRESS: a single termination event was
>> +     * requested and it is now completing, so we're ready to start.
>> +     * - XE_PXP_NEEDS_TERMINATION: a second termination was 
>> requested while
>> +     * the first one was still being processed; we don't update the 
>> state
>> +     * in this case so the pxp_start code will automatically issue that
>> +     * second termination.
>> +     */
>> +    if (pxp->status == XE_PXP_TERMINATION_IN_PROGRESS)
>> +        pxp->status = XE_PXP_READY_TO_START;
>> +    else if (pxp->status != XE_PXP_NEEDS_TERMINATION)
>> +        drm_err(&pxp->xe->drm,
>> +            "PXP termination complete while status was %u\n",
>> +            pxp->status);
>> +
>> +    complete_all(&pxp->termination);
>>   }
>>     static void pxp_irq_work(struct work_struct *work)
>> @@ -112,6 +182,8 @@ static void pxp_irq_work(struct work_struct *work)
>>       if ((events & PXP_TERMINATION_REQUEST) && 
>> !xe_pm_runtime_get_if_active(xe))
>>           return;
>>   +    mutex_lock(&pxp->mutex);
>> +
>>       if (events & PXP_TERMINATION_REQUEST) {
>>           events &= ~PXP_TERMINATION_COMPLETE;
>>           pxp_terminate(pxp);
>> @@ -120,6 +192,8 @@ static void pxp_irq_work(struct work_struct *work)
>>       if (events & PXP_TERMINATION_COMPLETE)
>>           pxp_terminate_complete(pxp);
>>   +    mutex_unlock(&pxp->mutex);
>> +
>>       if (events & PXP_TERMINATION_REQUEST)
>>           xe_pm_runtime_put(xe);
>>   }
>> @@ -133,7 +207,7 @@ void xe_pxp_irq_handler(struct xe_device *xe, u16 
>> iir)
>>   {
>>       struct xe_pxp *pxp = xe->pxp;
>>   -    if (!pxp_is_enabled(pxp)) {
>> +    if (!xe_pxp_is_enabled(pxp)) {
>>           drm_err(&xe->drm, "PXP irq 0x%x received with PXP 
>> disabled!\n", iir);
>>           return;
>>       }
>> @@ -230,10 +304,22 @@ int xe_pxp_init(struct xe_device *xe)
>>       if (!pxp)
>>           return -ENOMEM;
>>   +    INIT_LIST_HEAD(&pxp->queues.list);
>> +    spin_lock_init(&pxp->queues.lock);
>>       INIT_WORK(&pxp->irq.work, pxp_irq_work);
>>       pxp->xe = xe;
>>       pxp->gt = gt;
>>   +    /*
>> +     * we'll use the completion to check if there is a termination 
>> pending,
>> +     * so we start it as completed and we reinit it when a termination
>> +     * is triggered.
>> +     */
>> +    init_completion(&pxp->termination);
>> +    complete_all(&pxp->termination);
>> +
>> +    mutex_init(&pxp->mutex);
>> +
>>       pxp->irq.wq = alloc_ordered_workqueue("pxp-wq", 0);
>>       if (!pxp->irq.wq)
>>           return -ENOMEM;
>> @@ -256,3 +342,202 @@ int xe_pxp_init(struct xe_device *xe)
>>       destroy_workqueue(pxp->irq.wq);
>>       return err;
>>   }
>> +
>> +static int __pxp_start_arb_session(struct xe_pxp *pxp)
>> +{
>> +    int ret;
>> +
>> +    if (pxp_session_is_in_play(pxp, ARB_SESSION))
>> +        return -EEXIST;
>> +
>> +    ret = xe_pxp_submit_session_init(&pxp->gsc_res, ARB_SESSION);
>> +    if (ret) {
>> +        drm_err(&pxp->xe->drm, "Failed to init PXP arb session\n");
>> +        goto out;
>> +    }
>> +
>> +    ret = pxp_wait_for_session_state(pxp, ARB_SESSION, true);
>> +    if (ret) {
>> +        drm_err(&pxp->xe->drm, "PXP ARB session failed to go in 
>> play\n");
>> +        goto out;
>> +    }
>> +
>> +    drm_dbg(&pxp->xe->drm, "PXP ARB session is active\n");
>> +
>> +out:
>> +    if (!ret)
>> +        pxp->status = XE_PXP_ACTIVE;
>> +    else
>> +        pxp->status = XE_PXP_ERROR;
>> +
>> +    return ret;
>> +}
>> +
>> +/**
>> + * xe_pxp_exec_queue_set_type - Mark a queue as using PXP
>> + * @pxp: the xe->pxp pointer (it will be NULL if PXP is disabled)
>> + * @q: the queue to mark as using PXP
>> + * @type: the type of PXP session this queue will use
>> + *
>> + * Returns 0 if the selected PXP type is supported, -ENODEV otherwise.
>> + */
>> +int xe_pxp_exec_queue_set_type(struct xe_pxp *pxp, struct 
>> xe_exec_queue *q, u8 type)
>> +{
>> +    if (!xe_pxp_is_enabled(pxp))
>> +        return -ENODEV;
>> +
>> +    /* we only support HWDRM sessions right now */
>> +    xe_assert(pxp->xe, type == DRM_XE_PXP_TYPE_HWDRM);
>> +
>> +    q->pxp.type = type;
>> +
>> +    return 0;
>> +}
>> +
>> +/**
>> + * xe_pxp_exec_queue_add - add a queue to the PXP list
>> + * @pxp: the xe->pxp pointer (it will be NULL if PXP is disabled)
>> + * @q: the queue to add to the list
>> + *
>> + * If PXP is enabled and the prerequisites are done, start the PXP ARB
>> + * session (if not already running) and add the queue to the PXP 
>> list. Note
>> + * that the queue must have previously been marked as using PXP with
>> + * xe_pxp_exec_queue_set_type.
>> + *
>> + * Returns 0 if the PXP ARB session is running and the queue is in 
>> the list,
>> + * -ENODEV if PXP is disabled, -EBUSY if the PXP prerequisites are 
>> not done,
>> + * other errno value if something goes wrong during the session start.
>> + */
>> +#define PXP_TERMINATION_TIMEOUT_MS 500
>> +int xe_pxp_exec_queue_add(struct xe_pxp *pxp, struct xe_exec_queue *q)
>> +{
>> +    int ret = 0;
>> +
>> +    if (!xe_pxp_is_enabled(pxp))
>> +        return -ENODEV;
>> +
>> +    /* we only support HWDRM sessions right now */
>> +    xe_assert(pxp->xe, q->pxp.type == DRM_XE_PXP_TYPE_HWDRM);
>> +
>> +    /*
>> +     * Runtime suspend kills PXP, so we need to turn it off while we 
>> have
>> +     * active queues that use PXP
>> +     */
>> +    xe_pm_runtime_get(pxp->xe);
>> +
>> +    if (!pxp_prerequisites_done(pxp)) {
>> +        ret = -EBUSY;
> Wouldn't EAGAIN be more appropriate? The pre-reqs here are the GSC 
> firmware load which is guaranteed to in progress or done (or dead?), 
> in which case it is just a matter or re-trying until the firmware init 
> completes?

Userspace tends to retry immediately when we return -EAGAIN . This wait 
can take several hundreds on ms and I didn't want userspace to just keep 
retrying in a tight loop for that long, so I used a different error 
code. This was also discussed on the mesa review here:

https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/30723#note_2622269

>
>> +        goto out;
>> +    }
>> +
>> +wait_for_termination:
>> +    /*
>> +     * if there is a termination in progress, wait for it.
>> +     * We need to wait outside the lock because the completion is 
>> done from
>> +     * within the lock
>> +     */
>> +    if (!wait_for_completion_timeout(&pxp->termination,
>> + msecs_to_jiffies(PXP_TERMINATION_TIMEOUT_MS)))
>> +        return -ETIMEDOUT;
>> +
>> +    mutex_lock(&pxp->mutex);
>> +
>> +    /*
>> +     * check if a new termination was issued between the above check 
>> and
>> +     * grabbing the mutex
>> +     */
>> +    if (!completion_done(&pxp->termination)) {
>> +        mutex_unlock(&pxp->mutex);
>> +        goto wait_for_termination;
>> +    }
>> +
>> +    /* If PXP is not already active, turn it on */
>> +    switch (pxp->status) {
>> +    case XE_PXP_ERROR:
>> +        ret = -EIO;
>> +        break;
>> +    case XE_PXP_ACTIVE:
>> +        break;
>> +    case XE_PXP_READY_TO_START:
>> +        ret = __pxp_start_arb_session(pxp);
>> +        break;
>> +    case XE_PXP_NEEDS_TERMINATION:
>> +        pxp_terminate(pxp);
>> +        mutex_unlock(&pxp->mutex);
>> +        goto wait_for_termination;
>> +    default:
>> +        drm_err(&pxp->xe->drm, "unexpected state during PXP start: 
>> %u", pxp->status);
>> +        ret = -EIO;
>> +        break;
>> +    }
>> +
>> +    /* If everything went ok, add the queue to the list */
>> +    if (!ret) {
>> +        spin_lock_irq(&pxp->queues.lock);
>> +        list_add_tail(&q->pxp.link, &pxp->queues.list);
>> +        spin_unlock_irq(&pxp->queues.lock);
>> +    }
>> +
>> +    mutex_unlock(&pxp->mutex);
>> +
>> +out:
>> +    /*
>> +     * in the successful case the PM ref is released from
>> +     * xe_pxp_exec_queue_remove
>> +     */
>> +    if (ret)
>> +        xe_pm_runtime_put(pxp->xe);
> Does the runtime PM get/put need to be mutex protected as well? Is it 
> possible for two xe_pxp_exec_queue_add() calls to be running 
> concurrently?

It is possible to have two xe_pxp_exec_queue_add running concurrently, 
but that shouldn't matter with the pm_put. Am I not seeing a race?

>
>> +
>> +    return ret;
>> +}
>> +
>> +/**
>> + * xe_pxp_exec_queue_remove - remove a queue from the PXP list
>> + * @pxp: the xe->pxp pointer (it will be NULL if PXP is disabled)
>> + * @q: the queue to remove from the list
>> + *
>> + * If PXP is enabled and the exec_queue is in the list, the queue 
>> will be
>> + * removed from the list and its PM reference will be released. It 
>> is safe to
>> + * call this function multiple times for the same queue.
>> + */
>> +void xe_pxp_exec_queue_remove(struct xe_pxp *pxp, struct 
>> xe_exec_queue *q)
>> +{
>> +    bool need_pm_put = false;
>> +
>> +    if (!xe_pxp_is_enabled(pxp))
>> +        return;
>> +
>> +    spin_lock_irq(&pxp->queues.lock);
>> +
>> +    if (!list_empty(&q->pxp.link)) {
>> +        list_del_init(&q->pxp.link);
>> +        need_pm_put = true;
>> +    }
>> +
>> +    q->pxp.type = DRM_XE_PXP_TYPE_NONE;
>> +
>> +    spin_unlock_irq(&pxp->queues.lock);
>> +
>> +    if (need_pm_put)
>> +        xe_pm_runtime_put(pxp->xe);
>> +}
>> +
>> +static void pxp_invalidate_queues(struct xe_pxp *pxp)
>> +{
>> +    struct xe_exec_queue *tmp, *q;
>> +
>> +    spin_lock_irq(&pxp->queues.lock);
>> +
>> +    list_for_each_entry(tmp, &pxp->queues.list, pxp.link) {
> Double space.
>
>> +        q = xe_exec_queue_get_unless_zero(tmp);
>> +
>> +        if (!q)
>> +            continue;
>> +
>> +        xe_exec_queue_kill(q);
>> +        xe_exec_queue_put(q);
>> +    }
> This doesn't need to empty the list out as well?

It's not strictly necessary, because it is ok to kill a queue multiple 
times. Given the PM handling required as part of removing a queue from 
the list and the fact that it needs to happen outside the lock (see 
xe_pxp_exec_queue_remove), my thought was that it'd be easier to just 
not do it here and leave it to when the queue is cleaned up.

>
>> +
>> +    spin_unlock_irq(&pxp->queues.lock);
>> +}
>> +
>> diff --git a/drivers/gpu/drm/xe/xe_pxp.h b/drivers/gpu/drm/xe/xe_pxp.h
>> index 81bafe2714ff..2e0ab186072a 100644
>> --- a/drivers/gpu/drm/xe/xe_pxp.h
>> +++ b/drivers/gpu/drm/xe/xe_pxp.h
>> @@ -9,10 +9,17 @@
>>   #include <linux/types.h>
>>     struct xe_device;
>> +struct xe_exec_queue;
>> +struct xe_pxp;
>>     bool xe_pxp_is_supported(const struct xe_device *xe);
>> +bool xe_pxp_is_enabled(const struct xe_pxp *pxp);
>>     int xe_pxp_init(struct xe_device *xe);
>>   void xe_pxp_irq_handler(struct xe_device *xe, u16 iir);
>>   +int xe_pxp_exec_queue_set_type(struct xe_pxp *pxp, struct 
>> xe_exec_queue *q, u8 type);
>> +int xe_pxp_exec_queue_add(struct xe_pxp *pxp, struct xe_exec_queue *q);
>> +void xe_pxp_exec_queue_remove(struct xe_pxp *pxp, struct 
>> xe_exec_queue *q);
>> +
>>   #endif /* __XE_PXP_H__ */
>> diff --git a/drivers/gpu/drm/xe/xe_pxp_submit.c 
>> b/drivers/gpu/drm/xe/xe_pxp_submit.c
>> index c9258c861556..becffa6dfd4c 100644
>> --- a/drivers/gpu/drm/xe/xe_pxp_submit.c
>> +++ b/drivers/gpu/drm/xe/xe_pxp_submit.c
>> @@ -26,8 +26,6 @@
>>   #include "instructions/xe_mi_commands.h"
>>   #include "regs/xe_gt_regs.h"
>>   -#define ARB_SESSION 0xF /* TODO: move to UAPI */
>> -
>>   /*
>>    * The VCS is used for kernel-owned GGTT submissions to issue key 
>> termination.
>>    * Terminations are serialized, so we only need a single queue and 
>> a single
>> @@ -495,7 +493,7 @@ int xe_pxp_submit_session_init(struct 
>> xe_pxp_gsc_client_resources *gsc_res, u32
>>                      FIELD_PREP(PXP43_INIT_SESSION_APPTYPE, 0));
>>       msg_in.header.buffer_len = sizeof(msg_in) - sizeof(msg_in.header);
>>   -    if (id == ARB_SESSION)
>> +    if (id == DRM_XE_PXP_HWDRM_DEFAULT_SESSION)
> Would have been clearer to just use the correct name from the start.

You mean define DRM_XE_PXP_HWDRM_DEFAULT_SESSION locally in the earlier 
patch, and then moving it to the uapi without a rename?

>
>>           msg_in.protection_mode = PXP43_INIT_SESSION_PROTECTION_ARB;
>>         ret = gsccs_send_message(gsc_res, &msg_in, sizeof(msg_in),
>> diff --git a/drivers/gpu/drm/xe/xe_pxp_types.h 
>> b/drivers/gpu/drm/xe/xe_pxp_types.h
>> index d5cf8faed7be..eb6a0183320a 100644
>> --- a/drivers/gpu/drm/xe/xe_pxp_types.h
>> +++ b/drivers/gpu/drm/xe/xe_pxp_types.h
>> @@ -6,7 +6,10 @@
>>   #ifndef __XE_PXP_TYPES_H__
>>   #define __XE_PXP_TYPES_H__
>>   +#include <linux/completion.h>
>>   #include <linux/iosys-map.h>
>> +#include <linux/mutex.h>
>> +#include <linux/spinlock.h>
>>   #include <linux/types.h>
>>   #include <linux/workqueue.h>
>>   @@ -16,6 +19,14 @@ struct xe_device;
>>   struct xe_gt;
>>   struct xe_vm;
>>   +enum xe_pxp_status {
>> +    XE_PXP_ERROR = -1,
>> +    XE_PXP_NEEDS_TERMINATION = 0, /* starting status */
>> +    XE_PXP_TERMINATION_IN_PROGRESS,
>> +    XE_PXP_READY_TO_START,
>> +    XE_PXP_ACTIVE
>> +};
>> +
>>   /**
>>    * struct xe_pxp_gsc_client_resources - resources for GSC 
>> submission by a PXP
>>    * client. The GSC FW supports multiple GSC client active at the 
>> same time.
>> @@ -82,6 +93,21 @@ struct xe_pxp {
>>   #define PXP_TERMINATION_REQUEST  BIT(0)
>>   #define PXP_TERMINATION_COMPLETE BIT(1)
>>       } irq;
>> +
>> +    /** @mutex: protects the pxp status and the queue list */
>> +    struct mutex mutex;
>> +    /** @status: the current pxp status */
>> +    enum xe_pxp_status status;
>> +    /** @termination: completion struct that tracks terminations */
>> +    struct completion termination;
>> +
>> +    /** @queues: management of exec_queues that use PXP */
>> +    struct {
>> +        /** @queues.lock: spinlock protecting the queue management */
>> +        spinlock_t lock;
>> +        /** @queues.list: list of exec_queues that use PXP */
>> +        struct list_head list;
>> +    } queues;
>>   };
>>     #endif /* __XE_PXP_TYPES_H__ */
>> diff --git a/include/uapi/drm/xe_drm.h b/include/uapi/drm/xe_drm.h
>> index b6fbe4988f2e..5f4d08123672 100644
>> --- a/include/uapi/drm/xe_drm.h
>> +++ b/include/uapi/drm/xe_drm.h
>> @@ -1085,6 +1085,24 @@ struct drm_xe_vm_bind {
>>   /**
>>    * struct drm_xe_exec_queue_create - Input of 
>> &DRM_IOCTL_XE_EXEC_QUEUE_CREATE
>>    *
>> + * This ioctl supports setting the following properties via the
>> + * %DRM_XE_EXEC_QUEUE_EXTENSION_SET_PROPERTY extension, which uses the
>> + * generic @drm_xe_ext_set_property struct:
>> + *
>> + *  - %DRM_XE_EXEC_QUEUE_SET_PROPERTY_PRIORITY - set the queue 
>> priority.
>> + *    CAP_SYS_NICE is required to set a value above normal.
>> + *  - %DRM_XE_EXEC_QUEUE_SET_PROPERTY_TIMESLICE - set the queue 
>> timeslice
>> + *    duration.
> Units would be helpful.

I have no idea what they are. I only added this documentation because it 
seemed unclean to only add the part about PXP.

>
>> + *  - %DRM_XE_EXEC_QUEUE_SET_PROPERTY_PXP_TYPE - set the type of PXP 
>> session
>> + *    this queue will be used with. Valid values are listed in enum
>> + *    drm_xe_pxp_session_type. %DRM_XE_PXP_TYPE_NONE is the default 
>> behavior, so
>> + *    there is no need to explicitly set that. When a queue of type
>> + *    %DRM_XE_PXP_TYPE_HWDRM is created, the PXP default HWDRM session
>> + *    (%XE_PXP_HWDRM_DEFAULT_SESSION) will be started, if isn't 
>> already running.
>> + *    Given that going into a power-saving state kills PXP HWDRM 
>> sessions,
>> + *    runtime PM will be blocked while queues of this type are alive.
>> + *    All PXP queues will be killed if a PXP invalidation event occurs.
> Seems odd to say 'values are listed in ...' and then go on to describe 
> each type and provide extra information about them. Seems like the 
> extra details should be part of the enum documentation instead of here?

This is documentation specific to how this ioctl handles those values, 
so it belongs here. The 'values are listed in ...' sentence was about 
being future proof, in case we update the enum in the future and don't 
need to add any extra explanation here.

Daniele

>
> John.
>
>> + *
>>    * The example below shows how to use @drm_xe_exec_queue_create to 
>> create
>>    * a simple exec_queue (no parallel submission) of class
>>    * &DRM_XE_ENGINE_CLASS_RENDER.
>> @@ -1108,7 +1126,7 @@ struct drm_xe_exec_queue_create {
>>   #define DRM_XE_EXEC_QUEUE_EXTENSION_SET_PROPERTY        0
>>   #define   DRM_XE_EXEC_QUEUE_SET_PROPERTY_PRIORITY        0
>>   #define   DRM_XE_EXEC_QUEUE_SET_PROPERTY_TIMESLICE        1
>> -
>> +#define   DRM_XE_EXEC_QUEUE_SET_PROPERTY_PXP_TYPE        2
>>       /** @extensions: Pointer to the first extension struct, if any */
>>       __u64 extensions;
>>   @@ -1694,6 +1712,26 @@ struct drm_xe_oa_stream_info {
>>       __u64 reserved[3];
>>   };
>>   +/**
>> + * enum drm_xe_pxp_session_type - Supported PXP session types.
>> + *
>> + * We currently only support HWDRM sessions, which are used for 
>> protected
>> + * content that ends up being displayed, but the HW supports 
>> multiple types, so
>> + * we might extend support in the future.
>> + */
>> +enum drm_xe_pxp_session_type {
>> +    /** @DRM_XE_PXP_TYPE_NONE: PXP not used */
>> +    DRM_XE_PXP_TYPE_NONE = 0,
>> +    /**
>> +     * @DRM_XE_PXP_TYPE_HWDRM: HWDRM sessions are used for content 
>> that ends
>> +     * up on the display.
>> +     */
>> +    DRM_XE_PXP_TYPE_HWDRM = 1,
>> +};
>> +
>> +/* ID of the protected content session managed by Xe when PXP is 
>> active */
>> +#define DRM_XE_PXP_HWDRM_DEFAULT_SESSION 0xf
>> +
>>   #if defined(__cplusplus)
>>   }
>>   #endif