[PATCH 3/7] drm/xe/oa: Add input fence dependencies
Dixit, Ashutosh
ashutosh.dixit at intel.com
Wed Sep 18 19:56:08 UTC 2024
On Wed, 18 Sep 2024 04:59:59 -0700, Souza, Jose wrote:
>
Hi Jose,
> On Fri, 2024-08-30 at 15:16 -0700, Ashutosh Dixit wrote:
> > Add input fence dependencies which will make OA configuration wait till
> > these dependencies are met (till input fences signal).
> >
> > v2: Change add_deps arg to xe_oa_submit_bb from bool to enum (Matt Brost)
> >
> > Reviewed-by: Jonathan Cavitt <jonathan.cavitt at intel.com>
> > Signed-off-by: Ashutosh Dixit <ashutosh.dixit at intel.com>
> > ---
> > drivers/gpu/drm/xe/xe_oa.c | 25 +++++++++++++++++++++----
> > 1 file changed, 21 insertions(+), 4 deletions(-)
> >
> > diff --git a/drivers/gpu/drm/xe/xe_oa.c b/drivers/gpu/drm/xe/xe_oa.c
> > index 8ada74da3da19..b4b68019d35b7 100644
> > --- a/drivers/gpu/drm/xe/xe_oa.c
> > +++ b/drivers/gpu/drm/xe/xe_oa.c
> > @@ -42,6 +42,11 @@
> > #define DEFAULT_POLL_PERIOD_NS (NSEC_PER_SEC / DEFAULT_POLL_FREQUENCY_HZ)
> > #define XE_OA_UNIT_INVALID U32_MAX
> >
> > +enum xe_oa_submit_deps {
> > + XE_OA_SUBMIT_NO_DEPS,
> > + XE_OA_SUBMIT_ADD_DEPS,
> > +};
> > +
> > struct xe_oa_reg {
> > struct xe_reg addr;
> > u32 value;
> > @@ -568,7 +573,8 @@ static __poll_t xe_oa_poll(struct file *file, poll_table *wait)
> > return ret;
> > }
> >
> > -static struct dma_fence *xe_oa_submit_bb(struct xe_oa_stream *stream, struct xe_bb *bb)
> > +static struct dma_fence *xe_oa_submit_bb(struct xe_oa_stream *stream, enum xe_oa_submit_deps deps,
> > + struct xe_bb *bb)
> > {
> > struct xe_sched_job *job;
> > struct dma_fence *fence;
> > @@ -581,11 +587,22 @@ static struct dma_fence *xe_oa_submit_bb(struct xe_oa_stream *stream, struct xe_
> > goto exit;
> > }
> >
> > + if (deps == XE_OA_SUBMIT_ADD_DEPS) {
> > + for (int i = 0; i < stream->num_syncs && !err; i++)
> > + err = xe_sync_entry_add_deps(&stream->syncs[i], job);
>
> err needs to be initialize to 0 otherwise it could take the error path
> below when there is no syncs set.
Somehow I missed this because I never see the drm_dbg print below. Anyway,
I have added the initialization, though the change is in Patch 1 of the
series since the initialization was there and it was removed in Patch 1.
Thanks for catching this,
Ashutosh
>
> > + if (err) {
> > + drm_dbg(&stream->oa->xe->drm, "xe_sync_entry_add_deps err %d\n", err);
> > + goto err_put_job;
> > + }
> > + }
> > +
> > xe_sched_job_arm(job);
> > fence = dma_fence_get(&job->drm.s_fence->finished);
> > xe_sched_job_push(job);
> >
> > return fence;
> > +err_put_job:
> > + xe_sched_job_put(job);
> > exit:
> > return ERR_PTR(err);
> > }
> > @@ -663,7 +680,7 @@ static int xe_oa_modify_ctx_image(struct xe_oa_stream *stream, struct xe_lrc *lr
> >
> > xe_oa_store_flex(stream, lrc, bb, flex, count);
> >
> > - fence = xe_oa_submit_bb(stream, bb);
> > + fence = xe_oa_submit_bb(stream, XE_OA_SUBMIT_NO_DEPS, bb);
> > if (IS_ERR(fence)) {
> > err = PTR_ERR(fence);
> > goto free_bb;
> > @@ -692,7 +709,7 @@ static int xe_oa_load_with_lri(struct xe_oa_stream *stream, struct xe_oa_reg *re
> >
> > write_cs_mi_lri(bb, reg_lri, 1);
> >
> > - fence = xe_oa_submit_bb(stream, bb);
> > + fence = xe_oa_submit_bb(stream, XE_OA_SUBMIT_NO_DEPS, bb);
> > if (IS_ERR(fence)) {
> > err = PTR_ERR(fence);
> > goto free_bb;
> > @@ -943,7 +960,7 @@ static int xe_oa_emit_oa_config(struct xe_oa_stream *stream, struct xe_oa_config
> > goto exit;
> > }
> >
> > - fence = xe_oa_submit_bb(stream, oa_bo->bb);
> > + fence = xe_oa_submit_bb(stream, XE_OA_SUBMIT_ADD_DEPS, oa_bo->bb);
> > if (IS_ERR(fence)) {
> > err = PTR_ERR(fence);
> > goto exit;
>
More information about the Intel-xe
mailing list