[Intel-gfx] [PATCH v3 3/3] drm/i915/display: Program PSR2 selective fetch registers
Mun, Gwan-gyeong
gwan-gyeong.mun at intel.com
Thu Sep 24 13:27:17 UTC 2020
On Wed, 2020-09-23 at 10:09 -0700, Souza, Jose wrote:
> On Wed, 2020-09-23 at 10:10 -0700, José Roberto de Souza wrote:
> > On Wed, 2020-09-23 at 14:02 +0100, Mun, Gwan-gyeong wrote:
> > > On Thu, 2020-09-17 at 18:02 -0700, José Roberto de Souza wrote:
> > > > Another step towards PSR2 selective fetch, here programming
> > > > plane
> > > > selective fetch registers and MAN_TRK_CTL enabling selective
> > > > fetch
> > > > but
> > > > for now it is fetching the whole area of the planes.
> > > > The damaged area calculation will come as next and final step.
> > > >
> > > > v2:
> > > > - removed warn on when no plane is visible in state
> > > > - removed calculations using plane damaged area in
> > > > intel_psr2_program_plane_sel_fetch()
> > > >
> > > > v3:
> > > > - do not shift 16 positions the plane dst coordinates, only src
> > > > is
> > > > shifted
> > > >
> > > > BSpec: 55229
> > > > Cc: Gwan-gyeong Mun <
> > > > gwan-gyeong.mun at intel.com
> > > >
> > > >
> > > > Cc: Ville Syrjälä <
> > > > ville.syrjala at linux.intel.com
> > > >
> > > >
> > > > Signed-off-by: José Roberto de Souza <
> > > > jose.souza at intel.com
> > > >
> > > >
> > > > ---
> > > > drivers/gpu/drm/i915/display/intel_display.c | 10 +-
> > > > drivers/gpu/drm/i915/display/intel_psr.c | 120
> > > > ++++++++++++++++++-
> > > > drivers/gpu/drm/i915/display/intel_psr.h | 10 +-
> > > > drivers/gpu/drm/i915/display/intel_sprite.c | 3 +
> > > > 4 files changed, 134 insertions(+), 9 deletions(-)
> > > >
> > > > diff --git a/drivers/gpu/drm/i915/display/intel_display.c
> > > > b/drivers/gpu/drm/i915/display/intel_display.c
> > > > index 5a9d933e425a..96bc515497c1 100644
> > > > --- a/drivers/gpu/drm/i915/display/intel_display.c
> > > > +++ b/drivers/gpu/drm/i915/display/intel_display.c
> > > > @@ -11812,6 +11812,9 @@ static void i9xx_update_cursor(struct
> > > > intel_plane *plane,
> > > > if (INTEL_GEN(dev_priv) >= 9)
> > > > skl_write_cursor_wm(plane, crtc_state);
> > > >
> > > > + if (!needs_modeset(crtc_state))
> > > > + intel_psr2_program_plane_sel_fetch(plane,
> > > > crtc_state,
> > > > plane_state, 0);
> > > > +
> > > > if (plane->cursor.base != base ||
> > > > plane->cursor.size != fbc_ctl ||
> > > > plane->cursor.cntl != cntl) {
> > > > @@ -12823,8 +12826,11 @@ static int
> > > > intel_crtc_atomic_check(struct
> > > > intel_atomic_state *state,
> > > >
> > > > }
> > > >
> > > > - if (!mode_changed)
> > > > - intel_psr2_sel_fetch_update(state, crtc);
> > > > + if (!mode_changed) {
> > > > + ret = intel_psr2_sel_fetch_update(state, crtc);
> > > > + if (ret)
> > > > + return ret;
> > > > + }
> > > >
> > > > return 0;
> > > > }
> > > > diff --git a/drivers/gpu/drm/i915/display/intel_psr.c
> > > > b/drivers/gpu/drm/i915/display/intel_psr.c
> > > > index 02f74b0ddec1..deb0523f9f29 100644
> > > > --- a/drivers/gpu/drm/i915/display/intel_psr.c
> > > > +++ b/drivers/gpu/drm/i915/display/intel_psr.c
> > > > @@ -1166,6 +1166,41 @@ static void
> > > > psr_force_hw_tracking_exit(struct
> > > > drm_i915_private *dev_priv)
> > > > intel_psr_exit(dev_priv);
> > > > }
> > > >
> > > > +void intel_psr2_program_plane_sel_fetch(struct intel_plane
> > > > *plane,
> > > > + const struct
> > > > intel_crtc_state
> > > > *crtc_state,
> > > > + const struct
> > > > intel_plane_state
> > > > *plane_state,
> > > > + int color_plane)
> > > > +{
> > > > + struct drm_i915_private *dev_priv = to_i915(plane-
> > > > >base.dev);
> > > > + enum pipe pipe = plane->pipe;
> > > > + u32 val;
> > > > +
> > > > + if (!crtc_state->enable_psr2_sel_fetch)
> > > > + return;
> > > > +
> > > > + /*
> > > > + * skl_plane_ctl_crtc()/i9xx_cursor_ctl_crtc() return 0
> > > > for
> > > > gen11+, so
> > > > + * plane_state->ctl is the right value
> > > > + */
> > > > + val = plane_state ? plane_state->ctl : 0;
> > >
> > > IMHO, skl_plane_ctl() might set other ctl bits, it would be
> > > better to
> > > have separated ctl bit value for "selective fetch ctl".
> >
> > Like said all other bits are spares so can be set without issues
> > but okay will a "plane_state->ctl & PLANE_SEL_FETCH_CTL_ENABLE".
>
> Please take a look to the answer of your other comment bellow, with
> the change above can I have your rv-b?
The purpose and composition of bits of Register_SEL_FETCH_PLANE_CTL is
different from Register_PLANE_CTL.
And the Spares bits of Register_SEL_FETCH_PLANE_CTL might be used for
other purpose.
(And we current don't know the side effect of setting of Spares bit of
Register_SEL_FETCH_PLANE_CTL )
therefor I recommend "Read and Modify" to SEL_FETCH_PLANE_CTL.
>
> > > > + intel_de_write_fw(dev_priv, PLANE_SEL_FETCH_CTL(pipe,
> > > > plane-
> > > > > id), val);
> > > >
> > > > + if (!val || plane->id == PLANE_CURSOR)
> > > > + return;
> > > > +
> > > > + val = plane_state->uapi.dst.y1 << 16 | plane_state-
> > > > > uapi.dst.x1;
> > > >
> > > > + intel_de_write_fw(dev_priv, PLANE_SEL_FETCH_POS(pipe,
> > > > plane-
> > > > > id), val);
> > > >
> > > > +
> > > > + val = plane_state->color_plane[color_plane].y << 16;
> > > > + val |= plane_state->color_plane[color_plane].x;
> > > > + intel_de_write_fw(dev_priv,
> > > > PLANE_SEL_FETCH_OFFSET(pipe, plane-
> > > > > id),
> > > >
> > > > + val);
> > > > +
> > > > + /* Sizes are 0 based */
> > > > + val = ((drm_rect_height(&plane_state->uapi.src) >> 16)
> > > > - 1) <<
> > > > 16;
> > > > + val |= (drm_rect_width(&plane_state->uapi.src) >> 16) -
> > > > 1;
> > > > + intel_de_write_fw(dev_priv, PLANE_SEL_FETCH_SIZE(pipe,
> > > > plane-
> > > > > id), val);
> > > >
> > > > +}
> > > > +
> > > > void intel_psr2_program_trans_man_trk_ctl(const struct
> > > > intel_crtc_state *crtc_state)
> > > > {
> > > > struct intel_crtc *crtc = to_intel_crtc(crtc_state-
> > > > >uapi.crtc);
> > > > @@ -1180,16 +1215,91 @@ void
> > > > intel_psr2_program_trans_man_trk_ctl(const struct
> > > > intel_crtc_state
> > > > *crtc_st
> > > > crtc_state->psr2_man_track_ctl);
> > > > }
> > > >
> > > > -void intel_psr2_sel_fetch_update(struct intel_atomic_state
> > > > *state,
> > > > - struct intel_crtc *crtc)
> > > > +static void psr2_man_trk_ctl_calc(struct intel_crtc_state
> > > > *crtc_state,
> > > > + struct drm_rect *clip, bool
> > > > full_update)
> > > > +{
> > > > + u32 val = PSR2_MAN_TRK_CTL_ENABLE;
> > > > +
> > > > + if (full_update) {
> > > > + val |= PSR2_MAN_TRK_CTL_SF_SINGLE_FULL_FRAME;
> > > > + goto exit;
> > > > + }
> > > > +
> > > > + if (clip->y1 == -1)
> > > > + goto exit;
> > > > +
> > > > + val |= PSR2_MAN_TRK_CTL_SF_PARTIAL_FRAME_UPDATE;
> > > > + val |= PSR2_MAN_TRK_CTL_SU_REGION_START_ADDR(clip->y1 /
> > > > 4 + 1);
> > >
> > > I think the start address block would be like this too.
> > > PSR2_MAN_TRK_CTL_SU_REGION_START_ADDR(DIV_ROUND_UP(clip->y1 ,
> > > 4));
> >
> > This would not match for numbers that divide by 4.
> > y pos 0 = region 1y pos 1 = region 1
> > y pos 4 = region 2
> >
yes. you are right.
> >
> > > > + val |=
> > > > PSR2_MAN_TRK_CTL_SU_REGION_END_ADDR(DIV_ROUND_UP(clip-
> > > > > y2, 4) + 1);
> > > >
> > > > +exit:
> > > > + crtc_state->psr2_man_track_ctl = val;
> > > > +}
> > > > +
> > > > +static void clip_area_update(struct drm_rect
> > > > *overlap_damage_area,
> > > > + struct drm_rect *damage_area)
> > > > +{
> > > > + if (overlap_damage_area->y1 == -1) {
> > > > + overlap_damage_area->y1 = damage_area->y1;
> > > > + overlap_damage_area->y2 = damage_area->y2;
> > > > + return;
> > > > + }
> > > > +
> > > > + if (damage_area->y1 < overlap_damage_area->y1)
> > > > + overlap_damage_area->y1 = damage_area->y1;
> > > > +
> > > > + if (damage_area->y2 > overlap_damage_area->y2)
> > > > + overlap_damage_area->y2 = damage_area->y2;
> > > > +}
> > > > +
> > > > +int intel_psr2_sel_fetch_update(struct intel_atomic_state
> > > > *state,
> > > > + struct intel_crtc *crtc)
> > > > {
> > > > struct intel_crtc_state *crtc_state =
> > > > intel_atomic_get_new_crtc_state(state, crtc);
> > > > + struct intel_plane_state *new_plane_state,
> > > > *old_plane_state;
> > > > + struct drm_rect pipe_clip = { .y1 = -1 };
> > > > + struct intel_plane *plane;
> > > > + bool full_update = false;
> > > > + int i, ret;
> > > >
> > > > if (!crtc_state->enable_psr2_sel_fetch)
> > > > - return;
> > > > + return 0;
> > > > +
> > > > + ret = drm_atomic_add_affected_planes(&state->base,
> > > > &crtc-
> > > > > base);
> > > >
> > > > + if (ret)
> > > > + return ret;
> > > > +
> > > > + for_each_oldnew_intel_plane_in_state(state, plane,
> > > > old_plane_state,
> > > > + new_plane_state,
> > > > i) {
> > > > + struct drm_rect temp;
> > > > +
> > > > + if (new_plane_state->uapi.crtc != crtc_state-
> > > > > uapi.crtc)
> > > >
> > > > + continue;
> > > >
> > > > - crtc_state->psr2_man_track_ctl =
> > > > PSR2_MAN_TRK_CTL_ENABLE |
> > > > - PSR2_MAN_TRK_CTL_SF_SI
> > > > NGLE_FUL
> > > > L_FRAME;
> > > > + /*
> > > > + * TODO: Not clear how to handle planes with
> > > > negative
> > > > position,
> > > > + * also planes are not updated if they have a
> > > > negative
> > > > X
> > > > + * position so for now doing a full update in
> > > > this
> > > > cases
> > > > + */
> > > > + if (new_plane_state->uapi.dst.y1 < 0 ||
> > > > + new_plane_state->uapi.dst.x1 < 0) {
> > > > + full_update = true;
> > > > + break;
> > > > + }
> > > > +
> > > > + if (!new_plane_state->uapi.visible)
> > > > + continue;
> > > > +
> > > > + /*
> > > > + * For now doing a selective fetch in the whole
> > > > plane
> > > > area,
> > > > + * optimizations will come in the future.
> > > > + */
> > > > + temp.y1 = new_plane_state->uapi.dst.y1;
> > > > + temp.y2 = new_plane_state->uapi.dst.y2;
> > > > + clip_area_update(&pipe_clip, &temp);
> > > > + }
> > > > +
> > > > + psr2_man_trk_ctl_calc(crtc_state, &pipe_clip,
> > > > full_update);
> > > > + return 0;
> > > > }
> > > >
> > > > /**
> > > > diff --git a/drivers/gpu/drm/i915/display/intel_psr.h
> > > > b/drivers/gpu/drm/i915/display/intel_psr.h
> > > > index 6a83c8e682e6..3eca9dcec3c0 100644
> > > > --- a/drivers/gpu/drm/i915/display/intel_psr.h
> > > > +++ b/drivers/gpu/drm/i915/display/intel_psr.h
> > > > @@ -15,6 +15,8 @@ struct intel_crtc_state;
> > > > struct intel_dp;
> > > > struct intel_crtc;
> > > > struct intel_atomic_state;
> > > > +struct intel_plane_state;
> > > > +struct intel_plane;
> > > >
> > > > #define CAN_PSR(dev_priv) (HAS_PSR(dev_priv) && dev_priv-
> > > > > psr.sink_support)
> > > >
> > > > void intel_psr_init_dpcd(struct intel_dp *intel_dp);
> > > > @@ -45,8 +47,12 @@ void intel_psr_atomic_check(struct
> > > > drm_connector
> > > > *connector,
> > > > struct drm_connector_state
> > > > *old_state,
> > > > struct drm_connector_state
> > > > *new_state);
> > > > void intel_psr_set_force_mode_changed(struct intel_dp
> > > > *intel_dp);
> > > > -void intel_psr2_sel_fetch_update(struct intel_atomic_state
> > > > *state,
> > > > - struct intel_crtc *crtc);
> > > > +int intel_psr2_sel_fetch_update(struct intel_atomic_state
> > > > *state,
> > > > + struct intel_crtc *crtc);
> > > > void intel_psr2_program_trans_man_trk_ctl(const struct
> > > > intel_crtc_state *crtc_state);
> > > > +void intel_psr2_program_plane_sel_fetch(struct intel_plane
> > > > *plane,
> > > > + const struct
> > > > intel_crtc_state
> > > > *crtc_state,
> > > > + const struct
> > > > intel_plane_state
> > > > *plane_state,
> > > > + int color_plane);
> > > >
> > > > #endif /* __INTEL_PSR_H__ */
> > > > diff --git a/drivers/gpu/drm/i915/display/intel_sprite.c
> > > > b/drivers/gpu/drm/i915/display/intel_sprite.c
> > > > index 63040cb0d4e1..f12425b90607 100644
> > > > --- a/drivers/gpu/drm/i915/display/intel_sprite.c
> > > > +++ b/drivers/gpu/drm/i915/display/intel_sprite.c
> > > > @@ -690,6 +690,9 @@ skl_program_plane(struct intel_plane
> > > > *plane,
> > > > intel_de_write_fw(dev_priv,
> > > > PLANE_AUX_OFFSET(pipe,
> > > > plane_id),
> > > > (plane_state-
> > > > >color_plane[1].y << 16)
> > > > > plane_state->color_plane[1].x);
> > > >
> > > >
> > > > + if (!drm_atomic_crtc_needs_modeset(&crtc_state->uapi))
> > > > + intel_psr2_program_plane_sel_fetch(plane,
> > > > crtc_state,
> > > > plane_state, color_plane);
> > > > +
> > > > /*
> > > > * The control register self-arms if the plane was
> > > > previously
> > > > * disabled. Try to make the plane enable atomic by
> > > > writing
More information about the Intel-gfx
mailing list