[Mesa-dev] [PATCHv2 1/6] r600g: make all scissor states use single atom

Marek Olšák maraeo at gmail.com
Thu Sep 3 09:07:45 PDT 2015


Pushed the series. Thanks.

Marek

On Thu, Sep 3, 2015 at 12:54 AM, Grazvydas Ignotas <notasas at gmail.com> wrote:
> As suggested by Marek Olšák, we can use single atom to track all scissor
> states. This will allow to simplify dirty atom handling later.
> ---
> v2: rebased, moved dirty_mask set out of the loop
>
>  src/gallium/drivers/r600/evergreen_state.c   | 36 ++++++++++++++--------
>  src/gallium/drivers/r600/r600_blit.c         |  2 +-
>  src/gallium/drivers/r600/r600_hw_context.c   |  4 ++-
>  src/gallium/drivers/r600/r600_pipe.h         |  8 ++---
>  src/gallium/drivers/r600/r600_state.c        | 46 +++++++++++++++++-----------
>  src/gallium/drivers/r600/r600_state_common.c |  6 ++--
>  6 files changed, 62 insertions(+), 40 deletions(-)
>
> diff --git a/src/gallium/drivers/r600/evergreen_state.c b/src/gallium/drivers/r600/evergreen_state.c
> index 0d4b598..3a7f583 100644
> --- a/src/gallium/drivers/r600/evergreen_state.c
> +++ b/src/gallium/drivers/r600/evergreen_state.c
> @@ -892,27 +892,38 @@ static void evergreen_set_scissor_states(struct pipe_context *ctx,
>                                         const struct pipe_scissor_state *state)
>  {
>         struct r600_context *rctx = (struct r600_context *)ctx;
> +       struct r600_scissor_state *rstate = &rctx->scissor;
>         int i;
>
> -       for (i = start_slot; i < start_slot + num_scissors; i++) {
> -               rctx->scissor[i].scissor = state[i - start_slot];
> -               r600_mark_atom_dirty(rctx, &rctx->scissor[i].atom);
> -       }
> +       for (i = start_slot; i < start_slot + num_scissors; i++)
> +               rstate->scissor[i] = state[i - start_slot];
> +       rstate->dirty_mask |= ((1 << num_scissors) - 1) << start_slot;
> +       rstate->atom.num_dw = util_bitcount(rstate->dirty_mask) * 4;
> +       r600_mark_atom_dirty(rctx, &rstate->atom);
>  }
>
>  static void evergreen_emit_scissor_state(struct r600_context *rctx, struct r600_atom *atom)
>  {
>         struct radeon_winsys_cs *cs = rctx->b.rings.gfx.cs;
> -       struct r600_scissor_state *rstate = (struct r600_scissor_state *)atom;
> -       struct pipe_scissor_state *state = &rstate->scissor;
> -       unsigned offset = rstate->idx * 4 * 2;
> +       struct r600_scissor_state *rstate = &rctx->scissor;
> +       struct pipe_scissor_state *state;
> +       uint32_t dirty_mask;
> +       unsigned i, offset;
>         uint32_t tl, br;
>
> -       evergreen_get_scissor_rect(rctx, state->minx, state->miny, state->maxx, state->maxy, &tl, &br);
> +       dirty_mask = rstate->dirty_mask;
> +       while (dirty_mask != 0) {
> +               i = u_bit_scan(&dirty_mask);
> +               state = &rstate->scissor[i];
> +               evergreen_get_scissor_rect(rctx, state->minx, state->miny, state->maxx, state->maxy, &tl, &br);
>
> -       radeon_set_context_reg_seq(cs, R_028250_PA_SC_VPORT_SCISSOR_0_TL + offset, 2);
> -       radeon_emit(cs, tl);
> -       radeon_emit(cs, br);
> +               offset = i * 4 * 2;
> +               radeon_set_context_reg_seq(cs, R_028250_PA_SC_VPORT_SCISSOR_0_TL + offset, 2);
> +               radeon_emit(cs, tl);
> +               radeon_emit(cs, br);
> +       }
> +       rstate->dirty_mask = 0;
> +       rstate->atom.num_dw = 0;
>  }
>
>  /**
> @@ -3491,11 +3502,10 @@ void evergreen_init_state_functions(struct r600_context *rctx)
>         r600_init_atom(rctx, &rctx->dsa_state.atom, id++, r600_emit_cso_state, 0);
>         r600_init_atom(rctx, &rctx->poly_offset_state.atom, id++, evergreen_emit_polygon_offset, 6);
>         r600_init_atom(rctx, &rctx->rasterizer_state.atom, id++, r600_emit_cso_state, 0);
> +       r600_init_atom(rctx, &rctx->scissor.atom, id++, evergreen_emit_scissor_state, 0);
>         for (i = 0; i < R600_MAX_VIEWPORTS; i++) {
>                 r600_init_atom(rctx, &rctx->viewport[i].atom, id++, r600_emit_viewport_state, 8);
> -               r600_init_atom(rctx, &rctx->scissor[i].atom, id++, evergreen_emit_scissor_state, 4);
>                 rctx->viewport[i].idx = i;
> -               rctx->scissor[i].idx = i;
>         }
>         r600_init_atom(rctx, &rctx->stencil_ref.atom, id++, r600_emit_stencil_ref, 4);
>         r600_init_atom(rctx, &rctx->vertex_fetch_shader.atom, id++, evergreen_emit_vertex_fetch_shader, 5);
> diff --git a/src/gallium/drivers/r600/r600_blit.c b/src/gallium/drivers/r600/r600_blit.c
> index 08b2f64..8774cb5 100644
> --- a/src/gallium/drivers/r600/r600_blit.c
> +++ b/src/gallium/drivers/r600/r600_blit.c
> @@ -66,7 +66,7 @@ static void r600_blitter_begin(struct pipe_context *ctx, enum r600_blitter_op op
>
>         if (op & R600_SAVE_FRAGMENT_STATE) {
>                 util_blitter_save_viewport(rctx->blitter, &rctx->viewport[0].state);
> -               util_blitter_save_scissor(rctx->blitter, &rctx->scissor[0].scissor);
> +               util_blitter_save_scissor(rctx->blitter, &rctx->scissor.scissor[0]);
>                 util_blitter_save_fragment_shader(rctx->blitter, rctx->ps_shader);
>                 util_blitter_save_blend(rctx->blitter, rctx->blend_state.cso);
>                 util_blitter_save_depth_stencil_alpha(rctx->blitter, rctx->dsa_state.cso);
> diff --git a/src/gallium/drivers/r600/r600_hw_context.c b/src/gallium/drivers/r600/r600_hw_context.c
> index 2fe29e9..c540325 100644
> --- a/src/gallium/drivers/r600/r600_hw_context.c
> +++ b/src/gallium/drivers/r600/r600_hw_context.c
> @@ -308,8 +308,10 @@ void r600_begin_new_cs(struct r600_context *ctx)
>         r600_mark_atom_dirty(ctx, &ctx->poly_offset_state.atom);
>         r600_mark_atom_dirty(ctx, &ctx->vgt_state.atom);
>         r600_mark_atom_dirty(ctx, &ctx->sample_mask.atom);
> +       ctx->scissor.dirty_mask = (1 << R600_MAX_VIEWPORTS) - 1;
> +       ctx->scissor.atom.num_dw = R600_MAX_VIEWPORTS * 4;
> +       r600_mark_atom_dirty(ctx, &ctx->scissor.atom);
>         for (i = 0; i < R600_MAX_VIEWPORTS; i++) {
> -               r600_mark_atom_dirty(ctx, &ctx->scissor[i].atom);
>                 r600_mark_atom_dirty(ctx, &ctx->viewport[i].atom);
>         }
>         if (ctx->b.chip_class < EVERGREEN) {
> diff --git a/src/gallium/drivers/r600/r600_pipe.h b/src/gallium/drivers/r600/r600_pipe.h
> index 8d5fd99..e09bee1 100644
> --- a/src/gallium/drivers/r600/r600_pipe.h
> +++ b/src/gallium/drivers/r600/r600_pipe.h
> @@ -38,7 +38,7 @@
>
>  #include "tgsi/tgsi_scan.h"
>
> -#define R600_NUM_ATOMS 75
> +#define R600_NUM_ATOMS 60
>
>  #define R600_MAX_VIEWPORTS 16
>
> @@ -393,9 +393,9 @@ struct r600_cso_state
>  struct r600_scissor_state
>  {
>         struct r600_atom                atom;
> -       struct pipe_scissor_state       scissor;
> +       struct pipe_scissor_state       scissor[R600_MAX_VIEWPORTS];
> +       uint32_t                        dirty_mask;
>         bool                            enable; /* r6xx only */
> -       int idx;
>  };
>
>  struct r600_fetch_shader {
> @@ -458,7 +458,7 @@ struct r600_context {
>         struct r600_poly_offset_state   poly_offset_state;
>         struct r600_cso_state           rasterizer_state;
>         struct r600_sample_mask         sample_mask;
> -       struct r600_scissor_state       scissor[R600_MAX_VIEWPORTS];
> +       struct r600_scissor_state       scissor;
>         struct r600_seamless_cube_map   seamless_cube_map;
>         struct r600_config_state        config_state;
>         struct r600_stencil_ref_state   stencil_ref;
> diff --git a/src/gallium/drivers/r600/r600_state.c b/src/gallium/drivers/r600/r600_state.c
> index f2d24a3..64a22e6 100644
> --- a/src/gallium/drivers/r600/r600_state.c
> +++ b/src/gallium/drivers/r600/r600_state.c
> @@ -769,21 +769,32 @@ static void r600_set_polygon_stipple(struct pipe_context *ctx,
>  static void r600_emit_scissor_state(struct r600_context *rctx, struct r600_atom *atom)
>  {
>         struct radeon_winsys_cs *cs = rctx->b.rings.gfx.cs;
> -       struct r600_scissor_state *rstate = (struct r600_scissor_state *)atom;
> -       struct pipe_scissor_state *state = &rstate->scissor;
> -       unsigned offset = rstate->idx * 4 * 2;
> +       struct r600_scissor_state *rstate = &rctx->scissor;
> +       struct pipe_scissor_state *state;
> +       uint32_t dirty_mask;
> +       unsigned i, offset;
>
> -       if (rctx->b.chip_class != R600 || rctx->scissor[0].enable) {
> -               radeon_set_context_reg_seq(cs, R_028250_PA_SC_VPORT_SCISSOR_0_TL + offset, 2);
> -               radeon_emit(cs, S_028240_TL_X(state->minx) | S_028240_TL_Y(state->miny) |
> -                                    S_028240_WINDOW_OFFSET_DISABLE(1));
> -               radeon_emit(cs, S_028244_BR_X(state->maxx) | S_028244_BR_Y(state->maxy));
> -       } else {
> +       if (rctx->b.chip_class == R600 && !rctx->scissor.enable) {
>                 radeon_set_context_reg_seq(cs, R_028250_PA_SC_VPORT_SCISSOR_0_TL, 2);
>                 radeon_emit(cs, S_028240_TL_X(0) | S_028240_TL_Y(0) |
>                                      S_028240_WINDOW_OFFSET_DISABLE(1));
>                 radeon_emit(cs, S_028244_BR_X(8192) | S_028244_BR_Y(8192));
> +               return;
> +       }
> +
> +       dirty_mask = rstate->dirty_mask;
> +       while (dirty_mask != 0)
> +       {
> +               i = u_bit_scan(&dirty_mask);
> +               offset = i * 4 * 2;
> +               state = &rstate->scissor[i];
> +               radeon_set_context_reg_seq(cs, R_028250_PA_SC_VPORT_SCISSOR_0_TL + offset, 2);
> +               radeon_emit(cs, S_028240_TL_X(state->minx) | S_028240_TL_Y(state->miny) |
> +                                    S_028240_WINDOW_OFFSET_DISABLE(1));
> +               radeon_emit(cs, S_028244_BR_X(state->maxx) | S_028244_BR_Y(state->maxy));
>         }
> +       rstate->dirty_mask = 0;
> +       rstate->atom.num_dw = 0;
>  }
>
>  static void r600_set_scissor_states(struct pipe_context *ctx,
> @@ -792,18 +803,18 @@ static void r600_set_scissor_states(struct pipe_context *ctx,
>                                      const struct pipe_scissor_state *state)
>  {
>         struct r600_context *rctx = (struct r600_context *)ctx;
> +       struct r600_scissor_state *rstate = &rctx->scissor;
>         int i;
>
> -       for (i = start_slot ; i < start_slot + num_scissors; i++) {
> -               rctx->scissor[i].scissor = state[i - start_slot];
> -       }
> +       for (i = start_slot ; i < start_slot + num_scissors; i++)
> +               rstate->scissor[i] = state[i - start_slot];
> +       rstate->dirty_mask |= ((1 << num_scissors) - 1) << start_slot;
> +       rstate->atom.num_dw = util_bitcount(rstate->dirty_mask) * 4;
>
> -       if (rctx->b.chip_class == R600 && !rctx->scissor[0].enable)
> +       if (rctx->b.chip_class == R600 && !rstate->enable)
>                 return;
>
> -       for (i = start_slot ; i < start_slot + num_scissors; i++) {
> -               r600_mark_atom_dirty(rctx, &rctx->scissor[i].atom);
> -       }
> +       r600_mark_atom_dirty(rctx, &rstate->atom);
>  }
>
>  static struct r600_resource *r600_buffer_create_helper(struct r600_screen *rscreen,
> @@ -3065,10 +3076,9 @@ void r600_init_state_functions(struct r600_context *rctx)
>         r600_init_atom(rctx, &rctx->dsa_state.atom, id++, r600_emit_cso_state, 0);
>         r600_init_atom(rctx, &rctx->poly_offset_state.atom, id++, r600_emit_polygon_offset, 6);
>         r600_init_atom(rctx, &rctx->rasterizer_state.atom, id++, r600_emit_cso_state, 0);
> +       r600_init_atom(rctx, &rctx->scissor.atom, id++, r600_emit_scissor_state, 0);
>         for (i = 0;i < R600_MAX_VIEWPORTS; i++) {
> -               r600_init_atom(rctx, &rctx->scissor[i].atom, id++, r600_emit_scissor_state, 4);
>                 r600_init_atom(rctx, &rctx->viewport[i].atom, id++, r600_emit_viewport_state, 8);
> -               rctx->scissor[i].idx = i;
>                 rctx->viewport[i].idx = i;
>         }
>         r600_init_atom(rctx, &rctx->config_state.atom, id++, r600_emit_config_state, 3);
> diff --git a/src/gallium/drivers/r600/r600_state_common.c b/src/gallium/drivers/r600/r600_state_common.c
> index 24ed74b..d2b6ebe 100644
> --- a/src/gallium/drivers/r600/r600_state_common.c
> +++ b/src/gallium/drivers/r600/r600_state_common.c
> @@ -372,9 +372,9 @@ static void r600_bind_rs_state(struct pipe_context *ctx, void *state)
>
>         /* Workaround for a missing scissor enable on r600. */
>         if (rctx->b.chip_class == R600 &&
> -           rs->scissor_enable != rctx->scissor[0].enable) {
> -               rctx->scissor[0].enable = rs->scissor_enable;
> -               r600_mark_atom_dirty(rctx, &rctx->scissor[0].atom);
> +           rs->scissor_enable != rctx->scissor.enable) {
> +               rctx->scissor.enable = rs->scissor_enable;
> +               r600_mark_atom_dirty(rctx, &rctx->scissor.atom);
>         }
>
>         /* Re-emit PA_SC_LINE_STIPPLE. */
> --
> 1.9.1
>
> _______________________________________________
> mesa-dev mailing list
> mesa-dev at lists.freedesktop.org
> http://lists.freedesktop.org/mailman/listinfo/mesa-dev


More information about the mesa-dev mailing list