[Mesa-dev] [PATCH] gallium: allow setting of the internal stream output offset
Roland Scheidegger
sroland at vmware.com
Fri Mar 7 13:32:28 PST 2014
Reviewed-by: Roland Scheidegger <sroland at vmware.com>
Am 07.03.2014 04:09, schrieb Zack Rusin:
> (This version includes comments from Roland.)
>
> D3D10 allows setting of the internal offset of a buffer, which is
> in general only incremented via actual stream output writes. By
> allowing setting of the internal offset draw_auto is capable
> of rendering from buffers which have not been actually streamed
> out to. Our interface didn't allow. This change functionally
> shouldn't make any difference to OpenGL where instead of an
> append_bitmask you just get a real array where -1 means append
> (like in D3D) and 0 means do not append.
>
> Signed-off-by: Zack Rusin <zackr at vmware.com>
> ---
> src/gallium/auxiliary/cso_cache/cso_context.c | 13 ++++++++-----
> src/gallium/auxiliary/cso_cache/cso_context.h | 2 +-
> src/gallium/auxiliary/draw/draw_context.h | 3 +--
> src/gallium/auxiliary/draw/draw_pt.c | 8 +++++---
> src/gallium/auxiliary/draw/draw_pt_so_emit.c | 3 +--
> src/gallium/auxiliary/hud/hud_context.c | 2 +-
> src/gallium/auxiliary/postprocess/pp_run.c | 2 +-
> src/gallium/auxiliary/util/u_blit.c | 2 +-
> src/gallium/auxiliary/util/u_blitter.c | 13 +++++++++----
> src/gallium/auxiliary/util/u_gen_mipmap.c | 2 +-
> src/gallium/docs/source/context.rst | 9 +++++----
> src/gallium/drivers/galahad/glhd_context.c | 4 ++--
> src/gallium/drivers/ilo/ilo_state.c | 8 ++++++--
> src/gallium/drivers/llvmpipe/lp_state_so.c | 12 ++++++------
> src/gallium/drivers/noop/noop_state.c | 2 +-
> src/gallium/drivers/nouveau/nv50/nv50_state.c | 7 ++++---
> src/gallium/drivers/nouveau/nvc0/nvc0_state.c | 7 ++++---
> src/gallium/drivers/radeon/r600_pipe_common.h | 2 +-
> src/gallium/drivers/radeon/r600_streamout.c | 5 ++++-
> src/gallium/drivers/radeonsi/si_descriptors.c | 4 ++--
> src/gallium/drivers/softpipe/sp_state_so.c | 2 +-
> src/gallium/drivers/trace/tr_context.c | 6 +++---
> src/gallium/include/pipe/p_context.h | 2 +-
> src/gallium/tools/trace/dump_state.py | 4 ++--
> src/mesa/state_tracker/st_cb_bitmap.c | 2 +-
> src/mesa/state_tracker/st_cb_clear.c | 2 +-
> src/mesa/state_tracker/st_cb_drawpixels.c | 2 +-
> src/mesa/state_tracker/st_cb_drawtex.c | 2 +-
> src/mesa/state_tracker/st_cb_xformfb.c | 20 +++++++++++++-------
> 29 files changed, 88 insertions(+), 64 deletions(-)
>
> diff --git a/src/gallium/auxiliary/cso_cache/cso_context.c b/src/gallium/auxiliary/cso_cache/cso_context.c
> index 2dcf01d..9146684 100644
> --- a/src/gallium/auxiliary/cso_cache/cso_context.c
> +++ b/src/gallium/auxiliary/cso_cache/cso_context.c
> @@ -332,7 +332,7 @@ void cso_release_all( struct cso_context *ctx )
> ctx->pipe->bind_vertex_elements_state( ctx->pipe, NULL );
>
> if (ctx->pipe->set_stream_output_targets)
> - ctx->pipe->set_stream_output_targets(ctx->pipe, 0, NULL, 0);
> + ctx->pipe->set_stream_output_targets(ctx->pipe, 0, NULL, NULL);
> }
>
> /* free fragment sampler views */
> @@ -1241,7 +1241,7 @@ void
> cso_set_stream_outputs(struct cso_context *ctx,
> unsigned num_targets,
> struct pipe_stream_output_target **targets,
> - unsigned append_bitmask)
> + const unsigned *offsets)
> {
> struct pipe_context *pipe = ctx->pipe;
> uint i;
> @@ -1266,7 +1266,7 @@ cso_set_stream_outputs(struct cso_context *ctx,
> }
>
> pipe->set_stream_output_targets(pipe, num_targets, targets,
> - append_bitmask);
> + offsets);
> ctx->nr_so_targets = num_targets;
> }
>
> @@ -1292,6 +1292,7 @@ cso_restore_stream_outputs(struct cso_context *ctx)
> {
> struct pipe_context *pipe = ctx->pipe;
> uint i;
> + unsigned offset[PIPE_MAX_SO_BUFFERS];
>
> if (!ctx->has_streamout) {
> return;
> @@ -1302,19 +1303,21 @@ cso_restore_stream_outputs(struct cso_context *ctx)
> return;
> }
>
> + assert(ctx->nr_so_targets_saved <= PIPE_MAX_SO_BUFFERS);
> for (i = 0; i < ctx->nr_so_targets_saved; i++) {
> pipe_so_target_reference(&ctx->so_targets[i], NULL);
> /* move the reference from one pointer to another */
> ctx->so_targets[i] = ctx->so_targets_saved[i];
> ctx->so_targets_saved[i] = NULL;
> + /* -1 means append */
> + offset[i] = (unsigned)-1;
> }
> for (; i < ctx->nr_so_targets; i++) {
> pipe_so_target_reference(&ctx->so_targets[i], NULL);
> }
>
> - /* ~0 means append */
> pipe->set_stream_output_targets(pipe, ctx->nr_so_targets_saved,
> - ctx->so_targets, ~0);
> + ctx->so_targets, offset);
>
> ctx->nr_so_targets = ctx->nr_so_targets_saved;
> ctx->nr_so_targets_saved = 0;
> diff --git a/src/gallium/auxiliary/cso_cache/cso_context.h b/src/gallium/auxiliary/cso_cache/cso_context.h
> index 822e2df..1aa9998 100644
> --- a/src/gallium/auxiliary/cso_cache/cso_context.h
> +++ b/src/gallium/auxiliary/cso_cache/cso_context.h
> @@ -115,7 +115,7 @@ unsigned cso_get_aux_vertex_buffer_slot(struct cso_context *ctx);
> void cso_set_stream_outputs(struct cso_context *ctx,
> unsigned num_targets,
> struct pipe_stream_output_target **targets,
> - unsigned append_bitmask);
> + const unsigned *offsets);
> void cso_save_stream_outputs(struct cso_context *ctx);
> void cso_restore_stream_outputs(struct cso_context *ctx);
>
> diff --git a/src/gallium/auxiliary/draw/draw_context.h b/src/gallium/auxiliary/draw/draw_context.h
> index c9f933c..f114f50 100644
> --- a/src/gallium/auxiliary/draw/draw_context.h
> +++ b/src/gallium/auxiliary/draw/draw_context.h
> @@ -53,14 +53,13 @@ struct tgsi_sampler;
> * structure to contain driver internal information
> * for stream out support. mapping stores the pointer
> * to the buffer contents, and internal offset stores
> - * stores an internal counter to how much of the stream
> + * an internal counter to how much of the stream
> * out buffer is used (in bytes).
> */
> struct draw_so_target {
> struct pipe_stream_output_target target;
> void *mapping;
> int internal_offset;
> - int emitted_vertices;
> };
>
> struct draw_context *draw_create( struct pipe_context *pipe );
> diff --git a/src/gallium/auxiliary/draw/draw_pt.c b/src/gallium/auxiliary/draw/draw_pt.c
> index e2ff7f9..3236e52 100644
> --- a/src/gallium/auxiliary/draw/draw_pt.c
> +++ b/src/gallium/auxiliary/draw/draw_pt.c
> @@ -431,14 +431,16 @@ draw_pt_arrays_restart(struct draw_context *draw,
> */
> static void
> resolve_draw_info(const struct pipe_draw_info *raw_info,
> - struct pipe_draw_info *info)
> + struct pipe_draw_info *info,
> + struct pipe_vertex_buffer *vertex_buffer)
> {
> memcpy(info, raw_info, sizeof(struct pipe_draw_info));
>
> if (raw_info->count_from_stream_output) {
> struct draw_so_target *target =
> (struct draw_so_target *)info->count_from_stream_output;
> - info->count = target->emitted_vertices;
> + assert(vertex_buffer != NULL);
> + info->count = target->internal_offset / vertex_buffer->stride;
>
> /* Stream output draw can not be indexed */
> debug_assert(!info->indexed);
> @@ -467,7 +469,7 @@ draw_vbo(struct draw_context *draw,
> */
> util_fpstate_set_denorms_to_zero(fpstate);
>
> - resolve_draw_info(info, &resolved_info);
> + resolve_draw_info(info, &resolved_info, &(draw->pt.vertex_buffer[0]));
> info = &resolved_info;
>
> assert(info->instance_count > 0);
> diff --git a/src/gallium/auxiliary/draw/draw_pt_so_emit.c b/src/gallium/auxiliary/draw/draw_pt_so_emit.c
> index 7cef17c..bd49d0a 100644
> --- a/src/gallium/auxiliary/draw/draw_pt_so_emit.c
> +++ b/src/gallium/auxiliary/draw/draw_pt_so_emit.c
> @@ -194,7 +194,7 @@ static void so_emit_prim(struct pt_so_emit *so,
> {
> int j;
> debug_printf("VERT[%d], offset = %d, slot[%d] sc = %d, num_c = %d, idx = %d = [",
> - i + draw->so.targets[ob]->emitted_vertices,
> + i,
> draw->so.targets[ob]->internal_offset,
> slot, start_comp, num_comps, idx);
> for (j = 0; j < num_comps; ++j) {
> @@ -209,7 +209,6 @@ static void so_emit_prim(struct pt_so_emit *so,
> struct draw_so_target *target = draw->so.targets[ob];
> if (target && buffer_written[ob]) {
> target->internal_offset += state->stride[ob] * sizeof(float);
> - target->emitted_vertices += 1;
> }
> }
> }
> diff --git a/src/gallium/auxiliary/hud/hud_context.c b/src/gallium/auxiliary/hud/hud_context.c
> index 465013c..ccf020b 100644
> --- a/src/gallium/auxiliary/hud/hud_context.c
> +++ b/src/gallium/auxiliary/hud/hud_context.c
> @@ -454,7 +454,7 @@ hud_draw(struct hud_context *hud, struct pipe_resource *tex)
> cso_set_depth_stencil_alpha(cso, &hud->dsa);
> cso_set_rasterizer(cso, &hud->rasterizer);
> cso_set_viewport(cso, &viewport);
> - cso_set_stream_outputs(cso, 0, NULL, 0);
> + cso_set_stream_outputs(cso, 0, NULL, NULL);
> cso_set_geometry_shader_handle(cso, NULL);
> cso_set_vertex_shader_handle(cso, hud->vs);
> cso_set_vertex_elements(cso, 2, hud->velems);
> diff --git a/src/gallium/auxiliary/postprocess/pp_run.c b/src/gallium/auxiliary/postprocess/pp_run.c
> index a4dc75d..7d9330c 100644
> --- a/src/gallium/auxiliary/postprocess/pp_run.c
> +++ b/src/gallium/auxiliary/postprocess/pp_run.c
> @@ -136,7 +136,7 @@ pp_run(struct pp_queue_t *ppq, struct pipe_resource *in,
>
> /* set default state */
> cso_set_sample_mask(cso, ~0);
> - cso_set_stream_outputs(cso, 0, NULL, 0);
> + cso_set_stream_outputs(cso, 0, NULL, NULL);
> cso_set_geometry_shader_handle(cso, NULL);
> cso_set_render_condition(cso, NULL, FALSE, 0);
>
> diff --git a/src/gallium/auxiliary/util/u_blit.c b/src/gallium/auxiliary/util/u_blit.c
> index dd33eb0..4b25b93 100644
> --- a/src/gallium/auxiliary/util/u_blit.c
> +++ b/src/gallium/auxiliary/util/u_blit.c
> @@ -537,7 +537,7 @@ util_blit_pixels_tex(struct blit_state *ctx,
> cso_set_sample_mask(ctx->cso, ~0);
> cso_set_rasterizer(ctx->cso, &ctx->rasterizer);
> cso_set_vertex_elements(ctx->cso, 2, ctx->velem);
> - cso_set_stream_outputs(ctx->cso, 0, NULL, 0);
> + cso_set_stream_outputs(ctx->cso, 0, NULL, NULL);
>
> /* sampler */
> ctx->sampler.normalized_coords = normalized;
> diff --git a/src/gallium/auxiliary/util/u_blitter.c b/src/gallium/auxiliary/util/u_blitter.c
> index 66b511e..1e7f374 100644
> --- a/src/gallium/auxiliary/util/u_blitter.c
> +++ b/src/gallium/auxiliary/util/u_blitter.c
> @@ -472,9 +472,12 @@ static void blitter_restore_vertex_states(struct blitter_context_priv *ctx)
>
> /* Stream outputs. */
> if (ctx->has_stream_out) {
> + unsigned offsets[PIPE_MAX_SO_BUFFERS];
> + for (i = 0; i < ctx->base.saved_num_so_targets; i++)
> + offsets[i] = (unsigned)-1;
> pipe->set_stream_output_targets(pipe,
> ctx->base.saved_num_so_targets,
> - ctx->base.saved_so_targets, ~0);
> + ctx->base.saved_so_targets, offsets);
>
> for (i = 0; i < ctx->base.saved_num_so_targets; i++)
> pipe_so_target_reference(&ctx->base.saved_so_targets[i], NULL);
> @@ -1013,7 +1016,7 @@ static void blitter_set_common_draw_rect_state(struct blitter_context_priv *ctx,
> if (ctx->has_geometry_shader)
> pipe->bind_gs_state(pipe, NULL);
> if (ctx->has_stream_out)
> - pipe->set_stream_output_targets(pipe, 0, NULL, 0);
> + pipe->set_stream_output_targets(pipe, 0, NULL, NULL);
> }
>
> static void blitter_draw(struct blitter_context_priv *ctx,
> @@ -1806,6 +1809,7 @@ void util_blitter_copy_buffer(struct blitter_context *blitter,
> struct pipe_context *pipe = ctx->base.pipe;
> struct pipe_vertex_buffer vb;
> struct pipe_stream_output_target *so_target;
> + unsigned offsets[PIPE_MAX_SO_BUFFERS] = {0};
>
> if (srcx >= src->width0 ||
> dstx >= dst->width0) {
> @@ -1847,7 +1851,7 @@ void util_blitter_copy_buffer(struct blitter_context *blitter,
> pipe->bind_rasterizer_state(pipe, ctx->rs_discard_state);
>
> so_target = pipe->create_stream_output_target(pipe, dst, dstx, size);
> - pipe->set_stream_output_targets(pipe, 1, &so_target, 0);
> + pipe->set_stream_output_targets(pipe, 1, &so_target, offsets);
>
> util_draw_arrays(pipe, PIPE_PRIM_POINTS, 0, size / 4);
>
> @@ -1867,6 +1871,7 @@ void util_blitter_clear_buffer(struct blitter_context *blitter,
> struct pipe_context *pipe = ctx->base.pipe;
> struct pipe_vertex_buffer vb = {0};
> struct pipe_stream_output_target *so_target;
> + unsigned offsets[PIPE_MAX_SO_BUFFERS] = {0};
>
> assert(num_channels >= 1);
> assert(num_channels <= 4);
> @@ -1906,7 +1911,7 @@ void util_blitter_clear_buffer(struct blitter_context *blitter,
> pipe->bind_rasterizer_state(pipe, ctx->rs_discard_state);
>
> so_target = pipe->create_stream_output_target(pipe, dst, offset, size);
> - pipe->set_stream_output_targets(pipe, 1, &so_target, 0);
> + pipe->set_stream_output_targets(pipe, 1, &so_target, offsets);
>
> util_draw_arrays(pipe, PIPE_PRIM_POINTS, 0, size / 4);
>
> diff --git a/src/gallium/auxiliary/util/u_gen_mipmap.c b/src/gallium/auxiliary/util/u_gen_mipmap.c
> index d3401a6..dad3ad2 100644
> --- a/src/gallium/auxiliary/util/u_gen_mipmap.c
> +++ b/src/gallium/auxiliary/util/u_gen_mipmap.c
> @@ -1578,7 +1578,7 @@ util_gen_mipmap(struct gen_mipmap_state *ctx,
> cso_set_rasterizer(ctx->cso, &ctx->rasterizer);
> cso_set_sample_mask(ctx->cso, ~0);
> cso_set_vertex_elements(ctx->cso, 2, ctx->velem);
> - cso_set_stream_outputs(ctx->cso, 0, NULL, 0);
> + cso_set_stream_outputs(ctx->cso, 0, NULL, NULL);
> cso_set_render_condition(ctx->cso, NULL, FALSE, 0);
>
> set_fragment_shader(ctx, type, is_depth);
> diff --git a/src/gallium/docs/source/context.rst b/src/gallium/docs/source/context.rst
> index 64df0ac..8e14522 100644
> --- a/src/gallium/docs/source/context.rst
> +++ b/src/gallium/docs/source/context.rst
> @@ -182,10 +182,11 @@ discussed above.
> use pipe_so_target_reference instead.
>
> * ``set_stream_output_targets`` binds stream output targets. The parameter
> - append_bitmask is a bitmask, where the i-th bit specifies whether new
> - primitives should be appended to the i-th buffer (writing starts at
> - the internal offset), or whether writing should start at the beginning
> - (the internal offset is effectively set to 0).
> + offset is an array which specifies the internal offset of the buffer. The
> + internal offset is, besides writing, used for reading the data during the
> + draw_auto stage, i.e. it specifies how much data there is in the buffer
> + for the purposes of the draw_auto stage. -1 means the buffer should
> + be appended to, and everything else sets the internal offset.
>
> NOTE: The currently-bound vertex or geometry shader must be compiled with
> the properly-filled-in structure pipe_stream_output_info describing which
> diff --git a/src/gallium/drivers/galahad/glhd_context.c b/src/gallium/drivers/galahad/glhd_context.c
> index fa743bd..2e61e59 100644
> --- a/src/gallium/drivers/galahad/glhd_context.c
> +++ b/src/gallium/drivers/galahad/glhd_context.c
> @@ -613,12 +613,12 @@ static INLINE void
> galahad_context_set_stream_output_targets(struct pipe_context *_pipe,
> unsigned num_targets,
> struct pipe_stream_output_target **tgs,
> - unsigned append_bitmask)
> + const unsigned *offsets)
> {
> struct galahad_context *glhd_pipe = galahad_context(_pipe);
> struct pipe_context *pipe = glhd_pipe->pipe;
>
> - pipe->set_stream_output_targets(pipe, num_targets, tgs, append_bitmask);
> + pipe->set_stream_output_targets(pipe, num_targets, tgs, offsets);
> }
>
> static void
> diff --git a/src/gallium/drivers/ilo/ilo_state.c b/src/gallium/drivers/ilo/ilo_state.c
> index 43dc347..1b97eaa 100644
> --- a/src/gallium/drivers/ilo/ilo_state.c
> +++ b/src/gallium/drivers/ilo/ilo_state.c
> @@ -856,10 +856,11 @@ static void
> ilo_set_stream_output_targets(struct pipe_context *pipe,
> unsigned num_targets,
> struct pipe_stream_output_target **targets,
> - unsigned append_bitmask)
> + const unsigned *offset)
> {
> struct ilo_context *ilo = ilo_context(pipe);
> unsigned i;
> + unsigned append_bitmask = 0;
>
> if (!targets)
> num_targets = 0;
> @@ -868,8 +869,11 @@ ilo_set_stream_output_targets(struct pipe_context *pipe,
> if (!ilo->so.count && !num_targets)
> return;
>
> - for (i = 0; i < num_targets; i++)
> + for (i = 0; i < num_targets; i++) {
> pipe_so_target_reference(&ilo->so.states[i], targets[i]);
> + if (offset[i] == (unsigned)-1)
> + append_bitmask |= 1 << i;
> + }
>
> for (; i < ilo->so.count; i++)
> pipe_so_target_reference(&ilo->so.states[i], NULL);
> diff --git a/src/gallium/drivers/llvmpipe/lp_state_so.c b/src/gallium/drivers/llvmpipe/lp_state_so.c
> index fa58f79..2af04cd 100644
> --- a/src/gallium/drivers/llvmpipe/lp_state_so.c
> +++ b/src/gallium/drivers/llvmpipe/lp_state_so.c
> @@ -64,17 +64,17 @@ static void
> llvmpipe_set_so_targets(struct pipe_context *pipe,
> unsigned num_targets,
> struct pipe_stream_output_target **targets,
> - unsigned append_bitmask)
> + const unsigned *offsets)
> {
> struct llvmpipe_context *llvmpipe = llvmpipe_context(pipe);
> int i;
> for (i = 0; i < num_targets; i++) {
> + const boolean append = (offsets[i] == (unsigned)-1);
> pipe_so_target_reference((struct pipe_stream_output_target **)&llvmpipe->so_targets[i], targets[i]);
> - /* if we're not appending then lets reset the internal
> - data of our so target */
> - if (!(append_bitmask & (1 << i)) && llvmpipe->so_targets[i]) {
> - llvmpipe->so_targets[i]->internal_offset = 0;
> - llvmpipe->so_targets[i]->emitted_vertices = 0;
> + /* If we're not appending then lets set the internal
> + offset to what was requested */
> + if (!append && llvmpipe->so_targets[i]) {
> + llvmpipe->so_targets[i]->internal_offset = offsets[i];
> }
> }
>
> diff --git a/src/gallium/drivers/noop/noop_state.c b/src/gallium/drivers/noop/noop_state.c
> index 9c62c27..5cb37b6 100644
> --- a/src/gallium/drivers/noop/noop_state.c
> +++ b/src/gallium/drivers/noop/noop_state.c
> @@ -274,7 +274,7 @@ static void noop_stream_output_target_destroy(struct pipe_context *ctx,
> static void noop_set_stream_output_targets(struct pipe_context *ctx,
> unsigned num_targets,
> struct pipe_stream_output_target **targets,
> - unsigned append_bitmask)
> + const unsigned *offsets)
> {
> }
>
> diff --git a/src/gallium/drivers/nouveau/nv50/nv50_state.c b/src/gallium/drivers/nouveau/nv50/nv50_state.c
> index 288ba46..065e10c 100644
> --- a/src/gallium/drivers/nouveau/nv50/nv50_state.c
> +++ b/src/gallium/drivers/nouveau/nv50/nv50_state.c
> @@ -1051,7 +1051,7 @@ static void
> nv50_set_stream_output_targets(struct pipe_context *pipe,
> unsigned num_targets,
> struct pipe_stream_output_target **targets,
> - unsigned append_mask)
> + const unsigned *offsets)
> {
> struct nv50_context *nv50 = nv50_context(pipe);
> unsigned i;
> @@ -1062,7 +1062,8 @@ nv50_set_stream_output_targets(struct pipe_context *pipe,
>
> for (i = 0; i < num_targets; ++i) {
> const boolean changed = nv50->so_target[i] != targets[i];
> - if (!changed && (append_mask & (1 << i)))
> + const boolean append = (offsets[i] == (unsigned)-1);
> + if (!changed && append)
> continue;
> nv50->so_targets_dirty |= 1 << i;
>
> @@ -1071,7 +1072,7 @@ nv50_set_stream_output_targets(struct pipe_context *pipe,
> serialize = FALSE;
> }
>
> - if (targets[i] && !(append_mask & (1 << i)))
> + if (targets[i] && !append)
> nv50_so_target(targets[i])->clean = TRUE;
>
> pipe_so_target_reference(&nv50->so_target[i], targets[i]);
> diff --git a/src/gallium/drivers/nouveau/nvc0/nvc0_state.c b/src/gallium/drivers/nouveau/nvc0/nvc0_state.c
> index 0213a8e..8fcff01 100644
> --- a/src/gallium/drivers/nouveau/nvc0/nvc0_state.c
> +++ b/src/gallium/drivers/nouveau/nvc0/nvc0_state.c
> @@ -1027,7 +1027,7 @@ static void
> nvc0_set_transform_feedback_targets(struct pipe_context *pipe,
> unsigned num_targets,
> struct pipe_stream_output_target **targets,
> - unsigned append_mask)
> + unsigned *offsets)
> {
> struct nvc0_context *nvc0 = nvc0_context(pipe);
> unsigned i;
> @@ -1036,14 +1036,15 @@ nvc0_set_transform_feedback_targets(struct pipe_context *pipe,
> assert(num_targets <= 4);
>
> for (i = 0; i < num_targets; ++i) {
> - if (nvc0->tfbbuf[i] == targets[i] && (append_mask & (1 << i)))
> + boolean append = (offsets[i] == ((unsigned)-1));
> + if (nvc0->tfbbuf[i] == targets[i] && append)
> continue;
> nvc0->tfbbuf_dirty |= 1 << i;
>
> if (nvc0->tfbbuf[i] && nvc0->tfbbuf[i] != targets[i])
> nvc0_so_target_save_offset(pipe, nvc0->tfbbuf[i], i, &serialize);
>
> - if (targets[i] && !(append_mask & (1 << i)))
> + if (targets[i] && !append)
> nvc0_so_target(targets[i])->clean = TRUE;
>
> pipe_so_target_reference(&nvc0->tfbbuf[i], targets[i]);
> diff --git a/src/gallium/drivers/radeon/r600_pipe_common.h b/src/gallium/drivers/radeon/r600_pipe_common.h
> index cf5aa08..b0000a0 100644
> --- a/src/gallium/drivers/radeon/r600_pipe_common.h
> +++ b/src/gallium/drivers/radeon/r600_pipe_common.h
> @@ -397,7 +397,7 @@ void r600_streamout_buffers_dirty(struct r600_common_context *rctx);
> void r600_set_streamout_targets(struct pipe_context *ctx,
> unsigned num_targets,
> struct pipe_stream_output_target **targets,
> - unsigned append_bitmask);
> + unsigned *offset);
> void r600_emit_streamout_end(struct r600_common_context *rctx);
> void r600_streamout_init(struct r600_common_context *rctx);
>
> diff --git a/src/gallium/drivers/radeon/r600_streamout.c b/src/gallium/drivers/radeon/r600_streamout.c
> index adc11e0..b6cf858 100644
> --- a/src/gallium/drivers/radeon/r600_streamout.c
> +++ b/src/gallium/drivers/radeon/r600_streamout.c
> @@ -108,10 +108,11 @@ void r600_streamout_buffers_dirty(struct r600_common_context *rctx)
> void r600_set_streamout_targets(struct pipe_context *ctx,
> unsigned num_targets,
> struct pipe_stream_output_target **targets,
> - unsigned append_bitmask)
> + const unsigned *offsets)
> {
> struct r600_common_context *rctx = (struct r600_common_context *)ctx;
> unsigned i;
> + unsigned append_bitmask = 0;
>
> /* Stop streamout. */
> if (rctx->streamout.num_targets && rctx->streamout.begin_emitted) {
> @@ -122,6 +123,8 @@ void r600_set_streamout_targets(struct pipe_context *ctx,
> for (i = 0; i < num_targets; i++) {
> pipe_so_target_reference((struct pipe_stream_output_target**)&rctx->streamout.targets[i], targets[i]);
> r600_context_add_resource_size(ctx, targets[i]->buffer);
> + if (offsets[i] == ((unsigned)-1))
> + append_bitmask |= 1 << i;
> }
> for (; i < rctx->streamout.num_targets; i++) {
> pipe_so_target_reference((struct pipe_stream_output_target**)&rctx->streamout.targets[i], NULL);
> diff --git a/src/gallium/drivers/radeonsi/si_descriptors.c b/src/gallium/drivers/radeonsi/si_descriptors.c
> index 9b10d01..4925bef 100644
> --- a/src/gallium/drivers/radeonsi/si_descriptors.c
> +++ b/src/gallium/drivers/radeonsi/si_descriptors.c
> @@ -605,7 +605,7 @@ void si_set_ring_buffer(struct pipe_context *ctx, uint shader, uint slot,
> static void si_set_streamout_targets(struct pipe_context *ctx,
> unsigned num_targets,
> struct pipe_stream_output_target **targets,
> - unsigned append_bitmask)
> + const unsigned *offsets)
> {
> struct si_context *sctx = (struct si_context *)ctx;
> struct si_buffer_resources *buffers = &sctx->rw_buffers[PIPE_SHADER_VERTEX];
> @@ -618,7 +618,7 @@ static void si_set_streamout_targets(struct pipe_context *ctx,
> */
>
> /* Set the VGT regs. */
> - r600_set_streamout_targets(ctx, num_targets, targets, append_bitmask);
> + r600_set_streamout_targets(ctx, num_targets, targets, offsets);
>
> /* Set the shader resources.*/
> for (i = 0; i < num_targets; i++) {
> diff --git a/src/gallium/drivers/softpipe/sp_state_so.c b/src/gallium/drivers/softpipe/sp_state_so.c
> index f456237..3878e4a 100644
> --- a/src/gallium/drivers/softpipe/sp_state_so.c
> +++ b/src/gallium/drivers/softpipe/sp_state_so.c
> @@ -63,7 +63,7 @@ static void
> softpipe_set_so_targets(struct pipe_context *pipe,
> unsigned num_targets,
> struct pipe_stream_output_target **targets,
> - unsigned append_bitmask)
> + const unsigned *offsets)
> {
> struct softpipe_context *softpipe = softpipe_context(pipe);
> unsigned i;
> diff --git a/src/gallium/drivers/trace/tr_context.c b/src/gallium/drivers/trace/tr_context.c
> index c10e010..3e99598 100644
> --- a/src/gallium/drivers/trace/tr_context.c
> +++ b/src/gallium/drivers/trace/tr_context.c
> @@ -1080,7 +1080,7 @@ static INLINE void
> trace_context_set_stream_output_targets(struct pipe_context *_pipe,
> unsigned num_targets,
> struct pipe_stream_output_target **tgs,
> - unsigned append_bitmask)
> + const unsigned *offsets)
> {
> struct trace_context *tr_ctx = trace_context(_pipe);
> struct pipe_context *pipe = tr_ctx->pipe;
> @@ -1090,9 +1090,9 @@ trace_context_set_stream_output_targets(struct pipe_context *_pipe,
> trace_dump_arg(ptr, pipe);
> trace_dump_arg(uint, num_targets);
> trace_dump_arg_array(ptr, tgs, num_targets);
> - trace_dump_arg(uint, append_bitmask);
> + trace_dump_arg_array(uint, offsets, num_targets);
>
> - pipe->set_stream_output_targets(pipe, num_targets, tgs, append_bitmask);
> + pipe->set_stream_output_targets(pipe, num_targets, tgs, offsets);
>
> trace_dump_call_end();
> }
> diff --git a/src/gallium/include/pipe/p_context.h b/src/gallium/include/pipe/p_context.h
> index 0702729..fe3045a 100644
> --- a/src/gallium/include/pipe/p_context.h
> +++ b/src/gallium/include/pipe/p_context.h
> @@ -260,7 +260,7 @@ struct pipe_context {
> void (*set_stream_output_targets)(struct pipe_context *,
> unsigned num_targets,
> struct pipe_stream_output_target **targets,
> - unsigned append_bitmask);
> + const unsigned *offsets);
>
> /*@}*/
>
> diff --git a/src/gallium/tools/trace/dump_state.py b/src/gallium/tools/trace/dump_state.py
> index bde00ec..8bb29e7 100755
> --- a/src/gallium/tools/trace/dump_state.py
> +++ b/src/gallium/tools/trace/dump_state.py
> @@ -536,9 +536,9 @@ class Context(Dispatcher):
> self._state.render_condition_condition = condition
> self._state.render_condition_mode = mode
>
> - def set_stream_output_targets(self, num_targets, tgs, append_bitmask):
> + def set_stream_output_targets(self, num_targets, tgs, offsets):
> self._state.so_targets = tgs
> - self._state.so_append_bitmask = append_bitmask
> + self._state.offsets = offsets
>
> def draw_vbo(self, info):
> self._draw_no += 1
> diff --git a/src/mesa/state_tracker/st_cb_bitmap.c b/src/mesa/state_tracker/st_cb_bitmap.c
> index 874ff77..e3ba5a8 100644
> --- a/src/mesa/state_tracker/st_cb_bitmap.c
> +++ b/src/mesa/state_tracker/st_cb_bitmap.c
> @@ -513,7 +513,7 @@ draw_bitmap_quad(struct gl_context *ctx, GLint x, GLint y, GLfloat z,
> }
>
> cso_set_vertex_elements(cso, 3, st->velems_util_draw);
> - cso_set_stream_outputs(st->cso_context, 0, NULL, 0);
> + cso_set_stream_outputs(st->cso_context, 0, NULL, NULL);
>
> /* convert Z from [0,1] to [-1,-1] to match viewport Z scale/bias */
> z = z * 2.0f - 1.0f;
> diff --git a/src/mesa/state_tracker/st_cb_clear.c b/src/mesa/state_tracker/st_cb_clear.c
> index 97cc5a2..fcd7e13 100644
> --- a/src/mesa/state_tracker/st_cb_clear.c
> +++ b/src/mesa/state_tracker/st_cb_clear.c
> @@ -307,7 +307,7 @@ clear_with_quad(struct gl_context *ctx, unsigned clear_buffers)
> }
>
> cso_set_vertex_elements(st->cso_context, 2, st->velems_util_draw);
> - cso_set_stream_outputs(st->cso_context, 0, NULL, 0);
> + cso_set_stream_outputs(st->cso_context, 0, NULL, NULL);
> cso_set_sample_mask(st->cso_context, ~0);
> cso_set_rasterizer(st->cso_context, &st->clear.raster);
>
> diff --git a/src/mesa/state_tracker/st_cb_drawpixels.c b/src/mesa/state_tracker/st_cb_drawpixels.c
> index 90f34e3..2b36361 100644
> --- a/src/mesa/state_tracker/st_cb_drawpixels.c
> +++ b/src/mesa/state_tracker/st_cb_drawpixels.c
> @@ -788,7 +788,7 @@ draw_textured_quad(struct gl_context *ctx, GLint x, GLint y, GLfloat z,
> }
>
> cso_set_vertex_elements(cso, 3, st->velems_util_draw);
> - cso_set_stream_outputs(st->cso_context, 0, NULL, 0);
> + cso_set_stream_outputs(st->cso_context, 0, NULL, NULL);
>
> /* texture state: */
> cso_set_sampler_views(cso, PIPE_SHADER_FRAGMENT, num_sampler_view, sv);
> diff --git a/src/mesa/state_tracker/st_cb_drawtex.c b/src/mesa/state_tracker/st_cb_drawtex.c
> index 047cf47..b0a44fd 100644
> --- a/src/mesa/state_tracker/st_cb_drawtex.c
> +++ b/src/mesa/state_tracker/st_cb_drawtex.c
> @@ -244,7 +244,7 @@ st_DrawTex(struct gl_context *ctx, GLfloat x, GLfloat y, GLfloat z,
> velements[i].src_format = PIPE_FORMAT_R32G32B32A32_FLOAT;
> }
> cso_set_vertex_elements(cso, numAttribs, velements);
> - cso_set_stream_outputs(st->cso_context, 0, NULL, 0);
> + cso_set_stream_outputs(st->cso_context, 0, NULL, NULL);
>
> /* viewport state: viewport matching window dims */
> {
> diff --git a/src/mesa/state_tracker/st_cb_xformfb.c b/src/mesa/state_tracker/st_cb_xformfb.c
> index e824fe9..8f75eda 100644
> --- a/src/mesa/state_tracker/st_cb_xformfb.c
> +++ b/src/mesa/state_tracker/st_cb_xformfb.c
> @@ -113,6 +113,7 @@ st_begin_transform_feedback(struct gl_context *ctx, GLenum mode,
> struct st_transform_feedback_object *sobj =
> st_transform_feedback_object(obj);
> unsigned i, max_num_targets;
> + unsigned offsets[PIPE_MAX_SO_BUFFERS] = {0};
>
> max_num_targets = MIN2(Elements(sobj->base.Buffers),
> Elements(sobj->targets));
> @@ -145,8 +146,8 @@ st_begin_transform_feedback(struct gl_context *ctx, GLenum mode,
> }
>
> /* Start writing at the beginning of each target. */
> - cso_set_stream_outputs(st->cso_context, sobj->num_targets, sobj->targets,
> - 0);
> + cso_set_stream_outputs(st->cso_context, sobj->num_targets,
> + sobj->targets, offsets);
> }
>
>
> @@ -155,7 +156,7 @@ st_pause_transform_feedback(struct gl_context *ctx,
> struct gl_transform_feedback_object *obj)
> {
> struct st_context *st = st_context(ctx);
> - cso_set_stream_outputs(st->cso_context, 0, NULL, 0);
> + cso_set_stream_outputs(st->cso_context, 0, NULL, NULL);
> }
>
>
> @@ -165,10 +166,15 @@ st_resume_transform_feedback(struct gl_context *ctx,
> {
> struct st_context *st = st_context(ctx);
> struct st_transform_feedback_object *sobj =
> - st_transform_feedback_object(obj);
> + st_transform_feedback_object(obj);
> + unsigned offsets[PIPE_MAX_SO_BUFFERS];
> + unsigned i;
> +
> + for (i = 0; i < PIPE_MAX_SO_BUFFERS; i++)
> + offsets[i] = (unsigned)-1;
>
> - cso_set_stream_outputs(st->cso_context, sobj->num_targets, sobj->targets,
> - ~0);
> + cso_set_stream_outputs(st->cso_context, sobj->num_targets,
> + sobj->targets, offsets);
> }
>
>
> @@ -198,7 +204,7 @@ st_end_transform_feedback(struct gl_context *ctx,
> struct st_transform_feedback_object *sobj =
> st_transform_feedback_object(obj);
>
> - cso_set_stream_outputs(st->cso_context, 0, NULL, 0);
> + cso_set_stream_outputs(st->cso_context, 0, NULL, NULL);
>
> pipe_so_target_reference(&sobj->draw_count,
> st_transform_feedback_get_draw_target(obj));
>
More information about the mesa-dev
mailing list