[Nouveau] [PATCH] nvc0: keep track of cb bindings per buffer, use for upload settings
Ilia Mirkin
imirkin at alum.mit.edu
Wed Sep 9 10:47:59 PDT 2015
On Wed, Sep 9, 2015 at 3:17 AM, Ilia Mirkin <imirkin at alum.mit.edu> wrote:
> CB updates to bound buffers need to go through the CB_DATA endpoints,
> otherwise the shader may not notice that the updates happened.
> Furthermore, these updates have to go in to the same address as the
> bound buffer, otherwise, again, the shader may not notice updates.
>
> So we keep track of all the places where a constbuf is bound, and
> iterate over all of them when updating data. If a binding is found that
> encompasses the region to be updated, then we use the settings of that
> binding for the upload. Otherwise we upload as a regular data update.
>
> This fixes piglit 'arb_uniform_buffer_object-rendering offset' as well
> as blurriness in Witcher2.
>
> Bugzilla: https://bugs.freedesktop.org/show_bug.cgi?id=91890
> Signed-off-by: Ilia Mirkin <imirkin at alum.mit.edu>
> Cc: "11.0" <mesa-stable at lists.freedesktop.org>
> ---
> src/gallium/drivers/nouveau/nouveau_buffer.c | 4 +-
> src/gallium/drivers/nouveau/nouveau_buffer.h | 2 +
> src/gallium/drivers/nouveau/nouveau_context.h | 5 ++-
> src/gallium/drivers/nouveau/nvc0/nvc0_context.h | 8 ++--
> src/gallium/drivers/nouveau/nvc0/nvc0_state.c | 2 +
> .../drivers/nouveau/nvc0/nvc0_state_validate.c | 3 +-
> src/gallium/drivers/nouveau/nvc0/nvc0_transfer.c | 46 ++++++++++++++++++++--
> 7 files changed, 58 insertions(+), 12 deletions(-)
>
> diff --git a/src/gallium/drivers/nouveau/nouveau_buffer.c b/src/gallium/drivers/nouveau/nouveau_buffer.c
> index 912b778..4937dae 100644
> --- a/src/gallium/drivers/nouveau/nouveau_buffer.c
> +++ b/src/gallium/drivers/nouveau/nouveau_buffer.c
> @@ -206,8 +206,8 @@ nouveau_transfer_write(struct nouveau_context *nv, struct nouveau_transfer *tx,
> nv->copy_data(nv, buf->bo, buf->offset + base, buf->domain,
> tx->bo, tx->offset + offset, NOUVEAU_BO_GART, size);
> else
> - if ((buf->base.bind & PIPE_BIND_CONSTANT_BUFFER) && nv->push_cb && can_cb)
> - nv->push_cb(nv, buf->bo, buf->domain, buf->offset, buf->base.width0,
> + if (nv->push_cb && can_cb)
> + nv->push_cb(nv, buf,
> base, size / 4, (const uint32_t *)data);
> else
> nv->push_data(nv, buf->bo, buf->offset + base, buf->domain, size, data);
> diff --git a/src/gallium/drivers/nouveau/nouveau_buffer.h b/src/gallium/drivers/nouveau/nouveau_buffer.h
> index 7e6a6cc..d45bf7a 100644
> --- a/src/gallium/drivers/nouveau/nouveau_buffer.h
> +++ b/src/gallium/drivers/nouveau/nouveau_buffer.h
> @@ -41,6 +41,8 @@ struct nv04_resource {
> uint8_t status;
> uint8_t domain;
>
> + uint16_t cb_bindings[6]; /* per-shader per-slot bindings */
> +
> struct nouveau_fence *fence;
> struct nouveau_fence *fence_wr;
>
> diff --git a/src/gallium/drivers/nouveau/nouveau_context.h b/src/gallium/drivers/nouveau/nouveau_context.h
> index 24deb7e..decb271 100644
> --- a/src/gallium/drivers/nouveau/nouveau_context.h
> +++ b/src/gallium/drivers/nouveau/nouveau_context.h
> @@ -6,6 +6,8 @@
>
> #define NOUVEAU_MAX_SCRATCH_BUFS 4
>
> +struct nv04_resource;
> +
> struct nouveau_context {
> struct pipe_context pipe;
> struct nouveau_screen *screen;
> @@ -23,8 +25,7 @@ struct nouveau_context {
> unsigned, const void *);
> /* base, size refer to the whole constant buffer */
> void (*push_cb)(struct nouveau_context *,
> - struct nouveau_bo *, unsigned domain,
> - unsigned base, unsigned size,
> + struct nv04_resource *,
> unsigned offset, unsigned words, const uint32_t *);
>
> /* @return: @ref reduced by nr of references found in context */
> diff --git a/src/gallium/drivers/nouveau/nvc0/nvc0_context.h b/src/gallium/drivers/nouveau/nvc0/nvc0_context.h
> index 6ed79cf..30bee3a 100644
> --- a/src/gallium/drivers/nouveau/nvc0/nvc0_context.h
> +++ b/src/gallium/drivers/nouveau/nvc0/nvc0_context.h
> @@ -299,10 +299,10 @@ nve4_p2mf_push_linear(struct nouveau_context *nv,
> struct nouveau_bo *dst, unsigned offset, unsigned domain,
> unsigned size, const void *data);
> void
> -nvc0_cb_push(struct nouveau_context *,
> - struct nouveau_bo *bo, unsigned domain,
> - unsigned base, unsigned size,
> - unsigned offset, unsigned words, const uint32_t *data);
> +nvc0_cb_bo_push(struct nouveau_context *,
> + struct nouveau_bo *bo, unsigned domain,
> + unsigned base, unsigned size,
> + unsigned offset, unsigned words, const uint32_t *data);
>
> /* nvc0_vbo.c */
> void nvc0_draw_vbo(struct pipe_context *, const struct pipe_draw_info *);
> diff --git a/src/gallium/drivers/nouveau/nvc0/nvc0_state.c b/src/gallium/drivers/nouveau/nvc0/nvc0_state.c
> index ee29912..c5bfd03 100644
> --- a/src/gallium/drivers/nouveau/nvc0/nvc0_state.c
> +++ b/src/gallium/drivers/nouveau/nvc0/nvc0_state.c
> @@ -831,6 +831,8 @@ nvc0_set_constant_buffer(struct pipe_context *pipe, uint shader, uint index,
> }
> nvc0->constbuf_dirty[s] |= 1 << i;
>
> + if (nvc0->constbuf[s][i].u.buf)
> + nv04_resource(nvc0->constbuf[s][i].u.buf)->cb_bindings[s] &= ~(1 << i);
> pipe_resource_reference(&nvc0->constbuf[s][i].u.buf, res);
>
> nvc0->constbuf[s][i].user = (cb && cb->user_buffer) ? true : false;
> diff --git a/src/gallium/drivers/nouveau/nvc0/nvc0_state_validate.c b/src/gallium/drivers/nouveau/nvc0/nvc0_state_validate.c
> index 47bd66d..aec0609 100644
> --- a/src/gallium/drivers/nouveau/nvc0/nvc0_state_validate.c
> +++ b/src/gallium/drivers/nouveau/nvc0/nvc0_state_validate.c
> @@ -440,7 +440,7 @@ nvc0_constbufs_validate(struct nvc0_context *nvc0)
> BEGIN_NVC0(push, NVC0_3D(CB_BIND(s)), 1);
> PUSH_DATA (push, (0 << 4) | 1);
> }
> - nvc0_cb_push(&nvc0->base, bo, NV_VRAM_DOMAIN(&nvc0->screen->base),
> + nvc0_cb_bo_push(&nvc0->base, bo, NV_VRAM_DOMAIN(&nvc0->screen->base),
> base, nvc0->state.uniform_buffer_bound[s],
> 0, (size + 3) / 4,
> nvc0->constbuf[s][0].u.data);
> @@ -458,6 +458,7 @@ nvc0_constbufs_validate(struct nvc0_context *nvc0)
> BCTX_REFN(nvc0->bufctx_3d, CB(s, i), res, RD);
>
> nvc0->cb_dirty = 1; /* Force cache flush for UBO. */
> + res->cb_bindings[s] |= 1 << i;
> } else {
> BEGIN_NVC0(push, NVC0_3D(CB_BIND(s)), 1);
> PUSH_DATA (push, (i << 4) | 0);
> diff --git a/src/gallium/drivers/nouveau/nvc0/nvc0_transfer.c b/src/gallium/drivers/nouveau/nvc0/nvc0_transfer.c
> index 7cc5b4b..ff2ad19 100644
> --- a/src/gallium/drivers/nouveau/nvc0/nvc0_transfer.c
> +++ b/src/gallium/drivers/nouveau/nvc0/nvc0_transfer.c
> @@ -506,12 +506,49 @@ nvc0_miptree_transfer_unmap(struct pipe_context *pctx,
> }
>
> /* This happens rather often with DTD9/st. */
> -void
> +static void
> nvc0_cb_push(struct nouveau_context *nv,
> - struct nouveau_bo *bo, unsigned domain,
> - unsigned base, unsigned size,
> + struct nv04_resource *res,
> unsigned offset, unsigned words, const uint32_t *data)
> {
> + struct nvc0_context *nvc0 = nvc0_context(&nv->pipe);
> + struct nvc0_constbuf *cb = NULL;
> + int s;
> +
> + /* Go through all the constbuf binding points of this buffer and try to
> + * find one which contains the region to be updated.
> + */
> + for (s = 0; s < 6 && !cb; s++) {
> + uint16_t bindings = res->cb_bindings[s];
> + while (bindings) {
> + int i = ffs(i) - 1;
joi tells me that this works considerably better as ffs(bindings) - 1.
Will do a piglit run on my GK208, see if Heaven still works, and then
push. (That's right... cower in the extensiveness of my QA process...)
> + uint32_t cb_offset = nvc0->constbuf[s][i].offset;
> +
> + bindings &= ~(1 << i);
> + if (cb_offset <= offset &&
> + cb_offset + nvc0->constbuf[s][i].size >= offset + words * 4) {
> + cb = &nvc0->constbuf[s][i];
> + break;
> + }
> + }
> + }
> +
> + if (cb) {
> + nvc0_cb_bo_push(nv, res->bo, res->domain,
> + res->offset + cb->offset, cb->size,
> + offset - cb->offset, words, data);
> + } else {
> + nv->push_data(nv, res->bo, res->offset + offset, res->domain,
> + words * 4, data);
> + }
> +}
> +
> +void
> +nvc0_cb_bo_push(struct nouveau_context *nv,
> + struct nouveau_bo *bo, unsigned domain,
> + unsigned base, unsigned size,
> + unsigned offset, unsigned words, const uint32_t *data)
> +{
> struct nouveau_pushbuf *push = nv->pushbuf;
>
> NOUVEAU_DRV_STAT(nv->screen, constbuf_upload_count, 1);
> @@ -520,6 +557,9 @@ nvc0_cb_push(struct nouveau_context *nv,
> assert(!(offset & 3));
> size = align(size, 0x100);
>
> + assert(offset < size);
> + assert(offset + words * 4 <= size);
> +
> BEGIN_NVC0(push, NVC0_3D(CB_SIZE), 3);
> PUSH_DATA (push, size);
> PUSH_DATAh(push, bo->offset + base);
> --
> 2.4.6
>
More information about the Nouveau
mailing list