[Mesa-dev] [PATCH 04/11] st/mesa: Use Array._DrawVAO in st_atom_array.c.
Marek Olšák
maraeo at gmail.com
Mon Nov 26 20:42:16 UTC 2018
I have this issue on radeonsi as well, but the bad commit is:
commit f1998e15ffccf260552bf559abe1a733a8ce990e
Author: Erik Faye-Lund <erik.faye-lund at collabora.com>
Date: Wed Nov 21 20:09:46 2018 +0100
mesa/main: remove ARB suffix from glGetnTexImage
This function has been core since OpenGL 4.3, so naming the
implementation and reporting erros using an ARB-suffix can be
confusing.
Signed-off-by: Erik Faye-Lund <erik.faye-lund at collabora.com>
Reviewed-by: Juan A. Suarez <jasuarez at igalia.com>
Reverting the commit fixes supertuxkart.
Marek
On Mon, Nov 26, 2018 at 1:40 PM Erik Faye-Lund <erik.faye-lund at collabora.com>
wrote:
> On Mon, 2018-05-07 at 08:14 +0200, Mathias.Froehlich at gmx.net wrote:
> > From: Mathias Fröhlich <mathias.froehlich at web.de>
> >
> > Finally make use of the binding information in the VAO when
> > setting up arrays for draw.
> >
> > v2: Emit less relocations also for interleaved userspace arrays.
> >
> > Signed-off-by: Mathias Fröhlich <Mathias.Froehlich at web.de>
>
> I know this is *very* late notice, but this commit broke Super Tux Kart
> on VirGL. Both the player-models as as well as the level data renders
> with gibberish vertex positions since this commit.
>
> The fix that Rob Clark did on top does not fix the problem (and
> shouldn't have; VirGL doesn't use NIR).
>
> > ---
> > src/mesa/state_tracker/st_atom_array.c | 432 ++++++++---------------
> > ----------
> > 1 file changed, 107 insertions(+), 325 deletions(-)
> >
> > diff --git a/src/mesa/state_tracker/st_atom_array.c
> > b/src/mesa/state_tracker/st_atom_array.c
> > index 2fd67e8d84..6b39b4186d 100644
> > --- a/src/mesa/state_tracker/st_atom_array.c
> > +++ b/src/mesa/state_tracker/st_atom_array.c
> > @@ -48,6 +48,7 @@
> > #include "main/bufferobj.h"
> > #include "main/glformats.h"
> > #include "main/varray.h"
> > +#include "main/arrayobj.h"
> >
> > /* vertex_formats[gltype - GL_BYTE][integer*2 + normalized][size -
> > 1] */
> > static const uint16_t vertex_formats[][4][4] = {
> > @@ -306,79 +307,6 @@ st_pipe_vertex_format(const struct
> > gl_array_attributes *attrib)
> > return vertex_formats[type - GL_BYTE][index][size-1];
> > }
> >
> > -static const struct gl_vertex_array *
> > -get_client_array(const struct gl_vertex_array *arrays,
> > - unsigned mesaAttr)
> > -{
> > - /* st_program uses 0xffffffff to denote a double placeholder
> > attribute */
> > - if (mesaAttr == ST_DOUBLE_ATTRIB_PLACEHOLDER)
> > - return NULL;
> > - return &arrays[mesaAttr];
> > -}
> > -
> > -/**
> > - * Examine the active arrays to determine if we have interleaved
> > - * vertex arrays all living in one VBO, or all living in user space.
> > - */
> > -static GLboolean
> > -is_interleaved_arrays(const struct st_vertex_program *vp,
> > - const struct gl_vertex_array *arrays,
> > - unsigned num_inputs)
> > -{
> > - GLuint attr;
> > - const struct gl_buffer_object *firstBufObj = NULL;
> > - GLint firstStride = -1;
> > - const GLubyte *firstPtr = NULL;
> > - GLboolean userSpaceBuffer = GL_FALSE;
> > -
> > - for (attr = 0; attr < num_inputs; attr++) {
> > - const struct gl_vertex_array *array;
> > - const struct gl_vertex_buffer_binding *binding;
> > - const struct gl_array_attributes *attrib;
> > - const GLubyte *ptr;
> > - const struct gl_buffer_object *bufObj;
> > - GLsizei stride;
> > -
> > - array = get_client_array(arrays, vp->index_to_input[attr]);
> > - if (!array)
> > - continue;
> > -
> > - binding = array->BufferBinding;
> > - attrib = array->VertexAttrib;
> > - stride = binding->Stride; /* in bytes */
> > - ptr = _mesa_vertex_attrib_address(attrib, binding);
> > -
> > - /* To keep things simple, don't allow interleaved zero-stride
> > attribs. */
> > - if (stride == 0)
> > - return false;
> > -
> > - bufObj = binding->BufferObj;
> > - if (attr == 0) {
> > - /* save info about the first array */
> > - firstStride = stride;
> > - firstPtr = ptr;
> > - firstBufObj = bufObj;
> > - userSpaceBuffer = !_mesa_is_bufferobj(bufObj);
> > - }
> > - else {
> > - /* check if other arrays interleave with the first, in same
> > buffer */
> > - if (stride != firstStride)
> > - return GL_FALSE; /* strides don't match */
> > -
> > - if (bufObj != firstBufObj)
> > - return GL_FALSE; /* arrays in different VBOs */
> > -
> > - if (llabs(ptr - firstPtr) > firstStride)
> > - return GL_FALSE; /* arrays start too far apart */
> > -
> > - if ((!_mesa_is_bufferobj(bufObj)) != userSpaceBuffer)
> > - return GL_FALSE; /* mix of VBO and user-space arrays */
> > - }
> > - }
> > -
> > - return GL_TRUE;
> > -}
> > -
> > static void init_velement(struct pipe_vertex_element *velement,
> > int src_offset, int format,
> > int instance_divisor, int vbo_index)
> > @@ -392,13 +320,14 @@ static void init_velement(struct
> > pipe_vertex_element *velement,
> >
> > static void init_velement_lowered(const struct st_vertex_program
> > *vp,
> > struct pipe_vertex_element
> > *velements,
> > - int src_offset, int format,
> > - int instance_divisor, int
> > vbo_index,
> > - int nr_components, GLboolean
> > doubles,
> > - GLuint *attr_idx)
> > + const struct gl_array_attributes
> > *attrib,
> > + int src_offset, int
> > instance_divisor,
> > + int vbo_index, int idx)
> > {
> > - int idx = *attr_idx;
> > - if (doubles) {
> > + const unsigned format = st_pipe_vertex_format(attrib);
> > + const GLubyte nr_components = attrib->Size;
> > +
> > + if (attrib->Doubles) {
> > int lower_format;
> >
> > if (nr_components < 2)
> > @@ -427,15 +356,11 @@ static void init_velement_lowered(const struct
> > st_vertex_program *vp,
> > init_velement(&velements[idx], src_offset,
> > PIPE_FORMAT_R32G32_UINT,
> > instance_divisor, vbo_index);
> > }
> > -
> > - idx++;
> > }
> > } else {
> > init_velement(&velements[idx], src_offset,
> > format, instance_divisor, vbo_index);
> > - idx++;
> > }
> > - *attr_idx = idx;
> > }
> >
> > static void
> > @@ -457,274 +382,131 @@ set_vertex_attribs(struct st_context *st,
> > cso_set_vertex_elements(cso, num_velements, velements);
> > }
> >
> > -/**
> > - * Set up for drawing interleaved arrays that all live in one VBO
> > - * or all live in user space.
> > - * \param vbuffer returns vertex buffer info
> > - * \param velements returns vertex element info
> > - */
> > -static void
> > -setup_interleaved_attribs(struct st_context *st,
> > - const struct st_vertex_program *vp,
> > - const struct gl_vertex_array *arrays,
> > - unsigned num_inputs)
> > -{
> > - struct pipe_vertex_buffer vbuffer;
> > - struct pipe_vertex_element velements[PIPE_MAX_ATTRIBS] = {{0}};
> > - GLuint attr;
> > - const GLubyte *low_addr = NULL;
> > - GLboolean usingVBO; /* all arrays in a VBO? */
> > - struct gl_buffer_object *bufobj;
> > - GLsizei stride;
> > -
> > - /* Find the lowest address of the arrays we're drawing,
> > - * Init bufobj and stride.
> > - */
> > - if (num_inputs) {
> > - const struct gl_vertex_array *array;
> > - const struct gl_vertex_buffer_binding *binding;
> > - const struct gl_array_attributes *attrib;
> > -
> > - array = get_client_array(arrays, vp->index_to_input[0]);
> > - assert(array);
> > -
> > - binding = array->BufferBinding;
> > - attrib = array->VertexAttrib;
> > -
> > - /* Since we're doing interleaved arrays, we know there'll be
> > at most
> > - * one buffer object and the stride will be the same for all
> > arrays.
> > - * Grab them now.
> > - */
> > - bufobj = binding->BufferObj;
> > - stride = binding->Stride;
> > -
> > - low_addr = _mesa_vertex_attrib_address(attrib, binding);
> > -
> > - for (attr = 1; attr < num_inputs; attr++) {
> > - const GLubyte *start;
> > - array = get_client_array(arrays, vp->index_to_input[attr]);
> > - if (!array)
> > - continue;
> > - binding = array->BufferBinding;
> > - attrib = array->VertexAttrib;
> > - start = _mesa_vertex_attrib_address(attrib, binding);
> > - low_addr = MIN2(low_addr, start);
> > - }
> > - }
> > - else {
> > - /* not sure we'll ever have zero inputs, but play it safe */
> > - bufobj = NULL;
> > - stride = 0;
> > - low_addr = 0;
> > - }
> > -
> > - /* are the arrays in user space? */
> > - usingVBO = _mesa_is_bufferobj(bufobj);
> > -
> > - for (attr = 0; attr < num_inputs;) {
> > - const struct gl_vertex_array *array;
> > - const struct gl_vertex_buffer_binding *binding;
> > - const struct gl_array_attributes *attrib;
> > - const GLubyte *ptr;
> > - unsigned src_offset;
> > - unsigned src_format;
> > -
> > - array = get_client_array(arrays, vp->index_to_input[attr]);
> > - assert(array);
> > -
> > - binding = array->BufferBinding;
> > - attrib = array->VertexAttrib;
> > - ptr = _mesa_vertex_attrib_address(attrib, binding);
> > -
> > - src_offset = (unsigned) (ptr - low_addr);
> > -
> > - src_format = st_pipe_vertex_format(attrib);
> > -
> > - init_velement_lowered(vp, velements, src_offset, src_format,
> > - binding->InstanceDivisor, 0,
> > - attrib->Size, attrib->Doubles, &attr);
> > - }
> > -
> > - /*
> > - * Return the vbuffer info and setup user-space attrib info, if
> > needed.
> > - */
> > - if (num_inputs == 0) {
> > - /* just defensive coding here */
> > - vbuffer.buffer.resource = NULL;
> > - vbuffer.is_user_buffer = false;
> > - vbuffer.buffer_offset = 0;
> > - vbuffer.stride = 0;
> > - }
> > - else if (usingVBO) {
> > - /* all interleaved arrays in a VBO */
> > - struct st_buffer_object *stobj = st_buffer_object(bufobj);
> > -
> > - if (!stobj || !stobj->buffer) {
> > - st->vertex_array_out_of_memory = true;
> > - return; /* out-of-memory error probably */
> > - }
> > -
> > - vbuffer.buffer.resource = stobj->buffer;
> > - vbuffer.is_user_buffer = false;
> > - vbuffer.buffer_offset = pointer_to_offset(low_addr);
> > - vbuffer.stride = stride;
> > - }
> > - else {
> > - /* all interleaved arrays in user memory */
> > - vbuffer.buffer.user = low_addr;
> > - vbuffer.is_user_buffer = !!low_addr; /* if NULL, then unbind
> > */
> > - vbuffer.buffer_offset = 0;
> > - vbuffer.stride = stride;
> > -
> > - if (low_addr)
> > - st->draw_needs_minmax_index = true;
> > - }
> > -
> > - set_vertex_attribs(st, &vbuffer, num_inputs ? 1 : 0,
> > - velements, num_inputs);
> > -}
> > -
> > -/**
> > - * Set up a separate pipe_vertex_buffer and pipe_vertex_element for
> > each
> > - * vertex attribute.
> > - * \param vbuffer returns vertex buffer info
> > - * \param velements returns vertex element info
> > - */
> > -static void
> > -setup_non_interleaved_attribs(struct st_context *st,
> > - const struct st_vertex_program *vp,
> > - const struct gl_vertex_array *arrays,
> > - unsigned num_inputs)
> > +void st_update_array(struct st_context *st)
> > {
> > struct gl_context *ctx = st->ctx;
> > + /* vertex program validation must be done before this */
> > + const struct st_vertex_program *vp = st->vp;
> > + /* _NEW_PROGRAM, ST_NEW_VS_STATE */
> > + const GLbitfield inputs_read = st->vp_variant->vert_attrib_mask;
> > + const struct gl_vertex_array_object *vao = ctx->Array._DrawVAO;
> > + const ubyte *input_to_index = vp->input_to_index;
> > +
> > struct pipe_vertex_buffer vbuffer[PIPE_MAX_ATTRIBS];
> > - struct pipe_vertex_element velements[PIPE_MAX_ATTRIBS] = {{0}};
> > + struct pipe_vertex_element velements[PIPE_MAX_ATTRIBS];
> > unsigned num_vbuffers = 0;
> > - unsigned unref_buffers = 0;
> > - GLuint attr;
> > -
> > - for (attr = 0; attr < num_inputs;) {
> > - const unsigned mesaAttr = vp->index_to_input[attr];
> > - const struct gl_vertex_array *array;
> > - const struct gl_vertex_buffer_binding *binding;
> > - const struct gl_array_attributes *attrib;
> > - struct gl_buffer_object *bufobj;
> > - GLsizei stride;
> > - unsigned src_format;
> > - unsigned bufidx;
> > -
> > - array = get_client_array(arrays, mesaAttr);
> > - assert(array);
> > -
> > - bufidx = num_vbuffers++;
> > -
> > - binding = array->BufferBinding;
> > - attrib = array->VertexAttrib;
> > - stride = binding->Stride;
> > - bufobj = binding->BufferObj;
> > -
> > - if (_mesa_is_bufferobj(bufobj)) {
> > - /* Attribute data is in a VBO.
> > - * Recall that for VBOs, the gl_vertex_array->Ptr field is
> > - * really an offset from the start of the VBO, not a
> > pointer.
> > - */
> > - struct st_buffer_object *stobj = st_buffer_object(bufobj);
> >
> > + st->vertex_array_out_of_memory = FALSE;
> > + st->draw_needs_minmax_index = false;
> > +
> > + /* _NEW_PROGRAM */
> > + /* ST_NEW_VERTEX_ARRAYS alias ctx->DriverFlags.NewArray */
> > + /* Process attribute array data. */
> > + GLbitfield mask = inputs_read & _mesa_draw_array_bits(ctx);
> > + while (mask) {
> > + /* The attribute index to start pulling a binding */
> > + const gl_vert_attrib i = ffs(mask) - 1;
> > + const struct gl_vertex_buffer_binding *const binding
> > + = _mesa_draw_buffer_binding(vao, i);
> > + const unsigned bufidx = num_vbuffers++;
> > +
> > + if (_mesa_is_bufferobj(binding->BufferObj)) {
> > + struct st_buffer_object *stobj = st_buffer_object(binding-
> > >BufferObj);
> > if (!stobj || !stobj->buffer) {
> > st->vertex_array_out_of_memory = true;
> > return; /* out-of-memory error probably */
> > }
> >
> > + /* Set the binding */
> > vbuffer[bufidx].buffer.resource = stobj->buffer;
> > vbuffer[bufidx].is_user_buffer = false;
> > - vbuffer[bufidx].buffer_offset =
> > - binding->Offset + attrib->RelativeOffset;
> > + vbuffer[bufidx].buffer_offset =
> > _mesa_draw_binding_offset(binding);
> > + } else {
> > + /* Set the binding */
> > + const void *ptr = (const void
> > *)_mesa_draw_binding_offset(binding);
> > + vbuffer[bufidx].buffer.user = ptr;
> > + vbuffer[bufidx].is_user_buffer = true;
> > + vbuffer[bufidx].buffer_offset = 0;
> > +
> > + if (!binding->InstanceDivisor)
> > + st->draw_needs_minmax_index = true;
> > }
> > - else {
> > - if (stride == 0) {
> > - unsigned size = attrib->_ElementSize;
> > - /* This is optimal for GPU cache line usage if the
> > upload size
> > - * is <= cache line size.
> > - */
> > - unsigned alignment = util_next_power_of_two(size);
> > -
> > - assert(attrib->Ptr);
> > - vbuffer[bufidx].buffer.user = attrib->Ptr;
> > - void *ptr = attrib->Ptr ? (void*)attrib->Ptr :
> > - (void*)ctx-
> > >Current.Attrib[mesaAttr];
> > -
> > - vbuffer[bufidx].is_user_buffer = false;
> > - vbuffer[bufidx].buffer.resource = NULL;
> > -
> > - /* Use const_uploader for zero-stride vertex attributes,
> > because
> > - * it may use a better memory placement than
> > stream_uploader.
> > - * The reason is that zero-stride attributes can be
> > fetched many
> > - * times (thousands of times), so a better placement is
> > going to
> > - * perform better.
> > - *
> > - * Upload the maximum possible size, which is 4x
> > GLdouble = 32.
> > - */
> > - u_upload_data(st->can_bind_const_buffer_as_vertex ?
> > - st->pipe->const_uploader :
> > - st->pipe->stream_uploader,
> > - 0, size, alignment, ptr,
> > - &vbuffer[bufidx].buffer_offset,
> > - &vbuffer[bufidx].buffer.resource);
> > - unref_buffers |= 1u << bufidx;
> > - } else {
> > - assert(attrib->Ptr);
> > - vbuffer[bufidx].buffer.user = attrib->Ptr;
> > - vbuffer[bufidx].is_user_buffer = true;
> > - vbuffer[bufidx].buffer_offset = 0;
> > -
> > - if (!binding->InstanceDivisor)
> > - st->draw_needs_minmax_index = true;
> > - }
> > + vbuffer[bufidx].stride = binding->Stride; /* in bytes */
> > +
> > + const GLbitfield boundmask =
> > _mesa_draw_bound_attrib_bits(binding);
> > + GLbitfield attrmask = mask & boundmask;
> > + /* Mark the those attributes as processed */
> > + mask &= ~boundmask;
> > + /* We can assume that we have array for the binding */
> > + assert(attrmask);
> > + /* Walk attributes belonging to the binding */
> > + while (attrmask) {
> > + const gl_vert_attrib attr = u_bit_scan(&attrmask);
> > + const struct gl_array_attributes *const attrib
> > + = _mesa_draw_array_attrib(vao, attr);
> > + const GLuint off =
> > _mesa_draw_attributes_relative_offset(attrib);
> > + init_velement_lowered(vp, velements, attrib, off,
> > + binding->InstanceDivisor, bufidx,
> > + input_to_index[attr]);
> > }
> > + }
> >
> > - /* common-case setup */
> > - vbuffer[bufidx].stride = stride; /* in bytes */
> > + const unsigned first_current_vbuffer = num_vbuffers;
> > + /* _NEW_PROGRAM | _NEW_CURRENT_ATTRIB */
> > + /* Process values that should have better been uniforms in the
> > application */
> > + GLbitfield curmask = inputs_read & _mesa_draw_current_bits(ctx);
> > + if (curmask) {
> > + /* For each attribute, upload the maximum possible size. */
> > + GLubyte data[VERT_ATTRIB_MAX*sizeof(GLdouble)*4];
> > + GLubyte *cursor = data;
> > + const unsigned bufidx = num_vbuffers++;
> > + unsigned max_alignment = 1;
> > +
> > + while (curmask) {
> > + const gl_vert_attrib attr = u_bit_scan(&curmask);
> > + const struct gl_array_attributes *const attrib
> > + = _mesa_draw_current_attrib(ctx, attr);
> > + const unsigned size = attrib->_ElementSize;
> > + const unsigned alignment = util_next_power_of_two(size);
> > + max_alignment = MAX2(max_alignment, alignment);
> > + memcpy(cursor, attrib->Ptr, size);
> > + if (alignment != size)
> > + memset(cursor + size, 0, alignment - size);
> > +
> > + init_velement_lowered(vp, velements, attrib, cursor - data,
> > 0,
> > + bufidx, input_to_index[attr]);
> > +
> > + cursor += alignment;
> > + }
> >
> > - src_format = st_pipe_vertex_format(attrib);
> > + vbuffer[bufidx].is_user_buffer = false;
> > + vbuffer[bufidx].buffer.resource = NULL;
> > + /* vbuffer[bufidx].buffer_offset is set below */
> > + vbuffer[bufidx].stride = 0;
> >
> > - init_velement_lowered(vp, velements, 0, src_format,
> > - binding->InstanceDivisor, bufidx,
> > - attrib->Size, attrib->Doubles, &attr);
> > + /* Use const_uploader for zero-stride vertex attributes,
> > because
> > + * it may use a better memory placement than stream_uploader.
> > + * The reason is that zero-stride attributes can be fetched
> > many
> > + * times (thousands of times), so a better placement is going
> > to
> > + * perform better.
> > + */
> > + u_upload_data(st->can_bind_const_buffer_as_vertex ?
> > + st->pipe->const_uploader :
> > + st->pipe->stream_uploader,
> > + 0, cursor - data, max_alignment, data,
> > + &vbuffer[bufidx].buffer_offset,
> > + &vbuffer[bufidx].buffer.resource);
> > }
> >
> > if (!ctx->Const.AllowMappedBuffersDuringExecution) {
> > u_upload_unmap(st->pipe->stream_uploader);
> > }
> >
> > + const unsigned num_inputs = st->vp_variant->num_inputs;
> > set_vertex_attribs(st, vbuffer, num_vbuffers, velements,
> > num_inputs);
> >
> > /* Unreference uploaded zero-stride vertex buffers. */
> > - while (unref_buffers) {
> > - unsigned i = u_bit_scan(&unref_buffers);
> > + for (unsigned i = first_current_vbuffer; i < num_vbuffers; ++i) {
> > pipe_resource_reference(&vbuffer[i].buffer.resource, NULL);
> > }
> > }
> > -
> > -void st_update_array(struct st_context *st)
> > -{
> > - struct gl_context *ctx = st->ctx;
> > - const struct gl_vertex_array *arrays = ctx->Array._DrawArrays;
> > - const struct st_vertex_program *vp;
> > - unsigned num_inputs;
> > -
> > - st->vertex_array_out_of_memory = FALSE;
> > - st->draw_needs_minmax_index = false;
> > -
> > - /* No drawing has been done yet, so do nothing. */
> > - if (!arrays)
> > - return;
> > -
> > - /* vertex program validation must be done before this */
> > - vp = st->vp;
> > - num_inputs = st->vp_variant->num_inputs;
> > -
> > - if (is_interleaved_arrays(vp, arrays, num_inputs))
> > - setup_interleaved_attribs(st, vp, arrays, num_inputs);
> > - else
> > - setup_non_interleaved_attribs(st, vp, arrays, num_inputs);
> > -}
>
> _______________________________________________
> mesa-dev mailing list
> mesa-dev at lists.freedesktop.org
> https://lists.freedesktop.org/mailman/listinfo/mesa-dev
>
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <https://lists.freedesktop.org/archives/mesa-dev/attachments/20181126/2d9a8bd6/attachment-0001.html>
More information about the mesa-dev
mailing list