[Mesa-dev] [PATCH v3] anv: handle failures when growing reloc lists
Iago Toral
itoral at igalia.com
Thu Mar 16 07:56:30 UTC 2017
On Wed, 2017-03-15 at 16:56 +0200, Pohjolainen, Topi wrote:
> On Wed, Mar 15, 2017 at 01:03:37PM +0100, Iago Toral Quiroga wrote:
> >
> > Growing the reloc list happens through calling anv_reloc_list_add()
> > or
> > anv_reloc_list_append(). Make sure that we call these through
> > helpers
> > that check the result and set the batch error status if needed.
> >
> > v2:
> > - Handling the crashes is not good enough, we need to keep track
> > of
> > the error, for that, keep track of the errors in the batch
> > instead (Jason).
> > - Make reloc list growth go through helpers so we can have a
> > central
> > place where we can do error tracking (Jason).
> >
> > v3:
> > - Callers that need the offset returned by anv_reloc_list_add()
> > can
> > compute it themselves since it is extracted from the inputs to
> > the
> > function, so change the function to return a VkResult, make
> > anv_batch_emit_reloc() also return a VkResult and let their
> > callers
> > do the error management (Topi)
> > ---
> > src/intel/vulkan/anv_batch_chain.c | 40 +++++++++++++++++++++++++-
> > ------------
> > src/intel/vulkan/anv_private.h | 17 ++++++++++++----
> > src/intel/vulkan/genX_blorp_exec.c | 20 +++++++++++++++----
> > src/intel/vulkan/genX_cmd_buffer.c | 27 +++++++++++++------------
> > 4 files changed, 71 insertions(+), 33 deletions(-)
> >
> > diff --git a/src/intel/vulkan/anv_batch_chain.c
> > b/src/intel/vulkan/anv_batch_chain.c
> > index c6fdfe5..95df0c9 100644
> > --- a/src/intel/vulkan/anv_batch_chain.c
> > +++ b/src/intel/vulkan/anv_batch_chain.c
> > @@ -140,7 +140,7 @@ anv_reloc_list_grow(struct anv_reloc_list
> > *list,
> > return VK_SUCCESS;
> > }
> >
> > -uint64_t
> > +VkResult
> > anv_reloc_list_add(struct anv_reloc_list *list,
> > const VkAllocationCallbacks *alloc,
> > uint32_t offset, struct anv_bo *target_bo,
> > uint32_t delta)
> > @@ -151,8 +151,9 @@ anv_reloc_list_add(struct anv_reloc_list *list,
> > const uint32_t domain =
> > target_bo->is_winsys_bo ? I915_GEM_DOMAIN_RENDER : 0;
> >
> > - anv_reloc_list_grow(list, alloc, 1);
> > - /* TODO: Handle failure */
> > + VkResult result = anv_reloc_list_grow(list, alloc, 1);
> > + if (result != VK_SUCCESS)
> > + return result;
> >
> > /* XXX: Can we use I915_EXEC_HANDLE_LUT? */
> > index = list->num_relocs++;
> > @@ -166,16 +167,17 @@ anv_reloc_list_add(struct anv_reloc_list
> > *list,
> > entry->write_domain = domain;
> > VG(VALGRIND_CHECK_MEM_IS_DEFINED(entry, sizeof(*entry)));
> >
> > - return target_bo->offset + delta;
> > + return VK_SUCCESS;
> > }
> >
> > -static void
> > +static VkResult
> > anv_reloc_list_append(struct anv_reloc_list *list,
> > const VkAllocationCallbacks *alloc,
> > struct anv_reloc_list *other, uint32_t
> > offset)
> > {
> > - anv_reloc_list_grow(list, alloc, other->num_relocs);
> > - /* TODO: Handle failure */
> > + VkResult result = anv_reloc_list_grow(list, alloc, other-
> > >num_relocs);
> > + if (result != VK_SUCCESS)
> > + return result;
> >
> > memcpy(&list->relocs[list->num_relocs], &other->relocs[0],
> > other->num_relocs * sizeof(other->relocs[0]));
> > @@ -186,6 +188,7 @@ anv_reloc_list_append(struct anv_reloc_list
> > *list,
> > list->relocs[i + list->num_relocs].offset += offset;
> >
> > list->num_relocs += other->num_relocs;
> > + return VK_SUCCESS;
> > }
> >
> > /*--------------------------------------------------------------
> > ---------*
> > @@ -211,12 +214,19 @@ anv_batch_emit_dwords(struct anv_batch
> > *batch, int num_dwords)
> > return p;
> > }
> >
> > -uint64_t
> > +VkResult
> > anv_batch_emit_reloc(struct anv_batch *batch,
> > - void *location, struct anv_bo *bo, uint32_t
> > delta)
> > + void *location, struct anv_bo *bo, uint32_t
> > delta,
> > + uint64_t *offset)
> > {
> > - return anv_reloc_list_add(batch->relocs, batch->alloc,
> > - location - batch->start, bo, delta);
> > + VkResult result = anv_reloc_list_add(batch->relocs, batch-
> > >alloc,
> > + location - batch->start,
> > bo, delta);
> > + if (result != VK_SUCCESS)
> > + return result;
> I'm really sorry for the endless churn, but it looks to me that only
> anv_reloc_list_add() needs to report the error. I for some reason
> thought the
> callers of anv_batch_emit_reloc() need to take individual steps upon
> failure.
> All they really do is set the error state which we can do already
> here as
> you had in the original.
>
> So here just:
>
> if (result != VK_SUCCESS) {
> anv_batch_set_error(batch, result);
> return 0;
> }
>
> return bo->offset + delta;
>
> And leave _anv_combine_address() and blorp_emit_reloc() as they were.
> Now that
> you have written it out it becomes clearer to me.
Sure, no worries.
> >
> > +
> > + *offset = bo->offset + delta;
> > +
> > + return VK_SUCCESS;
> > }
> >
> > void
> > @@ -240,8 +250,12 @@ anv_batch_emit_batch(struct anv_batch *batch,
> > struct anv_batch *other)
> > memcpy(batch->next, other->start, size);
> >
> > offset = batch->next - batch->start;
> > - anv_reloc_list_append(batch->relocs, batch->alloc,
> > - other->relocs, offset);
> > + VkResult result = anv_reloc_list_append(batch->relocs, batch-
> > >alloc,
> > + other->relocs, offset);
> > + if (result != VK_SUCCESS) {
> > + anv_batch_set_error(batch, result);
> > + return;
> > + }
> >
> > batch->next += size;
> > }
> > diff --git a/src/intel/vulkan/anv_private.h
> > b/src/intel/vulkan/anv_private.h
> > index 87538de..081bfb6 100644
> > --- a/src/intel/vulkan/anv_private.h
> > +++ b/src/intel/vulkan/anv_private.h
> > @@ -673,7 +673,7 @@ VkResult anv_reloc_list_init(struct
> > anv_reloc_list *list,
> > void anv_reloc_list_finish(struct anv_reloc_list *list,
> > const VkAllocationCallbacks *alloc);
> >
> > -uint64_t anv_reloc_list_add(struct anv_reloc_list *list,
> > +VkResult anv_reloc_list_add(struct anv_reloc_list *list,
> > const VkAllocationCallbacks *alloc,
> > uint32_t offset, struct anv_bo
> > *target_bo,
> > uint32_t delta);
> > @@ -717,8 +717,9 @@ struct anv_batch {
> >
> > void *anv_batch_emit_dwords(struct anv_batch *batch, int
> > num_dwords);
> > void anv_batch_emit_batch(struct anv_batch *batch, struct
> > anv_batch *other);
> > -uint64_t anv_batch_emit_reloc(struct anv_batch *batch,
> > - void *location, struct anv_bo *bo,
> > uint32_t offset);
> > +VkResult anv_batch_emit_reloc(struct anv_batch *batch,
> > + void *location, struct anv_bo *bo,
> > + uint32_t delta, uint64_t *offset);
> > VkResult anv_device_submit_simple_batch(struct anv_device *device,
> > struct anv_batch *batch);
> >
> > @@ -751,7 +752,15 @@ _anv_combine_address(struct anv_batch *batch,
> > void *location,
> > } else {
> > assert(batch->start <= location && location < batch->end);
> >
> > - return anv_batch_emit_reloc(batch, location, address.bo,
> > address.offset + delta);
> > + uint64_t offset;
> > + VkResult result = anv_batch_emit_reloc(batch, location,
> > address.bo,
> > + address.offset +
> > delta, &offset);
> > + if (result != VK_SUCCESS) {
> > + anv_batch_set_error(batch, result);
> > + return 0;
> > + }
> > +
> > + return offset;
> > }
> > }
> >
> > diff --git a/src/intel/vulkan/genX_blorp_exec.c
> > b/src/intel/vulkan/genX_blorp_exec.c
> > index 7084735..f775ce8 100644
> > --- a/src/intel/vulkan/genX_blorp_exec.c
> > +++ b/src/intel/vulkan/genX_blorp_exec.c
> > @@ -48,8 +48,17 @@ blorp_emit_reloc(struct blorp_batch *batch,
> > struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> > assert(cmd_buffer->batch.start <= location &&
> > location < cmd_buffer->batch.end);
> > - return anv_batch_emit_reloc(&cmd_buffer->batch, location,
> > - address.buffer, address.offset +
> > delta);
> > +
> > + uint64_t offset;
> > + VkResult result =
> > + anv_batch_emit_reloc(&cmd_buffer->batch, location,
> > + address.buffer, address.offset + delta,
> > &offset);
> > + if (result != VK_SUCCESS) {
> > + anv_batch_set_error(&cmd_buffer->batch, result);
> > + return 0;
> > + }
> > +
> > + return offset;
> > }
> >
> > static void
> > @@ -57,8 +66,11 @@ blorp_surface_reloc(struct blorp_batch *batch,
> > uint32_t ss_offset,
> > struct blorp_address address, uint32_t delta)
> > {
> > struct anv_cmd_buffer *cmd_buffer = batch->driver_batch;
> > - anv_reloc_list_add(&cmd_buffer->surface_relocs, &cmd_buffer-
> > >pool->alloc,
> > - ss_offset, address.buffer, address.offset +
> > delta);
> > + VkResult result =
> > + anv_reloc_list_add(&cmd_buffer->surface_relocs, &cmd_buffer-
> > >pool->alloc,
> > + ss_offset, address.buffer, address.offset
> > + delta);
> > + if (result != VK_SUCCESS)
> > + anv_batch_set_error(&cmd_buffer->batch, result);
> > }
> >
> > static void *
> > diff --git a/src/intel/vulkan/genX_cmd_buffer.c
> > b/src/intel/vulkan/genX_cmd_buffer.c
> > index e3faa17..6a759f4 100644
> > --- a/src/intel/vulkan/genX_cmd_buffer.c
> > +++ b/src/intel/vulkan/genX_cmd_buffer.c
> > @@ -155,12 +155,19 @@
> > genX(cmd_buffer_emit_state_base_address)(struct anv_cmd_buffer
> > *cmd_buffer)
> > static void
> > add_surface_state_reloc(struct anv_cmd_buffer *cmd_buffer,
> > struct anv_state state,
> > + bool is_aux,
> > struct anv_bo *bo, uint32_t offset)
> > {
> > const struct isl_device *isl_dev = &cmd_buffer->device-
> > >isl_dev;
> >
> > - anv_reloc_list_add(&cmd_buffer->surface_relocs, &cmd_buffer-
> > >pool->alloc,
> > - state.offset + isl_dev->ss.addr_offset, bo,
> > offset);
> > + uint32_t total_offset = state.offset +
> > + (is_aux ? isl_dev->ss.aux_addr_offset : isl_dev-
> > >ss.addr_offset);
> > +
> > + VkResult result =
> > + anv_reloc_list_add(&cmd_buffer->surface_relocs, &cmd_buffer-
> > >pool->alloc,
> > + total_offset, bo, offset);
> > + if (result != VK_SUCCESS)
> > + anv_batch_set_error(&cmd_buffer->batch, result);
> > }
> >
> > static void
> > @@ -171,9 +178,7 @@ add_image_view_relocs(struct anv_cmd_buffer
> > *cmd_buffer,
> > {
> > const struct isl_device *isl_dev = &cmd_buffer->device-
> > >isl_dev;
> >
> > - anv_reloc_list_add(&cmd_buffer->surface_relocs, &cmd_buffer-
> > >pool->alloc,
> > - state.offset + isl_dev->ss.addr_offset,
> > - iview->bo, iview->offset);
> > + add_surface_state_reloc(cmd_buffer, state, false, iview->bo,
> > iview->offset);
> I also think we could avoid changes to add_surface_state_reloc()
> altogether
> if handled the special case of aux below. So here just:
I did this change because Jason suggested that we had helpers to call
anv_reloc_list_add() so we can centralize error management a bit in
those helpers, so in this case it looked like add_surface_state_reloc()
was the natural place for it. That said, I don't think there is a
strong reason to do it, however:
> VkResult result = anv_reloc_list_add(
> &cmd_buffer->surface_relocs,
> &cmd_buffer->pool->alloc,
> state.offset + isl_dev->ss.addr_offset,
> iview->bo, iview->offset);
> if (result != VK_SUCCESS) {
> anv_batch_set_error(&cmd_buffer->batch, result);
> return;
> }
I think we want to do error management in add_surface_state_reloc()
because that is called from various other places and it calls
anv_reloc_list_add, which can fail. In that case, this call to
anv_reloc_list_add() here is exactly normal surface_reloc, so I think
it makes sense to call add_surface_state_reloc() directly instead of
pretty much exactly replicating it here.
> >
> >
> > if (aux_usage != ISL_AUX_USAGE_NONE) {
> > uint32_t aux_offset = iview->offset + iview->image-
> > >aux_surface.offset;
> > @@ -186,9 +191,7 @@ add_image_view_relocs(struct anv_cmd_buffer
> > *cmd_buffer,
> > uint32_t *aux_addr_dw = state.map + isl_dev-
> > >ss.aux_addr_offset;
> > aux_offset += *aux_addr_dw & 0xfff;
> >
> > - anv_reloc_list_add(&cmd_buffer->surface_relocs, &cmd_buffer-
> > >pool->alloc,
> > - state.offset + isl_dev-
> > >ss.aux_addr_offset,
> > - iview->bo, aux_offset);
> And here:
>
> if (anv_reloc_list_add(&cmd_buffer->surface_relocs,
> &cmd_buffer->pool->alloc,
> state.offset + isl_dev-
> >ss.aux_addr_offset,
> iview->bo, aux_offset) != VK_SUCCESS)
> anv_batch_set_error(&cmd_buffer->batch, result);
Yes, we can do this. We would remove the "is_aux" parameter from
add_surface_state_reloc() which was a bit forced maybe and since this
is the only place where we needed it I don't think it is a big deal to
handle it separately.
Does this sound reasonable?
> >
> > + add_surface_state_reloc(cmd_buffer, state, true, iview->bo,
> > aux_offset);
> > }
> > }
> >
> > @@ -1120,7 +1123,7 @@ emit_binding_table(struct anv_cmd_buffer
> > *cmd_buffer,
> > format, bo_offset, 12, 1);
> >
> > bt_map[0] = surface_state.offset + state_offset;
> > - add_surface_state_reloc(cmd_buffer, surface_state, bo,
> > bo_offset);
> > + add_surface_state_reloc(cmd_buffer, surface_state, false,
> > bo, bo_offset);
> > }
> >
> > if (map->surface_count == 0)
> > @@ -1221,7 +1224,7 @@ emit_binding_table(struct anv_cmd_buffer
> > *cmd_buffer,
> > case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
> > surface_state = desc->buffer_view->surface_state;
> > assert(surface_state.alloc_size);
> > - add_surface_state_reloc(cmd_buffer, surface_state,
> > + add_surface_state_reloc(cmd_buffer, surface_state, false,
> > desc->buffer_view->bo,
> > desc->buffer_view->offset);
> > break;
> > @@ -1248,7 +1251,7 @@ emit_binding_table(struct anv_cmd_buffer
> > *cmd_buffer,
> >
> > anv_fill_buffer_surface_state(cmd_buffer->device,
> > surface_state,
> > format, offset, range, 1);
> > - add_surface_state_reloc(cmd_buffer, surface_state,
> > + add_surface_state_reloc(cmd_buffer, surface_state, false,
> > desc->buffer->bo,
> > desc->buffer->offset + offset);
> > break;
> > @@ -1259,7 +1262,7 @@ emit_binding_table(struct anv_cmd_buffer
> > *cmd_buffer,
> > ? desc->buffer_view->writeonly_storage_surface_state
> > : desc->buffer_view->storage_surface_state;
> > assert(surface_state.alloc_size);
> > - add_surface_state_reloc(cmd_buffer, surface_state,
> > + add_surface_state_reloc(cmd_buffer, surface_state, false,
> > desc->buffer_view->bo,
> > desc->buffer_view->offset);
> >
More information about the mesa-dev
mailing list