[Mesa-dev] [PATCH 06/25] anv: Rework the way render target surfaces are allocated
Nanley Chery
nanleychery at gmail.com
Wed Nov 9 01:00:24 UTC 2016
On Tue, Nov 08, 2016 at 04:24:48PM -0800, Jason Ekstrand wrote:
> On Tue, Nov 8, 2016 at 3:13 PM, Nanley Chery <nanleychery at gmail.com> wrote:
>
> > On Sat, Oct 22, 2016 at 10:50:37AM -0700, Jason Ekstrand wrote:
> > > This commit moves the allocation and filling out of surface state from
> > > CreateImageView time to BeginRenderPass time. Instead of allocating the
> > > render target surface state as part of the image view, we allocate it in
> > > the command buffer state at the same time that we set up clears. For
> > > secondary command buffers, we allocate memory for the surface states in
> > > BeginCommandBuffer but don't fill them out; instead, we use our new
> > > SOL-based memcpy function to copy the surface states from the primary
> > > command buffer. This allows us to handle secondary command buffers
> > without
> > > the user specifying the framebuffer ahead-of-time.
> > > ---
> > > src/intel/vulkan/anv_cmd_buffer.c | 56 ----------
> > > src/intel/vulkan/anv_image.c | 22 ----
> > > src/intel/vulkan/anv_private.h | 24 ++++-
> > > src/intel/vulkan/genX_cmd_buffer.c | 204 +++++++++++++++++++++++++++++-
> > -------
> > > 4 files changed, 180 insertions(+), 126 deletions(-)
> > >
> > > diff --git a/src/intel/vulkan/anv_cmd_buffer.c
> > b/src/intel/vulkan/anv_cmd_buffer.c
> > > index a652f9a..372030c 100644
> > > --- a/src/intel/vulkan/anv_cmd_buffer.c
> > > +++ b/src/intel/vulkan/anv_cmd_buffer.c
> > > @@ -144,62 +144,6 @@ anv_cmd_state_reset(struct anv_cmd_buffer
> > *cmd_buffer)
> > > state->gen7.index_buffer = NULL;
> > > }
> > >
> > > -/**
> > > - * Setup anv_cmd_state::attachments for vkCmdBeginRenderPass.
> > > - */
> > > -void
> > > -anv_cmd_state_setup_attachments(struct anv_cmd_buffer *cmd_buffer,
> > > - const VkRenderPassBeginInfo *info)
> > > -{
> > > - struct anv_cmd_state *state = &cmd_buffer->state;
> > > - ANV_FROM_HANDLE(anv_render_pass, pass, info->renderPass);
> > > -
> > > - vk_free(&cmd_buffer->pool->alloc, state->attachments);
> > > -
> > > - if (pass->attachment_count == 0) {
> > > - state->attachments = NULL;
> > > - return;
> > > - }
> > > -
> > > - state->attachments = vk_alloc(&cmd_buffer->pool->alloc,
> > > - pass->attachment_count *
> > > - sizeof(state->attachments[0]),
> > > - 8, VK_SYSTEM_ALLOCATION_SCOPE_
> > OBJECT);
> > > - if (state->attachments == NULL) {
> > > - /* FIXME: Propagate VK_ERROR_OUT_OF_HOST_MEMORY to
> > vkEndCommandBuffer */
> > > - abort();
> > > - }
> > > -
> > > - for (uint32_t i = 0; i < pass->attachment_count; ++i) {
> > > - struct anv_render_pass_attachment *att = &pass->attachments[i];
> > > - VkImageAspectFlags att_aspects = vk_format_aspects(att->format);
> > > - VkImageAspectFlags clear_aspects = 0;
> > > -
> > > - if (att_aspects == VK_IMAGE_ASPECT_COLOR_BIT) {
> > > - /* color attachment */
> > > - if (att->load_op == VK_ATTACHMENT_LOAD_OP_CLEAR) {
> > > - clear_aspects |= VK_IMAGE_ASPECT_COLOR_BIT;
> > > - }
> > > - } else {
> > > - /* depthstencil attachment */
> > > - if ((att_aspects & VK_IMAGE_ASPECT_DEPTH_BIT) &&
> > > - att->load_op == VK_ATTACHMENT_LOAD_OP_CLEAR) {
> > > - clear_aspects |= VK_IMAGE_ASPECT_DEPTH_BIT;
> > > - }
> > > - if ((att_aspects & VK_IMAGE_ASPECT_STENCIL_BIT) &&
> > > - att->stencil_load_op == VK_ATTACHMENT_LOAD_OP_CLEAR) {
> > > - clear_aspects |= VK_IMAGE_ASPECT_STENCIL_BIT;
> > > - }
> > > - }
> > > -
> > > - state->attachments[i].pending_clear_aspects = clear_aspects;
> > > - if (clear_aspects) {
> > > - assert(info->clearValueCount > i);
> > > - state->attachments[i].clear_value = info->pClearValues[i];
> > > - }
> > > - }
> > > -}
> > > -
> > > VkResult
> > > anv_cmd_buffer_ensure_push_constants_size(struct anv_cmd_buffer
> > *cmd_buffer,
> > > gl_shader_stage stage,
> > uint32_t size)
> > > diff --git a/src/intel/vulkan/anv_image.c b/src/intel/vulkan/anv_image.c
> > > index b7c2e99..b014985 100644
> > > --- a/src/intel/vulkan/anv_image.c
> > > +++ b/src/intel/vulkan/anv_image.c
> > > @@ -504,23 +504,6 @@ anv_CreateImageView(VkDevice _device,
> > > iview->sampler_surface_state.alloc_size = 0;
> > > }
> > >
> > > - if (image->usage & VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT) {
> > > - iview->color_rt_surface_state = alloc_surface_state(device);
> > > -
> > > - struct isl_view view = iview->isl;
> > > - view.usage |= ISL_SURF_USAGE_RENDER_TARGET_BIT;
> > > - isl_surf_fill_state(&device->isl_dev,
> > > - iview->color_rt_surface_state.map,
> > > - .surf = &surface->isl,
> > > - .view = &view,
> > > - .mocs = device->default_mocs);
> > > -
> > > - if (!device->info.has_llc)
> > > - anv_state_clflush(iview->color_rt_surface_state);
> > > - } else {
> > > - iview->color_rt_surface_state.alloc_size = 0;
> > > - }
> > > -
> > > /* NOTE: This one needs to go last since it may stomp
> > isl_view.format */
> > > if (image->usage & VK_IMAGE_USAGE_STORAGE_BIT) {
> > > iview->storage_surface_state = alloc_surface_state(device);
> > > @@ -565,11 +548,6 @@ anv_DestroyImageView(VkDevice _device, VkImageView
> > _iview,
> > > ANV_FROM_HANDLE(anv_device, device, _device);
> > > ANV_FROM_HANDLE(anv_image_view, iview, _iview);
> > >
> > > - if (iview->color_rt_surface_state.alloc_size > 0) {
> > > - anv_state_pool_free(&device->surface_state_pool,
> > > - iview->color_rt_surface_state);
> > > - }
> > > -
> > > if (iview->sampler_surface_state.alloc_size > 0) {
> > > anv_state_pool_free(&device->surface_state_pool,
> > > iview->sampler_surface_state);
> > > diff --git a/src/intel/vulkan/anv_private.h b/src/intel/vulkan/anv_
> > private.h
> > > index a6611f1..2a98ea1 100644
> > > --- a/src/intel/vulkan/anv_private.h
> > > +++ b/src/intel/vulkan/anv_private.h
> > > @@ -1059,6 +1059,8 @@ void anv_dynamic_state_copy(struct
> > anv_dynamic_state *dest,
> > > * The clear value is valid only if there exists a pending clear.
> > > */
> > > struct anv_attachment_state {
> > > + struct anv_state color_rt_state;
> > > +
> > > VkImageAspectFlags pending_clear_aspects;
> > > VkClearValue clear_value;
> > > };
> > > @@ -1099,6 +1101,19 @@ struct anv_cmd_state {
> > > */
> > > struct anv_attachment_state * attachments;
> > >
> > > + /**
> > > + * Surface states for color render targets. These are stored in a
> > single
> > > + * flat array. For depth-stencil attachments, the surface state is
> > simply
> > > + * left blank.
> > > + */
> > > + struct anv_state render_pass_states;
> > > +
> > > + /**
> > > + * A null surface state of the right size to match the framebuffer.
> > This
> > > + * is one of the states in render_pass_states.
> > > + */
> > > + struct anv_state null_surface_state;
> > > +
> > > struct {
> > > struct anv_buffer * index_buffer;
> > > uint32_t index_type; /**<
> > 3DSTATE_INDEX_BUFFER.IndexFormat */
> > > @@ -1237,8 +1252,10 @@ void gen8_cmd_buffer_emit_depth_viewport(struct
> > anv_cmd_buffer *cmd_buffer,
> > > bool depth_clamp_enable);
> > > void gen7_cmd_buffer_emit_scissor(struct anv_cmd_buffer *cmd_buffer);
> > >
> > > -void anv_cmd_state_setup_attachments(struct anv_cmd_buffer *cmd_buffer,
> > > - const VkRenderPassBeginInfo *info);
> > > +void anv_cmd_buffer_setup_attachments(struct anv_cmd_buffer
> > *cmd_buffer,
> > > + struct anv_render_pass *pass,
> > > + struct anv_framebuffer
> > *framebuffer,
> > > + const VkClearValue *clear_values);
> > >
> > > struct anv_state
> > > anv_cmd_buffer_push_constants(struct anv_cmd_buffer *cmd_buffer,
> > > @@ -1549,9 +1566,6 @@ struct anv_image_view {
> > > VkFormat vk_format;
> > > VkExtent3D extent; /**< Extent of VkImageViewCreateInfo::baseMipLevel.
> > */
> > >
> > > - /** RENDER_SURFACE_STATE when using image as a color render target.
> > */
> > > - struct anv_state color_rt_surface_state;
> > > -
> > > /** RENDER_SURFACE_STATE when using image as a sampler surface. */
> > > struct anv_state sampler_surface_state;
> > >
> > > diff --git a/src/intel/vulkan/genX_cmd_buffer.c
> > b/src/intel/vulkan/genX_cmd_buffer.c
> > > index 8734389..78b9bcc 100644
> > > --- a/src/intel/vulkan/genX_cmd_buffer.c
> > > +++ b/src/intel/vulkan/genX_cmd_buffer.c
> > > @@ -25,6 +25,7 @@
> > > #include <stdbool.h>
> > >
> > > #include "anv_private.h"
> > > +#include "vk_format_info.h"
> > >
> > > #include "common/gen_l3_config.h"
> > > #include "genxml/gen_macros.h"
> > > @@ -150,6 +151,142 @@ genX(cmd_buffer_emit_state_base_address)(struct
> > anv_cmd_buffer *cmd_buffer)
> > > }
> > > }
> > >
> > > +/**
> > > + * Setup anv_cmd_state::attachments for vkCmdBeginRenderPass.
> > > + */
> > > +static void
> > > +genX(cmd_buffer_setup_attachments)(struct anv_cmd_buffer *cmd_buffer,
> > > + struct anv_render_pass *pass,
> > > + struct anv_framebuffer *framebuffer,
> > > + const VkClearValue *clear_values)
> > > +{
> > > + const struct isl_device *isl_dev = &cmd_buffer->device->isl_dev;
> > > + struct anv_cmd_state *state = &cmd_buffer->state;
> > > +
> > > + vk_free(&cmd_buffer->pool->alloc, state->attachments);
> > > +
> > > + if (pass->attachment_count == 0) {
> > > + state->attachments = NULL;
> > > + return;
> > > + }
> > > +
> > > + state->attachments = vk_alloc(&cmd_buffer->pool->alloc,
> > > + pass->attachment_count *
> > > + sizeof(state->attachments[0]),
> > > + 8, VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
> > > + if (state->attachments == NULL) {
> > > + /* FIXME: Propagate VK_ERROR_OUT_OF_HOST_MEMORY to
> > vkEndCommandBuffer */
> > > + abort();
> > > + }
> > > +
> > > + bool need_null_state = false;
> > > + for (uint32_t s = 0; s < pass->subpass_count; ++s) {
> > > + if (pass->subpasses[s].color_count == 0) {
> > > + need_null_state = true;
> > > + break;
> > > + }
> > > + }
> > > +
> > > + unsigned num_states = need_null_state;
> > > + for (uint32_t i = 0; i < pass->attachment_count; ++i) {
> > > + if (vk_format_is_color(pass->attachments[i].format))
> > > + num_states++;
> > > + }
> > > +
> > > + const uint32_t ss_stride = align_u32(isl_dev->ss.size,
> > isl_dev->ss.align);
> > > + state->render_pass_states =
> > > + anv_state_stream_alloc(&cmd_buffer->surface_state_stream,
> > > + num_states * ss_stride, isl_dev->ss.align);
> > > +
> > > + struct anv_state next_state = state->render_pass_states;
> > > + next_state.alloc_size = isl_dev->ss.size;
> > > +
> > > + if (need_null_state) {
> > > + state->null_surface_state = next_state;
> > > + next_state.offset += ss_stride;
> > > + next_state.map += ss_stride;
> > > + }
> > > +
> > > + for (uint32_t i = 0; i < pass->attachment_count; ++i) {
> > > + if (vk_format_is_color(pass->attachments[i].format)) {
> > > + state->attachments[i].color_rt_state = next_state;
> > > + next_state.offset += ss_stride;
> > > + next_state.map += ss_stride;
> > > + }
> > > + }
> > > + assert(next_state.offset == state->render_pass_states.offset +
> > > + state->render_pass_states.alloc_size);
> > > +
> > > + if (framebuffer) {
> > > + assert(pass->attachment_count == framebuffer->attachment_count);
> > > +
> > > + if (need_null_state) {
> > > + struct GENX(RENDER_SURFACE_STATE) null_ss = {
> > > + .SurfaceType = SURFTYPE_NULL,
> > > + .SurfaceArray = framebuffer->layers > 0,
> > > + .SurfaceFormat = ISL_FORMAT_R8G8B8A8_UNORM,
> > > +#if GEN_GEN >= 8
> > > + .TileMode = YMAJOR,
> > > +#else
> > > + .TiledSurface = true,
> > > +#endif
> > > + .Width = framebuffer->width - 1,
> > > + .Height = framebuffer->height - 1,
> > > + .Depth = framebuffer->layers - 1,
> > > + .RenderTargetViewExtent = framebuffer->layers - 1,
> > > + };
> > > + GENX(RENDER_SURFACE_STATE_pack)(NULL,
> > state->null_surface_state.map,
> > > + &null_ss);
> > > + }
> > > +
> > > + for (uint32_t i = 0; i < pass->attachment_count; ++i) {
> > > + struct anv_render_pass_attachment *att = &pass->attachments[i];
> > > + VkImageAspectFlags att_aspects = vk_format_aspects(att->format)
> > ;
> > > + VkImageAspectFlags clear_aspects = 0;
> > > +
> > > + if (att_aspects == VK_IMAGE_ASPECT_COLOR_BIT) {
> > > + /* color attachment */
> > > + if (att->load_op == VK_ATTACHMENT_LOAD_OP_CLEAR) {
> > > + clear_aspects |= VK_IMAGE_ASPECT_COLOR_BIT;
> > > + }
> > > + } else {
> > > + /* depthstencil attachment */
> > > + if ((att_aspects & VK_IMAGE_ASPECT_DEPTH_BIT) &&
> > > + att->load_op == VK_ATTACHMENT_LOAD_OP_CLEAR) {
> > > + clear_aspects |= VK_IMAGE_ASPECT_DEPTH_BIT;
> > > + }
> > > + if ((att_aspects & VK_IMAGE_ASPECT_STENCIL_BIT) &&
> > > + att->stencil_load_op == VK_ATTACHMENT_LOAD_OP_CLEAR) {
> > > + clear_aspects |= VK_IMAGE_ASPECT_STENCIL_BIT;
> > > + }
> > > + }
> > > +
> > > + state->attachments[i].pending_clear_aspects = clear_aspects;
> > > + if (clear_aspects)
> > > + state->attachments[i].clear_value = clear_values[i];
> > > +
> > > + struct anv_image_view *iview = framebuffer->attachments[i];
> > > + assert(iview->image->vk_format == att->format);
> >
> > This assertion fails when running Dota 2 on your wip/anv-null-fb branch.
> > I don't know if this branch is the most up-to-date version of this
> > series, but it was the easiest way to test it (I couldn't get the mailing
> > list patches to apply with git am). Are you able to reproduce this?
> >
>
> That's odd... I haven't seen that and I have run dota2 with CCS on top of
> this branch but may be not in a debug build. What are the two formats when
> it fails? I suppose it's possible that it's ATTACHMENT_UNUSED or something.
>
(gdb) p iview->image->vk_format
$1 = VK_FORMAT_B8G8R8A8_SRGB
(gdb) p att->format
$2 = VK_FORMAT_B8G8R8A8_UNORM
>
> > - Nanley
> >
> > > +
> > > + if (att_aspects == VK_IMAGE_ASPECT_COLOR_BIT) {
> > > + struct isl_view view = iview->isl;
> > > + view.usage |= ISL_SURF_USAGE_RENDER_TARGET_BIT;
> > > + isl_surf_fill_state(isl_dev,
> > > + state->attachments[i].color_
> > rt_state.map,
> > > + .surf = &iview->image->color_surface.
> > isl,
> > > + .view = &view,
> > > + .mocs = cmd_buffer->device->default_
> > mocs);
> > > +
> > > + anv_cmd_buffer_add_surface_state_reloc(cmd_buffer,
> > > + state->attachments[i].color_rt_state, iview->bo,
> > iview->offset);
> > > + }
> > > + }
> > > +
> > > + if (!cmd_buffer->device->info.has_llc)
> > > + anv_state_clflush(state->render_pass_states);
> > > + }
> > > +}
> > > +
> > > VkResult
> > > genX(BeginCommandBuffer)(
> > > VkCommandBuffer commandBuffer,
> > > @@ -189,6 +326,9 @@ genX(BeginCommandBuffer)(
> > > cmd_buffer->state.subpass =
> > > &cmd_buffer->state.pass->subpasses[pBeginInfo->
> > pInheritanceInfo->subpass];
> > >
> > > + genX(cmd_buffer_setup_attachments)(cmd_buffer,
> > cmd_buffer->state.pass,
> > > + NULL, NULL);
> > > +
> > > cmd_buffer->state.dirty |= ANV_CMD_DIRTY_RENDER_TARGETS;
> > > }
> > >
> > > @@ -232,6 +372,22 @@ genX(CmdExecuteCommands)(
> > >
> > > assert(secondary->level == VK_COMMAND_BUFFER_LEVEL_SECONDARY);
> > >
> > > + if (secondary->usage_flags &
> > > + VK_COMMAND_BUFFER_USAGE_RENDER_PASS_CONTINUE_BIT) {
> > > + /* If we're continuing a render pass from the primary, we need
> > to
> > > + * copy the surface states for the current subpass into the
> > storage
> > > + * we allocated for them in BeginCommandBuffer.
> > > + */
> > > + struct anv_bo *ss_bo = &primary->device->surface_
> > state_block_pool.bo;
> > > + struct anv_state src_state = primary->state.render_pass_
> > states;
> > > + struct anv_state dst_state = secondary->state.render_pass_
> > states;
> > > + assert(src_state.alloc_size == dst_state.alloc_size);
> > > +
> > > + genX(cmd_buffer_gpu_memcpy)(primary, ss_bo, dst_state.offset,
> > > + ss_bo, src_state.offset,
> > > + src_state.alloc_size);
> > > + }
> > > +
> > > anv_cmd_buffer_add_secondary(primary, secondary);
> > > }
> > >
> > > @@ -628,43 +784,11 @@ cmd_buffer_alloc_push_constants(struct
> > anv_cmd_buffer *cmd_buffer)
> > > cmd_buffer->state.push_constants_dirty |=
> > VK_SHADER_STAGE_ALL_GRAPHICS;
> > > }
> > >
> > > -static struct anv_state
> > > -alloc_null_surface_state(struct anv_cmd_buffer *cmd_buffer,
> > > - struct anv_framebuffer *fb)
> > > -{
> > > - struct anv_state state =
> > > - anv_cmd_buffer_alloc_surface_state(cmd_buffer);
> > > -
> > > - struct GENX(RENDER_SURFACE_STATE) null_ss = {
> > > - .SurfaceType = SURFTYPE_NULL,
> > > - .SurfaceArray = fb->layers > 0,
> > > - .SurfaceFormat = ISL_FORMAT_R8G8B8A8_UNORM,
> > > -#if GEN_GEN >= 8
> > > - .TileMode = YMAJOR,
> > > -#else
> > > - .TiledSurface = true,
> > > -#endif
> > > - .Width = fb->width - 1,
> > > - .Height = fb->height - 1,
> > > - .Depth = fb->layers - 1,
> > > - .RenderTargetViewExtent = fb->layers - 1,
> > > - };
> > > -
> > > - GENX(RENDER_SURFACE_STATE_pack)(NULL, state.map, &null_ss);
> > > -
> > > - if (!cmd_buffer->device->info.has_llc)
> > > - anv_state_clflush(state);
> > > -
> > > - return state;
> > > -}
> > > -
> > > -
> > > static VkResult
> > > emit_binding_table(struct anv_cmd_buffer *cmd_buffer,
> > > gl_shader_stage stage,
> > > struct anv_state *bt_state)
> > > {
> > > - struct anv_framebuffer *fb = cmd_buffer->state.framebuffer;
> > > struct anv_subpass *subpass = cmd_buffer->state.subpass;
> > > struct anv_pipeline *pipeline;
> > > uint32_t bias, state_offset;
> > > @@ -743,17 +867,10 @@ emit_binding_table(struct anv_cmd_buffer
> > *cmd_buffer,
> > > assert(stage == MESA_SHADER_FRAGMENT);
> > > assert(binding->binding == 0);
> > > if (binding->index < subpass->color_count) {
> > > - const struct anv_image_view *iview =
> > > - fb->attachments[subpass->color_attachments[binding->
> > index]];
> > > -
> > > - assert(iview->color_rt_surface_state.alloc_size);
> > > - surface_state = iview->color_rt_surface_state;
> > > - anv_cmd_buffer_add_surface_state_reloc(cmd_buffer,
> > surface_state,
> > > - iview->bo,
> > iview->offset);
> > > + const unsigned att = subpass->color_attachments[
> > binding->index];
> > > + surface_state = cmd_buffer->state.attachments[
> > att].color_rt_state;
> > > } else {
> > > - /* Null render target */
> > > - struct anv_framebuffer *fb = cmd_buffer->state.framebuffer;
> > > - surface_state = alloc_null_surface_state(cmd_buffer, fb);
> > > + surface_state = cmd_buffer->state.null_surface_state;
> > > }
> > >
> > > bt_map[bias + s] = surface_state.offset + state_offset;
> > > @@ -1837,7 +1954,8 @@ void genX(CmdBeginRenderPass)(
> > > cmd_buffer->state.framebuffer = framebuffer;
> > > cmd_buffer->state.pass = pass;
> > > cmd_buffer->state.render_area = pRenderPassBegin->renderArea;
> > > - anv_cmd_state_setup_attachments(cmd_buffer, pRenderPassBegin);
> > > + genX(cmd_buffer_setup_attachments)(cmd_buffer, pass, framebuffer,
> > > + pRenderPassBegin->pClearValues);
> > >
> > > genX(flush_pipeline_select_3d)(cmd_buffer);
> > >
> > > --
> > > 2.5.0.400.gff86faf
> > >
> > > _______________________________________________
> > > mesa-dev mailing list
> > > mesa-dev at lists.freedesktop.org
> > > https://lists.freedesktop.org/mailman/listinfo/mesa-dev
> >
More information about the mesa-dev
mailing list