<div dir="ltr">This patch causes a perf drop in sascha gears.  I'm investigating.<br></div><div class="gmail_extra"><br><div class="gmail_quote">On Mon, Nov 27, 2017 at 7:06 PM, Jason Ekstrand <span dir="ltr"><<a href="mailto:jason@jlekstrand.net" target="_blank">jason@jlekstrand.net</a>></span> wrote:<br><blockquote class="gmail_quote" style="margin:0 0 0 .8ex;border-left:1px #ccc solid;padding-left:1ex">---<br>
 src/intel/vulkan/genX_cmd_<wbr>buffer.c | 187 +++++++++++++-----------------<wbr>-------<br>
 1 file changed, 65 insertions(+), 122 deletions(-)<br>
<br>
diff --git a/src/intel/vulkan/genX_cmd_<wbr>buffer.c b/src/intel/vulkan/genX_cmd_<wbr>buffer.c<br>
index 7901b0c..2c4ab38 100644<br>
--- a/src/intel/vulkan/genX_cmd_<wbr>buffer.c<br>
+++ b/src/intel/vulkan/genX_cmd_<wbr>buffer.c<br>
@@ -2982,120 +2982,6 @@ cmd_buffer_emit_depth_stencil(<wbr>struct anv_cmd_buffer *cmd_buffer)<br>
    cmd_buffer->state.hiz_enabled = info.hiz_usage == ISL_AUX_USAGE_HIZ;<br>
 }<br>
<br>
-<br>
-/**<br>
- * @brief Perform any layout transitions required at the beginning and/or end<br>
- *        of the current subpass for depth buffers.<br>
- *<br>
- * TODO: Consider preprocessing the attachment reference array at render pass<br>
- *       create time to determine if no layout transition is needed at the<br>
- *       beginning and/or end of each subpass.<br>
- *<br>
- * @param cmd_buffer The command buffer the transition is happening within.<br>
- * @param subpass_end If true, marks that the transition is happening at the<br>
- *                    end of the subpass.<br>
- */<br>
-static void<br>
-cmd_buffer_subpass_<wbr>transition_layouts(struct anv_cmd_buffer * const cmd_buffer,<br>
-                                      const bool subpass_end)<br>
-{<br>
-   /* We need a non-NULL command buffer. */<br>
-   assert(cmd_buffer);<br>
-<br>
-   const struct anv_cmd_state * const cmd_state = &cmd_buffer->state;<br>
-   const struct anv_subpass * const subpass = cmd_state->subpass;<br>
-<br>
-   /* This function must be called within a subpass. */<br>
-   assert(subpass);<br>
-<br>
-   /* If there are attachment references, the array shouldn't be NULL.<br>
-    */<br>
-   if (subpass->attachment_count > 0)<br>
-      assert(subpass->attachments);<br>
-<br>
-   /* Iterate over the array of attachment references. */<br>
-   for (const VkAttachmentReference *att_ref = subpass->attachments;<br>
-        att_ref < subpass->attachments + subpass->attachment_count; att_ref++) {<br>
-<br>
-      /* If the attachment is unused, we can't perform a layout transition. */<br>
-      if (att_ref->attachment == VK_ATTACHMENT_UNUSED)<br>
-         continue;<br>
-<br>
-      /* This attachment index shouldn't go out of bounds. */<br>
-      assert(att_ref->attachment < cmd_state->pass->attachment_<wbr>count);<br>
-<br>
-      const struct anv_render_pass_attachment * const att_desc =<br>
-         &cmd_state->pass->attachments[<wbr>att_ref->attachment];<br>
-      struct anv_attachment_state * const att_state =<br>
-         &cmd_buffer->state.<wbr>attachments[att_ref-><wbr>attachment];<br>
-<br>
-      /* The attachment should not be used in a subpass after its last. */<br>
-      assert(att_desc->last_subpass_<wbr>idx >= anv_get_subpass_id(cmd_state))<wbr>;<br>
-<br>
-      if (subpass_end && anv_get_subpass_id(cmd_state) <<br>
-          att_desc->last_subpass_idx) {<br>
-         /* We're calling this function on a buffer twice in one subpass and<br>
-          * this is not the last use of the buffer. The layout should not have<br>
-          * changed from the first call and no transition is necessary.<br>
-          */<br>
-         assert(att_state->current_<wbr>layout == att_ref->layout ||<br>
-                att_state->current_layout ==<br>
-                VK_IMAGE_LAYOUT_COLOR_<wbr>ATTACHMENT_OPTIMAL);<br>
-         continue;<br>
-      }<br>
-<br>
-      /* The attachment index must be less than the number of attachments<br>
-       * within the framebuffer.<br>
-       */<br>
-      assert(att_ref->attachment < cmd_state->framebuffer-><wbr>attachment_count);<br>
-<br>
-      const struct anv_image_view * const iview =<br>
-         cmd_state->framebuffer-><wbr>attachments[att_ref-><wbr>attachment];<br>
-      const struct anv_image * const image = iview->image;<br>
-<br>
-      /* Get the appropriate target layout for this attachment. */<br>
-      VkImageLayout target_layout;<br>
-<br>
-      /* A resolve is necessary before use as an input attachment if the clear<br>
-       * color or auxiliary buffer usage isn't supported by the sampler.<br>
-       */<br>
-      const bool input_needs_resolve =<br>
-            (att_state->fast_clear && !att_state->clear_color_is_<wbr>zero_one) ||<br>
-            att_state->input_aux_usage != att_state->aux_usage;<br>
-      if (subpass_end) {<br>
-         target_layout = att_desc->final_layout;<br>
-      } else if (iview->aspect_mask & VK_IMAGE_ASPECT_ANY_COLOR_BIT_<wbr>ANV &&<br>
-                 !input_needs_resolve) {<br>
-         /* Layout transitions before the final only help to enable sampling as<br>
-          * an input attachment. If the input attachment supports sampling<br>
-          * using the auxiliary surface, we can skip such transitions by making<br>
-          * the target layout one that is CCS-aware.<br>
-          */<br>
-         target_layout = VK_IMAGE_LAYOUT_COLOR_<wbr>ATTACHMENT_OPTIMAL;<br>
-      } else {<br>
-         target_layout = att_ref->layout;<br>
-      }<br>
-<br>
-      /* Perform the layout transition. */<br>
-      if (image->aspects & VK_IMAGE_ASPECT_DEPTH_BIT) {<br>
-         transition_depth_buffer(cmd_<wbr>buffer, image,<br>
-                                 att_state->current_layout, target_layout);<br>
-         att_state->aux_usage =<br>
-            anv_layout_to_aux_usage(&cmd_<wbr>buffer->device->info, image,<br>
-                                    VK_IMAGE_ASPECT_DEPTH_BIT, target_layout);<br>
-      } else if (image->aspects & VK_IMAGE_ASPECT_ANY_COLOR_BIT_<wbr>ANV) {<br>
-         assert(image->aspects == VK_IMAGE_ASPECT_COLOR_BIT);<br>
-         transition_color_buffer(cmd_<wbr>buffer, image, VK_IMAGE_ASPECT_COLOR_BIT,<br>
-                                 iview->planes[0].isl.base_<wbr>level, 1,<br>
-                                 iview->planes[0].isl.base_<wbr>array_layer,<br>
-                                 iview->planes[0].isl.array_<wbr>len,<br>
-                                 att_state->current_layout, target_layout);<br>
-      }<br>
-<br>
-      att_state->current_layout = target_layout;<br>
-   }<br>
-}<br>
-<br>
 static void<br>
 cmd_buffer_begin_subpass(<wbr>struct anv_cmd_buffer *cmd_buffer,<br>
                          uint32_t subpass_id)<br>
@@ -3120,11 +3006,6 @@ cmd_buffer_begin_subpass(<wbr>struct anv_cmd_buffer *cmd_buffer,<br>
    cmd_buffer->state.pending_<wbr>pipe_bits |=<br>
       cmd_buffer->state.pass-><wbr>subpass_flushes[subpass_id];<br>
<br>
-   /* Perform transitions to the subpass layout before any writes have<br>
-    * occurred.<br>
-    */<br>
-   cmd_buffer_subpass_transition_<wbr>layouts(cmd_buffer, false);<br>
-<br>
    VkRect2D render_area = cmd_buffer->state.render_area;<br>
    struct anv_framebuffer *fb = cmd_buffer->state.framebuffer;<br>
<br>
@@ -3139,6 +3020,39 @@ cmd_buffer_begin_subpass(<wbr>struct anv_cmd_buffer *cmd_buffer,<br>
       struct anv_image_view *iview = fb->attachments[a];<br>
       const struct anv_image *image = iview->image;<br>
<br>
+      /* A resolve is necessary before use as an input attachment if the clear<br>
+       * color or auxiliary buffer usage isn't supported by the sampler.<br>
+       */<br>
+      const bool input_needs_resolve =<br>
+            (att_state->fast_clear && !att_state->clear_color_is_<wbr>zero_one) ||<br>
+            att_state->input_aux_usage != att_state->aux_usage;<br>
+<br>
+      VkImageLayout target_layout;<br>
+      if (iview->aspect_mask & VK_IMAGE_ASPECT_ANY_COLOR_BIT_<wbr>ANV &&<br>
+          !input_needs_resolve) {<br>
+         /* Layout transitions before the final only help to enable sampling<br>
+          * as an input attachment. If the input attachment supports sampling<br>
+          * using the auxiliary surface, we can skip such transitions by<br>
+          * making the target layout one that is CCS-aware.<br>
+          */<br>
+         target_layout = VK_IMAGE_LAYOUT_COLOR_<wbr>ATTACHMENT_OPTIMAL;<br>
+      } else {<br>
+         target_layout = subpass->attachments[i].<wbr>layout;<br>
+      }<br>
+<br>
+      if (image->aspects & VK_IMAGE_ASPECT_ANY_COLOR_BIT_<wbr>ANV) {<br>
+         assert(image->aspects == VK_IMAGE_ASPECT_COLOR_BIT);<br>
+         transition_color_buffer(cmd_<wbr>buffer, image, VK_IMAGE_ASPECT_COLOR_BIT,<br>
+                                 iview->planes[0].isl.base_<wbr>level, 1,<br>
+                                 iview->planes[0].isl.base_<wbr>array_layer,<br>
+                                 iview->planes[0].isl.array_<wbr>len,<br>
+                                 att_state->current_layout, target_layout);<br>
+      } else if (image->aspects & VK_IMAGE_ASPECT_DEPTH_BIT) {<br>
+         transition_depth_buffer(cmd_<wbr>buffer, image,<br>
+                                 att_state->current_layout, target_layout);<br>
+      }<br>
+      att_state->current_layout = target_layout;<br>
+<br>
       if (att_state->pending_clear_<wbr>aspects & VK_IMAGE_ASPECT_COLOR_BIT) {<br>
          assert(att_state->pending_<wbr>clear_aspects == VK_IMAGE_ASPECT_COLOR_BIT);<br>
<br>
@@ -3251,13 +3165,42 @@ cmd_buffer_begin_subpass(<wbr>struct anv_cmd_buffer *cmd_buffer,<br>
 static void<br>
 cmd_buffer_end_subpass(struct anv_cmd_buffer *cmd_buffer)<br>
 {<br>
+   struct anv_cmd_state *cmd_state = &cmd_buffer->state;<br>
+   struct anv_subpass *subpass = cmd_state->subpass;<br>
    uint32_t subpass_id = anv_get_subpass_id(&cmd_<wbr>buffer->state);<br>
<br>
    anv_cmd_buffer_resolve_<wbr>subpass(cmd_buffer);<br>
<br>
-   /* Perform transitions to the final layout after all writes have occurred.<br>
-    */<br>
-   cmd_buffer_subpass_transition_<wbr>layouts(cmd_buffer, true);<br>
+   struct anv_framebuffer *fb = cmd_buffer->state.framebuffer;<br>
+   for (uint32_t i = 0; i < subpass->attachment_count; ++i) {<br>
+      const uint32_t a = subpass->attachments[i].<wbr>attachment;<br>
+      if (a == VK_ATTACHMENT_UNUSED)<br>
+         continue;<br>
+<br>
+      if (cmd_state->pass->attachments[<wbr>a].last_subpass_idx != subpass_id)<br>
+         continue;<br>
+<br>
+      assert(a < cmd_state->pass->attachment_<wbr>count);<br>
+      struct anv_attachment_state *att_state = &cmd_state->attachments[a];<br>
+      struct anv_image_view *iview = fb->attachments[a];<br>
+      const struct anv_image *image = iview->image;<br>
+<br>
+      /* Transition the image into the final layout for this render pass */<br>
+      VkImageLayout target_layout =<br>
+         cmd_state->pass->attachments[<wbr>a].final_layout;<br>
+<br>
+      if (image->aspects & VK_IMAGE_ASPECT_ANY_COLOR_BIT_<wbr>ANV) {<br>
+         assert(image->aspects == VK_IMAGE_ASPECT_COLOR_BIT);<br>
+         transition_color_buffer(cmd_<wbr>buffer, image, VK_IMAGE_ASPECT_COLOR_BIT,<br>
+                                 iview->planes[0].isl.base_<wbr>level, 1,<br>
+                                 iview->planes[0].isl.base_<wbr>array_layer,<br>
+                                 iview->planes[0].isl.array_<wbr>len,<br>
+                                 att_state->current_layout, target_layout);<br>
+      } else if (image->aspects & VK_IMAGE_ASPECT_DEPTH_BIT) {<br>
+         transition_depth_buffer(cmd_<wbr>buffer, image,<br>
+                                 att_state->current_layout, target_layout);<br>
+      }<br>
+   }<br>
<br>
    /* Accumulate any subpass flushes that need to happen after the subpass.<br>
     * Yes, they do get accumulated twice in the NextSubpass case but since<br>
<span class="HOEnZb"><font color="#888888">--<br>
2.5.0.400.gff86faf<br>
<br>
</font></span></blockquote></div><br></div>