<div dir="ltr"><div class="gmail_extra"><div class="gmail_quote">On Fri, May 26, 2017 at 4:30 PM, Jason Ekstrand <span dir="ltr"><<a href="mailto:jason@jlekstrand.net" target="_blank">jason@jlekstrand.net</a>></span> wrote:<br><blockquote class="gmail_quote" style="margin:0 0 0 .8ex;border-left:1px #ccc solid;padding-left:1ex">---<br>
 src/mesa/drivers/dri/i965/brw_<wbr>context.c       | 35 +++----------------<br>
 src/mesa/drivers/dri/i965/brw_<wbr>draw.c          |  4 +--<br>
 src/mesa/drivers/dri/i965/<wbr>intel_mipmap_tree.c | 48 +++++++++++++++++++++++++++<br>
 src/mesa/drivers/dri/i965/<wbr>intel_mipmap_tree.h |  9 +++++<br>
 4 files changed, 63 insertions(+), 33 deletions(-)<br>
<br>
diff --git a/src/mesa/drivers/dri/i965/<wbr>brw_context.c b/src/mesa/drivers/dri/i965/<wbr>brw_context.c<br>
index 07ddaf0..48e8b6c 100644<br>
--- a/src/mesa/drivers/dri/i965/<wbr>brw_context.c<br>
+++ b/src/mesa/drivers/dri/i965/<wbr>brw_context.c<br>
@@ -301,38 +301,11 @@ intel_update_state(struct gl_context * ctx, GLuint new_state)<br>
       if (irb == NULL || irb->mt == NULL)<br>
          continue;<br>
<br>
-      struct intel_mipmap_tree *mt = irb->mt;<br>
+      intel_miptree_prepare_render(<wbr>brw, irb->mt, irb->mt_level,<br>
+                                   irb->mt_layer, irb->layer_count,<br>
+                                   ctx->Color.sRGBEnabled);<br>
<br>
-      /* If FRAMEBUFFER_SRGB is used on Gen9+ then we need to resolve any of<br>
-       * the single-sampled color renderbuffers because the CCS buffer isn't<br>
-       * supported for SRGB formats. This only matters if FRAMEBUFFER_SRGB is<br>
-       * enabled because otherwise the surface state will be programmed with<br>
-       * the linear equivalent format anyway.<br>
-       */<br>
-      if (brw->gen >= 9 && ctx->Color.sRGBEnabled && mt->num_samples <= 1 &&<br>
-          _mesa_get_srgb_format_linear(<wbr>mt->format) != mt->format) {<br>
-<br>
-         /* Lossless compression is not supported for SRGB formats, it<br>
-          * should be impossible to get here with such surfaces.<br>
-          */<br>
-         assert(!intel_miptree_is_<wbr>lossless_compressed(brw, mt));<br>
-         intel_miptree_all_slices_<wbr>resolve_color(brw, mt, 0);<br>
-         brw_render_cache_set_check_<wbr>flush(brw, mt->bo);<br>
-      }<br>
-<br>
-      /* For layered rendering non-compressed fast cleared buffers need to be<br>
-       * resolved. Surface state can carry only one fast color clear value<br>
-       * while each layer may have its own fast clear color value. For<br>
-       * compressed buffers color value is available in the color buffer.<br>
-       */<br>
-      if (irb->layer_count > 1 &&<br>
-          !(irb->mt->aux_disable & INTEL_AUX_DISABLE_CCS) &&<br>
-          !intel_miptree_is_lossless_<wbr>compressed(brw, mt)) {<br>
-         assert(brw->gen >= 8);<br>
-<br>
-         intel_miptree_resolve_color(<wbr>brw, mt, irb->mt_level, 1,<br>
-                                     irb->mt_layer, irb->layer_count, 0);<br>
-      }<br>
+      brw_render_cache_set_check_<wbr>flush(brw, irb->mt->bo);<br></blockquote><div><br></div><div>This render_cache_set_check_flush is unneeded and is actually the cause of most of the performance regressions in this series.  Making it unconditional meant we flushed the render cache on every draw call.  It's a bit surprising that doing so didn't hurt things any worse than it did.  It was originally put in to satisfy the requirements about flushing around resolves.  Now that we do that directly in brw_blorp_resolve_color, we don't need it at all much less unconditionally.  I've removed this line locally.<br></div><div> </div><blockquote class="gmail_quote" style="margin:0 0 0 .8ex;border-left:1px #ccc solid;padding-left:1ex">
    }<br>
<br>
    _mesa_lock_context_textures(<wbr>ctx);<br>
diff --git a/src/mesa/drivers/dri/i965/<wbr>brw_draw.c b/src/mesa/drivers/dri/i965/<wbr>brw_draw.c<br>
index 3a1bb50..07f1d48 100644<br>
--- a/src/mesa/drivers/dri/i965/<wbr>brw_draw.c<br>
+++ b/src/mesa/drivers/dri/i965/<wbr>brw_draw.c<br>
@@ -400,8 +400,8 @@ brw_postdraw_set_buffers_need_<wbr>resolve(struct brw_context *brw)<br>
          continue;<br>
<br>
       brw_render_cache_set_add_bo(<wbr>brw, irb->mt->bo);<br>
-      intel_miptree_used_for_<wbr>rendering(<br>
-         brw, irb->mt, irb->mt_level, irb->mt_layer, irb->layer_count);<br>
+      intel_miptree_finish_render(<wbr>brw, irb->mt, irb->mt_level,<br>
+                                  irb->mt_layer, irb->layer_count);<br>
    }<br>
 }<br>
<br>
diff --git a/src/mesa/drivers/dri/i965/<wbr>intel_mipmap_tree.c b/src/mesa/drivers/dri/i965/<wbr>intel_mipmap_tree.c<br>
index 8cf2016..1774ed5 100644<br>
--- a/src/mesa/drivers/dri/i965/<wbr>intel_mipmap_tree.c<br>
+++ b/src/mesa/drivers/dri/i965/<wbr>intel_mipmap_tree.c<br>
@@ -2424,6 +2424,54 @@ intel_miptree_prepare_texture(<wbr>struct brw_context *brw,<br>
       *aux_supported_out = aux_supported;<br>
 }<br>
<br>
+void<br>
+intel_miptree_prepare_render(<wbr>struct brw_context *brw,<br>
+                             struct intel_mipmap_tree *mt, uint32_t level,<br>
+                             uint32_t start_layer, uint32_t layer_count,<br>
+                             bool srgb_enabled)<br>
+{<br>
+   /* If FRAMEBUFFER_SRGB is used on Gen9+ then we need to resolve any of<br>
+    * the single-sampled color renderbuffers because the CCS buffer isn't<br>
+    * supported for SRGB formats. This only matters if FRAMEBUFFER_SRGB is<br>
+    * enabled because otherwise the surface state will be programmed with<br>
+    * the linear equivalent format anyway.<br>
+    */<br>
+   if (brw->gen >= 9 && srgb_enabled && mt->num_samples <= 1 &&<br>
+       _mesa_get_srgb_format_linear(<wbr>mt->format) != mt->format) {<br>
+<br>
+      /* Lossless compression is not supported for SRGB formats, it<br>
+       * should be impossible to get here with such surfaces.<br>
+       */<br>
+      assert(!intel_miptree_is_<wbr>lossless_compressed(brw, mt));<br>
+      intel_miptree_prepare_access(<wbr>brw, mt, level, 1, start_layer, layer_count,<br>
+                                   false, false);<br>
+   }<br>
+<br>
+   /* For layered rendering non-compressed fast cleared buffers need to be<br>
+    * resolved. Surface state can carry only one fast color clear value<br>
+    * while each layer may have its own fast clear color value. For<br>
+    * compressed buffers color value is available in the color buffer.<br>
+    */<br>
+   if (layer_count > 1 &&<br>
+       !(mt->aux_disable & INTEL_AUX_DISABLE_CCS) &&<br>
+       !intel_miptree_is_lossless_<wbr>compressed(brw, mt)) {<br>
+      assert(brw->gen >= 8);<br>
+<br>
+      intel_miptree_prepare_access(<wbr>brw, mt, level, 1, start_layer, layer_count,<br>
+                                   false, false);<br>
+   }<br>
+}<br>
+<br>
+void<br>
+intel_miptree_finish_render(<wbr>struct brw_context *brw,<br>
+                            struct intel_mipmap_tree *mt, uint32_t level,<br>
+                            uint32_t start_layer, uint32_t layer_count)<br>
+{<br>
+   assert(_mesa_is_format_color_<wbr>format(mt->format));<br>
+   intel_miptree_finish_write(<wbr>brw, mt, level, start_layer, layer_count,<br>
+                              mt->mcs_buf);<br>
+}<br>
+<br>
 /**<br>
  * Make it possible to share the BO backing the given miptree with another<br>
  * process or another miptree.<br>
diff --git a/src/mesa/drivers/dri/i965/<wbr>intel_mipmap_tree.h b/src/mesa/drivers/dri/i965/<wbr>intel_mipmap_tree.h<br>
index 61ec895..0392935 100644<br>
--- a/src/mesa/drivers/dri/i965/<wbr>intel_mipmap_tree.h<br>
+++ b/src/mesa/drivers/dri/i965/<wbr>intel_mipmap_tree.h<br>
@@ -1015,6 +1015,15 @@ intel_miptree_prepare_texture(<wbr>struct brw_context *brw,<br>
                               struct intel_mipmap_tree *mt,<br>
                               mesa_format view_format,<br>
                               bool *aux_supported_out);<br>
+void<br>
+intel_miptree_prepare_render(<wbr>struct brw_context *brw,<br>
+                             struct intel_mipmap_tree *mt, uint32_t level,<br>
+                             uint32_t start_layer, uint32_t layer_count,<br>
+                             bool srgb_enabled);<br>
+void<br>
+intel_miptree_finish_render(<wbr>struct brw_context *brw,<br>
+                            struct intel_mipmap_tree *mt, uint32_t level,<br>
+                            uint32_t start_layer, uint32_t layer_count);<br>
<br>
 void<br>
 intel_miptree_make_shareable(<wbr>struct brw_context *brw,<br>
<span class="HOEnZb"><font color="#888888">--<br>
2.5.0.400.gff86faf<br>
<br>
</font></span></blockquote></div><br></div></div>