<div dir="ltr"><div class="gmail_extra"><div class="gmail_quote">On Fri, Jun 29, 2018 at 9:56 PM, Timothy Arceri <span dir="ltr"><<a href="mailto:tarceri@itsqueeze.com" target="_blank">tarceri@itsqueeze.com</a>></span> wrote:<br><blockquote class="gmail_quote" style="margin:0 0 0 .8ex;border-left:1px #ccc solid;padding-left:1ex"><div class="HOEnZb"><div class="h5">On 30/06/18 10:13, Jason Ekstrand wrote:<br>
<blockquote class="gmail_quote" style="margin:0 0 0 .8ex;border-left:1px #ccc solid;padding-left:1ex">
This pass searches for reasonably large local variables which can be<br>
statically proven to be constant and moves them into shader constant<br>
data.  This is especially useful when large tables are baked into the<br>
shader source code because they can be moved into a UBO by the driver to<br>
reduce register pressure and make indirect access cheaper.<br>
<br>
v2 (Jason Ekstrand):<br>
  - Use a size/align function to ensure we get the right alignments<br>
  - Use the newly added deref offset helpers<br>
---<br>
  src/compiler/Makefile.sources              |   1 +<br>
  src/compiler/nir/meson.build               |   1 +<br>
  src/compiler/nir/nir.h                     |   4 +<br>
  src/compiler/nir/nir_opt_large<wbr>_constants.c | 301 +++++++++++++++++++++<br>
  4 files changed, 307 insertions(+)<br>
  create mode 100644 src/compiler/nir/nir_opt_large<wbr>_constants.c<br>
<br>
diff --git a/src/compiler/Makefile.source<wbr>s b/src/compiler/Makefile.source<wbr>s<br>
index 0fcbc5c5c5b..9e3fbdc2612 100644<br>
--- a/src/compiler/Makefile.source<wbr>s<br>
+++ b/src/compiler/Makefile.source<wbr>s<br>
@@ -276,6 +276,7 @@ NIR_FILES = \<br>
        nir/nir_opt_if.c \<br>
        nir/nir_opt_intrinsics.c \<br>
        nir/nir_opt_loop_unroll.c \<br>
+       nir/nir_opt_large_constants.c \<br>
        nir/nir_opt_move_comparisons.c \<br>
        nir/nir_opt_move_load_ubo.c \<br>
        nir/nir_opt_peephole_select.c \<br>
diff --git a/src/compiler/nir/meson.build b/src/compiler/nir/meson.build<br>
index eb7fb7b121e..28aa8de7014 100644<br>
--- a/src/compiler/nir/meson.build<br>
+++ b/src/compiler/nir/meson.build<br>
@@ -160,6 +160,7 @@ files_libnir = files(<br>
    'nir_opt_global_to_local.c',<br>
    'nir_opt_if.c',<br>
    'nir_opt_intrinsics.c',<br>
+  'nir_opt_large_constants.c',<br>
    'nir_opt_loop_unroll.c',<br>
    'nir_opt_move_comparisons.c',<br>
    'nir_opt_move_load_ubo.c',<br>
diff --git a/src/compiler/nir/nir.h b/src/compiler/nir/nir.h<br>
index cc5f88d6f54..92ab3a699cc 100644<br>
--- a/src/compiler/nir/nir.h<br>
+++ b/src/compiler/nir/nir.h<br>
@@ -2905,6 +2905,10 @@ bool nir_opt_if(nir_shader *shader);<br>
    bool nir_opt_intrinsics(nir_shader *shader);<br>
  +bool nir_opt_large_constants(nir_sh<wbr>ader *shader,<br>
+                             glsl_type_size_align_func size_align,<br>
+                             unsigned threshold);<br>
+<br>
  bool nir_opt_loop_unroll(nir_shader *shader, nir_variable_mode indirect_mask);<br>
    bool nir_opt_move_comparisons(nir_s<wbr>hader *shader);<br>
diff --git a/src/compiler/nir/nir_opt_lar<wbr>ge_constants.c b/src/compiler/nir/nir_opt_lar<wbr>ge_constants.c<br>
new file mode 100644<br>
index 00000000000..027c6e8e5b5<br>
--- /dev/null<br>
+++ b/src/compiler/nir/nir_opt_lar<wbr>ge_constants.c<br>
@@ -0,0 +1,301 @@<br>
+/*<br>
+ * Copyright © 2018 Intel Corporation<br>
+ *<br>
+ * Permission is hereby granted, free of charge, to any person obtaining a<br>
+ * copy of this software and associated documentation files (the "Software"),<br>
+ * to deal in the Software without restriction, including without limitation<br>
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,<br>
+ * and/or sell copies of the Software, and to permit persons to whom the<br>
+ * Software is furnished to do so, subject to the following conditions:<br>
+ *<br>
+ * The above copyright notice and this permission notice (including the next<br>
+ * paragraph) shall be included in all copies or substantial portions of the<br>
+ * Software.<br>
+ *<br>
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR<br>
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,<br>
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL<br>
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER<br>
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING<br>
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS<br>
+ * IN THE SOFTWARE.<br>
+ */<br>
+<br>
+#include "nir.h"<br>
+#include "nir_builder.h"<br>
+#include "nir_deref.h"<br>
+<br>
+struct var_info {<br>
+   bool is_constant;<br>
+   bool found_read;<br>
+};<br>
+<br>
+static nir_ssa_def *<br>
+build_constant_load(nir_build<wbr>er *b, nir_deref_instr *deref,<br>
+                    glsl_type_size_align_func size_align)<br>
+{<br>
+   nir_variable *var = nir_deref_instr_get_variable(d<wbr>eref);<br>
+<br>
+   const unsigned bit_size = glsl_get_bit_size(deref->type)<wbr>;<br>
+   const unsigned num_components = glsl_get_vector_elements(deref<wbr>->type);<br>
+<br>
+   UNUSED unsigned var_size, var_align;<br>
+   size_align(var->type, &var_size, &var_align);<br>
+   assert(var->data.location % var_align == 0);<br>
+<br>
+   nir_intrinsic_instr *load =<br>
+      nir_intrinsic_instr_create(b-><wbr>shader, nir_intrinsic_load_constant);<br>
+   load->num_components = num_components;<br>
+   nir_intrinsic_set_base(load, var->data.location);<br>
+   nir_intrinsic_set_range(load, var_size);<br>
+   load->src[0] = nir_src_for_ssa(nir_build_dere<wbr>f_offset(b, deref, size_align));<br>
+   nir_ssa_dest_init(&load->inst<wbr>r, &load->dest,<br>
+                     num_components, bit_size, NULL);<br>
+   nir_builder_instr_insert(b, &load->instr);<br>
+<br>
+   return &load->dest.ssa;<br>
+}<br>
+<br>
+static void<br>
+handle_constant_store(nir_bui<wbr>lder *b, nir_intrinsic_instr *store,<br>
+                      glsl_type_size_align_func size_align)<br>
+{<br>
+   nir_deref_instr *deref = nir_src_as_deref(store->src[0]<wbr>);<br>
+   assert(!nir_deref_instr_has_i<wbr>ndirect(deref));<br>
+<br>
+   nir_variable *var = nir_deref_instr_get_variable(d<wbr>eref);<br>
+<br>
+   const unsigned bit_size = glsl_get_bit_size(deref->type)<wbr>;<br>
+   const unsigned num_components = glsl_get_vector_elements(deref<wbr>->type);<br>
+<br>
+   char *dst = (char *)b->shader->constant_data +<br>
+               var->data.location +<br>
+               nir_deref_instr_get_const_off<wbr>set(deref, size_align);<br>
+<br>
+   nir_const_value *val = nir_src_as_const_value(store-><wbr>src[1]);<br>
+   switch (bit_size) {<br>
+   case 8:<br>
+      for (unsigned i = 0; i < num_components; i++)<br>
+         ((uint8_t *)dst)[i] = val->u8[i];<br>
+      break;<br>
+<br>
+   case 16:<br>
+      for (unsigned i = 0; i < num_components; i++)<br>
+         ((uint16_t *)dst)[i] = val->u16[i];<br>
+      break;<br>
+<br>
+   case 32:<br>
+      for (unsigned i = 0; i < num_components; i++)<br>
+         ((uint32_t *)dst)[i] = val->u32[i];<br>
+      break;<br>
+<br>
+   case 64:<br>
+      for (unsigned i = 0; i < num_components; i++)<br>
+         ((uint64_t *)dst)[i] = val->u64[i];<br>
+      break;<br>
+<br>
+   default:<br>
+      unreachable("Invalid bit size");<br>
+   }<br>
+}<br>
+<br>
+/** Lower large constant variables to shader constant data<br>
+ *<br>
+ * This pass looks for large (type_size(var->type) > threshold) variables<br>
+ * which are statically constant and moves them into shader constant data.<br>
+ * This is especially useful when large tables are baked into the shader<br>
+ * source code because they can be moved into a UBO by the driver to reduce<br>
+ * register pressure and make indirect access cheaper.<br>
+ */<br>
+bool<br>
+nir_opt_large_constants(nir_s<wbr>hader *shader,<br>
+                        glsl_type_size_align_func size_align,<br>
+                        unsigned threshold)<br>
+{<br>
+   /* Default to a natural alignment if none is provided */<br>
+   if (size_align == NULL)<br>
+      size_align = glsl_get_natural_size_align_by<wbr>tes;<br>
+<br>
+   /* This only works with a single entrypoint */<br>
+   nir_function_impl *impl = nir_shader_get_entrypoint(shad<wbr>er);<br>
+<br>
+   /* This pass can only be run once */<br>
+   assert(shader->constant_data == NULL && shader->constant_data_size == 0);<br>
+<br>
+   /* The index parameter is unused for local variables so we'll use it for<br>
+    * indexing into our array of variable metadata.<br>
+    */<br>
+   unsigned num_locals = 0;<br>
+   nir_foreach_variable(var, &impl->locals)<br>
+      var->data.index = num_locals++;<br>
+<br>
+   struct var_info *var_infos = malloc(num_locals * sizeof(struct var_info));<br>
+   for (unsigned i = 0; i < num_locals; i++) {<br>
+      var_infos[i] = (struct var_info) {<br>
+         .is_constant = true,<br>
+         .found_read = false,<br>
+      };<br>
+   }<br>
+<br>
+   /* First, walk through the shader and figure out what variables we can<br>
+    * lower to the constant blob.<br>
+    */<br>
+   bool first_block = true;<br>
+   nir_foreach_block(block, impl) {<br>
+      nir_foreach_instr(instr, block) {<br>
+         if (instr->type != nir_instr_type_intrinsic)<br>
+            continue;<br>
+<br>
+         nir_intrinsic_instr *intrin = nir_instr_as_intrinsic(instr);<br>
+<br>
+         bool src_is_const = false;<br>
+         nir_deref_instr *src_deref = NULL, *dst_deref = NULL;<br>
+         switch (intrin->intrinsic) {<br>
+         case nir_intrinsic_store_deref:<br>
+            dst_deref = nir_src_as_deref(intrin->src[0<wbr>]);<br>
+            src_is_const = nir_src_as_const_value(intrin-<wbr>>src[1]);<br>
+            break;<br>
+<br>
+         case nir_intrinsic_load_deref:<br>
+            src_deref = nir_src_as_deref(intrin->src[0<wbr>]);<br>
+            break;<br>
+<br>
+         case nir_intrinsic_copy_deref:<br>
</blockquote>
<br></div></div>
Can we add a comment here? Something like:<br>
<br>
/* We always assume the src and therefore the dst are not constants<br>
 * here. Copy and constant propagation passes should have taken<br>
 * care of this in most cases anyway.<br>
 */<br>
<br>
Does that sound correct?<br></blockquote><div><br></div><div>Sounds fine with me.<br></div><div> </div><blockquote class="gmail_quote" style="margin:0 0 0 .8ex;border-left:1px #ccc solid;padding-left:1ex">
Otherwise this series is:<br>
<br>
Reviewed-by: Timothy Arceri <<a href="mailto:tarceri@itsqueeze.com" target="_blank">tarceri@itsqueeze.com</a>><br></blockquote><div><br></div><div>Thanks!</div><div><br></div><div>--Jason<br></div><div> </div><blockquote class="gmail_quote" style="margin:0 0 0 .8ex;border-left:1px #ccc solid;padding-left:1ex">
Although I don't know the code i patch 8 very well so maybe someone else might want to take a look over that.<div class="HOEnZb"><div class="h5"><br>
<br>
<blockquote class="gmail_quote" style="margin:0 0 0 .8ex;border-left:1px #ccc solid;padding-left:1ex">
+            dst_deref = nir_src_as_deref(intrin->src[0<wbr>]);<br>
+            src_deref = nir_src_as_deref(intrin->src[1<wbr>]);<br>
+            src_is_const = false > +            break;<br>
+<br>
+         default:<br>
+            continue;<br>
+         }<br>
+<br>
+         if (dst_deref && dst_deref->mode == nir_var_local) {<br>
+            nir_variable *var = nir_deref_instr_get_variable(d<wbr>st_deref);<br>
+            assert(var->data.mode == nir_var_local);<br>
+<br>
+            /* We only consider variables constant if they only have constant<br>
+             * stores, all the stores come before any reads, and all stores<br>
+             * come in the first block.  We also can't handle indirect stores.<br>
+             */<br>
+            struct var_info *info = &var_infos[var->data.index];<br>
+            if (!src_is_const || info->found_read || !first_block ||<br>
+                nir_deref_instr_has_indirect(d<wbr>st_deref))<br>
+               info->is_constant = false;<br>
+         }<br>
+<br>
+         if (src_deref && src_deref->mode == nir_var_local) {<br>
+            nir_variable *var = nir_deref_instr_get_variable(s<wbr>rc_deref);<br>
+            assert(var->data.mode == nir_var_local);<br>
+<br>
+            var_infos[var->data.index].fou<wbr>nd_read = true;<br>
+         }<br>
+      }<br>
+      first_block = false;<br>
+   }<br>
+<br>
+   shader->constant_data_size = 0;<br>
+   nir_foreach_variable(var, &impl->locals) {<br>
+      struct var_info *info = &var_infos[var->data.index];<br>
+      if (!info->is_constant)<br>
+         continue;<br>
+<br>
+      unsigned var_size, var_align;<br>
+      size_align(var->type, &var_size, &var_align);<br>
+      if (var_size <= threshold || !info->found_read) {<br>
+         /* Don't bother lowering small stuff or data that's never read */<br>
+         info->is_constant = false;<br>
+         continue;<br>
+      }<br>
+<br>
+      var->data.location = ALIGN_POT(shader->constant_dat<wbr>a_size, var_align);<br>
+      shader->constant_data_size = var->data.location + var_size;<br>
+   }<br>
+<br>
+   if (shader->constant_data_size == 0) {<br>
+      free(var_infos);<br>
+      return false;<br>
+   }<br>
+<br>
+   shader->constant_data = rzalloc_size(shader, shader->constant_data_size);<br>
+<br>
+   nir_builder b;<br>
+   nir_builder_init(&b, impl);<br>
+<br>
+   nir_foreach_block(block, impl) {<br>
+      nir_foreach_instr_safe(instr, block) {<br>
+         if (instr->type != nir_instr_type_intrinsic)<br>
+            continue;<br>
+<br>
+         nir_intrinsic_instr *intrin = nir_instr_as_intrinsic(instr);<br>
+<br>
+         switch (intrin->intrinsic) {<br>
+         case nir_intrinsic_load_deref: {<br>
+            nir_deref_instr *deref = nir_src_as_deref(intrin->src[0<wbr>]);<br>
+            if (deref->mode != nir_var_local)<br>
+               continue;<br>
+<br>
+            nir_variable *var = nir_deref_instr_get_variable(d<wbr>eref);<br>
+            struct var_info *info = &var_infos[var->data.index];<br>
+            if (info->is_constant) {<br>
+               b.cursor = nir_after_instr(&intrin->instr<wbr>);<br>
+               nir_ssa_def *val = build_constant_load(&b, deref, size_align);<br>
+               nir_ssa_def_rewrite_uses(&int<wbr>rin->dest.ssa,<br>
+                                        nir_src_for_ssa(val));<br>
+               nir_instr_remove(&intrin->ins<wbr>tr);<br>
+               nir_deref_instr_remove_if_unu<wbr>sed(deref);<br>
+            }<br>
+            break;<br>
+         }<br>
+<br>
+         case nir_intrinsic_store_deref: {<br>
+            nir_deref_instr *deref = nir_src_as_deref(intrin->src[0<wbr>]);<br>
+            if (deref->mode != nir_var_local)<br>
+               continue;<br>
+<br>
+            nir_variable *var = nir_deref_instr_get_variable(d<wbr>eref);<br>
+            struct var_info *info = &var_infos[var->data.index];<br>
+            if (info->is_constant) {<br>
+               b.cursor = nir_after_instr(&intrin->instr<wbr>);<br>
+               handle_constant_store(&b, intrin, size_align);<br>
+               nir_instr_remove(&intrin->ins<wbr>tr);<br>
+               nir_deref_instr_remove_if_unu<wbr>sed(deref);<br>
+            }<br>
+            break;<br>
+         }<br>
+<br>
+         case nir_intrinsic_copy_deref: {<br>
+            nir_deref_instr *deref = nir_src_as_deref(intrin->src[1<wbr>]);<br>
+            if (deref->mode != nir_var_local)<br>
+               continue;<br>
+<br>
+            nir_variable *var = nir_deref_instr_get_variable(d<wbr>eref);<br>
+            struct var_info *info = &var_infos[var->data.index];<br>
+            if (info->is_constant) {<br>
+               b.cursor = nir_after_instr(&intrin->instr<wbr>);<br>
+               nir_ssa_def *val = build_constant_load(&b, deref, size_align);<br>
+               nir_store_deref(&b, nir_src_as_deref(intrin->src[0<wbr>]), val, ~0);<br>
+               nir_instr_remove(&intrin->ins<wbr>tr);<br>
+               nir_deref_instr_remove_if_unu<wbr>sed(deref);<br>
+            }<br>
+            break;<br>
+         }<br>
+<br>
+         default:<br>
+            continue;<br>
+         }<br>
+      }<br>
+   }<br>
+<br>
+   /* Clean up the now unused variables */<br>
+   nir_foreach_variable_safe(<wbr>var, &impl->locals) {<br>
+      if (var_infos[var->data.index].is<wbr>_constant)<br>
+         exec_node_remove(&var->node);<br>
+   }<br>
+<br>
+   free(var_infos);<br>
+<br>
+   nir_metadata_preserve(impl, nir_metadata_block_index |<br>
+                               nir_metadata_dominance);<br>
+   return true;<br>
+}<br>
<br>
</blockquote>
</div></div></blockquote></div><br></div></div>