<div dir="ltr">I'd also like to rename or at least note that this is a scalar-only thing for now... otherwise,<div><br></div><div>Reviewed-by: Connor Abbott <<a href="mailto:cwabbott0@gmail.com">cwabbott0@gmail.com</a>></div></div><div class="gmail_extra"><br><div class="gmail_quote">On Tue, Dec 16, 2014 at 1:11 AM, Jason Ekstrand <span dir="ltr"><<a href="mailto:jason@jlekstrand.net" target="_blank">jason@jlekstrand.net</a>></span> wrote:<br><blockquote class="gmail_quote" style="margin:0 0 0 .8ex;border-left:1px #ccc solid;padding-left:1ex">---<br>
 src/glsl/Makefile.sources   |   1 +<br>
 src/glsl/nir/nir.h          |   2 +<br>
 src/glsl/nir/nir_lower_io.c | 388 ++++++++++++++++++++++++++++++++++++++++++++<br>
 3 files changed, 391 insertions(+)<br>
 create mode 100644 src/glsl/nir/nir_lower_io.c<br>
<br>
diff --git a/src/glsl/Makefile.sources b/src/glsl/Makefile.sources<br>
index 6230f49..53c3e98 100644<br>
--- a/src/glsl/Makefile.sources<br>
+++ b/src/glsl/Makefile.sources<br>
@@ -23,6 +23,7 @@ NIR_FILES = \<br>
        $(GLSL_SRCDIR)/nir/nir_live_variables.c \<br>
        $(GLSL_SRCDIR)/nir/nir_lower_atomics.c \<br>
        $(GLSL_SRCDIR)/nir/nir_lower_locals_to_regs.c \<br>
+       $(GLSL_SRCDIR)/nir/nir_lower_io.c \<br>
        $(GLSL_SRCDIR)/nir/nir_lower_samplers.cpp \<br>
        $(GLSL_SRCDIR)/nir/nir_lower_system_values.c \<br>
        $(GLSL_SRCDIR)/nir/nir_lower_variables.c \<br>
diff --git a/src/glsl/nir/nir.h b/src/glsl/nir/nir.h<br>
index 7d7aec7..ec9ce07 100644<br>
--- a/src/glsl/nir/nir.h<br>
+++ b/src/glsl/nir/nir.h<br>
@@ -1360,6 +1360,8 @@ void nir_split_var_copies(nir_shader *shader);<br>
<br>
 void nir_lower_locals_to_regs(nir_shader *shader);<br>
<br>
+void nir_lower_io(nir_shader *shader);<br>
+<br>
 void nir_lower_variables(nir_shader *shader);<br>
<br>
 void nir_lower_variables_scalar(nir_shader *shader, bool lower_globals,<br>
diff --git a/src/glsl/nir/nir_lower_io.c b/src/glsl/nir/nir_lower_io.c<br>
new file mode 100644<br>
index 0000000..a3b8186<br>
--- /dev/null<br>
+++ b/src/glsl/nir/nir_lower_io.c<br>
@@ -0,0 +1,388 @@<br>
+/*<br>
+ * Copyright © 2014 Intel Corporation<br>
+ *<br>
+ * Permission is hereby granted, free of charge, to any person obtaining a<br>
+ * copy of this software and associated documentation files (the "Software"),<br>
+ * to deal in the Software without restriction, including without limitation<br>
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,<br>
+ * and/or sell copies of the Software, and to permit persons to whom the<br>
+ * Software is furnished to do so, subject to the following conditions:<br>
+ *<br>
+ * The above copyright notice and this permission notice (including the next<br>
+ * paragraph) shall be included in all copies or substantial portions of the<br>
+ * Software.<br>
+ *<br>
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR<br>
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,<br>
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL<br>
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER<br>
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING<br>
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS<br>
+ * IN THE SOFTWARE.<br>
+ *<br>
+ * Authors:<br>
+ *    Connor Abbott (<a href="mailto:cwabbott0@gmail.com">cwabbott0@gmail.com</a>)<br>
+ *    Jason Ekstrand (<a href="mailto:jason@jlekstrand.net">jason@jlekstrand.net</a>)<br>
+ *<br>
+ */<br>
+<br>
+/*<br>
+ * This lowering pass converts references to input/output variables with<br>
+ * loads/stores to actual input/output intrinsics.<br>
+ */<br>
+<br>
+#include "nir.h"<br>
+<br>
+struct lower_io_state {<br>
+   void *mem_ctx;<br>
+};<br>
+<br>
+static unsigned<br>
+type_size(const struct glsl_type *type)<br>
+{<br>
+   unsigned int size, i;<br>
+<br>
+   switch (glsl_get_base_type(type)) {<br>
+   case GLSL_TYPE_UINT:<br>
+   case GLSL_TYPE_INT:<br>
+   case GLSL_TYPE_FLOAT:<br>
+   case GLSL_TYPE_BOOL:<br>
+      return glsl_get_components(type);<br>
+   case GLSL_TYPE_ARRAY:<br>
+      return type_size(glsl_get_array_element(type)) * glsl_get_length(type);<br>
+   case GLSL_TYPE_STRUCT:<br>
+      size = 0;<br>
+      for (i = 0; i < glsl_get_length(type); i++) {<br>
+         size += type_size(glsl_get_struct_field(type, i));<br>
+      }<br>
+      return size;<br>
+   case GLSL_TYPE_SAMPLER:<br>
+      return 0;<br>
+   case GLSL_TYPE_ATOMIC_UINT:<br>
+      return 0;<br>
+   case GLSL_TYPE_INTERFACE:<br>
+      return 0;<br>
+   case GLSL_TYPE_IMAGE:<br>
+      return 0;<br>
+   case GLSL_TYPE_VOID:<br>
+   case GLSL_TYPE_ERROR:<br>
+      unreachable("not reached");<br>
+   }<br>
+<br>
+   return 0;<br>
+}<br>
+<br>
+static void<br>
+assign_var_locations(struct hash_table *ht, unsigned *size)<br>
+{<br>
+   unsigned location = 0;<br>
+<br>
+   struct hash_entry *entry;<br>
+   hash_table_foreach(ht, entry) {<br>
+      nir_variable *var = (nir_variable *) entry->data;<br>
+<br>
+      /*<br>
+       * UBO's have their own address spaces, so don't count them towards the<br>
+       * number of global uniforms<br>
+       */<br>
+      if (var->data.mode == nir_var_uniform && var->interface_type != NULL)<br>
+         continue;<br>
+<br>
+      var->data.driver_location = location;<br>
+      location += type_size(var->type);<br>
+   }<br>
+<br>
+   *size = location;<br>
+}<br>
+<br>
+static void<br>
+assign_var_locations_shader(nir_shader *shader)<br>
+{<br>
+   assign_var_locations(shader->inputs, &shader->num_inputs);<br>
+   assign_var_locations(shader->outputs, &shader->num_outputs);<br>
+   assign_var_locations(shader->uniforms, &shader->num_uniforms);<br>
+}<br>
+<br>
+static bool<br>
+deref_has_indirect(nir_deref_var *deref)<br>
+{<br>
+   for (nir_deref *tail = deref->deref.child; tail; tail = tail->child) {<br>
+      if (tail->deref_type == nir_deref_type_array) {<br>
+         nir_deref_array *arr = nir_deref_as_array(tail);<br>
+         if (arr->deref_array_type == nir_deref_array_type_indirect)<br>
+            return true;<br>
+      }<br>
+   }<br>
+<br>
+   return false;<br>
+}<br>
+<br>
+static unsigned<br>
+get_io_offset(nir_deref_var *deref, nir_instr *instr, nir_src *indirect,<br>
+              struct lower_io_state *state)<br>
+{<br>
+   bool found_indirect = false;<br>
+   unsigned base_offset = 0;<br>
+<br>
+   nir_deref *tail = &deref->deref;<br>
+   while (tail->child != NULL) {<br>
+      const struct glsl_type *parent_type = tail->type;<br>
+      tail = tail->child;<br>
+<br>
+      if (tail->deref_type == nir_deref_type_array) {<br>
+         nir_deref_array *deref_array = nir_deref_as_array(tail);<br>
+         unsigned size = type_size(tail->type);<br>
+<br>
+         base_offset += size * deref_array->base_offset;<br>
+<br>
+         if (deref_array->deref_array_type == nir_deref_array_type_indirect) {<br>
+            nir_load_const_instr *load_const =<br>
+               nir_load_const_instr_create(state->mem_ctx);<br>
+            load_const->num_components = 1;<br>
+            load_const->value.u[0] = size;<br>
+            load_const->dest.is_ssa = true;<br>
+            nir_ssa_def_init(&load_const->instr, &load_const->dest.ssa,<br>
+                             1, NULL);<br>
+            nir_instr_insert_before(instr, &load_const->instr);<br>
+<br>
+            nir_alu_instr *mul = nir_alu_instr_create(state->mem_ctx,<br>
+                                                      nir_op_imul);<br>
+            mul->src[0].src.is_ssa = true;<br>
+            mul->src[0].src.ssa = &load_const->dest.ssa;<br>
+            mul->src[1].src = nir_src_copy(deref_array->indirect,<br>
+                                           state->mem_ctx);<br>
+            mul->dest.write_mask = 1;<br>
+            mul->dest.dest.is_ssa = true;<br>
+            nir_ssa_def_init(&mul->instr, &mul->dest.dest.ssa, 1, NULL);<br>
+            nir_instr_insert_before(instr, &mul->instr);<br>
+<br>
+            if (found_indirect) {<br>
+               nir_alu_instr *add = nir_alu_instr_create(state->mem_ctx,<br>
+                                                         nir_op_iadd);<br>
+               add->src[0].src = *indirect;<br>
+               add->src[1].src.is_ssa = true;<br>
+               add->src[1].src.ssa = &mul->dest.dest.ssa;<br>
+               add->dest.write_mask = 1;<br>
+               add->dest.dest.is_ssa = true;<br>
+               nir_ssa_def_init(&add->instr, &add->dest.dest.ssa, 1, NULL);<br>
+               nir_instr_insert_before(instr, &add->instr);<br>
+<br>
+               indirect->is_ssa = true;<br>
+               indirect->ssa = &add->dest.dest.ssa;<br>
+            } else {<br>
+               indirect->is_ssa = true;<br>
+               indirect->ssa = &mul->dest.dest.ssa;<br>
+               found_indirect = true;<br>
+            }<br>
+         }<br>
+      } else if (tail->deref_type == nir_deref_type_struct) {<br>
+         nir_deref_struct *deref_struct = nir_deref_as_struct(tail);<br>
+<br>
+         for (unsigned i = 0; i < deref_struct->index; i++)<br>
+            base_offset += type_size(glsl_get_struct_field(parent_type, i));<br>
+      }<br>
+   }<br>
+<br>
+   return base_offset;<br>
+}<br>
+<br>
+static nir_intrinsic_op<br>
+get_load_op(nir_variable_mode mode, bool indirect, unsigned num_components)<br>
+{<br>
+   if (indirect) {<br>
+      switch (mode) {<br>
+      case nir_var_shader_in:<br>
+         switch (num_components) {<br>
+         case 1: return nir_intrinsic_load_input_vec1_indirect;<br>
+         case 2: return nir_intrinsic_load_input_vec2_indirect;<br>
+         case 3: return nir_intrinsic_load_input_vec3_indirect;<br>
+         case 4: return nir_intrinsic_load_input_vec4_indirect;<br>
+         default: unreachable("Invalid number of components"); break;<br>
+         }<br>
+         break;<br>
+<br>
+      case nir_var_uniform:<br>
+         switch (num_components) {<br>
+         case 1: return nir_intrinsic_load_uniform_vec1_indirect;<br>
+         case 2: return nir_intrinsic_load_uniform_vec2_indirect;<br>
+         case 3: return nir_intrinsic_load_uniform_vec3_indirect;<br>
+         case 4: return nir_intrinsic_load_uniform_vec4_indirect;<br>
+         default: unreachable("Invalid number of components"); break;<br>
+         }<br>
+         break;<br>
+<br>
+      default:<br>
+         unreachable("Invalid input type");<br>
+         break;<br>
+      }<br>
+   } else {<br>
+      switch (mode) {<br>
+      case nir_var_shader_in:<br>
+         switch (num_components) {<br>
+         case 1: return nir_intrinsic_load_input_vec1;<br>
+         case 2: return nir_intrinsic_load_input_vec2;<br>
+         case 3: return nir_intrinsic_load_input_vec3;<br>
+         case 4: return nir_intrinsic_load_input_vec4;<br>
+         default: unreachable("Invalid number of components"); break;<br>
+         }<br>
+         break;<br>
+<br>
+      case nir_var_uniform:<br>
+         switch (num_components) {<br>
+         case 1: return nir_intrinsic_load_uniform_vec1;<br>
+         case 2: return nir_intrinsic_load_uniform_vec2;<br>
+         case 3: return nir_intrinsic_load_uniform_vec3;<br>
+         case 4: return nir_intrinsic_load_uniform_vec4;<br>
+         default: unreachable("Invalid number of components"); break;<br>
+         }<br>
+         break;<br>
+<br>
+      default:<br>
+         unreachable("Invalid input type");<br>
+         break;<br>
+      }<br>
+   }<br>
+<br>
+   return nir_intrinsic_load_input_vec1;<br>
+}<br>
+<br>
+static bool<br>
+nir_lower_io_block(nir_block *block, void *void_state)<br>
+{<br>
+   struct lower_io_state *state = void_state;<br>
+<br>
+   nir_foreach_instr_safe(block, instr) {<br>
+      if (instr->type != nir_instr_type_intrinsic)<br>
+         continue;<br>
+<br>
+      nir_intrinsic_instr *intrin = nir_instr_as_intrinsic(instr);<br>
+<br>
+      switch (intrin->intrinsic) {<br>
+      case nir_intrinsic_load_var_vec1:<br>
+      case nir_intrinsic_load_var_vec2:<br>
+      case nir_intrinsic_load_var_vec3:<br>
+      case nir_intrinsic_load_var_vec4: {<br>
+         nir_variable_mode mode = intrin->variables[0]->var->data.mode;<br>
+         if (mode != nir_var_shader_in && mode != nir_var_uniform)<br>
+            continue;<br>
+<br>
+         bool has_indirect = deref_has_indirect(intrin->variables[0]);<br>
+         unsigned num_components =<br>
+            nir_intrinsic_infos[intrin->intrinsic].dest_components;<br>
+<br>
+         nir_intrinsic_op load_op = get_load_op(mode, has_indirect,<br>
+                                                num_components);<br>
+         nir_intrinsic_instr *load = nir_intrinsic_instr_create(state->mem_ctx,<br>
+                                                                load_op);<br>
+<br>
+         nir_src indirect;<br>
+         unsigned offset = get_io_offset(intrin->variables[0],<br>
+                                         &intrin->instr, &indirect, state);<br>
+         offset += intrin->variables[0]->var->data.driver_location;<br>
+<br>
+         load->const_index[0] = offset;<br>
+         load->const_index[1] = 1;<br>
+<br>
+         if (has_indirect)<br>
+            load->src[0] = indirect;<br>
+<br>
+         if (intrin->dest.is_ssa) {<br>
+            load->dest.is_ssa = true;<br>
+            nir_ssa_def_init(&load->instr, &load->dest.ssa,<br>
+                             num_components, NULL);<br>
+<br>
+            nir_src new_src = {<br>
+               .is_ssa = true,<br>
+               .ssa = &load->dest.ssa,<br>
+            };<br>
+<br>
+            nir_ssa_def_rewrite_uses(&intrin->dest.ssa, new_src,<br>
+                                     state->mem_ctx);<br>
+         } else {<br>
+            load->dest = nir_dest_copy(intrin->dest, state->mem_ctx);<br>
+         }<br>
+<br>
+         nir_instr_insert_before(&intrin->instr, &load->instr);<br>
+         nir_instr_remove(&intrin->instr);<br>
+         break;<br>
+      }<br>
+<br>
+      case nir_intrinsic_store_var_vec1:<br>
+      case nir_intrinsic_store_var_vec2:<br>
+      case nir_intrinsic_store_var_vec3:<br>
+      case nir_intrinsic_store_var_vec4: {<br>
+         if (intrin->variables[0]->var->data.mode != nir_var_shader_out)<br>
+            continue;<br>
+<br>
+         bool has_indirect = deref_has_indirect(intrin->variables[0]);<br>
+         unsigned num_components =<br>
+            nir_intrinsic_infos[intrin->intrinsic].src_components[0];<br>
+<br>
+         nir_intrinsic_op store_op;<br>
+         if (has_indirect) {<br>
+            switch (num_components) {<br>
+            case 1: store_op = nir_intrinsic_store_output_vec1_indirect; break;<br>
+            case 2: store_op = nir_intrinsic_store_output_vec2_indirect; break;<br>
+            case 3: store_op = nir_intrinsic_store_output_vec3_indirect; break;<br>
+            case 4: store_op = nir_intrinsic_store_output_vec4_indirect; break;<br>
+            default: unreachable("Invalid number of components"); break;<br>
+            }<br>
+         } else {<br>
+            switch (num_components) {<br>
+            case 1: store_op = nir_intrinsic_store_output_vec1; break;<br>
+            case 2: store_op = nir_intrinsic_store_output_vec2; break;<br>
+            case 3: store_op = nir_intrinsic_store_output_vec3; break;<br>
+            case 4: store_op = nir_intrinsic_store_output_vec4; break;<br>
+            default: unreachable("Invalid number of components"); break;<br>
+            }<br>
+         }<br>
+<br>
+         nir_intrinsic_instr *store = nir_intrinsic_instr_create(state->mem_ctx,<br>
+                                                                 store_op);<br>
+<br>
+         nir_src indirect;<br>
+         unsigned offset = get_io_offset(intrin->variables[0],<br>
+                                         &intrin->instr, &indirect, state);<br>
+         offset += intrin->variables[0]->var->data.driver_location;<br>
+<br>
+         store->const_index[0] = offset;<br>
+         store->const_index[1] = 1;<br>
+<br>
+         store->src[0] = nir_src_copy(intrin->src[0], state->mem_ctx);<br>
+<br>
+         if (has_indirect)<br>
+            store->src[1] = indirect;<br>
+<br>
+         nir_instr_insert_before(&intrin->instr, &store->instr);<br>
+         nir_instr_remove(&intrin->instr);<br>
+         break;<br>
+      }<br>
+<br>
+      default:<br>
+         break;<br>
+      }<br>
+   }<br>
+<br>
+   return true;<br>
+}<br>
+<br>
+static void<br>
+nir_lower_io_impl(nir_function_impl *impl)<br>
+{<br>
+   struct lower_io_state state;<br>
+<br>
+   state.mem_ctx = ralloc_parent(impl);<br>
+<br>
+   nir_foreach_block(impl, nir_lower_io_block, &state);<br>
+}<br>
+<br>
+void<br>
+nir_lower_io(nir_shader *shader)<br>
+{<br>
+   assign_var_locations_shader(shader);<br>
+<br>
+   nir_foreach_overload(shader, overload) {<br>
+      if (overload->impl)<br>
+         nir_lower_io_impl(overload->impl);<br>
+   }<br>
+}<br>
<span class="HOEnZb"><font color="#888888">--<br>
2.2.0<br>
<br>
_______________________________________________<br>
mesa-dev mailing list<br>
<a href="mailto:mesa-dev@lists.freedesktop.org">mesa-dev@lists.freedesktop.org</a><br>
<a href="http://lists.freedesktop.org/mailman/listinfo/mesa-dev" target="_blank">http://lists.freedesktop.org/mailman/listinfo/mesa-dev</a><br>
</font></span></blockquote></div><br></div>