[Mesa-dev] [PATCH v2 13/18] RFC: nir/vtn: "raw" pointer support

Karol Herbst kherbst at redhat.com
Thu Mar 8 15:25:59 UTC 2018


From: Rob Clark <robdclark at gmail.com>

An attempt to add physical pointer support to vtn.  I'm not totally
happy about the handling of logical pointers vs physical pointers.
So this is really more of an RFS (request for suggestions)

v2: treat vec3 types as vec4 when dereferencing

Signed-off-by: Karol Herbst <kherbst at redhat.com>
---
 src/compiler/spirv/spirv_to_nir.c  |  77 ++++++++++----
 src/compiler/spirv/vtn_private.h   |  19 +++-
 src/compiler/spirv/vtn_variables.c | 208 +++++++++++++++++++++++++++++++++----
 3 files changed, 264 insertions(+), 40 deletions(-)

diff --git a/src/compiler/spirv/spirv_to_nir.c b/src/compiler/spirv/spirv_to_nir.c
index 2e74e634eb..74c7031d47 100644
--- a/src/compiler/spirv/spirv_to_nir.c
+++ b/src/compiler/spirv/spirv_to_nir.c
@@ -573,6 +573,7 @@ vtn_types_compatible(struct vtn_builder *b,
              vtn_types_compatible(b, t1->array_element, t2->array_element);
 
    case vtn_base_type_pointer:
+   case vtn_base_type_raw_pointer:
       return vtn_types_compatible(b, t1->deref, t2->deref);
 
    case vtn_base_type_struct:
@@ -610,6 +611,7 @@ vtn_type_copy(struct vtn_builder *b, struct vtn_type *src)
    case vtn_base_type_matrix:
    case vtn_base_type_array:
    case vtn_base_type_pointer:
+   case vtn_base_type_raw_pointer:
    case vtn_base_type_image:
    case vtn_base_type_sampler:
    case vtn_base_type_sampled_image:
@@ -933,6 +935,14 @@ vtn_type_layout_std430(struct vtn_builder *b, struct vtn_type *type,
       return type;
    }
 
+   case vtn_base_type_raw_pointer: {
+      uint32_t comp_size = b->ptr_size / 8;
+      vtn_assert(comp_size);
+      *size_out = comp_size;
+      *align_out = comp_size;
+      return type;
+   }
+
    case vtn_base_type_vector: {
       uint32_t comp_size = glsl_get_bit_size(type->type) / 8;
       assert(type->length > 0 && type->length <= 4);
@@ -1055,6 +1065,10 @@ vtn_handle_type(struct vtn_builder *b, SpvOp opcode,
       val->type->type = glsl_vector_type(glsl_get_base_type(base->type), elems);
       val->type->length = elems;
       val->type->stride = glsl_get_bit_size(base->type) / 8;
+      /* special case: vec3 is aligned to vec4 */
+      if (elems == 3)
+         elems = 4;
+      val->type->stride *= elems;
       val->type->array_element = base;
       break;
    }
@@ -1160,27 +1174,46 @@ vtn_handle_type(struct vtn_builder *b, SpvOp opcode,
       val->type->storage_class = storage_class;
       val->type->deref = deref_type;
 
-      if (storage_class == SpvStorageClassUniform ||
-          storage_class == SpvStorageClassStorageBuffer) {
-         /* These can actually be stored to nir_variables and used as SSA
-          * values so they need a real glsl_type.
-          */
-         val->type->type = glsl_vector_type(GLSL_TYPE_UINT, 2);
-      }
-
-      if (storage_class == SpvStorageClassWorkgroup &&
-          b->options->lower_workgroup_access_to_offsets) {
+      // XXX handling the "fake" glsl pointers vs "raw" pointers in kernel
+      // is a bit ugly..  need to understand how "pointers" are used in vk
+      // and figure out something better
+      if (storage_class == SpvStorageClassFunction || !b->kernel_mode) {
+         if (storage_class == SpvStorageClassUniform ||
+             storage_class == SpvStorageClassStorageBuffer) {
+            /* These can actually be stored to nir_variables and used as SSA
+             * values so they need a real glsl_type.
+             */
+            val->type->type = glsl_vector_type(GLSL_TYPE_UINT, 2);
+         } else if (storage_class == SpvStorageClassWorkgroup &&
+                    b->options->lower_workgroup_access_to_offsets) {
+            uint32_t size, align;
+            val->type->deref = vtn_type_layout_std430(b, val->type->deref,
+                                                      &size, &align);
+            val->type->length = size;
+            val->type->align = align;
+            /* These can actually be stored to nir_variables and used as SSA
+             * values so they need a real glsl_type.
+             */
+            val->type->type = glsl_uint_type();
+         }
+      } else {
+         vtn_assert(storage_class == SpvStorageClassCrossWorkgroup ||
+                    storage_class == SpvStorageClassInput);
          uint32_t size, align;
+         if (b->ptr_size == 64) {
+            val->type->type = glsl_uint64_t_type();
+         } else {
+            val->type->type = glsl_uint_type();
+         }
+         val->type->base_type = vtn_base_type_raw_pointer;
+         /* pointers can be accessed as array, so set the stride as size: */
          val->type->deref = vtn_type_layout_std430(b, val->type->deref,
                                                    &size, &align);
-         val->type->length = size;
+#define ALIGN(_v, _d) (((_v) + ((_d) - 1)) & ~((_d) - 1))
+         val->type->stride = ALIGN(size, align);
          val->type->align = align;
-         /* These can actually be stored to nir_variables and used as SSA
-          * values so they need a real glsl_type.
-          */
-         val->type->type = glsl_uint_type();
+         break;
       }
-      break;
    }
 
    case SpvOpTypeImage: {
@@ -3375,9 +3408,16 @@ vtn_handle_preamble_instruction(struct vtn_builder *b, SpvOp opcode,
       break;
 
    case SpvOpMemoryModel:
-      vtn_assert(w[1] == SpvAddressingModelLogical);
+      vtn_assert(w[1] == SpvAddressingModelLogical ||
+                 w[1] == SpvAddressingModelPhysical32 ||
+                 w[1] == SpvAddressingModelPhysical64);
       vtn_assert(w[2] == SpvMemoryModelSimple ||
-                 w[2] == SpvMemoryModelGLSL450);
+                 w[2] == SpvMemoryModelGLSL450 ||
+                 w[2] == SpvMemoryModelOpenCL);
+      if (w[1] == SpvAddressingModelPhysical32)
+         b->ptr_size = 32;
+      else if (w[1] == SpvAddressingModelPhysical64)
+         b->ptr_size = 64;
       break;
 
    case SpvOpEntryPoint: {
@@ -3764,6 +3804,7 @@ vtn_handle_body_instruction(struct vtn_builder *b, SpvOp opcode,
          sel_type = glsl_vector_type(GLSL_TYPE_BOOL, res_val->type->length);
          break;
       case vtn_base_type_pointer:
+      case vtn_base_type_raw_pointer:
          /* We need to have actual storage for pointer types */
          vtn_fail_if(res_val->type->type == NULL,
                      "Invalid pointer result type for OpSelect");
diff --git a/src/compiler/spirv/vtn_private.h b/src/compiler/spirv/vtn_private.h
index 6041d45d00..9776274225 100644
--- a/src/compiler/spirv/vtn_private.h
+++ b/src/compiler/spirv/vtn_private.h
@@ -262,7 +262,8 @@ enum vtn_base_type {
    vtn_base_type_matrix,
    vtn_base_type_array,
    vtn_base_type_struct,
-   vtn_base_type_pointer,
+   vtn_base_type_pointer,         /* a logical pointer */
+   vtn_base_type_raw_pointer,     /* a physical pointer */
    vtn_base_type_image,
    vtn_base_type_sampler,
    vtn_base_type_sampled_image,
@@ -406,6 +407,7 @@ enum vtn_variable_mode {
    vtn_variable_mode_image,
    vtn_variable_mode_sampler,
    vtn_variable_mode_workgroup,
+   vtn_variable_mode_cross_workgroup,
    vtn_variable_mode_input,
    vtn_variable_mode_output,
 };
@@ -581,6 +583,13 @@ struct vtn_builder {
 
    bool has_loop_continue;
 
+   /* pointer size is:
+    *   AddressingModelLogical:    0    (default)
+    *   AddressingModelPhysical32: 32
+    *   AddressingModelPhysical64: 64
+    */
+   unsigned ptr_size;
+
    bool kernel_mode;
 };
 
@@ -617,7 +626,8 @@ vtn_push_ssa(struct vtn_builder *b, uint32_t value_id,
              struct vtn_type *type, struct vtn_ssa_value *ssa)
 {
    struct vtn_value *val;
-   if (type->base_type == vtn_base_type_pointer) {
+   if (type->base_type == vtn_base_type_pointer ||
+       type->base_type == vtn_base_type_raw_pointer) {
       val = vtn_push_value(b, value_id, vtn_value_type_pointer);
       val->pointer = vtn_pointer_from_ssa(b, ssa->def, type);
    } else {
@@ -681,6 +691,11 @@ struct vtn_ssa_value *vtn_local_load(struct vtn_builder *b, nir_deref_var *src);
 void vtn_local_store(struct vtn_builder *b, struct vtn_ssa_value *src,
                      nir_deref_var *dest);
 
+struct vtn_ssa_value *vtn_pointer_load(struct vtn_builder *b,
+                                       struct vtn_pointer *ptr);
+void vtn_pointer_store(struct vtn_builder *b, struct vtn_ssa_value *src,
+                       struct vtn_pointer *ptr);
+
 struct vtn_ssa_value *
 vtn_variable_load(struct vtn_builder *b, struct vtn_pointer *src);
 
diff --git a/src/compiler/spirv/vtn_variables.c b/src/compiler/spirv/vtn_variables.c
index f0e876806c..91291c8a62 100644
--- a/src/compiler/spirv/vtn_variables.c
+++ b/src/compiler/spirv/vtn_variables.c
@@ -207,6 +207,12 @@ vtn_ssa_offset_pointer_dereference(struct vtn_builder *b,
             /* You can't have a zero-length OpPtrAccessChain */
             vtn_assert(deref_chain->length >= 1);
             desc_arr_idx = vtn_access_link_as_ssa(b, deref_chain->link[0], 1);
+         } else if (!glsl_type_is_struct(type->type)) {
+            /* if we have something that is ptr to simple type, like an
+             * int ptr, then just treat that like an array of length 1,
+             * we just want to deref the zero'th element:
+             */
+            desc_arr_idx = nir_imm_int(&b->nb, 0);
          } else {
             /* We have a regular non-array SSBO. */
             desc_arr_idx = NULL;
@@ -304,7 +310,9 @@ vtn_ssa_offset_pointer_dereference(struct vtn_builder *b,
       case GLSL_TYPE_FLOAT:
       case GLSL_TYPE_FLOAT16:
       case GLSL_TYPE_DOUBLE:
-      case GLSL_TYPE_BOOL:
+      case GLSL_TYPE_BOOL: {
+         break;
+      }
       case GLSL_TYPE_ARRAY: {
          nir_ssa_def *elem_offset =
             vtn_access_link_as_ssa(b, deref_chain->link[idx], type->stride);
@@ -336,6 +344,80 @@ vtn_ssa_offset_pointer_dereference(struct vtn_builder *b,
    return ptr;
 }
 
+static struct vtn_pointer *
+vtn_ssa_raw_pointer_dereference(struct vtn_builder *b,
+                                struct vtn_pointer *base,
+                                struct vtn_access_chain *deref_chain)
+{
+   nir_ssa_def *offset = nir_imm_int(&b->nb, 0);
+   struct vtn_type *type = base->ptr_type;
+
+
+   vtn_assert(type);
+
+   /* TODO this can probably be refactored out into helper?  Nearly
+    * the same as in vtn_ssa_offset_pointer_dereference() and perhaps
+    * elsewhere..
+    *
+    * Note that the type here in the switch is of what the pointer
+    * points to, ie. if the base type is uint, we are dereferencing
+    * (possibly as an array) a uint* pointer.
+    */
+   for (unsigned idx = 0; idx < deref_chain->length; idx++) {
+      switch (glsl_get_base_type(type->type)) {
+      case GLSL_TYPE_UINT:
+      case GLSL_TYPE_INT:
+      case GLSL_TYPE_UINT16:
+      case GLSL_TYPE_INT16:
+      case GLSL_TYPE_UINT8:
+      case GLSL_TYPE_INT8:
+      case GLSL_TYPE_UINT64:
+      case GLSL_TYPE_INT64:
+      case GLSL_TYPE_FLOAT:
+      case GLSL_TYPE_FLOAT16:
+      case GLSL_TYPE_DOUBLE:
+      case GLSL_TYPE_BOOL:
+      case GLSL_TYPE_ARRAY: {
+         nir_ssa_def *elem_offset =
+            vtn_access_link_as_ssa(b, deref_chain->link[idx], type->stride);
+         offset = nir_iadd(&b->nb, offset, elem_offset);
+         type = type->array_element;
+         break;
+      }
+
+      case GLSL_TYPE_STRUCT: {
+         vtn_assert(deref_chain->link[idx].mode == vtn_access_mode_literal);
+         unsigned member = deref_chain->link[idx].id;
+         nir_ssa_def *mem_offset = nir_imm_int(&b->nb, type->offsets[member]);
+         offset = nir_iadd(&b->nb, offset, mem_offset);
+         type = type->members[member];
+         break;
+      }
+
+      default:
+         vtn_fail("Invalid type for deref");
+      }
+   }
+
+   /* at this point, offset is 32b, but pointer can be either 32b or 64b
+    * depending on memory model:
+    */
+   if (b->ptr_size == 64) {
+      offset = nir_u2u64(&b->nb, offset);
+   }
+
+   /* add pointer address to calculated offset: */
+   if (base->offset)
+      offset = nir_iadd(&b->nb, offset, base->offset);
+
+   struct vtn_pointer *ptr = rzalloc(b, struct vtn_pointer);
+   ptr->mode = base->mode;
+   ptr->type = type;
+   ptr->offset = offset;
+
+   return ptr;
+}
+
 /* Dereference the given base pointer by the access chain */
 static struct vtn_pointer *
 vtn_pointer_dereference(struct vtn_builder *b,
@@ -344,6 +426,8 @@ vtn_pointer_dereference(struct vtn_builder *b,
 {
    if (vtn_pointer_uses_ssa_offset(b, base)) {
       return vtn_ssa_offset_pointer_dereference(b, base, deref_chain);
+   } else if (base->ptr_type->base_type == vtn_base_type_raw_pointer) {
+      return vtn_ssa_raw_pointer_dereference(b, base, deref_chain);
    } else {
       return vtn_access_chain_pointer_dereference(b, base, deref_chain);
    }
@@ -373,7 +457,8 @@ vtn_pointer_for_variable(struct vtn_builder *b,
 
    pointer->mode = var->mode;
    pointer->type = var->type;
-   vtn_assert(ptr_type->base_type == vtn_base_type_pointer);
+   vtn_assert(ptr_type->base_type == vtn_base_type_pointer ||
+              ptr_type->base_type == vtn_base_type_raw_pointer);
    vtn_assert(ptr_type->deref->type == var->type->type);
    pointer->ptr_type = ptr_type;
    pointer->var = var;
@@ -384,6 +469,12 @@ vtn_pointer_for_variable(struct vtn_builder *b,
 nir_deref_var *
 vtn_pointer_to_deref(struct vtn_builder *b, struct vtn_pointer *ptr)
 {
+   /* once you've chased a pointer, you no longer really have a var,
+    * so this case is handled differently
+    */
+   if (!ptr->var)
+      return NULL;
+
    /* Do on-the-fly copy propagation for samplers. */
    if (ptr->var->copy_prop_sampler)
       return vtn_pointer_to_deref(b, ptr->var->copy_prop_sampler);
@@ -598,6 +689,49 @@ vtn_local_store(struct vtn_builder *b, struct vtn_ssa_value *src,
    }
 }
 
+struct vtn_ssa_value *
+vtn_pointer_load(struct vtn_builder *b, struct vtn_pointer *ptr)
+{
+   const struct glsl_type *type = ptr->type->type;
+   struct vtn_ssa_value *val = vtn_create_ssa_value(b, type);
+   nir_intrinsic_op op = nir_intrinsic_load_global;
+
+   vtn_assert(ptr->offset);
+
+   nir_intrinsic_instr *intrin = nir_intrinsic_instr_create(b->shader, op);
+   intrin->num_components = glsl_get_vector_elements(type);
+   intrin->src[0] = nir_src_for_ssa(ptr->offset);
+
+   nir_ssa_dest_init(&intrin->instr, &intrin->dest,
+                     intrin->num_components,
+                     glsl_get_bit_size(type),
+                     NULL);
+   val->def = &intrin->dest.ssa;
+
+   nir_builder_instr_insert(&b->nb, &intrin->instr);
+
+   return val;
+}
+
+void
+vtn_pointer_store(struct vtn_builder *b, struct vtn_ssa_value *src,
+                  struct vtn_pointer *ptr)
+{
+   const struct glsl_type *type = ptr->type->type;
+   nir_intrinsic_op op = nir_intrinsic_store_global;
+
+   vtn_assert(ptr->offset);
+
+   nir_intrinsic_instr *intrin = nir_intrinsic_instr_create(b->shader, op);
+   intrin->num_components = glsl_get_vector_elements(type);
+   intrin->src[0] = nir_src_for_ssa(src->def);
+   intrin->src[1] = nir_src_for_ssa(ptr->offset);
+
+   nir_intrinsic_set_write_mask(intrin, (1 << intrin->num_components) - 1);
+
+   nir_builder_instr_insert(&b->nb, &intrin->instr);
+}
+
 nir_ssa_def *
 vtn_pointer_to_offset(struct vtn_builder *b, struct vtn_pointer *ptr,
                       nir_ssa_def **index_out, unsigned *end_idx_out)
@@ -1004,20 +1138,33 @@ _vtn_variable_load_store(struct vtn_builder *b, bool load,
    case GLSL_TYPE_FLOAT:
    case GLSL_TYPE_FLOAT16:
    case GLSL_TYPE_BOOL:
-   case GLSL_TYPE_DOUBLE:
-      /* At this point, we have a scalar, vector, or matrix so we know that
-       * there cannot be any structure splitting still in the way.  By
-       * stopping at the matrix level rather than the vector level, we
-       * ensure that matrices get loaded in the optimal way even if they
-       * are storred row-major in a UBO.
-       */
-      if (load) {
-         *inout = vtn_local_load(b, vtn_pointer_to_deref(b, ptr));
+   case GLSL_TYPE_DOUBLE: {
+      nir_deref_var *deref_var = vtn_pointer_to_deref(b, ptr);
+
+      if (deref_var) {
+         /* At this point, we have a scalar, vector, or matrix so we know that
+          * there cannot be any structure splitting still in the way.  By
+          * stopping at the matrix level rather than the vector level, we
+          * ensure that matrices get loaded in the optimal way even if they
+          * are storred row-major in a UBO.
+          */
+         if (load) {
+            *inout = vtn_local_load(b, deref_var);
+         } else {
+            vtn_local_store(b, *inout, deref_var);
+         }
       } else {
-         vtn_local_store(b, *inout, vtn_pointer_to_deref(b, ptr));
+         /* If deref'ing a raw pointer, we don't have a variable to go along
+          * with it.  Just directly generate load/store_global intrinsics:
+          */
+         if (load) {
+            *inout = vtn_pointer_load(b, ptr);
+         } else {
+            vtn_pointer_store(b, *inout, ptr);
+         }
       }
       return;
-
+   }
    case GLSL_TYPE_ARRAY:
    case GLSL_TYPE_STRUCT: {
       unsigned elems = glsl_get_length(ptr->type->type);
@@ -1065,7 +1212,8 @@ vtn_variable_store(struct vtn_builder *b, struct vtn_ssa_value *src,
 {
    if (vtn_pointer_is_external_block(b, dest)) {
       vtn_assert(dest->mode == vtn_variable_mode_ssbo ||
-                 dest->mode == vtn_variable_mode_workgroup);
+                 dest->mode == vtn_variable_mode_workgroup ||
+                 dest->mode == vtn_variable_mode_param);
       vtn_block_store(b, src, dest);
    } else {
       _vtn_variable_load_store(b, false, dest, &src);
@@ -1668,6 +1816,10 @@ vtn_storage_class_to_mode(struct vtn_builder *b,
       nir_mode = nir_var_shared;
       break;
    case SpvStorageClassCrossWorkgroup:
+      mode = vtn_variable_mode_cross_workgroup;
+      // TODO do we want a new nir_mode for raw pointers?
+      nir_mode = nir_var_global;
+      break;
    case SpvStorageClassGeneric:
    case SpvStorageClassAtomicCounter:
    default:
@@ -1696,7 +1848,14 @@ vtn_pointer_to_ssa(struct vtn_builder *b, struct vtn_pointer *ptr)
       struct vtn_access_chain chain = {
          .length = 0,
       };
-      ptr = vtn_ssa_offset_pointer_dereference(b, ptr, &chain);
+
+      if (vtn_pointer_uses_ssa_offset(b, ptr)) {
+         ptr = vtn_ssa_offset_pointer_dereference(b, ptr, &chain);
+      } else if (ptr->ptr_type->base_type == vtn_base_type_raw_pointer) {
+         ptr = vtn_ssa_raw_pointer_dereference(b, ptr, &chain);
+      } else {
+         vtn_fail("unhandled");
+      }
    }
 
    vtn_assert(ptr->offset);
@@ -1714,8 +1873,8 @@ struct vtn_pointer *
 vtn_pointer_from_ssa(struct vtn_builder *b, nir_ssa_def *ssa,
                      struct vtn_type *ptr_type)
 {
-   vtn_assert(ssa->num_components <= 2 && ssa->bit_size == 32);
-   vtn_assert(ptr_type->base_type == vtn_base_type_pointer);
+   vtn_assert(ptr_type->base_type == vtn_base_type_pointer ||
+              ptr_type->base_type == vtn_base_type_raw_pointer);
    vtn_assert(ptr_type->deref->base_type != vtn_base_type_pointer);
    /* This pointer type needs to have actual storage */
    vtn_assert(ptr_type->type);
@@ -1723,18 +1882,25 @@ vtn_pointer_from_ssa(struct vtn_builder *b, nir_ssa_def *ssa,
    struct vtn_pointer *ptr = rzalloc(b, struct vtn_pointer);
    ptr->mode = vtn_storage_class_to_mode(b, ptr_type->storage_class,
                                          ptr_type, NULL);
+
+   if (ptr_type->base_type == vtn_base_type_raw_pointer) {
+      vtn_assert(ssa->num_components == 1 && ssa->bit_size == b->ptr_size);
+   } else {
+      vtn_assert(ssa->num_components <= 2 && ssa->bit_size == 32);
+   }
+
    ptr->type = ptr_type->deref;
    ptr->ptr_type = ptr_type;
 
    if (ssa->num_components > 1) {
       vtn_assert(ssa->num_components == 2);
       vtn_assert(ptr->mode == vtn_variable_mode_ubo ||
-                 ptr->mode == vtn_variable_mode_ssbo);
+                 ptr->mode == vtn_variable_mode_ssbo ||
+                 ptr->mode == vtn_variable_mode_global);
       ptr->block_index = nir_channel(&b->nb, ssa, 0);
       ptr->offset = nir_channel(&b->nb, ssa, 1);
    } else {
       vtn_assert(ssa->num_components == 1);
-      vtn_assert(ptr->mode == vtn_variable_mode_workgroup);
       ptr->block_index = NULL;
       ptr->offset = ssa;
    }
@@ -1765,7 +1931,8 @@ vtn_create_variable(struct vtn_builder *b, struct vtn_value *val,
                     struct vtn_type *ptr_type, SpvStorageClass storage_class,
                     nir_constant *initializer)
 {
-   vtn_assert(ptr_type->base_type == vtn_base_type_pointer);
+   vtn_assert(ptr_type->base_type == vtn_base_type_pointer ||
+              ptr_type->base_type == vtn_base_type_raw_pointer);
    struct vtn_type *type = ptr_type->deref;
 
    struct vtn_type *without_array = type;
@@ -1937,6 +2104,7 @@ vtn_create_variable(struct vtn_builder *b, struct vtn_value *val,
    case vtn_variable_mode_ubo:
    case vtn_variable_mode_ssbo:
    case vtn_variable_mode_push_constant:
+   case vtn_variable_mode_cross_workgroup:
       /* These don't need actual variables. */
       break;
    }
-- 
2.14.3



More information about the mesa-dev mailing list