nir: deref only for OpTypePointer

[mesa.git] / src / compiler / spirv / spirv_to_nir.c
diff --git a/src/compiler/spirv/spirv_to_nir.c b/src/compiler/spirv/spirv_to_nir.c

index 1a86312539e69fd44ed8b7d795d955f0f1ada764..ce3e0781afc34a9e6b83aaf38b911e0b0b1ce289 100644 (file)
--- a/src/compiler/spirv/spirv_to_nir.c
+++ b/src/compiler/spirv/spirv_to_nir.c
@@ -32,6 +32,8 @@
  #include "nir/nir_deref.h"
  #include "spirv_info.h"
  
+#include "util/u_math.h"
+
  #include <stdio.h>
  
  void
@@ -395,6 +397,8 @@ vtn_handle_extension(struct vtn_builder *b, SpvOp opcode,
        } else if ((strcmp(ext, "SPV_AMD_shader_trinary_minmax") == 0)
                  && (b->options && b->options->caps.trinary_minmax)) {
           val->ext_handler = vtn_handle_amd_shader_trinary_minmax_instruction;
+      } else if (strcmp(ext, "OpenCL.std") == 0) {
+         val->ext_handler = vtn_handle_opencl_instruction;
        } else {
           vtn_fail("Unsupported extension: %s", ext);
        }
@@ -497,7 +501,8 @@ vtn_handle_decoration(struct vtn_builder *b, SpvOp opcode,
     case SpvOpMemberDecorate:
     case SpvOpDecorateStringGOOGLE:
     case SpvOpMemberDecorateStringGOOGLE:
-   case SpvOpExecutionMode: {
+   case SpvOpExecutionMode:
+   case SpvOpExecutionModeId: {
        struct vtn_value *val = vtn_untyped_value(b, target);
  
        struct vtn_decoration *dec = rzalloc(b, struct vtn_decoration);
@@ -513,6 +518,7 @@ vtn_handle_decoration(struct vtn_builder *b, SpvOp opcode,
                       "Member argument of OpMemberDecorate too large");
           break;
        case SpvOpExecutionMode:
+      case SpvOpExecutionModeId:
           dec->scope = VTN_DEC_EXECUTION_MODE;
           break;
        default:
@@ -815,13 +821,22 @@ struct_member_decoration_cb(struct vtn_builder *b,
        break;
  
     case SpvDecorationCPacked:
+      if (b->shader->info.stage != MESA_SHADER_KERNEL)
+         vtn_warn("Decoration only allowed for CL-style kernels: %s",
+                  spirv_decoration_to_string(dec->decoration));
+      else
+         ctx->type->packed = true;
+      break;
+
     case SpvDecorationSaturatedConversion:
     case SpvDecorationFuncParamAttr:
     case SpvDecorationFPRoundingMode:
     case SpvDecorationFPFastMathMode:
     case SpvDecorationAlignment:
-      vtn_warn("Decoration only allowed for CL-style kernels: %s",
-               spirv_decoration_to_string(dec->decoration));
+      if (b->shader->info.stage != MESA_SHADER_KERNEL) {
+         vtn_warn("Decoration only allowed for CL-style kernels: %s",
+                  spirv_decoration_to_string(dec->decoration));
+      }
        break;
  
     case SpvDecorationHlslSemanticGOOGLE:
@@ -973,6 +988,13 @@ type_decoration_cb(struct vtn_builder *b,
        break;
  
     case SpvDecorationCPacked:
+      if (b->shader->info.stage != MESA_SHADER_KERNEL)
+         vtn_warn("Decoration only allowed for CL-style kernels: %s",
+                  spirv_decoration_to_string(dec->decoration));
+      else
+         type->packed = true;
+      break;
+
     case SpvDecorationSaturatedConversion:
     case SpvDecorationFuncParamAttr:
     case SpvDecorationFPRoundingMode:
@@ -1042,14 +1064,16 @@ vtn_type_layout_std430(struct vtn_builder *b, struct vtn_type *type,
  {
     switch (type->base_type) {
     case vtn_base_type_scalar: {
-      uint32_t comp_size = glsl_get_bit_size(type->type) / 8;
+      uint32_t comp_size = glsl_type_is_boolean(type->type)
+         ? 4 : glsl_get_bit_size(type->type) / 8;
        *size_out = comp_size;
        *align_out = comp_size;
        return type;
     }
  
     case vtn_base_type_vector: {
-      uint32_t comp_size = glsl_get_bit_size(type->type) / 8;
+      uint32_t comp_size = glsl_type_is_boolean(type->type)
+         ? 4 : glsl_get_bit_size(type->type) / 8;
        unsigned align_comps = type->length == 3 ? 4 : type->length;
        *size_out = comp_size * type->length,
        *align_out = comp_size * align_comps;
@@ -1097,10 +1121,18 @@ static void
  vtn_handle_type(struct vtn_builder *b, SpvOp opcode,
                  const uint32_t *w, unsigned count)
  {
-   struct vtn_value *val = vtn_push_value(b, w[1], vtn_value_type_type);
+   struct vtn_value *val = NULL;
  
-   val->type = rzalloc(b, struct vtn_type);
-   val->type->id = w[1];
+   /* In order to properly handle forward declarations, we have to defer
+    * allocation for pointer types.
+    */
+   if (opcode != SpvOpTypePointer && opcode != SpvOpTypeForwardPointer) {
+      val = vtn_push_value(b, w[1], vtn_value_type_type);
+      vtn_fail_if(val->type != NULL,
+                  "Only pointers can have forward declarations");
+      val->type = rzalloc(b, struct vtn_type);
+      val->type->id = w[1];
+   }
  
     switch (opcode) {
     case SpvOpTypeVoid:
@@ -1168,7 +1200,8 @@ vtn_handle_type(struct vtn_builder *b, SpvOp opcode,
        val->type->base_type = vtn_base_type_vector;
        val->type->type = glsl_vector_type(glsl_get_base_type(base->type), elems);
        val->type->length = elems;
-      val->type->stride = glsl_get_bit_size(base->type) / 8;
+      val->type->stride = glsl_type_is_boolean(val->type->type)
+         ? 4 : glsl_get_bit_size(base->type) / 8;
        val->type->array_element = base;
        break;
     }
@@ -1211,7 +1244,8 @@ vtn_handle_type(struct vtn_builder *b, SpvOp opcode,
  
        val->type->base_type = vtn_base_type_array;
        val->type->array_element = array_element;
-      val->type->stride = 0;
+      if (b->shader->info.stage == MESA_SHADER_KERNEL)
+         val->type->stride = glsl_get_cl_size(array_element->type);
  
        vtn_foreach_decoration(b, val, array_stride_decoration_cb, NULL);
        val->type->type = glsl_array_type(array_element->type, val->type->length,
@@ -1225,6 +1259,7 @@ vtn_handle_type(struct vtn_builder *b, SpvOp opcode,
        val->type->length = num_fields;
        val->type->members = ralloc_array(b, struct vtn_type *, num_fields);
        val->type->offsets = ralloc_array(b, unsigned, num_fields);
+      val->type->packed = false;
  
        NIR_VLA(struct glsl_struct_field, fields, count);
        for (unsigned i = 0; i < num_fields; i++) {
@@ -1234,9 +1269,19 @@ vtn_handle_type(struct vtn_builder *b, SpvOp opcode,
              .type = val->type->members[i]->type,
              .name = ralloc_asprintf(b, "field%d", i),
              .location = -1,
+            .offset = -1,
           };
        }
  
+      if (b->shader->info.stage == MESA_SHADER_KERNEL) {
+         unsigned offset = 0;
+         for (unsigned i = 0; i < num_fields; i++) {
+            offset = align(offset, glsl_get_cl_alignment(fields[i].type));
+            fields[i].offset = offset;
+            offset += glsl_get_cl_size(fields[i].type);
+         }
+      }
+
        struct member_decoration_ctx ctx = {
           .num_fields = num_fields,
           .fields = fields,
@@ -1248,7 +1293,7 @@ vtn_handle_type(struct vtn_builder *b, SpvOp opcode,
  
        const char *name = val->name ? val->name : "struct";
  
-      val->type->type = glsl_struct_type(fields, num_fields, name);
+      val->type->type = glsl_struct_type(fields, num_fields, name, false);
        break;
     }
  
@@ -1268,46 +1313,93 @@ vtn_handle_type(struct vtn_builder *b, SpvOp opcode,
        break;
     }
  
-   case SpvOpTypePointer: {
+   case SpvOpTypePointer:
+   case SpvOpTypeForwardPointer: {
+      /* We can't blindly push the value because it might be a forward
+       * declaration.
+       */
+      val = vtn_untyped_value(b, w[1]);
+
        SpvStorageClass storage_class = w[2];
-      struct vtn_type *deref_type =
-         vtn_value(b, w[3], vtn_value_type_type)->type;
  
-      val->type->base_type = vtn_base_type_pointer;
-      val->type->storage_class = storage_class;
-      val->type->deref = deref_type;
+      if (val->value_type == vtn_value_type_invalid) {
+         val->value_type = vtn_value_type_type;
+         val->type = rzalloc(b, struct vtn_type);
+         val->type->id = w[1];
+         val->type->base_type = vtn_base_type_pointer;
+         val->type->storage_class = storage_class;
  
-      vtn_foreach_decoration(b, val, array_stride_decoration_cb, NULL);
+         /* These can actually be stored to nir_variables and used as SSA
+          * values so they need a real glsl_type.
+          */
+         switch (storage_class) {
+         case SpvStorageClassUniform:
+            val->type->type = b->options->ubo_ptr_type;
+            break;
+         case SpvStorageClassStorageBuffer:
+            val->type->type = b->options->ssbo_ptr_type;
+            break;
+         case SpvStorageClassPhysicalStorageBufferEXT:
+            val->type->type = b->options->phys_ssbo_ptr_type;
+            break;
+         case SpvStorageClassPushConstant:
+            val->type->type = b->options->push_const_ptr_type;
+            break;
+         case SpvStorageClassWorkgroup:
+            val->type->type = b->options->shared_ptr_type;
+            break;
+         case SpvStorageClassCrossWorkgroup:
+            val->type->type = b->options->global_ptr_type;
+            break;
+         case SpvStorageClassFunction:
+            if (b->physical_ptrs)
+               val->type->type = b->options->temp_ptr_type;
+            break;
+         default:
+            /* In this case, no variable pointers are allowed so all deref
+             * chains are complete back to the variable and it doesn't matter
+             * what type gets used so we leave it NULL.
+             */
+            break;
+         }
+      } else {
+         vtn_fail_if(val->type->storage_class != storage_class,
+                     "The storage classes of an OpTypePointer and any "
+                     "OpTypeForwardPointers that provide forward "
+                     "declarations of it must match.");
+      }
  
-      /* These can actually be stored to nir_variables and used as SSA
-       * values so they need a real glsl_type.
-       */
-      switch (storage_class) {
-      case SpvStorageClassUniform:
-         val->type->type = b->options->ubo_ptr_type;
-         break;
-      case SpvStorageClassStorageBuffer:
-         val->type->type = b->options->ssbo_ptr_type;
-         break;
-      case SpvStorageClassPushConstant:
-         val->type->type = b->options->push_const_ptr_type;
-         break;
-      case SpvStorageClassWorkgroup:
-         val->type->type = b->options->shared_ptr_type;
-         if (b->options->lower_workgroup_access_to_offsets) {
+      if (opcode == SpvOpTypePointer) {
+         vtn_fail_if(val->type->deref != NULL,
+                     "While OpTypeForwardPointer can be used to provide a "
+                     "forward declaration of a pointer, OpTypePointer can "
+                     "only be used once for a given id.");
+
+         val->type->deref = vtn_value(b, w[3], vtn_value_type_type)->type;
+
+         vtn_foreach_decoration(b, val, array_stride_decoration_cb, NULL);
+
+         if (b->physical_ptrs) {
+            switch (storage_class) {
+            case SpvStorageClassFunction:
+            case SpvStorageClassWorkgroup:
+            case SpvStorageClassCrossWorkgroup:
+               val->type->stride = align(glsl_get_cl_size(val->type->deref->type),
+                                         glsl_get_cl_alignment(val->type->deref->type));
+               break;
+            default:
+               break;
+            }
+         }
+
+         if (storage_class == SpvStorageClassWorkgroup &&
+             b->options->lower_workgroup_access_to_offsets) {
              uint32_t size, align;
              val->type->deref = vtn_type_layout_std430(b, val->type->deref,
                                                        &size, &align);
              val->type->length = size;
              val->type->align = align;
           }
-         break;
-      default:
-         /* In this case, no variable pointers are allowed so all deref chains
-          * are complete back to the variable and it doesn't matter what type
-          * gets used so we leave it NULL.
-          */
-         break;
        }
        break;
     }
@@ -1335,7 +1427,9 @@ vtn_handle_type(struct vtn_builder *b, SpvOp opcode,
           vtn_fail("Invalid SPIR-V image dimensionality");
        }
  
-      bool is_shadow = w[4];
+      /* w[4]: as per Vulkan spec "Validation Rules within a Module",
+       *       The “Depth” operand of OpTypeImage is ignored.
+       */
        bool is_array = w[5];
        bool multisampled = w[6];
        unsigned sampled = w[7];
@@ -1361,10 +1455,9 @@ vtn_handle_type(struct vtn_builder *b, SpvOp opcode,
           glsl_get_base_type(sampled_type->type);
        if (sampled == 1) {
           val->type->sampled = true;
-         val->type->type = glsl_sampler_type(dim, is_shadow, is_array,
+         val->type->type = glsl_sampler_type(dim, false, is_array,
                                               sampled_base_type);
        } else if (sampled == 2) {
-         vtn_assert(!is_shadow);
           val->type->sampled = false;
           val->type->type = glsl_image_type(dim, is_array, sampled_base_type);
        } else {
@@ -1523,10 +1616,7 @@ handle_workgroup_size_decoration_cb(struct vtn_builder *b,
        return;
  
     vtn_assert(val->type->type == glsl_vector_type(GLSL_TYPE_UINT, 3));
-
-   b->shader->info.cs.local_size[0] = val->constant->values[0].u32[0];
-   b->shader->info.cs.local_size[1] = val->constant->values[0].u32[1];
-   b->shader->info.cs.local_size[2] = val->constant->values[0].u32[2];
+   b->workgroup_size_builtin = val;
  }
  
  static void
@@ -2114,6 +2204,7 @@ vtn_handle_texture(struct vtn_builder *b, SpvOp opcode,
     case nir_texop_txl:
     case nir_texop_txd:
     case nir_texop_tg4:
+   case nir_texop_lod:
        /* These operations require a sampler */
        p->src = nir_src_for_ssa(&sampler->dest.ssa);
        p->src_type = nir_tex_src_sampler_deref;
@@ -2122,7 +2213,6 @@ vtn_handle_texture(struct vtn_builder *b, SpvOp opcode,
     case nir_texop_txf:
     case nir_texop_txf_ms:
     case nir_texop_txs:
-   case nir_texop_lod:
     case nir_texop_query_levels:
     case nir_texop_texture_samples:
     case nir_texop_samples_identical:
@@ -3004,12 +3094,7 @@ nir_ssa_def *
  vtn_vector_extract_dynamic(struct vtn_builder *b, nir_ssa_def *src,
                             nir_ssa_def *index)
  {
-   nir_ssa_def *dest = vtn_vector_extract(b, src, 0);
-   for (unsigned i = 1; i < src->num_components; i++)
-      dest = nir_bcsel(&b->nb, nir_ieq_imm(&b->nb, index, i),
-                       vtn_vector_extract(b, src, i), dest);
-
-   return dest;
+   return nir_vector_extract(&b->nb, src, nir_i2i(&b->nb, index, 32));
  }
  
  nir_ssa_def *
@@ -3317,7 +3402,7 @@ vtn_handle_barrier(struct vtn_builder *b, SpvOp opcode,
        switch (opcode) {
        case SpvOpEmitStreamVertex:
        case SpvOpEndStreamPrimitive: {
-         unsigned stream = vtn_constant_value(b, w[1])->values[0].u32[0];
+         unsigned stream = vtn_constant_uint(b, w[1]);
           nir_intrinsic_set_stream_id(intrin, stream);
           break;
        }
@@ -3331,23 +3416,19 @@ vtn_handle_barrier(struct vtn_builder *b, SpvOp opcode,
     }
  
     case SpvOpMemoryBarrier: {
-      SpvScope scope = vtn_constant_value(b, w[1])->values[0].u32[0];
-      SpvMemorySemanticsMask semantics =
-         vtn_constant_value(b, w[2])->values[0].u32[0];
+      SpvScope scope = vtn_constant_uint(b, w[1]);
+      SpvMemorySemanticsMask semantics = vtn_constant_uint(b, w[2]);
        vtn_emit_memory_barrier(b, scope, semantics);
        return;
     }
  
     case SpvOpControlBarrier: {
-      SpvScope execution_scope =
-         vtn_constant_value(b, w[1])->values[0].u32[0];
+      SpvScope execution_scope = vtn_constant_uint(b, w[1]);
        if (execution_scope == SpvScopeWorkgroup)
           vtn_emit_barrier(b, nir_intrinsic_barrier);
  
-      SpvScope memory_scope =
-         vtn_constant_value(b, w[2])->values[0].u32[0];
-      SpvMemorySemanticsMask memory_semantics =
-         vtn_constant_value(b, w[3])->values[0].u32[0];
+      SpvScope memory_scope = vtn_constant_uint(b, w[2]);
+      SpvMemorySemanticsMask memory_semantics = vtn_constant_uint(b, w[3]);
        vtn_emit_memory_barrier(b, memory_scope, memory_semantics);
        break;
     }
@@ -3422,6 +3503,8 @@ stage_for_execution_model(struct vtn_builder *b, SpvExecutionModel model)
        return MESA_SHADER_FRAGMENT;
     case SpvExecutionModelGLCompute:
        return MESA_SHADER_COMPUTE;
+   case SpvExecutionModelKernel:
+      return MESA_SHADER_KERNEL;
     default:
        vtn_fail("Unsupported execution model");
     }
@@ -3519,7 +3602,6 @@ vtn_handle_preamble_instruction(struct vtn_builder *b, SpvOp opcode,
        case SpvCapabilityVector16:
        case SpvCapabilityFloat16Buffer:
        case SpvCapabilityFloat16:
-      case SpvCapabilityInt8:
        case SpvCapabilitySparseResidency:
           vtn_warn("Unsupported SPIR-V capability: %s",
                    spirv_capability_to_string(cap));
@@ -3555,12 +3637,22 @@ vtn_handle_preamble_instruction(struct vtn_builder *b, SpvOp opcode,
           spv_check_supported(int64_atomics, cap);
           break;
  
+      case SpvCapabilityInt8:
+         spv_check_supported(int8, cap);
+         break;
+
        case SpvCapabilityStorageImageMultisample:
           spv_check_supported(storage_image_ms, cap);
           break;
  
        case SpvCapabilityAddresses:
+         spv_check_supported(address, cap);
+         break;
+
        case SpvCapabilityKernel:
+         spv_check_supported(kernel, cap);
+         break;
+
        case SpvCapabilityImageBasic:
        case SpvCapabilityImageReadWrite:
        case SpvCapabilityImageMipmap:
@@ -3670,6 +3762,10 @@ vtn_handle_preamble_instruction(struct vtn_builder *b, SpvOp opcode,
           spv_check_supported(post_depth_coverage, cap);
           break;
  
+      case SpvCapabilityPhysicalStorageBufferAddressesEXT:
+         spv_check_supported(physical_storage_buffer_address, cap);
+         break;
+
        default:
           vtn_fail("Unhandled capability");
        }
@@ -3681,9 +3777,44 @@ vtn_handle_preamble_instruction(struct vtn_builder *b, SpvOp opcode,
        break;
  
     case SpvOpMemoryModel:
-      vtn_assert(w[1] == SpvAddressingModelLogical);
+      switch (w[1]) {
+      case SpvAddressingModelPhysical32:
+         vtn_fail_if(b->shader->info.stage != MESA_SHADER_KERNEL,
+                     "AddressingModelPhysical32 only supported for kernels");
+         b->shader->info.cs.ptr_size = 32;
+         b->physical_ptrs = true;
+         b->options->shared_ptr_type = glsl_uint_type();
+         b->options->global_ptr_type = glsl_uint_type();
+         b->options->temp_ptr_type = glsl_uint_type();
+         break;
+      case SpvAddressingModelPhysical64:
+         vtn_fail_if(b->shader->info.stage != MESA_SHADER_KERNEL,
+                     "AddressingModelPhysical64 only supported for kernels");
+         b->shader->info.cs.ptr_size = 64;
+         b->physical_ptrs = true;
+         b->options->shared_ptr_type = glsl_uint64_t_type();
+         b->options->global_ptr_type = glsl_uint64_t_type();
+         b->options->temp_ptr_type = glsl_uint64_t_type();
+         break;
+      case SpvAddressingModelLogical:
+         vtn_fail_if(b->shader->info.stage >= MESA_SHADER_STAGES,
+                     "AddressingModelLogical only supported for shaders");
+         b->shader->info.cs.ptr_size = 0;
+         b->physical_ptrs = false;
+         break;
+      case SpvAddressingModelPhysicalStorageBuffer64EXT:
+         vtn_fail_if(!b->options ||
+                     !b->options->caps.physical_storage_buffer_address,
+                     "AddressingModelPhysicalStorageBuffer64EXT not supported");
+         break;
+      default:
+         vtn_fail("Unknown addressing model");
+         break;
+      }
+
        vtn_assert(w[2] == SpvMemoryModelSimple ||
-                 w[2] == SpvMemoryModelGLSL450);
+                 w[2] == SpvMemoryModelGLSL450 ||
+                 w[2] == SpvMemoryModelOpenCL);
        break;
  
     case SpvOpEntryPoint:
@@ -3704,6 +3835,7 @@ vtn_handle_preamble_instruction(struct vtn_builder *b, SpvOp opcode,
        break;
  
     case SpvOpExecutionMode:
+   case SpvOpExecutionModeId:
     case SpvOpDecorationGroup:
     case SpvOpDecorate:
     case SpvOpMemberDecorate:
@@ -3730,7 +3862,8 @@ vtn_handle_execution_mode(struct vtn_builder *b, struct vtn_value *entry_point,
     switch(mode->exec_mode) {
     case SpvExecutionModeOriginUpperLeft:
     case SpvExecutionModeOriginLowerLeft:
-      b->origin_upper_left =
+      vtn_assert(b->shader->info.stage == MESA_SHADER_FRAGMENT);
+      b->shader->info.fs.origin_upper_left =
           (mode->exec_mode == SpvExecutionModeOriginUpperLeft);
        break;
  
@@ -3772,7 +3905,15 @@ vtn_handle_execution_mode(struct vtn_builder *b, struct vtn_value *entry_point,
        b->shader->info.cs.local_size[1] = mode->literals[1];
        b->shader->info.cs.local_size[2] = mode->literals[2];
        break;
+
+   case SpvExecutionModeLocalSizeId:
+      b->shader->info.cs.local_size[0] = vtn_constant_uint(b, mode->literals[0]);
+      b->shader->info.cs.local_size[1] = vtn_constant_uint(b, mode->literals[1]);
+      b->shader->info.cs.local_size[2] = vtn_constant_uint(b, mode->literals[2]);
+      break;
+
     case SpvExecutionModeLocalSizeHint:
+   case SpvExecutionModeLocalSizeHintId:
        break; /* Nothing to do with this */
  
     case SpvExecutionModeOutputVertices:
@@ -3845,7 +3986,8 @@ vtn_handle_execution_mode(struct vtn_builder *b, struct vtn_value *entry_point,
        break;
  
     case SpvExecutionModePixelCenterInteger:
-      b->pixel_center_integer = true;
+      vtn_assert(b->shader->info.stage == MESA_SHADER_FRAGMENT);
+      b->shader->info.fs.pixel_center_integer = true;
        break;
  
     case SpvExecutionModeXfb:
@@ -3853,9 +3995,16 @@ vtn_handle_execution_mode(struct vtn_builder *b, struct vtn_value *entry_point,
        break;
  
     case SpvExecutionModeVecTypeHint:
-   case SpvExecutionModeContractionOff:
        break; /* OpenCL */
  
+   case SpvExecutionModeContractionOff:
+      if (b->shader->info.stage != MESA_SHADER_KERNEL)
+         vtn_warn("ExectionMode only allowed for CL-style kernels: %s",
+                  spirv_executionmode_to_string(mode->exec_mode));
+      else
+         b->exact = true;
+      break;
+
     case SpvExecutionModeStencilRefReplacingEXT:
        vtn_assert(b->shader->info.stage == MESA_SHADER_FRAGMENT);
        break;
@@ -3908,6 +4057,7 @@ vtn_handle_variable_or_type_instruction(struct vtn_builder *b, SpvOp opcode,
     case SpvOpTypeStruct:
     case SpvOpTypeOpaque:
     case SpvOpTypePointer:
+   case SpvOpTypeForwardPointer:
     case SpvOpTypeFunction:
     case SpvOpTypeEvent:
     case SpvOpTypeDeviceEvent:
@@ -3974,7 +4124,10 @@ vtn_handle_body_instruction(struct vtn_builder *b, SpvOp opcode,
     case SpvOpAccessChain:
     case SpvOpPtrAccessChain:
     case SpvOpInBoundsAccessChain:
+   case SpvOpInBoundsPtrAccessChain:
     case SpvOpArrayLength:
+   case SpvOpConvertPtrToU:
+   case SpvOpConvertUToPtr:
        vtn_handle_variables(b, opcode, w, count);
        break;
  
@@ -4131,8 +4284,6 @@ vtn_handle_body_instruction(struct vtn_builder *b, SpvOp opcode,
     case SpvOpSConvert:
     case SpvOpFConvert:
     case SpvOpQuantizeToF16:
-   case SpvOpConvertPtrToU:
-   case SpvOpConvertUToPtr:
     case SpvOpPtrCastToGeneric:
     case SpvOpGenericCastToPtr:
     case SpvOpBitcast:
@@ -4290,6 +4441,10 @@ vtn_create_builder(const uint32_t *words, size_t word_count,
  {
     /* Initialize the vtn_builder object */
     struct vtn_builder *b = rzalloc(NULL, struct vtn_builder);
+   struct spirv_to_nir_options *dup_options =
+      ralloc(b, struct spirv_to_nir_options);
+   *dup_options = *options;
+
     b->spirv = words;
     b->spirv_word_count = word_count;
     b->file = NULL;
@@ -4298,7 +4453,7 @@ vtn_create_builder(const uint32_t *words, size_t word_count,
     exec_list_make_empty(&b->functions);
     b->entry_point_stage = stage;
     b->entry_point_name = entry_point_name;
-   b->options = options;
+   b->options = dup_options;
  
     /*
      * Handle the SPIR-V header (first 5 dwords).
@@ -4341,6 +4496,68 @@ vtn_create_builder(const uint32_t *words, size_t word_count,
     return NULL;
  }
  
+static nir_function *
+vtn_emit_kernel_entry_point_wrapper(struct vtn_builder *b,
+                                    nir_function *entry_point)
+{
+   vtn_assert(entry_point == b->entry_point->func->impl->function);
+   vtn_fail_if(!entry_point->name, "entry points are required to have a name");
+   const char *func_name =
+      ralloc_asprintf(b->shader, "__wrapped_%s", entry_point->name);
+
+   /* we shouldn't have any inputs yet */
+   vtn_assert(!entry_point->shader->num_inputs);
+   vtn_assert(b->shader->info.stage == MESA_SHADER_KERNEL);
+
+   nir_function *main_entry_point = nir_function_create(b->shader, func_name);
+   main_entry_point->impl = nir_function_impl_create(main_entry_point);
+   nir_builder_init(&b->nb, main_entry_point->impl);
+   b->nb.cursor = nir_after_cf_list(&main_entry_point->impl->body);
+   b->func_param_idx = 0;
+
+   nir_call_instr *call = nir_call_instr_create(b->nb.shader, entry_point);
+
+   for (unsigned i = 0; i < entry_point->num_params; ++i) {
+      struct vtn_type *param_type = b->entry_point->func->type->params[i];
+
+      /* consider all pointers to function memory to be parameters passed
+       * by value
+       */
+      bool is_by_val = param_type->base_type == vtn_base_type_pointer &&
+         param_type->storage_class == SpvStorageClassFunction;
+
+      /* input variable */
+      nir_variable *in_var = rzalloc(b->nb.shader, nir_variable);
+      in_var->data.mode = nir_var_shader_in;
+      in_var->data.read_only = true;
+      in_var->data.location = i;
+
+      if (is_by_val)
+         in_var->type = param_type->deref->type;
+      else
+         in_var->type = param_type->type;
+
+      nir_shader_add_variable(b->nb.shader, in_var);
+      b->nb.shader->num_inputs++;
+
+      /* we have to copy the entire variable into function memory */
+      if (is_by_val) {
+         nir_variable *copy_var =
+            nir_local_variable_create(main_entry_point->impl, in_var->type,
+                                      "copy_in");
+         nir_copy_var(&b->nb, copy_var, in_var);
+         call->params[i] =
+            nir_src_for_ssa(&nir_build_deref_var(&b->nb, copy_var)->dest.ssa);
+      } else {
+         call->params[i] = nir_src_for_ssa(nir_load_var(&b->nb, in_var));
+      }
+   }
+
+   nir_builder_instr_insert(&b->nb, &call->instr);
+
+   return main_entry_point;
+}
+
  nir_function *
  spirv_to_nir(const uint32_t *words, size_t word_count,
               struct nir_spirv_specialization *spec, unsigned num_spec,
@@ -4367,6 +4584,8 @@ spirv_to_nir(const uint32_t *words, size_t word_count,
     /* Skip the SPIR-V header, handled at vtn_create_builder */
     words+= 5;
  
+   b->shader = nir_shader_create(b, stage, nir_options, NULL);
+
     /* Handle all the preamble instructions */
     words = vtn_foreach_instruction(b, words, word_end,
                                     vtn_handle_preamble_instruction);
@@ -4377,15 +4596,9 @@ spirv_to_nir(const uint32_t *words, size_t word_count,
        return NULL;
     }
  
-   b->shader = nir_shader_create(b, stage, nir_options, NULL);
-
     /* Set shader info defaults */
     b->shader->info.gs.invocations = 1;
  
-   /* Parse execution modes */
-   vtn_foreach_execution_mode(b, b->entry_point,
-                              vtn_handle_execution_mode, NULL);
-
     b->specializations = spec;
     b->num_specializations = num_spec;
  
@@ -4393,6 +4606,22 @@ spirv_to_nir(const uint32_t *words, size_t word_count,
     words = vtn_foreach_instruction(b, words, word_end,
                                     vtn_handle_variable_or_type_instruction);
  
+   /* Parse execution modes */
+   vtn_foreach_execution_mode(b, b->entry_point,
+                              vtn_handle_execution_mode, NULL);
+
+   if (b->workgroup_size_builtin) {
+      vtn_assert(b->workgroup_size_builtin->type->type ==
+                 glsl_vector_type(GLSL_TYPE_UINT, 3));
+
+      nir_const_value *const_size =
+         &b->workgroup_size_builtin->constant->values[0];
+
+      b->shader->info.cs.local_size[0] = const_size->u32[0];
+      b->shader->info.cs.local_size[1] = const_size->u32[1];
+      b->shader->info.cs.local_size[2] = const_size->u32[2];
+   }
+
     /* Set types on all vtn_values */
     vtn_foreach_instruction(b, words, word_end, vtn_set_instruction_result_type);
  
@@ -4414,20 +4643,39 @@ spirv_to_nir(const uint32_t *words, size_t word_count,
        }
     } while (progress);
  
+   vtn_assert(b->entry_point->value_type == vtn_value_type_function);
+   nir_function *entry_point = b->entry_point->func->impl->function;
+   vtn_assert(entry_point);
+
+   /* post process entry_points with input params */
+   if (entry_point->num_params && b->shader->info.stage == MESA_SHADER_KERNEL)
+      entry_point = vtn_emit_kernel_entry_point_wrapper(b, entry_point);
+
+   entry_point->is_entrypoint = true;
+
+   /* When multiple shader stages exist in the same SPIR-V module, we
+    * generate input and output variables for every stage, in the same
+    * NIR program.  These dead variables can be invalid NIR.  For example,
+    * TCS outputs must be per-vertex arrays (or decorated 'patch'), while
+    * VS output variables wouldn't be.
+    *
+    * To ensure we have valid NIR, we eliminate any dead inputs and outputs
+    * right away.  In order to do so, we must lower any constant initializers
+    * on outputs so nir_remove_dead_variables sees that they're written to.
+    */
+   nir_lower_constant_initializers(b->shader, nir_var_shader_out);
+   nir_remove_dead_variables(b->shader,
+                             nir_var_shader_in | nir_var_shader_out);
+
     /* We sometimes generate bogus derefs that, while never used, give the
      * validator a bit of heartburn.  Run dead code to get rid of them.
      */
     nir_opt_dce(b->shader);
  
-   vtn_assert(b->entry_point->value_type == vtn_value_type_function);
-   nir_function *entry_point = b->entry_point->func->impl->function;
-   vtn_assert(entry_point);
-
     /* Unparent the shader from the vtn_builder before we delete the builder */
     ralloc_steal(NULL, b->shader);
  
     ralloc_free(b);
  
-   entry_point->is_entrypoint = true;
     return entry_point;
  }