vtn: handle SpvExecutionModelKernel

[mesa.git] / src / compiler / spirv / spirv_to_nir.c
diff --git a/src/compiler/spirv/spirv_to_nir.c b/src/compiler/spirv/spirv_to_nir.c

index 235003e872a1525e2d331d3c0b2cfa613e13eea7..4e5be79c9d71b67107606c1c53c54b223a8cb686 100644 (file)
--- a/src/compiler/spirv/spirv_to_nir.c
+++ b/src/compiler/spirv/spirv_to_nir.c
@@ -495,15 +495,19 @@ vtn_handle_decoration(struct vtn_builder *b, SpvOp opcode,
  
     case SpvOpDecorate:
     case SpvOpMemberDecorate:
+   case SpvOpDecorateStringGOOGLE:
+   case SpvOpMemberDecorateStringGOOGLE:
     case SpvOpExecutionMode: {
        struct vtn_value *val = vtn_untyped_value(b, target);
  
        struct vtn_decoration *dec = rzalloc(b, struct vtn_decoration);
        switch (opcode) {
        case SpvOpDecorate:
+      case SpvOpDecorateStringGOOGLE:
           dec->scope = VTN_DEC_DECORATION;
           break;
        case SpvOpMemberDecorate:
+      case SpvOpMemberDecorateStringGOOGLE:
           dec->scope = VTN_DEC_STRUCT_MEMBER0 + *(w++);
           vtn_fail_if(dec->scope < VTN_DEC_STRUCT_MEMBER0, /* overflow */
                       "Member argument of OpMemberDecorate too large");
@@ -559,6 +563,29 @@ struct member_decoration_ctx {
     struct vtn_type *type;
  };
  
+/**
+ * Returns true if the given type contains a struct decorated Block or
+ * BufferBlock
+ */
+bool
+vtn_type_contains_block(struct vtn_builder *b, struct vtn_type *type)
+{
+   switch (type->base_type) {
+   case vtn_base_type_array:
+      return vtn_type_contains_block(b, type->array_element);
+   case vtn_base_type_struct:
+      if (type->block || type->buffer_block)
+         return true;
+      for (unsigned i = 0; i < type->length; i++) {
+         if (vtn_type_contains_block(b, type->members[i]))
+            return true;
+      }
+      return false;
+   default:
+      return false;
+   }
+}
+
  /** Returns true if two types are "compatible", i.e. you can do an OpLoad,
   * OpStore, or OpCopyMemory between them without breaking anything.
   * Technically, the SPIR-V rules require the exact same type ID but this lets
@@ -668,6 +695,29 @@ mutable_matrix_member(struct vtn_builder *b, struct vtn_type *type, int member)
     return type;
  }
  
+static void
+vtn_handle_access_qualifier(struct vtn_builder *b, struct vtn_type *type,
+                            int member, enum gl_access_qualifier access)
+{
+   type->members[member] = vtn_type_copy(b, type->members[member]);
+   type = type->members[member];
+
+   type->access |= access;
+}
+
+static void
+array_stride_decoration_cb(struct vtn_builder *b,
+                           struct vtn_value *val, int member,
+                           const struct vtn_decoration *dec, void *void_ctx)
+{
+   struct vtn_type *type = val->type;
+
+   if (dec->decoration == SpvDecorationArrayStride) {
+      vtn_fail_if(dec->literals[0] == 0, "ArrayStride must be non-zero");
+      type->stride = dec->literals[0];
+   }
+}
+
  static void
  struct_member_decoration_cb(struct vtn_builder *b,
                              struct vtn_value *val, int member,
@@ -681,13 +731,21 @@ struct_member_decoration_cb(struct vtn_builder *b,
     assert(member < ctx->num_fields);
  
     switch (dec->decoration) {
+   case SpvDecorationRelaxedPrecision:
+   case SpvDecorationUniform:
+      break; /* FIXME: Do nothing with this for now. */
     case SpvDecorationNonWritable:
+      vtn_handle_access_qualifier(b, ctx->type, member, ACCESS_NON_WRITEABLE);
+      break;
     case SpvDecorationNonReadable:
-   case SpvDecorationRelaxedPrecision:
+      vtn_handle_access_qualifier(b, ctx->type, member, ACCESS_NON_READABLE);
+      break;
     case SpvDecorationVolatile:
+      vtn_handle_access_qualifier(b, ctx->type, member, ACCESS_VOLATILE);
+      break;
     case SpvDecorationCoherent:
-   case SpvDecorationUniform:
-      break; /* FIXME: Do nothing with this for now. */
+      vtn_handle_access_qualifier(b, ctx->type, member, ACCESS_COHERENT);
+      break;
     case SpvDecorationNoPerspective:
        ctx->fields[member].interpolation = INTERP_MODE_NOPERSPECTIVE;
        break;
@@ -717,6 +775,7 @@ struct_member_decoration_cb(struct vtn_builder *b,
        break;
     case SpvDecorationOffset:
        ctx->type->offsets[member] = dec->literals[0];
+      ctx->fields[member].offset = dec->literals[0];
        break;
     case SpvDecorationMatrixStride:
        /* Handled as a second pass */
@@ -765,11 +824,30 @@ struct_member_decoration_cb(struct vtn_builder *b,
                 spirv_decoration_to_string(dec->decoration));
        break;
  
+   case SpvDecorationHlslSemanticGOOGLE:
+      /* HLSL semantic decorations can safely be ignored by the driver. */
+      break;
+
     default:
        vtn_fail("Unhandled decoration");
     }
  }
  
+/** Chases the array type all the way down to the tail and rewrites the
+ * glsl_types to be based off the tail's glsl_type.
+ */
+static void
+vtn_array_type_rewrite_glsl_type(struct vtn_type *type)
+{
+   if (type->base_type != vtn_base_type_array)
+      return;
+
+   vtn_array_type_rewrite_glsl_type(type->array_element);
+
+   type->type = glsl_array_type(type->array_element->type,
+                                type->length, type->stride);
+}
+
  /* Matrix strides are handled as a separate pass because we need to know
   * whether the matrix is row-major or not first.
   */
@@ -785,6 +863,7 @@ struct_member_matrix_stride_cb(struct vtn_builder *b,
     vtn_fail_if(member < 0,
                 "The MatrixStride decoration is only allowed on members "
                 "of OpTypeStruct");
+   vtn_fail_if(dec->literals[0] == 0, "MatrixStride must be non-zero");
  
     struct member_decoration_ctx *ctx = void_ctx;
  
@@ -793,10 +872,24 @@ struct_member_matrix_stride_cb(struct vtn_builder *b,
        mat_type->array_element = vtn_type_copy(b, mat_type->array_element);
        mat_type->stride = mat_type->array_element->stride;
        mat_type->array_element->stride = dec->literals[0];
+
+      mat_type->type = glsl_explicit_matrix_type(mat_type->type,
+                                                 dec->literals[0], true);
+      mat_type->array_element->type = glsl_get_column_type(mat_type->type);
     } else {
        vtn_assert(mat_type->array_element->stride > 0);
        mat_type->stride = dec->literals[0];
+
+      mat_type->type = glsl_explicit_matrix_type(mat_type->type,
+                                                 dec->literals[0], false);
     }
+
+   /* Now that we've replaced the glsl_type with a properly strided matrix
+    * type, rewrite the member type so that it's an array of the proper kind
+    * of glsl_type.
+    */
+   vtn_array_type_rewrite_glsl_type(ctx->type->members[member]);
+   ctx->fields[member].type = ctx->type->members[member]->type;
  }
  
  static void
@@ -815,10 +908,8 @@ type_decoration_cb(struct vtn_builder *b,
  
     switch (dec->decoration) {
     case SpvDecorationArrayStride:
-      vtn_assert(type->base_type == vtn_base_type_matrix ||
-                 type->base_type == vtn_base_type_array ||
+      vtn_assert(type->base_type == vtn_base_type_array ||
                   type->base_type == vtn_base_type_pointer);
-      type->stride = dec->literals[0];
        break;
     case SpvDecorationBlock:
        vtn_assert(type->base_type == vtn_base_type_struct);
@@ -847,16 +938,24 @@ type_decoration_cb(struct vtn_builder *b,
     case SpvDecorationNonWritable:
     case SpvDecorationNonReadable:
     case SpvDecorationUniform:
-   case SpvDecorationStream:
     case SpvDecorationLocation:
     case SpvDecorationComponent:
     case SpvDecorationOffset:
     case SpvDecorationXfbBuffer:
     case SpvDecorationXfbStride:
+   case SpvDecorationHlslSemanticGOOGLE:
        vtn_warn("Decoration only allowed for struct members: %s",
                 spirv_decoration_to_string(dec->decoration));
        break;
  
+   case SpvDecorationStream:
+      /* We don't need to do anything here, as stream is filled up when
+       * aplying the decoration to a variable, just check that if it is not a
+       * struct member, it should be a struct.
+       */
+      vtn_assert(type->base_type == vtn_base_type_struct);
+      break;
+
     case SpvDecorationRelaxedPrecision:
     case SpvDecorationSpecId:
     case SpvDecorationInvariant:
@@ -1111,9 +1210,12 @@ vtn_handle_type(struct vtn_builder *b, SpvOp opcode,
        }
  
        val->type->base_type = vtn_base_type_array;
-      val->type->type = glsl_array_type(array_element->type, val->type->length);
        val->type->array_element = array_element;
        val->type->stride = 0;
+
+      vtn_foreach_decoration(b, val, array_stride_decoration_cb, NULL);
+      val->type->type = glsl_array_type(array_element->type, val->type->length,
+                                        val->type->stride);
        break;
     }
  
@@ -1175,32 +1277,37 @@ vtn_handle_type(struct vtn_builder *b, SpvOp opcode,
        val->type->storage_class = storage_class;
        val->type->deref = deref_type;
  
-      if (storage_class == SpvStorageClassUniform ||
-          storage_class == SpvStorageClassStorageBuffer) {
-         /* These can actually be stored to nir_variables and used as SSA
-          * values so they need a real glsl_type.
-          */
-         val->type->type = glsl_vector_type(GLSL_TYPE_UINT, 2);
-      }
-
-      if (storage_class == SpvStorageClassPushConstant) {
-         /* These can actually be stored to nir_variables and used as SSA
-          * values so they need a real glsl_type.
-          */
-         val->type->type = glsl_uint_type();
-      }
+      vtn_foreach_decoration(b, val, array_stride_decoration_cb, NULL);
  
-      if (storage_class == SpvStorageClassWorkgroup &&
-          b->options->lower_workgroup_access_to_offsets) {
-         uint32_t size, align;
-         val->type->deref = vtn_type_layout_std430(b, val->type->deref,
-                                                   &size, &align);
-         val->type->length = size;
-         val->type->align = align;
-         /* These can actually be stored to nir_variables and used as SSA
-          * values so they need a real glsl_type.
+      /* These can actually be stored to nir_variables and used as SSA
+       * values so they need a real glsl_type.
+       */
+      switch (storage_class) {
+      case SpvStorageClassUniform:
+         val->type->type = b->options->ubo_ptr_type;
+         break;
+      case SpvStorageClassStorageBuffer:
+         val->type->type = b->options->ssbo_ptr_type;
+         break;
+      case SpvStorageClassPushConstant:
+         val->type->type = b->options->push_const_ptr_type;
+         break;
+      case SpvStorageClassWorkgroup:
+         val->type->type = b->options->shared_ptr_type;
+         if (b->options->lower_workgroup_access_to_offsets) {
+            uint32_t size, align;
+            val->type->deref = vtn_type_layout_std430(b, val->type->deref,
+                                                      &size, &align);
+            val->type->length = size;
+            val->type->align = align;
+         }
+         break;
+      default:
+         /* In this case, no variable pointers are allowed so all deref chains
+          * are complete back to the variable and it doesn't matter what type
+          * gets used so we leave it NULL.
            */
-         val->type->type = glsl_uint_type();
+         break;
        }
        break;
     }
@@ -1293,6 +1400,17 @@ vtn_handle_type(struct vtn_builder *b, SpvOp opcode,
     }
  
     vtn_foreach_decoration(b, val, type_decoration_cb, NULL);
+
+   if (val->type->base_type == vtn_base_type_struct &&
+       (val->type->block || val->type->buffer_block)) {
+      for (unsigned i = 0; i < val->type->length; i++) {
+         vtn_fail_if(vtn_type_contains_block(b, val->type->members[i]),
+                     "Block and BufferBlock decorations cannot decorate a "
+                     "structure type that is nested at any level inside "
+                     "another structure type decorated with Block or "
+                     "BufferBlock.");
+      }
+   }
  }
  
  static nir_constant *
@@ -1433,7 +1551,7 @@ vtn_handle_constant(struct vtn_builder *b, SpvOp opcode,
            opcode == SpvOpSpecConstantFalse)
           int_val = get_specialization(b, val, int_val);
  
-      val->constant->values[0].u32[0] = int_val ? NIR_TRUE : NIR_FALSE;
+      val->constant->values[0].b[0] = int_val != 0;
        break;
     }
  
@@ -1526,6 +1644,9 @@ vtn_handle_constant(struct vtn_builder *b, SpvOp opcode,
              case 8:
                 val->constant->values[0].u8[i] = elems[i]->values[0].u8[0];
                 break;
+            case 1:
+               val->constant->values[0].b[i] = elems[i]->values[0].b[0];
+               break;
              default:
                 vtn_fail("Invalid SpvOpConstantComposite bit size");
              }
@@ -1699,6 +1820,9 @@ vtn_handle_constant(struct vtn_builder *b, SpvOp opcode,
                    case 8:
                       val->constant->values[0].u8[i] = (*c)->values[col].u8[elem + i];
                       break;
+                  case 1:
+                     val->constant->values[0].b[i] = (*c)->values[col].b[elem + i];
+                     break;
                    default:
                       vtn_fail("Invalid SpvOpCompositeExtract bit size");
                    }
@@ -1726,6 +1850,9 @@ vtn_handle_constant(struct vtn_builder *b, SpvOp opcode,
                    case 8:
                       (*c)->values[col].u8[elem + i] = insert->constant->values[0].u8[i];
                       break;
+                  case 1:
+                     (*c)->values[col].b[elem + i] = insert->constant->values[0].b[i];
+                     break;
                    default:
                       vtn_fail("Invalid SpvOpCompositeInsert bit size");
                    }
@@ -1764,11 +1891,37 @@ vtn_handle_constant(struct vtn_builder *b, SpvOp opcode,
           nir_const_value src[4];
  
           for (unsigned i = 0; i < count - 4; i++) {
-            nir_constant *c =
-               vtn_value(b, w[4 + i], vtn_value_type_constant)->constant;
+            struct vtn_value *src_val =
+               vtn_value(b, w[4 + i], vtn_value_type_constant);
+
+            /* If this is an unsized source, pull the bit size from the
+             * source; otherwise, we'll use the bit size from the destination.
+             */
+            if (!nir_alu_type_get_type_size(nir_op_infos[op].input_types[i]))
+               bit_size = glsl_get_bit_size(src_val->type->type);
  
              unsigned j = swap ? 1 - i : i;
-            src[j] = c->values[0];
+            src[j] = src_val->constant->values[0];
+         }
+
+         /* fix up fixed size sources */
+         switch (op) {
+         case nir_op_ishl:
+         case nir_op_ishr:
+         case nir_op_ushr: {
+            if (bit_size == 32)
+               break;
+            for (unsigned i = 0; i < num_components; ++i) {
+               switch (bit_size) {
+               case 64: src[1].u32[i] = src[1].u64[i]; break;
+               case 16: src[1].u32[i] = src[1].u16[i]; break;
+               case  8: src[1].u32[i] = src[1].u8[i];  break;
+               }
+            }
+            break;
+         }
+         default:
+            break;
           }
  
           val->constant->values[0] =
@@ -1795,69 +1948,6 @@ vtn_handle_constant(struct vtn_builder *b, SpvOp opcode,
     vtn_foreach_decoration(b, val, handle_workgroup_size_decoration_cb, NULL);
  }
  
-static void
-vtn_handle_function_call(struct vtn_builder *b, SpvOp opcode,
-                         const uint32_t *w, unsigned count)
-{
-   struct vtn_type *res_type = vtn_value(b, w[1], vtn_value_type_type)->type;
-   struct vtn_function *vtn_callee =
-      vtn_value(b, w[3], vtn_value_type_function)->func;
-   struct nir_function *callee = vtn_callee->impl->function;
-
-   vtn_callee->referenced = true;
-
-   nir_call_instr *call = nir_call_instr_create(b->nb.shader, callee);
-
-   unsigned param_idx = 0;
-
-   nir_deref_instr *ret_deref = NULL;
-   struct vtn_type *ret_type = vtn_callee->type->return_type;
-   if (ret_type->base_type != vtn_base_type_void) {
-      nir_variable *ret_tmp =
-         nir_local_variable_create(b->nb.impl, ret_type->type, "return_tmp");
-      ret_deref = nir_build_deref_var(&b->nb, ret_tmp);
-      call->params[param_idx++] = nir_src_for_ssa(&ret_deref->dest.ssa);
-   }
-
-   for (unsigned i = 0; i < vtn_callee->type->length; i++) {
-      struct vtn_type *arg_type = vtn_callee->type->params[i];
-      unsigned arg_id = w[4 + i];
-
-      if (arg_type->base_type == vtn_base_type_sampled_image) {
-         struct vtn_sampled_image *sampled_image =
-            vtn_value(b, arg_id, vtn_value_type_sampled_image)->sampled_image;
-
-         call->params[param_idx++] =
-            nir_src_for_ssa(&sampled_image->image->deref->dest.ssa);
-         call->params[param_idx++] =
-            nir_src_for_ssa(&sampled_image->sampler->deref->dest.ssa);
-      } else if (arg_type->base_type == vtn_base_type_pointer ||
-                 arg_type->base_type == vtn_base_type_image ||
-                 arg_type->base_type == vtn_base_type_sampler) {
-         struct vtn_pointer *pointer =
-            vtn_value(b, arg_id, vtn_value_type_pointer)->pointer;
-         call->params[param_idx++] =
-            nir_src_for_ssa(vtn_pointer_to_ssa(b, pointer));
-      } else {
-         /* This is a regular SSA value and we need a temporary */
-         nir_variable *tmp =
-            nir_local_variable_create(b->nb.impl, arg_type->type, "arg_tmp");
-         nir_deref_instr *tmp_deref = nir_build_deref_var(&b->nb, tmp);
-         vtn_local_store(b, vtn_ssa_value(b, arg_id), tmp_deref);
-         call->params[param_idx++] = nir_src_for_ssa(&tmp_deref->dest.ssa);
-      }
-   }
-   assert(param_idx == call->num_params);
-
-   nir_builder_instr_insert(&b->nb, &call->instr);
-
-   if (ret_type->base_type == vtn_base_type_void) {
-      vtn_push_value(b, w[2], vtn_value_type_undef);
-   } else {
-      vtn_push_ssa(b, w[2], res_type, vtn_local_load(b, ret_deref));
-   }
-}
-
  struct vtn_ssa_value *
  vtn_create_ssa_value(struct vtn_builder *b, const struct glsl_type *type)
  {
@@ -2176,6 +2266,13 @@ vtn_handle_texture(struct vtn_builder *b, SpvOp opcode,
           texop = nir_texop_txf_ms;
           (*p++) = vtn_tex_src(b, w[idx++], nir_tex_src_ms_index);
        }
+
+      if (operands & SpvImageOperandsMinLodMask) {
+         vtn_assert(texop == nir_texop_tex ||
+                    texop == nir_texop_txb ||
+                    texop == nir_texop_txd);
+         (*p++) = vtn_tex_src(b, w[idx++], nir_tex_src_min_lod);
+      }
     }
     /* We should have now consumed exactly all of the arguments */
     vtn_assert(idx == count);
@@ -2321,6 +2418,18 @@ get_image_coord(struct vtn_builder *b, uint32_t value)
     return nir_swizzle(&b->nb, coord->def, swizzle, 4, false);
  }
  
+static nir_ssa_def *
+expand_to_vec4(nir_builder *b, nir_ssa_def *value)
+{
+   if (value->num_components == 4)
+      return value;
+
+   unsigned swiz[4];
+   for (unsigned i = 0; i < 4; i++)
+      swiz[i] = i < value->num_components ? i : 0;
+   return nir_swizzle(b, value, swiz, 4, false);
+}
+
  static void
  vtn_handle_image(struct vtn_builder *b, SpvOp opcode,
                   const uint32_t *w, unsigned count)
@@ -2434,11 +2543,7 @@ vtn_handle_image(struct vtn_builder *b, SpvOp opcode,
        /* The image coordinate is always 4 components but we may not have that
         * many.  Swizzle to compensate.
         */
-      unsigned swiz[4];
-      for (unsigned i = 0; i < 4; i++)
-         swiz[i] = i < image.coord->num_components ? i : 0;
-      intrin->src[1] = nir_src_for_ssa(nir_swizzle(&b->nb, image.coord,
-                                                   swiz, 4, false));
+      intrin->src[1] = nir_src_for_ssa(expand_to_vec4(&b->nb, image.coord));
        intrin->src[2] = nir_src_for_ssa(image.sample);
     }
  
@@ -2448,11 +2553,15 @@ vtn_handle_image(struct vtn_builder *b, SpvOp opcode,
     case SpvOpImageRead:
        break;
     case SpvOpAtomicStore:
-      intrin->src[3] = nir_src_for_ssa(vtn_ssa_value(b, w[4])->def);
-      break;
-   case SpvOpImageWrite:
-      intrin->src[3] = nir_src_for_ssa(vtn_ssa_value(b, w[3])->def);
+   case SpvOpImageWrite: {
+      const uint32_t value_id = opcode == SpvOpAtomicStore ? w[4] : w[3];
+      nir_ssa_def *value = vtn_ssa_value(b, value_id)->def;
+      /* nir_intrinsic_image_deref_store always takes a vec4 value */
+      assert(op == nir_intrinsic_image_deref_store);
+      intrin->num_components = 4;
+      intrin->src[3] = nir_src_for_ssa(expand_to_vec4(&b->nb, value));
        break;
+   }
  
     case SpvOpAtomicCompareExchange:
     case SpvOpAtomicIIncrement:
@@ -2474,23 +2583,26 @@ vtn_handle_image(struct vtn_builder *b, SpvOp opcode,
        vtn_fail("Invalid image opcode");
     }
  
-   if (opcode != SpvOpImageWrite) {
+   if (opcode != SpvOpImageWrite && opcode != SpvOpAtomicStore) {
        struct vtn_value *val = vtn_push_value(b, w[2], vtn_value_type_ssa);
        struct vtn_type *type = vtn_value(b, w[1], vtn_value_type_type)->type;
  
-      unsigned dest_components = nir_intrinsic_dest_components(intrin);
-      if (intrin->intrinsic == nir_intrinsic_image_deref_size) {
-         dest_components = intrin->num_components =
-            glsl_get_vector_elements(type->type);
-      }
+      unsigned dest_components = glsl_get_vector_elements(type->type);
+      intrin->num_components = nir_intrinsic_infos[op].dest_components;
+      if (intrin->num_components == 0)
+         intrin->num_components = dest_components;
  
        nir_ssa_dest_init(&intrin->instr, &intrin->dest,
-                        dest_components, 32, NULL);
+                        intrin->num_components, 32, NULL);
  
        nir_builder_instr_insert(&b->nb, &intrin->instr);
  
+      nir_ssa_def *result = &intrin->dest.ssa;
+      if (intrin->num_components != dest_components)
+         result = nir_channels(&b->nb, result, (1 << dest_components) - 1);
+
        val->ssa = vtn_create_ssa_value(b, type->type);
-      val->ssa->def = &intrin->dest.ssa;
+      val->ssa->def = result;
     } else {
        nir_builder_instr_insert(&b->nb, &intrin->instr);
     }
@@ -2691,23 +2803,39 @@ vtn_handle_atomics(struct vtn_builder *b, SpvOp opcode,
           unreachable("Invalid SPIR-V atomic");
  
        }
-   } else if (ptr->mode == vtn_variable_mode_workgroup &&
-              !b->options->lower_workgroup_access_to_offsets) {
-      nir_deref_instr *deref = vtn_pointer_to_deref(b, ptr);
-      const struct glsl_type *deref_type = deref->type;
-      nir_intrinsic_op op = get_deref_nir_atomic_op(b, opcode);
+   } else if (vtn_pointer_uses_ssa_offset(b, ptr)) {
+      nir_ssa_def *offset, *index;
+      offset = vtn_pointer_to_offset(b, ptr, &index);
+
+      nir_intrinsic_op op;
+      if (ptr->mode == vtn_variable_mode_ssbo) {
+         op = get_ssbo_nir_atomic_op(b, opcode);
+      } else {
+         vtn_assert(ptr->mode == vtn_variable_mode_workgroup &&
+                    b->options->lower_workgroup_access_to_offsets);
+         op = get_shared_nir_atomic_op(b, opcode);
+      }
+
        atomic = nir_intrinsic_instr_create(b->nb.shader, op);
-      atomic->src[0] = nir_src_for_ssa(&deref->dest.ssa);
  
+      int src = 0;
        switch (opcode) {
        case SpvOpAtomicLoad:
-         atomic->num_components = glsl_get_vector_elements(deref_type);
+         atomic->num_components = glsl_get_vector_elements(ptr->type->type);
+         nir_intrinsic_set_align(atomic, 4, 0);
+         if (ptr->mode == vtn_variable_mode_ssbo)
+            atomic->src[src++] = nir_src_for_ssa(index);
+         atomic->src[src++] = nir_src_for_ssa(offset);
           break;
  
        case SpvOpAtomicStore:
-         atomic->num_components = glsl_get_vector_elements(deref_type);
+         atomic->num_components = glsl_get_vector_elements(ptr->type->type);
           nir_intrinsic_set_write_mask(atomic, (1 << atomic->num_components) - 1);
-         atomic->src[1] = nir_src_for_ssa(vtn_ssa_value(b, w[4])->def);
+         nir_intrinsic_set_align(atomic, 4, 0);
+         atomic->src[src++] = nir_src_for_ssa(vtn_ssa_value(b, w[4])->def);
+         if (ptr->mode == vtn_variable_mode_ssbo)
+            atomic->src[src++] = nir_src_for_ssa(index);
+         atomic->src[src++] = nir_src_for_ssa(offset);
           break;
  
        case SpvOpAtomicExchange:
@@ -2724,44 +2852,31 @@ vtn_handle_atomics(struct vtn_builder *b, SpvOp opcode,
        case SpvOpAtomicAnd:
        case SpvOpAtomicOr:
        case SpvOpAtomicXor:
-         fill_common_atomic_sources(b, opcode, w, &atomic->src[1]);
+         if (ptr->mode == vtn_variable_mode_ssbo)
+            atomic->src[src++] = nir_src_for_ssa(index);
+         atomic->src[src++] = nir_src_for_ssa(offset);
+         fill_common_atomic_sources(b, opcode, w, &atomic->src[src]);
           break;
  
        default:
           vtn_fail("Invalid SPIR-V atomic");
-
        }
     } else {
-      nir_ssa_def *offset, *index;
-      offset = vtn_pointer_to_offset(b, ptr, &index);
-
-      nir_intrinsic_op op;
-      if (ptr->mode == vtn_variable_mode_ssbo) {
-         op = get_ssbo_nir_atomic_op(b, opcode);
-      } else {
-         vtn_assert(ptr->mode == vtn_variable_mode_workgroup &&
-                    b->options->lower_workgroup_access_to_offsets);
-         op = get_shared_nir_atomic_op(b, opcode);
-      }
-
+      nir_deref_instr *deref = vtn_pointer_to_deref(b, ptr);
+      const struct glsl_type *deref_type = deref->type;
+      nir_intrinsic_op op = get_deref_nir_atomic_op(b, opcode);
        atomic = nir_intrinsic_instr_create(b->nb.shader, op);
+      atomic->src[0] = nir_src_for_ssa(&deref->dest.ssa);
  
-      int src = 0;
        switch (opcode) {
        case SpvOpAtomicLoad:
-         atomic->num_components = glsl_get_vector_elements(ptr->type->type);
-         if (ptr->mode == vtn_variable_mode_ssbo)
-            atomic->src[src++] = nir_src_for_ssa(index);
-         atomic->src[src++] = nir_src_for_ssa(offset);
+         atomic->num_components = glsl_get_vector_elements(deref_type);
           break;
  
        case SpvOpAtomicStore:
-         atomic->num_components = glsl_get_vector_elements(ptr->type->type);
+         atomic->num_components = glsl_get_vector_elements(deref_type);
           nir_intrinsic_set_write_mask(atomic, (1 << atomic->num_components) - 1);
-         atomic->src[src++] = nir_src_for_ssa(vtn_ssa_value(b, w[4])->def);
-         if (ptr->mode == vtn_variable_mode_ssbo)
-            atomic->src[src++] = nir_src_for_ssa(index);
-         atomic->src[src++] = nir_src_for_ssa(offset);
+         atomic->src[1] = nir_src_for_ssa(vtn_ssa_value(b, w[4])->def);
           break;
  
        case SpvOpAtomicExchange:
@@ -2778,10 +2893,7 @@ vtn_handle_atomics(struct vtn_builder *b, SpvOp opcode,
        case SpvOpAtomicAnd:
        case SpvOpAtomicOr:
        case SpvOpAtomicXor:
-         if (ptr->mode == vtn_variable_mode_ssbo)
-            atomic->src[src++] = nir_src_for_ssa(index);
-         atomic->src[src++] = nir_src_for_ssa(offset);
-         fill_common_atomic_sources(b, opcode, w, &atomic->src[src]);
+         fill_common_atomic_sources(b, opcode, w, &atomic->src[1]);
           break;
  
        default:
@@ -2858,8 +2970,7 @@ vtn_ssa_transpose(struct vtn_builder *b, struct vtn_ssa_value *src)
  nir_ssa_def *
  vtn_vector_extract(struct vtn_builder *b, nir_ssa_def *src, unsigned index)
  {
-   unsigned swiz[4] = { index };
-   return nir_swizzle(&b->nb, src, swiz, 1, false);
+   return nir_channel(&b->nb, src, index);
  }
  
  nir_ssa_def *
@@ -2883,13 +2994,19 @@ vtn_vector_insert(struct vtn_builder *b, nir_ssa_def *src, nir_ssa_def *insert,
     return &vec->dest.dest.ssa;
  }
  
+static nir_ssa_def *
+nir_ieq_imm(nir_builder *b, nir_ssa_def *x, uint64_t i)
+{
+   return nir_ieq(b, x, nir_imm_intN_t(b, i, x->bit_size));
+}
+
  nir_ssa_def *
  vtn_vector_extract_dynamic(struct vtn_builder *b, nir_ssa_def *src,
                             nir_ssa_def *index)
  {
     nir_ssa_def *dest = vtn_vector_extract(b, src, 0);
     for (unsigned i = 1; i < src->num_components; i++)
-      dest = nir_bcsel(&b->nb, nir_ieq(&b->nb, index, nir_imm_int(&b->nb, i)),
+      dest = nir_bcsel(&b->nb, nir_ieq_imm(&b->nb, index, i),
                         vtn_vector_extract(b, src, i), dest);
  
     return dest;
@@ -2901,7 +3018,7 @@ vtn_vector_insert_dynamic(struct vtn_builder *b, nir_ssa_def *src,
  {
     nir_ssa_def *dest = vtn_vector_insert(b, src, insert, 0);
     for (unsigned i = 1; i < src->num_components; i++)
-      dest = nir_bcsel(&b->nb, nir_ieq(&b->nb, index, nir_imm_int(&b->nb, i)),
+      dest = nir_bcsel(&b->nb, nir_ieq_imm(&b->nb, index, i),
                         vtn_vector_insert(b, src, insert, i), dest);
  
     return dest;
@@ -3075,7 +3192,7 @@ vtn_handle_composite(struct vtn_builder *b, SpvOp opcode,
        unsigned elems = count - 3;
        assume(elems >= 1);
        if (glsl_type_is_vector_or_scalar(type)) {
-         nir_ssa_def *srcs[4];
+         nir_ssa_def *srcs[NIR_MAX_VEC_COMPONENTS];
           for (unsigned i = 0; i < elems; i++)
              srcs[i] = vtn_ssa_value(b, w[3 + i])->def;
           val->ssa->def =
@@ -3199,9 +3316,12 @@ vtn_handle_barrier(struct vtn_builder *b, SpvOp opcode,
  
        switch (opcode) {
        case SpvOpEmitStreamVertex:
-      case SpvOpEndStreamPrimitive:
-         nir_intrinsic_set_stream_id(intrin, w[1]);
+      case SpvOpEndStreamPrimitive: {
+         unsigned stream = vtn_constant_value(b, w[1])->values[0].u32[0];
+         nir_intrinsic_set_stream_id(intrin, stream);
           break;
+      }
+
        default:
           break;
        }
@@ -3302,6 +3422,8 @@ stage_for_execution_model(struct vtn_builder *b, SpvExecutionModel model)
        return MESA_SHADER_FRAGMENT;
     case SpvExecutionModelGLCompute:
        return MESA_SHADER_COMPUTE;
+   case SpvExecutionModelKernel:
+      return MESA_SHADER_KERNEL;
     default:
        vtn_fail("Unsupported execution model");
     }
@@ -3395,21 +3517,20 @@ vtn_handle_preamble_instruction(struct vtn_builder *b, SpvOp opcode,
        case SpvCapabilityStorageImageExtendedFormats:
           break;
  
-      case SpvCapabilityGeometryStreams:
        case SpvCapabilityLinkage:
        case SpvCapabilityVector16:
        case SpvCapabilityFloat16Buffer:
        case SpvCapabilityFloat16:
-      case SpvCapabilityInt64Atomics:
-      case SpvCapabilityStorageImageMultisample:
        case SpvCapabilityInt8:
        case SpvCapabilitySparseResidency:
-      case SpvCapabilityMinLod:
-      case SpvCapabilityTransformFeedback:
           vtn_warn("Unsupported SPIR-V capability: %s",
                    spirv_capability_to_string(cap));
           break;
  
+      case SpvCapabilityMinLod:
+         spv_check_supported(min_lod, cap);
+         break;
+
        case SpvCapabilityAtomicStorage:
           spv_check_supported(atomic_storage, cap);
           break;
@@ -3424,6 +3545,22 @@ vtn_handle_preamble_instruction(struct vtn_builder *b, SpvOp opcode,
           spv_check_supported(int16, cap);
           break;
  
+      case SpvCapabilityTransformFeedback:
+         spv_check_supported(transform_feedback, cap);
+         break;
+
+      case SpvCapabilityGeometryStreams:
+         spv_check_supported(geometry_streams, cap);
+         break;
+
+      case SpvCapabilityInt64Atomics:
+         spv_check_supported(int64_atomics, cap);
+         break;
+
+      case SpvCapabilityStorageImageMultisample:
+         spv_check_supported(storage_image_ms, cap);
+         break;
+
        case SpvCapabilityAddresses:
        case SpvCapabilityKernel:
        case SpvCapabilityImageBasic:
@@ -3497,6 +3634,7 @@ vtn_handle_preamble_instruction(struct vtn_builder *b, SpvOp opcode,
        case SpvCapabilityVariablePointersStorageBuffer:
        case SpvCapabilityVariablePointers:
           spv_check_supported(variable_pointers, cap);
+         b->variable_pointers = true;
           break;
  
        case SpvCapabilityStorageUniformBufferBlock16:
@@ -3530,6 +3668,10 @@ vtn_handle_preamble_instruction(struct vtn_builder *b, SpvOp opcode,
           spv_check_supported(stencil_export, cap);
           break;
  
+      case SpvCapabilitySampleMaskPostDepthCoverage:
+         spv_check_supported(post_depth_coverage, cap);
+         break;
+
        default:
           vtn_fail("Unhandled capability");
        }
@@ -3569,6 +3711,8 @@ vtn_handle_preamble_instruction(struct vtn_builder *b, SpvOp opcode,
     case SpvOpMemberDecorate:
     case SpvOpGroupDecorate:
     case SpvOpGroupMemberDecorate:
+   case SpvOpDecorateStringGOOGLE:
+   case SpvOpMemberDecorateStringGOOGLE:
        vtn_handle_decoration(b, opcode, w, count);
        break;
  
@@ -3597,6 +3741,11 @@ vtn_handle_execution_mode(struct vtn_builder *b, struct vtn_value *entry_point,
        b->shader->info.fs.early_fragment_tests = true;
        break;
  
+   case SpvExecutionModePostDepthCoverage:
+      vtn_assert(b->shader->info.stage == MESA_SHADER_FRAGMENT);
+      b->shader->info.fs.post_depth_coverage = true;
+      break;
+
     case SpvExecutionModeInvocations:
        vtn_assert(b->shader->info.stage == MESA_SHADER_GEOMETRY);
        b->shader->info.gs.invocations = MAX2(1, mode->literals[0]);
@@ -3620,7 +3769,7 @@ vtn_handle_execution_mode(struct vtn_builder *b, struct vtn_value *entry_point,
        break;
  
     case SpvExecutionModeLocalSize:
-      vtn_assert(b->shader->info.stage == MESA_SHADER_COMPUTE);
+      vtn_assert(gl_shader_stage_is_compute(b->shader->info.stage));
        b->shader->info.cs.local_size[0] = mode->literals[0];
        b->shader->info.cs.local_size[1] = mode->literals[1];
        b->shader->info.cs.local_size[2] = mode->literals[2];
@@ -3653,6 +3802,8 @@ vtn_handle_execution_mode(struct vtn_builder *b, struct vtn_value *entry_point,
           vtn_assert(b->shader->info.stage == MESA_SHADER_GEOMETRY);
           b->shader->info.gs.vertices_in =
              vertices_in_from_spv_execution_mode(b, mode->exec_mode);
+         b->shader->info.gs.input_primitive =
+            gl_primitive_from_spv_execution_mode(b, mode->exec_mode);
        }
        break;
  
@@ -3700,7 +3851,7 @@ vtn_handle_execution_mode(struct vtn_builder *b, struct vtn_value *entry_point,
        break;
  
     case SpvExecutionModeXfb:
-      vtn_fail("Unhandled execution mode");
+      b->shader->info.has_transform_feedback_varyings = true;
        break;
  
     case SpvExecutionModeVecTypeHint:
@@ -3740,6 +3891,8 @@ vtn_handle_variable_or_type_instruction(struct vtn_builder *b, SpvOp opcode,
     case SpvOpMemberDecorate:
     case SpvOpGroupDecorate:
     case SpvOpGroupMemberDecorate:
+   case SpvOpDecorateStringGOOGLE:
+   case SpvOpMemberDecorateStringGOOGLE:
        vtn_fail("Invalid opcode types and variables section");
        break;
  
@@ -4165,6 +4318,15 @@ vtn_create_builder(const uint32_t *words, size_t word_count,
        goto fail;
     }
  
+   uint16_t generator_id = words[2] >> 16;
+   uint16_t generator_version = words[2];
+
+   /* The first GLSLang version bump actually 1.5 years after #179 was fixed
+    * but this should at least let us shut the workaround off for modern
+    * versions of GLSLang.
+    */
+   b->wa_glslang_179 = (generator_id == 8 && generator_version == 1);
+
     /* words[2] == generator magic */
     unsigned value_id_bound = words[3];
     if (words[4] != 0) {
@@ -4246,8 +4408,7 @@ spirv_to_nir(const uint32_t *words, size_t word_count,
        progress = false;
        foreach_list_typed(struct vtn_function, func, node, &b->functions) {
           if (func->referenced && !func->emitted) {
-            b->const_table = _mesa_hash_table_create(b, _mesa_hash_pointer,
-                                                     _mesa_key_pointer_equal);
+            b->const_table = _mesa_pointer_hash_table_create(b);
  
              vtn_function_emit(b, func, vtn_handle_body_instruction);
              progress = true;
@@ -4269,5 +4430,6 @@ spirv_to_nir(const uint32_t *words, size_t word_count,
  
     ralloc_free(b);
  
+   entry_point->is_entrypoint = true;
     return entry_point;
  }