glsl: free uniform_map on failure path.

[mesa.git] / src / glsl / linker.cpp
diff --git a/src/glsl/linker.cpp b/src/glsl/linker.cpp

index a1bae297eaaec9bb69ba0fb939b189f400764b6e..57be4931d780291a4dbb48f9b6a649410c2e72dc 100644 (file)
--- a/src/glsl/linker.cpp
+++ b/src/glsl/linker.cpp
@@ -74,6 +74,7 @@
  #include "link_varyings.h"
  #include "ir_optimization.h"
  #include "ir_rvalue_visitor.h"
+#include "ir_uniform.h"
  
  extern "C" {
  #include "main/shaderobj.h"
@@ -249,31 +250,100 @@ public:
     }
  };
  
-
  /**
- * Visitor that determines whether or not a shader uses ir_end_primitive.
+ * Visitor that determines the highest stream id to which a (geometry) shader
+ * emits vertices. It also checks whether End{Stream}Primitive is ever called.
   */
-class find_end_primitive_visitor : public ir_hierarchical_visitor {
+class find_emit_vertex_visitor : public ir_hierarchical_visitor {
  public:
-   find_end_primitive_visitor()
-      : found(false)
+   find_emit_vertex_visitor(int max_allowed)
+      : max_stream_allowed(max_allowed),
+        invalid_stream_id(0),
+        invalid_stream_id_from_emit_vertex(false),
+        end_primitive_found(false),
+        uses_non_zero_stream(false)
     {
        /* empty */
     }
  
-   virtual ir_visitor_status visit(ir_end_primitive *)
+   virtual ir_visitor_status visit_leave(ir_emit_vertex *ir)
     {
-      found = true;
-      return visit_stop;
+      int stream_id = ir->stream_id();
+
+      if (stream_id < 0) {
+         invalid_stream_id = stream_id;
+         invalid_stream_id_from_emit_vertex = true;
+         return visit_stop;
+      }
+
+      if (stream_id > max_stream_allowed) {
+         invalid_stream_id = stream_id;
+         invalid_stream_id_from_emit_vertex = true;
+         return visit_stop;
+      }
+
+      if (stream_id != 0)
+         uses_non_zero_stream = true;
+
+      return visit_continue;
     }
  
-   bool end_primitive_found()
+   virtual ir_visitor_status visit_leave(ir_end_primitive *ir)
     {
-      return found;
+      end_primitive_found = true;
+
+      int stream_id = ir->stream_id();
+
+      if (stream_id < 0) {
+         invalid_stream_id = stream_id;
+         invalid_stream_id_from_emit_vertex = false;
+         return visit_stop;
+      }
+
+      if (stream_id > max_stream_allowed) {
+         invalid_stream_id = stream_id;
+         invalid_stream_id_from_emit_vertex = false;
+         return visit_stop;
+      }
+
+      if (stream_id != 0)
+         uses_non_zero_stream = true;
+
+      return visit_continue;
+   }
+
+   bool error()
+   {
+      return invalid_stream_id != 0;
+   }
+
+   const char *error_func()
+   {
+      return invalid_stream_id_from_emit_vertex ?
+         "EmitStreamVertex" : "EndStreamPrimitive";
+   }
+
+   int error_stream()
+   {
+      return invalid_stream_id;
+   }
+
+   bool uses_streams()
+   {
+      return uses_non_zero_stream;
+   }
+
+   bool uses_end_primitive()
+   {
+      return end_primitive_found;
     }
  
  private:
-   bool found;
+   int max_stream_allowed;
+   int invalid_stream_id;
+   bool invalid_stream_id_from_emit_vertex;
+   bool end_primitive_found;
+   bool uses_non_zero_stream;
  };
  
  } /* anonymous namespace */
@@ -367,8 +437,8 @@ parse_program_resource_name(const GLchar *name,
  void
  link_invalidate_variable_locations(exec_list *ir)
  {
-   foreach_list(node, ir) {
-      ir_variable *const var = ((ir_instruction *) node)->as_variable();
+   foreach_in_list(ir_instruction, node, ir) {
+      ir_variable *const var = node->as_variable();
  
        if (var == NULL)
           continue;
@@ -550,10 +620,58 @@ validate_geometry_shader_executable(struct gl_shader_program *prog,
  
     analyze_clip_usage(prog, shader, &prog->Geom.UsesClipDistance,
                        &prog->Geom.ClipDistanceArraySize);
+}
  
-   find_end_primitive_visitor end_primitive;
-   end_primitive.run(shader->ir);
-   prog->Geom.UsesEndPrimitive = end_primitive.end_primitive_found();
+/**
+ * Check if geometry shaders emit to non-zero streams and do corresponding
+ * validations.
+ */
+static void
+validate_geometry_shader_emissions(struct gl_context *ctx,
+                                   struct gl_shader_program *prog)
+{
+   if (prog->_LinkedShaders[MESA_SHADER_GEOMETRY] != NULL) {
+      find_emit_vertex_visitor emit_vertex(ctx->Const.MaxVertexStreams - 1);
+      emit_vertex.run(prog->_LinkedShaders[MESA_SHADER_GEOMETRY]->ir);
+      if (emit_vertex.error()) {
+         linker_error(prog, "Invalid call %s(%d). Accepted values for the "
+                      "stream parameter are in the range [0, %d].",
+                      emit_vertex.error_func(),
+                      emit_vertex.error_stream(),
+                      ctx->Const.MaxVertexStreams - 1);
+      }
+      prog->Geom.UsesStreams = emit_vertex.uses_streams();
+      prog->Geom.UsesEndPrimitive = emit_vertex.uses_end_primitive();
+
+      /* From the ARB_gpu_shader5 spec:
+       *
+       *   "Multiple vertex streams are supported only if the output primitive
+       *    type is declared to be "points".  A program will fail to link if it
+       *    contains a geometry shader calling EmitStreamVertex() or
+       *    EndStreamPrimitive() if its output primitive type is not "points".
+       *
+       * However, in the same spec:
+       *
+       *   "The function EmitVertex() is equivalent to calling EmitStreamVertex()
+       *    with <stream> set to zero."
+       *
+       * And:
+       *
+       *   "The function EndPrimitive() is equivalent to calling
+       *    EndStreamPrimitive() with <stream> set to zero."
+       *
+       * Since we can call EmitVertex() and EndPrimitive() when we output
+       * primitives other than points, calling EmitStreamVertex(0) or
+       * EmitEndPrimitive(0) should not produce errors. This it also what Nvidia
+       * does. Currently we only set prog->Geom.UsesStreams to TRUE when
+       * EmitStreamVertex() or EmitEndPrimitive() are called with a non-zero
+       * stream.
+       */
+      if (prog->Geom.UsesStreams && prog->Geom.OutputType != GL_POINTS) {
+         linker_error(prog, "EmitStreamVertex(n) and EndStreamPrimitive(n) "
+                      "with n>0 requires point output");
+      }
+   }
  }
  
  
@@ -574,8 +692,8 @@ cross_validate_globals(struct gl_shader_program *prog,
        if (shader_list[i] == NULL)
          continue;
  
-      foreach_list(node, shader_list[i]->ir) {
-        ir_variable *const var = ((ir_instruction *) node)->as_variable();
+      foreach_in_list(ir_instruction, node, shader_list[i]->ir) {
+        ir_variable *const var = node->as_variable();
  
          if (var == NULL)
             continue;
@@ -844,8 +962,7 @@ populate_symbol_table(gl_shader *sh)
  {
     sh->symbols = new(sh) glsl_symbol_table;
  
-   foreach_list(node, sh->ir) {
-      ir_instruction *const inst = (ir_instruction *) node;
+   foreach_in_list(ir_instruction, inst, sh->ir) {
        ir_variable *var;
        ir_function *func;
  
@@ -961,9 +1078,7 @@ move_non_declarations(exec_list *instructions, exec_node *last,
        temps = hash_table_ctor(0, hash_table_pointer_hash,
                               hash_table_pointer_compare);
  
-   foreach_list_safe(node, instructions) {
-      ir_instruction *inst = (ir_instruction *) node;
-
+   foreach_in_list_safe(ir_instruction, inst, instructions) {
        if (inst->as_function())
          continue;
  
@@ -1014,7 +1129,8 @@ get_main_function_signature(gl_shader *sh)
         * We don't have to check for multiple definitions of main (in multiple
         * shaders) because that would have already been caught above.
         */
-      ir_function_signature *sig = f->matching_signature(NULL, &void_parameters);
+      ir_function_signature *sig =
+         f->matching_signature(NULL, &void_parameters, false);
        if ((sig != NULL) && sig->is_defined) {
          return sig;
        }
@@ -1478,13 +1594,15 @@ link_intrastage_shaders(void *mem_ctx,
     const unsigned num_uniform_blocks =
        link_uniform_blocks(mem_ctx, prog, shader_list, num_shaders,
                            &uniform_blocks);
+   if (!prog->LinkStatus)
+      return NULL;
  
     /* Check that there is only a single definition of each function signature
      * across all shaders.
      */
     for (unsigned i = 0; i < (num_shaders - 1); i++) {
-      foreach_list(node, shader_list[i]->ir) {
-        ir_function *const f = ((ir_instruction *) node)->as_function();
+      foreach_in_list(ir_instruction, node, shader_list[i]->ir) {
+        ir_function *const f = node->as_function();
  
          if (f == NULL)
             continue;
@@ -1499,9 +1617,7 @@ link_intrastage_shaders(void *mem_ctx,
             if (other == NULL)
                continue;
  
-           foreach_list(n, &f->signatures) {
-              ir_function_signature *sig = (ir_function_signature *) n;
-
+           foreach_in_list(ir_function_signature, sig, &f->signatures) {
                if (!sig->is_defined || sig->is_builtin())
                   continue;
  
@@ -1615,8 +1731,7 @@ link_intrastage_shaders(void *mem_ctx,
     if (linked->Stage == MESA_SHADER_GEOMETRY) {
        unsigned num_vertices = vertices_per_prim(prog->Geom.InputType);
        geom_array_resize_visitor input_resize_visitor(num_vertices, prog);
-      foreach_list(n, linked->ir) {
-         ir_instruction *ir = (ir_instruction *) n;
+      foreach_in_list(ir_instruction, ir, linked->ir) {
           ir->accept(&input_resize_visitor);
        }
     }
@@ -1654,8 +1769,8 @@ update_array_sizes(struct gl_shader_program *prog)
          if (prog->_LinkedShaders[i] == NULL)
             continue;
  
-      foreach_list(node, prog->_LinkedShaders[i]->ir) {
-        ir_variable *const var = ((ir_instruction *) node)->as_variable();
+      foreach_in_list(ir_instruction, node, prog->_LinkedShaders[i]->ir) {
+        ir_variable *const var = node->as_variable();
  
          if ((var == NULL) || (var->data.mode != ir_var_uniform) ||
              !var->type->is_array())
@@ -1677,8 +1792,8 @@ update_array_sizes(struct gl_shader_program *prog)
                if (prog->_LinkedShaders[j] == NULL)
                   continue;
  
-           foreach_list(node2, prog->_LinkedShaders[j]->ir) {
-              ir_variable *other_var = ((ir_instruction *) node2)->as_variable();
+           foreach_in_list(ir_instruction, node2, prog->_LinkedShaders[j]->ir) {
+              ir_variable *other_var = node2->as_variable();
                if (!other_var)
                   continue;
  
@@ -1820,8 +1935,8 @@ assign_attribute_or_color_locations(gl_shader_program *prog,
  
     unsigned num_attr = 0;
  
-   foreach_list(node, sh->ir) {
-      ir_variable *const var = ((ir_instruction *) node)->as_variable();
+   foreach_in_list(ir_instruction, node, sh->ir) {
+      ir_variable *const var = node->as_variable();
  
        if ((var == NULL) || (var->data.mode != (unsigned) direction))
          continue;
@@ -2039,8 +2154,8 @@ assign_attribute_or_color_locations(gl_shader_program *prog,
  void
  demote_shader_inputs_and_outputs(gl_shader *sh, enum ir_variable_mode mode)
  {
-   foreach_list(node, sh->ir) {
-      ir_variable *const var = ((ir_instruction *) node)->as_variable();
+   foreach_in_list(ir_instruction, node, sh->ir) {
+      ir_variable *const var = node->as_variable();
  
        if ((var == NULL) || (var->data.mode != int(mode)))
          continue;
@@ -2075,8 +2190,8 @@ store_fragdepth_layout(struct gl_shader_program *prog)
      * We're only interested in the cases where the variable is NOT removed
      * from the IR.
      */
-   foreach_list(node, ir) {
-      ir_variable *const var = ((ir_instruction *) node)->as_variable();
+   foreach_in_list(ir_instruction, node, ir) {
+      ir_variable *const var = node->as_variable();
  
        if (var == NULL || var->data.mode != ir_var_shader_out) {
           continue;
@@ -2207,8 +2322,8 @@ check_image_resources(struct gl_context *ctx, struct gl_shader_program *prog)
           total_image_units += sh->NumImages;
  
           if (i == MESA_SHADER_FRAGMENT) {
-            foreach_list(node, sh->ir) {
-               ir_variable *var = ((ir_instruction *)node)->as_variable();
+            foreach_in_list(ir_instruction, node, sh->ir) {
+               ir_variable *var = node->as_variable();
                 if (var && var->data.mode == ir_var_shader_out)
                    fragment_outputs += var->type->count_attribute_slots();
              }
@@ -2224,6 +2339,117 @@ check_image_resources(struct gl_context *ctx, struct gl_shader_program *prog)
        linker_error(prog, "Too many combined image uniforms and fragment outputs");
  }
  
+
+/**
+ * Initializes explicit location slots to INACTIVE_UNIFORM_EXPLICIT_LOCATION
+ * for a variable, checks for overlaps between other uniforms using explicit
+ * locations.
+ */
+static bool
+reserve_explicit_locations(struct gl_shader_program *prog,
+                           string_to_uint_map *map, ir_variable *var)
+{
+   unsigned slots = var->type->uniform_locations();
+   unsigned max_loc = var->data.location + slots - 1;
+
+   /* Resize remap table if locations do not fit in the current one. */
+   if (max_loc + 1 > prog->NumUniformRemapTable) {
+      prog->UniformRemapTable =
+         reralloc(prog, prog->UniformRemapTable,
+                  gl_uniform_storage *,
+                  max_loc + 1);
+
+      if (!prog->UniformRemapTable) {
+         linker_error(prog, "Out of memory during linking.");
+         return false;
+      }
+
+      /* Initialize allocated space. */
+      for (unsigned i = prog->NumUniformRemapTable; i < max_loc + 1; i++)
+         prog->UniformRemapTable[i] = NULL;
+
+      prog->NumUniformRemapTable = max_loc + 1;
+   }
+
+   for (unsigned i = 0; i < slots; i++) {
+      unsigned loc = var->data.location + i;
+
+      /* Check if location is already used. */
+      if (prog->UniformRemapTable[loc] == INACTIVE_UNIFORM_EXPLICIT_LOCATION) {
+
+         /* Possibly same uniform from a different stage, this is ok. */
+         unsigned hash_loc;
+         if (map->get(hash_loc, var->name) && hash_loc == loc - i)
+               continue;
+
+         /* ARB_explicit_uniform_location specification states:
+          *
+          *     "No two default-block uniform variables in the program can have
+          *     the same location, even if they are unused, otherwise a compiler
+          *     or linker error will be generated."
+          */
+         linker_error(prog,
+                      "location qualifier for uniform %s overlaps"
+                      "previously used location",
+                      var->name);
+         return false;
+      }
+
+      /* Initialize location as inactive before optimization
+       * rounds and location assignment.
+       */
+      prog->UniformRemapTable[loc] = INACTIVE_UNIFORM_EXPLICIT_LOCATION;
+   }
+
+   /* Note, base location used for arrays. */
+   map->put(var->data.location, var->name);
+
+   return true;
+}
+
+/**
+ * Check and reserve all explicit uniform locations, called before
+ * any optimizations happen to handle also inactive uniforms and
+ * inactive array elements that may get trimmed away.
+ */
+static void
+check_explicit_uniform_locations(struct gl_context *ctx,
+                                 struct gl_shader_program *prog)
+{
+   if (!ctx->Extensions.ARB_explicit_uniform_location)
+      return;
+
+   /* This map is used to detect if overlapping explicit locations
+    * occur with the same uniform (from different stage) or a different one.
+    */
+   string_to_uint_map *uniform_map = new string_to_uint_map;
+
+   if (!uniform_map) {
+      linker_error(prog, "Out of memory during linking.");
+      return;
+   }
+
+   for (unsigned i = 0; i < MESA_SHADER_STAGES; i++) {
+      struct gl_shader *sh = prog->_LinkedShaders[i];
+
+      if (!sh)
+         continue;
+
+      foreach_in_list(ir_instruction, node, sh->ir) {
+         ir_variable *var = node->as_variable();
+         if ((var && var->data.mode == ir_var_uniform) &&
+             var->data.explicit_location) {
+            if (!reserve_explicit_locations(prog, uniform_map, var)) {
+               delete uniform_map;
+               return;
+            }
+         }
+      }
+   }
+
+   delete uniform_map;
+}
+
  void
  link_shaders(struct gl_context *ctx, struct gl_shader_program *prog)
  {
@@ -2300,7 +2526,8 @@ link_shaders(struct gl_context *ctx, struct gl_shader_program *prog)
     /* Geometry shaders have to be linked with vertex shaders.
      */
     if (num_shaders[MESA_SHADER_GEOMETRY] > 0 &&
-       num_shaders[MESA_SHADER_VERTEX] == 0) {
+       num_shaders[MESA_SHADER_VERTEX] == 0 &&
+       !prog->SeparateShader) {
        linker_error(prog, "Geometry shader must be linked with "
                    "vertex shader\n");
        goto done;
@@ -2371,6 +2598,10 @@ link_shaders(struct gl_context *ctx, struct gl_shader_program *prog)
           break;
     }
  
+   check_explicit_uniform_locations(ctx, prog);
+   if (!prog->LinkStatus)
+      goto done;
+
     /* Validate the inputs of each stage with the output of the preceding
      * stage.
      */
@@ -2431,16 +2662,19 @@ link_shaders(struct gl_context *ctx, struct gl_shader_program *prog)
        if (!prog->LinkStatus)
          goto done;
  
-      if (ctx->ShaderCompilerOptions[i].LowerClipDistance) {
+      if (ctx->Const.ShaderCompilerOptions[i].LowerClipDistance) {
           lower_clip_distance(prog->_LinkedShaders[i]);
        }
  
        while (do_common_optimization(prog->_LinkedShaders[i]->ir, true, false,
-                                    &ctx->ShaderCompilerOptions[i],
+                                    &ctx->Const.ShaderCompilerOptions[i],
                                      ctx->Const.NativeIntegers))
          ;
     }
  
+   /* Check and validate stream emissions in geometry shaders */
+   validate_geometry_shader_emissions(ctx, prog);
+
     /* Mark all generic shader inputs and outputs as unpaired. */
     for (unsigned i = MESA_SHADER_VERTEX; i <= MESA_SHADER_FRAGMENT; i++) {
        if (prog->_LinkedShaders[i] != NULL) {
@@ -2502,7 +2736,7 @@ link_shaders(struct gl_context *ctx, struct gl_shader_program *prog)
     if (last >= 0 && last < MESA_SHADER_FRAGMENT) {
        gl_shader *const sh = prog->_LinkedShaders[last];
  
-      if (num_tfeedback_decls != 0) {
+      if (num_tfeedback_decls != 0 || prog->SeparateShader) {
           /* There was no fragment shader, but we still have to assign varying
            * locations for use by transform feedback.
            */
@@ -2516,7 +2750,8 @@ link_shaders(struct gl_context *ctx, struct gl_shader_program *prog)
        do_dead_builtin_varyings(ctx, sh, NULL,
                                 num_tfeedback_decls, tfeedback_decls);
  
-      demote_shader_inputs_and_outputs(sh, ir_var_shader_out);
+      if (!prog->SeparateShader)
+         demote_shader_inputs_and_outputs(sh, ir_var_shader_out);
  
        /* Eliminate code that is now dead due to unused outputs being demoted.
         */
@@ -2531,7 +2766,16 @@ link_shaders(struct gl_context *ctx, struct gl_shader_program *prog)
        do_dead_builtin_varyings(ctx, NULL, sh,
                                 num_tfeedback_decls, tfeedback_decls);
  
-      demote_shader_inputs_and_outputs(sh, ir_var_shader_in);
+      if (prog->SeparateShader) {
+         if (!assign_varying_locations(ctx, mem_ctx, prog,
+                                       NULL /* producer */,
+                                       sh /* consumer */,
+                                       0 /* num_tfeedback_decls */,
+                                       NULL /* tfeedback_decls */,
+                                       0 /* gs_input_vertices */))
+            goto done;
+      } else
+         demote_shader_inputs_and_outputs(sh, ir_var_shader_in);
  
        while (do_dead_code(sh->ir, false))
           ;
@@ -2579,7 +2823,7 @@ link_shaders(struct gl_context *ctx, struct gl_shader_program *prog)
        goto done;
  
     update_array_sizes(prog);
-   link_assign_uniform_locations(prog);
+   link_assign_uniform_locations(prog, ctx->Const.UniformBooleanTrue);
     link_assign_atomic_counter_resources(ctx, prog);
     store_fragdepth_layout(prog);
  
@@ -2596,7 +2840,7 @@ link_shaders(struct gl_context *ctx, struct gl_shader_program *prog)
      * fragment shader) is absent. So, the extension shouldn't change the
      * behavior specified in GLSL specification.
      */
-   if (!prog->InternalSeparateShader && ctx->API == API_OPENGLES2) {
+   if (!prog->SeparateShader && ctx->API == API_OPENGLES2) {
        if (prog->_LinkedShaders[MESA_SHADER_VERTEX] == NULL) {
          linker_error(prog, "program lacks a vertex shader\n");
        } else if (prog->_LinkedShaders[MESA_SHADER_FRAGMENT] == NULL) {