Merge branch 'master' of ../mesa into vulkan

[mesa.git] / src / mesa / program / ir_to_mesa.cpp
diff --git a/src/mesa/program/ir_to_mesa.cpp b/src/mesa/program/ir_to_mesa.cpp

index ae4a6e2dec67fafa38f93bcecdd41e725a88ba59..1cfcf9119f97c2508219a0fc7508b826a05d1b92 100644 (file)
--- a/src/mesa/program/ir_to_mesa.cpp
+++ b/src/mesa/program/ir_to_mesa.cpp
@@ -43,19 +43,18 @@
  #include "linker.h"
  
  #include "main/mtypes.h"
+#include "main/shaderapi.h"
  #include "main/shaderobj.h"
  #include "main/uniforms.h"
-#include "program/hash_table.h"
  
-extern "C" {
-#include "main/shaderapi.h"
+#include "program/hash_table.h"
  #include "program/prog_instruction.h"
  #include "program/prog_optimize.h"
  #include "program/prog_print.h"
  #include "program/program.h"
  #include "program/prog_parameter.h"
  #include "program/sampler.h"
-}
+
  
  static int swizzle_for_size(int size);
  
@@ -229,7 +228,7 @@ public:
  
     int next_temp;
  
-   variable_storage *find_variable_storage(ir_variable *var);
+   variable_storage *find_variable_storage(const ir_variable *var);
  
     src_reg get_temp(const glsl_type *type);
     void reladdr_to_temp(ir_instruction *ir, src_reg *reg, int *num_reladdr);
@@ -263,6 +262,7 @@ public:
     virtual void visit(ir_if *);
     virtual void visit(ir_emit_vertex *);
     virtual void visit(ir_end_primitive *);
+   virtual void visit(ir_barrier *);
     /*@}*/
  
     src_reg result;
@@ -304,14 +304,10 @@ public:
     void emit_scalar(ir_instruction *ir, enum prog_opcode op,
                     dst_reg dst, src_reg src0, src_reg src1);
  
-   void emit_scs(ir_instruction *ir, enum prog_opcode op,
-                dst_reg dst, const src_reg &src);
-
     bool try_emit_mad(ir_expression *ir,
                           int mul_operand);
     bool try_emit_mad_for_and_not(ir_expression *ir,
                                  int mul_operand);
-   bool try_emit_sat(ir_expression *ir);
  
     void emit_swz(ir_expression *ir);
  
@@ -410,7 +406,7 @@ ir_to_mesa_visitor::emit_dp(ir_instruction *ir,
                             dst_reg dst, src_reg src0, src_reg src1,
                             unsigned elements)
  {
-   static const gl_inst_opcode dot_opcodes[] = {
+   static const enum prog_opcode dot_opcodes[] = {
        OPCODE_DP2, OPCODE_DP3, OPCODE_DP4
     };
  
@@ -481,101 +477,6 @@ ir_to_mesa_visitor::emit_scalar(ir_instruction *ir, enum prog_opcode op,
     emit_scalar(ir, op, dst, src0, undef);
  }
  
-/**
- * Emit an OPCODE_SCS instruction
- *
- * The \c SCS opcode functions a bit differently than the other Mesa (or
- * ARB_fragment_program) opcodes.  Instead of splatting its result across all
- * four components of the destination, it writes one value to the \c x
- * component and another value to the \c y component.
- *
- * \param ir        IR instruction being processed
- * \param op        Either \c OPCODE_SIN or \c OPCODE_COS depending on which
- *                  value is desired.
- * \param dst       Destination register
- * \param src       Source register
- */
-void
-ir_to_mesa_visitor::emit_scs(ir_instruction *ir, enum prog_opcode op,
-                            dst_reg dst,
-                            const src_reg &src)
-{
-   /* Vertex programs cannot use the SCS opcode.
-    */
-   if (this->prog->Target == GL_VERTEX_PROGRAM_ARB) {
-      emit_scalar(ir, op, dst, src);
-      return;
-   }
-
-   const unsigned component = (op == OPCODE_SIN) ? 0 : 1;
-   const unsigned scs_mask = (1U << component);
-   int done_mask = ~dst.writemask;
-   src_reg tmp;
-
-   assert(op == OPCODE_SIN || op == OPCODE_COS);
-
-   /* If there are compnents in the destination that differ from the component
-    * that will be written by the SCS instrution, we'll need a temporary.
-    */
-   if (scs_mask != unsigned(dst.writemask)) {
-      tmp = get_temp(glsl_type::vec4_type);
-   }
-
-   for (unsigned i = 0; i < 4; i++) {
-      unsigned this_mask = (1U << i);
-      src_reg src0 = src;
-
-      if ((done_mask & this_mask) != 0)
-        continue;
-
-      /* The source swizzle specified which component of the source generates
-       * sine / cosine for the current component in the destination.  The SCS
-       * instruction requires that this value be swizzle to the X component.
-       * Replace the current swizzle with a swizzle that puts the source in
-       * the X component.
-       */
-      unsigned src0_swiz = GET_SWZ(src.swizzle, i);
-
-      src0.swizzle = MAKE_SWIZZLE4(src0_swiz, src0_swiz,
-                                  src0_swiz, src0_swiz);
-      for (unsigned j = i + 1; j < 4; j++) {
-        /* If there is another enabled component in the destination that is
-         * derived from the same inputs, generate its value on this pass as
-         * well.
-         */
-        if (!(done_mask & (1 << j)) &&
-            GET_SWZ(src0.swizzle, j) == src0_swiz) {
-           this_mask |= (1 << j);
-        }
-      }
-
-      if (this_mask != scs_mask) {
-        ir_to_mesa_instruction *inst;
-        dst_reg tmp_dst = dst_reg(tmp);
-
-        /* Emit the SCS instruction.
-         */
-        inst = emit(ir, OPCODE_SCS, tmp_dst, src0);
-        inst->dst.writemask = scs_mask;
-
-        /* Move the result of the SCS instruction to the desired location in
-         * the destination.
-         */
-        tmp.swizzle = MAKE_SWIZZLE4(component, component,
-                                    component, component);
-        inst = emit(ir, OPCODE_SCS, dst, tmp);
-        inst->dst.writemask = this_mask;
-      } else {
-        /* Emit the SCS instruction to write directly to the destination.
-         */
-        ir_to_mesa_instruction *inst = emit(ir, OPCODE_SCS, dst, src0);
-        inst->dst.writemask = scs_mask;
-      }
-
-      done_mask |= this_mask;
-   }
-}
-
  src_reg
  ir_to_mesa_visitor::src_reg_for_float(float val)
  {
@@ -608,6 +509,20 @@ type_size(const struct glsl_type *type)
           */
          return 1;
        }
+      break;
+   case GLSL_TYPE_DOUBLE:
+      if (type->is_matrix()) {
+         if (type->vector_elements > 2)
+            return type->matrix_columns * 2;
+         else
+            return type->matrix_columns;
+      } else {
+         if (type->vector_elements > 2)
+            return 2;
+         else
+            return 1;
+      }
+      break;
     case GLSL_TYPE_ARRAY:
        assert(type->length > 0);
        return type_size(type->fields.array) * type->length;
@@ -618,6 +533,8 @@ type_size(const struct glsl_type *type)
        }
        return size;
     case GLSL_TYPE_SAMPLER:
+   case GLSL_TYPE_IMAGE:
+   case GLSL_TYPE_SUBROUTINE:
        /* Samplers take up one slot in UNIFORMS[], but they're baked in
         * at link time.
         */
@@ -626,6 +543,7 @@ type_size(const struct glsl_type *type)
     case GLSL_TYPE_VOID:
     case GLSL_TYPE_ERROR:
     case GLSL_TYPE_INTERFACE:
+   case GLSL_TYPE_FUNCTION:
        assert(!"Invalid type in type_size");
        break;
     }
@@ -660,14 +578,9 @@ ir_to_mesa_visitor::get_temp(const glsl_type *type)
  }
  
  variable_storage *
-ir_to_mesa_visitor::find_variable_storage(ir_variable *var)
+ir_to_mesa_visitor::find_variable_storage(const ir_variable *var)
  {
-   
-   variable_storage *entry;
-
-   foreach_iter(exec_list_iterator, iter, this->variables) {
-      entry = (variable_storage *)iter.get();
-
+   foreach_in_list(variable_storage, entry, &this->variables) {
        if (entry->var == var)
          return entry;
     }
@@ -687,8 +600,8 @@ ir_to_mesa_visitor::visit(ir_variable *ir)
  
     if (ir->data.mode == ir_var_uniform && strncmp(ir->name, "gl_", 3) == 0) {
        unsigned int i;
-      const ir_state_slot *const slots = ir->state_slots;
-      assert(ir->state_slots != NULL);
+      const ir_state_slot *const slots = ir->get_state_slots();
+      assert(slots != NULL);
  
        /* Check if this statevar's setup in the STATE file exactly
         * matches how we'll want to reference it as a
@@ -696,7 +609,7 @@ ir_to_mesa_visitor::visit(ir_variable *ir)
         * temporary storage and hope that it'll get copy-propagated
         * out.
         */
-      for (i = 0; i < ir->num_state_slots; i++) {
+      for (i = 0; i < ir->get_num_state_slots(); i++) {
          if (slots[i].swizzle != SWIZZLE_XYZW) {
             break;
          }
@@ -704,7 +617,7 @@ ir_to_mesa_visitor::visit(ir_variable *ir)
  
        variable_storage *storage;
        dst_reg dst;
-      if (i == ir->num_state_slots) {
+      if (i == ir->get_num_state_slots()) {
          /* We'll set the index later. */
          storage = new(mem_ctx) variable_storage(ir, PROGRAM_STATE_VAR, -1);
          this->variables.push_tail(storage);
@@ -715,7 +628,7 @@ ir_to_mesa_visitor::visit(ir_variable *ir)
           * of the type.  However, this had better match the number of state
           * elements that we're going to copy into the new temporary.
           */
-        assert((int) ir->num_state_slots == type_size(ir->type));
+        assert((int) ir->get_num_state_slots() == type_size(ir->type));
  
          storage = new(mem_ctx) variable_storage(ir, PROGRAM_TEMPORARY,
                                                  this->next_temp);
@@ -726,7 +639,7 @@ ir_to_mesa_visitor::visit(ir_variable *ir)
        }
  
  
-      for (unsigned int i = 0; i < ir->num_state_slots; i++) {
+      for (unsigned int i = 0; i < ir->get_num_state_slots(); i++) {
          int index = _mesa_add_state_reference(this->prog->Parameters,
                                                (gl_state_index *)slots[i].tokens);
  
@@ -746,7 +659,7 @@ ir_to_mesa_visitor::visit(ir_variable *ir)
        }
  
        if (storage->file == PROGRAM_TEMPORARY &&
-         dst.index != storage->index + (int) ir->num_state_slots) {
+         dst.index != storage->index + (int) ir->get_num_state_slots()) {
          linker_error(this->shader_program,
                       "failed to load builtin uniform `%s' "
                       "(%d/%d regs loaded)\n",
@@ -797,13 +710,11 @@ ir_to_mesa_visitor::visit(ir_function *ir)
        const ir_function_signature *sig;
        exec_list empty;
  
-      sig = ir->matching_signature(NULL, &empty);
+      sig = ir->matching_signature(NULL, &empty, false);
  
        assert(sig);
  
-      foreach_iter(exec_list_iterator, iter, sig->body) {
-        ir_instruction *ir = (ir_instruction *)iter.get();
-
+      foreach_in_list(ir_instruction, ir, &sig->body) {
          ir->accept(this);
        }
     }
@@ -872,50 +783,6 @@ ir_to_mesa_visitor::try_emit_mad_for_and_not(ir_expression *ir, int try_operand)
     return true;
  }
  
-bool
-ir_to_mesa_visitor::try_emit_sat(ir_expression *ir)
-{
-   /* Saturates were only introduced to vertex programs in
-    * NV_vertex_program3, so don't give them to drivers in the VP.
-    */
-   if (this->prog->Target == GL_VERTEX_PROGRAM_ARB)
-      return false;
-
-   ir_rvalue *sat_src = ir->as_rvalue_to_saturate();
-   if (!sat_src)
-      return false;
-
-   sat_src->accept(this);
-   src_reg src = this->result;
-
-   /* If we generated an expression instruction into a temporary in
-    * processing the saturate's operand, apply the saturate to that
-    * instruction.  Otherwise, generate a MOV to do the saturate.
-    *
-    * Note that we have to be careful to only do this optimization if
-    * the instruction in question was what generated src->result.  For
-    * example, ir_dereference_array might generate a MUL instruction
-    * to create the reladdr, and return us a src reg using that
-    * reladdr.  That MUL result is not the value we're trying to
-    * saturate.
-    */
-   ir_expression *sat_src_expr = sat_src->as_expression();
-   ir_to_mesa_instruction *new_inst;
-   new_inst = (ir_to_mesa_instruction *)this->instructions.get_tail();
-   if (sat_src_expr && (sat_src_expr->operation == ir_binop_mul ||
-                       sat_src_expr->operation == ir_binop_add ||
-                       sat_src_expr->operation == ir_binop_dot)) {
-      new_inst->saturate = true;
-   } else {
-      this->result = get_temp(ir->type);
-      ir_to_mesa_instruction *inst;
-      inst = emit(ir, OPCODE_MOV, dst_reg(this->result), src);
-      inst->saturate = true;
-   }
-
-   return true;
-}
-
  void
  ir_to_mesa_visitor::reladdr_to_temp(ir_instruction *ir,
                                     src_reg *reg, int *num_reladdr)
@@ -1056,7 +923,7 @@ void
  ir_to_mesa_visitor::visit(ir_expression *ir)
  {
     unsigned int operand;
-   src_reg op[Elements(ir->operands)];
+   src_reg op[ARRAY_SIZE(ir->operands)];
     src_reg result_src;
     dst_reg result_dst;
  
@@ -1078,9 +945,6 @@ ir_to_mesa_visitor::visit(ir_expression *ir)
          return;
     }
  
-   if (try_emit_sat(ir))
-      return;
-
     if (ir->operation == ir_quadop_vector) {
        this->emit_swz(ir);
        return;
@@ -1163,12 +1027,6 @@ ir_to_mesa_visitor::visit(ir_expression *ir)
     case ir_unop_cos:
        emit_scalar(ir, OPCODE_COS, result_dst, op[0]);
        break;
-   case ir_unop_sin_reduced:
-      emit_scs(ir, OPCODE_SIN, result_dst, op[0]);
-      break;
-   case ir_unop_cos_reduced:
-      emit_scs(ir, OPCODE_COS, result_dst, op[0]);
-      break;
  
     case ir_unop_dFdx:
        emit(ir, OPCODE_DDX, result_dst, op[0]);
@@ -1177,6 +1035,12 @@ ir_to_mesa_visitor::visit(ir_expression *ir)
        emit(ir, OPCODE_DDY, result_dst, op[0]);
        break;
  
+   case ir_unop_saturate: {
+      ir_to_mesa_instruction *inst = emit(ir, OPCODE_MOV,
+                                          result_dst, op[0]);
+      inst->saturate = true;
+      break;
+   }
     case ir_unop_noise: {
        const enum prog_opcode opcode =
          prog_opcode(OPCODE_NOISE1
@@ -1201,7 +1065,7 @@ ir_to_mesa_visitor::visit(ir_expression *ir)
        assert(!"not reached: should be handled by ir_div_to_mul_rcp");
        break;
     case ir_binop_mod:
-      /* Floating point should be lowered by MOD_TO_FRACT in the compiler. */
+      /* Floating point should be lowered by MOD_TO_FLOOR in the compiler. */
        assert(ir->type->is_integer());
        emit(ir, OPCODE_MUL, result_dst, op[0], op[1]);
        break;
@@ -1397,6 +1261,7 @@ ir_to_mesa_visitor::visit(ir_expression *ir)
     case ir_unop_pack_unorm_2x16:
     case ir_unop_pack_unorm_4x8:
     case ir_unop_pack_half_2x16:
+   case ir_unop_pack_double_2x32:
     case ir_unop_unpack_snorm_2x16:
     case ir_unop_unpack_snorm_4x8:
     case ir_unop_unpack_unorm_2x16:
@@ -1404,11 +1269,21 @@ ir_to_mesa_visitor::visit(ir_expression *ir)
     case ir_unop_unpack_half_2x16:
     case ir_unop_unpack_half_2x16_split_x:
     case ir_unop_unpack_half_2x16_split_y:
+   case ir_unop_unpack_double_2x32:
     case ir_binop_pack_half_2x16_split:
     case ir_unop_bitfield_reverse:
     case ir_unop_bit_count:
     case ir_unop_find_msb:
     case ir_unop_find_lsb:
+   case ir_unop_d2f:
+   case ir_unop_f2d:
+   case ir_unop_d2i:
+   case ir_unop_i2d:
+   case ir_unop_d2u:
+   case ir_unop_u2d:
+   case ir_unop_d2b:
+   case ir_unop_frexp_sig:
+   case ir_unop_frexp_exp:
        assert(!"not supported");
        break;
     case ir_binop_min:
@@ -1462,9 +1337,19 @@ ir_to_mesa_visitor::visit(ir_expression *ir)
     case ir_binop_carry:
     case ir_binop_borrow:
     case ir_binop_imul_high:
+   case ir_unop_interpolate_at_centroid:
+   case ir_binop_interpolate_at_offset:
+   case ir_binop_interpolate_at_sample:
+   case ir_unop_dFdx_coarse:
+   case ir_unop_dFdx_fine:
+   case ir_unop_dFdy_coarse:
+   case ir_unop_dFdy_fine:
+   case ir_unop_subroutine_to_int:
+   case ir_unop_get_buffer_size:
        assert(!"not supported");
        break;
  
+   case ir_unop_ssbo_unsized_array_length:
     case ir_quadop_vector:
        /* This operation should have already been handled.
         */
@@ -1491,6 +1376,7 @@ ir_to_mesa_visitor::visit(ir_swizzle *ir)
     ir->val->accept(this);
     src = this->result;
     assert(src.file != PROGRAM_UNDEFINED);
+   assert(ir->type->vector_elements > 0);
  
     for (i = 0; i < 4; i++) {
        if (i < ir->type->vector_elements) {
@@ -1868,8 +1754,7 @@ ir_to_mesa_visitor::visit(ir_constant *ir)
        src_reg temp_base = get_temp(ir->type);
        dst_reg temp = dst_reg(temp_base);
  
-      foreach_iter(exec_list_iterator, iter, ir->components) {
-        ir_constant *field_value = (ir_constant *)iter.get();
+      foreach_in_list(ir_constant, field_value, &ir->components) {
          int size = type_size(field_value->type);
  
          assert(size > 0);
@@ -1963,7 +1848,7 @@ ir_to_mesa_visitor::visit(ir_constant *ir)
  }
  
  void
-ir_to_mesa_visitor::visit(ir_call *ir)
+ir_to_mesa_visitor::visit(ir_call *)
  {
     assert(!"ir_to_mesa: All function calls should have been inlined by now.");
  }
@@ -2037,6 +1922,8 @@ ir_to_mesa_visitor::visit(ir_texture *ir)
     case ir_query_levels:
        assert(!"Unexpected ir_query_levels opcode");
        break;
+   case ir_texture_samples:
+      unreachable("Unexpected ir_texture_samples opcode");
     }
  
     const glsl_type *sampler_type = ir->sampler->type;
@@ -2227,17 +2114,23 @@ ir_to_mesa_visitor::visit(ir_if *ir)
  }
  
  void
-ir_to_mesa_visitor::visit(ir_emit_vertex *ir)
+ir_to_mesa_visitor::visit(ir_emit_vertex *)
  {
     assert(!"Geometry shaders not supported.");
  }
  
  void
-ir_to_mesa_visitor::visit(ir_end_primitive *ir)
+ir_to_mesa_visitor::visit(ir_end_primitive *)
  {
     assert(!"Geometry shaders not supported.");
  }
  
+void
+ir_to_mesa_visitor::visit(ir_barrier *)
+{
+   unreachable("GLSL barrier() not supported.");
+}
+
  ir_to_mesa_visitor::ir_to_mesa_visitor()
  {
     result.file = PROGRAM_UNDEFINED;
@@ -2338,9 +2231,7 @@ set_branchtargets(ir_to_mesa_visitor *v,
          mesa_instructions[loop_stack[loop_stack_pos]].BranchTarget = i;
          break;
        case OPCODE_CAL:
-        foreach_iter(exec_list_iterator, iter, v->function_signatures) {
-           function_entry *entry = (function_entry *)iter.get();
-
+        foreach_in_list(function_entry, entry, &v->function_signatures) {
             if (entry->sig_id == mesa_instructions[i].BranchTarget) {
                mesa_instructions[i].BranchTarget = entry->inst;
                break;
@@ -2429,13 +2320,14 @@ add_uniform_to_shader::visit_field(const glsl_type *type, const char *name,
  
     if (type->is_vector() || type->is_scalar()) {
        size = type->vector_elements;
+      if (type->is_double())
+         size *= 2;
     } else {
        size = type_size(type) * 4;
     }
  
     gl_register_file file;
-   if (type->is_sampler() ||
-       (type->is_array() && type->fields.array->is_sampler())) {
+   if (type->without_array()->is_sampler()) {
        file = PROGRAM_SAMPLER;
     } else {
        file = PROGRAM_UNIFORM;
@@ -2493,14 +2385,13 @@ _mesa_generate_parameters_list_for_uniforms(struct gl_shader_program
                                             struct gl_program_parameter_list
                                             *params)
  {
-   add_uniform_to_shader add(shader_program, params,
-                             _mesa_shader_enum_to_shader_stage(sh->Type));
+   add_uniform_to_shader add(shader_program, params, sh->Stage);
  
-   foreach_list(node, sh->ir) {
-      ir_variable *var = ((ir_instruction *) node)->as_variable();
+   foreach_in_list(ir_instruction, node, sh->ir) {
+      ir_variable *var = node->as_variable();
  
        if ((var == NULL) || (var->data.mode != ir_var_uniform)
-         || var->is_in_uniform_block() || (strncmp(var->name, "gl_", 3) == 0))
+         || var->is_in_buffer_block() || (strncmp(var->name, "gl_", 3) == 0))
          continue;
  
        add.process(var);
@@ -2529,12 +2420,18 @@ _mesa_associate_uniform_storage(struct gl_context *ctx,
        if (!found)
          continue;
  
+      struct gl_uniform_storage *storage =
+         &shader_program->UniformStorage[location];
+
+      /* Do not associate any uniform storage to built-in uniforms */
+      if (storage->builtin)
+         continue;
+
        if (location != last_location) {
-        struct gl_uniform_storage *storage =
-           &shader_program->UniformStorage[location];
          enum gl_uniform_driver_format format = uniform_native;
  
          unsigned columns = 0;
+        int dmul = 4 * sizeof(float);
          switch (storage->type->base_type) {
          case GLSL_TYPE_UINT:
             assert(ctx->Const.NativeIntegers);
@@ -2546,20 +2443,22 @@ _mesa_associate_uniform_storage(struct gl_context *ctx,
                (ctx->Const.NativeIntegers) ? uniform_native : uniform_int_float;
             columns = 1;
             break;
+
+        case GLSL_TYPE_DOUBLE:
+           if (storage->type->vector_elements > 2)
+               dmul *= 2;
+           /* fallthrough */
          case GLSL_TYPE_FLOAT:
             format = uniform_native;
             columns = storage->type->matrix_columns;
             break;
          case GLSL_TYPE_BOOL:
-           if (ctx->Const.NativeIntegers) {
-              format = (ctx->Const.UniformBooleanTrue == 1)
-                 ? uniform_bool_int_0_1 : uniform_bool_int_0_not0;
-           } else {
-              format = uniform_bool_float;
-           }
+           format = uniform_native;
             columns = 1;
             break;
          case GLSL_TYPE_SAMPLER:
+        case GLSL_TYPE_IMAGE:
+         case GLSL_TYPE_SUBROUTINE:
             format = uniform_native;
             columns = 1;
             break;
@@ -2569,13 +2468,14 @@ _mesa_associate_uniform_storage(struct gl_context *ctx,
           case GLSL_TYPE_STRUCT:
           case GLSL_TYPE_ERROR:
           case GLSL_TYPE_INTERFACE:
+         case GLSL_TYPE_FUNCTION:
             assert(!"Should not get here.");
             break;
          }
  
          _mesa_uniform_attach_driver_storage(storage,
-                                            4 * sizeof(float) * columns,
-                                            4 * sizeof(float),
+                                            dmul * columns,
+                                            dmul,
                                              format,
                                              &params->ParameterValues[i]);
  
@@ -2621,9 +2521,7 @@ ir_to_mesa_visitor::copy_propagate(void)
     int *acp_level = rzalloc_array(mem_ctx, int, this->next_temp * 4);
     int level = 0;
  
-   foreach_iter(exec_list_iterator, iter, this->instructions) {
-      ir_to_mesa_instruction *inst = (ir_to_mesa_instruction *)iter.get();
-
+   foreach_in_list(ir_to_mesa_instruction, inst, &this->instructions) {
        assert(inst->dst.file != PROGRAM_TEMPORARY
              || inst->dst.index < this->next_temp);
  
@@ -2800,25 +2698,10 @@ get_mesa_program(struct gl_context *ctx,
     ir_instruction **mesa_instruction_annotation;
     int i;
     struct gl_program *prog;
-   GLenum target;
-   const char *target_string = _mesa_progshader_enum_to_string(shader->Type);
+   GLenum target = _mesa_shader_stage_to_program(shader->Stage);
+   const char *target_string = _mesa_shader_stage_to_string(shader->Stage);
     struct gl_shader_compiler_options *options =
-         &ctx->ShaderCompilerOptions[_mesa_shader_enum_to_shader_stage(shader->Type)];
-
-   switch (shader->Type) {
-   case GL_VERTEX_SHADER:
-      target = GL_VERTEX_PROGRAM_ARB;
-      break;
-   case GL_FRAGMENT_SHADER:
-      target = GL_FRAGMENT_PROGRAM_ARB;
-      break;
-   case GL_GEOMETRY_SHADER:
-      target = GL_GEOMETRY_PROGRAM_NV;
-      break;
-   default:
-      assert(!"should not be reached");
-      return NULL;
-   }
+         &ctx->Const.ShaderCompilerOptions[shader->Stage];
  
     validate_ir_tree(shader->ir);
  
@@ -2840,10 +2723,7 @@ get_mesa_program(struct gl_context *ctx,
  
     prog->NumTemporaries = v.next_temp;
  
-   int num_instructions = 0;
-   foreach_iter(exec_list_iterator, iter, v.instructions) {
-      num_instructions++;
-   }
+   unsigned num_instructions = v.instructions.length();
  
     mesa_instructions =
        (struct prog_instruction *)calloc(num_instructions,
@@ -2857,13 +2737,11 @@ get_mesa_program(struct gl_context *ctx,
      */
     mesa_inst = mesa_instructions;
     i = 0;
-   foreach_iter(exec_list_iterator, iter, v.instructions) {
-      const ir_to_mesa_instruction *inst = (ir_to_mesa_instruction *)iter.get();
-
+   foreach_in_list(const ir_to_mesa_instruction, inst, &v.instructions) {
        mesa_inst->Opcode = inst->op;
        mesa_inst->CondUpdate = inst->cond_update;
        if (inst->saturate)
-        mesa_inst->SaturateMode = SATURATE_ZERO_ONE;
+        mesa_inst->Saturate = GL_TRUE;
        mesa_inst->DstReg.File = inst->dst.file;
        mesa_inst->DstReg.Index = inst->dst.index;
        mesa_inst->DstReg.CondMask = inst->dst.cond_mask;
@@ -2931,17 +2809,18 @@ get_mesa_program(struct gl_context *ctx,
  
     set_branchtargets(&v, mesa_instructions, num_instructions);
  
-   if (ctx->Shader.Flags & GLSL_DUMP) {
-      printf("\n");
-      printf("GLSL IR for linked %s program %d:\n", target_string,
-            shader_program->Name);
-      _mesa_print_ir(shader->ir, NULL);
-      printf("\n");
-      printf("\n");
-      printf("Mesa IR for linked %s program %d:\n", target_string,
-            shader_program->Name);
+   if (ctx->_Shader->Flags & GLSL_DUMP) {
+      fprintf(stderr, "\n");
+      fprintf(stderr, "GLSL IR for linked %s program %d:\n", target_string,
+             shader_program->Name);
+      _mesa_print_ir(stderr, shader->ir, NULL);
+      fprintf(stderr, "\n");
+      fprintf(stderr, "\n");
+      fprintf(stderr, "Mesa IR for linked %s program %d:\n", target_string,
+             shader_program->Name);
        print_program(mesa_instructions, mesa_instruction_annotation,
                     num_instructions);
+      fflush(stderr);
     }
  
     prog->Instructions = mesa_instructions;
@@ -2952,7 +2831,7 @@ get_mesa_program(struct gl_context *ctx,
      */
     mesa_instructions = NULL;
  
-   do_set_program_inouts(shader->ir, prog, shader->Type);
+   do_set_program_inouts(shader->ir, prog, shader->Stage);
  
     prog->SamplersUsed = shader->active_samplers;
     prog->ShadowSamplers = shader->shadow_samplers;
@@ -2966,7 +2845,7 @@ get_mesa_program(struct gl_context *ctx,
  
     _mesa_reference_program(ctx, &shader->Program, prog);
  
-   if ((ctx->Shader.Flags & GLSL_NO_OPT) == 0) {
+   if ((ctx->_Shader->Flags & GLSL_NO_OPT) == 0) {
        _mesa_optimize_program(ctx, prog);
     }
  
@@ -3007,22 +2886,21 @@ _mesa_ir_link_shader(struct gl_context *ctx, struct gl_shader_program *prog)
        bool progress;
        exec_list *ir = prog->_LinkedShaders[i]->ir;
        const struct gl_shader_compiler_options *options =
-            &ctx->ShaderCompilerOptions[_mesa_shader_enum_to_shader_stage(prog->_LinkedShaders[i]->Type)];
+            &ctx->Const.ShaderCompilerOptions[prog->_LinkedShaders[i]->Stage];
  
        do {
          progress = false;
  
          /* Lowering */
          do_mat_op_to_vec(ir);
-        lower_instructions(ir, (MOD_TO_FRACT | DIV_TO_MUL_RCP | EXP_TO_EXP2
+        lower_instructions(ir, (MOD_TO_FLOOR | DIV_TO_MUL_RCP | EXP_TO_EXP2
                                  | LOG_TO_LOG2 | INT_DIV_TO_MUL_RCP
                                  | ((options->EmitNoPow) ? POW_TO_EXP2 : 0)));
  
          progress = do_lower_jumps(ir, true, true, options->EmitNoMainReturn, options->EmitNoCont, options->EmitNoLoops) || progress;
  
          progress = do_common_optimization(ir, true, true,
-                                          options->MaxUnrollIterations,
-                                           options)
+                                           options, ctx->Const.NativeIntegers)
            || progress;
  
          progress = lower_quadop_vector(ir, true) || progress;
@@ -3041,7 +2919,7 @@ _mesa_ir_link_shader(struct gl_context *ctx, struct gl_shader_program *prog)
          if (options->EmitNoIndirectInput || options->EmitNoIndirectOutput
              || options->EmitNoIndirectTemp || options->EmitNoIndirectUniform)
            progress =
-            lower_variable_index_to_cond_assign(ir,
+            lower_variable_index_to_cond_assign(prog->_LinkedShaders[i]->Stage, ir,
                                                  options->EmitNoIndirectInput,
                                                  options->EmitNoIndirectOutput,
                                                  options->EmitNoIndirectTemp,
@@ -3069,7 +2947,7 @@ _mesa_ir_link_shader(struct gl_context *ctx, struct gl_shader_program *prog)
          _mesa_reference_program(ctx, &prog->_LinkedShaders[i]->Program,
                                  linked_prog);
           if (!ctx->Driver.ProgramStringNotify(ctx,
-                                              _mesa_program_index_to_target(i),
+                                              _mesa_shader_stage_to_program(i),
                                                linked_prog)) {
              return GL_FALSE;
           }
@@ -3089,7 +2967,7 @@ _mesa_glsl_link_shader(struct gl_context *ctx, struct gl_shader_program *prog)
  {
     unsigned int i;
  
-   _mesa_clear_shader_program_data(ctx, prog);
+   _mesa_clear_shader_program_data(prog);
  
     prog->LinkStatus = GL_TRUE;
  
@@ -3106,17 +2984,19 @@ _mesa_glsl_link_shader(struct gl_context *ctx, struct gl_shader_program *prog)
     if (prog->LinkStatus) {
        if (!ctx->Driver.LinkShader(ctx, prog)) {
          prog->LinkStatus = GL_FALSE;
+      } else {
+         build_program_resource_list(prog);
        }
     }
  
-   if (ctx->Shader.Flags & GLSL_DUMP) {
+   if (ctx->_Shader->Flags & GLSL_DUMP) {
        if (!prog->LinkStatus) {
-        printf("GLSL shader program %d failed to link\n", prog->Name);
+        fprintf(stderr, "GLSL shader program %d failed to link\n", prog->Name);
        }
  
        if (prog->InfoLog && prog->InfoLog[0] != 0) {
-        printf("GLSL shader program %d info log:\n", prog->Name);
-        printf("%s\n", prog->InfoLog);
+        fprintf(stderr, "GLSL shader program %d info log:\n", prog->Name);
+        fprintf(stderr, "%s\n", prog->InfoLog);
        }
     }
  }