glsl/mesa: split gl_shader in two

[mesa.git] / src / mesa / program / ir_to_mesa.cpp
diff --git a/src/mesa/program/ir_to_mesa.cpp b/src/mesa/program/ir_to_mesa.cpp

index c5b67ad706a931369b2f42ac0a24e46884fed7ff..e74d94f84f7a35baa3dbd889c43f2ee5776771b4 100644 (file)
--- a/src/mesa/program/ir_to_mesa.cpp
+++ b/src/mesa/program/ir_to_mesa.cpp
@@ -304,6 +304,22 @@ public:
  
     void emit_swz(ir_expression *ir);
  
+   void emit_equality_comparison(ir_expression *ir, enum prog_opcode op,
+                                 dst_reg dst,
+                                 const src_reg &src0, const src_reg &src1);
+
+   inline void emit_sne(ir_expression *ir, dst_reg dst,
+                        const src_reg &src0, const src_reg &src1)
+   {
+      emit_equality_comparison(ir, OPCODE_SLT, dst, src0, src1);
+   }
+
+   inline void emit_seq(ir_expression *ir, dst_reg dst,
+                        const src_reg &src0, const src_reg &src1)
+   {
+      emit_equality_comparison(ir, OPCODE_SGE, dst, src0, src1);
+   }
+
     bool process_move_condition(ir_rvalue *ir);
  
     void copy_propagate(void);
@@ -912,6 +928,46 @@ ir_to_mesa_visitor::emit_swz(ir_expression *ir)
     this->result = result_src;
  }
  
+void
+ir_to_mesa_visitor::emit_equality_comparison(ir_expression *ir,
+                                             enum prog_opcode op,
+                                             dst_reg dst,
+                                             const src_reg &src0,
+                                             const src_reg &src1)
+{
+   src_reg difference;
+   src_reg abs_difference = get_temp(glsl_type::vec4_type);
+   const src_reg zero = src_reg_for_float(0.0);
+
+   /* x == y is equivalent to -abs(x-y) >= 0.  Since all of the code that
+    * consumes the generated IR is pretty dumb, take special care when one
+    * of the operands is zero.
+    *
+    * Similarly, x != y is equivalent to -abs(x-y) < 0.
+    */
+   if (src0.file == zero.file &&
+       src0.index == zero.index &&
+       src0.swizzle == zero.swizzle) {
+      difference = src1;
+   } else if (src1.file == zero.file &&
+              src1.index == zero.index &&
+              src1.swizzle == zero.swizzle) {
+      difference = src0;
+   } else {
+      difference = get_temp(glsl_type::vec4_type);
+
+      src_reg tmp_src = src0;
+      tmp_src.negate = ~tmp_src.negate;
+
+      emit(ir, OPCODE_ADD, dst_reg(difference), tmp_src, src1);
+   }
+
+   emit(ir, OPCODE_ABS, dst_reg(abs_difference), difference);
+
+   abs_difference.negate = ~abs_difference.negate;
+   emit(ir, op, dst, abs_difference, zero);
+}
+
  void
  ir_to_mesa_visitor::visit(ir_expression *ir)
  {
@@ -1086,17 +1142,17 @@ ir_to_mesa_visitor::visit(ir_expression *ir)
        emit(ir, OPCODE_SGE, result_dst, op[0], op[1]);
        break;
     case ir_binop_equal:
-      emit(ir, OPCODE_SEQ, result_dst, op[0], op[1]);
+      emit_seq(ir, result_dst, op[0], op[1]);
        break;
     case ir_binop_nequal:
-      emit(ir, OPCODE_SNE, result_dst, op[0], op[1]);
+      emit_sne(ir, result_dst, op[0], op[1]);
        break;
     case ir_binop_all_equal:
        /* "==" operator producing a scalar boolean. */
        if (ir->operands[0]->type->is_vector() ||
           ir->operands[1]->type->is_vector()) {
          src_reg temp = get_temp(glsl_type::vec4_type);
-        emit(ir, OPCODE_SNE, dst_reg(temp), op[0], op[1]);
+         emit_sne(ir, dst_reg(temp), op[0], op[1]);
  
          /* After the dot-product, the value will be an integer on the
           * range [0,4].  Zero becomes 1.0, and positive values become zero.
@@ -1111,7 +1167,7 @@ ir_to_mesa_visitor::visit(ir_expression *ir)
          sge_src.negate = ~sge_src.negate;
          emit(ir, OPCODE_SGE, result_dst, sge_src, src_reg_for_float(0.0));
        } else {
-        emit(ir, OPCODE_SEQ, result_dst, op[0], op[1]);
+         emit_seq(ir, result_dst, op[0], op[1]);
        }
        break;
     case ir_binop_any_nequal:
@@ -1124,7 +1180,7 @@ ir_to_mesa_visitor::visit(ir_expression *ir)
               ir->operands[1]->as_constant()->is_zero()) {
              temp = op[0];
           } else {
-            emit(ir, OPCODE_SNE, dst_reg(temp), op[0], op[1]);
+            emit_sne(ir, dst_reg(temp), op[0], op[1]);
           }
  
          /* After the dot-product, the value will be an integer on the
@@ -1147,33 +1203,29 @@ ir_to_mesa_visitor::visit(ir_expression *ir)
             emit(ir, OPCODE_SLT, result_dst, slt_src, src_reg_for_float(0.0));
          }
        } else {
-        emit(ir, OPCODE_SNE, result_dst, op[0], op[1]);
+         emit_sne(ir, result_dst, op[0], op[1]);
        }
        break;
  
     case ir_binop_logic_xor:
-      emit(ir, OPCODE_SNE, result_dst, op[0], op[1]);
+      emit_sne(ir, result_dst, op[0], op[1]);
        break;
  
     case ir_binop_logic_or: {
-      /* After the addition, the value will be an integer on the
-       * range [0,2].  Zero stays zero, and positive values become 1.0.
-       */
-      ir_to_mesa_instruction *add =
-        emit(ir, OPCODE_ADD, result_dst, op[0], op[1]);
        if (this->prog->Target == GL_FRAGMENT_PROGRAM_ARB) {
-        /* The clamping to [0,1] can be done for free in the fragment
-         * shader with a saturate.
-         */
+         /* After the addition, the value will be an integer on the
+          * range [0,2].  Zero stays zero, and positive values become 1.0.
+          */
+         ir_to_mesa_instruction *add =
+            emit(ir, OPCODE_ADD, result_dst, op[0], op[1]);
          add->saturate = true;
        } else {
-        /* Negating the result of the addition gives values on the range
-         * [-2, 0].  Zero stays zero, and negative values become 1.0.  This
-         * is achieved using SLT.
-         */
-        src_reg slt_src = result_src;
-        slt_src.negate = ~slt_src.negate;
-        emit(ir, OPCODE_SLT, result_dst, slt_src, src_reg_for_float(0.0));
+         /* The Boolean arguments are stored as float 0.0 and 1.0.  If either
+          * value is 1.0, the result of the logcal-or should be 1.0.  If both
+          * values are 0.0, the result should be 0.0.  This is exactly what
+          * MAX does.
+          */
+         emit(ir, OPCODE_MAX, result_dst, op[0], op[1]);
        }
        break;
     }
@@ -1217,8 +1269,7 @@ ir_to_mesa_visitor::visit(ir_expression *ir)
        break;
     case ir_unop_f2b:
     case ir_unop_i2b:
-      emit(ir, OPCODE_SNE, result_dst,
-                         op[0], src_reg_for_float(0.0));
+      emit_sne(ir, result_dst, op[0], src_reg_for_float(0.0));
        break;
     case ir_unop_bitcast_f2i: // Ignore these 4, they can't happen here anyway
     case ir_unop_bitcast_f2u:
@@ -1324,6 +1375,9 @@ ir_to_mesa_visitor::visit(ir_expression *ir)
     case ir_unop_dFdy_fine:
     case ir_unop_subroutine_to_int:
     case ir_unop_get_buffer_size:
+   case ir_unop_vote_any:
+   case ir_unop_vote_all:
+   case ir_unop_vote_eq:
        assert(!"not supported");
        break;
  
@@ -1921,7 +1975,7 @@ ir_to_mesa_visitor::visit(ir_texture *ir)
        ir->coordinate->accept(this);
  
     /* Put our coords in a temp.  We'll need to modify them for shadow,
-    * projection, or LOD, so the only case we'd use it as is is if
+    * projection, or LOD, so the only case we'd use it as-is is if
      * we're doing plain old texturing.  Mesa IR optimization should
      * handle cleaning up our mess in that case.
      */
@@ -2353,7 +2407,7 @@ add_uniform_to_shader::visit_field(const glsl_type *type, const char *name,
  
     if (type->is_vector() || type->is_scalar()) {
        size = type->vector_elements;
-      if (type->is_double())
+      if (type->is_64bit())
           size *= 2;
     } else {
        size = type_size(type) * 4;
@@ -2415,7 +2469,7 @@ add_uniform_to_shader::visit_field(const glsl_type *type, const char *name,
  void
  _mesa_generate_parameters_list_for_uniforms(struct gl_shader_program
                                             *shader_program,
-                                           struct gl_shader *sh,
+                                           struct gl_linked_shader *sh,
                                             struct gl_program_parameter_list
                                             *params)
  {
@@ -2725,7 +2779,7 @@ ir_to_mesa_visitor::copy_propagate(void)
  static struct gl_program *
  get_mesa_program(struct gl_context *ctx,
                   struct gl_shader_program *shader_program,
-                struct gl_shader *shader)
+                struct gl_linked_shader *shader)
  {
     ir_to_mesa_visitor v;
     struct prog_instruction *mesa_instructions, *mesa_inst;