i965: fs: fix gen6+ math operands in one place

author Chris Forbes <chrisf@ijw.co.nz>

Wed, 28 Nov 2012 19:39:08 +0000 (08:39 +1300)

committer Eric Anholt <eric@anholt.net>

Fri, 14 Dec 2012 23:26:35 +0000 (15:26 -0800)
author Chris Forbes <chrisf@ijw.co.nz>
Wed, 28 Nov 2012 19:39:08 +0000 (08:39 +1300)
committer Eric Anholt <eric@anholt.net>
Fri, 14 Dec 2012 23:26:35 +0000 (15:26 -0800)
diff --git a/src/mesa/drivers/dri/i965/brw_fs.cpp b/src/mesa/drivers/dri/i965/brw_fs.cpp

index 83128117328c031f6c4d5e7ac435da119cf4e6fe..b7cdadf60874ec1bb6f6ad02e2b8b0bbb93d3f06 100644 (file)
--- a/src/mesa/drivers/dri/i965/brw_fs.cpp
+++ b/src/mesa/drivers/dri/i965/brw_fs.cpp
@@ -1067,6 +1067,33 @@ fs_visitor::emit_frontfacing_interpolation(ir_variable *ir)
     return reg;
  }
  
+fs_reg
+fs_visitor::fix_math_operand(fs_reg src)
+{
+   /* Can't do hstride == 0 args on gen6 math, so expand it out. We
+    * might be able to do better by doing execsize = 1 math and then
+    * expanding that result out, but we would need to be careful with
+    * masking.
+    *
+    * The hardware ignores source modifiers (negate and abs) on math
+    * instructions, so we also move to a temp to set those up.
+    */
+   if (intel->gen == 6 && src.file != UNIFORM && src.file != IMM &&
+       !src.abs && !src.negate)
+      return src;
+
+   /* Gen7 relaxes most of the above restrictions, but still can't use IMM
+    * operands to math
+    */
+   if (intel->gen >= 7 && src.file != IMM)
+      return src;
+
+   fs_reg expanded = fs_reg(this, glsl_type::float_type);
+   expanded.type = src.type;
+   emit(BRW_OPCODE_MOV, expanded, src);
+   return expanded;
+}
+
  fs_inst *
  fs_visitor::emit_math(enum opcode opcode, fs_reg dst, fs_reg src)
  {
@@ -1092,13 +1119,8 @@ fs_visitor::emit_math(enum opcode opcode, fs_reg dst, fs_reg src)
      * Gen 6 hardware ignores source modifiers (negate and abs) on math
      * instructions, so we also move to a temp to set those up.
      */
-   if (intel->gen == 6 && (src.file == UNIFORM ||
-                          src.abs ||
-                          src.negate)) {
-      fs_reg expanded = fs_reg(this, glsl_type::float_type);
-      emit(BRW_OPCODE_MOV, expanded, src);
-      src = expanded;
-   }
+   if (intel->gen >= 6)
+      src = fix_math_operand(src);
  
     fs_inst *inst = emit(opcode, dst, src);
  
@@ -1126,27 +1148,9 @@ fs_visitor::emit_math(enum opcode opcode, fs_reg dst, fs_reg src0, fs_reg src1)
        return NULL;
     }
  
-   if (intel->gen >= 7) {
-      inst = emit(opcode, dst, src0, src1);
-   } else if (intel->gen == 6) {
-      /* Can't do hstride == 0 args to gen6 math, so expand it out.
-       *
-       * The hardware ignores source modifiers (negate and abs) on math
-       * instructions, so we also move to a temp to set those up.
-       */
-      if (src0.file == UNIFORM || src0.abs || src0.negate) {
-        fs_reg expanded = fs_reg(this, glsl_type::float_type);
-        expanded.type = src0.type;
-        emit(BRW_OPCODE_MOV, expanded, src0);
-        src0 = expanded;
-      }
-
-      if (src1.file == UNIFORM || src1.abs || src1.negate) {
-        fs_reg expanded = fs_reg(this, glsl_type::float_type);
-        expanded.type = src1.type;
-        emit(BRW_OPCODE_MOV, expanded, src1);
-        src1 = expanded;
-      }
+   if (intel->gen >= 6) {
+      src0 = fix_math_operand(src0);
+      src1 = fix_math_operand(src1);
  
        inst = emit(opcode, dst, src0, src1);
     } else {
diff --git a/src/mesa/drivers/dri/i965/brw_fs.h b/src/mesa/drivers/dri/i965/brw_fs.h

index 87257123f27d2a3a52555d3405a166abca37b748..ca242df3d7487e3d6bb27249fd6097f4be9aa9f5 100644 (file)
--- a/src/mesa/drivers/dri/i965/brw_fs.h
+++ b/src/mesa/drivers/dri/i965/brw_fs.h
@@ -353,6 +353,7 @@ public:
                               fs_reg shadow_comp, fs_reg lod, fs_reg lod2);
     fs_inst *emit_texture_gen7(ir_texture *ir, fs_reg dst, fs_reg coordinate,
                               fs_reg shadow_comp, fs_reg lod, fs_reg lod2);
+   fs_reg fix_math_operand(fs_reg src);
     fs_inst *emit_math(enum opcode op, fs_reg dst, fs_reg src0);
     fs_inst *emit_math(enum opcode op, fs_reg dst, fs_reg src0, fs_reg src1);
     void emit_minmax(uint32_t conditionalmod, fs_reg dst,
author	Chris Forbes <chrisf@ijw.co.nz>
	Wed, 28 Nov 2012 19:39:08 +0000 (08:39 +1300)
committer	Eric Anholt <eric@anholt.net>
	Fri, 14 Dec 2012 23:26:35 +0000 (15:26 -0800)
src/mesa/drivers/dri/i965/brw_fs.cpp		patch \| blob \| history
src/mesa/drivers/dri/i965/brw_fs.h		patch \| blob \| history