i965: Fix fp-dst-aliasing-[12].vpfp.
authorEric Anholt <eric@anholt.net>
Fri, 8 Jul 2011 00:08:04 +0000 (17:08 -0700)
committerEric Anholt <eric@anholt.net>
Mon, 11 Jul 2011 15:58:37 +0000 (08:58 -0700)
There's no pretty way to avoid the overwriting of the src operands, so
just use a temporary destination and rely on the MOV optimization.

Reviewed-by: Ian Romanick <ian.d.romanick@intel.com>
src/mesa/drivers/dri/i965/brw_wm_fp.c

index 87eabf1fba137fdb388edfd4e3155f9465fd13ab..7cd3edad23588d52fbd9448cce6d77b1a017d70e 100644 (file)
@@ -563,13 +563,14 @@ static void precalc_dst( struct brw_wm_compile *c,
    struct prog_src_register src0 = inst->SrcReg[0];
    struct prog_src_register src1 = inst->SrcReg[1];
    struct prog_dst_register dst = inst->DstReg;
-   
+   struct prog_dst_register temp = get_temp(c);
+
    if (dst.WriteMask & WRITEMASK_Y) {      
       /* dst.y = mul src0.y, src1.y
        */
       emit_op(c,
              OPCODE_MUL,
-             dst_mask(dst, WRITEMASK_Y),
+             dst_mask(temp, WRITEMASK_Y),
              inst->SaturateMode,
              src0,
              src1,
@@ -584,7 +585,7 @@ static void precalc_dst( struct brw_wm_compile *c,
        */
       swz = emit_op(c,
                    OPCODE_SWZ,
-                   dst_mask(dst, WRITEMASK_XZ),
+                   dst_mask(temp, WRITEMASK_XZ),
                    inst->SaturateMode,
                    src_swizzle(src0, SWIZZLE_ONE, z, z, z),
                    src_undef(),
@@ -597,12 +598,26 @@ static void precalc_dst( struct brw_wm_compile *c,
        */
       emit_op(c,
              OPCODE_MOV,
-             dst_mask(dst, WRITEMASK_W),
+             dst_mask(temp, WRITEMASK_W),
              inst->SaturateMode,
              src1,
              src_undef(),
              src_undef());
    }
+
+   /* This will get optimized out in general, but it ensures that we
+    * don't overwrite src operands in our channel-wise splitting
+    * above.  See piglit fp-dst-aliasing-[12].
+    */
+   emit_op(c,
+          OPCODE_MOV,
+          dst,
+          0,
+          src_reg_from_dst(temp),
+          src_undef(),
+          src_undef());
+
+   release_temp(c, temp);
 }