r300/compiler: Introduce control flow instructions and refactor dataflow
[mesa.git] / src / mesa / drivers / dri / r300 / compiler / r3xx_fragprog.c
index 014c5fbac0194fdc9eec1c5b23a7900461442e5c..590201a9bab4cf593ffd2bce495f202aba469ba2 100644 (file)
 
 #include "radeon_compiler.h"
 
-#include "shader/prog_parameter.h"
-#include "shader/prog_print.h"
-#include "shader/prog_statevars.h"
+#include <stdio.h>
 
-#include "radeon_nqssadce.h"
+#include "radeon_dataflow.h"
 #include "radeon_program_alu.h"
 #include "r300_fragprog.h"
 #include "r300_fragprog_swizzle.h"
 #include "r500_fragprog.h"
 
 
-static void nqssadce_init(struct nqssadce_state* s)
+static void dataflow_outputs_mark_use(void * userdata, void * data,
+               void (*callback)(void *, unsigned int, unsigned int))
 {
-       s->Outputs[FRAG_RESULT_COLOR].Sourced = WRITEMASK_XYZW;
-       s->Outputs[FRAG_RESULT_DEPTH].Sourced = WRITEMASK_W;
+       struct r300_fragment_program_compiler * c = userdata;
+       callback(data, c->OutputColor, RC_MASK_XYZW);
+       callback(data, c->OutputDepth, RC_MASK_W);
 }
 
-/**
- * Transform the program to support fragment.position.
- *
- * Introduce a small fragment at the start of the program that will be
- * the only code that directly reads the FRAG_ATTRIB_WPOS input.
- * All other code pieces that reference that input will be rewritten
- * to read from a newly allocated temporary.
- *
- */
-static void insert_WPOS_trailer(struct r300_fragment_program_compiler *compiler)
-{
-       int i;
-
-       if (!(compiler->Base.Program.InputsRead & FRAG_BIT_WPOS)) {
-               compiler->code->wpos_attr = FRAG_ATTRIB_MAX;
-               return;
-       }
-
-       for (i = FRAG_ATTRIB_TEX0; i <= FRAG_ATTRIB_TEX7; ++i)
-       {
-               if (!(compiler->Base.Program.InputsRead & (1 << i))) {
-                       compiler->code->wpos_attr = i;
-                       break;
-               }
-       }
-
-       rc_transform_fragment_wpos(&compiler->Base, FRAG_ATTRIB_WPOS, compiler->code->wpos_attr);
-}
-
-/**
- * Rewrite fragment.fogcoord to use a texture coordinate slot.
- * Note that fogcoord is forced into an X001 pattern, and this enforcement
- * is done here.
- *
- * See also the counterpart rewriting for vertex programs.
- */
-static void rewriteFog(struct r300_fragment_program_compiler *compiler)
-{
-       struct rX00_fragment_program_code *code = compiler->code;
-       struct prog_src_register src;
-       int i;
-
-       if (!(compiler->Base.Program.InputsRead & FRAG_BIT_FOGC)) {
-               code->fog_attr = FRAG_ATTRIB_MAX;
-               return;
-       }
-
-       for (i = FRAG_ATTRIB_TEX0; i <= FRAG_ATTRIB_TEX7; ++i)
-       {
-               if (!(compiler->Base.Program.InputsRead & (1 << i))) {
-                       code->fog_attr = i;
-                       break;
-               }
-       }
-
-       reset_srcreg(&src);
-       src.File = PROGRAM_INPUT;
-       src.Index = code->fog_attr;
-       src.Swizzle = MAKE_SWIZZLE4(SWIZZLE_X, SWIZZLE_ZERO, SWIZZLE_ZERO, SWIZZLE_ONE);
-       rc_move_input(&compiler->Base, FRAG_ATTRIB_FOGC, src);
-}
-
-
 static void rewrite_depth_out(struct r300_fragment_program_compiler * c)
 {
        struct rc_instruction *rci;
 
        for (rci = c->Base.Program.Instructions.Next; rci != &c->Base.Program.Instructions; rci = rci->Next) {
-               struct prog_instruction * inst = &rci->I;
+               struct rc_sub_instruction * inst = &rci->I;
 
-               if (inst->DstReg.File != PROGRAM_OUTPUT || inst->DstReg.Index != FRAG_RESULT_DEPTH)
+               if (inst->DstReg.File != RC_FILE_OUTPUT || inst->DstReg.Index != c->OutputDepth)
                        continue;
 
-               if (inst->DstReg.WriteMask & WRITEMASK_Z) {
-                       inst->DstReg.WriteMask = WRITEMASK_W;
+               if (inst->DstReg.WriteMask & RC_MASK_Z) {
+                       inst->DstReg.WriteMask = RC_MASK_W;
                } else {
                        inst->DstReg.WriteMask = 0;
                        continue;
                }
 
                switch (inst->Opcode) {
-                       case OPCODE_FRC:
-                       case OPCODE_MOV:
-                               inst->SrcReg[0] = lmul_swizzle(SWIZZLE_ZZZZ, inst->SrcReg[0]);
+                       case RC_OPCODE_FRC:
+                       case RC_OPCODE_MOV:
+                               inst->SrcReg[0] = lmul_swizzle(RC_SWIZZLE_ZZZZ, inst->SrcReg[0]);
                                break;
-                       case OPCODE_ADD:
-                       case OPCODE_MAX:
-                       case OPCODE_MIN:
-                       case OPCODE_MUL:
-                               inst->SrcReg[0] = lmul_swizzle(SWIZZLE_ZZZZ, inst->SrcReg[0]);
-                               inst->SrcReg[1] = lmul_swizzle(SWIZZLE_ZZZZ, inst->SrcReg[1]);
+                       case RC_OPCODE_ADD:
+                       case RC_OPCODE_MAX:
+                       case RC_OPCODE_MIN:
+                       case RC_OPCODE_MUL:
+                               inst->SrcReg[0] = lmul_swizzle(RC_SWIZZLE_ZZZZ, inst->SrcReg[0]);
+                               inst->SrcReg[1] = lmul_swizzle(RC_SWIZZLE_ZZZZ, inst->SrcReg[1]);
                                break;
-                       case OPCODE_CMP:
-                       case OPCODE_MAD:
-                               inst->SrcReg[0] = lmul_swizzle(SWIZZLE_ZZZZ, inst->SrcReg[0]);
-                               inst->SrcReg[1] = lmul_swizzle(SWIZZLE_ZZZZ, inst->SrcReg[1]);
-                               inst->SrcReg[2] = lmul_swizzle(SWIZZLE_ZZZZ, inst->SrcReg[2]);
+                       case RC_OPCODE_CMP:
+                       case RC_OPCODE_MAD:
+                               inst->SrcReg[0] = lmul_swizzle(RC_SWIZZLE_ZZZZ, inst->SrcReg[0]);
+                               inst->SrcReg[1] = lmul_swizzle(RC_SWIZZLE_ZZZZ, inst->SrcReg[1]);
+                               inst->SrcReg[2] = lmul_swizzle(RC_SWIZZLE_ZZZZ, inst->SrcReg[2]);
                                break;
                        default:
                                // Scalar instructions needn't be reswizzled
@@ -146,19 +83,6 @@ static void rewrite_depth_out(struct r300_fragment_program_compiler * c)
 
 void r3xx_compile_fragment_program(struct r300_fragment_program_compiler* c)
 {
-       if (c->Base.Debug) {
-               fflush(stdout);
-               _mesa_printf("Fragment Program: Initial program:\n");
-               _mesa_print_program(c->program);
-               fflush(stdout);
-       }
-
-       rc_mesa_to_rc_program(&c->Base, c->program);
-
-       insert_WPOS_trailer(c);
-
-       rewriteFog(c);
-
        rewrite_depth_out(c);
 
        if (c->is_r500) {
@@ -169,6 +93,8 @@ void r3xx_compile_fragment_program(struct r300_fragment_program_compiler* c)
                        { &radeonTransformTrigScale, 0 }
                };
                radeonLocalTransform(&c->Base, 4, transformations);
+
+               c->Base.SwizzleCaps = &r500_swizzle_caps;
        } else {
                struct radeon_program_transformation transformations[] = {
                        { &r300_transform_TEX, c },
@@ -176,34 +102,30 @@ void r3xx_compile_fragment_program(struct r300_fragment_program_compiler* c)
                        { &radeonTransformTrigSimple, 0 }
                };
                radeonLocalTransform(&c->Base, 3, transformations);
+
+               c->Base.SwizzleCaps = &r300_swizzle_caps;
        }
 
        if (c->Base.Debug) {
-               _mesa_printf("Fragment Program: After native rewrite:\n");
+               fprintf(stderr, "Fragment Program: After native rewrite:\n");
                rc_print_program(&c->Base.Program);
-               fflush(stdout);
+               fflush(stderr);
        }
 
-       if (c->is_r500) {
-               struct radeon_nqssadce_descr nqssadce = {
-                       .Init = &nqssadce_init,
-                       .IsNativeSwizzle = &r500FPIsNativeSwizzle,
-                       .BuildSwizzle = &r500FPBuildSwizzle
-               };
-               radeonNqssaDce(&c->Base, &nqssadce, 0);
-       } else {
-               struct radeon_nqssadce_descr nqssadce = {
-                       .Init = &nqssadce_init,
-                       .IsNativeSwizzle = &r300FPIsNativeSwizzle,
-                       .BuildSwizzle = &r300FPBuildSwizzle
-               };
-               radeonNqssaDce(&c->Base, &nqssadce, 0);
+       rc_dataflow_deadcode(&c->Base, &dataflow_outputs_mark_use, c);
+
+       if (c->Base.Debug) {
+               fprintf(stderr, "Fragment Program: After deadcode:\n");
+               rc_print_program(&c->Base.Program);
+               fflush(stderr);
        }
 
+       rc_dataflow_swizzles(&c->Base);
+
        if (c->Base.Debug) {
-               _mesa_printf("Compiler: after NqSSA-DCE:\n");
+               fprintf(stderr, "Compiler: after dataflow passes:\n");
                rc_print_program(&c->Base.Program);
-               fflush(stdout);
+               fflush(stderr);
        }
 
        if (c->is_r500) {