i965g: Add missing va_end.

[mesa.git] / src / gallium / drivers / i965 / brw_wm_emit.c
diff --git a/src/gallium/drivers/i965/brw_wm_emit.c b/src/gallium/drivers/i965/brw_wm_emit.c

index fec33f74ebc2e74aebb1b1547a0bd2473aa281dc..8f983a60ae86fbcd3b3bc3ad261e48b232aa788e 100644 (file)
--- a/src/gallium/drivers/i965/brw_wm_emit.c
+++ b/src/gallium/drivers/i965/brw_wm_emit.c
@@ -28,10 +28,14 @@
    * Authors:
    *   Keith Whitwell <keith@tungstengraphics.com>
    */
-               
+
+#include "util/u_math.h"
+#include "tgsi/tgsi_info.h"
  
  #include "brw_context.h"
  #include "brw_wm.h"
+#include "brw_debug.h"
+#include "brw_disasm.h"
  
  /* Not quite sure how correct this is - need to understand horiz
   * vs. vertical strides a little better.
@@ -45,15 +49,15 @@ static INLINE struct brw_reg sechalf( struct brw_reg reg )
  
  /* Payload R0:
   *
- * R0.0 -- pixel mask, one bit for each of 4 pixels in 4 tiles,
+ * R0.0 -- pixel mask, one bit for each of 4 pixels in 4 quads,
   *         corresponding to each of the 16 execution channels.
   * R0.1..8 -- ?
   * R1.0 -- triangle vertex 0.X
   * R1.1 -- triangle vertex 0.Y
- * R1.2 -- tile 0 x,y coords (2 packed uwords)
- * R1.3 -- tile 1 x,y coords (2 packed uwords)
- * R1.4 -- tile 2 x,y coords (2 packed uwords)
- * R1.5 -- tile 3 x,y coords (2 packed uwords)
+ * R1.2 -- quad 0 x,y coords (2 packed uwords)
+ * R1.3 -- quad 1 x,y coords (2 packed uwords)
+ * R1.4 -- quad 2 x,y coords (2 packed uwords)
+ * R1.5 -- quad 3 x,y coords (2 packed uwords)
   * R1.6 -- ?
   * R1.7 -- ?
   * R1.8 -- ?
@@ -72,14 +76,14 @@ static void emit_pixel_xy(struct brw_compile *p,
     /* Calculate pixel centers by adding 1 or 0 to each of the
      * micro-tile coordinates passed in r1.
      */
-   if (mask & WRITEMASK_X) {
+   if (mask & BRW_WRITEMASK_X) {
        brw_ADD(p,
               vec16(retype(dst[0], BRW_REGISTER_TYPE_UW)),
               stride(suboffset(r1_uw, 4), 2, 4, 0),
               brw_imm_v(0x10101010));
     }
  
-   if (mask & WRITEMASK_Y) {
+   if (mask & BRW_WRITEMASK_Y) {
        brw_ADD(p,
               vec16(retype(dst[1], BRW_REGISTER_TYPE_UW)),
               stride(suboffset(r1_uw,5), 2, 4, 0),
@@ -101,14 +105,14 @@ static void emit_delta_xy(struct brw_compile *p,
     /* Calc delta X,Y by subtracting origin in r1 from the pixel
      * centers.
      */
-   if (mask & WRITEMASK_X) {
+   if (mask & BRW_WRITEMASK_X) {
        brw_ADD(p,
               dst[0],
               retype(arg0[0], BRW_REGISTER_TYPE_UW),
               negate(r1));
     }
  
-   if (mask & WRITEMASK_Y) {
+   if (mask & BRW_WRITEMASK_Y) {
        brw_ADD(p,
               dst[1],
               retype(arg0[1], BRW_REGISTER_TYPE_UW),
@@ -124,7 +128,7 @@ static void emit_wpos_xy(struct brw_wm_compile *c,
  {
     struct brw_compile *p = &c->func;
  
-   if (mask & WRITEMASK_X) {
+   if (mask & BRW_WRITEMASK_X) {
        /* X' = X */
        brw_MOV(p,
               dst[0],
@@ -133,12 +137,18 @@ static void emit_wpos_xy(struct brw_wm_compile *c,
  
     /* XXX: is this needed any more, or is this a NOOP?
      */
-   if (mask & WRITEMASK_Y) {
+   if (mask & BRW_WRITEMASK_Y) {
+#if 0
        /* Y' = height - 1 - Y */
        brw_ADD(p,
               dst[1],
               negate(retype(arg0[1], BRW_REGISTER_TYPE_W)),
               brw_imm_d(c->key.drawable_height - 1));
+#else
+      brw_MOV(p,
+             dst[0],
+             retype(arg0[0], BRW_REGISTER_TYPE_W));
+#endif
     }
  }
  
@@ -152,7 +162,7 @@ static void emit_pixel_w( struct brw_compile *p,
     /* Don't need this if all you are doing is interpolating color, for
      * instance.
      */
-   if (mask & WRITEMASK_W) {      
+   if (mask & BRW_WRITEMASK_W) {      
        struct brw_reg interp3 = brw_vec1_grf(arg0[0].nr+1, 4);
  
        /* Calc 1/w - just linterp wpos[3] optimized by putting the
@@ -255,7 +265,7 @@ static void emit_frontfacing( struct brw_compile *p,
     struct brw_reg r1_6ud = retype(brw_vec1_grf(1, 6), BRW_REGISTER_TYPE_UD);
     GLuint i;
  
-   if (!(mask & WRITEMASK_XYZW))
+   if (!(mask & BRW_WRITEMASK_XYZW))
        return;
  
     for (i = 0; i < 4; i++) {
@@ -279,28 +289,28 @@ static void emit_frontfacing( struct brw_compile *p,
  /* For OPCODE_DDX and OPCODE_DDY, per channel of output we've got input
   * looking like:
   *
- * arg0: ss0.tl ss0.tr ss0.bl ss0.br ss1.tl ss1.tr ss1.bl ss1.br
+ * arg0: q0.tl q0.tr q0.bl q0.br q1.tl q1.tr q1.bl q1.br
   *
   * and we're trying to produce:
   *
   *           DDX                     DDY
- * dst: (ss0.tr - ss0.tl)     (ss0.tl - ss0.bl)
- *      (ss0.tr - ss0.tl)     (ss0.tr - ss0.br)
- *      (ss0.br - ss0.bl)     (ss0.tl - ss0.bl)
- *      (ss0.br - ss0.bl)     (ss0.tr - ss0.br)
- *      (ss1.tr - ss1.tl)     (ss1.tl - ss1.bl)
- *      (ss1.tr - ss1.tl)     (ss1.tr - ss1.br)
- *      (ss1.br - ss1.bl)     (ss1.tl - ss1.bl)
- *      (ss1.br - ss1.bl)     (ss1.tr - ss1.br)
+ * dst: (q0.tr - q0.tl)     (q0.tl - q0.bl)
+ *      (q0.tr - q0.tl)     (q0.tr - q0.br)
+ *      (q0.br - q0.bl)     (q0.tl - q0.bl)
+ *      (q0.br - q0.bl)     (q0.tr - q0.br)
+ *      (q1.tr - q1.tl)     (q1.tl - q1.bl)
+ *      (q1.tr - q1.tl)     (q1.tr - q1.br)
+ *      (q1.br - q1.bl)     (q1.tl - q1.bl)
+ *      (q1.br - q1.bl)     (q1.tr - q1.br)
   *
- * and add another set of two more subspans if in 16-pixel dispatch mode.
+ * and add two more quads if in 16-pixel dispatch mode.
   *
   * For DDX, it ends up being easy: width = 2, horiz=0 gets us the same result
   * for each pair, and vertstride = 2 jumps us 2 elements after processing a
   * pair. But for DDY, it's harder, as we want to produce the pairs swizzled
   * between each other.  We could probably do it like ddx and swizzle the right
   * order later, but bail for now and just produce
- * ((ss0.tl - ss0.bl)x4 (ss1.tl - ss1.bl)x4)
+ * ((q0.tl - q0.bl)x4 (q1.tl - q1.bl)x4)
   */
  void emit_ddxy(struct brw_compile *p,
                const struct brw_reg *dst,
@@ -321,26 +331,26 @@ void emit_ddxy(struct brw_compile *p,
                            BRW_VERTICAL_STRIDE_2,
                            BRW_WIDTH_2,
                            BRW_HORIZONTAL_STRIDE_0,
-                          BRW_SWIZZLE_XYZW, WRITEMASK_XYZW);
+                          BRW_SWIZZLE_XYZW, BRW_WRITEMASK_XYZW);
             src1 = brw_reg(arg0[i].file, arg0[i].nr, 0,
                            BRW_REGISTER_TYPE_F,
                            BRW_VERTICAL_STRIDE_2,
                            BRW_WIDTH_2,
                            BRW_HORIZONTAL_STRIDE_0,
-                          BRW_SWIZZLE_XYZW, WRITEMASK_XYZW);
+                          BRW_SWIZZLE_XYZW, BRW_WRITEMASK_XYZW);
          } else {
             src0 = brw_reg(arg0[i].file, arg0[i].nr, 0,
                            BRW_REGISTER_TYPE_F,
                            BRW_VERTICAL_STRIDE_4,
                            BRW_WIDTH_4,
                            BRW_HORIZONTAL_STRIDE_0,
-                          BRW_SWIZZLE_XYZW, WRITEMASK_XYZW);
+                          BRW_SWIZZLE_XYZW, BRW_WRITEMASK_XYZW);
             src1 = brw_reg(arg0[i].file, arg0[i].nr, 2,
                            BRW_REGISTER_TYPE_F,
                            BRW_VERTICAL_STRIDE_4,
                            BRW_WIDTH_4,
                            BRW_HORIZONTAL_STRIDE_0,
-                          BRW_SWIZZLE_XYZW, WRITEMASK_XYZW);
+                          BRW_SWIZZLE_XYZW, BRW_WRITEMASK_XYZW);
          }
          brw_ADD(p, dst[i], src0, negate(src1));
        }
@@ -611,12 +621,12 @@ static void emit_dp3( struct brw_compile *p,
                       const struct brw_reg *arg0,
                       const struct brw_reg *arg1 )
  {
-   int dst_chan = _mesa_ffs(mask & WRITEMASK_XYZW) - 1;
+   int dst_chan = ffs(mask & BRW_WRITEMASK_XYZW) - 1;
  
-   if (!(mask & WRITEMASK_XYZW))
+   if (!(mask & BRW_WRITEMASK_XYZW))
        return; /* Do not emit dead code */
  
-   assert(is_power_of_two(mask & WRITEMASK_XYZW));
+   assert(util_is_power_of_two(mask & BRW_WRITEMASK_XYZW));
  
     brw_MUL(p, brw_null_reg(), arg0[0], arg1[0]);
     brw_MAC(p, brw_null_reg(), arg0[1], arg1[1]);
@@ -633,12 +643,12 @@ static void emit_dp4( struct brw_compile *p,
                       const struct brw_reg *arg0,
                       const struct brw_reg *arg1 )
  {
-   int dst_chan = _mesa_ffs(mask & WRITEMASK_XYZW) - 1;
+   int dst_chan = ffs(mask & BRW_WRITEMASK_XYZW) - 1;
  
-   if (!(mask & WRITEMASK_XYZW))
+   if (!(mask & BRW_WRITEMASK_XYZW))
        return; /* Do not emit dead code */
  
-   assert(is_power_of_two(mask & WRITEMASK_XYZW));
+   assert(util_is_power_of_two(mask & BRW_WRITEMASK_XYZW));
  
     brw_MUL(p, brw_null_reg(), arg0[0], arg1[0]);
     brw_MAC(p, brw_null_reg(), arg0[1], arg1[1]);
@@ -656,12 +666,12 @@ static void emit_dph( struct brw_compile *p,
                       const struct brw_reg *arg0,
                       const struct brw_reg *arg1 )
  {
-   const int dst_chan = _mesa_ffs(mask & WRITEMASK_XYZW) - 1;
+   const int dst_chan = ffs(mask & BRW_WRITEMASK_XYZW) - 1;
  
-   if (!(mask & WRITEMASK_XYZW))
+   if (!(mask & BRW_WRITEMASK_XYZW))
        return; /* Do not emit dead code */
  
-   assert(is_power_of_two(mask & WRITEMASK_XYZW));
+   assert(util_is_power_of_two(mask & BRW_WRITEMASK_XYZW));
  
     brw_MUL(p, brw_null_reg(), arg0[0], arg1[0]);
     brw_MAC(p, brw_null_reg(), arg0[1], arg1[1]);
@@ -681,7 +691,7 @@ static void emit_xpd( struct brw_compile *p,
  {
     GLuint i;
  
-   assert(!(mask & WRITEMASK_W) == WRITEMASK_X);
+   assert((mask & BRW_WRITEMASK_W) != BRW_WRITEMASK_W);
     
     for (i = 0 ; i < 3; i++) {
        if (mask & (1<<i)) {
@@ -704,12 +714,12 @@ static void emit_math1( struct brw_compile *p,
                         GLuint mask,
                         const struct brw_reg *arg0 )
  {
-   int dst_chan = _mesa_ffs(mask & WRITEMASK_XYZW) - 1;
+   int dst_chan = ffs(mask & BRW_WRITEMASK_XYZW) - 1;
  
-   if (!(mask & WRITEMASK_XYZW))
+   if (!(mask & BRW_WRITEMASK_XYZW))
        return; /* Do not emit dead code */
  
-   assert(is_power_of_two(mask & WRITEMASK_XYZW));
+   assert(util_is_power_of_two(mask & BRW_WRITEMASK_XYZW));
  
     brw_MOV(p, brw_message_reg(2), arg0[0]);
  
@@ -732,12 +742,12 @@ static void emit_math2( struct brw_compile *p,
                         const struct brw_reg *arg0,
                         const struct brw_reg *arg1)
  {
-   int dst_chan = _mesa_ffs(mask & WRITEMASK_XYZW) - 1;
+   int dst_chan = ffs(mask & BRW_WRITEMASK_XYZW) - 1;
  
-   if (!(mask & WRITEMASK_XYZW))
+   if (!(mask & BRW_WRITEMASK_XYZW))
        return; /* Do not emit dead code */
  
-   assert(is_power_of_two(mask & WRITEMASK_XYZW));
+   assert(util_is_power_of_two(mask & BRW_WRITEMASK_XYZW));
  
     brw_push_insn_state(p);
  
@@ -783,29 +793,41 @@ static void emit_tex( struct brw_wm_compile *c,
                       const struct brw_wm_instruction *inst,
                       struct brw_reg *dst,
                       GLuint dst_flags,
-                     struct brw_reg *arg )
+                     struct brw_reg *coord,
+                     GLuint sampler)
  {
     struct brw_compile *p = &c->func;
     GLuint msgLength, responseLength;
     GLuint i, nr;
     GLuint emit;
     GLuint msg_type;
+   GLboolean shadow = FALSE;
  
     /* How many input regs are there?
      */
-   switch (inst->tex_idx) {
-   case TEXTURE_1D_INDEX:
-      emit = WRITEMASK_X;
+   switch (inst->target) {
+   case TGSI_TEXTURE_1D:
+      emit = BRW_WRITEMASK_X;
        nr = 1;
        break;
-   case TEXTURE_2D_INDEX:
-   case TEXTURE_RECT_INDEX:
-      emit = WRITEMASK_XY;
+   case TGSI_TEXTURE_SHADOW1D:
+      emit = BRW_WRITEMASK_XW;
+      nr = 4;
+      shadow = TRUE;
+      break;
+   case TGSI_TEXTURE_2D:
+      emit = BRW_WRITEMASK_XY;
        nr = 2;
        break;
-   case TEXTURE_3D_INDEX:
-   case TEXTURE_CUBE_INDEX:
-      emit = WRITEMASK_XYZ;
+   case TGSI_TEXTURE_SHADOW2D:
+   case TGSI_TEXTURE_SHADOWRECT:
+      emit = BRW_WRITEMASK_XYW;
+      nr = 4;
+      shadow = TRUE;
+      break;
+   case TGSI_TEXTURE_3D:
+   case TGSI_TEXTURE_CUBE:
+      emit = BRW_WRITEMASK_XYZ;
        nr = 3;
        break;
     default:
@@ -813,17 +835,12 @@ static void emit_tex( struct brw_wm_compile *c,
        abort();
     }
  
-   if (inst->tex_shadow) {
-      nr = 4;
-      emit |= WRITEMASK_W;
-   }
-
     msgLength = 1;
  
     for (i = 0; i < nr; i++) {
        static const GLuint swz[4] = {0,1,2,2};
        if (emit & (1<<i)) 
-        brw_MOV(p, brw_message_reg(msgLength+1), arg[swz[i]]);
+        brw_MOV(p, brw_message_reg(msgLength+1), coord[swz[i]]);
        else
          brw_MOV(p, brw_message_reg(msgLength+1), brw_imm_f(0));
        msgLength += 2;
@@ -832,12 +849,12 @@ static void emit_tex( struct brw_wm_compile *c,
     responseLength = 8;         /* always */
  
     if (BRW_IS_IGDNG(p->brw)) {
-       if (inst->tex_shadow)
+       if (shadow)
             msg_type = BRW_SAMPLER_MESSAGE_SIMD16_SAMPLE_COMPARE_IGDNG;
         else
             msg_type = BRW_SAMPLER_MESSAGE_SIMD16_SAMPLE_IGDNG;
     } else {
-       if (inst->tex_shadow)
+       if (shadow)
             msg_type = BRW_SAMPLER_MESSAGE_SIMD16_SAMPLE_COMPARE;
         else
             msg_type = BRW_SAMPLER_MESSAGE_SIMD16_SAMPLE;
@@ -847,8 +864,8 @@ static void emit_tex( struct brw_wm_compile *c,
               retype(vec16(dst[0]), BRW_REGISTER_TYPE_UW),
               1,
               retype(c->payload.depth[0].hw_reg, BRW_REGISTER_TYPE_UW),
-              SURF_INDEX_TEXTURE(inst->tex_unit),
-             inst->tex_unit,     /* sampler */
+              BTI_TEXTURE(inst->tex_unit),
+             sampler,          /* sampler index */
               inst->writemask,
               msg_type, 
               responseLength,
@@ -863,37 +880,41 @@ static void emit_txb( struct brw_wm_compile *c,
                       const struct brw_wm_instruction *inst,
                       struct brw_reg *dst,
                       GLuint dst_flags,
-                     struct brw_reg *arg )
+                     struct brw_reg *coord,
+                     GLuint sampler )
  {
     struct brw_compile *p = &c->func;
     GLuint msgLength;
     GLuint msg_type;
     /* Shadow ignored for txb.
      */
-   switch (inst->tex_idx) {
-   case TEXTURE_1D_INDEX:
-      brw_MOV(p, brw_message_reg(2), arg[0]);
+   switch (inst->target) {
+   case TGSI_TEXTURE_1D:
+   case TGSI_TEXTURE_SHADOW1D:
+      brw_MOV(p, brw_message_reg(2), coord[0]);
        brw_MOV(p, brw_message_reg(4), brw_imm_f(0));
        brw_MOV(p, brw_message_reg(6), brw_imm_f(0));
        break;
-   case TEXTURE_2D_INDEX:
-   case TEXTURE_RECT_INDEX:
-      brw_MOV(p, brw_message_reg(2), arg[0]);
-      brw_MOV(p, brw_message_reg(4), arg[1]);
+   case TGSI_TEXTURE_2D:
+   case TGSI_TEXTURE_RECT:
+   case TGSI_TEXTURE_SHADOW2D:
+   case TGSI_TEXTURE_SHADOWRECT:
+      brw_MOV(p, brw_message_reg(2), coord[0]);
+      brw_MOV(p, brw_message_reg(4), coord[1]);
        brw_MOV(p, brw_message_reg(6), brw_imm_f(0));
        break;
-   case TEXTURE_3D_INDEX:
-   case TEXTURE_CUBE_INDEX:
-      brw_MOV(p, brw_message_reg(2), arg[0]);
-      brw_MOV(p, brw_message_reg(4), arg[1]);
-      brw_MOV(p, brw_message_reg(6), arg[2]);
+   case TGSI_TEXTURE_3D:
+   case TGSI_TEXTURE_CUBE:
+      brw_MOV(p, brw_message_reg(2), coord[0]);
+      brw_MOV(p, brw_message_reg(4), coord[1]);
+      brw_MOV(p, brw_message_reg(6), coord[2]);
        break;
     default:
        /* unexpected target */
        abort();
     }
  
-   brw_MOV(p, brw_message_reg(8), arg[3]);
+   brw_MOV(p, brw_message_reg(8), coord[3]);
     msgLength = 9;
  
     if (BRW_IS_IGDNG(p->brw))
@@ -905,8 +926,8 @@ static void emit_txb( struct brw_wm_compile *c,
               retype(vec16(dst[0]), BRW_REGISTER_TYPE_UW),
               1,
               retype(c->payload.depth[0].hw_reg, BRW_REGISTER_TYPE_UW),
-              SURF_INDEX_TEXTURE(inst->tex_unit),
-             inst->tex_unit,     /* sampler */
+              BTI_TEXTURE(inst->tex_unit),
+             sampler,          /* sampler index */
               inst->writemask,
               msg_type,
               8,                /* responseLength */
@@ -922,18 +943,18 @@ static void emit_lit( struct brw_compile *p,
                       GLuint mask,
                       const struct brw_reg *arg0 )
  {
-   assert((mask & WRITEMASK_XW) == 0);
+   assert((mask & BRW_WRITEMASK_XW) == 0);
  
-   if (mask & WRITEMASK_Y) {
+   if (mask & BRW_WRITEMASK_Y) {
        brw_set_saturate(p, (mask & SATURATE) ? 1 : 0);
        brw_MOV(p, dst[1], arg0[0]);
        brw_set_saturate(p, 0);
     }
  
-   if (mask & WRITEMASK_Z) {
+   if (mask & BRW_WRITEMASK_Z) {
        emit_math2(p, BRW_MATH_FUNCTION_POW,
                  &dst[2],
-                WRITEMASK_X | (mask & SATURATE),
+                BRW_WRITEMASK_X | (mask & SATURATE),
                  &arg0[1],
                  &arg0[3]);
     }
@@ -944,10 +965,10 @@ static void emit_lit( struct brw_compile *p,
      */
     brw_CMP(p, brw_null_reg(), BRW_CONDITIONAL_LE, arg0[0], brw_imm_f(0));
     {
-      if (mask & WRITEMASK_Y) 
+      if (mask & BRW_WRITEMASK_Y) 
          brw_MOV(p, dst[1], brw_imm_f(0));
  
-      if (mask & WRITEMASK_Z) 
+      if (mask & BRW_WRITEMASK_Z) 
          brw_MOV(p, dst[2], brw_imm_f(0)); 
     }
     brw_set_predicate_control(p, BRW_PREDICATE_NONE);
@@ -976,17 +997,17 @@ static void emit_kil( struct brw_wm_compile *c,
     }
  }
  
-/* KIL_NV kills the pixels that are currently executing, not based on a test
+/* KILLP kills the pixels that are currently executing, not based on a test
   * of the arguments.
   */
-static void emit_kil_nv( struct brw_wm_compile *c )
+static void emit_killp( struct brw_wm_compile *c )
  {
     struct brw_compile *p = &c->func;
     struct brw_reg r0uw = retype(brw_vec1_grf(0, 0), BRW_REGISTER_TYPE_UW);
  
     brw_push_insn_state(p);
     brw_set_mask_control(p, BRW_MASK_DISABLE);
-   brw_NOT(p, c->emit_mask_reg, brw_mask_reg(1)); //IMASK
+   brw_NOT(p, c->emit_mask_reg, brw_mask_reg(1)); /* IMASK */
     brw_AND(p, r0uw, c->emit_mask_reg, r0uw);
     brw_pop_insn_state(p);
  }
@@ -1259,7 +1280,7 @@ void brw_wm_emit( struct brw_wm_compile *c )
      */
     spill_values(c, c->payload.depth, 4);
     spill_values(c, c->creg, c->nr_creg);
-   spill_values(c, c->payload.input_interp, FRAG_ATTRIB_MAX);
+   spill_values(c, c->payload.input_interp, PIPE_MAX_SHADER_INPUTS);
     
  
     for (insn = 0; insn < c->nr_insns; insn++) {
@@ -1328,163 +1349,162 @@ void brw_wm_emit( struct brw_wm_compile *c )
  
          /* Straightforward arithmetic:
           */
-      case OPCODE_ADD:
+      case TGSI_OPCODE_ADD:
          emit_alu2(p, brw_ADD, dst, dst_flags, args[0], args[1]);
          break;
  
-      case OPCODE_FRC:
+      case TGSI_OPCODE_FRC:
          emit_alu1(p, brw_FRC, dst, dst_flags, args[0]);
          break;
  
-      case OPCODE_FLR:
+      case TGSI_OPCODE_FLR:
          emit_alu1(p, brw_RNDD, dst, dst_flags, args[0]);
          break;
  
-      case OPCODE_DDX:
+      case TGSI_OPCODE_DDX:
          emit_ddxy(p, dst, dst_flags, GL_TRUE, args[0]);
          break;
  
-      case OPCODE_DDY:
+      case TGSI_OPCODE_DDY:
          emit_ddxy(p, dst, dst_flags, GL_FALSE, args[0]);
          break;
  
-      case OPCODE_DP3:
+      case TGSI_OPCODE_DP3:
          emit_dp3(p, dst, dst_flags, args[0], args[1]);
          break;
  
-      case OPCODE_DP4:
+      case TGSI_OPCODE_DP4:
          emit_dp4(p, dst, dst_flags, args[0], args[1]);
          break;
  
-      case OPCODE_DPH:
+      case TGSI_OPCODE_DPH:
          emit_dph(p, dst, dst_flags, args[0], args[1]);
          break;
  
-      case OPCODE_TRUNC:
+      case TGSI_OPCODE_TRUNC:
          emit_trunc(p, dst, dst_flags, args[0]);
          break;
  
-      case OPCODE_LRP:
+      case TGSI_OPCODE_LRP:
          emit_lrp(p, dst, dst_flags, args[0], args[1], args[2]);
          break;
  
-      case OPCODE_MAD: 
+      case TGSI_OPCODE_MAD:    
          emit_mad(p, dst, dst_flags, args[0], args[1], args[2]);
          break;
  
-      case OPCODE_MOV:
+      case TGSI_OPCODE_MOV:
          emit_alu1(p, brw_MOV, dst, dst_flags, args[0]);
          break;
  
-      case OPCODE_MUL:
+      case TGSI_OPCODE_MUL:
          emit_alu2(p, brw_MUL, dst, dst_flags, args[0], args[1]);
          break;
  
-      case OPCODE_XPD:
+      case TGSI_OPCODE_XPD:
          emit_xpd(p, dst, dst_flags, args[0], args[1]);
          break;
  
          /* Higher math functions:
           */
-      case OPCODE_RCP:
+      case TGSI_OPCODE_RCP:
          emit_math1(p, BRW_MATH_FUNCTION_INV, dst, dst_flags, args[0]);
          break;
  
-      case OPCODE_RSQ:
+      case TGSI_OPCODE_RSQ:
          emit_math1(p, BRW_MATH_FUNCTION_RSQ, dst, dst_flags, args[0]);
          break;
  
-      case OPCODE_SIN:
+      case TGSI_OPCODE_SIN:
          emit_math1(p, BRW_MATH_FUNCTION_SIN, dst, dst_flags, args[0]);
          break;
  
-      case OPCODE_COS:
+      case TGSI_OPCODE_COS:
          emit_math1(p, BRW_MATH_FUNCTION_COS, dst, dst_flags, args[0]);
          break;
  
-      case OPCODE_EX2:
+      case TGSI_OPCODE_EX2:
          emit_math1(p, BRW_MATH_FUNCTION_EXP, dst, dst_flags, args[0]);
          break;
  
-      case OPCODE_LG2:
+      case TGSI_OPCODE_LG2:
          emit_math1(p, BRW_MATH_FUNCTION_LOG, dst, dst_flags, args[0]);
          break;
  
-      case OPCODE_SCS:
+      case TGSI_OPCODE_SCS:
          /* There is an scs math function, but it would need some
           * fixup for 16-element execution.
           */
-        if (dst_flags & WRITEMASK_X)
-           emit_math1(p, BRW_MATH_FUNCTION_COS, dst, (dst_flags&SATURATE)|WRITEMASK_X, args[0]);
-        if (dst_flags & WRITEMASK_Y)
-           emit_math1(p, BRW_MATH_FUNCTION_SIN, dst+1, (dst_flags&SATURATE)|WRITEMASK_X, args[0]);
+        if (dst_flags & BRW_WRITEMASK_X)
+           emit_math1(p, BRW_MATH_FUNCTION_COS, dst, (dst_flags&SATURATE)|BRW_WRITEMASK_X, args[0]);
+        if (dst_flags & BRW_WRITEMASK_Y)
+           emit_math1(p, BRW_MATH_FUNCTION_SIN, dst+1, (dst_flags&SATURATE)|BRW_WRITEMASK_X, args[0]);
          break;
  
-      case OPCODE_POW:
+      case TGSI_OPCODE_POW:
          emit_math2(p, BRW_MATH_FUNCTION_POW, dst, dst_flags, args[0], args[1]);
          break;
  
          /* Comparisons:
           */
-      case OPCODE_CMP:
+      case TGSI_OPCODE_CMP:
          emit_cmp(p, dst, dst_flags, args[0], args[1], args[2]);
          break;
  
-      case OPCODE_MAX:
+      case TGSI_OPCODE_MAX:
          emit_max(p, dst, dst_flags, args[0], args[1]);
          break;
  
-      case OPCODE_MIN:
+      case TGSI_OPCODE_MIN:
          emit_min(p, dst, dst_flags, args[0], args[1]);
          break;
  
-      case OPCODE_SLT:
+      case TGSI_OPCODE_SLT:
          emit_slt(p, dst, dst_flags, args[0], args[1]);
          break;
  
-      case OPCODE_SLE:
+      case TGSI_OPCODE_SLE:
          emit_sle(p, dst, dst_flags, args[0], args[1]);
         break;
-      case OPCODE_SGT:
+      case TGSI_OPCODE_SGT:
          emit_sgt(p, dst, dst_flags, args[0], args[1]);
         break;
-      case OPCODE_SGE:
+      case TGSI_OPCODE_SGE:
          emit_sge(p, dst, dst_flags, args[0], args[1]);
          break;
-      case OPCODE_SEQ:
+      case TGSI_OPCODE_SEQ:
          emit_seq(p, dst, dst_flags, args[0], args[1]);
         break;
-      case OPCODE_SNE:
+      case TGSI_OPCODE_SNE:
          emit_sne(p, dst, dst_flags, args[0], args[1]);
         break;
  
-      case OPCODE_LIT:
+      case TGSI_OPCODE_LIT:
          emit_lit(p, dst, dst_flags, args[0]);
          break;
  
          /* Texturing operations:
           */
-      case OPCODE_TEX:
-        emit_tex(c, inst, dst, dst_flags, args[0]);
+      case TGSI_OPCODE_TEX:
+        emit_tex(c, inst, dst, dst_flags, args[0], inst->sampler);
          break;
  
-      case OPCODE_TXB:
-        emit_txb(c, inst, dst, dst_flags, args[0]);
+      case TGSI_OPCODE_TXB:
+        emit_txb(c, inst, dst, dst_flags, args[0], inst->sampler);
          break;
  
-      case OPCODE_KIL:
+      case TGSI_OPCODE_KIL:
          emit_kil(c, args[0]);
          break;
  
-      case OPCODE_KIL_NV:
-        emit_kil_nv(c);
+      case TGSI_OPCODE_KILP:
+        emit_killp(c);
          break;
  
        default:
-        _mesa_printf("Unsupported opcode %i (%s) in fragment shader\n",
-                     inst->opcode, inst->opcode < MAX_OPCODE ?
-                                   _mesa_opcode_string(inst->opcode) :
-                                   "unknown");
+        debug_printf("Unsupported opcode %i (%s) in fragment shader\n",
+                     inst->opcode, 
+                     tgsi_get_opcode_info(inst->opcode)->mnemonic);
        }
        
        for (i = 0; i < 4; i++)
@@ -1494,12 +1514,8 @@ void brw_wm_emit( struct brw_wm_compile *c )
                       inst->dst[i]->spill_slot);
     }
  
-   if (INTEL_DEBUG & DEBUG_WM) {
-      int i;
-
-      _mesa_printf("wm-native:\n");
-      for (i = 0; i < p->nr_insn; i++)
-        brw_disasm(stderr, &p->store[i]);
-      _mesa_printf("\n");
+   if (BRW_DEBUG & DEBUG_WM) {
+      debug_printf("wm-native:\n");
+      brw_disasm(stderr, p->store, p->nr_insn);
     }
  }