Move the remaining format pf_get_* functions to u_format.h.

[mesa.git] / src / gallium / drivers / llvmpipe / lp_setup.c
diff --git a/src/gallium/drivers/llvmpipe/lp_setup.c b/src/gallium/drivers/llvmpipe/lp_setup.c

index 2d2fc19a65fe00f806867690d85623004dade7ff..b18f17c0cd34a2ef76f1b01e360d0f58b9d612d3 100644 (file)
--- a/src/gallium/drivers/llvmpipe/lp_setup.c
+++ b/src/gallium/drivers/llvmpipe/lp_setup.c
@@ -33,7 +33,6 @@
   */
  
  #include "lp_context.h"
-#include "lp_prim_setup.h"
  #include "lp_quad.h"
  #include "lp_setup.h"
  #include "lp_state.h"
@@ -42,6 +41,7 @@
  #include "draw/draw_vertex.h"
  #include "pipe/p_shader_tokens.h"
  #include "pipe/p_thread.h"
+#include "util/u_format.h"
  #include "util/u_math.h"
  #include "util/u_memory.h"
  #include "lp_bld_debug.h"
@@ -90,6 +90,8 @@ struct setup_context {
     float oneoverarea;
     int facing;
  
+   float pixel_offset;
+
     struct quad_header quad[MAX_QUADS];
     struct quad_header *quad_ptrs[MAX_QUADS];
     unsigned count;
@@ -115,6 +117,7 @@ struct setup_context {
  /**
   * Execute fragment shader for the four fragments in the quad.
   */
+ALIGN_STACK
  static void
  shade_quads(struct llvmpipe_context *llvmpipe,
              struct quad_header *quads[],
@@ -124,7 +127,7 @@ shade_quads(struct llvmpipe_context *llvmpipe,
     struct quad_header *quad = quads[0];
     const unsigned x = quad->input.x0;
     const unsigned y = quad->input.y0;
-   uint8_t *tile = lp_get_cached_tile(llvmpipe->cbuf_cache[0], x, y);
+   uint8_t *tile;
     uint8_t *color;
     void *depth;
     uint32_t ALIGN16_ATTRIB mask[4][NUM_CHANNELS];
@@ -150,7 +153,13 @@ shade_quads(struct llvmpipe_context *llvmpipe,
           mask[q][chan_index] = quads[q]->inout.mask & (1 << chan_index) ? ~0 : 0;
  
     /* color buffer */
-   color = &TILE_PIXEL(tile, x & (TILE_SIZE-1), y & (TILE_SIZE-1), 0);
+   if(llvmpipe->framebuffer.nr_cbufs >= 1 &&
+      llvmpipe->framebuffer.cbufs[0]) {
+      tile = lp_get_cached_tile(llvmpipe->cbuf_cache[0], x, y);
+      color = &TILE_PIXEL(tile, x & (TILE_SIZE-1), y & (TILE_SIZE-1), 0);
+   }
+   else
+      color = NULL;
  
     /* depth buffer */
     if(llvmpipe->zsbuf_map) {
@@ -158,7 +167,7 @@ shade_quads(struct llvmpipe_context *llvmpipe,
        assert((y % 2) == 0);
        depth = llvmpipe->zsbuf_map +
                y*llvmpipe->zsbuf_transfer->stride +
-              2*x*llvmpipe->zsbuf_transfer->block.size;
+              2*x*util_format_get_blocksize(llvmpipe->zsbuf_transfer->texture->format);
     }
     else
        depth = NULL;
@@ -271,11 +280,13 @@ clip_emit_quad( struct setup_context *setup, struct quad_header *quad )
         * until we codegenerate single-quad variants of the fragment pipeline
         * we need this hack. */
        const unsigned nr_quads = TILE_VECTOR_HEIGHT*TILE_VECTOR_WIDTH/QUAD_SIZE;
-      struct quad_header quads[nr_quads];
-      struct quad_header *quad_ptrs[nr_quads];
+      struct quad_header quads[4];
+      struct quad_header *quad_ptrs[4];
        int x0 = block_x(quad->input.x0);
        unsigned i;
  
+      assert(nr_quads == 4);
+
        for(i = 0; i < nr_quads; ++i) {
           int x = x0 + 2*i;
           if(x == quad->input.x0)
@@ -474,6 +485,16 @@ static boolean setup_sort_vertices( struct setup_context *setup,
        ((det > 0.0) ^ 
         (setup->llvmpipe->rasterizer->front_winding == PIPE_WINDING_CW));
  
+   /* Prepare pixel offset for rasterisation:
+    *  - pixel center (0.5, 0.5) for GL, or
+    *  - assume (0.0, 0.0) for other APIs.
+    */
+   if (setup->llvmpipe->rasterizer->gl_rasterization_rules) {
+      setup->pixel_offset = 0.5f;
+   } else {
+      setup->pixel_offset = 0.0f;
+   }
+
     return TRUE;
  }
  
@@ -499,7 +520,7 @@ static void tri_pos_coeff( struct setup_context *setup,
  
     /* calculate a0 as the value which would be sampled for the
      * fragment at (0,0), taking into account that we want to sample at
-    * pixel centers, in other words (0.5, 0.5).
+    * pixel centers, in other words (pixel_offset, pixel_offset).
      *
      * this is neat but unfortunately not a good way to do things for
      * triangles with very large values of dadx or dady as it will
@@ -510,8 +531,8 @@ static void tri_pos_coeff( struct setup_context *setup,
      * instead - i'll switch to this later.
      */
     setup->coef.a0[0][i] = (setup->vmin[vertSlot][i] -
-                           (dadx * (setup->vmin[0][0] - 0.5f) +
-                            dady * (setup->vmin[0][1] - 0.5f)));
+                           (dadx * (setup->vmin[0][0] - setup->pixel_offset) +
+                            dady * (setup->vmin[0][1] - setup->pixel_offset)));
  
     /*
     debug_printf("attr[%d].%c: %f dx:%f dy:%f\n",
@@ -600,8 +621,8 @@ static void tri_linear_coeff( struct setup_context *setup,
         * instead - i'll switch to this later.
         */
        setup->coef.a0[1 + attrib][i] = (setup->vmin[vertSlot][i] -
-                     (dadx * (setup->vmin[0][0] - 0.5f) +
-                      dady * (setup->vmin[0][1] - 0.5f)));
+                     (dadx * (setup->vmin[0][0] - setup->pixel_offset) +
+                      dady * (setup->vmin[0][1] - setup->pixel_offset)));
  
        /*
        debug_printf("attr[%d].%c: %f dx:%f dy:%f\n",
@@ -652,8 +673,8 @@ static void tri_persp_coeff( struct setup_context *setup,
        setup->coef.dadx[1 + attrib][i] = dadx;
        setup->coef.dady[1 + attrib][i] = dady;
        setup->coef.a0[1 + attrib][i] = (mina -
-                     (dadx * (setup->vmin[0][0] - 0.5f) +
-                      dady * (setup->vmin[0][1] - 0.5f)));
+                     (dadx * (setup->vmin[0][0] - setup->pixel_offset) +
+                      dady * (setup->vmin[0][1] - setup->pixel_offset)));
     }
  }
  
@@ -737,12 +758,12 @@ static void setup_tri_coefficients( struct setup_context *setup )
  
  static void setup_tri_edges( struct setup_context *setup )
  {
-   float vmin_x = setup->vmin[0][0] + 0.5f;
-   float vmid_x = setup->vmid[0][0] + 0.5f;
+   float vmin_x = setup->vmin[0][0] + setup->pixel_offset;
+   float vmid_x = setup->vmid[0][0] + setup->pixel_offset;
  
-   float vmin_y = setup->vmin[0][1] - 0.5f;
-   float vmid_y = setup->vmid[0][1] - 0.5f;
-   float vmax_y = setup->vmax[0][1] - 0.5f;
+   float vmin_y = setup->vmin[0][1] - setup->pixel_offset;
+   float vmid_y = setup->vmid[0][1] - setup->pixel_offset;
+   float vmax_y = setup->vmax[0][1] - setup->pixel_offset;
  
     setup->emaj.sy = ceilf(vmin_y);
     setup->emaj.lines = (int) ceilf(vmax_y - setup->emaj.sy);
@@ -941,8 +962,8 @@ linear_pos_coeff(struct setup_context *setup,
     setup->coef.dadx[0][i] = dadx;
     setup->coef.dady[0][i] = dady;
     setup->coef.a0[0][i] = (setup->vmin[vertSlot][i] -
-                           (dadx * (setup->vmin[0][0] - 0.5f) +
-                            dady * (setup->vmin[0][1] - 0.5f)));
+                           (dadx * (setup->vmin[0][0] - setup->pixel_offset) +
+                            dady * (setup->vmin[0][1] - setup->pixel_offset)));
  }
  
  
@@ -963,8 +984,8 @@ line_linear_coeff(struct setup_context *setup,
        setup->coef.dadx[1 + attrib][i] = dadx;
        setup->coef.dady[1 + attrib][i] = dady;
        setup->coef.a0[1 + attrib][i] = (setup->vmin[vertSlot][i] -
-                     (dadx * (setup->vmin[0][0] - 0.5f) +
-                      dady * (setup->vmin[0][1] - 0.5f)));
+                     (dadx * (setup->vmin[0][0] - setup->pixel_offset) +
+                      dady * (setup->vmin[0][1] - setup->pixel_offset)));
     }
  }
  
@@ -989,8 +1010,8 @@ line_persp_coeff(struct setup_context *setup,
        setup->coef.dadx[1 + attrib][i] = dadx;
        setup->coef.dady[1 + attrib][i] = dady;
        setup->coef.a0[1 + attrib][i] = (setup->vmin[vertSlot][i] -
-                     (dadx * (setup->vmin[0][0] - 0.5f) +
-                      dady * (setup->vmin[0][1] - 0.5f)));
+                     (dadx * (setup->vmin[0][0] - setup->pixel_offset) +
+                      dady * (setup->vmin[0][1] - setup->pixel_offset)));
     }
  }