*
**************************************************************************/
+/**
+ * The rast code is concerned with rasterization of command bins.
+ * Each screen tile has a bin associated with it. To render the
+ * scene we iterate over the tile bins and execute the commands
+ * in each bin.
+ * We'll do that with multiple threads...
+ */
+
+
#ifndef LP_RAST_H
#define LP_RAST_H
#include "pipe/p_compiler.h"
+#include "util/u_pack_color.h"
#include "lp_jit.h"
-/* Initially create and program a single rasterizer directly. Later
- * will want multiple of these, one or two per core. At that stage
- * will probably pass command buffers into the rasterizers rather than
- * individual function calls like this.
- */
+
struct lp_rasterizer;
-struct pipe_screen;
+struct lp_scene;
+struct lp_fence;
+struct cmd_bin;
-#define FIXED_ORDER 4
+#define FIXED_TYPE_WIDTH 64
+/** For sub-pixel positioning */
+#define FIXED_ORDER 8
#define FIXED_ONE (1<<FIXED_ORDER)
-#define TILE_ORDER 6
-#define TILESIZE (1<<TILE_ORDER)
+#define FIXED_SHIFT (FIXED_TYPE_WIDTH - 1)
+/** Maximum length of an edge in a primitive in pixels.
+ * If the framebuffer is large we have to think about fixed-point
+ * integer overflow. Coordinates need ((FIXED_TYPE_WIDTH/2) - 1) bits
+ * to be able to fit product of two such coordinates inside
+ * FIXED_TYPE_WIDTH, any larger and we could overflow a
+ * FIXED_TYPE_WIDTH_-bit int.
+ */
+#define MAX_FIXED_LENGTH (1 << (((FIXED_TYPE_WIDTH/2) - 1) - FIXED_ORDER))
+
+#define MAX_FIXED_LENGTH32 (1 << (((32/2) - 1) - FIXED_ORDER))
+
+/* Rasterizer output size going to jit fs, width/height */
+#define LP_RASTER_BLOCK_SIZE 4
+
+#define LP_MAX_ACTIVE_BINNED_QUERIES 64
+
+#define IMUL64(a, b) (((int64_t)(a)) * ((int64_t)(b)))
+struct lp_rasterizer_task;
+
+/**
+ * Rasterization state.
+ * Objects of this type are put into the shared data bin and pointed
+ * to by commands in the per-tile bins.
+ */
struct lp_rast_state {
- /* State for the shader:
+ /* State for the shader. This also contains state which feeds into
+ * the fragment shader, such as blend color and alpha ref value.
*/
struct lp_jit_context jit_context;
/* The shader itself. Probably we also need to pass a pointer to
- * the tile color/z/stencil data somehow:
- */
- lp_jit_frag_func jit_function;
-
+ * the tile color/z/stencil data somehow
+ */
+ struct lp_fragment_shader_variant *variant;
};
-/* Coefficients necessary to run the shader at a given location:
+
+/**
+ * Coefficients necessary to run the shader at a given location.
+ * First coefficient is position.
+ * These pointers point into the bin data buffer.
*/
struct lp_rast_shader_inputs {
+ unsigned frontfacing:1; /** True for front-facing */
+ unsigned disable:1; /** Partially binned, disable this command */
+ unsigned opaque:1; /** Is opaque */
+ unsigned pad0:29; /* wasted space */
+ unsigned stride; /* how much to advance data between a0, dadx, dady */
+ unsigned layer; /* the layer to render to (from gs, already clamped) */
+ unsigned viewport_index; /* the active viewport index (from gs, already clamped) */
+ /* followed by a0, dadx, dady and planes[] */
+};
- /* Current rasterizer state:
- */
- const struct lp_rast_state *state;
+struct lp_rast_plane {
+ /* edge function values at minx,miny ?? */
+ int64_t c;
- /* Attribute interpolation:
- *
- * First coefficient is position.
- *
- * FIXME: reduce memory waste!
- */
- float a0[1 + PIPE_MAX_SHADER_INPUTS][4];
- float dadx[1 + PIPE_MAX_SHADER_INPUTS][4];
- float dady[1 + PIPE_MAX_SHADER_INPUTS][4];
-};
+ int32_t dcdx;
+ int32_t dcdy;
+ /* one-pixel sized trivial reject offsets for each plane */
+ int64_t eo;
+};
-/* Rasterization information for a triangle known to be in this bin,
+/**
+ * Rasterization information for a triangle known to be in this bin,
* plus inputs to run the shader:
+ * These fields are tile- and bin-independent.
+ * Objects of this type are put into the lp_setup_context::data buffer.
*/
struct lp_rast_triangle {
- int minx;
- int maxx;
- int miny;
- int maxy;
-
- /* one-pixel sized trivial accept offsets for each plane */
- int ei1;
- int ei2;
- int ei3;
-
- /* one-pixel sized trivial reject offsets for each plane */
- int eo1;
- int eo2;
- int eo3;
-
- /* y deltas for vertex pairs */
- int dy12;
- int dy23;
- int dy31;
-
- /* x deltas for vertex pairs */
- int dx12;
- int dx23;
- int dx31;
-
- /* edge function values at minx,miny ?? */
- int c1;
- int c2;
- int c3;
-
- /* XXX: this is only used inside lp_setup_tri.c, don't really
- * need it here:
- */
- float oneoverarea;
+#ifdef DEBUG
+ float v[3][2];
+ float pad0;
+ float pad1;
+#endif
/* inputs for the shader */
struct lp_rast_shader_inputs inputs;
+ /* planes are also allocated here */
};
+struct lp_rast_clear_rb {
+ union util_color color_val;
+ unsigned cbuf;
+};
-struct lp_rasterizer *lp_rast_create( struct pipe_screen *screen );
-boolean lp_rast_begin( struct lp_rasterizer *rast,
- struct pipe_surface *cbuf,
- struct pipe_surface *zsbuf,
- boolean write_color,
- boolean write_zstencil,
- unsigned width,
- unsigned height );
+#define GET_A0(inputs) ((float (*)[4])((inputs)+1))
+#define GET_DADX(inputs) ((float (*)[4])((char *)((inputs) + 1) + (inputs)->stride))
+#define GET_DADY(inputs) ((float (*)[4])((char *)((inputs) + 1) + 2 * (inputs)->stride))
+#define GET_PLANES(tri) ((struct lp_rast_plane *)((char *)(&(tri)->inputs + 1) + 3 * (tri)->inputs.stride))
-void lp_rast_end( struct lp_rasterizer * );
-/* Begining of each tile:
- */
-void lp_rast_start_tile( struct lp_rasterizer *,
- unsigned x,
- unsigned y );
+struct lp_rasterizer *
+lp_rast_create( unsigned num_threads );
+
+void
+lp_rast_destroy( struct lp_rasterizer * );
+
+void
+lp_rast_queue_scene( struct lp_rasterizer *rast,
+ struct lp_scene *scene );
+
+void
+lp_rast_finish( struct lp_rasterizer *rast );
union lp_rast_cmd_arg {
const struct lp_rast_shader_inputs *shade_tile;
- const struct lp_rast_triangle *triangle;
+ struct {
+ const struct lp_rast_triangle *tri;
+ unsigned plane_mask;
+ } triangle;
const struct lp_rast_state *set_state;
- uint8_t clear_color[4];
- unsigned clear_zstencil;
+ const struct lp_rast_clear_rb *clear_rb;
+ struct {
+ uint64_t value;
+ uint64_t mask;
+ } clear_zstencil;
+ const struct lp_rast_state *state;
+ struct lp_fence *fence;
+ struct llvmpipe_query *query_obj;
};
+
/* Cast wrappers. Hopefully these compile to noops!
*/
-static INLINE const union lp_rast_cmd_arg
+static INLINE union lp_rast_cmd_arg
lp_rast_arg_inputs( const struct lp_rast_shader_inputs *shade_tile )
{
union lp_rast_cmd_arg arg;
return arg;
}
-static INLINE const union lp_rast_cmd_arg
-lp_rast_arg_triangle( const struct lp_rast_triangle *triangle )
+static INLINE union lp_rast_cmd_arg
+lp_rast_arg_triangle( const struct lp_rast_triangle *triangle,
+ unsigned plane_mask)
+{
+ union lp_rast_cmd_arg arg;
+ arg.triangle.tri = triangle;
+ arg.triangle.plane_mask = plane_mask;
+ return arg;
+}
+
+/**
+ * Build argument for a contained triangle.
+ *
+ * All planes are enabled, so instead of the plane mask we pass the upper
+ * left coordinates of the a block that fully encloses the triangle.
+ */
+static INLINE union lp_rast_cmd_arg
+lp_rast_arg_triangle_contained( const struct lp_rast_triangle *triangle,
+ unsigned x, unsigned y)
{
union lp_rast_cmd_arg arg;
- arg.triangle = triangle;
+ arg.triangle.tri = triangle;
+ arg.triangle.plane_mask = x | (y << 8);
return arg;
}
-static INLINE const union lp_rast_cmd_arg
+static INLINE union lp_rast_cmd_arg
lp_rast_arg_state( const struct lp_rast_state *state )
{
union lp_rast_cmd_arg arg;
return arg;
}
-static INLINE const union lp_rast_cmd_arg
-lp_rast_arg_null( void )
+static INLINE union lp_rast_cmd_arg
+lp_rast_arg_fence( struct lp_fence *fence )
{
union lp_rast_cmd_arg arg;
- arg.set_state = NULL;
+ arg.fence = fence;
return arg;
}
+static INLINE union lp_rast_cmd_arg
+lp_rast_arg_clearzs( uint64_t value, uint64_t mask )
+{
+ union lp_rast_cmd_arg arg;
+ arg.clear_zstencil.value = value;
+ arg.clear_zstencil.mask = mask;
+ return arg;
+}
+static INLINE union lp_rast_cmd_arg
+lp_rast_arg_query( struct llvmpipe_query *pq )
+{
+ union lp_rast_cmd_arg arg;
+ arg.query_obj = pq;
+ return arg;
+}
-/* Binnable Commands:
- */
-void lp_rast_clear_color( struct lp_rasterizer *,
- const union lp_rast_cmd_arg );
-
-void lp_rast_clear_zstencil( struct lp_rasterizer *,
- const union lp_rast_cmd_arg );
-
-void lp_rast_load_color( struct lp_rasterizer *,
- const union lp_rast_cmd_arg );
-
-void lp_rast_load_zstencil( struct lp_rasterizer *,
- const union lp_rast_cmd_arg );
-
-void lp_rast_set_state( struct lp_rasterizer *,
- const union lp_rast_cmd_arg );
-
-void lp_rast_triangle( struct lp_rasterizer *,
- const union lp_rast_cmd_arg );
-
-void lp_rast_shade_tile( struct lp_rasterizer *,
- const union lp_rast_cmd_arg );
-
-
-/* End of tile:
- */
+static INLINE union lp_rast_cmd_arg
+lp_rast_arg_null( void )
+{
+ union lp_rast_cmd_arg arg;
+ arg.set_state = NULL;
+ return arg;
+}
-void lp_rast_end_tile( struct lp_rasterizer *rast );
-/* Shutdown:
+/**
+ * Binnable Commands.
+ * These get put into bins by the setup code and are called when
+ * the bins are executed.
*/
-void lp_rast_destroy( struct lp_rasterizer * );
+#define LP_RAST_OP_CLEAR_COLOR 0x0
+#define LP_RAST_OP_CLEAR_ZSTENCIL 0x1
+#define LP_RAST_OP_TRIANGLE_1 0x2
+#define LP_RAST_OP_TRIANGLE_2 0x3
+#define LP_RAST_OP_TRIANGLE_3 0x4
+#define LP_RAST_OP_TRIANGLE_4 0x5
+#define LP_RAST_OP_TRIANGLE_5 0x6
+#define LP_RAST_OP_TRIANGLE_6 0x7
+#define LP_RAST_OP_TRIANGLE_7 0x8
+#define LP_RAST_OP_TRIANGLE_8 0x9
+#define LP_RAST_OP_TRIANGLE_3_4 0xa
+#define LP_RAST_OP_TRIANGLE_3_16 0xb
+#define LP_RAST_OP_TRIANGLE_4_16 0xc
+#define LP_RAST_OP_SHADE_TILE 0xd
+#define LP_RAST_OP_SHADE_TILE_OPAQUE 0xe
+#define LP_RAST_OP_BEGIN_QUERY 0xf
+#define LP_RAST_OP_END_QUERY 0x10
+#define LP_RAST_OP_SET_STATE 0x11
+#define LP_RAST_OP_TRIANGLE_32_1 0x12
+#define LP_RAST_OP_TRIANGLE_32_2 0x13
+#define LP_RAST_OP_TRIANGLE_32_3 0x14
+#define LP_RAST_OP_TRIANGLE_32_4 0x15
+#define LP_RAST_OP_TRIANGLE_32_5 0x16
+#define LP_RAST_OP_TRIANGLE_32_6 0x17
+#define LP_RAST_OP_TRIANGLE_32_7 0x18
+#define LP_RAST_OP_TRIANGLE_32_8 0x19
+#define LP_RAST_OP_TRIANGLE_32_3_4 0x1a
+#define LP_RAST_OP_TRIANGLE_32_3_16 0x1b
+#define LP_RAST_OP_TRIANGLE_32_4_16 0x1c
+
+#define LP_RAST_OP_MAX 0x1d
+#define LP_RAST_OP_MASK 0xff
+
+void
+lp_debug_bins( struct lp_scene *scene );
+void
+lp_debug_draw_bins_by_cmd_length( struct lp_scene *scene );
+void
+lp_debug_draw_bins_by_coverage( struct lp_scene *scene );
+
+
+#ifdef PIPE_ARCH_SSE
+#include <emmintrin.h>
+#include "util/u_sse.h"
+
+static INLINE __m128i
+lp_plane_to_m128i(const struct lp_rast_plane *plane)
+{
+ return _mm_setr_epi32((int32_t)plane->c, (int32_t)plane->dcdx,
+ (int32_t)plane->dcdy, (int32_t)plane->eo);
+}
+#endif
#endif