1 /**************************************************************************
3 * Copyright 2009 VMware, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
29 * The rast code is concerned with rasterization of command bins.
30 * Each screen tile has a bin associated with it. To render the
31 * scene we iterate over the tile bins and execute the commands
33 * We'll do that with multiple threads...
40 #include "pipe/p_compiler.h"
49 #define FIXED_TYPE_WIDTH 32
50 /** For sub-pixel positioning */
52 #define FIXED_ONE (1<<FIXED_ORDER)
53 /** Maximum length of an edge in a primitive in pixels.
54 * If the framebuffer is large we have to think about fixed-point
55 * integer overflow. Coordinates need ((FIXED_TYPE_WIDTH/2) - 1) bits
56 * to be able to fit product of two such coordinates inside
57 * FIXED_TYPE_WIDTH, any larger and we could overflow a
58 * FIXED_TYPE_WIDTH_-bit int.
60 #define MAX_FIXED_LENGTH (1 << (((FIXED_TYPE_WIDTH/2) - 1) - FIXED_ORDER))
62 /* Rasterizer output size going to jit fs, width/height */
63 #define LP_RASTER_BLOCK_SIZE 4
65 #define LP_MAX_ACTIVE_BINNED_QUERIES 16
68 struct lp_rasterizer_task
;
72 * Rasterization state.
73 * Objects of this type are put into the shared data bin and pointed
74 * to by commands in the per-tile bins.
76 struct lp_rast_state
{
77 /* State for the shader. This also contains state which feeds into
78 * the fragment shader, such as blend color and alpha ref value.
80 struct lp_jit_context jit_context
;
82 /* The shader itself. Probably we also need to pass a pointer to
83 * the tile color/z/stencil data somehow
85 struct lp_fragment_shader_variant
*variant
;
90 * Coefficients necessary to run the shader at a given location.
91 * First coefficient is position.
92 * These pointers point into the bin data buffer.
94 struct lp_rast_shader_inputs
{
95 unsigned frontfacing
:1; /** True for front-facing */
96 unsigned disable
:1; /** Partially binned, disable this command */
97 unsigned opaque
:1; /** Is opaque */
98 unsigned pad0
:29; /* wasted space */
99 unsigned stride
; /* how much to advance data between a0, dadx, dady */
100 unsigned layer
; /* the layer to render to (from gs, already clamped) */
101 unsigned pad2
; /* wasted space */
102 /* followed by a0, dadx, dady and planes[] */
105 /* Note: the order of these values is important as they are loaded by
106 * sse code in rasterization:
108 struct lp_rast_plane
{
109 /* edge function values at minx,miny ?? */
115 /* one-pixel sized trivial reject offsets for each plane */
120 * Rasterization information for a triangle known to be in this bin,
121 * plus inputs to run the shader:
122 * These fields are tile- and bin-independent.
123 * Objects of this type are put into the lp_setup_context::data buffer.
125 struct lp_rast_triangle
{
132 /* inputs for the shader */
133 struct lp_rast_shader_inputs inputs
;
134 /* planes are also allocated here */
138 #define GET_A0(inputs) ((float (*)[4])((inputs)+1))
139 #define GET_DADX(inputs) ((float (*)[4])((char *)((inputs) + 1) + (inputs)->stride))
140 #define GET_DADY(inputs) ((float (*)[4])((char *)((inputs) + 1) + 2 * (inputs)->stride))
141 #define GET_PLANES(tri) ((struct lp_rast_plane *)((char *)(&(tri)->inputs + 1) + 3 * (tri)->inputs.stride))
145 struct lp_rasterizer
*
146 lp_rast_create( unsigned num_threads
);
149 lp_rast_destroy( struct lp_rasterizer
* );
152 lp_rast_queue_scene( struct lp_rasterizer
*rast
,
153 struct lp_scene
*scene
);
156 lp_rast_finish( struct lp_rasterizer
*rast
);
159 union lp_rast_cmd_arg
{
160 const struct lp_rast_shader_inputs
*shade_tile
;
162 const struct lp_rast_triangle
*tri
;
165 const struct lp_rast_state
*set_state
;
166 union pipe_color_union clear_color
;
171 const struct lp_rast_state
*state
;
172 struct lp_fence
*fence
;
173 struct llvmpipe_query
*query_obj
;
177 /* Cast wrappers. Hopefully these compile to noops!
179 static INLINE
union lp_rast_cmd_arg
180 lp_rast_arg_inputs( const struct lp_rast_shader_inputs
*shade_tile
)
182 union lp_rast_cmd_arg arg
;
183 arg
.shade_tile
= shade_tile
;
187 static INLINE
union lp_rast_cmd_arg
188 lp_rast_arg_triangle( const struct lp_rast_triangle
*triangle
,
191 union lp_rast_cmd_arg arg
;
192 arg
.triangle
.tri
= triangle
;
193 arg
.triangle
.plane_mask
= plane_mask
;
198 * Build argument for a contained triangle.
200 * All planes are enabled, so instead of the plane mask we pass the upper
201 * left coordinates of the a block that fully encloses the triangle.
203 static INLINE
union lp_rast_cmd_arg
204 lp_rast_arg_triangle_contained( const struct lp_rast_triangle
*triangle
,
205 unsigned x
, unsigned y
)
207 union lp_rast_cmd_arg arg
;
208 arg
.triangle
.tri
= triangle
;
209 arg
.triangle
.plane_mask
= x
| (y
<< 8);
213 static INLINE
union lp_rast_cmd_arg
214 lp_rast_arg_state( const struct lp_rast_state
*state
)
216 union lp_rast_cmd_arg arg
;
217 arg
.set_state
= state
;
221 static INLINE
union lp_rast_cmd_arg
222 lp_rast_arg_fence( struct lp_fence
*fence
)
224 union lp_rast_cmd_arg arg
;
230 static INLINE
union lp_rast_cmd_arg
231 lp_rast_arg_clearzs( uint64_t value
, uint64_t mask
)
233 union lp_rast_cmd_arg arg
;
234 arg
.clear_zstencil
.value
= value
;
235 arg
.clear_zstencil
.mask
= mask
;
240 static INLINE
union lp_rast_cmd_arg
241 lp_rast_arg_query( struct llvmpipe_query
*pq
)
243 union lp_rast_cmd_arg arg
;
248 static INLINE
union lp_rast_cmd_arg
249 lp_rast_arg_null( void )
251 union lp_rast_cmd_arg arg
;
252 arg
.set_state
= NULL
;
259 * These get put into bins by the setup code and are called when
260 * the bins are executed.
262 #define LP_RAST_OP_CLEAR_COLOR 0x0
263 #define LP_RAST_OP_CLEAR_ZSTENCIL 0x1
264 #define LP_RAST_OP_TRIANGLE_1 0x2
265 #define LP_RAST_OP_TRIANGLE_2 0x3
266 #define LP_RAST_OP_TRIANGLE_3 0x4
267 #define LP_RAST_OP_TRIANGLE_4 0x5
268 #define LP_RAST_OP_TRIANGLE_5 0x6
269 #define LP_RAST_OP_TRIANGLE_6 0x7
270 #define LP_RAST_OP_TRIANGLE_7 0x8
271 #define LP_RAST_OP_TRIANGLE_8 0x9
272 #define LP_RAST_OP_TRIANGLE_3_4 0xa
273 #define LP_RAST_OP_TRIANGLE_3_16 0xb
274 #define LP_RAST_OP_TRIANGLE_4_16 0xc
275 #define LP_RAST_OP_SHADE_TILE 0xd
276 #define LP_RAST_OP_SHADE_TILE_OPAQUE 0xe
277 #define LP_RAST_OP_BEGIN_QUERY 0xf
278 #define LP_RAST_OP_END_QUERY 0x10
279 #define LP_RAST_OP_SET_STATE 0x11
281 #define LP_RAST_OP_MAX 0x12
282 #define LP_RAST_OP_MASK 0xff
285 lp_debug_bins( struct lp_scene
*scene
);
287 lp_debug_draw_bins_by_cmd_length( struct lp_scene
*scene
);
289 lp_debug_draw_bins_by_coverage( struct lp_scene
*scene
);