Merge remote-tracking branch 'jekstrand/wip/i965-uniforms' into vulkan
[mesa.git] / src / gallium / drivers / llvmpipe / lp_rast.h
1 /**************************************************************************
2 *
3 * Copyright 2009 VMware, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 /**
29 * The rast code is concerned with rasterization of command bins.
30 * Each screen tile has a bin associated with it. To render the
31 * scene we iterate over the tile bins and execute the commands
32 * in each bin.
33 * We'll do that with multiple threads...
34 */
35
36
37 #ifndef LP_RAST_H
38 #define LP_RAST_H
39
40 #include "pipe/p_compiler.h"
41 #include "util/u_pack_color.h"
42 #include "lp_jit.h"
43
44
45 struct lp_rasterizer;
46 struct lp_scene;
47 struct lp_fence;
48 struct cmd_bin;
49
50 #define FIXED_TYPE_WIDTH 64
51 /** For sub-pixel positioning */
52 #define FIXED_ORDER 8
53 #define FIXED_ONE (1<<FIXED_ORDER)
54 #define FIXED_SHIFT (FIXED_TYPE_WIDTH - 1)
55 /** Maximum length of an edge in a primitive in pixels.
56 * If the framebuffer is large we have to think about fixed-point
57 * integer overflow. Coordinates need ((FIXED_TYPE_WIDTH/2) - 1) bits
58 * to be able to fit product of two such coordinates inside
59 * FIXED_TYPE_WIDTH, any larger and we could overflow a
60 * FIXED_TYPE_WIDTH_-bit int.
61 */
62 #define MAX_FIXED_LENGTH (1 << (((FIXED_TYPE_WIDTH/2) - 1) - FIXED_ORDER))
63
64 #define MAX_FIXED_LENGTH32 (1 << (((32/2) - 1) - FIXED_ORDER))
65
66 /* Rasterizer output size going to jit fs, width/height */
67 #define LP_RASTER_BLOCK_SIZE 4
68
69 #define LP_MAX_ACTIVE_BINNED_QUERIES 64
70
71 #define IMUL64(a, b) (((int64_t)(a)) * ((int64_t)(b)))
72
73 struct lp_rasterizer_task;
74
75
76 /**
77 * Rasterization state.
78 * Objects of this type are put into the shared data bin and pointed
79 * to by commands in the per-tile bins.
80 */
81 struct lp_rast_state {
82 /* State for the shader. This also contains state which feeds into
83 * the fragment shader, such as blend color and alpha ref value.
84 */
85 struct lp_jit_context jit_context;
86
87 /* The shader itself. Probably we also need to pass a pointer to
88 * the tile color/z/stencil data somehow
89 */
90 struct lp_fragment_shader_variant *variant;
91 };
92
93
94 /**
95 * Coefficients necessary to run the shader at a given location.
96 * First coefficient is position.
97 * These pointers point into the bin data buffer.
98 */
99 struct lp_rast_shader_inputs {
100 unsigned frontfacing:1; /** True for front-facing */
101 unsigned disable:1; /** Partially binned, disable this command */
102 unsigned opaque:1; /** Is opaque */
103 unsigned pad0:29; /* wasted space */
104 unsigned stride; /* how much to advance data between a0, dadx, dady */
105 unsigned layer; /* the layer to render to (from gs, already clamped) */
106 unsigned viewport_index; /* the active viewport index (from gs, already clamped) */
107 /* followed by a0, dadx, dady and planes[] */
108 };
109
110 struct lp_rast_plane {
111 /* edge function values at minx,miny ?? */
112 int64_t c;
113
114 int32_t dcdx;
115 int32_t dcdy;
116
117 /* one-pixel sized trivial reject offsets for each plane */
118 uint32_t eo;
119 };
120
121 /**
122 * Rasterization information for a triangle known to be in this bin,
123 * plus inputs to run the shader:
124 * These fields are tile- and bin-independent.
125 * Objects of this type are put into the lp_setup_context::data buffer.
126 */
127 struct lp_rast_triangle {
128 #ifdef DEBUG
129 float v[3][2];
130 float pad0;
131 float pad1;
132 #endif
133
134 /* inputs for the shader */
135 struct lp_rast_shader_inputs inputs;
136 /* planes are also allocated here */
137 };
138
139
140 struct lp_rast_clear_rb {
141 union util_color color_val;
142 unsigned cbuf;
143 };
144
145
146 #define GET_A0(inputs) ((float (*)[4])((inputs)+1))
147 #define GET_DADX(inputs) ((float (*)[4])((char *)((inputs) + 1) + (inputs)->stride))
148 #define GET_DADY(inputs) ((float (*)[4])((char *)((inputs) + 1) + 2 * (inputs)->stride))
149 #define GET_PLANES(tri) ((struct lp_rast_plane *)((char *)(&(tri)->inputs + 1) + 3 * (tri)->inputs.stride))
150
151
152
153 struct lp_rasterizer *
154 lp_rast_create( unsigned num_threads );
155
156 void
157 lp_rast_destroy( struct lp_rasterizer * );
158
159 void
160 lp_rast_queue_scene( struct lp_rasterizer *rast,
161 struct lp_scene *scene );
162
163 void
164 lp_rast_finish( struct lp_rasterizer *rast );
165
166
167 union lp_rast_cmd_arg {
168 const struct lp_rast_shader_inputs *shade_tile;
169 struct {
170 const struct lp_rast_triangle *tri;
171 unsigned plane_mask;
172 } triangle;
173 const struct lp_rast_state *set_state;
174 const struct lp_rast_clear_rb *clear_rb;
175 struct {
176 uint64_t value;
177 uint64_t mask;
178 } clear_zstencil;
179 const struct lp_rast_state *state;
180 struct lp_fence *fence;
181 struct llvmpipe_query *query_obj;
182 };
183
184
185 /* Cast wrappers. Hopefully these compile to noops!
186 */
187 static inline union lp_rast_cmd_arg
188 lp_rast_arg_inputs( const struct lp_rast_shader_inputs *shade_tile )
189 {
190 union lp_rast_cmd_arg arg;
191 arg.shade_tile = shade_tile;
192 return arg;
193 }
194
195 static inline union lp_rast_cmd_arg
196 lp_rast_arg_triangle( const struct lp_rast_triangle *triangle,
197 unsigned plane_mask)
198 {
199 union lp_rast_cmd_arg arg;
200 arg.triangle.tri = triangle;
201 arg.triangle.plane_mask = plane_mask;
202 return arg;
203 }
204
205 /**
206 * Build argument for a contained triangle.
207 *
208 * All planes are enabled, so instead of the plane mask we pass the upper
209 * left coordinates of the a block that fully encloses the triangle.
210 */
211 static inline union lp_rast_cmd_arg
212 lp_rast_arg_triangle_contained( const struct lp_rast_triangle *triangle,
213 unsigned x, unsigned y)
214 {
215 union lp_rast_cmd_arg arg;
216 arg.triangle.tri = triangle;
217 arg.triangle.plane_mask = x | (y << 8);
218 return arg;
219 }
220
221 static inline union lp_rast_cmd_arg
222 lp_rast_arg_state( const struct lp_rast_state *state )
223 {
224 union lp_rast_cmd_arg arg;
225 arg.set_state = state;
226 return arg;
227 }
228
229 static inline union lp_rast_cmd_arg
230 lp_rast_arg_fence( struct lp_fence *fence )
231 {
232 union lp_rast_cmd_arg arg;
233 arg.fence = fence;
234 return arg;
235 }
236
237
238 static inline union lp_rast_cmd_arg
239 lp_rast_arg_clearzs( uint64_t value, uint64_t mask )
240 {
241 union lp_rast_cmd_arg arg;
242 arg.clear_zstencil.value = value;
243 arg.clear_zstencil.mask = mask;
244 return arg;
245 }
246
247
248 static inline union lp_rast_cmd_arg
249 lp_rast_arg_query( struct llvmpipe_query *pq )
250 {
251 union lp_rast_cmd_arg arg;
252 arg.query_obj = pq;
253 return arg;
254 }
255
256 static inline union lp_rast_cmd_arg
257 lp_rast_arg_null( void )
258 {
259 union lp_rast_cmd_arg arg;
260 arg.set_state = NULL;
261 return arg;
262 }
263
264
265 /**
266 * Binnable Commands.
267 * These get put into bins by the setup code and are called when
268 * the bins are executed.
269 */
270 #define LP_RAST_OP_CLEAR_COLOR 0x0
271 #define LP_RAST_OP_CLEAR_ZSTENCIL 0x1
272 #define LP_RAST_OP_TRIANGLE_1 0x2
273 #define LP_RAST_OP_TRIANGLE_2 0x3
274 #define LP_RAST_OP_TRIANGLE_3 0x4
275 #define LP_RAST_OP_TRIANGLE_4 0x5
276 #define LP_RAST_OP_TRIANGLE_5 0x6
277 #define LP_RAST_OP_TRIANGLE_6 0x7
278 #define LP_RAST_OP_TRIANGLE_7 0x8
279 #define LP_RAST_OP_TRIANGLE_8 0x9
280 #define LP_RAST_OP_TRIANGLE_3_4 0xa
281 #define LP_RAST_OP_TRIANGLE_3_16 0xb
282 #define LP_RAST_OP_TRIANGLE_4_16 0xc
283 #define LP_RAST_OP_SHADE_TILE 0xd
284 #define LP_RAST_OP_SHADE_TILE_OPAQUE 0xe
285 #define LP_RAST_OP_BEGIN_QUERY 0xf
286 #define LP_RAST_OP_END_QUERY 0x10
287 #define LP_RAST_OP_SET_STATE 0x11
288 #define LP_RAST_OP_TRIANGLE_32_1 0x12
289 #define LP_RAST_OP_TRIANGLE_32_2 0x13
290 #define LP_RAST_OP_TRIANGLE_32_3 0x14
291 #define LP_RAST_OP_TRIANGLE_32_4 0x15
292 #define LP_RAST_OP_TRIANGLE_32_5 0x16
293 #define LP_RAST_OP_TRIANGLE_32_6 0x17
294 #define LP_RAST_OP_TRIANGLE_32_7 0x18
295 #define LP_RAST_OP_TRIANGLE_32_8 0x19
296 #define LP_RAST_OP_TRIANGLE_32_3_4 0x1a
297 #define LP_RAST_OP_TRIANGLE_32_3_16 0x1b
298 #define LP_RAST_OP_TRIANGLE_32_4_16 0x1c
299
300 #define LP_RAST_OP_MAX 0x1d
301 #define LP_RAST_OP_MASK 0xff
302
303 void
304 lp_debug_bins( struct lp_scene *scene );
305 void
306 lp_debug_draw_bins_by_cmd_length( struct lp_scene *scene );
307 void
308 lp_debug_draw_bins_by_coverage( struct lp_scene *scene );
309
310
311 #ifdef PIPE_ARCH_SSE
312 #include <emmintrin.h>
313 #include "util/u_sse.h"
314
315 static inline __m128i
316 lp_plane_to_m128i(const struct lp_rast_plane *plane)
317 {
318 return _mm_setr_epi32((int32_t)plane->c, (int32_t)plane->dcdx,
319 (int32_t)plane->dcdy, (int32_t)plane->eo);
320 }
321
322 #endif
323
324 #endif