draw: clean up d3d style point clipping
[mesa.git] / src / gallium / auxiliary / draw / draw_pt_fetch_shade_pipeline.c
1 /**************************************************************************
2 *
3 * Copyright 2007 VMware, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 #include "util/u_math.h"
29 #include "util/u_memory.h"
30 #include "util/u_prim.h"
31 #include "draw/draw_context.h"
32 #include "draw/draw_vbuf.h"
33 #include "draw/draw_vertex.h"
34 #include "draw/draw_prim_assembler.h"
35 #include "draw/draw_pt.h"
36 #include "draw/draw_vs.h"
37 #include "draw/draw_gs.h"
38
39
40 struct fetch_pipeline_middle_end {
41 struct draw_pt_middle_end base;
42 struct draw_context *draw;
43
44 struct pt_emit *emit;
45 struct pt_so_emit *so_emit;
46 struct pt_fetch *fetch;
47 struct pt_post_vs *post_vs;
48
49 unsigned vertex_data_offset;
50 unsigned vertex_size;
51 unsigned input_prim;
52 unsigned opt;
53 };
54
55
56 /**
57 * Prepare/validate middle part of the vertex pipeline.
58 * NOTE: if you change this function, also look at the LLVM
59 * function llvm_middle_end_prepare() for similar changes.
60 */
61 static void fetch_pipeline_prepare( struct draw_pt_middle_end *middle,
62 unsigned prim,
63 unsigned opt,
64 unsigned *max_vertices )
65 {
66 struct fetch_pipeline_middle_end *fpme = (struct fetch_pipeline_middle_end *)middle;
67 struct draw_context *draw = fpme->draw;
68 struct draw_vertex_shader *vs = draw->vs.vertex_shader;
69 struct draw_geometry_shader *gs = draw->gs.geometry_shader;
70 unsigned i;
71 unsigned instance_id_index = ~0;
72
73 const unsigned gs_out_prim = (gs ? gs->output_primitive :
74 u_assembled_prim(prim));
75 unsigned nr = MAX2(vs->info.num_inputs,
76 draw_total_vs_outputs(draw));
77 unsigned point_clip = draw->rasterizer->fill_front == PIPE_POLYGON_MODE_POINT ||
78 gs_out_prim == PIPE_PRIM_POINTS;
79
80 if (gs) {
81 nr = MAX2(nr, gs->info.num_outputs + 1);
82 }
83
84 /* Scan for instanceID system value.
85 */
86 for (i = 0; i < vs->info.num_inputs; i++) {
87 if (vs->info.input_semantic_name[i] == TGSI_SEMANTIC_INSTANCEID) {
88 instance_id_index = i;
89 break;
90 }
91 }
92
93 fpme->input_prim = prim;
94 fpme->opt = opt;
95
96 /* Always leave room for the vertex header whether we need it or
97 * not. It's hard to get rid of it in particular because of the
98 * viewport code in draw_pt_post_vs.c.
99 */
100 fpme->vertex_size = sizeof(struct vertex_header) + nr * 4 * sizeof(float);
101
102
103 draw_pt_fetch_prepare( fpme->fetch,
104 vs->info.num_inputs,
105 fpme->vertex_size,
106 instance_id_index );
107 draw_pt_post_vs_prepare( fpme->post_vs,
108 draw->clip_xy,
109 draw->clip_z,
110 draw->clip_user,
111 point_clip ? draw->guard_band_points_xy :
112 draw->guard_band_xy,
113 draw->identity_viewport,
114 draw->rasterizer->clip_halfz,
115 (draw->vs.edgeflag_output ? TRUE : FALSE) );
116
117 draw_pt_so_emit_prepare( fpme->so_emit, FALSE );
118
119 if (!(opt & PT_PIPELINE)) {
120 draw_pt_emit_prepare( fpme->emit,
121 gs_out_prim,
122 max_vertices );
123
124 *max_vertices = MAX2( *max_vertices, 4096 );
125 }
126 else {
127 /* limit max fetches by limiting max_vertices */
128 *max_vertices = 4096;
129 }
130
131 /* No need to prepare the shader.
132 */
133 vs->prepare(vs, draw);
134 }
135
136
137 static void
138 fetch_pipeline_bind_parameters(struct draw_pt_middle_end *middle)
139 {
140 /* No-op since the vertex shader executor and drawing pipeline
141 * just grab the constants, viewport, etc. from the draw context state.
142 */
143 }
144
145
146 static void fetch( struct pt_fetch *fetch,
147 const struct draw_fetch_info *fetch_info,
148 char *output)
149 {
150 if (fetch_info->linear) {
151 draw_pt_fetch_run_linear( fetch,
152 fetch_info->start,
153 fetch_info->count,
154 output );
155 }
156 else {
157 draw_pt_fetch_run( fetch,
158 fetch_info->elts,
159 fetch_info->count,
160 output );
161 }
162 }
163
164
165 static void pipeline(struct fetch_pipeline_middle_end *fpme,
166 const struct draw_vertex_info *vert_info,
167 const struct draw_prim_info *prim_info)
168 {
169 if (prim_info->linear)
170 draw_pipeline_run_linear( fpme->draw,
171 vert_info,
172 prim_info);
173 else
174 draw_pipeline_run( fpme->draw,
175 vert_info,
176 prim_info );
177 }
178
179 static void emit(struct pt_emit *emit,
180 const struct draw_vertex_info *vert_info,
181 const struct draw_prim_info *prim_info)
182 {
183 if (prim_info->linear) {
184 draw_pt_emit_linear(emit, vert_info, prim_info);
185 }
186 else {
187 draw_pt_emit(emit, vert_info, prim_info);
188 }
189 }
190
191
192 static void draw_vertex_shader_run(struct draw_vertex_shader *vshader,
193 const void *constants[PIPE_MAX_CONSTANT_BUFFERS],
194 unsigned const_size[PIPE_MAX_CONSTANT_BUFFERS],
195 const struct draw_vertex_info *input_verts,
196 struct draw_vertex_info *output_verts )
197 {
198 output_verts->vertex_size = input_verts->vertex_size;
199 output_verts->stride = input_verts->vertex_size;
200 output_verts->count = input_verts->count;
201 output_verts->verts =
202 (struct vertex_header *)MALLOC(output_verts->vertex_size *
203 align(output_verts->count, 4));
204
205 vshader->run_linear(vshader,
206 (const float (*)[4])input_verts->verts->data,
207 ( float (*)[4])output_verts->verts->data,
208 constants,
209 const_size,
210 input_verts->count,
211 input_verts->vertex_size,
212 input_verts->vertex_size);
213 }
214
215 static void fetch_pipeline_generic( struct draw_pt_middle_end *middle,
216 const struct draw_fetch_info *fetch_info,
217 const struct draw_prim_info *in_prim_info )
218 {
219 struct fetch_pipeline_middle_end *fpme = (struct fetch_pipeline_middle_end *)middle;
220 struct draw_context *draw = fpme->draw;
221 struct draw_vertex_shader *vshader = draw->vs.vertex_shader;
222 struct draw_geometry_shader *gshader = draw->gs.geometry_shader;
223 struct draw_prim_info gs_prim_info;
224 struct draw_vertex_info fetched_vert_info;
225 struct draw_vertex_info vs_vert_info;
226 struct draw_vertex_info gs_vert_info;
227 struct draw_vertex_info *vert_info;
228 struct draw_prim_info ia_prim_info;
229 struct draw_vertex_info ia_vert_info;
230 const struct draw_prim_info *prim_info = in_prim_info;
231 boolean free_prim_info = FALSE;
232 unsigned opt = fpme->opt;
233
234 fetched_vert_info.count = fetch_info->count;
235 fetched_vert_info.vertex_size = fpme->vertex_size;
236 fetched_vert_info.stride = fpme->vertex_size;
237 fetched_vert_info.verts =
238 (struct vertex_header *)MALLOC(fpme->vertex_size *
239 align(fetch_info->count, 4));
240 if (!fetched_vert_info.verts) {
241 assert(0);
242 return;
243 }
244 if (draw->collect_statistics) {
245 draw->statistics.ia_vertices += prim_info->count;
246 draw->statistics.ia_primitives +=
247 u_decomposed_prims_for_vertices(prim_info->prim, fetch_info->count);
248 draw->statistics.vs_invocations += fetch_info->count;
249 }
250
251 /* Fetch into our vertex buffer.
252 */
253 fetch( fpme->fetch, fetch_info, (char *)fetched_vert_info.verts );
254
255 /* Finished with fetch:
256 */
257 fetch_info = NULL;
258 vert_info = &fetched_vert_info;
259
260 /* Run the shader, note that this overwrites the data[] parts of
261 * the pipeline verts.
262 */
263 if (fpme->opt & PT_SHADE) {
264 draw_vertex_shader_run(vshader,
265 draw->pt.user.vs_constants,
266 draw->pt.user.vs_constants_size,
267 vert_info,
268 &vs_vert_info);
269
270 FREE(vert_info->verts);
271 vert_info = &vs_vert_info;
272 }
273
274 if ((fpme->opt & PT_SHADE) && gshader) {
275 draw_geometry_shader_run(gshader,
276 draw->pt.user.gs_constants,
277 draw->pt.user.gs_constants_size,
278 vert_info,
279 prim_info,
280 &vshader->info,
281 &gs_vert_info,
282 &gs_prim_info);
283
284 FREE(vert_info->verts);
285 vert_info = &gs_vert_info;
286 prim_info = &gs_prim_info;
287 } else {
288 if (draw_prim_assembler_is_required(draw, prim_info, vert_info)) {
289 draw_prim_assembler_run(draw, prim_info, vert_info,
290 &ia_prim_info, &ia_vert_info);
291
292 if (ia_vert_info.count) {
293 FREE(vert_info->verts);
294 vert_info = &ia_vert_info;
295 prim_info = &ia_prim_info;
296 free_prim_info = TRUE;
297 }
298 }
299 }
300 if (prim_info->count == 0) {
301 debug_printf("GS/IA didn't emit any vertices!\n");
302
303 FREE(vert_info->verts);
304 if (free_prim_info) {
305 FREE(prim_info->primitive_lengths);
306 }
307 return;
308 }
309
310
311 /* Stream output needs to be done before clipping.
312 *
313 * XXX: Stream output surely needs to respect the prim_info->elt
314 * lists.
315 */
316 draw_pt_so_emit( fpme->so_emit, vert_info, prim_info );
317
318 draw_stats_clipper_primitives(draw, prim_info);
319
320 /*
321 * if there's no position, need to stop now, or the latter stages
322 * will try to access non-existent position output.
323 */
324 if (draw_current_shader_position_output(draw) != -1) {
325
326 if (draw_pt_post_vs_run( fpme->post_vs, vert_info, prim_info ))
327 {
328 opt |= PT_PIPELINE;
329 }
330
331 /* Do we need to run the pipeline?
332 */
333 if (opt & PT_PIPELINE) {
334 pipeline( fpme, vert_info, prim_info );
335 }
336 else {
337 emit( fpme->emit, vert_info, prim_info );
338 }
339 }
340 FREE(vert_info->verts);
341 if (free_prim_info) {
342 FREE(prim_info->primitive_lengths);
343 }
344 }
345
346 static void fetch_pipeline_run( struct draw_pt_middle_end *middle,
347 const unsigned *fetch_elts,
348 unsigned fetch_count,
349 const ushort *draw_elts,
350 unsigned draw_count,
351 unsigned prim_flags )
352 {
353 struct fetch_pipeline_middle_end *fpme = (struct fetch_pipeline_middle_end *)middle;
354 struct draw_fetch_info fetch_info;
355 struct draw_prim_info prim_info;
356
357 fetch_info.linear = FALSE;
358 fetch_info.start = 0;
359 fetch_info.elts = fetch_elts;
360 fetch_info.count = fetch_count;
361
362 prim_info.linear = FALSE;
363 prim_info.start = 0;
364 prim_info.count = draw_count;
365 prim_info.elts = draw_elts;
366 prim_info.prim = fpme->input_prim;
367 prim_info.flags = prim_flags;
368 prim_info.primitive_count = 1;
369 prim_info.primitive_lengths = &draw_count;
370
371 fetch_pipeline_generic( middle, &fetch_info, &prim_info );
372 }
373
374
375 static void fetch_pipeline_linear_run( struct draw_pt_middle_end *middle,
376 unsigned start,
377 unsigned count,
378 unsigned prim_flags)
379 {
380 struct fetch_pipeline_middle_end *fpme = (struct fetch_pipeline_middle_end *)middle;
381 struct draw_fetch_info fetch_info;
382 struct draw_prim_info prim_info;
383
384 fetch_info.linear = TRUE;
385 fetch_info.start = start;
386 fetch_info.count = count;
387 fetch_info.elts = NULL;
388
389 prim_info.linear = TRUE;
390 prim_info.start = 0;
391 prim_info.count = count;
392 prim_info.elts = NULL;
393 prim_info.prim = fpme->input_prim;
394 prim_info.flags = prim_flags;
395 prim_info.primitive_count = 1;
396 prim_info.primitive_lengths = &count;
397
398 fetch_pipeline_generic( middle, &fetch_info, &prim_info );
399 }
400
401
402
403 static boolean fetch_pipeline_linear_run_elts( struct draw_pt_middle_end *middle,
404 unsigned start,
405 unsigned count,
406 const ushort *draw_elts,
407 unsigned draw_count,
408 unsigned prim_flags )
409 {
410 struct fetch_pipeline_middle_end *fpme = (struct fetch_pipeline_middle_end *)middle;
411 struct draw_fetch_info fetch_info;
412 struct draw_prim_info prim_info;
413
414 fetch_info.linear = TRUE;
415 fetch_info.start = start;
416 fetch_info.count = count;
417 fetch_info.elts = NULL;
418
419 prim_info.linear = FALSE;
420 prim_info.start = 0;
421 prim_info.count = draw_count;
422 prim_info.elts = draw_elts;
423 prim_info.prim = fpme->input_prim;
424 prim_info.flags = prim_flags;
425 prim_info.primitive_count = 1;
426 prim_info.primitive_lengths = &draw_count;
427
428 fetch_pipeline_generic( middle, &fetch_info, &prim_info );
429
430 return TRUE;
431 }
432
433
434
435 static void fetch_pipeline_finish( struct draw_pt_middle_end *middle )
436 {
437 /* nothing to do */
438 }
439
440 static void fetch_pipeline_destroy( struct draw_pt_middle_end *middle )
441 {
442 struct fetch_pipeline_middle_end *fpme = (struct fetch_pipeline_middle_end *)middle;
443
444 if (fpme->fetch)
445 draw_pt_fetch_destroy( fpme->fetch );
446
447 if (fpme->emit)
448 draw_pt_emit_destroy( fpme->emit );
449
450 if (fpme->so_emit)
451 draw_pt_so_emit_destroy( fpme->so_emit );
452
453 if (fpme->post_vs)
454 draw_pt_post_vs_destroy( fpme->post_vs );
455
456 FREE(middle);
457 }
458
459
460 struct draw_pt_middle_end *draw_pt_fetch_pipeline_or_emit( struct draw_context *draw )
461 {
462 struct fetch_pipeline_middle_end *fpme = CALLOC_STRUCT( fetch_pipeline_middle_end );
463 if (!fpme)
464 goto fail;
465
466 fpme->base.prepare = fetch_pipeline_prepare;
467 fpme->base.bind_parameters = fetch_pipeline_bind_parameters;
468 fpme->base.run = fetch_pipeline_run;
469 fpme->base.run_linear = fetch_pipeline_linear_run;
470 fpme->base.run_linear_elts = fetch_pipeline_linear_run_elts;
471 fpme->base.finish = fetch_pipeline_finish;
472 fpme->base.destroy = fetch_pipeline_destroy;
473
474 fpme->draw = draw;
475
476 fpme->fetch = draw_pt_fetch_create( draw );
477 if (!fpme->fetch)
478 goto fail;
479
480 fpme->post_vs = draw_pt_post_vs_create( draw );
481 if (!fpme->post_vs)
482 goto fail;
483
484 fpme->emit = draw_pt_emit_create( draw );
485 if (!fpme->emit)
486 goto fail;
487
488 fpme->so_emit = draw_pt_so_emit_create( draw );
489 if (!fpme->so_emit)
490 goto fail;
491
492 return &fpme->base;
493
494 fail:
495 if (fpme)
496 fetch_pipeline_destroy( &fpme->base );
497
498 return NULL;
499 }