llvmpipe: add support for nested / overlapping queries
[mesa.git] / src / gallium / drivers / llvmpipe / lp_setup.c
1 /**************************************************************************
2 *
3 * Copyright 2007 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 /**
29 * Tiling engine.
30 *
31 * Builds per-tile display lists and executes them on calls to
32 * lp_setup_flush().
33 */
34
35 #include <limits.h>
36
37 #include "pipe/p_defines.h"
38 #include "util/u_framebuffer.h"
39 #include "util/u_inlines.h"
40 #include "util/u_memory.h"
41 #include "util/u_pack_color.h"
42 #include "draw/draw_pipe.h"
43 #include "lp_context.h"
44 #include "lp_memory.h"
45 #include "lp_scene.h"
46 #include "lp_texture.h"
47 #include "lp_debug.h"
48 #include "lp_fence.h"
49 #include "lp_query.h"
50 #include "lp_rast.h"
51 #include "lp_setup_context.h"
52 #include "lp_screen.h"
53 #include "lp_state.h"
54 #include "state_tracker/sw_winsys.h"
55
56 #include "draw/draw_context.h"
57 #include "draw/draw_vbuf.h"
58
59
60 static boolean set_scene_state( struct lp_setup_context *, enum setup_state,
61 const char *reason);
62 static boolean try_update_scene_state( struct lp_setup_context *setup );
63
64
65 static void
66 lp_setup_get_empty_scene(struct lp_setup_context *setup)
67 {
68 struct llvmpipe_context *lp = llvmpipe_context(setup->pipe);
69 boolean discard = lp->rasterizer ? lp->rasterizer->rasterizer_discard : FALSE;
70
71 assert(setup->scene == NULL);
72
73 setup->scene_idx++;
74 setup->scene_idx %= Elements(setup->scenes);
75
76 setup->scene = setup->scenes[setup->scene_idx];
77
78 if (setup->scene->fence) {
79 if (LP_DEBUG & DEBUG_SETUP)
80 debug_printf("%s: wait for scene %d\n",
81 __FUNCTION__, setup->scene->fence->id);
82
83 lp_fence_wait(setup->scene->fence);
84 }
85
86 lp_scene_begin_binning(setup->scene, &setup->fb, discard);
87
88 }
89
90
91 static void
92 first_triangle( struct lp_setup_context *setup,
93 const float (*v0)[4],
94 const float (*v1)[4],
95 const float (*v2)[4])
96 {
97 assert(setup->state == SETUP_ACTIVE);
98 lp_setup_choose_triangle( setup );
99 setup->triangle( setup, v0, v1, v2 );
100 }
101
102 static void
103 first_line( struct lp_setup_context *setup,
104 const float (*v0)[4],
105 const float (*v1)[4])
106 {
107 assert(setup->state == SETUP_ACTIVE);
108 lp_setup_choose_line( setup );
109 setup->line( setup, v0, v1 );
110 }
111
112 static void
113 first_point( struct lp_setup_context *setup,
114 const float (*v0)[4])
115 {
116 assert(setup->state == SETUP_ACTIVE);
117 lp_setup_choose_point( setup );
118 setup->point( setup, v0 );
119 }
120
121 void lp_setup_reset( struct lp_setup_context *setup )
122 {
123 unsigned i;
124
125 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
126
127 /* Reset derived state */
128 for (i = 0; i < Elements(setup->constants); ++i) {
129 setup->constants[i].stored_size = 0;
130 setup->constants[i].stored_data = NULL;
131 }
132 setup->fs.stored = NULL;
133 setup->dirty = ~0;
134
135 /* no current bin */
136 setup->scene = NULL;
137
138 /* Reset some state:
139 */
140 memset(&setup->clear, 0, sizeof setup->clear);
141
142 /* Have an explicit "start-binning" call and get rid of this
143 * pointer twiddling?
144 */
145 setup->line = first_line;
146 setup->point = first_point;
147 setup->triangle = first_triangle;
148 }
149
150
151 /** Rasterize all scene's bins */
152 static void
153 lp_setup_rasterize_scene( struct lp_setup_context *setup )
154 {
155 struct lp_scene *scene = setup->scene;
156 struct llvmpipe_screen *screen = llvmpipe_screen(scene->pipe->screen);
157
158 scene->num_active_queries = setup->active_binned_queries;
159 memcpy(scene->active_queries, setup->active_queries,
160 scene->num_active_queries * sizeof(scene->active_queries[0]));
161
162 lp_scene_end_binning(scene);
163
164 lp_fence_reference(&setup->last_fence, scene->fence);
165
166 if (setup->last_fence)
167 setup->last_fence->issued = TRUE;
168
169 pipe_mutex_lock(screen->rast_mutex);
170 lp_rast_queue_scene(screen->rast, scene);
171 lp_rast_finish(screen->rast);
172 pipe_mutex_unlock(screen->rast_mutex);
173
174 lp_scene_end_rasterization(setup->scene);
175 lp_setup_reset( setup );
176
177 LP_DBG(DEBUG_SETUP, "%s done \n", __FUNCTION__);
178 }
179
180
181
182 static boolean
183 begin_binning( struct lp_setup_context *setup )
184 {
185 struct lp_scene *scene = setup->scene;
186 boolean need_zsload = FALSE;
187 boolean ok;
188
189 assert(scene);
190 assert(scene->fence == NULL);
191
192 /* Always create a fence:
193 */
194 scene->fence = lp_fence_create(MAX2(1, setup->num_threads));
195 if (!scene->fence)
196 return FALSE;
197
198 ok = try_update_scene_state(setup);
199 if (!ok)
200 return FALSE;
201
202 if (setup->fb.zsbuf &&
203 ((setup->clear.flags & PIPE_CLEAR_DEPTHSTENCIL) != PIPE_CLEAR_DEPTHSTENCIL) &&
204 util_format_is_depth_and_stencil(setup->fb.zsbuf->format))
205 need_zsload = TRUE;
206
207 LP_DBG(DEBUG_SETUP, "%s color: %s depth: %s\n", __FUNCTION__,
208 (setup->clear.flags & PIPE_CLEAR_COLOR) ? "clear": "load",
209 need_zsload ? "clear": "load");
210
211 if (setup->fb.nr_cbufs) {
212 if (setup->clear.flags & PIPE_CLEAR_COLOR) {
213 ok = lp_scene_bin_everywhere( scene,
214 LP_RAST_OP_CLEAR_COLOR,
215 setup->clear.color );
216 if (!ok)
217 return FALSE;
218 }
219 }
220
221 if (setup->fb.zsbuf) {
222 if (setup->clear.flags & PIPE_CLEAR_DEPTHSTENCIL) {
223 if (!need_zsload)
224 scene->has_depthstencil_clear = TRUE;
225
226 ok = lp_scene_bin_everywhere( scene,
227 LP_RAST_OP_CLEAR_ZSTENCIL,
228 lp_rast_arg_clearzs(
229 setup->clear.zsvalue,
230 setup->clear.zsmask));
231 if (!ok)
232 return FALSE;
233 }
234 }
235
236 setup->clear.flags = 0;
237 setup->clear.zsmask = 0;
238 setup->clear.zsvalue = 0;
239
240 LP_DBG(DEBUG_SETUP, "%s done\n", __FUNCTION__);
241 return TRUE;
242 }
243
244
245 /* This basically bins and then flushes any outstanding full-screen
246 * clears.
247 *
248 * TODO: fast path for fullscreen clears and no triangles.
249 */
250 static boolean
251 execute_clears( struct lp_setup_context *setup )
252 {
253 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
254
255 return begin_binning( setup );
256 }
257
258 const char *states[] = {
259 "FLUSHED",
260 "CLEARED",
261 "ACTIVE "
262 };
263
264
265 static boolean
266 set_scene_state( struct lp_setup_context *setup,
267 enum setup_state new_state,
268 const char *reason)
269 {
270 unsigned old_state = setup->state;
271
272 if (old_state == new_state)
273 return TRUE;
274
275 if (LP_DEBUG & DEBUG_SCENE) {
276 debug_printf("%s old %s new %s%s%s\n",
277 __FUNCTION__,
278 states[old_state],
279 states[new_state],
280 (new_state == SETUP_FLUSHED) ? ": " : "",
281 (new_state == SETUP_FLUSHED) ? reason : "");
282
283 if (new_state == SETUP_FLUSHED && setup->scene)
284 lp_debug_draw_bins_by_cmd_length(setup->scene);
285 }
286
287 /* wait for a free/empty scene
288 */
289 if (old_state == SETUP_FLUSHED)
290 lp_setup_get_empty_scene(setup);
291
292 switch (new_state) {
293 case SETUP_CLEARED:
294 break;
295
296 case SETUP_ACTIVE:
297 if (!begin_binning( setup ))
298 goto fail;
299 break;
300
301 case SETUP_FLUSHED:
302 if (old_state == SETUP_CLEARED)
303 if (!execute_clears( setup ))
304 goto fail;
305
306 lp_setup_rasterize_scene( setup );
307 assert(setup->scene == NULL);
308 break;
309
310 default:
311 assert(0 && "invalid setup state mode");
312 goto fail;
313 }
314
315 setup->state = new_state;
316 return TRUE;
317
318 fail:
319 if (setup->scene) {
320 lp_scene_end_rasterization(setup->scene);
321 setup->scene = NULL;
322 }
323
324 setup->state = SETUP_FLUSHED;
325 lp_setup_reset( setup );
326 return FALSE;
327 }
328
329
330 void
331 lp_setup_flush( struct lp_setup_context *setup,
332 struct pipe_fence_handle **fence,
333 const char *reason)
334 {
335 set_scene_state( setup, SETUP_FLUSHED, reason );
336
337 if (fence) {
338 lp_fence_reference((struct lp_fence **)fence, setup->last_fence);
339 }
340 }
341
342
343 void
344 lp_setup_bind_framebuffer( struct lp_setup_context *setup,
345 const struct pipe_framebuffer_state *fb )
346 {
347 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
348
349 /* Flush any old scene.
350 */
351 set_scene_state( setup, SETUP_FLUSHED, __FUNCTION__ );
352
353 /*
354 * Ensure the old scene is not reused.
355 */
356 assert(!setup->scene);
357
358 /* Set new state. This will be picked up later when we next need a
359 * scene.
360 */
361 util_copy_framebuffer_state(&setup->fb, fb);
362 setup->framebuffer.x0 = 0;
363 setup->framebuffer.y0 = 0;
364 setup->framebuffer.x1 = fb->width-1;
365 setup->framebuffer.y1 = fb->height-1;
366 setup->dirty |= LP_SETUP_NEW_SCISSOR;
367 }
368
369
370 static boolean
371 lp_setup_try_clear( struct lp_setup_context *setup,
372 const union pipe_color_union *color,
373 double depth,
374 unsigned stencil,
375 unsigned flags )
376 {
377 uint64_t zsmask = 0;
378 uint64_t zsvalue = 0;
379 union lp_rast_cmd_arg color_arg;
380 unsigned i;
381
382 LP_DBG(DEBUG_SETUP, "%s state %d\n", __FUNCTION__, setup->state);
383
384 if (flags & PIPE_CLEAR_COLOR) {
385 for (i = 0; i < 4; i++)
386 color_arg.clear_color.i[i] = color->i[i];
387 }
388
389 if (flags & PIPE_CLEAR_DEPTHSTENCIL) {
390 uint32_t zmask = (flags & PIPE_CLEAR_DEPTH) ? ~0 : 0;
391 uint8_t smask = (flags & PIPE_CLEAR_STENCIL) ? ~0 : 0;
392
393 zsvalue = util_pack64_z_stencil(setup->fb.zsbuf->format,
394 depth,
395 stencil);
396
397
398 zsmask = util_pack64_mask_z_stencil(setup->fb.zsbuf->format,
399 zmask,
400 smask);
401
402 zsvalue &= zsmask;
403 }
404
405 if (setup->state == SETUP_ACTIVE) {
406 struct lp_scene *scene = setup->scene;
407
408 /* Add the clear to existing scene. In the unusual case where
409 * both color and depth-stencil are being cleared when there's
410 * already been some rendering, we could discard the currently
411 * binned scene and start again, but I don't see that as being
412 * a common usage.
413 */
414 if (flags & PIPE_CLEAR_COLOR) {
415 if (!lp_scene_bin_everywhere( scene,
416 LP_RAST_OP_CLEAR_COLOR,
417 color_arg ))
418 return FALSE;
419 }
420
421 if (flags & PIPE_CLEAR_DEPTHSTENCIL) {
422 if (!lp_scene_bin_everywhere( scene,
423 LP_RAST_OP_CLEAR_ZSTENCIL,
424 lp_rast_arg_clearzs(zsvalue, zsmask) ))
425 return FALSE;
426 }
427 }
428 else {
429 /* Put ourselves into the 'pre-clear' state, specifically to try
430 * and accumulate multiple clears to color and depth_stencil
431 * buffers which the app or state-tracker might issue
432 * separately.
433 */
434 set_scene_state( setup, SETUP_CLEARED, __FUNCTION__ );
435
436 setup->clear.flags |= flags;
437
438 if (flags & PIPE_CLEAR_DEPTHSTENCIL) {
439 setup->clear.zsmask |= zsmask;
440 setup->clear.zsvalue =
441 (setup->clear.zsvalue & ~zsmask) | (zsvalue & zsmask);
442 }
443
444 if (flags & PIPE_CLEAR_COLOR) {
445 memcpy(&setup->clear.color.clear_color,
446 &color_arg,
447 sizeof setup->clear.color.clear_color);
448 }
449 }
450
451 return TRUE;
452 }
453
454 void
455 lp_setup_clear( struct lp_setup_context *setup,
456 const union pipe_color_union *color,
457 double depth,
458 unsigned stencil,
459 unsigned flags )
460 {
461 if (!lp_setup_try_clear( setup, color, depth, stencil, flags )) {
462 lp_setup_flush(setup, NULL, __FUNCTION__);
463
464 if (!lp_setup_try_clear( setup, color, depth, stencil, flags ))
465 assert(0);
466 }
467 }
468
469
470
471
472
473 void
474 lp_setup_set_triangle_state( struct lp_setup_context *setup,
475 unsigned cull_mode,
476 boolean ccw_is_frontface,
477 boolean scissor,
478 boolean half_pixel_center,
479 boolean bottom_edge_rule)
480 {
481 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
482
483 setup->ccw_is_frontface = ccw_is_frontface;
484 setup->cullmode = cull_mode;
485 setup->triangle = first_triangle;
486 setup->pixel_offset = half_pixel_center ? 0.5f : 0.0f;
487 setup->bottom_edge_rule = bottom_edge_rule;
488
489 if (setup->scissor_test != scissor) {
490 setup->dirty |= LP_SETUP_NEW_SCISSOR;
491 setup->scissor_test = scissor;
492 }
493 }
494
495 void
496 lp_setup_set_line_state( struct lp_setup_context *setup,
497 float line_width)
498 {
499 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
500
501 setup->line_width = line_width;
502 }
503
504 void
505 lp_setup_set_point_state( struct lp_setup_context *setup,
506 float point_size,
507 boolean point_size_per_vertex,
508 uint sprite_coord_enable,
509 uint sprite_coord_origin)
510 {
511 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
512
513 setup->point_size = point_size;
514 setup->sprite_coord_enable = sprite_coord_enable;
515 setup->sprite_coord_origin = sprite_coord_origin;
516 setup->point_size_per_vertex = point_size_per_vertex;
517 }
518
519 void
520 lp_setup_set_setup_variant( struct lp_setup_context *setup,
521 const struct lp_setup_variant *variant)
522 {
523 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
524
525 setup->setup.variant = variant;
526 }
527
528 void
529 lp_setup_set_fs_variant( struct lp_setup_context *setup,
530 struct lp_fragment_shader_variant *variant)
531 {
532 LP_DBG(DEBUG_SETUP, "%s %p\n", __FUNCTION__,
533 variant);
534 /* FIXME: reference count */
535
536 setup->fs.current.variant = variant;
537 setup->dirty |= LP_SETUP_NEW_FS;
538 }
539
540 void
541 lp_setup_set_fs_constants(struct lp_setup_context *setup,
542 unsigned num,
543 struct pipe_constant_buffer *buffers)
544 {
545 unsigned i;
546
547 LP_DBG(DEBUG_SETUP, "%s %p\n", __FUNCTION__, (void *) buffers);
548
549 assert(num <= Elements(setup->constants));
550
551 for (i = 0; i < num; ++i) {
552 util_copy_constant_buffer(&setup->constants[i].current, &buffers[i]);
553 }
554 for (; i < Elements(setup->constants); i++) {
555 util_copy_constant_buffer(&setup->constants[i].current, NULL);
556 }
557 setup->dirty |= LP_SETUP_NEW_CONSTANTS;
558 }
559
560
561 void
562 lp_setup_set_alpha_ref_value( struct lp_setup_context *setup,
563 float alpha_ref_value )
564 {
565 LP_DBG(DEBUG_SETUP, "%s %f\n", __FUNCTION__, alpha_ref_value);
566
567 if(setup->fs.current.jit_context.alpha_ref_value != alpha_ref_value) {
568 setup->fs.current.jit_context.alpha_ref_value = alpha_ref_value;
569 setup->dirty |= LP_SETUP_NEW_FS;
570 }
571 }
572
573 void
574 lp_setup_set_stencil_ref_values( struct lp_setup_context *setup,
575 const ubyte refs[2] )
576 {
577 LP_DBG(DEBUG_SETUP, "%s %d %d\n", __FUNCTION__, refs[0], refs[1]);
578
579 if (setup->fs.current.jit_context.stencil_ref_front != refs[0] ||
580 setup->fs.current.jit_context.stencil_ref_back != refs[1]) {
581 setup->fs.current.jit_context.stencil_ref_front = refs[0];
582 setup->fs.current.jit_context.stencil_ref_back = refs[1];
583 setup->dirty |= LP_SETUP_NEW_FS;
584 }
585 }
586
587 void
588 lp_setup_set_blend_color( struct lp_setup_context *setup,
589 const struct pipe_blend_color *blend_color )
590 {
591 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
592
593 assert(blend_color);
594
595 if(memcmp(&setup->blend_color.current, blend_color, sizeof *blend_color) != 0) {
596 memcpy(&setup->blend_color.current, blend_color, sizeof *blend_color);
597 setup->dirty |= LP_SETUP_NEW_BLEND_COLOR;
598 }
599 }
600
601
602 void
603 lp_setup_set_scissors( struct lp_setup_context *setup,
604 const struct pipe_scissor_state *scissors )
605 {
606 unsigned i;
607 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
608
609 assert(scissors);
610
611 for (i = 0; i < PIPE_MAX_VIEWPORTS; ++i) {
612 setup->scissors[i].x0 = scissors[i].minx;
613 setup->scissors[i].x1 = scissors[i].maxx-1;
614 setup->scissors[i].y0 = scissors[i].miny;
615 setup->scissors[i].y1 = scissors[i].maxy-1;
616 }
617 setup->dirty |= LP_SETUP_NEW_SCISSOR;
618 }
619
620
621 void
622 lp_setup_set_flatshade_first( struct lp_setup_context *setup,
623 boolean flatshade_first )
624 {
625 setup->flatshade_first = flatshade_first;
626 }
627
628 void
629 lp_setup_set_rasterizer_discard( struct lp_setup_context *setup,
630 boolean rasterizer_discard )
631 {
632 if (setup->rasterizer_discard != rasterizer_discard) {
633 setup->rasterizer_discard = rasterizer_discard;
634 set_scene_state( setup, SETUP_FLUSHED, __FUNCTION__ );
635 }
636 }
637
638 void
639 lp_setup_set_vertex_info( struct lp_setup_context *setup,
640 struct vertex_info *vertex_info )
641 {
642 /* XXX: just silently holding onto the pointer:
643 */
644 setup->vertex_info = vertex_info;
645 }
646
647
648 /**
649 * Called during state validation when LP_NEW_SAMPLER_VIEW is set.
650 */
651 void
652 lp_setup_set_fragment_sampler_views(struct lp_setup_context *setup,
653 unsigned num,
654 struct pipe_sampler_view **views)
655 {
656 unsigned i;
657
658 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
659
660 assert(num <= PIPE_MAX_SHADER_SAMPLER_VIEWS);
661
662 for (i = 0; i < PIPE_MAX_SHADER_SAMPLER_VIEWS; i++) {
663 struct pipe_sampler_view *view = i < num ? views[i] : NULL;
664
665 if (view) {
666 struct pipe_resource *res = view->texture;
667 struct llvmpipe_resource *lp_tex = llvmpipe_resource(res);
668 struct lp_jit_texture *jit_tex;
669 jit_tex = &setup->fs.current.jit_context.textures[i];
670
671 /* We're referencing the texture's internal data, so save a
672 * reference to it.
673 */
674 pipe_resource_reference(&setup->fs.current_tex[i], res);
675
676 if (!lp_tex->dt) {
677 /* regular texture - setup array of mipmap level offsets */
678 void *mip_ptr;
679 int j;
680 unsigned first_level = 0;
681 unsigned last_level = 0;
682
683 if (llvmpipe_resource_is_texture(res)) {
684 first_level = view->u.tex.first_level;
685 last_level = view->u.tex.last_level;
686 assert(first_level <= last_level);
687 assert(last_level <= res->last_level);
688
689 /*
690 * The complexity here should no longer be necessary.
691 */
692 mip_ptr = llvmpipe_get_texture_image_all(lp_tex, first_level,
693 LP_TEX_USAGE_READ);
694 jit_tex->base = lp_tex->linear_img.data;
695 }
696 else {
697 mip_ptr = lp_tex->data;
698 jit_tex->base = mip_ptr;
699 }
700
701 if ((LP_PERF & PERF_TEX_MEM) || !mip_ptr) {
702 /* out of memory - use dummy tile memory */
703 /* Note if using PERF_TEX_MEM will also skip tile conversion */
704 jit_tex->base = lp_dummy_tile;
705 jit_tex->width = TILE_SIZE/8;
706 jit_tex->height = TILE_SIZE/8;
707 jit_tex->depth = 1;
708 jit_tex->first_level = 0;
709 jit_tex->last_level = 0;
710 jit_tex->mip_offsets[0] = 0;
711 jit_tex->row_stride[0] = 0;
712 jit_tex->img_stride[0] = 0;
713 }
714 else {
715 jit_tex->width = res->width0;
716 jit_tex->height = res->height0;
717 jit_tex->depth = res->depth0;
718 jit_tex->first_level = first_level;
719 jit_tex->last_level = last_level;
720
721 if (llvmpipe_resource_is_texture(res)) {
722 for (j = first_level; j <= last_level; j++) {
723 mip_ptr = llvmpipe_get_texture_image_all(lp_tex, j,
724 LP_TEX_USAGE_READ);
725 jit_tex->mip_offsets[j] = (uint8_t *)mip_ptr - (uint8_t *)jit_tex->base;
726 /*
727 * could get mip offset directly but need call above to
728 * invoke tiled->linear conversion.
729 */
730 assert(lp_tex->linear_mip_offsets[j] == jit_tex->mip_offsets[j]);
731 jit_tex->row_stride[j] = lp_tex->row_stride[j];
732 jit_tex->img_stride[j] = lp_tex->img_stride[j];
733 }
734
735 if (res->target == PIPE_TEXTURE_1D_ARRAY ||
736 res->target == PIPE_TEXTURE_2D_ARRAY) {
737 /*
738 * For array textures, we don't have first_layer, instead
739 * adjust last_layer (stored as depth) plus the mip level offsets
740 * (as we have mip-first layout can't just adjust base ptr).
741 * XXX For mip levels, could do something similar.
742 */
743 jit_tex->depth = view->u.tex.last_layer - view->u.tex.first_layer + 1;
744 for (j = first_level; j <= last_level; j++) {
745 jit_tex->mip_offsets[j] += view->u.tex.first_layer *
746 lp_tex->img_stride[j];
747 }
748 assert(view->u.tex.first_layer <= view->u.tex.last_layer);
749 assert(view->u.tex.last_layer < res->array_size);
750 }
751 }
752 else {
753 /*
754 * For buffers, we don't have first_element, instead adjust
755 * last_element (stored as width) plus the base pointer.
756 */
757 unsigned view_blocksize = util_format_get_blocksize(view->format);
758 /* probably don't really need to fill that out */
759 jit_tex->mip_offsets[0] = 0;
760 jit_tex->row_stride[0] = 0;
761 jit_tex->row_stride[0] = 0;
762
763 /* everything specified in number of elements here. */
764 jit_tex->width = view->u.buf.last_element - view->u.buf.first_element + 1;
765 jit_tex->base = (uint8_t *)jit_tex->base + view->u.buf.first_element *
766 view_blocksize;
767 /* XXX Unsure if we need to sanitize parameters? */
768 assert(view->u.buf.first_element <= view->u.buf.last_element);
769 assert(view->u.buf.last_element * view_blocksize < res->width0);
770 }
771 }
772 }
773 else {
774 /* display target texture/surface */
775 /*
776 * XXX: Where should this be unmapped?
777 */
778 struct llvmpipe_screen *screen = llvmpipe_screen(res->screen);
779 struct sw_winsys *winsys = screen->winsys;
780 jit_tex->base = winsys->displaytarget_map(winsys, lp_tex->dt,
781 PIPE_TRANSFER_READ);
782 jit_tex->row_stride[0] = lp_tex->row_stride[0];
783 jit_tex->img_stride[0] = lp_tex->img_stride[0];
784 jit_tex->mip_offsets[0] = 0;
785 jit_tex->width = res->width0;
786 jit_tex->height = res->height0;
787 jit_tex->depth = res->depth0;
788 jit_tex->first_level = jit_tex->last_level = 0;
789 assert(jit_tex->base);
790 }
791 }
792 }
793
794 setup->dirty |= LP_SETUP_NEW_FS;
795 }
796
797
798 /**
799 * Called during state validation when LP_NEW_SAMPLER is set.
800 */
801 void
802 lp_setup_set_fragment_sampler_state(struct lp_setup_context *setup,
803 unsigned num,
804 struct pipe_sampler_state **samplers)
805 {
806 unsigned i;
807
808 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
809
810 assert(num <= PIPE_MAX_SAMPLERS);
811
812 for (i = 0; i < PIPE_MAX_SAMPLERS; i++) {
813 const struct pipe_sampler_state *sampler = i < num ? samplers[i] : NULL;
814
815 if (sampler) {
816 struct lp_jit_sampler *jit_sam;
817 jit_sam = &setup->fs.current.jit_context.samplers[i];
818
819 jit_sam->min_lod = sampler->min_lod;
820 jit_sam->max_lod = sampler->max_lod;
821 jit_sam->lod_bias = sampler->lod_bias;
822 COPY_4V(jit_sam->border_color, sampler->border_color.f);
823 }
824 }
825
826 setup->dirty |= LP_SETUP_NEW_FS;
827 }
828
829
830 /**
831 * Is the given texture referenced by any scene?
832 * Note: we have to check all scenes including any scenes currently
833 * being rendered and the current scene being built.
834 */
835 unsigned
836 lp_setup_is_resource_referenced( const struct lp_setup_context *setup,
837 const struct pipe_resource *texture )
838 {
839 unsigned i;
840
841 /* check the render targets */
842 for (i = 0; i < setup->fb.nr_cbufs; i++) {
843 if (setup->fb.cbufs[i]->texture == texture)
844 return LP_REFERENCED_FOR_READ | LP_REFERENCED_FOR_WRITE;
845 }
846 if (setup->fb.zsbuf && setup->fb.zsbuf->texture == texture) {
847 return LP_REFERENCED_FOR_READ | LP_REFERENCED_FOR_WRITE;
848 }
849
850 /* check textures referenced by the scene */
851 for (i = 0; i < Elements(setup->scenes); i++) {
852 if (lp_scene_is_resource_referenced(setup->scenes[i], texture)) {
853 return LP_REFERENCED_FOR_READ;
854 }
855 }
856
857 return LP_UNREFERENCED;
858 }
859
860
861 /**
862 * Called by vbuf code when we're about to draw something.
863 */
864 static boolean
865 try_update_scene_state( struct lp_setup_context *setup )
866 {
867 boolean new_scene = (setup->fs.stored == NULL);
868 struct lp_scene *scene = setup->scene;
869 unsigned i;
870
871 assert(scene);
872
873 if(setup->dirty & LP_SETUP_NEW_BLEND_COLOR) {
874 uint8_t *stored;
875 float* fstored;
876 unsigned i, j;
877 unsigned size;
878
879 /* Alloc u8_blend_color (16 x i8) and f_blend_color (4 or 8 x f32) */
880 size = 4 * 16 * sizeof(uint8_t);
881 size += (LP_MAX_VECTOR_LENGTH / 4) * sizeof(float);
882 stored = lp_scene_alloc_aligned(scene, size, LP_MAX_VECTOR_LENGTH);
883
884 if (!stored) {
885 assert(!new_scene);
886 return FALSE;
887 }
888
889 /* Store floating point colour */
890 fstored = (float*)(stored + 4*16);
891 for (i = 0; i < (LP_MAX_VECTOR_LENGTH / 4); ++i) {
892 fstored[i] = setup->blend_color.current.color[i % 4];
893 }
894
895 /* smear each blend color component across 16 ubyte elements */
896 for (i = 0; i < 4; ++i) {
897 uint8_t c = float_to_ubyte(setup->blend_color.current.color[i]);
898 for (j = 0; j < 16; ++j)
899 stored[i*16 + j] = c;
900 }
901
902 setup->blend_color.stored = stored;
903 setup->fs.current.jit_context.u8_blend_color = stored;
904 setup->fs.current.jit_context.f_blend_color = fstored;
905 setup->dirty |= LP_SETUP_NEW_FS;
906 }
907
908 if (setup->dirty & LP_SETUP_NEW_CONSTANTS) {
909 for (i = 0; i < Elements(setup->constants); ++i) {
910 struct pipe_resource *buffer = setup->constants[i].current.buffer;
911 const unsigned current_size = setup->constants[i].current.buffer_size;
912 const ubyte *current_data = NULL;
913
914 if (buffer) {
915 /* resource buffer */
916 current_data = (ubyte *) llvmpipe_resource_data(buffer);
917 }
918 else if (setup->constants[i].current.user_buffer) {
919 /* user-space buffer */
920 current_data = (ubyte *) setup->constants[i].current.user_buffer;
921 }
922
923 if (current_data) {
924 current_data += setup->constants[i].current.buffer_offset;
925
926 /* TODO: copy only the actually used constants? */
927
928 if (setup->constants[i].stored_size != current_size ||
929 !setup->constants[i].stored_data ||
930 memcmp(setup->constants[i].stored_data,
931 current_data,
932 current_size) != 0) {
933 void *stored;
934
935 stored = lp_scene_alloc(scene, current_size);
936 if (!stored) {
937 assert(!new_scene);
938 return FALSE;
939 }
940
941 memcpy(stored,
942 current_data,
943 current_size);
944 setup->constants[i].stored_size = current_size;
945 setup->constants[i].stored_data = stored;
946 }
947 }
948 else {
949 setup->constants[i].stored_size = 0;
950 setup->constants[i].stored_data = NULL;
951 }
952
953 setup->fs.current.jit_context.constants[i] = setup->constants[i].stored_data;
954 setup->dirty |= LP_SETUP_NEW_FS;
955 }
956 }
957
958
959 if (setup->dirty & LP_SETUP_NEW_FS) {
960 if (!setup->fs.stored ||
961 memcmp(setup->fs.stored,
962 &setup->fs.current,
963 sizeof setup->fs.current) != 0)
964 {
965 struct lp_rast_state *stored;
966
967 /* The fs state that's been stored in the scene is different from
968 * the new, current state. So allocate a new lp_rast_state object
969 * and append it to the bin's setup data buffer.
970 */
971 stored = (struct lp_rast_state *) lp_scene_alloc(scene, sizeof *stored);
972 if (!stored) {
973 assert(!new_scene);
974 return FALSE;
975 }
976
977 memcpy(stored,
978 &setup->fs.current,
979 sizeof setup->fs.current);
980 setup->fs.stored = stored;
981
982 /* The scene now references the textures in the rasterization
983 * state record. Note that now.
984 */
985 for (i = 0; i < Elements(setup->fs.current_tex); i++) {
986 if (setup->fs.current_tex[i]) {
987 if (!lp_scene_add_resource_reference(scene,
988 setup->fs.current_tex[i],
989 new_scene)) {
990 assert(!new_scene);
991 return FALSE;
992 }
993 }
994 }
995 }
996 }
997
998 if (setup->dirty & LP_SETUP_NEW_SCISSOR) {
999 unsigned i;
1000 for (i = 0; i < PIPE_MAX_VIEWPORTS; ++i) {
1001 setup->draw_regions[i] = setup->framebuffer;
1002 if (setup->scissor_test) {
1003 u_rect_possible_intersection(&setup->scissors[i],
1004 &setup->draw_regions[i]);
1005 }
1006 }
1007 /* If the framebuffer is large we have to think about fixed-point
1008 * integer overflow. For 2K by 2K images, coordinates need 15 bits
1009 * (2^11 + 4 subpixel bits). The product of two such numbers would
1010 * use 30 bits. Any larger and we could overflow a 32-bit int.
1011 *
1012 * To cope with this problem we check if triangles are large and
1013 * subdivide them if needed.
1014 */
1015 setup->subdivide_large_triangles = (setup->fb.width > 2048 &&
1016 setup->fb.height > 2048);
1017 }
1018
1019 setup->dirty = 0;
1020
1021 assert(setup->fs.stored);
1022 return TRUE;
1023 }
1024
1025 boolean
1026 lp_setup_update_state( struct lp_setup_context *setup,
1027 boolean update_scene )
1028 {
1029 /* Some of the 'draw' pipeline stages may have changed some driver state.
1030 * Make sure we've processed those state changes before anything else.
1031 *
1032 * XXX this is the only place where llvmpipe_context is used in the
1033 * setup code. This may get refactored/changed...
1034 */
1035 {
1036 struct llvmpipe_context *lp = llvmpipe_context(setup->pipe);
1037 if (lp->dirty) {
1038 llvmpipe_update_derived(lp);
1039 }
1040
1041 if (lp->setup->dirty) {
1042 llvmpipe_update_setup(lp);
1043 }
1044
1045 assert(setup->setup.variant);
1046
1047 /* Will probably need to move this somewhere else, just need
1048 * to know about vertex shader point size attribute.
1049 */
1050 setup->psize = lp->psize_slot;
1051 setup->viewport_index_slot = lp->viewport_index_slot;
1052 setup->layer_slot = lp->layer_slot;
1053
1054 assert(lp->dirty == 0);
1055
1056 assert(lp->setup_variant.key.size ==
1057 setup->setup.variant->key.size);
1058
1059 assert(memcmp(&lp->setup_variant.key,
1060 &setup->setup.variant->key,
1061 setup->setup.variant->key.size) == 0);
1062 }
1063
1064 if (update_scene && setup->state != SETUP_ACTIVE) {
1065 if (!set_scene_state( setup, SETUP_ACTIVE, __FUNCTION__ ))
1066 return FALSE;
1067 }
1068
1069 /* Only call into update_scene_state() if we already have a
1070 * scene:
1071 */
1072 if (update_scene && setup->scene) {
1073 assert(setup->state == SETUP_ACTIVE);
1074
1075 if (try_update_scene_state(setup))
1076 return TRUE;
1077
1078 /* Update failed, try to restart the scene.
1079 *
1080 * Cannot call lp_setup_flush_and_restart() directly here
1081 * because of potential recursion.
1082 */
1083 if (!set_scene_state(setup, SETUP_FLUSHED, __FUNCTION__))
1084 return FALSE;
1085
1086 if (!set_scene_state(setup, SETUP_ACTIVE, __FUNCTION__))
1087 return FALSE;
1088
1089 if (!setup->scene)
1090 return FALSE;
1091
1092 return try_update_scene_state(setup);
1093 }
1094
1095 return TRUE;
1096 }
1097
1098
1099
1100 /* Only caller is lp_setup_vbuf_destroy()
1101 */
1102 void
1103 lp_setup_destroy( struct lp_setup_context *setup )
1104 {
1105 uint i;
1106
1107 lp_setup_reset( setup );
1108
1109 util_unreference_framebuffer_state(&setup->fb);
1110
1111 for (i = 0; i < Elements(setup->fs.current_tex); i++) {
1112 pipe_resource_reference(&setup->fs.current_tex[i], NULL);
1113 }
1114
1115 for (i = 0; i < Elements(setup->constants); i++) {
1116 pipe_resource_reference(&setup->constants[i].current.buffer, NULL);
1117 }
1118
1119 /* free the scenes in the 'empty' queue */
1120 for (i = 0; i < Elements(setup->scenes); i++) {
1121 struct lp_scene *scene = setup->scenes[i];
1122
1123 if (scene->fence)
1124 lp_fence_wait(scene->fence);
1125
1126 lp_scene_destroy(scene);
1127 }
1128
1129 lp_fence_reference(&setup->last_fence, NULL);
1130
1131 FREE( setup );
1132 }
1133
1134
1135 /**
1136 * Create a new primitive tiling engine. Plug it into the backend of
1137 * the draw module. Currently also creates a rasterizer to use with
1138 * it.
1139 */
1140 struct lp_setup_context *
1141 lp_setup_create( struct pipe_context *pipe,
1142 struct draw_context *draw )
1143 {
1144 struct llvmpipe_screen *screen = llvmpipe_screen(pipe->screen);
1145 struct lp_setup_context *setup;
1146 unsigned i;
1147
1148 setup = CALLOC_STRUCT(lp_setup_context);
1149 if (!setup) {
1150 goto no_setup;
1151 }
1152
1153 lp_setup_init_vbuf(setup);
1154
1155 /* Used only in update_state():
1156 */
1157 setup->pipe = pipe;
1158
1159
1160 setup->num_threads = screen->num_threads;
1161 setup->vbuf = draw_vbuf_stage(draw, &setup->base);
1162 if (!setup->vbuf) {
1163 goto no_vbuf;
1164 }
1165
1166 draw_set_rasterize_stage(draw, setup->vbuf);
1167 draw_set_render(draw, &setup->base);
1168
1169 /* create some empty scenes */
1170 for (i = 0; i < MAX_SCENES; i++) {
1171 setup->scenes[i] = lp_scene_create( pipe );
1172 if (!setup->scenes[i]) {
1173 goto no_scenes;
1174 }
1175 }
1176
1177 setup->triangle = first_triangle;
1178 setup->line = first_line;
1179 setup->point = first_point;
1180
1181 setup->dirty = ~0;
1182
1183 return setup;
1184
1185 no_scenes:
1186 for (i = 0; i < MAX_SCENES; i++) {
1187 if (setup->scenes[i]) {
1188 lp_scene_destroy(setup->scenes[i]);
1189 }
1190 }
1191
1192 setup->vbuf->destroy(setup->vbuf);
1193 no_vbuf:
1194 FREE(setup);
1195 no_setup:
1196 return NULL;
1197 }
1198
1199
1200 /**
1201 * Put a BeginQuery command into all bins.
1202 */
1203 void
1204 lp_setup_begin_query(struct lp_setup_context *setup,
1205 struct llvmpipe_query *pq)
1206 {
1207
1208 set_scene_state(setup, SETUP_ACTIVE, "begin_query");
1209
1210 if (!(pq->type == PIPE_QUERY_OCCLUSION_COUNTER ||
1211 pq->type == PIPE_QUERY_OCCLUSION_PREDICATE ||
1212 pq->type == PIPE_QUERY_PIPELINE_STATISTICS))
1213 return;
1214
1215 /* init the query to its beginning state */
1216 assert(setup->active_binned_queries < LP_MAX_ACTIVE_BINNED_QUERIES);
1217 /* exceeding list size so just ignore the query */
1218 if (setup->active_binned_queries >= LP_MAX_ACTIVE_BINNED_QUERIES) {
1219 return;
1220 }
1221 assert(setup->active_queries[setup->active_binned_queries] == NULL);
1222 setup->active_queries[setup->active_binned_queries] = pq;
1223 setup->active_binned_queries++;
1224
1225 assert(setup->scene);
1226 if (setup->scene) {
1227 if (!lp_scene_bin_everywhere(setup->scene,
1228 LP_RAST_OP_BEGIN_QUERY,
1229 lp_rast_arg_query(pq))) {
1230
1231 if (!lp_setup_flush_and_restart(setup))
1232 return;
1233
1234 if (!lp_scene_bin_everywhere(setup->scene,
1235 LP_RAST_OP_BEGIN_QUERY,
1236 lp_rast_arg_query(pq))) {
1237 return;
1238 }
1239 }
1240 }
1241 }
1242
1243
1244 /**
1245 * Put an EndQuery command into all bins.
1246 */
1247 void
1248 lp_setup_end_query(struct lp_setup_context *setup, struct llvmpipe_query *pq)
1249 {
1250 set_scene_state(setup, SETUP_ACTIVE, "end_query");
1251
1252 assert(setup->scene);
1253 if (setup->scene) {
1254 /* pq->fence should be the fence of the *last* scene which
1255 * contributed to the query result.
1256 */
1257 lp_fence_reference(&pq->fence, setup->scene->fence);
1258
1259 if (pq->type == PIPE_QUERY_OCCLUSION_COUNTER ||
1260 pq->type == PIPE_QUERY_OCCLUSION_PREDICATE ||
1261 pq->type == PIPE_QUERY_PIPELINE_STATISTICS ||
1262 pq->type == PIPE_QUERY_TIMESTAMP) {
1263 if (!lp_scene_bin_everywhere(setup->scene,
1264 LP_RAST_OP_END_QUERY,
1265 lp_rast_arg_query(pq))) {
1266 if (!lp_setup_flush_and_restart(setup))
1267 goto fail;
1268
1269 if (!lp_scene_bin_everywhere(setup->scene,
1270 LP_RAST_OP_END_QUERY,
1271 lp_rast_arg_query(pq))) {
1272 goto fail;
1273 }
1274 }
1275 }
1276 }
1277 else {
1278 lp_fence_reference(&pq->fence, setup->last_fence);
1279 }
1280
1281 fail:
1282 /* Need to do this now not earlier since it still needs to be marked as
1283 * active when binning it would cause a flush.
1284 */
1285 if (pq->type == PIPE_QUERY_OCCLUSION_COUNTER ||
1286 pq->type == PIPE_QUERY_OCCLUSION_PREDICATE ||
1287 pq->type == PIPE_QUERY_PIPELINE_STATISTICS) {
1288 unsigned i;
1289
1290 /* remove from active binned query list */
1291 for (i = 0; i < setup->active_binned_queries; i++) {
1292 if (setup->active_queries[i] == pq)
1293 break;
1294 }
1295 assert(i < setup->active_binned_queries);
1296 if (i == setup->active_binned_queries)
1297 return;
1298 setup->active_binned_queries--;
1299 setup->active_queries[i] = setup->active_queries[setup->active_binned_queries];
1300 setup->active_queries[setup->active_binned_queries] = NULL;
1301 }
1302 }
1303
1304
1305 boolean
1306 lp_setup_flush_and_restart(struct lp_setup_context *setup)
1307 {
1308 if (0) debug_printf("%s\n", __FUNCTION__);
1309
1310 assert(setup->state == SETUP_ACTIVE);
1311
1312 if (!set_scene_state(setup, SETUP_FLUSHED, __FUNCTION__))
1313 return FALSE;
1314
1315 if (!lp_setup_update_state(setup, TRUE))
1316 return FALSE;
1317
1318 return TRUE;
1319 }
1320
1321