49962af7bb231c72cb5d2728f72af1851fa96bef
[mesa.git] / src / gallium / drivers / llvmpipe / lp_setup.c
1 /**************************************************************************
2 *
3 * Copyright 2007 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 /**
29 * Tiling engine.
30 *
31 * Builds per-tile display lists and executes them on calls to
32 * lp_setup_flush().
33 */
34
35 #include <limits.h>
36
37 #include "pipe/p_defines.h"
38 #include "util/u_framebuffer.h"
39 #include "util/u_inlines.h"
40 #include "util/u_memory.h"
41 #include "util/u_pack_color.h"
42 #include "draw/draw_pipe.h"
43 #include "os/os_time.h"
44 #include "lp_context.h"
45 #include "lp_memory.h"
46 #include "lp_scene.h"
47 #include "lp_texture.h"
48 #include "lp_debug.h"
49 #include "lp_fence.h"
50 #include "lp_query.h"
51 #include "lp_rast.h"
52 #include "lp_setup_context.h"
53 #include "lp_screen.h"
54 #include "lp_state.h"
55 #include "state_tracker/sw_winsys.h"
56
57 #include "draw/draw_context.h"
58 #include "draw/draw_vbuf.h"
59
60
61 static boolean set_scene_state( struct lp_setup_context *, enum setup_state,
62 const char *reason);
63 static boolean try_update_scene_state( struct lp_setup_context *setup );
64
65
66 static void
67 lp_setup_get_empty_scene(struct lp_setup_context *setup)
68 {
69 struct llvmpipe_context *lp = llvmpipe_context(setup->pipe);
70 boolean discard = lp->rasterizer ? lp->rasterizer->rasterizer_discard : FALSE;
71
72 assert(setup->scene == NULL);
73
74 setup->scene_idx++;
75 setup->scene_idx %= Elements(setup->scenes);
76
77 setup->scene = setup->scenes[setup->scene_idx];
78
79 if (setup->scene->fence) {
80 if (LP_DEBUG & DEBUG_SETUP)
81 debug_printf("%s: wait for scene %d\n",
82 __FUNCTION__, setup->scene->fence->id);
83
84 lp_fence_wait(setup->scene->fence);
85 }
86
87 lp_scene_begin_binning(setup->scene, &setup->fb, discard);
88
89 }
90
91
92 static void
93 first_triangle( struct lp_setup_context *setup,
94 const float (*v0)[4],
95 const float (*v1)[4],
96 const float (*v2)[4])
97 {
98 assert(setup->state == SETUP_ACTIVE);
99 lp_setup_choose_triangle( setup );
100 setup->triangle( setup, v0, v1, v2 );
101 }
102
103 static void
104 first_line( struct lp_setup_context *setup,
105 const float (*v0)[4],
106 const float (*v1)[4])
107 {
108 assert(setup->state == SETUP_ACTIVE);
109 lp_setup_choose_line( setup );
110 setup->line( setup, v0, v1 );
111 }
112
113 static void
114 first_point( struct lp_setup_context *setup,
115 const float (*v0)[4])
116 {
117 assert(setup->state == SETUP_ACTIVE);
118 lp_setup_choose_point( setup );
119 setup->point( setup, v0 );
120 }
121
122 void lp_setup_reset( struct lp_setup_context *setup )
123 {
124 unsigned i;
125
126 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
127
128 /* Reset derived state */
129 for (i = 0; i < Elements(setup->constants); ++i) {
130 setup->constants[i].stored_size = 0;
131 setup->constants[i].stored_data = NULL;
132 }
133 setup->fs.stored = NULL;
134 setup->dirty = ~0;
135
136 /* no current bin */
137 setup->scene = NULL;
138
139 /* Reset some state:
140 */
141 memset(&setup->clear, 0, sizeof setup->clear);
142
143 /* Have an explicit "start-binning" call and get rid of this
144 * pointer twiddling?
145 */
146 setup->line = first_line;
147 setup->point = first_point;
148 setup->triangle = first_triangle;
149 }
150
151
152 /** Rasterize all scene's bins */
153 static void
154 lp_setup_rasterize_scene( struct lp_setup_context *setup )
155 {
156 struct lp_scene *scene = setup->scene;
157 struct llvmpipe_screen *screen = llvmpipe_screen(scene->pipe->screen);
158
159 scene->num_active_queries = setup->active_binned_queries;
160 memcpy(scene->active_queries, setup->active_queries,
161 scene->num_active_queries * sizeof(scene->active_queries[0]));
162
163 lp_scene_end_binning(scene);
164
165 lp_fence_reference(&setup->last_fence, scene->fence);
166
167 if (setup->last_fence)
168 setup->last_fence->issued = TRUE;
169
170 pipe_mutex_lock(screen->rast_mutex);
171 lp_rast_queue_scene(screen->rast, scene);
172 lp_rast_finish(screen->rast);
173 pipe_mutex_unlock(screen->rast_mutex);
174
175 lp_scene_end_rasterization(setup->scene);
176 lp_setup_reset( setup );
177
178 LP_DBG(DEBUG_SETUP, "%s done \n", __FUNCTION__);
179 }
180
181
182
183 static boolean
184 begin_binning( struct lp_setup_context *setup )
185 {
186 struct lp_scene *scene = setup->scene;
187 boolean need_zsload = FALSE;
188 boolean ok;
189
190 assert(scene);
191 assert(scene->fence == NULL);
192
193 /* Always create a fence:
194 */
195 scene->fence = lp_fence_create(MAX2(1, setup->num_threads));
196 if (!scene->fence)
197 return FALSE;
198
199 ok = try_update_scene_state(setup);
200 if (!ok)
201 return FALSE;
202
203 if (setup->fb.zsbuf &&
204 ((setup->clear.flags & PIPE_CLEAR_DEPTHSTENCIL) != PIPE_CLEAR_DEPTHSTENCIL) &&
205 util_format_is_depth_and_stencil(setup->fb.zsbuf->format))
206 need_zsload = TRUE;
207
208 LP_DBG(DEBUG_SETUP, "%s color: %s depth: %s\n", __FUNCTION__,
209 (setup->clear.flags & PIPE_CLEAR_COLOR) ? "clear": "load",
210 need_zsload ? "clear": "load");
211
212 if (setup->fb.nr_cbufs) {
213 if (setup->clear.flags & PIPE_CLEAR_COLOR) {
214 ok = lp_scene_bin_everywhere( scene,
215 LP_RAST_OP_CLEAR_COLOR,
216 setup->clear.color );
217 if (!ok)
218 return FALSE;
219 }
220 }
221
222 if (setup->fb.zsbuf) {
223 if (setup->clear.flags & PIPE_CLEAR_DEPTHSTENCIL) {
224 if (!need_zsload)
225 scene->has_depthstencil_clear = TRUE;
226
227 ok = lp_scene_bin_everywhere( scene,
228 LP_RAST_OP_CLEAR_ZSTENCIL,
229 lp_rast_arg_clearzs(
230 setup->clear.zsvalue,
231 setup->clear.zsmask));
232 if (!ok)
233 return FALSE;
234 }
235 }
236
237 setup->clear.flags = 0;
238 setup->clear.zsmask = 0;
239 setup->clear.zsvalue = 0;
240
241 scene->had_queries = !!setup->active_binned_queries;
242
243 LP_DBG(DEBUG_SETUP, "%s done\n", __FUNCTION__);
244 return TRUE;
245 }
246
247
248 /* This basically bins and then flushes any outstanding full-screen
249 * clears.
250 *
251 * TODO: fast path for fullscreen clears and no triangles.
252 */
253 static boolean
254 execute_clears( struct lp_setup_context *setup )
255 {
256 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
257
258 return begin_binning( setup );
259 }
260
261 const char *states[] = {
262 "FLUSHED",
263 "CLEARED",
264 "ACTIVE "
265 };
266
267
268 static boolean
269 set_scene_state( struct lp_setup_context *setup,
270 enum setup_state new_state,
271 const char *reason)
272 {
273 unsigned old_state = setup->state;
274
275 if (old_state == new_state)
276 return TRUE;
277
278 if (LP_DEBUG & DEBUG_SCENE) {
279 debug_printf("%s old %s new %s%s%s\n",
280 __FUNCTION__,
281 states[old_state],
282 states[new_state],
283 (new_state == SETUP_FLUSHED) ? ": " : "",
284 (new_state == SETUP_FLUSHED) ? reason : "");
285
286 if (new_state == SETUP_FLUSHED && setup->scene)
287 lp_debug_draw_bins_by_cmd_length(setup->scene);
288 }
289
290 /* wait for a free/empty scene
291 */
292 if (old_state == SETUP_FLUSHED)
293 lp_setup_get_empty_scene(setup);
294
295 switch (new_state) {
296 case SETUP_CLEARED:
297 break;
298
299 case SETUP_ACTIVE:
300 if (!begin_binning( setup ))
301 goto fail;
302 break;
303
304 case SETUP_FLUSHED:
305 if (old_state == SETUP_CLEARED)
306 if (!execute_clears( setup ))
307 goto fail;
308
309 lp_setup_rasterize_scene( setup );
310 assert(setup->scene == NULL);
311 break;
312
313 default:
314 assert(0 && "invalid setup state mode");
315 goto fail;
316 }
317
318 setup->state = new_state;
319 return TRUE;
320
321 fail:
322 if (setup->scene) {
323 lp_scene_end_rasterization(setup->scene);
324 setup->scene = NULL;
325 }
326
327 setup->state = SETUP_FLUSHED;
328 lp_setup_reset( setup );
329 return FALSE;
330 }
331
332
333 void
334 lp_setup_flush( struct lp_setup_context *setup,
335 struct pipe_fence_handle **fence,
336 const char *reason)
337 {
338 set_scene_state( setup, SETUP_FLUSHED, reason );
339
340 if (fence) {
341 lp_fence_reference((struct lp_fence **)fence, setup->last_fence);
342 }
343 }
344
345
346 void
347 lp_setup_bind_framebuffer( struct lp_setup_context *setup,
348 const struct pipe_framebuffer_state *fb )
349 {
350 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
351
352 /* Flush any old scene.
353 */
354 set_scene_state( setup, SETUP_FLUSHED, __FUNCTION__ );
355
356 /*
357 * Ensure the old scene is not reused.
358 */
359 assert(!setup->scene);
360
361 /* Set new state. This will be picked up later when we next need a
362 * scene.
363 */
364 util_copy_framebuffer_state(&setup->fb, fb);
365 setup->framebuffer.x0 = 0;
366 setup->framebuffer.y0 = 0;
367 setup->framebuffer.x1 = fb->width-1;
368 setup->framebuffer.y1 = fb->height-1;
369 setup->dirty |= LP_SETUP_NEW_SCISSOR;
370 }
371
372
373 static boolean
374 lp_setup_try_clear( struct lp_setup_context *setup,
375 const union pipe_color_union *color,
376 double depth,
377 unsigned stencil,
378 unsigned flags )
379 {
380 uint64_t zsmask = 0;
381 uint64_t zsvalue = 0;
382 union lp_rast_cmd_arg color_arg;
383 unsigned i;
384
385 LP_DBG(DEBUG_SETUP, "%s state %d\n", __FUNCTION__, setup->state);
386
387 if (flags & PIPE_CLEAR_COLOR) {
388 for (i = 0; i < 4; i++)
389 color_arg.clear_color.i[i] = color->i[i];
390 }
391
392 if (flags & PIPE_CLEAR_DEPTHSTENCIL) {
393 uint32_t zmask = (flags & PIPE_CLEAR_DEPTH) ? ~0 : 0;
394 uint8_t smask = (flags & PIPE_CLEAR_STENCIL) ? ~0 : 0;
395
396 zsvalue = util_pack64_z_stencil(setup->fb.zsbuf->format,
397 depth,
398 stencil);
399
400
401 zsmask = util_pack64_mask_z_stencil(setup->fb.zsbuf->format,
402 zmask,
403 smask);
404
405 zsvalue &= zsmask;
406 }
407
408 if (setup->state == SETUP_ACTIVE) {
409 struct lp_scene *scene = setup->scene;
410
411 /* Add the clear to existing scene. In the unusual case where
412 * both color and depth-stencil are being cleared when there's
413 * already been some rendering, we could discard the currently
414 * binned scene and start again, but I don't see that as being
415 * a common usage.
416 */
417 if (flags & PIPE_CLEAR_COLOR) {
418 if (!lp_scene_bin_everywhere( scene,
419 LP_RAST_OP_CLEAR_COLOR,
420 color_arg ))
421 return FALSE;
422 }
423
424 if (flags & PIPE_CLEAR_DEPTHSTENCIL) {
425 if (!lp_scene_bin_everywhere( scene,
426 LP_RAST_OP_CLEAR_ZSTENCIL,
427 lp_rast_arg_clearzs(zsvalue, zsmask) ))
428 return FALSE;
429 }
430 }
431 else {
432 /* Put ourselves into the 'pre-clear' state, specifically to try
433 * and accumulate multiple clears to color and depth_stencil
434 * buffers which the app or state-tracker might issue
435 * separately.
436 */
437 set_scene_state( setup, SETUP_CLEARED, __FUNCTION__ );
438
439 setup->clear.flags |= flags;
440
441 if (flags & PIPE_CLEAR_DEPTHSTENCIL) {
442 setup->clear.zsmask |= zsmask;
443 setup->clear.zsvalue =
444 (setup->clear.zsvalue & ~zsmask) | (zsvalue & zsmask);
445 }
446
447 if (flags & PIPE_CLEAR_COLOR) {
448 memcpy(&setup->clear.color.clear_color,
449 &color_arg,
450 sizeof setup->clear.color.clear_color);
451 }
452 }
453
454 return TRUE;
455 }
456
457 void
458 lp_setup_clear( struct lp_setup_context *setup,
459 const union pipe_color_union *color,
460 double depth,
461 unsigned stencil,
462 unsigned flags )
463 {
464 if (!lp_setup_try_clear( setup, color, depth, stencil, flags )) {
465 lp_setup_flush(setup, NULL, __FUNCTION__);
466
467 if (!lp_setup_try_clear( setup, color, depth, stencil, flags ))
468 assert(0);
469 }
470 }
471
472
473
474
475
476 void
477 lp_setup_set_triangle_state( struct lp_setup_context *setup,
478 unsigned cull_mode,
479 boolean ccw_is_frontface,
480 boolean scissor,
481 boolean half_pixel_center,
482 boolean bottom_edge_rule)
483 {
484 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
485
486 setup->ccw_is_frontface = ccw_is_frontface;
487 setup->cullmode = cull_mode;
488 setup->triangle = first_triangle;
489 setup->pixel_offset = half_pixel_center ? 0.5f : 0.0f;
490 setup->bottom_edge_rule = bottom_edge_rule;
491
492 if (setup->scissor_test != scissor) {
493 setup->dirty |= LP_SETUP_NEW_SCISSOR;
494 setup->scissor_test = scissor;
495 }
496 }
497
498 void
499 lp_setup_set_line_state( struct lp_setup_context *setup,
500 float line_width)
501 {
502 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
503
504 setup->line_width = line_width;
505 }
506
507 void
508 lp_setup_set_point_state( struct lp_setup_context *setup,
509 float point_size,
510 boolean point_size_per_vertex,
511 uint sprite_coord_enable,
512 uint sprite_coord_origin)
513 {
514 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
515
516 setup->point_size = point_size;
517 setup->sprite_coord_enable = sprite_coord_enable;
518 setup->sprite_coord_origin = sprite_coord_origin;
519 setup->point_size_per_vertex = point_size_per_vertex;
520 }
521
522 void
523 lp_setup_set_setup_variant( struct lp_setup_context *setup,
524 const struct lp_setup_variant *variant)
525 {
526 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
527
528 setup->setup.variant = variant;
529 }
530
531 void
532 lp_setup_set_fs_variant( struct lp_setup_context *setup,
533 struct lp_fragment_shader_variant *variant)
534 {
535 LP_DBG(DEBUG_SETUP, "%s %p\n", __FUNCTION__,
536 variant);
537 /* FIXME: reference count */
538
539 setup->fs.current.variant = variant;
540 setup->dirty |= LP_SETUP_NEW_FS;
541 }
542
543 void
544 lp_setup_set_fs_constants(struct lp_setup_context *setup,
545 unsigned num,
546 struct pipe_constant_buffer *buffers)
547 {
548 unsigned i;
549
550 LP_DBG(DEBUG_SETUP, "%s %p\n", __FUNCTION__, (void *) buffers);
551
552 assert(num <= Elements(setup->constants));
553
554 for (i = 0; i < num; ++i) {
555 util_copy_constant_buffer(&setup->constants[i].current, &buffers[i]);
556 }
557 for (; i < Elements(setup->constants); i++) {
558 util_copy_constant_buffer(&setup->constants[i].current, NULL);
559 }
560 setup->dirty |= LP_SETUP_NEW_CONSTANTS;
561 }
562
563
564 void
565 lp_setup_set_alpha_ref_value( struct lp_setup_context *setup,
566 float alpha_ref_value )
567 {
568 LP_DBG(DEBUG_SETUP, "%s %f\n", __FUNCTION__, alpha_ref_value);
569
570 if(setup->fs.current.jit_context.alpha_ref_value != alpha_ref_value) {
571 setup->fs.current.jit_context.alpha_ref_value = alpha_ref_value;
572 setup->dirty |= LP_SETUP_NEW_FS;
573 }
574 }
575
576 void
577 lp_setup_set_stencil_ref_values( struct lp_setup_context *setup,
578 const ubyte refs[2] )
579 {
580 LP_DBG(DEBUG_SETUP, "%s %d %d\n", __FUNCTION__, refs[0], refs[1]);
581
582 if (setup->fs.current.jit_context.stencil_ref_front != refs[0] ||
583 setup->fs.current.jit_context.stencil_ref_back != refs[1]) {
584 setup->fs.current.jit_context.stencil_ref_front = refs[0];
585 setup->fs.current.jit_context.stencil_ref_back = refs[1];
586 setup->dirty |= LP_SETUP_NEW_FS;
587 }
588 }
589
590 void
591 lp_setup_set_blend_color( struct lp_setup_context *setup,
592 const struct pipe_blend_color *blend_color )
593 {
594 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
595
596 assert(blend_color);
597
598 if(memcmp(&setup->blend_color.current, blend_color, sizeof *blend_color) != 0) {
599 memcpy(&setup->blend_color.current, blend_color, sizeof *blend_color);
600 setup->dirty |= LP_SETUP_NEW_BLEND_COLOR;
601 }
602 }
603
604
605 void
606 lp_setup_set_scissors( struct lp_setup_context *setup,
607 const struct pipe_scissor_state *scissors )
608 {
609 unsigned i;
610 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
611
612 assert(scissors);
613
614 for (i = 0; i < PIPE_MAX_VIEWPORTS; ++i) {
615 setup->scissors[i].x0 = scissors[i].minx;
616 setup->scissors[i].x1 = scissors[i].maxx-1;
617 setup->scissors[i].y0 = scissors[i].miny;
618 setup->scissors[i].y1 = scissors[i].maxy-1;
619 }
620 setup->dirty |= LP_SETUP_NEW_SCISSOR;
621 }
622
623
624 void
625 lp_setup_set_flatshade_first( struct lp_setup_context *setup,
626 boolean flatshade_first )
627 {
628 setup->flatshade_first = flatshade_first;
629 }
630
631 void
632 lp_setup_set_rasterizer_discard( struct lp_setup_context *setup,
633 boolean rasterizer_discard )
634 {
635 if (setup->rasterizer_discard != rasterizer_discard) {
636 setup->rasterizer_discard = rasterizer_discard;
637 set_scene_state( setup, SETUP_FLUSHED, __FUNCTION__ );
638 }
639 }
640
641 void
642 lp_setup_set_vertex_info( struct lp_setup_context *setup,
643 struct vertex_info *vertex_info )
644 {
645 /* XXX: just silently holding onto the pointer:
646 */
647 setup->vertex_info = vertex_info;
648 }
649
650
651 /**
652 * Called during state validation when LP_NEW_VIEWPORT is set.
653 */
654 void
655 lp_setup_set_viewports(struct lp_setup_context *setup,
656 unsigned num_viewports,
657 const struct pipe_viewport_state *viewports)
658 {
659 struct llvmpipe_context *lp = llvmpipe_context(setup->pipe);
660 unsigned i;
661
662 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
663
664 assert(num_viewports <= PIPE_MAX_VIEWPORTS);
665 assert(viewports);
666
667 /*
668 * For use in lp_state_fs.c, propagate the viewport values for all viewports.
669 */
670 for (i = 0; i < num_viewports; i++) {
671 float min_depth;
672 float max_depth;
673
674 if (lp->rasterizer->clip_halfz == 0) {
675 float half_depth = viewports[i].scale[2];
676 min_depth = viewports[i].translate[2] - half_depth;
677 max_depth = min_depth + half_depth * 2.0f;
678 } else {
679 min_depth = viewports[i].translate[2];
680 max_depth = min_depth + viewports[i].scale[2];
681 }
682
683 if (setup->viewports[i].min_depth != min_depth ||
684 setup->viewports[i].max_depth != max_depth) {
685 setup->viewports[i].min_depth = min_depth;
686 setup->viewports[i].max_depth = max_depth;
687 setup->dirty |= LP_SETUP_NEW_VIEWPORTS;
688 }
689 }
690 }
691
692
693 /**
694 * Called during state validation when LP_NEW_SAMPLER_VIEW is set.
695 */
696 void
697 lp_setup_set_fragment_sampler_views(struct lp_setup_context *setup,
698 unsigned num,
699 struct pipe_sampler_view **views)
700 {
701 unsigned i;
702
703 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
704
705 assert(num <= PIPE_MAX_SHADER_SAMPLER_VIEWS);
706
707 for (i = 0; i < PIPE_MAX_SHADER_SAMPLER_VIEWS; i++) {
708 struct pipe_sampler_view *view = i < num ? views[i] : NULL;
709
710 if (view) {
711 struct pipe_resource *res = view->texture;
712 struct llvmpipe_resource *lp_tex = llvmpipe_resource(res);
713 struct lp_jit_texture *jit_tex;
714 jit_tex = &setup->fs.current.jit_context.textures[i];
715
716 /* We're referencing the texture's internal data, so save a
717 * reference to it.
718 */
719 pipe_resource_reference(&setup->fs.current_tex[i], res);
720
721 if (!lp_tex->dt) {
722 /* regular texture - setup array of mipmap level offsets */
723 void *mip_ptr;
724 int j;
725 unsigned first_level = 0;
726 unsigned last_level = 0;
727
728 if (llvmpipe_resource_is_texture(res)) {
729 first_level = view->u.tex.first_level;
730 last_level = view->u.tex.last_level;
731 assert(first_level <= last_level);
732 assert(last_level <= res->last_level);
733
734 /*
735 * The complexity here should no longer be necessary.
736 */
737 mip_ptr = llvmpipe_get_texture_image_all(lp_tex, first_level,
738 LP_TEX_USAGE_READ);
739 jit_tex->base = lp_tex->linear_img.data;
740 }
741 else {
742 mip_ptr = lp_tex->data;
743 jit_tex->base = mip_ptr;
744 }
745
746 if ((LP_PERF & PERF_TEX_MEM) || !mip_ptr) {
747 /* out of memory - use dummy tile memory */
748 /* Note if using PERF_TEX_MEM will also skip tile conversion */
749 jit_tex->base = lp_dummy_tile;
750 jit_tex->width = TILE_SIZE/8;
751 jit_tex->height = TILE_SIZE/8;
752 jit_tex->depth = 1;
753 jit_tex->first_level = 0;
754 jit_tex->last_level = 0;
755 jit_tex->mip_offsets[0] = 0;
756 jit_tex->row_stride[0] = 0;
757 jit_tex->img_stride[0] = 0;
758 }
759 else {
760 jit_tex->width = res->width0;
761 jit_tex->height = res->height0;
762 jit_tex->depth = res->depth0;
763 jit_tex->first_level = first_level;
764 jit_tex->last_level = last_level;
765
766 if (llvmpipe_resource_is_texture(res)) {
767 for (j = first_level; j <= last_level; j++) {
768 mip_ptr = llvmpipe_get_texture_image_all(lp_tex, j,
769 LP_TEX_USAGE_READ);
770 jit_tex->mip_offsets[j] = (uint8_t *)mip_ptr - (uint8_t *)jit_tex->base;
771 /*
772 * could get mip offset directly but need call above to
773 * invoke tiled->linear conversion.
774 */
775 assert(lp_tex->linear_mip_offsets[j] == jit_tex->mip_offsets[j]);
776 jit_tex->row_stride[j] = lp_tex->row_stride[j];
777 jit_tex->img_stride[j] = lp_tex->img_stride[j];
778 }
779
780 if (res->target == PIPE_TEXTURE_1D_ARRAY ||
781 res->target == PIPE_TEXTURE_2D_ARRAY) {
782 /*
783 * For array textures, we don't have first_layer, instead
784 * adjust last_layer (stored as depth) plus the mip level offsets
785 * (as we have mip-first layout can't just adjust base ptr).
786 * XXX For mip levels, could do something similar.
787 */
788 jit_tex->depth = view->u.tex.last_layer - view->u.tex.first_layer + 1;
789 for (j = first_level; j <= last_level; j++) {
790 jit_tex->mip_offsets[j] += view->u.tex.first_layer *
791 lp_tex->img_stride[j];
792 }
793 assert(view->u.tex.first_layer <= view->u.tex.last_layer);
794 assert(view->u.tex.last_layer < res->array_size);
795 }
796 }
797 else {
798 /*
799 * For buffers, we don't have first_element, instead adjust
800 * last_element (stored as width) plus the base pointer.
801 */
802 unsigned view_blocksize = util_format_get_blocksize(view->format);
803 /* probably don't really need to fill that out */
804 jit_tex->mip_offsets[0] = 0;
805 jit_tex->row_stride[0] = 0;
806 jit_tex->row_stride[0] = 0;
807
808 /* everything specified in number of elements here. */
809 jit_tex->width = view->u.buf.last_element - view->u.buf.first_element + 1;
810 jit_tex->base = (uint8_t *)jit_tex->base + view->u.buf.first_element *
811 view_blocksize;
812 /* XXX Unsure if we need to sanitize parameters? */
813 assert(view->u.buf.first_element <= view->u.buf.last_element);
814 assert(view->u.buf.last_element * view_blocksize < res->width0);
815 }
816 }
817 }
818 else {
819 /* display target texture/surface */
820 /*
821 * XXX: Where should this be unmapped?
822 */
823 struct llvmpipe_screen *screen = llvmpipe_screen(res->screen);
824 struct sw_winsys *winsys = screen->winsys;
825 jit_tex->base = winsys->displaytarget_map(winsys, lp_tex->dt,
826 PIPE_TRANSFER_READ);
827 jit_tex->row_stride[0] = lp_tex->row_stride[0];
828 jit_tex->img_stride[0] = lp_tex->img_stride[0];
829 jit_tex->mip_offsets[0] = 0;
830 jit_tex->width = res->width0;
831 jit_tex->height = res->height0;
832 jit_tex->depth = res->depth0;
833 jit_tex->first_level = jit_tex->last_level = 0;
834 assert(jit_tex->base);
835 }
836 }
837 }
838
839 setup->dirty |= LP_SETUP_NEW_FS;
840 }
841
842
843 /**
844 * Called during state validation when LP_NEW_SAMPLER is set.
845 */
846 void
847 lp_setup_set_fragment_sampler_state(struct lp_setup_context *setup,
848 unsigned num,
849 struct pipe_sampler_state **samplers)
850 {
851 unsigned i;
852
853 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
854
855 assert(num <= PIPE_MAX_SAMPLERS);
856
857 for (i = 0; i < PIPE_MAX_SAMPLERS; i++) {
858 const struct pipe_sampler_state *sampler = i < num ? samplers[i] : NULL;
859
860 if (sampler) {
861 struct lp_jit_sampler *jit_sam;
862 jit_sam = &setup->fs.current.jit_context.samplers[i];
863
864 jit_sam->min_lod = sampler->min_lod;
865 jit_sam->max_lod = sampler->max_lod;
866 jit_sam->lod_bias = sampler->lod_bias;
867 COPY_4V(jit_sam->border_color, sampler->border_color.f);
868 }
869 }
870
871 setup->dirty |= LP_SETUP_NEW_FS;
872 }
873
874
875 /**
876 * Is the given texture referenced by any scene?
877 * Note: we have to check all scenes including any scenes currently
878 * being rendered and the current scene being built.
879 */
880 unsigned
881 lp_setup_is_resource_referenced( const struct lp_setup_context *setup,
882 const struct pipe_resource *texture )
883 {
884 unsigned i;
885
886 /* check the render targets */
887 for (i = 0; i < setup->fb.nr_cbufs; i++) {
888 if (setup->fb.cbufs[i]->texture == texture)
889 return LP_REFERENCED_FOR_READ | LP_REFERENCED_FOR_WRITE;
890 }
891 if (setup->fb.zsbuf && setup->fb.zsbuf->texture == texture) {
892 return LP_REFERENCED_FOR_READ | LP_REFERENCED_FOR_WRITE;
893 }
894
895 /* check textures referenced by the scene */
896 for (i = 0; i < Elements(setup->scenes); i++) {
897 if (lp_scene_is_resource_referenced(setup->scenes[i], texture)) {
898 return LP_REFERENCED_FOR_READ;
899 }
900 }
901
902 return LP_UNREFERENCED;
903 }
904
905
906 /**
907 * Called by vbuf code when we're about to draw something.
908 *
909 * This function stores all dirty state in the current scene's display list
910 * memory, via lp_scene_alloc(). We can not pass pointers of mutable state to
911 * the JIT functions, as the JIT functions will be called later on, most likely
912 * on a different thread.
913 *
914 * When processing dirty state it is imperative that we don't refer to any
915 * pointers previously allocated with lp_scene_alloc() in this function (or any
916 * function) as they may belong to a scene freed since then.
917 */
918 static boolean
919 try_update_scene_state( struct lp_setup_context *setup )
920 {
921 boolean new_scene = (setup->fs.stored == NULL);
922 struct lp_scene *scene = setup->scene;
923 unsigned i;
924
925 assert(scene);
926
927 if (setup->dirty & LP_SETUP_NEW_VIEWPORTS) {
928 /*
929 * Record new depth range state for changes due to viewport updates.
930 *
931 * TODO: Collapse the existing viewport and depth range information
932 * into one structure, for access by JIT.
933 */
934 struct lp_jit_viewport *stored;
935
936 stored = (struct lp_jit_viewport *)
937 lp_scene_alloc(scene, sizeof setup->viewports);
938
939 if (!stored) {
940 assert(!new_scene);
941 return FALSE;
942 }
943
944 memcpy(stored, setup->viewports, sizeof setup->viewports);
945
946 setup->fs.current.jit_context.viewports = stored;
947 setup->dirty |= LP_SETUP_NEW_FS;
948 }
949
950 if(setup->dirty & LP_SETUP_NEW_BLEND_COLOR) {
951 uint8_t *stored;
952 float* fstored;
953 unsigned i, j;
954 unsigned size;
955
956 /* Alloc u8_blend_color (16 x i8) and f_blend_color (4 or 8 x f32) */
957 size = 4 * 16 * sizeof(uint8_t);
958 size += (LP_MAX_VECTOR_LENGTH / 4) * sizeof(float);
959 stored = lp_scene_alloc_aligned(scene, size, LP_MAX_VECTOR_LENGTH);
960
961 if (!stored) {
962 assert(!new_scene);
963 return FALSE;
964 }
965
966 /* Store floating point colour */
967 fstored = (float*)(stored + 4*16);
968 for (i = 0; i < (LP_MAX_VECTOR_LENGTH / 4); ++i) {
969 fstored[i] = setup->blend_color.current.color[i % 4];
970 }
971
972 /* smear each blend color component across 16 ubyte elements */
973 for (i = 0; i < 4; ++i) {
974 uint8_t c = float_to_ubyte(setup->blend_color.current.color[i]);
975 for (j = 0; j < 16; ++j)
976 stored[i*16 + j] = c;
977 }
978
979 setup->blend_color.stored = stored;
980 setup->fs.current.jit_context.u8_blend_color = stored;
981 setup->fs.current.jit_context.f_blend_color = fstored;
982 setup->dirty |= LP_SETUP_NEW_FS;
983 }
984
985 if (setup->dirty & LP_SETUP_NEW_CONSTANTS) {
986 for (i = 0; i < Elements(setup->constants); ++i) {
987 struct pipe_resource *buffer = setup->constants[i].current.buffer;
988 const unsigned current_size = setup->constants[i].current.buffer_size;
989 const ubyte *current_data = NULL;
990
991 if (buffer) {
992 /* resource buffer */
993 current_data = (ubyte *) llvmpipe_resource_data(buffer);
994 }
995 else if (setup->constants[i].current.user_buffer) {
996 /* user-space buffer */
997 current_data = (ubyte *) setup->constants[i].current.user_buffer;
998 }
999
1000 if (current_data) {
1001 current_data += setup->constants[i].current.buffer_offset;
1002
1003 /* TODO: copy only the actually used constants? */
1004
1005 if (setup->constants[i].stored_size != current_size ||
1006 !setup->constants[i].stored_data ||
1007 memcmp(setup->constants[i].stored_data,
1008 current_data,
1009 current_size) != 0) {
1010 void *stored;
1011
1012 stored = lp_scene_alloc(scene, current_size);
1013 if (!stored) {
1014 assert(!new_scene);
1015 return FALSE;
1016 }
1017
1018 memcpy(stored,
1019 current_data,
1020 current_size);
1021 setup->constants[i].stored_size = current_size;
1022 setup->constants[i].stored_data = stored;
1023 }
1024 }
1025 else {
1026 setup->constants[i].stored_size = 0;
1027 setup->constants[i].stored_data = NULL;
1028 }
1029
1030 setup->fs.current.jit_context.constants[i] = setup->constants[i].stored_data;
1031 setup->dirty |= LP_SETUP_NEW_FS;
1032 }
1033 }
1034
1035
1036 if (setup->dirty & LP_SETUP_NEW_FS) {
1037 if (!setup->fs.stored ||
1038 memcmp(setup->fs.stored,
1039 &setup->fs.current,
1040 sizeof setup->fs.current) != 0)
1041 {
1042 struct lp_rast_state *stored;
1043
1044 /* The fs state that's been stored in the scene is different from
1045 * the new, current state. So allocate a new lp_rast_state object
1046 * and append it to the bin's setup data buffer.
1047 */
1048 stored = (struct lp_rast_state *) lp_scene_alloc(scene, sizeof *stored);
1049 if (!stored) {
1050 assert(!new_scene);
1051 return FALSE;
1052 }
1053
1054 memcpy(stored,
1055 &setup->fs.current,
1056 sizeof setup->fs.current);
1057 setup->fs.stored = stored;
1058
1059 /* The scene now references the textures in the rasterization
1060 * state record. Note that now.
1061 */
1062 for (i = 0; i < Elements(setup->fs.current_tex); i++) {
1063 if (setup->fs.current_tex[i]) {
1064 if (!lp_scene_add_resource_reference(scene,
1065 setup->fs.current_tex[i],
1066 new_scene)) {
1067 assert(!new_scene);
1068 return FALSE;
1069 }
1070 }
1071 }
1072 }
1073 }
1074
1075 if (setup->dirty & LP_SETUP_NEW_SCISSOR) {
1076 unsigned i;
1077 for (i = 0; i < PIPE_MAX_VIEWPORTS; ++i) {
1078 setup->draw_regions[i] = setup->framebuffer;
1079 if (setup->scissor_test) {
1080 u_rect_possible_intersection(&setup->scissors[i],
1081 &setup->draw_regions[i]);
1082 }
1083 }
1084 /*
1085 * Subdivide triangles if the framebuffer is larger than the
1086 * MAX_FIXED_LENGTH.
1087 */
1088 setup->subdivide_large_triangles = (setup->fb.width > MAX_FIXED_LENGTH ||
1089 setup->fb.height > MAX_FIXED_LENGTH);
1090 }
1091
1092 setup->dirty = 0;
1093
1094 assert(setup->fs.stored);
1095 return TRUE;
1096 }
1097
1098 boolean
1099 lp_setup_update_state( struct lp_setup_context *setup,
1100 boolean update_scene )
1101 {
1102 /* Some of the 'draw' pipeline stages may have changed some driver state.
1103 * Make sure we've processed those state changes before anything else.
1104 *
1105 * XXX this is the only place where llvmpipe_context is used in the
1106 * setup code. This may get refactored/changed...
1107 */
1108 {
1109 struct llvmpipe_context *lp = llvmpipe_context(setup->pipe);
1110 if (lp->dirty) {
1111 llvmpipe_update_derived(lp);
1112 }
1113
1114 if (lp->setup->dirty) {
1115 llvmpipe_update_setup(lp);
1116 }
1117
1118 assert(setup->setup.variant);
1119
1120 /* Will probably need to move this somewhere else, just need
1121 * to know about vertex shader point size attribute.
1122 */
1123 setup->psize = lp->psize_slot;
1124 setup->viewport_index_slot = lp->viewport_index_slot;
1125 setup->layer_slot = lp->layer_slot;
1126 setup->face_slot = lp->face_slot;
1127
1128 assert(lp->dirty == 0);
1129
1130 assert(lp->setup_variant.key.size ==
1131 setup->setup.variant->key.size);
1132
1133 assert(memcmp(&lp->setup_variant.key,
1134 &setup->setup.variant->key,
1135 setup->setup.variant->key.size) == 0);
1136 }
1137
1138 if (update_scene && setup->state != SETUP_ACTIVE) {
1139 if (!set_scene_state( setup, SETUP_ACTIVE, __FUNCTION__ ))
1140 return FALSE;
1141 }
1142
1143 /* Only call into update_scene_state() if we already have a
1144 * scene:
1145 */
1146 if (update_scene && setup->scene) {
1147 assert(setup->state == SETUP_ACTIVE);
1148
1149 if (try_update_scene_state(setup))
1150 return TRUE;
1151
1152 /* Update failed, try to restart the scene.
1153 *
1154 * Cannot call lp_setup_flush_and_restart() directly here
1155 * because of potential recursion.
1156 */
1157 if (!set_scene_state(setup, SETUP_FLUSHED, __FUNCTION__))
1158 return FALSE;
1159
1160 if (!set_scene_state(setup, SETUP_ACTIVE, __FUNCTION__))
1161 return FALSE;
1162
1163 if (!setup->scene)
1164 return FALSE;
1165
1166 return try_update_scene_state(setup);
1167 }
1168
1169 return TRUE;
1170 }
1171
1172
1173
1174 /* Only caller is lp_setup_vbuf_destroy()
1175 */
1176 void
1177 lp_setup_destroy( struct lp_setup_context *setup )
1178 {
1179 uint i;
1180
1181 lp_setup_reset( setup );
1182
1183 util_unreference_framebuffer_state(&setup->fb);
1184
1185 for (i = 0; i < Elements(setup->fs.current_tex); i++) {
1186 pipe_resource_reference(&setup->fs.current_tex[i], NULL);
1187 }
1188
1189 for (i = 0; i < Elements(setup->constants); i++) {
1190 pipe_resource_reference(&setup->constants[i].current.buffer, NULL);
1191 }
1192
1193 /* free the scenes in the 'empty' queue */
1194 for (i = 0; i < Elements(setup->scenes); i++) {
1195 struct lp_scene *scene = setup->scenes[i];
1196
1197 if (scene->fence)
1198 lp_fence_wait(scene->fence);
1199
1200 lp_scene_destroy(scene);
1201 }
1202
1203 lp_fence_reference(&setup->last_fence, NULL);
1204
1205 FREE( setup );
1206 }
1207
1208
1209 /**
1210 * Create a new primitive tiling engine. Plug it into the backend of
1211 * the draw module. Currently also creates a rasterizer to use with
1212 * it.
1213 */
1214 struct lp_setup_context *
1215 lp_setup_create( struct pipe_context *pipe,
1216 struct draw_context *draw )
1217 {
1218 struct llvmpipe_screen *screen = llvmpipe_screen(pipe->screen);
1219 struct lp_setup_context *setup;
1220 unsigned i;
1221
1222 setup = CALLOC_STRUCT(lp_setup_context);
1223 if (!setup) {
1224 goto no_setup;
1225 }
1226
1227 lp_setup_init_vbuf(setup);
1228
1229 /* Used only in update_state():
1230 */
1231 setup->pipe = pipe;
1232
1233
1234 setup->num_threads = screen->num_threads;
1235 setup->vbuf = draw_vbuf_stage(draw, &setup->base);
1236 if (!setup->vbuf) {
1237 goto no_vbuf;
1238 }
1239
1240 draw_set_rasterize_stage(draw, setup->vbuf);
1241 draw_set_render(draw, &setup->base);
1242
1243 /* create some empty scenes */
1244 for (i = 0; i < MAX_SCENES; i++) {
1245 setup->scenes[i] = lp_scene_create( pipe );
1246 if (!setup->scenes[i]) {
1247 goto no_scenes;
1248 }
1249 }
1250
1251 setup->triangle = first_triangle;
1252 setup->line = first_line;
1253 setup->point = first_point;
1254
1255 setup->dirty = ~0;
1256
1257 return setup;
1258
1259 no_scenes:
1260 for (i = 0; i < MAX_SCENES; i++) {
1261 if (setup->scenes[i]) {
1262 lp_scene_destroy(setup->scenes[i]);
1263 }
1264 }
1265
1266 setup->vbuf->destroy(setup->vbuf);
1267 no_vbuf:
1268 FREE(setup);
1269 no_setup:
1270 return NULL;
1271 }
1272
1273
1274 /**
1275 * Put a BeginQuery command into all bins.
1276 */
1277 void
1278 lp_setup_begin_query(struct lp_setup_context *setup,
1279 struct llvmpipe_query *pq)
1280 {
1281
1282 set_scene_state(setup, SETUP_ACTIVE, "begin_query");
1283
1284 if (!(pq->type == PIPE_QUERY_OCCLUSION_COUNTER ||
1285 pq->type == PIPE_QUERY_OCCLUSION_PREDICATE ||
1286 pq->type == PIPE_QUERY_PIPELINE_STATISTICS))
1287 return;
1288
1289 /* init the query to its beginning state */
1290 assert(setup->active_binned_queries < LP_MAX_ACTIVE_BINNED_QUERIES);
1291 /* exceeding list size so just ignore the query */
1292 if (setup->active_binned_queries >= LP_MAX_ACTIVE_BINNED_QUERIES) {
1293 return;
1294 }
1295 assert(setup->active_queries[setup->active_binned_queries] == NULL);
1296 setup->active_queries[setup->active_binned_queries] = pq;
1297 setup->active_binned_queries++;
1298
1299 assert(setup->scene);
1300 if (setup->scene) {
1301 if (!lp_scene_bin_everywhere(setup->scene,
1302 LP_RAST_OP_BEGIN_QUERY,
1303 lp_rast_arg_query(pq))) {
1304
1305 if (!lp_setup_flush_and_restart(setup))
1306 return;
1307
1308 if (!lp_scene_bin_everywhere(setup->scene,
1309 LP_RAST_OP_BEGIN_QUERY,
1310 lp_rast_arg_query(pq))) {
1311 return;
1312 }
1313 }
1314 setup->scene->had_queries |= TRUE;
1315 }
1316 }
1317
1318
1319 /**
1320 * Put an EndQuery command into all bins.
1321 */
1322 void
1323 lp_setup_end_query(struct lp_setup_context *setup, struct llvmpipe_query *pq)
1324 {
1325 set_scene_state(setup, SETUP_ACTIVE, "end_query");
1326
1327 assert(setup->scene);
1328 if (setup->scene) {
1329 /* pq->fence should be the fence of the *last* scene which
1330 * contributed to the query result.
1331 */
1332 lp_fence_reference(&pq->fence, setup->scene->fence);
1333
1334 if (pq->type == PIPE_QUERY_OCCLUSION_COUNTER ||
1335 pq->type == PIPE_QUERY_OCCLUSION_PREDICATE ||
1336 pq->type == PIPE_QUERY_PIPELINE_STATISTICS ||
1337 pq->type == PIPE_QUERY_TIMESTAMP) {
1338 if (pq->type == PIPE_QUERY_TIMESTAMP &&
1339 !(setup->scene->tiles_x | setup->scene->tiles_y)) {
1340 /*
1341 * If there's a zero width/height framebuffer, there's no bins and
1342 * hence no rast task is ever run. So fill in something here instead.
1343 */
1344 pq->end[0] = os_time_get_nano();
1345 }
1346
1347 if (!lp_scene_bin_everywhere(setup->scene,
1348 LP_RAST_OP_END_QUERY,
1349 lp_rast_arg_query(pq))) {
1350 if (!lp_setup_flush_and_restart(setup))
1351 goto fail;
1352
1353 if (!lp_scene_bin_everywhere(setup->scene,
1354 LP_RAST_OP_END_QUERY,
1355 lp_rast_arg_query(pq))) {
1356 goto fail;
1357 }
1358 }
1359 setup->scene->had_queries |= TRUE;
1360 }
1361 }
1362 else {
1363 lp_fence_reference(&pq->fence, setup->last_fence);
1364 }
1365
1366 fail:
1367 /* Need to do this now not earlier since it still needs to be marked as
1368 * active when binning it would cause a flush.
1369 */
1370 if (pq->type == PIPE_QUERY_OCCLUSION_COUNTER ||
1371 pq->type == PIPE_QUERY_OCCLUSION_PREDICATE ||
1372 pq->type == PIPE_QUERY_PIPELINE_STATISTICS) {
1373 unsigned i;
1374
1375 /* remove from active binned query list */
1376 for (i = 0; i < setup->active_binned_queries; i++) {
1377 if (setup->active_queries[i] == pq)
1378 break;
1379 }
1380 assert(i < setup->active_binned_queries);
1381 if (i == setup->active_binned_queries)
1382 return;
1383 setup->active_binned_queries--;
1384 setup->active_queries[i] = setup->active_queries[setup->active_binned_queries];
1385 setup->active_queries[setup->active_binned_queries] = NULL;
1386 }
1387 }
1388
1389
1390 boolean
1391 lp_setup_flush_and_restart(struct lp_setup_context *setup)
1392 {
1393 if (0) debug_printf("%s\n", __FUNCTION__);
1394
1395 assert(setup->state == SETUP_ACTIVE);
1396
1397 if (!set_scene_state(setup, SETUP_FLUSHED, __FUNCTION__))
1398 return FALSE;
1399
1400 if (!lp_setup_update_state(setup, TRUE))
1401 return FALSE;
1402
1403 return TRUE;
1404 }
1405
1406