82c006d78b0b35331b5e4b28b029198e69185b80
1 /**************************************************************************
3 * Copyright 2009 VMware, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
29 #include "util/u_memory.h"
30 #include "util/u_math.h"
31 #include "util/u_cpu_detect.h"
32 #include "util/u_surface.h"
34 #include "lp_scene_queue.h"
39 #include "lp_rast_priv.h"
40 #include "lp_tile_soa.h"
41 #include "gallivm/lp_bld_debug.h"
46 * Begin the rasterization phase.
47 * Map the framebuffer surfaces. Initialize the 'rast' state.
50 lp_rast_begin( struct lp_rasterizer
*rast
,
51 const struct pipe_framebuffer_state
*fb
,
53 boolean write_zstencil
)
55 struct pipe_screen
*screen
= rast
->screen
;
56 struct pipe_surface
*cbuf
, *zsbuf
;
59 LP_DBG(DEBUG_RAST
, "%s\n", __FUNCTION__
);
61 util_copy_framebuffer_state(&rast
->state
.fb
, fb
);
63 rast
->state
.write_zstencil
= write_zstencil
;
64 rast
->state
.write_color
= write_color
;
66 rast
->check_for_clipped_tiles
= (fb
->width
% TILE_SIZE
!= 0 ||
67 fb
->height
% TILE_SIZE
!= 0);
70 for (i
= 0; i
< rast
->state
.fb
.nr_cbufs
; i
++) {
71 cbuf
= rast
->state
.fb
.cbufs
[i
];
73 rast
->cbuf_transfer
[i
] = screen
->get_tex_transfer(rast
->screen
,
78 PIPE_TRANSFER_READ_WRITE
,
82 if (!rast
->cbuf_transfer
[i
])
85 rast
->cbuf_map
[i
] = screen
->transfer_map(rast
->screen
,
86 rast
->cbuf_transfer
[i
]);
87 if (!rast
->cbuf_map
[i
])
92 zsbuf
= rast
->state
.fb
.zsbuf
;
94 rast
->zsbuf_transfer
= screen
->get_tex_transfer(rast
->screen
,
99 PIPE_TRANSFER_READ_WRITE
,
103 if (!rast
->zsbuf_transfer
)
106 rast
->zsbuf_map
= screen
->transfer_map(rast
->screen
,
107 rast
->zsbuf_transfer
);
108 if (!rast
->zsbuf_map
)
115 /* Unmap and release transfers?
122 * Finish the rasterization phase.
123 * Unmap framebuffer surfaces.
126 lp_rast_end( struct lp_rasterizer
*rast
)
128 struct pipe_screen
*screen
= rast
->screen
;
131 for (i
= 0; i
< rast
->state
.fb
.nr_cbufs
; i
++) {
132 if (rast
->cbuf_map
[i
])
133 screen
->transfer_unmap(screen
, rast
->cbuf_transfer
[i
]);
135 if (rast
->cbuf_transfer
[i
])
136 screen
->tex_transfer_destroy(rast
->cbuf_transfer
[i
]);
138 rast
->cbuf_transfer
[i
] = NULL
;
139 rast
->cbuf_map
[i
] = NULL
;
143 screen
->transfer_unmap(screen
, rast
->zsbuf_transfer
);
145 if (rast
->zsbuf_transfer
)
146 screen
->tex_transfer_destroy(rast
->zsbuf_transfer
);
148 rast
->zsbuf_transfer
= NULL
;
149 rast
->zsbuf_map
= NULL
;
154 * Begining rasterization of a tile.
155 * \param x window X position of the tile, in pixels
156 * \param y window Y position of the tile, in pixels
159 lp_rast_start_tile(struct lp_rasterizer_task
*task
,
160 unsigned x
, unsigned y
)
162 LP_DBG(DEBUG_RAST
, "%s %d,%d\n", __FUNCTION__
, x
, y
);
170 * Clear the rasterizer's current color tile.
171 * This is a bin command called during bin processing.
174 lp_rast_clear_color(struct lp_rasterizer_task
*task
,
175 const union lp_rast_cmd_arg arg
)
177 struct lp_rasterizer
*rast
= task
->rast
;
178 const uint8_t *clear_color
= arg
.clear_color
;
179 uint8_t **color_tile
= task
->tile
.color
;
182 LP_DBG(DEBUG_RAST
, "%s 0x%x,0x%x,0x%x,0x%x\n", __FUNCTION__
,
188 if (clear_color
[0] == clear_color
[1] &&
189 clear_color
[1] == clear_color
[2] &&
190 clear_color
[2] == clear_color
[3]) {
191 /* clear to grayscale value {x, x, x, x} */
192 for (i
= 0; i
< rast
->state
.fb
.nr_cbufs
; i
++) {
193 memset(color_tile
[i
], clear_color
[0], TILE_SIZE
* TILE_SIZE
* 4);
198 * Note: if the swizzled tile layout changes (see TILE_PIXEL) this code
199 * will need to change. It'll be pretty obvious when clearing no longer
202 const unsigned chunk
= TILE_SIZE
/ 4;
203 for (i
= 0; i
< rast
->state
.fb
.nr_cbufs
; i
++) {
204 uint8_t *c
= color_tile
[i
];
206 for (j
= 0; j
< 4 * TILE_SIZE
; j
++) {
207 memset(c
, clear_color
[0], chunk
);
209 memset(c
, clear_color
[1], chunk
);
211 memset(c
, clear_color
[2], chunk
);
213 memset(c
, clear_color
[3], chunk
);
216 assert(c
- color_tile
[i
] == TILE_SIZE
* TILE_SIZE
* 4);
220 LP_COUNT(nr_color_tile_clear
);
225 * Clear the rasterizer's current z/stencil tile.
226 * This is a bin command called during bin processing.
229 lp_rast_clear_zstencil(struct lp_rasterizer_task
*task
,
230 const union lp_rast_cmd_arg arg
)
232 struct lp_rasterizer
*rast
= task
->rast
;
233 const unsigned tile_x
= task
->x
;
234 const unsigned tile_y
= task
->y
;
235 const unsigned height
= TILE_SIZE
/TILE_VECTOR_HEIGHT
;
236 const unsigned width
= TILE_SIZE
*TILE_VECTOR_HEIGHT
;
237 unsigned block_size
= util_format_get_blocksize(rast
->zsbuf_transfer
->texture
->format
);
239 unsigned dst_stride
= rast
->zsbuf_transfer
->stride
*TILE_VECTOR_HEIGHT
;
242 LP_DBG(DEBUG_RAST
, "%s 0x%x\n", __FUNCTION__
, arg
.clear_zstencil
);
244 assert(rast
->zsbuf_map
);
245 if (!rast
->zsbuf_map
)
248 LP_DBG(DEBUG_RAST
, "%s\n", __FUNCTION__
);
251 * Clear the aera of the swizzled depth/depth buffer matching this tile, in
252 * stripes of TILE_VECTOR_HEIGHT x TILE_SIZE at a time.
254 * The swizzled depth format is such that the depths for
255 * TILE_VECTOR_HEIGHT x TILE_VECTOR_WIDTH pixels have consecutive offsets.
258 dst
= lp_rast_depth_pointer(rast
, tile_x
, tile_y
);
260 switch (block_size
) {
262 memset(dst
, (uint8_t) arg
.clear_zstencil
, height
* width
);
265 for (i
= 0; i
< height
; i
++) {
266 uint16_t *row
= (uint16_t *)dst
;
267 for (j
= 0; j
< width
; j
++)
268 *row
++ = (uint16_t) arg
.clear_zstencil
;
273 for (i
= 0; i
< height
; i
++) {
274 uint32_t *row
= (uint32_t *)dst
;
275 for (j
= 0; j
< width
; j
++)
276 *row
++ = arg
.clear_zstencil
;
288 * Load tile color from the framebuffer surface.
289 * This is a bin command called during bin processing.
292 lp_rast_load_color(struct lp_rasterizer_task
*task
,
293 const union lp_rast_cmd_arg arg
)
295 struct lp_rasterizer
*rast
= task
->rast
;
296 const unsigned x
= task
->x
, y
= task
->y
;
299 LP_DBG(DEBUG_RAST
, "%s at %u, %u\n", __FUNCTION__
, x
, y
);
301 for (i
= 0; i
< rast
->state
.fb
.nr_cbufs
; i
++) {
302 struct pipe_transfer
*transfer
= rast
->cbuf_transfer
[i
];
306 if (x
>= transfer
->width
|| y
>= transfer
->height
)
311 assert(w
<= TILE_SIZE
);
312 assert(h
<= TILE_SIZE
);
314 lp_tile_read_4ub(transfer
->texture
->format
,
321 LP_COUNT(nr_color_tile_load
);
327 lp_rast_set_state(struct lp_rasterizer_task
*task
,
328 const union lp_rast_cmd_arg arg
)
330 const struct lp_rast_state
*state
= arg
.set_state
;
332 LP_DBG(DEBUG_RAST
, "%s %p\n", __FUNCTION__
, (void *) state
);
334 /* just set the current state pointer for this rasterizer */
335 task
->current_state
= state
;
341 * Run the shader on all blocks in a tile. This is used when a tile is
342 * completely contained inside a triangle.
343 * This is a bin command called during bin processing.
346 lp_rast_shade_tile(struct lp_rasterizer_task
*task
,
347 const union lp_rast_cmd_arg arg
)
349 struct lp_rasterizer
*rast
= task
->rast
;
350 const struct lp_rast_state
*state
= task
->current_state
;
351 struct lp_rast_tile
*tile
= &task
->tile
;
352 const struct lp_rast_shader_inputs
*inputs
= arg
.shade_tile
;
353 const unsigned tile_x
= task
->x
, tile_y
= task
->y
;
356 LP_DBG(DEBUG_RAST
, "%s\n", __FUNCTION__
);
358 /* render the whole 64x64 tile in 4x4 chunks */
359 for (y
= 0; y
< TILE_SIZE
; y
+= 4){
360 for (x
= 0; x
< TILE_SIZE
; x
+= 4) {
361 uint8_t *color
[PIPE_MAX_COLOR_BUFS
];
363 unsigned block_offset
, i
;
365 /* offset of the 16x16 pixel block within the tile */
366 block_offset
= ((y
/ 4) * (16 * 16) + (x
/ 4) * 16);
369 for (i
= 0; i
< rast
->state
.fb
.nr_cbufs
; i
++)
370 color
[i
] = tile
->color
[i
] + 4 * block_offset
;
373 depth
= lp_rast_depth_pointer(rast
, tile_x
+ x
, tile_y
+ y
);
376 state
->jit_function
[0]( &state
->jit_context
,
377 tile_x
+ x
, tile_y
+ y
,
383 INT_MIN
, INT_MIN
, INT_MIN
,
391 * Compute shading for a 4x4 block of pixels.
392 * This is a bin command called during bin processing.
394 void lp_rast_shade_quads( struct lp_rasterizer_task
*task
,
395 const struct lp_rast_shader_inputs
*inputs
,
396 unsigned x
, unsigned y
,
397 int32_t c1
, int32_t c2
, int32_t c3
)
399 const struct lp_rast_state
*state
= task
->current_state
;
400 struct lp_rasterizer
*rast
= task
->rast
;
401 struct lp_rast_tile
*tile
= &task
->tile
;
402 uint8_t *color
[PIPE_MAX_COLOR_BUFS
];
412 assert(x
% TILE_VECTOR_WIDTH
== 0);
413 assert(y
% TILE_VECTOR_HEIGHT
== 0);
415 assert((x
% 4) == 0);
416 assert((y
% 4) == 0);
422 /* offset of the 16x16 pixel block within the tile */
423 block_offset
= ((iy
/ 4) * (16 * 16) + (ix
/ 4) * 16);
426 for (i
= 0; i
< rast
->state
.fb
.nr_cbufs
; i
++)
427 color
[i
] = tile
->color
[i
] + 4 * block_offset
;
430 depth
= lp_rast_depth_pointer(rast
, x
, y
);
435 assert(lp_check_alignment(tile
->color
[0], 16));
436 assert(lp_check_alignment(state
->jit_context
.blend_color
, 16));
438 assert(lp_check_alignment(inputs
->step
[0], 16));
439 assert(lp_check_alignment(inputs
->step
[1], 16));
440 assert(lp_check_alignment(inputs
->step
[2], 16));
444 state
->jit_function
[1]( &state
->jit_context
,
452 inputs
->step
[0], inputs
->step
[1], inputs
->step
[2]);
457 * Set top row and left column of the tile's pixels to white. For debugging.
460 outline_tile(uint8_t *tile
)
462 const uint8_t val
= 0xff;
465 for (i
= 0; i
< TILE_SIZE
; i
++) {
466 TILE_PIXEL(tile
, i
, 0, 0) = val
;
467 TILE_PIXEL(tile
, i
, 0, 1) = val
;
468 TILE_PIXEL(tile
, i
, 0, 2) = val
;
469 TILE_PIXEL(tile
, i
, 0, 3) = val
;
471 TILE_PIXEL(tile
, 0, i
, 0) = val
;
472 TILE_PIXEL(tile
, 0, i
, 1) = val
;
473 TILE_PIXEL(tile
, 0, i
, 2) = val
;
474 TILE_PIXEL(tile
, 0, i
, 3) = val
;
480 * Draw grid of gray lines at 16-pixel intervals across the tile to
481 * show the sub-tile boundaries. For debugging.
484 outline_subtiles(uint8_t *tile
)
486 const uint8_t val
= 0x80;
487 const unsigned step
= 16;
490 for (i
= 0; i
< TILE_SIZE
; i
+= step
) {
491 for (j
= 0; j
< TILE_SIZE
; j
++) {
492 TILE_PIXEL(tile
, i
, j
, 0) = val
;
493 TILE_PIXEL(tile
, i
, j
, 1) = val
;
494 TILE_PIXEL(tile
, i
, j
, 2) = val
;
495 TILE_PIXEL(tile
, i
, j
, 3) = val
;
497 TILE_PIXEL(tile
, j
, i
, 0) = val
;
498 TILE_PIXEL(tile
, j
, i
, 1) = val
;
499 TILE_PIXEL(tile
, j
, i
, 2) = val
;
500 TILE_PIXEL(tile
, j
, i
, 3) = val
;
510 * Write the rasterizer's color tile to the framebuffer.
513 lp_rast_store_color(struct lp_rasterizer_task
*task
)
515 struct lp_rasterizer
*rast
= task
->rast
;
516 const unsigned x
= task
->x
, y
= task
->y
;
519 for (i
= 0; i
< rast
->state
.fb
.nr_cbufs
; i
++) {
520 struct pipe_transfer
*transfer
= rast
->cbuf_transfer
[i
];
524 if (x
>= transfer
->width
)
527 if (y
>= transfer
->height
)
530 LP_DBG(DEBUG_RAST
, "%s [%u] %d,%d %dx%d\n", __FUNCTION__
,
531 task
->thread_index
, x
, y
, w
, h
);
533 if (LP_DEBUG
& DEBUG_SHOW_SUBTILES
)
534 outline_subtiles(task
->tile
.color
[i
]);
535 else if (LP_DEBUG
& DEBUG_SHOW_TILES
)
536 outline_tile(task
->tile
.color
[i
]);
538 lp_tile_write_4ub(transfer
->texture
->format
,
545 LP_COUNT(nr_color_tile_store
);
551 * Write the rasterizer's tiles to the framebuffer.
554 lp_rast_end_tile(struct lp_rasterizer_task
*task
)
556 struct lp_rasterizer
*rast
= task
->rast
;
558 LP_DBG(DEBUG_RAST
, "%s\n", __FUNCTION__
);
560 if (rast
->state
.write_color
)
561 lp_rast_store_color(task
);
566 * Signal on a fence. This is called during bin execution/rasterization.
570 lp_rast_fence(struct lp_rasterizer_task
*task
,
571 const union lp_rast_cmd_arg arg
)
573 struct lp_fence
*fence
= arg
.fence
;
575 pipe_mutex_lock( fence
->mutex
);
578 assert(fence
->count
<= fence
->rank
);
580 LP_DBG(DEBUG_RAST
, "%s count=%u rank=%u\n", __FUNCTION__
,
581 fence
->count
, fence
->rank
);
583 pipe_condvar_signal( fence
->signalled
);
585 pipe_mutex_unlock( fence
->mutex
);
590 * When all the threads are done rasterizing a scene, one thread will
591 * call this function to reset the scene and put it onto the empty queue.
594 release_scene( struct lp_rasterizer
*rast
,
595 struct lp_scene
*scene
)
597 util_unreference_framebuffer_state( &scene
->fb
);
599 lp_scene_reset( scene
);
601 assert(lp_scene_is_empty(scene
));
603 lp_scene_enqueue( rast
->empty_scenes
, scene
);
604 rast
->curr_scene
= NULL
;
609 * Rasterize commands for a single bin.
610 * \param x, y position of the bin's tile in the framebuffer
611 * Must be called between lp_rast_begin() and lp_rast_end().
615 rasterize_bin(struct lp_rasterizer_task
*task
,
616 const struct cmd_bin
*bin
,
619 const struct cmd_block_list
*commands
= &bin
->commands
;
620 struct cmd_block
*block
;
623 lp_rast_start_tile( task
, x
, y
);
625 /* simply execute each of the commands in the block list */
626 for (block
= commands
->head
; block
; block
= block
->next
) {
627 for (k
= 0; k
< block
->count
; k
++) {
628 block
->cmd
[k
]( task
, block
->arg
[k
] );
632 lp_rast_end_tile( task
);
636 #define RAST(x) { lp_rast_##x, #x }
645 RAST(clear_zstencil
),
653 debug_bin( const struct cmd_bin
*bin
)
655 const struct cmd_block
*head
= bin
->commands
.head
;
658 for (i
= 0; i
< head
->count
; i
++) {
659 debug_printf("%d: ", i
);
660 for (j
= 0; j
< Elements(cmd_names
); j
++) {
661 if (head
->cmd
[i
] == cmd_names
[j
].cmd
) {
662 debug_printf("%s\n", cmd_names
[j
].name
);
666 if (j
== Elements(cmd_names
))
667 debug_printf("...other\n");
672 /* An empty bin is one that just loads the contents of the tile and
673 * stores them again unchanged. This typically happens when bins have
674 * been flushed for some reason in the middle of a frame, or when
675 * incremental updates are being made to a render target.
677 * Try to avoid doing pointless work in this case.
680 is_empty_bin( const struct cmd_bin
*bin
)
682 const struct cmd_block
*head
= bin
->commands
.head
;
688 /* We emit at most two load-tile commands at the start of the first
689 * command block. In addition we seem to emit a couple of
690 * set-state commands even in empty bins.
692 * As a heuristic, if a bin has more than 4 commands, consider it
695 if (head
->next
!= NULL
||
700 for (i
= 0; i
< head
->count
; i
++)
701 if (head
->cmd
[i
] != lp_rast_load_color
&&
702 head
->cmd
[i
] != lp_rast_set_state
) {
712 * Rasterize/execute all bins within a scene.
716 rasterize_scene(struct lp_rasterizer_task
*task
,
717 struct lp_scene
*scene
,
720 /* loop over scene bins, rasterize each */
724 for (i
= 0; i
< scene
->tiles_x
; i
++) {
725 for (j
= 0; j
< scene
->tiles_y
; j
++) {
726 struct cmd_bin
*bin
= lp_scene_get_bin(scene
, i
, j
);
727 rasterize_bin(task
, bin
, i
* TILE_SIZE
, j
* TILE_SIZE
);
737 while ((bin
= lp_scene_bin_iter_next(scene
, &x
, &y
))) {
738 if (!is_empty_bin( bin
))
739 rasterize_bin(task
, bin
, x
* TILE_SIZE
, y
* TILE_SIZE
);
747 * Called by setup module when it has something for us to render.
750 lp_rasterize_scene( struct lp_rasterizer
*rast
,
751 struct lp_scene
*scene
,
752 const struct pipe_framebuffer_state
*fb
,
755 boolean debug
= false;
757 LP_DBG(DEBUG_SETUP
, "%s\n", __FUNCTION__
);
761 debug_printf("rasterize scene:\n");
762 debug_printf(" data size: %u\n", lp_scene_data_size(scene
));
763 for (y
= 0; y
< scene
->tiles_y
; y
++) {
764 for (x
= 0; x
< scene
->tiles_x
; x
++) {
765 debug_printf(" bin %u, %u size: %u\n", x
, y
,
766 lp_scene_bin_size(scene
, x
, y
));
771 /* save framebuffer state in the bin */
772 util_copy_framebuffer_state(&scene
->fb
, fb
);
773 scene
->write_depth
= write_depth
;
775 if (rast
->num_threads
== 0) {
778 lp_rast_begin( rast
, fb
,
779 fb
->nr_cbufs
!= 0, /* always write color if cbufs present */
780 fb
->zsbuf
!= NULL
&& write_depth
);
782 lp_scene_bin_iter_begin( scene
);
783 rasterize_scene( &rast
->tasks
[0], scene
, write_depth
);
785 release_scene( rast
, scene
);
790 /* threaded rendering! */
793 lp_scene_enqueue( rast
->full_scenes
, scene
);
795 /* signal the threads that there's work to do */
796 for (i
= 0; i
< rast
->num_threads
; i
++) {
797 pipe_semaphore_signal(&rast
->tasks
[i
].work_ready
);
800 /* wait for work to complete */
801 for (i
= 0; i
< rast
->num_threads
; i
++) {
802 pipe_semaphore_wait(&rast
->tasks
[i
].work_done
);
806 LP_DBG(DEBUG_SETUP
, "%s done \n", __FUNCTION__
);
811 * This is the thread's main entrypoint.
812 * It's a simple loop:
815 * 3. signal that we're done
817 static PIPE_THREAD_ROUTINE( thread_func
, init_data
)
819 struct lp_rasterizer_task
*task
= (struct lp_rasterizer_task
*) init_data
;
820 struct lp_rasterizer
*rast
= task
->rast
;
821 boolean debug
= false;
826 debug_printf("thread %d waiting for work\n", task
->thread_index
);
827 pipe_semaphore_wait(&task
->work_ready
);
832 if (task
->thread_index
== 0) {
834 * - get next scene to rasterize
835 * - map the framebuffer surfaces
837 const struct pipe_framebuffer_state
*fb
;
840 rast
->curr_scene
= lp_scene_dequeue( rast
->full_scenes
, TRUE
);
842 lp_scene_bin_iter_begin( rast
->curr_scene
);
844 fb
= &rast
->curr_scene
->fb
;
845 write_depth
= rast
->curr_scene
->write_depth
;
847 lp_rast_begin( rast
, fb
,
849 fb
->zsbuf
!= NULL
&& write_depth
);
852 /* Wait for all threads to get here so that threads[1+] don't
853 * get a null rast->curr_scene pointer.
855 pipe_barrier_wait( &rast
->barrier
);
859 debug_printf("thread %d doing work\n", task
->thread_index
);
860 rasterize_scene(task
,
862 rast
->curr_scene
->write_depth
);
864 /* wait for all threads to finish with this scene */
865 pipe_barrier_wait( &rast
->barrier
);
867 if (task
->thread_index
== 0) {
869 * - release the scene object
870 * - unmap the framebuffer surfaces
872 release_scene( rast
, rast
->curr_scene
);
876 /* signal done with work */
878 debug_printf("thread %d done working\n", task
->thread_index
);
879 pipe_semaphore_signal(&task
->work_done
);
887 * Initialize semaphores and spawn the threads.
890 create_rast_threads(struct lp_rasterizer
*rast
)
894 #ifdef PIPE_OS_WINDOWS
895 /* Multithreading not supported on windows until conditions and barriers are
896 * properly implemented. */
897 rast
->num_threads
= 0;
899 rast
->num_threads
= util_cpu_caps
.nr_cpus
;
900 rast
->num_threads
= debug_get_num_option("LP_NUM_THREADS", rast
->num_threads
);
901 rast
->num_threads
= MIN2(rast
->num_threads
, MAX_THREADS
);
904 /* NOTE: if num_threads is zero, we won't use any threads */
905 for (i
= 0; i
< rast
->num_threads
; i
++) {
906 pipe_semaphore_init(&rast
->tasks
[i
].work_ready
, 0);
907 pipe_semaphore_init(&rast
->tasks
[i
].work_done
, 0);
908 rast
->threads
[i
] = pipe_thread_create(thread_func
,
909 (void *) &rast
->tasks
[i
]);
916 * Create new lp_rasterizer.
917 * \param empty the queue to put empty scenes on after we've finished
920 struct lp_rasterizer
*
921 lp_rast_create( struct pipe_screen
*screen
, struct lp_scene_queue
*empty
)
923 struct lp_rasterizer
*rast
;
926 rast
= CALLOC_STRUCT(lp_rasterizer
);
930 rast
->screen
= screen
;
932 rast
->empty_scenes
= empty
;
933 rast
->full_scenes
= lp_scene_queue_create();
935 for (i
= 0; i
< Elements(rast
->tasks
); i
++) {
936 struct lp_rasterizer_task
*task
= &rast
->tasks
[i
];
938 for (cbuf
= 0; cbuf
< PIPE_MAX_COLOR_BUFS
; cbuf
++ )
939 task
->tile
.color
[cbuf
] = align_malloc(TILE_SIZE
* TILE_SIZE
* 4, 16);
942 task
->thread_index
= i
;
945 create_rast_threads(rast
);
947 /* for synchronizing rasterization threads */
948 pipe_barrier_init( &rast
->barrier
, rast
->num_threads
);
956 void lp_rast_destroy( struct lp_rasterizer
*rast
)
960 util_unreference_framebuffer_state(&rast
->state
.fb
);
962 for (i
= 0; i
< Elements(rast
->tasks
); i
++) {
963 for (cbuf
= 0; cbuf
< PIPE_MAX_COLOR_BUFS
; cbuf
++ )
964 align_free(rast
->tasks
[i
].tile
.color
[cbuf
]);
967 /* Set exit_flag and signal each thread's work_ready semaphore.
968 * Each thread will be woken up, notice that the exit_flag is set and
969 * break out of its main loop. The thread will then exit.
971 rast
->exit_flag
= TRUE
;
972 for (i
= 0; i
< rast
->num_threads
; i
++) {
973 pipe_semaphore_signal(&rast
->tasks
[i
].work_ready
);
976 for (i
= 0; i
< rast
->num_threads
; i
++) {
977 pipe_semaphore_destroy(&rast
->tasks
[i
].work_ready
);
978 pipe_semaphore_destroy(&rast
->tasks
[i
].work_done
);
981 /* for synchronizing rasterization threads */
982 pipe_barrier_destroy( &rast
->barrier
);
988 /** Return number of rasterization threads */
990 lp_rast_get_num_threads( struct lp_rasterizer
*rast
)
992 return rast
->num_threads
;