1 /**************************************************************************
3 * Copyright 2007 Tungsten Graphics, Inc., Cedar Park, Texas.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
30 * Vertex buffer drawing stage.
32 * \author José Fonseca <jrfonsec@tungstengraphics.com>
33 * \author Keith Whitwell <keith@tungstengraphics.com>
37 #include "pipe/p_debug.h"
38 #include "util/u_math.h"
39 #include "util/u_memory.h"
41 #include "draw_vbuf.h"
42 #include "draw_private.h"
43 #include "draw_vertex.h"
44 #include "draw_pipe.h"
45 #include "translate/translate.h"
46 #include "translate/translate_cache.h"
50 * Vertex buffer emit stage.
53 struct draw_stage stage
; /**< This must be first (base class) */
55 struct vbuf_render
*render
;
57 const struct vertex_info
*vinfo
;
59 /** Vertex size in bytes */
62 struct translate
*translate
;
64 /* FIXME: we have no guarantee that 'unsigned' is 32bit */
66 /** Vertices in hardware format */
69 unsigned max_vertices
;
77 /* Cache point size somewhere it's address won't change:
81 struct translate_cache
*cache
;
86 * Basically a cast wrapper.
88 static INLINE
struct vbuf_stage
*
89 vbuf_stage( struct draw_stage
*stage
)
92 return (struct vbuf_stage
*)stage
;
96 static void vbuf_flush_indices( struct vbuf_stage
*vbuf
);
97 static void vbuf_flush_vertices( struct vbuf_stage
*vbuf
);
98 static void vbuf_alloc_vertices( struct vbuf_stage
*vbuf
);
101 static INLINE boolean
102 overflow( void *map
, void *ptr
, unsigned bytes
, unsigned bufsz
)
104 unsigned long used
= (unsigned long) ((char *)ptr
- (char *)map
);
105 return (used
+ bytes
) > bufsz
;
110 check_space( struct vbuf_stage
*vbuf
, unsigned nr
)
112 if (vbuf
->nr_vertices
+ nr
> vbuf
->max_vertices
) {
113 vbuf_flush_vertices(vbuf
);
114 vbuf_alloc_vertices(vbuf
);
117 if (vbuf
->nr_indices
+ nr
> vbuf
->max_indices
)
118 vbuf_flush_indices(vbuf
);
125 * Extract the needed fields from post-transformed vertex and emit
126 * a hardware(driver) vertex.
127 * Recall that the vertices are constructed by the 'draw' module and
128 * have a couple of slots at the beginning (1-dword header, 4-dword
129 * clip pos) that we ignore here. We only use the vertex->data[] fields.
132 emit_vertex( struct vbuf_stage
*vbuf
,
133 struct vertex_header
*vertex
)
135 if(vertex
->vertex_id
== UNDEFINED_VERTEX_ID
) {
136 /* Hmm - vertices are emitted one at a time - better make sure
137 * set_buffer is efficient. Consider a special one-shot mode for
140 /* Note: we really do want data[0] here, not data[pos]:
142 vbuf
->translate
->set_buffer(vbuf
->translate
, 0, vertex
->data
[0], 0);
143 vbuf
->translate
->run(vbuf
->translate
, 0, 1, vbuf
->vertex_ptr
);
145 if (0) draw_dump_emitted_vertex(vbuf
->vinfo
, (uint8_t *)vbuf
->vertex_ptr
);
147 vbuf
->vertex_ptr
+= vbuf
->vertex_size
/4;
148 vertex
->vertex_id
= vbuf
->nr_vertices
++;
151 return (ushort
)vertex
->vertex_id
;
156 vbuf_tri( struct draw_stage
*stage
,
157 struct prim_header
*prim
)
159 struct vbuf_stage
*vbuf
= vbuf_stage( stage
);
162 check_space( vbuf
, 3 );
164 for (i
= 0; i
< 3; i
++) {
165 vbuf
->indices
[vbuf
->nr_indices
++] = emit_vertex( vbuf
, prim
->v
[i
] );
171 vbuf_line( struct draw_stage
*stage
,
172 struct prim_header
*prim
)
174 struct vbuf_stage
*vbuf
= vbuf_stage( stage
);
177 check_space( vbuf
, 2 );
179 for (i
= 0; i
< 2; i
++) {
180 vbuf
->indices
[vbuf
->nr_indices
++] = emit_vertex( vbuf
, prim
->v
[i
] );
186 vbuf_point( struct draw_stage
*stage
,
187 struct prim_header
*prim
)
189 struct vbuf_stage
*vbuf
= vbuf_stage( stage
);
191 check_space( vbuf
, 1 );
193 vbuf
->indices
[vbuf
->nr_indices
++] = emit_vertex( vbuf
, prim
->v
[0] );
200 * Set the prim type for subsequent vertices.
201 * This may result in a new vertex size. The existing vbuffer (if any)
202 * will be flushed if needed and a new one allocated.
205 vbuf_set_prim( struct vbuf_stage
*vbuf
, uint prim
)
207 struct translate_key hw_key
;
211 vbuf
->render
->set_primitive(vbuf
->render
, prim
);
213 /* Must do this after set_primitive() above:
215 * XXX: need some state managment to track when this needs to be
216 * recalculated. The driver should tell us whether there was a
219 vbuf
->vinfo
= vbuf
->render
->get_vertex_info(vbuf
->render
);
221 if (vbuf
->vertex_size
!= vbuf
->vinfo
->size
* sizeof(float)) {
222 vbuf_flush_vertices(vbuf
);
223 vbuf
->vertex_size
= vbuf
->vinfo
->size
* sizeof(float);
226 /* Translate from pipeline vertices to hw vertices.
230 for (i
= 0; i
< vbuf
->vinfo
->num_attribs
; i
++) {
231 unsigned emit_sz
= 0;
232 unsigned src_buffer
= 0;
233 unsigned output_format
;
234 unsigned src_offset
= (vbuf
->vinfo
->attrib
[i
].src_index
* 4 * sizeof(float) );
236 switch (vbuf
->vinfo
->attrib
[i
].emit
) {
238 output_format
= PIPE_FORMAT_R32G32B32A32_FLOAT
;
239 emit_sz
= 4 * sizeof(float);
242 output_format
= PIPE_FORMAT_R32G32B32_FLOAT
;
243 emit_sz
= 3 * sizeof(float);
246 output_format
= PIPE_FORMAT_R32G32_FLOAT
;
247 emit_sz
= 2 * sizeof(float);
250 output_format
= PIPE_FORMAT_R32_FLOAT
;
251 emit_sz
= 1 * sizeof(float);
254 output_format
= PIPE_FORMAT_R32_FLOAT
;
255 emit_sz
= 1 * sizeof(float);
260 output_format
= PIPE_FORMAT_B8G8R8A8_UNORM
;
261 emit_sz
= 4 * sizeof(ubyte
);
265 output_format
= PIPE_FORMAT_NONE
;
270 hw_key
.element
[i
].input_format
= PIPE_FORMAT_R32G32B32A32_FLOAT
;
271 hw_key
.element
[i
].input_buffer
= src_buffer
;
272 hw_key
.element
[i
].input_offset
= src_offset
;
273 hw_key
.element
[i
].output_format
= output_format
;
274 hw_key
.element
[i
].output_offset
= dst_offset
;
276 dst_offset
+= emit_sz
;
279 hw_key
.nr_elements
= vbuf
->vinfo
->num_attribs
;
280 hw_key
.output_stride
= vbuf
->vinfo
->size
* 4;
282 /* Don't bother with caching at this stage:
284 if (!vbuf
->translate
||
285 translate_key_compare(&vbuf
->translate
->key
, &hw_key
) != 0)
287 translate_key_sanitize(&hw_key
);
288 vbuf
->translate
= translate_cache_find(vbuf
->cache
, &hw_key
);
290 vbuf
->translate
->set_buffer(vbuf
->translate
, 1, &vbuf
->point_size
, 0);
293 vbuf
->point_size
= vbuf
->stage
.draw
->rasterizer
->point_size
;
295 /* Allocate new buffer?
298 vbuf_alloc_vertices(vbuf
);
303 vbuf_first_tri( struct draw_stage
*stage
,
304 struct prim_header
*prim
)
306 struct vbuf_stage
*vbuf
= vbuf_stage( stage
);
308 vbuf_flush_indices( vbuf
);
309 stage
->tri
= vbuf_tri
;
310 vbuf_set_prim(vbuf
, PIPE_PRIM_TRIANGLES
);
311 stage
->tri( stage
, prim
);
316 vbuf_first_line( struct draw_stage
*stage
,
317 struct prim_header
*prim
)
319 struct vbuf_stage
*vbuf
= vbuf_stage( stage
);
321 vbuf_flush_indices( vbuf
);
322 stage
->line
= vbuf_line
;
323 vbuf_set_prim(vbuf
, PIPE_PRIM_LINES
);
324 stage
->line( stage
, prim
);
329 vbuf_first_point( struct draw_stage
*stage
,
330 struct prim_header
*prim
)
332 struct vbuf_stage
*vbuf
= vbuf_stage( stage
);
334 vbuf_flush_indices( vbuf
);
335 stage
->point
= vbuf_point
;
336 vbuf_set_prim(vbuf
, PIPE_PRIM_POINTS
);
337 stage
->point( stage
, prim
);
342 vbuf_flush_indices( struct vbuf_stage
*vbuf
)
344 if(!vbuf
->nr_indices
)
347 assert((uint
) (vbuf
->vertex_ptr
- vbuf
->vertices
) ==
348 vbuf
->nr_vertices
* vbuf
->vertex_size
/ sizeof(unsigned));
350 vbuf
->render
->draw(vbuf
->render
, vbuf
->indices
, vbuf
->nr_indices
);
352 vbuf
->nr_indices
= 0;
357 * Flush existing vertex buffer and allocate a new one.
359 * XXX: We separate flush-on-index-full and flush-on-vb-full, but may
360 * raise issues uploading vertices if the hardware wants to flush when
364 vbuf_flush_vertices( struct vbuf_stage
*vbuf
)
367 vbuf_flush_indices(vbuf
);
369 /* Reset temporary vertices ids */
370 if(vbuf
->nr_vertices
)
371 draw_reset_vertex_ids( vbuf
->stage
.draw
);
373 /* Free the vertex buffer */
374 vbuf
->render
->release_vertices(vbuf
->render
,
378 vbuf
->max_vertices
= vbuf
->nr_vertices
= 0;
379 vbuf
->vertex_ptr
= vbuf
->vertices
= NULL
;
386 vbuf_alloc_vertices( struct vbuf_stage
*vbuf
)
388 assert(!vbuf
->nr_indices
);
389 assert(!vbuf
->vertices
);
391 /* Allocate a new vertex buffer */
392 vbuf
->max_vertices
= vbuf
->render
->max_vertex_buffer_bytes
/ vbuf
->vertex_size
;
395 vbuf
->max_vertices
= vbuf
->max_vertices
& ~1;
397 /* Must always succeed -- driver gives us a
398 * 'max_vertex_buffer_bytes' which it guarantees it can allocate,
399 * and it will flush itself if necessary to do so. If this does
400 * fail, we are basically without usable hardware.
402 assert(vbuf
->max_vertices
< UNDEFINED_VERTEX_ID
);
404 vbuf
->vertices
= (uint
*) vbuf
->render
->allocate_vertices(vbuf
->render
,
405 (ushort
) vbuf
->vertex_size
,
406 (ushort
) vbuf
->max_vertices
);
407 vbuf
->vertex_ptr
= vbuf
->vertices
;
413 vbuf_flush( struct draw_stage
*stage
, unsigned flags
)
415 struct vbuf_stage
*vbuf
= vbuf_stage( stage
);
417 vbuf_flush_indices( vbuf
);
419 stage
->point
= vbuf_first_point
;
420 stage
->line
= vbuf_first_line
;
421 stage
->tri
= vbuf_first_tri
;
423 if (flags
& DRAW_FLUSH_BACKEND
)
424 vbuf_flush_vertices( vbuf
);
429 vbuf_reset_stipple_counter( struct draw_stage
*stage
)
431 /* XXX: Need to do something here for hardware with linestipple.
437 static void vbuf_destroy( struct draw_stage
*stage
)
439 struct vbuf_stage
*vbuf
= vbuf_stage( stage
);
442 align_free( vbuf
->indices
);
445 vbuf
->render
->destroy( vbuf
->render
);
448 translate_cache_destroy(vbuf
->cache
);
455 * Create a new primitive vbuf/render stage.
457 struct draw_stage
*draw_vbuf_stage( struct draw_context
*draw
,
458 struct vbuf_render
*render
)
460 struct vbuf_stage
*vbuf
= CALLOC_STRUCT(vbuf_stage
);
464 vbuf
->stage
.draw
= draw
;
465 vbuf
->stage
.point
= vbuf_first_point
;
466 vbuf
->stage
.line
= vbuf_first_line
;
467 vbuf
->stage
.tri
= vbuf_first_tri
;
468 vbuf
->stage
.flush
= vbuf_flush
;
469 vbuf
->stage
.reset_stipple_counter
= vbuf_reset_stipple_counter
;
470 vbuf
->stage
.destroy
= vbuf_destroy
;
472 vbuf
->render
= render
;
473 vbuf
->max_indices
= MAX2(render
->max_indices
, UNDEFINED_VERTEX_ID
-1);
475 vbuf
->indices
= (ushort
*) align_malloc( vbuf
->max_indices
*
476 sizeof(vbuf
->indices
[0]),
481 vbuf
->cache
= translate_cache_create();
486 vbuf
->vertices
= NULL
;
487 vbuf
->vertex_ptr
= vbuf
->vertices
;
493 vbuf_destroy(&vbuf
->stage
);