1 /**************************************************************************
3 * Copyright 2011 Marek Olšák <maraeo@gmail.com>
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
29 * This module uploads user buffers and translates the vertex buffers which
30 * contain incompatible vertices (i.e. not supported by the driver/hardware)
31 * into compatible ones, based on the Gallium CAPs.
33 * It does not upload index buffers.
35 * The module heavily uses bitmasks to represent per-buffer and
36 * per-vertex-element flags to avoid looping over the list of buffers just
37 * to see if there's a non-zero stride, or user buffer, or unsupported format,
40 * There are 3 categories of vertex elements, which are processed separately:
41 * - per-vertex attribs (stride != 0, instance_divisor == 0)
42 * - instanced attribs (stride != 0, instance_divisor > 0)
43 * - constant attribs (stride == 0)
45 * All needed uploads and translations are performed every draw command, but
46 * only the subset of vertices needed for that draw command is uploaded or
47 * translated. (the module never translates whole buffers)
50 * The module consists of two main parts:
53 * 1) Translate (u_vbuf_translate_begin/end)
55 * This is pretty much a vertex fetch fallback. It translates vertices from
56 * one vertex buffer to another in an unused vertex buffer slot. It does
57 * whatever is needed to make the vertices readable by the hardware (changes
58 * vertex formats and aligns offsets and strides). The translate module is
61 * Each of the 3 categories is translated to a separate buffer.
62 * Only the [min_index, max_index] range is translated. For instanced attribs,
63 * the range is [start_instance, start_instance+instance_count]. For constant
64 * attribs, the range is [0, 1].
67 * 2) User buffer uploading (u_vbuf_upload_buffers)
69 * Only the [min_index, max_index] range is uploaded (just like Translate)
70 * with a single memcpy.
72 * This method works best for non-indexed draw operations or indexed draw
73 * operations where the [min_index, max_index] range is not being way bigger
74 * than the vertex count.
76 * If the range is too big (e.g. one triangle with indices {0, 1, 10000}),
77 * the per-vertex attribs are uploaded via the translate module, all packed
78 * into one vertex buffer, and the indexed draw call is turned into
79 * a non-indexed one in the process. This adds additional complexity
80 * to the translate part, but it prevents bad apps from bringing your frame
84 * If there is nothing to do, it forwards every command to the driver.
85 * The module also has its own CSO cache of vertex element states.
88 #include "util/u_vbuf.h"
90 #include "util/u_dump.h"
91 #include "util/u_format.h"
92 #include "util/u_inlines.h"
93 #include "util/u_memory.h"
94 #include "util/u_upload_mgr.h"
95 #include "translate/translate.h"
96 #include "translate/translate_cache.h"
97 #include "cso_cache/cso_cache.h"
98 #include "cso_cache/cso_hash.h"
100 struct u_vbuf_elements
{
102 struct pipe_vertex_element ve
[PIPE_MAX_ATTRIBS
];
104 unsigned src_format_size
[PIPE_MAX_ATTRIBS
];
106 /* If (velem[i].src_format != native_format[i]), the vertex buffer
107 * referenced by the vertex element cannot be used for rendering and
108 * its vertex data must be translated to native_format[i]. */
109 enum pipe_format native_format
[PIPE_MAX_ATTRIBS
];
110 unsigned native_format_size
[PIPE_MAX_ATTRIBS
];
112 /* Which buffers are used by the vertex element state. */
113 uint32_t used_vb_mask
;
114 /* This might mean two things:
115 * - src_format != native_format, as discussed above.
116 * - src_offset % 4 != 0 (if the caps don't allow such an offset). */
117 uint32_t incompatible_elem_mask
; /* each bit describes a corresp. attrib */
118 /* Which buffer has at least one vertex element referencing it
120 uint32_t incompatible_vb_mask_any
;
121 /* Which buffer has all vertex elements referencing it incompatible. */
122 uint32_t incompatible_vb_mask_all
;
123 /* Which buffer has at least one vertex element referencing it
125 uint32_t compatible_vb_mask_any
;
126 /* Which buffer has all vertex elements referencing it compatible. */
127 uint32_t compatible_vb_mask_all
;
129 /* Which buffer has at least one vertex element referencing it
131 uint32_t noninstance_vb_mask_any
;
144 struct u_vbuf_caps caps
;
146 struct pipe_context
*pipe
;
147 struct translate_cache
*translate_cache
;
148 struct cso_cache
*cso_cache
;
149 struct u_upload_mgr
*uploader
;
151 /* This is what was set in set_vertex_buffers.
152 * May contain user buffers. */
153 struct pipe_vertex_buffer vertex_buffer
[PIPE_MAX_ATTRIBS
];
154 uint32_t enabled_vb_mask
;
156 /* Saved vertex buffer. */
157 unsigned aux_vertex_buffer_slot
;
158 struct pipe_vertex_buffer aux_vertex_buffer_saved
;
160 /* Vertex buffers for the driver.
161 * There are usually no user buffers. */
162 struct pipe_vertex_buffer real_vertex_buffer
[PIPE_MAX_ATTRIBS
];
163 uint32_t dirty_real_vb_mask
; /* which buffers are dirty since the last
164 call of set_vertex_buffers */
166 /* The index buffer. */
167 struct pipe_index_buffer index_buffer
;
169 /* Vertex elements. */
170 struct u_vbuf_elements
*ve
, *ve_saved
;
172 /* Vertex elements used for the translate fallback. */
173 struct pipe_vertex_element fallback_velems
[PIPE_MAX_ATTRIBS
];
174 /* If non-NULL, this is a vertex element state used for the translate
175 * fallback and therefore used for rendering too. */
176 boolean using_translate
;
177 /* The vertex buffer slot index where translated vertices have been
179 unsigned fallback_vbs
[VB_NUM
];
181 /* Which buffer is a user buffer. */
182 uint32_t user_vb_mask
; /* each bit describes a corresp. buffer */
183 /* Which buffer is incompatible (unaligned). */
184 uint32_t incompatible_vb_mask
; /* each bit describes a corresp. buffer */
185 /* Which buffer has a non-zero stride. */
186 uint32_t nonzero_stride_vb_mask
; /* each bit describes a corresp. buffer */
190 u_vbuf_create_vertex_elements(struct u_vbuf
*mgr
, unsigned count
,
191 const struct pipe_vertex_element
*attribs
);
192 static void u_vbuf_delete_vertex_elements(struct u_vbuf
*mgr
, void *cso
);
194 static const struct {
195 enum pipe_format from
, to
;
196 } vbuf_format_fallbacks
[] = {
197 { PIPE_FORMAT_R32_FIXED
, PIPE_FORMAT_R32_FLOAT
},
198 { PIPE_FORMAT_R32G32_FIXED
, PIPE_FORMAT_R32G32_FLOAT
},
199 { PIPE_FORMAT_R32G32B32_FIXED
, PIPE_FORMAT_R32G32B32_FLOAT
},
200 { PIPE_FORMAT_R32G32B32A32_FIXED
, PIPE_FORMAT_R32G32B32A32_FLOAT
},
201 { PIPE_FORMAT_R16_FLOAT
, PIPE_FORMAT_R32_FLOAT
},
202 { PIPE_FORMAT_R16G16_FLOAT
, PIPE_FORMAT_R32G32_FLOAT
},
203 { PIPE_FORMAT_R16G16B16_FLOAT
, PIPE_FORMAT_R32G32B32_FLOAT
},
204 { PIPE_FORMAT_R16G16B16A16_FLOAT
, PIPE_FORMAT_R32G32B32A32_FLOAT
},
205 { PIPE_FORMAT_R64_FLOAT
, PIPE_FORMAT_R32_FLOAT
},
206 { PIPE_FORMAT_R64G64_FLOAT
, PIPE_FORMAT_R32G32_FLOAT
},
207 { PIPE_FORMAT_R64G64B64_FLOAT
, PIPE_FORMAT_R32G32B32_FLOAT
},
208 { PIPE_FORMAT_R64G64B64A64_FLOAT
, PIPE_FORMAT_R32G32B32A32_FLOAT
},
209 { PIPE_FORMAT_R32_UNORM
, PIPE_FORMAT_R32_FLOAT
},
210 { PIPE_FORMAT_R32G32_UNORM
, PIPE_FORMAT_R32G32_FLOAT
},
211 { PIPE_FORMAT_R32G32B32_UNORM
, PIPE_FORMAT_R32G32B32_FLOAT
},
212 { PIPE_FORMAT_R32G32B32A32_UNORM
, PIPE_FORMAT_R32G32B32A32_FLOAT
},
213 { PIPE_FORMAT_R32_SNORM
, PIPE_FORMAT_R32_FLOAT
},
214 { PIPE_FORMAT_R32G32_SNORM
, PIPE_FORMAT_R32G32_FLOAT
},
215 { PIPE_FORMAT_R32G32B32_SNORM
, PIPE_FORMAT_R32G32B32_FLOAT
},
216 { PIPE_FORMAT_R32G32B32A32_SNORM
, PIPE_FORMAT_R32G32B32A32_FLOAT
},
217 { PIPE_FORMAT_R32_USCALED
, PIPE_FORMAT_R32_FLOAT
},
218 { PIPE_FORMAT_R32G32_USCALED
, PIPE_FORMAT_R32G32_FLOAT
},
219 { PIPE_FORMAT_R32G32B32_USCALED
, PIPE_FORMAT_R32G32B32_FLOAT
},
220 { PIPE_FORMAT_R32G32B32A32_USCALED
, PIPE_FORMAT_R32G32B32A32_FLOAT
},
221 { PIPE_FORMAT_R32_SSCALED
, PIPE_FORMAT_R32_FLOAT
},
222 { PIPE_FORMAT_R32G32_SSCALED
, PIPE_FORMAT_R32G32_FLOAT
},
223 { PIPE_FORMAT_R32G32B32_SSCALED
, PIPE_FORMAT_R32G32B32_FLOAT
},
224 { PIPE_FORMAT_R32G32B32A32_SSCALED
, PIPE_FORMAT_R32G32B32A32_FLOAT
},
225 { PIPE_FORMAT_R16_UNORM
, PIPE_FORMAT_R32_FLOAT
},
226 { PIPE_FORMAT_R16G16_UNORM
, PIPE_FORMAT_R32G32_FLOAT
},
227 { PIPE_FORMAT_R16G16B16_UNORM
, PIPE_FORMAT_R32G32B32_FLOAT
},
228 { PIPE_FORMAT_R16G16B16A16_UNORM
, PIPE_FORMAT_R32G32B32A32_FLOAT
},
229 { PIPE_FORMAT_R16_SNORM
, PIPE_FORMAT_R32_FLOAT
},
230 { PIPE_FORMAT_R16G16_SNORM
, PIPE_FORMAT_R32G32_FLOAT
},
231 { PIPE_FORMAT_R16G16B16_SNORM
, PIPE_FORMAT_R32G32B32_FLOAT
},
232 { PIPE_FORMAT_R16G16B16A16_SNORM
, PIPE_FORMAT_R32G32B32A32_FLOAT
},
233 { PIPE_FORMAT_R16_USCALED
, PIPE_FORMAT_R32_FLOAT
},
234 { PIPE_FORMAT_R16G16_USCALED
, PIPE_FORMAT_R32G32_FLOAT
},
235 { PIPE_FORMAT_R16G16B16_USCALED
, PIPE_FORMAT_R32G32B32_FLOAT
},
236 { PIPE_FORMAT_R16G16B16A16_USCALED
, PIPE_FORMAT_R32G32B32A32_FLOAT
},
237 { PIPE_FORMAT_R16_SSCALED
, PIPE_FORMAT_R32_FLOAT
},
238 { PIPE_FORMAT_R16G16_SSCALED
, PIPE_FORMAT_R32G32_FLOAT
},
239 { PIPE_FORMAT_R16G16B16_SSCALED
, PIPE_FORMAT_R32G32B32_FLOAT
},
240 { PIPE_FORMAT_R16G16B16A16_SSCALED
, PIPE_FORMAT_R32G32B32A32_FLOAT
},
241 { PIPE_FORMAT_R8_UNORM
, PIPE_FORMAT_R32_FLOAT
},
242 { PIPE_FORMAT_R8G8_UNORM
, PIPE_FORMAT_R32G32_FLOAT
},
243 { PIPE_FORMAT_R8G8B8_UNORM
, PIPE_FORMAT_R32G32B32_FLOAT
},
244 { PIPE_FORMAT_R8G8B8A8_UNORM
, PIPE_FORMAT_R32G32B32A32_FLOAT
},
245 { PIPE_FORMAT_R8_SNORM
, PIPE_FORMAT_R32_FLOAT
},
246 { PIPE_FORMAT_R8G8_SNORM
, PIPE_FORMAT_R32G32_FLOAT
},
247 { PIPE_FORMAT_R8G8B8_SNORM
, PIPE_FORMAT_R32G32B32_FLOAT
},
248 { PIPE_FORMAT_R8G8B8A8_SNORM
, PIPE_FORMAT_R32G32B32A32_FLOAT
},
249 { PIPE_FORMAT_R8_USCALED
, PIPE_FORMAT_R32_FLOAT
},
250 { PIPE_FORMAT_R8G8_USCALED
, PIPE_FORMAT_R32G32_FLOAT
},
251 { PIPE_FORMAT_R8G8B8_USCALED
, PIPE_FORMAT_R32G32B32_FLOAT
},
252 { PIPE_FORMAT_R8G8B8A8_USCALED
, PIPE_FORMAT_R32G32B32A32_FLOAT
},
253 { PIPE_FORMAT_R8_SSCALED
, PIPE_FORMAT_R32_FLOAT
},
254 { PIPE_FORMAT_R8G8_SSCALED
, PIPE_FORMAT_R32G32_FLOAT
},
255 { PIPE_FORMAT_R8G8B8_SSCALED
, PIPE_FORMAT_R32G32B32_FLOAT
},
256 { PIPE_FORMAT_R8G8B8A8_SSCALED
, PIPE_FORMAT_R32G32B32A32_FLOAT
},
259 boolean
u_vbuf_get_caps(struct pipe_screen
*screen
, struct u_vbuf_caps
*caps
)
262 boolean fallback
= FALSE
;
264 /* I'd rather have a bitfield of which formats are supported and a static
265 * table of the translations indexed by format, but since we don't have C99
266 * we can't easily make a sparsely-populated table indexed by format. So,
267 * we construct the sparse table here.
269 for (i
= 0; i
< PIPE_FORMAT_COUNT
; i
++)
270 caps
->format_translation
[i
] = i
;
272 for (i
= 0; i
< Elements(vbuf_format_fallbacks
); i
++) {
273 enum pipe_format format
= vbuf_format_fallbacks
[i
].from
;
275 if (!screen
->is_format_supported(screen
, format
, PIPE_BUFFER
, 0,
276 PIPE_BIND_VERTEX_BUFFER
)) {
277 caps
->format_translation
[format
] = vbuf_format_fallbacks
[i
].to
;
282 caps
->buffer_offset_unaligned
=
283 !screen
->get_param(screen
,
284 PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY
);
285 caps
->buffer_stride_unaligned
=
286 !screen
->get_param(screen
,
287 PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY
);
288 caps
->velem_src_offset_unaligned
=
289 !screen
->get_param(screen
,
290 PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY
);
291 caps
->user_vertex_buffers
=
292 screen
->get_param(screen
, PIPE_CAP_USER_VERTEX_BUFFERS
);
294 if (!caps
->buffer_offset_unaligned
||
295 !caps
->buffer_stride_unaligned
||
296 !caps
->velem_src_offset_unaligned
||
297 !caps
->user_vertex_buffers
) {
305 u_vbuf_create(struct pipe_context
*pipe
,
306 struct u_vbuf_caps
*caps
, unsigned aux_vertex_buffer_index
)
308 struct u_vbuf
*mgr
= CALLOC_STRUCT(u_vbuf
);
311 mgr
->aux_vertex_buffer_slot
= aux_vertex_buffer_index
;
313 mgr
->cso_cache
= cso_cache_create();
314 mgr
->translate_cache
= translate_cache_create();
315 memset(mgr
->fallback_vbs
, ~0, sizeof(mgr
->fallback_vbs
));
317 mgr
->uploader
= u_upload_create(pipe
, 1024 * 1024, 4,
318 PIPE_BIND_VERTEX_BUFFER
);
323 /* u_vbuf uses its own caching for vertex elements, because it needs to keep
324 * its own preprocessed state per vertex element CSO. */
325 static struct u_vbuf_elements
*
326 u_vbuf_set_vertex_elements_internal(struct u_vbuf
*mgr
, unsigned count
,
327 const struct pipe_vertex_element
*states
)
329 struct pipe_context
*pipe
= mgr
->pipe
;
330 unsigned key_size
, hash_key
;
331 struct cso_hash_iter iter
;
332 struct u_vbuf_elements
*ve
;
333 struct cso_velems_state velems_state
;
335 /* need to include the count into the stored state data too. */
336 key_size
= sizeof(struct pipe_vertex_element
) * count
+ sizeof(unsigned);
337 velems_state
.count
= count
;
338 memcpy(velems_state
.velems
, states
,
339 sizeof(struct pipe_vertex_element
) * count
);
340 hash_key
= cso_construct_key((void*)&velems_state
, key_size
);
341 iter
= cso_find_state_template(mgr
->cso_cache
, hash_key
, CSO_VELEMENTS
,
342 (void*)&velems_state
, key_size
);
344 if (cso_hash_iter_is_null(iter
)) {
345 struct cso_velements
*cso
= MALLOC_STRUCT(cso_velements
);
346 memcpy(&cso
->state
, &velems_state
, key_size
);
347 cso
->data
= u_vbuf_create_vertex_elements(mgr
, count
, states
);
348 cso
->delete_state
= (cso_state_callback
)u_vbuf_delete_vertex_elements
;
349 cso
->context
= (void*)mgr
;
351 iter
= cso_insert_state(mgr
->cso_cache
, hash_key
, CSO_VELEMENTS
, cso
);
354 ve
= ((struct cso_velements
*)cso_hash_iter_data(iter
))->data
;
360 pipe
->bind_vertex_elements_state(pipe
, ve
->driver_cso
);
365 void u_vbuf_set_vertex_elements(struct u_vbuf
*mgr
, unsigned count
,
366 const struct pipe_vertex_element
*states
)
368 mgr
->ve
= u_vbuf_set_vertex_elements_internal(mgr
, count
, states
);
371 void u_vbuf_destroy(struct u_vbuf
*mgr
)
373 struct pipe_screen
*screen
= mgr
->pipe
->screen
;
375 unsigned num_vb
= screen
->get_shader_param(screen
, PIPE_SHADER_VERTEX
,
376 PIPE_SHADER_CAP_MAX_INPUTS
);
378 mgr
->pipe
->set_index_buffer(mgr
->pipe
, NULL
);
379 pipe_resource_reference(&mgr
->index_buffer
.buffer
, NULL
);
381 mgr
->pipe
->set_vertex_buffers(mgr
->pipe
, 0, num_vb
, NULL
);
383 for (i
= 0; i
< PIPE_MAX_ATTRIBS
; i
++) {
384 pipe_resource_reference(&mgr
->vertex_buffer
[i
].buffer
, NULL
);
386 for (i
= 0; i
< PIPE_MAX_ATTRIBS
; i
++) {
387 pipe_resource_reference(&mgr
->real_vertex_buffer
[i
].buffer
, NULL
);
389 pipe_resource_reference(&mgr
->aux_vertex_buffer_saved
.buffer
, NULL
);
391 translate_cache_destroy(mgr
->translate_cache
);
392 u_upload_destroy(mgr
->uploader
);
393 cso_cache_delete(mgr
->cso_cache
);
397 static enum pipe_error
398 u_vbuf_translate_buffers(struct u_vbuf
*mgr
, struct translate_key
*key
,
399 unsigned vb_mask
, unsigned out_vb
,
400 int start_vertex
, unsigned num_vertices
,
401 int start_index
, unsigned num_indices
, int min_index
,
402 boolean unroll_indices
)
404 struct translate
*tr
;
405 struct pipe_transfer
*vb_transfer
[PIPE_MAX_ATTRIBS
] = {0};
406 struct pipe_resource
*out_buffer
= NULL
;
408 unsigned out_offset
, mask
;
410 /* Get a translate object. */
411 tr
= translate_cache_find(mgr
->translate_cache
, key
);
413 /* Map buffers we want to translate. */
416 struct pipe_vertex_buffer
*vb
;
419 unsigned i
= u_bit_scan(&mask
);
421 vb
= &mgr
->vertex_buffer
[i
];
422 offset
= vb
->buffer_offset
+ vb
->stride
* start_vertex
;
424 if (vb
->user_buffer
) {
425 map
= (uint8_t*)vb
->user_buffer
+ offset
;
427 unsigned size
= vb
->stride
? num_vertices
* vb
->stride
430 if (offset
+size
> vb
->buffer
->width0
) {
431 size
= vb
->buffer
->width0
- offset
;
434 map
= pipe_buffer_map_range(mgr
->pipe
, vb
->buffer
, offset
, size
,
435 PIPE_TRANSFER_READ
, &vb_transfer
[i
]);
438 /* Subtract min_index so that indexing with the index buffer works. */
439 if (unroll_indices
) {
440 map
-= (ptrdiff_t)vb
->stride
* min_index
;
443 tr
->set_buffer(tr
, i
, map
, vb
->stride
, ~0);
447 if (unroll_indices
) {
448 struct pipe_index_buffer
*ib
= &mgr
->index_buffer
;
449 struct pipe_transfer
*transfer
= NULL
;
450 unsigned offset
= ib
->offset
+ start_index
* ib
->index_size
;
453 assert((ib
->buffer
|| ib
->user_buffer
) && ib
->index_size
);
455 /* Create and map the output buffer. */
456 u_upload_alloc(mgr
->uploader
, 0,
457 key
->output_stride
* num_indices
,
458 &out_offset
, &out_buffer
,
461 return PIPE_ERROR_OUT_OF_MEMORY
;
463 if (ib
->user_buffer
) {
464 map
= (uint8_t*)ib
->user_buffer
+ offset
;
466 map
= pipe_buffer_map_range(mgr
->pipe
, ib
->buffer
, offset
,
467 num_indices
* ib
->index_size
,
468 PIPE_TRANSFER_READ
, &transfer
);
471 switch (ib
->index_size
) {
473 tr
->run_elts(tr
, (unsigned*)map
, num_indices
, 0, 0, out_map
);
476 tr
->run_elts16(tr
, (uint16_t*)map
, num_indices
, 0, 0, out_map
);
479 tr
->run_elts8(tr
, map
, num_indices
, 0, 0, out_map
);
484 pipe_buffer_unmap(mgr
->pipe
, transfer
);
487 /* Create and map the output buffer. */
488 u_upload_alloc(mgr
->uploader
,
489 key
->output_stride
* start_vertex
,
490 key
->output_stride
* num_vertices
,
491 &out_offset
, &out_buffer
,
494 return PIPE_ERROR_OUT_OF_MEMORY
;
496 out_offset
-= key
->output_stride
* start_vertex
;
498 tr
->run(tr
, 0, num_vertices
, 0, 0, out_map
);
501 /* Unmap all buffers. */
504 unsigned i
= u_bit_scan(&mask
);
506 if (vb_transfer
[i
]) {
507 pipe_buffer_unmap(mgr
->pipe
, vb_transfer
[i
]);
511 /* Setup the new vertex buffer. */
512 mgr
->real_vertex_buffer
[out_vb
].buffer_offset
= out_offset
;
513 mgr
->real_vertex_buffer
[out_vb
].stride
= key
->output_stride
;
515 /* Move the buffer reference. */
516 pipe_resource_reference(
517 &mgr
->real_vertex_buffer
[out_vb
].buffer
, NULL
);
518 mgr
->real_vertex_buffer
[out_vb
].buffer
= out_buffer
;
524 u_vbuf_translate_find_free_vb_slots(struct u_vbuf
*mgr
,
525 unsigned mask
[VB_NUM
])
528 unsigned fallback_vbs
[VB_NUM
];
529 /* Set the bit for each buffer which is incompatible, or isn't set. */
530 uint32_t unused_vb_mask
=
531 mgr
->ve
->incompatible_vb_mask_all
| mgr
->incompatible_vb_mask
|
532 ~mgr
->enabled_vb_mask
;
534 memset(fallback_vbs
, ~0, sizeof(fallback_vbs
));
536 /* Find free slots for each type if needed. */
537 for (type
= 0; type
< VB_NUM
; type
++) {
541 if (!unused_vb_mask
) {
545 index
= ffs(unused_vb_mask
) - 1;
546 fallback_vbs
[type
] = index
;
547 unused_vb_mask
&= ~(1 << index
);
548 /*printf("found slot=%i for type=%i\n", index, type);*/
552 for (type
= 0; type
< VB_NUM
; type
++) {
554 mgr
->dirty_real_vb_mask
|= 1 << fallback_vbs
[type
];
558 memcpy(mgr
->fallback_vbs
, fallback_vbs
, sizeof(fallback_vbs
));
563 u_vbuf_translate_begin(struct u_vbuf
*mgr
,
564 int start_vertex
, unsigned num_vertices
,
565 int start_instance
, unsigned num_instances
,
566 int start_index
, unsigned num_indices
, int min_index
,
567 boolean unroll_indices
)
569 unsigned mask
[VB_NUM
] = {0};
570 struct translate_key key
[VB_NUM
];
571 unsigned elem_index
[VB_NUM
][PIPE_MAX_ATTRIBS
]; /* ... into key.elements */
573 unsigned incompatible_vb_mask
= mgr
->incompatible_vb_mask
&
574 mgr
->ve
->used_vb_mask
;
576 int start
[VB_NUM
] = {
577 start_vertex
, /* VERTEX */
578 start_instance
, /* INSTANCE */
582 unsigned num
[VB_NUM
] = {
583 num_vertices
, /* VERTEX */
584 num_instances
, /* INSTANCE */
588 memset(key
, 0, sizeof(key
));
589 memset(elem_index
, ~0, sizeof(elem_index
));
591 /* See if there are vertex attribs of each type to translate and
593 for (i
= 0; i
< mgr
->ve
->count
; i
++) {
594 unsigned vb_index
= mgr
->ve
->ve
[i
].vertex_buffer_index
;
596 if (!mgr
->vertex_buffer
[vb_index
].stride
) {
597 if (!(mgr
->ve
->incompatible_elem_mask
& (1 << i
)) &&
598 !(incompatible_vb_mask
& (1 << vb_index
))) {
601 mask
[VB_CONST
] |= 1 << vb_index
;
602 } else if (mgr
->ve
->ve
[i
].instance_divisor
) {
603 if (!(mgr
->ve
->incompatible_elem_mask
& (1 << i
)) &&
604 !(incompatible_vb_mask
& (1 << vb_index
))) {
607 mask
[VB_INSTANCE
] |= 1 << vb_index
;
609 if (!unroll_indices
&&
610 !(mgr
->ve
->incompatible_elem_mask
& (1 << i
)) &&
611 !(incompatible_vb_mask
& (1 << vb_index
))) {
614 mask
[VB_VERTEX
] |= 1 << vb_index
;
618 assert(mask
[VB_VERTEX
] || mask
[VB_INSTANCE
] || mask
[VB_CONST
]);
620 /* Find free vertex buffer slots. */
621 if (!u_vbuf_translate_find_free_vb_slots(mgr
, mask
)) {
625 /* Initialize the translate keys. */
626 for (i
= 0; i
< mgr
->ve
->count
; i
++) {
627 struct translate_key
*k
;
628 struct translate_element
*te
;
629 unsigned bit
, vb_index
= mgr
->ve
->ve
[i
].vertex_buffer_index
;
632 if (!(mgr
->ve
->incompatible_elem_mask
& (1 << i
)) &&
633 !(incompatible_vb_mask
& (1 << vb_index
)) &&
634 (!unroll_indices
|| !(mask
[VB_VERTEX
] & bit
))) {
638 /* Set type to what we will translate.
639 * Whether vertex, instance, or constant attribs. */
640 for (type
= 0; type
< VB_NUM
; type
++) {
641 if (mask
[type
] & bit
) {
645 assert(type
< VB_NUM
);
646 assert(translate_is_output_format_supported(mgr
->ve
->native_format
[i
]));
647 /*printf("velem=%i type=%i\n", i, type);*/
649 /* Add the vertex element. */
651 elem_index
[type
][i
] = k
->nr_elements
;
653 te
= &k
->element
[k
->nr_elements
];
654 te
->type
= TRANSLATE_ELEMENT_NORMAL
;
655 te
->instance_divisor
= 0;
656 te
->input_buffer
= vb_index
;
657 te
->input_format
= mgr
->ve
->ve
[i
].src_format
;
658 te
->input_offset
= mgr
->ve
->ve
[i
].src_offset
;
659 te
->output_format
= mgr
->ve
->native_format
[i
];
660 te
->output_offset
= k
->output_stride
;
662 k
->output_stride
+= mgr
->ve
->native_format_size
[i
];
666 /* Translate buffers. */
667 for (type
= 0; type
< VB_NUM
; type
++) {
668 if (key
[type
].nr_elements
) {
670 err
= u_vbuf_translate_buffers(mgr
, &key
[type
], mask
[type
],
671 mgr
->fallback_vbs
[type
],
672 start
[type
], num
[type
],
673 start_index
, num_indices
, min_index
,
674 unroll_indices
&& type
== VB_VERTEX
);
678 /* Fixup the stride for constant attribs. */
679 if (type
== VB_CONST
) {
680 mgr
->real_vertex_buffer
[mgr
->fallback_vbs
[VB_CONST
]].stride
= 0;
685 /* Setup new vertex elements. */
686 for (i
= 0; i
< mgr
->ve
->count
; i
++) {
687 for (type
= 0; type
< VB_NUM
; type
++) {
688 if (elem_index
[type
][i
] < key
[type
].nr_elements
) {
689 struct translate_element
*te
= &key
[type
].element
[elem_index
[type
][i
]];
690 mgr
->fallback_velems
[i
].instance_divisor
= mgr
->ve
->ve
[i
].instance_divisor
;
691 mgr
->fallback_velems
[i
].src_format
= te
->output_format
;
692 mgr
->fallback_velems
[i
].src_offset
= te
->output_offset
;
693 mgr
->fallback_velems
[i
].vertex_buffer_index
= mgr
->fallback_vbs
[type
];
695 /* elem_index[type][i] can only be set for one type. */
696 assert(type
> VB_INSTANCE
|| elem_index
[type
+1][i
] == ~0);
697 assert(type
> VB_VERTEX
|| elem_index
[type
+2][i
] == ~0);
701 /* No translating, just copy the original vertex element over. */
702 if (type
== VB_NUM
) {
703 memcpy(&mgr
->fallback_velems
[i
], &mgr
->ve
->ve
[i
],
704 sizeof(struct pipe_vertex_element
));
708 u_vbuf_set_vertex_elements_internal(mgr
, mgr
->ve
->count
,
709 mgr
->fallback_velems
);
710 mgr
->using_translate
= TRUE
;
714 static void u_vbuf_translate_end(struct u_vbuf
*mgr
)
718 /* Restore vertex elements. */
719 mgr
->pipe
->bind_vertex_elements_state(mgr
->pipe
, mgr
->ve
->driver_cso
);
720 mgr
->using_translate
= FALSE
;
722 /* Unreference the now-unused VBOs. */
723 for (i
= 0; i
< VB_NUM
; i
++) {
724 unsigned vb
= mgr
->fallback_vbs
[i
];
726 pipe_resource_reference(&mgr
->real_vertex_buffer
[vb
].buffer
, NULL
);
727 mgr
->fallback_vbs
[i
] = ~0;
729 /* This will cause the buffer to be unbound in the driver later. */
730 mgr
->dirty_real_vb_mask
|= 1 << vb
;
736 u_vbuf_create_vertex_elements(struct u_vbuf
*mgr
, unsigned count
,
737 const struct pipe_vertex_element
*attribs
)
739 struct pipe_context
*pipe
= mgr
->pipe
;
741 struct pipe_vertex_element driver_attribs
[PIPE_MAX_ATTRIBS
];
742 struct u_vbuf_elements
*ve
= CALLOC_STRUCT(u_vbuf_elements
);
743 uint32_t used_buffers
= 0;
747 memcpy(ve
->ve
, attribs
, sizeof(struct pipe_vertex_element
) * count
);
748 memcpy(driver_attribs
, attribs
, sizeof(struct pipe_vertex_element
) * count
);
750 /* Set the best native format in case the original format is not
752 for (i
= 0; i
< count
; i
++) {
753 enum pipe_format format
= ve
->ve
[i
].src_format
;
755 ve
->src_format_size
[i
] = util_format_get_blocksize(format
);
757 used_buffers
|= 1 << ve
->ve
[i
].vertex_buffer_index
;
759 if (!ve
->ve
[i
].instance_divisor
) {
760 ve
->noninstance_vb_mask_any
|= 1 << ve
->ve
[i
].vertex_buffer_index
;
763 format
= mgr
->caps
.format_translation
[format
];
765 driver_attribs
[i
].src_format
= format
;
766 ve
->native_format
[i
] = format
;
767 ve
->native_format_size
[i
] =
768 util_format_get_blocksize(ve
->native_format
[i
]);
770 if (ve
->ve
[i
].src_format
!= format
||
771 (!mgr
->caps
.velem_src_offset_unaligned
&&
772 ve
->ve
[i
].src_offset
% 4 != 0)) {
773 ve
->incompatible_elem_mask
|= 1 << i
;
774 ve
->incompatible_vb_mask_any
|= 1 << ve
->ve
[i
].vertex_buffer_index
;
776 ve
->compatible_vb_mask_any
|= 1 << ve
->ve
[i
].vertex_buffer_index
;
780 ve
->used_vb_mask
= used_buffers
;
781 ve
->compatible_vb_mask_all
= ~ve
->incompatible_vb_mask_any
& used_buffers
;
782 ve
->incompatible_vb_mask_all
= ~ve
->compatible_vb_mask_any
& used_buffers
;
784 /* Align the formats and offsets to the size of DWORD if needed. */
785 if (!mgr
->caps
.velem_src_offset_unaligned
) {
786 for (i
= 0; i
< count
; i
++) {
787 ve
->native_format_size
[i
] = align(ve
->native_format_size
[i
], 4);
788 driver_attribs
[i
].src_offset
= align(ve
->ve
[i
].src_offset
, 4);
793 pipe
->create_vertex_elements_state(pipe
, count
, driver_attribs
);
797 static void u_vbuf_delete_vertex_elements(struct u_vbuf
*mgr
, void *cso
)
799 struct pipe_context
*pipe
= mgr
->pipe
;
800 struct u_vbuf_elements
*ve
= cso
;
802 pipe
->delete_vertex_elements_state(pipe
, ve
->driver_cso
);
806 void u_vbuf_set_vertex_buffers(struct u_vbuf
*mgr
,
807 unsigned start_slot
, unsigned count
,
808 const struct pipe_vertex_buffer
*bufs
)
811 /* which buffers are enabled */
812 uint32_t enabled_vb_mask
= 0;
813 /* which buffers are in user memory */
814 uint32_t user_vb_mask
= 0;
815 /* which buffers are incompatible with the driver */
816 uint32_t incompatible_vb_mask
= 0;
817 /* which buffers have a non-zero stride */
818 uint32_t nonzero_stride_vb_mask
= 0;
819 uint32_t mask
= ~(((1ull << count
) - 1) << start_slot
);
821 /* Zero out the bits we are going to rewrite completely. */
822 mgr
->user_vb_mask
&= mask
;
823 mgr
->incompatible_vb_mask
&= mask
;
824 mgr
->nonzero_stride_vb_mask
&= mask
;
825 mgr
->enabled_vb_mask
&= mask
;
828 struct pipe_context
*pipe
= mgr
->pipe
;
830 mgr
->dirty_real_vb_mask
&= mask
;
832 for (i
= 0; i
< count
; i
++) {
833 unsigned dst_index
= start_slot
+ i
;
835 pipe_resource_reference(&mgr
->vertex_buffer
[dst_index
].buffer
, NULL
);
836 pipe_resource_reference(&mgr
->real_vertex_buffer
[dst_index
].buffer
,
840 pipe
->set_vertex_buffers(pipe
, start_slot
, count
, NULL
);
844 for (i
= 0; i
< count
; i
++) {
845 unsigned dst_index
= start_slot
+ i
;
846 const struct pipe_vertex_buffer
*vb
= &bufs
[i
];
847 struct pipe_vertex_buffer
*orig_vb
= &mgr
->vertex_buffer
[dst_index
];
848 struct pipe_vertex_buffer
*real_vb
= &mgr
->real_vertex_buffer
[dst_index
];
850 if (!vb
->buffer
&& !vb
->user_buffer
) {
851 pipe_resource_reference(&orig_vb
->buffer
, NULL
);
852 pipe_resource_reference(&real_vb
->buffer
, NULL
);
853 real_vb
->user_buffer
= NULL
;
857 pipe_resource_reference(&orig_vb
->buffer
, vb
->buffer
);
858 orig_vb
->user_buffer
= vb
->user_buffer
;
860 real_vb
->buffer_offset
= orig_vb
->buffer_offset
= vb
->buffer_offset
;
861 real_vb
->stride
= orig_vb
->stride
= vb
->stride
;
864 nonzero_stride_vb_mask
|= 1 << dst_index
;
866 enabled_vb_mask
|= 1 << dst_index
;
868 if ((!mgr
->caps
.buffer_offset_unaligned
&& vb
->buffer_offset
% 4 != 0) ||
869 (!mgr
->caps
.buffer_stride_unaligned
&& vb
->stride
% 4 != 0)) {
870 incompatible_vb_mask
|= 1 << dst_index
;
871 pipe_resource_reference(&real_vb
->buffer
, NULL
);
875 if (!mgr
->caps
.user_vertex_buffers
&& vb
->user_buffer
) {
876 user_vb_mask
|= 1 << dst_index
;
877 pipe_resource_reference(&real_vb
->buffer
, NULL
);
881 pipe_resource_reference(&real_vb
->buffer
, vb
->buffer
);
882 real_vb
->user_buffer
= vb
->user_buffer
;
885 mgr
->user_vb_mask
|= user_vb_mask
;
886 mgr
->incompatible_vb_mask
|= incompatible_vb_mask
;
887 mgr
->nonzero_stride_vb_mask
|= nonzero_stride_vb_mask
;
888 mgr
->enabled_vb_mask
|= enabled_vb_mask
;
890 /* All changed buffers are marked as dirty, even the NULL ones,
891 * which will cause the NULL buffers to be unbound in the driver later. */
892 mgr
->dirty_real_vb_mask
|= ~mask
;
895 void u_vbuf_set_index_buffer(struct u_vbuf
*mgr
,
896 const struct pipe_index_buffer
*ib
)
898 struct pipe_context
*pipe
= mgr
->pipe
;
901 assert(ib
->offset
% ib
->index_size
== 0);
902 pipe_resource_reference(&mgr
->index_buffer
.buffer
, ib
->buffer
);
903 memcpy(&mgr
->index_buffer
, ib
, sizeof(*ib
));
905 pipe_resource_reference(&mgr
->index_buffer
.buffer
, NULL
);
908 pipe
->set_index_buffer(pipe
, ib
);
911 static enum pipe_error
912 u_vbuf_upload_buffers(struct u_vbuf
*mgr
,
913 int start_vertex
, unsigned num_vertices
,
914 int start_instance
, unsigned num_instances
)
917 unsigned nr_velems
= mgr
->ve
->count
;
918 struct pipe_vertex_element
*velems
=
919 mgr
->using_translate
? mgr
->fallback_velems
: mgr
->ve
->ve
;
920 unsigned start_offset
[PIPE_MAX_ATTRIBS
];
921 unsigned end_offset
[PIPE_MAX_ATTRIBS
];
922 uint32_t buffer_mask
= 0;
924 /* Determine how much data needs to be uploaded. */
925 for (i
= 0; i
< nr_velems
; i
++) {
926 struct pipe_vertex_element
*velem
= &velems
[i
];
927 unsigned index
= velem
->vertex_buffer_index
;
928 struct pipe_vertex_buffer
*vb
= &mgr
->vertex_buffer
[index
];
929 unsigned instance_div
, first
, size
, index_bit
;
931 /* Skip the buffers generated by translate. */
932 if (index
== mgr
->fallback_vbs
[VB_VERTEX
] ||
933 index
== mgr
->fallback_vbs
[VB_INSTANCE
] ||
934 index
== mgr
->fallback_vbs
[VB_CONST
]) {
938 if (!vb
->user_buffer
) {
942 instance_div
= velem
->instance_divisor
;
943 first
= vb
->buffer_offset
+ velem
->src_offset
;
946 /* Constant attrib. */
947 size
= mgr
->ve
->src_format_size
[i
];
948 } else if (instance_div
) {
949 /* Per-instance attrib. */
950 unsigned count
= (num_instances
+ instance_div
- 1) / instance_div
;
951 first
+= vb
->stride
* start_instance
;
952 size
= vb
->stride
* (count
- 1) + mgr
->ve
->src_format_size
[i
];
954 /* Per-vertex attrib. */
955 first
+= vb
->stride
* start_vertex
;
956 size
= vb
->stride
* (num_vertices
- 1) + mgr
->ve
->src_format_size
[i
];
959 index_bit
= 1 << index
;
961 /* Update offsets. */
962 if (!(buffer_mask
& index_bit
)) {
963 start_offset
[index
] = first
;
964 end_offset
[index
] = first
+ size
;
966 if (first
< start_offset
[index
])
967 start_offset
[index
] = first
;
968 if (first
+ size
> end_offset
[index
])
969 end_offset
[index
] = first
+ size
;
972 buffer_mask
|= index_bit
;
975 /* Upload buffers. */
976 while (buffer_mask
) {
978 struct pipe_vertex_buffer
*real_vb
;
981 i
= u_bit_scan(&buffer_mask
);
983 start
= start_offset
[i
];
987 real_vb
= &mgr
->real_vertex_buffer
[i
];
988 ptr
= mgr
->vertex_buffer
[i
].user_buffer
;
990 u_upload_data(mgr
->uploader
, start
, end
- start
, ptr
+ start
,
991 &real_vb
->buffer_offset
, &real_vb
->buffer
);
992 if (!real_vb
->buffer
)
993 return PIPE_ERROR_OUT_OF_MEMORY
;
995 real_vb
->buffer_offset
-= start
;
1001 static boolean
u_vbuf_need_minmax_index(const struct u_vbuf
*mgr
)
1003 /* See if there are any per-vertex attribs which will be uploaded or
1004 * translated. Use bitmasks to get the info instead of looping over vertex
1006 return (mgr
->ve
->used_vb_mask
&
1007 ((mgr
->user_vb_mask
| mgr
->incompatible_vb_mask
|
1008 mgr
->ve
->incompatible_vb_mask_any
) &
1009 mgr
->ve
->noninstance_vb_mask_any
& mgr
->nonzero_stride_vb_mask
)) != 0;
1012 static boolean
u_vbuf_mapping_vertex_buffer_blocks(const struct u_vbuf
*mgr
)
1014 /* Return true if there are hw buffers which don't need to be translated.
1016 * We could query whether each buffer is busy, but that would
1017 * be way more costly than this. */
1018 return (mgr
->ve
->used_vb_mask
&
1019 (~mgr
->user_vb_mask
& ~mgr
->incompatible_vb_mask
&
1020 mgr
->ve
->compatible_vb_mask_all
& mgr
->ve
->noninstance_vb_mask_any
&
1021 mgr
->nonzero_stride_vb_mask
)) != 0;
1024 static void u_vbuf_get_minmax_index(struct pipe_context
*pipe
,
1025 struct pipe_index_buffer
*ib
,
1026 boolean primitive_restart
,
1027 unsigned restart_index
,
1028 unsigned start
, unsigned count
,
1032 struct pipe_transfer
*transfer
= NULL
;
1033 const void *indices
;
1036 if (ib
->user_buffer
) {
1037 indices
= (uint8_t*)ib
->user_buffer
+
1038 ib
->offset
+ start
* ib
->index_size
;
1040 indices
= pipe_buffer_map_range(pipe
, ib
->buffer
,
1041 ib
->offset
+ start
* ib
->index_size
,
1042 count
* ib
->index_size
,
1043 PIPE_TRANSFER_READ
, &transfer
);
1046 switch (ib
->index_size
) {
1048 const unsigned *ui_indices
= (const unsigned*)indices
;
1049 unsigned max_ui
= 0;
1050 unsigned min_ui
= ~0U;
1051 if (primitive_restart
) {
1052 for (i
= 0; i
< count
; i
++) {
1053 if (ui_indices
[i
] != restart_index
) {
1054 if (ui_indices
[i
] > max_ui
) max_ui
= ui_indices
[i
];
1055 if (ui_indices
[i
] < min_ui
) min_ui
= ui_indices
[i
];
1060 for (i
= 0; i
< count
; i
++) {
1061 if (ui_indices
[i
] > max_ui
) max_ui
= ui_indices
[i
];
1062 if (ui_indices
[i
] < min_ui
) min_ui
= ui_indices
[i
];
1065 *out_min_index
= min_ui
;
1066 *out_max_index
= max_ui
;
1070 const unsigned short *us_indices
= (const unsigned short*)indices
;
1071 unsigned max_us
= 0;
1072 unsigned min_us
= ~0U;
1073 if (primitive_restart
) {
1074 for (i
= 0; i
< count
; i
++) {
1075 if (us_indices
[i
] != restart_index
) {
1076 if (us_indices
[i
] > max_us
) max_us
= us_indices
[i
];
1077 if (us_indices
[i
] < min_us
) min_us
= us_indices
[i
];
1082 for (i
= 0; i
< count
; i
++) {
1083 if (us_indices
[i
] > max_us
) max_us
= us_indices
[i
];
1084 if (us_indices
[i
] < min_us
) min_us
= us_indices
[i
];
1087 *out_min_index
= min_us
;
1088 *out_max_index
= max_us
;
1092 const unsigned char *ub_indices
= (const unsigned char*)indices
;
1093 unsigned max_ub
= 0;
1094 unsigned min_ub
= ~0U;
1095 if (primitive_restart
) {
1096 for (i
= 0; i
< count
; i
++) {
1097 if (ub_indices
[i
] != restart_index
) {
1098 if (ub_indices
[i
] > max_ub
) max_ub
= ub_indices
[i
];
1099 if (ub_indices
[i
] < min_ub
) min_ub
= ub_indices
[i
];
1104 for (i
= 0; i
< count
; i
++) {
1105 if (ub_indices
[i
] > max_ub
) max_ub
= ub_indices
[i
];
1106 if (ub_indices
[i
] < min_ub
) min_ub
= ub_indices
[i
];
1109 *out_min_index
= min_ub
;
1110 *out_max_index
= max_ub
;
1120 pipe_buffer_unmap(pipe
, transfer
);
1124 static void u_vbuf_set_driver_vertex_buffers(struct u_vbuf
*mgr
)
1126 struct pipe_context
*pipe
= mgr
->pipe
;
1127 unsigned start_slot
, count
;
1129 start_slot
= ffs(mgr
->dirty_real_vb_mask
) - 1;
1130 count
= util_last_bit(mgr
->dirty_real_vb_mask
>> start_slot
);
1132 pipe
->set_vertex_buffers(pipe
, start_slot
, count
,
1133 mgr
->real_vertex_buffer
+ start_slot
);
1134 mgr
->dirty_real_vb_mask
= 0;
1137 void u_vbuf_draw_vbo(struct u_vbuf
*mgr
, const struct pipe_draw_info
*info
)
1139 struct pipe_context
*pipe
= mgr
->pipe
;
1140 int start_vertex
, min_index
;
1141 unsigned num_vertices
;
1142 boolean unroll_indices
= FALSE
;
1143 uint32_t used_vb_mask
= mgr
->ve
->used_vb_mask
;
1144 uint32_t user_vb_mask
= mgr
->user_vb_mask
& used_vb_mask
;
1145 uint32_t incompatible_vb_mask
= mgr
->incompatible_vb_mask
& used_vb_mask
;
1146 struct pipe_draw_info new_info
;
1148 /* Normal draw. No fallback and no user buffers. */
1149 if (!incompatible_vb_mask
&&
1150 !mgr
->ve
->incompatible_elem_mask
&&
1153 /* Set vertex buffers if needed. */
1154 if (mgr
->dirty_real_vb_mask
& used_vb_mask
) {
1155 u_vbuf_set_driver_vertex_buffers(mgr
);
1158 pipe
->draw_vbo(pipe
, info
);
1164 /* Fallback. We need to know all the parameters. */
1165 if (new_info
.indirect
) {
1166 struct pipe_transfer
*transfer
= NULL
;
1169 if (new_info
.indexed
) {
1170 data
= pipe_buffer_map_range(pipe
, new_info
.indirect
,
1171 new_info
.indirect_offset
, 20,
1172 PIPE_TRANSFER_READ
, &transfer
);
1173 new_info
.index_bias
= data
[3];
1174 new_info
.start_instance
= data
[4];
1177 data
= pipe_buffer_map_range(pipe
, new_info
.indirect
,
1178 new_info
.indirect_offset
, 16,
1179 PIPE_TRANSFER_READ
, &transfer
);
1180 new_info
.start_instance
= data
[3];
1183 new_info
.count
= data
[0];
1184 new_info
.instance_count
= data
[1];
1185 new_info
.start
= data
[2];
1186 pipe_buffer_unmap(pipe
, transfer
);
1187 new_info
.indirect
= NULL
;
1190 if (new_info
.indexed
) {
1191 /* See if anything needs to be done for per-vertex attribs. */
1192 if (u_vbuf_need_minmax_index(mgr
)) {
1195 if (new_info
.max_index
!= ~0) {
1196 min_index
= new_info
.min_index
;
1197 max_index
= new_info
.max_index
;
1199 u_vbuf_get_minmax_index(mgr
->pipe
, &mgr
->index_buffer
,
1200 new_info
.primitive_restart
,
1201 new_info
.restart_index
, new_info
.start
,
1202 new_info
.count
, &min_index
, &max_index
);
1205 assert(min_index
<= max_index
);
1207 start_vertex
= min_index
+ new_info
.index_bias
;
1208 num_vertices
= max_index
+ 1 - min_index
;
1210 /* Primitive restart doesn't work when unrolling indices.
1211 * We would have to break this drawing operation into several ones. */
1212 /* Use some heuristic to see if unrolling indices improves
1214 if (!new_info
.primitive_restart
&&
1215 num_vertices
> new_info
.count
*2 &&
1216 num_vertices
- new_info
.count
> 32 &&
1217 !u_vbuf_mapping_vertex_buffer_blocks(mgr
)) {
1218 unroll_indices
= TRUE
;
1219 user_vb_mask
&= ~(mgr
->nonzero_stride_vb_mask
&
1220 mgr
->ve
->noninstance_vb_mask_any
);
1223 /* Nothing to do for per-vertex attribs. */
1229 start_vertex
= new_info
.start
;
1230 num_vertices
= new_info
.count
;
1234 /* Translate vertices with non-native layouts or formats. */
1235 if (unroll_indices
||
1236 incompatible_vb_mask
||
1237 mgr
->ve
->incompatible_elem_mask
) {
1238 if (!u_vbuf_translate_begin(mgr
, start_vertex
, num_vertices
,
1239 new_info
.start_instance
,
1240 new_info
.instance_count
, new_info
.start
,
1241 new_info
.count
, min_index
, unroll_indices
)) {
1242 debug_warn_once("u_vbuf_translate_begin() failed");
1246 if (unroll_indices
) {
1247 new_info
.indexed
= FALSE
;
1248 new_info
.index_bias
= 0;
1249 new_info
.min_index
= 0;
1250 new_info
.max_index
= new_info
.count
- 1;
1254 user_vb_mask
&= ~(incompatible_vb_mask
|
1255 mgr
->ve
->incompatible_vb_mask_all
);
1258 /* Upload user buffers. */
1260 if (u_vbuf_upload_buffers(mgr
, start_vertex
, num_vertices
,
1261 new_info
.start_instance
,
1262 new_info
.instance_count
) != PIPE_OK
) {
1263 debug_warn_once("u_vbuf_upload_buffers() failed");
1267 mgr
->dirty_real_vb_mask
|= user_vb_mask
;
1271 if (unroll_indices) {
1272 printf("unrolling indices: start_vertex = %i, num_vertices = %i\n",
1273 start_vertex, num_vertices);
1274 util_dump_draw_info(stdout, info);
1279 for (i = 0; i < mgr->nr_vertex_buffers; i++) {
1280 printf("input %i: ", i);
1281 util_dump_vertex_buffer(stdout, mgr->vertex_buffer+i);
1284 for (i = 0; i < mgr->nr_real_vertex_buffers; i++) {
1285 printf("real %i: ", i);
1286 util_dump_vertex_buffer(stdout, mgr->real_vertex_buffer+i);
1291 u_upload_unmap(mgr
->uploader
);
1292 u_vbuf_set_driver_vertex_buffers(mgr
);
1294 pipe
->draw_vbo(pipe
, &new_info
);
1296 if (mgr
->using_translate
) {
1297 u_vbuf_translate_end(mgr
);
1301 void u_vbuf_save_vertex_elements(struct u_vbuf
*mgr
)
1303 assert(!mgr
->ve_saved
);
1304 mgr
->ve_saved
= mgr
->ve
;
1307 void u_vbuf_restore_vertex_elements(struct u_vbuf
*mgr
)
1309 if (mgr
->ve
!= mgr
->ve_saved
) {
1310 struct pipe_context
*pipe
= mgr
->pipe
;
1312 mgr
->ve
= mgr
->ve_saved
;
1313 pipe
->bind_vertex_elements_state(pipe
,
1314 mgr
->ve
? mgr
->ve
->driver_cso
: NULL
);
1316 mgr
->ve_saved
= NULL
;
1319 void u_vbuf_save_aux_vertex_buffer_slot(struct u_vbuf
*mgr
)
1321 struct pipe_vertex_buffer
*vb
=
1322 &mgr
->vertex_buffer
[mgr
->aux_vertex_buffer_slot
];
1324 pipe_resource_reference(&mgr
->aux_vertex_buffer_saved
.buffer
, vb
->buffer
);
1325 memcpy(&mgr
->aux_vertex_buffer_saved
, vb
, sizeof(*vb
));
1328 void u_vbuf_restore_aux_vertex_buffer_slot(struct u_vbuf
*mgr
)
1330 u_vbuf_set_vertex_buffers(mgr
, mgr
->aux_vertex_buffer_slot
, 1,
1331 &mgr
->aux_vertex_buffer_saved
);
1332 pipe_resource_reference(&mgr
->aux_vertex_buffer_saved
.buffer
, NULL
);