2 * Mesa 3-D graphics library
4 * Copyright (C) 1999-2008 Brian Paul All Rights Reserved.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included
14 * in all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
17 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22 * OTHER DEALINGS IN THE SOFTWARE.
25 * Keith Whitwell <keithw@vmware.com>
30 #include "main/glheader.h"
31 #include "main/bufferobj.h"
32 #include "main/compiler.h"
33 #include "main/context.h"
34 #include "main/enums.h"
35 #include "main/state.h"
36 #include "main/vtxfmt.h"
38 #include "vbo_context.h"
43 vbo_exec_debug_verts( struct vbo_exec_context
*exec
)
45 GLuint count
= exec
->vtx
.vert_count
;
48 printf("%s: %u vertices %d primitives, %d vertsize\n",
52 exec
->vtx
.vertex_size
);
54 for (i
= 0 ; i
< exec
->vtx
.prim_count
; i
++) {
55 struct _mesa_prim
*prim
= &exec
->vtx
.prim
[i
];
56 printf(" prim %d: %s%s %d..%d %s %s\n",
58 _mesa_lookup_prim_by_nr(prim
->mode
),
59 prim
->weak
? " (weak)" : "",
61 prim
->start
+ prim
->count
,
62 prim
->begin
? "BEGIN" : "(wrap)",
63 prim
->end
? "END" : "(wrap)");
69 * Copy zero, one or two vertices from the current vertex buffer into
70 * the temporary "copy" buffer.
71 * This is used when a single primitive overflows a vertex buffer and
72 * we need to continue the primitive in a new vertex buffer.
73 * The temporary "copy" buffer holds the vertices which need to get
74 * copied from the old buffer to the new one.
77 vbo_copy_vertices( struct vbo_exec_context
*exec
)
79 struct _mesa_prim
*last_prim
= &exec
->vtx
.prim
[exec
->vtx
.prim_count
- 1];
80 const GLuint nr
= last_prim
->count
;
82 const GLuint sz
= exec
->vtx
.vertex_size
;
83 fi_type
*dst
= exec
->vtx
.copied
.buffer
;
84 const fi_type
*src
= exec
->vtx
.buffer_map
+ last_prim
->start
* sz
;
86 switch (exec
->ctx
->Driver
.CurrentExecPrimitive
) {
91 for (i
= 0 ; i
< ovf
; i
++)
92 memcpy( dst
+i
*sz
, src
+(nr
-ovf
+i
)*sz
, sz
* sizeof(GLfloat
) );
96 for (i
= 0 ; i
< ovf
; i
++)
97 memcpy( dst
+i
*sz
, src
+(nr
-ovf
+i
)*sz
, sz
* sizeof(GLfloat
) );
101 for (i
= 0 ; i
< ovf
; i
++)
102 memcpy( dst
+i
*sz
, src
+(nr
-ovf
+i
)*sz
, sz
* sizeof(GLfloat
) );
109 memcpy( dst
, src
+(nr
-1)*sz
, sz
* sizeof(GLfloat
) );
113 if (last_prim
->begin
== 0) {
114 /* We're dealing with the second or later section of a split/wrapped
115 * GL_LINE_LOOP. Since we're converting line loops to line strips,
116 * we've already increment the last_prim->start counter by one to
117 * skip the 0th vertex in the loop. We need to undo that (effectively
118 * subtract one from last_prim->start) so that we copy the 0th vertex
119 * to the next vertex buffer.
121 assert(last_prim
->start
> 0);
125 case GL_TRIANGLE_FAN
:
131 memcpy( dst
, src
+0, sz
* sizeof(GLfloat
) );
135 memcpy( dst
, src
+0, sz
* sizeof(GLfloat
) );
136 memcpy( dst
+sz
, src
+(nr
-1)*sz
, sz
* sizeof(GLfloat
) );
139 case GL_TRIANGLE_STRIP
:
140 /* no parity issue, but need to make sure the tri is not drawn twice */
157 for (i
= 0 ; i
< ovf
; i
++)
158 memcpy( dst
+i
*sz
, src
+(nr
-ovf
+i
)*sz
, sz
* sizeof(GLfloat
) );
160 case PRIM_OUTSIDE_BEGIN_END
:
170 /* TODO: populate these as the vertex is defined:
173 vbo_exec_bind_arrays( struct gl_context
*ctx
)
175 struct vbo_context
*vbo
= vbo_context(ctx
);
176 struct vbo_exec_context
*exec
= &vbo
->exec
;
177 struct gl_client_array
*arrays
= exec
->vtx
.arrays
;
180 GLbitfield64 varying_inputs
= 0x0;
181 bool swap_pos
= false;
183 /* Install the default (ie Current) attributes first, then overlay
186 switch (get_program_mode(exec
->ctx
)) {
188 for (attr
= 0; attr
< VERT_ATTRIB_FF_MAX
; attr
++) {
189 exec
->vtx
.inputs
[attr
] = &vbo
->currval
[VBO_ATTRIB_POS
+attr
];
191 for (attr
= 0; attr
< MAT_ATTRIB_MAX
; attr
++) {
192 assert(VERT_ATTRIB_GENERIC(attr
) < ARRAY_SIZE(exec
->vtx
.inputs
));
193 exec
->vtx
.inputs
[VERT_ATTRIB_GENERIC(attr
)] =
194 &vbo
->currval
[VBO_ATTRIB_MAT_FRONT_AMBIENT
+attr
];
196 map
= vbo
->map_vp_none
;
199 for (attr
= 0; attr
< VERT_ATTRIB_FF_MAX
; attr
++) {
200 exec
->vtx
.inputs
[attr
] = &vbo
->currval
[VBO_ATTRIB_POS
+attr
];
202 for (attr
= 0; attr
< VERT_ATTRIB_GENERIC_MAX
; attr
++) {
203 assert(VERT_ATTRIB_GENERIC(attr
) < ARRAY_SIZE(exec
->vtx
.inputs
));
204 exec
->vtx
.inputs
[VERT_ATTRIB_GENERIC(attr
)] =
205 &vbo
->currval
[VBO_ATTRIB_GENERIC0
+attr
];
207 map
= vbo
->map_vp_arb
;
209 /* check if VERT_ATTRIB_POS is not read but VERT_BIT_GENERIC0 is read.
210 * In that case we effectively need to route the data from
211 * glVertexAttrib(0, val) calls to feed into the GENERIC0 input.
212 * The original state gets essentially restored below.
214 if ((ctx
->VertexProgram
._Current
->InputsRead
& VERT_BIT_POS
) == 0 &&
215 (ctx
->VertexProgram
._Current
->InputsRead
& VERT_BIT_GENERIC0
)) {
217 exec
->vtx
.inputs
[VERT_ATTRIB_GENERIC0
] = exec
->vtx
.inputs
[0];
218 exec
->vtx
.attrsz
[VERT_ATTRIB_GENERIC0
] = exec
->vtx
.attrsz
[0];
219 exec
->vtx
.attrtype
[VERT_ATTRIB_GENERIC0
] = exec
->vtx
.attrtype
[0];
220 exec
->vtx
.attrptr
[VERT_ATTRIB_GENERIC0
] = exec
->vtx
.attrptr
[0];
221 exec
->vtx
.attrsz
[0] = 0;
228 for (attr
= 0; attr
< VERT_ATTRIB_MAX
; attr
++) {
229 const GLuint src
= map
[attr
];
231 if (exec
->vtx
.attrsz
[src
]) {
232 GLsizeiptr offset
= (GLbyte
*)exec
->vtx
.attrptr
[src
] -
233 (GLbyte
*)exec
->vtx
.vertex
;
235 /* override the default array set above */
236 assert(attr
< ARRAY_SIZE(exec
->vtx
.inputs
));
237 assert(attr
< ARRAY_SIZE(exec
->vtx
.arrays
)); /* arrays[] */
238 exec
->vtx
.inputs
[attr
] = &arrays
[attr
];
240 if (_mesa_is_bufferobj(exec
->vtx
.bufferobj
)) {
241 /* a real buffer obj: Ptr is an offset, not a pointer */
242 assert(exec
->vtx
.bufferobj
->Mappings
[MAP_INTERNAL
].Pointer
);
244 arrays
[attr
].Ptr
= (GLubyte
*)
245 exec
->vtx
.bufferobj
->Mappings
[MAP_INTERNAL
].Offset
+ offset
;
248 /* Ptr into ordinary app memory */
249 arrays
[attr
].Ptr
= (GLubyte
*)exec
->vtx
.buffer_map
+ offset
;
251 arrays
[attr
].Size
= exec
->vtx
.attrsz
[src
];
252 arrays
[attr
].StrideB
= exec
->vtx
.vertex_size
* sizeof(GLfloat
);
253 arrays
[attr
].Type
= exec
->vtx
.attrtype
[src
];
254 arrays
[attr
].Integer
=
255 vbo_attrtype_to_integer_flag(exec
->vtx
.attrtype
[src
]);
256 arrays
[attr
].Format
= GL_RGBA
;
257 arrays
[attr
]._ElementSize
= arrays
[attr
].Size
* sizeof(GLfloat
);
258 _mesa_reference_buffer_object(ctx
,
259 &arrays
[attr
].BufferObj
,
260 exec
->vtx
.bufferobj
);
262 varying_inputs
|= VERT_BIT(attr
);
266 /* In case we swapped the position and generic0 attribute.
267 * Restore the original setting of the vtx.* variables.
268 * They are still needed with the original order and settings in case
269 * of a split primitive.
272 exec
->vtx
.attrsz
[0] = exec
->vtx
.attrsz
[VERT_ATTRIB_GENERIC0
];
273 exec
->vtx
.attrsz
[VERT_ATTRIB_GENERIC0
] = 0;
276 _mesa_set_varying_vp_inputs( ctx
, varying_inputs
);
277 ctx
->NewDriverState
|= ctx
->DriverFlags
.NewArray
;
282 * Unmap the VBO. This is called before drawing.
285 vbo_exec_vtx_unmap( struct vbo_exec_context
*exec
)
287 if (_mesa_is_bufferobj(exec
->vtx
.bufferobj
)) {
288 struct gl_context
*ctx
= exec
->ctx
;
290 if (ctx
->Driver
.FlushMappedBufferRange
) {
291 GLintptr offset
= exec
->vtx
.buffer_used
-
292 exec
->vtx
.bufferobj
->Mappings
[MAP_INTERNAL
].Offset
;
293 GLsizeiptr length
= (exec
->vtx
.buffer_ptr
- exec
->vtx
.buffer_map
) *
297 ctx
->Driver
.FlushMappedBufferRange(ctx
, offset
, length
,
302 exec
->vtx
.buffer_used
+= (exec
->vtx
.buffer_ptr
-
303 exec
->vtx
.buffer_map
) * sizeof(float);
305 assert(exec
->vtx
.buffer_used
<= VBO_VERT_BUFFER_SIZE
);
306 assert(exec
->vtx
.buffer_ptr
!= NULL
);
308 ctx
->Driver
.UnmapBuffer(ctx
, exec
->vtx
.bufferobj
, MAP_INTERNAL
);
309 exec
->vtx
.buffer_map
= NULL
;
310 exec
->vtx
.buffer_ptr
= NULL
;
311 exec
->vtx
.max_vert
= 0;
317 * Map the vertex buffer to begin storing glVertex, glColor, etc data.
320 vbo_exec_vtx_map( struct vbo_exec_context
*exec
)
322 struct gl_context
*ctx
= exec
->ctx
;
323 const GLenum accessRange
= GL_MAP_WRITE_BIT
| /* for MapBufferRange */
324 GL_MAP_INVALIDATE_RANGE_BIT
|
325 GL_MAP_UNSYNCHRONIZED_BIT
|
326 GL_MAP_FLUSH_EXPLICIT_BIT
|
328 const GLenum usage
= GL_STREAM_DRAW_ARB
;
330 if (!_mesa_is_bufferobj(exec
->vtx
.bufferobj
))
333 assert(!exec
->vtx
.buffer_map
);
334 assert(!exec
->vtx
.buffer_ptr
);
336 if (VBO_VERT_BUFFER_SIZE
> exec
->vtx
.buffer_used
+ 1024) {
337 /* The VBO exists and there's room for more */
338 if (exec
->vtx
.bufferobj
->Size
> 0) {
339 exec
->vtx
.buffer_map
=
340 (fi_type
*)ctx
->Driver
.MapBufferRange(ctx
,
341 exec
->vtx
.buffer_used
,
342 (VBO_VERT_BUFFER_SIZE
-
343 exec
->vtx
.buffer_used
),
347 exec
->vtx
.buffer_ptr
= exec
->vtx
.buffer_map
;
350 exec
->vtx
.buffer_ptr
= exec
->vtx
.buffer_map
= NULL
;
354 if (!exec
->vtx
.buffer_map
) {
355 /* Need to allocate a new VBO */
356 exec
->vtx
.buffer_used
= 0;
358 if (ctx
->Driver
.BufferData(ctx
, GL_ARRAY_BUFFER_ARB
,
359 VBO_VERT_BUFFER_SIZE
,
362 GL_DYNAMIC_STORAGE_BIT
|
363 GL_CLIENT_STORAGE_BIT
,
364 exec
->vtx
.bufferobj
)) {
365 /* buffer allocation worked, now map the buffer */
366 exec
->vtx
.buffer_map
=
367 (fi_type
*)ctx
->Driver
.MapBufferRange(ctx
,
368 0, VBO_VERT_BUFFER_SIZE
,
374 _mesa_error(ctx
, GL_OUT_OF_MEMORY
, "VBO allocation");
375 exec
->vtx
.buffer_map
= NULL
;
379 exec
->vtx
.buffer_ptr
= exec
->vtx
.buffer_map
;
381 if (!exec
->vtx
.buffer_map
) {
383 _mesa_install_exec_vtxfmt( ctx
, &exec
->vtxfmt_noop
);
386 if (_mesa_using_noop_vtxfmt(ctx
->Exec
)) {
387 /* The no-op functions are installed so switch back to regular
388 * functions. We do this test just to avoid frequent and needless
389 * calls to _mesa_install_exec_vtxfmt().
391 _mesa_install_exec_vtxfmt(ctx
, &exec
->vtxfmt
);
396 printf("map %d..\n", exec
->vtx
.buffer_used
);
402 * Execute the buffer and save copied verts.
403 * \param keep_unmapped if true, leave the VBO unmapped when we're done.
406 vbo_exec_vtx_flush(struct vbo_exec_context
*exec
, GLboolean keepUnmapped
)
409 vbo_exec_debug_verts( exec
);
411 if (exec
->vtx
.prim_count
&&
412 exec
->vtx
.vert_count
) {
414 exec
->vtx
.copied
.nr
= vbo_copy_vertices( exec
);
416 if (exec
->vtx
.copied
.nr
!= exec
->vtx
.vert_count
) {
417 struct gl_context
*ctx
= exec
->ctx
;
419 /* Before the update_state() as this may raise _NEW_VARYING_VP_INPUTS
420 * from _mesa_set_varying_vp_inputs().
422 vbo_exec_bind_arrays( ctx
);
425 _mesa_update_state( ctx
);
427 if (_mesa_is_bufferobj(exec
->vtx
.bufferobj
)) {
428 vbo_exec_vtx_unmap( exec
);
432 printf("%s %d %d\n", __func__
, exec
->vtx
.prim_count
,
433 exec
->vtx
.vert_count
);
435 vbo_context(ctx
)->draw_prims( ctx
,
437 exec
->vtx
.prim_count
,
441 exec
->vtx
.vert_count
- 1,
444 /* If using a real VBO, get new storage -- unless asked not to.
446 if (_mesa_is_bufferobj(exec
->vtx
.bufferobj
) && !keepUnmapped
) {
447 vbo_exec_vtx_map( exec
);
452 /* May have to unmap explicitly if we didn't draw:
455 _mesa_is_bufferobj(exec
->vtx
.bufferobj
) &&
456 exec
->vtx
.buffer_map
) {
457 vbo_exec_vtx_unmap( exec
);
460 if (keepUnmapped
|| exec
->vtx
.vertex_size
== 0)
461 exec
->vtx
.max_vert
= 0;
463 exec
->vtx
.max_vert
= vbo_compute_max_verts(exec
);
465 exec
->vtx
.buffer_ptr
= exec
->vtx
.buffer_map
;
466 exec
->vtx
.prim_count
= 0;
467 exec
->vtx
.vert_count
= 0;