gallium: make p_winsys internal
[mesa.git] / src / gallium / drivers / i915simple / i915_prim_vbuf.c
1 /**************************************************************************
2 *
3 * Copyright 2007 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 /**
29 * \file
30 * Build post-transformation, post-clipping vertex buffers and element
31 * lists by hooking into the end of the primitive pipeline and
32 * manipulating the vertex_id field in the vertex headers.
33 *
34 * XXX: work in progress
35 *
36 * \author José Fonseca <jrfonseca@tungstengraphics.com>
37 * \author Keith Whitwell <keith@tungstengraphics.com>
38 */
39
40
41 #include "draw/draw_context.h"
42 #include "draw/draw_vbuf.h"
43 #include "pipe/p_debug.h"
44 #include "pipe/p_inlines.h"
45 #include "pipe/internal/p_winsys_screen.h"
46 #include "util/u_math.h"
47 #include "util/u_memory.h"
48
49 #include "i915_context.h"
50 #include "i915_reg.h"
51 #include "i915_winsys.h"
52 #include "i915_batch.h"
53 #include "i915_state.h"
54
55
56 /**
57 * Primitive renderer for i915.
58 */
59 struct i915_vbuf_render {
60 struct vbuf_render base;
61
62 struct i915_context *i915;
63
64 /** Vertex size in bytes */
65 unsigned vertex_size;
66
67 /** Software primitive */
68 unsigned prim;
69
70 /** Hardware primitive */
71 unsigned hwprim;
72
73 /** Genereate a vertex list */
74 unsigned fallback;
75
76 /* Stuff for the vbo */
77 struct pipe_buffer *vbo;
78 size_t vbo_size;
79 size_t vbo_offset;
80 void *vbo_ptr;
81 size_t vbo_alloc_size;
82 };
83
84
85 /**
86 * Basically a cast wrapper.
87 */
88 static INLINE struct i915_vbuf_render *
89 i915_vbuf_render( struct vbuf_render *render )
90 {
91 assert(render);
92 return (struct i915_vbuf_render *)render;
93 }
94
95
96 static const struct vertex_info *
97 i915_vbuf_render_get_vertex_info( struct vbuf_render *render )
98 {
99 struct i915_vbuf_render *i915_render = i915_vbuf_render(render);
100 struct i915_context *i915 = i915_render->i915;
101
102 if (i915->dirty) {
103 /* make sure we have up to date vertex layout */
104 i915_update_derived( i915 );
105 }
106
107 return &i915->current.vertex_info;
108 }
109
110
111 static void *
112 i915_vbuf_render_allocate_vertices( struct vbuf_render *render,
113 ushort vertex_size,
114 ushort nr_vertices )
115 {
116 struct i915_vbuf_render *i915_render = i915_vbuf_render(render);
117 struct i915_context *i915 = i915_render->i915;
118 struct pipe_screen *screen = i915->pipe.screen;
119 size_t size = (size_t)vertex_size * (size_t)nr_vertices;
120
121 /* FIXME: handle failure */
122 assert(!i915->vbo);
123
124 if (i915_render->vbo_size > size + i915_render->vbo_offset && !i915->vbo_flushed) {
125 } else {
126 i915->vbo_flushed = 0;
127 pipe_buffer_reference(screen, &i915_render->vbo, NULL);
128 }
129
130 if (!i915_render->vbo) {
131 i915_render->vbo_size = MAX2(size, i915_render->vbo_alloc_size);
132 i915_render->vbo_offset = 0;
133 i915_render->vbo = pipe_buffer_create(screen,
134 64,
135 I915_BUFFER_USAGE_LIT_VERTEX,
136 i915_render->vbo_size);
137 i915_render->vbo_ptr = pipe_buffer_map(screen,
138 i915_render->vbo,
139 PIPE_BUFFER_USAGE_CPU_WRITE);
140 pipe_buffer_unmap(screen, i915_render->vbo);
141 }
142
143 i915->vbo = i915_render->vbo;
144 i915->vbo_offset = i915_render->vbo_offset;
145 i915->dirty |= I915_NEW_VBO;
146
147 return (unsigned char *)i915_render->vbo_ptr + i915->vbo_offset;
148 }
149
150
151 static boolean
152 i915_vbuf_render_set_primitive( struct vbuf_render *render,
153 unsigned prim )
154 {
155 struct i915_vbuf_render *i915_render = i915_vbuf_render(render);
156 i915_render->prim = prim;
157
158 switch(prim) {
159 case PIPE_PRIM_POINTS:
160 i915_render->hwprim = PRIM3D_POINTLIST;
161 i915_render->fallback = 0;
162 return TRUE;
163 case PIPE_PRIM_LINES:
164 i915_render->hwprim = PRIM3D_LINELIST;
165 i915_render->fallback = 0;
166 return TRUE;
167 case PIPE_PRIM_LINE_LOOP:
168 i915_render->hwprim = PRIM3D_LINELIST;
169 i915_render->fallback = PIPE_PRIM_LINE_LOOP;
170 return TRUE;
171 case PIPE_PRIM_LINE_STRIP:
172 i915_render->hwprim = PRIM3D_LINESTRIP;
173 i915_render->fallback = 0;
174 return TRUE;
175 case PIPE_PRIM_TRIANGLES:
176 i915_render->hwprim = PRIM3D_TRILIST;
177 i915_render->fallback = 0;
178 return TRUE;
179 case PIPE_PRIM_TRIANGLE_STRIP:
180 i915_render->hwprim = PRIM3D_TRISTRIP;
181 i915_render->fallback = 0;
182 return TRUE;
183 case PIPE_PRIM_TRIANGLE_FAN:
184 i915_render->hwprim = PRIM3D_TRIFAN;
185 i915_render->fallback = 0;
186 return TRUE;
187 case PIPE_PRIM_QUADS:
188 i915_render->hwprim = PRIM3D_TRILIST;
189 i915_render->fallback = PIPE_PRIM_QUADS;
190 return TRUE;
191 case PIPE_PRIM_QUAD_STRIP:
192 i915_render->hwprim = PRIM3D_TRILIST;
193 i915_render->fallback = PIPE_PRIM_QUAD_STRIP;
194 return TRUE;
195 case PIPE_PRIM_POLYGON:
196 i915_render->hwprim = PRIM3D_POLY;
197 i915_render->fallback = 0;
198 return TRUE;
199 default:
200 /* FIXME: Actually, can handle a lot more just fine... */
201 return FALSE;
202 }
203 }
204
205
206
207 /**
208 * Used for fallbacks in draw_arrays
209 */
210 static void
211 draw_arrays_generate_indices( struct vbuf_render *render,
212 unsigned start, uint nr,
213 unsigned type )
214 {
215 struct i915_vbuf_render *i915_render = i915_vbuf_render(render);
216 struct i915_context *i915 = i915_render->i915;
217 unsigned i;
218 unsigned end = start + nr;
219 switch(type) {
220 case 0:
221 for (i = start; i+1 < end; i += 2)
222 OUT_BATCH( (i+0) | (i+1) << 16 );
223 if (i < end)
224 OUT_BATCH( i );
225 break;
226 case PIPE_PRIM_LINE_LOOP:
227 if (nr >= 2) {
228 for (i = start + 1; i < end; i++)
229 OUT_BATCH( (i-0) | (i+0) << 16 );
230 OUT_BATCH( (i-0) | ( start) << 16 );
231 }
232 break;
233 case PIPE_PRIM_QUADS:
234 for (i = start; i + 3 < end; i += 4) {
235 OUT_BATCH( (i+0) | (i+1) << 16 );
236 OUT_BATCH( (i+3) | (i+1) << 16 );
237 OUT_BATCH( (i+2) | (i+3) << 16 );
238 }
239 break;
240 case PIPE_PRIM_QUAD_STRIP:
241 for (i = start; i + 3 < end; i += 2) {
242 OUT_BATCH( (i+0) | (i+1) << 16 );
243 OUT_BATCH( (i+3) | (i+2) << 16 );
244 OUT_BATCH( (i+0) | (i+3) << 16 );
245 }
246 break;
247 default:
248 assert(0);
249 }
250 }
251
252 static unsigned
253 draw_arrays_calc_nr_indices( uint nr, unsigned type )
254 {
255 switch (type) {
256 case 0:
257 return nr;
258 case PIPE_PRIM_LINE_LOOP:
259 if (nr >= 2)
260 return nr * 2;
261 else
262 return 0;
263 case PIPE_PRIM_QUADS:
264 return (nr / 4) * 6;
265 case PIPE_PRIM_QUAD_STRIP:
266 return ((nr - 2) / 2) * 6;
267 default:
268 assert(0);
269 return 0;
270 }
271 }
272
273 static void
274 draw_arrays_fallback( struct vbuf_render *render,
275 unsigned start,
276 uint nr )
277 {
278 struct i915_vbuf_render *i915_render = i915_vbuf_render(render);
279 struct i915_context *i915 = i915_render->i915;
280 unsigned nr_indices;
281
282 if (i915->dirty)
283 i915_update_derived( i915 );
284
285 if (i915->hardware_dirty)
286 i915_emit_hardware_state( i915 );
287
288 nr_indices = draw_arrays_calc_nr_indices( nr, i915_render->fallback );
289 if (!nr_indices)
290 return;
291
292 if (!BEGIN_BATCH( 1 + (nr_indices + 1)/2, 1 )) {
293 FLUSH_BATCH(NULL);
294
295 /* Make sure state is re-emitted after a flush:
296 */
297 i915_update_derived( i915 );
298 i915_emit_hardware_state( i915 );
299 i915->vbo_flushed = 1;
300
301 if (!BEGIN_BATCH( 1 + (nr_indices + 1)/2, 1 )) {
302 assert(0);
303 goto out;
304 }
305 }
306 OUT_BATCH( _3DPRIMITIVE |
307 PRIM_INDIRECT |
308 i915_render->hwprim |
309 PRIM_INDIRECT_ELTS |
310 nr_indices );
311
312 draw_arrays_generate_indices( render, start, nr, i915_render->fallback );
313
314 out:
315 return;
316 }
317
318 static void
319 i915_vbuf_render_draw_arrays( struct vbuf_render *render,
320 unsigned start,
321 uint nr )
322 {
323 struct i915_vbuf_render *i915_render = i915_vbuf_render(render);
324
325 if (i915_render->fallback) {
326 draw_arrays_fallback( render, start, nr );
327 return;
328 }
329
330 /* JB: TODO submit direct cmds */
331 draw_arrays_fallback( render, start, nr );
332 }
333
334 /**
335 * Used for normal and fallback emitting of indices
336 * If type is zero normal operation assumed.
337 */
338 static void
339 draw_generate_indices( struct vbuf_render *render,
340 const ushort *indices,
341 uint nr_indices,
342 unsigned type )
343 {
344 struct i915_vbuf_render *i915_render = i915_vbuf_render(render);
345 struct i915_context *i915 = i915_render->i915;
346 unsigned i;
347
348 switch(type) {
349 case 0:
350 for (i = 0; i + 1 < nr_indices; i += 2) {
351 OUT_BATCH( indices[i] | indices[i+1] << 16 );
352 }
353 if (i < nr_indices) {
354 OUT_BATCH( indices[i] );
355 }
356 break;
357 case PIPE_PRIM_LINE_LOOP:
358 if (nr_indices >= 2) {
359 for (i = 1; i < nr_indices; i++)
360 OUT_BATCH( indices[i-1] | indices[i] << 16 );
361 OUT_BATCH( indices[i-1] | indices[0] << 16 );
362 }
363 break;
364 case PIPE_PRIM_QUADS:
365 for (i = 0; i + 3 < nr_indices; i += 4) {
366 OUT_BATCH( indices[i+0] | indices[i+1] << 16 );
367 OUT_BATCH( indices[i+3] | indices[i+1] << 16 );
368 OUT_BATCH( indices[i+2] | indices[i+3] << 16 );
369 }
370 break;
371 case PIPE_PRIM_QUAD_STRIP:
372 for (i = 0; i + 3 < nr_indices; i += 2) {
373 OUT_BATCH( indices[i+0] | indices[i+1] << 16 );
374 OUT_BATCH( indices[i+3] | indices[i+2] << 16 );
375 OUT_BATCH( indices[i+0] | indices[i+3] << 16 );
376 }
377 break;
378 default:
379 assert(0);
380 break;
381 }
382 }
383
384 static unsigned
385 draw_calc_nr_indices( uint nr_indices, unsigned type )
386 {
387 switch (type) {
388 case 0:
389 return nr_indices;
390 case PIPE_PRIM_LINE_LOOP:
391 if (nr_indices >= 2)
392 return nr_indices * 2;
393 else
394 return 0;
395 case PIPE_PRIM_QUADS:
396 return (nr_indices / 4) * 6;
397 case PIPE_PRIM_QUAD_STRIP:
398 return ((nr_indices - 2) / 2) * 6;
399 default:
400 assert(0);
401 return 0;
402 }
403 }
404
405 static void
406 i915_vbuf_render_draw( struct vbuf_render *render,
407 const ushort *indices,
408 uint nr_indices)
409 {
410 struct i915_vbuf_render *i915_render = i915_vbuf_render(render);
411 struct i915_context *i915 = i915_render->i915;
412 unsigned save_nr_indices;
413
414 save_nr_indices = nr_indices;
415
416 nr_indices = draw_calc_nr_indices( nr_indices, i915_render->fallback );
417 if (!nr_indices)
418 return;
419
420 if (i915->dirty)
421 i915_update_derived( i915 );
422
423 if (i915->hardware_dirty)
424 i915_emit_hardware_state( i915 );
425
426 if (!BEGIN_BATCH( 1 + (nr_indices + 1)/2, 1 )) {
427 FLUSH_BATCH(NULL);
428
429 /* Make sure state is re-emitted after a flush:
430 */
431 i915_update_derived( i915 );
432 i915_emit_hardware_state( i915 );
433 i915->vbo_flushed = 1;
434
435 if (!BEGIN_BATCH( 1 + (nr_indices + 1)/2, 1 )) {
436 assert(0);
437 goto out;
438 }
439 }
440
441 OUT_BATCH( _3DPRIMITIVE |
442 PRIM_INDIRECT |
443 i915_render->hwprim |
444 PRIM_INDIRECT_ELTS |
445 nr_indices );
446 draw_generate_indices( render,
447 indices,
448 save_nr_indices,
449 i915_render->fallback );
450
451 out:
452 return;
453 }
454
455
456 static void
457 i915_vbuf_render_release_vertices( struct vbuf_render *render,
458 void *vertices,
459 unsigned vertex_size,
460 unsigned vertices_used )
461 {
462 struct i915_vbuf_render *i915_render = i915_vbuf_render(render);
463 struct i915_context *i915 = i915_render->i915;
464 size_t size = (size_t)vertex_size * (size_t)vertices_used;
465
466 assert(i915->vbo);
467
468 i915_render->vbo_offset += size;
469 i915->vbo = NULL;
470 i915->dirty |= I915_NEW_VBO;
471 }
472
473
474 static void
475 i915_vbuf_render_destroy( struct vbuf_render *render )
476 {
477 struct i915_vbuf_render *i915_render = i915_vbuf_render(render);
478 FREE(i915_render);
479 }
480
481
482 /**
483 * Create a new primitive render.
484 */
485 static struct vbuf_render *
486 i915_vbuf_render_create( struct i915_context *i915 )
487 {
488 struct i915_vbuf_render *i915_render = CALLOC_STRUCT(i915_vbuf_render);
489 struct pipe_screen *screen = i915->pipe.screen;
490
491 i915_render->i915 = i915;
492
493 i915_render->base.max_vertex_buffer_bytes = 128*1024;
494
495 /* NOTE: it must be such that state and vertices indices fit in a single
496 * batch buffer.
497 */
498 i915_render->base.max_indices = 16*1024;
499
500 i915_render->base.get_vertex_info = i915_vbuf_render_get_vertex_info;
501 i915_render->base.allocate_vertices = i915_vbuf_render_allocate_vertices;
502 i915_render->base.set_primitive = i915_vbuf_render_set_primitive;
503 i915_render->base.draw = i915_vbuf_render_draw;
504 i915_render->base.draw_arrays = i915_vbuf_render_draw_arrays;
505 i915_render->base.release_vertices = i915_vbuf_render_release_vertices;
506 i915_render->base.destroy = i915_vbuf_render_destroy;
507
508 i915_render->vbo_alloc_size = 128 * 4096;
509 i915_render->vbo_size = i915_render->vbo_alloc_size;
510 i915_render->vbo_offset = 0;
511 i915_render->vbo = pipe_buffer_create(screen,
512 64,
513 I915_BUFFER_USAGE_LIT_VERTEX,
514 i915_render->vbo_size);
515 i915_render->vbo_ptr = pipe_buffer_map(screen,
516 i915_render->vbo,
517 PIPE_BUFFER_USAGE_CPU_WRITE);
518 pipe_buffer_unmap(screen, i915_render->vbo);
519
520 return &i915_render->base;
521 }
522
523
524 /**
525 * Create a new primitive vbuf/render stage.
526 */
527 struct draw_stage *i915_draw_vbuf_stage( struct i915_context *i915 )
528 {
529 struct vbuf_render *render;
530 struct draw_stage *stage;
531
532 render = i915_vbuf_render_create(i915);
533 if(!render)
534 return NULL;
535
536 stage = draw_vbuf_stage( i915->draw, render );
537 if(!stage) {
538 render->destroy(render);
539 return NULL;
540 }
541 /** TODO JB: this shouldn't be here */
542 draw_set_render(i915->draw, render);
543
544 return stage;
545 }