gallium: a lot more complete implementation of stream output
[mesa.git] / src / gallium / auxiliary / draw / draw_pt_emit.c
1 /**************************************************************************
2 *
3 * Copyright 2008 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 #include "util/u_memory.h"
29 #include "draw/draw_context.h"
30 #include "draw/draw_private.h"
31 #include "draw/draw_vbuf.h"
32 #include "draw/draw_vertex.h"
33 #include "draw/draw_pt.h"
34 #include "translate/translate.h"
35 #include "translate/translate_cache.h"
36 #include "util/u_format.h"
37
38 struct pt_emit {
39 struct draw_context *draw;
40
41 struct translate *translate;
42
43 struct translate_cache *cache;
44 unsigned prim;
45
46 const struct vertex_info *vinfo;
47 };
48
49 void draw_pt_emit_prepare( struct pt_emit *emit,
50 unsigned prim,
51 unsigned *max_vertices )
52 {
53 struct draw_context *draw = emit->draw;
54 const struct vertex_info *vinfo;
55 unsigned dst_offset;
56 struct translate_key hw_key;
57 unsigned i;
58 boolean ok;
59
60 /* XXX: need to flush to get prim_vbuf.c to release its allocation??
61 */
62 draw_do_flush( draw, DRAW_FLUSH_BACKEND );
63
64
65 /* XXX: may need to defensively reset this later on as clipping can
66 * clobber this state in the render backend.
67 */
68 emit->prim = prim;
69
70 ok = draw->render->set_primitive(draw->render, emit->prim);
71 if (!ok) {
72 assert(0);
73 return;
74 }
75
76 /* Must do this after set_primitive() above:
77 */
78 emit->vinfo = vinfo = draw->render->get_vertex_info(draw->render);
79
80
81 /* Translate from pipeline vertices to hw vertices.
82 */
83 dst_offset = 0;
84 for (i = 0; i < vinfo->num_attribs; i++) {
85 unsigned emit_sz = 0;
86 unsigned src_buffer = 0;
87 unsigned output_format;
88 unsigned src_offset = (vinfo->attrib[i].src_index * 4 * sizeof(float) );
89
90 output_format = draw_translate_vinfo_format(vinfo->attrib[i].emit);
91 emit_sz = draw_translate_vinfo_size(vinfo->attrib[i].emit);
92
93 /* doesn't handle EMIT_OMIT */
94 assert(emit_sz != 0);
95
96 if (vinfo->attrib[i].emit == EMIT_1F_PSIZE) {
97 src_buffer = 1;
98 src_offset = 0;
99 }
100
101 hw_key.element[i].type = TRANSLATE_ELEMENT_NORMAL;
102 hw_key.element[i].input_format = PIPE_FORMAT_R32G32B32A32_FLOAT;
103 hw_key.element[i].input_buffer = src_buffer;
104 hw_key.element[i].input_offset = src_offset;
105 hw_key.element[i].instance_divisor = 0;
106 hw_key.element[i].output_format = output_format;
107 hw_key.element[i].output_offset = dst_offset;
108
109 dst_offset += emit_sz;
110 }
111
112 hw_key.nr_elements = vinfo->num_attribs;
113 hw_key.output_stride = vinfo->size * 4;
114
115 if (!emit->translate ||
116 translate_key_compare(&emit->translate->key, &hw_key) != 0)
117 {
118 translate_key_sanitize(&hw_key);
119 emit->translate = translate_cache_find(emit->cache, &hw_key);
120 }
121
122 *max_vertices = (draw->render->max_vertex_buffer_bytes /
123 (vinfo->size * 4));
124
125 /* even number */
126 *max_vertices = *max_vertices & ~1;
127 }
128
129
130 void draw_pt_emit( struct pt_emit *emit,
131 const float (*vertex_data)[4],
132 unsigned vertex_count,
133 unsigned stride,
134 const ushort *elts,
135 unsigned count )
136 {
137 struct draw_context *draw = emit->draw;
138 struct translate *translate = emit->translate;
139 struct vbuf_render *render = draw->render;
140 void *hw_verts;
141
142 /* XXX: need to flush to get prim_vbuf.c to release its allocation??
143 */
144 draw_do_flush( draw, DRAW_FLUSH_BACKEND );
145
146 if (vertex_count == 0)
147 return;
148
149 if (vertex_count >= UNDEFINED_VERTEX_ID) {
150 assert(0);
151 return;
152 }
153
154 /* XXX: and work out some way to coordinate the render primitive
155 * between vbuf.c and here...
156 */
157 if (!draw->render->set_primitive(draw->render, emit->prim)) {
158 assert(0);
159 return;
160 }
161
162 render->allocate_vertices(render,
163 (ushort)translate->key.output_stride,
164 (ushort)vertex_count);
165
166 hw_verts = render->map_vertices( render );
167 if (!hw_verts) {
168 assert(0);
169 return;
170 }
171
172 translate->set_buffer(translate,
173 0,
174 vertex_data,
175 stride,
176 ~0);
177
178 translate->set_buffer(translate,
179 1,
180 &draw->rasterizer->point_size,
181 0,
182 ~0);
183
184 translate->run( translate,
185 0,
186 vertex_count,
187 draw->instance_id,
188 hw_verts );
189
190 render->unmap_vertices( render,
191 0,
192 vertex_count - 1 );
193
194 render->draw_elements(render,
195 elts,
196 count);
197
198 render->release_vertices(render);
199 }
200
201
202 void draw_pt_emit_linear(struct pt_emit *emit,
203 const float (*vertex_data)[4],
204 unsigned stride,
205 unsigned count)
206 {
207 struct draw_context *draw = emit->draw;
208 struct translate *translate = emit->translate;
209 struct vbuf_render *render = draw->render;
210 void *hw_verts;
211
212 #if 0
213 debug_printf("Linear emit\n");
214 #endif
215 /* XXX: need to flush to get prim_vbuf.c to release its allocation??
216 */
217 draw_do_flush( draw, DRAW_FLUSH_BACKEND );
218
219 if (count >= UNDEFINED_VERTEX_ID)
220 goto fail;
221
222 /* XXX: and work out some way to coordinate the render primitive
223 * between vbuf.c and here...
224 */
225 if (!draw->render->set_primitive(draw->render, emit->prim))
226 goto fail;
227
228 if (!render->allocate_vertices(render,
229 (ushort)translate->key.output_stride,
230 (ushort)count))
231 goto fail;
232
233 hw_verts = render->map_vertices( render );
234 if (!hw_verts)
235 goto fail;
236
237 translate->set_buffer(translate, 0,
238 vertex_data, stride, count - 1);
239
240 translate->set_buffer(translate, 1,
241 &draw->rasterizer->point_size,
242 0, ~0);
243
244 translate->run(translate,
245 0,
246 count,
247 draw->instance_id,
248 hw_verts);
249
250 if (0) {
251 unsigned i;
252 for (i = 0; i < count; i++) {
253 debug_printf("\n\n%s vertex %d:\n", __FUNCTION__, i);
254 draw_dump_emitted_vertex( emit->vinfo,
255 (const uint8_t *)hw_verts +
256 translate->key.output_stride * i );
257 }
258 }
259
260 render->unmap_vertices( render, 0, count - 1 );
261
262 render->draw_arrays(render, 0, count);
263
264 render->release_vertices(render);
265
266 return;
267
268 fail:
269 assert(0);
270 return;
271 }
272
273 struct pt_emit *draw_pt_emit_create( struct draw_context *draw )
274 {
275 struct pt_emit *emit = CALLOC_STRUCT(pt_emit);
276 if (!emit)
277 return NULL;
278
279 emit->draw = draw;
280 emit->cache = translate_cache_create();
281 if (!emit->cache) {
282 FREE(emit);
283 return NULL;
284 }
285
286 return emit;
287 }
288
289 void draw_pt_emit_destroy( struct pt_emit *emit )
290 {
291 if (emit->cache)
292 translate_cache_destroy(emit->cache);
293
294 FREE(emit);
295 }