svga: try blitting with copy region in more cases
[mesa.git] / src / gallium / drivers / svga / svga_swtnl_backend.c
1 /**********************************************************
2 * Copyright 2008-2009 VMware, Inc. All rights reserved.
3 *
4 * Permission is hereby granted, free of charge, to any person
5 * obtaining a copy of this software and associated documentation
6 * files (the "Software"), to deal in the Software without
7 * restriction, including without limitation the rights to use, copy,
8 * modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is
10 * furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice shall be
13 * included in all copies or substantial portions of the Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 *
24 **********************************************************/
25
26 #include "draw/draw_vbuf.h"
27 #include "draw/draw_context.h"
28 #include "draw/draw_vertex.h"
29
30 #include "util/u_debug.h"
31 #include "util/u_inlines.h"
32 #include "util/u_math.h"
33 #include "util/u_memory.h"
34
35 #include "svga_context.h"
36 #include "svga_state.h"
37 #include "svga_swtnl.h"
38
39 #include "svga_types.h"
40 #include "svga_reg.h"
41 #include "svga3d_reg.h"
42 #include "svga_draw.h"
43 #include "svga_shader.h"
44 #include "svga_swtnl_private.h"
45
46
47 static const struct vertex_info *
48 svga_vbuf_render_get_vertex_info( struct vbuf_render *render )
49 {
50 struct svga_vbuf_render *svga_render = svga_vbuf_render(render);
51 struct svga_context *svga = svga_render->svga;
52
53 svga_swtnl_update_vdecl(svga);
54
55 return &svga_render->vertex_info;
56 }
57
58
59 static boolean
60 svga_vbuf_render_allocate_vertices( struct vbuf_render *render,
61 ushort vertex_size,
62 ushort nr_vertices )
63 {
64 struct svga_vbuf_render *svga_render = svga_vbuf_render(render);
65 struct svga_context *svga = svga_render->svga;
66 struct pipe_screen *screen = svga->pipe.screen;
67 size_t size = (size_t)nr_vertices * (size_t)vertex_size;
68 boolean new_vbuf = FALSE;
69 boolean new_ibuf = FALSE;
70
71 if (svga_render->vertex_size != vertex_size)
72 svga->swtnl.new_vdecl = TRUE;
73 svga_render->vertex_size = (size_t)vertex_size;
74
75 if (svga->swtnl.new_vbuf)
76 new_ibuf = new_vbuf = TRUE;
77 svga->swtnl.new_vbuf = FALSE;
78
79 if (svga_render->vbuf_size < svga_render->vbuf_offset + svga_render->vbuf_used + size)
80 new_vbuf = TRUE;
81
82 if (new_vbuf)
83 pipe_resource_reference(&svga_render->vbuf, NULL);
84 if (new_ibuf)
85 pipe_resource_reference(&svga_render->ibuf, NULL);
86
87 if (!svga_render->vbuf) {
88 svga_render->vbuf_size = MAX2(size, svga_render->vbuf_alloc_size);
89 svga_render->vbuf = pipe_buffer_create(screen,
90 PIPE_BIND_VERTEX_BUFFER,
91 PIPE_USAGE_STREAM,
92 svga_render->vbuf_size);
93 if(!svga_render->vbuf) {
94 svga_context_flush(svga, NULL);
95 assert(!svga_render->vbuf);
96 svga_render->vbuf = pipe_buffer_create(screen,
97 PIPE_BIND_VERTEX_BUFFER,
98 PIPE_USAGE_STREAM,
99 svga_render->vbuf_size);
100 /* The buffer allocation may fail if we run out of memory.
101 * The draw module's vbuf code should handle that without crashing.
102 */
103 }
104
105 svga->swtnl.new_vdecl = TRUE;
106 svga_render->vbuf_offset = 0;
107 } else {
108 svga_render->vbuf_offset += svga_render->vbuf_used;
109 }
110
111 svga_render->vbuf_used = 0;
112
113 if (svga->swtnl.new_vdecl)
114 svga_render->vdecl_offset = svga_render->vbuf_offset;
115
116 return TRUE;
117 }
118
119 static void *
120 svga_vbuf_render_map_vertices( struct vbuf_render *render )
121 {
122 struct svga_vbuf_render *svga_render = svga_vbuf_render(render);
123 struct svga_context *svga = svga_render->svga;
124
125 if (svga_render->vbuf) {
126 char *ptr = (char*)pipe_buffer_map(&svga->pipe,
127 svga_render->vbuf,
128 PIPE_TRANSFER_WRITE |
129 PIPE_TRANSFER_FLUSH_EXPLICIT |
130 PIPE_TRANSFER_DISCARD_RANGE |
131 PIPE_TRANSFER_UNSYNCHRONIZED,
132 &svga_render->vbuf_transfer);
133 if (ptr) {
134 svga_render->vbuf_ptr = ptr;
135 return ptr + svga_render->vbuf_offset;
136 }
137 else {
138 svga_render->vbuf_ptr = NULL;
139 svga_render->vbuf_transfer = NULL;
140 return NULL;
141 }
142 }
143 else {
144 /* we probably ran out of memory when allocating the vertex buffer */
145 return NULL;
146 }
147 }
148
149 static void
150 svga_vbuf_render_unmap_vertices( struct vbuf_render *render,
151 ushort min_index,
152 ushort max_index )
153 {
154 struct svga_vbuf_render *svga_render = svga_vbuf_render(render);
155 struct svga_context *svga = svga_render->svga;
156 unsigned offset, length;
157 size_t used = svga_render->vertex_size * ((size_t)max_index + 1);
158
159 offset = svga_render->vbuf_offset + svga_render->vertex_size * min_index;
160 length = svga_render->vertex_size * (max_index + 1 - min_index);
161
162 if (0) {
163 /* dump vertex data */
164 const float *f = (const float *) ((char *) svga_render->vbuf_ptr +
165 svga_render->vbuf_offset);
166 unsigned i;
167 debug_printf("swtnl vertex data:\n");
168 for (i = 0; i < length / 4; i += 4) {
169 debug_printf("%u: %f %f %f %f\n", i, f[i], f[i+1], f[i+2], f[i+3]);
170 }
171 }
172
173 pipe_buffer_flush_mapped_range(&svga->pipe,
174 svga_render->vbuf_transfer,
175 offset, length);
176 pipe_buffer_unmap(&svga->pipe, svga_render->vbuf_transfer);
177 svga_render->min_index = min_index;
178 svga_render->max_index = max_index;
179 svga_render->vbuf_used = MAX2(svga_render->vbuf_used, used);
180 }
181
182 static void
183 svga_vbuf_render_set_primitive( struct vbuf_render *render,
184 enum pipe_prim_type prim )
185 {
186 struct svga_vbuf_render *svga_render = svga_vbuf_render(render);
187 svga_render->prim = prim;
188 }
189
190 static void
191 svga_vbuf_submit_state( struct svga_vbuf_render *svga_render )
192 {
193 struct svga_context *svga = svga_render->svga;
194 SVGA3dVertexDecl vdecl[PIPE_MAX_ATTRIBS];
195 enum pipe_error ret;
196 unsigned i;
197 static const unsigned zero[PIPE_MAX_ATTRIBS] = {0};
198
199 /* if the vdecl or vbuf hasn't changed do nothing */
200 if (!svga->swtnl.new_vdecl)
201 return;
202
203 memcpy(vdecl, svga_render->vdecl, sizeof(vdecl));
204
205 /* flush the hw state */
206 ret = svga_hwtnl_flush(svga->hwtnl);
207 if (ret != PIPE_OK) {
208 svga_context_flush(svga, NULL);
209 ret = svga_hwtnl_flush(svga->hwtnl);
210 /* if we hit this path we might become synced with hw */
211 svga->swtnl.new_vbuf = TRUE;
212 assert(ret == PIPE_OK);
213 }
214
215 for (i = 0; i < svga_render->vdecl_count; i++) {
216 vdecl[i].array.offset += svga_render->vdecl_offset;
217 }
218
219 svga_hwtnl_vertex_decls(svga->hwtnl,
220 svga_render->vdecl_count,
221 vdecl,
222 zero,
223 svga_render->layout_id);
224
225 /* Specify the vertex buffer (there's only ever one) */
226 {
227 struct pipe_vertex_buffer vb;
228 vb.buffer = svga_render->vbuf;
229 vb.buffer_offset = svga_render->vdecl_offset;
230 vb.stride = vdecl[0].array.stride;
231 vb.user_buffer = NULL;
232 svga_hwtnl_vertex_buffers(svga->hwtnl, 1, &vb);
233 }
234
235 /* We have already taken care of flatshading, so let the hwtnl
236 * module use whatever is most convenient:
237 */
238 if (svga->state.sw.need_pipeline) {
239 svga_hwtnl_set_flatshade(svga->hwtnl, FALSE, FALSE);
240 svga_hwtnl_set_fillmode(svga->hwtnl, PIPE_POLYGON_MODE_FILL);
241 }
242 else {
243 svga_hwtnl_set_flatshade( svga->hwtnl,
244 svga->curr.rast->templ.flatshade ||
245 svga->state.hw_draw.fs->uses_flat_interp,
246 svga->curr.rast->templ.flatshade_first );
247
248 svga_hwtnl_set_fillmode(svga->hwtnl, svga->curr.rast->hw_fillmode);
249 }
250
251 svga->swtnl.new_vdecl = FALSE;
252 }
253
254 static void
255 svga_vbuf_render_draw_arrays( struct vbuf_render *render,
256 unsigned start, uint nr )
257 {
258 struct svga_vbuf_render *svga_render = svga_vbuf_render(render);
259 struct svga_context *svga = svga_render->svga;
260 unsigned bias = (svga_render->vbuf_offset - svga_render->vdecl_offset) / svga_render->vertex_size;
261 enum pipe_error ret = PIPE_OK;
262 /* instancing will already have been resolved at this point by 'draw' */
263 const unsigned start_instance = 0;
264 const unsigned instance_count = 1;
265
266 /* off to hardware */
267 svga_vbuf_submit_state(svga_render);
268
269 /* Need to call update_state() again as the draw module may have
270 * altered some of our state behind our backs. Testcase:
271 * redbook/polys.c
272 */
273 svga_update_state_retry( svga, SVGA_STATE_HW_DRAW );
274
275 ret = svga_hwtnl_draw_arrays(svga->hwtnl, svga_render->prim, start + bias, nr,
276 start_instance, instance_count);
277 if (ret != PIPE_OK) {
278 svga_context_flush(svga, NULL);
279 ret = svga_hwtnl_draw_arrays(svga->hwtnl, svga_render->prim,
280 start + bias, nr,
281 start_instance, instance_count);
282 svga->swtnl.new_vbuf = TRUE;
283 assert(ret == PIPE_OK);
284 }
285 }
286
287
288 static void
289 svga_vbuf_render_draw_elements( struct vbuf_render *render,
290 const ushort *indices,
291 uint nr_indices)
292 {
293 struct svga_vbuf_render *svga_render = svga_vbuf_render(render);
294 struct svga_context *svga = svga_render->svga;
295 struct pipe_screen *screen = svga->pipe.screen;
296 int bias = (svga_render->vbuf_offset - svga_render->vdecl_offset) / svga_render->vertex_size;
297 boolean ret;
298 size_t size = 2 * nr_indices;
299 /* instancing will already have been resolved at this point by 'draw' */
300 const unsigned start_instance = 0;
301 const unsigned instance_count = 1;
302
303 assert(( svga_render->vbuf_offset - svga_render->vdecl_offset) % svga_render->vertex_size == 0);
304
305 if (svga_render->ibuf_size < svga_render->ibuf_offset + size)
306 pipe_resource_reference(&svga_render->ibuf, NULL);
307
308 if (!svga_render->ibuf) {
309 svga_render->ibuf_size = MAX2(size, svga_render->ibuf_alloc_size);
310 svga_render->ibuf = pipe_buffer_create(screen,
311 PIPE_BIND_INDEX_BUFFER,
312 PIPE_USAGE_STREAM,
313 svga_render->ibuf_size);
314 svga_render->ibuf_offset = 0;
315 }
316
317 pipe_buffer_write_nooverlap(&svga->pipe, svga_render->ibuf,
318 svga_render->ibuf_offset, 2 * nr_indices, indices);
319
320 /* off to hardware */
321 svga_vbuf_submit_state(svga_render);
322
323 /* Need to call update_state() again as the draw module may have
324 * altered some of our state behind our backs. Testcase:
325 * redbook/polys.c
326 */
327 svga_update_state_retry( svga, SVGA_STATE_HW_DRAW );
328
329 ret = svga_hwtnl_draw_range_elements(svga->hwtnl,
330 svga_render->ibuf,
331 2,
332 bias,
333 svga_render->min_index,
334 svga_render->max_index,
335 svga_render->prim,
336 svga_render->ibuf_offset / 2, nr_indices,
337 start_instance, instance_count);
338 if(ret != PIPE_OK) {
339 svga_context_flush(svga, NULL);
340 ret = svga_hwtnl_draw_range_elements(svga->hwtnl,
341 svga_render->ibuf,
342 2,
343 bias,
344 svga_render->min_index,
345 svga_render->max_index,
346 svga_render->prim,
347 svga_render->ibuf_offset / 2,
348 nr_indices,
349 start_instance, instance_count);
350 svga->swtnl.new_vbuf = TRUE;
351 assert(ret == PIPE_OK);
352 }
353
354 svga_render->ibuf_offset += size;
355 }
356
357
358 static void
359 svga_vbuf_render_release_vertices( struct vbuf_render *render )
360 {
361
362 }
363
364
365 static void
366 svga_vbuf_render_destroy( struct vbuf_render *render )
367 {
368 struct svga_vbuf_render *svga_render = svga_vbuf_render(render);
369
370 pipe_resource_reference(&svga_render->vbuf, NULL);
371 pipe_resource_reference(&svga_render->ibuf, NULL);
372 FREE(svga_render);
373 }
374
375
376 /**
377 * Create a new primitive render.
378 */
379 struct vbuf_render *
380 svga_vbuf_render_create( struct svga_context *svga )
381 {
382 struct svga_vbuf_render *svga_render = CALLOC_STRUCT(svga_vbuf_render);
383
384 svga_render->svga = svga;
385 svga_render->ibuf_size = 0;
386 svga_render->vbuf_size = 0;
387 svga_render->ibuf_alloc_size = 4*1024;
388 svga_render->vbuf_alloc_size = 64*1024;
389 svga_render->layout_id = SVGA3D_INVALID_ID;
390 svga_render->base.max_vertex_buffer_bytes = 64*1024/10;
391 svga_render->base.max_indices = 65536;
392 svga_render->base.get_vertex_info = svga_vbuf_render_get_vertex_info;
393 svga_render->base.allocate_vertices = svga_vbuf_render_allocate_vertices;
394 svga_render->base.map_vertices = svga_vbuf_render_map_vertices;
395 svga_render->base.unmap_vertices = svga_vbuf_render_unmap_vertices;
396 svga_render->base.set_primitive = svga_vbuf_render_set_primitive;
397 svga_render->base.draw_elements = svga_vbuf_render_draw_elements;
398 svga_render->base.draw_arrays = svga_vbuf_render_draw_arrays;
399 svga_render->base.release_vertices = svga_vbuf_render_release_vertices;
400 svga_render->base.destroy = svga_vbuf_render_destroy;
401
402 return &svga_render->base;
403 }