draw/translate: fix instancing
[mesa.git] / src / gallium / auxiliary / translate / translate_generic.c
1 /**************************************************************************
2 *
3 * Copyright 2007 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 /*
29 * Authors:
30 * Keith Whitwell <keith@tungstengraphics.com>
31 */
32
33 #include "util/u_memory.h"
34 #include "util/u_format.h"
35 #include "util/u_half.h"
36 #include "util/u_math.h"
37 #include "pipe/p_state.h"
38 #include "translate.h"
39
40
41 #define DRAW_DBG 0
42
43 typedef void (*fetch_func)(void *dst,
44 const uint8_t *src,
45 unsigned i, unsigned j);
46 typedef void (*emit_func)(const void *attrib, void *ptr);
47
48
49
50 struct translate_generic {
51 struct translate translate;
52
53 struct {
54 enum translate_element_type type;
55
56 fetch_func fetch;
57 unsigned buffer;
58 unsigned input_offset;
59 unsigned instance_divisor;
60
61 emit_func emit;
62 unsigned output_offset;
63
64 const uint8_t *input_ptr;
65 unsigned input_stride;
66 unsigned max_index;
67
68 /* this value is set to -1 if this is a normal element with output_format != input_format:
69 * in this case, u_format is used to do a full conversion
70 *
71 * this value is set to the format size in bytes if output_format == input_format or for 32-bit instance ids:
72 * in this case, memcpy is used to copy this amount of bytes
73 */
74 int copy_size;
75
76 } attrib[PIPE_MAX_ATTRIBS];
77
78 unsigned nr_attrib;
79 };
80
81
82 static struct translate_generic *translate_generic( struct translate *translate )
83 {
84 return (struct translate_generic *)translate;
85 }
86
87 /**
88 * Fetch a dword[4] vertex attribute from memory, doing format/type
89 * conversion as needed.
90 *
91 * This is probably needed/dupliocated elsewhere, eg format
92 * conversion, texture sampling etc.
93 */
94 #define ATTRIB( NAME, SZ, SRCTYPE, DSTTYPE, TO ) \
95 static void \
96 emit_##NAME(const void *attrib, void *ptr) \
97 { \
98 unsigned i; \
99 SRCTYPE *in = (SRCTYPE *)attrib; \
100 DSTTYPE *out = (DSTTYPE *)ptr; \
101 \
102 for (i = 0; i < SZ; i++) { \
103 out[i] = TO(in[i]); \
104 } \
105 }
106
107
108 #define TO_64_FLOAT(x) ((double) x)
109 #define TO_32_FLOAT(x) (x)
110 #define TO_16_FLOAT(x) util_float_to_half(x)
111
112 #define TO_8_USCALED(x) ((unsigned char) x)
113 #define TO_16_USCALED(x) ((unsigned short) x)
114 #define TO_32_USCALED(x) ((unsigned int) x)
115
116 #define TO_8_SSCALED(x) ((char) x)
117 #define TO_16_SSCALED(x) ((short) x)
118 #define TO_32_SSCALED(x) ((int) x)
119
120 #define TO_8_UNORM(x) ((unsigned char) (x * 255.0f))
121 #define TO_16_UNORM(x) ((unsigned short) (x * 65535.0f))
122 #define TO_32_UNORM(x) ((unsigned int) (x * 4294967295.0f))
123
124 #define TO_8_SNORM(x) ((char) (x * 127.0f))
125 #define TO_16_SNORM(x) ((short) (x * 32767.0f))
126 #define TO_32_SNORM(x) ((int) (x * 2147483647.0f))
127
128 #define TO_32_FIXED(x) ((int) (x * 65536.0f))
129
130 #define TO_INT(x) (x)
131
132
133 ATTRIB( R64G64B64A64_FLOAT, 4, float, double, TO_64_FLOAT )
134 ATTRIB( R64G64B64_FLOAT, 3, float, double, TO_64_FLOAT )
135 ATTRIB( R64G64_FLOAT, 2, float, double, TO_64_FLOAT )
136 ATTRIB( R64_FLOAT, 1, float, double, TO_64_FLOAT )
137
138 ATTRIB( R32G32B32A32_FLOAT, 4, float, float, TO_32_FLOAT )
139 ATTRIB( R32G32B32_FLOAT, 3, float, float, TO_32_FLOAT )
140 ATTRIB( R32G32_FLOAT, 2, float, float, TO_32_FLOAT )
141 ATTRIB( R32_FLOAT, 1, float, float, TO_32_FLOAT )
142
143 ATTRIB( R16G16B16A16_FLOAT, 4, float, ushort, TO_16_FLOAT )
144 ATTRIB( R16G16B16_FLOAT, 3, float, ushort, TO_16_FLOAT )
145 ATTRIB( R16G16_FLOAT, 2, float, ushort, TO_16_FLOAT )
146 ATTRIB( R16_FLOAT, 1, float, ushort, TO_16_FLOAT )
147
148 ATTRIB( R32G32B32A32_USCALED, 4, float, unsigned, TO_32_USCALED )
149 ATTRIB( R32G32B32_USCALED, 3, float, unsigned, TO_32_USCALED )
150 ATTRIB( R32G32_USCALED, 2, float, unsigned, TO_32_USCALED )
151 ATTRIB( R32_USCALED, 1, float, unsigned, TO_32_USCALED )
152
153 ATTRIB( R32G32B32A32_SSCALED, 4, float, int, TO_32_SSCALED )
154 ATTRIB( R32G32B32_SSCALED, 3, float, int, TO_32_SSCALED )
155 ATTRIB( R32G32_SSCALED, 2, float, int, TO_32_SSCALED )
156 ATTRIB( R32_SSCALED, 1, float, int, TO_32_SSCALED )
157
158 ATTRIB( R32G32B32A32_UNORM, 4, float, unsigned, TO_32_UNORM )
159 ATTRIB( R32G32B32_UNORM, 3, float, unsigned, TO_32_UNORM )
160 ATTRIB( R32G32_UNORM, 2, float, unsigned, TO_32_UNORM )
161 ATTRIB( R32_UNORM, 1, float, unsigned, TO_32_UNORM )
162
163 ATTRIB( R32G32B32A32_SNORM, 4, float, int, TO_32_SNORM )
164 ATTRIB( R32G32B32_SNORM, 3, float, int, TO_32_SNORM )
165 ATTRIB( R32G32_SNORM, 2, float, int, TO_32_SNORM )
166 ATTRIB( R32_SNORM, 1, float, int, TO_32_SNORM )
167
168 ATTRIB( R16G16B16A16_USCALED, 4, float, ushort, TO_16_USCALED )
169 ATTRIB( R16G16B16_USCALED, 3, float, ushort, TO_16_USCALED )
170 ATTRIB( R16G16_USCALED, 2, float, ushort, TO_16_USCALED )
171 ATTRIB( R16_USCALED, 1, float, ushort, TO_16_USCALED )
172
173 ATTRIB( R16G16B16A16_SSCALED, 4, float, short, TO_16_SSCALED )
174 ATTRIB( R16G16B16_SSCALED, 3, float, short, TO_16_SSCALED )
175 ATTRIB( R16G16_SSCALED, 2, float, short, TO_16_SSCALED )
176 ATTRIB( R16_SSCALED, 1, float, short, TO_16_SSCALED )
177
178 ATTRIB( R16G16B16A16_UNORM, 4, float, ushort, TO_16_UNORM )
179 ATTRIB( R16G16B16_UNORM, 3, float, ushort, TO_16_UNORM )
180 ATTRIB( R16G16_UNORM, 2, float, ushort, TO_16_UNORM )
181 ATTRIB( R16_UNORM, 1, float, ushort, TO_16_UNORM )
182
183 ATTRIB( R16G16B16A16_SNORM, 4, float, short, TO_16_SNORM )
184 ATTRIB( R16G16B16_SNORM, 3, float, short, TO_16_SNORM )
185 ATTRIB( R16G16_SNORM, 2, float, short, TO_16_SNORM )
186 ATTRIB( R16_SNORM, 1, float, short, TO_16_SNORM )
187
188 ATTRIB( R8G8B8A8_USCALED, 4, float, ubyte, TO_8_USCALED )
189 ATTRIB( R8G8B8_USCALED, 3, float, ubyte, TO_8_USCALED )
190 ATTRIB( R8G8_USCALED, 2, float, ubyte, TO_8_USCALED )
191 ATTRIB( R8_USCALED, 1, float, ubyte, TO_8_USCALED )
192
193 ATTRIB( R8G8B8A8_SSCALED, 4, float, char, TO_8_SSCALED )
194 ATTRIB( R8G8B8_SSCALED, 3, float, char, TO_8_SSCALED )
195 ATTRIB( R8G8_SSCALED, 2, float, char, TO_8_SSCALED )
196 ATTRIB( R8_SSCALED, 1, float, char, TO_8_SSCALED )
197
198 ATTRIB( R8G8B8A8_UNORM, 4, float, ubyte, TO_8_UNORM )
199 ATTRIB( R8G8B8_UNORM, 3, float, ubyte, TO_8_UNORM )
200 ATTRIB( R8G8_UNORM, 2, float, ubyte, TO_8_UNORM )
201 ATTRIB( R8_UNORM, 1, float, ubyte, TO_8_UNORM )
202
203 ATTRIB( R8G8B8A8_SNORM, 4, float, char, TO_8_SNORM )
204 ATTRIB( R8G8B8_SNORM, 3, float, char, TO_8_SNORM )
205 ATTRIB( R8G8_SNORM, 2, float, char, TO_8_SNORM )
206 ATTRIB( R8_SNORM, 1, float, char, TO_8_SNORM )
207
208 ATTRIB( R32G32B32A32_UINT, 4, uint32_t, unsigned, TO_INT )
209 ATTRIB( R32G32B32_UINT, 3, uint32_t, unsigned, TO_INT )
210 ATTRIB( R32G32_UINT, 2, uint32_t, unsigned, TO_INT )
211 ATTRIB( R32_UINT, 1, uint32_t, unsigned, TO_INT )
212
213 ATTRIB( R16G16B16A16_UINT, 4, uint32_t, ushort, TO_INT )
214 ATTRIB( R16G16B16_UINT, 3, uint32_t, ushort, TO_INT )
215 ATTRIB( R16G16_UINT, 2, uint32_t, ushort, TO_INT )
216 ATTRIB( R16_UINT, 1, uint32_t, ushort, TO_INT )
217
218 ATTRIB( R8G8B8A8_UINT, 4, uint32_t, ubyte, TO_INT )
219 ATTRIB( R8G8B8_UINT, 3, uint32_t, ubyte, TO_INT )
220 ATTRIB( R8G8_UINT, 2, uint32_t, ubyte, TO_INT )
221 ATTRIB( R8_UINT, 1, uint32_t, ubyte, TO_INT )
222
223 ATTRIB( R32G32B32A32_SINT, 4, int32_t, int, TO_INT )
224 ATTRIB( R32G32B32_SINT, 3, int32_t, int, TO_INT )
225 ATTRIB( R32G32_SINT, 2, int32_t, int, TO_INT )
226 ATTRIB( R32_SINT, 1, int32_t, int, TO_INT )
227
228 ATTRIB( R16G16B16A16_SINT, 4, int32_t, short, TO_INT )
229 ATTRIB( R16G16B16_SINT, 3, int32_t, short, TO_INT )
230 ATTRIB( R16G16_SINT, 2, int32_t, short, TO_INT )
231 ATTRIB( R16_SINT, 1, int32_t, short, TO_INT )
232
233 ATTRIB( R8G8B8A8_SINT, 4, int32_t, char, TO_INT )
234 ATTRIB( R8G8B8_SINT, 3, int32_t, char, TO_INT )
235 ATTRIB( R8G8_SINT, 2, int32_t, char, TO_INT )
236 ATTRIB( R8_SINT, 1, int32_t, char, TO_INT )
237
238 static void
239 emit_A8R8G8B8_UNORM( const void *attrib, void *ptr)
240 {
241 float *in = (float *)attrib;
242 ubyte *out = (ubyte *)ptr;
243 out[0] = TO_8_UNORM(in[3]);
244 out[1] = TO_8_UNORM(in[0]);
245 out[2] = TO_8_UNORM(in[1]);
246 out[3] = TO_8_UNORM(in[2]);
247 }
248
249 static void
250 emit_B8G8R8A8_UNORM( const void *attrib, void *ptr)
251 {
252 float *in = (float *)attrib;
253 ubyte *out = (ubyte *)ptr;
254 out[2] = TO_8_UNORM(in[0]);
255 out[1] = TO_8_UNORM(in[1]);
256 out[0] = TO_8_UNORM(in[2]);
257 out[3] = TO_8_UNORM(in[3]);
258 }
259
260 static void
261 emit_B10G10R10A2_UNORM( const void *attrib, void *ptr )
262 {
263 float *src = (float *)ptr;
264 uint32_t value = 0;
265 value |= ((uint32_t)(CLAMP(src[2], 0, 1) * 0x3ff)) & 0x3ff;
266 value |= (((uint32_t)(CLAMP(src[1], 0, 1) * 0x3ff)) & 0x3ff) << 10;
267 value |= (((uint32_t)(CLAMP(src[0], 0, 1) * 0x3ff)) & 0x3ff) << 20;
268 value |= ((uint32_t)(CLAMP(src[3], 0, 1) * 0x3)) << 30;
269 #ifdef PIPE_ARCH_BIG_ENDIAN
270 value = util_bswap32(value);
271 #endif
272 *(uint32_t *)attrib = value;
273 }
274
275 static void
276 emit_B10G10R10A2_USCALED( const void *attrib, void *ptr )
277 {
278 float *src = (float *)ptr;
279 uint32_t value = 0;
280 value |= ((uint32_t)CLAMP(src[2], 0, 1023)) & 0x3ff;
281 value |= (((uint32_t)CLAMP(src[1], 0, 1023)) & 0x3ff) << 10;
282 value |= (((uint32_t)CLAMP(src[0], 0, 1023)) & 0x3ff) << 20;
283 value |= ((uint32_t)CLAMP(src[3], 0, 3)) << 30;
284 #ifdef PIPE_ARCH_BIG_ENDIAN
285 value = util_bswap32(value);
286 #endif
287 *(uint32_t *)attrib = value;
288 }
289
290 static void
291 emit_B10G10R10A2_SNORM( const void *attrib, void *ptr )
292 {
293 float *src = (float *)ptr;
294 uint32_t value = 0;
295 value |= (uint32_t)(((uint32_t)(CLAMP(src[2], -1, 1) * 0x1ff)) & 0x3ff) ;
296 value |= (uint32_t)((((uint32_t)(CLAMP(src[1], -1, 1) * 0x1ff)) & 0x3ff) << 10) ;
297 value |= (uint32_t)((((uint32_t)(CLAMP(src[0], -1, 1) * 0x1ff)) & 0x3ff) << 20) ;
298 value |= (uint32_t)(((uint32_t)(CLAMP(src[3], -1, 1) * 0x1)) << 30) ;
299 #ifdef PIPE_ARCH_BIG_ENDIAN
300 value = util_bswap32(value);
301 #endif
302 *(uint32_t *)attrib = value;
303 }
304
305 static void
306 emit_B10G10R10A2_SSCALED( const void *attrib, void *ptr )
307 {
308 float *src = (float *)ptr;
309 uint32_t value = 0;
310 value |= (uint32_t)(((uint32_t)CLAMP(src[2], -512, 511)) & 0x3ff) ;
311 value |= (uint32_t)((((uint32_t)CLAMP(src[1], -512, 511)) & 0x3ff) << 10) ;
312 value |= (uint32_t)((((uint32_t)CLAMP(src[0], -512, 511)) & 0x3ff) << 20) ;
313 value |= (uint32_t)(((uint32_t)CLAMP(src[3], -2, 1)) << 30) ;
314 #ifdef PIPE_ARCH_BIG_ENDIAN
315 value = util_bswap32(value);
316 #endif
317 *(uint32_t *)attrib = value;
318 }
319
320 static void
321 emit_R10G10B10A2_UNORM( const void *attrib, void *ptr )
322 {
323 float *src = (float *)ptr;
324 uint32_t value = 0;
325 value |= ((uint32_t)(CLAMP(src[0], 0, 1) * 0x3ff)) & 0x3ff;
326 value |= (((uint32_t)(CLAMP(src[1], 0, 1) * 0x3ff)) & 0x3ff) << 10;
327 value |= (((uint32_t)(CLAMP(src[2], 0, 1) * 0x3ff)) & 0x3ff) << 20;
328 value |= ((uint32_t)(CLAMP(src[3], 0, 1) * 0x3)) << 30;
329 #ifdef PIPE_ARCH_BIG_ENDIAN
330 value = util_bswap32(value);
331 #endif
332 *(uint32_t *)attrib = value;
333 }
334
335 static void
336 emit_R10G10B10A2_USCALED( const void *attrib, void *ptr )
337 {
338 float *src = (float *)ptr;
339 uint32_t value = 0;
340 value |= ((uint32_t)CLAMP(src[0], 0, 1023)) & 0x3ff;
341 value |= (((uint32_t)CLAMP(src[1], 0, 1023)) & 0x3ff) << 10;
342 value |= (((uint32_t)CLAMP(src[2], 0, 1023)) & 0x3ff) << 20;
343 value |= ((uint32_t)CLAMP(src[3], 0, 3)) << 30;
344 #ifdef PIPE_ARCH_BIG_ENDIAN
345 value = util_bswap32(value);
346 #endif
347 *(uint32_t *)attrib = value;
348 }
349
350 static void
351 emit_R10G10B10A2_SNORM( const void *attrib, void *ptr )
352 {
353 float *src = (float *)ptr;
354 uint32_t value = 0;
355 value |= (uint32_t)(((uint32_t)(CLAMP(src[0], -1, 1) * 0x1ff)) & 0x3ff) ;
356 value |= (uint32_t)((((uint32_t)(CLAMP(src[1], -1, 1) * 0x1ff)) & 0x3ff) << 10) ;
357 value |= (uint32_t)((((uint32_t)(CLAMP(src[2], -1, 1) * 0x1ff)) & 0x3ff) << 20) ;
358 value |= (uint32_t)(((uint32_t)(CLAMP(src[3], -1, 1) * 0x1)) << 30) ;
359 #ifdef PIPE_ARCH_BIG_ENDIAN
360 value = util_bswap32(value);
361 #endif
362 *(uint32_t *)attrib = value;
363 }
364
365 static void
366 emit_R10G10B10A2_SSCALED( const void *attrib, void *ptr)
367 {
368 float *src = (float *)ptr;
369 uint32_t value = 0;
370 value |= (uint32_t)(((uint32_t)CLAMP(src[0], -512, 511)) & 0x3ff) ;
371 value |= (uint32_t)((((uint32_t)CLAMP(src[1], -512, 511)) & 0x3ff) << 10) ;
372 value |= (uint32_t)((((uint32_t)CLAMP(src[2], -512, 511)) & 0x3ff) << 20) ;
373 value |= (uint32_t)(((uint32_t)CLAMP(src[3], -2, 1)) << 30) ;
374 #ifdef PIPE_ARCH_BIG_ENDIAN
375 value = util_bswap32(value);
376 #endif
377 *(uint32_t *)attrib = value;
378 }
379
380 static void
381 emit_NULL( const void *attrib, void *ptr )
382 {
383 /* do nothing is the only sensible option */
384 }
385
386 static emit_func get_emit_func( enum pipe_format format )
387 {
388 switch (format) {
389 case PIPE_FORMAT_R64_FLOAT:
390 return &emit_R64_FLOAT;
391 case PIPE_FORMAT_R64G64_FLOAT:
392 return &emit_R64G64_FLOAT;
393 case PIPE_FORMAT_R64G64B64_FLOAT:
394 return &emit_R64G64B64_FLOAT;
395 case PIPE_FORMAT_R64G64B64A64_FLOAT:
396 return &emit_R64G64B64A64_FLOAT;
397
398 case PIPE_FORMAT_R32_FLOAT:
399 return &emit_R32_FLOAT;
400 case PIPE_FORMAT_R32G32_FLOAT:
401 return &emit_R32G32_FLOAT;
402 case PIPE_FORMAT_R32G32B32_FLOAT:
403 return &emit_R32G32B32_FLOAT;
404 case PIPE_FORMAT_R32G32B32A32_FLOAT:
405 return &emit_R32G32B32A32_FLOAT;
406
407 case PIPE_FORMAT_R16_FLOAT:
408 return &emit_R16_FLOAT;
409 case PIPE_FORMAT_R16G16_FLOAT:
410 return &emit_R16G16_FLOAT;
411 case PIPE_FORMAT_R16G16B16_FLOAT:
412 return &emit_R16G16B16_FLOAT;
413 case PIPE_FORMAT_R16G16B16A16_FLOAT:
414 return &emit_R16G16B16A16_FLOAT;
415
416 case PIPE_FORMAT_R32_UNORM:
417 return &emit_R32_UNORM;
418 case PIPE_FORMAT_R32G32_UNORM:
419 return &emit_R32G32_UNORM;
420 case PIPE_FORMAT_R32G32B32_UNORM:
421 return &emit_R32G32B32_UNORM;
422 case PIPE_FORMAT_R32G32B32A32_UNORM:
423 return &emit_R32G32B32A32_UNORM;
424
425 case PIPE_FORMAT_R32_USCALED:
426 return &emit_R32_USCALED;
427 case PIPE_FORMAT_R32G32_USCALED:
428 return &emit_R32G32_USCALED;
429 case PIPE_FORMAT_R32G32B32_USCALED:
430 return &emit_R32G32B32_USCALED;
431 case PIPE_FORMAT_R32G32B32A32_USCALED:
432 return &emit_R32G32B32A32_USCALED;
433
434 case PIPE_FORMAT_R32_SNORM:
435 return &emit_R32_SNORM;
436 case PIPE_FORMAT_R32G32_SNORM:
437 return &emit_R32G32_SNORM;
438 case PIPE_FORMAT_R32G32B32_SNORM:
439 return &emit_R32G32B32_SNORM;
440 case PIPE_FORMAT_R32G32B32A32_SNORM:
441 return &emit_R32G32B32A32_SNORM;
442
443 case PIPE_FORMAT_R32_SSCALED:
444 return &emit_R32_SSCALED;
445 case PIPE_FORMAT_R32G32_SSCALED:
446 return &emit_R32G32_SSCALED;
447 case PIPE_FORMAT_R32G32B32_SSCALED:
448 return &emit_R32G32B32_SSCALED;
449 case PIPE_FORMAT_R32G32B32A32_SSCALED:
450 return &emit_R32G32B32A32_SSCALED;
451
452 case PIPE_FORMAT_R16_UNORM:
453 return &emit_R16_UNORM;
454 case PIPE_FORMAT_R16G16_UNORM:
455 return &emit_R16G16_UNORM;
456 case PIPE_FORMAT_R16G16B16_UNORM:
457 return &emit_R16G16B16_UNORM;
458 case PIPE_FORMAT_R16G16B16A16_UNORM:
459 return &emit_R16G16B16A16_UNORM;
460
461 case PIPE_FORMAT_R16_USCALED:
462 return &emit_R16_USCALED;
463 case PIPE_FORMAT_R16G16_USCALED:
464 return &emit_R16G16_USCALED;
465 case PIPE_FORMAT_R16G16B16_USCALED:
466 return &emit_R16G16B16_USCALED;
467 case PIPE_FORMAT_R16G16B16A16_USCALED:
468 return &emit_R16G16B16A16_USCALED;
469
470 case PIPE_FORMAT_R16_SNORM:
471 return &emit_R16_SNORM;
472 case PIPE_FORMAT_R16G16_SNORM:
473 return &emit_R16G16_SNORM;
474 case PIPE_FORMAT_R16G16B16_SNORM:
475 return &emit_R16G16B16_SNORM;
476 case PIPE_FORMAT_R16G16B16A16_SNORM:
477 return &emit_R16G16B16A16_SNORM;
478
479 case PIPE_FORMAT_R16_SSCALED:
480 return &emit_R16_SSCALED;
481 case PIPE_FORMAT_R16G16_SSCALED:
482 return &emit_R16G16_SSCALED;
483 case PIPE_FORMAT_R16G16B16_SSCALED:
484 return &emit_R16G16B16_SSCALED;
485 case PIPE_FORMAT_R16G16B16A16_SSCALED:
486 return &emit_R16G16B16A16_SSCALED;
487
488 case PIPE_FORMAT_R8_UNORM:
489 return &emit_R8_UNORM;
490 case PIPE_FORMAT_R8G8_UNORM:
491 return &emit_R8G8_UNORM;
492 case PIPE_FORMAT_R8G8B8_UNORM:
493 return &emit_R8G8B8_UNORM;
494 case PIPE_FORMAT_R8G8B8A8_UNORM:
495 return &emit_R8G8B8A8_UNORM;
496
497 case PIPE_FORMAT_R8_USCALED:
498 return &emit_R8_USCALED;
499 case PIPE_FORMAT_R8G8_USCALED:
500 return &emit_R8G8_USCALED;
501 case PIPE_FORMAT_R8G8B8_USCALED:
502 return &emit_R8G8B8_USCALED;
503 case PIPE_FORMAT_R8G8B8A8_USCALED:
504 return &emit_R8G8B8A8_USCALED;
505
506 case PIPE_FORMAT_R8_SNORM:
507 return &emit_R8_SNORM;
508 case PIPE_FORMAT_R8G8_SNORM:
509 return &emit_R8G8_SNORM;
510 case PIPE_FORMAT_R8G8B8_SNORM:
511 return &emit_R8G8B8_SNORM;
512 case PIPE_FORMAT_R8G8B8A8_SNORM:
513 return &emit_R8G8B8A8_SNORM;
514
515 case PIPE_FORMAT_R8_SSCALED:
516 return &emit_R8_SSCALED;
517 case PIPE_FORMAT_R8G8_SSCALED:
518 return &emit_R8G8_SSCALED;
519 case PIPE_FORMAT_R8G8B8_SSCALED:
520 return &emit_R8G8B8_SSCALED;
521 case PIPE_FORMAT_R8G8B8A8_SSCALED:
522 return &emit_R8G8B8A8_SSCALED;
523
524 case PIPE_FORMAT_B8G8R8A8_UNORM:
525 return &emit_B8G8R8A8_UNORM;
526
527 case PIPE_FORMAT_A8R8G8B8_UNORM:
528 return &emit_A8R8G8B8_UNORM;
529
530 case PIPE_FORMAT_R32_UINT:
531 return &emit_R32_UINT;
532 case PIPE_FORMAT_R32G32_UINT:
533 return &emit_R32G32_UINT;
534 case PIPE_FORMAT_R32G32B32_UINT:
535 return &emit_R32G32B32_UINT;
536 case PIPE_FORMAT_R32G32B32A32_UINT:
537 return &emit_R32G32B32A32_UINT;
538
539 case PIPE_FORMAT_R16_UINT:
540 return &emit_R16_UINT;
541 case PIPE_FORMAT_R16G16_UINT:
542 return &emit_R16G16_UINT;
543 case PIPE_FORMAT_R16G16B16_UINT:
544 return &emit_R16G16B16_UINT;
545 case PIPE_FORMAT_R16G16B16A16_UINT:
546 return &emit_R16G16B16A16_UINT;
547
548 case PIPE_FORMAT_R8_UINT:
549 return &emit_R8_UINT;
550 case PIPE_FORMAT_R8G8_UINT:
551 return &emit_R8G8_UINT;
552 case PIPE_FORMAT_R8G8B8_UINT:
553 return &emit_R8G8B8_UINT;
554 case PIPE_FORMAT_R8G8B8A8_UINT:
555 return &emit_R8G8B8A8_UINT;
556
557 case PIPE_FORMAT_R32_SINT:
558 return &emit_R32_SINT;
559 case PIPE_FORMAT_R32G32_SINT:
560 return &emit_R32G32_SINT;
561 case PIPE_FORMAT_R32G32B32_SINT:
562 return &emit_R32G32B32_SINT;
563 case PIPE_FORMAT_R32G32B32A32_SINT:
564 return &emit_R32G32B32A32_SINT;
565
566 case PIPE_FORMAT_R16_SINT:
567 return &emit_R16_SINT;
568 case PIPE_FORMAT_R16G16_SINT:
569 return &emit_R16G16_SINT;
570 case PIPE_FORMAT_R16G16B16_SINT:
571 return &emit_R16G16B16_SINT;
572 case PIPE_FORMAT_R16G16B16A16_SINT:
573 return &emit_R16G16B16A16_SINT;
574
575 case PIPE_FORMAT_R8_SINT:
576 return &emit_R8_SINT;
577 case PIPE_FORMAT_R8G8_SINT:
578 return &emit_R8G8_SINT;
579 case PIPE_FORMAT_R8G8B8_SINT:
580 return &emit_R8G8B8_SINT;
581 case PIPE_FORMAT_R8G8B8A8_SINT:
582 return &emit_R8G8B8A8_SINT;
583
584 case PIPE_FORMAT_B10G10R10A2_UNORM:
585 return &emit_B10G10R10A2_UNORM;
586 case PIPE_FORMAT_B10G10R10A2_USCALED:
587 return &emit_B10G10R10A2_USCALED;
588 case PIPE_FORMAT_B10G10R10A2_SNORM:
589 return &emit_B10G10R10A2_SNORM;
590 case PIPE_FORMAT_B10G10R10A2_SSCALED:
591 return &emit_B10G10R10A2_SSCALED;
592
593 case PIPE_FORMAT_R10G10B10A2_UNORM:
594 return &emit_R10G10B10A2_UNORM;
595 case PIPE_FORMAT_R10G10B10A2_USCALED:
596 return &emit_R10G10B10A2_USCALED;
597 case PIPE_FORMAT_R10G10B10A2_SNORM:
598 return &emit_R10G10B10A2_SNORM;
599 case PIPE_FORMAT_R10G10B10A2_SSCALED:
600 return &emit_R10G10B10A2_SSCALED;
601
602 default:
603 assert(0);
604 return &emit_NULL;
605 }
606 }
607
608 static ALWAYS_INLINE void PIPE_CDECL generic_run_one( struct translate_generic *tg,
609 unsigned elt,
610 unsigned start_instance,
611 unsigned instance_id,
612 void *vert )
613 {
614 unsigned nr_attrs = tg->nr_attrib;
615 unsigned attr;
616
617 for (attr = 0; attr < nr_attrs; attr++) {
618 float data[4];
619 uint8_t *dst = (uint8_t *)vert + tg->attrib[attr].output_offset;
620
621 if (tg->attrib[attr].type == TRANSLATE_ELEMENT_NORMAL) {
622 const uint8_t *src;
623 unsigned index;
624 int copy_size;
625
626 if (tg->attrib[attr].instance_divisor) {
627 index = start_instance;
628 index += (instance_id - start_instance) /
629 tg->attrib[attr].instance_divisor;
630 /* XXX we need to clamp the index here too, but to a
631 * per-array max value, not the draw->pt.max_index value
632 * that's being given to us via translate->set_buffer().
633 */
634 }
635 else {
636 index = elt;
637 /* clamp to avoid going out of bounds */
638 index = MIN2(index, tg->attrib[attr].max_index);
639 }
640
641 src = tg->attrib[attr].input_ptr +
642 tg->attrib[attr].input_stride * index;
643
644 copy_size = tg->attrib[attr].copy_size;
645 if(likely(copy_size >= 0))
646 memcpy(dst, src, copy_size);
647 else
648 {
649 tg->attrib[attr].fetch( data, src, 0, 0 );
650
651 if (0)
652 debug_printf("Fetch linear attr %d from %p stride %d index %d: "
653 " %f, %f, %f, %f \n",
654 attr,
655 tg->attrib[attr].input_ptr,
656 tg->attrib[attr].input_stride,
657 index,
658 data[0], data[1],data[2], data[3]);
659
660 tg->attrib[attr].emit( data, dst );
661 }
662 } else {
663 if(likely(tg->attrib[attr].copy_size >= 0))
664 memcpy(data, &instance_id, 4);
665 else
666 {
667 data[0] = (float)instance_id;
668 tg->attrib[attr].emit( data, dst );
669 }
670 }
671 }
672 }
673
674 /**
675 * Fetch vertex attributes for 'count' vertices.
676 */
677 static void PIPE_CDECL generic_run_elts( struct translate *translate,
678 const unsigned *elts,
679 unsigned count,
680 unsigned start_instance,
681 unsigned instance_id,
682 void *output_buffer )
683 {
684 struct translate_generic *tg = translate_generic(translate);
685 char *vert = output_buffer;
686 unsigned i;
687
688 for (i = 0; i < count; i++) {
689 generic_run_one(tg, *elts++, start_instance, instance_id, vert);
690 vert += tg->translate.key.output_stride;
691 }
692 }
693
694 static void PIPE_CDECL generic_run_elts16( struct translate *translate,
695 const uint16_t *elts,
696 unsigned count,
697 unsigned start_instance,
698 unsigned instance_id,
699 void *output_buffer )
700 {
701 struct translate_generic *tg = translate_generic(translate);
702 char *vert = output_buffer;
703 unsigned i;
704
705 for (i = 0; i < count; i++) {
706 generic_run_one(tg, *elts++, start_instance, instance_id, vert);
707 vert += tg->translate.key.output_stride;
708 }
709 }
710
711 static void PIPE_CDECL generic_run_elts8( struct translate *translate,
712 const uint8_t *elts,
713 unsigned count,
714 unsigned start_instance,
715 unsigned instance_id,
716 void *output_buffer )
717 {
718 struct translate_generic *tg = translate_generic(translate);
719 char *vert = output_buffer;
720 unsigned i;
721
722 for (i = 0; i < count; i++) {
723 generic_run_one(tg, *elts++, start_instance, instance_id, vert);
724 vert += tg->translate.key.output_stride;
725 }
726 }
727
728 static void PIPE_CDECL generic_run( struct translate *translate,
729 unsigned start,
730 unsigned count,
731 unsigned start_instance,
732 unsigned instance_id,
733 void *output_buffer )
734 {
735 struct translate_generic *tg = translate_generic(translate);
736 char *vert = output_buffer;
737 unsigned i;
738
739 for (i = 0; i < count; i++) {
740 generic_run_one(tg, start + i, start_instance, instance_id, vert);
741 vert += tg->translate.key.output_stride;
742 }
743 }
744
745
746
747 static void generic_set_buffer( struct translate *translate,
748 unsigned buf,
749 const void *ptr,
750 unsigned stride,
751 unsigned max_index )
752 {
753 struct translate_generic *tg = translate_generic(translate);
754 unsigned i;
755
756 for (i = 0; i < tg->nr_attrib; i++) {
757 if (tg->attrib[i].buffer == buf) {
758 tg->attrib[i].input_ptr = ((const uint8_t *)ptr +
759 tg->attrib[i].input_offset);
760 tg->attrib[i].input_stride = stride;
761 tg->attrib[i].max_index = max_index;
762 }
763 }
764 }
765
766
767 static void generic_release( struct translate *translate )
768 {
769 /* Refcount?
770 */
771 FREE(translate);
772 }
773
774 static boolean
775 is_legal_int_format_combo( const struct util_format_description *src,
776 const struct util_format_description *dst )
777 {
778 unsigned i;
779 unsigned nr = MIN2(src->nr_channels, dst->nr_channels);
780
781 for (i = 0; i < nr; i++) {
782 /* The signs must match. */
783 if (src->channel[i].type != dst->channel[i].type) {
784 return FALSE;
785 }
786
787 /* Integers must not lose precision at any point in the pipeline. */
788 if (src->channel[i].size > dst->channel[i].size) {
789 return FALSE;
790 }
791 }
792 return TRUE;
793 }
794
795 struct translate *translate_generic_create( const struct translate_key *key )
796 {
797 struct translate_generic *tg = CALLOC_STRUCT(translate_generic);
798 unsigned i;
799
800 if (tg == NULL)
801 return NULL;
802
803 tg->translate.key = *key;
804 tg->translate.release = generic_release;
805 tg->translate.set_buffer = generic_set_buffer;
806 tg->translate.run_elts = generic_run_elts;
807 tg->translate.run_elts16 = generic_run_elts16;
808 tg->translate.run_elts8 = generic_run_elts8;
809 tg->translate.run = generic_run;
810
811 for (i = 0; i < key->nr_elements; i++) {
812 const struct util_format_description *format_desc =
813 util_format_description(key->element[i].input_format);
814
815 assert(format_desc);
816
817 tg->attrib[i].type = key->element[i].type;
818
819 if (format_desc->channel[0].pure_integer) {
820 const struct util_format_description *out_format_desc =
821 util_format_description(key->element[i].output_format);
822
823 if (!is_legal_int_format_combo(format_desc, out_format_desc)) {
824 FREE(tg);
825 return NULL;
826 }
827
828 if (format_desc->channel[0].type == UTIL_FORMAT_TYPE_SIGNED) {
829 assert(format_desc->fetch_rgba_sint);
830 tg->attrib[i].fetch = (fetch_func)format_desc->fetch_rgba_sint;
831 } else {
832 assert(format_desc->fetch_rgba_uint);
833 tg->attrib[i].fetch = (fetch_func)format_desc->fetch_rgba_uint;
834 }
835 } else {
836 assert(format_desc->fetch_rgba_float);
837 tg->attrib[i].fetch = (fetch_func)format_desc->fetch_rgba_float;
838 }
839
840 tg->attrib[i].buffer = key->element[i].input_buffer;
841 tg->attrib[i].input_offset = key->element[i].input_offset;
842 tg->attrib[i].instance_divisor = key->element[i].instance_divisor;
843
844 tg->attrib[i].output_offset = key->element[i].output_offset;
845
846 tg->attrib[i].copy_size = -1;
847 if (tg->attrib[i].type == TRANSLATE_ELEMENT_INSTANCE_ID)
848 {
849 if(key->element[i].output_format == PIPE_FORMAT_R32_USCALED
850 || key->element[i].output_format == PIPE_FORMAT_R32_SSCALED)
851 tg->attrib[i].copy_size = 4;
852 }
853 else
854 {
855 if(key->element[i].input_format == key->element[i].output_format
856 && format_desc->block.width == 1
857 && format_desc->block.height == 1
858 && !(format_desc->block.bits & 7))
859 tg->attrib[i].copy_size = format_desc->block.bits >> 3;
860 }
861
862 if(tg->attrib[i].copy_size < 0)
863 tg->attrib[i].emit = get_emit_func(key->element[i].output_format);
864 else
865 tg->attrib[i].emit = NULL;
866 }
867
868 tg->nr_attrib = key->nr_elements;
869
870
871 return &tg->translate;
872 }
873
874 boolean translate_generic_is_output_format_supported(enum pipe_format format)
875 {
876 switch(format)
877 {
878 case PIPE_FORMAT_R64G64B64A64_FLOAT: return TRUE;
879 case PIPE_FORMAT_R64G64B64_FLOAT: return TRUE;
880 case PIPE_FORMAT_R64G64_FLOAT: return TRUE;
881 case PIPE_FORMAT_R64_FLOAT: return TRUE;
882
883 case PIPE_FORMAT_R32G32B32A32_FLOAT: return TRUE;
884 case PIPE_FORMAT_R32G32B32_FLOAT: return TRUE;
885 case PIPE_FORMAT_R32G32_FLOAT: return TRUE;
886 case PIPE_FORMAT_R32_FLOAT: return TRUE;
887
888 case PIPE_FORMAT_R16G16B16A16_FLOAT: return TRUE;
889 case PIPE_FORMAT_R16G16B16_FLOAT: return TRUE;
890 case PIPE_FORMAT_R16G16_FLOAT: return TRUE;
891 case PIPE_FORMAT_R16_FLOAT: return TRUE;
892
893 case PIPE_FORMAT_R32G32B32A32_USCALED: return TRUE;
894 case PIPE_FORMAT_R32G32B32_USCALED: return TRUE;
895 case PIPE_FORMAT_R32G32_USCALED: return TRUE;
896 case PIPE_FORMAT_R32_USCALED: return TRUE;
897
898 case PIPE_FORMAT_R32G32B32A32_SSCALED: return TRUE;
899 case PIPE_FORMAT_R32G32B32_SSCALED: return TRUE;
900 case PIPE_FORMAT_R32G32_SSCALED: return TRUE;
901 case PIPE_FORMAT_R32_SSCALED: return TRUE;
902
903 case PIPE_FORMAT_R32G32B32A32_UNORM: return TRUE;
904 case PIPE_FORMAT_R32G32B32_UNORM: return TRUE;
905 case PIPE_FORMAT_R32G32_UNORM: return TRUE;
906 case PIPE_FORMAT_R32_UNORM: return TRUE;
907
908 case PIPE_FORMAT_R32G32B32A32_SNORM: return TRUE;
909 case PIPE_FORMAT_R32G32B32_SNORM: return TRUE;
910 case PIPE_FORMAT_R32G32_SNORM: return TRUE;
911 case PIPE_FORMAT_R32_SNORM: return TRUE;
912
913 case PIPE_FORMAT_R16G16B16A16_USCALED: return TRUE;
914 case PIPE_FORMAT_R16G16B16_USCALED: return TRUE;
915 case PIPE_FORMAT_R16G16_USCALED: return TRUE;
916 case PIPE_FORMAT_R16_USCALED: return TRUE;
917
918 case PIPE_FORMAT_R16G16B16A16_SSCALED: return TRUE;
919 case PIPE_FORMAT_R16G16B16_SSCALED: return TRUE;
920 case PIPE_FORMAT_R16G16_SSCALED: return TRUE;
921 case PIPE_FORMAT_R16_SSCALED: return TRUE;
922
923 case PIPE_FORMAT_R16G16B16A16_UNORM: return TRUE;
924 case PIPE_FORMAT_R16G16B16_UNORM: return TRUE;
925 case PIPE_FORMAT_R16G16_UNORM: return TRUE;
926 case PIPE_FORMAT_R16_UNORM: return TRUE;
927
928 case PIPE_FORMAT_R16G16B16A16_SNORM: return TRUE;
929 case PIPE_FORMAT_R16G16B16_SNORM: return TRUE;
930 case PIPE_FORMAT_R16G16_SNORM: return TRUE;
931 case PIPE_FORMAT_R16_SNORM: return TRUE;
932
933 case PIPE_FORMAT_R8G8B8A8_USCALED: return TRUE;
934 case PIPE_FORMAT_R8G8B8_USCALED: return TRUE;
935 case PIPE_FORMAT_R8G8_USCALED: return TRUE;
936 case PIPE_FORMAT_R8_USCALED: return TRUE;
937
938 case PIPE_FORMAT_R8G8B8A8_SSCALED: return TRUE;
939 case PIPE_FORMAT_R8G8B8_SSCALED: return TRUE;
940 case PIPE_FORMAT_R8G8_SSCALED: return TRUE;
941 case PIPE_FORMAT_R8_SSCALED: return TRUE;
942
943 case PIPE_FORMAT_R8G8B8A8_UNORM: return TRUE;
944 case PIPE_FORMAT_R8G8B8_UNORM: return TRUE;
945 case PIPE_FORMAT_R8G8_UNORM: return TRUE;
946 case PIPE_FORMAT_R8_UNORM: return TRUE;
947
948 case PIPE_FORMAT_R8G8B8A8_SNORM: return TRUE;
949 case PIPE_FORMAT_R8G8B8_SNORM: return TRUE;
950 case PIPE_FORMAT_R8G8_SNORM: return TRUE;
951 case PIPE_FORMAT_R8_SNORM: return TRUE;
952
953 case PIPE_FORMAT_A8R8G8B8_UNORM: return TRUE;
954 case PIPE_FORMAT_B8G8R8A8_UNORM: return TRUE;
955
956 case PIPE_FORMAT_R32G32B32A32_UINT: return TRUE;
957 case PIPE_FORMAT_R32G32B32_UINT: return TRUE;
958 case PIPE_FORMAT_R32G32_UINT: return TRUE;
959 case PIPE_FORMAT_R32_UINT: return TRUE;
960
961 case PIPE_FORMAT_R16G16B16A16_UINT: return TRUE;
962 case PIPE_FORMAT_R16G16B16_UINT: return TRUE;
963 case PIPE_FORMAT_R16G16_UINT: return TRUE;
964 case PIPE_FORMAT_R16_UINT: return TRUE;
965
966 case PIPE_FORMAT_R8G8B8A8_UINT: return TRUE;
967 case PIPE_FORMAT_R8G8B8_UINT: return TRUE;
968 case PIPE_FORMAT_R8G8_UINT: return TRUE;
969 case PIPE_FORMAT_R8_UINT: return TRUE;
970
971 case PIPE_FORMAT_R32G32B32A32_SINT: return TRUE;
972 case PIPE_FORMAT_R32G32B32_SINT: return TRUE;
973 case PIPE_FORMAT_R32G32_SINT: return TRUE;
974 case PIPE_FORMAT_R32_SINT: return TRUE;
975
976 case PIPE_FORMAT_R16G16B16A16_SINT: return TRUE;
977 case PIPE_FORMAT_R16G16B16_SINT: return TRUE;
978 case PIPE_FORMAT_R16G16_SINT: return TRUE;
979 case PIPE_FORMAT_R16_SINT: return TRUE;
980
981 case PIPE_FORMAT_R8G8B8A8_SINT: return TRUE;
982 case PIPE_FORMAT_R8G8B8_SINT: return TRUE;
983 case PIPE_FORMAT_R8G8_SINT: return TRUE;
984 case PIPE_FORMAT_R8_SINT: return TRUE;
985
986 case PIPE_FORMAT_B10G10R10A2_UNORM: return TRUE;
987 case PIPE_FORMAT_B10G10R10A2_USCALED: return TRUE;
988 case PIPE_FORMAT_B10G10R10A2_SNORM: return TRUE;
989 case PIPE_FORMAT_B10G10R10A2_SSCALED: return TRUE;
990
991 case PIPE_FORMAT_R10G10B10A2_UNORM: return TRUE;
992 case PIPE_FORMAT_R10G10B10A2_USCALED: return TRUE;
993 case PIPE_FORMAT_R10G10B10A2_SNORM: return TRUE;
994 case PIPE_FORMAT_R10G10B10A2_SSCALED: return TRUE;
995
996 default: return FALSE;
997 }
998 }