fdab0f34a1a944225cb36b1bb3c7fbeded2e54cf
[mesa.git] / src / gallium / auxiliary / translate / translate_generic.c
1 /**************************************************************************
2 *
3 * Copyright 2007 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 /*
29 * Authors:
30 * Keith Whitwell <keith@tungstengraphics.com>
31 */
32
33 #include "util/u_memory.h"
34 #include "util/u_format.h"
35 #include "util/u_half.h"
36 #include "util/u_math.h"
37 #include "pipe/p_state.h"
38 #include "translate.h"
39
40
41 #define DRAW_DBG 0
42
43 typedef void (*fetch_func)(void *dst,
44 const uint8_t *src,
45 unsigned i, unsigned j);
46 typedef void (*emit_func)(const void *attrib, void *ptr);
47
48
49
50 struct translate_generic {
51 struct translate translate;
52
53 struct {
54 enum translate_element_type type;
55
56 fetch_func fetch;
57 unsigned buffer;
58 unsigned input_offset;
59 unsigned instance_divisor;
60
61 emit_func emit;
62 unsigned output_offset;
63
64 const uint8_t *input_ptr;
65 unsigned input_stride;
66 unsigned max_index;
67
68 /* this value is set to -1 if this is a normal element with output_format != input_format:
69 * in this case, u_format is used to do a full conversion
70 *
71 * this value is set to the format size in bytes if output_format == input_format or for 32-bit instance ids:
72 * in this case, memcpy is used to copy this amount of bytes
73 */
74 int copy_size;
75
76 } attrib[PIPE_MAX_ATTRIBS];
77
78 unsigned nr_attrib;
79 };
80
81
82 static struct translate_generic *translate_generic( struct translate *translate )
83 {
84 return (struct translate_generic *)translate;
85 }
86
87 /**
88 * Fetch a dword[4] vertex attribute from memory, doing format/type
89 * conversion as needed.
90 *
91 * This is probably needed/dupliocated elsewhere, eg format
92 * conversion, texture sampling etc.
93 */
94 #define ATTRIB( NAME, SZ, SRCTYPE, DSTTYPE, TO ) \
95 static void \
96 emit_##NAME(const void *attrib, void *ptr) \
97 { \
98 unsigned i; \
99 SRCTYPE *in = (SRCTYPE *)attrib; \
100 DSTTYPE *out = (DSTTYPE *)ptr; \
101 \
102 for (i = 0; i < SZ; i++) { \
103 out[i] = TO(in[i]); \
104 } \
105 }
106
107
108 #define TO_64_FLOAT(x) ((double) x)
109 #define TO_32_FLOAT(x) (x)
110 #define TO_16_FLOAT(x) util_float_to_half(x)
111
112 #define TO_8_USCALED(x) ((unsigned char) x)
113 #define TO_16_USCALED(x) ((unsigned short) x)
114 #define TO_32_USCALED(x) ((unsigned int) x)
115
116 #define TO_8_SSCALED(x) ((char) x)
117 #define TO_16_SSCALED(x) ((short) x)
118 #define TO_32_SSCALED(x) ((int) x)
119
120 #define TO_8_UNORM(x) ((unsigned char) (x * 255.0f))
121 #define TO_16_UNORM(x) ((unsigned short) (x * 65535.0f))
122 #define TO_32_UNORM(x) ((unsigned int) (x * 4294967295.0f))
123
124 #define TO_8_SNORM(x) ((char) (x * 127.0f))
125 #define TO_16_SNORM(x) ((short) (x * 32767.0f))
126 #define TO_32_SNORM(x) ((int) (x * 2147483647.0f))
127
128 #define TO_32_FIXED(x) ((int) (x * 65536.0f))
129
130 #define TO_INT(x) (x)
131
132
133 ATTRIB( R64G64B64A64_FLOAT, 4, float, double, TO_64_FLOAT )
134 ATTRIB( R64G64B64_FLOAT, 3, float, double, TO_64_FLOAT )
135 ATTRIB( R64G64_FLOAT, 2, float, double, TO_64_FLOAT )
136 ATTRIB( R64_FLOAT, 1, float, double, TO_64_FLOAT )
137
138 ATTRIB( R32G32B32A32_FLOAT, 4, float, float, TO_32_FLOAT )
139 ATTRIB( R32G32B32_FLOAT, 3, float, float, TO_32_FLOAT )
140 ATTRIB( R32G32_FLOAT, 2, float, float, TO_32_FLOAT )
141 ATTRIB( R32_FLOAT, 1, float, float, TO_32_FLOAT )
142
143 ATTRIB( R16G16B16A16_FLOAT, 4, float, ushort, TO_16_FLOAT )
144 ATTRIB( R16G16B16_FLOAT, 3, float, ushort, TO_16_FLOAT )
145 ATTRIB( R16G16_FLOAT, 2, float, ushort, TO_16_FLOAT )
146 ATTRIB( R16_FLOAT, 1, float, ushort, TO_16_FLOAT )
147
148 ATTRIB( R32G32B32A32_USCALED, 4, float, unsigned, TO_32_USCALED )
149 ATTRIB( R32G32B32_USCALED, 3, float, unsigned, TO_32_USCALED )
150 ATTRIB( R32G32_USCALED, 2, float, unsigned, TO_32_USCALED )
151 ATTRIB( R32_USCALED, 1, float, unsigned, TO_32_USCALED )
152
153 ATTRIB( R32G32B32A32_SSCALED, 4, float, int, TO_32_SSCALED )
154 ATTRIB( R32G32B32_SSCALED, 3, float, int, TO_32_SSCALED )
155 ATTRIB( R32G32_SSCALED, 2, float, int, TO_32_SSCALED )
156 ATTRIB( R32_SSCALED, 1, float, int, TO_32_SSCALED )
157
158 ATTRIB( R32G32B32A32_UNORM, 4, float, unsigned, TO_32_UNORM )
159 ATTRIB( R32G32B32_UNORM, 3, float, unsigned, TO_32_UNORM )
160 ATTRIB( R32G32_UNORM, 2, float, unsigned, TO_32_UNORM )
161 ATTRIB( R32_UNORM, 1, float, unsigned, TO_32_UNORM )
162
163 ATTRIB( R32G32B32A32_SNORM, 4, float, int, TO_32_SNORM )
164 ATTRIB( R32G32B32_SNORM, 3, float, int, TO_32_SNORM )
165 ATTRIB( R32G32_SNORM, 2, float, int, TO_32_SNORM )
166 ATTRIB( R32_SNORM, 1, float, int, TO_32_SNORM )
167
168 ATTRIB( R16G16B16A16_USCALED, 4, float, ushort, TO_16_USCALED )
169 ATTRIB( R16G16B16_USCALED, 3, float, ushort, TO_16_USCALED )
170 ATTRIB( R16G16_USCALED, 2, float, ushort, TO_16_USCALED )
171 ATTRIB( R16_USCALED, 1, float, ushort, TO_16_USCALED )
172
173 ATTRIB( R16G16B16A16_SSCALED, 4, float, short, TO_16_SSCALED )
174 ATTRIB( R16G16B16_SSCALED, 3, float, short, TO_16_SSCALED )
175 ATTRIB( R16G16_SSCALED, 2, float, short, TO_16_SSCALED )
176 ATTRIB( R16_SSCALED, 1, float, short, TO_16_SSCALED )
177
178 ATTRIB( R16G16B16A16_UNORM, 4, float, ushort, TO_16_UNORM )
179 ATTRIB( R16G16B16_UNORM, 3, float, ushort, TO_16_UNORM )
180 ATTRIB( R16G16_UNORM, 2, float, ushort, TO_16_UNORM )
181 ATTRIB( R16_UNORM, 1, float, ushort, TO_16_UNORM )
182
183 ATTRIB( R16G16B16A16_SNORM, 4, float, short, TO_16_SNORM )
184 ATTRIB( R16G16B16_SNORM, 3, float, short, TO_16_SNORM )
185 ATTRIB( R16G16_SNORM, 2, float, short, TO_16_SNORM )
186 ATTRIB( R16_SNORM, 1, float, short, TO_16_SNORM )
187
188 ATTRIB( R8G8B8A8_USCALED, 4, float, ubyte, TO_8_USCALED )
189 ATTRIB( R8G8B8_USCALED, 3, float, ubyte, TO_8_USCALED )
190 ATTRIB( R8G8_USCALED, 2, float, ubyte, TO_8_USCALED )
191 ATTRIB( R8_USCALED, 1, float, ubyte, TO_8_USCALED )
192
193 ATTRIB( R8G8B8A8_SSCALED, 4, float, char, TO_8_SSCALED )
194 ATTRIB( R8G8B8_SSCALED, 3, float, char, TO_8_SSCALED )
195 ATTRIB( R8G8_SSCALED, 2, float, char, TO_8_SSCALED )
196 ATTRIB( R8_SSCALED, 1, float, char, TO_8_SSCALED )
197
198 ATTRIB( R8G8B8A8_UNORM, 4, float, ubyte, TO_8_UNORM )
199 ATTRIB( R8G8B8_UNORM, 3, float, ubyte, TO_8_UNORM )
200 ATTRIB( R8G8_UNORM, 2, float, ubyte, TO_8_UNORM )
201 ATTRIB( R8_UNORM, 1, float, ubyte, TO_8_UNORM )
202
203 ATTRIB( R8G8B8A8_SNORM, 4, float, char, TO_8_SNORM )
204 ATTRIB( R8G8B8_SNORM, 3, float, char, TO_8_SNORM )
205 ATTRIB( R8G8_SNORM, 2, float, char, TO_8_SNORM )
206 ATTRIB( R8_SNORM, 1, float, char, TO_8_SNORM )
207
208 ATTRIB( R32G32B32A32_UINT, 4, uint32_t, unsigned, TO_INT )
209 ATTRIB( R32G32B32_UINT, 3, uint32_t, unsigned, TO_INT )
210 ATTRIB( R32G32_UINT, 2, uint32_t, unsigned, TO_INT )
211 ATTRIB( R32_UINT, 1, uint32_t, unsigned, TO_INT )
212
213 ATTRIB( R16G16B16A16_UINT, 4, uint32_t, ushort, TO_INT )
214 ATTRIB( R16G16B16_UINT, 3, uint32_t, ushort, TO_INT )
215 ATTRIB( R16G16_UINT, 2, uint32_t, ushort, TO_INT )
216 ATTRIB( R16_UINT, 1, uint32_t, ushort, TO_INT )
217
218 ATTRIB( R8G8B8A8_UINT, 4, uint32_t, ubyte, TO_INT )
219 ATTRIB( R8G8B8_UINT, 3, uint32_t, ubyte, TO_INT )
220 ATTRIB( R8G8_UINT, 2, uint32_t, ubyte, TO_INT )
221 ATTRIB( R8_UINT, 1, uint32_t, ubyte, TO_INT )
222
223 ATTRIB( R32G32B32A32_SINT, 4, int32_t, int, TO_INT )
224 ATTRIB( R32G32B32_SINT, 3, int32_t, int, TO_INT )
225 ATTRIB( R32G32_SINT, 2, int32_t, int, TO_INT )
226 ATTRIB( R32_SINT, 1, int32_t, int, TO_INT )
227
228 ATTRIB( R16G16B16A16_SINT, 4, int32_t, short, TO_INT )
229 ATTRIB( R16G16B16_SINT, 3, int32_t, short, TO_INT )
230 ATTRIB( R16G16_SINT, 2, int32_t, short, TO_INT )
231 ATTRIB( R16_SINT, 1, int32_t, short, TO_INT )
232
233 ATTRIB( R8G8B8A8_SINT, 4, int32_t, char, TO_INT )
234 ATTRIB( R8G8B8_SINT, 3, int32_t, char, TO_INT )
235 ATTRIB( R8G8_SINT, 2, int32_t, char, TO_INT )
236 ATTRIB( R8_SINT, 1, int32_t, char, TO_INT )
237
238 static void
239 emit_A8R8G8B8_UNORM( const void *attrib, void *ptr)
240 {
241 float *in = (float *)attrib;
242 ubyte *out = (ubyte *)ptr;
243 out[0] = TO_8_UNORM(in[3]);
244 out[1] = TO_8_UNORM(in[0]);
245 out[2] = TO_8_UNORM(in[1]);
246 out[3] = TO_8_UNORM(in[2]);
247 }
248
249 static void
250 emit_B8G8R8A8_UNORM( const void *attrib, void *ptr)
251 {
252 float *in = (float *)attrib;
253 ubyte *out = (ubyte *)ptr;
254 out[2] = TO_8_UNORM(in[0]);
255 out[1] = TO_8_UNORM(in[1]);
256 out[0] = TO_8_UNORM(in[2]);
257 out[3] = TO_8_UNORM(in[3]);
258 }
259
260 static void
261 emit_B10G10R10A2_UNORM( const void *attrib, void *ptr )
262 {
263 float *src = (float *)ptr;
264 uint32_t value = 0;
265 value |= ((uint32_t)(CLAMP(src[2], 0, 1) * 0x3ff)) & 0x3ff;
266 value |= (((uint32_t)(CLAMP(src[1], 0, 1) * 0x3ff)) & 0x3ff) << 10;
267 value |= (((uint32_t)(CLAMP(src[0], 0, 1) * 0x3ff)) & 0x3ff) << 20;
268 value |= ((uint32_t)(CLAMP(src[3], 0, 1) * 0x3)) << 30;
269 #ifdef PIPE_ARCH_BIG_ENDIAN
270 value = util_bswap32(value);
271 #endif
272 *(uint32_t *)attrib = value;
273 }
274
275 static void
276 emit_B10G10R10A2_USCALED( const void *attrib, void *ptr )
277 {
278 float *src = (float *)ptr;
279 uint32_t value = 0;
280 value |= ((uint32_t)CLAMP(src[2], 0, 1023)) & 0x3ff;
281 value |= (((uint32_t)CLAMP(src[1], 0, 1023)) & 0x3ff) << 10;
282 value |= (((uint32_t)CLAMP(src[0], 0, 1023)) & 0x3ff) << 20;
283 value |= ((uint32_t)CLAMP(src[3], 0, 3)) << 30;
284 #ifdef PIPE_ARCH_BIG_ENDIAN
285 value = util_bswap32(value);
286 #endif
287 *(uint32_t *)attrib = value;
288 }
289
290 static void
291 emit_B10G10R10A2_SNORM( const void *attrib, void *ptr )
292 {
293 float *src = (float *)ptr;
294 uint32_t value = 0;
295 value |= (uint32_t)(((uint32_t)(CLAMP(src[2], -1, 1) * 0x1ff)) & 0x3ff) ;
296 value |= (uint32_t)((((uint32_t)(CLAMP(src[1], -1, 1) * 0x1ff)) & 0x3ff) << 10) ;
297 value |= (uint32_t)((((uint32_t)(CLAMP(src[0], -1, 1) * 0x1ff)) & 0x3ff) << 20) ;
298 value |= (uint32_t)(((uint32_t)(CLAMP(src[3], -1, 1) * 0x1)) << 30) ;
299 #ifdef PIPE_ARCH_BIG_ENDIAN
300 value = util_bswap32(value);
301 #endif
302 *(uint32_t *)attrib = value;
303 }
304
305 static void
306 emit_B10G10R10A2_SSCALED( const void *attrib, void *ptr )
307 {
308 float *src = (float *)ptr;
309 uint32_t value = 0;
310 value |= (uint32_t)(((uint32_t)CLAMP(src[2], -512, 511)) & 0x3ff) ;
311 value |= (uint32_t)((((uint32_t)CLAMP(src[1], -512, 511)) & 0x3ff) << 10) ;
312 value |= (uint32_t)((((uint32_t)CLAMP(src[0], -512, 511)) & 0x3ff) << 20) ;
313 value |= (uint32_t)(((uint32_t)CLAMP(src[3], -2, 1)) << 30) ;
314 #ifdef PIPE_ARCH_BIG_ENDIAN
315 value = util_bswap32(value);
316 #endif
317 *(uint32_t *)attrib = value;
318 }
319
320 static void
321 emit_R10G10B10A2_UNORM( const void *attrib, void *ptr )
322 {
323 float *src = (float *)ptr;
324 uint32_t value = 0;
325 value |= ((uint32_t)(CLAMP(src[0], 0, 1) * 0x3ff)) & 0x3ff;
326 value |= (((uint32_t)(CLAMP(src[1], 0, 1) * 0x3ff)) & 0x3ff) << 10;
327 value |= (((uint32_t)(CLAMP(src[2], 0, 1) * 0x3ff)) & 0x3ff) << 20;
328 value |= ((uint32_t)(CLAMP(src[3], 0, 1) * 0x3)) << 30;
329 #ifdef PIPE_ARCH_BIG_ENDIAN
330 value = util_bswap32(value);
331 #endif
332 *(uint32_t *)attrib = value;
333 }
334
335 static void
336 emit_R10G10B10A2_USCALED( const void *attrib, void *ptr )
337 {
338 float *src = (float *)ptr;
339 uint32_t value = 0;
340 value |= ((uint32_t)CLAMP(src[0], 0, 1023)) & 0x3ff;
341 value |= (((uint32_t)CLAMP(src[1], 0, 1023)) & 0x3ff) << 10;
342 value |= (((uint32_t)CLAMP(src[2], 0, 1023)) & 0x3ff) << 20;
343 value |= ((uint32_t)CLAMP(src[3], 0, 3)) << 30;
344 #ifdef PIPE_ARCH_BIG_ENDIAN
345 value = util_bswap32(value);
346 #endif
347 *(uint32_t *)attrib = value;
348 }
349
350 static void
351 emit_R10G10B10A2_SNORM( const void *attrib, void *ptr )
352 {
353 float *src = (float *)ptr;
354 uint32_t value = 0;
355 value |= (uint32_t)(((uint32_t)(CLAMP(src[0], -1, 1) * 0x1ff)) & 0x3ff) ;
356 value |= (uint32_t)((((uint32_t)(CLAMP(src[1], -1, 1) * 0x1ff)) & 0x3ff) << 10) ;
357 value |= (uint32_t)((((uint32_t)(CLAMP(src[2], -1, 1) * 0x1ff)) & 0x3ff) << 20) ;
358 value |= (uint32_t)(((uint32_t)(CLAMP(src[3], -1, 1) * 0x1)) << 30) ;
359 #ifdef PIPE_ARCH_BIG_ENDIAN
360 value = util_bswap32(value);
361 #endif
362 *(uint32_t *)attrib = value;
363 }
364
365 static void
366 emit_R10G10B10A2_SSCALED( const void *attrib, void *ptr)
367 {
368 float *src = (float *)ptr;
369 uint32_t value = 0;
370 value |= (uint32_t)(((uint32_t)CLAMP(src[0], -512, 511)) & 0x3ff) ;
371 value |= (uint32_t)((((uint32_t)CLAMP(src[1], -512, 511)) & 0x3ff) << 10) ;
372 value |= (uint32_t)((((uint32_t)CLAMP(src[2], -512, 511)) & 0x3ff) << 20) ;
373 value |= (uint32_t)(((uint32_t)CLAMP(src[3], -2, 1)) << 30) ;
374 #ifdef PIPE_ARCH_BIG_ENDIAN
375 value = util_bswap32(value);
376 #endif
377 *(uint32_t *)attrib = value;
378 }
379
380 static void
381 emit_NULL( const void *attrib, void *ptr )
382 {
383 /* do nothing is the only sensible option */
384 }
385
386 static emit_func get_emit_func( enum pipe_format format )
387 {
388 switch (format) {
389 case PIPE_FORMAT_R64_FLOAT:
390 return &emit_R64_FLOAT;
391 case PIPE_FORMAT_R64G64_FLOAT:
392 return &emit_R64G64_FLOAT;
393 case PIPE_FORMAT_R64G64B64_FLOAT:
394 return &emit_R64G64B64_FLOAT;
395 case PIPE_FORMAT_R64G64B64A64_FLOAT:
396 return &emit_R64G64B64A64_FLOAT;
397
398 case PIPE_FORMAT_R32_FLOAT:
399 return &emit_R32_FLOAT;
400 case PIPE_FORMAT_R32G32_FLOAT:
401 return &emit_R32G32_FLOAT;
402 case PIPE_FORMAT_R32G32B32_FLOAT:
403 return &emit_R32G32B32_FLOAT;
404 case PIPE_FORMAT_R32G32B32A32_FLOAT:
405 return &emit_R32G32B32A32_FLOAT;
406
407 case PIPE_FORMAT_R16_FLOAT:
408 return &emit_R16_FLOAT;
409 case PIPE_FORMAT_R16G16_FLOAT:
410 return &emit_R16G16_FLOAT;
411 case PIPE_FORMAT_R16G16B16_FLOAT:
412 return &emit_R16G16B16_FLOAT;
413 case PIPE_FORMAT_R16G16B16A16_FLOAT:
414 return &emit_R16G16B16A16_FLOAT;
415
416 case PIPE_FORMAT_R32_UNORM:
417 return &emit_R32_UNORM;
418 case PIPE_FORMAT_R32G32_UNORM:
419 return &emit_R32G32_UNORM;
420 case PIPE_FORMAT_R32G32B32_UNORM:
421 return &emit_R32G32B32_UNORM;
422 case PIPE_FORMAT_R32G32B32A32_UNORM:
423 return &emit_R32G32B32A32_UNORM;
424
425 case PIPE_FORMAT_R32_USCALED:
426 return &emit_R32_USCALED;
427 case PIPE_FORMAT_R32G32_USCALED:
428 return &emit_R32G32_USCALED;
429 case PIPE_FORMAT_R32G32B32_USCALED:
430 return &emit_R32G32B32_USCALED;
431 case PIPE_FORMAT_R32G32B32A32_USCALED:
432 return &emit_R32G32B32A32_USCALED;
433
434 case PIPE_FORMAT_R32_SNORM:
435 return &emit_R32_SNORM;
436 case PIPE_FORMAT_R32G32_SNORM:
437 return &emit_R32G32_SNORM;
438 case PIPE_FORMAT_R32G32B32_SNORM:
439 return &emit_R32G32B32_SNORM;
440 case PIPE_FORMAT_R32G32B32A32_SNORM:
441 return &emit_R32G32B32A32_SNORM;
442
443 case PIPE_FORMAT_R32_SSCALED:
444 return &emit_R32_SSCALED;
445 case PIPE_FORMAT_R32G32_SSCALED:
446 return &emit_R32G32_SSCALED;
447 case PIPE_FORMAT_R32G32B32_SSCALED:
448 return &emit_R32G32B32_SSCALED;
449 case PIPE_FORMAT_R32G32B32A32_SSCALED:
450 return &emit_R32G32B32A32_SSCALED;
451
452 case PIPE_FORMAT_R16_UNORM:
453 return &emit_R16_UNORM;
454 case PIPE_FORMAT_R16G16_UNORM:
455 return &emit_R16G16_UNORM;
456 case PIPE_FORMAT_R16G16B16_UNORM:
457 return &emit_R16G16B16_UNORM;
458 case PIPE_FORMAT_R16G16B16A16_UNORM:
459 return &emit_R16G16B16A16_UNORM;
460
461 case PIPE_FORMAT_R16_USCALED:
462 return &emit_R16_USCALED;
463 case PIPE_FORMAT_R16G16_USCALED:
464 return &emit_R16G16_USCALED;
465 case PIPE_FORMAT_R16G16B16_USCALED:
466 return &emit_R16G16B16_USCALED;
467 case PIPE_FORMAT_R16G16B16A16_USCALED:
468 return &emit_R16G16B16A16_USCALED;
469
470 case PIPE_FORMAT_R16_SNORM:
471 return &emit_R16_SNORM;
472 case PIPE_FORMAT_R16G16_SNORM:
473 return &emit_R16G16_SNORM;
474 case PIPE_FORMAT_R16G16B16_SNORM:
475 return &emit_R16G16B16_SNORM;
476 case PIPE_FORMAT_R16G16B16A16_SNORM:
477 return &emit_R16G16B16A16_SNORM;
478
479 case PIPE_FORMAT_R16_SSCALED:
480 return &emit_R16_SSCALED;
481 case PIPE_FORMAT_R16G16_SSCALED:
482 return &emit_R16G16_SSCALED;
483 case PIPE_FORMAT_R16G16B16_SSCALED:
484 return &emit_R16G16B16_SSCALED;
485 case PIPE_FORMAT_R16G16B16A16_SSCALED:
486 return &emit_R16G16B16A16_SSCALED;
487
488 case PIPE_FORMAT_R8_UNORM:
489 return &emit_R8_UNORM;
490 case PIPE_FORMAT_R8G8_UNORM:
491 return &emit_R8G8_UNORM;
492 case PIPE_FORMAT_R8G8B8_UNORM:
493 return &emit_R8G8B8_UNORM;
494 case PIPE_FORMAT_R8G8B8A8_UNORM:
495 return &emit_R8G8B8A8_UNORM;
496
497 case PIPE_FORMAT_R8_USCALED:
498 return &emit_R8_USCALED;
499 case PIPE_FORMAT_R8G8_USCALED:
500 return &emit_R8G8_USCALED;
501 case PIPE_FORMAT_R8G8B8_USCALED:
502 return &emit_R8G8B8_USCALED;
503 case PIPE_FORMAT_R8G8B8A8_USCALED:
504 return &emit_R8G8B8A8_USCALED;
505
506 case PIPE_FORMAT_R8_SNORM:
507 return &emit_R8_SNORM;
508 case PIPE_FORMAT_R8G8_SNORM:
509 return &emit_R8G8_SNORM;
510 case PIPE_FORMAT_R8G8B8_SNORM:
511 return &emit_R8G8B8_SNORM;
512 case PIPE_FORMAT_R8G8B8A8_SNORM:
513 return &emit_R8G8B8A8_SNORM;
514
515 case PIPE_FORMAT_R8_SSCALED:
516 return &emit_R8_SSCALED;
517 case PIPE_FORMAT_R8G8_SSCALED:
518 return &emit_R8G8_SSCALED;
519 case PIPE_FORMAT_R8G8B8_SSCALED:
520 return &emit_R8G8B8_SSCALED;
521 case PIPE_FORMAT_R8G8B8A8_SSCALED:
522 return &emit_R8G8B8A8_SSCALED;
523
524 case PIPE_FORMAT_B8G8R8A8_UNORM:
525 return &emit_B8G8R8A8_UNORM;
526
527 case PIPE_FORMAT_A8R8G8B8_UNORM:
528 return &emit_A8R8G8B8_UNORM;
529
530 case PIPE_FORMAT_R32_UINT:
531 return &emit_R32_UINT;
532 case PIPE_FORMAT_R32G32_UINT:
533 return &emit_R32G32_UINT;
534 case PIPE_FORMAT_R32G32B32_UINT:
535 return &emit_R32G32B32_UINT;
536 case PIPE_FORMAT_R32G32B32A32_UINT:
537 return &emit_R32G32B32A32_UINT;
538
539 case PIPE_FORMAT_R16_UINT:
540 return &emit_R16_UINT;
541 case PIPE_FORMAT_R16G16_UINT:
542 return &emit_R16G16_UINT;
543 case PIPE_FORMAT_R16G16B16_UINT:
544 return &emit_R16G16B16_UINT;
545 case PIPE_FORMAT_R16G16B16A16_UINT:
546 return &emit_R16G16B16A16_UINT;
547
548 case PIPE_FORMAT_R8_UINT:
549 return &emit_R8_UINT;
550 case PIPE_FORMAT_R8G8_UINT:
551 return &emit_R8G8_UINT;
552 case PIPE_FORMAT_R8G8B8_UINT:
553 return &emit_R8G8B8_UINT;
554 case PIPE_FORMAT_R8G8B8A8_UINT:
555 return &emit_R8G8B8A8_UINT;
556
557 case PIPE_FORMAT_R32_SINT:
558 return &emit_R32_SINT;
559 case PIPE_FORMAT_R32G32_SINT:
560 return &emit_R32G32_SINT;
561 case PIPE_FORMAT_R32G32B32_SINT:
562 return &emit_R32G32B32_SINT;
563 case PIPE_FORMAT_R32G32B32A32_SINT:
564 return &emit_R32G32B32A32_SINT;
565
566 case PIPE_FORMAT_R16_SINT:
567 return &emit_R16_SINT;
568 case PIPE_FORMAT_R16G16_SINT:
569 return &emit_R16G16_SINT;
570 case PIPE_FORMAT_R16G16B16_SINT:
571 return &emit_R16G16B16_SINT;
572 case PIPE_FORMAT_R16G16B16A16_SINT:
573 return &emit_R16G16B16A16_SINT;
574
575 case PIPE_FORMAT_R8_SINT:
576 return &emit_R8_SINT;
577 case PIPE_FORMAT_R8G8_SINT:
578 return &emit_R8G8_SINT;
579 case PIPE_FORMAT_R8G8B8_SINT:
580 return &emit_R8G8B8_SINT;
581 case PIPE_FORMAT_R8G8B8A8_SINT:
582 return &emit_R8G8B8A8_SINT;
583
584 case PIPE_FORMAT_B10G10R10A2_UNORM:
585 return &emit_B10G10R10A2_UNORM;
586 case PIPE_FORMAT_B10G10R10A2_USCALED:
587 return &emit_B10G10R10A2_USCALED;
588 case PIPE_FORMAT_B10G10R10A2_SNORM:
589 return &emit_B10G10R10A2_SNORM;
590 case PIPE_FORMAT_B10G10R10A2_SSCALED:
591 return &emit_B10G10R10A2_SSCALED;
592
593 case PIPE_FORMAT_R10G10B10A2_UNORM:
594 return &emit_R10G10B10A2_UNORM;
595 case PIPE_FORMAT_R10G10B10A2_USCALED:
596 return &emit_R10G10B10A2_USCALED;
597 case PIPE_FORMAT_R10G10B10A2_SNORM:
598 return &emit_R10G10B10A2_SNORM;
599 case PIPE_FORMAT_R10G10B10A2_SSCALED:
600 return &emit_R10G10B10A2_SSCALED;
601
602 default:
603 assert(0);
604 return &emit_NULL;
605 }
606 }
607
608 static ALWAYS_INLINE void PIPE_CDECL generic_run_one( struct translate_generic *tg,
609 unsigned elt,
610 unsigned start_instance,
611 unsigned instance_id,
612 void *vert )
613 {
614 unsigned nr_attrs = tg->nr_attrib;
615 unsigned attr;
616
617 for (attr = 0; attr < nr_attrs; attr++) {
618 float data[4];
619 uint8_t *dst = (uint8_t *)vert + tg->attrib[attr].output_offset;
620
621 if (tg->attrib[attr].type == TRANSLATE_ELEMENT_NORMAL) {
622 const uint8_t *src;
623 unsigned index;
624 int copy_size;
625
626 if (tg->attrib[attr].instance_divisor) {
627 index = start_instance;
628 index += (instance_id / tg->attrib[attr].instance_divisor);
629 /* XXX we need to clamp the index here too, but to a
630 * per-array max value, not the draw->pt.max_index value
631 * that's being given to us via translate->set_buffer().
632 */
633 }
634 else {
635 index = elt;
636 /* clamp to avoid going out of bounds */
637 index = MIN2(index, tg->attrib[attr].max_index);
638 }
639
640 src = tg->attrib[attr].input_ptr +
641 tg->attrib[attr].input_stride * index;
642
643 copy_size = tg->attrib[attr].copy_size;
644 if(likely(copy_size >= 0))
645 memcpy(dst, src, copy_size);
646 else
647 {
648 tg->attrib[attr].fetch( data, src, 0, 0 );
649
650 if (0)
651 debug_printf("Fetch linear attr %d from %p stride %d index %d: "
652 " %f, %f, %f, %f \n",
653 attr,
654 tg->attrib[attr].input_ptr,
655 tg->attrib[attr].input_stride,
656 index,
657 data[0], data[1],data[2], data[3]);
658
659 tg->attrib[attr].emit( data, dst );
660 }
661 } else {
662 if(likely(tg->attrib[attr].copy_size >= 0))
663 memcpy(data, &instance_id, 4);
664 else
665 {
666 data[0] = (float)instance_id;
667 tg->attrib[attr].emit( data, dst );
668 }
669 }
670 }
671 }
672
673 /**
674 * Fetch vertex attributes for 'count' vertices.
675 */
676 static void PIPE_CDECL generic_run_elts( struct translate *translate,
677 const unsigned *elts,
678 unsigned count,
679 unsigned start_instance,
680 unsigned instance_id,
681 void *output_buffer )
682 {
683 struct translate_generic *tg = translate_generic(translate);
684 char *vert = output_buffer;
685 unsigned i;
686
687 for (i = 0; i < count; i++) {
688 generic_run_one(tg, *elts++, start_instance, instance_id, vert);
689 vert += tg->translate.key.output_stride;
690 }
691 }
692
693 static void PIPE_CDECL generic_run_elts16( struct translate *translate,
694 const uint16_t *elts,
695 unsigned count,
696 unsigned start_instance,
697 unsigned instance_id,
698 void *output_buffer )
699 {
700 struct translate_generic *tg = translate_generic(translate);
701 char *vert = output_buffer;
702 unsigned i;
703
704 for (i = 0; i < count; i++) {
705 generic_run_one(tg, *elts++, start_instance, instance_id, vert);
706 vert += tg->translate.key.output_stride;
707 }
708 }
709
710 static void PIPE_CDECL generic_run_elts8( struct translate *translate,
711 const uint8_t *elts,
712 unsigned count,
713 unsigned start_instance,
714 unsigned instance_id,
715 void *output_buffer )
716 {
717 struct translate_generic *tg = translate_generic(translate);
718 char *vert = output_buffer;
719 unsigned i;
720
721 for (i = 0; i < count; i++) {
722 generic_run_one(tg, *elts++, start_instance, instance_id, vert);
723 vert += tg->translate.key.output_stride;
724 }
725 }
726
727 static void PIPE_CDECL generic_run( struct translate *translate,
728 unsigned start,
729 unsigned count,
730 unsigned start_instance,
731 unsigned instance_id,
732 void *output_buffer )
733 {
734 struct translate_generic *tg = translate_generic(translate);
735 char *vert = output_buffer;
736 unsigned i;
737
738 for (i = 0; i < count; i++) {
739 generic_run_one(tg, start + i, start_instance, instance_id, vert);
740 vert += tg->translate.key.output_stride;
741 }
742 }
743
744
745
746 static void generic_set_buffer( struct translate *translate,
747 unsigned buf,
748 const void *ptr,
749 unsigned stride,
750 unsigned max_index )
751 {
752 struct translate_generic *tg = translate_generic(translate);
753 unsigned i;
754
755 for (i = 0; i < tg->nr_attrib; i++) {
756 if (tg->attrib[i].buffer == buf) {
757 tg->attrib[i].input_ptr = ((const uint8_t *)ptr +
758 tg->attrib[i].input_offset);
759 tg->attrib[i].input_stride = stride;
760 tg->attrib[i].max_index = max_index;
761 }
762 }
763 }
764
765
766 static void generic_release( struct translate *translate )
767 {
768 /* Refcount?
769 */
770 FREE(translate);
771 }
772
773 static boolean
774 is_legal_int_format_combo( const struct util_format_description *src,
775 const struct util_format_description *dst )
776 {
777 unsigned i;
778 unsigned nr = MIN2(src->nr_channels, dst->nr_channels);
779
780 for (i = 0; i < nr; i++) {
781 /* The signs must match. */
782 if (src->channel[i].type != dst->channel[i].type) {
783 return FALSE;
784 }
785
786 /* Integers must not lose precision at any point in the pipeline. */
787 if (src->channel[i].size > dst->channel[i].size) {
788 return FALSE;
789 }
790 }
791 return TRUE;
792 }
793
794 struct translate *translate_generic_create( const struct translate_key *key )
795 {
796 struct translate_generic *tg = CALLOC_STRUCT(translate_generic);
797 unsigned i;
798
799 if (tg == NULL)
800 return NULL;
801
802 tg->translate.key = *key;
803 tg->translate.release = generic_release;
804 tg->translate.set_buffer = generic_set_buffer;
805 tg->translate.run_elts = generic_run_elts;
806 tg->translate.run_elts16 = generic_run_elts16;
807 tg->translate.run_elts8 = generic_run_elts8;
808 tg->translate.run = generic_run;
809
810 for (i = 0; i < key->nr_elements; i++) {
811 const struct util_format_description *format_desc =
812 util_format_description(key->element[i].input_format);
813
814 assert(format_desc);
815
816 tg->attrib[i].type = key->element[i].type;
817
818 if (format_desc->channel[0].pure_integer) {
819 const struct util_format_description *out_format_desc =
820 util_format_description(key->element[i].output_format);
821
822 if (!is_legal_int_format_combo(format_desc, out_format_desc)) {
823 FREE(tg);
824 return NULL;
825 }
826
827 if (format_desc->channel[0].type == UTIL_FORMAT_TYPE_SIGNED) {
828 assert(format_desc->fetch_rgba_sint);
829 tg->attrib[i].fetch = (fetch_func)format_desc->fetch_rgba_sint;
830 } else {
831 assert(format_desc->fetch_rgba_uint);
832 tg->attrib[i].fetch = (fetch_func)format_desc->fetch_rgba_uint;
833 }
834 } else {
835 assert(format_desc->fetch_rgba_float);
836 tg->attrib[i].fetch = (fetch_func)format_desc->fetch_rgba_float;
837 }
838
839 tg->attrib[i].buffer = key->element[i].input_buffer;
840 tg->attrib[i].input_offset = key->element[i].input_offset;
841 tg->attrib[i].instance_divisor = key->element[i].instance_divisor;
842
843 tg->attrib[i].output_offset = key->element[i].output_offset;
844
845 tg->attrib[i].copy_size = -1;
846 if (tg->attrib[i].type == TRANSLATE_ELEMENT_INSTANCE_ID)
847 {
848 if(key->element[i].output_format == PIPE_FORMAT_R32_USCALED
849 || key->element[i].output_format == PIPE_FORMAT_R32_SSCALED)
850 tg->attrib[i].copy_size = 4;
851 }
852 else
853 {
854 if(key->element[i].input_format == key->element[i].output_format
855 && format_desc->block.width == 1
856 && format_desc->block.height == 1
857 && !(format_desc->block.bits & 7))
858 tg->attrib[i].copy_size = format_desc->block.bits >> 3;
859 }
860
861 if(tg->attrib[i].copy_size < 0)
862 tg->attrib[i].emit = get_emit_func(key->element[i].output_format);
863 else
864 tg->attrib[i].emit = NULL;
865 }
866
867 tg->nr_attrib = key->nr_elements;
868
869
870 return &tg->translate;
871 }
872
873 boolean translate_generic_is_output_format_supported(enum pipe_format format)
874 {
875 switch(format)
876 {
877 case PIPE_FORMAT_R64G64B64A64_FLOAT: return TRUE;
878 case PIPE_FORMAT_R64G64B64_FLOAT: return TRUE;
879 case PIPE_FORMAT_R64G64_FLOAT: return TRUE;
880 case PIPE_FORMAT_R64_FLOAT: return TRUE;
881
882 case PIPE_FORMAT_R32G32B32A32_FLOAT: return TRUE;
883 case PIPE_FORMAT_R32G32B32_FLOAT: return TRUE;
884 case PIPE_FORMAT_R32G32_FLOAT: return TRUE;
885 case PIPE_FORMAT_R32_FLOAT: return TRUE;
886
887 case PIPE_FORMAT_R16G16B16A16_FLOAT: return TRUE;
888 case PIPE_FORMAT_R16G16B16_FLOAT: return TRUE;
889 case PIPE_FORMAT_R16G16_FLOAT: return TRUE;
890 case PIPE_FORMAT_R16_FLOAT: return TRUE;
891
892 case PIPE_FORMAT_R32G32B32A32_USCALED: return TRUE;
893 case PIPE_FORMAT_R32G32B32_USCALED: return TRUE;
894 case PIPE_FORMAT_R32G32_USCALED: return TRUE;
895 case PIPE_FORMAT_R32_USCALED: return TRUE;
896
897 case PIPE_FORMAT_R32G32B32A32_SSCALED: return TRUE;
898 case PIPE_FORMAT_R32G32B32_SSCALED: return TRUE;
899 case PIPE_FORMAT_R32G32_SSCALED: return TRUE;
900 case PIPE_FORMAT_R32_SSCALED: return TRUE;
901
902 case PIPE_FORMAT_R32G32B32A32_UNORM: return TRUE;
903 case PIPE_FORMAT_R32G32B32_UNORM: return TRUE;
904 case PIPE_FORMAT_R32G32_UNORM: return TRUE;
905 case PIPE_FORMAT_R32_UNORM: return TRUE;
906
907 case PIPE_FORMAT_R32G32B32A32_SNORM: return TRUE;
908 case PIPE_FORMAT_R32G32B32_SNORM: return TRUE;
909 case PIPE_FORMAT_R32G32_SNORM: return TRUE;
910 case PIPE_FORMAT_R32_SNORM: return TRUE;
911
912 case PIPE_FORMAT_R16G16B16A16_USCALED: return TRUE;
913 case PIPE_FORMAT_R16G16B16_USCALED: return TRUE;
914 case PIPE_FORMAT_R16G16_USCALED: return TRUE;
915 case PIPE_FORMAT_R16_USCALED: return TRUE;
916
917 case PIPE_FORMAT_R16G16B16A16_SSCALED: return TRUE;
918 case PIPE_FORMAT_R16G16B16_SSCALED: return TRUE;
919 case PIPE_FORMAT_R16G16_SSCALED: return TRUE;
920 case PIPE_FORMAT_R16_SSCALED: return TRUE;
921
922 case PIPE_FORMAT_R16G16B16A16_UNORM: return TRUE;
923 case PIPE_FORMAT_R16G16B16_UNORM: return TRUE;
924 case PIPE_FORMAT_R16G16_UNORM: return TRUE;
925 case PIPE_FORMAT_R16_UNORM: return TRUE;
926
927 case PIPE_FORMAT_R16G16B16A16_SNORM: return TRUE;
928 case PIPE_FORMAT_R16G16B16_SNORM: return TRUE;
929 case PIPE_FORMAT_R16G16_SNORM: return TRUE;
930 case PIPE_FORMAT_R16_SNORM: return TRUE;
931
932 case PIPE_FORMAT_R8G8B8A8_USCALED: return TRUE;
933 case PIPE_FORMAT_R8G8B8_USCALED: return TRUE;
934 case PIPE_FORMAT_R8G8_USCALED: return TRUE;
935 case PIPE_FORMAT_R8_USCALED: return TRUE;
936
937 case PIPE_FORMAT_R8G8B8A8_SSCALED: return TRUE;
938 case PIPE_FORMAT_R8G8B8_SSCALED: return TRUE;
939 case PIPE_FORMAT_R8G8_SSCALED: return TRUE;
940 case PIPE_FORMAT_R8_SSCALED: return TRUE;
941
942 case PIPE_FORMAT_R8G8B8A8_UNORM: return TRUE;
943 case PIPE_FORMAT_R8G8B8_UNORM: return TRUE;
944 case PIPE_FORMAT_R8G8_UNORM: return TRUE;
945 case PIPE_FORMAT_R8_UNORM: return TRUE;
946
947 case PIPE_FORMAT_R8G8B8A8_SNORM: return TRUE;
948 case PIPE_FORMAT_R8G8B8_SNORM: return TRUE;
949 case PIPE_FORMAT_R8G8_SNORM: return TRUE;
950 case PIPE_FORMAT_R8_SNORM: return TRUE;
951
952 case PIPE_FORMAT_A8R8G8B8_UNORM: return TRUE;
953 case PIPE_FORMAT_B8G8R8A8_UNORM: return TRUE;
954
955 case PIPE_FORMAT_R32G32B32A32_UINT: return TRUE;
956 case PIPE_FORMAT_R32G32B32_UINT: return TRUE;
957 case PIPE_FORMAT_R32G32_UINT: return TRUE;
958 case PIPE_FORMAT_R32_UINT: return TRUE;
959
960 case PIPE_FORMAT_R16G16B16A16_UINT: return TRUE;
961 case PIPE_FORMAT_R16G16B16_UINT: return TRUE;
962 case PIPE_FORMAT_R16G16_UINT: return TRUE;
963 case PIPE_FORMAT_R16_UINT: return TRUE;
964
965 case PIPE_FORMAT_R8G8B8A8_UINT: return TRUE;
966 case PIPE_FORMAT_R8G8B8_UINT: return TRUE;
967 case PIPE_FORMAT_R8G8_UINT: return TRUE;
968 case PIPE_FORMAT_R8_UINT: return TRUE;
969
970 case PIPE_FORMAT_R32G32B32A32_SINT: return TRUE;
971 case PIPE_FORMAT_R32G32B32_SINT: return TRUE;
972 case PIPE_FORMAT_R32G32_SINT: return TRUE;
973 case PIPE_FORMAT_R32_SINT: return TRUE;
974
975 case PIPE_FORMAT_R16G16B16A16_SINT: return TRUE;
976 case PIPE_FORMAT_R16G16B16_SINT: return TRUE;
977 case PIPE_FORMAT_R16G16_SINT: return TRUE;
978 case PIPE_FORMAT_R16_SINT: return TRUE;
979
980 case PIPE_FORMAT_R8G8B8A8_SINT: return TRUE;
981 case PIPE_FORMAT_R8G8B8_SINT: return TRUE;
982 case PIPE_FORMAT_R8G8_SINT: return TRUE;
983 case PIPE_FORMAT_R8_SINT: return TRUE;
984
985 case PIPE_FORMAT_B10G10R10A2_UNORM: return TRUE;
986 case PIPE_FORMAT_B10G10R10A2_USCALED: return TRUE;
987 case PIPE_FORMAT_B10G10R10A2_SNORM: return TRUE;
988 case PIPE_FORMAT_B10G10R10A2_SSCALED: return TRUE;
989
990 case PIPE_FORMAT_R10G10B10A2_UNORM: return TRUE;
991 case PIPE_FORMAT_R10G10B10A2_USCALED: return TRUE;
992 case PIPE_FORMAT_R10G10B10A2_SNORM: return TRUE;
993 case PIPE_FORMAT_R10G10B10A2_SSCALED: return TRUE;
994
995 default: return FALSE;
996 }
997 }