1 /**************************************************************************
3 * Copyright 2007 VMware, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
30 * Keith Whitwell <keithw@vmware.com>
33 #include "util/u_memory.h"
34 #include "util/format/u_format.h"
35 #include "util/u_half.h"
36 #include "util/u_math.h"
37 #include "pipe/p_state.h"
38 #include "translate.h"
43 typedef void (*emit_func
)(const void *attrib
, void *ptr
);
47 struct translate_generic
{
48 struct translate translate
;
51 enum translate_element_type type
;
53 util_format_fetch_rgba_func_ptr fetch
;
55 unsigned input_offset
;
56 unsigned instance_divisor
;
59 unsigned output_offset
;
61 const uint8_t *input_ptr
;
62 unsigned input_stride
;
65 /* this value is set to -1 if this is a normal element with
66 * output_format != input_format: in this case, u_format is used
67 * to do a full conversion
69 * this value is set to the format size in bytes if
70 * output_format == input_format or for 32-bit instance ids:
71 * in this case, memcpy is used to copy this amount of bytes
75 } attrib
[TRANSLATE_MAX_ATTRIBS
];
81 static struct translate_generic
*
82 translate_generic(struct translate
*translate
)
84 return (struct translate_generic
*)translate
;
89 * Fetch a dword[4] vertex attribute from memory, doing format/type
90 * conversion as needed.
92 * This is probably needed/dupliocated elsewhere, eg format
93 * conversion, texture sampling etc.
95 #define ATTRIB(NAME, SZ, SRCTYPE, DSTTYPE, TO) \
97 emit_##NAME(const void *attrib, void *ptr) \
100 SRCTYPE *in = (SRCTYPE *)attrib; \
101 DSTTYPE *out = (DSTTYPE *)ptr; \
103 for (i = 0; i < SZ; i++) { \
104 out[i] = TO(in[i]); \
109 #define TO_64_FLOAT(x) ((double) x)
110 #define TO_32_FLOAT(x) (x)
111 #define TO_16_FLOAT(x) util_float_to_half(x)
113 #define TO_8_USCALED(x) ((unsigned char) x)
114 #define TO_16_USCALED(x) ((unsigned short) x)
115 #define TO_32_USCALED(x) ((unsigned int) x)
117 #define TO_8_SSCALED(x) ((char) x)
118 #define TO_16_SSCALED(x) ((short) x)
119 #define TO_32_SSCALED(x) ((int) x)
121 #define TO_8_UNORM(x) ((unsigned char) (x * 255.0f))
122 #define TO_16_UNORM(x) ((unsigned short) (x * 65535.0f))
123 #define TO_32_UNORM(x) ((unsigned int) (x * 4294967295.0f))
125 #define TO_8_SNORM(x) ((char) (x * 127.0f))
126 #define TO_16_SNORM(x) ((short) (x * 32767.0f))
127 #define TO_32_SNORM(x) ((int) (x * 2147483647.0f))
129 #define TO_32_FIXED(x) ((int) (x * 65536.0f))
131 #define TO_INT(x) (x)
134 ATTRIB(R64G64B64A64_FLOAT
, 4, float, double, TO_64_FLOAT
)
135 ATTRIB(R64G64B64_FLOAT
, 3, float, double, TO_64_FLOAT
)
136 ATTRIB(R64G64_FLOAT
, 2, float, double, TO_64_FLOAT
)
137 ATTRIB(R64_FLOAT
, 1, float, double, TO_64_FLOAT
)
139 ATTRIB(R32G32B32A32_FLOAT
, 4, float, float, TO_32_FLOAT
)
140 ATTRIB(R32G32B32_FLOAT
, 3, float, float, TO_32_FLOAT
)
141 ATTRIB(R32G32_FLOAT
, 2, float, float, TO_32_FLOAT
)
142 ATTRIB(R32_FLOAT
, 1, float, float, TO_32_FLOAT
)
144 ATTRIB(R16G16B16A16_FLOAT
, 4, float, ushort
, TO_16_FLOAT
)
145 ATTRIB(R16G16B16_FLOAT
, 3, float, ushort
, TO_16_FLOAT
)
146 ATTRIB(R16G16_FLOAT
, 2, float, ushort
, TO_16_FLOAT
)
147 ATTRIB(R16_FLOAT
, 1, float, ushort
, TO_16_FLOAT
)
149 ATTRIB(R32G32B32A32_USCALED
, 4, float, unsigned, TO_32_USCALED
)
150 ATTRIB(R32G32B32_USCALED
, 3, float, unsigned, TO_32_USCALED
)
151 ATTRIB(R32G32_USCALED
, 2, float, unsigned, TO_32_USCALED
)
152 ATTRIB(R32_USCALED
, 1, float, unsigned, TO_32_USCALED
)
154 ATTRIB(R32G32B32A32_SSCALED
, 4, float, int, TO_32_SSCALED
)
155 ATTRIB(R32G32B32_SSCALED
, 3, float, int, TO_32_SSCALED
)
156 ATTRIB(R32G32_SSCALED
, 2, float, int, TO_32_SSCALED
)
157 ATTRIB(R32_SSCALED
, 1, float, int, TO_32_SSCALED
)
159 ATTRIB(R32G32B32A32_UNORM
, 4, float, unsigned, TO_32_UNORM
)
160 ATTRIB(R32G32B32_UNORM
, 3, float, unsigned, TO_32_UNORM
)
161 ATTRIB(R32G32_UNORM
, 2, float, unsigned, TO_32_UNORM
)
162 ATTRIB(R32_UNORM
, 1, float, unsigned, TO_32_UNORM
)
164 ATTRIB(R32G32B32A32_SNORM
, 4, float, int, TO_32_SNORM
)
165 ATTRIB(R32G32B32_SNORM
, 3, float, int, TO_32_SNORM
)
166 ATTRIB(R32G32_SNORM
, 2, float, int, TO_32_SNORM
)
167 ATTRIB(R32_SNORM
, 1, float, int, TO_32_SNORM
)
169 ATTRIB(R16G16B16A16_USCALED
, 4, float, ushort
, TO_16_USCALED
)
170 ATTRIB(R16G16B16_USCALED
, 3, float, ushort
, TO_16_USCALED
)
171 ATTRIB(R16G16_USCALED
, 2, float, ushort
, TO_16_USCALED
)
172 ATTRIB(R16_USCALED
, 1, float, ushort
, TO_16_USCALED
)
174 ATTRIB(R16G16B16A16_SSCALED
, 4, float, short, TO_16_SSCALED
)
175 ATTRIB(R16G16B16_SSCALED
, 3, float, short, TO_16_SSCALED
)
176 ATTRIB(R16G16_SSCALED
, 2, float, short, TO_16_SSCALED
)
177 ATTRIB(R16_SSCALED
, 1, float, short, TO_16_SSCALED
)
179 ATTRIB(R16G16B16A16_UNORM
, 4, float, ushort
, TO_16_UNORM
)
180 ATTRIB(R16G16B16_UNORM
, 3, float, ushort
, TO_16_UNORM
)
181 ATTRIB(R16G16_UNORM
, 2, float, ushort
, TO_16_UNORM
)
182 ATTRIB(R16_UNORM
, 1, float, ushort
, TO_16_UNORM
)
184 ATTRIB(R16G16B16A16_SNORM
, 4, float, short, TO_16_SNORM
)
185 ATTRIB(R16G16B16_SNORM
, 3, float, short, TO_16_SNORM
)
186 ATTRIB(R16G16_SNORM
, 2, float, short, TO_16_SNORM
)
187 ATTRIB(R16_SNORM
, 1, float, short, TO_16_SNORM
)
189 ATTRIB(R8G8B8A8_USCALED
, 4, float, ubyte
, TO_8_USCALED
)
190 ATTRIB(R8G8B8_USCALED
, 3, float, ubyte
, TO_8_USCALED
)
191 ATTRIB(R8G8_USCALED
, 2, float, ubyte
, TO_8_USCALED
)
192 ATTRIB(R8_USCALED
, 1, float, ubyte
, TO_8_USCALED
)
194 ATTRIB(R8G8B8A8_SSCALED
, 4, float, char, TO_8_SSCALED
)
195 ATTRIB(R8G8B8_SSCALED
, 3, float, char, TO_8_SSCALED
)
196 ATTRIB(R8G8_SSCALED
, 2, float, char, TO_8_SSCALED
)
197 ATTRIB(R8_SSCALED
, 1, float, char, TO_8_SSCALED
)
199 ATTRIB(R8G8B8A8_UNORM
, 4, float, ubyte
, TO_8_UNORM
)
200 ATTRIB(R8G8B8_UNORM
, 3, float, ubyte
, TO_8_UNORM
)
201 ATTRIB(R8G8_UNORM
, 2, float, ubyte
, TO_8_UNORM
)
202 ATTRIB(R8_UNORM
, 1, float, ubyte
, TO_8_UNORM
)
204 ATTRIB(R8G8B8A8_SNORM
, 4, float, char, TO_8_SNORM
)
205 ATTRIB(R8G8B8_SNORM
, 3, float, char, TO_8_SNORM
)
206 ATTRIB(R8G8_SNORM
, 2, float, char, TO_8_SNORM
)
207 ATTRIB(R8_SNORM
, 1, float, char, TO_8_SNORM
)
209 ATTRIB(R32G32B32A32_UINT
, 4, uint32_t, unsigned, TO_INT
)
210 ATTRIB(R32G32B32_UINT
, 3, uint32_t, unsigned, TO_INT
)
211 ATTRIB(R32G32_UINT
, 2, uint32_t, unsigned, TO_INT
)
212 ATTRIB(R32_UINT
, 1, uint32_t, unsigned, TO_INT
)
214 ATTRIB(R16G16B16A16_UINT
, 4, uint32_t, ushort
, TO_INT
)
215 ATTRIB(R16G16B16_UINT
, 3, uint32_t, ushort
, TO_INT
)
216 ATTRIB(R16G16_UINT
, 2, uint32_t, ushort
, TO_INT
)
217 ATTRIB(R16_UINT
, 1, uint32_t, ushort
, TO_INT
)
219 ATTRIB(R8G8B8A8_UINT
, 4, uint32_t, ubyte
, TO_INT
)
220 ATTRIB(R8G8B8_UINT
, 3, uint32_t, ubyte
, TO_INT
)
221 ATTRIB(R8G8_UINT
, 2, uint32_t, ubyte
, TO_INT
)
222 ATTRIB(R8_UINT
, 1, uint32_t, ubyte
, TO_INT
)
224 ATTRIB(R32G32B32A32_SINT
, 4, int32_t, int, TO_INT
)
225 ATTRIB(R32G32B32_SINT
, 3, int32_t, int, TO_INT
)
226 ATTRIB(R32G32_SINT
, 2, int32_t, int, TO_INT
)
227 ATTRIB(R32_SINT
, 1, int32_t, int, TO_INT
)
229 ATTRIB(R16G16B16A16_SINT
, 4, int32_t, short, TO_INT
)
230 ATTRIB(R16G16B16_SINT
, 3, int32_t, short, TO_INT
)
231 ATTRIB(R16G16_SINT
, 2, int32_t, short, TO_INT
)
232 ATTRIB(R16_SINT
, 1, int32_t, short, TO_INT
)
234 ATTRIB(R8G8B8A8_SINT
, 4, int32_t, char, TO_INT
)
235 ATTRIB(R8G8B8_SINT
, 3, int32_t, char, TO_INT
)
236 ATTRIB(R8G8_SINT
, 2, int32_t, char, TO_INT
)
237 ATTRIB(R8_SINT
, 1, int32_t, char, TO_INT
)
240 emit_A8R8G8B8_UNORM(const void *attrib
, void *ptr
)
242 float *in
= (float *)attrib
;
243 ubyte
*out
= (ubyte
*)ptr
;
244 out
[0] = TO_8_UNORM(in
[3]);
245 out
[1] = TO_8_UNORM(in
[0]);
246 out
[2] = TO_8_UNORM(in
[1]);
247 out
[3] = TO_8_UNORM(in
[2]);
251 emit_B8G8R8A8_UNORM(const void *attrib
, void *ptr
)
253 float *in
= (float *)attrib
;
254 ubyte
*out
= (ubyte
*)ptr
;
255 out
[2] = TO_8_UNORM(in
[0]);
256 out
[1] = TO_8_UNORM(in
[1]);
257 out
[0] = TO_8_UNORM(in
[2]);
258 out
[3] = TO_8_UNORM(in
[3]);
262 emit_B10G10R10A2_UNORM(const void *attrib
, void *ptr
)
264 float *src
= (float *)ptr
;
266 value
|= ((uint32_t)(CLAMP(src
[2], 0, 1) * 0x3ff)) & 0x3ff;
267 value
|= (((uint32_t)(CLAMP(src
[1], 0, 1) * 0x3ff)) & 0x3ff) << 10;
268 value
|= (((uint32_t)(CLAMP(src
[0], 0, 1) * 0x3ff)) & 0x3ff) << 20;
269 value
|= ((uint32_t)(CLAMP(src
[3], 0, 1) * 0x3)) << 30;
270 *(uint32_t *)attrib
= util_le32_to_cpu(value
);
274 emit_B10G10R10A2_USCALED(const void *attrib
, void *ptr
)
276 float *src
= (float *)ptr
;
278 value
|= ((uint32_t)CLAMP(src
[2], 0, 1023)) & 0x3ff;
279 value
|= (((uint32_t)CLAMP(src
[1], 0, 1023)) & 0x3ff) << 10;
280 value
|= (((uint32_t)CLAMP(src
[0], 0, 1023)) & 0x3ff) << 20;
281 value
|= ((uint32_t)CLAMP(src
[3], 0, 3)) << 30;
282 *(uint32_t *)attrib
= util_le32_to_cpu(value
);
286 emit_B10G10R10A2_SNORM(const void *attrib
, void *ptr
)
288 float *src
= (float *)ptr
;
290 value
|= (uint32_t)(((uint32_t)(CLAMP(src
[2], -1, 1) * 0x1ff)) & 0x3ff) ;
291 value
|= (uint32_t)((((uint32_t)(CLAMP(src
[1], -1, 1) * 0x1ff)) & 0x3ff) << 10) ;
292 value
|= (uint32_t)((((uint32_t)(CLAMP(src
[0], -1, 1) * 0x1ff)) & 0x3ff) << 20) ;
293 value
|= (uint32_t)(((uint32_t)(CLAMP(src
[3], -1, 1) * 0x1)) << 30) ;
294 *(uint32_t *)attrib
= util_le32_to_cpu(value
);
298 emit_B10G10R10A2_SSCALED(const void *attrib
, void *ptr
)
300 float *src
= (float *)ptr
;
302 value
|= (uint32_t)(((uint32_t)CLAMP(src
[2], -512, 511)) & 0x3ff) ;
303 value
|= (uint32_t)((((uint32_t)CLAMP(src
[1], -512, 511)) & 0x3ff) << 10) ;
304 value
|= (uint32_t)((((uint32_t)CLAMP(src
[0], -512, 511)) & 0x3ff) << 20) ;
305 value
|= (uint32_t)(((uint32_t)CLAMP(src
[3], -2, 1)) << 30) ;
306 *(uint32_t *)attrib
= util_le32_to_cpu(value
);
310 emit_R10G10B10A2_UNORM(const void *attrib
, void *ptr
)
312 float *src
= (float *)ptr
;
314 value
|= ((uint32_t)(CLAMP(src
[0], 0, 1) * 0x3ff)) & 0x3ff;
315 value
|= (((uint32_t)(CLAMP(src
[1], 0, 1) * 0x3ff)) & 0x3ff) << 10;
316 value
|= (((uint32_t)(CLAMP(src
[2], 0, 1) * 0x3ff)) & 0x3ff) << 20;
317 value
|= ((uint32_t)(CLAMP(src
[3], 0, 1) * 0x3)) << 30;
318 *(uint32_t *)attrib
= util_le32_to_cpu(value
);
322 emit_R10G10B10A2_USCALED(const void *attrib
, void *ptr
)
324 float *src
= (float *)ptr
;
326 value
|= ((uint32_t)CLAMP(src
[0], 0, 1023)) & 0x3ff;
327 value
|= (((uint32_t)CLAMP(src
[1], 0, 1023)) & 0x3ff) << 10;
328 value
|= (((uint32_t)CLAMP(src
[2], 0, 1023)) & 0x3ff) << 20;
329 value
|= ((uint32_t)CLAMP(src
[3], 0, 3)) << 30;
330 *(uint32_t *)attrib
= util_le32_to_cpu(value
);
334 emit_R10G10B10A2_SNORM(const void *attrib
, void *ptr
)
336 float *src
= (float *)ptr
;
338 value
|= (uint32_t)(((uint32_t)(CLAMP(src
[0], -1, 1) * 0x1ff)) & 0x3ff) ;
339 value
|= (uint32_t)((((uint32_t)(CLAMP(src
[1], -1, 1) * 0x1ff)) & 0x3ff) << 10) ;
340 value
|= (uint32_t)((((uint32_t)(CLAMP(src
[2], -1, 1) * 0x1ff)) & 0x3ff) << 20) ;
341 value
|= (uint32_t)(((uint32_t)(CLAMP(src
[3], -1, 1) * 0x1)) << 30) ;
342 *(uint32_t *)attrib
= util_le32_to_cpu(value
);
346 emit_R10G10B10A2_SSCALED(const void *attrib
, void *ptr
)
348 float *src
= (float *)ptr
;
350 value
|= (uint32_t)(((uint32_t)CLAMP(src
[0], -512, 511)) & 0x3ff) ;
351 value
|= (uint32_t)((((uint32_t)CLAMP(src
[1], -512, 511)) & 0x3ff) << 10) ;
352 value
|= (uint32_t)((((uint32_t)CLAMP(src
[2], -512, 511)) & 0x3ff) << 20) ;
353 value
|= (uint32_t)(((uint32_t)CLAMP(src
[3], -2, 1)) << 30) ;
354 *(uint32_t *)attrib
= util_le32_to_cpu(value
);
358 emit_NULL(const void *attrib
, void *ptr
)
360 /* do nothing is the only sensible option */
364 get_emit_func(enum pipe_format format
)
367 case PIPE_FORMAT_R64_FLOAT
:
368 return &emit_R64_FLOAT
;
369 case PIPE_FORMAT_R64G64_FLOAT
:
370 return &emit_R64G64_FLOAT
;
371 case PIPE_FORMAT_R64G64B64_FLOAT
:
372 return &emit_R64G64B64_FLOAT
;
373 case PIPE_FORMAT_R64G64B64A64_FLOAT
:
374 return &emit_R64G64B64A64_FLOAT
;
376 case PIPE_FORMAT_R32_FLOAT
:
377 return &emit_R32_FLOAT
;
378 case PIPE_FORMAT_R32G32_FLOAT
:
379 return &emit_R32G32_FLOAT
;
380 case PIPE_FORMAT_R32G32B32_FLOAT
:
381 return &emit_R32G32B32_FLOAT
;
382 case PIPE_FORMAT_R32G32B32A32_FLOAT
:
383 return &emit_R32G32B32A32_FLOAT
;
385 case PIPE_FORMAT_R16_FLOAT
:
386 return &emit_R16_FLOAT
;
387 case PIPE_FORMAT_R16G16_FLOAT
:
388 return &emit_R16G16_FLOAT
;
389 case PIPE_FORMAT_R16G16B16_FLOAT
:
390 return &emit_R16G16B16_FLOAT
;
391 case PIPE_FORMAT_R16G16B16A16_FLOAT
:
392 return &emit_R16G16B16A16_FLOAT
;
394 case PIPE_FORMAT_R32_UNORM
:
395 return &emit_R32_UNORM
;
396 case PIPE_FORMAT_R32G32_UNORM
:
397 return &emit_R32G32_UNORM
;
398 case PIPE_FORMAT_R32G32B32_UNORM
:
399 return &emit_R32G32B32_UNORM
;
400 case PIPE_FORMAT_R32G32B32A32_UNORM
:
401 return &emit_R32G32B32A32_UNORM
;
403 case PIPE_FORMAT_R32_USCALED
:
404 return &emit_R32_USCALED
;
405 case PIPE_FORMAT_R32G32_USCALED
:
406 return &emit_R32G32_USCALED
;
407 case PIPE_FORMAT_R32G32B32_USCALED
:
408 return &emit_R32G32B32_USCALED
;
409 case PIPE_FORMAT_R32G32B32A32_USCALED
:
410 return &emit_R32G32B32A32_USCALED
;
412 case PIPE_FORMAT_R32_SNORM
:
413 return &emit_R32_SNORM
;
414 case PIPE_FORMAT_R32G32_SNORM
:
415 return &emit_R32G32_SNORM
;
416 case PIPE_FORMAT_R32G32B32_SNORM
:
417 return &emit_R32G32B32_SNORM
;
418 case PIPE_FORMAT_R32G32B32A32_SNORM
:
419 return &emit_R32G32B32A32_SNORM
;
421 case PIPE_FORMAT_R32_SSCALED
:
422 return &emit_R32_SSCALED
;
423 case PIPE_FORMAT_R32G32_SSCALED
:
424 return &emit_R32G32_SSCALED
;
425 case PIPE_FORMAT_R32G32B32_SSCALED
:
426 return &emit_R32G32B32_SSCALED
;
427 case PIPE_FORMAT_R32G32B32A32_SSCALED
:
428 return &emit_R32G32B32A32_SSCALED
;
430 case PIPE_FORMAT_R16_UNORM
:
431 return &emit_R16_UNORM
;
432 case PIPE_FORMAT_R16G16_UNORM
:
433 return &emit_R16G16_UNORM
;
434 case PIPE_FORMAT_R16G16B16_UNORM
:
435 return &emit_R16G16B16_UNORM
;
436 case PIPE_FORMAT_R16G16B16A16_UNORM
:
437 return &emit_R16G16B16A16_UNORM
;
439 case PIPE_FORMAT_R16_USCALED
:
440 return &emit_R16_USCALED
;
441 case PIPE_FORMAT_R16G16_USCALED
:
442 return &emit_R16G16_USCALED
;
443 case PIPE_FORMAT_R16G16B16_USCALED
:
444 return &emit_R16G16B16_USCALED
;
445 case PIPE_FORMAT_R16G16B16A16_USCALED
:
446 return &emit_R16G16B16A16_USCALED
;
448 case PIPE_FORMAT_R16_SNORM
:
449 return &emit_R16_SNORM
;
450 case PIPE_FORMAT_R16G16_SNORM
:
451 return &emit_R16G16_SNORM
;
452 case PIPE_FORMAT_R16G16B16_SNORM
:
453 return &emit_R16G16B16_SNORM
;
454 case PIPE_FORMAT_R16G16B16A16_SNORM
:
455 return &emit_R16G16B16A16_SNORM
;
457 case PIPE_FORMAT_R16_SSCALED
:
458 return &emit_R16_SSCALED
;
459 case PIPE_FORMAT_R16G16_SSCALED
:
460 return &emit_R16G16_SSCALED
;
461 case PIPE_FORMAT_R16G16B16_SSCALED
:
462 return &emit_R16G16B16_SSCALED
;
463 case PIPE_FORMAT_R16G16B16A16_SSCALED
:
464 return &emit_R16G16B16A16_SSCALED
;
466 case PIPE_FORMAT_R8_UNORM
:
467 return &emit_R8_UNORM
;
468 case PIPE_FORMAT_R8G8_UNORM
:
469 return &emit_R8G8_UNORM
;
470 case PIPE_FORMAT_R8G8B8_UNORM
:
471 return &emit_R8G8B8_UNORM
;
472 case PIPE_FORMAT_R8G8B8A8_UNORM
:
473 return &emit_R8G8B8A8_UNORM
;
475 case PIPE_FORMAT_R8_USCALED
:
476 return &emit_R8_USCALED
;
477 case PIPE_FORMAT_R8G8_USCALED
:
478 return &emit_R8G8_USCALED
;
479 case PIPE_FORMAT_R8G8B8_USCALED
:
480 return &emit_R8G8B8_USCALED
;
481 case PIPE_FORMAT_R8G8B8A8_USCALED
:
482 return &emit_R8G8B8A8_USCALED
;
484 case PIPE_FORMAT_R8_SNORM
:
485 return &emit_R8_SNORM
;
486 case PIPE_FORMAT_R8G8_SNORM
:
487 return &emit_R8G8_SNORM
;
488 case PIPE_FORMAT_R8G8B8_SNORM
:
489 return &emit_R8G8B8_SNORM
;
490 case PIPE_FORMAT_R8G8B8A8_SNORM
:
491 return &emit_R8G8B8A8_SNORM
;
493 case PIPE_FORMAT_R8_SSCALED
:
494 return &emit_R8_SSCALED
;
495 case PIPE_FORMAT_R8G8_SSCALED
:
496 return &emit_R8G8_SSCALED
;
497 case PIPE_FORMAT_R8G8B8_SSCALED
:
498 return &emit_R8G8B8_SSCALED
;
499 case PIPE_FORMAT_R8G8B8A8_SSCALED
:
500 return &emit_R8G8B8A8_SSCALED
;
502 case PIPE_FORMAT_B8G8R8A8_UNORM
:
503 return &emit_B8G8R8A8_UNORM
;
505 case PIPE_FORMAT_A8R8G8B8_UNORM
:
506 return &emit_A8R8G8B8_UNORM
;
508 case PIPE_FORMAT_R32_UINT
:
509 return &emit_R32_UINT
;
510 case PIPE_FORMAT_R32G32_UINT
:
511 return &emit_R32G32_UINT
;
512 case PIPE_FORMAT_R32G32B32_UINT
:
513 return &emit_R32G32B32_UINT
;
514 case PIPE_FORMAT_R32G32B32A32_UINT
:
515 return &emit_R32G32B32A32_UINT
;
517 case PIPE_FORMAT_R16_UINT
:
518 return &emit_R16_UINT
;
519 case PIPE_FORMAT_R16G16_UINT
:
520 return &emit_R16G16_UINT
;
521 case PIPE_FORMAT_R16G16B16_UINT
:
522 return &emit_R16G16B16_UINT
;
523 case PIPE_FORMAT_R16G16B16A16_UINT
:
524 return &emit_R16G16B16A16_UINT
;
526 case PIPE_FORMAT_R8_UINT
:
527 return &emit_R8_UINT
;
528 case PIPE_FORMAT_R8G8_UINT
:
529 return &emit_R8G8_UINT
;
530 case PIPE_FORMAT_R8G8B8_UINT
:
531 return &emit_R8G8B8_UINT
;
532 case PIPE_FORMAT_R8G8B8A8_UINT
:
533 return &emit_R8G8B8A8_UINT
;
535 case PIPE_FORMAT_R32_SINT
:
536 return &emit_R32_SINT
;
537 case PIPE_FORMAT_R32G32_SINT
:
538 return &emit_R32G32_SINT
;
539 case PIPE_FORMAT_R32G32B32_SINT
:
540 return &emit_R32G32B32_SINT
;
541 case PIPE_FORMAT_R32G32B32A32_SINT
:
542 return &emit_R32G32B32A32_SINT
;
544 case PIPE_FORMAT_R16_SINT
:
545 return &emit_R16_SINT
;
546 case PIPE_FORMAT_R16G16_SINT
:
547 return &emit_R16G16_SINT
;
548 case PIPE_FORMAT_R16G16B16_SINT
:
549 return &emit_R16G16B16_SINT
;
550 case PIPE_FORMAT_R16G16B16A16_SINT
:
551 return &emit_R16G16B16A16_SINT
;
553 case PIPE_FORMAT_R8_SINT
:
554 return &emit_R8_SINT
;
555 case PIPE_FORMAT_R8G8_SINT
:
556 return &emit_R8G8_SINT
;
557 case PIPE_FORMAT_R8G8B8_SINT
:
558 return &emit_R8G8B8_SINT
;
559 case PIPE_FORMAT_R8G8B8A8_SINT
:
560 return &emit_R8G8B8A8_SINT
;
562 case PIPE_FORMAT_B10G10R10A2_UNORM
:
563 return &emit_B10G10R10A2_UNORM
;
564 case PIPE_FORMAT_B10G10R10A2_USCALED
:
565 return &emit_B10G10R10A2_USCALED
;
566 case PIPE_FORMAT_B10G10R10A2_SNORM
:
567 return &emit_B10G10R10A2_SNORM
;
568 case PIPE_FORMAT_B10G10R10A2_SSCALED
:
569 return &emit_B10G10R10A2_SSCALED
;
571 case PIPE_FORMAT_R10G10B10A2_UNORM
:
572 return &emit_R10G10B10A2_UNORM
;
573 case PIPE_FORMAT_R10G10B10A2_USCALED
:
574 return &emit_R10G10B10A2_USCALED
;
575 case PIPE_FORMAT_R10G10B10A2_SNORM
:
576 return &emit_R10G10B10A2_SNORM
;
577 case PIPE_FORMAT_R10G10B10A2_SSCALED
:
578 return &emit_R10G10B10A2_SSCALED
;
586 static ALWAYS_INLINE
void PIPE_CDECL
587 generic_run_one(struct translate_generic
*tg
,
589 unsigned start_instance
,
590 unsigned instance_id
,
593 unsigned nr_attrs
= tg
->nr_attrib
;
596 for (attr
= 0; attr
< nr_attrs
; attr
++) {
598 uint8_t *dst
= (uint8_t *)vert
+ tg
->attrib
[attr
].output_offset
;
600 if (tg
->attrib
[attr
].type
== TRANSLATE_ELEMENT_NORMAL
) {
605 if (tg
->attrib
[attr
].instance_divisor
) {
606 index
= start_instance
;
607 index
+= (instance_id
/ tg
->attrib
[attr
].instance_divisor
);
608 /* XXX we need to clamp the index here too, but to a
609 * per-array max value, not the draw->pt.max_index value
610 * that's being given to us via translate->set_buffer().
615 /* clamp to avoid going out of bounds */
616 index
= MIN2(index
, tg
->attrib
[attr
].max_index
);
619 src
= tg
->attrib
[attr
].input_ptr
+
620 (ptrdiff_t)tg
->attrib
[attr
].input_stride
* index
;
622 copy_size
= tg
->attrib
[attr
].copy_size
;
623 if (likely(copy_size
>= 0)) {
624 memcpy(dst
, src
, copy_size
);
626 tg
->attrib
[attr
].fetch(data
, src
, 0, 0);
629 debug_printf("Fetch linear attr %d from %p stride %d index %d: "
630 " %f, %f, %f, %f \n",
632 tg
->attrib
[attr
].input_ptr
,
633 tg
->attrib
[attr
].input_stride
,
635 data
[0], data
[1],data
[2], data
[3]);
637 tg
->attrib
[attr
].emit(data
, dst
);
640 if (likely(tg
->attrib
[attr
].copy_size
>= 0)) {
641 memcpy(data
, &instance_id
, 4);
643 data
[0] = (float)instance_id
;
644 tg
->attrib
[attr
].emit(data
, dst
);
651 * Fetch vertex attributes for 'count' vertices.
653 static void PIPE_CDECL
654 generic_run_elts(struct translate
*translate
,
655 const unsigned *elts
,
657 unsigned start_instance
,
658 unsigned instance_id
,
661 struct translate_generic
*tg
= translate_generic(translate
);
662 char *vert
= output_buffer
;
665 for (i
= 0; i
< count
; i
++) {
666 generic_run_one(tg
, *elts
++, start_instance
, instance_id
, vert
);
667 vert
+= tg
->translate
.key
.output_stride
;
671 static void PIPE_CDECL
672 generic_run_elts16(struct translate
*translate
,
673 const uint16_t *elts
,
675 unsigned start_instance
,
676 unsigned instance_id
,
679 struct translate_generic
*tg
= translate_generic(translate
);
680 char *vert
= output_buffer
;
683 for (i
= 0; i
< count
; i
++) {
684 generic_run_one(tg
, *elts
++, start_instance
, instance_id
, vert
);
685 vert
+= tg
->translate
.key
.output_stride
;
689 static void PIPE_CDECL
690 generic_run_elts8(struct translate
*translate
,
693 unsigned start_instance
,
694 unsigned instance_id
,
697 struct translate_generic
*tg
= translate_generic(translate
);
698 char *vert
= output_buffer
;
701 for (i
= 0; i
< count
; i
++) {
702 generic_run_one(tg
, *elts
++, start_instance
, instance_id
, vert
);
703 vert
+= tg
->translate
.key
.output_stride
;
707 static void PIPE_CDECL
708 generic_run(struct translate
*translate
,
711 unsigned start_instance
,
712 unsigned instance_id
,
715 struct translate_generic
*tg
= translate_generic(translate
);
716 char *vert
= output_buffer
;
719 for (i
= 0; i
< count
; i
++) {
720 generic_run_one(tg
, start
+ i
, start_instance
, instance_id
, vert
);
721 vert
+= tg
->translate
.key
.output_stride
;
728 generic_set_buffer(struct translate
*translate
,
734 struct translate_generic
*tg
= translate_generic(translate
);
737 for (i
= 0; i
< tg
->nr_attrib
; i
++) {
738 if (tg
->attrib
[i
].buffer
== buf
) {
739 tg
->attrib
[i
].input_ptr
= ((const uint8_t *)ptr
+
740 tg
->attrib
[i
].input_offset
);
741 tg
->attrib
[i
].input_stride
= stride
;
742 tg
->attrib
[i
].max_index
= max_index
;
749 generic_release(struct translate
*translate
)
757 is_legal_int_format_combo(const struct util_format_description
*src
,
758 const struct util_format_description
*dst
)
761 unsigned nr
= MIN2(src
->nr_channels
, dst
->nr_channels
);
763 for (i
= 0; i
< nr
; i
++) {
764 /* The signs must match. */
765 if (src
->channel
[i
].type
!= dst
->channel
[i
].type
) {
769 /* Integers must not lose precision at any point in the pipeline. */
770 if (src
->channel
[i
].size
> dst
->channel
[i
].size
) {
778 translate_generic_create(const struct translate_key
*key
)
780 struct translate_generic
*tg
= CALLOC_STRUCT(translate_generic
);
786 assert(key
->nr_elements
<= TRANSLATE_MAX_ATTRIBS
);
788 tg
->translate
.key
= *key
;
789 tg
->translate
.release
= generic_release
;
790 tg
->translate
.set_buffer
= generic_set_buffer
;
791 tg
->translate
.run_elts
= generic_run_elts
;
792 tg
->translate
.run_elts16
= generic_run_elts16
;
793 tg
->translate
.run_elts8
= generic_run_elts8
;
794 tg
->translate
.run
= generic_run
;
796 for (i
= 0; i
< key
->nr_elements
; i
++) {
797 const struct util_format_description
*format_desc
=
798 util_format_description(key
->element
[i
].input_format
);
802 tg
->attrib
[i
].type
= key
->element
[i
].type
;
804 if (format_desc
->channel
[0].pure_integer
) {
805 const struct util_format_description
*out_format_desc
=
806 util_format_description(key
->element
[i
].output_format
);
808 if (!is_legal_int_format_combo(format_desc
, out_format_desc
)) {
814 tg
->attrib
[i
].fetch
=
815 util_format_fetch_rgba_func(key
->element
[i
].input_format
);
816 tg
->attrib
[i
].buffer
= key
->element
[i
].input_buffer
;
817 tg
->attrib
[i
].input_offset
= key
->element
[i
].input_offset
;
818 tg
->attrib
[i
].instance_divisor
= key
->element
[i
].instance_divisor
;
820 tg
->attrib
[i
].output_offset
= key
->element
[i
].output_offset
;
822 tg
->attrib
[i
].copy_size
= -1;
823 if (tg
->attrib
[i
].type
== TRANSLATE_ELEMENT_INSTANCE_ID
) {
824 if (key
->element
[i
].output_format
== PIPE_FORMAT_R32_USCALED
825 || key
->element
[i
].output_format
== PIPE_FORMAT_R32_SSCALED
)
826 tg
->attrib
[i
].copy_size
= 4;
828 if (key
->element
[i
].input_format
== key
->element
[i
].output_format
829 && format_desc
->block
.width
== 1
830 && format_desc
->block
.height
== 1
831 && !(format_desc
->block
.bits
& 7))
832 tg
->attrib
[i
].copy_size
= format_desc
->block
.bits
>> 3;
835 if (tg
->attrib
[i
].copy_size
< 0)
836 tg
->attrib
[i
].emit
= get_emit_func(key
->element
[i
].output_format
);
838 tg
->attrib
[i
].emit
= NULL
;
841 tg
->nr_attrib
= key
->nr_elements
;
843 return &tg
->translate
;
847 translate_generic_is_output_format_supported(enum pipe_format format
)
850 case PIPE_FORMAT_R64G64B64A64_FLOAT
: return TRUE
;
851 case PIPE_FORMAT_R64G64B64_FLOAT
: return TRUE
;
852 case PIPE_FORMAT_R64G64_FLOAT
: return TRUE
;
853 case PIPE_FORMAT_R64_FLOAT
: return TRUE
;
855 case PIPE_FORMAT_R32G32B32A32_FLOAT
: return TRUE
;
856 case PIPE_FORMAT_R32G32B32_FLOAT
: return TRUE
;
857 case PIPE_FORMAT_R32G32_FLOAT
: return TRUE
;
858 case PIPE_FORMAT_R32_FLOAT
: return TRUE
;
860 case PIPE_FORMAT_R16G16B16A16_FLOAT
: return TRUE
;
861 case PIPE_FORMAT_R16G16B16_FLOAT
: return TRUE
;
862 case PIPE_FORMAT_R16G16_FLOAT
: return TRUE
;
863 case PIPE_FORMAT_R16_FLOAT
: return TRUE
;
865 case PIPE_FORMAT_R32G32B32A32_USCALED
: return TRUE
;
866 case PIPE_FORMAT_R32G32B32_USCALED
: return TRUE
;
867 case PIPE_FORMAT_R32G32_USCALED
: return TRUE
;
868 case PIPE_FORMAT_R32_USCALED
: return TRUE
;
870 case PIPE_FORMAT_R32G32B32A32_SSCALED
: return TRUE
;
871 case PIPE_FORMAT_R32G32B32_SSCALED
: return TRUE
;
872 case PIPE_FORMAT_R32G32_SSCALED
: return TRUE
;
873 case PIPE_FORMAT_R32_SSCALED
: return TRUE
;
875 case PIPE_FORMAT_R32G32B32A32_UNORM
: return TRUE
;
876 case PIPE_FORMAT_R32G32B32_UNORM
: return TRUE
;
877 case PIPE_FORMAT_R32G32_UNORM
: return TRUE
;
878 case PIPE_FORMAT_R32_UNORM
: return TRUE
;
880 case PIPE_FORMAT_R32G32B32A32_SNORM
: return TRUE
;
881 case PIPE_FORMAT_R32G32B32_SNORM
: return TRUE
;
882 case PIPE_FORMAT_R32G32_SNORM
: return TRUE
;
883 case PIPE_FORMAT_R32_SNORM
: return TRUE
;
885 case PIPE_FORMAT_R16G16B16A16_USCALED
: return TRUE
;
886 case PIPE_FORMAT_R16G16B16_USCALED
: return TRUE
;
887 case PIPE_FORMAT_R16G16_USCALED
: return TRUE
;
888 case PIPE_FORMAT_R16_USCALED
: return TRUE
;
890 case PIPE_FORMAT_R16G16B16A16_SSCALED
: return TRUE
;
891 case PIPE_FORMAT_R16G16B16_SSCALED
: return TRUE
;
892 case PIPE_FORMAT_R16G16_SSCALED
: return TRUE
;
893 case PIPE_FORMAT_R16_SSCALED
: return TRUE
;
895 case PIPE_FORMAT_R16G16B16A16_UNORM
: return TRUE
;
896 case PIPE_FORMAT_R16G16B16_UNORM
: return TRUE
;
897 case PIPE_FORMAT_R16G16_UNORM
: return TRUE
;
898 case PIPE_FORMAT_R16_UNORM
: return TRUE
;
900 case PIPE_FORMAT_R16G16B16A16_SNORM
: return TRUE
;
901 case PIPE_FORMAT_R16G16B16_SNORM
: return TRUE
;
902 case PIPE_FORMAT_R16G16_SNORM
: return TRUE
;
903 case PIPE_FORMAT_R16_SNORM
: return TRUE
;
905 case PIPE_FORMAT_R8G8B8A8_USCALED
: return TRUE
;
906 case PIPE_FORMAT_R8G8B8_USCALED
: return TRUE
;
907 case PIPE_FORMAT_R8G8_USCALED
: return TRUE
;
908 case PIPE_FORMAT_R8_USCALED
: return TRUE
;
910 case PIPE_FORMAT_R8G8B8A8_SSCALED
: return TRUE
;
911 case PIPE_FORMAT_R8G8B8_SSCALED
: return TRUE
;
912 case PIPE_FORMAT_R8G8_SSCALED
: return TRUE
;
913 case PIPE_FORMAT_R8_SSCALED
: return TRUE
;
915 case PIPE_FORMAT_R8G8B8A8_UNORM
: return TRUE
;
916 case PIPE_FORMAT_R8G8B8_UNORM
: return TRUE
;
917 case PIPE_FORMAT_R8G8_UNORM
: return TRUE
;
918 case PIPE_FORMAT_R8_UNORM
: return TRUE
;
920 case PIPE_FORMAT_R8G8B8A8_SNORM
: return TRUE
;
921 case PIPE_FORMAT_R8G8B8_SNORM
: return TRUE
;
922 case PIPE_FORMAT_R8G8_SNORM
: return TRUE
;
923 case PIPE_FORMAT_R8_SNORM
: return TRUE
;
925 case PIPE_FORMAT_A8R8G8B8_UNORM
: return TRUE
;
926 case PIPE_FORMAT_B8G8R8A8_UNORM
: return TRUE
;
928 case PIPE_FORMAT_R32G32B32A32_UINT
: return TRUE
;
929 case PIPE_FORMAT_R32G32B32_UINT
: return TRUE
;
930 case PIPE_FORMAT_R32G32_UINT
: return TRUE
;
931 case PIPE_FORMAT_R32_UINT
: return TRUE
;
933 case PIPE_FORMAT_R16G16B16A16_UINT
: return TRUE
;
934 case PIPE_FORMAT_R16G16B16_UINT
: return TRUE
;
935 case PIPE_FORMAT_R16G16_UINT
: return TRUE
;
936 case PIPE_FORMAT_R16_UINT
: return TRUE
;
938 case PIPE_FORMAT_R8G8B8A8_UINT
: return TRUE
;
939 case PIPE_FORMAT_R8G8B8_UINT
: return TRUE
;
940 case PIPE_FORMAT_R8G8_UINT
: return TRUE
;
941 case PIPE_FORMAT_R8_UINT
: return TRUE
;
943 case PIPE_FORMAT_R32G32B32A32_SINT
: return TRUE
;
944 case PIPE_FORMAT_R32G32B32_SINT
: return TRUE
;
945 case PIPE_FORMAT_R32G32_SINT
: return TRUE
;
946 case PIPE_FORMAT_R32_SINT
: return TRUE
;
948 case PIPE_FORMAT_R16G16B16A16_SINT
: return TRUE
;
949 case PIPE_FORMAT_R16G16B16_SINT
: return TRUE
;
950 case PIPE_FORMAT_R16G16_SINT
: return TRUE
;
951 case PIPE_FORMAT_R16_SINT
: return TRUE
;
953 case PIPE_FORMAT_R8G8B8A8_SINT
: return TRUE
;
954 case PIPE_FORMAT_R8G8B8_SINT
: return TRUE
;
955 case PIPE_FORMAT_R8G8_SINT
: return TRUE
;
956 case PIPE_FORMAT_R8_SINT
: return TRUE
;
958 case PIPE_FORMAT_B10G10R10A2_UNORM
: return TRUE
;
959 case PIPE_FORMAT_B10G10R10A2_USCALED
: return TRUE
;
960 case PIPE_FORMAT_B10G10R10A2_SNORM
: return TRUE
;
961 case PIPE_FORMAT_B10G10R10A2_SSCALED
: return TRUE
;
963 case PIPE_FORMAT_R10G10B10A2_UNORM
: return TRUE
;
964 case PIPE_FORMAT_R10G10B10A2_USCALED
: return TRUE
;
965 case PIPE_FORMAT_R10G10B10A2_SNORM
: return TRUE
;
966 case PIPE_FORMAT_R10G10B10A2_SSCALED
: return TRUE
;
968 default: return FALSE
;