freedreno/a3xx: only enable blend clamp for non-float formats
[mesa.git] / src / gallium / drivers / freedreno / a3xx / fd3_util.c
1 /* -*- mode: C; c-file-style: "k&r"; tab-width 4; indent-tabs-mode: t; -*- */
2
3 /*
4 * Copyright (C) 2013 Rob Clark <robclark@freedesktop.org>
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice (including the next
14 * paragraph) shall be included in all copies or substantial portions of the
15 * Software.
16 *
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
23 * SOFTWARE.
24 *
25 * Authors:
26 * Rob Clark <robclark@freedesktop.org>
27 */
28
29 #include "pipe/p_defines.h"
30 #include "util/u_format.h"
31
32 #include "fd3_util.h"
33
34 /* convert pipe format to vertex buffer format: */
35 enum a3xx_vtx_fmt
36 fd3_pipe2vtx(enum pipe_format format)
37 {
38 switch (format) {
39 /* 8-bit buffers. */
40 case PIPE_FORMAT_R8_UNORM:
41 return VFMT_NORM_UBYTE_8;
42
43 case PIPE_FORMAT_R8_SNORM:
44 return VFMT_NORM_BYTE_8;
45
46 case PIPE_FORMAT_R8_UINT:
47 case PIPE_FORMAT_R8_USCALED:
48 return VFMT_UBYTE_8;
49
50 case PIPE_FORMAT_R8_SINT:
51 case PIPE_FORMAT_R8_SSCALED:
52 return VFMT_BYTE_8;
53
54 /* 16-bit buffers. */
55 case PIPE_FORMAT_R16_UNORM:
56 case PIPE_FORMAT_Z16_UNORM:
57 return VFMT_NORM_USHORT_16;
58
59 case PIPE_FORMAT_R16_SNORM:
60 return VFMT_NORM_SHORT_16;
61
62 case PIPE_FORMAT_R16_UINT:
63 case PIPE_FORMAT_R16_USCALED:
64 return VFMT_USHORT_16;
65
66 case PIPE_FORMAT_R16_SINT:
67 case PIPE_FORMAT_R16_SSCALED:
68 return VFMT_SHORT_16;
69
70 case PIPE_FORMAT_R16_FLOAT:
71 return VFMT_FLOAT_16;
72
73 case PIPE_FORMAT_R8G8_UNORM:
74 return VFMT_NORM_UBYTE_8_8;
75
76 case PIPE_FORMAT_R8G8_SNORM:
77 return VFMT_NORM_BYTE_8_8;
78
79 case PIPE_FORMAT_R8G8_UINT:
80 case PIPE_FORMAT_R8G8_USCALED:
81 return VFMT_UBYTE_8_8;
82
83 case PIPE_FORMAT_R8G8_SINT:
84 case PIPE_FORMAT_R8G8_SSCALED:
85 return VFMT_BYTE_8_8;
86
87 /* 24-bit buffers. */
88 case PIPE_FORMAT_R8G8B8_UNORM:
89 return VFMT_NORM_UBYTE_8_8_8;
90
91 case PIPE_FORMAT_R8G8B8_SNORM:
92 return VFMT_NORM_BYTE_8_8_8;
93
94 case PIPE_FORMAT_R8G8B8_UINT:
95 case PIPE_FORMAT_R8G8B8_USCALED:
96 return VFMT_UBYTE_8_8_8;
97
98 case PIPE_FORMAT_R8G8B8_SINT:
99 case PIPE_FORMAT_R8G8B8_SSCALED:
100 return VFMT_BYTE_8_8_8;
101
102 /* 32-bit buffers. */
103 case PIPE_FORMAT_A8B8G8R8_UNORM:
104 case PIPE_FORMAT_A8R8G8B8_UNORM:
105 case PIPE_FORMAT_B8G8R8A8_UNORM:
106 case PIPE_FORMAT_R8G8B8A8_UNORM:
107 return VFMT_NORM_UBYTE_8_8_8_8;
108
109 case PIPE_FORMAT_R8G8B8A8_SNORM:
110 return VFMT_NORM_BYTE_8_8_8_8;
111
112 case PIPE_FORMAT_R8G8B8A8_UINT:
113 case PIPE_FORMAT_R8G8B8A8_USCALED:
114 return VFMT_UBYTE_8_8_8_8;
115
116 case PIPE_FORMAT_R8G8B8A8_SINT:
117 case PIPE_FORMAT_R8G8B8A8_SSCALED:
118 return VFMT_BYTE_8_8_8_8;
119
120 case PIPE_FORMAT_R16G16_SSCALED:
121 case PIPE_FORMAT_R16G16_SINT:
122 return VFMT_SHORT_16_16;
123
124 case PIPE_FORMAT_R16G16_FLOAT:
125 return VFMT_FLOAT_16_16;
126
127 case PIPE_FORMAT_R16G16_UINT:
128 case PIPE_FORMAT_R16G16_USCALED:
129 return VFMT_USHORT_16_16;
130
131 case PIPE_FORMAT_R16G16_UNORM:
132 return VFMT_NORM_USHORT_16_16;
133
134 case PIPE_FORMAT_R16G16_SNORM:
135 return VFMT_NORM_SHORT_16_16;
136
137 case PIPE_FORMAT_R32_UINT:
138 case PIPE_FORMAT_R32_USCALED:
139 return VFMT_UINT_32;
140
141 case PIPE_FORMAT_R32_SINT:
142 case PIPE_FORMAT_R32_SSCALED:
143 return VFMT_INT_32;
144
145 case PIPE_FORMAT_R10G10B10A2_UNORM:
146 return VFMT_NORM_UINT_10_10_10_2;
147
148 case PIPE_FORMAT_R10G10B10A2_SNORM:
149 return VFMT_NORM_INT_10_10_10_2;
150
151 case PIPE_FORMAT_R10G10B10A2_UINT:
152 case PIPE_FORMAT_R10G10B10A2_USCALED:
153 return VFMT_UINT_10_10_10_2;
154
155 case PIPE_FORMAT_R10G10B10A2_SSCALED:
156 return VFMT_INT_10_10_10_2;
157
158 /* 48-bit buffers. */
159 case PIPE_FORMAT_R16G16B16_FLOAT:
160 return VFMT_FLOAT_16_16_16;
161
162 case PIPE_FORMAT_R16G16B16_SINT:
163 case PIPE_FORMAT_R16G16B16_SSCALED:
164 return VFMT_SHORT_16_16_16;
165
166 case PIPE_FORMAT_R16G16B16_UINT:
167 case PIPE_FORMAT_R16G16B16_USCALED:
168 return VFMT_USHORT_16_16_16;
169
170 case PIPE_FORMAT_R16G16B16_SNORM:
171 return VFMT_NORM_SHORT_16_16_16;
172
173 case PIPE_FORMAT_R16G16B16_UNORM:
174 return VFMT_NORM_USHORT_16_16_16;
175
176 case PIPE_FORMAT_R32_FLOAT:
177 case PIPE_FORMAT_Z32_FLOAT:
178 return VFMT_FLOAT_32;
179
180 case PIPE_FORMAT_R32_FIXED:
181 return VFMT_FIXED_32;
182
183 /* 64-bit buffers. */
184 case PIPE_FORMAT_R16G16B16A16_UNORM:
185 return VFMT_NORM_USHORT_16_16_16_16;
186
187 case PIPE_FORMAT_R16G16B16A16_SNORM:
188 return VFMT_NORM_SHORT_16_16_16_16;
189
190 case PIPE_FORMAT_R16G16B16A16_UINT:
191 case PIPE_FORMAT_R16G16B16A16_USCALED:
192 return VFMT_USHORT_16_16_16_16;
193
194 case PIPE_FORMAT_R16G16B16A16_SINT:
195 case PIPE_FORMAT_R16G16B16A16_SSCALED:
196 return VFMT_SHORT_16_16_16_16;
197
198 case PIPE_FORMAT_R32G32_FLOAT:
199 return VFMT_FLOAT_32_32;
200
201 case PIPE_FORMAT_R32G32_FIXED:
202 return VFMT_FIXED_32_32;
203
204 case PIPE_FORMAT_R16G16B16A16_FLOAT:
205 return VFMT_FLOAT_16_16_16_16;
206
207 case PIPE_FORMAT_R32G32_UINT:
208 case PIPE_FORMAT_R32G32_USCALED:
209 return VFMT_UINT_32_32;
210
211 case PIPE_FORMAT_R32G32_SINT:
212 case PIPE_FORMAT_R32G32_SSCALED:
213 return VFMT_INT_32_32;
214
215 /* 96-bit buffers. */
216 case PIPE_FORMAT_R32G32B32_FLOAT:
217 return VFMT_FLOAT_32_32_32;
218
219 case PIPE_FORMAT_R32G32B32_FIXED:
220 return VFMT_FIXED_32_32_32;
221
222 case PIPE_FORMAT_R32G32B32_UINT:
223 case PIPE_FORMAT_R32G32B32_USCALED:
224 return VFMT_UINT_32_32_32;
225
226 case PIPE_FORMAT_R32G32B32_SINT:
227 case PIPE_FORMAT_R32G32B32_SSCALED:
228 return VFMT_INT_32_32_32;
229
230 /* 128-bit buffers. */
231 case PIPE_FORMAT_R32G32B32A32_FLOAT:
232 return VFMT_FLOAT_32_32_32_32;
233
234 case PIPE_FORMAT_R32G32B32A32_FIXED:
235 return VFMT_FIXED_32_32_32_32;
236
237 case PIPE_FORMAT_R32G32B32A32_UINT:
238 case PIPE_FORMAT_R32G32B32A32_USCALED:
239 return VFMT_UINT_32_32_32_32;
240
241 case PIPE_FORMAT_R32G32B32A32_SINT:
242 case PIPE_FORMAT_R32G32B32A32_SSCALED:
243 return VFMT_INT_32_32_32_32;
244
245 /* TODO normalized 32bit int formats do not appear to be supported
246 * natively.. will require either shader variant or VFD_DECODE
247 * gymnastics like the blob driver does..
248 case PIPE_FORMAT_R32G32B32A32_SNORM:
249 case PIPE_FORMAT_R32G32B32A32_UNORM:
250 */
251
252 default:
253 return ~0;
254 }
255 }
256
257 /* convert pipe format to texture sampler format: */
258 enum a3xx_tex_fmt
259 fd3_pipe2tex(enum pipe_format format)
260 {
261 switch (format) {
262 case PIPE_FORMAT_L8_UNORM:
263 case PIPE_FORMAT_A8_UNORM:
264 case PIPE_FORMAT_I8_UNORM:
265 return TFMT_NORM_UINT_8;
266
267 case PIPE_FORMAT_R8G8_UNORM:
268 return TFMT_NORM_UINT_8_8;
269
270 case PIPE_FORMAT_B8G8R8A8_UNORM:
271 case PIPE_FORMAT_B8G8R8X8_UNORM:
272 case PIPE_FORMAT_R8G8B8A8_UNORM:
273 case PIPE_FORMAT_R8G8B8X8_UNORM:
274 case PIPE_FORMAT_B8G8R8A8_SRGB:
275 case PIPE_FORMAT_B8G8R8X8_SRGB:
276 case PIPE_FORMAT_R8G8B8A8_SRGB:
277 case PIPE_FORMAT_R8G8B8X8_SRGB:
278 return TFMT_NORM_UINT_8_8_8_8;
279
280 case PIPE_FORMAT_Z24X8_UNORM:
281 case PIPE_FORMAT_Z24_UNORM_S8_UINT:
282 return TFMT_NORM_UINT_X8Z24;
283
284 case PIPE_FORMAT_Z16_UNORM:
285 return TFMT_NORM_USHORT_Z16;
286
287 case PIPE_FORMAT_R16G16B16A16_FLOAT:
288 case PIPE_FORMAT_R16G16B16X16_FLOAT:
289 return TFMT_FLOAT_16_16_16_16;
290
291 case PIPE_FORMAT_R32G32B32A32_FLOAT:
292 case PIPE_FORMAT_R32G32B32X32_FLOAT:
293 return TFMT_FLOAT_32_32_32_32;
294
295 // TODO add more..
296
297 default:
298 return ~0;
299 }
300 }
301
302 enum a3xx_tex_fetchsize
303 fd3_pipe2fetchsize(enum pipe_format format)
304 {
305 switch (format) {
306 case PIPE_FORMAT_L8_UNORM:
307 case PIPE_FORMAT_A8_UNORM:
308 case PIPE_FORMAT_I8_UNORM:
309 return TFETCH_1_BYTE;
310
311 case PIPE_FORMAT_Z16_UNORM:
312 return TFETCH_2_BYTE;
313
314 case PIPE_FORMAT_B8G8R8A8_UNORM:
315 case PIPE_FORMAT_B8G8R8X8_UNORM:
316 case PIPE_FORMAT_R8G8B8A8_UNORM:
317 case PIPE_FORMAT_R8G8B8X8_UNORM:
318 case PIPE_FORMAT_B8G8R8A8_SRGB:
319 case PIPE_FORMAT_B8G8R8X8_SRGB:
320 case PIPE_FORMAT_R8G8B8A8_SRGB:
321 case PIPE_FORMAT_R8G8B8X8_SRGB:
322 case PIPE_FORMAT_Z24X8_UNORM:
323 case PIPE_FORMAT_Z24_UNORM_S8_UINT:
324 return TFETCH_4_BYTE;
325
326 // TODO add more..
327
328 default:
329 return TFETCH_DISABLE; /* safe default */
330 }
331 }
332
333 /* convert pipe format to MRT / copydest format used for render-target: */
334 enum a3xx_color_fmt
335 fd3_pipe2color(enum pipe_format format)
336 {
337 switch (format) {
338 case PIPE_FORMAT_B8G8R8A8_UNORM:
339 case PIPE_FORMAT_B8G8R8X8_UNORM:
340 case PIPE_FORMAT_R8G8B8A8_UNORM:
341 return RB_R8G8B8A8_UNORM;
342
343 case PIPE_FORMAT_Z16_UNORM:
344 return RB_R8G8_UNORM;
345
346 case PIPE_FORMAT_Z24X8_UNORM:
347 case PIPE_FORMAT_Z24_UNORM_S8_UINT:
348 /* for DEPTHX_24_8, blob driver also seems to use R8G8B8A8 fmt.. */
349 return RB_R8G8B8A8_UNORM;
350
351 case PIPE_FORMAT_R8_UNORM:
352 case PIPE_FORMAT_L8_UNORM:
353 return RB_R8_UNORM;
354
355 case PIPE_FORMAT_A8_UNORM:
356 return RB_A8_UNORM;
357
358 case PIPE_FORMAT_R16G16B16A16_FLOAT:
359 case PIPE_FORMAT_R16G16B16X16_FLOAT:
360 return RB_R16G16B16A16_FLOAT;
361
362 case PIPE_FORMAT_R32G32B32A32_FLOAT:
363 case PIPE_FORMAT_R32G32B32X32_FLOAT:
364 return RB_R32G32B32A32_FLOAT;
365
366 // TODO add more..
367
368 default:
369 return ~0;
370 }
371 }
372
373 /* we need to special case a bit the depth/stencil restore, because we are
374 * using the texture sampler to blit into the depth/stencil buffer, *not*
375 * into a color buffer. Otherwise fd3_tex_swiz() will do the wrong thing,
376 * as it is assuming that you are sampling into normal render target..
377 */
378 enum pipe_format
379 fd3_gmem_restore_format(enum pipe_format format)
380 {
381 switch (format) {
382 case PIPE_FORMAT_Z24X8_UNORM:
383 case PIPE_FORMAT_Z24_UNORM_S8_UINT:
384 return PIPE_FORMAT_R8G8B8A8_UNORM;
385 case PIPE_FORMAT_Z16_UNORM:
386 return PIPE_FORMAT_R8G8_UNORM;
387 default:
388 return format;
389 }
390 }
391
392 enum a3xx_color_swap
393 fd3_pipe2swap(enum pipe_format format)
394 {
395 switch (format) {
396 case PIPE_FORMAT_B8G8R8A8_UNORM:
397 case PIPE_FORMAT_B8G8R8X8_UNORM:
398 case PIPE_FORMAT_B8G8R8A8_SRGB:
399 case PIPE_FORMAT_B8G8R8X8_SRGB:
400 return WXYZ;
401
402 case PIPE_FORMAT_A8R8G8B8_UNORM:
403 case PIPE_FORMAT_X8R8G8B8_UNORM:
404 case PIPE_FORMAT_A8R8G8B8_SRGB:
405 case PIPE_FORMAT_X8R8G8B8_SRGB:
406 return ZYXW;
407
408 case PIPE_FORMAT_A8B8G8R8_UNORM:
409 case PIPE_FORMAT_X8B8G8R8_UNORM:
410 case PIPE_FORMAT_A8B8G8R8_SRGB:
411 case PIPE_FORMAT_X8B8G8R8_SRGB:
412 return XYZW;
413
414 case PIPE_FORMAT_R8G8B8A8_UNORM:
415 case PIPE_FORMAT_R8G8B8X8_UNORM:
416 case PIPE_FORMAT_Z24X8_UNORM:
417 case PIPE_FORMAT_Z24_UNORM_S8_UINT:
418 default:
419 return WZYX;
420 }
421 }
422
423 static inline enum a3xx_tex_swiz
424 tex_swiz(unsigned swiz)
425 {
426 switch (swiz) {
427 default:
428 case PIPE_SWIZZLE_RED: return A3XX_TEX_X;
429 case PIPE_SWIZZLE_GREEN: return A3XX_TEX_Y;
430 case PIPE_SWIZZLE_BLUE: return A3XX_TEX_Z;
431 case PIPE_SWIZZLE_ALPHA: return A3XX_TEX_W;
432 case PIPE_SWIZZLE_ZERO: return A3XX_TEX_ZERO;
433 case PIPE_SWIZZLE_ONE: return A3XX_TEX_ONE;
434 }
435 }
436
437 uint32_t
438 fd3_tex_swiz(enum pipe_format format, unsigned swizzle_r, unsigned swizzle_g,
439 unsigned swizzle_b, unsigned swizzle_a)
440 {
441 const struct util_format_description *desc =
442 util_format_description(format);
443 unsigned char swiz[4] = {
444 swizzle_r, swizzle_g, swizzle_b, swizzle_a,
445 }, rswiz[4];
446
447 util_format_compose_swizzles(desc->swizzle, swiz, rswiz);
448
449 return A3XX_TEX_CONST_0_SWIZ_X(tex_swiz(rswiz[0])) |
450 A3XX_TEX_CONST_0_SWIZ_Y(tex_swiz(rswiz[1])) |
451 A3XX_TEX_CONST_0_SWIZ_Z(tex_swiz(rswiz[2])) |
452 A3XX_TEX_CONST_0_SWIZ_W(tex_swiz(rswiz[3]));
453 }