92b88ef0e0093985853aa78be8dd488a0bdc3f23
[mesa.git] / src / gallium / drivers / vc5 / vc5_formats.c
1 /*
2 * Copyright © 2014-2017 Broadcom
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24 /**
25 * @file vc5_formats.c
26 *
27 * Contains the table and accessors for VC5 texture and render target format
28 * support.
29 *
30 * The hardware has limited support for texture formats, and extremely limited
31 * support for render target formats. As a result, we emulate other formats
32 * in our shader code, and this stores the table for doing so.
33 */
34
35 #include "util/u_format.h"
36 #include "util/macros.h"
37
38 #include "vc5_context.h"
39 #include "broadcom/cle/v3d_packet_v33_pack.h"
40
41 #define OUTPUT_IMAGE_FORMAT_NO 255
42
43 struct vc5_format {
44 /** Set if the pipe format is defined in the table. */
45 bool present;
46
47 /** One of V3D33_OUTPUT_IMAGE_FORMAT_*, or OUTPUT_IMAGE_FORMAT_NO */
48 uint8_t rt_type;
49
50 /** One of V3D33_TEXTURE_DATA_FORMAT_*. */
51 uint8_t tex_type;
52
53 /**
54 * Swizzle to apply to the RGBA shader output for storing to the tile
55 * buffer, to the RGBA tile buffer to produce shader input (for
56 * blending), and for turning the rgba8888 texture sampler return
57 * value into shader rgba values.
58 */
59 uint8_t swizzle[4];
60
61 /* Whether the return value is 16F/I/UI or 32F/I/UI. */
62 uint8_t return_size;
63
64 /* If return_size == 32, how many channels are returned by texturing.
65 * 16 always returns 2 pairs of 16 bit values.
66 */
67 uint8_t return_channels;
68 };
69
70 #define SWIZ(x,y,z,w) { \
71 PIPE_SWIZZLE_##x, \
72 PIPE_SWIZZLE_##y, \
73 PIPE_SWIZZLE_##z, \
74 PIPE_SWIZZLE_##w \
75 }
76
77 #define FORMAT(pipe, rt, tex, swiz, return_size, return_channels) \
78 [PIPE_FORMAT_##pipe] = { \
79 true, \
80 OUTPUT_IMAGE_FORMAT_##rt, \
81 TEXTURE_DATA_FORMAT_##tex, \
82 swiz, \
83 return_size, \
84 return_channels, \
85 }
86
87 #define SWIZ_X001 SWIZ(X, 0, 0, 1)
88 #define SWIZ_XY01 SWIZ(X, Y, 0, 1)
89 #define SWIZ_XYZ1 SWIZ(X, Y, Z, 1)
90 #define SWIZ_XYZW SWIZ(X, Y, Z, W)
91 #define SWIZ_YZWX SWIZ(Y, Z, W, X)
92 #define SWIZ_YZW1 SWIZ(Y, Z, W, 1)
93 #define SWIZ_ZYXW SWIZ(Z, Y, X, W)
94 #define SWIZ_ZYX1 SWIZ(Z, Y, X, 1)
95 #define SWIZ_XXXY SWIZ(X, X, X, Y)
96 #define SWIZ_XXX1 SWIZ(X, X, X, 1)
97 #define SWIZ_XXXX SWIZ(X, X, X, X)
98 #define SWIZ_000X SWIZ(0, 0, 0, X)
99
100 static const struct vc5_format vc5_format_table[] = {
101 FORMAT(B8G8R8A8_UNORM, RGBA8, RGBA8, SWIZ_ZYXW, 16, 0),
102 FORMAT(B8G8R8X8_UNORM, RGBX8, RGBA8, SWIZ_ZYX1, 16, 0),
103 FORMAT(B8G8R8A8_SRGB, SRGB8_ALPHA8, RGBA8, SWIZ_ZYXW, 16, 0),
104 FORMAT(B8G8R8X8_SRGB, SRGBX8, RGBA8, SWIZ_ZYX1, 16, 0),
105 FORMAT(R8G8B8A8_UNORM, RGBA8, RGBA8, SWIZ_XYZW, 16, 0),
106 FORMAT(R8G8B8X8_UNORM, RGBX8, RGBA8, SWIZ_XYZ1, 16, 0),
107 FORMAT(R8G8B8A8_SNORM, NO, RGBA8_SNORM, SWIZ_XYZW, 16, 0),
108 FORMAT(R8G8B8X8_SNORM, NO, RGBA8_SNORM, SWIZ_XYZ1, 16, 0),
109 FORMAT(R10G10B10A2_UNORM, RGB10_A2, RGB10_A2, SWIZ_XYZW, 16, 0),
110
111 FORMAT(B4G4R4A4_UNORM, ABGR4444, RGBA4, SWIZ_YZWX, 16, 0),
112 FORMAT(B4G4R4X4_UNORM, ABGR4444, RGBA4, SWIZ_YZW1, 16, 0),
113
114 FORMAT(A1B5G5R5_UNORM, ABGR1555, RGB5_A1, SWIZ_XYZW, 16, 0),
115 FORMAT(X1B5G5R5_UNORM, ABGR1555, RGB5_A1, SWIZ_XYZ1, 16, 0),
116 FORMAT(B5G6R5_UNORM, BGR565, RGB565, SWIZ_XYZ1, 16, 0),
117
118 FORMAT(R8_UNORM, R8, R8, SWIZ_X001, 16, 0),
119 FORMAT(R8_SNORM, NO, R8_SNORM, SWIZ_X001, 16, 0),
120 FORMAT(R8G8_UNORM, RG8, RG8, SWIZ_XY01, 16, 0),
121 FORMAT(R8G8_SNORM, NO, RG8_SNORM, SWIZ_XY01, 16, 0),
122
123 FORMAT(R16_UNORM, NO, R16, SWIZ_X001, 32, 1),
124 FORMAT(R16_SNORM, NO, R16_SNORM, SWIZ_X001, 32, 1),
125 FORMAT(R16_FLOAT, R16F, R16F, SWIZ_X001, 16, 0),
126 FORMAT(R32_FLOAT, R32F, R32F, SWIZ_X001, 32, 1),
127
128 FORMAT(R16G16_UNORM, NO, RG16, SWIZ_XY01, 32, 2),
129 FORMAT(R16G16_SNORM, NO, RG16_SNORM, SWIZ_XY01, 32, 2),
130 FORMAT(R16G16_FLOAT, RG16F, RG16F, SWIZ_XY01, 16, 0),
131 FORMAT(R32G32_FLOAT, RG32F, RG32F, SWIZ_XY01, 32, 2),
132
133 FORMAT(R16G16B16A16_UNORM, NO, RGBA16, SWIZ_XYZW, 32, 4),
134 FORMAT(R16G16B16A16_SNORM, NO, RGBA16_SNORM, SWIZ_XYZW, 32, 4),
135 FORMAT(R16G16B16A16_FLOAT, RGBA16F, RGBA16F, SWIZ_XYZW, 16, 0),
136 FORMAT(R32G32B32A32_FLOAT, RGBA32F, RGBA32F, SWIZ_XYZW, 32, 4),
137
138 /* If we don't have L/A/LA16, mesa/st will fall back to RGBA16. */
139 FORMAT(L16_UNORM, NO, R16, SWIZ_XXX1, 32, 1),
140 FORMAT(L16_SNORM, NO, R16_SNORM, SWIZ_XXX1, 32, 1),
141 FORMAT(I16_UNORM, NO, R16, SWIZ_XXXX, 32, 1),
142 FORMAT(I16_SNORM, NO, R16_SNORM, SWIZ_XXXX, 32, 1),
143 FORMAT(A16_UNORM, NO, R16, SWIZ_000X, 32, 1),
144 FORMAT(A16_SNORM, NO, R16_SNORM, SWIZ_000X, 32, 1),
145 FORMAT(L16A16_UNORM, NO, RG16, SWIZ_XXXY, 32, 2),
146 FORMAT(L16A16_SNORM, NO, RG16_SNORM, SWIZ_XXXY, 32, 2),
147
148 FORMAT(A8_UNORM, NO, R8, SWIZ_000X, 16, 0),
149 FORMAT(L8_UNORM, NO, R8, SWIZ_XXX1, 16, 0),
150 FORMAT(I8_UNORM, NO, R8, SWIZ_XXXX, 16, 0),
151 FORMAT(L8A8_UNORM, NO, RG8, SWIZ_XXXY, 16, 0),
152
153 FORMAT(R8_SINT, R8I, S8, SWIZ_X001, 16, 0),
154 FORMAT(R8_UINT, R8UI, S8, SWIZ_X001, 16, 0),
155 FORMAT(R8G8_SINT, RG8I, S16, SWIZ_XY01, 16, 0),
156 FORMAT(R8G8_UINT, RG8UI, S16, SWIZ_XY01, 16, 0),
157 FORMAT(R8G8B8A8_SINT, RGBA8I, R32F, SWIZ_XYZW, 16, 0),
158 FORMAT(R8G8B8A8_UINT, RGBA8UI, R32F, SWIZ_XYZW, 16, 0),
159
160 FORMAT(R16_SINT, R16I, S16, SWIZ_X001, 16, 0),
161 FORMAT(R16_UINT, R16UI, S16, SWIZ_X001, 16, 0),
162 FORMAT(R16G16_SINT, RG16I, R32F, SWIZ_XY01, 16, 0),
163 FORMAT(R16G16_UINT, RG16UI, R32F, SWIZ_XY01, 16, 0),
164 FORMAT(R16G16B16A16_SINT, RGBA16I, RG32F, SWIZ_XYZW, 16, 0),
165 FORMAT(R16G16B16A16_UINT, RGBA16UI, RG32F, SWIZ_XYZW, 16, 0),
166
167 FORMAT(R32_SINT, R32I, R32F, SWIZ_X001, 16, 0),
168 FORMAT(R32_UINT, R32UI, R32F, SWIZ_X001, 16, 0),
169 FORMAT(R32G32_SINT, RG32I, RG32F, SWIZ_XY01, 16, 0),
170 FORMAT(R32G32_UINT, RG32UI, RG32F, SWIZ_XY01, 16, 0),
171 FORMAT(R32G32B32A32_SINT, RGBA32I, RGBA32F, SWIZ_XYZW, 16, 0),
172 FORMAT(R32G32B32A32_UINT, RGBA32UI, RGBA32F, SWIZ_XYZW, 16, 0),
173
174 FORMAT(A8_SINT, R8I, S8, SWIZ_000X, 16, 0),
175 FORMAT(A8_UINT, R8UI, S8, SWIZ_000X, 16, 0),
176 FORMAT(A16_SINT, R16I, S16, SWIZ_000X, 16, 0),
177 FORMAT(A16_UINT, R16UI, S16, SWIZ_000X, 16, 0),
178 FORMAT(A32_SINT, R32I, R32F, SWIZ_000X, 16, 0),
179 FORMAT(A32_UINT, R32UI, R32F, SWIZ_000X, 16, 0),
180
181 FORMAT(R11G11B10_FLOAT, R11F_G11F_B10F, R11F_G11F_B10F, SWIZ_XYZW, 16, 0),
182 FORMAT(R9G9B9E5_FLOAT, NO, RGB9_E5, SWIZ_XYZW, 16, 0),
183
184 FORMAT(S8_UINT_Z24_UNORM, DEPTH24_STENCIL8, DEPTH24_X8, SWIZ_X001, 32, 1),
185 FORMAT(X8Z24_UNORM, DEPTH24_STENCIL8, DEPTH24_X8, SWIZ_X001, 32, 1),
186 FORMAT(S8X24_UINT, NO, R32F, SWIZ_X001, 32, 1),
187 FORMAT(Z32_FLOAT, DEPTH_COMPONENT32F, R32F, SWIZ_X001, 32, 1),
188 FORMAT(Z16_UNORM, DEPTH_COMPONENT16, DEPTH_COMP16, SWIZ_X001, 32, 1),
189
190 /* Pretend we support this, but it'll be separate Z32F depth and S8. */
191 FORMAT(Z32_FLOAT_S8X24_UINT, DEPTH_COMPONENT32F, R32F, SWIZ_X001, 32, 1),
192
193 FORMAT(ETC2_RGB8, NO, RGB8_ETC2, SWIZ_XYZ1, 16, 0),
194 FORMAT(ETC2_SRGB8, NO, RGB8_ETC2, SWIZ_XYZ1, 16, 0),
195 FORMAT(ETC2_RGB8A1, NO, RGB8_PUNCHTHROUGH_ALPHA1, SWIZ_XYZW, 16, 0),
196 FORMAT(ETC2_SRGB8A1, NO, RGB8_PUNCHTHROUGH_ALPHA1, SWIZ_XYZW, 16, 0),
197 FORMAT(ETC2_RGBA8, NO, RGBA8_ETC2_EAC, SWIZ_XYZW, 16, 0),
198 FORMAT(ETC2_SRGBA8, NO, RGBA8_ETC2_EAC, SWIZ_XYZW, 16, 0),
199 FORMAT(ETC2_R11_UNORM, NO, R11_EAC, SWIZ_X001, 16, 0),
200 FORMAT(ETC2_R11_SNORM, NO, SIGNED_R11_EAC, SWIZ_X001, 16, 0),
201 FORMAT(ETC2_RG11_UNORM, NO, RG11_EAC, SWIZ_XY01, 16, 0),
202 FORMAT(ETC2_RG11_SNORM, NO, SIGNED_RG11_EAC, SWIZ_XY01, 16, 0),
203
204 FORMAT(DXT1_RGB, NO, BC1, SWIZ_XYZ1, 16, 0),
205 FORMAT(DXT3_RGBA, NO, BC2, SWIZ_XYZ1, 16, 0),
206 FORMAT(DXT5_RGBA, NO, BC3, SWIZ_XYZ1, 16, 0),
207 };
208
209 static const struct vc5_format *
210 get_format(enum pipe_format f)
211 {
212 if (f >= ARRAY_SIZE(vc5_format_table) ||
213 !vc5_format_table[f].present)
214 return NULL;
215 else
216 return &vc5_format_table[f];
217 }
218
219 bool
220 vc5_rt_format_supported(enum pipe_format f)
221 {
222 const struct vc5_format *vf = get_format(f);
223
224 if (!vf)
225 return false;
226
227 return vf->rt_type != OUTPUT_IMAGE_FORMAT_NO;
228 }
229
230 uint8_t
231 vc5_get_rt_format(enum pipe_format f)
232 {
233 const struct vc5_format *vf = get_format(f);
234
235 if (!vf)
236 return 0;
237
238 return vf->rt_type;
239 }
240
241 bool
242 vc5_tex_format_supported(enum pipe_format f)
243 {
244 const struct vc5_format *vf = get_format(f);
245
246 return vf != NULL;
247 }
248
249 uint8_t
250 vc5_get_tex_format(enum pipe_format f)
251 {
252 const struct vc5_format *vf = get_format(f);
253
254 if (!vf)
255 return 0;
256
257 return vf->tex_type;
258 }
259
260 uint8_t
261 vc5_get_tex_return_size(enum pipe_format f)
262 {
263 const struct vc5_format *vf = get_format(f);
264
265 if (!vf)
266 return 0;
267
268 return vf->return_size;
269 }
270
271 uint8_t
272 vc5_get_tex_return_channels(enum pipe_format f)
273 {
274 const struct vc5_format *vf = get_format(f);
275
276 if (!vf)
277 return 0;
278
279 return vf->return_channels;
280 }
281
282 const uint8_t *
283 vc5_get_format_swizzle(enum pipe_format f)
284 {
285 const struct vc5_format *vf = get_format(f);
286 static const uint8_t fallback[] = {0, 1, 2, 3};
287
288 if (!vf)
289 return fallback;
290
291 return vf->swizzle;
292 }
293
294 void
295 vc5_get_internal_type_bpp_for_output_format(uint32_t format,
296 uint32_t *type,
297 uint32_t *bpp)
298 {
299 switch (format) {
300 case OUTPUT_IMAGE_FORMAT_RGBA8:
301 case OUTPUT_IMAGE_FORMAT_RGBX8:
302 case OUTPUT_IMAGE_FORMAT_RGB8:
303 case OUTPUT_IMAGE_FORMAT_RG8:
304 case OUTPUT_IMAGE_FORMAT_R8:
305 case OUTPUT_IMAGE_FORMAT_ABGR4444:
306 case OUTPUT_IMAGE_FORMAT_BGR565:
307 case OUTPUT_IMAGE_FORMAT_ABGR1555:
308 *type = INTERNAL_TYPE_8;
309 *bpp = INTERNAL_BPP_32;
310 break;
311
312 case OUTPUT_IMAGE_FORMAT_RGBA8I:
313 case OUTPUT_IMAGE_FORMAT_RG8I:
314 case OUTPUT_IMAGE_FORMAT_R8I:
315 *type = INTERNAL_TYPE_8I;
316 *bpp = INTERNAL_BPP_32;
317 break;
318
319 case OUTPUT_IMAGE_FORMAT_RGBA8UI:
320 case OUTPUT_IMAGE_FORMAT_RG8UI:
321 case OUTPUT_IMAGE_FORMAT_R8UI:
322 *type = INTERNAL_TYPE_8UI;
323 *bpp = INTERNAL_BPP_32;
324 break;
325
326 case OUTPUT_IMAGE_FORMAT_SRGB8_ALPHA8:
327 case OUTPUT_IMAGE_FORMAT_SRGB:
328 case OUTPUT_IMAGE_FORMAT_RGB10_A2:
329 case OUTPUT_IMAGE_FORMAT_R11F_G11F_B10F:
330 case OUTPUT_IMAGE_FORMAT_SRGBX8:
331 case OUTPUT_IMAGE_FORMAT_RGBA16F:
332 /* Note that sRGB RTs are stored in the tile buffer at 16F,
333 * and the conversion to sRGB happens at tilebuffer
334 * load/store.
335 */
336 *type = INTERNAL_TYPE_16F;
337 *bpp = INTERNAL_BPP_64;
338 break;
339
340 case OUTPUT_IMAGE_FORMAT_RG16F:
341 case OUTPUT_IMAGE_FORMAT_R16F:
342 *type = INTERNAL_TYPE_16F;
343 /* Use 64bpp to make sure the TLB doesn't throw away the alpha
344 * channel before alpha test happens.
345 */
346 *bpp = INTERNAL_BPP_64;
347 break;
348
349 case OUTPUT_IMAGE_FORMAT_RGBA16I:
350 *type = INTERNAL_TYPE_16I;
351 *bpp = INTERNAL_BPP_64;
352 break;
353 case OUTPUT_IMAGE_FORMAT_RG16I:
354 case OUTPUT_IMAGE_FORMAT_R16I:
355 *type = INTERNAL_TYPE_16I;
356 *bpp = INTERNAL_BPP_32;
357 break;
358
359 case OUTPUT_IMAGE_FORMAT_RGBA16UI:
360 *type = INTERNAL_TYPE_16UI;
361 *bpp = INTERNAL_BPP_64;
362 break;
363 case OUTPUT_IMAGE_FORMAT_RG16UI:
364 case OUTPUT_IMAGE_FORMAT_R16UI:
365 *type = INTERNAL_TYPE_16UI;
366 *bpp = INTERNAL_BPP_32;
367 break;
368
369 case OUTPUT_IMAGE_FORMAT_RGBA32I:
370 *type = INTERNAL_TYPE_32I;
371 *bpp = INTERNAL_BPP_128;
372 break;
373 case OUTPUT_IMAGE_FORMAT_RG32I:
374 *type = INTERNAL_TYPE_32I;
375 *bpp = INTERNAL_BPP_64;
376 break;
377 case OUTPUT_IMAGE_FORMAT_R32I:
378 *type = INTERNAL_TYPE_32I;
379 *bpp = INTERNAL_BPP_32;
380 break;
381
382 case OUTPUT_IMAGE_FORMAT_RGBA32UI:
383 *type = INTERNAL_TYPE_32UI;
384 *bpp = INTERNAL_BPP_128;
385 break;
386 case OUTPUT_IMAGE_FORMAT_RG32UI:
387 *type = INTERNAL_TYPE_32UI;
388 *bpp = INTERNAL_BPP_64;
389 break;
390 case OUTPUT_IMAGE_FORMAT_R32UI:
391 *type = INTERNAL_TYPE_32UI;
392 *bpp = INTERNAL_BPP_32;
393 break;
394
395 case OUTPUT_IMAGE_FORMAT_RGBA32F:
396 *type = INTERNAL_TYPE_32F;
397 *bpp = INTERNAL_BPP_128;
398 break;
399 case OUTPUT_IMAGE_FORMAT_RG32F:
400 *type = INTERNAL_TYPE_32F;
401 *bpp = INTERNAL_BPP_64;
402 break;
403 case OUTPUT_IMAGE_FORMAT_R32F:
404 *type = INTERNAL_TYPE_32F;
405 *bpp = INTERNAL_BPP_32;
406 break;
407
408 default:
409 /* Provide some default values, as we'll be called at RB
410 * creation time, even if an RB with this format isn't
411 * supported.
412 */
413 *type = INTERNAL_TYPE_8;
414 *bpp = INTERNAL_BPP_32;
415 break;
416 }
417 }