08e1dd0383d3685cb3abe7ae4eb422891933bf79
[mesa.git] / src / gallium / drivers / vc5 / vc5_formats.c
1 /*
2 * Copyright © 2014-2017 Broadcom
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24 /**
25 * @file vc5_formats.c
26 *
27 * Contains the table and accessors for VC5 texture and render target format
28 * support.
29 *
30 * The hardware has limited support for texture formats, and extremely limited
31 * support for render target formats. As a result, we emulate other formats
32 * in our shader code, and this stores the table for doing so.
33 */
34
35 #include "util/u_format.h"
36 #include "util/macros.h"
37
38 #include "vc5_context.h"
39 #include "broadcom/cle/v3d_packet_v33_pack.h"
40
41 #define V3D_OUTPUT_IMAGE_FORMAT_NO 255
42
43 struct vc5_format {
44 /** Set if the pipe format is defined in the table. */
45 bool present;
46
47 /** One of V3D33_OUTPUT_IMAGE_FORMAT_*, or OUTPUT_IMAGE_FORMAT_NO */
48 uint8_t rt_type;
49
50 /** One of V3D33_TEXTURE_DATA_FORMAT_*. */
51 uint8_t tex_type;
52
53 /**
54 * Swizzle to apply to the RGBA shader output for storing to the tile
55 * buffer, to the RGBA tile buffer to produce shader input (for
56 * blending), and for turning the rgba8888 texture sampler return
57 * value into shader rgba values.
58 */
59 uint8_t swizzle[4];
60
61 /* Whether the return value is 16F/I/UI or 32F/I/UI. */
62 uint8_t return_size;
63
64 /* If return_size == 32, how many channels are returned by texturing.
65 * 16 always returns 2 pairs of 16 bit values.
66 */
67 uint8_t return_channels;
68 };
69
70 #define SWIZ(x,y,z,w) { \
71 PIPE_SWIZZLE_##x, \
72 PIPE_SWIZZLE_##y, \
73 PIPE_SWIZZLE_##z, \
74 PIPE_SWIZZLE_##w \
75 }
76
77 #define FORMAT(pipe, rt, tex, swiz, return_size, return_channels) \
78 [PIPE_FORMAT_##pipe] = { \
79 true, \
80 V3D_OUTPUT_IMAGE_FORMAT_##rt, \
81 TEXTURE_DATA_FORMAT_##tex, \
82 swiz, \
83 return_size, \
84 return_channels, \
85 }
86
87 #define SWIZ_X001 SWIZ(X, 0, 0, 1)
88 #define SWIZ_XY01 SWIZ(X, Y, 0, 1)
89 #define SWIZ_XYZ1 SWIZ(X, Y, Z, 1)
90 #define SWIZ_XYZW SWIZ(X, Y, Z, W)
91 #define SWIZ_YZWX SWIZ(Y, Z, W, X)
92 #define SWIZ_YZW1 SWIZ(Y, Z, W, 1)
93 #define SWIZ_ZYXW SWIZ(Z, Y, X, W)
94 #define SWIZ_ZYX1 SWIZ(Z, Y, X, 1)
95 #define SWIZ_XXXY SWIZ(X, X, X, Y)
96 #define SWIZ_XXX1 SWIZ(X, X, X, 1)
97 #define SWIZ_XXXX SWIZ(X, X, X, X)
98 #define SWIZ_000X SWIZ(0, 0, 0, X)
99
100 static const struct vc5_format vc5_format_table[] = {
101 FORMAT(B8G8R8A8_UNORM, RGBA8, RGBA8, SWIZ_ZYXW, 16, 0),
102 FORMAT(B8G8R8X8_UNORM, RGBX8, RGBA8, SWIZ_ZYX1, 16, 0),
103 FORMAT(B8G8R8A8_SRGB, SRGB8_ALPHA8, RGBA8, SWIZ_ZYXW, 16, 0),
104 FORMAT(B8G8R8X8_SRGB, SRGBX8, RGBA8, SWIZ_ZYX1, 16, 0),
105 FORMAT(R8G8B8A8_UNORM, RGBA8, RGBA8, SWIZ_XYZW, 16, 0),
106 FORMAT(R8G8B8X8_UNORM, RGBX8, RGBA8, SWIZ_XYZ1, 16, 0),
107 FORMAT(R8G8B8A8_SNORM, NO, RGBA8_SNORM, SWIZ_XYZW, 16, 0),
108 FORMAT(R8G8B8X8_SNORM, NO, RGBA8_SNORM, SWIZ_XYZ1, 16, 0),
109 FORMAT(R10G10B10A2_UNORM, RGB10_A2, RGB10_A2, SWIZ_XYZW, 16, 0),
110 FORMAT(B10G10R10A2_UINT, RGB10_A2UI, RGB10_A2UI, SWIZ_ZYXW, 16, 0),
111
112 FORMAT(B4G4R4A4_UNORM, ABGR4444, RGBA4, SWIZ_YZWX, 16, 0),
113 FORMAT(B4G4R4X4_UNORM, ABGR4444, RGBA4, SWIZ_YZW1, 16, 0),
114
115 FORMAT(A1B5G5R5_UNORM, ABGR1555, RGB5_A1, SWIZ_XYZW, 16, 0),
116 FORMAT(X1B5G5R5_UNORM, ABGR1555, RGB5_A1, SWIZ_XYZ1, 16, 0),
117 FORMAT(B5G6R5_UNORM, BGR565, RGB565, SWIZ_XYZ1, 16, 0),
118
119 FORMAT(R8_UNORM, R8, R8, SWIZ_X001, 16, 0),
120 FORMAT(R8_SNORM, NO, R8_SNORM, SWIZ_X001, 16, 0),
121 FORMAT(R8G8_UNORM, RG8, RG8, SWIZ_XY01, 16, 0),
122 FORMAT(R8G8_SNORM, NO, RG8_SNORM, SWIZ_XY01, 16, 0),
123
124 FORMAT(R16_UNORM, NO, R16, SWIZ_X001, 32, 1),
125 FORMAT(R16_SNORM, NO, R16_SNORM, SWIZ_X001, 32, 1),
126 FORMAT(R16_FLOAT, R16F, R16F, SWIZ_X001, 16, 0),
127 FORMAT(R32_FLOAT, R32F, R32F, SWIZ_X001, 32, 1),
128
129 FORMAT(R16G16_UNORM, NO, RG16, SWIZ_XY01, 32, 2),
130 FORMAT(R16G16_SNORM, NO, RG16_SNORM, SWIZ_XY01, 32, 2),
131 FORMAT(R16G16_FLOAT, RG16F, RG16F, SWIZ_XY01, 16, 0),
132 FORMAT(R32G32_FLOAT, RG32F, RG32F, SWIZ_XY01, 32, 2),
133
134 FORMAT(R16G16B16A16_UNORM, NO, RGBA16, SWIZ_XYZW, 32, 4),
135 FORMAT(R16G16B16A16_SNORM, NO, RGBA16_SNORM, SWIZ_XYZW, 32, 4),
136 FORMAT(R16G16B16A16_FLOAT, RGBA16F, RGBA16F, SWIZ_XYZW, 16, 0),
137 FORMAT(R32G32B32A32_FLOAT, RGBA32F, RGBA32F, SWIZ_XYZW, 32, 4),
138
139 /* If we don't have L/A/LA16, mesa/st will fall back to RGBA16. */
140 FORMAT(L16_UNORM, NO, R16, SWIZ_XXX1, 32, 1),
141 FORMAT(L16_SNORM, NO, R16_SNORM, SWIZ_XXX1, 32, 1),
142 FORMAT(I16_UNORM, NO, R16, SWIZ_XXXX, 32, 1),
143 FORMAT(I16_SNORM, NO, R16_SNORM, SWIZ_XXXX, 32, 1),
144 FORMAT(A16_UNORM, NO, R16, SWIZ_000X, 32, 1),
145 FORMAT(A16_SNORM, NO, R16_SNORM, SWIZ_000X, 32, 1),
146 FORMAT(L16A16_UNORM, NO, RG16, SWIZ_XXXY, 32, 2),
147 FORMAT(L16A16_SNORM, NO, RG16_SNORM, SWIZ_XXXY, 32, 2),
148
149 FORMAT(A8_UNORM, NO, R8, SWIZ_000X, 16, 0),
150 FORMAT(L8_UNORM, NO, R8, SWIZ_XXX1, 16, 0),
151 FORMAT(I8_UNORM, NO, R8, SWIZ_XXXX, 16, 0),
152 FORMAT(L8A8_UNORM, NO, RG8, SWIZ_XXXY, 16, 0),
153
154 FORMAT(R8_SINT, R8I, R8I, SWIZ_X001, 16, 0),
155 FORMAT(R8_UINT, R8UI, R8UI, SWIZ_X001, 16, 0),
156 FORMAT(R8G8_SINT, RG8I, RG8I, SWIZ_XY01, 16, 0),
157 FORMAT(R8G8_UINT, RG8UI, RG8UI, SWIZ_XY01, 16, 0),
158 FORMAT(R8G8B8A8_SINT, RGBA8I, RGBA8I, SWIZ_XYZW, 16, 0),
159 FORMAT(R8G8B8A8_UINT, RGBA8UI, RGBA8UI, SWIZ_XYZW, 16, 0),
160
161 FORMAT(R16_SINT, R16I, R16I, SWIZ_X001, 16, 0),
162 FORMAT(R16_UINT, R16UI, R16UI, SWIZ_X001, 16, 0),
163 FORMAT(R16G16_SINT, RG16I, R16I, SWIZ_XY01, 16, 0),
164 FORMAT(R16G16_UINT, RG16UI, R16UI, SWIZ_XY01, 16, 0),
165 FORMAT(R16G16B16A16_SINT, RGBA16I, RGBA16I, SWIZ_XYZW, 16, 0),
166 FORMAT(R16G16B16A16_UINT, RGBA16UI, RGBA16UI, SWIZ_XYZW, 16, 0),
167
168 FORMAT(R32_SINT, R32I, R32I, SWIZ_X001, 32, 1),
169 FORMAT(R32_UINT, R32UI, R32UI, SWIZ_X001, 32, 1),
170 FORMAT(R32G32_SINT, RG32I, RG32I, SWIZ_XY01, 32, 2),
171 FORMAT(R32G32_UINT, RG32UI, RG32UI, SWIZ_XY01, 32, 2),
172 FORMAT(R32G32B32A32_SINT, RGBA32I, RGBA32I, SWIZ_XYZW, 32, 4),
173 FORMAT(R32G32B32A32_UINT, RGBA32UI, RGBA32UI, SWIZ_XYZW, 32, 4),
174
175 FORMAT(A8_SINT, R8I, R8I, SWIZ_000X, 16, 0),
176 FORMAT(A8_UINT, R8UI, R8UI, SWIZ_000X, 16, 0),
177 FORMAT(A16_SINT, R16I, R16I, SWIZ_000X, 16, 0),
178 FORMAT(A16_UINT, R16UI, R16UI, SWIZ_000X, 16, 0),
179 FORMAT(A32_SINT, R32I, R32I, SWIZ_000X, 32, 1),
180 FORMAT(A32_UINT, R32UI, R32UI, SWIZ_000X, 32, 1),
181
182 FORMAT(R11G11B10_FLOAT, R11F_G11F_B10F, R11F_G11F_B10F, SWIZ_XYZW, 16, 0),
183 FORMAT(R9G9B9E5_FLOAT, NO, RGB9_E5, SWIZ_XYZW, 16, 0),
184
185 FORMAT(S8_UINT_Z24_UNORM, ZS_DEPTH24_STENCIL8, DEPTH24_X8, SWIZ_XXXX, 32, 1),
186 FORMAT(X8Z24_UNORM, ZS_DEPTH24_STENCIL8, DEPTH24_X8, SWIZ_XXXX, 32, 1),
187 FORMAT(S8X24_UINT, NO, R32F, SWIZ_XXXX, 32, 1),
188 FORMAT(Z32_FLOAT, ZS_DEPTH_COMPONENT32F, R32F, SWIZ_XXXX, 32, 1),
189 FORMAT(Z16_UNORM, ZS_DEPTH_COMPONENT16, DEPTH_COMP16, SWIZ_XXXX, 32, 1),
190
191 /* Pretend we support this, but it'll be separate Z32F depth and S8. */
192 FORMAT(Z32_FLOAT_S8X24_UINT, ZS_DEPTH_COMPONENT32F, R32F, SWIZ_XXXX, 32, 1),
193
194 FORMAT(ETC2_RGB8, NO, RGB8_ETC2, SWIZ_XYZ1, 16, 0),
195 FORMAT(ETC2_SRGB8, NO, RGB8_ETC2, SWIZ_XYZ1, 16, 0),
196 FORMAT(ETC2_RGB8A1, NO, RGB8_PUNCHTHROUGH_ALPHA1, SWIZ_XYZW, 16, 0),
197 FORMAT(ETC2_SRGB8A1, NO, RGB8_PUNCHTHROUGH_ALPHA1, SWIZ_XYZW, 16, 0),
198 FORMAT(ETC2_RGBA8, NO, RGBA8_ETC2_EAC, SWIZ_XYZW, 16, 0),
199 FORMAT(ETC2_SRGBA8, NO, RGBA8_ETC2_EAC, SWIZ_XYZW, 16, 0),
200 FORMAT(ETC2_R11_UNORM, NO, R11_EAC, SWIZ_X001, 16, 0),
201 FORMAT(ETC2_R11_SNORM, NO, SIGNED_R11_EAC, SWIZ_X001, 16, 0),
202 FORMAT(ETC2_RG11_UNORM, NO, RG11_EAC, SWIZ_XY01, 16, 0),
203 FORMAT(ETC2_RG11_SNORM, NO, SIGNED_RG11_EAC, SWIZ_XY01, 16, 0),
204
205 FORMAT(DXT1_RGB, NO, BC1, SWIZ_XYZ1, 16, 0),
206 FORMAT(DXT3_RGBA, NO, BC2, SWIZ_XYZ1, 16, 0),
207 FORMAT(DXT5_RGBA, NO, BC3, SWIZ_XYZ1, 16, 0),
208 };
209
210 static const struct vc5_format *
211 get_format(enum pipe_format f)
212 {
213 if (f >= ARRAY_SIZE(vc5_format_table) ||
214 !vc5_format_table[f].present)
215 return NULL;
216 else
217 return &vc5_format_table[f];
218 }
219
220 bool
221 vc5_rt_format_supported(enum pipe_format f)
222 {
223 const struct vc5_format *vf = get_format(f);
224
225 if (!vf)
226 return false;
227
228 return vf->rt_type != V3D_OUTPUT_IMAGE_FORMAT_NO;
229 }
230
231 uint8_t
232 vc5_get_rt_format(enum pipe_format f)
233 {
234 const struct vc5_format *vf = get_format(f);
235
236 if (!vf)
237 return 0;
238
239 return vf->rt_type;
240 }
241
242 bool
243 vc5_tex_format_supported(enum pipe_format f)
244 {
245 const struct vc5_format *vf = get_format(f);
246
247 return vf != NULL;
248 }
249
250 uint8_t
251 vc5_get_tex_format(enum pipe_format f)
252 {
253 const struct vc5_format *vf = get_format(f);
254
255 if (!vf)
256 return 0;
257
258 return vf->tex_type;
259 }
260
261 uint8_t
262 vc5_get_tex_return_size(enum pipe_format f, enum pipe_tex_compare compare)
263 {
264 const struct vc5_format *vf = get_format(f);
265
266 if (!vf)
267 return 0;
268
269 if (compare == PIPE_TEX_COMPARE_R_TO_TEXTURE)
270 return 16;
271
272 return vf->return_size;
273 }
274
275 uint8_t
276 vc5_get_tex_return_channels(enum pipe_format f)
277 {
278 const struct vc5_format *vf = get_format(f);
279
280 if (!vf)
281 return 0;
282
283 return vf->return_channels;
284 }
285
286 const uint8_t *
287 vc5_get_format_swizzle(enum pipe_format f)
288 {
289 const struct vc5_format *vf = get_format(f);
290 static const uint8_t fallback[] = {0, 1, 2, 3};
291
292 if (!vf)
293 return fallback;
294
295 return vf->swizzle;
296 }
297
298 void
299 vc5_get_internal_type_bpp_for_output_format(uint32_t format,
300 uint32_t *type,
301 uint32_t *bpp)
302 {
303 switch (format) {
304 case V3D_OUTPUT_IMAGE_FORMAT_RGBA8:
305 case V3D_OUTPUT_IMAGE_FORMAT_RGBX8:
306 case V3D_OUTPUT_IMAGE_FORMAT_RGB8:
307 case V3D_OUTPUT_IMAGE_FORMAT_RG8:
308 case V3D_OUTPUT_IMAGE_FORMAT_R8:
309 case V3D_OUTPUT_IMAGE_FORMAT_ABGR4444:
310 case V3D_OUTPUT_IMAGE_FORMAT_BGR565:
311 case V3D_OUTPUT_IMAGE_FORMAT_ABGR1555:
312 *type = V3D_INTERNAL_TYPE_8;
313 *bpp = V3D_INTERNAL_BPP_32;
314 break;
315
316 case V3D_OUTPUT_IMAGE_FORMAT_RGBA8I:
317 case V3D_OUTPUT_IMAGE_FORMAT_RG8I:
318 case V3D_OUTPUT_IMAGE_FORMAT_R8I:
319 *type = V3D_INTERNAL_TYPE_8I;
320 *bpp = V3D_INTERNAL_BPP_32;
321 break;
322
323 case V3D_OUTPUT_IMAGE_FORMAT_RGBA8UI:
324 case V3D_OUTPUT_IMAGE_FORMAT_RG8UI:
325 case V3D_OUTPUT_IMAGE_FORMAT_R8UI:
326 *type = V3D_INTERNAL_TYPE_8UI;
327 *bpp = V3D_INTERNAL_BPP_32;
328 break;
329
330 case V3D_OUTPUT_IMAGE_FORMAT_SRGB8_ALPHA8:
331 case V3D_OUTPUT_IMAGE_FORMAT_SRGB:
332 case V3D_OUTPUT_IMAGE_FORMAT_RGB10_A2:
333 case V3D_OUTPUT_IMAGE_FORMAT_R11F_G11F_B10F:
334 case V3D_OUTPUT_IMAGE_FORMAT_SRGBX8:
335 case V3D_OUTPUT_IMAGE_FORMAT_RGBA16F:
336 /* Note that sRGB RTs are stored in the tile buffer at 16F,
337 * and the conversion to sRGB happens at tilebuffer
338 * load/store.
339 */
340 *type = V3D_INTERNAL_TYPE_16F;
341 *bpp = V3D_INTERNAL_BPP_64;
342 break;
343
344 case V3D_OUTPUT_IMAGE_FORMAT_RG16F:
345 case V3D_OUTPUT_IMAGE_FORMAT_R16F:
346 *type = V3D_INTERNAL_TYPE_16F;
347 /* Use 64bpp to make sure the TLB doesn't throw away the alpha
348 * channel before alpha test happens.
349 */
350 *bpp = V3D_INTERNAL_BPP_64;
351 break;
352
353 case V3D_OUTPUT_IMAGE_FORMAT_RGBA16I:
354 *type = V3D_INTERNAL_TYPE_16I;
355 *bpp = V3D_INTERNAL_BPP_64;
356 break;
357 case V3D_OUTPUT_IMAGE_FORMAT_RG16I:
358 case V3D_OUTPUT_IMAGE_FORMAT_R16I:
359 *type = V3D_INTERNAL_TYPE_16I;
360 *bpp = V3D_INTERNAL_BPP_32;
361 break;
362
363 case V3D_OUTPUT_IMAGE_FORMAT_RGB10_A2UI:
364 case V3D_OUTPUT_IMAGE_FORMAT_RGBA16UI:
365 *type = V3D_INTERNAL_TYPE_16UI;
366 *bpp = V3D_INTERNAL_BPP_64;
367 break;
368 case V3D_OUTPUT_IMAGE_FORMAT_RG16UI:
369 case V3D_OUTPUT_IMAGE_FORMAT_R16UI:
370 *type = V3D_INTERNAL_TYPE_16UI;
371 *bpp = V3D_INTERNAL_BPP_32;
372 break;
373
374 case V3D_OUTPUT_IMAGE_FORMAT_RGBA32I:
375 *type = V3D_INTERNAL_TYPE_32I;
376 *bpp = V3D_INTERNAL_BPP_128;
377 break;
378 case V3D_OUTPUT_IMAGE_FORMAT_RG32I:
379 *type = V3D_INTERNAL_TYPE_32I;
380 *bpp = V3D_INTERNAL_BPP_64;
381 break;
382 case V3D_OUTPUT_IMAGE_FORMAT_R32I:
383 *type = V3D_INTERNAL_TYPE_32I;
384 *bpp = V3D_INTERNAL_BPP_32;
385 break;
386
387 case V3D_OUTPUT_IMAGE_FORMAT_RGBA32UI:
388 *type = V3D_INTERNAL_TYPE_32UI;
389 *bpp = V3D_INTERNAL_BPP_128;
390 break;
391 case V3D_OUTPUT_IMAGE_FORMAT_RG32UI:
392 *type = V3D_INTERNAL_TYPE_32UI;
393 *bpp = V3D_INTERNAL_BPP_64;
394 break;
395 case V3D_OUTPUT_IMAGE_FORMAT_R32UI:
396 *type = V3D_INTERNAL_TYPE_32UI;
397 *bpp = V3D_INTERNAL_BPP_32;
398 break;
399
400 case V3D_OUTPUT_IMAGE_FORMAT_RGBA32F:
401 *type = V3D_INTERNAL_TYPE_32F;
402 *bpp = V3D_INTERNAL_BPP_128;
403 break;
404 case V3D_OUTPUT_IMAGE_FORMAT_RG32F:
405 *type = V3D_INTERNAL_TYPE_32F;
406 *bpp = V3D_INTERNAL_BPP_64;
407 break;
408 case V3D_OUTPUT_IMAGE_FORMAT_R32F:
409 *type = V3D_INTERNAL_TYPE_32F;
410 *bpp = V3D_INTERNAL_BPP_32;
411 break;
412
413 default:
414 /* Provide some default values, as we'll be called at RB
415 * creation time, even if an RB with this format isn't
416 * supported.
417 */
418 *type = V3D_INTERNAL_TYPE_8;
419 *bpp = V3D_INTERNAL_BPP_32;
420 break;
421 }
422 }