i915g: make gears run again.
[mesa.git] / src / gallium / drivers / vc5 / vc5_formats.c
1 /*
2 * Copyright © 2014-2017 Broadcom
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24 /**
25 * @file vc5_formats.c
26 *
27 * Contains the table and accessors for VC5 texture and render target format
28 * support.
29 *
30 * The hardware has limited support for texture formats, and extremely limited
31 * support for render target formats. As a result, we emulate other formats
32 * in our shader code, and this stores the table for doing so.
33 */
34
35 #include "util/u_format.h"
36 #include "util/macros.h"
37
38 #include "vc5_context.h"
39 #include "broadcom/cle/v3d_packet_v33_pack.h"
40
41 #define OUTPUT_IMAGE_FORMAT_NO 255
42
43 struct vc5_format {
44 /** Set if the pipe format is defined in the table. */
45 bool present;
46
47 /** One of V3D33_OUTPUT_IMAGE_FORMAT_*, or OUTPUT_IMAGE_FORMAT_NO */
48 uint8_t rt_type;
49
50 /** One of V3D33_TEXTURE_DATA_FORMAT_*. */
51 uint8_t tex_type;
52
53 /**
54 * Swizzle to apply to the RGBA shader output for storing to the tile
55 * buffer, to the RGBA tile buffer to produce shader input (for
56 * blending), and for turning the rgba8888 texture sampler return
57 * value into shader rgba values.
58 */
59 uint8_t swizzle[4];
60
61 /* Whether the return value is 16F/I/UI or 32F/I/UI. */
62 uint8_t return_size;
63
64 /* If return_size == 32, how many channels are returned by texturing.
65 * 16 always returns 2 pairs of 16 bit values.
66 */
67 uint8_t return_channels;
68 };
69
70 #define SWIZ(x,y,z,w) { \
71 PIPE_SWIZZLE_##x, \
72 PIPE_SWIZZLE_##y, \
73 PIPE_SWIZZLE_##z, \
74 PIPE_SWIZZLE_##w \
75 }
76
77 #define FORMAT(pipe, rt, tex, swiz, return_size, return_channels) \
78 [PIPE_FORMAT_##pipe] = { \
79 true, \
80 OUTPUT_IMAGE_FORMAT_##rt, \
81 TEXTURE_DATA_FORMAT_##tex, \
82 swiz, \
83 return_size, \
84 return_channels, \
85 }
86
87 #define SWIZ_X001 SWIZ(X, 0, 0, 1)
88 #define SWIZ_XY01 SWIZ(X, Y, 0, 1)
89 #define SWIZ_XYZ1 SWIZ(X, Y, Z, 1)
90 #define SWIZ_XYZW SWIZ(X, Y, Z, W)
91 #define SWIZ_YZWX SWIZ(Y, Z, W, X)
92 #define SWIZ_YZW1 SWIZ(Y, Z, W, 1)
93 #define SWIZ_ZYXW SWIZ(Z, Y, X, W)
94 #define SWIZ_ZYX1 SWIZ(Z, Y, X, 1)
95 #define SWIZ_XXXY SWIZ(X, X, X, Y)
96 #define SWIZ_XXX1 SWIZ(X, X, X, 1)
97 #define SWIZ_XXXX SWIZ(X, X, X, X)
98 #define SWIZ_000X SWIZ(0, 0, 0, X)
99
100 static const struct vc5_format vc5_format_table[] = {
101 FORMAT(B8G8R8A8_UNORM, RGBA8, RGBA8, SWIZ_ZYXW, 16, 0),
102 FORMAT(B8G8R8X8_UNORM, RGBX8, RGBA8, SWIZ_ZYX1, 16, 0),
103 FORMAT(B8G8R8A8_SRGB, SRGB8_ALPHA8, RGBA8, SWIZ_ZYXW, 16, 0),
104 FORMAT(B8G8R8X8_SRGB, SRGBX8, RGBA8, SWIZ_ZYX1, 16, 0),
105 FORMAT(R8G8B8A8_UNORM, RGBA8, RGBA8, SWIZ_XYZW, 16, 0),
106 FORMAT(R8G8B8X8_UNORM, RGBX8, RGBA8, SWIZ_XYZ1, 16, 0),
107 FORMAT(R8G8B8A8_SNORM, NO, RGBA8_SNORM, SWIZ_XYZW, 16, 0),
108 FORMAT(R8G8B8X8_SNORM, NO, RGBA8_SNORM, SWIZ_XYZ1, 16, 0),
109 FORMAT(R10G10B10A2_UNORM, RGB10_A2, RGB10_A2, SWIZ_XYZW, 16, 0),
110
111 FORMAT(B4G4R4A4_UNORM, ABGR4444, RGBA4, SWIZ_YZWX, 16, 0),
112 FORMAT(B4G4R4X4_UNORM, ABGR4444, RGBA4, SWIZ_YZW1, 16, 0),
113
114 FORMAT(A1B5G5R5_UNORM, ABGR1555, RGB5_A1, SWIZ_XYZW, 16, 0),
115 FORMAT(X1B5G5R5_UNORM, ABGR1555, RGB5_A1, SWIZ_XYZ1, 16, 0),
116 FORMAT(B5G6R5_UNORM, BGR565, RGB565, SWIZ_XYZ1, 16, 0),
117
118 FORMAT(R8_UNORM, R8, R8, SWIZ_X001, 16, 0),
119 FORMAT(R8_SNORM, NO, R8_SNORM, SWIZ_X001, 16, 0),
120 FORMAT(R8G8_UNORM, RG8, RG8, SWIZ_XY01, 16, 0),
121 FORMAT(R8G8_SNORM, NO, RG8_SNORM, SWIZ_XY01, 16, 0),
122
123 FORMAT(R16_UNORM, NO, R16, SWIZ_X001, 32, 1),
124 FORMAT(R16_SNORM, NO, R16_SNORM, SWIZ_X001, 32, 1),
125 FORMAT(R16_FLOAT, R16F, R16F, SWIZ_X001, 16, 0),
126 FORMAT(R32_FLOAT, R32F, R32F, SWIZ_X001, 32, 1),
127
128 FORMAT(R16G16_UNORM, NO, RG16, SWIZ_XY01, 32, 2),
129 FORMAT(R16G16_SNORM, NO, RG16_SNORM, SWIZ_XY01, 32, 2),
130 FORMAT(R16G16_FLOAT, RG16F, RG16F, SWIZ_XY01, 16, 0),
131 FORMAT(R32G32_FLOAT, RG32F, RG32F, SWIZ_XY01, 32, 2),
132
133 FORMAT(R16G16B16A16_UNORM, NO, RGBA16, SWIZ_XYZW, 32, 4),
134 FORMAT(R16G16B16A16_SNORM, NO, RGBA16_SNORM, SWIZ_XYZW, 32, 4),
135 FORMAT(R16G16B16A16_FLOAT, RGBA16F, RGBA16F, SWIZ_XYZW, 16, 0),
136 FORMAT(R32G32B32A32_FLOAT, RGBA32F, RGBA32F, SWIZ_XYZW, 32, 4),
137
138 /* If we don't have L/A/LA16, mesa/st will fall back to RGBA16. */
139 FORMAT(L16_UNORM, NO, R16, SWIZ_XXX1, 32, 1),
140 FORMAT(L16_SNORM, NO, R16_SNORM, SWIZ_XXX1, 32, 1),
141 FORMAT(I16_UNORM, NO, R16, SWIZ_XXXX, 32, 1),
142 FORMAT(I16_SNORM, NO, R16_SNORM, SWIZ_XXXX, 32, 1),
143 FORMAT(A16_UNORM, NO, R16, SWIZ_000X, 32, 1),
144 FORMAT(A16_SNORM, NO, R16_SNORM, SWIZ_000X, 32, 1),
145 FORMAT(L16A16_UNORM, NO, RG16, SWIZ_XXXY, 32, 2),
146 FORMAT(L16A16_SNORM, NO, RG16_SNORM, SWIZ_XXXY, 32, 2),
147
148 FORMAT(A8_UNORM, NO, R8, SWIZ_000X, 16, 0),
149 FORMAT(L8_UNORM, NO, R8, SWIZ_XXX1, 16, 0),
150 FORMAT(I8_UNORM, NO, R8, SWIZ_XXXX, 16, 0),
151 FORMAT(L8A8_UNORM, NO, RG8, SWIZ_XXXY, 16, 0),
152
153 FORMAT(R8_SINT, R8I, S8, SWIZ_X001, 16, 0),
154 FORMAT(R8_UINT, R8UI, S8, SWIZ_X001, 16, 0),
155 FORMAT(R8G8_SINT, RG8I, S16, SWIZ_XY01, 16, 0),
156 FORMAT(R8G8_UINT, RG8UI, S16, SWIZ_XY01, 16, 0),
157 FORMAT(R8G8B8A8_SINT, RGBA8I, R32F, SWIZ_XYZW, 16, 0),
158 FORMAT(R8G8B8A8_UINT, RGBA8UI, R32F, SWIZ_XYZW, 16, 0),
159
160 FORMAT(R16_SINT, R16I, S16, SWIZ_X001, 16, 0),
161 FORMAT(R16_UINT, R16UI, S16, SWIZ_X001, 16, 0),
162 FORMAT(R16G16_SINT, RG16I, R32F, SWIZ_XY01, 16, 0),
163 FORMAT(R16G16_UINT, RG16UI, R32F, SWIZ_XY01, 16, 0),
164 FORMAT(R16G16B16A16_SINT, RGBA16I, RG32F, SWIZ_XYZW, 16, 0),
165 FORMAT(R16G16B16A16_UINT, RGBA16UI, RG32F, SWIZ_XYZW, 16, 0),
166
167 FORMAT(R32_SINT, R32I, R32F, SWIZ_X001, 16, 0),
168 FORMAT(R32_UINT, R32UI, R32F, SWIZ_X001, 16, 0),
169 FORMAT(R32G32_SINT, RG32I, RG32F, SWIZ_XY01, 16, 0),
170 FORMAT(R32G32_UINT, RG32UI, RG32F, SWIZ_XY01, 16, 0),
171 FORMAT(R32G32B32A32_SINT, RGBA32I, RGBA32F, SWIZ_XYZW, 16, 0),
172 FORMAT(R32G32B32A32_UINT, RGBA32UI, RGBA32F, SWIZ_XYZW, 16, 0),
173
174 FORMAT(A8_SINT, R8I, S8, SWIZ_000X, 16, 0),
175 FORMAT(A8_UINT, R8UI, S8, SWIZ_000X, 16, 0),
176 FORMAT(A16_SINT, R16I, S16, SWIZ_000X, 16, 0),
177 FORMAT(A16_UINT, R16UI, S16, SWIZ_000X, 16, 0),
178 FORMAT(A32_SINT, R32I, R32F, SWIZ_000X, 16, 0),
179 FORMAT(A32_UINT, R32UI, R32F, SWIZ_000X, 16, 0),
180
181 FORMAT(R11G11B10_FLOAT, R11F_G11F_B10F, R11F_G11F_B10F, SWIZ_XYZW, 16, 0),
182 FORMAT(R9G9B9E5_FLOAT, NO, RGB9_E5, SWIZ_XYZW, 16, 0),
183
184 FORMAT(S8_UINT_Z24_UNORM, DEPTH24_STENCIL8, DEPTH24_X8, SWIZ_X001, 32, 1),
185 FORMAT(X8Z24_UNORM, DEPTH_COMPONENT24, DEPTH24_X8, SWIZ_X001, 32, 1),
186 FORMAT(S8X24_UINT, NO, R32F, SWIZ_X001, 32, 1),
187 FORMAT(Z32_FLOAT, DEPTH_COMPONENT32F, R32F, SWIZ_X001, 32, 1),
188 FORMAT(Z16_UNORM, DEPTH_COMPONENT16, DEPTH_COMP16, SWIZ_X001, 32, 1),
189
190 /* Pretend we support this, but it'll be separate Z32F depth and S8. */
191 FORMAT(Z32_FLOAT_S8X24_UINT, DEPTH_COMPONENT32F, R32F, SWIZ_X001, 32, 1),
192
193 FORMAT(ETC2_RGB8, NO, RGB8_ETC2, SWIZ_XYZ1, 16, 0),
194 FORMAT(ETC2_SRGB8, NO, RGB8_ETC2, SWIZ_XYZ1, 16, 0),
195 FORMAT(ETC2_RGB8A1, NO, RGB8_PUNCHTHROUGH_ALPHA1, SWIZ_XYZW, 16, 0),
196 FORMAT(ETC2_SRGB8A1, NO, RGB8_PUNCHTHROUGH_ALPHA1, SWIZ_XYZW, 16, 0),
197 FORMAT(ETC2_RGBA8, NO, RGBA8_ETC2_EAC, SWIZ_XYZW, 16, 0),
198 FORMAT(ETC2_R11_UNORM, NO, R11_EAC, SWIZ_X001, 16, 0),
199 FORMAT(ETC2_R11_SNORM, NO, SIGNED_R11_EAC, SWIZ_X001, 16, 0),
200 FORMAT(ETC2_RG11_UNORM, NO, RG11_EAC, SWIZ_XY01, 16, 0),
201 FORMAT(ETC2_RG11_SNORM, NO, SIGNED_RG11_EAC, SWIZ_XY01, 16, 0),
202
203 FORMAT(DXT1_RGB, NO, BC1, SWIZ_XYZ1, 16, 0),
204 FORMAT(DXT3_RGBA, NO, BC2, SWIZ_XYZ1, 16, 0),
205 FORMAT(DXT5_RGBA, NO, BC3, SWIZ_XYZ1, 16, 0),
206 };
207
208 static const struct vc5_format *
209 get_format(enum pipe_format f)
210 {
211 if (f >= ARRAY_SIZE(vc5_format_table) ||
212 !vc5_format_table[f].present)
213 return NULL;
214 else
215 return &vc5_format_table[f];
216 }
217
218 bool
219 vc5_rt_format_supported(enum pipe_format f)
220 {
221 const struct vc5_format *vf = get_format(f);
222
223 if (!vf)
224 return false;
225
226 return vf->rt_type != OUTPUT_IMAGE_FORMAT_NO;
227 }
228
229 uint8_t
230 vc5_get_rt_format(enum pipe_format f)
231 {
232 const struct vc5_format *vf = get_format(f);
233
234 if (!vf)
235 return 0;
236
237 return vf->rt_type;
238 }
239
240 bool
241 vc5_tex_format_supported(enum pipe_format f)
242 {
243 const struct vc5_format *vf = get_format(f);
244
245 return vf != NULL;
246 }
247
248 uint8_t
249 vc5_get_tex_format(enum pipe_format f)
250 {
251 const struct vc5_format *vf = get_format(f);
252
253 if (!vf)
254 return 0;
255
256 return vf->tex_type;
257 }
258
259 uint8_t
260 vc5_get_tex_return_size(enum pipe_format f)
261 {
262 const struct vc5_format *vf = get_format(f);
263
264 if (!vf)
265 return 0;
266
267 return vf->return_size;
268 }
269
270 uint8_t
271 vc5_get_tex_return_channels(enum pipe_format f)
272 {
273 const struct vc5_format *vf = get_format(f);
274
275 if (!vf)
276 return 0;
277
278 return vf->return_channels;
279 }
280
281 const uint8_t *
282 vc5_get_format_swizzle(enum pipe_format f)
283 {
284 const struct vc5_format *vf = get_format(f);
285 static const uint8_t fallback[] = {0, 1, 2, 3};
286
287 if (!vf)
288 return fallback;
289
290 return vf->swizzle;
291 }
292
293 void
294 vc5_get_internal_type_bpp_for_output_format(uint32_t format,
295 uint32_t *type,
296 uint32_t *bpp)
297 {
298 switch (format) {
299 case OUTPUT_IMAGE_FORMAT_RGBA8:
300 case OUTPUT_IMAGE_FORMAT_RGBX8:
301 case OUTPUT_IMAGE_FORMAT_RGB8:
302 case OUTPUT_IMAGE_FORMAT_RG8:
303 case OUTPUT_IMAGE_FORMAT_R8:
304 case OUTPUT_IMAGE_FORMAT_ABGR4444:
305 case OUTPUT_IMAGE_FORMAT_BGR565:
306 case OUTPUT_IMAGE_FORMAT_ABGR1555:
307 *type = INTERNAL_TYPE_8;
308 *bpp = INTERNAL_BPP_32;
309 break;
310
311 case OUTPUT_IMAGE_FORMAT_RGBA8I:
312 case OUTPUT_IMAGE_FORMAT_RG8I:
313 case OUTPUT_IMAGE_FORMAT_R8I:
314 *type = INTERNAL_TYPE_8I;
315 *bpp = INTERNAL_BPP_32;
316 break;
317
318 case OUTPUT_IMAGE_FORMAT_RGBA8UI:
319 case OUTPUT_IMAGE_FORMAT_RG8UI:
320 case OUTPUT_IMAGE_FORMAT_R8UI:
321 *type = INTERNAL_TYPE_8UI;
322 *bpp = INTERNAL_BPP_32;
323 break;
324
325 case OUTPUT_IMAGE_FORMAT_SRGB8_ALPHA8:
326 case OUTPUT_IMAGE_FORMAT_SRGB:
327 case OUTPUT_IMAGE_FORMAT_RGB10_A2:
328 case OUTPUT_IMAGE_FORMAT_R11F_G11F_B10F:
329 case OUTPUT_IMAGE_FORMAT_SRGBX8:
330 case OUTPUT_IMAGE_FORMAT_RGBA16F:
331 /* Note that sRGB RTs are stored in the tile buffer at 16F,
332 * and the conversion to sRGB happens at tilebuffer
333 * load/store.
334 */
335 *type = INTERNAL_TYPE_16F;
336 *bpp = INTERNAL_BPP_64;
337 break;
338
339 case OUTPUT_IMAGE_FORMAT_RG16F:
340 case OUTPUT_IMAGE_FORMAT_R16F:
341 *type = INTERNAL_TYPE_16F;
342 /* Use 64bpp to make sure the TLB doesn't throw away the alpha
343 * channel before alpha test happens.
344 */
345 *bpp = INTERNAL_BPP_64;
346 break;
347
348 case OUTPUT_IMAGE_FORMAT_RGBA16I:
349 *type = INTERNAL_TYPE_16I;
350 *bpp = INTERNAL_BPP_64;
351 break;
352 case OUTPUT_IMAGE_FORMAT_RG16I:
353 case OUTPUT_IMAGE_FORMAT_R16I:
354 *type = INTERNAL_TYPE_16I;
355 *bpp = INTERNAL_BPP_32;
356 break;
357
358 case OUTPUT_IMAGE_FORMAT_RGBA16UI:
359 *type = INTERNAL_TYPE_16UI;
360 *bpp = INTERNAL_BPP_64;
361 break;
362 case OUTPUT_IMAGE_FORMAT_RG16UI:
363 case OUTPUT_IMAGE_FORMAT_R16UI:
364 *type = INTERNAL_TYPE_16UI;
365 *bpp = INTERNAL_BPP_32;
366 break;
367
368 case OUTPUT_IMAGE_FORMAT_RGBA32I:
369 *type = INTERNAL_TYPE_32I;
370 *bpp = INTERNAL_BPP_128;
371 break;
372 case OUTPUT_IMAGE_FORMAT_RG32I:
373 *type = INTERNAL_TYPE_32I;
374 *bpp = INTERNAL_BPP_64;
375 break;
376 case OUTPUT_IMAGE_FORMAT_R32I:
377 *type = INTERNAL_TYPE_32I;
378 *bpp = INTERNAL_BPP_32;
379 break;
380
381 case OUTPUT_IMAGE_FORMAT_RGBA32UI:
382 *type = INTERNAL_TYPE_32UI;
383 *bpp = INTERNAL_BPP_128;
384 break;
385 case OUTPUT_IMAGE_FORMAT_RG32UI:
386 *type = INTERNAL_TYPE_32UI;
387 *bpp = INTERNAL_BPP_64;
388 break;
389 case OUTPUT_IMAGE_FORMAT_R32UI:
390 *type = INTERNAL_TYPE_32UI;
391 *bpp = INTERNAL_BPP_32;
392 break;
393
394 case OUTPUT_IMAGE_FORMAT_RGBA32F:
395 *type = INTERNAL_TYPE_32F;
396 *bpp = INTERNAL_BPP_128;
397 break;
398 case OUTPUT_IMAGE_FORMAT_RG32F:
399 *type = INTERNAL_TYPE_32F;
400 *bpp = INTERNAL_BPP_64;
401 break;
402 case OUTPUT_IMAGE_FORMAT_R32F:
403 *type = INTERNAL_TYPE_32F;
404 *bpp = INTERNAL_BPP_32;
405 break;
406
407 default:
408 /* Provide some default values, as we'll be called at RB
409 * creation time, even if an RB with this format isn't
410 * supported.
411 */
412 *type = INTERNAL_TYPE_8;
413 *bpp = INTERNAL_BPP_32;
414 break;
415 }
416 }