ir3: Rewrite UBO push analysis to support bindless
[mesa.git] / src / freedreno / vulkan / tu_formats.c
1
2 /*
3 * Copyright © 2016 Red Hat.
4 * Copyright © 2016 Bas Nieuwenhuizen
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice (including the next
14 * paragraph) shall be included in all copies or substantial portions of the
15 * Software.
16 *
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
22 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
23 * DEALINGS IN THE SOFTWARE.
24 */
25
26 #include "tu_private.h"
27
28 #include "registers/adreno_common.xml.h"
29 #include "registers/a6xx.xml.h"
30
31 #include "vk_format.h"
32 #include "vk_util.h"
33 #include "drm-uapi/drm_fourcc.h"
34
35 #define FMT6_x -1
36
37 #define TU6_FMT(vkfmt, hwfmt, swapfmt, valid) \
38 [VK_FORMAT_##vkfmt] = { \
39 .fmt = FMT6_##hwfmt, \
40 .swap = swapfmt, \
41 .supported = valid, \
42 }
43
44 #define TU6_VTC(vk, fmt, swap) TU6_FMT(vk, fmt, swap, FMT_VERTEX | FMT_TEXTURE | FMT_COLOR)
45 #define TU6_xTC(vk, fmt, swap) TU6_FMT(vk, fmt, swap, FMT_TEXTURE | FMT_COLOR)
46 #define TU6_Vxx(vk, fmt, swap) TU6_FMT(vk, fmt, swap, FMT_VERTEX)
47 #define TU6_xTx(vk, fmt, swap) TU6_FMT(vk, fmt, swap, FMT_TEXTURE)
48 #define TU6_xxx(vk, fmt, swap) TU6_FMT(vk, x, WZYX, false)
49
50 static const struct tu_native_format tu6_format_table[] = {
51 TU6_xxx(UNDEFINED, x, x), /* 0 */
52
53 /* 8-bit packed */
54 TU6_xxx(R4G4_UNORM_PACK8, 4_4_UNORM, WZXY), /* 1 */
55
56 /* 16-bit packed */
57 TU6_xTC(R4G4B4A4_UNORM_PACK16, 4_4_4_4_UNORM, XYZW), /* 2 */
58 TU6_xTC(B4G4R4A4_UNORM_PACK16, 4_4_4_4_UNORM, ZYXW), /* 3 */
59 TU6_xTC(R5G6B5_UNORM_PACK16, 5_6_5_UNORM, WXYZ), /* 4 */
60 TU6_xTC(B5G6R5_UNORM_PACK16, 5_6_5_UNORM, WZYX), /* 5 */
61 TU6_xTC(R5G5B5A1_UNORM_PACK16, 5_5_5_1_UNORM, XYZW), /* 6 */
62 TU6_xTC(B5G5R5A1_UNORM_PACK16, 5_5_5_1_UNORM, ZYXW), /* 7 */
63 TU6_xTC(A1R5G5B5_UNORM_PACK16, 5_5_5_1_UNORM, WXYZ), /* 8 */
64
65 /* 8-bit R */
66 TU6_VTC(R8_UNORM, 8_UNORM, WZYX), /* 9 */
67 TU6_VTC(R8_SNORM, 8_SNORM, WZYX), /* 10 */
68 TU6_Vxx(R8_USCALED, 8_UINT, WZYX), /* 11 */
69 TU6_Vxx(R8_SSCALED, 8_SINT, WZYX), /* 12 */
70 TU6_VTC(R8_UINT, 8_UINT, WZYX), /* 13 */
71 TU6_VTC(R8_SINT, 8_SINT, WZYX), /* 14 */
72 TU6_xTC(R8_SRGB, 8_UNORM, WZYX), /* 15 */
73
74 /* 16-bit RG */
75 TU6_VTC(R8G8_UNORM, 8_8_UNORM, WZYX), /* 16 */
76 TU6_VTC(R8G8_SNORM, 8_8_SNORM, WZYX), /* 17 */
77 TU6_Vxx(R8G8_USCALED, 8_8_UINT, WZYX), /* 18 */
78 TU6_Vxx(R8G8_SSCALED, 8_8_SINT, WZYX), /* 19 */
79 TU6_VTC(R8G8_UINT, 8_8_UINT, WZYX), /* 20 */
80 TU6_VTC(R8G8_SINT, 8_8_SINT, WZYX), /* 21 */
81 TU6_xTC(R8G8_SRGB, 8_8_UNORM, WZYX), /* 22 */
82
83 /* 24-bit RGB */
84 TU6_Vxx(R8G8B8_UNORM, 8_8_8_UNORM, WZYX), /* 23 */
85 TU6_Vxx(R8G8B8_SNORM, 8_8_8_SNORM, WZYX), /* 24 */
86 TU6_Vxx(R8G8B8_USCALED, 8_8_8_UINT, WZYX), /* 25 */
87 TU6_Vxx(R8G8B8_SSCALED, 8_8_8_SINT, WZYX), /* 26 */
88 TU6_Vxx(R8G8B8_UINT, 8_8_8_UINT, WZYX), /* 27 */
89 TU6_Vxx(R8G8B8_SINT, 8_8_8_SINT, WZYX), /* 28 */
90 TU6_xxx(R8G8B8_SRGB, 8_8_8_UNORM, WZYX), /* 29 */
91
92 /* 24-bit BGR */
93 TU6_xxx(B8G8R8_UNORM, 8_8_8_UNORM, WXYZ), /* 30 */
94 TU6_xxx(B8G8R8_SNORM, 8_8_8_SNORM, WXYZ), /* 31 */
95 TU6_xxx(B8G8R8_USCALED, 8_8_8_UINT, WXYZ), /* 32 */
96 TU6_xxx(B8G8R8_SSCALED, 8_8_8_SINT, WXYZ), /* 33 */
97 TU6_xxx(B8G8R8_UINT, 8_8_8_UINT, WXYZ), /* 34 */
98 TU6_xxx(B8G8R8_SINT, 8_8_8_SINT, WXYZ), /* 35 */
99 TU6_xxx(B8G8R8_SRGB, 8_8_8_UNORM, WXYZ), /* 36 */
100
101 /* 32-bit RGBA */
102 TU6_VTC(R8G8B8A8_UNORM, 8_8_8_8_UNORM, WZYX), /* 37 */
103 TU6_VTC(R8G8B8A8_SNORM, 8_8_8_8_SNORM, WZYX), /* 38 */
104 TU6_Vxx(R8G8B8A8_USCALED, 8_8_8_8_UINT, WZYX), /* 39 */
105 TU6_Vxx(R8G8B8A8_SSCALED, 8_8_8_8_SINT, WZYX), /* 40 */
106 TU6_VTC(R8G8B8A8_UINT, 8_8_8_8_UINT, WZYX), /* 41 */
107 TU6_VTC(R8G8B8A8_SINT, 8_8_8_8_SINT, WZYX), /* 42 */
108 TU6_xTC(R8G8B8A8_SRGB, 8_8_8_8_UNORM, WZYX), /* 43 */
109
110 /* 32-bit BGRA */
111 TU6_VTC(B8G8R8A8_UNORM, 8_8_8_8_UNORM, WXYZ), /* 44 */
112 TU6_VTC(B8G8R8A8_SNORM, 8_8_8_8_SNORM, WXYZ), /* 45 */
113 TU6_Vxx(B8G8R8A8_USCALED, 8_8_8_8_UINT, WXYZ), /* 46 */
114 TU6_Vxx(B8G8R8A8_SSCALED, 8_8_8_8_SINT, WXYZ), /* 47 */
115 TU6_VTC(B8G8R8A8_UINT, 8_8_8_8_UINT, WXYZ), /* 48 */
116 TU6_VTC(B8G8R8A8_SINT, 8_8_8_8_SINT, WXYZ), /* 49 */
117 TU6_xTC(B8G8R8A8_SRGB, 8_8_8_8_UNORM, WXYZ), /* 50 */
118
119 /* 32-bit packed */
120 TU6_VTC(A8B8G8R8_UNORM_PACK32, 8_8_8_8_UNORM, WZYX), /* 51 */
121 TU6_VTC(A8B8G8R8_SNORM_PACK32, 8_8_8_8_SNORM, WZYX), /* 52 */
122 TU6_Vxx(A8B8G8R8_USCALED_PACK32, 8_8_8_8_UINT, WZYX), /* 53 */
123 TU6_Vxx(A8B8G8R8_SSCALED_PACK32, 8_8_8_8_SINT, WZYX), /* 54 */
124 TU6_VTC(A8B8G8R8_UINT_PACK32, 8_8_8_8_UINT, WZYX), /* 55 */
125 TU6_VTC(A8B8G8R8_SINT_PACK32, 8_8_8_8_SINT, WZYX), /* 56 */
126 TU6_xTC(A8B8G8R8_SRGB_PACK32, 8_8_8_8_UNORM, WZYX), /* 57 */
127 TU6_VTC(A2R10G10B10_UNORM_PACK32, 10_10_10_2_UNORM, WXYZ), /* 58 */
128 TU6_Vxx(A2R10G10B10_SNORM_PACK32, 10_10_10_2_SNORM, WXYZ), /* 59 */
129 TU6_Vxx(A2R10G10B10_USCALED_PACK32, 10_10_10_2_UINT, WXYZ), /* 60 */
130 TU6_Vxx(A2R10G10B10_SSCALED_PACK32, 10_10_10_2_SINT, WXYZ), /* 61 */
131 TU6_VTC(A2R10G10B10_UINT_PACK32, 10_10_10_2_UINT, WXYZ), /* 62 */
132 TU6_Vxx(A2R10G10B10_SINT_PACK32, 10_10_10_2_SINT, WXYZ), /* 63 */
133 TU6_VTC(A2B10G10R10_UNORM_PACK32, 10_10_10_2_UNORM, WZYX), /* 64 */
134 TU6_Vxx(A2B10G10R10_SNORM_PACK32, 10_10_10_2_SNORM, WZYX), /* 65 */
135 TU6_Vxx(A2B10G10R10_USCALED_PACK32, 10_10_10_2_UINT, WZYX), /* 66 */
136 TU6_Vxx(A2B10G10R10_SSCALED_PACK32, 10_10_10_2_SINT, WZYX), /* 67 */
137 TU6_VTC(A2B10G10R10_UINT_PACK32, 10_10_10_2_UINT, WZYX), /* 68 */
138 TU6_Vxx(A2B10G10R10_SINT_PACK32, 10_10_10_2_SINT, WZYX), /* 69 */
139
140 /* 16-bit R */
141 TU6_VTC(R16_UNORM, 16_UNORM, WZYX), /* 70 */
142 TU6_VTC(R16_SNORM, 16_SNORM, WZYX), /* 71 */
143 TU6_Vxx(R16_USCALED, 16_UINT, WZYX), /* 72 */
144 TU6_Vxx(R16_SSCALED, 16_SINT, WZYX), /* 73 */
145 TU6_VTC(R16_UINT, 16_UINT, WZYX), /* 74 */
146 TU6_VTC(R16_SINT, 16_SINT, WZYX), /* 75 */
147 TU6_VTC(R16_SFLOAT, 16_FLOAT, WZYX), /* 76 */
148
149 /* 32-bit RG */
150 TU6_VTC(R16G16_UNORM, 16_16_UNORM, WZYX), /* 77 */
151 TU6_VTC(R16G16_SNORM, 16_16_SNORM, WZYX), /* 78 */
152 TU6_Vxx(R16G16_USCALED, 16_16_UINT, WZYX), /* 79 */
153 TU6_Vxx(R16G16_SSCALED, 16_16_SINT, WZYX), /* 80 */
154 TU6_VTC(R16G16_UINT, 16_16_UINT, WZYX), /* 81 */
155 TU6_VTC(R16G16_SINT, 16_16_SINT, WZYX), /* 82 */
156 TU6_VTC(R16G16_SFLOAT, 16_16_FLOAT, WZYX), /* 83 */
157
158 /* 48-bit RGB */
159 TU6_Vxx(R16G16B16_UNORM, 16_16_16_UNORM, WZYX), /* 84 */
160 TU6_Vxx(R16G16B16_SNORM, 16_16_16_SNORM, WZYX), /* 85 */
161 TU6_Vxx(R16G16B16_USCALED, 16_16_16_UINT, WZYX), /* 86 */
162 TU6_Vxx(R16G16B16_SSCALED, 16_16_16_SINT, WZYX), /* 87 */
163 TU6_Vxx(R16G16B16_UINT, 16_16_16_UINT, WZYX), /* 88 */
164 TU6_Vxx(R16G16B16_SINT, 16_16_16_SINT, WZYX), /* 89 */
165 TU6_Vxx(R16G16B16_SFLOAT, 16_16_16_FLOAT, WZYX), /* 90 */
166
167 /* 64-bit RGBA */
168 TU6_VTC(R16G16B16A16_UNORM, 16_16_16_16_UNORM, WZYX), /* 91 */
169 TU6_VTC(R16G16B16A16_SNORM, 16_16_16_16_SNORM, WZYX), /* 92 */
170 TU6_Vxx(R16G16B16A16_USCALED, 16_16_16_16_UINT, WZYX), /* 93 */
171 TU6_Vxx(R16G16B16A16_SSCALED, 16_16_16_16_SINT, WZYX), /* 94 */
172 TU6_VTC(R16G16B16A16_UINT, 16_16_16_16_UINT, WZYX), /* 95 */
173 TU6_VTC(R16G16B16A16_SINT, 16_16_16_16_SINT, WZYX), /* 96 */
174 TU6_VTC(R16G16B16A16_SFLOAT, 16_16_16_16_FLOAT, WZYX), /* 97 */
175
176 /* 32-bit R */
177 TU6_VTC(R32_UINT, 32_UINT, WZYX), /* 98 */
178 TU6_VTC(R32_SINT, 32_SINT, WZYX), /* 99 */
179 TU6_VTC(R32_SFLOAT, 32_FLOAT, WZYX), /* 100 */
180
181 /* 64-bit RG */
182 TU6_VTC(R32G32_UINT, 32_32_UINT, WZYX), /* 101 */
183 TU6_VTC(R32G32_SINT, 32_32_SINT, WZYX), /* 102 */
184 TU6_VTC(R32G32_SFLOAT, 32_32_FLOAT, WZYX), /* 103 */
185
186 /* 96-bit RGB */
187 TU6_Vxx(R32G32B32_UINT, 32_32_32_UINT, WZYX), /* 104 */
188 TU6_Vxx(R32G32B32_SINT, 32_32_32_SINT, WZYX), /* 105 */
189 TU6_Vxx(R32G32B32_SFLOAT, 32_32_32_FLOAT, WZYX), /* 106 */
190
191 /* 128-bit RGBA */
192 TU6_VTC(R32G32B32A32_UINT, 32_32_32_32_UINT, WZYX), /* 107 */
193 TU6_VTC(R32G32B32A32_SINT, 32_32_32_32_SINT, WZYX), /* 108 */
194 TU6_VTC(R32G32B32A32_SFLOAT, 32_32_32_32_FLOAT, WZYX), /* 109 */
195
196 /* 64-bit R */
197 TU6_xxx(R64_UINT, 64_UINT, WZYX), /* 110 */
198 TU6_xxx(R64_SINT, 64_SINT, WZYX), /* 111 */
199 TU6_xxx(R64_SFLOAT, 64_FLOAT, WZYX), /* 112 */
200
201 /* 128-bit RG */
202 TU6_xxx(R64G64_UINT, 64_64_UINT, WZYX), /* 113 */
203 TU6_xxx(R64G64_SINT, 64_64_SINT, WZYX), /* 114 */
204 TU6_xxx(R64G64_SFLOAT, 64_64_FLOAT, WZYX), /* 115 */
205
206 /* 192-bit RGB */
207 TU6_xxx(R64G64B64_UINT, 64_64_64_UINT, WZYX), /* 116 */
208 TU6_xxx(R64G64B64_SINT, 64_64_64_SINT, WZYX), /* 117 */
209 TU6_xxx(R64G64B64_SFLOAT, 64_64_64_FLOAT, WZYX), /* 118 */
210
211 /* 256-bit RGBA */
212 TU6_xxx(R64G64B64A64_UINT, 64_64_64_64_UINT, WZYX), /* 119 */
213 TU6_xxx(R64G64B64A64_SINT, 64_64_64_64_SINT, WZYX), /* 120 */
214 TU6_xxx(R64G64B64A64_SFLOAT, 64_64_64_64_FLOAT, WZYX), /* 121 */
215
216 /* 32-bit packed float */
217 TU6_VTC(B10G11R11_UFLOAT_PACK32, 11_11_10_FLOAT, WZYX), /* 122 */
218 TU6_xTx(E5B9G9R9_UFLOAT_PACK32, 9_9_9_E5_FLOAT, WZYX), /* 123 */
219
220 /* depth/stencil */
221 TU6_xTC(D16_UNORM, 16_UNORM, WZYX), /* 124 */
222 TU6_xTC(X8_D24_UNORM_PACK32, Z24_UNORM_S8_UINT_AS_R8G8B8A8, WZYX), /* 125 */
223 TU6_xTC(D32_SFLOAT, 32_FLOAT, WZYX), /* 126 */
224 TU6_xTC(S8_UINT, 8_UINT, WZYX), /* 127 */
225 TU6_xxx(D16_UNORM_S8_UINT, X8Z16_UNORM, WZYX), /* 128 */
226 TU6_xTC(D24_UNORM_S8_UINT, Z24_UNORM_S8_UINT_AS_R8G8B8A8, WZYX), /* 129 */
227 TU6_xxx(D32_SFLOAT_S8_UINT, x, WZYX), /* 130 */
228
229 /* compressed */
230 TU6_xTx(BC1_RGB_UNORM_BLOCK, DXT1, WZYX), /* 131 */
231 TU6_xTx(BC1_RGB_SRGB_BLOCK, DXT1, WZYX), /* 132 */
232 TU6_xTx(BC1_RGBA_UNORM_BLOCK, DXT1, WZYX), /* 133 */
233 TU6_xTx(BC1_RGBA_SRGB_BLOCK, DXT1, WZYX), /* 134 */
234 TU6_xTx(BC2_UNORM_BLOCK, DXT3, WZYX), /* 135 */
235 TU6_xTx(BC2_SRGB_BLOCK, DXT3, WZYX), /* 136 */
236 TU6_xTx(BC3_UNORM_BLOCK, DXT5, WZYX), /* 137 */
237 TU6_xTx(BC3_SRGB_BLOCK, DXT5, WZYX), /* 138 */
238 TU6_xTx(BC4_UNORM_BLOCK, RGTC1_UNORM, WZYX), /* 139 */
239 TU6_xTx(BC4_SNORM_BLOCK, RGTC1_SNORM, WZYX), /* 140 */
240 TU6_xTx(BC5_UNORM_BLOCK, RGTC2_UNORM, WZYX), /* 141 */
241 TU6_xTx(BC5_SNORM_BLOCK, RGTC2_SNORM, WZYX), /* 142 */
242 TU6_xTx(BC6H_UFLOAT_BLOCK, BPTC_UFLOAT, WZYX), /* 143 */
243 TU6_xTx(BC6H_SFLOAT_BLOCK, BPTC_FLOAT, WZYX), /* 144 */
244 TU6_xTx(BC7_UNORM_BLOCK, BPTC, WZYX), /* 145 */
245 TU6_xTx(BC7_SRGB_BLOCK, BPTC, WZYX), /* 146 */
246 TU6_xTx(ETC2_R8G8B8_UNORM_BLOCK, ETC2_RGB8, WZYX), /* 147 */
247 TU6_xTx(ETC2_R8G8B8_SRGB_BLOCK, ETC2_RGB8, WZYX), /* 148 */
248 TU6_xTx(ETC2_R8G8B8A1_UNORM_BLOCK, ETC2_RGB8A1, WZYX), /* 149 */
249 TU6_xTx(ETC2_R8G8B8A1_SRGB_BLOCK, ETC2_RGB8A1, WZYX), /* 150 */
250 TU6_xTx(ETC2_R8G8B8A8_UNORM_BLOCK, ETC2_RGBA8, WZYX), /* 151 */
251 TU6_xTx(ETC2_R8G8B8A8_SRGB_BLOCK, ETC2_RGBA8, WZYX), /* 152 */
252 TU6_xTx(EAC_R11_UNORM_BLOCK, ETC2_R11_UNORM, WZYX), /* 153 */
253 TU6_xTx(EAC_R11_SNORM_BLOCK, ETC2_R11_SNORM, WZYX), /* 154 */
254 TU6_xTx(EAC_R11G11_UNORM_BLOCK, ETC2_RG11_UNORM, WZYX), /* 155 */
255 TU6_xTx(EAC_R11G11_SNORM_BLOCK, ETC2_RG11_SNORM, WZYX), /* 156 */
256 TU6_xTx(ASTC_4x4_UNORM_BLOCK, ASTC_4x4, WZYX), /* 157 */
257 TU6_xTx(ASTC_4x4_SRGB_BLOCK, ASTC_4x4, WZYX), /* 158 */
258 TU6_xTx(ASTC_5x4_UNORM_BLOCK, ASTC_5x4, WZYX), /* 159 */
259 TU6_xTx(ASTC_5x4_SRGB_BLOCK, ASTC_5x4, WZYX), /* 160 */
260 TU6_xTx(ASTC_5x5_UNORM_BLOCK, ASTC_5x5, WZYX), /* 161 */
261 TU6_xTx(ASTC_5x5_SRGB_BLOCK, ASTC_5x5, WZYX), /* 162 */
262 TU6_xTx(ASTC_6x5_UNORM_BLOCK, ASTC_6x5, WZYX), /* 163 */
263 TU6_xTx(ASTC_6x5_SRGB_BLOCK, ASTC_6x5, WZYX), /* 164 */
264 TU6_xTx(ASTC_6x6_UNORM_BLOCK, ASTC_6x6, WZYX), /* 165 */
265 TU6_xTx(ASTC_6x6_SRGB_BLOCK, ASTC_6x6, WZYX), /* 166 */
266 TU6_xTx(ASTC_8x5_UNORM_BLOCK, ASTC_8x5, WZYX), /* 167 */
267 TU6_xTx(ASTC_8x5_SRGB_BLOCK, ASTC_8x5, WZYX), /* 168 */
268 TU6_xTx(ASTC_8x6_UNORM_BLOCK, ASTC_8x6, WZYX), /* 169 */
269 TU6_xTx(ASTC_8x6_SRGB_BLOCK, ASTC_8x6, WZYX), /* 170 */
270 TU6_xTx(ASTC_8x8_UNORM_BLOCK, ASTC_8x8, WZYX), /* 171 */
271 TU6_xTx(ASTC_8x8_SRGB_BLOCK, ASTC_8x8, WZYX), /* 172 */
272 TU6_xTx(ASTC_10x5_UNORM_BLOCK, ASTC_10x5, WZYX), /* 173 */
273 TU6_xTx(ASTC_10x5_SRGB_BLOCK, ASTC_10x5, WZYX), /* 174 */
274 TU6_xTx(ASTC_10x6_UNORM_BLOCK, ASTC_10x6, WZYX), /* 175 */
275 TU6_xTx(ASTC_10x6_SRGB_BLOCK, ASTC_10x6, WZYX), /* 176 */
276 TU6_xTx(ASTC_10x8_UNORM_BLOCK, ASTC_10x8, WZYX), /* 177 */
277 TU6_xTx(ASTC_10x8_SRGB_BLOCK, ASTC_10x8, WZYX), /* 178 */
278 TU6_xTx(ASTC_10x10_UNORM_BLOCK, ASTC_10x10, WZYX), /* 179 */
279 TU6_xTx(ASTC_10x10_SRGB_BLOCK, ASTC_10x10, WZYX), /* 180 */
280 TU6_xTx(ASTC_12x10_UNORM_BLOCK, ASTC_12x10, WZYX), /* 181 */
281 TU6_xTx(ASTC_12x10_SRGB_BLOCK, ASTC_12x10, WZYX), /* 182 */
282 TU6_xTx(ASTC_12x12_UNORM_BLOCK, ASTC_12x12, WZYX), /* 183 */
283 TU6_xTx(ASTC_12x12_SRGB_BLOCK, ASTC_12x12, WZYX), /* 184 */
284 };
285
286 static struct tu_native_format
287 tu6_get_native_format(VkFormat format)
288 {
289 struct tu_native_format fmt = {};
290
291 if (format >= ARRAY_SIZE(tu6_format_table))
292 return fmt;
293
294 if (!tu6_format_table[format].supported)
295 return fmt;
296
297 if (vk_format_to_pipe_format(format) == PIPE_FORMAT_NONE) {
298 tu_finishme("vk_format %d missing matching pipe format.\n", format);
299 return fmt;
300 }
301
302 return tu6_format_table[format];
303 }
304
305 struct tu_native_format
306 tu6_format_vtx(VkFormat format)
307 {
308 struct tu_native_format fmt = tu6_get_native_format(format);
309 assert(fmt.supported & FMT_VERTEX);
310 return fmt;
311 }
312
313 struct tu_native_format
314 tu6_format_color(VkFormat format, enum a6xx_tile_mode tile_mode)
315 {
316 struct tu_native_format fmt = tu6_get_native_format(format);
317 assert(fmt.supported & FMT_COLOR);
318
319 if (fmt.fmt == FMT6_10_10_10_2_UNORM)
320 fmt.fmt = FMT6_10_10_10_2_UNORM_DEST;
321
322 if (tile_mode)
323 fmt.swap = WZYX;
324
325 return fmt;
326 }
327
328 struct tu_native_format
329 tu6_format_texture(VkFormat format, enum a6xx_tile_mode tile_mode)
330 {
331 struct tu_native_format fmt = tu6_get_native_format(format);
332 assert(fmt.supported & FMT_TEXTURE);
333
334 if (!tile_mode) {
335 /* different from format table when used as linear src */
336 if (format == VK_FORMAT_R5G5B5A1_UNORM_PACK16)
337 fmt.fmt = FMT6_1_5_5_5_UNORM, fmt.swap = WXYZ;
338 if (format == VK_FORMAT_B5G5R5A1_UNORM_PACK16)
339 fmt.fmt = FMT6_1_5_5_5_UNORM, fmt.swap = WZYX;
340 } else {
341 fmt.swap = WZYX;
342 }
343
344 return fmt;
345 }
346
347 enum a6xx_depth_format
348 tu6_pipe2depth(VkFormat format)
349 {
350 switch (format) {
351 case VK_FORMAT_D16_UNORM:
352 return DEPTH6_16;
353 case VK_FORMAT_X8_D24_UNORM_PACK32:
354 case VK_FORMAT_D24_UNORM_S8_UINT:
355 return DEPTH6_24_8;
356 case VK_FORMAT_D32_SFLOAT:
357 return DEPTH6_32;
358 default:
359 return ~0;
360 }
361 }
362
363 static void
364 tu_physical_device_get_format_properties(
365 struct tu_physical_device *physical_device,
366 VkFormat format,
367 VkFormatProperties *out_properties)
368 {
369 VkFormatFeatureFlags linear = 0, optimal = 0, buffer = 0;
370 const struct util_format_description *desc = vk_format_description(format);
371 const struct tu_native_format native_fmt = tu6_get_native_format(format);
372 if (!desc || !native_fmt.supported) {
373 goto end;
374 }
375
376 buffer |= VK_FORMAT_FEATURE_TRANSFER_SRC_BIT | VK_FORMAT_FEATURE_TRANSFER_DST_BIT;
377 if (native_fmt.supported & FMT_VERTEX)
378 buffer |= VK_FORMAT_FEATURE_VERTEX_BUFFER_BIT;
379
380 if (native_fmt.supported & FMT_TEXTURE) {
381 optimal |= VK_FORMAT_FEATURE_TRANSFER_SRC_BIT |
382 VK_FORMAT_FEATURE_TRANSFER_DST_BIT |
383 VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT |
384 VK_FORMAT_FEATURE_SAMPLED_IMAGE_FILTER_LINEAR_BIT;
385 buffer |= VK_FORMAT_FEATURE_UNIFORM_TEXEL_BUFFER_BIT;
386 }
387
388 if (native_fmt.supported & FMT_COLOR) {
389 assert(native_fmt.supported & FMT_TEXTURE);
390 optimal |= VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT |
391 VK_FORMAT_FEATURE_BLIT_SRC_BIT |
392 VK_FORMAT_FEATURE_BLIT_DST_BIT;
393 }
394
395 /* For the most part, we can do anything with a linear image that we could
396 * do with a tiled image. However, we can't support sysmem rendering with a
397 * linear depth texture, because we don't know if there's a bit to control
398 * the tiling of the depth buffer in BYPASS mode, and the blob also
399 * disables linear depth rendering, so there's no way to discover it. We
400 * also can't force GMEM mode, because there are other situations where we
401 * have to use sysmem rendering. So follow the blob here, and only enable
402 * DEPTH_STENCIL_ATTACHMENT_BIT for the optimal features.
403 */
404 linear = optimal;
405 if (tu6_pipe2depth(format) != (enum a6xx_depth_format)~0)
406 optimal |= VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT;
407
408 end:
409 out_properties->linearTilingFeatures = linear;
410 out_properties->optimalTilingFeatures = optimal;
411 out_properties->bufferFeatures = buffer;
412 }
413
414 void
415 tu_GetPhysicalDeviceFormatProperties(VkPhysicalDevice physicalDevice,
416 VkFormat format,
417 VkFormatProperties *pFormatProperties)
418 {
419 TU_FROM_HANDLE(tu_physical_device, physical_device, physicalDevice);
420
421 tu_physical_device_get_format_properties(physical_device, format,
422 pFormatProperties);
423 }
424
425 void
426 tu_GetPhysicalDeviceFormatProperties2(
427 VkPhysicalDevice physicalDevice,
428 VkFormat format,
429 VkFormatProperties2 *pFormatProperties)
430 {
431 TU_FROM_HANDLE(tu_physical_device, physical_device, physicalDevice);
432
433 tu_physical_device_get_format_properties(
434 physical_device, format, &pFormatProperties->formatProperties);
435
436 VkDrmFormatModifierPropertiesListEXT *list =
437 vk_find_struct(pFormatProperties->pNext, DRM_FORMAT_MODIFIER_PROPERTIES_LIST_EXT);
438 if (list) {
439 VK_OUTARRAY_MAKE(out, list->pDrmFormatModifierProperties,
440 &list->drmFormatModifierCount);
441
442 vk_outarray_append(&out, mod_props) {
443 mod_props->drmFormatModifier = DRM_FORMAT_MOD_LINEAR;
444 mod_props->drmFormatModifierPlaneCount = 1;
445 }
446
447 /* TODO: any cases where this should be disabled? */
448 vk_outarray_append(&out, mod_props) {
449 mod_props->drmFormatModifier = DRM_FORMAT_MOD_QCOM_COMPRESSED;
450 mod_props->drmFormatModifierPlaneCount = 1;
451 }
452 }
453 }
454
455 static VkResult
456 tu_get_image_format_properties(
457 struct tu_physical_device *physical_device,
458 const VkPhysicalDeviceImageFormatInfo2 *info,
459 VkImageFormatProperties *pImageFormatProperties)
460
461 {
462 VkFormatProperties format_props;
463 VkFormatFeatureFlags format_feature_flags;
464 VkExtent3D maxExtent;
465 uint32_t maxMipLevels;
466 uint32_t maxArraySize;
467 VkSampleCountFlags sampleCounts = VK_SAMPLE_COUNT_1_BIT;
468
469 tu_physical_device_get_format_properties(physical_device, info->format,
470 &format_props);
471
472 switch (info->tiling) {
473 case VK_IMAGE_TILING_LINEAR:
474 format_feature_flags = format_props.linearTilingFeatures;
475 break;
476
477 case VK_IMAGE_TILING_DRM_FORMAT_MODIFIER_EXT:
478 /* The only difference between optimal and linear is currently whether
479 * depth/stencil attachments are allowed on depth/stencil formats.
480 * There's no reason to allow importing depth/stencil textures, so just
481 * disallow it and then this annoying edge case goes away.
482 *
483 * TODO: If anyone cares, we could enable this by looking at the
484 * modifier and checking if it's LINEAR or not.
485 */
486 if (vk_format_is_depth_or_stencil(info->format))
487 goto unsupported;
488
489 assert(format_props.optimalTilingFeatures == format_props.linearTilingFeatures);
490 /* fallthrough */
491 case VK_IMAGE_TILING_OPTIMAL:
492 format_feature_flags = format_props.optimalTilingFeatures;
493 break;
494 default:
495 unreachable("bad VkPhysicalDeviceImageFormatInfo2");
496 }
497
498 if (format_feature_flags == 0)
499 goto unsupported;
500
501 if (info->type != VK_IMAGE_TYPE_2D &&
502 vk_format_is_depth_or_stencil(info->format))
503 goto unsupported;
504
505 switch (info->type) {
506 default:
507 unreachable("bad vkimage type\n");
508 case VK_IMAGE_TYPE_1D:
509 maxExtent.width = 16384;
510 maxExtent.height = 1;
511 maxExtent.depth = 1;
512 maxMipLevels = 15; /* log2(maxWidth) + 1 */
513 maxArraySize = 2048;
514 break;
515 case VK_IMAGE_TYPE_2D:
516 maxExtent.width = 16384;
517 maxExtent.height = 16384;
518 maxExtent.depth = 1;
519 maxMipLevels = 15; /* log2(maxWidth) + 1 */
520 maxArraySize = 2048;
521 break;
522 case VK_IMAGE_TYPE_3D:
523 maxExtent.width = 2048;
524 maxExtent.height = 2048;
525 maxExtent.depth = 2048;
526 maxMipLevels = 12; /* log2(maxWidth) + 1 */
527 maxArraySize = 1;
528 break;
529 }
530
531 if (info->tiling == VK_IMAGE_TILING_OPTIMAL &&
532 info->type == VK_IMAGE_TYPE_2D &&
533 (format_feature_flags &
534 (VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT |
535 VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT)) &&
536 !(info->flags & VK_IMAGE_CREATE_CUBE_COMPATIBLE_BIT) &&
537 !(info->usage & VK_IMAGE_USAGE_STORAGE_BIT)) {
538 sampleCounts |= VK_SAMPLE_COUNT_2_BIT | VK_SAMPLE_COUNT_4_BIT;
539 /* note: most operations support 8 samples (GMEM render/resolve do at least)
540 * but some do not (which ones?), just disable 8 samples completely,
541 * (no 8x msaa matches the blob driver behavior)
542 */
543 }
544
545 if (info->usage & VK_IMAGE_USAGE_SAMPLED_BIT) {
546 if (!(format_feature_flags & VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT)) {
547 goto unsupported;
548 }
549 }
550
551 if (info->usage & VK_IMAGE_USAGE_STORAGE_BIT) {
552 if (!(format_feature_flags & VK_FORMAT_FEATURE_STORAGE_IMAGE_BIT)) {
553 goto unsupported;
554 }
555 }
556
557 if (info->usage & VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT) {
558 if (!(format_feature_flags & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT)) {
559 goto unsupported;
560 }
561 }
562
563 if (info->usage & VK_IMAGE_USAGE_DEPTH_STENCIL_ATTACHMENT_BIT) {
564 if (!(format_feature_flags &
565 VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT)) {
566 goto unsupported;
567 }
568 }
569
570 *pImageFormatProperties = (VkImageFormatProperties) {
571 .maxExtent = maxExtent,
572 .maxMipLevels = maxMipLevels,
573 .maxArrayLayers = maxArraySize,
574 .sampleCounts = sampleCounts,
575
576 /* FINISHME: Accurately calculate
577 * VkImageFormatProperties::maxResourceSize.
578 */
579 .maxResourceSize = UINT32_MAX,
580 };
581
582 return VK_SUCCESS;
583 unsupported:
584 *pImageFormatProperties = (VkImageFormatProperties) {
585 .maxExtent = { 0, 0, 0 },
586 .maxMipLevels = 0,
587 .maxArrayLayers = 0,
588 .sampleCounts = 0,
589 .maxResourceSize = 0,
590 };
591
592 return VK_ERROR_FORMAT_NOT_SUPPORTED;
593 }
594
595 VkResult
596 tu_GetPhysicalDeviceImageFormatProperties(
597 VkPhysicalDevice physicalDevice,
598 VkFormat format,
599 VkImageType type,
600 VkImageTiling tiling,
601 VkImageUsageFlags usage,
602 VkImageCreateFlags createFlags,
603 VkImageFormatProperties *pImageFormatProperties)
604 {
605 TU_FROM_HANDLE(tu_physical_device, physical_device, physicalDevice);
606
607 const VkPhysicalDeviceImageFormatInfo2 info = {
608 .sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_IMAGE_FORMAT_INFO_2,
609 .pNext = NULL,
610 .format = format,
611 .type = type,
612 .tiling = tiling,
613 .usage = usage,
614 .flags = createFlags,
615 };
616
617 return tu_get_image_format_properties(physical_device, &info,
618 pImageFormatProperties);
619 }
620
621 static VkResult
622 tu_get_external_image_format_properties(
623 const struct tu_physical_device *physical_device,
624 const VkPhysicalDeviceImageFormatInfo2 *pImageFormatInfo,
625 VkExternalMemoryHandleTypeFlagBits handleType,
626 VkExternalMemoryProperties *external_properties)
627 {
628 VkExternalMemoryFeatureFlagBits flags = 0;
629 VkExternalMemoryHandleTypeFlags export_flags = 0;
630 VkExternalMemoryHandleTypeFlags compat_flags = 0;
631
632 /* From the Vulkan 1.1.98 spec:
633 *
634 * If handleType is not compatible with the format, type, tiling,
635 * usage, and flags specified in VkPhysicalDeviceImageFormatInfo2,
636 * then vkGetPhysicalDeviceImageFormatProperties2 returns
637 * VK_ERROR_FORMAT_NOT_SUPPORTED.
638 */
639
640 switch (handleType) {
641 case VK_EXTERNAL_MEMORY_HANDLE_TYPE_OPAQUE_FD_BIT:
642 case VK_EXTERNAL_MEMORY_HANDLE_TYPE_DMA_BUF_BIT_EXT:
643 switch (pImageFormatInfo->type) {
644 case VK_IMAGE_TYPE_2D:
645 flags = VK_EXTERNAL_MEMORY_FEATURE_DEDICATED_ONLY_BIT |
646 VK_EXTERNAL_MEMORY_FEATURE_EXPORTABLE_BIT |
647 VK_EXTERNAL_MEMORY_FEATURE_IMPORTABLE_BIT;
648 compat_flags = export_flags =
649 VK_EXTERNAL_MEMORY_HANDLE_TYPE_OPAQUE_FD_BIT |
650 VK_EXTERNAL_MEMORY_HANDLE_TYPE_DMA_BUF_BIT_EXT;
651 break;
652 default:
653 return vk_errorf(physical_device->instance, VK_ERROR_FORMAT_NOT_SUPPORTED,
654 "VkExternalMemoryTypeFlagBits(0x%x) unsupported for VkImageType(%d)",
655 handleType, pImageFormatInfo->type);
656 }
657 break;
658 case VK_EXTERNAL_MEMORY_HANDLE_TYPE_HOST_ALLOCATION_BIT_EXT:
659 flags = VK_EXTERNAL_MEMORY_FEATURE_IMPORTABLE_BIT;
660 compat_flags = VK_EXTERNAL_MEMORY_HANDLE_TYPE_HOST_ALLOCATION_BIT_EXT;
661 break;
662 default:
663 return vk_errorf(physical_device->instance, VK_ERROR_FORMAT_NOT_SUPPORTED,
664 "VkExternalMemoryTypeFlagBits(0x%x) unsupported",
665 handleType);
666 }
667
668 *external_properties = (VkExternalMemoryProperties) {
669 .externalMemoryFeatures = flags,
670 .exportFromImportedHandleTypes = export_flags,
671 .compatibleHandleTypes = compat_flags,
672 };
673
674 return VK_SUCCESS;
675 }
676
677 VkResult
678 tu_GetPhysicalDeviceImageFormatProperties2(
679 VkPhysicalDevice physicalDevice,
680 const VkPhysicalDeviceImageFormatInfo2 *base_info,
681 VkImageFormatProperties2 *base_props)
682 {
683 TU_FROM_HANDLE(tu_physical_device, physical_device, physicalDevice);
684 const VkPhysicalDeviceExternalImageFormatInfo *external_info = NULL;
685 VkExternalImageFormatProperties *external_props = NULL;
686 VkResult result;
687
688 result = tu_get_image_format_properties(
689 physical_device, base_info, &base_props->imageFormatProperties);
690 if (result != VK_SUCCESS)
691 return result;
692
693 /* Extract input structs */
694 vk_foreach_struct_const(s, base_info->pNext)
695 {
696 switch (s->sType) {
697 case VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_EXTERNAL_IMAGE_FORMAT_INFO:
698 external_info = (const void *) s;
699 break;
700 default:
701 break;
702 }
703 }
704
705 /* Extract output structs */
706 vk_foreach_struct(s, base_props->pNext)
707 {
708 switch (s->sType) {
709 case VK_STRUCTURE_TYPE_EXTERNAL_IMAGE_FORMAT_PROPERTIES:
710 external_props = (void *) s;
711 break;
712 default:
713 break;
714 }
715 }
716
717 /* From the Vulkan 1.0.42 spec:
718 *
719 * If handleType is 0, vkGetPhysicalDeviceImageFormatProperties2 will
720 * behave as if VkPhysicalDeviceExternalImageFormatInfo was not
721 * present and VkExternalImageFormatProperties will be ignored.
722 */
723 if (external_info && external_info->handleType != 0) {
724 result = tu_get_external_image_format_properties(
725 physical_device, base_info, external_info->handleType,
726 &external_props->externalMemoryProperties);
727 if (result != VK_SUCCESS)
728 goto fail;
729 }
730
731 return VK_SUCCESS;
732
733 fail:
734 if (result == VK_ERROR_FORMAT_NOT_SUPPORTED) {
735 /* From the Vulkan 1.0.42 spec:
736 *
737 * If the combination of parameters to
738 * vkGetPhysicalDeviceImageFormatProperties2 is not supported by
739 * the implementation for use in vkCreateImage, then all members of
740 * imageFormatProperties will be filled with zero.
741 */
742 base_props->imageFormatProperties = (VkImageFormatProperties) { 0 };
743 }
744
745 return result;
746 }
747
748 void
749 tu_GetPhysicalDeviceSparseImageFormatProperties(
750 VkPhysicalDevice physicalDevice,
751 VkFormat format,
752 VkImageType type,
753 uint32_t samples,
754 VkImageUsageFlags usage,
755 VkImageTiling tiling,
756 uint32_t *pNumProperties,
757 VkSparseImageFormatProperties *pProperties)
758 {
759 /* Sparse images are not yet supported. */
760 *pNumProperties = 0;
761 }
762
763 void
764 tu_GetPhysicalDeviceSparseImageFormatProperties2(
765 VkPhysicalDevice physicalDevice,
766 const VkPhysicalDeviceSparseImageFormatInfo2 *pFormatInfo,
767 uint32_t *pPropertyCount,
768 VkSparseImageFormatProperties2 *pProperties)
769 {
770 /* Sparse images are not yet supported. */
771 *pPropertyCount = 0;
772 }
773
774 void
775 tu_GetPhysicalDeviceExternalBufferProperties(
776 VkPhysicalDevice physicalDevice,
777 const VkPhysicalDeviceExternalBufferInfo *pExternalBufferInfo,
778 VkExternalBufferProperties *pExternalBufferProperties)
779 {
780 VkExternalMemoryFeatureFlagBits flags = 0;
781 VkExternalMemoryHandleTypeFlags export_flags = 0;
782 VkExternalMemoryHandleTypeFlags compat_flags = 0;
783 switch (pExternalBufferInfo->handleType) {
784 case VK_EXTERNAL_MEMORY_HANDLE_TYPE_OPAQUE_FD_BIT:
785 case VK_EXTERNAL_MEMORY_HANDLE_TYPE_DMA_BUF_BIT_EXT:
786 flags = VK_EXTERNAL_MEMORY_FEATURE_EXPORTABLE_BIT |
787 VK_EXTERNAL_MEMORY_FEATURE_IMPORTABLE_BIT;
788 compat_flags = export_flags =
789 VK_EXTERNAL_MEMORY_HANDLE_TYPE_OPAQUE_FD_BIT |
790 VK_EXTERNAL_MEMORY_HANDLE_TYPE_DMA_BUF_BIT_EXT;
791 break;
792 case VK_EXTERNAL_MEMORY_HANDLE_TYPE_HOST_ALLOCATION_BIT_EXT:
793 flags = VK_EXTERNAL_MEMORY_FEATURE_IMPORTABLE_BIT;
794 compat_flags = VK_EXTERNAL_MEMORY_HANDLE_TYPE_HOST_ALLOCATION_BIT_EXT;
795 break;
796 default:
797 break;
798 }
799 pExternalBufferProperties->externalMemoryProperties =
800 (VkExternalMemoryProperties) {
801 .externalMemoryFeatures = flags,
802 .exportFromImportedHandleTypes = export_flags,
803 .compatibleHandleTypes = compat_flags,
804 };
805 }