a650e2f133f2c32be9eb365f83571800cb766d95
[mesa.git] / src / freedreno / vulkan / tu_formats.c
1
2 /*
3 * Copyright © 2016 Red Hat.
4 * Copyright © 2016 Bas Nieuwenhuizen
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice (including the next
14 * paragraph) shall be included in all copies or substantial portions of the
15 * Software.
16 *
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
22 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
23 * DEALINGS IN THE SOFTWARE.
24 */
25
26 #include "tu_private.h"
27
28 #include "registers/adreno_common.xml.h"
29 #include "registers/a6xx.xml.h"
30
31 #include "util/format_r11g11b10f.h"
32 #include "util/format_rgb9e5.h"
33 #include "util/format_srgb.h"
34 #include "util/u_half.h"
35 #include "vk_format.h"
36 #include "vk_util.h"
37
38 /**
39 * Declare a format table. A format table is an array of tu_native_format.
40 * It can map a consecutive range of VkFormat to the corresponding
41 * tu_native_format.
42 *
43 * TU_FORMAT_TABLE_FIRST and TU_FORMAT_TABLE_LAST must already be defined and
44 * have the values of the first and last VkFormat of the array respectively.
45 */
46 #define TU_FORMAT_TABLE(var) \
47 static const VkFormat var##_first = TU_FORMAT_TABLE_FIRST; \
48 static const VkFormat var##_last = TU_FORMAT_TABLE_LAST; \
49 static const struct tu_native_format var[TU_FORMAT_TABLE_LAST - TU_FORMAT_TABLE_FIRST + 1]
50 #undef TU_FORMAT_TABLE_FIRST
51 #undef TU_FORMAT_TABLE_LAST
52
53 #define VFMT6_x -1
54 #define TFMT6_x -1
55 #define RB6_x -1
56
57 #define TU6_FMT(vkfmt, vtxfmt, texfmt, rbfmt, swapfmt, valid) \
58 [VK_FORMAT_##vkfmt - TU_FORMAT_TABLE_FIRST] = { \
59 .vtx = VFMT6_##vtxfmt, \
60 .tex = TFMT6_##texfmt, \
61 .rb = RB6_##rbfmt, \
62 .swap = swapfmt, \
63 .present = valid, \
64 }
65
66 /**
67 * fmt/alias/swap are derived from VkFormat mechanically (and might not even
68 * exist). It is the macro of choice that decides whether a VkFormat is
69 * supported and how.
70 */
71 #define TU6_VTC(vk, fmt, alias, swap) TU6_FMT(vk, fmt, fmt, alias, swap, true)
72 #define TU6_xTC(vk, fmt, alias, swap) TU6_FMT(vk, x, fmt, alias, swap, true)
73 #define TU6_VTx(vk, fmt, alias, swap) TU6_FMT(vk, fmt, fmt, x, swap, true)
74 #define TU6_Vxx(vk, fmt, alias, swap) TU6_FMT(vk, fmt, x, x, swap, true)
75 #define TU6_xTx(vk, fmt, alias, swap) TU6_FMT(vk, x, fmt, x, swap, true)
76 #define TU6_xxx(vk, fmt, alias, swap) TU6_FMT(vk, x, x, x, WZYX, false)
77
78 #define TU_FORMAT_TABLE_FIRST VK_FORMAT_UNDEFINED
79 #define TU_FORMAT_TABLE_LAST VK_FORMAT_ASTC_12x12_SRGB_BLOCK
80 TU_FORMAT_TABLE(tu6_format_table0) = {
81 TU6_xxx(UNDEFINED, x, x, x), /* 0 */
82
83 /* 8-bit packed */
84 TU6_xxx(R4G4_UNORM_PACK8, 4_4_UNORM, R4G4_UNORM, WZXY), /* 1 */
85
86 /* 16-bit packed */
87 TU6_xTC(R4G4B4A4_UNORM_PACK16, 4_4_4_4_UNORM, R4G4B4A4_UNORM, XYZW), /* 2 */
88 TU6_xTC(B4G4R4A4_UNORM_PACK16, 4_4_4_4_UNORM, R4G4B4A4_UNORM, ZYXW), /* 3 */
89 TU6_xTC(R5G6B5_UNORM_PACK16, 5_6_5_UNORM, R5G6B5_UNORM, WXYZ), /* 4 */
90 TU6_xTC(B5G6R5_UNORM_PACK16, 5_6_5_UNORM, R5G6B5_UNORM, WZYX), /* 5 */
91 TU6_xxx(R5G5B5A1_UNORM_PACK16, 1_5_5_5_UNORM, A1R5G5B5_UNORM, XYZW), /* 6 */
92 TU6_xxx(B5G5R5A1_UNORM_PACK16, 1_5_5_5_UNORM, A1R5G5B5_UNORM, XYZW), /* 7 */
93 TU6_xTC(A1R5G5B5_UNORM_PACK16, 5_5_5_1_UNORM, R5G5B5A1_UNORM, WXYZ), /* 8 */
94
95 /* 8-bit R */
96 TU6_VTC(R8_UNORM, 8_UNORM, R8_UNORM, WZYX), /* 9 */
97 TU6_VTC(R8_SNORM, 8_SNORM, R8_SNORM, WZYX), /* 10 */
98 TU6_Vxx(R8_USCALED, 8_UINT, R8_UINT, WZYX), /* 11 */
99 TU6_Vxx(R8_SSCALED, 8_SINT, R8_SINT, WZYX), /* 12 */
100 TU6_VTC(R8_UINT, 8_UINT, R8_UINT, WZYX), /* 13 */
101 TU6_VTC(R8_SINT, 8_SINT, R8_SINT, WZYX), /* 14 */
102 TU6_xTC(R8_SRGB, 8_UNORM, R8_UNORM, WZYX), /* 15 */
103
104 /* 16-bit RG */
105 TU6_VTC(R8G8_UNORM, 8_8_UNORM, R8G8_UNORM, WZYX), /* 16 */
106 TU6_VTC(R8G8_SNORM, 8_8_SNORM, R8G8_SNORM, WZYX), /* 17 */
107 TU6_Vxx(R8G8_USCALED, 8_8_UINT, R8G8_UINT, WZYX), /* 18 */
108 TU6_Vxx(R8G8_SSCALED, 8_8_SINT, R8G8_SINT, WZYX), /* 19 */
109 TU6_VTC(R8G8_UINT, 8_8_UINT, R8G8_UINT, WZYX), /* 20 */
110 TU6_VTC(R8G8_SINT, 8_8_SINT, R8G8_SINT, WZYX), /* 21 */
111 TU6_xTC(R8G8_SRGB, 8_8_UNORM, R8G8_UNORM, WZYX), /* 22 */
112
113 /* 24-bit RGB */
114 TU6_Vxx(R8G8B8_UNORM, 8_8_8_UNORM, R8G8B8_UNORM, WZYX), /* 23 */
115 TU6_Vxx(R8G8B8_SNORM, 8_8_8_SNORM, R8G8B8_SNORM, WZYX), /* 24 */
116 TU6_Vxx(R8G8B8_USCALED, 8_8_8_UINT, R8G8B8_UINT, WZYX), /* 25 */
117 TU6_Vxx(R8G8B8_SSCALED, 8_8_8_SINT, R8G8B8_SINT, WZYX), /* 26 */
118 TU6_Vxx(R8G8B8_UINT, 8_8_8_UINT, R8G8B8_UINT, WZYX), /* 27 */
119 TU6_Vxx(R8G8B8_SINT, 8_8_8_SINT, R8G8B8_SINT, WZYX), /* 28 */
120 TU6_xxx(R8G8B8_SRGB, 8_8_8_UNORM, R8G8B8_UNORM, WZYX), /* 29 */
121
122 /* 24-bit BGR */
123 TU6_Vxx(B8G8R8_UNORM, 8_8_8_UNORM, R8G8B8_UNORM, WXYZ), /* 30 */
124 TU6_Vxx(B8G8R8_SNORM, 8_8_8_SNORM, R8G8B8_SNORM, WXYZ), /* 31 */
125 TU6_Vxx(B8G8R8_USCALED, 8_8_8_UINT, R8G8B8_UINT, WXYZ), /* 32 */
126 TU6_Vxx(B8G8R8_SSCALED, 8_8_8_SINT, R8G8B8_SINT, WXYZ), /* 33 */
127 TU6_Vxx(B8G8R8_UINT, 8_8_8_UINT, R8G8B8_UINT, WXYZ), /* 34 */
128 TU6_Vxx(B8G8R8_SINT, 8_8_8_SINT, R8G8B8_SINT, WXYZ), /* 35 */
129 TU6_xxx(B8G8R8_SRGB, 8_8_8_UNORM, R8G8B8_UNORM, WXYZ), /* 36 */
130
131 /* 32-bit RGBA */
132 TU6_VTC(R8G8B8A8_UNORM, 8_8_8_8_UNORM, R8G8B8A8_UNORM, WZYX), /* 37 */
133 TU6_VTC(R8G8B8A8_SNORM, 8_8_8_8_SNORM, R8G8B8A8_SNORM, WZYX), /* 38 */
134 TU6_Vxx(R8G8B8A8_USCALED, 8_8_8_8_UINT, R8G8B8A8_UINT, WZYX), /* 39 */
135 TU6_Vxx(R8G8B8A8_SSCALED, 8_8_8_8_SINT, R8G8B8A8_SINT, WZYX), /* 40 */
136 TU6_VTC(R8G8B8A8_UINT, 8_8_8_8_UINT, R8G8B8A8_UINT, WZYX), /* 41 */
137 TU6_VTC(R8G8B8A8_SINT, 8_8_8_8_SINT, R8G8B8A8_SINT, WZYX), /* 42 */
138 TU6_xTC(R8G8B8A8_SRGB, 8_8_8_8_UNORM, R8G8B8A8_UNORM, WZYX), /* 43 */
139
140 /* 32-bit BGRA */
141 TU6_VTC(B8G8R8A8_UNORM, 8_8_8_8_UNORM, R8G8B8A8_UNORM, WXYZ), /* 44 */
142 TU6_VTC(B8G8R8A8_SNORM, 8_8_8_8_SNORM, R8G8B8A8_SNORM, WXYZ), /* 45 */
143 TU6_Vxx(B8G8R8A8_USCALED, 8_8_8_8_UINT, R8G8B8A8_UINT, WXYZ), /* 46 */
144 TU6_Vxx(B8G8R8A8_SSCALED, 8_8_8_8_SINT, R8G8B8A8_SINT, WXYZ), /* 47 */
145 TU6_VTC(B8G8R8A8_UINT, 8_8_8_8_UINT, R8G8B8A8_UINT, WXYZ), /* 48 */
146 TU6_VTC(B8G8R8A8_SINT, 8_8_8_8_SINT, R8G8B8A8_SINT, WXYZ), /* 49 */
147 TU6_xTC(B8G8R8A8_SRGB, 8_8_8_8_UNORM, R8G8B8A8_UNORM, WXYZ), /* 50 */
148
149 /* 32-bit packed */
150 TU6_VTC(A8B8G8R8_UNORM_PACK32, 8_8_8_8_UNORM, R8G8B8A8_UNORM, WZYX), /* 51 */
151 TU6_VTC(A8B8G8R8_SNORM_PACK32, 8_8_8_8_SNORM, R8G8B8A8_SNORM, WZYX), /* 52 */
152 TU6_Vxx(A8B8G8R8_USCALED_PACK32, 8_8_8_8_UINT, R8G8B8A8_UINT, WZYX), /* 53 */
153 TU6_Vxx(A8B8G8R8_SSCALED_PACK32, 8_8_8_8_SINT, R8G8B8A8_SINT, WZYX), /* 54 */
154 TU6_VTC(A8B8G8R8_UINT_PACK32, 8_8_8_8_UINT, R8G8B8A8_UINT, WZYX), /* 55 */
155 TU6_VTC(A8B8G8R8_SINT_PACK32, 8_8_8_8_SINT, R8G8B8A8_SINT, WZYX), /* 56 */
156 TU6_xTC(A8B8G8R8_SRGB_PACK32, 8_8_8_8_UNORM, R8G8B8A8_UNORM, WZYX), /* 57 */
157 TU6_VTC(A2R10G10B10_UNORM_PACK32, 10_10_10_2_UNORM, R10G10B10A2_UNORM, WXYZ), /* 58 */
158 TU6_Vxx(A2R10G10B10_SNORM_PACK32, 10_10_10_2_SNORM, R10G10B10A2_SNORM, WXYZ), /* 59 */
159 TU6_Vxx(A2R10G10B10_USCALED_PACK32, 10_10_10_2_UINT, R10G10B10A2_UINT, WXYZ), /* 60 */
160 TU6_Vxx(A2R10G10B10_SSCALED_PACK32, 10_10_10_2_SINT, R10G10B10A2_SINT, WXYZ), /* 61 */
161 TU6_VTC(A2R10G10B10_UINT_PACK32, 10_10_10_2_UINT, R10G10B10A2_UINT, WXYZ), /* 62 */
162 TU6_Vxx(A2R10G10B10_SINT_PACK32, 10_10_10_2_SINT, R10G10B10A2_SINT, WXYZ), /* 63 */
163 TU6_VTC(A2B10G10R10_UNORM_PACK32, 10_10_10_2_UNORM, R10G10B10A2_UNORM, WZYX), /* 64 */
164 TU6_Vxx(A2B10G10R10_SNORM_PACK32, 10_10_10_2_SNORM, R10G10B10A2_SNORM, WZYX), /* 65 */
165 TU6_Vxx(A2B10G10R10_USCALED_PACK32, 10_10_10_2_UINT, R10G10B10A2_UINT, WZYX), /* 66 */
166 TU6_Vxx(A2B10G10R10_SSCALED_PACK32, 10_10_10_2_SINT, R10G10B10A2_SINT, WZYX), /* 67 */
167 TU6_VTC(A2B10G10R10_UINT_PACK32, 10_10_10_2_UINT, R10G10B10A2_UINT, WZYX), /* 68 */
168 TU6_Vxx(A2B10G10R10_SINT_PACK32, 10_10_10_2_SINT, R10G10B10A2_SINT, WZYX), /* 69 */
169
170 /* 16-bit R */
171 TU6_VTC(R16_UNORM, 16_UNORM, R16_UNORM, WZYX), /* 70 */
172 TU6_VTC(R16_SNORM, 16_SNORM, R16_SNORM, WZYX), /* 71 */
173 TU6_Vxx(R16_USCALED, 16_UINT, R16_UINT, WZYX), /* 72 */
174 TU6_Vxx(R16_SSCALED, 16_SINT, R16_SINT, WZYX), /* 73 */
175 TU6_VTC(R16_UINT, 16_UINT, R16_UINT, WZYX), /* 74 */
176 TU6_VTC(R16_SINT, 16_SINT, R16_SINT, WZYX), /* 75 */
177 TU6_VTC(R16_SFLOAT, 16_FLOAT, R16_FLOAT, WZYX), /* 76 */
178
179 /* 32-bit RG */
180 TU6_VTC(R16G16_UNORM, 16_16_UNORM, R16G16_UNORM, WZYX), /* 77 */
181 TU6_VTC(R16G16_SNORM, 16_16_SNORM, R16G16_SNORM, WZYX), /* 78 */
182 TU6_Vxx(R16G16_USCALED, 16_16_UINT, R16G16_UINT, WZYX), /* 79 */
183 TU6_Vxx(R16G16_SSCALED, 16_16_SINT, R16G16_SINT, WZYX), /* 80 */
184 TU6_VTC(R16G16_UINT, 16_16_UINT, R16G16_UINT, WZYX), /* 81 */
185 TU6_VTC(R16G16_SINT, 16_16_SINT, R16G16_SINT, WZYX), /* 82 */
186 TU6_VTC(R16G16_SFLOAT, 16_16_FLOAT, R16G16_FLOAT, WZYX), /* 83 */
187
188 /* 48-bit RGB */
189 TU6_Vxx(R16G16B16_UNORM, 16_16_16_UNORM, R16G16B16_UNORM, WZYX), /* 84 */
190 TU6_Vxx(R16G16B16_SNORM, 16_16_16_SNORM, R16G16B16_SNORM, WZYX), /* 85 */
191 TU6_Vxx(R16G16B16_USCALED, 16_16_16_UINT, R16G16B16_UINT, WZYX), /* 86 */
192 TU6_Vxx(R16G16B16_SSCALED, 16_16_16_SINT, R16G16B16_SINT, WZYX), /* 87 */
193 TU6_Vxx(R16G16B16_UINT, 16_16_16_UINT, R16G16B16_UINT, WZYX), /* 88 */
194 TU6_Vxx(R16G16B16_SINT, 16_16_16_SINT, R16G16B16_SINT, WZYX), /* 89 */
195 TU6_Vxx(R16G16B16_SFLOAT, 16_16_16_FLOAT, R16G16B16_FLOAT, WZYX), /* 90 */
196
197 /* 64-bit RGBA */
198 TU6_VTC(R16G16B16A16_UNORM, 16_16_16_16_UNORM, R16G16B16A16_UNORM, WZYX), /* 91 */
199 TU6_VTC(R16G16B16A16_SNORM, 16_16_16_16_SNORM, R16G16B16A16_SNORM, WZYX), /* 92 */
200 TU6_Vxx(R16G16B16A16_USCALED, 16_16_16_16_UINT, R16G16B16A16_UINT, WZYX), /* 93 */
201 TU6_Vxx(R16G16B16A16_SSCALED, 16_16_16_16_SINT, R16G16B16A16_SINT, WZYX), /* 94 */
202 TU6_VTC(R16G16B16A16_UINT, 16_16_16_16_UINT, R16G16B16A16_UINT, WZYX), /* 95 */
203 TU6_VTC(R16G16B16A16_SINT, 16_16_16_16_SINT, R16G16B16A16_SINT, WZYX), /* 96 */
204 TU6_VTC(R16G16B16A16_SFLOAT, 16_16_16_16_FLOAT, R16G16B16A16_FLOAT, WZYX), /* 97 */
205
206 /* 32-bit R */
207 TU6_VTC(R32_UINT, 32_UINT, R32_UINT, WZYX), /* 98 */
208 TU6_VTC(R32_SINT, 32_SINT, R32_SINT, WZYX), /* 99 */
209 TU6_VTC(R32_SFLOAT, 32_FLOAT, R32_FLOAT, WZYX), /* 100 */
210
211 /* 64-bit RG */
212 TU6_VTC(R32G32_UINT, 32_32_UINT, R32G32_UINT, WZYX), /* 101 */
213 TU6_VTC(R32G32_SINT, 32_32_SINT, R32G32_SINT, WZYX), /* 102 */
214 TU6_VTC(R32G32_SFLOAT, 32_32_FLOAT, R32G32_FLOAT, WZYX), /* 103 */
215
216 /* 96-bit RGB */
217 TU6_Vxx(R32G32B32_UINT, 32_32_32_UINT, R32G32B32_UINT, WZYX), /* 104 */
218 TU6_Vxx(R32G32B32_SINT, 32_32_32_SINT, R32G32B32_SINT, WZYX), /* 105 */
219 TU6_Vxx(R32G32B32_SFLOAT, 32_32_32_FLOAT, R32G32B32_FLOAT, WZYX), /* 106 */
220
221 /* 128-bit RGBA */
222 TU6_VTC(R32G32B32A32_UINT, 32_32_32_32_UINT, R32G32B32A32_UINT, WZYX), /* 107 */
223 TU6_VTC(R32G32B32A32_SINT, 32_32_32_32_SINT, R32G32B32A32_SINT, WZYX), /* 108 */
224 TU6_VTC(R32G32B32A32_SFLOAT, 32_32_32_32_FLOAT, R32G32B32A32_FLOAT, WZYX), /* 109 */
225
226 /* 64-bit R */
227 TU6_xxx(R64_UINT, 64_UINT, R64_UINT, WZYX), /* 110 */
228 TU6_xxx(R64_SINT, 64_SINT, R64_SINT, WZYX), /* 111 */
229 TU6_xxx(R64_SFLOAT, 64_FLOAT, R64_FLOAT, WZYX), /* 112 */
230
231 /* 128-bit RG */
232 TU6_xxx(R64G64_UINT, 64_64_UINT, R64G64_UINT, WZYX), /* 113 */
233 TU6_xxx(R64G64_SINT, 64_64_SINT, R64G64_SINT, WZYX), /* 114 */
234 TU6_xxx(R64G64_SFLOAT, 64_64_FLOAT, R64G64_FLOAT, WZYX), /* 115 */
235
236 /* 192-bit RGB */
237 TU6_xxx(R64G64B64_UINT, 64_64_64_UINT, R64G64B64_UINT, WZYX), /* 116 */
238 TU6_xxx(R64G64B64_SINT, 64_64_64_SINT, R64G64B64_SINT, WZYX), /* 117 */
239 TU6_xxx(R64G64B64_SFLOAT, 64_64_64_FLOAT, R64G64B64_FLOAT, WZYX), /* 118 */
240
241 /* 256-bit RGBA */
242 TU6_xxx(R64G64B64A64_UINT, 64_64_64_64_UINT, R64G64B64A64_UINT, WZYX), /* 119 */
243 TU6_xxx(R64G64B64A64_SINT, 64_64_64_64_SINT, R64G64B64A64_SINT, WZYX), /* 120 */
244 TU6_xxx(R64G64B64A64_SFLOAT, 64_64_64_64_FLOAT, R64G64B64A64_FLOAT, WZYX), /* 121 */
245
246 /* 32-bit packed float */
247 TU6_VTC(B10G11R11_UFLOAT_PACK32, 11_11_10_FLOAT, R11G11B10_FLOAT, WZYX), /* 122 */
248 TU6_xTx(E5B9G9R9_UFLOAT_PACK32, 9_9_9_E5_FLOAT, R9G9B9E5_FLOAT, WZYX), /* 123 */
249
250 /* depth/stencil */
251 TU6_xTC(D16_UNORM, 16_UNORM, R16_UNORM, WZYX), /* 124 */
252 TU6_xTC(X8_D24_UNORM_PACK32, Z24_UNORM_S8_UINT, Z24_UNORM_S8_UINT, WZYX), /* 125 */
253 TU6_xTC(D32_SFLOAT, 32_FLOAT, R32_FLOAT, WZYX), /* 126 */
254 TU6_xTC(S8_UINT, 8_UINT, R8_UINT, WZYX), /* 127 */
255 TU6_xxx(D16_UNORM_S8_UINT, X8Z16_UNORM, X8Z16_UNORM, WZYX), /* 128 */
256 TU6_xTC(D24_UNORM_S8_UINT, Z24_UNORM_S8_UINT, Z24_UNORM_S8_UINT, WZYX), /* 129 */
257 TU6_xxx(D32_SFLOAT_S8_UINT, x, x, WZYX), /* 130 */
258
259 /* compressed */
260 TU6_xTx(BC1_RGB_UNORM_BLOCK, DXT1, DXT1, WZYX), /* 131 */
261 TU6_xTx(BC1_RGB_SRGB_BLOCK, DXT1, DXT1, WZYX), /* 132 */
262 TU6_xTx(BC1_RGBA_UNORM_BLOCK, DXT1, DXT1, WZYX), /* 133 */
263 TU6_xTx(BC1_RGBA_SRGB_BLOCK, DXT1, DXT1, WZYX), /* 134 */
264 TU6_xTx(BC2_UNORM_BLOCK, DXT3, DXT3, WZYX), /* 135 */
265 TU6_xTx(BC2_SRGB_BLOCK, DXT3, DXT3, WZYX), /* 136 */
266 TU6_xTx(BC3_UNORM_BLOCK, DXT5, DXT5, WZYX), /* 137 */
267 TU6_xTx(BC3_SRGB_BLOCK, DXT5, DXT5, WZYX), /* 138 */
268 TU6_xTx(BC4_UNORM_BLOCK, RGTC1_UNORM, RGTC1_UNORM, WZYX), /* 139 */
269 TU6_xTx(BC4_SNORM_BLOCK, RGTC1_SNORM, RGTC1_SNORM, WZYX), /* 140 */
270 TU6_xTx(BC5_UNORM_BLOCK, RGTC2_UNORM, RGTC2_UNORM, WZYX), /* 141 */
271 TU6_xTx(BC5_SNORM_BLOCK, RGTC2_SNORM, RGTC2_SNORM, WZYX), /* 142 */
272 TU6_xTx(BC6H_UFLOAT_BLOCK, BPTC_UFLOAT, BPTC_UFLOAT, WZYX), /* 143 */
273 TU6_xTx(BC6H_SFLOAT_BLOCK, BPTC_FLOAT, BPTC_FLOAT, WZYX), /* 144 */
274 TU6_xTx(BC7_UNORM_BLOCK, BPTC, BPTC, WZYX), /* 145 */
275 TU6_xTx(BC7_SRGB_BLOCK, BPTC, BPTC, WZYX), /* 146 */
276 TU6_xTx(ETC2_R8G8B8_UNORM_BLOCK, ETC2_RGB8, ETC2_RGB8, WZYX), /* 147 */
277 TU6_xTx(ETC2_R8G8B8_SRGB_BLOCK, ETC2_RGB8, ETC2_RGB8, WZYX), /* 148 */
278 TU6_xTx(ETC2_R8G8B8A1_UNORM_BLOCK, ETC2_RGB8A1, ETC2_RGB8A1, WZYX), /* 149 */
279 TU6_xTx(ETC2_R8G8B8A1_SRGB_BLOCK, ETC2_RGB8A1, ETC2_RGB8A1, WZYX), /* 150 */
280 TU6_xTx(ETC2_R8G8B8A8_UNORM_BLOCK, ETC2_RGBA8, ETC2_RGBA8, WZYX), /* 151 */
281 TU6_xTx(ETC2_R8G8B8A8_SRGB_BLOCK, ETC2_RGBA8, ETC2_RGBA8, WZYX), /* 152 */
282 TU6_xTx(EAC_R11_UNORM_BLOCK, ETC2_R11_UNORM, ETC2_R11_UNORM, WZYX), /* 153 */
283 TU6_xTx(EAC_R11_SNORM_BLOCK, ETC2_R11_SNORM, ETC2_R11_SNORM, WZYX), /* 154 */
284 TU6_xTx(EAC_R11G11_UNORM_BLOCK, ETC2_RG11_UNORM, ETC2_RG11_UNORM, WZYX), /* 155 */
285 TU6_xTx(EAC_R11G11_SNORM_BLOCK, ETC2_RG11_SNORM, ETC2_RG11_SNORM, WZYX), /* 156 */
286 TU6_xTx(ASTC_4x4_UNORM_BLOCK, ASTC_4x4, ASTC_4x4, WZYX), /* 157 */
287 TU6_xTx(ASTC_4x4_SRGB_BLOCK, ASTC_4x4, ASTC_4x4, WZYX), /* 158 */
288 TU6_xTx(ASTC_5x4_UNORM_BLOCK, ASTC_5x4, ASTC_5x4, WZYX), /* 159 */
289 TU6_xTx(ASTC_5x4_SRGB_BLOCK, ASTC_5x4, ASTC_5x4, WZYX), /* 160 */
290 TU6_xTx(ASTC_5x5_UNORM_BLOCK, ASTC_5x5, ASTC_5x5, WZYX), /* 161 */
291 TU6_xTx(ASTC_5x5_SRGB_BLOCK, ASTC_5x5, ASTC_5x5, WZYX), /* 162 */
292 TU6_xTx(ASTC_6x5_UNORM_BLOCK, ASTC_6x5, ASTC_6x5, WZYX), /* 163 */
293 TU6_xTx(ASTC_6x5_SRGB_BLOCK, ASTC_6x5, ASTC_6x5, WZYX), /* 164 */
294 TU6_xTx(ASTC_6x6_UNORM_BLOCK, ASTC_6x6, ASTC_6x6, WZYX), /* 165 */
295 TU6_xTx(ASTC_6x6_SRGB_BLOCK, ASTC_6x6, ASTC_6x6, WZYX), /* 166 */
296 TU6_xTx(ASTC_8x5_UNORM_BLOCK, ASTC_8x5, ASTC_8x5, WZYX), /* 167 */
297 TU6_xTx(ASTC_8x5_SRGB_BLOCK, ASTC_8x5, ASTC_8x5, WZYX), /* 168 */
298 TU6_xTx(ASTC_8x6_UNORM_BLOCK, ASTC_8x6, ASTC_8x6, WZYX), /* 169 */
299 TU6_xTx(ASTC_8x6_SRGB_BLOCK, ASTC_8x6, ASTC_8x6, WZYX), /* 170 */
300 TU6_xTx(ASTC_8x8_UNORM_BLOCK, ASTC_8x8, ASTC_8x8, WZYX), /* 171 */
301 TU6_xTx(ASTC_8x8_SRGB_BLOCK, ASTC_8x8, ASTC_8x8, WZYX), /* 172 */
302 TU6_xTx(ASTC_10x5_UNORM_BLOCK, ASTC_10x5, ASTC_10x5, WZYX), /* 173 */
303 TU6_xTx(ASTC_10x5_SRGB_BLOCK, ASTC_10x5, ASTC_10x5, WZYX), /* 174 */
304 TU6_xTx(ASTC_10x6_UNORM_BLOCK, ASTC_10x6, ASTC_10x6, WZYX), /* 175 */
305 TU6_xTx(ASTC_10x6_SRGB_BLOCK, ASTC_10x6, ASTC_10x6, WZYX), /* 176 */
306 TU6_xTx(ASTC_10x8_UNORM_BLOCK, ASTC_10x8, ASTC_10x8, WZYX), /* 177 */
307 TU6_xTx(ASTC_10x8_SRGB_BLOCK, ASTC_10x8, ASTC_10x8, WZYX), /* 178 */
308 TU6_xTx(ASTC_10x10_UNORM_BLOCK, ASTC_10x10, ASTC_10x10, WZYX), /* 179 */
309 TU6_xTx(ASTC_10x10_SRGB_BLOCK, ASTC_10x10, ASTC_10x10, WZYX), /* 180 */
310 TU6_xTx(ASTC_12x10_UNORM_BLOCK, ASTC_12x10, ASTC_12x10, WZYX), /* 181 */
311 TU6_xTx(ASTC_12x10_SRGB_BLOCK, ASTC_12x10, ASTC_12x10, WZYX), /* 182 */
312 TU6_xTx(ASTC_12x12_UNORM_BLOCK, ASTC_12x12, ASTC_12x12, WZYX), /* 183 */
313 TU6_xTx(ASTC_12x12_SRGB_BLOCK, ASTC_12x12, ASTC_12x12, WZYX), /* 184 */
314 };
315 #undef TU_FORMAT_TABLE_FIRST
316 #undef TU_FORMAT_TABLE_LAST
317
318 const struct tu_native_format *
319 tu6_get_native_format(VkFormat format)
320 {
321 const struct tu_native_format *fmt = NULL;
322
323 if (format >= tu6_format_table0_first && format <= tu6_format_table0_last)
324 fmt = &tu6_format_table0[format - tu6_format_table0_first];
325
326 return (fmt && fmt->present) ? fmt : NULL;
327 }
328
329 enum a6xx_2d_ifmt
330 tu6_rb_fmt_to_ifmt(enum a6xx_color_fmt fmt)
331 {
332 switch (fmt) {
333 case RB6_A8_UNORM:
334 case RB6_R8_UNORM:
335 case RB6_R8_SNORM:
336 case RB6_R8G8_UNORM:
337 case RB6_R8G8_SNORM:
338 case RB6_R8G8B8A8_UNORM:
339 case RB6_R8G8B8_UNORM:
340 case RB6_R8G8B8A8_SNORM:
341 case RB6_R4G4B4A4_UNORM:
342 case RB6_R5G5B5A1_UNORM:
343 case RB6_R5G6B5_UNORM:
344 case RB6_Z24_UNORM_S8_UINT:
345 case RB6_Z24_UNORM_S8_UINT_AS_R8G8B8A8:
346 return R2D_UNORM8;
347
348 case RB6_R32_UINT:
349 case RB6_R32_SINT:
350 case RB6_R32G32_UINT:
351 case RB6_R32G32_SINT:
352 case RB6_R32G32B32A32_UINT:
353 case RB6_R32G32B32A32_SINT:
354 return R2D_INT32;
355
356 case RB6_R16_UINT:
357 case RB6_R16_SINT:
358 case RB6_R16G16_UINT:
359 case RB6_R16G16_SINT:
360 case RB6_R16G16B16A16_UINT:
361 case RB6_R16G16B16A16_SINT:
362 case RB6_R10G10B10A2_UINT:
363 return R2D_INT16;
364
365 case RB6_R8_UINT:
366 case RB6_R8_SINT:
367 case RB6_R8G8_UINT:
368 case RB6_R8G8_SINT:
369 case RB6_R8G8B8A8_UINT:
370 case RB6_R8G8B8A8_SINT:
371 return R2D_INT8;
372
373 case RB6_R16_UNORM:
374 case RB6_R16_SNORM:
375 case RB6_R16G16_UNORM:
376 case RB6_R16G16_SNORM:
377 case RB6_R16G16B16A16_UNORM:
378 case RB6_R16G16B16A16_SNORM:
379 case RB6_R32_FLOAT:
380 case RB6_R32G32_FLOAT:
381 case RB6_R32G32B32A32_FLOAT:
382 return R2D_FLOAT32;
383
384 case RB6_R16_FLOAT:
385 case RB6_R16G16_FLOAT:
386 case RB6_R16G16B16A16_FLOAT:
387 case RB6_R11G11B10_FLOAT:
388 case RB6_R10G10B10A2_UNORM:
389 return R2D_FLOAT16;
390
391 default:
392 unreachable("bad format");
393 return 0;
394 }
395 }
396
397 enum a6xx_depth_format
398 tu6_pipe2depth(VkFormat format)
399 {
400 switch (format) {
401 case VK_FORMAT_D16_UNORM:
402 return DEPTH6_16;
403 case VK_FORMAT_X8_D24_UNORM_PACK32:
404 case VK_FORMAT_D24_UNORM_S8_UINT:
405 return DEPTH6_24_8;
406 case VK_FORMAT_D32_SFLOAT:
407 return DEPTH6_32;
408 default:
409 return ~0;
410 }
411 }
412
413 static uint32_t
414 tu_pack_mask(int bits)
415 {
416 assert(bits <= 32);
417 return (1ull << bits) - 1;
418 }
419
420 static uint32_t
421 tu_pack_float32_for_unorm(float val, int bits)
422 {
423 const uint32_t max = tu_pack_mask(bits);
424 if (val < 0.0f)
425 return 0;
426 else if (val > 1.0f)
427 return max;
428 else
429 return _mesa_lroundevenf(val * (float) max);
430 }
431
432 static uint32_t
433 tu_pack_float32_for_snorm(float val, int bits)
434 {
435 const int32_t max = tu_pack_mask(bits - 1);
436 int32_t tmp;
437 if (val < -1.0f)
438 tmp = -max;
439 else if (val > 1.0f)
440 tmp = max;
441 else
442 tmp = _mesa_lroundevenf(val * (float) max);
443
444 return tmp & tu_pack_mask(bits);
445 }
446
447 static uint32_t
448 tu_pack_float32_for_uscaled(float val, int bits)
449 {
450 const uint32_t max = tu_pack_mask(bits);
451 if (val < 0.0f)
452 return 0;
453 else if (val > (float) max)
454 return max;
455 else
456 return (uint32_t) val;
457 }
458
459 static uint32_t
460 tu_pack_float32_for_sscaled(float val, int bits)
461 {
462 const int32_t max = tu_pack_mask(bits - 1);
463 const int32_t min = -max - 1;
464 int32_t tmp;
465 if (val < (float) min)
466 tmp = min;
467 else if (val > (float) max)
468 tmp = max;
469 else
470 tmp = (int32_t) val;
471
472 return tmp & tu_pack_mask(bits);
473 }
474
475 static uint32_t
476 tu_pack_uint32_for_uint(uint32_t val, int bits)
477 {
478 return val & tu_pack_mask(bits);
479 }
480
481 static uint32_t
482 tu_pack_int32_for_sint(int32_t val, int bits)
483 {
484 return val & tu_pack_mask(bits);
485 }
486
487 static uint32_t
488 tu_pack_float32_for_sfloat(float val, int bits)
489 {
490 assert(bits == 16 || bits == 32);
491 return bits == 16 ? util_float_to_half(val) : fui(val);
492 }
493
494 union tu_clear_component_value {
495 float float32;
496 int32_t int32;
497 uint32_t uint32;
498 };
499
500 static uint32_t
501 tu_pack_clear_component_value(union tu_clear_component_value val,
502 const struct vk_format_channel_description *ch)
503 {
504 uint32_t packed;
505
506 switch (ch->type) {
507 case VK_FORMAT_TYPE_UNSIGNED:
508 /* normalized, scaled, or pure integer */
509 assert(ch->normalized + ch->scaled + ch->pure_integer == 1);
510 if (ch->normalized)
511 packed = tu_pack_float32_for_unorm(val.float32, ch->size);
512 else if (ch->scaled)
513 packed = tu_pack_float32_for_uscaled(val.float32, ch->size);
514 else
515 packed = tu_pack_uint32_for_uint(val.uint32, ch->size);
516 break;
517 case VK_FORMAT_TYPE_SIGNED:
518 /* normalized, scaled, or pure integer */
519 assert(ch->normalized + ch->scaled + ch->pure_integer == 1);
520 if (ch->normalized)
521 packed = tu_pack_float32_for_snorm(val.float32, ch->size);
522 else if (ch->scaled)
523 packed = tu_pack_float32_for_sscaled(val.float32, ch->size);
524 else
525 packed = tu_pack_int32_for_sint(val.int32, ch->size);
526 break;
527 case VK_FORMAT_TYPE_FLOAT:
528 packed = tu_pack_float32_for_sfloat(val.float32, ch->size);
529 break;
530 default:
531 unreachable("unexpected channel type");
532 packed = 0;
533 break;
534 }
535
536 assert((packed & tu_pack_mask(ch->size)) == packed);
537 return packed;
538 }
539
540 static const struct vk_format_channel_description *
541 tu_get_format_channel_description(const struct vk_format_description *desc,
542 int comp)
543 {
544 switch (desc->swizzle[comp]) {
545 case VK_SWIZZLE_X:
546 return &desc->channel[0];
547 case VK_SWIZZLE_Y:
548 return &desc->channel[1];
549 case VK_SWIZZLE_Z:
550 return &desc->channel[2];
551 case VK_SWIZZLE_W:
552 return &desc->channel[3];
553 default:
554 return NULL;
555 }
556 }
557
558 static union tu_clear_component_value
559 tu_get_clear_component_value(const VkClearValue *val, int comp,
560 enum vk_format_colorspace colorspace)
561 {
562 assert(comp < 4);
563
564 union tu_clear_component_value tmp;
565 switch (colorspace) {
566 case VK_FORMAT_COLORSPACE_ZS:
567 assert(comp < 2);
568 if (comp == 0)
569 tmp.float32 = val->depthStencil.depth;
570 else
571 tmp.uint32 = val->depthStencil.stencil;
572 break;
573 case VK_FORMAT_COLORSPACE_SRGB:
574 if (comp < 3) {
575 tmp.float32 = util_format_linear_to_srgb_float(val->color.float32[comp]);
576 break;
577 }
578 default:
579 assert(comp < 4);
580 tmp.uint32 = val->color.uint32[comp];
581 break;
582 }
583
584 return tmp;
585 }
586
587 /**
588 * Pack a VkClearValue into a 128-bit buffer. \a format is respected except
589 * for the component order. The components are always packed in WZYX order
590 * (i.e., msb is white and lsb is red).
591 *
592 * Return the number of uint32_t's used.
593 */
594 void
595 tu_pack_clear_value(const VkClearValue *val, VkFormat format, uint32_t buf[4])
596 {
597 const struct vk_format_description *desc = vk_format_description(format);
598
599 switch (format) {
600 case VK_FORMAT_B10G11R11_UFLOAT_PACK32:
601 buf[0] = float3_to_r11g11b10f(val->color.float32);
602 return;
603 case VK_FORMAT_E5B9G9R9_UFLOAT_PACK32:
604 buf[0] = float3_to_rgb9e5(val->color.float32);
605 return;
606 default:
607 break;
608 }
609
610 assert(desc && desc->layout == VK_FORMAT_LAYOUT_PLAIN);
611
612 /* S8_UINT is special and has no depth */
613 const int max_components =
614 format == VK_FORMAT_S8_UINT ? 2 : desc->nr_channels;
615
616 int buf_offset = 0;
617 int bit_shift = 0;
618 for (int comp = 0; comp < max_components; comp++) {
619 const struct vk_format_channel_description *ch =
620 tu_get_format_channel_description(desc, comp);
621 if (!ch) {
622 assert((format == VK_FORMAT_S8_UINT && comp == 0) ||
623 (format == VK_FORMAT_X8_D24_UNORM_PACK32 && comp == 1));
624 continue;
625 }
626
627 union tu_clear_component_value v = tu_get_clear_component_value(
628 val, comp, desc->colorspace);
629
630 /* move to the next uint32_t when there is not enough space */
631 assert(ch->size <= 32);
632 if (bit_shift + ch->size > 32) {
633 buf_offset++;
634 bit_shift = 0;
635 }
636
637 if (bit_shift == 0)
638 buf[buf_offset] = 0;
639
640 buf[buf_offset] |= tu_pack_clear_component_value(v, ch) << bit_shift;
641 bit_shift += ch->size;
642 }
643 }
644
645 void
646 tu_2d_clear_color(const VkClearColorValue *val, VkFormat format, uint32_t buf[4])
647 {
648 const struct vk_format_description *desc = vk_format_description(format);
649
650 /* not supported by 2D engine, cleared as U32 */
651 if (format == VK_FORMAT_E5B9G9R9_UFLOAT_PACK32) {
652 buf[0] = float3_to_rgb9e5(val->float32);
653 return;
654 }
655
656 enum a6xx_2d_ifmt ifmt = tu6_rb_fmt_to_ifmt(tu6_get_native_format(format)->rb);
657
658 assert(desc && desc->layout == VK_FORMAT_LAYOUT_PLAIN);
659
660 for (unsigned i = 0; i < desc->nr_channels; i++) {
661 const struct vk_format_channel_description *ch = &desc->channel[i];
662
663 switch (ifmt) {
664 case R2D_INT32:
665 case R2D_INT16:
666 case R2D_INT8:
667 case R2D_FLOAT32:
668 buf[i] = val->uint32[i];
669 break;
670 case R2D_FLOAT16:
671 buf[i] = util_float_to_half(val->float32[i]);
672 break;
673 case R2D_UNORM8: {
674 float linear = val->float32[i];
675 if (desc->colorspace == VK_FORMAT_COLORSPACE_SRGB && i < 3)
676 linear = util_format_linear_to_srgb_float(val->float32[i]);
677
678 if (ch->type == VK_FORMAT_TYPE_SIGNED)
679 buf[i] = tu_pack_float32_for_snorm(linear, 8);
680 else
681 buf[i] = tu_pack_float32_for_unorm(linear, 8);
682 } break;
683 default:
684 unreachable("unexpected ifmt");
685 break;
686 }
687 }
688 }
689
690 void
691 tu_2d_clear_zs(const VkClearDepthStencilValue *val, VkFormat format, uint32_t buf[4])
692 {
693 switch (format) {
694 case VK_FORMAT_X8_D24_UNORM_PACK32:
695 case VK_FORMAT_D24_UNORM_S8_UINT:
696 buf[0] = tu_pack_float32_for_unorm(val->depth, 24);
697 buf[1] = buf[0] >> 8;
698 buf[2] = buf[0] >> 16;
699 buf[3] = val->stencil;
700 return;
701 case VK_FORMAT_D16_UNORM:
702 case VK_FORMAT_D32_SFLOAT:
703 buf[0] = fui(val->depth);
704 return;
705 case VK_FORMAT_S8_UINT:
706 buf[0] = val->stencil;
707 return;
708 default:
709 unreachable("unexpected zs format");
710 break;
711 }
712 }
713
714 static void
715 tu_physical_device_get_format_properties(
716 struct tu_physical_device *physical_device,
717 VkFormat format,
718 VkFormatProperties *out_properties)
719 {
720 VkFormatFeatureFlags linear = 0, tiled = 0, buffer = 0;
721 const struct vk_format_description *desc = vk_format_description(format);
722 const struct tu_native_format *native_fmt = tu6_get_native_format(format);
723 if (!desc || !native_fmt) {
724 goto end;
725 }
726
727 buffer |= VK_FORMAT_FEATURE_TRANSFER_SRC_BIT | VK_FORMAT_FEATURE_TRANSFER_DST_BIT;
728 if (native_fmt->vtx >= 0) {
729 buffer |= VK_FORMAT_FEATURE_VERTEX_BUFFER_BIT;
730 }
731
732 if (native_fmt->tex >= 0 || native_fmt->rb >= 0) {
733 linear |= VK_FORMAT_FEATURE_TRANSFER_SRC_BIT | VK_FORMAT_FEATURE_TRANSFER_DST_BIT;
734 tiled |= VK_FORMAT_FEATURE_TRANSFER_SRC_BIT | VK_FORMAT_FEATURE_TRANSFER_DST_BIT;
735 }
736
737 if (native_fmt->tex >= 0) {
738 linear |= VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT | VK_FORMAT_FEATURE_SAMPLED_IMAGE_FILTER_LINEAR_BIT;
739 tiled |= VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT | VK_FORMAT_FEATURE_SAMPLED_IMAGE_FILTER_LINEAR_BIT;
740 buffer |= VK_FORMAT_FEATURE_UNIFORM_TEXEL_BUFFER_BIT;
741 }
742
743 if (native_fmt->rb >= 0) {
744 linear |= VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT | VK_FORMAT_FEATURE_BLIT_SRC_BIT | VK_FORMAT_FEATURE_BLIT_DST_BIT;
745 tiled |= VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT | VK_FORMAT_FEATURE_BLIT_SRC_BIT | VK_FORMAT_FEATURE_BLIT_DST_BIT;
746 }
747
748 if (tu6_pipe2depth(format) != (enum a6xx_depth_format)~0) {
749 linear |= VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT;
750 tiled |= VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT;
751 }
752
753 end:
754 out_properties->linearTilingFeatures = linear;
755 out_properties->optimalTilingFeatures = tiled;
756 out_properties->bufferFeatures = buffer;
757 }
758
759 void
760 tu_GetPhysicalDeviceFormatProperties(VkPhysicalDevice physicalDevice,
761 VkFormat format,
762 VkFormatProperties *pFormatProperties)
763 {
764 TU_FROM_HANDLE(tu_physical_device, physical_device, physicalDevice);
765
766 tu_physical_device_get_format_properties(physical_device, format,
767 pFormatProperties);
768 }
769
770 void
771 tu_GetPhysicalDeviceFormatProperties2(
772 VkPhysicalDevice physicalDevice,
773 VkFormat format,
774 VkFormatProperties2 *pFormatProperties)
775 {
776 TU_FROM_HANDLE(tu_physical_device, physical_device, physicalDevice);
777
778 tu_physical_device_get_format_properties(
779 physical_device, format, &pFormatProperties->formatProperties);
780 }
781
782 static VkResult
783 tu_get_image_format_properties(
784 struct tu_physical_device *physical_device,
785 const VkPhysicalDeviceImageFormatInfo2 *info,
786 VkImageFormatProperties *pImageFormatProperties)
787
788 {
789 VkFormatProperties format_props;
790 VkFormatFeatureFlags format_feature_flags;
791 VkExtent3D maxExtent;
792 uint32_t maxMipLevels;
793 uint32_t maxArraySize;
794 VkSampleCountFlags sampleCounts = VK_SAMPLE_COUNT_1_BIT;
795
796 tu_physical_device_get_format_properties(physical_device, info->format,
797 &format_props);
798 if (info->tiling == VK_IMAGE_TILING_LINEAR) {
799 format_feature_flags = format_props.linearTilingFeatures;
800 } else if (info->tiling == VK_IMAGE_TILING_OPTIMAL) {
801 format_feature_flags = format_props.optimalTilingFeatures;
802 } else {
803 unreachable("bad VkImageTiling");
804 }
805
806 if (format_feature_flags == 0)
807 goto unsupported;
808
809 if (info->type != VK_IMAGE_TYPE_2D &&
810 vk_format_is_depth_or_stencil(info->format))
811 goto unsupported;
812
813 switch (info->type) {
814 default:
815 unreachable("bad vkimage type\n");
816 case VK_IMAGE_TYPE_1D:
817 maxExtent.width = 16384;
818 maxExtent.height = 1;
819 maxExtent.depth = 1;
820 maxMipLevels = 15; /* log2(maxWidth) + 1 */
821 maxArraySize = 2048;
822 break;
823 case VK_IMAGE_TYPE_2D:
824 maxExtent.width = 16384;
825 maxExtent.height = 16384;
826 maxExtent.depth = 1;
827 maxMipLevels = 15; /* log2(maxWidth) + 1 */
828 maxArraySize = 2048;
829 break;
830 case VK_IMAGE_TYPE_3D:
831 maxExtent.width = 2048;
832 maxExtent.height = 2048;
833 maxExtent.depth = 2048;
834 maxMipLevels = 12; /* log2(maxWidth) + 1 */
835 maxArraySize = 1;
836 break;
837 }
838
839 if (info->tiling == VK_IMAGE_TILING_OPTIMAL &&
840 info->type == VK_IMAGE_TYPE_2D &&
841 (format_feature_flags &
842 (VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT |
843 VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT)) &&
844 !(info->flags & VK_IMAGE_CREATE_CUBE_COMPATIBLE_BIT) &&
845 !(info->usage & VK_IMAGE_USAGE_STORAGE_BIT)) {
846 sampleCounts |= VK_SAMPLE_COUNT_2_BIT | VK_SAMPLE_COUNT_4_BIT |
847 VK_SAMPLE_COUNT_8_BIT;
848 }
849
850 if (info->usage & VK_IMAGE_USAGE_SAMPLED_BIT) {
851 if (!(format_feature_flags & VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT)) {
852 goto unsupported;
853 }
854 }
855
856 if (info->usage & VK_IMAGE_USAGE_STORAGE_BIT) {
857 if (!(format_feature_flags & VK_FORMAT_FEATURE_STORAGE_IMAGE_BIT)) {
858 goto unsupported;
859 }
860 }
861
862 if (info->usage & VK_IMAGE_USAGE_COLOR_ATTACHMENT_BIT) {
863 if (!(format_feature_flags & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT)) {
864 goto unsupported;
865 }
866 }
867
868 if (info->usage & VK_IMAGE_USAGE_DEPTH_STENCIL_ATTACHMENT_BIT) {
869 if (!(format_feature_flags &
870 VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT)) {
871 goto unsupported;
872 }
873 }
874
875 *pImageFormatProperties = (VkImageFormatProperties) {
876 .maxExtent = maxExtent,
877 .maxMipLevels = maxMipLevels,
878 .maxArrayLayers = maxArraySize,
879 .sampleCounts = sampleCounts,
880
881 /* FINISHME: Accurately calculate
882 * VkImageFormatProperties::maxResourceSize.
883 */
884 .maxResourceSize = UINT32_MAX,
885 };
886
887 return VK_SUCCESS;
888 unsupported:
889 *pImageFormatProperties = (VkImageFormatProperties) {
890 .maxExtent = { 0, 0, 0 },
891 .maxMipLevels = 0,
892 .maxArrayLayers = 0,
893 .sampleCounts = 0,
894 .maxResourceSize = 0,
895 };
896
897 return VK_ERROR_FORMAT_NOT_SUPPORTED;
898 }
899
900 VkResult
901 tu_GetPhysicalDeviceImageFormatProperties(
902 VkPhysicalDevice physicalDevice,
903 VkFormat format,
904 VkImageType type,
905 VkImageTiling tiling,
906 VkImageUsageFlags usage,
907 VkImageCreateFlags createFlags,
908 VkImageFormatProperties *pImageFormatProperties)
909 {
910 TU_FROM_HANDLE(tu_physical_device, physical_device, physicalDevice);
911
912 const VkPhysicalDeviceImageFormatInfo2 info = {
913 .sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_IMAGE_FORMAT_INFO_2,
914 .pNext = NULL,
915 .format = format,
916 .type = type,
917 .tiling = tiling,
918 .usage = usage,
919 .flags = createFlags,
920 };
921
922 return tu_get_image_format_properties(physical_device, &info,
923 pImageFormatProperties);
924 }
925
926 static VkResult
927 tu_get_external_image_format_properties(
928 const struct tu_physical_device *physical_device,
929 const VkPhysicalDeviceImageFormatInfo2 *pImageFormatInfo,
930 VkExternalMemoryHandleTypeFlagBits handleType,
931 VkExternalMemoryProperties *external_properties)
932 {
933 VkExternalMemoryFeatureFlagBits flags = 0;
934 VkExternalMemoryHandleTypeFlags export_flags = 0;
935 VkExternalMemoryHandleTypeFlags compat_flags = 0;
936
937 /* From the Vulkan 1.1.98 spec:
938 *
939 * If handleType is not compatible with the format, type, tiling,
940 * usage, and flags specified in VkPhysicalDeviceImageFormatInfo2,
941 * then vkGetPhysicalDeviceImageFormatProperties2 returns
942 * VK_ERROR_FORMAT_NOT_SUPPORTED.
943 */
944
945 switch (handleType) {
946 case VK_EXTERNAL_MEMORY_HANDLE_TYPE_OPAQUE_FD_BIT:
947 case VK_EXTERNAL_MEMORY_HANDLE_TYPE_DMA_BUF_BIT_EXT:
948 switch (pImageFormatInfo->type) {
949 case VK_IMAGE_TYPE_2D:
950 flags = VK_EXTERNAL_MEMORY_FEATURE_DEDICATED_ONLY_BIT |
951 VK_EXTERNAL_MEMORY_FEATURE_EXPORTABLE_BIT |
952 VK_EXTERNAL_MEMORY_FEATURE_IMPORTABLE_BIT;
953 compat_flags = export_flags =
954 VK_EXTERNAL_MEMORY_HANDLE_TYPE_OPAQUE_FD_BIT |
955 VK_EXTERNAL_MEMORY_HANDLE_TYPE_DMA_BUF_BIT_EXT;
956 break;
957 default:
958 return vk_errorf(physical_device->instance, VK_ERROR_FORMAT_NOT_SUPPORTED,
959 "VkExternalMemoryTypeFlagBits(0x%x) unsupported for VkImageType(%d)",
960 handleType, pImageFormatInfo->type);
961 }
962 break;
963 case VK_EXTERNAL_MEMORY_HANDLE_TYPE_HOST_ALLOCATION_BIT_EXT:
964 flags = VK_EXTERNAL_MEMORY_FEATURE_IMPORTABLE_BIT;
965 compat_flags = VK_EXTERNAL_MEMORY_HANDLE_TYPE_HOST_ALLOCATION_BIT_EXT;
966 break;
967 default:
968 return vk_errorf(physical_device->instance, VK_ERROR_FORMAT_NOT_SUPPORTED,
969 "VkExternalMemoryTypeFlagBits(0x%x) unsupported",
970 handleType);
971 }
972
973 *external_properties = (VkExternalMemoryProperties) {
974 .externalMemoryFeatures = flags,
975 .exportFromImportedHandleTypes = export_flags,
976 .compatibleHandleTypes = compat_flags,
977 };
978
979 return VK_SUCCESS;
980 }
981
982 VkResult
983 tu_GetPhysicalDeviceImageFormatProperties2(
984 VkPhysicalDevice physicalDevice,
985 const VkPhysicalDeviceImageFormatInfo2 *base_info,
986 VkImageFormatProperties2 *base_props)
987 {
988 TU_FROM_HANDLE(tu_physical_device, physical_device, physicalDevice);
989 const VkPhysicalDeviceExternalImageFormatInfo *external_info = NULL;
990 VkExternalImageFormatProperties *external_props = NULL;
991 VkResult result;
992
993 result = tu_get_image_format_properties(
994 physical_device, base_info, &base_props->imageFormatProperties);
995 if (result != VK_SUCCESS)
996 return result;
997
998 /* Extract input structs */
999 vk_foreach_struct_const(s, base_info->pNext)
1000 {
1001 switch (s->sType) {
1002 case VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_EXTERNAL_IMAGE_FORMAT_INFO:
1003 external_info = (const void *) s;
1004 break;
1005 default:
1006 break;
1007 }
1008 }
1009
1010 /* Extract output structs */
1011 vk_foreach_struct(s, base_props->pNext)
1012 {
1013 switch (s->sType) {
1014 case VK_STRUCTURE_TYPE_EXTERNAL_IMAGE_FORMAT_PROPERTIES:
1015 external_props = (void *) s;
1016 break;
1017 default:
1018 break;
1019 }
1020 }
1021
1022 /* From the Vulkan 1.0.42 spec:
1023 *
1024 * If handleType is 0, vkGetPhysicalDeviceImageFormatProperties2 will
1025 * behave as if VkPhysicalDeviceExternalImageFormatInfo was not
1026 * present and VkExternalImageFormatProperties will be ignored.
1027 */
1028 if (external_info && external_info->handleType != 0) {
1029 result = tu_get_external_image_format_properties(
1030 physical_device, base_info, external_info->handleType,
1031 &external_props->externalMemoryProperties);
1032 if (result != VK_SUCCESS)
1033 goto fail;
1034 }
1035
1036 return VK_SUCCESS;
1037
1038 fail:
1039 if (result == VK_ERROR_FORMAT_NOT_SUPPORTED) {
1040 /* From the Vulkan 1.0.42 spec:
1041 *
1042 * If the combination of parameters to
1043 * vkGetPhysicalDeviceImageFormatProperties2 is not supported by
1044 * the implementation for use in vkCreateImage, then all members of
1045 * imageFormatProperties will be filled with zero.
1046 */
1047 base_props->imageFormatProperties = (VkImageFormatProperties) { 0 };
1048 }
1049
1050 return result;
1051 }
1052
1053 void
1054 tu_GetPhysicalDeviceSparseImageFormatProperties(
1055 VkPhysicalDevice physicalDevice,
1056 VkFormat format,
1057 VkImageType type,
1058 uint32_t samples,
1059 VkImageUsageFlags usage,
1060 VkImageTiling tiling,
1061 uint32_t *pNumProperties,
1062 VkSparseImageFormatProperties *pProperties)
1063 {
1064 /* Sparse images are not yet supported. */
1065 *pNumProperties = 0;
1066 }
1067
1068 void
1069 tu_GetPhysicalDeviceSparseImageFormatProperties2(
1070 VkPhysicalDevice physicalDevice,
1071 const VkPhysicalDeviceSparseImageFormatInfo2 *pFormatInfo,
1072 uint32_t *pPropertyCount,
1073 VkSparseImageFormatProperties2 *pProperties)
1074 {
1075 /* Sparse images are not yet supported. */
1076 *pPropertyCount = 0;
1077 }
1078
1079 void
1080 tu_GetPhysicalDeviceExternalBufferProperties(
1081 VkPhysicalDevice physicalDevice,
1082 const VkPhysicalDeviceExternalBufferInfo *pExternalBufferInfo,
1083 VkExternalBufferProperties *pExternalBufferProperties)
1084 {
1085 VkExternalMemoryFeatureFlagBits flags = 0;
1086 VkExternalMemoryHandleTypeFlags export_flags = 0;
1087 VkExternalMemoryHandleTypeFlags compat_flags = 0;
1088 switch (pExternalBufferInfo->handleType) {
1089 case VK_EXTERNAL_MEMORY_HANDLE_TYPE_OPAQUE_FD_BIT:
1090 case VK_EXTERNAL_MEMORY_HANDLE_TYPE_DMA_BUF_BIT_EXT:
1091 flags = VK_EXTERNAL_MEMORY_FEATURE_EXPORTABLE_BIT |
1092 VK_EXTERNAL_MEMORY_FEATURE_IMPORTABLE_BIT;
1093 compat_flags = export_flags =
1094 VK_EXTERNAL_MEMORY_HANDLE_TYPE_OPAQUE_FD_BIT |
1095 VK_EXTERNAL_MEMORY_HANDLE_TYPE_DMA_BUF_BIT_EXT;
1096 break;
1097 case VK_EXTERNAL_MEMORY_HANDLE_TYPE_HOST_ALLOCATION_BIT_EXT:
1098 flags = VK_EXTERNAL_MEMORY_FEATURE_IMPORTABLE_BIT;
1099 compat_flags = VK_EXTERNAL_MEMORY_HANDLE_TYPE_HOST_ALLOCATION_BIT_EXT;
1100 break;
1101 default:
1102 break;
1103 }
1104 pExternalBufferProperties->externalMemoryProperties =
1105 (VkExternalMemoryProperties) {
1106 .externalMemoryFeatures = flags,
1107 .exportFromImportedHandleTypes = export_flags,
1108 .compatibleHandleTypes = compat_flags,
1109 };
1110 }