intel: Implement Gen12 workaround for array textures of size 1
[mesa.git] / src / intel / isl / isl_format.c
1 /*
2 * Copyright 2015 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24 #include <assert.h>
25
26 #include "isl.h"
27 #include "isl_priv.h"
28 #include "dev/gen_device_info.h"
29
30 #include "main/macros.h" /* Needed for MAX3 and MAX2 for format_rgb9e5 */
31 #include "util/format_srgb.h"
32 #include "util/format_rgb9e5.h"
33 #include "util/format_r11g11b10f.h"
34
35 /* Header-only format conversion include */
36 #include "main/format_utils.h"
37
38 struct surface_format_info {
39 bool exists;
40 uint8_t sampling;
41 uint8_t filtering;
42 uint8_t shadow_compare;
43 uint8_t chroma_key;
44 uint8_t render_target;
45 uint8_t alpha_blend;
46 uint8_t input_vb;
47 uint8_t streamed_output_vb;
48 uint8_t color_processing;
49 uint8_t typed_write;
50 uint8_t typed_read;
51 uint8_t ccs_e;
52 };
53
54 /* This macro allows us to write the table almost as it appears in the PRM,
55 * while restructuring it to turn it into the C code we want.
56 */
57 #define SF(sampl, filt, shad, ck, rt, ab, vb, so, color, tw, tr, ccs_e, sf) \
58 [ISL_FORMAT_##sf] = { true, sampl, filt, shad, ck, rt, ab, vb, so, color, tw, tr, ccs_e},
59
60 #define Y 0
61 #define x 255
62 /**
63 * This is the table of support for surface (texture, renderbuffer, and vertex
64 * buffer, but not depthbuffer) formats across the various hardware generations.
65 *
66 * The table is formatted to match the documentation, except that the docs have
67 * this ridiculous mapping of Y[*+~^#&] for "supported on DevWhatever". To put
68 * it in our table, here's the mapping:
69 *
70 * Y*: 45
71 * Y+: 45 (g45/gm45)
72 * Y~: 50 (gen5)
73 * Y^: 60 (gen6)
74 * Y#: 70 (gen7)
75 *
76 * The abbreviations in the header below are:
77 * smpl - Sampling Engine
78 * filt - Sampling Engine Filtering
79 * shad - Sampling Engine Shadow Map
80 * CK - Sampling Engine Chroma Key
81 * RT - Render Target
82 * AB - Alpha Blend Render Target
83 * VB - Input Vertex Buffer
84 * SO - Steamed Output Vertex Buffers (transform feedback)
85 * color - Color Processing
86 * ccs_e - Lossless Compression Support (gen9+ only)
87 * sf - Surface Format
88 *
89 * See page 88 of the Sandybridge PRM VOL4_Part1 PDF.
90 *
91 * As of Ivybridge, the columns are no longer in that table and the
92 * information can be found spread across:
93 *
94 * - VOL2_Part1 section 2.5.11 Format Conversion (vertex fetch).
95 * - VOL4_Part1 section 2.12.2.1.2 Sampler Output Channel Mapping.
96 * - VOL4_Part1 section 3.9.11 Render Target Write.
97 * - Render Target Surface Types [SKL+]
98 */
99 static const struct surface_format_info format_info[] = {
100 /* smpl filt shad CK RT AB VB SO color TW TR ccs_e */
101 SF( Y, 50, x, x, Y, Y, Y, Y, x, 70, 90, 90, R32G32B32A32_FLOAT)
102 SF( Y, x, x, x, Y, x, Y, Y, x, 70, 90, 90, R32G32B32A32_SINT)
103 SF( Y, x, x, x, Y, x, Y, Y, x, 70, 90, 90, R32G32B32A32_UINT)
104 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R32G32B32A32_UNORM)
105 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R32G32B32A32_SNORM)
106 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R64G64_FLOAT)
107 SF( Y, 50, x, x, 100, 100, x, x, x, x, x, 100, R32G32B32X32_FLOAT)
108 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R32G32B32A32_SSCALED)
109 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R32G32B32A32_USCALED)
110 SF( x, x, x, x, x, x, 75, x, x, x, x, x, R32G32B32A32_SFIXED)
111 SF( x, x, x, x, x, x, 80, x, x, x, x, x, R64G64_PASSTHRU)
112 SF( Y, 50, x, x, x, x, Y, Y, x, x, x, x, R32G32B32_FLOAT)
113 SF( Y, x, x, x, x, x, Y, Y, x, x, x, x, R32G32B32_SINT)
114 SF( Y, x, x, x, x, x, Y, Y, x, x, x, x, R32G32B32_UINT)
115 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R32G32B32_UNORM)
116 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R32G32B32_SNORM)
117 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R32G32B32_SSCALED)
118 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R32G32B32_USCALED)
119 SF( x, x, x, x, x, x, 75, x, x, x, x, x, R32G32B32_SFIXED)
120 SF( Y, Y, x, x, Y, 45, Y, x, 60, 70, 110, 90, R16G16B16A16_UNORM)
121 SF( Y, Y, x, x, Y, 60, Y, x, x, 70, 110, 90, R16G16B16A16_SNORM)
122 SF( Y, x, x, x, Y, x, Y, x, x, 70, 90, 90, R16G16B16A16_SINT)
123 SF( Y, x, x, x, Y, x, Y, x, x, 70, 75, 90, R16G16B16A16_UINT)
124 SF( Y, Y, x, x, Y, Y, Y, x, x, 70, 90, 90, R16G16B16A16_FLOAT)
125 SF( Y, 50, x, x, Y, Y, Y, Y, x, 70, 90, 90, R32G32_FLOAT)
126 SF( Y, 70, x, x, Y, Y, Y, Y, x, x, x, x, R32G32_FLOAT_LD)
127 SF( Y, x, x, x, Y, x, Y, Y, x, 70, 90, 90, R32G32_SINT)
128 SF( Y, x, x, x, Y, x, Y, Y, x, 70, 90, 90, R32G32_UINT)
129 SF( Y, 50, Y, x, x, x, x, x, x, x, x, x, R32_FLOAT_X8X24_TYPELESS)
130 SF( Y, x, x, x, x, x, x, x, x, x, x, x, X32_TYPELESS_G8X24_UINT)
131 SF( Y, 50, x, x, x, x, x, x, x, x, x, x, L32A32_FLOAT)
132 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R32G32_UNORM)
133 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R32G32_SNORM)
134 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R64_FLOAT)
135 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, R16G16B16X16_UNORM)
136 SF( Y, Y, x, x, 90, 90, x, x, x, x, x, 90, R16G16B16X16_FLOAT)
137 SF( Y, 50, x, x, x, x, x, x, x, x, x, x, A32X32_FLOAT)
138 SF( Y, 50, x, x, x, x, x, x, x, x, x, x, L32X32_FLOAT)
139 SF( Y, 50, x, x, x, x, x, x, x, x, x, x, I32X32_FLOAT)
140 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R16G16B16A16_SSCALED)
141 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R16G16B16A16_USCALED)
142 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R32G32_SSCALED)
143 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R32G32_USCALED)
144 SF( x, x, x, x, x, x, 75, x, x, x, x, x, R32G32_SFIXED)
145 SF( x, x, x, x, x, x, 80, x, x, x, x, x, R64_PASSTHRU)
146 SF( Y, Y, x, Y, Y, Y, Y, x, 60, 70, x, 90, B8G8R8A8_UNORM)
147 SF( Y, Y, x, x, Y, Y, x, x, x, x, x, 100, B8G8R8A8_UNORM_SRGB)
148 /* smpl filt shad CK RT AB VB SO color TW TR ccs_e */
149 SF( Y, Y, x, x, Y, Y, Y, x, 60, 70, x, 100, R10G10B10A2_UNORM)
150 SF( Y, Y, x, x, x, x, x, x, 60, x, x, 120, R10G10B10A2_UNORM_SRGB)
151 SF( Y, x, x, x, Y, x, Y, x, x, 70, x, 100, R10G10B10A2_UINT)
152 SF( Y, Y, x, x, x, x, Y, x, x, x, x, x, R10G10B10_SNORM_A2_UNORM)
153 SF( Y, Y, x, x, Y, Y, Y, x, 60, 70, 110, 90, R8G8B8A8_UNORM)
154 SF( Y, Y, x, x, Y, Y, x, x, 60, x, x, 100, R8G8B8A8_UNORM_SRGB)
155 SF( Y, Y, x, x, Y, 60, Y, x, x, 70, 110, 90, R8G8B8A8_SNORM)
156 SF( Y, x, x, x, Y, x, Y, x, x, 70, 90, 90, R8G8B8A8_SINT)
157 SF( Y, x, x, x, Y, x, Y, x, x, 70, 75, 90, R8G8B8A8_UINT)
158 SF( Y, Y, x, x, Y, 45, Y, x, x, 70, 110, 90, R16G16_UNORM)
159 SF( Y, Y, x, x, Y, 60, Y, x, x, 70, 110, 90, R16G16_SNORM)
160 SF( Y, x, x, x, Y, x, Y, x, x, 70, 90, 90, R16G16_SINT)
161 SF( Y, x, x, x, Y, x, Y, x, x, 70, 75, 90, R16G16_UINT)
162 SF( Y, Y, x, x, Y, Y, Y, x, x, 70, 90, 90, R16G16_FLOAT)
163 SF( Y, Y, x, x, Y, Y, 75, x, 60, 70, x, 100, B10G10R10A2_UNORM)
164 SF( Y, Y, x, x, Y, Y, x, x, 60, x, x, 100, B10G10R10A2_UNORM_SRGB)
165 SF( Y, Y, x, x, Y, Y, Y, x, x, 70, x, 100, R11G11B10_FLOAT)
166 SF(120, 120, x, x, 120, 120, x, x, x, x, x, 120, R10G10B10_FLOAT_A2_UNORM)
167 SF( Y, x, x, x, Y, x, Y, Y, x, 70, 70, 90, R32_SINT)
168 SF( Y, x, x, x, Y, x, Y, Y, x, 70, 70, 90, R32_UINT)
169 SF( Y, 50, Y, x, Y, Y, Y, Y, x, 70, 70, 90, R32_FLOAT)
170 SF( Y, 50, Y, x, x, x, x, x, x, x, x, 120, R24_UNORM_X8_TYPELESS)
171 SF( Y, x, x, x, x, x, x, x, x, x, x, x, X24_TYPELESS_G8_UINT)
172 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, L16A16_UNORM)
173 SF( Y, 50, Y, x, x, x, x, x, x, x, x, x, I24X8_UNORM)
174 SF( Y, 50, Y, x, x, x, x, x, x, x, x, x, L24X8_UNORM)
175 SF( Y, 50, Y, x, x, x, x, x, x, x, x, x, A24X8_UNORM)
176 SF( Y, 50, Y, x, x, x, x, x, x, x, x, x, I32_FLOAT)
177 SF( Y, 50, Y, x, x, x, x, x, x, x, x, x, L32_FLOAT)
178 SF( Y, 50, Y, x, x, x, x, x, x, x, x, x, A32_FLOAT)
179 SF( Y, Y, x, Y, 80, 80, x, x, 60, x, x, 90, B8G8R8X8_UNORM)
180 SF( Y, Y, x, x, 80, 80, x, x, x, x, x, 100, B8G8R8X8_UNORM_SRGB)
181 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, R8G8B8X8_UNORM)
182 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, R8G8B8X8_UNORM_SRGB)
183 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, R9G9B9E5_SHAREDEXP)
184 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, B10G10R10X2_UNORM)
185 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, L16A16_FLOAT)
186 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R32_UNORM)
187 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R32_SNORM)
188 /* smpl filt shad CK RT AB VB SO color TW TR ccs_e */
189 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R10G10B10X2_USCALED)
190 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R8G8B8A8_SSCALED)
191 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R8G8B8A8_USCALED)
192 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R16G16_SSCALED)
193 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R16G16_USCALED)
194 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R32_SSCALED)
195 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R32_USCALED)
196 SF( Y, Y, x, Y, Y, Y, x, x, x, 70, x, 120, B5G6R5_UNORM)
197 SF( Y, Y, x, x, Y, Y, x, x, x, x, x, 120, B5G6R5_UNORM_SRGB)
198 SF( Y, Y, x, Y, Y, Y, x, x, x, 70, x, 120, B5G5R5A1_UNORM)
199 SF( Y, Y, x, x, Y, Y, x, x, x, x, x, 120, B5G5R5A1_UNORM_SRGB)
200 SF( Y, Y, x, Y, Y, Y, x, x, x, 70, x, 120, B4G4R4A4_UNORM)
201 SF( Y, Y, x, x, Y, Y, x, x, x, x, x, 120, B4G4R4A4_UNORM_SRGB)
202 SF( Y, Y, x, x, Y, Y, Y, x, x, 70, 110, 120, R8G8_UNORM)
203 SF( Y, Y, x, Y, Y, 60, Y, x, x, 70, 110, 120, R8G8_SNORM)
204 SF( Y, x, x, x, Y, x, Y, x, x, 70, 90, 120, R8G8_SINT)
205 SF( Y, x, x, x, Y, x, Y, x, x, 70, 75, 120, R8G8_UINT)
206 SF( Y, Y, Y, x, Y, 45, Y, x, 70, 70, 110, 120, R16_UNORM)
207 SF( Y, Y, x, x, Y, 60, Y, x, x, 70, 110, 120, R16_SNORM)
208 SF( Y, x, x, x, Y, x, Y, x, x, 70, 90, 120, R16_SINT)
209 SF( Y, x, x, x, Y, x, Y, x, x, 70, 75, 120, R16_UINT)
210 SF( Y, Y, x, x, Y, Y, Y, x, x, 70, 90, 120, R16_FLOAT)
211 SF( 50, 50, x, x, x, x, x, x, x, x, x, x, A8P8_UNORM_PALETTE0)
212 SF( 50, 50, x, x, x, x, x, x, x, x, x, x, A8P8_UNORM_PALETTE1)
213 SF( Y, Y, Y, x, x, x, x, x, x, x, x, x, I16_UNORM)
214 SF( Y, Y, Y, x, x, x, x, x, x, x, x, x, L16_UNORM)
215 SF( Y, Y, Y, x, x, x, x, x, x, x, x, x, A16_UNORM)
216 SF( Y, Y, x, Y, x, x, x, x, x, x, x, x, L8A8_UNORM)
217 SF( Y, Y, Y, x, x, x, x, x, x, x, x, x, I16_FLOAT)
218 SF( Y, Y, Y, x, x, x, x, x, x, x, x, x, L16_FLOAT)
219 SF( Y, Y, Y, x, x, x, x, x, x, x, x, x, A16_FLOAT)
220 SF( 45, 45, x, x, x, x, x, x, x, x, x, x, L8A8_UNORM_SRGB)
221 SF( Y, Y, x, Y, x, x, x, x, x, x, x, x, R5G5_SNORM_B6_UNORM)
222 SF( x, x, x, x, Y, Y, x, x, x, 70, x, 120, B5G5R5X1_UNORM)
223 SF( x, x, x, x, Y, Y, x, x, x, x, x, 120, B5G5R5X1_UNORM_SRGB)
224 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R8G8_SSCALED)
225 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R8G8_USCALED)
226 /* smpl filt shad CK RT AB VB SO color TW TR ccs_e */
227 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R16_SSCALED)
228 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R16_USCALED)
229 SF( 50, 50, x, x, x, x, x, x, x, x, x, x, P8A8_UNORM_PALETTE0)
230 SF( 50, 50, x, x, x, x, x, x, x, x, x, x, P8A8_UNORM_PALETTE1)
231 SF(120, 120, x, x, 120, 120, x, x, x, x, x, 120, A1B5G5R5_UNORM)
232 /* According to the PRM, A4B4G4R4_UNORM isn't supported until Sky Lake
233 * but empirical testing indicates that at least sampling works just fine
234 * on Broadwell.
235 */
236 SF( 80, 80, x, x, 90, 120, x, x, x, x, x, 120, A4B4G4R4_UNORM)
237 SF( 90, x, x, x, x, x, x, x, x, x, x, x, L8A8_UINT)
238 SF( 90, x, x, x, x, x, x, x, x, x, x, x, L8A8_SINT)
239 SF( Y, Y, x, 45, Y, Y, Y, x, x, 70, 110, 120, R8_UNORM)
240 SF( Y, Y, x, x, Y, 60, Y, x, x, 70, 110, 120, R8_SNORM)
241 SF( Y, x, x, x, Y, x, Y, x, x, 70, 90, 120, R8_SINT)
242 SF( Y, x, x, x, Y, x, Y, x, x, 70, 75, 120, R8_UINT)
243 SF( Y, Y, x, Y, Y, Y, x, x, x, 70, 110, 120, A8_UNORM)
244 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, I8_UNORM)
245 SF( Y, Y, x, Y, x, x, x, x, x, x, x, x, L8_UNORM)
246 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, P4A4_UNORM_PALETTE0)
247 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, A4P4_UNORM_PALETTE0)
248 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R8_SSCALED)
249 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R8_USCALED)
250 SF( 45, 45, x, x, x, x, x, x, x, x, x, x, P8_UNORM_PALETTE0)
251 SF( 45, 45, x, x, x, x, x, x, x, x, x, x, L8_UNORM_SRGB)
252 SF( 45, 45, x, x, x, x, x, x, x, x, x, x, P8_UNORM_PALETTE1)
253 SF( 45, 45, x, x, x, x, x, x, x, x, x, x, P4A4_UNORM_PALETTE1)
254 SF( 45, 45, x, x, x, x, x, x, x, x, x, x, A4P4_UNORM_PALETTE1)
255 SF( x, x, x, x, x, x, x, x, x, x, x, x, Y8_UNORM)
256 SF( 90, x, x, x, x, x, x, x, x, x, x, x, L8_UINT)
257 SF( 90, x, x, x, x, x, x, x, x, x, x, x, L8_SINT)
258 SF( 90, x, x, x, x, x, x, x, x, x, x, x, I8_UINT)
259 SF( 90, x, x, x, x, x, x, x, x, x, x, x, I8_SINT)
260 SF( 45, 45, x, x, x, x, x, x, x, x, x, x, DXT1_RGB_SRGB)
261 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, R1_UNORM)
262 SF( Y, Y, x, Y, Y, x, x, x, 60, x, x, x, YCRCB_NORMAL)
263 SF( Y, Y, x, Y, Y, x, x, x, 60, x, x, x, YCRCB_SWAPUVY)
264 SF( 45, 45, x, x, x, x, x, x, x, x, x, x, P2_UNORM_PALETTE0)
265 SF( 45, 45, x, x, x, x, x, x, x, x, x, x, P2_UNORM_PALETTE1)
266 SF( Y, Y, x, Y, x, x, x, x, x, x, x, x, BC1_UNORM)
267 SF( Y, Y, x, Y, x, x, x, x, x, x, x, x, BC2_UNORM)
268 SF( Y, Y, x, Y, x, x, x, x, x, x, x, x, BC3_UNORM)
269 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, BC4_UNORM)
270 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, BC5_UNORM)
271 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, BC1_UNORM_SRGB)
272 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, BC2_UNORM_SRGB)
273 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, BC3_UNORM_SRGB)
274 SF( Y, x, x, x, x, x, x, x, x, x, x, x, MONO8)
275 SF( Y, Y, x, x, Y, x, x, x, 60, x, x, x, YCRCB_SWAPUV)
276 SF( Y, Y, x, x, Y, x, x, x, 60, x, x, x, YCRCB_SWAPY)
277 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, DXT1_RGB)
278 /* smpl filt shad CK RT AB VB SO color TW TR ccs_e */
279 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, FXT1)
280 SF( 75, 75, x, x, x, x, Y, x, x, x, x, x, R8G8B8_UNORM)
281 SF( 75, 75, x, x, x, x, Y, x, x, x, x, x, R8G8B8_SNORM)
282 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R8G8B8_SSCALED)
283 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R8G8B8_USCALED)
284 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R64G64B64A64_FLOAT)
285 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R64G64B64_FLOAT)
286 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, BC4_SNORM)
287 SF( Y, Y, x, x, x, x, x, x, x, x, x, x, BC5_SNORM)
288 SF( 50, 50, x, x, x, x, 60, x, x, x, x, x, R16G16B16_FLOAT)
289 SF( 75, 75, x, x, x, x, Y, x, x, x, x, x, R16G16B16_UNORM)
290 SF( 75, 75, x, x, x, x, Y, x, x, x, x, x, R16G16B16_SNORM)
291 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R16G16B16_SSCALED)
292 SF( x, x, x, x, x, x, Y, x, x, x, x, x, R16G16B16_USCALED)
293 SF( 70, 70, x, x, x, x, x, x, x, x, x, x, BC6H_SF16)
294 SF( 70, 70, x, x, x, x, x, x, x, x, x, x, BC7_UNORM)
295 SF( 70, 70, x, x, x, x, x, x, x, x, x, x, BC7_UNORM_SRGB)
296 SF( 70, 70, x, x, x, x, x, x, x, x, x, x, BC6H_UF16)
297 SF( x, x, x, x, x, x, x, x, x, x, x, x, PLANAR_420_8)
298 /* The format enum for R8G8B8_UNORM_SRGB first shows up in the HSW PRM but
299 * empirical testing indicates that it doesn't actually sRGB decode and
300 * acts identical to R8G8B8_UNORM. It does work on gen8+.
301 */
302 SF( 80, 80, x, x, x, x, x, x, x, x, x, x, R8G8B8_UNORM_SRGB)
303 SF( 80, 80, x, x, x, x, x, x, x, x, x, x, ETC1_RGB8)
304 SF( 80, 80, x, x, x, x, x, x, x, x, x, x, ETC2_RGB8)
305 SF( 80, 80, x, x, x, x, x, x, x, x, x, x, EAC_R11)
306 SF( 80, 80, x, x, x, x, x, x, x, x, x, x, EAC_RG11)
307 SF( 80, 80, x, x, x, x, x, x, x, x, x, x, EAC_SIGNED_R11)
308 SF( 80, 80, x, x, x, x, x, x, x, x, x, x, EAC_SIGNED_RG11)
309 SF( 80, 80, x, x, x, x, x, x, x, x, x, x, ETC2_SRGB8)
310 SF( 90, x, x, x, x, x, 75, x, x, x, x, x, R16G16B16_UINT)
311 SF( 90, x, x, x, x, x, 75, x, x, x, x, x, R16G16B16_SINT)
312 SF( x, x, x, x, x, x, 75, x, x, x, x, x, R32_SFIXED)
313 SF( x, x, x, x, x, x, 75, x, x, x, x, x, R10G10B10A2_SNORM)
314 SF( x, x, x, x, x, x, 75, x, x, x, x, x, R10G10B10A2_USCALED)
315 SF( x, x, x, x, x, x, 75, x, x, x, x, x, R10G10B10A2_SSCALED)
316 SF( x, x, x, x, x, x, 75, x, x, x, x, x, R10G10B10A2_SINT)
317 SF( x, x, x, x, x, x, 75, x, x, x, x, x, B10G10R10A2_SNORM)
318 SF( x, x, x, x, x, x, 75, x, x, x, x, x, B10G10R10A2_USCALED)
319 SF( x, x, x, x, x, x, 75, x, x, x, x, x, B10G10R10A2_SSCALED)
320 SF( x, x, x, x, x, x, 75, x, x, x, x, x, B10G10R10A2_UINT)
321 SF( x, x, x, x, x, x, 75, x, x, x, x, x, B10G10R10A2_SINT)
322 SF( x, x, x, x, x, x, 80, x, x, x, x, x, R64G64B64A64_PASSTHRU)
323 SF( x, x, x, x, x, x, 80, x, x, x, x, x, R64G64B64_PASSTHRU)
324 SF( 80, 80, x, x, x, x, x, x, x, x, x, x, ETC2_RGB8_PTA)
325 SF( 80, 80, x, x, x, x, x, x, x, x, x, x, ETC2_SRGB8_PTA)
326 SF( 80, 80, x, x, x, x, x, x, x, x, x, x, ETC2_EAC_RGBA8)
327 SF( 80, 80, x, x, x, x, x, x, x, x, x, x, ETC2_EAC_SRGB8_A8)
328 SF( 90, x, x, x, x, x, 75, x, x, x, x, x, R8G8B8_UINT)
329 SF( 90, x, x, x, x, x, 75, x, x, x, x, x, R8G8B8_SINT)
330 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_4X4_FLT16)
331 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_5X4_FLT16)
332 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_5X5_FLT16)
333 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_6X5_FLT16)
334 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_6X6_FLT16)
335 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_8X5_FLT16)
336 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_8X6_FLT16)
337 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_8X8_FLT16)
338 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_10X5_FLT16)
339 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_10X6_FLT16)
340 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_10X8_FLT16)
341 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_10X10_FLT16)
342 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_12X10_FLT16)
343 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_12X12_FLT16)
344 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_4X4_U8SRGB)
345 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_5X4_U8SRGB)
346 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_5X5_U8SRGB)
347 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_6X5_U8SRGB)
348 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_6X6_U8SRGB)
349 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_8X5_U8SRGB)
350 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_8X6_U8SRGB)
351 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_8X8_U8SRGB)
352 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_10X5_U8SRGB)
353 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_10X6_U8SRGB)
354 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_10X8_U8SRGB)
355 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_10X10_U8SRGB)
356 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_12X10_U8SRGB)
357 SF( 90, 90, x, x, x, x, x, x, x, x, x, x, ASTC_LDR_2D_12X12_U8SRGB)
358 SF(100, 100, x, x, x, x, x, x, x, x, x, x, ASTC_HDR_2D_4X4_FLT16)
359 SF(100, 100, x, x, x, x, x, x, x, x, x, x, ASTC_HDR_2D_5X4_FLT16)
360 SF(100, 100, x, x, x, x, x, x, x, x, x, x, ASTC_HDR_2D_5X5_FLT16)
361 SF(100, 100, x, x, x, x, x, x, x, x, x, x, ASTC_HDR_2D_6X5_FLT16)
362 SF(100, 100, x, x, x, x, x, x, x, x, x, x, ASTC_HDR_2D_6X6_FLT16)
363 SF(100, 100, x, x, x, x, x, x, x, x, x, x, ASTC_HDR_2D_8X5_FLT16)
364 SF(100, 100, x, x, x, x, x, x, x, x, x, x, ASTC_HDR_2D_8X6_FLT16)
365 SF(100, 100, x, x, x, x, x, x, x, x, x, x, ASTC_HDR_2D_8X8_FLT16)
366 SF(100, 100, x, x, x, x, x, x, x, x, x, x, ASTC_HDR_2D_10X5_FLT16)
367 SF(100, 100, x, x, x, x, x, x, x, x, x, x, ASTC_HDR_2D_10X6_FLT16)
368 SF(100, 100, x, x, x, x, x, x, x, x, x, x, ASTC_HDR_2D_10X8_FLT16)
369 SF(100, 100, x, x, x, x, x, x, x, x, x, x, ASTC_HDR_2D_10X10_FLT16)
370 SF(100, 100, x, x, x, x, x, x, x, x, x, x, ASTC_HDR_2D_12X10_FLT16)
371 SF(100, 100, x, x, x, x, x, x, x, x, x, x, ASTC_HDR_2D_12X12_FLT16)
372 };
373 #undef x
374 #undef Y
375
376 static unsigned
377 format_gen(const struct gen_device_info *devinfo)
378 {
379 return devinfo->gen * 10 + (devinfo->is_g4x || devinfo->is_haswell) * 5;
380 }
381
382 static bool
383 format_info_exists(enum isl_format format)
384 {
385 assert(format != ISL_FORMAT_UNSUPPORTED);
386 assert(format < ISL_NUM_FORMATS);
387 return format < ARRAY_SIZE(format_info) && format_info[format].exists;
388 }
389
390 bool
391 isl_format_supports_rendering(const struct gen_device_info *devinfo,
392 enum isl_format format)
393 {
394 if (!format_info_exists(format))
395 return false;
396
397 return format_gen(devinfo) >= format_info[format].render_target;
398 }
399
400 bool
401 isl_format_supports_alpha_blending(const struct gen_device_info *devinfo,
402 enum isl_format format)
403 {
404 if (!format_info_exists(format))
405 return false;
406
407 return format_gen(devinfo) >= format_info[format].alpha_blend;
408 }
409
410 bool
411 isl_format_supports_sampling(const struct gen_device_info *devinfo,
412 enum isl_format format)
413 {
414 if (!format_info_exists(format))
415 return false;
416
417 if (devinfo->is_baytrail) {
418 const struct isl_format_layout *fmtl = isl_format_get_layout(format);
419 /* Support for ETC1 and ETC2 exists on Bay Trail even though big-core
420 * GPUs didn't get it until Broadwell.
421 */
422 if (fmtl->txc == ISL_TXC_ETC1 || fmtl->txc == ISL_TXC_ETC2)
423 return true;
424 } else if (devinfo->is_cherryview) {
425 const struct isl_format_layout *fmtl = isl_format_get_layout(format);
426 /* Support for ASTC LDR exists on Cherry View even though big-core
427 * GPUs didn't get it until Skylake.
428 */
429 if (fmtl->txc == ISL_TXC_ASTC)
430 return format < ISL_FORMAT_ASTC_HDR_2D_4X4_FLT16;
431 } else if (gen_device_info_is_9lp(devinfo)) {
432 const struct isl_format_layout *fmtl = isl_format_get_layout(format);
433 /* Support for ASTC HDR exists on Broxton even though big-core
434 * GPUs didn't get it until Cannonlake.
435 */
436 if (fmtl->txc == ISL_TXC_ASTC)
437 return true;
438 }
439
440 return format_gen(devinfo) >= format_info[format].sampling;
441 }
442
443 bool
444 isl_format_supports_filtering(const struct gen_device_info *devinfo,
445 enum isl_format format)
446 {
447 if (!format_info_exists(format))
448 return false;
449
450 if (devinfo->is_baytrail) {
451 const struct isl_format_layout *fmtl = isl_format_get_layout(format);
452 /* Support for ETC1 and ETC2 exists on Bay Trail even though big-core
453 * GPUs didn't get it until Broadwell.
454 */
455 if (fmtl->txc == ISL_TXC_ETC1 || fmtl->txc == ISL_TXC_ETC2)
456 return true;
457 } else if (devinfo->is_cherryview) {
458 const struct isl_format_layout *fmtl = isl_format_get_layout(format);
459 /* Support for ASTC LDR exists on Cherry View even though big-core
460 * GPUs didn't get it until Skylake.
461 */
462 if (fmtl->txc == ISL_TXC_ASTC)
463 return format < ISL_FORMAT_ASTC_HDR_2D_4X4_FLT16;
464 } else if (gen_device_info_is_9lp(devinfo)) {
465 const struct isl_format_layout *fmtl = isl_format_get_layout(format);
466 /* Support for ASTC HDR exists on Broxton even though big-core
467 * GPUs didn't get it until Cannonlake.
468 */
469 if (fmtl->txc == ISL_TXC_ASTC)
470 return true;
471 }
472
473 return format_gen(devinfo) >= format_info[format].filtering;
474 }
475
476 bool
477 isl_format_supports_vertex_fetch(const struct gen_device_info *devinfo,
478 enum isl_format format)
479 {
480 if (!format_info_exists(format))
481 return false;
482
483 /* For vertex fetch, Bay Trail supports the same set of formats as Haswell
484 * but is a superset of Ivy Bridge.
485 */
486 if (devinfo->is_baytrail)
487 return 75 >= format_info[format].input_vb;
488
489 return format_gen(devinfo) >= format_info[format].input_vb;
490 }
491
492 /**
493 * Returns true if the given format can support typed writes.
494 */
495 bool
496 isl_format_supports_typed_writes(const struct gen_device_info *devinfo,
497 enum isl_format format)
498 {
499 if (!format_info_exists(format))
500 return false;
501
502 return format_gen(devinfo) >= format_info[format].typed_write;
503 }
504
505
506 /**
507 * Returns true if the given format can support typed reads with format
508 * conversion fully handled by hardware. On Sky Lake, all formats which are
509 * supported for typed writes also support typed reads but some of them return
510 * the raw image data and don't provide format conversion.
511 *
512 * For anyone looking to find this data in the PRM, the easiest way to find
513 * format tables is to search for R11G11B10. There are only a few
514 * occurrences.
515 */
516 bool
517 isl_format_supports_typed_reads(const struct gen_device_info *devinfo,
518 enum isl_format format)
519 {
520 if (!format_info_exists(format))
521 return false;
522
523 return format_gen(devinfo) >= format_info[format].typed_read;
524 }
525
526 /**
527 * Returns true if the given format can support single-sample fast clears.
528 * This function only checks the format. In order to determine if a surface
529 * supports CCS_E, several other factors need to be considered such as tiling
530 * and sample count. See isl_surf_get_ccs_surf for details.
531 */
532 bool
533 isl_format_supports_ccs_d(const struct gen_device_info *devinfo,
534 enum isl_format format)
535 {
536 /* Clear-only compression was first added on Ivy Bridge and was last
537 * implemented on Ice lake (see BSpec: 43862).
538 */
539 if (devinfo->gen < 7 || devinfo->gen > 11)
540 return false;
541
542 if (!isl_format_supports_rendering(devinfo, format))
543 return false;
544
545 const struct isl_format_layout *fmtl = isl_format_get_layout(format);
546
547 return fmtl->bpb == 32 || fmtl->bpb == 64 || fmtl->bpb == 128;
548 }
549
550 /**
551 * Returns true if the given format can support single-sample color
552 * compression. This function only checks the format. In order to determine
553 * if a surface supports CCS_E, several other factors need to be considered
554 * such as tiling and sample count. See isl_surf_get_ccs_surf for details.
555 */
556 bool
557 isl_format_supports_ccs_e(const struct gen_device_info *devinfo,
558 enum isl_format format)
559 {
560 if (!format_info_exists(format))
561 return false;
562
563 /* For simplicity, only report that a format supports CCS_E if blorp can
564 * perform bit-for-bit copies with an image of that format while compressed.
565 * Unfortunately, R11G11B10_FLOAT is in a compression class of its own and
566 * there is no way to copy to/from it which doesn't potentially loose data
567 * if one of the bit patterns being copied isn't valid finite floats.
568 */
569 if (format == ISL_FORMAT_R11G11B10_FLOAT)
570 return false;
571
572 return format_gen(devinfo) >= format_info[format].ccs_e;
573 }
574
575 bool
576 isl_format_supports_multisampling(const struct gen_device_info *devinfo,
577 enum isl_format format)
578 {
579 /* From the Sandybridge PRM, Volume 4 Part 1 p72, SURFACE_STATE, Surface
580 * Format:
581 *
582 * If Number of Multisamples is set to a value other than
583 * MULTISAMPLECOUNT_1, this field cannot be set to the following
584 * formats:
585 *
586 * - any format with greater than 64 bits per element
587 * - any compressed texture format (BC*)
588 * - any YCRCB* format
589 *
590 * The restriction on the format's size is removed on Broadwell. Moreover,
591 * empirically it looks that even IvyBridge can handle multisampled surfaces
592 * with format sizes all the way to 128-bits (RGBA32F, RGBA32I, RGBA32UI).
593 *
594 * Also, there is an exception for HiZ which we treat as a compressed
595 * format and is allowed to be multisampled on Broadwell and earlier.
596 */
597 if (format == ISL_FORMAT_HIZ) {
598 /* On SKL+, HiZ is always single-sampled even when the primary surface
599 * is multisampled. See also isl_surf_get_hiz_surf().
600 */
601 return devinfo->gen <= 8;
602 } else if (devinfo->gen < 7 && isl_format_get_layout(format)->bpb > 64) {
603 return false;
604 } else if (isl_format_is_compressed(format)) {
605 return false;
606 } else if (isl_format_is_yuv(format)) {
607 return false;
608 } else {
609 return true;
610 }
611 }
612
613 /**
614 * Returns true if the two formats are "CCS_E compatible" meaning that you can
615 * render in one format with CCS_E enabled and then texture using the other
616 * format without needing a resolve.
617 *
618 * Note: Even if the formats are compatible, special care must be taken if a
619 * clear color is involved because the encoding of the clear color is heavily
620 * format-dependent.
621 */
622 bool
623 isl_formats_are_ccs_e_compatible(const struct gen_device_info *devinfo,
624 enum isl_format format1,
625 enum isl_format format2)
626 {
627 /* They must support CCS_E */
628 if (!isl_format_supports_ccs_e(devinfo, format1) ||
629 !isl_format_supports_ccs_e(devinfo, format2))
630 return false;
631
632 const struct isl_format_layout *fmtl1 = isl_format_get_layout(format1);
633 const struct isl_format_layout *fmtl2 = isl_format_get_layout(format2);
634
635 /* The compression used by CCS is not dependent on the actual data encoding
636 * of the format but only depends on the bit-layout of the channels.
637 */
638 return fmtl1->channels.r.bits == fmtl2->channels.r.bits &&
639 fmtl1->channels.g.bits == fmtl2->channels.g.bits &&
640 fmtl1->channels.b.bits == fmtl2->channels.b.bits &&
641 fmtl1->channels.a.bits == fmtl2->channels.a.bits;
642 }
643
644 static bool
645 isl_format_has_channel_type(enum isl_format fmt, enum isl_base_type type)
646 {
647 const struct isl_format_layout *fmtl = isl_format_get_layout(fmt);
648
649 return fmtl->channels.r.type == type ||
650 fmtl->channels.g.type == type ||
651 fmtl->channels.b.type == type ||
652 fmtl->channels.a.type == type ||
653 fmtl->channels.l.type == type ||
654 fmtl->channels.i.type == type ||
655 fmtl->channels.p.type == type;
656 }
657
658 bool
659 isl_format_has_unorm_channel(enum isl_format fmt)
660 {
661 return isl_format_has_channel_type(fmt, ISL_UNORM);
662 }
663
664 bool
665 isl_format_has_snorm_channel(enum isl_format fmt)
666 {
667 return isl_format_has_channel_type(fmt, ISL_SNORM);
668 }
669
670 bool
671 isl_format_has_ufloat_channel(enum isl_format fmt)
672 {
673 return isl_format_has_channel_type(fmt, ISL_UFLOAT);
674 }
675
676 bool
677 isl_format_has_sfloat_channel(enum isl_format fmt)
678 {
679 return isl_format_has_channel_type(fmt, ISL_SFLOAT);
680 }
681
682 bool
683 isl_format_has_uint_channel(enum isl_format fmt)
684 {
685 return isl_format_has_channel_type(fmt, ISL_UINT);
686 }
687
688 bool
689 isl_format_has_sint_channel(enum isl_format fmt)
690 {
691 return isl_format_has_channel_type(fmt, ISL_SINT);
692 }
693
694 bool
695 isl_format_has_color_component(enum isl_format fmt, int component)
696 {
697 const struct isl_format_layout *fmtl = isl_format_get_layout(fmt);
698 const uint8_t intensity = fmtl->channels.i.bits;
699 const uint8_t luminance = fmtl->channels.l.bits;
700
701 switch (component) {
702 case 0:
703 return (fmtl->channels.r.bits + intensity + luminance) > 0;
704 case 1:
705 return (fmtl->channels.g.bits + intensity + luminance) > 0;
706 case 2:
707 return (fmtl->channels.b.bits + intensity + luminance) > 0;
708 case 3:
709 return (fmtl->channels.a.bits + intensity) > 0;
710 default:
711 assert(!"Invalid color component: must be 0..3");
712 return false;
713 }
714 }
715
716 unsigned
717 isl_format_get_num_channels(enum isl_format fmt)
718 {
719 const struct isl_format_layout *fmtl = isl_format_get_layout(fmt);
720
721 assert(fmtl->channels.p.bits == 0);
722
723 return (fmtl->channels.r.bits > 0) +
724 (fmtl->channels.g.bits > 0) +
725 (fmtl->channels.b.bits > 0) +
726 (fmtl->channels.a.bits > 0) +
727 (fmtl->channels.l.bits > 0) +
728 (fmtl->channels.i.bits > 0);
729 }
730
731 uint32_t
732 isl_format_get_depth_format(enum isl_format fmt, bool has_stencil)
733 {
734 switch (fmt) {
735 default:
736 unreachable("bad isl depth format");
737 case ISL_FORMAT_R32_FLOAT_X8X24_TYPELESS:
738 assert(has_stencil);
739 return 0; /* D32_FLOAT_S8X24_UINT */
740 case ISL_FORMAT_R32_FLOAT:
741 assert(!has_stencil);
742 return 1; /* D32_FLOAT */
743 case ISL_FORMAT_R24_UNORM_X8_TYPELESS:
744 if (has_stencil) {
745 return 2; /* D24_UNORM_S8_UINT */
746 } else {
747 return 3; /* D24_UNORM_X8_UINT */
748 }
749 case ISL_FORMAT_R16_UNORM:
750 assert(!has_stencil);
751 return 5; /* D16_UNORM */
752 }
753 }
754
755 enum isl_format
756 isl_format_rgb_to_rgba(enum isl_format rgb)
757 {
758 assert(isl_format_is_rgb(rgb));
759
760 switch (rgb) {
761 case ISL_FORMAT_R32G32B32_FLOAT: return ISL_FORMAT_R32G32B32A32_FLOAT;
762 case ISL_FORMAT_R32G32B32_SINT: return ISL_FORMAT_R32G32B32A32_SINT;
763 case ISL_FORMAT_R32G32B32_UINT: return ISL_FORMAT_R32G32B32A32_UINT;
764 case ISL_FORMAT_R32G32B32_UNORM: return ISL_FORMAT_R32G32B32A32_UNORM;
765 case ISL_FORMAT_R32G32B32_SNORM: return ISL_FORMAT_R32G32B32A32_SNORM;
766 case ISL_FORMAT_R32G32B32_SSCALED: return ISL_FORMAT_R32G32B32A32_SSCALED;
767 case ISL_FORMAT_R32G32B32_USCALED: return ISL_FORMAT_R32G32B32A32_USCALED;
768 case ISL_FORMAT_R32G32B32_SFIXED: return ISL_FORMAT_R32G32B32A32_SFIXED;
769 case ISL_FORMAT_R8G8B8_UNORM: return ISL_FORMAT_R8G8B8A8_UNORM;
770 case ISL_FORMAT_R8G8B8_SNORM: return ISL_FORMAT_R8G8B8A8_SNORM;
771 case ISL_FORMAT_R8G8B8_SSCALED: return ISL_FORMAT_R8G8B8A8_SSCALED;
772 case ISL_FORMAT_R8G8B8_USCALED: return ISL_FORMAT_R8G8B8A8_USCALED;
773 case ISL_FORMAT_R16G16B16_FLOAT: return ISL_FORMAT_R16G16B16A16_FLOAT;
774 case ISL_FORMAT_R16G16B16_UNORM: return ISL_FORMAT_R16G16B16A16_UNORM;
775 case ISL_FORMAT_R16G16B16_SNORM: return ISL_FORMAT_R16G16B16A16_SNORM;
776 case ISL_FORMAT_R16G16B16_SSCALED: return ISL_FORMAT_R16G16B16A16_SSCALED;
777 case ISL_FORMAT_R16G16B16_USCALED: return ISL_FORMAT_R16G16B16A16_USCALED;
778 case ISL_FORMAT_R8G8B8_UNORM_SRGB: return ISL_FORMAT_R8G8B8A8_UNORM_SRGB;
779 case ISL_FORMAT_R16G16B16_UINT: return ISL_FORMAT_R16G16B16A16_UINT;
780 case ISL_FORMAT_R16G16B16_SINT: return ISL_FORMAT_R16G16B16A16_SINT;
781 case ISL_FORMAT_R8G8B8_UINT: return ISL_FORMAT_R8G8B8A8_UINT;
782 case ISL_FORMAT_R8G8B8_SINT: return ISL_FORMAT_R8G8B8A8_SINT;
783 default:
784 return ISL_FORMAT_UNSUPPORTED;
785 }
786 }
787
788 enum isl_format
789 isl_format_rgb_to_rgbx(enum isl_format rgb)
790 {
791 assert(isl_format_is_rgb(rgb));
792
793 switch (rgb) {
794 case ISL_FORMAT_R32G32B32_FLOAT:
795 return ISL_FORMAT_R32G32B32X32_FLOAT;
796 case ISL_FORMAT_R16G16B16_UNORM:
797 return ISL_FORMAT_R16G16B16X16_UNORM;
798 case ISL_FORMAT_R16G16B16_FLOAT:
799 return ISL_FORMAT_R16G16B16X16_FLOAT;
800 case ISL_FORMAT_R8G8B8_UNORM:
801 return ISL_FORMAT_R8G8B8X8_UNORM;
802 case ISL_FORMAT_R8G8B8_UNORM_SRGB:
803 return ISL_FORMAT_R8G8B8X8_UNORM_SRGB;
804 default:
805 return ISL_FORMAT_UNSUPPORTED;
806 }
807 }
808
809 enum isl_format
810 isl_format_rgbx_to_rgba(enum isl_format rgbx)
811 {
812 assert(isl_format_is_rgbx(rgbx));
813
814 switch (rgbx) {
815 case ISL_FORMAT_R32G32B32X32_FLOAT:
816 return ISL_FORMAT_R32G32B32A32_FLOAT;
817 case ISL_FORMAT_R16G16B16X16_UNORM:
818 return ISL_FORMAT_R16G16B16A16_UNORM;
819 case ISL_FORMAT_R16G16B16X16_FLOAT:
820 return ISL_FORMAT_R16G16B16A16_FLOAT;
821 case ISL_FORMAT_B8G8R8X8_UNORM:
822 return ISL_FORMAT_B8G8R8A8_UNORM;
823 case ISL_FORMAT_B8G8R8X8_UNORM_SRGB:
824 return ISL_FORMAT_B8G8R8A8_UNORM_SRGB;
825 case ISL_FORMAT_R8G8B8X8_UNORM:
826 return ISL_FORMAT_R8G8B8A8_UNORM;
827 case ISL_FORMAT_R8G8B8X8_UNORM_SRGB:
828 return ISL_FORMAT_R8G8B8A8_UNORM_SRGB;
829 case ISL_FORMAT_B10G10R10X2_UNORM:
830 return ISL_FORMAT_B10G10R10A2_UNORM;
831 case ISL_FORMAT_B5G5R5X1_UNORM:
832 return ISL_FORMAT_B5G5R5A1_UNORM;
833 case ISL_FORMAT_B5G5R5X1_UNORM_SRGB:
834 return ISL_FORMAT_B5G5R5A1_UNORM_SRGB;
835 default:
836 assert(!"Invalid RGBX format");
837 return rgbx;
838 }
839 }
840
841 static inline void
842 pack_channel(const union isl_color_value *value, unsigned i,
843 const struct isl_channel_layout *layout,
844 enum isl_colorspace colorspace,
845 uint32_t data_out[4])
846 {
847 if (layout->type == ISL_VOID)
848 return;
849
850 if (colorspace == ISL_COLORSPACE_SRGB)
851 assert(layout->type == ISL_UNORM);
852
853 uint32_t packed;
854 switch (layout->type) {
855 case ISL_UNORM:
856 if (colorspace == ISL_COLORSPACE_SRGB) {
857 if (layout->bits == 8) {
858 packed = util_format_linear_float_to_srgb_8unorm(value->f32[i]);
859 } else {
860 float srgb = util_format_linear_to_srgb_float(value->f32[i]);
861 packed = _mesa_float_to_unorm(srgb, layout->bits);
862 }
863 } else {
864 packed = _mesa_float_to_unorm(value->f32[i], layout->bits);
865 }
866 break;
867 case ISL_SNORM:
868 packed = _mesa_float_to_snorm(value->f32[i], layout->bits);
869 break;
870 case ISL_SFLOAT:
871 assert(layout->bits == 16 || layout->bits == 32);
872 if (layout->bits == 16) {
873 packed = _mesa_float_to_half(value->f32[i]);
874 } else {
875 packed = value->u32[i];
876 }
877 break;
878 case ISL_UINT:
879 packed = MIN(value->u32[i], MAX_UINT(layout->bits));
880 break;
881 case ISL_SINT:
882 packed = MIN(MAX(value->u32[i], MIN_INT(layout->bits)),
883 MAX_INT(layout->bits));
884 break;
885
886 default:
887 unreachable("Invalid channel type");
888 }
889
890 unsigned dword = layout->start_bit / 32;
891 unsigned bit = layout->start_bit % 32;
892 assert(bit + layout->bits <= 32);
893 data_out[dword] |= (packed & MAX_UINT(layout->bits)) << bit;
894 }
895
896 /**
897 * Take an isl_color_value and pack it into the actual bits as specified by
898 * the isl_format. This function is very slow for a format conversion
899 * function but should be fine for a single pixel worth of data.
900 */
901 void
902 isl_color_value_pack(const union isl_color_value *value,
903 enum isl_format format,
904 uint32_t *data_out)
905 {
906 const struct isl_format_layout *fmtl = isl_format_get_layout(format);
907 assert(fmtl->colorspace == ISL_COLORSPACE_LINEAR ||
908 fmtl->colorspace == ISL_COLORSPACE_SRGB);
909 assert(!isl_format_is_compressed(format));
910
911 memset(data_out, 0, isl_align(fmtl->bpb, 32) / 8);
912
913 if (format == ISL_FORMAT_R9G9B9E5_SHAREDEXP) {
914 data_out[0] = float3_to_rgb9e5(value->f32);
915 return;
916 } else if (format == ISL_FORMAT_R11G11B10_FLOAT) {
917 data_out[0] = float3_to_r11g11b10f(value->f32);
918 return;
919 }
920
921 pack_channel(value, 0, &fmtl->channels.r, fmtl->colorspace, data_out);
922 pack_channel(value, 1, &fmtl->channels.g, fmtl->colorspace, data_out);
923 pack_channel(value, 2, &fmtl->channels.b, fmtl->colorspace, data_out);
924 pack_channel(value, 3, &fmtl->channels.a, ISL_COLORSPACE_LINEAR, data_out);
925 pack_channel(value, 0, &fmtl->channels.l, fmtl->colorspace, data_out);
926 pack_channel(value, 0, &fmtl->channels.i, ISL_COLORSPACE_LINEAR, data_out);
927 assert(fmtl->channels.p.bits == 0);
928 }
929
930 /** Extend an N-bit signed integer to 32 bits */
931 static inline int32_t
932 sign_extend(int32_t x, unsigned bits)
933 {
934 if (bits < 32) {
935 unsigned shift = 32 - bits;
936 return (x << shift) >> shift;
937 } else {
938 return x;
939 }
940 }
941
942 static inline void
943 unpack_channel(union isl_color_value *value,
944 unsigned start, unsigned count,
945 const struct isl_channel_layout *layout,
946 enum isl_colorspace colorspace,
947 const uint32_t *data_in)
948 {
949 if (layout->type == ISL_VOID)
950 return;
951
952 unsigned dword = layout->start_bit / 32;
953 unsigned bit = layout->start_bit % 32;
954 assert(bit + layout->bits <= 32);
955 uint32_t packed = (data_in[dword] >> bit) & MAX_UINT(layout->bits);
956
957 union {
958 uint32_t u32;
959 float f32;
960 } unpacked;
961
962 if (colorspace == ISL_COLORSPACE_SRGB)
963 assert(layout->type == ISL_UNORM);
964
965 switch (layout->type) {
966 case ISL_UNORM:
967 unpacked.f32 = _mesa_unorm_to_float(packed, layout->bits);
968 if (colorspace == ISL_COLORSPACE_SRGB) {
969 if (layout->bits == 8) {
970 unpacked.f32 = util_format_srgb_8unorm_to_linear_float(packed);
971 } else {
972 float srgb = _mesa_unorm_to_float(packed, layout->bits);
973 unpacked.f32 = util_format_srgb_to_linear_float(srgb);
974 }
975 } else {
976 unpacked.f32 = _mesa_unorm_to_float(packed, layout->bits);
977 }
978 break;
979 case ISL_SNORM:
980 unpacked.f32 = _mesa_snorm_to_float(sign_extend(packed, layout->bits),
981 layout->bits);
982 break;
983 case ISL_SFLOAT:
984 assert(layout->bits == 16 || layout->bits == 32);
985 if (layout->bits == 16) {
986 unpacked.f32 = _mesa_half_to_float(packed);
987 } else {
988 unpacked.u32 = packed;
989 }
990 break;
991 case ISL_UINT:
992 unpacked.u32 = packed;
993 break;
994 case ISL_SINT:
995 unpacked.u32 = sign_extend(packed, layout->bits);
996 break;
997
998 default:
999 unreachable("Invalid channel type");
1000 }
1001
1002 for (unsigned i = 0; i < count; i++)
1003 value->u32[start + i] = unpacked.u32;
1004 }
1005
1006 /**
1007 * Take unpack an isl_color_value from the actual bits as specified by
1008 * the isl_format. This function is very slow for a format conversion
1009 * function but should be fine for a single pixel worth of data.
1010 */
1011 void
1012 isl_color_value_unpack(union isl_color_value *value,
1013 enum isl_format format,
1014 const uint32_t data_in[4])
1015 {
1016 const struct isl_format_layout *fmtl = isl_format_get_layout(format);
1017 assert(fmtl->colorspace == ISL_COLORSPACE_LINEAR ||
1018 fmtl->colorspace == ISL_COLORSPACE_SRGB);
1019 assert(!isl_format_is_compressed(format));
1020
1021 /* Default to opaque black. */
1022 memset(value, 0, sizeof(*value));
1023 if (isl_format_has_int_channel(format)) {
1024 value->u32[3] = 1u;
1025 } else {
1026 value->f32[3] = 1.0f;
1027 }
1028
1029 if (format == ISL_FORMAT_R9G9B9E5_SHAREDEXP) {
1030 rgb9e5_to_float3(data_in[0], value->f32);
1031 return;
1032 } else if (format == ISL_FORMAT_R11G11B10_FLOAT) {
1033 r11g11b10f_to_float3(data_in[0], value->f32);
1034 return;
1035 }
1036
1037 unpack_channel(value, 0, 1, &fmtl->channels.r, fmtl->colorspace, data_in);
1038 unpack_channel(value, 1, 1, &fmtl->channels.g, fmtl->colorspace, data_in);
1039 unpack_channel(value, 2, 1, &fmtl->channels.b, fmtl->colorspace, data_in);
1040 unpack_channel(value, 3, 1, &fmtl->channels.a, ISL_COLORSPACE_LINEAR, data_in);
1041 unpack_channel(value, 0, 3, &fmtl->channels.l, fmtl->colorspace, data_in);
1042 unpack_channel(value, 0, 4, &fmtl->channels.i, ISL_COLORSPACE_LINEAR, data_in);
1043 assert(fmtl->channels.p.bits == 0);
1044 }