Merge remote-tracking branch 'mesa-public/master' into vulkan
[mesa.git] / src / mesa / drivers / dri / i965 / brw_defines.h
1 /*
2 Copyright (C) Intel Corp. 2006. All Rights Reserved.
3 Intel funded Tungsten Graphics to
4 develop this 3D driver.
5
6 Permission is hereby granted, free of charge, to any person obtaining
7 a copy of this software and associated documentation files (the
8 "Software"), to deal in the Software without restriction, including
9 without limitation the rights to use, copy, modify, merge, publish,
10 distribute, sublicense, and/or sell copies of the Software, and to
11 permit persons to whom the Software is furnished to do so, subject to
12 the following conditions:
13
14 The above copyright notice and this permission notice (including the
15 next paragraph) shall be included in all copies or substantial
16 portions of the Software.
17
18 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
19 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
21 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
22 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
23 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
24 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25
26 **********************************************************************/
27 /*
28 * Authors:
29 * Keith Whitwell <keithw@vmware.com>
30 */
31
32 #define INTEL_MASK(high, low) (((1<<((high)-(low)+1))-1)<<(low))
33 /* Using the GNU statement expression extension */
34 #define SET_FIELD(value, field) \
35 ({ \
36 uint32_t fieldval = (value) << field ## _SHIFT; \
37 assert((fieldval & ~ field ## _MASK) == 0); \
38 fieldval & field ## _MASK; \
39 })
40
41 #define GET_BITS(data, high, low) ((data & INTEL_MASK((high), (low))) >> (low))
42 #define GET_FIELD(word, field) (((word) & field ## _MASK) >> field ## _SHIFT)
43
44 #ifndef BRW_DEFINES_H
45 #define BRW_DEFINES_H
46
47 /* 3D state:
48 */
49 #define CMD_3D_PRIM 0x7b00 /* 3DPRIMITIVE */
50 /* DW0 */
51 # define GEN4_3DPRIM_TOPOLOGY_TYPE_SHIFT 10
52 # define GEN4_3DPRIM_VERTEXBUFFER_ACCESS_SEQUENTIAL (0 << 15)
53 # define GEN4_3DPRIM_VERTEXBUFFER_ACCESS_RANDOM (1 << 15)
54 # define GEN7_3DPRIM_INDIRECT_PARAMETER_ENABLE (1 << 10)
55 # define GEN7_3DPRIM_PREDICATE_ENABLE (1 << 8)
56 /* DW1 */
57 # define GEN7_3DPRIM_VERTEXBUFFER_ACCESS_SEQUENTIAL (0 << 8)
58 # define GEN7_3DPRIM_VERTEXBUFFER_ACCESS_RANDOM (1 << 8)
59
60 #ifndef _3DPRIM_POINTLIST /* FIXME: Avoid clashing with defines from bdw_pack.h */
61 #define _3DPRIM_POINTLIST 0x01
62 #define _3DPRIM_LINELIST 0x02
63 #define _3DPRIM_LINESTRIP 0x03
64 #define _3DPRIM_TRILIST 0x04
65 #define _3DPRIM_TRISTRIP 0x05
66 #define _3DPRIM_TRIFAN 0x06
67 #define _3DPRIM_QUADLIST 0x07
68 #define _3DPRIM_QUADSTRIP 0x08
69 #define _3DPRIM_LINELIST_ADJ 0x09 /* G45+ */
70 #define _3DPRIM_LINESTRIP_ADJ 0x0A /* G45+ */
71 #define _3DPRIM_TRILIST_ADJ 0x0B /* G45+ */
72 #define _3DPRIM_TRISTRIP_ADJ 0x0C /* G45+ */
73 #define _3DPRIM_TRISTRIP_REVERSE 0x0D
74 #define _3DPRIM_POLYGON 0x0E
75 #define _3DPRIM_RECTLIST 0x0F
76 #define _3DPRIM_LINELOOP 0x10
77 #define _3DPRIM_POINTLIST_BF 0x11
78 #define _3DPRIM_LINESTRIP_CONT 0x12
79 #define _3DPRIM_LINESTRIP_BF 0x13
80 #define _3DPRIM_LINESTRIP_CONT_BF 0x14
81 #define _3DPRIM_TRIFAN_NOSTIPPLE 0x16
82 #define _3DPRIM_PATCHLIST(n) ({ assert(n > 0 && n <= 32); 0x20 + (n - 1); })
83
84 #endif /* bdw_pack.h */
85
86 /* We use this offset to be able to pass native primitive types in struct
87 * _mesa_prim::mode. Native primitive types are BRW_PRIM_OFFSET +
88 * native_type, which should be different from all GL types and still fit in
89 * the 8 bits avialable. */
90
91 #define BRW_PRIM_OFFSET 0x80
92
93 #define BRW_ANISORATIO_2 0
94 #define BRW_ANISORATIO_4 1
95 #define BRW_ANISORATIO_6 2
96 #define BRW_ANISORATIO_8 3
97 #define BRW_ANISORATIO_10 4
98 #define BRW_ANISORATIO_12 5
99 #define BRW_ANISORATIO_14 6
100 #define BRW_ANISORATIO_16 7
101
102 #define BRW_BLENDFACTOR_ONE 0x1
103 #define BRW_BLENDFACTOR_SRC_COLOR 0x2
104 #define BRW_BLENDFACTOR_SRC_ALPHA 0x3
105 #define BRW_BLENDFACTOR_DST_ALPHA 0x4
106 #define BRW_BLENDFACTOR_DST_COLOR 0x5
107 #define BRW_BLENDFACTOR_SRC_ALPHA_SATURATE 0x6
108 #define BRW_BLENDFACTOR_CONST_COLOR 0x7
109 #define BRW_BLENDFACTOR_CONST_ALPHA 0x8
110 #define BRW_BLENDFACTOR_SRC1_COLOR 0x9
111 #define BRW_BLENDFACTOR_SRC1_ALPHA 0x0A
112 #define BRW_BLENDFACTOR_ZERO 0x11
113 #define BRW_BLENDFACTOR_INV_SRC_COLOR 0x12
114 #define BRW_BLENDFACTOR_INV_SRC_ALPHA 0x13
115 #define BRW_BLENDFACTOR_INV_DST_ALPHA 0x14
116 #define BRW_BLENDFACTOR_INV_DST_COLOR 0x15
117 #define BRW_BLENDFACTOR_INV_CONST_COLOR 0x17
118 #define BRW_BLENDFACTOR_INV_CONST_ALPHA 0x18
119 #define BRW_BLENDFACTOR_INV_SRC1_COLOR 0x19
120 #define BRW_BLENDFACTOR_INV_SRC1_ALPHA 0x1A
121
122 #define BRW_BLENDFUNCTION_ADD 0
123 #define BRW_BLENDFUNCTION_SUBTRACT 1
124 #define BRW_BLENDFUNCTION_REVERSE_SUBTRACT 2
125 #define BRW_BLENDFUNCTION_MIN 3
126 #define BRW_BLENDFUNCTION_MAX 4
127
128 #define BRW_ALPHATEST_FORMAT_UNORM8 0
129 #define BRW_ALPHATEST_FORMAT_FLOAT32 1
130
131 #define BRW_CHROMAKEY_KILL_ON_ANY_MATCH 0
132 #define BRW_CHROMAKEY_REPLACE_BLACK 1
133
134 #define BRW_CLIP_API_OGL 0
135 #define BRW_CLIP_API_DX 1
136
137 #define BRW_CLIPMODE_NORMAL 0
138 #define BRW_CLIPMODE_CLIP_ALL 1
139 #define BRW_CLIPMODE_CLIP_NON_REJECTED 2
140 #define BRW_CLIPMODE_REJECT_ALL 3
141 #define BRW_CLIPMODE_ACCEPT_ALL 4
142 #define BRW_CLIPMODE_KERNEL_CLIP 5
143
144 #define BRW_CLIP_NDCSPACE 0
145 #define BRW_CLIP_SCREENSPACE 1
146
147 #define BRW_COMPAREFUNCTION_ALWAYS 0
148 #define BRW_COMPAREFUNCTION_NEVER 1
149 #define BRW_COMPAREFUNCTION_LESS 2
150 #define BRW_COMPAREFUNCTION_EQUAL 3
151 #define BRW_COMPAREFUNCTION_LEQUAL 4
152 #define BRW_COMPAREFUNCTION_GREATER 5
153 #define BRW_COMPAREFUNCTION_NOTEQUAL 6
154 #define BRW_COMPAREFUNCTION_GEQUAL 7
155
156 #define BRW_COVERAGE_PIXELS_HALF 0
157 #define BRW_COVERAGE_PIXELS_1 1
158 #define BRW_COVERAGE_PIXELS_2 2
159 #define BRW_COVERAGE_PIXELS_4 3
160
161 #define BRW_CULLMODE_BOTH 0
162 #define BRW_CULLMODE_NONE 1
163 #define BRW_CULLMODE_FRONT 2
164 #define BRW_CULLMODE_BACK 3
165
166 #define BRW_DEFAULTCOLOR_R8G8B8A8_UNORM 0
167 #define BRW_DEFAULTCOLOR_R32G32B32A32_FLOAT 1
168
169 #define BRW_DEPTHFORMAT_D32_FLOAT_S8X24_UINT 0
170 #define BRW_DEPTHFORMAT_D32_FLOAT 1
171 #define BRW_DEPTHFORMAT_D24_UNORM_S8_UINT 2
172 #define BRW_DEPTHFORMAT_D24_UNORM_X8_UINT 3 /* GEN5 */
173 #define BRW_DEPTHFORMAT_D16_UNORM 5
174
175 #define BRW_FLOATING_POINT_IEEE_754 0
176 #define BRW_FLOATING_POINT_NON_IEEE_754 1
177
178 #define BRW_FRONTWINDING_CW 0
179 #define BRW_FRONTWINDING_CCW 1
180
181 #define BRW_SPRITE_POINT_ENABLE 16
182
183 #define BRW_CUT_INDEX_ENABLE (1 << 10)
184
185 #define BRW_INDEX_BYTE 0
186 #define BRW_INDEX_WORD 1
187 #define BRW_INDEX_DWORD 2
188
189 #define BRW_LOGICOPFUNCTION_CLEAR 0
190 #define BRW_LOGICOPFUNCTION_NOR 1
191 #define BRW_LOGICOPFUNCTION_AND_INVERTED 2
192 #define BRW_LOGICOPFUNCTION_COPY_INVERTED 3
193 #define BRW_LOGICOPFUNCTION_AND_REVERSE 4
194 #define BRW_LOGICOPFUNCTION_INVERT 5
195 #define BRW_LOGICOPFUNCTION_XOR 6
196 #define BRW_LOGICOPFUNCTION_NAND 7
197 #define BRW_LOGICOPFUNCTION_AND 8
198 #define BRW_LOGICOPFUNCTION_EQUIV 9
199 #define BRW_LOGICOPFUNCTION_NOOP 10
200 #define BRW_LOGICOPFUNCTION_OR_INVERTED 11
201 #define BRW_LOGICOPFUNCTION_COPY 12
202 #define BRW_LOGICOPFUNCTION_OR_REVERSE 13
203 #define BRW_LOGICOPFUNCTION_OR 14
204 #define BRW_LOGICOPFUNCTION_SET 15
205
206 #define BRW_MAPFILTER_NEAREST 0x0
207 #define BRW_MAPFILTER_LINEAR 0x1
208 #define BRW_MAPFILTER_ANISOTROPIC 0x2
209
210 #define BRW_MIPFILTER_NONE 0
211 #define BRW_MIPFILTER_NEAREST 1
212 #define BRW_MIPFILTER_LINEAR 3
213
214 #define BRW_ADDRESS_ROUNDING_ENABLE_U_MAG 0x20
215 #define BRW_ADDRESS_ROUNDING_ENABLE_U_MIN 0x10
216 #define BRW_ADDRESS_ROUNDING_ENABLE_V_MAG 0x08
217 #define BRW_ADDRESS_ROUNDING_ENABLE_V_MIN 0x04
218 #define BRW_ADDRESS_ROUNDING_ENABLE_R_MAG 0x02
219 #define BRW_ADDRESS_ROUNDING_ENABLE_R_MIN 0x01
220
221 #define BRW_POLYGON_FRONT_FACING 0
222 #define BRW_POLYGON_BACK_FACING 1
223
224 #define BRW_PREFILTER_ALWAYS 0x0
225 #define BRW_PREFILTER_NEVER 0x1
226 #define BRW_PREFILTER_LESS 0x2
227 #define BRW_PREFILTER_EQUAL 0x3
228 #define BRW_PREFILTER_LEQUAL 0x4
229 #define BRW_PREFILTER_GREATER 0x5
230 #define BRW_PREFILTER_NOTEQUAL 0x6
231 #define BRW_PREFILTER_GEQUAL 0x7
232
233 #define BRW_PROVOKING_VERTEX_0 0
234 #define BRW_PROVOKING_VERTEX_1 1
235 #define BRW_PROVOKING_VERTEX_2 2
236
237 #define BRW_RASTRULE_UPPER_LEFT 0
238 #define BRW_RASTRULE_UPPER_RIGHT 1
239 /* These are listed as "Reserved, but not seen as useful"
240 * in Intel documentation (page 212, "Point Rasterization Rule",
241 * section 7.4 "SF Pipeline State Summary", of document
242 * "IntelĀ® 965 Express Chipset Family and IntelĀ® G35 Express
243 * Chipset Graphics Controller Programmer's Reference Manual,
244 * Volume 2: 3D/Media", Revision 1.0b as of January 2008,
245 * available at
246 * http://intellinuxgraphics.org/documentation.html
247 * at the time of this writing).
248 *
249 * These appear to be supported on at least some
250 * i965-family devices, and the BRW_RASTRULE_LOWER_RIGHT
251 * is useful when using OpenGL to render to a FBO
252 * (which has the pixel coordinate Y orientation inverted
253 * with respect to the normal OpenGL pixel coordinate system).
254 */
255 #define BRW_RASTRULE_LOWER_LEFT 2
256 #define BRW_RASTRULE_LOWER_RIGHT 3
257
258 #define BRW_RENDERTARGET_CLAMPRANGE_UNORM 0
259 #define BRW_RENDERTARGET_CLAMPRANGE_SNORM 1
260 #define BRW_RENDERTARGET_CLAMPRANGE_FORMAT 2
261
262 #define BRW_STENCILOP_KEEP 0
263 #define BRW_STENCILOP_ZERO 1
264 #define BRW_STENCILOP_REPLACE 2
265 #define BRW_STENCILOP_INCRSAT 3
266 #define BRW_STENCILOP_DECRSAT 4
267 #define BRW_STENCILOP_INCR 5
268 #define BRW_STENCILOP_DECR 6
269 #define BRW_STENCILOP_INVERT 7
270
271 /* Surface state DW0 */
272 #define GEN8_SURFACE_IS_ARRAY (1 << 28)
273 #define GEN8_SURFACE_VALIGN_4 (1 << 16)
274 #define GEN8_SURFACE_VALIGN_8 (2 << 16)
275 #define GEN8_SURFACE_VALIGN_16 (3 << 16)
276 #define GEN8_SURFACE_HALIGN_4 (1 << 14)
277 #define GEN8_SURFACE_HALIGN_8 (2 << 14)
278 #define GEN8_SURFACE_HALIGN_16 (3 << 14)
279 #define GEN8_SURFACE_TILING_NONE (0 << 12)
280 #define GEN8_SURFACE_TILING_W (1 << 12)
281 #define GEN8_SURFACE_TILING_X (2 << 12)
282 #define GEN8_SURFACE_TILING_Y (3 << 12)
283 #define GEN8_SURFACE_SAMPLER_L2_BYPASS_DISABLE (1 << 9)
284 #define BRW_SURFACE_RC_READ_WRITE (1 << 8)
285 #define BRW_SURFACE_MIPLAYOUT_SHIFT 10
286 #define BRW_SURFACE_MIPMAPLAYOUT_BELOW 0
287 #define BRW_SURFACE_MIPMAPLAYOUT_RIGHT 1
288 #define BRW_SURFACE_CUBEFACE_ENABLES 0x3f
289 #define BRW_SURFACE_BLEND_ENABLED (1 << 13)
290 #define BRW_SURFACE_WRITEDISABLE_B_SHIFT 14
291 #define BRW_SURFACE_WRITEDISABLE_G_SHIFT 15
292 #define BRW_SURFACE_WRITEDISABLE_R_SHIFT 16
293 #define BRW_SURFACE_WRITEDISABLE_A_SHIFT 17
294
295 #define BRW_SURFACEFORMAT_R32G32B32A32_FLOAT 0x000
296 #define BRW_SURFACEFORMAT_R32G32B32A32_SINT 0x001
297 #define BRW_SURFACEFORMAT_R32G32B32A32_UINT 0x002
298 #define BRW_SURFACEFORMAT_R32G32B32A32_UNORM 0x003
299 #define BRW_SURFACEFORMAT_R32G32B32A32_SNORM 0x004
300 #define BRW_SURFACEFORMAT_R64G64_FLOAT 0x005
301 #define BRW_SURFACEFORMAT_R32G32B32X32_FLOAT 0x006
302 #define BRW_SURFACEFORMAT_R32G32B32A32_SSCALED 0x007
303 #define BRW_SURFACEFORMAT_R32G32B32A32_USCALED 0x008
304 #define BRW_SURFACEFORMAT_R32G32B32A32_SFIXED 0x020
305 #define BRW_SURFACEFORMAT_R64G64_PASSTHRU 0x021
306 #define BRW_SURFACEFORMAT_R32G32B32_FLOAT 0x040
307 #define BRW_SURFACEFORMAT_R32G32B32_SINT 0x041
308 #define BRW_SURFACEFORMAT_R32G32B32_UINT 0x042
309 #define BRW_SURFACEFORMAT_R32G32B32_UNORM 0x043
310 #define BRW_SURFACEFORMAT_R32G32B32_SNORM 0x044
311 #define BRW_SURFACEFORMAT_R32G32B32_SSCALED 0x045
312 #define BRW_SURFACEFORMAT_R32G32B32_USCALED 0x046
313 #define BRW_SURFACEFORMAT_R32G32B32_SFIXED 0x050
314 #define BRW_SURFACEFORMAT_R16G16B16A16_UNORM 0x080
315 #define BRW_SURFACEFORMAT_R16G16B16A16_SNORM 0x081
316 #define BRW_SURFACEFORMAT_R16G16B16A16_SINT 0x082
317 #define BRW_SURFACEFORMAT_R16G16B16A16_UINT 0x083
318 #define BRW_SURFACEFORMAT_R16G16B16A16_FLOAT 0x084
319 #define BRW_SURFACEFORMAT_R32G32_FLOAT 0x085
320 #define BRW_SURFACEFORMAT_R32G32_SINT 0x086
321 #define BRW_SURFACEFORMAT_R32G32_UINT 0x087
322 #define BRW_SURFACEFORMAT_R32_FLOAT_X8X24_TYPELESS 0x088
323 #define BRW_SURFACEFORMAT_X32_TYPELESS_G8X24_UINT 0x089
324 #define BRW_SURFACEFORMAT_L32A32_FLOAT 0x08A
325 #define BRW_SURFACEFORMAT_R32G32_UNORM 0x08B
326 #define BRW_SURFACEFORMAT_R32G32_SNORM 0x08C
327 #define BRW_SURFACEFORMAT_R64_FLOAT 0x08D
328 #define BRW_SURFACEFORMAT_R16G16B16X16_UNORM 0x08E
329 #define BRW_SURFACEFORMAT_R16G16B16X16_FLOAT 0x08F
330 #define BRW_SURFACEFORMAT_A32X32_FLOAT 0x090
331 #define BRW_SURFACEFORMAT_L32X32_FLOAT 0x091
332 #define BRW_SURFACEFORMAT_I32X32_FLOAT 0x092
333 #define BRW_SURFACEFORMAT_R16G16B16A16_SSCALED 0x093
334 #define BRW_SURFACEFORMAT_R16G16B16A16_USCALED 0x094
335 #define BRW_SURFACEFORMAT_R32G32_SSCALED 0x095
336 #define BRW_SURFACEFORMAT_R32G32_USCALED 0x096
337 #define BRW_SURFACEFORMAT_R32G32_FLOAT_LD 0x097
338 #define BRW_SURFACEFORMAT_R32G32_SFIXED 0x0A0
339 #define BRW_SURFACEFORMAT_R64_PASSTHRU 0x0A1
340 #define BRW_SURFACEFORMAT_B8G8R8A8_UNORM 0x0C0
341 #define BRW_SURFACEFORMAT_B8G8R8A8_UNORM_SRGB 0x0C1
342 #define BRW_SURFACEFORMAT_R10G10B10A2_UNORM 0x0C2
343 #define BRW_SURFACEFORMAT_R10G10B10A2_UNORM_SRGB 0x0C3
344 #define BRW_SURFACEFORMAT_R10G10B10A2_UINT 0x0C4
345 #define BRW_SURFACEFORMAT_R10G10B10_SNORM_A2_UNORM 0x0C5
346 #define BRW_SURFACEFORMAT_R8G8B8A8_UNORM 0x0C7
347 #define BRW_SURFACEFORMAT_R8G8B8A8_UNORM_SRGB 0x0C8
348 #define BRW_SURFACEFORMAT_R8G8B8A8_SNORM 0x0C9
349 #define BRW_SURFACEFORMAT_R8G8B8A8_SINT 0x0CA
350 #define BRW_SURFACEFORMAT_R8G8B8A8_UINT 0x0CB
351 #define BRW_SURFACEFORMAT_R16G16_UNORM 0x0CC
352 #define BRW_SURFACEFORMAT_R16G16_SNORM 0x0CD
353 #define BRW_SURFACEFORMAT_R16G16_SINT 0x0CE
354 #define BRW_SURFACEFORMAT_R16G16_UINT 0x0CF
355 #define BRW_SURFACEFORMAT_R16G16_FLOAT 0x0D0
356 #define BRW_SURFACEFORMAT_B10G10R10A2_UNORM 0x0D1
357 #define BRW_SURFACEFORMAT_B10G10R10A2_UNORM_SRGB 0x0D2
358 #define BRW_SURFACEFORMAT_R11G11B10_FLOAT 0x0D3
359 #define BRW_SURFACEFORMAT_R32_SINT 0x0D6
360 #define BRW_SURFACEFORMAT_R32_UINT 0x0D7
361 #define BRW_SURFACEFORMAT_R32_FLOAT 0x0D8
362 #define BRW_SURFACEFORMAT_R24_UNORM_X8_TYPELESS 0x0D9
363 #define BRW_SURFACEFORMAT_X24_TYPELESS_G8_UINT 0x0DA
364 #define BRW_SURFACEFORMAT_L16A16_UNORM 0x0DF
365 #define BRW_SURFACEFORMAT_I24X8_UNORM 0x0E0
366 #define BRW_SURFACEFORMAT_L24X8_UNORM 0x0E1
367 #define BRW_SURFACEFORMAT_A24X8_UNORM 0x0E2
368 #define BRW_SURFACEFORMAT_I32_FLOAT 0x0E3
369 #define BRW_SURFACEFORMAT_L32_FLOAT 0x0E4
370 #define BRW_SURFACEFORMAT_A32_FLOAT 0x0E5
371 #define BRW_SURFACEFORMAT_B8G8R8X8_UNORM 0x0E9
372 #define BRW_SURFACEFORMAT_B8G8R8X8_UNORM_SRGB 0x0EA
373 #define BRW_SURFACEFORMAT_R8G8B8X8_UNORM 0x0EB
374 #define BRW_SURFACEFORMAT_R8G8B8X8_UNORM_SRGB 0x0EC
375 #define BRW_SURFACEFORMAT_R9G9B9E5_SHAREDEXP 0x0ED
376 #define BRW_SURFACEFORMAT_B10G10R10X2_UNORM 0x0EE
377 #define BRW_SURFACEFORMAT_L16A16_FLOAT 0x0F0
378 #define BRW_SURFACEFORMAT_R32_UNORM 0x0F1
379 #define BRW_SURFACEFORMAT_R32_SNORM 0x0F2
380 #define BRW_SURFACEFORMAT_R10G10B10X2_USCALED 0x0F3
381 #define BRW_SURFACEFORMAT_R8G8B8A8_SSCALED 0x0F4
382 #define BRW_SURFACEFORMAT_R8G8B8A8_USCALED 0x0F5
383 #define BRW_SURFACEFORMAT_R16G16_SSCALED 0x0F6
384 #define BRW_SURFACEFORMAT_R16G16_USCALED 0x0F7
385 #define BRW_SURFACEFORMAT_R32_SSCALED 0x0F8
386 #define BRW_SURFACEFORMAT_R32_USCALED 0x0F9
387 #define BRW_SURFACEFORMAT_B5G6R5_UNORM 0x100
388 #define BRW_SURFACEFORMAT_B5G6R5_UNORM_SRGB 0x101
389 #define BRW_SURFACEFORMAT_B5G5R5A1_UNORM 0x102
390 #define BRW_SURFACEFORMAT_B5G5R5A1_UNORM_SRGB 0x103
391 #define BRW_SURFACEFORMAT_B4G4R4A4_UNORM 0x104
392 #define BRW_SURFACEFORMAT_B4G4R4A4_UNORM_SRGB 0x105
393 #define BRW_SURFACEFORMAT_R8G8_UNORM 0x106
394 #define BRW_SURFACEFORMAT_R8G8_SNORM 0x107
395 #define BRW_SURFACEFORMAT_R8G8_SINT 0x108
396 #define BRW_SURFACEFORMAT_R8G8_UINT 0x109
397 #define BRW_SURFACEFORMAT_R16_UNORM 0x10A
398 #define BRW_SURFACEFORMAT_R16_SNORM 0x10B
399 #define BRW_SURFACEFORMAT_R16_SINT 0x10C
400 #define BRW_SURFACEFORMAT_R16_UINT 0x10D
401 #define BRW_SURFACEFORMAT_R16_FLOAT 0x10E
402 #define BRW_SURFACEFORMAT_A8P8_UNORM_PALETTE0 0x10F
403 #define BRW_SURFACEFORMAT_A8P8_UNORM_PALETTE1 0x110
404 #define BRW_SURFACEFORMAT_I16_UNORM 0x111
405 #define BRW_SURFACEFORMAT_L16_UNORM 0x112
406 #define BRW_SURFACEFORMAT_A16_UNORM 0x113
407 #define BRW_SURFACEFORMAT_L8A8_UNORM 0x114
408 #define BRW_SURFACEFORMAT_I16_FLOAT 0x115
409 #define BRW_SURFACEFORMAT_L16_FLOAT 0x116
410 #define BRW_SURFACEFORMAT_A16_FLOAT 0x117
411 #define BRW_SURFACEFORMAT_L8A8_UNORM_SRGB 0x118
412 #define BRW_SURFACEFORMAT_R5G5_SNORM_B6_UNORM 0x119
413 #define BRW_SURFACEFORMAT_B5G5R5X1_UNORM 0x11A
414 #define BRW_SURFACEFORMAT_B5G5R5X1_UNORM_SRGB 0x11B
415 #define BRW_SURFACEFORMAT_R8G8_SSCALED 0x11C
416 #define BRW_SURFACEFORMAT_R8G8_USCALED 0x11D
417 #define BRW_SURFACEFORMAT_R16_SSCALED 0x11E
418 #define BRW_SURFACEFORMAT_R16_USCALED 0x11F
419 #define BRW_SURFACEFORMAT_P8A8_UNORM_PALETTE0 0x122
420 #define BRW_SURFACEFORMAT_P8A8_UNORM_PALETTE1 0x123
421 #define BRW_SURFACEFORMAT_A1B5G5R5_UNORM 0x124
422 #define BRW_SURFACEFORMAT_A4B4G4R4_UNORM 0x125
423 #define BRW_SURFACEFORMAT_L8A8_UINT 0x126
424 #define BRW_SURFACEFORMAT_L8A8_SINT 0x127
425 #define BRW_SURFACEFORMAT_R8_UNORM 0x140
426 #define BRW_SURFACEFORMAT_R8_SNORM 0x141
427 #define BRW_SURFACEFORMAT_R8_SINT 0x142
428 #define BRW_SURFACEFORMAT_R8_UINT 0x143
429 #define BRW_SURFACEFORMAT_A8_UNORM 0x144
430 #define BRW_SURFACEFORMAT_I8_UNORM 0x145
431 #define BRW_SURFACEFORMAT_L8_UNORM 0x146
432 #define BRW_SURFACEFORMAT_P4A4_UNORM 0x147
433 #define BRW_SURFACEFORMAT_A4P4_UNORM 0x148
434 #define BRW_SURFACEFORMAT_R8_SSCALED 0x149
435 #define BRW_SURFACEFORMAT_R8_USCALED 0x14A
436 #define BRW_SURFACEFORMAT_P8_UNORM_PALETTE0 0x14B
437 #define BRW_SURFACEFORMAT_L8_UNORM_SRGB 0x14C
438 #define BRW_SURFACEFORMAT_P8_UNORM_PALETTE1 0x14D
439 #define BRW_SURFACEFORMAT_P4A4_UNORM_PALETTE1 0x14E
440 #define BRW_SURFACEFORMAT_A4P4_UNORM_PALETTE1 0x14F
441 #define BRW_SURFACEFORMAT_Y8_SNORM 0x150
442 #define BRW_SURFACEFORMAT_L8_UINT 0x152
443 #define BRW_SURFACEFORMAT_L8_SINT 0x153
444 #define BRW_SURFACEFORMAT_I8_UINT 0x154
445 #define BRW_SURFACEFORMAT_I8_SINT 0x155
446 #define BRW_SURFACEFORMAT_DXT1_RGB_SRGB 0x180
447 #define BRW_SURFACEFORMAT_R1_UINT 0x181
448 #define BRW_SURFACEFORMAT_YCRCB_NORMAL 0x182
449 #define BRW_SURFACEFORMAT_YCRCB_SWAPUVY 0x183
450 #define BRW_SURFACEFORMAT_P2_UNORM_PALETTE0 0x184
451 #define BRW_SURFACEFORMAT_P2_UNORM_PALETTE1 0x185
452 #define BRW_SURFACEFORMAT_BC1_UNORM 0x186
453 #define BRW_SURFACEFORMAT_BC2_UNORM 0x187
454 #define BRW_SURFACEFORMAT_BC3_UNORM 0x188
455 #define BRW_SURFACEFORMAT_BC4_UNORM 0x189
456 #define BRW_SURFACEFORMAT_BC5_UNORM 0x18A
457 #define BRW_SURFACEFORMAT_BC1_UNORM_SRGB 0x18B
458 #define BRW_SURFACEFORMAT_BC2_UNORM_SRGB 0x18C
459 #define BRW_SURFACEFORMAT_BC3_UNORM_SRGB 0x18D
460 #define BRW_SURFACEFORMAT_MONO8 0x18E
461 #define BRW_SURFACEFORMAT_YCRCB_SWAPUV 0x18F
462 #define BRW_SURFACEFORMAT_YCRCB_SWAPY 0x190
463 #define BRW_SURFACEFORMAT_DXT1_RGB 0x191
464 #define BRW_SURFACEFORMAT_FXT1 0x192
465 #define BRW_SURFACEFORMAT_R8G8B8_UNORM 0x193
466 #define BRW_SURFACEFORMAT_R8G8B8_SNORM 0x194
467 #define BRW_SURFACEFORMAT_R8G8B8_SSCALED 0x195
468 #define BRW_SURFACEFORMAT_R8G8B8_USCALED 0x196
469 #define BRW_SURFACEFORMAT_R64G64B64A64_FLOAT 0x197
470 #define BRW_SURFACEFORMAT_R64G64B64_FLOAT 0x198
471 #define BRW_SURFACEFORMAT_BC4_SNORM 0x199
472 #define BRW_SURFACEFORMAT_BC5_SNORM 0x19A
473 #define BRW_SURFACEFORMAT_R16G16B16_FLOAT 0x19B
474 #define BRW_SURFACEFORMAT_R16G16B16_UNORM 0x19C
475 #define BRW_SURFACEFORMAT_R16G16B16_SNORM 0x19D
476 #define BRW_SURFACEFORMAT_R16G16B16_SSCALED 0x19E
477 #define BRW_SURFACEFORMAT_R16G16B16_USCALED 0x19F
478 #define BRW_SURFACEFORMAT_BC6H_SF16 0x1A1
479 #define BRW_SURFACEFORMAT_BC7_UNORM 0x1A2
480 #define BRW_SURFACEFORMAT_BC7_UNORM_SRGB 0x1A3
481 #define BRW_SURFACEFORMAT_BC6H_UF16 0x1A4
482 #define BRW_SURFACEFORMAT_PLANAR_420_8 0x1A5
483 #define BRW_SURFACEFORMAT_R8G8B8_UNORM_SRGB 0x1A8
484 #define BRW_SURFACEFORMAT_ETC1_RGB8 0x1A9
485 #define BRW_SURFACEFORMAT_ETC2_RGB8 0x1AA
486 #define BRW_SURFACEFORMAT_EAC_R11 0x1AB
487 #define BRW_SURFACEFORMAT_EAC_RG11 0x1AC
488 #define BRW_SURFACEFORMAT_EAC_SIGNED_R11 0x1AD
489 #define BRW_SURFACEFORMAT_EAC_SIGNED_RG11 0x1AE
490 #define BRW_SURFACEFORMAT_ETC2_SRGB8 0x1AF
491 #define BRW_SURFACEFORMAT_R16G16B16_UINT 0x1B0
492 #define BRW_SURFACEFORMAT_R16G16B16_SINT 0x1B1
493 #define BRW_SURFACEFORMAT_R32_SFIXED 0x1B2
494 #define BRW_SURFACEFORMAT_R10G10B10A2_SNORM 0x1B3
495 #define BRW_SURFACEFORMAT_R10G10B10A2_USCALED 0x1B4
496 #define BRW_SURFACEFORMAT_R10G10B10A2_SSCALED 0x1B5
497 #define BRW_SURFACEFORMAT_R10G10B10A2_SINT 0x1B6
498 #define BRW_SURFACEFORMAT_B10G10R10A2_SNORM 0x1B7
499 #define BRW_SURFACEFORMAT_B10G10R10A2_USCALED 0x1B8
500 #define BRW_SURFACEFORMAT_B10G10R10A2_SSCALED 0x1B9
501 #define BRW_SURFACEFORMAT_B10G10R10A2_UINT 0x1BA
502 #define BRW_SURFACEFORMAT_B10G10R10A2_SINT 0x1BB
503 #define BRW_SURFACEFORMAT_R64G64B64A64_PASSTHRU 0x1BC
504 #define BRW_SURFACEFORMAT_R64G64B64_PASSTHRU 0x1BD
505 #define BRW_SURFACEFORMAT_ETC2_RGB8_PTA 0x1C0
506 #define BRW_SURFACEFORMAT_ETC2_SRGB8_PTA 0x1C1
507 #define BRW_SURFACEFORMAT_ETC2_EAC_RGBA8 0x1C2
508 #define BRW_SURFACEFORMAT_ETC2_EAC_SRGB8_A8 0x1C3
509 #define BRW_SURFACEFORMAT_R8G8B8_UINT 0x1C8
510 #define BRW_SURFACEFORMAT_R8G8B8_SINT 0x1C9
511 #define BRW_SURFACEFORMAT_RAW 0x1FF
512
513 #define GEN9_SURFACE_ASTC_HDR_FORMAT_BIT 0x100
514
515 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_4x4_U8sRGB 0x200
516 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_5x4_U8sRGB 0x208
517 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_5x5_U8sRGB 0x209
518 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_6x5_U8sRGB 0x211
519 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_6x6_U8sRGB 0x212
520 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_8x5_U8sRGB 0x221
521 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_8x6_U8sRGB 0x222
522 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_8x8_U8sRGB 0x224
523 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_10x5_U8sRGB 0x231
524 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_10x6_U8sRGB 0x232
525 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_10x8_U8sRGB 0x234
526 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_10x10_U8sRGB 0x236
527 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_12x10_U8sRGB 0x23E
528 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_12x12_U8sRGB 0x23F
529 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_4x4_FLT16 0x240
530 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_5x4_FLT16 0x248
531 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_5x5_FLT16 0x249
532 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_6x5_FLT16 0x251
533 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_6x6_FLT16 0x252
534 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_8x5_FLT16 0x261
535 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_8x6_FLT16 0x262
536 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_8x8_FLT16 0x264
537 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_10x5_FLT16 0x271
538 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_10x6_FLT16 0x272
539 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_10x8_FLT16 0x274
540 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_10x10_FLT16 0x276
541 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_12x10_FLT16 0x27E
542 #define BRW_SURFACEFORMAT_ASTC_LDR_2D_12x12_FLT16 0x27F
543
544 #define BRW_SURFACE_FORMAT_SHIFT 18
545 #define BRW_SURFACE_FORMAT_MASK INTEL_MASK(26, 18)
546
547 #define BRW_SURFACERETURNFORMAT_FLOAT32 0
548 #define BRW_SURFACERETURNFORMAT_S1 1
549
550 #define BRW_SURFACE_TYPE_SHIFT 29
551 #define BRW_SURFACE_TYPE_MASK INTEL_MASK(31, 29)
552 #define BRW_SURFACE_1D 0
553 #define BRW_SURFACE_2D 1
554 #define BRW_SURFACE_3D 2
555 #define BRW_SURFACE_CUBE 3
556 #define BRW_SURFACE_BUFFER 4
557 #define BRW_SURFACE_NULL 7
558
559 #define GEN7_SURFACE_IS_ARRAY (1 << 28)
560 #define GEN7_SURFACE_VALIGN_2 (0 << 16)
561 #define GEN7_SURFACE_VALIGN_4 (1 << 16)
562 #define GEN7_SURFACE_HALIGN_4 (0 << 15)
563 #define GEN7_SURFACE_HALIGN_8 (1 << 15)
564 #define GEN7_SURFACE_TILING_NONE (0 << 13)
565 #define GEN7_SURFACE_TILING_X (2 << 13)
566 #define GEN7_SURFACE_TILING_Y (3 << 13)
567 #define GEN7_SURFACE_ARYSPC_FULL (0 << 10)
568 #define GEN7_SURFACE_ARYSPC_LOD0 (1 << 10)
569
570 /* Surface state DW1 */
571 #define GEN8_SURFACE_MOCS_SHIFT 24
572 #define GEN8_SURFACE_MOCS_MASK INTEL_MASK(30, 24)
573 #define GEN8_SURFACE_QPITCH_SHIFT 0
574 #define GEN8_SURFACE_QPITCH_MASK INTEL_MASK(14, 0)
575
576 /* Surface state DW2 */
577 #define BRW_SURFACE_HEIGHT_SHIFT 19
578 #define BRW_SURFACE_HEIGHT_MASK INTEL_MASK(31, 19)
579 #define BRW_SURFACE_WIDTH_SHIFT 6
580 #define BRW_SURFACE_WIDTH_MASK INTEL_MASK(18, 6)
581 #define BRW_SURFACE_LOD_SHIFT 2
582 #define BRW_SURFACE_LOD_MASK INTEL_MASK(5, 2)
583 #define GEN7_SURFACE_HEIGHT_SHIFT 16
584 #define GEN7_SURFACE_HEIGHT_MASK INTEL_MASK(29, 16)
585 #define GEN7_SURFACE_WIDTH_SHIFT 0
586 #define GEN7_SURFACE_WIDTH_MASK INTEL_MASK(13, 0)
587
588 /* Surface state DW3 */
589 #define BRW_SURFACE_DEPTH_SHIFT 21
590 #define BRW_SURFACE_DEPTH_MASK INTEL_MASK(31, 21)
591 #define BRW_SURFACE_PITCH_SHIFT 3
592 #define BRW_SURFACE_PITCH_MASK INTEL_MASK(19, 3)
593 #define BRW_SURFACE_TILED (1 << 1)
594 #define BRW_SURFACE_TILED_Y (1 << 0)
595 #define HSW_SURFACE_IS_INTEGER_FORMAT (1 << 18)
596
597 /* Surface state DW4 */
598 #define BRW_SURFACE_MIN_LOD_SHIFT 28
599 #define BRW_SURFACE_MIN_LOD_MASK INTEL_MASK(31, 28)
600 #define BRW_SURFACE_MIN_ARRAY_ELEMENT_SHIFT 17
601 #define BRW_SURFACE_MIN_ARRAY_ELEMENT_MASK INTEL_MASK(27, 17)
602 #define BRW_SURFACE_RENDER_TARGET_VIEW_EXTENT_SHIFT 8
603 #define BRW_SURFACE_RENDER_TARGET_VIEW_EXTENT_MASK INTEL_MASK(16, 8)
604 #define BRW_SURFACE_MULTISAMPLECOUNT_1 (0 << 4)
605 #define BRW_SURFACE_MULTISAMPLECOUNT_4 (2 << 4)
606 #define GEN7_SURFACE_MULTISAMPLECOUNT_1 (0 << 3)
607 #define GEN8_SURFACE_MULTISAMPLECOUNT_2 (1 << 3)
608 #define GEN7_SURFACE_MULTISAMPLECOUNT_4 (2 << 3)
609 #define GEN7_SURFACE_MULTISAMPLECOUNT_8 (3 << 3)
610 #define GEN8_SURFACE_MULTISAMPLECOUNT_16 (4 << 3)
611 #define GEN7_SURFACE_MSFMT_MSS (0 << 6)
612 #define GEN7_SURFACE_MSFMT_DEPTH_STENCIL (1 << 6)
613 #define GEN7_SURFACE_MIN_ARRAY_ELEMENT_SHIFT 18
614 #define GEN7_SURFACE_MIN_ARRAY_ELEMENT_MASK INTEL_MASK(28, 18)
615 #define GEN7_SURFACE_RENDER_TARGET_VIEW_EXTENT_SHIFT 7
616 #define GEN7_SURFACE_RENDER_TARGET_VIEW_EXTENT_MASK INTEL_MASK(17, 7)
617
618 /* Surface state DW5 */
619 #define BRW_SURFACE_X_OFFSET_SHIFT 25
620 #define BRW_SURFACE_X_OFFSET_MASK INTEL_MASK(31, 25)
621 #define BRW_SURFACE_VERTICAL_ALIGN_ENABLE (1 << 24)
622 #define BRW_SURFACE_Y_OFFSET_SHIFT 20
623 #define BRW_SURFACE_Y_OFFSET_MASK INTEL_MASK(23, 20)
624 #define GEN7_SURFACE_MIN_LOD_SHIFT 4
625 #define GEN7_SURFACE_MIN_LOD_MASK INTEL_MASK(7, 4)
626 #define GEN8_SURFACE_Y_OFFSET_SHIFT 21
627 #define GEN8_SURFACE_Y_OFFSET_MASK INTEL_MASK(23, 21)
628
629 #define GEN7_SURFACE_MOCS_SHIFT 16
630 #define GEN7_SURFACE_MOCS_MASK INTEL_MASK(19, 16)
631
632 #define GEN9_SURFACE_TRMODE_SHIFT 18
633 #define GEN9_SURFACE_TRMODE_MASK INTEL_MASK(19, 18)
634 #define GEN9_SURFACE_TRMODE_NONE 0
635 #define GEN9_SURFACE_TRMODE_TILEYF 1
636 #define GEN9_SURFACE_TRMODE_TILEYS 2
637
638 #define GEN9_SURFACE_MIP_TAIL_START_LOD_SHIFT 8
639 #define GEN9_SURFACE_MIP_TAIL_START_LOD_MASK INTEL_MASK(11, 8)
640
641 /* Surface state DW6 */
642 #define GEN7_SURFACE_MCS_ENABLE (1 << 0)
643 #define GEN7_SURFACE_MCS_PITCH_SHIFT 3
644 #define GEN7_SURFACE_MCS_PITCH_MASK INTEL_MASK(11, 3)
645 #define GEN8_SURFACE_AUX_QPITCH_SHIFT 16
646 #define GEN8_SURFACE_AUX_QPITCH_MASK INTEL_MASK(30, 16)
647 #define GEN8_SURFACE_AUX_PITCH_SHIFT 3
648 #define GEN8_SURFACE_AUX_PITCH_MASK INTEL_MASK(11, 3)
649 #define GEN8_SURFACE_AUX_MODE_MASK INTEL_MASK(2, 0)
650
651 #define GEN8_SURFACE_AUX_MODE_NONE 0
652 #define GEN8_SURFACE_AUX_MODE_MCS 1
653 #define GEN8_SURFACE_AUX_MODE_APPEND 2
654 #define GEN8_SURFACE_AUX_MODE_HIZ 3
655
656 /* Surface state DW7 */
657 #define GEN9_SURFACE_RT_COMPRESSION_SHIFT 30
658 #define GEN9_SURFACE_RT_COMPRESSION_MASK INTEL_MASK(30, 30)
659 #define GEN7_SURFACE_CLEAR_COLOR_SHIFT 28
660 #define GEN7_SURFACE_SCS_R_SHIFT 25
661 #define GEN7_SURFACE_SCS_R_MASK INTEL_MASK(27, 25)
662 #define GEN7_SURFACE_SCS_G_SHIFT 22
663 #define GEN7_SURFACE_SCS_G_MASK INTEL_MASK(24, 22)
664 #define GEN7_SURFACE_SCS_B_SHIFT 19
665 #define GEN7_SURFACE_SCS_B_MASK INTEL_MASK(21, 19)
666 #define GEN7_SURFACE_SCS_A_SHIFT 16
667 #define GEN7_SURFACE_SCS_A_MASK INTEL_MASK(18, 16)
668
669 /* The actual swizzle values/what channel to use */
670 #define HSW_SCS_ZERO 0
671 #define HSW_SCS_ONE 1
672 #define HSW_SCS_RED 4
673 #define HSW_SCS_GREEN 5
674 #define HSW_SCS_BLUE 6
675 #define HSW_SCS_ALPHA 7
676
677 /* SAMPLER_STATE DW0 */
678 #define BRW_SAMPLER_DISABLE (1 << 31)
679 #define BRW_SAMPLER_LOD_PRECLAMP_ENABLE (1 << 28)
680 #define GEN6_SAMPLER_MIN_MAG_NOT_EQUAL (1 << 27) /* Gen6 only */
681 #define BRW_SAMPLER_BASE_MIPLEVEL_MASK INTEL_MASK(26, 22)
682 #define BRW_SAMPLER_BASE_MIPLEVEL_SHIFT 22
683 #define BRW_SAMPLER_MIP_FILTER_MASK INTEL_MASK(21, 20)
684 #define BRW_SAMPLER_MIP_FILTER_SHIFT 20
685 #define BRW_SAMPLER_MAG_FILTER_MASK INTEL_MASK(19, 17)
686 #define BRW_SAMPLER_MAG_FILTER_SHIFT 17
687 #define BRW_SAMPLER_MIN_FILTER_MASK INTEL_MASK(16, 14)
688 #define BRW_SAMPLER_MIN_FILTER_SHIFT 14
689 #define GEN4_SAMPLER_LOD_BIAS_MASK INTEL_MASK(13, 3)
690 #define GEN4_SAMPLER_LOD_BIAS_SHIFT 3
691 #define GEN4_SAMPLER_SHADOW_FUNCTION_MASK INTEL_MASK(2, 0)
692 #define GEN4_SAMPLER_SHADOW_FUNCTION_SHIFT 0
693
694 #define GEN7_SAMPLER_LOD_BIAS_MASK INTEL_MASK(13, 1)
695 #define GEN7_SAMPLER_LOD_BIAS_SHIFT 1
696 #define GEN7_SAMPLER_EWA_ANISOTROPIC_ALGORITHM (1 << 0)
697
698 /* SAMPLER_STATE DW1 */
699 #define GEN4_SAMPLER_MIN_LOD_MASK INTEL_MASK(31, 22)
700 #define GEN4_SAMPLER_MIN_LOD_SHIFT 22
701 #define GEN4_SAMPLER_MAX_LOD_MASK INTEL_MASK(21, 12)
702 #define GEN4_SAMPLER_MAX_LOD_SHIFT 12
703 #define GEN4_SAMPLER_CUBE_CONTROL_OVERRIDE (1 << 9)
704 /* Wrap modes are in DW1 on Gen4-6 and DW3 on Gen7+ */
705 #define BRW_SAMPLER_TCX_WRAP_MODE_MASK INTEL_MASK(8, 6)
706 #define BRW_SAMPLER_TCX_WRAP_MODE_SHIFT 6
707 #define BRW_SAMPLER_TCY_WRAP_MODE_MASK INTEL_MASK(5, 3)
708 #define BRW_SAMPLER_TCY_WRAP_MODE_SHIFT 3
709 #define BRW_SAMPLER_TCZ_WRAP_MODE_MASK INTEL_MASK(2, 0)
710 #define BRW_SAMPLER_TCZ_WRAP_MODE_SHIFT 0
711
712 #define GEN7_SAMPLER_MIN_LOD_MASK INTEL_MASK(31, 20)
713 #define GEN7_SAMPLER_MIN_LOD_SHIFT 20
714 #define GEN7_SAMPLER_MAX_LOD_MASK INTEL_MASK(19, 8)
715 #define GEN7_SAMPLER_MAX_LOD_SHIFT 8
716 #define GEN7_SAMPLER_SHADOW_FUNCTION_MASK INTEL_MASK(3, 1)
717 #define GEN7_SAMPLER_SHADOW_FUNCTION_SHIFT 1
718 #define GEN7_SAMPLER_CUBE_CONTROL_OVERRIDE (1 << 0)
719
720 /* SAMPLER_STATE DW2 - border color pointer */
721
722 /* SAMPLER_STATE DW3 */
723 #define BRW_SAMPLER_MAX_ANISOTROPY_MASK INTEL_MASK(21, 19)
724 #define BRW_SAMPLER_MAX_ANISOTROPY_SHIFT 19
725 #define BRW_SAMPLER_ADDRESS_ROUNDING_MASK INTEL_MASK(18, 13)
726 #define BRW_SAMPLER_ADDRESS_ROUNDING_SHIFT 13
727 #define GEN7_SAMPLER_NON_NORMALIZED_COORDINATES (1 << 10)
728 /* Gen7+ wrap modes reuse the same BRW_SAMPLER_TC*_WRAP_MODE enums. */
729 #define GEN6_SAMPLER_NON_NORMALIZED_COORDINATES (1 << 0)
730
731 enum brw_wrap_mode {
732 BRW_TEXCOORDMODE_WRAP = 0,
733 BRW_TEXCOORDMODE_MIRROR = 1,
734 BRW_TEXCOORDMODE_CLAMP = 2,
735 BRW_TEXCOORDMODE_CUBE = 3,
736 BRW_TEXCOORDMODE_CLAMP_BORDER = 4,
737 BRW_TEXCOORDMODE_MIRROR_ONCE = 5,
738 GEN8_TEXCOORDMODE_HALF_BORDER = 6,
739 };
740
741 #define BRW_THREAD_PRIORITY_NORMAL 0
742 #define BRW_THREAD_PRIORITY_HIGH 1
743
744 #define BRW_TILEWALK_XMAJOR 0
745 #define BRW_TILEWALK_YMAJOR 1
746
747 #define BRW_VERTEX_SUBPIXEL_PRECISION_8BITS 0
748 #define BRW_VERTEX_SUBPIXEL_PRECISION_4BITS 1
749
750 /* Execution Unit (EU) defines
751 */
752
753 #define BRW_ALIGN_1 0
754 #define BRW_ALIGN_16 1
755
756 #define BRW_ADDRESS_DIRECT 0
757 #define BRW_ADDRESS_REGISTER_INDIRECT_REGISTER 1
758
759 #define BRW_CHANNEL_X 0
760 #define BRW_CHANNEL_Y 1
761 #define BRW_CHANNEL_Z 2
762 #define BRW_CHANNEL_W 3
763
764 enum brw_compression {
765 BRW_COMPRESSION_NONE = 0,
766 BRW_COMPRESSION_2NDHALF = 1,
767 BRW_COMPRESSION_COMPRESSED = 2,
768 };
769
770 #define GEN6_COMPRESSION_1Q 0
771 #define GEN6_COMPRESSION_2Q 1
772 #define GEN6_COMPRESSION_3Q 2
773 #define GEN6_COMPRESSION_4Q 3
774 #define GEN6_COMPRESSION_1H 0
775 #define GEN6_COMPRESSION_2H 2
776
777 enum PACKED brw_conditional_mod {
778 BRW_CONDITIONAL_NONE = 0,
779 BRW_CONDITIONAL_Z = 1,
780 BRW_CONDITIONAL_NZ = 2,
781 BRW_CONDITIONAL_EQ = 1, /* Z */
782 BRW_CONDITIONAL_NEQ = 2, /* NZ */
783 BRW_CONDITIONAL_G = 3,
784 BRW_CONDITIONAL_GE = 4,
785 BRW_CONDITIONAL_L = 5,
786 BRW_CONDITIONAL_LE = 6,
787 BRW_CONDITIONAL_R = 7, /* Gen <= 5 */
788 BRW_CONDITIONAL_O = 8,
789 BRW_CONDITIONAL_U = 9,
790 };
791
792 #define BRW_DEBUG_NONE 0
793 #define BRW_DEBUG_BREAKPOINT 1
794
795 #define BRW_DEPENDENCY_NORMAL 0
796 #define BRW_DEPENDENCY_NOTCLEARED 1
797 #define BRW_DEPENDENCY_NOTCHECKED 2
798 #define BRW_DEPENDENCY_DISABLE 3
799
800 enum PACKED brw_execution_size {
801 BRW_EXECUTE_1 = 0,
802 BRW_EXECUTE_2 = 1,
803 BRW_EXECUTE_4 = 2,
804 BRW_EXECUTE_8 = 3,
805 BRW_EXECUTE_16 = 4,
806 BRW_EXECUTE_32 = 5,
807 };
808
809 enum PACKED brw_horizontal_stride {
810 BRW_HORIZONTAL_STRIDE_0 = 0,
811 BRW_HORIZONTAL_STRIDE_1 = 1,
812 BRW_HORIZONTAL_STRIDE_2 = 2,
813 BRW_HORIZONTAL_STRIDE_4 = 3,
814 };
815
816 #define BRW_INSTRUCTION_NORMAL 0
817 #define BRW_INSTRUCTION_SATURATE 1
818
819 #define BRW_MASK_ENABLE 0
820 #define BRW_MASK_DISABLE 1
821
822 /** @{
823 *
824 * Gen6 has replaced "mask enable/disable" with WECtrl, which is
825 * effectively the same but much simpler to think about. Now, there
826 * are two contributors ANDed together to whether channels are
827 * executed: The predication on the instruction, and the channel write
828 * enable.
829 */
830 /**
831 * This is the default value. It means that a channel's write enable is set
832 * if the per-channel IP is pointing at this instruction.
833 */
834 #define BRW_WE_NORMAL 0
835 /**
836 * This is used like BRW_MASK_DISABLE, and causes all channels to have
837 * their write enable set. Note that predication still contributes to
838 * whether the channel actually gets written.
839 */
840 #define BRW_WE_ALL 1
841 /** @} */
842
843 enum opcode {
844 /* These are the actual hardware opcodes. */
845 BRW_OPCODE_ILLEGAL = 0,
846 BRW_OPCODE_MOV = 1,
847 BRW_OPCODE_SEL = 2,
848 BRW_OPCODE_MOVI = 3, /**< G45+ */
849 BRW_OPCODE_NOT = 4,
850 BRW_OPCODE_AND = 5,
851 BRW_OPCODE_OR = 6,
852 BRW_OPCODE_XOR = 7,
853 BRW_OPCODE_SHR = 8,
854 BRW_OPCODE_SHL = 9,
855 // BRW_OPCODE_DIM = 10, /**< Gen7.5 only */ /* Reused */
856 // BRW_OPCODE_SMOV = 10, /**< Gen8+ */ /* Reused */
857 /* Reserved - 11 */
858 BRW_OPCODE_ASR = 12,
859 /* Reserved - 13-15 */
860 BRW_OPCODE_CMP = 16,
861 BRW_OPCODE_CMPN = 17,
862 BRW_OPCODE_CSEL = 18, /**< Gen8+ */
863 BRW_OPCODE_F32TO16 = 19, /**< Gen7 only */
864 BRW_OPCODE_F16TO32 = 20, /**< Gen7 only */
865 /* Reserved - 21-22 */
866 BRW_OPCODE_BFREV = 23, /**< Gen7+ */
867 BRW_OPCODE_BFE = 24, /**< Gen7+ */
868 BRW_OPCODE_BFI1 = 25, /**< Gen7+ */
869 BRW_OPCODE_BFI2 = 26, /**< Gen7+ */
870 /* Reserved - 27-31 */
871 BRW_OPCODE_JMPI = 32,
872 // BRW_OPCODE_BRD = 33, /**< Gen7+ */
873 BRW_OPCODE_IF = 34,
874 BRW_OPCODE_IFF = 35, /**< Pre-Gen6 */ /* Reused */
875 // BRW_OPCODE_BRC = 35, /**< Gen7+ */ /* Reused */
876 BRW_OPCODE_ELSE = 36,
877 BRW_OPCODE_ENDIF = 37,
878 BRW_OPCODE_DO = 38, /**< Pre-Gen6 */ /* Reused */
879 // BRW_OPCODE_CASE = 38, /**< Gen6 only */ /* Reused */
880 BRW_OPCODE_WHILE = 39,
881 BRW_OPCODE_BREAK = 40,
882 BRW_OPCODE_CONTINUE = 41,
883 BRW_OPCODE_HALT = 42,
884 // BRW_OPCODE_CALLA = 43, /**< Gen7.5+ */
885 // BRW_OPCODE_MSAVE = 44, /**< Pre-Gen6 */ /* Reused */
886 // BRW_OPCODE_CALL = 44, /**< Gen6+ */ /* Reused */
887 // BRW_OPCODE_MREST = 45, /**< Pre-Gen6 */ /* Reused */
888 // BRW_OPCODE_RET = 45, /**< Gen6+ */ /* Reused */
889 // BRW_OPCODE_PUSH = 46, /**< Pre-Gen6 */ /* Reused */
890 // BRW_OPCODE_FORK = 46, /**< Gen6 only */ /* Reused */
891 // BRW_OPCODE_GOTO = 46, /**< Gen8+ */ /* Reused */
892 // BRW_OPCODE_POP = 47, /**< Pre-Gen6 */
893 BRW_OPCODE_WAIT = 48,
894 BRW_OPCODE_SEND = 49,
895 BRW_OPCODE_SENDC = 50,
896 BRW_OPCODE_SENDS = 51, /**< Gen9+ */
897 BRW_OPCODE_SENDSC = 52, /**< Gen9+ */
898 /* Reserved 53-55 */
899 BRW_OPCODE_MATH = 56, /**< Gen6+ */
900 /* Reserved 57-63 */
901 BRW_OPCODE_ADD = 64,
902 BRW_OPCODE_MUL = 65,
903 BRW_OPCODE_AVG = 66,
904 BRW_OPCODE_FRC = 67,
905 BRW_OPCODE_RNDU = 68,
906 BRW_OPCODE_RNDD = 69,
907 BRW_OPCODE_RNDE = 70,
908 BRW_OPCODE_RNDZ = 71,
909 BRW_OPCODE_MAC = 72,
910 BRW_OPCODE_MACH = 73,
911 BRW_OPCODE_LZD = 74,
912 BRW_OPCODE_FBH = 75, /**< Gen7+ */
913 BRW_OPCODE_FBL = 76, /**< Gen7+ */
914 BRW_OPCODE_CBIT = 77, /**< Gen7+ */
915 BRW_OPCODE_ADDC = 78, /**< Gen7+ */
916 BRW_OPCODE_SUBB = 79, /**< Gen7+ */
917 BRW_OPCODE_SAD2 = 80,
918 BRW_OPCODE_SADA2 = 81,
919 /* Reserved 82-83 */
920 BRW_OPCODE_DP4 = 84,
921 BRW_OPCODE_DPH = 85,
922 BRW_OPCODE_DP3 = 86,
923 BRW_OPCODE_DP2 = 87,
924 /* Reserved 88 */
925 BRW_OPCODE_LINE = 89,
926 BRW_OPCODE_PLN = 90, /**< G45+ */
927 BRW_OPCODE_MAD = 91, /**< Gen6+ */
928 BRW_OPCODE_LRP = 92, /**< Gen6+ */
929 // BRW_OPCODE_MADM = 93, /**< Gen8+ */
930 /* Reserved 94-124 */
931 BRW_OPCODE_NENOP = 125, /**< G45 only */
932 BRW_OPCODE_NOP = 126,
933 /* Reserved 127 */
934
935 /* These are compiler backend opcodes that get translated into other
936 * instructions.
937 */
938 FS_OPCODE_FB_WRITE = 128,
939
940 /**
941 * Same as FS_OPCODE_FB_WRITE but expects its arguments separately as
942 * individual sources instead of as a single payload blob. The
943 * position/ordering of the arguments are defined by the enum
944 * fb_write_logical_srcs.
945 */
946 FS_OPCODE_FB_WRITE_LOGICAL,
947
948 FS_OPCODE_BLORP_FB_WRITE,
949 FS_OPCODE_REP_FB_WRITE,
950 FS_OPCODE_PACK_STENCIL_REF,
951 SHADER_OPCODE_RCP,
952 SHADER_OPCODE_RSQ,
953 SHADER_OPCODE_SQRT,
954 SHADER_OPCODE_EXP2,
955 SHADER_OPCODE_LOG2,
956 SHADER_OPCODE_POW,
957 SHADER_OPCODE_INT_QUOTIENT,
958 SHADER_OPCODE_INT_REMAINDER,
959 SHADER_OPCODE_SIN,
960 SHADER_OPCODE_COS,
961
962 /**
963 * Texture sampling opcodes.
964 *
965 * LOGICAL opcodes are eventually translated to the matching non-LOGICAL
966 * opcode but instead of taking a single payload blob they expect their
967 * arguments separately as individual sources:
968 *
969 * Source 0: [optional] Texture coordinates.
970 * Source 1: [optional] Shadow comparitor.
971 * Source 2: [optional] dPdx if the operation takes explicit derivatives,
972 * otherwise LOD value.
973 * Source 3: [optional] dPdy if the operation takes explicit derivatives.
974 * Source 4: [optional] Sample index.
975 * Source 5: [optional] MCS data.
976 * Source 6: [required] Texture sampler.
977 * Source 7: [optional] Texel offset.
978 * Source 8: [required] Number of coordinate components (as UD immediate).
979 * Source 9: [required] Number derivative components (as UD immediate).
980 */
981 SHADER_OPCODE_TEX,
982 SHADER_OPCODE_TEX_LOGICAL,
983 SHADER_OPCODE_TXD,
984 SHADER_OPCODE_TXD_LOGICAL,
985 SHADER_OPCODE_TXF,
986 SHADER_OPCODE_TXF_LOGICAL,
987 SHADER_OPCODE_TXL,
988 SHADER_OPCODE_TXL_LOGICAL,
989 SHADER_OPCODE_TXS,
990 SHADER_OPCODE_TXS_LOGICAL,
991 FS_OPCODE_TXB,
992 FS_OPCODE_TXB_LOGICAL,
993 SHADER_OPCODE_TXF_CMS,
994 SHADER_OPCODE_TXF_CMS_LOGICAL,
995 SHADER_OPCODE_TXF_CMS_W,
996 SHADER_OPCODE_TXF_CMS_W_LOGICAL,
997 SHADER_OPCODE_TXF_UMS,
998 SHADER_OPCODE_TXF_UMS_LOGICAL,
999 SHADER_OPCODE_TXF_MCS,
1000 SHADER_OPCODE_TXF_MCS_LOGICAL,
1001 SHADER_OPCODE_LOD,
1002 SHADER_OPCODE_LOD_LOGICAL,
1003 SHADER_OPCODE_TG4,
1004 SHADER_OPCODE_TG4_LOGICAL,
1005 SHADER_OPCODE_TG4_OFFSET,
1006 SHADER_OPCODE_TG4_OFFSET_LOGICAL,
1007 SHADER_OPCODE_SAMPLEINFO,
1008
1009 /**
1010 * Combines multiple sources of size 1 into a larger virtual GRF.
1011 * For example, parameters for a send-from-GRF message. Or, updating
1012 * channels of a size 4 VGRF used to store vec4s such as texturing results.
1013 *
1014 * This will be lowered into MOVs from each source to consecutive reg_offsets
1015 * of the destination VGRF.
1016 *
1017 * src[0] may be BAD_FILE. If so, the lowering pass skips emitting the MOV,
1018 * but still reserves the first channel of the destination VGRF. This can be
1019 * used to reserve space for, say, a message header set up by the generators.
1020 */
1021 SHADER_OPCODE_LOAD_PAYLOAD,
1022
1023 SHADER_OPCODE_SHADER_TIME_ADD,
1024
1025 /**
1026 * Typed and untyped surface access opcodes.
1027 *
1028 * LOGICAL opcodes are eventually translated to the matching non-LOGICAL
1029 * opcode but instead of taking a single payload blob they expect their
1030 * arguments separately as individual sources:
1031 *
1032 * Source 0: [required] Surface coordinates.
1033 * Source 1: [optional] Operation source.
1034 * Source 2: [required] Surface index.
1035 * Source 3: [required] Number of coordinate components (as UD immediate).
1036 * Source 4: [required] Opcode-specific control immediate, same as source 2
1037 * of the matching non-LOGICAL opcode.
1038 */
1039 SHADER_OPCODE_UNTYPED_ATOMIC,
1040 SHADER_OPCODE_UNTYPED_ATOMIC_LOGICAL,
1041 SHADER_OPCODE_UNTYPED_SURFACE_READ,
1042 SHADER_OPCODE_UNTYPED_SURFACE_READ_LOGICAL,
1043 SHADER_OPCODE_UNTYPED_SURFACE_WRITE,
1044 SHADER_OPCODE_UNTYPED_SURFACE_WRITE_LOGICAL,
1045
1046 SHADER_OPCODE_TYPED_ATOMIC,
1047 SHADER_OPCODE_TYPED_ATOMIC_LOGICAL,
1048 SHADER_OPCODE_TYPED_SURFACE_READ,
1049 SHADER_OPCODE_TYPED_SURFACE_READ_LOGICAL,
1050 SHADER_OPCODE_TYPED_SURFACE_WRITE,
1051 SHADER_OPCODE_TYPED_SURFACE_WRITE_LOGICAL,
1052
1053 SHADER_OPCODE_MEMORY_FENCE,
1054
1055 SHADER_OPCODE_GEN4_SCRATCH_READ,
1056 SHADER_OPCODE_GEN4_SCRATCH_WRITE,
1057 SHADER_OPCODE_GEN7_SCRATCH_READ,
1058
1059 /**
1060 * Gen8+ SIMD8 URB Read messages.
1061 */
1062 SHADER_OPCODE_URB_READ_SIMD8,
1063 SHADER_OPCODE_URB_READ_SIMD8_PER_SLOT,
1064
1065 SHADER_OPCODE_URB_WRITE_SIMD8,
1066 SHADER_OPCODE_URB_WRITE_SIMD8_PER_SLOT,
1067 SHADER_OPCODE_URB_WRITE_SIMD8_MASKED,
1068 SHADER_OPCODE_URB_WRITE_SIMD8_MASKED_PER_SLOT,
1069
1070 /**
1071 * Return the index of an arbitrary live channel (i.e. one of the channels
1072 * enabled in the current execution mask) and assign it to the first
1073 * component of the destination. Expected to be used as input for the
1074 * BROADCAST pseudo-opcode.
1075 */
1076 SHADER_OPCODE_FIND_LIVE_CHANNEL,
1077
1078 /**
1079 * Pick the channel from its first source register given by the index
1080 * specified as second source. Useful for variable indexing of surfaces.
1081 */
1082 SHADER_OPCODE_BROADCAST,
1083
1084 VEC4_OPCODE_MOV_BYTES,
1085 VEC4_OPCODE_PACK_BYTES,
1086 VEC4_OPCODE_UNPACK_UNIFORM,
1087
1088 FS_OPCODE_DDX_COARSE,
1089 FS_OPCODE_DDX_FINE,
1090 /**
1091 * Compute dFdy(), dFdyCoarse(), or dFdyFine().
1092 * src1 is an immediate storing the key->render_to_fbo boolean.
1093 */
1094 FS_OPCODE_DDY_COARSE,
1095 FS_OPCODE_DDY_FINE,
1096 FS_OPCODE_CINTERP,
1097 FS_OPCODE_LINTERP,
1098 FS_OPCODE_PIXEL_X,
1099 FS_OPCODE_PIXEL_Y,
1100 FS_OPCODE_UNIFORM_PULL_CONSTANT_LOAD,
1101 FS_OPCODE_UNIFORM_PULL_CONSTANT_LOAD_GEN7,
1102 FS_OPCODE_VARYING_PULL_CONSTANT_LOAD,
1103 FS_OPCODE_VARYING_PULL_CONSTANT_LOAD_GEN7,
1104 FS_OPCODE_GET_BUFFER_SIZE,
1105 FS_OPCODE_MOV_DISPATCH_TO_FLAGS,
1106 FS_OPCODE_DISCARD_JUMP,
1107 FS_OPCODE_SET_SAMPLE_ID,
1108 FS_OPCODE_SET_SIMD4X2_OFFSET,
1109 FS_OPCODE_PACK_HALF_2x16_SPLIT,
1110 FS_OPCODE_UNPACK_HALF_2x16_SPLIT_X,
1111 FS_OPCODE_UNPACK_HALF_2x16_SPLIT_Y,
1112 FS_OPCODE_PLACEHOLDER_HALT,
1113 FS_OPCODE_INTERPOLATE_AT_CENTROID,
1114 FS_OPCODE_INTERPOLATE_AT_SAMPLE,
1115 FS_OPCODE_INTERPOLATE_AT_SHARED_OFFSET,
1116 FS_OPCODE_INTERPOLATE_AT_PER_SLOT_OFFSET,
1117
1118 VS_OPCODE_URB_WRITE,
1119 VS_OPCODE_PULL_CONSTANT_LOAD,
1120 VS_OPCODE_PULL_CONSTANT_LOAD_GEN7,
1121 VS_OPCODE_SET_SIMD4X2_HEADER_GEN9,
1122
1123 VS_OPCODE_GET_BUFFER_SIZE,
1124
1125 VS_OPCODE_UNPACK_FLAGS_SIMD4X2,
1126
1127 /**
1128 * Write geometry shader output data to the URB.
1129 *
1130 * Unlike VS_OPCODE_URB_WRITE, this opcode doesn't do an implied move from
1131 * R0 to the first MRF. This allows the geometry shader to override the
1132 * "Slot {0,1} Offset" fields in the message header.
1133 */
1134 GS_OPCODE_URB_WRITE,
1135
1136 /**
1137 * Write geometry shader output data to the URB and request a new URB
1138 * handle (gen6).
1139 *
1140 * This opcode doesn't do an implied move from R0 to the first MRF.
1141 */
1142 GS_OPCODE_URB_WRITE_ALLOCATE,
1143
1144 /**
1145 * Terminate the geometry shader thread by doing an empty URB write.
1146 *
1147 * This opcode doesn't do an implied move from R0 to the first MRF. This
1148 * allows the geometry shader to override the "GS Number of Output Vertices
1149 * for Slot {0,1}" fields in the message header.
1150 */
1151 GS_OPCODE_THREAD_END,
1152
1153 /**
1154 * Set the "Slot {0,1} Offset" fields of a URB_WRITE message header.
1155 *
1156 * - dst is the MRF containing the message header.
1157 *
1158 * - src0.x indicates which portion of the URB should be written to (e.g. a
1159 * vertex number)
1160 *
1161 * - src1 is an immediate multiplier which will be applied to src0
1162 * (e.g. the size of a single vertex in the URB).
1163 *
1164 * Note: the hardware will apply this offset *in addition to* the offset in
1165 * vec4_instruction::offset.
1166 */
1167 GS_OPCODE_SET_WRITE_OFFSET,
1168
1169 /**
1170 * Set the "GS Number of Output Vertices for Slot {0,1}" fields of a
1171 * URB_WRITE message header.
1172 *
1173 * - dst is the MRF containing the message header.
1174 *
1175 * - src0.x is the vertex count. The upper 16 bits will be ignored.
1176 */
1177 GS_OPCODE_SET_VERTEX_COUNT,
1178
1179 /**
1180 * Set DWORD 2 of dst to the value in src.
1181 */
1182 GS_OPCODE_SET_DWORD_2,
1183
1184 /**
1185 * Prepare the dst register for storage in the "Channel Mask" fields of a
1186 * URB_WRITE message header.
1187 *
1188 * DWORD 4 of dst is shifted left by 4 bits, so that later,
1189 * GS_OPCODE_SET_CHANNEL_MASKS can OR DWORDs 0 and 4 together to form the
1190 * final channel mask.
1191 *
1192 * Note: since GS_OPCODE_SET_CHANNEL_MASKS ORs DWORDs 0 and 4 together to
1193 * form the final channel mask, DWORDs 0 and 4 of the dst register must not
1194 * have any extraneous bits set prior to execution of this opcode (that is,
1195 * they should be in the range 0x0 to 0xf).
1196 */
1197 GS_OPCODE_PREPARE_CHANNEL_MASKS,
1198
1199 /**
1200 * Set the "Channel Mask" fields of a URB_WRITE message header.
1201 *
1202 * - dst is the MRF containing the message header.
1203 *
1204 * - src.x is the channel mask, as prepared by
1205 * GS_OPCODE_PREPARE_CHANNEL_MASKS. DWORDs 0 and 4 are OR'ed together to
1206 * form the final channel mask.
1207 */
1208 GS_OPCODE_SET_CHANNEL_MASKS,
1209
1210 /**
1211 * Get the "Instance ID" fields from the payload.
1212 *
1213 * - dst is the GRF for gl_InvocationID.
1214 */
1215 GS_OPCODE_GET_INSTANCE_ID,
1216
1217 /**
1218 * Send a FF_SYNC message to allocate initial URB handles (gen6).
1219 *
1220 * - dst will be used as the writeback register for the FF_SYNC operation.
1221 *
1222 * - src0 is the number of primitives written.
1223 *
1224 * - src1 is the value to hold in M0.0: number of SO vertices to write
1225 * and number of SO primitives needed. Its value will be overwritten
1226 * with the SVBI values if transform feedback is enabled.
1227 *
1228 * Note: This opcode uses an implicit MRF register for the ff_sync message
1229 * header, so the caller is expected to set inst->base_mrf and initialize
1230 * that MRF register to r0. This opcode will also write to this MRF register
1231 * to include the allocated URB handle so it can then be reused directly as
1232 * the header in the URB write operation we are allocating the handle for.
1233 */
1234 GS_OPCODE_FF_SYNC,
1235
1236 /**
1237 * Move r0.1 (which holds PrimitiveID information in gen6) to a separate
1238 * register.
1239 *
1240 * - dst is the GRF where PrimitiveID information will be moved.
1241 */
1242 GS_OPCODE_SET_PRIMITIVE_ID,
1243
1244 /**
1245 * Write transform feedback data to the SVB by sending a SVB WRITE message.
1246 * Used in gen6.
1247 *
1248 * - dst is the MRF register containing the message header.
1249 *
1250 * - src0 is the register where the vertex data is going to be copied from.
1251 *
1252 * - src1 is the destination register when write commit occurs.
1253 */
1254 GS_OPCODE_SVB_WRITE,
1255
1256 /**
1257 * Set destination index in the SVB write message payload (M0.5). Used
1258 * in gen6 for transform feedback.
1259 *
1260 * - dst is the header to save the destination indices for SVB WRITE.
1261 * - src is the register that holds the destination indices value.
1262 */
1263 GS_OPCODE_SVB_SET_DST_INDEX,
1264
1265 /**
1266 * Prepare Mx.0 subregister for being used in the FF_SYNC message header.
1267 * Used in gen6 for transform feedback.
1268 *
1269 * - dst will hold the register with the final Mx.0 value.
1270 *
1271 * - src0 has the number of vertices emitted in SO (NumSOVertsToWrite)
1272 *
1273 * - src1 has the number of needed primitives for SO (NumSOPrimsNeeded)
1274 *
1275 * - src2 is the value to hold in M0: number of SO vertices to write
1276 * and number of SO primitives needed.
1277 */
1278 GS_OPCODE_FF_SYNC_SET_PRIMITIVES,
1279
1280 /**
1281 * Terminate the compute shader.
1282 */
1283 CS_OPCODE_CS_TERMINATE,
1284
1285 /**
1286 * GLSL barrier()
1287 */
1288 SHADER_OPCODE_BARRIER,
1289
1290 /**
1291 * Calculate the high 32-bits of a 32x32 multiply.
1292 */
1293 SHADER_OPCODE_MULH,
1294 };
1295
1296 enum brw_urb_write_flags {
1297 BRW_URB_WRITE_NO_FLAGS = 0,
1298
1299 /**
1300 * Causes a new URB entry to be allocated, and its address stored in the
1301 * destination register (gen < 7).
1302 */
1303 BRW_URB_WRITE_ALLOCATE = 0x1,
1304
1305 /**
1306 * Causes the current URB entry to be deallocated (gen < 7).
1307 */
1308 BRW_URB_WRITE_UNUSED = 0x2,
1309
1310 /**
1311 * Causes the thread to terminate.
1312 */
1313 BRW_URB_WRITE_EOT = 0x4,
1314
1315 /**
1316 * Indicates that the given URB entry is complete, and may be sent further
1317 * down the 3D pipeline (gen < 7).
1318 */
1319 BRW_URB_WRITE_COMPLETE = 0x8,
1320
1321 /**
1322 * Indicates that an additional offset (which may be different for the two
1323 * vec4 slots) is stored in the message header (gen == 7).
1324 */
1325 BRW_URB_WRITE_PER_SLOT_OFFSET = 0x10,
1326
1327 /**
1328 * Indicates that the channel masks in the URB_WRITE message header should
1329 * not be overridden to 0xff (gen == 7).
1330 */
1331 BRW_URB_WRITE_USE_CHANNEL_MASKS = 0x20,
1332
1333 /**
1334 * Indicates that the data should be sent to the URB using the
1335 * URB_WRITE_OWORD message rather than URB_WRITE_HWORD (gen == 7). This
1336 * causes offsets to be interpreted as multiples of an OWORD instead of an
1337 * HWORD, and only allows one OWORD to be written.
1338 */
1339 BRW_URB_WRITE_OWORD = 0x40,
1340
1341 /**
1342 * Convenient combination of flags: end the thread while simultaneously
1343 * marking the given URB entry as complete.
1344 */
1345 BRW_URB_WRITE_EOT_COMPLETE = BRW_URB_WRITE_EOT | BRW_URB_WRITE_COMPLETE,
1346
1347 /**
1348 * Convenient combination of flags: mark the given URB entry as complete
1349 * and simultaneously allocate a new one.
1350 */
1351 BRW_URB_WRITE_ALLOCATE_COMPLETE =
1352 BRW_URB_WRITE_ALLOCATE | BRW_URB_WRITE_COMPLETE,
1353 };
1354
1355 enum fb_write_logical_srcs {
1356 FB_WRITE_LOGICAL_SRC_COLOR0, /* REQUIRED */
1357 FB_WRITE_LOGICAL_SRC_COLOR1, /* for dual source blend messages */
1358 FB_WRITE_LOGICAL_SRC_SRC0_ALPHA,
1359 FB_WRITE_LOGICAL_SRC_SRC_DEPTH, /* gl_FragDepth */
1360 FB_WRITE_LOGICAL_SRC_DST_DEPTH, /* GEN4-5: passthrough from thread */
1361 FB_WRITE_LOGICAL_SRC_SRC_STENCIL, /* gl_FragStencilRefARB */
1362 FB_WRITE_LOGICAL_SRC_OMASK, /* Sample Mask (gl_SampleMask) */
1363 FB_WRITE_LOGICAL_SRC_COMPONENTS, /* REQUIRED */
1364 };
1365
1366 #ifdef __cplusplus
1367 /**
1368 * Allow brw_urb_write_flags enums to be ORed together.
1369 */
1370 inline brw_urb_write_flags
1371 operator|(brw_urb_write_flags x, brw_urb_write_flags y)
1372 {
1373 return static_cast<brw_urb_write_flags>(static_cast<int>(x) |
1374 static_cast<int>(y));
1375 }
1376 #endif
1377
1378 enum PACKED brw_predicate {
1379 BRW_PREDICATE_NONE = 0,
1380 BRW_PREDICATE_NORMAL = 1,
1381 BRW_PREDICATE_ALIGN1_ANYV = 2,
1382 BRW_PREDICATE_ALIGN1_ALLV = 3,
1383 BRW_PREDICATE_ALIGN1_ANY2H = 4,
1384 BRW_PREDICATE_ALIGN1_ALL2H = 5,
1385 BRW_PREDICATE_ALIGN1_ANY4H = 6,
1386 BRW_PREDICATE_ALIGN1_ALL4H = 7,
1387 BRW_PREDICATE_ALIGN1_ANY8H = 8,
1388 BRW_PREDICATE_ALIGN1_ALL8H = 9,
1389 BRW_PREDICATE_ALIGN1_ANY16H = 10,
1390 BRW_PREDICATE_ALIGN1_ALL16H = 11,
1391 BRW_PREDICATE_ALIGN1_ANY32H = 12,
1392 BRW_PREDICATE_ALIGN1_ALL32H = 13,
1393 BRW_PREDICATE_ALIGN16_REPLICATE_X = 2,
1394 BRW_PREDICATE_ALIGN16_REPLICATE_Y = 3,
1395 BRW_PREDICATE_ALIGN16_REPLICATE_Z = 4,
1396 BRW_PREDICATE_ALIGN16_REPLICATE_W = 5,
1397 BRW_PREDICATE_ALIGN16_ANY4H = 6,
1398 BRW_PREDICATE_ALIGN16_ALL4H = 7,
1399 };
1400
1401 enum PACKED brw_reg_file {
1402 BRW_ARCHITECTURE_REGISTER_FILE = 0,
1403 BRW_GENERAL_REGISTER_FILE = 1,
1404 BRW_MESSAGE_REGISTER_FILE = 2,
1405 BRW_IMMEDIATE_VALUE = 3,
1406
1407 ARF = BRW_ARCHITECTURE_REGISTER_FILE,
1408 FIXED_GRF = BRW_GENERAL_REGISTER_FILE,
1409 MRF = BRW_MESSAGE_REGISTER_FILE,
1410 IMM = BRW_IMMEDIATE_VALUE,
1411
1412 /* These are not hardware values */
1413 VGRF,
1414 ATTR,
1415 UNIFORM, /* prog_data->params[reg] */
1416 BAD_FILE,
1417 };
1418
1419 #define BRW_HW_REG_TYPE_UD 0
1420 #define BRW_HW_REG_TYPE_D 1
1421 #define BRW_HW_REG_TYPE_UW 2
1422 #define BRW_HW_REG_TYPE_W 3
1423 #define BRW_HW_REG_TYPE_F 7
1424 #define GEN8_HW_REG_TYPE_UQ 8
1425 #define GEN8_HW_REG_TYPE_Q 9
1426
1427 #define BRW_HW_REG_NON_IMM_TYPE_UB 4
1428 #define BRW_HW_REG_NON_IMM_TYPE_B 5
1429 #define GEN7_HW_REG_NON_IMM_TYPE_DF 6
1430 #define GEN8_HW_REG_NON_IMM_TYPE_HF 10
1431
1432 #define BRW_HW_REG_IMM_TYPE_UV 4 /* Gen6+ packed unsigned immediate vector */
1433 #define BRW_HW_REG_IMM_TYPE_VF 5 /* packed float immediate vector */
1434 #define BRW_HW_REG_IMM_TYPE_V 6 /* packed int imm. vector; uword dest only */
1435 #define GEN8_HW_REG_IMM_TYPE_DF 10
1436 #define GEN8_HW_REG_IMM_TYPE_HF 11
1437
1438 /* SNB adds 3-src instructions (MAD and LRP) that only operate on floats, so
1439 * the types were implied. IVB adds BFE and BFI2 that operate on doublewords
1440 * and unsigned doublewords, so a new field is also available in the da3src
1441 * struct (part of struct brw_instruction.bits1 in brw_structs.h) to select
1442 * dst and shared-src types. The values are different from BRW_REGISTER_TYPE_*.
1443 */
1444 #define BRW_3SRC_TYPE_F 0
1445 #define BRW_3SRC_TYPE_D 1
1446 #define BRW_3SRC_TYPE_UD 2
1447 #define BRW_3SRC_TYPE_DF 3
1448
1449 #define BRW_ARF_NULL 0x00
1450 #define BRW_ARF_ADDRESS 0x10
1451 #define BRW_ARF_ACCUMULATOR 0x20
1452 #define BRW_ARF_FLAG 0x30
1453 #define BRW_ARF_MASK 0x40
1454 #define BRW_ARF_MASK_STACK 0x50
1455 #define BRW_ARF_MASK_STACK_DEPTH 0x60
1456 #define BRW_ARF_STATE 0x70
1457 #define BRW_ARF_CONTROL 0x80
1458 #define BRW_ARF_NOTIFICATION_COUNT 0x90
1459 #define BRW_ARF_IP 0xA0
1460 #define BRW_ARF_TDR 0xB0
1461 #define BRW_ARF_TIMESTAMP 0xC0
1462
1463 #define BRW_MRF_COMPR4 (1 << 7)
1464
1465 #define BRW_AMASK 0
1466 #define BRW_IMASK 1
1467 #define BRW_LMASK 2
1468 #define BRW_CMASK 3
1469
1470
1471
1472 #define BRW_THREAD_NORMAL 0
1473 #define BRW_THREAD_ATOMIC 1
1474 #define BRW_THREAD_SWITCH 2
1475
1476 enum PACKED brw_vertical_stride {
1477 BRW_VERTICAL_STRIDE_0 = 0,
1478 BRW_VERTICAL_STRIDE_1 = 1,
1479 BRW_VERTICAL_STRIDE_2 = 2,
1480 BRW_VERTICAL_STRIDE_4 = 3,
1481 BRW_VERTICAL_STRIDE_8 = 4,
1482 BRW_VERTICAL_STRIDE_16 = 5,
1483 BRW_VERTICAL_STRIDE_32 = 6,
1484 BRW_VERTICAL_STRIDE_ONE_DIMENSIONAL = 0xF,
1485 };
1486
1487 enum PACKED brw_width {
1488 BRW_WIDTH_1 = 0,
1489 BRW_WIDTH_2 = 1,
1490 BRW_WIDTH_4 = 2,
1491 BRW_WIDTH_8 = 3,
1492 BRW_WIDTH_16 = 4,
1493 };
1494
1495 #define BRW_STATELESS_BUFFER_BOUNDARY_1K 0
1496 #define BRW_STATELESS_BUFFER_BOUNDARY_2K 1
1497 #define BRW_STATELESS_BUFFER_BOUNDARY_4K 2
1498 #define BRW_STATELESS_BUFFER_BOUNDARY_8K 3
1499 #define BRW_STATELESS_BUFFER_BOUNDARY_16K 4
1500 #define BRW_STATELESS_BUFFER_BOUNDARY_32K 5
1501 #define BRW_STATELESS_BUFFER_BOUNDARY_64K 6
1502 #define BRW_STATELESS_BUFFER_BOUNDARY_128K 7
1503 #define BRW_STATELESS_BUFFER_BOUNDARY_256K 8
1504 #define BRW_STATELESS_BUFFER_BOUNDARY_512K 9
1505 #define BRW_STATELESS_BUFFER_BOUNDARY_1M 10
1506 #define BRW_STATELESS_BUFFER_BOUNDARY_2M 11
1507
1508 #define BRW_POLYGON_FACING_FRONT 0
1509 #define BRW_POLYGON_FACING_BACK 1
1510
1511 /**
1512 * Message target: Shared Function ID for where to SEND a message.
1513 *
1514 * These are enumerated in the ISA reference under "send - Send Message".
1515 * In particular, see the following tables:
1516 * - G45 PRM, Volume 4, Table 14-15 "Message Descriptor Definition"
1517 * - Sandybridge PRM, Volume 4 Part 2, Table 8-16 "Extended Message Descriptor"
1518 * - Ivybridge PRM, Volume 1 Part 1, section 3.2.7 "GPE Function IDs"
1519 */
1520 enum brw_message_target {
1521 BRW_SFID_NULL = 0,
1522 BRW_SFID_MATH = 1, /* Only valid on Gen4-5 */
1523 BRW_SFID_SAMPLER = 2,
1524 BRW_SFID_MESSAGE_GATEWAY = 3,
1525 BRW_SFID_DATAPORT_READ = 4,
1526 BRW_SFID_DATAPORT_WRITE = 5,
1527 BRW_SFID_URB = 6,
1528 BRW_SFID_THREAD_SPAWNER = 7,
1529 BRW_SFID_VME = 8,
1530
1531 GEN6_SFID_DATAPORT_SAMPLER_CACHE = 4,
1532 GEN6_SFID_DATAPORT_RENDER_CACHE = 5,
1533 GEN6_SFID_DATAPORT_CONSTANT_CACHE = 9,
1534
1535 GEN7_SFID_DATAPORT_DATA_CACHE = 10,
1536 GEN7_SFID_PIXEL_INTERPOLATOR = 11,
1537 HSW_SFID_DATAPORT_DATA_CACHE_1 = 12,
1538 HSW_SFID_CRE = 13,
1539 };
1540
1541 #define GEN7_MESSAGE_TARGET_DP_DATA_CACHE 10
1542
1543 #define BRW_SAMPLER_RETURN_FORMAT_FLOAT32 0
1544 #define BRW_SAMPLER_RETURN_FORMAT_UINT32 2
1545 #define BRW_SAMPLER_RETURN_FORMAT_SINT32 3
1546
1547 #define BRW_SAMPLER_MESSAGE_SIMD8_SAMPLE 0
1548 #define BRW_SAMPLER_MESSAGE_SIMD16_SAMPLE 0
1549 #define BRW_SAMPLER_MESSAGE_SIMD16_SAMPLE_BIAS 0
1550 #define BRW_SAMPLER_MESSAGE_SIMD8_KILLPIX 1
1551 #define BRW_SAMPLER_MESSAGE_SIMD4X2_SAMPLE_LOD 1
1552 #define BRW_SAMPLER_MESSAGE_SIMD16_SAMPLE_LOD 1
1553 #define BRW_SAMPLER_MESSAGE_SIMD4X2_SAMPLE_GRADIENTS 2
1554 #define BRW_SAMPLER_MESSAGE_SIMD8_SAMPLE_GRADIENTS 2
1555 #define BRW_SAMPLER_MESSAGE_SIMD4X2_SAMPLE_COMPARE 0
1556 #define BRW_SAMPLER_MESSAGE_SIMD16_SAMPLE_COMPARE 2
1557 #define BRW_SAMPLER_MESSAGE_SIMD8_SAMPLE_BIAS_COMPARE 0
1558 #define BRW_SAMPLER_MESSAGE_SIMD4X2_SAMPLE_LOD_COMPARE 1
1559 #define BRW_SAMPLER_MESSAGE_SIMD8_SAMPLE_LOD_COMPARE 1
1560 #define BRW_SAMPLER_MESSAGE_SIMD4X2_RESINFO 2
1561 #define BRW_SAMPLER_MESSAGE_SIMD16_RESINFO 2
1562 #define BRW_SAMPLER_MESSAGE_SIMD4X2_LD 3
1563 #define BRW_SAMPLER_MESSAGE_SIMD8_LD 3
1564 #define BRW_SAMPLER_MESSAGE_SIMD16_LD 3
1565
1566 #define GEN5_SAMPLER_MESSAGE_SAMPLE 0
1567 #define GEN5_SAMPLER_MESSAGE_SAMPLE_BIAS 1
1568 #define GEN5_SAMPLER_MESSAGE_SAMPLE_LOD 2
1569 #define GEN5_SAMPLER_MESSAGE_SAMPLE_COMPARE 3
1570 #define GEN5_SAMPLER_MESSAGE_SAMPLE_DERIVS 4
1571 #define GEN5_SAMPLER_MESSAGE_SAMPLE_BIAS_COMPARE 5
1572 #define GEN5_SAMPLER_MESSAGE_SAMPLE_LOD_COMPARE 6
1573 #define GEN5_SAMPLER_MESSAGE_SAMPLE_LD 7
1574 #define GEN7_SAMPLER_MESSAGE_SAMPLE_GATHER4 8
1575 #define GEN5_SAMPLER_MESSAGE_LOD 9
1576 #define GEN5_SAMPLER_MESSAGE_SAMPLE_RESINFO 10
1577 #define GEN6_SAMPLER_MESSAGE_SAMPLE_SAMPLEINFO 11
1578 #define GEN7_SAMPLER_MESSAGE_SAMPLE_GATHER4_C 16
1579 #define GEN7_SAMPLER_MESSAGE_SAMPLE_GATHER4_PO 17
1580 #define GEN7_SAMPLER_MESSAGE_SAMPLE_GATHER4_PO_C 18
1581 #define HSW_SAMPLER_MESSAGE_SAMPLE_DERIV_COMPARE 20
1582 #define GEN9_SAMPLER_MESSAGE_SAMPLE_LD2DMS_W 28
1583 #define GEN7_SAMPLER_MESSAGE_SAMPLE_LD_MCS 29
1584 #define GEN7_SAMPLER_MESSAGE_SAMPLE_LD2DMS 30
1585 #define GEN7_SAMPLER_MESSAGE_SAMPLE_LD2DSS 31
1586
1587 /* for GEN5 only */
1588 #define BRW_SAMPLER_SIMD_MODE_SIMD4X2 0
1589 #define BRW_SAMPLER_SIMD_MODE_SIMD8 1
1590 #define BRW_SAMPLER_SIMD_MODE_SIMD16 2
1591 #define BRW_SAMPLER_SIMD_MODE_SIMD32_64 3
1592
1593 /* GEN9 changes SIMD mode 0 to mean SIMD8D, but lets us get the SIMD4x2
1594 * behavior by setting bit 22 of dword 2 in the message header. */
1595 #define GEN9_SAMPLER_SIMD_MODE_SIMD8D 0
1596 #define GEN9_SAMPLER_SIMD_MODE_EXTENSION_SIMD4X2 (1 << 22)
1597
1598 #define BRW_DATAPORT_OWORD_BLOCK_1_OWORDLOW 0
1599 #define BRW_DATAPORT_OWORD_BLOCK_1_OWORDHIGH 1
1600 #define BRW_DATAPORT_OWORD_BLOCK_2_OWORDS 2
1601 #define BRW_DATAPORT_OWORD_BLOCK_4_OWORDS 3
1602 #define BRW_DATAPORT_OWORD_BLOCK_8_OWORDS 4
1603
1604 #define BRW_DATAPORT_OWORD_DUAL_BLOCK_1OWORD 0
1605 #define BRW_DATAPORT_OWORD_DUAL_BLOCK_4OWORDS 2
1606
1607 #define BRW_DATAPORT_DWORD_SCATTERED_BLOCK_8DWORDS 2
1608 #define BRW_DATAPORT_DWORD_SCATTERED_BLOCK_16DWORDS 3
1609
1610 /* This one stays the same across generations. */
1611 #define BRW_DATAPORT_READ_MESSAGE_OWORD_BLOCK_READ 0
1612 /* GEN4 */
1613 #define BRW_DATAPORT_READ_MESSAGE_OWORD_DUAL_BLOCK_READ 1
1614 #define BRW_DATAPORT_READ_MESSAGE_MEDIA_BLOCK_READ 2
1615 #define BRW_DATAPORT_READ_MESSAGE_DWORD_SCATTERED_READ 3
1616 /* G45, GEN5 */
1617 #define G45_DATAPORT_READ_MESSAGE_RENDER_UNORM_READ 1
1618 #define G45_DATAPORT_READ_MESSAGE_OWORD_DUAL_BLOCK_READ 2
1619 #define G45_DATAPORT_READ_MESSAGE_AVC_LOOP_FILTER_READ 3
1620 #define G45_DATAPORT_READ_MESSAGE_MEDIA_BLOCK_READ 4
1621 #define G45_DATAPORT_READ_MESSAGE_DWORD_SCATTERED_READ 6
1622 /* GEN6 */
1623 #define GEN6_DATAPORT_READ_MESSAGE_RENDER_UNORM_READ 1
1624 #define GEN6_DATAPORT_READ_MESSAGE_OWORD_DUAL_BLOCK_READ 2
1625 #define GEN6_DATAPORT_READ_MESSAGE_MEDIA_BLOCK_READ 4
1626 #define GEN6_DATAPORT_READ_MESSAGE_OWORD_UNALIGN_BLOCK_READ 5
1627 #define GEN6_DATAPORT_READ_MESSAGE_DWORD_SCATTERED_READ 6
1628
1629 #define BRW_DATAPORT_READ_TARGET_DATA_CACHE 0
1630 #define BRW_DATAPORT_READ_TARGET_RENDER_CACHE 1
1631 #define BRW_DATAPORT_READ_TARGET_SAMPLER_CACHE 2
1632
1633 #define BRW_DATAPORT_RENDER_TARGET_WRITE_SIMD16_SINGLE_SOURCE 0
1634 #define BRW_DATAPORT_RENDER_TARGET_WRITE_SIMD16_SINGLE_SOURCE_REPLICATED 1
1635 #define BRW_DATAPORT_RENDER_TARGET_WRITE_SIMD8_DUAL_SOURCE_SUBSPAN01 2
1636 #define BRW_DATAPORT_RENDER_TARGET_WRITE_SIMD8_DUAL_SOURCE_SUBSPAN23 3
1637 #define BRW_DATAPORT_RENDER_TARGET_WRITE_SIMD8_SINGLE_SOURCE_SUBSPAN01 4
1638
1639 #define BRW_DATAPORT_WRITE_MESSAGE_OWORD_BLOCK_WRITE 0
1640 #define BRW_DATAPORT_WRITE_MESSAGE_OWORD_DUAL_BLOCK_WRITE 1
1641 #define BRW_DATAPORT_WRITE_MESSAGE_MEDIA_BLOCK_WRITE 2
1642 #define BRW_DATAPORT_WRITE_MESSAGE_DWORD_SCATTERED_WRITE 3
1643 #define BRW_DATAPORT_WRITE_MESSAGE_RENDER_TARGET_WRITE 4
1644 #define BRW_DATAPORT_WRITE_MESSAGE_STREAMED_VERTEX_BUFFER_WRITE 5
1645 #define BRW_DATAPORT_WRITE_MESSAGE_FLUSH_RENDER_CACHE 7
1646
1647 /* GEN6 */
1648 #define GEN6_DATAPORT_WRITE_MESSAGE_DWORD_ATOMIC_WRITE 7
1649 #define GEN6_DATAPORT_WRITE_MESSAGE_OWORD_BLOCK_WRITE 8
1650 #define GEN6_DATAPORT_WRITE_MESSAGE_OWORD_DUAL_BLOCK_WRITE 9
1651 #define GEN6_DATAPORT_WRITE_MESSAGE_MEDIA_BLOCK_WRITE 10
1652 #define GEN6_DATAPORT_WRITE_MESSAGE_DWORD_SCATTERED_WRITE 11
1653 #define GEN6_DATAPORT_WRITE_MESSAGE_RENDER_TARGET_WRITE 12
1654 #define GEN6_DATAPORT_WRITE_MESSAGE_STREAMED_VB_WRITE 13
1655 #define GEN6_DATAPORT_WRITE_MESSAGE_RENDER_TARGET_UNORM_WRITE 14
1656
1657 /* GEN7 */
1658 #define GEN7_DATAPORT_RC_MEDIA_BLOCK_READ 4
1659 #define GEN7_DATAPORT_RC_TYPED_SURFACE_READ 5
1660 #define GEN7_DATAPORT_RC_TYPED_ATOMIC_OP 6
1661 #define GEN7_DATAPORT_RC_MEMORY_FENCE 7
1662 #define GEN7_DATAPORT_RC_MEDIA_BLOCK_WRITE 10
1663 #define GEN7_DATAPORT_RC_RENDER_TARGET_WRITE 12
1664 #define GEN7_DATAPORT_RC_TYPED_SURFACE_WRITE 13
1665 #define GEN7_DATAPORT_DC_OWORD_BLOCK_READ 0
1666 #define GEN7_DATAPORT_DC_UNALIGNED_OWORD_BLOCK_READ 1
1667 #define GEN7_DATAPORT_DC_OWORD_DUAL_BLOCK_READ 2
1668 #define GEN7_DATAPORT_DC_DWORD_SCATTERED_READ 3
1669 #define GEN7_DATAPORT_DC_BYTE_SCATTERED_READ 4
1670 #define GEN7_DATAPORT_DC_UNTYPED_SURFACE_READ 5
1671 #define GEN7_DATAPORT_DC_UNTYPED_ATOMIC_OP 6
1672 #define GEN7_DATAPORT_DC_MEMORY_FENCE 7
1673 #define GEN7_DATAPORT_DC_OWORD_BLOCK_WRITE 8
1674 #define GEN7_DATAPORT_DC_OWORD_DUAL_BLOCK_WRITE 10
1675 #define GEN7_DATAPORT_DC_DWORD_SCATTERED_WRITE 11
1676 #define GEN7_DATAPORT_DC_BYTE_SCATTERED_WRITE 12
1677 #define GEN7_DATAPORT_DC_UNTYPED_SURFACE_WRITE 13
1678
1679 #define GEN7_DATAPORT_SCRATCH_READ ((1 << 18) | \
1680 (0 << 17))
1681 #define GEN7_DATAPORT_SCRATCH_WRITE ((1 << 18) | \
1682 (1 << 17))
1683 #define GEN7_DATAPORT_SCRATCH_NUM_REGS_SHIFT 12
1684
1685 #define GEN7_PIXEL_INTERPOLATOR_LOC_SHARED_OFFSET 0
1686 #define GEN7_PIXEL_INTERPOLATOR_LOC_SAMPLE 1
1687 #define GEN7_PIXEL_INTERPOLATOR_LOC_CENTROID 2
1688 #define GEN7_PIXEL_INTERPOLATOR_LOC_PER_SLOT_OFFSET 3
1689
1690 /* HSW */
1691 #define HSW_DATAPORT_DC_PORT0_OWORD_BLOCK_READ 0
1692 #define HSW_DATAPORT_DC_PORT0_UNALIGNED_OWORD_BLOCK_READ 1
1693 #define HSW_DATAPORT_DC_PORT0_OWORD_DUAL_BLOCK_READ 2
1694 #define HSW_DATAPORT_DC_PORT0_DWORD_SCATTERED_READ 3
1695 #define HSW_DATAPORT_DC_PORT0_BYTE_SCATTERED_READ 4
1696 #define HSW_DATAPORT_DC_PORT0_MEMORY_FENCE 7
1697 #define HSW_DATAPORT_DC_PORT0_OWORD_BLOCK_WRITE 8
1698 #define HSW_DATAPORT_DC_PORT0_OWORD_DUAL_BLOCK_WRITE 10
1699 #define HSW_DATAPORT_DC_PORT0_DWORD_SCATTERED_WRITE 11
1700 #define HSW_DATAPORT_DC_PORT0_BYTE_SCATTERED_WRITE 12
1701
1702 #define HSW_DATAPORT_DC_PORT1_UNTYPED_SURFACE_READ 1
1703 #define HSW_DATAPORT_DC_PORT1_UNTYPED_ATOMIC_OP 2
1704 #define HSW_DATAPORT_DC_PORT1_UNTYPED_ATOMIC_OP_SIMD4X2 3
1705 #define HSW_DATAPORT_DC_PORT1_MEDIA_BLOCK_READ 4
1706 #define HSW_DATAPORT_DC_PORT1_TYPED_SURFACE_READ 5
1707 #define HSW_DATAPORT_DC_PORT1_TYPED_ATOMIC_OP 6
1708 #define HSW_DATAPORT_DC_PORT1_TYPED_ATOMIC_OP_SIMD4X2 7
1709 #define HSW_DATAPORT_DC_PORT1_UNTYPED_SURFACE_WRITE 9
1710 #define HSW_DATAPORT_DC_PORT1_MEDIA_BLOCK_WRITE 10
1711 #define HSW_DATAPORT_DC_PORT1_ATOMIC_COUNTER_OP 11
1712 #define HSW_DATAPORT_DC_PORT1_ATOMIC_COUNTER_OP_SIMD4X2 12
1713 #define HSW_DATAPORT_DC_PORT1_TYPED_SURFACE_WRITE 13
1714
1715 /* dataport atomic operations. */
1716 #define BRW_AOP_AND 1
1717 #define BRW_AOP_OR 2
1718 #define BRW_AOP_XOR 3
1719 #define BRW_AOP_MOV 4
1720 #define BRW_AOP_INC 5
1721 #define BRW_AOP_DEC 6
1722 #define BRW_AOP_ADD 7
1723 #define BRW_AOP_SUB 8
1724 #define BRW_AOP_REVSUB 9
1725 #define BRW_AOP_IMAX 10
1726 #define BRW_AOP_IMIN 11
1727 #define BRW_AOP_UMAX 12
1728 #define BRW_AOP_UMIN 13
1729 #define BRW_AOP_CMPWR 14
1730 #define BRW_AOP_PREDEC 15
1731
1732 #define BRW_MATH_FUNCTION_INV 1
1733 #define BRW_MATH_FUNCTION_LOG 2
1734 #define BRW_MATH_FUNCTION_EXP 3
1735 #define BRW_MATH_FUNCTION_SQRT 4
1736 #define BRW_MATH_FUNCTION_RSQ 5
1737 #define BRW_MATH_FUNCTION_SIN 6
1738 #define BRW_MATH_FUNCTION_COS 7
1739 #define BRW_MATH_FUNCTION_SINCOS 8 /* gen4, gen5 */
1740 #define BRW_MATH_FUNCTION_FDIV 9 /* gen6+ */
1741 #define BRW_MATH_FUNCTION_POW 10
1742 #define BRW_MATH_FUNCTION_INT_DIV_QUOTIENT_AND_REMAINDER 11
1743 #define BRW_MATH_FUNCTION_INT_DIV_QUOTIENT 12
1744 #define BRW_MATH_FUNCTION_INT_DIV_REMAINDER 13
1745 #define GEN8_MATH_FUNCTION_INVM 14
1746 #define GEN8_MATH_FUNCTION_RSQRTM 15
1747
1748 #define BRW_MATH_INTEGER_UNSIGNED 0
1749 #define BRW_MATH_INTEGER_SIGNED 1
1750
1751 #define BRW_MATH_PRECISION_FULL 0
1752 #define BRW_MATH_PRECISION_PARTIAL 1
1753
1754 #define BRW_MATH_SATURATE_NONE 0
1755 #define BRW_MATH_SATURATE_SATURATE 1
1756
1757 #define BRW_MATH_DATA_VECTOR 0
1758 #define BRW_MATH_DATA_SCALAR 1
1759
1760 #define BRW_URB_OPCODE_WRITE_HWORD 0
1761 #define BRW_URB_OPCODE_WRITE_OWORD 1
1762 #define BRW_URB_OPCODE_READ_HWORD 2
1763 #define BRW_URB_OPCODE_READ_OWORD 3
1764 #define GEN7_URB_OPCODE_ATOMIC_MOV 4
1765 #define GEN7_URB_OPCODE_ATOMIC_INC 5
1766 #define GEN8_URB_OPCODE_ATOMIC_ADD 6
1767 #define GEN8_URB_OPCODE_SIMD8_WRITE 7
1768 #define GEN8_URB_OPCODE_SIMD8_READ 8
1769
1770 #define BRW_URB_SWIZZLE_NONE 0
1771 #define BRW_URB_SWIZZLE_INTERLEAVE 1
1772 #define BRW_URB_SWIZZLE_TRANSPOSE 2
1773
1774 #define BRW_SCRATCH_SPACE_SIZE_1K 0
1775 #define BRW_SCRATCH_SPACE_SIZE_2K 1
1776 #define BRW_SCRATCH_SPACE_SIZE_4K 2
1777 #define BRW_SCRATCH_SPACE_SIZE_8K 3
1778 #define BRW_SCRATCH_SPACE_SIZE_16K 4
1779 #define BRW_SCRATCH_SPACE_SIZE_32K 5
1780 #define BRW_SCRATCH_SPACE_SIZE_64K 6
1781 #define BRW_SCRATCH_SPACE_SIZE_128K 7
1782 #define BRW_SCRATCH_SPACE_SIZE_256K 8
1783 #define BRW_SCRATCH_SPACE_SIZE_512K 9
1784 #define BRW_SCRATCH_SPACE_SIZE_1M 10
1785 #define BRW_SCRATCH_SPACE_SIZE_2M 11
1786
1787 #define BRW_MESSAGE_GATEWAY_SFID_OPEN_GATEWAY 0
1788 #define BRW_MESSAGE_GATEWAY_SFID_CLOSE_GATEWAY 1
1789 #define BRW_MESSAGE_GATEWAY_SFID_FORWARD_MSG 2
1790 #define BRW_MESSAGE_GATEWAY_SFID_GET_TIMESTAMP 3
1791 #define BRW_MESSAGE_GATEWAY_SFID_BARRIER_MSG 4
1792 #define BRW_MESSAGE_GATEWAY_SFID_UPDATE_GATEWAY_STATE 5
1793 #define BRW_MESSAGE_GATEWAY_SFID_MMIO_READ_WRITE 6
1794
1795
1796 #define CMD_URB_FENCE 0x6000
1797 #define CMD_CS_URB_STATE 0x6001
1798 #define CMD_CONST_BUFFER 0x6002
1799
1800 #define CMD_STATE_BASE_ADDRESS 0x6101
1801 #define CMD_STATE_SIP 0x6102
1802 #define CMD_PIPELINE_SELECT_965 0x6104
1803 #define CMD_PIPELINE_SELECT_GM45 0x6904
1804
1805 #define _3DSTATE_PIPELINED_POINTERS 0x7800
1806 #define _3DSTATE_BINDING_TABLE_POINTERS 0x7801
1807 # define GEN6_BINDING_TABLE_MODIFY_VS (1 << 8)
1808 # define GEN6_BINDING_TABLE_MODIFY_GS (1 << 9)
1809 # define GEN6_BINDING_TABLE_MODIFY_PS (1 << 12)
1810
1811 #define _3DSTATE_BINDING_TABLE_POINTERS_VS 0x7826 /* GEN7+ */
1812 #define _3DSTATE_BINDING_TABLE_POINTERS_HS 0x7827 /* GEN7+ */
1813 #define _3DSTATE_BINDING_TABLE_POINTERS_DS 0x7828 /* GEN7+ */
1814 #define _3DSTATE_BINDING_TABLE_POINTERS_GS 0x7829 /* GEN7+ */
1815 #define _3DSTATE_BINDING_TABLE_POINTERS_PS 0x782A /* GEN7+ */
1816
1817 #define _3DSTATE_BINDING_TABLE_POOL_ALLOC 0x7919 /* GEN7.5+ */
1818 #define BRW_HW_BINDING_TABLE_ENABLE (1 << 11)
1819 #define GEN7_HW_BT_POOL_MOCS_SHIFT 7
1820 #define GEN7_HW_BT_POOL_MOCS_MASK INTEL_MASK(10, 7)
1821 #define GEN8_HW_BT_POOL_MOCS_SHIFT 0
1822 #define GEN8_HW_BT_POOL_MOCS_MASK INTEL_MASK(6, 0)
1823 /* Only required in HSW */
1824 #define HSW_BT_POOL_ALLOC_MUST_BE_ONE (3 << 5)
1825
1826 #define _3DSTATE_BINDING_TABLE_EDIT_VS 0x7843 /* GEN7.5 */
1827 #define _3DSTATE_BINDING_TABLE_EDIT_GS 0x7844 /* GEN7.5 */
1828 #define _3DSTATE_BINDING_TABLE_EDIT_HS 0x7845 /* GEN7.5 */
1829 #define _3DSTATE_BINDING_TABLE_EDIT_DS 0x7846 /* GEN7.5 */
1830 #define _3DSTATE_BINDING_TABLE_EDIT_PS 0x7847 /* GEN7.5 */
1831 #define BRW_BINDING_TABLE_INDEX_SHIFT 16
1832 #define BRW_BINDING_TABLE_INDEX_MASK INTEL_MASK(23, 16)
1833
1834 #define BRW_BINDING_TABLE_EDIT_TARGET_ALL 3
1835 #define BRW_BINDING_TABLE_EDIT_TARGET_CORE1 2
1836 #define BRW_BINDING_TABLE_EDIT_TARGET_CORE0 1
1837 /* In HSW, when editing binding table entries to surface state offsets,
1838 * the surface state offset is a 16-bit value aligned to 32 bytes. But
1839 * Surface State Pointer in dword 2 is [15:0]. Right shift surf_offset
1840 * by 5 bits so it won't disturb bit 16 (which is used as the binding
1841 * table index entry), otherwise it would hang the GPU.
1842 */
1843 #define HSW_SURFACE_STATE_EDIT(value) (value >> 5)
1844 /* Same as Haswell, but surface state offsets now aligned to 64 bytes.*/
1845 #define GEN8_SURFACE_STATE_EDIT(value) (value >> 6)
1846
1847 #define _3DSTATE_SAMPLER_STATE_POINTERS 0x7802 /* GEN6+ */
1848 # define PS_SAMPLER_STATE_CHANGE (1 << 12)
1849 # define GS_SAMPLER_STATE_CHANGE (1 << 9)
1850 # define VS_SAMPLER_STATE_CHANGE (1 << 8)
1851 /* DW1: VS */
1852 /* DW2: GS */
1853 /* DW3: PS */
1854
1855 #define _3DSTATE_SAMPLER_STATE_POINTERS_VS 0x782B /* GEN7+ */
1856 #define _3DSTATE_SAMPLER_STATE_POINTERS_HS 0x782C /* GEN7+ */
1857 #define _3DSTATE_SAMPLER_STATE_POINTERS_DS 0x782D /* GEN7+ */
1858 #define _3DSTATE_SAMPLER_STATE_POINTERS_GS 0x782E /* GEN7+ */
1859 #define _3DSTATE_SAMPLER_STATE_POINTERS_PS 0x782F /* GEN7+ */
1860
1861 #define _3DSTATE_VERTEX_BUFFERS 0x7808
1862 # define BRW_VB0_INDEX_SHIFT 27
1863 # define GEN6_VB0_INDEX_SHIFT 26
1864 # define BRW_VB0_ACCESS_VERTEXDATA (0 << 26)
1865 # define BRW_VB0_ACCESS_INSTANCEDATA (1 << 26)
1866 # define GEN6_VB0_ACCESS_VERTEXDATA (0 << 20)
1867 # define GEN6_VB0_ACCESS_INSTANCEDATA (1 << 20)
1868 # define GEN7_VB0_ADDRESS_MODIFYENABLE (1 << 14)
1869 # define BRW_VB0_PITCH_SHIFT 0
1870
1871 #define _3DSTATE_VERTEX_ELEMENTS 0x7809
1872 # define BRW_VE0_INDEX_SHIFT 27
1873 # define GEN6_VE0_INDEX_SHIFT 26
1874 # define BRW_VE0_FORMAT_SHIFT 16
1875 # define BRW_VE0_VALID (1 << 26)
1876 # define GEN6_VE0_VALID (1 << 25)
1877 # define GEN6_VE0_EDGE_FLAG_ENABLE (1 << 15)
1878 # define BRW_VE0_SRC_OFFSET_SHIFT 0
1879 # define BRW_VE1_COMPONENT_NOSTORE 0
1880 # define BRW_VE1_COMPONENT_STORE_SRC 1
1881 # define BRW_VE1_COMPONENT_STORE_0 2
1882 # define BRW_VE1_COMPONENT_STORE_1_FLT 3
1883 # define BRW_VE1_COMPONENT_STORE_1_INT 4
1884 # define BRW_VE1_COMPONENT_STORE_VID 5
1885 # define BRW_VE1_COMPONENT_STORE_IID 6
1886 # define BRW_VE1_COMPONENT_STORE_PID 7
1887 # define BRW_VE1_COMPONENT_0_SHIFT 28
1888 # define BRW_VE1_COMPONENT_1_SHIFT 24
1889 # define BRW_VE1_COMPONENT_2_SHIFT 20
1890 # define BRW_VE1_COMPONENT_3_SHIFT 16
1891 # define BRW_VE1_DST_OFFSET_SHIFT 0
1892
1893 #define CMD_INDEX_BUFFER 0x780a
1894 #define GEN4_3DSTATE_VF_STATISTICS 0x780b
1895 #define GM45_3DSTATE_VF_STATISTICS 0x680b
1896 #define _3DSTATE_CC_STATE_POINTERS 0x780e /* GEN6+ */
1897 #define _3DSTATE_BLEND_STATE_POINTERS 0x7824 /* GEN7+ */
1898 #define _3DSTATE_DEPTH_STENCIL_STATE_POINTERS 0x7825 /* GEN7+ */
1899
1900 #define _3DSTATE_URB 0x7805 /* GEN6 */
1901 # define GEN6_URB_VS_SIZE_SHIFT 16
1902 # define GEN6_URB_VS_ENTRIES_SHIFT 0
1903 # define GEN6_URB_GS_ENTRIES_SHIFT 8
1904 # define GEN6_URB_GS_SIZE_SHIFT 0
1905
1906 #define _3DSTATE_VF 0x780c /* GEN7.5+ */
1907 #define HSW_CUT_INDEX_ENABLE (1 << 8)
1908
1909 #define _3DSTATE_VF_INSTANCING 0x7849 /* GEN8+ */
1910 # define GEN8_VF_INSTANCING_ENABLE (1 << 8)
1911
1912 #define _3DSTATE_VF_SGVS 0x784a /* GEN8+ */
1913 # define GEN8_SGVS_ENABLE_INSTANCE_ID (1 << 31)
1914 # define GEN8_SGVS_INSTANCE_ID_COMPONENT_SHIFT 29
1915 # define GEN8_SGVS_INSTANCE_ID_ELEMENT_OFFSET_SHIFT 16
1916 # define GEN8_SGVS_ENABLE_VERTEX_ID (1 << 15)
1917 # define GEN8_SGVS_VERTEX_ID_COMPONENT_SHIFT 13
1918 # define GEN8_SGVS_VERTEX_ID_ELEMENT_OFFSET_SHIFT 0
1919
1920 #define _3DSTATE_VF_TOPOLOGY 0x784b /* GEN8+ */
1921
1922 #define _3DSTATE_WM_CHROMAKEY 0x784c /* GEN8+ */
1923
1924 #define _3DSTATE_URB_VS 0x7830 /* GEN7+ */
1925 #define _3DSTATE_URB_HS 0x7831 /* GEN7+ */
1926 #define _3DSTATE_URB_DS 0x7832 /* GEN7+ */
1927 #define _3DSTATE_URB_GS 0x7833 /* GEN7+ */
1928 # define GEN7_URB_ENTRY_SIZE_SHIFT 16
1929 # define GEN7_URB_STARTING_ADDRESS_SHIFT 25
1930
1931 /* Gen7 "GS URB Entry Allocation Size" is a U9-1 field, so the maximum gs_size
1932 * is 2^9, or 512. It's counted in multiples of 64 bytes.
1933 */
1934 #define GEN7_MAX_GS_URB_ENTRY_SIZE_BYTES (512*64)
1935 /* Gen6 "GS URB Entry Allocation Size" is defined as a number of 1024-bit
1936 * (128 bytes) URB rows and the maximum allowed value is 5 rows.
1937 */
1938 #define GEN6_MAX_GS_URB_ENTRY_SIZE_BYTES (5*128)
1939
1940 #define _3DSTATE_PUSH_CONSTANT_ALLOC_VS 0x7912 /* GEN7+ */
1941 #define _3DSTATE_PUSH_CONSTANT_ALLOC_HS 0x7913 /* GEN7+ */
1942 #define _3DSTATE_PUSH_CONSTANT_ALLOC_DS 0x7914 /* GEN7+ */
1943 #define _3DSTATE_PUSH_CONSTANT_ALLOC_GS 0x7915 /* GEN7+ */
1944 #define _3DSTATE_PUSH_CONSTANT_ALLOC_PS 0x7916 /* GEN7+ */
1945 # define GEN7_PUSH_CONSTANT_BUFFER_OFFSET_SHIFT 16
1946
1947 #define _3DSTATE_VIEWPORT_STATE_POINTERS 0x780d /* GEN6+ */
1948 # define GEN6_CC_VIEWPORT_MODIFY (1 << 12)
1949 # define GEN6_SF_VIEWPORT_MODIFY (1 << 11)
1950 # define GEN6_CLIP_VIEWPORT_MODIFY (1 << 10)
1951 # define GEN6_NUM_VIEWPORTS 16
1952
1953 #define _3DSTATE_VIEWPORT_STATE_POINTERS_CC 0x7823 /* GEN7+ */
1954 #define _3DSTATE_VIEWPORT_STATE_POINTERS_SF_CL 0x7821 /* GEN7+ */
1955
1956 #define _3DSTATE_SCISSOR_STATE_POINTERS 0x780f /* GEN6+ */
1957
1958 #define _3DSTATE_VS 0x7810 /* GEN6+ */
1959 /* DW2 */
1960 # define GEN6_VS_SPF_MODE (1 << 31)
1961 # define GEN6_VS_VECTOR_MASK_ENABLE (1 << 30)
1962 # define GEN6_VS_SAMPLER_COUNT_SHIFT 27
1963 # define GEN6_VS_BINDING_TABLE_ENTRY_COUNT_SHIFT 18
1964 # define GEN6_VS_FLOATING_POINT_MODE_IEEE_754 (0 << 16)
1965 # define GEN6_VS_FLOATING_POINT_MODE_ALT (1 << 16)
1966 # define HSW_VS_UAV_ACCESS_ENABLE (1 << 12)
1967 /* DW4 */
1968 # define GEN6_VS_DISPATCH_START_GRF_SHIFT 20
1969 # define GEN6_VS_URB_READ_LENGTH_SHIFT 11
1970 # define GEN6_VS_URB_ENTRY_READ_OFFSET_SHIFT 4
1971 /* DW5 */
1972 # define GEN6_VS_MAX_THREADS_SHIFT 25
1973 # define HSW_VS_MAX_THREADS_SHIFT 23
1974 # define GEN6_VS_STATISTICS_ENABLE (1 << 10)
1975 # define GEN6_VS_CACHE_DISABLE (1 << 1)
1976 # define GEN6_VS_ENABLE (1 << 0)
1977 /* Gen8+ DW7 */
1978 # define GEN8_VS_SIMD8_ENABLE (1 << 2)
1979 /* Gen8+ DW8 */
1980 # define GEN8_VS_URB_ENTRY_OUTPUT_OFFSET_SHIFT 21
1981 # define GEN8_VS_URB_OUTPUT_LENGTH_SHIFT 16
1982 # define GEN8_VS_USER_CLIP_DISTANCE_SHIFT 8
1983
1984 #define _3DSTATE_GS 0x7811 /* GEN6+ */
1985 /* DW2 */
1986 # define GEN6_GS_SPF_MODE (1 << 31)
1987 # define GEN6_GS_VECTOR_MASK_ENABLE (1 << 30)
1988 # define GEN6_GS_SAMPLER_COUNT_SHIFT 27
1989 # define GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT 18
1990 # define GEN6_GS_FLOATING_POINT_MODE_IEEE_754 (0 << 16)
1991 # define GEN6_GS_FLOATING_POINT_MODE_ALT (1 << 16)
1992 # define HSW_GS_UAV_ACCESS_ENABLE (1 << 12)
1993 /* DW4 */
1994 # define GEN7_GS_OUTPUT_VERTEX_SIZE_SHIFT 23
1995 # define GEN7_GS_OUTPUT_TOPOLOGY_SHIFT 17
1996 # define GEN6_GS_URB_READ_LENGTH_SHIFT 11
1997 # define GEN7_GS_INCLUDE_VERTEX_HANDLES (1 << 10)
1998 # define GEN6_GS_URB_ENTRY_READ_OFFSET_SHIFT 4
1999 # define GEN6_GS_DISPATCH_START_GRF_SHIFT 0
2000 /* DW5 */
2001 # define GEN6_GS_MAX_THREADS_SHIFT 25
2002 # define HSW_GS_MAX_THREADS_SHIFT 24
2003 # define IVB_GS_CONTROL_DATA_FORMAT_SHIFT 24
2004 # define GEN7_GS_CONTROL_DATA_FORMAT_GSCTL_CUT 0
2005 # define GEN7_GS_CONTROL_DATA_FORMAT_GSCTL_SID 1
2006 # define GEN7_GS_CONTROL_DATA_HEADER_SIZE_SHIFT 20
2007 # define GEN7_GS_INSTANCE_CONTROL_SHIFT 15
2008 # define GEN7_GS_DISPATCH_MODE_SHIFT 11
2009 # define GEN7_GS_DISPATCH_MODE_MASK INTEL_MASK(12, 11)
2010 # define GEN6_GS_STATISTICS_ENABLE (1 << 10)
2011 # define GEN6_GS_SO_STATISTICS_ENABLE (1 << 9)
2012 # define GEN6_GS_RENDERING_ENABLE (1 << 8)
2013 # define GEN7_GS_INCLUDE_PRIMITIVE_ID (1 << 4)
2014 # define GEN7_GS_REORDER_TRAILING (1 << 2)
2015 # define GEN7_GS_ENABLE (1 << 0)
2016 /* DW6 */
2017 # define HSW_GS_CONTROL_DATA_FORMAT_SHIFT 31
2018 # define GEN6_GS_REORDER (1 << 30)
2019 # define GEN6_GS_DISCARD_ADJACENCY (1 << 29)
2020 # define GEN6_GS_SVBI_PAYLOAD_ENABLE (1 << 28)
2021 # define GEN6_GS_SVBI_POSTINCREMENT_ENABLE (1 << 27)
2022 # define GEN6_GS_SVBI_POSTINCREMENT_VALUE_SHIFT 16
2023 # define GEN6_GS_SVBI_POSTINCREMENT_VALUE_MASK INTEL_MASK(25, 16)
2024 # define GEN6_GS_ENABLE (1 << 15)
2025
2026 /* Gen8+ DW8 */
2027 # define GEN8_GS_STATIC_OUTPUT (1 << 30)
2028 # define GEN8_GS_STATIC_VERTEX_COUNT_SHIFT 16
2029 # define GEN8_GS_STATIC_VERTEX_COUNT_MASK INTEL_MASK(26, 16)
2030
2031 /* Gen8+ DW9 */
2032 # define GEN8_GS_URB_ENTRY_OUTPUT_OFFSET_SHIFT 21
2033 # define GEN8_GS_URB_OUTPUT_LENGTH_SHIFT 16
2034 # define GEN8_GS_USER_CLIP_DISTANCE_SHIFT 8
2035
2036 # define BRW_GS_EDGE_INDICATOR_0 (1 << 8)
2037 # define BRW_GS_EDGE_INDICATOR_1 (1 << 9)
2038
2039 /* GS Thread Payload
2040 */
2041 /* R0 */
2042 # define GEN7_GS_PAYLOAD_INSTANCE_ID_SHIFT 27
2043
2044 /* 3DSTATE_GS "Output Vertex Size" has an effective maximum of 62. It's
2045 * counted in multiples of 16 bytes.
2046 */
2047 #define GEN7_MAX_GS_OUTPUT_VERTEX_SIZE_BYTES (62*16)
2048
2049 #define _3DSTATE_HS 0x781B /* GEN7+ */
2050 /* DW1 */
2051 # define GEN7_HS_SAMPLER_COUNT_MASK INTEL_MASK(29, 27)
2052 # define GEN7_HS_SAMPLER_COUNT_SHIFT 27
2053 # define GEN7_HS_BINDING_TABLE_ENTRY_COUNT_MASK INTEL_MASK(25, 18)
2054 # define GEN7_HS_BINDING_TABLE_ENTRY_COUNT_SHIFT 18
2055 # define GEN7_HS_FLOATING_POINT_MODE_IEEE_754 (0 << 16)
2056 # define GEN7_HS_FLOATING_POINT_MODE_ALT (1 << 16)
2057 # define GEN7_HS_MAX_THREADS_SHIFT 0
2058 /* DW2 */
2059 # define GEN7_HS_ENABLE (1 << 31)
2060 # define GEN7_HS_STATISTICS_ENABLE (1 << 29)
2061 # define GEN8_HS_MAX_THREADS_SHIFT 8
2062 # define GEN7_HS_INSTANCE_COUNT_MASK INTEL_MASK(3, 0)
2063 # define GEN7_HS_INSTANCE_COUNT_SHIFT 0
2064 /* DW5 */
2065 # define GEN7_HS_SINGLE_PROGRAM_FLOW (1 << 27)
2066 # define GEN7_HS_VECTOR_MASK_ENABLE (1 << 26)
2067 # define HSW_HS_ACCESSES_UAV (1 << 25)
2068 # define GEN7_HS_INCLUDE_VERTEX_HANDLES (1 << 24)
2069 # define GEN7_HS_DISPATCH_START_GRF_MASK INTEL_MASK(23, 19)
2070 # define GEN7_HS_DISPATCH_START_GRF_SHIFT 19
2071 # define GEN7_HS_URB_READ_LENGTH_MASK INTEL_MASK(16, 11)
2072 # define GEN7_HS_URB_READ_LENGTH_SHIFT 11
2073 # define GEN7_HS_URB_ENTRY_READ_OFFSET_MASK INTEL_MASK(9, 4)
2074 # define GEN7_HS_URB_ENTRY_READ_OFFSET_SHIFT 4
2075
2076 #define _3DSTATE_TE 0x781C /* GEN7+ */
2077 /* DW1 */
2078 # define GEN7_TE_PARTITIONING_SHIFT 12
2079 # define GEN7_TE_OUTPUT_TOPOLOGY_SHIFT 8
2080 # define GEN7_TE_DOMAIN_SHIFT 4
2081 //# define GEN7_TE_MODE_SW (1 << 1)
2082 # define GEN7_TE_ENABLE (1 << 0)
2083
2084 #define _3DSTATE_DS 0x781D /* GEN7+ */
2085 /* DW2 */
2086 # define GEN7_DS_SINGLE_DOMAIN_POINT_DISPATCH (1 << 31)
2087 # define GEN7_DS_VECTOR_MASK_ENABLE (1 << 30)
2088 # define GEN7_DS_SAMPLER_COUNT_MASK INTEL_MASK(29, 27)
2089 # define GEN7_DS_SAMPLER_COUNT_SHIFT 27
2090 # define GEN7_DS_BINDING_TABLE_ENTRY_COUNT_MASK INTEL_MASK(25, 18)
2091 # define GEN7_DS_BINDING_TABLE_ENTRY_COUNT_SHIFT 18
2092 # define GEN7_DS_FLOATING_POINT_MODE_IEEE_754 (0 << 16)
2093 # define GEN7_DS_FLOATING_POINT_MODE_ALT (1 << 16)
2094 # define HSW_DS_ACCESSES_UAV (1 << 14)
2095 /* DW4 */
2096 # define GEN7_DS_DISPATCH_START_GRF_MASK INTEL_MASK(24, 20)
2097 # define GEN7_DS_DISPATCH_START_GRF_SHIFT 20
2098 # define GEN7_DS_URB_READ_LENGTH_MASK INTEL_MASK(17, 11)
2099 # define GEN7_DS_URB_READ_LENGTH_SHIFT 11
2100 # define GEN7_DS_URB_ENTRY_READ_OFFSET_MASK INTEL_MASK(9, 4)
2101 # define GEN7_DS_URB_ENTRY_READ_OFFSET_SHIFT 4
2102 /* DW5 */
2103 # define GEN7_DS_MAX_THREADS_SHIFT 25
2104 # define HSW_DS_MAX_THREADS_SHIFT 21
2105 # define GEN7_DS_STATISTICS_ENABLE (1 << 10)
2106 # define GEN7_DS_SIMD8_DISPATCH_ENABLE (1 << 3)
2107 # define GEN7_DS_COMPUTE_W_COORDINATE_ENABLE (1 << 2)
2108 # define GEN7_DS_CACHE_DISABLE (1 << 1)
2109 # define GEN7_DS_ENABLE (1 << 0)
2110 /* Gen8+ DW8 */
2111 # define GEN8_DS_URB_ENTRY_OUTPUT_OFFSET_MASK INTEL_MASK(26, 21)
2112 # define GEN8_DS_URB_ENTRY_OUTPUT_OFFSET_SHIFT 21
2113 # define GEN8_DS_URB_OUTPUT_LENGTH_MASK INTEL_MASK(20, 16)
2114 # define GEN8_DS_URB_OUTPUT_LENGTH_SHIFT 16
2115 # define GEN8_DS_USER_CLIP_DISTANCE_MASK INTEL_MASK(15, 8)
2116 # define GEN8_DS_USER_CLIP_DISTANCE_SHIFT 8
2117 # define GEN8_DS_USER_CULL_DISTANCE_MASK INTEL_MASK(7, 0)
2118 # define GEN8_DS_USER_CULL_DISTANCE_SHIFT 0
2119
2120
2121 #define _3DSTATE_CLIP 0x7812 /* GEN6+ */
2122 /* DW1 */
2123 # define GEN7_CLIP_WINDING_CW (0 << 20)
2124 # define GEN7_CLIP_WINDING_CCW (1 << 20)
2125 # define GEN7_CLIP_VERTEX_SUBPIXEL_PRECISION_8 (0 << 19)
2126 # define GEN7_CLIP_VERTEX_SUBPIXEL_PRECISION_4 (1 << 19)
2127 # define GEN7_CLIP_EARLY_CULL (1 << 18)
2128 # define GEN7_CLIP_CULLMODE_BOTH (0 << 16)
2129 # define GEN7_CLIP_CULLMODE_NONE (1 << 16)
2130 # define GEN7_CLIP_CULLMODE_FRONT (2 << 16)
2131 # define GEN7_CLIP_CULLMODE_BACK (3 << 16)
2132 # define GEN6_CLIP_STATISTICS_ENABLE (1 << 10)
2133 /**
2134 * Just does cheap culling based on the clip distance. Bits must be
2135 * disjoint with USER_CLIP_CLIP_DISTANCE bits.
2136 */
2137 # define GEN6_USER_CLIP_CULL_DISTANCES_SHIFT 0
2138 /* DW2 */
2139 # define GEN6_CLIP_ENABLE (1 << 31)
2140 # define GEN6_CLIP_API_OGL (0 << 30)
2141 # define GEN6_CLIP_API_D3D (1 << 30)
2142 # define GEN6_CLIP_XY_TEST (1 << 28)
2143 # define GEN6_CLIP_Z_TEST (1 << 27)
2144 # define GEN6_CLIP_GB_TEST (1 << 26)
2145 /** 8-bit field of which user clip distances to clip aganist. */
2146 # define GEN6_USER_CLIP_CLIP_DISTANCES_SHIFT 16
2147 # define GEN6_CLIP_MODE_NORMAL (0 << 13)
2148 # define GEN6_CLIP_MODE_REJECT_ALL (3 << 13)
2149 # define GEN6_CLIP_MODE_ACCEPT_ALL (4 << 13)
2150 # define GEN6_CLIP_PERSPECTIVE_DIVIDE_DISABLE (1 << 9)
2151 # define GEN6_CLIP_NON_PERSPECTIVE_BARYCENTRIC_ENABLE (1 << 8)
2152 # define GEN6_CLIP_TRI_PROVOKE_SHIFT 4
2153 # define GEN6_CLIP_LINE_PROVOKE_SHIFT 2
2154 # define GEN6_CLIP_TRIFAN_PROVOKE_SHIFT 0
2155 /* DW3 */
2156 # define GEN6_CLIP_MIN_POINT_WIDTH_SHIFT 17
2157 # define GEN6_CLIP_MAX_POINT_WIDTH_SHIFT 6
2158 # define GEN6_CLIP_FORCE_ZERO_RTAINDEX (1 << 5)
2159 # define GEN6_CLIP_MAX_VP_INDEX_MASK INTEL_MASK(3, 0)
2160
2161 #define _3DSTATE_SF 0x7813 /* GEN6+ */
2162 /* DW1 (for gen6) */
2163 # define GEN6_SF_NUM_OUTPUTS_SHIFT 22
2164 # define GEN6_SF_SWIZZLE_ENABLE (1 << 21)
2165 # define GEN6_SF_POINT_SPRITE_UPPERLEFT (0 << 20)
2166 # define GEN6_SF_POINT_SPRITE_LOWERLEFT (1 << 20)
2167 # define GEN9_SF_LINE_WIDTH_SHIFT 12 /* U11.7 */
2168 # define GEN6_SF_URB_ENTRY_READ_LENGTH_SHIFT 11
2169 # define GEN6_SF_URB_ENTRY_READ_OFFSET_SHIFT 4
2170 /* DW2 */
2171 # define GEN6_SF_LEGACY_GLOBAL_DEPTH_BIAS (1 << 11)
2172 # define GEN6_SF_STATISTICS_ENABLE (1 << 10)
2173 # define GEN6_SF_GLOBAL_DEPTH_OFFSET_SOLID (1 << 9)
2174 # define GEN6_SF_GLOBAL_DEPTH_OFFSET_WIREFRAME (1 << 8)
2175 # define GEN6_SF_GLOBAL_DEPTH_OFFSET_POINT (1 << 7)
2176 # define GEN6_SF_FRONT_SOLID (0 << 5)
2177 # define GEN6_SF_FRONT_WIREFRAME (1 << 5)
2178 # define GEN6_SF_FRONT_POINT (2 << 5)
2179 # define GEN6_SF_BACK_SOLID (0 << 3)
2180 # define GEN6_SF_BACK_WIREFRAME (1 << 3)
2181 # define GEN6_SF_BACK_POINT (2 << 3)
2182 # define GEN6_SF_VIEWPORT_TRANSFORM_ENABLE (1 << 1)
2183 # define GEN6_SF_WINDING_CCW (1 << 0)
2184 /* DW3 */
2185 # define GEN6_SF_LINE_AA_ENABLE (1 << 31)
2186 # define GEN6_SF_CULL_BOTH (0 << 29)
2187 # define GEN6_SF_CULL_NONE (1 << 29)
2188 # define GEN6_SF_CULL_FRONT (2 << 29)
2189 # define GEN6_SF_CULL_BACK (3 << 29)
2190 # define GEN6_SF_LINE_WIDTH_SHIFT 18 /* U3.7 */
2191 # define GEN6_SF_LINE_END_CAP_WIDTH_0_5 (0 << 16)
2192 # define GEN6_SF_LINE_END_CAP_WIDTH_1_0 (1 << 16)
2193 # define GEN6_SF_LINE_END_CAP_WIDTH_2_0 (2 << 16)
2194 # define GEN6_SF_LINE_END_CAP_WIDTH_4_0 (3 << 16)
2195 # define GEN6_SF_SCISSOR_ENABLE (1 << 11)
2196 # define GEN6_SF_MSRAST_OFF_PIXEL (0 << 8)
2197 # define GEN6_SF_MSRAST_OFF_PATTERN (1 << 8)
2198 # define GEN6_SF_MSRAST_ON_PIXEL (2 << 8)
2199 # define GEN6_SF_MSRAST_ON_PATTERN (3 << 8)
2200 /* DW4 */
2201 # define GEN6_SF_TRI_PROVOKE_SHIFT 29
2202 # define GEN6_SF_LINE_PROVOKE_SHIFT 27
2203 # define GEN6_SF_TRIFAN_PROVOKE_SHIFT 25
2204 # define GEN6_SF_LINE_AA_MODE_MANHATTAN (0 << 14)
2205 # define GEN6_SF_LINE_AA_MODE_TRUE (1 << 14)
2206 # define GEN6_SF_VERTEX_SUBPIXEL_8BITS (0 << 12)
2207 # define GEN6_SF_VERTEX_SUBPIXEL_4BITS (1 << 12)
2208 # define GEN6_SF_USE_STATE_POINT_WIDTH (1 << 11)
2209 # define GEN6_SF_POINT_WIDTH_SHIFT 0 /* U8.3 */
2210 /* DW5: depth offset constant */
2211 /* DW6: depth offset scale */
2212 /* DW7: depth offset clamp */
2213 /* DW8 */
2214 # define ATTRIBUTE_1_OVERRIDE_W (1 << 31)
2215 # define ATTRIBUTE_1_OVERRIDE_Z (1 << 30)
2216 # define ATTRIBUTE_1_OVERRIDE_Y (1 << 29)
2217 # define ATTRIBUTE_1_OVERRIDE_X (1 << 28)
2218 # define ATTRIBUTE_1_CONST_SOURCE_SHIFT 25
2219 # define ATTRIBUTE_1_SWIZZLE_SHIFT 22
2220 # define ATTRIBUTE_1_SOURCE_SHIFT 16
2221 # define ATTRIBUTE_0_OVERRIDE_W (1 << 15)
2222 # define ATTRIBUTE_0_OVERRIDE_Z (1 << 14)
2223 # define ATTRIBUTE_0_OVERRIDE_Y (1 << 13)
2224 # define ATTRIBUTE_0_OVERRIDE_X (1 << 12)
2225 # define ATTRIBUTE_0_CONST_SOURCE_SHIFT 9
2226 # define ATTRIBUTE_CONST_0000 0
2227 # define ATTRIBUTE_CONST_0001_FLOAT 1
2228 # define ATTRIBUTE_CONST_1111_FLOAT 2
2229 # define ATTRIBUTE_CONST_PRIM_ID 3
2230 # define ATTRIBUTE_0_SWIZZLE_SHIFT 6
2231 # define ATTRIBUTE_0_SOURCE_SHIFT 0
2232
2233 # define ATTRIBUTE_SWIZZLE_INPUTATTR 0
2234 # define ATTRIBUTE_SWIZZLE_INPUTATTR_FACING 1
2235 # define ATTRIBUTE_SWIZZLE_INPUTATTR_W 2
2236 # define ATTRIBUTE_SWIZZLE_INPUTATTR_FACING_W 3
2237 # define ATTRIBUTE_SWIZZLE_SHIFT 6
2238
2239 /* DW16: Point sprite texture coordinate enables */
2240 /* DW17: Constant interpolation enables */
2241 /* DW18: attr 0-7 wrap shortest enables */
2242 /* DW19: attr 8-16 wrap shortest enables */
2243
2244 /* On GEN7, many fields of 3DSTATE_SF were split out into a new command:
2245 * 3DSTATE_SBE. The remaining fields live in different DWords, but retain
2246 * the same bit-offset. The only new field:
2247 */
2248 /* GEN7/DW1: */
2249 # define GEN7_SF_DEPTH_BUFFER_SURFACE_FORMAT_SHIFT 12
2250 /* GEN7/DW2: */
2251 # define HSW_SF_LINE_STIPPLE_ENABLE (1 << 14)
2252
2253 # define GEN8_SF_SMOOTH_POINT_ENABLE (1 << 13)
2254
2255 #define _3DSTATE_SBE 0x781F /* GEN7+ */
2256 /* DW1 */
2257 # define GEN8_SBE_FORCE_URB_ENTRY_READ_LENGTH (1 << 29)
2258 # define GEN8_SBE_FORCE_URB_ENTRY_READ_OFFSET (1 << 28)
2259 # define GEN7_SBE_SWIZZLE_CONTROL_MODE (1 << 28)
2260 # define GEN7_SBE_NUM_OUTPUTS_SHIFT 22
2261 # define GEN7_SBE_SWIZZLE_ENABLE (1 << 21)
2262 # define GEN7_SBE_POINT_SPRITE_LOWERLEFT (1 << 20)
2263 # define GEN7_SBE_URB_ENTRY_READ_LENGTH_SHIFT 11
2264 # define GEN7_SBE_URB_ENTRY_READ_OFFSET_SHIFT 4
2265 # define GEN8_SBE_URB_ENTRY_READ_OFFSET_SHIFT 5
2266 /* DW2-9: Attribute setup (same as DW8-15 of gen6 _3DSTATE_SF) */
2267 /* DW10: Point sprite texture coordinate enables */
2268 /* DW11: Constant interpolation enables */
2269 /* DW12: attr 0-7 wrap shortest enables */
2270 /* DW13: attr 8-16 wrap shortest enables */
2271
2272 /* DW4-5: Attribute active components (gen9) */
2273 #define GEN9_SBE_ACTIVE_COMPONENT_NONE 0
2274 #define GEN9_SBE_ACTIVE_COMPONENT_XY 1
2275 #define GEN9_SBE_ACTIVE_COMPONENT_XYZ 2
2276 #define GEN9_SBE_ACTIVE_COMPONENT_XYZW 3
2277
2278 #define _3DSTATE_SBE_SWIZ 0x7851 /* GEN8+ */
2279
2280 #define _3DSTATE_RASTER 0x7850 /* GEN8+ */
2281 /* DW1 */
2282 # define GEN9_RASTER_VIEWPORT_Z_FAR_CLIP_TEST_ENABLE (1 << 26)
2283 # define GEN8_RASTER_FRONT_WINDING_CCW (1 << 21)
2284 # define GEN8_RASTER_CULL_BOTH (0 << 16)
2285 # define GEN8_RASTER_CULL_NONE (1 << 16)
2286 # define GEN8_RASTER_CULL_FRONT (2 << 16)
2287 # define GEN8_RASTER_CULL_BACK (3 << 16)
2288 # define GEN8_RASTER_SMOOTH_POINT_ENABLE (1 << 13)
2289 # define GEN8_RASTER_API_MULTISAMPLE_ENABLE (1 << 12)
2290 # define GEN8_RASTER_LINE_AA_ENABLE (1 << 2)
2291 # define GEN8_RASTER_SCISSOR_ENABLE (1 << 1)
2292 # define GEN8_RASTER_VIEWPORT_Z_CLIP_TEST_ENABLE (1 << 0)
2293 # define GEN9_RASTER_VIEWPORT_Z_NEAR_CLIP_TEST_ENABLE (1 << 0)
2294
2295 /* Gen8 BLEND_STATE */
2296 /* DW0 */
2297 #define GEN8_BLEND_ALPHA_TO_COVERAGE_ENABLE (1 << 31)
2298 #define GEN8_BLEND_INDEPENDENT_ALPHA_BLEND_ENABLE (1 << 30)
2299 #define GEN8_BLEND_ALPHA_TO_ONE_ENABLE (1 << 29)
2300 #define GEN8_BLEND_ALPHA_TO_COVERAGE_DITHER_ENABLE (1 << 28)
2301 #define GEN8_BLEND_ALPHA_TEST_ENABLE (1 << 27)
2302 #define GEN8_BLEND_ALPHA_TEST_FUNCTION_MASK INTEL_MASK(26, 24)
2303 #define GEN8_BLEND_ALPHA_TEST_FUNCTION_SHIFT 24
2304 #define GEN8_BLEND_COLOR_DITHER_ENABLE (1 << 23)
2305 #define GEN8_BLEND_X_DITHER_OFFSET_MASK INTEL_MASK(22, 21)
2306 #define GEN8_BLEND_X_DITHER_OFFSET_SHIFT 21
2307 #define GEN8_BLEND_Y_DITHER_OFFSET_MASK INTEL_MASK(20, 19)
2308 #define GEN8_BLEND_Y_DITHER_OFFSET_SHIFT 19
2309 /* DW1 + 2n */
2310 #define GEN8_BLEND_COLOR_BUFFER_BLEND_ENABLE (1 << 31)
2311 #define GEN8_BLEND_SRC_BLEND_FACTOR_MASK INTEL_MASK(30, 26)
2312 #define GEN8_BLEND_SRC_BLEND_FACTOR_SHIFT 26
2313 #define GEN8_BLEND_DST_BLEND_FACTOR_MASK INTEL_MASK(25, 21)
2314 #define GEN8_BLEND_DST_BLEND_FACTOR_SHIFT 21
2315 #define GEN8_BLEND_COLOR_BLEND_FUNCTION_MASK INTEL_MASK(20, 18)
2316 #define GEN8_BLEND_COLOR_BLEND_FUNCTION_SHIFT 18
2317 #define GEN8_BLEND_SRC_ALPHA_BLEND_FACTOR_MASK INTEL_MASK(17, 13)
2318 #define GEN8_BLEND_SRC_ALPHA_BLEND_FACTOR_SHIFT 13
2319 #define GEN8_BLEND_DST_ALPHA_BLEND_FACTOR_MASK INTEL_MASK(12, 8)
2320 #define GEN8_BLEND_DST_ALPHA_BLEND_FACTOR_SHIFT 8
2321 #define GEN8_BLEND_ALPHA_BLEND_FUNCTION_MASK INTEL_MASK(7, 5)
2322 #define GEN8_BLEND_ALPHA_BLEND_FUNCTION_SHIFT 5
2323 #define GEN8_BLEND_WRITE_DISABLE_ALPHA (1 << 3)
2324 #define GEN8_BLEND_WRITE_DISABLE_RED (1 << 2)
2325 #define GEN8_BLEND_WRITE_DISABLE_GREEN (1 << 1)
2326 #define GEN8_BLEND_WRITE_DISABLE_BLUE (1 << 0)
2327 /* DW1 + 2n + 1 */
2328 #define GEN8_BLEND_LOGIC_OP_ENABLE (1 << 31)
2329 #define GEN8_BLEND_LOGIC_OP_FUNCTION_MASK INTEL_MASK(30, 27)
2330 #define GEN8_BLEND_LOGIC_OP_FUNCTION_SHIFT 27
2331 #define GEN8_BLEND_PRE_BLEND_SRC_ONLY_CLAMP_ENABLE (1 << 4)
2332 #define GEN8_BLEND_COLOR_CLAMP_RANGE_RTFORMAT (2 << 2)
2333 #define GEN8_BLEND_PRE_BLEND_COLOR_CLAMP_ENABLE (1 << 1)
2334 #define GEN8_BLEND_POST_BLEND_COLOR_CLAMP_ENABLE (1 << 0)
2335
2336 #define _3DSTATE_WM_HZ_OP 0x7852 /* GEN8+ */
2337 /* DW1 */
2338 # define GEN8_WM_HZ_STENCIL_CLEAR (1 << 31)
2339 # define GEN8_WM_HZ_DEPTH_CLEAR (1 << 30)
2340 # define GEN8_WM_HZ_DEPTH_RESOLVE (1 << 28)
2341 # define GEN8_WM_HZ_HIZ_RESOLVE (1 << 27)
2342 # define GEN8_WM_HZ_PIXEL_OFFSET_ENABLE (1 << 26)
2343 # define GEN8_WM_HZ_FULL_SURFACE_DEPTH_CLEAR (1 << 25)
2344 # define GEN8_WM_HZ_STENCIL_CLEAR_VALUE_MASK INTEL_MASK(23, 16)
2345 # define GEN8_WM_HZ_STENCIL_CLEAR_VALUE_SHIFT 16
2346 # define GEN8_WM_HZ_NUM_SAMPLES_MASK INTEL_MASK(15, 13)
2347 # define GEN8_WM_HZ_NUM_SAMPLES_SHIFT 13
2348 /* DW2 */
2349 # define GEN8_WM_HZ_CLEAR_RECTANGLE_Y_MIN_MASK INTEL_MASK(31, 16)
2350 # define GEN8_WM_HZ_CLEAR_RECTANGLE_Y_MIN_SHIFT 16
2351 # define GEN8_WM_HZ_CLEAR_RECTANGLE_X_MIN_MASK INTEL_MASK(15, 0)
2352 # define GEN8_WM_HZ_CLEAR_RECTANGLE_X_MIN_SHIFT 0
2353 /* DW3 */
2354 # define GEN8_WM_HZ_CLEAR_RECTANGLE_Y_MAX_MASK INTEL_MASK(31, 16)
2355 # define GEN8_WM_HZ_CLEAR_RECTANGLE_Y_MAX_SHIFT 16
2356 # define GEN8_WM_HZ_CLEAR_RECTANGLE_X_MAX_MASK INTEL_MASK(15, 0)
2357 # define GEN8_WM_HZ_CLEAR_RECTANGLE_X_MAX_SHIFT 0
2358 /* DW4 */
2359 # define GEN8_WM_HZ_SAMPLE_MASK_MASK INTEL_MASK(15, 0)
2360 # define GEN8_WM_HZ_SAMPLE_MASK_SHIFT 0
2361
2362
2363 #define _3DSTATE_PS_BLEND 0x784D /* GEN8+ */
2364 /* DW1 */
2365 # define GEN8_PS_BLEND_ALPHA_TO_COVERAGE_ENABLE (1 << 31)
2366 # define GEN8_PS_BLEND_HAS_WRITEABLE_RT (1 << 30)
2367 # define GEN8_PS_BLEND_COLOR_BUFFER_BLEND_ENABLE (1 << 29)
2368 # define GEN8_PS_BLEND_SRC_ALPHA_BLEND_FACTOR_MASK INTEL_MASK(28, 24)
2369 # define GEN8_PS_BLEND_SRC_ALPHA_BLEND_FACTOR_SHIFT 24
2370 # define GEN8_PS_BLEND_DST_ALPHA_BLEND_FACTOR_MASK INTEL_MASK(23, 19)
2371 # define GEN8_PS_BLEND_DST_ALPHA_BLEND_FACTOR_SHIFT 19
2372 # define GEN8_PS_BLEND_SRC_BLEND_FACTOR_MASK INTEL_MASK(18, 14)
2373 # define GEN8_PS_BLEND_SRC_BLEND_FACTOR_SHIFT 14
2374 # define GEN8_PS_BLEND_DST_BLEND_FACTOR_MASK INTEL_MASK(13, 9)
2375 # define GEN8_PS_BLEND_DST_BLEND_FACTOR_SHIFT 9
2376 # define GEN8_PS_BLEND_ALPHA_TEST_ENABLE (1 << 8)
2377 # define GEN8_PS_BLEND_INDEPENDENT_ALPHA_BLEND_ENABLE (1 << 7)
2378
2379 #define _3DSTATE_WM_DEPTH_STENCIL 0x784E /* GEN8+ */
2380 /* DW1 */
2381 # define GEN8_WM_DS_STENCIL_FAIL_OP_SHIFT 29
2382 # define GEN8_WM_DS_Z_FAIL_OP_SHIFT 26
2383 # define GEN8_WM_DS_Z_PASS_OP_SHIFT 23
2384 # define GEN8_WM_DS_BF_STENCIL_FUNC_SHIFT 20
2385 # define GEN8_WM_DS_BF_STENCIL_FAIL_OP_SHIFT 17
2386 # define GEN8_WM_DS_BF_Z_FAIL_OP_SHIFT 14
2387 # define GEN8_WM_DS_BF_Z_PASS_OP_SHIFT 11
2388 # define GEN8_WM_DS_STENCIL_FUNC_SHIFT 8
2389 # define GEN8_WM_DS_DEPTH_FUNC_SHIFT 5
2390 # define GEN8_WM_DS_DOUBLE_SIDED_STENCIL_ENABLE (1 << 4)
2391 # define GEN8_WM_DS_STENCIL_TEST_ENABLE (1 << 3)
2392 # define GEN8_WM_DS_STENCIL_BUFFER_WRITE_ENABLE (1 << 2)
2393 # define GEN8_WM_DS_DEPTH_TEST_ENABLE (1 << 1)
2394 # define GEN8_WM_DS_DEPTH_BUFFER_WRITE_ENABLE (1 << 0)
2395 /* DW2 */
2396 # define GEN8_WM_DS_STENCIL_TEST_MASK_MASK INTEL_MASK(31, 24)
2397 # define GEN8_WM_DS_STENCIL_TEST_MASK_SHIFT 24
2398 # define GEN8_WM_DS_STENCIL_WRITE_MASK_MASK INTEL_MASK(23, 16)
2399 # define GEN8_WM_DS_STENCIL_WRITE_MASK_SHIFT 16
2400 # define GEN8_WM_DS_BF_STENCIL_TEST_MASK_MASK INTEL_MASK(15, 8)
2401 # define GEN8_WM_DS_BF_STENCIL_TEST_MASK_SHIFT 8
2402 # define GEN8_WM_DS_BF_STENCIL_WRITE_MASK_MASK INTEL_MASK(7, 0)
2403 # define GEN8_WM_DS_BF_STENCIL_WRITE_MASK_SHIFT 0
2404 /* DW3 */
2405 # define GEN9_WM_DS_STENCIL_REF_MASK INTEL_MASK(15, 8)
2406 # define GEN9_WM_DS_STENCIL_REF_SHIFT 8
2407 # define GEN9_WM_DS_BF_STENCIL_REF_MASK INTEL_MASK(7, 0)
2408 # define GEN9_WM_DS_BF_STENCIL_REF_SHIFT 0
2409
2410 enum brw_pixel_shader_computed_depth_mode {
2411 BRW_PSCDEPTH_OFF = 0, /* PS does not compute depth */
2412 BRW_PSCDEPTH_ON = 1, /* PS computes depth; no guarantee about value */
2413 BRW_PSCDEPTH_ON_GE = 2, /* PS guarantees output depth >= source depth */
2414 BRW_PSCDEPTH_ON_LE = 3, /* PS guarantees output depth <= source depth */
2415 };
2416
2417 enum brw_pixel_shader_coverage_mask_mode {
2418 BRW_PSICMS_OFF = 0, /* PS does not use input coverage masks. */
2419 BRW_PSICMS_NORMAL = 1, /* Input Coverage masks based on outer conservatism
2420 * and factors in SAMPLE_MASK. If Pixel is
2421 * conservatively covered, all samples are enabled.
2422 */
2423
2424 BRW_PSICMS_INNER = 2, /* Input Coverage masks based on inner conservatism
2425 * and factors in SAMPLE_MASK. If Pixel is
2426 * conservatively *FULLY* covered, all samples are
2427 * enabled.
2428 */
2429 BRW_PCICMS_DEPTH = 3,
2430 };
2431
2432 #define _3DSTATE_PS_EXTRA 0x784F /* GEN8+ */
2433 /* DW1 */
2434 # define GEN8_PSX_PIXEL_SHADER_VALID (1 << 31)
2435 # define GEN8_PSX_PIXEL_SHADER_NO_RT_WRITE (1 << 30)
2436 # define GEN8_PSX_OMASK_TO_RENDER_TARGET (1 << 29)
2437 # define GEN8_PSX_KILL_ENABLE (1 << 28)
2438 # define GEN8_PSX_COMPUTED_DEPTH_MODE_SHIFT 26
2439 # define GEN8_PSX_FORCE_COMPUTED_DEPTH (1 << 25)
2440 # define GEN8_PSX_USES_SOURCE_DEPTH (1 << 24)
2441 # define GEN8_PSX_USES_SOURCE_W (1 << 23)
2442 # define GEN8_PSX_ATTRIBUTE_ENABLE (1 << 8)
2443 # define GEN8_PSX_SHADER_DISABLES_ALPHA_TO_COVERAGE (1 << 7)
2444 # define GEN8_PSX_SHADER_IS_PER_SAMPLE (1 << 6)
2445 # define GEN9_PSX_SHADER_COMPUTES_STENCIL (1 << 5)
2446 # define GEN9_PSX_SHADER_PULLS_BARY (1 << 3)
2447 # define GEN8_PSX_SHADER_HAS_UAV (1 << 2)
2448 # define GEN8_PSX_SHADER_USES_INPUT_COVERAGE_MASK (1 << 1)
2449 # define GEN9_PSX_SHADER_NORMAL_COVERAGE_MASK_SHIFT 0
2450
2451 enum brw_wm_barycentric_interp_mode {
2452 BRW_WM_PERSPECTIVE_PIXEL_BARYCENTRIC = 0,
2453 BRW_WM_PERSPECTIVE_CENTROID_BARYCENTRIC = 1,
2454 BRW_WM_PERSPECTIVE_SAMPLE_BARYCENTRIC = 2,
2455 BRW_WM_NONPERSPECTIVE_PIXEL_BARYCENTRIC = 3,
2456 BRW_WM_NONPERSPECTIVE_CENTROID_BARYCENTRIC = 4,
2457 BRW_WM_NONPERSPECTIVE_SAMPLE_BARYCENTRIC = 5,
2458 BRW_WM_BARYCENTRIC_INTERP_MODE_COUNT = 6
2459 };
2460 #define BRW_WM_NONPERSPECTIVE_BARYCENTRIC_BITS \
2461 ((1 << BRW_WM_NONPERSPECTIVE_PIXEL_BARYCENTRIC) | \
2462 (1 << BRW_WM_NONPERSPECTIVE_CENTROID_BARYCENTRIC) | \
2463 (1 << BRW_WM_NONPERSPECTIVE_SAMPLE_BARYCENTRIC))
2464
2465 #define _3DSTATE_WM 0x7814 /* GEN6+ */
2466 /* DW1: kernel pointer */
2467 /* DW2 */
2468 # define GEN6_WM_SPF_MODE (1 << 31)
2469 # define GEN6_WM_VECTOR_MASK_ENABLE (1 << 30)
2470 # define GEN6_WM_SAMPLER_COUNT_SHIFT 27
2471 # define GEN6_WM_BINDING_TABLE_ENTRY_COUNT_SHIFT 18
2472 # define GEN6_WM_FLOATING_POINT_MODE_IEEE_754 (0 << 16)
2473 # define GEN6_WM_FLOATING_POINT_MODE_ALT (1 << 16)
2474 /* DW3: scratch space */
2475 /* DW4 */
2476 # define GEN6_WM_STATISTICS_ENABLE (1 << 31)
2477 # define GEN6_WM_DEPTH_CLEAR (1 << 30)
2478 # define GEN6_WM_DEPTH_RESOLVE (1 << 28)
2479 # define GEN6_WM_HIERARCHICAL_DEPTH_RESOLVE (1 << 27)
2480 # define GEN6_WM_DISPATCH_START_GRF_SHIFT_0 16
2481 # define GEN6_WM_DISPATCH_START_GRF_SHIFT_1 8
2482 # define GEN6_WM_DISPATCH_START_GRF_SHIFT_2 0
2483 /* DW5 */
2484 # define GEN6_WM_MAX_THREADS_SHIFT 25
2485 # define GEN6_WM_KILL_ENABLE (1 << 22)
2486 # define GEN6_WM_COMPUTED_DEPTH (1 << 21)
2487 # define GEN6_WM_USES_SOURCE_DEPTH (1 << 20)
2488 # define GEN6_WM_DISPATCH_ENABLE (1 << 19)
2489 # define GEN6_WM_LINE_END_CAP_AA_WIDTH_0_5 (0 << 16)
2490 # define GEN6_WM_LINE_END_CAP_AA_WIDTH_1_0 (1 << 16)
2491 # define GEN6_WM_LINE_END_CAP_AA_WIDTH_2_0 (2 << 16)
2492 # define GEN6_WM_LINE_END_CAP_AA_WIDTH_4_0 (3 << 16)
2493 # define GEN6_WM_LINE_AA_WIDTH_0_5 (0 << 14)
2494 # define GEN6_WM_LINE_AA_WIDTH_1_0 (1 << 14)
2495 # define GEN6_WM_LINE_AA_WIDTH_2_0 (2 << 14)
2496 # define GEN6_WM_LINE_AA_WIDTH_4_0 (3 << 14)
2497 # define GEN6_WM_POLYGON_STIPPLE_ENABLE (1 << 13)
2498 # define GEN6_WM_LINE_STIPPLE_ENABLE (1 << 11)
2499 # define GEN6_WM_OMASK_TO_RENDER_TARGET (1 << 9)
2500 # define GEN6_WM_USES_SOURCE_W (1 << 8)
2501 # define GEN6_WM_DUAL_SOURCE_BLEND_ENABLE (1 << 7)
2502 # define GEN6_WM_32_DISPATCH_ENABLE (1 << 2)
2503 # define GEN6_WM_16_DISPATCH_ENABLE (1 << 1)
2504 # define GEN6_WM_8_DISPATCH_ENABLE (1 << 0)
2505 /* DW6 */
2506 # define GEN6_WM_NUM_SF_OUTPUTS_SHIFT 20
2507 # define GEN6_WM_POSOFFSET_NONE (0 << 18)
2508 # define GEN6_WM_POSOFFSET_CENTROID (2 << 18)
2509 # define GEN6_WM_POSOFFSET_SAMPLE (3 << 18)
2510 # define GEN6_WM_POSITION_ZW_PIXEL (0 << 16)
2511 # define GEN6_WM_POSITION_ZW_CENTROID (2 << 16)
2512 # define GEN6_WM_POSITION_ZW_SAMPLE (3 << 16)
2513 # define GEN6_WM_NONPERSPECTIVE_SAMPLE_BARYCENTRIC (1 << 15)
2514 # define GEN6_WM_NONPERSPECTIVE_CENTROID_BARYCENTRIC (1 << 14)
2515 # define GEN6_WM_NONPERSPECTIVE_PIXEL_BARYCENTRIC (1 << 13)
2516 # define GEN6_WM_PERSPECTIVE_SAMPLE_BARYCENTRIC (1 << 12)
2517 # define GEN6_WM_PERSPECTIVE_CENTROID_BARYCENTRIC (1 << 11)
2518 # define GEN6_WM_PERSPECTIVE_PIXEL_BARYCENTRIC (1 << 10)
2519 # define GEN6_WM_BARYCENTRIC_INTERPOLATION_MODE_SHIFT 10
2520 # define GEN6_WM_POINT_RASTRULE_UPPER_RIGHT (1 << 9)
2521 # define GEN6_WM_MSRAST_OFF_PIXEL (0 << 1)
2522 # define GEN6_WM_MSRAST_OFF_PATTERN (1 << 1)
2523 # define GEN6_WM_MSRAST_ON_PIXEL (2 << 1)
2524 # define GEN6_WM_MSRAST_ON_PATTERN (3 << 1)
2525 # define GEN6_WM_MSDISPMODE_PERSAMPLE (0 << 0)
2526 # define GEN6_WM_MSDISPMODE_PERPIXEL (1 << 0)
2527 /* DW7: kernel 1 pointer */
2528 /* DW8: kernel 2 pointer */
2529
2530 #define _3DSTATE_CONSTANT_VS 0x7815 /* GEN6+ */
2531 #define _3DSTATE_CONSTANT_GS 0x7816 /* GEN6+ */
2532 #define _3DSTATE_CONSTANT_PS 0x7817 /* GEN6+ */
2533 # define GEN6_CONSTANT_BUFFER_3_ENABLE (1 << 15)
2534 # define GEN6_CONSTANT_BUFFER_2_ENABLE (1 << 14)
2535 # define GEN6_CONSTANT_BUFFER_1_ENABLE (1 << 13)
2536 # define GEN6_CONSTANT_BUFFER_0_ENABLE (1 << 12)
2537
2538 #define _3DSTATE_CONSTANT_HS 0x7819 /* GEN7+ */
2539 #define _3DSTATE_CONSTANT_DS 0x781A /* GEN7+ */
2540
2541 #define _3DSTATE_STREAMOUT 0x781e /* GEN7+ */
2542 /* DW1 */
2543 # define SO_FUNCTION_ENABLE (1 << 31)
2544 # define SO_RENDERING_DISABLE (1 << 30)
2545 /* This selects which incoming rendering stream goes down the pipeline. The
2546 * rendering stream is 0 if not defined by special cases in the GS state.
2547 */
2548 # define SO_RENDER_STREAM_SELECT_SHIFT 27
2549 # define SO_RENDER_STREAM_SELECT_MASK INTEL_MASK(28, 27)
2550 /* Controls reordering of TRISTRIP_* elements in stream output (not rendering).
2551 */
2552 # define SO_REORDER_TRAILING (1 << 26)
2553 /* Controls SO_NUM_PRIMS_WRITTEN_* and SO_PRIM_STORAGE_* */
2554 # define SO_STATISTICS_ENABLE (1 << 25)
2555 # define SO_BUFFER_ENABLE(n) (1 << (8 + (n)))
2556 /* DW2 */
2557 # define SO_STREAM_3_VERTEX_READ_OFFSET_SHIFT 29
2558 # define SO_STREAM_3_VERTEX_READ_OFFSET_MASK INTEL_MASK(29, 29)
2559 # define SO_STREAM_3_VERTEX_READ_LENGTH_SHIFT 24
2560 # define SO_STREAM_3_VERTEX_READ_LENGTH_MASK INTEL_MASK(28, 24)
2561 # define SO_STREAM_2_VERTEX_READ_OFFSET_SHIFT 21
2562 # define SO_STREAM_2_VERTEX_READ_OFFSET_MASK INTEL_MASK(21, 21)
2563 # define SO_STREAM_2_VERTEX_READ_LENGTH_SHIFT 16
2564 # define SO_STREAM_2_VERTEX_READ_LENGTH_MASK INTEL_MASK(20, 16)
2565 # define SO_STREAM_1_VERTEX_READ_OFFSET_SHIFT 13
2566 # define SO_STREAM_1_VERTEX_READ_OFFSET_MASK INTEL_MASK(13, 13)
2567 # define SO_STREAM_1_VERTEX_READ_LENGTH_SHIFT 8
2568 # define SO_STREAM_1_VERTEX_READ_LENGTH_MASK INTEL_MASK(12, 8)
2569 # define SO_STREAM_0_VERTEX_READ_OFFSET_SHIFT 5
2570 # define SO_STREAM_0_VERTEX_READ_OFFSET_MASK INTEL_MASK(5, 5)
2571 # define SO_STREAM_0_VERTEX_READ_LENGTH_SHIFT 0
2572 # define SO_STREAM_0_VERTEX_READ_LENGTH_MASK INTEL_MASK(4, 0)
2573
2574 /* 3DSTATE_WM for Gen7 */
2575 /* DW1 */
2576 # define GEN7_WM_STATISTICS_ENABLE (1 << 31)
2577 # define GEN7_WM_DEPTH_CLEAR (1 << 30)
2578 # define GEN7_WM_DISPATCH_ENABLE (1 << 29)
2579 # define GEN7_WM_DEPTH_RESOLVE (1 << 28)
2580 # define GEN7_WM_HIERARCHICAL_DEPTH_RESOLVE (1 << 27)
2581 # define GEN7_WM_KILL_ENABLE (1 << 25)
2582 # define GEN7_WM_COMPUTED_DEPTH_MODE_SHIFT 23
2583 # define GEN7_WM_USES_SOURCE_DEPTH (1 << 20)
2584 # define GEN7_WM_EARLY_DS_CONTROL_NORMAL (0 << 21)
2585 # define GEN7_WM_EARLY_DS_CONTROL_PSEXEC (1 << 21)
2586 # define GEN7_WM_EARLY_DS_CONTROL_PREPS (2 << 21)
2587 # define GEN7_WM_USES_SOURCE_W (1 << 19)
2588 # define GEN7_WM_POSITION_ZW_PIXEL (0 << 17)
2589 # define GEN7_WM_POSITION_ZW_CENTROID (2 << 17)
2590 # define GEN7_WM_POSITION_ZW_SAMPLE (3 << 17)
2591 # define GEN7_WM_BARYCENTRIC_INTERPOLATION_MODE_SHIFT 11
2592 # define GEN7_WM_USES_INPUT_COVERAGE_MASK (1 << 10)
2593 # define GEN7_WM_LINE_END_CAP_AA_WIDTH_0_5 (0 << 8)
2594 # define GEN7_WM_LINE_END_CAP_AA_WIDTH_1_0 (1 << 8)
2595 # define GEN7_WM_LINE_END_CAP_AA_WIDTH_2_0 (2 << 8)
2596 # define GEN7_WM_LINE_END_CAP_AA_WIDTH_4_0 (3 << 8)
2597 # define GEN7_WM_LINE_AA_WIDTH_0_5 (0 << 6)
2598 # define GEN7_WM_LINE_AA_WIDTH_1_0 (1 << 6)
2599 # define GEN7_WM_LINE_AA_WIDTH_2_0 (2 << 6)
2600 # define GEN7_WM_LINE_AA_WIDTH_4_0 (3 << 6)
2601 # define GEN7_WM_POLYGON_STIPPLE_ENABLE (1 << 4)
2602 # define GEN7_WM_LINE_STIPPLE_ENABLE (1 << 3)
2603 # define GEN7_WM_POINT_RASTRULE_UPPER_RIGHT (1 << 2)
2604 # define GEN7_WM_MSRAST_OFF_PIXEL (0 << 0)
2605 # define GEN7_WM_MSRAST_OFF_PATTERN (1 << 0)
2606 # define GEN7_WM_MSRAST_ON_PIXEL (2 << 0)
2607 # define GEN7_WM_MSRAST_ON_PATTERN (3 << 0)
2608 /* DW2 */
2609 # define GEN7_WM_MSDISPMODE_PERSAMPLE (0 << 31)
2610 # define GEN7_WM_MSDISPMODE_PERPIXEL (1 << 31)
2611 # define HSW_WM_UAV_ONLY (1 << 30)
2612
2613 #define _3DSTATE_PS 0x7820 /* GEN7+ */
2614 /* DW1: kernel pointer */
2615 /* DW2 */
2616 # define GEN7_PS_SPF_MODE (1 << 31)
2617 # define GEN7_PS_VECTOR_MASK_ENABLE (1 << 30)
2618 # define GEN7_PS_SAMPLER_COUNT_SHIFT 27
2619 # define GEN7_PS_SAMPLER_COUNT_MASK INTEL_MASK(29, 27)
2620 # define GEN7_PS_BINDING_TABLE_ENTRY_COUNT_SHIFT 18
2621 # define GEN7_PS_FLOATING_POINT_MODE_IEEE_754 (0 << 16)
2622 # define GEN7_PS_FLOATING_POINT_MODE_ALT (1 << 16)
2623 /* DW3: scratch space */
2624 /* DW4 */
2625 # define IVB_PS_MAX_THREADS_SHIFT 24
2626 # define HSW_PS_MAX_THREADS_SHIFT 23
2627 # define HSW_PS_SAMPLE_MASK_SHIFT 12
2628 # define HSW_PS_SAMPLE_MASK_MASK INTEL_MASK(19, 12)
2629 # define GEN7_PS_PUSH_CONSTANT_ENABLE (1 << 11)
2630 # define GEN7_PS_ATTRIBUTE_ENABLE (1 << 10)
2631 # define GEN7_PS_OMASK_TO_RENDER_TARGET (1 << 9)
2632 # define GEN7_PS_RENDER_TARGET_FAST_CLEAR_ENABLE (1 << 8)
2633 # define GEN7_PS_DUAL_SOURCE_BLEND_ENABLE (1 << 7)
2634 # define GEN7_PS_RENDER_TARGET_RESOLVE_ENABLE (1 << 6)
2635 # define HSW_PS_UAV_ACCESS_ENABLE (1 << 5)
2636 # define GEN7_PS_POSOFFSET_NONE (0 << 3)
2637 # define GEN7_PS_POSOFFSET_CENTROID (2 << 3)
2638 # define GEN7_PS_POSOFFSET_SAMPLE (3 << 3)
2639 # define GEN7_PS_32_DISPATCH_ENABLE (1 << 2)
2640 # define GEN7_PS_16_DISPATCH_ENABLE (1 << 1)
2641 # define GEN7_PS_8_DISPATCH_ENABLE (1 << 0)
2642 /* DW5 */
2643 # define GEN7_PS_DISPATCH_START_GRF_SHIFT_0 16
2644 # define GEN7_PS_DISPATCH_START_GRF_SHIFT_1 8
2645 # define GEN7_PS_DISPATCH_START_GRF_SHIFT_2 0
2646 /* DW6: kernel 1 pointer */
2647 /* DW7: kernel 2 pointer */
2648
2649 #define _3DSTATE_SAMPLE_MASK 0x7818 /* GEN6+ */
2650
2651 #define _3DSTATE_DRAWING_RECTANGLE 0x7900
2652 #define _3DSTATE_BLEND_CONSTANT_COLOR 0x7901
2653 #define _3DSTATE_CHROMA_KEY 0x7904
2654 #define _3DSTATE_DEPTH_BUFFER 0x7905 /* GEN4-6 */
2655 #define _3DSTATE_POLY_STIPPLE_OFFSET 0x7906
2656 #define _3DSTATE_POLY_STIPPLE_PATTERN 0x7907
2657 #define _3DSTATE_LINE_STIPPLE_PATTERN 0x7908
2658 #define _3DSTATE_GLOBAL_DEPTH_OFFSET_CLAMP 0x7909
2659 #define _3DSTATE_AA_LINE_PARAMETERS 0x790a /* G45+ */
2660
2661 #define _3DSTATE_GS_SVB_INDEX 0x790b /* CTG+ */
2662 /* DW1 */
2663 # define SVB_INDEX_SHIFT 29
2664 # define SVB_LOAD_INTERNAL_VERTEX_COUNT (1 << 0) /* SNB+ */
2665 /* DW2: SVB index */
2666 /* DW3: SVB maximum index */
2667
2668 #define _3DSTATE_MULTISAMPLE 0x790d /* GEN6+ */
2669 #define GEN8_3DSTATE_MULTISAMPLE 0x780d /* GEN8+ */
2670 /* DW1 */
2671 # define MS_PIXEL_LOCATION_CENTER (0 << 4)
2672 # define MS_PIXEL_LOCATION_UPPER_LEFT (1 << 4)
2673 # define MS_NUMSAMPLES_1 (0 << 1)
2674 # define MS_NUMSAMPLES_2 (1 << 1)
2675 # define MS_NUMSAMPLES_4 (2 << 1)
2676 # define MS_NUMSAMPLES_8 (3 << 1)
2677 # define MS_NUMSAMPLES_16 (4 << 1)
2678
2679 #define _3DSTATE_SAMPLE_PATTERN 0x791c
2680
2681 #define _3DSTATE_STENCIL_BUFFER 0x790e /* ILK, SNB */
2682 #define _3DSTATE_HIER_DEPTH_BUFFER 0x790f /* ILK, SNB */
2683
2684 #define GEN7_3DSTATE_CLEAR_PARAMS 0x7804
2685 #define GEN7_3DSTATE_DEPTH_BUFFER 0x7805
2686 #define GEN7_3DSTATE_STENCIL_BUFFER 0x7806
2687 # define HSW_STENCIL_ENABLED (1 << 31)
2688 #define GEN7_3DSTATE_HIER_DEPTH_BUFFER 0x7807
2689
2690 #define _3DSTATE_CLEAR_PARAMS 0x7910 /* ILK, SNB */
2691 # define GEN5_DEPTH_CLEAR_VALID (1 << 15)
2692 /* DW1: depth clear value */
2693 /* DW2 */
2694 # define GEN7_DEPTH_CLEAR_VALID (1 << 0)
2695
2696 #define _3DSTATE_SO_DECL_LIST 0x7917 /* GEN7+ */
2697 /* DW1 */
2698 # define SO_STREAM_TO_BUFFER_SELECTS_3_SHIFT 12
2699 # define SO_STREAM_TO_BUFFER_SELECTS_3_MASK INTEL_MASK(15, 12)
2700 # define SO_STREAM_TO_BUFFER_SELECTS_2_SHIFT 8
2701 # define SO_STREAM_TO_BUFFER_SELECTS_2_MASK INTEL_MASK(11, 8)
2702 # define SO_STREAM_TO_BUFFER_SELECTS_1_SHIFT 4
2703 # define SO_STREAM_TO_BUFFER_SELECTS_1_MASK INTEL_MASK(7, 4)
2704 # define SO_STREAM_TO_BUFFER_SELECTS_0_SHIFT 0
2705 # define SO_STREAM_TO_BUFFER_SELECTS_0_MASK INTEL_MASK(3, 0)
2706 /* DW2 */
2707 # define SO_NUM_ENTRIES_3_SHIFT 24
2708 # define SO_NUM_ENTRIES_3_MASK INTEL_MASK(31, 24)
2709 # define SO_NUM_ENTRIES_2_SHIFT 16
2710 # define SO_NUM_ENTRIES_2_MASK INTEL_MASK(23, 16)
2711 # define SO_NUM_ENTRIES_1_SHIFT 8
2712 # define SO_NUM_ENTRIES_1_MASK INTEL_MASK(15, 8)
2713 # define SO_NUM_ENTRIES_0_SHIFT 0
2714 # define SO_NUM_ENTRIES_0_MASK INTEL_MASK(7, 0)
2715
2716 /* SO_DECL DW0 */
2717 # define SO_DECL_OUTPUT_BUFFER_SLOT_SHIFT 12
2718 # define SO_DECL_OUTPUT_BUFFER_SLOT_MASK INTEL_MASK(13, 12)
2719 # define SO_DECL_HOLE_FLAG (1 << 11)
2720 # define SO_DECL_REGISTER_INDEX_SHIFT 4
2721 # define SO_DECL_REGISTER_INDEX_MASK INTEL_MASK(9, 4)
2722 # define SO_DECL_COMPONENT_MASK_SHIFT 0
2723 # define SO_DECL_COMPONENT_MASK_MASK INTEL_MASK(3, 0)
2724
2725 #define _3DSTATE_SO_BUFFER 0x7918 /* GEN7+ */
2726 /* DW1 */
2727 # define GEN8_SO_BUFFER_ENABLE (1 << 31)
2728 # define SO_BUFFER_INDEX_SHIFT 29
2729 # define SO_BUFFER_INDEX_MASK INTEL_MASK(30, 29)
2730 # define GEN8_SO_BUFFER_OFFSET_WRITE_ENABLE (1 << 21)
2731 # define GEN8_SO_BUFFER_OFFSET_ADDRESS_ENABLE (1 << 20)
2732 # define SO_BUFFER_PITCH_SHIFT 0
2733 # define SO_BUFFER_PITCH_MASK INTEL_MASK(11, 0)
2734 /* DW2: start address */
2735 /* DW3: end address. */
2736
2737 #define CMD_MI_FLUSH 0x0200
2738
2739 # define BLT_X_SHIFT 0
2740 # define BLT_X_MASK INTEL_MASK(15, 0)
2741 # define BLT_Y_SHIFT 16
2742 # define BLT_Y_MASK INTEL_MASK(31, 16)
2743
2744 #define GEN5_MI_REPORT_PERF_COUNT ((0x26 << 23) | (3 - 2))
2745 /* DW0 */
2746 # define GEN5_MI_COUNTER_SET_0 (0 << 6)
2747 # define GEN5_MI_COUNTER_SET_1 (1 << 6)
2748 /* DW1 */
2749 # define MI_COUNTER_ADDRESS_GTT (1 << 0)
2750 /* DW2: a user-defined report ID (written to the buffer but can be anything) */
2751
2752 #define GEN6_MI_REPORT_PERF_COUNT ((0x28 << 23) | (3 - 2))
2753
2754 /* Bitfields for the URB_WRITE message, DW2 of message header: */
2755 #define URB_WRITE_PRIM_END 0x1
2756 #define URB_WRITE_PRIM_START 0x2
2757 #define URB_WRITE_PRIM_TYPE_SHIFT 2
2758
2759
2760 /* Maximum number of entries that can be addressed using a binding table
2761 * pointer of type SURFTYPE_BUFFER
2762 */
2763 #define BRW_MAX_NUM_BUFFER_ENTRIES (1 << 27)
2764
2765 /* Memory Object Control State:
2766 * Specifying zero for L3 means "uncached in L3", at least on Haswell
2767 * and Baytrail, since there are no PTE flags for setting L3 cacheability.
2768 * On Ivybridge, the PTEs do have a cache-in-L3 bit, so setting MOCS to 0
2769 * may still respect that.
2770 */
2771 #define GEN7_MOCS_L3 1
2772
2773 /* Ivybridge only: cache in LLC.
2774 * Specifying zero here means to use the PTE values set by the kernel;
2775 * non-zero overrides the PTE values.
2776 */
2777 #define IVB_MOCS_LLC (1 << 1)
2778
2779 /* Baytrail only: snoop in CPU cache */
2780 #define BYT_MOCS_SNOOP (1 << 1)
2781
2782 /* Haswell only: LLC/eLLC controls (write-back or uncached).
2783 * Specifying zero here means to use the PTE values set by the kernel,
2784 * which is useful since it offers additional control (write-through
2785 * cacheing and age). Non-zero overrides the PTE values.
2786 */
2787 #define HSW_MOCS_UC_LLC_UC_ELLC (1 << 1)
2788 #define HSW_MOCS_WB_LLC_WB_ELLC (2 << 1)
2789 #define HSW_MOCS_UC_LLC_WB_ELLC (3 << 1)
2790
2791 /* Broadwell: these defines always use all available caches (L3, LLC, eLLC),
2792 * and let you force write-back (WB) or write-through (WT) caching, or leave
2793 * it up to the page table entry (PTE) specified by the kernel.
2794 */
2795 #define BDW_MOCS_WB 0x78
2796 #define BDW_MOCS_WT 0x58
2797 #define BDW_MOCS_PTE 0x18
2798
2799 /* Skylake: MOCS is now an index into an array of 62 different caching
2800 * configurations programmed by the kernel.
2801 */
2802 /* TC=LLC/eLLC, LeCC=WB, LRUM=3, L3CC=WB */
2803 #define SKL_MOCS_WB (2 << 1)
2804 /* TC=LLC/eLLC, LeCC=PTE, LRUM=3, L3CC=WB */
2805 #define SKL_MOCS_PTE (1 << 1)
2806
2807 #define MEDIA_VFE_STATE 0x7000
2808 /* GEN7 DW2, GEN8+ DW3 */
2809 # define MEDIA_VFE_STATE_MAX_THREADS_SHIFT 16
2810 # define MEDIA_VFE_STATE_MAX_THREADS_MASK INTEL_MASK(31, 16)
2811 # define MEDIA_VFE_STATE_URB_ENTRIES_SHIFT 8
2812 # define MEDIA_VFE_STATE_URB_ENTRIES_MASK INTEL_MASK(15, 8)
2813 # define MEDIA_VFE_STATE_RESET_GTW_TIMER_SHIFT 7
2814 # define MEDIA_VFE_STATE_RESET_GTW_TIMER_MASK INTEL_MASK(7, 7)
2815 # define MEDIA_VFE_STATE_BYPASS_GTW_SHIFT 6
2816 # define MEDIA_VFE_STATE_BYPASS_GTW_MASK INTEL_MASK(6, 6)
2817 # define GEN7_MEDIA_VFE_STATE_GPGPU_MODE_SHIFT 2
2818 # define GEN7_MEDIA_VFE_STATE_GPGPU_MODE_MASK INTEL_MASK(2, 2)
2819 /* GEN7 DW4, GEN8+ DW5 */
2820 # define MEDIA_VFE_STATE_URB_ALLOC_SHIFT 16
2821 # define MEDIA_VFE_STATE_URB_ALLOC_MASK INTEL_MASK(31, 16)
2822 # define MEDIA_VFE_STATE_CURBE_ALLOC_SHIFT 0
2823 # define MEDIA_VFE_STATE_CURBE_ALLOC_MASK INTEL_MASK(15, 0)
2824
2825 #define MEDIA_CURBE_LOAD 0x7001
2826 #define MEDIA_INTERFACE_DESCRIPTOR_LOAD 0x7002
2827 /* GEN7 DW4, GEN8+ DW5 */
2828 # define MEDIA_CURBE_READ_LENGTH_SHIFT 16
2829 # define MEDIA_CURBE_READ_LENGTH_MASK INTEL_MASK(31, 16)
2830 # define MEDIA_CURBE_READ_OFFSET_SHIFT 0
2831 # define MEDIA_CURBE_READ_OFFSET_MASK INTEL_MASK(15, 0)
2832 /* GEN7 DW5, GEN8+ DW6 */
2833 # define MEDIA_BARRIER_ENABLE_SHIFT 21
2834 # define MEDIA_BARRIER_ENABLE_MASK INTEL_MASK(21, 21)
2835 # define MEDIA_GPGPU_THREAD_COUNT_SHIFT 0
2836 # define MEDIA_GPGPU_THREAD_COUNT_MASK INTEL_MASK(7, 0)
2837 # define GEN8_MEDIA_GPGPU_THREAD_COUNT_SHIFT 0
2838 # define GEN8_MEDIA_GPGPU_THREAD_COUNT_MASK INTEL_MASK(9, 0)
2839 #define MEDIA_STATE_FLUSH 0x7004
2840 #define GPGPU_WALKER 0x7105
2841 /* GEN7 DW0 */
2842 # define GEN7_GPGPU_INDIRECT_PARAMETER_ENABLE (1 << 10)
2843 /* GEN8+ DW2 */
2844 # define GPGPU_WALKER_INDIRECT_LENGTH_SHIFT 0
2845 # define GPGPU_WALKER_INDIRECT_LENGTH_MASK INTEL_MASK(15, 0)
2846 /* GEN7 DW2, GEN8+ DW4 */
2847 # define GPGPU_WALKER_SIMD_SIZE_SHIFT 30
2848 # define GPGPU_WALKER_SIMD_SIZE_MASK INTEL_MASK(31, 30)
2849 # define GPGPU_WALKER_THREAD_DEPTH_MAX_SHIFT 16
2850 # define GPGPU_WALKER_THREAD_DEPTH_MAX_MASK INTEL_MASK(21, 16)
2851 # define GPGPU_WALKER_THREAD_HEIGHT_MAX_SHIFT 8
2852 # define GPGPU_WALKER_THREAD_HEIGHT_MAX_MASK INTEL_MASK(31, 8)
2853 # define GPGPU_WALKER_THREAD_WIDTH_MAX_SHIFT 0
2854 # define GPGPU_WALKER_THREAD_WIDTH_MAX_MASK INTEL_MASK(5, 0)
2855
2856 #endif