i965: remove unused macros from brw_defines.h
[mesa.git] / src / mesa / drivers / dri / i965 / brw_defines.h
1 /*
2 Copyright (C) Intel Corp. 2006. All Rights Reserved.
3 Intel funded Tungsten Graphics to
4 develop this 3D driver.
5
6 Permission is hereby granted, free of charge, to any person obtaining
7 a copy of this software and associated documentation files (the
8 "Software"), to deal in the Software without restriction, including
9 without limitation the rights to use, copy, modify, merge, publish,
10 distribute, sublicense, and/or sell copies of the Software, and to
11 permit persons to whom the Software is furnished to do so, subject to
12 the following conditions:
13
14 The above copyright notice and this permission notice (including the
15 next paragraph) shall be included in all copies or substantial
16 portions of the Software.
17
18 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
19 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
21 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
22 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
23 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
24 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25
26 **********************************************************************/
27 /*
28 * Authors:
29 * Keith Whitwell <keithw@vmware.com>
30 */
31
32 #include "util/macros.h"
33
34 #define INTEL_MASK(high, low) (((1u<<((high)-(low)+1))-1)<<(low))
35 /* Using the GNU statement expression extension */
36 #define SET_FIELD(value, field) \
37 ({ \
38 uint32_t fieldval = (value) << field ## _SHIFT; \
39 assert((fieldval & ~ field ## _MASK) == 0); \
40 fieldval & field ## _MASK; \
41 })
42
43 #define GET_BITS(data, high, low) ((data & INTEL_MASK((high), (low))) >> (low))
44 #define GET_FIELD(word, field) (((word) & field ## _MASK) >> field ## _SHIFT)
45
46 /**
47 * For use with masked MMIO registers where the upper 16 bits control which
48 * of the lower bits are committed to the register.
49 */
50 #define REG_MASK(value) ((value) << 16)
51
52 #ifndef BRW_DEFINES_H
53 #define BRW_DEFINES_H
54
55 /* 3D state:
56 */
57 #define CMD_3D_PRIM 0x7b00 /* 3DPRIMITIVE */
58 /* DW0 */
59 # define GEN4_3DPRIM_TOPOLOGY_TYPE_SHIFT 10
60 # define GEN4_3DPRIM_VERTEXBUFFER_ACCESS_SEQUENTIAL (0 << 15)
61 # define GEN4_3DPRIM_VERTEXBUFFER_ACCESS_RANDOM (1 << 15)
62 # define GEN7_3DPRIM_INDIRECT_PARAMETER_ENABLE (1 << 10)
63 # define GEN7_3DPRIM_PREDICATE_ENABLE (1 << 8)
64 /* DW1 */
65 # define GEN7_3DPRIM_VERTEXBUFFER_ACCESS_SEQUENTIAL (0 << 8)
66 # define GEN7_3DPRIM_VERTEXBUFFER_ACCESS_RANDOM (1 << 8)
67
68 #define _3DPRIM_POINTLIST 0x01
69 #define _3DPRIM_LINELIST 0x02
70 #define _3DPRIM_LINESTRIP 0x03
71 #define _3DPRIM_TRILIST 0x04
72 #define _3DPRIM_TRISTRIP 0x05
73 #define _3DPRIM_TRIFAN 0x06
74 #define _3DPRIM_QUADLIST 0x07
75 #define _3DPRIM_QUADSTRIP 0x08
76 #define _3DPRIM_LINELIST_ADJ 0x09 /* G45+ */
77 #define _3DPRIM_LINESTRIP_ADJ 0x0A /* G45+ */
78 #define _3DPRIM_TRILIST_ADJ 0x0B /* G45+ */
79 #define _3DPRIM_TRISTRIP_ADJ 0x0C /* G45+ */
80 #define _3DPRIM_TRISTRIP_REVERSE 0x0D
81 #define _3DPRIM_POLYGON 0x0E
82 #define _3DPRIM_RECTLIST 0x0F
83 #define _3DPRIM_LINELOOP 0x10
84 #define _3DPRIM_POINTLIST_BF 0x11
85 #define _3DPRIM_LINESTRIP_CONT 0x12
86 #define _3DPRIM_LINESTRIP_BF 0x13
87 #define _3DPRIM_LINESTRIP_CONT_BF 0x14
88 #define _3DPRIM_TRIFAN_NOSTIPPLE 0x16
89 #define _3DPRIM_PATCHLIST(n) ({ assert(n > 0 && n <= 32); 0x20 + (n - 1); })
90
91 #define BRW_ANISORATIO_2 0
92 #define BRW_ANISORATIO_4 1
93 #define BRW_ANISORATIO_6 2
94 #define BRW_ANISORATIO_8 3
95 #define BRW_ANISORATIO_10 4
96 #define BRW_ANISORATIO_12 5
97 #define BRW_ANISORATIO_14 6
98 #define BRW_ANISORATIO_16 7
99
100 #define BRW_BLENDFACTOR_ONE 0x1
101 #define BRW_BLENDFACTOR_SRC_COLOR 0x2
102 #define BRW_BLENDFACTOR_SRC_ALPHA 0x3
103 #define BRW_BLENDFACTOR_DST_ALPHA 0x4
104 #define BRW_BLENDFACTOR_DST_COLOR 0x5
105 #define BRW_BLENDFACTOR_SRC_ALPHA_SATURATE 0x6
106 #define BRW_BLENDFACTOR_CONST_COLOR 0x7
107 #define BRW_BLENDFACTOR_CONST_ALPHA 0x8
108 #define BRW_BLENDFACTOR_SRC1_COLOR 0x9
109 #define BRW_BLENDFACTOR_SRC1_ALPHA 0x0A
110 #define BRW_BLENDFACTOR_ZERO 0x11
111 #define BRW_BLENDFACTOR_INV_SRC_COLOR 0x12
112 #define BRW_BLENDFACTOR_INV_SRC_ALPHA 0x13
113 #define BRW_BLENDFACTOR_INV_DST_ALPHA 0x14
114 #define BRW_BLENDFACTOR_INV_DST_COLOR 0x15
115 #define BRW_BLENDFACTOR_INV_CONST_COLOR 0x17
116 #define BRW_BLENDFACTOR_INV_CONST_ALPHA 0x18
117 #define BRW_BLENDFACTOR_INV_SRC1_COLOR 0x19
118 #define BRW_BLENDFACTOR_INV_SRC1_ALPHA 0x1A
119
120 #define BRW_BLENDFUNCTION_ADD 0
121 #define BRW_BLENDFUNCTION_SUBTRACT 1
122 #define BRW_BLENDFUNCTION_REVERSE_SUBTRACT 2
123 #define BRW_BLENDFUNCTION_MIN 3
124 #define BRW_BLENDFUNCTION_MAX 4
125
126 #define BRW_ALPHATEST_FORMAT_UNORM8 0
127 #define BRW_ALPHATEST_FORMAT_FLOAT32 1
128
129 #define BRW_CHROMAKEY_KILL_ON_ANY_MATCH 0
130 #define BRW_CHROMAKEY_REPLACE_BLACK 1
131
132 #define BRW_CLIP_API_OGL 0
133 #define BRW_CLIP_API_DX 1
134
135 #define BRW_CLIPMODE_NORMAL 0
136 #define BRW_CLIPMODE_CLIP_ALL 1
137 #define BRW_CLIPMODE_CLIP_NON_REJECTED 2
138 #define BRW_CLIPMODE_REJECT_ALL 3
139 #define BRW_CLIPMODE_ACCEPT_ALL 4
140 #define BRW_CLIPMODE_KERNEL_CLIP 5
141
142 #define BRW_CLIP_NDCSPACE 0
143 #define BRW_CLIP_SCREENSPACE 1
144
145 #define BRW_COMPAREFUNCTION_ALWAYS 0
146 #define BRW_COMPAREFUNCTION_NEVER 1
147 #define BRW_COMPAREFUNCTION_LESS 2
148 #define BRW_COMPAREFUNCTION_EQUAL 3
149 #define BRW_COMPAREFUNCTION_LEQUAL 4
150 #define BRW_COMPAREFUNCTION_GREATER 5
151 #define BRW_COMPAREFUNCTION_NOTEQUAL 6
152 #define BRW_COMPAREFUNCTION_GEQUAL 7
153
154 #define BRW_COVERAGE_PIXELS_HALF 0
155 #define BRW_COVERAGE_PIXELS_1 1
156 #define BRW_COVERAGE_PIXELS_2 2
157 #define BRW_COVERAGE_PIXELS_4 3
158
159 #define BRW_CULLMODE_BOTH 0
160 #define BRW_CULLMODE_NONE 1
161 #define BRW_CULLMODE_FRONT 2
162 #define BRW_CULLMODE_BACK 3
163
164 #define BRW_DEFAULTCOLOR_R8G8B8A8_UNORM 0
165 #define BRW_DEFAULTCOLOR_R32G32B32A32_FLOAT 1
166
167 #define BRW_DEPTHFORMAT_D32_FLOAT_S8X24_UINT 0
168 #define BRW_DEPTHFORMAT_D32_FLOAT 1
169 #define BRW_DEPTHFORMAT_D24_UNORM_S8_UINT 2
170 #define BRW_DEPTHFORMAT_D24_UNORM_X8_UINT 3 /* GEN5 */
171 #define BRW_DEPTHFORMAT_D16_UNORM 5
172
173 #define BRW_FLOATING_POINT_IEEE_754 0
174 #define BRW_FLOATING_POINT_NON_IEEE_754 1
175
176 #define BRW_FRONTWINDING_CW 0
177 #define BRW_FRONTWINDING_CCW 1
178
179 #define BRW_SPRITE_POINT_ENABLE 16
180
181 #define BRW_CUT_INDEX_ENABLE (1 << 10)
182
183 #define BRW_INDEX_BYTE 0
184 #define BRW_INDEX_WORD 1
185 #define BRW_INDEX_DWORD 2
186
187 #define BRW_LOGICOPFUNCTION_CLEAR 0
188 #define BRW_LOGICOPFUNCTION_NOR 1
189 #define BRW_LOGICOPFUNCTION_AND_INVERTED 2
190 #define BRW_LOGICOPFUNCTION_COPY_INVERTED 3
191 #define BRW_LOGICOPFUNCTION_AND_REVERSE 4
192 #define BRW_LOGICOPFUNCTION_INVERT 5
193 #define BRW_LOGICOPFUNCTION_XOR 6
194 #define BRW_LOGICOPFUNCTION_NAND 7
195 #define BRW_LOGICOPFUNCTION_AND 8
196 #define BRW_LOGICOPFUNCTION_EQUIV 9
197 #define BRW_LOGICOPFUNCTION_NOOP 10
198 #define BRW_LOGICOPFUNCTION_OR_INVERTED 11
199 #define BRW_LOGICOPFUNCTION_COPY 12
200 #define BRW_LOGICOPFUNCTION_OR_REVERSE 13
201 #define BRW_LOGICOPFUNCTION_OR 14
202 #define BRW_LOGICOPFUNCTION_SET 15
203
204 #define BRW_MAPFILTER_NEAREST 0x0
205 #define BRW_MAPFILTER_LINEAR 0x1
206 #define BRW_MAPFILTER_ANISOTROPIC 0x2
207
208 #define BRW_MIPFILTER_NONE 0
209 #define BRW_MIPFILTER_NEAREST 1
210 #define BRW_MIPFILTER_LINEAR 3
211
212 #define BRW_ADDRESS_ROUNDING_ENABLE_U_MAG 0x20
213 #define BRW_ADDRESS_ROUNDING_ENABLE_U_MIN 0x10
214 #define BRW_ADDRESS_ROUNDING_ENABLE_V_MAG 0x08
215 #define BRW_ADDRESS_ROUNDING_ENABLE_V_MIN 0x04
216 #define BRW_ADDRESS_ROUNDING_ENABLE_R_MAG 0x02
217 #define BRW_ADDRESS_ROUNDING_ENABLE_R_MIN 0x01
218
219 #define BRW_PREFILTER_ALWAYS 0x0
220 #define BRW_PREFILTER_NEVER 0x1
221 #define BRW_PREFILTER_LESS 0x2
222 #define BRW_PREFILTER_EQUAL 0x3
223 #define BRW_PREFILTER_LEQUAL 0x4
224 #define BRW_PREFILTER_GREATER 0x5
225 #define BRW_PREFILTER_NOTEQUAL 0x6
226 #define BRW_PREFILTER_GEQUAL 0x7
227
228 #define BRW_PROVOKING_VERTEX_0 0
229 #define BRW_PROVOKING_VERTEX_1 1
230 #define BRW_PROVOKING_VERTEX_2 2
231
232 #define BRW_RASTRULE_UPPER_LEFT 0
233 #define BRW_RASTRULE_UPPER_RIGHT 1
234 /* These are listed as "Reserved, but not seen as useful"
235 * in Intel documentation (page 212, "Point Rasterization Rule",
236 * section 7.4 "SF Pipeline State Summary", of document
237 * "IntelĀ® 965 Express Chipset Family and IntelĀ® G35 Express
238 * Chipset Graphics Controller Programmer's Reference Manual,
239 * Volume 2: 3D/Media", Revision 1.0b as of January 2008,
240 * available at
241 * https://01.org/linuxgraphics/documentation/hardware-specification-prms
242 * at the time of this writing).
243 *
244 * These appear to be supported on at least some
245 * i965-family devices, and the BRW_RASTRULE_LOWER_RIGHT
246 * is useful when using OpenGL to render to a FBO
247 * (which has the pixel coordinate Y orientation inverted
248 * with respect to the normal OpenGL pixel coordinate system).
249 */
250 #define BRW_RASTRULE_LOWER_LEFT 2
251 #define BRW_RASTRULE_LOWER_RIGHT 3
252
253 #define BRW_RENDERTARGET_CLAMPRANGE_UNORM 0
254 #define BRW_RENDERTARGET_CLAMPRANGE_SNORM 1
255 #define BRW_RENDERTARGET_CLAMPRANGE_FORMAT 2
256
257 #define BRW_STENCILOP_KEEP 0
258 #define BRW_STENCILOP_ZERO 1
259 #define BRW_STENCILOP_REPLACE 2
260 #define BRW_STENCILOP_INCRSAT 3
261 #define BRW_STENCILOP_DECRSAT 4
262 #define BRW_STENCILOP_INCR 5
263 #define BRW_STENCILOP_DECR 6
264 #define BRW_STENCILOP_INVERT 7
265
266 /* Surface state DW0 */
267 #define GEN8_SURFACE_IS_ARRAY (1 << 28)
268 #define GEN8_SURFACE_VALIGN_4 (1 << 16)
269 #define GEN8_SURFACE_VALIGN_8 (2 << 16)
270 #define GEN8_SURFACE_VALIGN_16 (3 << 16)
271 #define GEN8_SURFACE_HALIGN_4 (1 << 14)
272 #define GEN8_SURFACE_HALIGN_8 (2 << 14)
273 #define GEN8_SURFACE_HALIGN_16 (3 << 14)
274 #define GEN8_SURFACE_TILING_NONE (0 << 12)
275 #define GEN8_SURFACE_TILING_W (1 << 12)
276 #define GEN8_SURFACE_TILING_X (2 << 12)
277 #define GEN8_SURFACE_TILING_Y (3 << 12)
278 #define GEN8_SURFACE_SAMPLER_L2_BYPASS_DISABLE (1 << 9)
279 #define BRW_SURFACE_RC_READ_WRITE (1 << 8)
280 #define BRW_SURFACE_MIPLAYOUT_SHIFT 10
281 #define BRW_SURFACE_MIPMAPLAYOUT_BELOW 0
282 #define BRW_SURFACE_MIPMAPLAYOUT_RIGHT 1
283 #define BRW_SURFACE_CUBEFACE_ENABLES 0x3f
284 #define BRW_SURFACE_BLEND_ENABLED (1 << 13)
285 #define BRW_SURFACE_WRITEDISABLE_B_SHIFT 14
286 #define BRW_SURFACE_WRITEDISABLE_G_SHIFT 15
287 #define BRW_SURFACE_WRITEDISABLE_R_SHIFT 16
288 #define BRW_SURFACE_WRITEDISABLE_A_SHIFT 17
289
290 #define GEN9_SURFACE_ASTC_HDR_FORMAT_BIT 0x100
291
292 #define BRW_SURFACE_FORMAT_SHIFT 18
293 #define BRW_SURFACE_FORMAT_MASK INTEL_MASK(26, 18)
294
295 #define BRW_SURFACERETURNFORMAT_FLOAT32 0
296 #define BRW_SURFACERETURNFORMAT_S1 1
297
298 #define BRW_SURFACE_TYPE_SHIFT 29
299 #define BRW_SURFACE_TYPE_MASK INTEL_MASK(31, 29)
300 #define BRW_SURFACE_1D 0
301 #define BRW_SURFACE_2D 1
302 #define BRW_SURFACE_3D 2
303 #define BRW_SURFACE_CUBE 3
304 #define BRW_SURFACE_BUFFER 4
305 #define BRW_SURFACE_NULL 7
306
307 #define GEN7_SURFACE_IS_ARRAY (1 << 28)
308 #define GEN7_SURFACE_VALIGN_2 (0 << 16)
309 #define GEN7_SURFACE_VALIGN_4 (1 << 16)
310 #define GEN7_SURFACE_HALIGN_4 (0 << 15)
311 #define GEN7_SURFACE_HALIGN_8 (1 << 15)
312 #define GEN7_SURFACE_TILING_NONE (0 << 13)
313 #define GEN7_SURFACE_TILING_X (2 << 13)
314 #define GEN7_SURFACE_TILING_Y (3 << 13)
315 #define GEN7_SURFACE_ARYSPC_FULL (0 << 10)
316 #define GEN7_SURFACE_ARYSPC_LOD0 (1 << 10)
317
318 /* Surface state DW1 */
319 #define GEN8_SURFACE_MOCS_SHIFT 24
320 #define GEN8_SURFACE_MOCS_MASK INTEL_MASK(30, 24)
321 #define GEN8_SURFACE_QPITCH_SHIFT 0
322 #define GEN8_SURFACE_QPITCH_MASK INTEL_MASK(14, 0)
323
324 /* Surface state DW2 */
325 #define BRW_SURFACE_HEIGHT_SHIFT 19
326 #define BRW_SURFACE_HEIGHT_MASK INTEL_MASK(31, 19)
327 #define BRW_SURFACE_WIDTH_SHIFT 6
328 #define BRW_SURFACE_WIDTH_MASK INTEL_MASK(18, 6)
329 #define BRW_SURFACE_LOD_SHIFT 2
330 #define BRW_SURFACE_LOD_MASK INTEL_MASK(5, 2)
331 #define GEN7_SURFACE_HEIGHT_SHIFT 16
332 #define GEN7_SURFACE_HEIGHT_MASK INTEL_MASK(29, 16)
333 #define GEN7_SURFACE_WIDTH_SHIFT 0
334 #define GEN7_SURFACE_WIDTH_MASK INTEL_MASK(13, 0)
335
336 /* Surface state DW3 */
337 #define BRW_SURFACE_DEPTH_SHIFT 21
338 #define BRW_SURFACE_DEPTH_MASK INTEL_MASK(31, 21)
339 #define BRW_SURFACE_PITCH_SHIFT 3
340 #define BRW_SURFACE_PITCH_MASK INTEL_MASK(19, 3)
341 #define BRW_SURFACE_TILED (1 << 1)
342 #define BRW_SURFACE_TILED_Y (1 << 0)
343 #define HSW_SURFACE_IS_INTEGER_FORMAT (1 << 18)
344
345 /* Surface state DW4 */
346 #define BRW_SURFACE_MIN_LOD_SHIFT 28
347 #define BRW_SURFACE_MIN_LOD_MASK INTEL_MASK(31, 28)
348 #define BRW_SURFACE_MIN_ARRAY_ELEMENT_SHIFT 17
349 #define BRW_SURFACE_MIN_ARRAY_ELEMENT_MASK INTEL_MASK(27, 17)
350 #define BRW_SURFACE_RENDER_TARGET_VIEW_EXTENT_SHIFT 8
351 #define BRW_SURFACE_RENDER_TARGET_VIEW_EXTENT_MASK INTEL_MASK(16, 8)
352 #define BRW_SURFACE_MULTISAMPLECOUNT_1 (0 << 4)
353 #define BRW_SURFACE_MULTISAMPLECOUNT_4 (2 << 4)
354 #define GEN7_SURFACE_MULTISAMPLECOUNT_1 (0 << 3)
355 #define GEN8_SURFACE_MULTISAMPLECOUNT_2 (1 << 3)
356 #define GEN7_SURFACE_MULTISAMPLECOUNT_4 (2 << 3)
357 #define GEN7_SURFACE_MULTISAMPLECOUNT_8 (3 << 3)
358 #define GEN8_SURFACE_MULTISAMPLECOUNT_16 (4 << 3)
359 #define GEN7_SURFACE_MSFMT_MSS (0 << 6)
360 #define GEN7_SURFACE_MSFMT_DEPTH_STENCIL (1 << 6)
361 #define GEN7_SURFACE_MIN_ARRAY_ELEMENT_SHIFT 18
362 #define GEN7_SURFACE_MIN_ARRAY_ELEMENT_MASK INTEL_MASK(28, 18)
363 #define GEN7_SURFACE_RENDER_TARGET_VIEW_EXTENT_SHIFT 7
364 #define GEN7_SURFACE_RENDER_TARGET_VIEW_EXTENT_MASK INTEL_MASK(17, 7)
365
366 /* Surface state DW5 */
367 #define BRW_SURFACE_X_OFFSET_SHIFT 25
368 #define BRW_SURFACE_X_OFFSET_MASK INTEL_MASK(31, 25)
369 #define BRW_SURFACE_VERTICAL_ALIGN_ENABLE (1 << 24)
370 #define BRW_SURFACE_Y_OFFSET_SHIFT 20
371 #define BRW_SURFACE_Y_OFFSET_MASK INTEL_MASK(23, 20)
372 #define GEN7_SURFACE_MIN_LOD_SHIFT 4
373 #define GEN7_SURFACE_MIN_LOD_MASK INTEL_MASK(7, 4)
374 #define GEN8_SURFACE_Y_OFFSET_SHIFT 21
375 #define GEN8_SURFACE_Y_OFFSET_MASK INTEL_MASK(23, 21)
376
377 #define GEN7_SURFACE_MOCS_SHIFT 16
378 #define GEN7_SURFACE_MOCS_MASK INTEL_MASK(19, 16)
379
380 #define GEN9_SURFACE_TRMODE_SHIFT 18
381 #define GEN9_SURFACE_TRMODE_MASK INTEL_MASK(19, 18)
382 #define GEN9_SURFACE_TRMODE_NONE 0
383 #define GEN9_SURFACE_TRMODE_TILEYF 1
384 #define GEN9_SURFACE_TRMODE_TILEYS 2
385
386 #define GEN9_SURFACE_MIP_TAIL_START_LOD_SHIFT 8
387 #define GEN9_SURFACE_MIP_TAIL_START_LOD_MASK INTEL_MASK(11, 8)
388
389 /* Surface state DW6 */
390 #define GEN7_SURFACE_MCS_ENABLE (1 << 0)
391 #define GEN7_SURFACE_MCS_PITCH_SHIFT 3
392 #define GEN7_SURFACE_MCS_PITCH_MASK INTEL_MASK(11, 3)
393 #define GEN8_SURFACE_AUX_QPITCH_SHIFT 16
394 #define GEN8_SURFACE_AUX_QPITCH_MASK INTEL_MASK(30, 16)
395 #define GEN8_SURFACE_AUX_PITCH_SHIFT 3
396 #define GEN8_SURFACE_AUX_PITCH_MASK INTEL_MASK(11, 3)
397 #define GEN8_SURFACE_AUX_MODE_MASK INTEL_MASK(2, 0)
398
399 #define GEN8_SURFACE_AUX_MODE_NONE 0
400 #define GEN8_SURFACE_AUX_MODE_MCS 1
401 #define GEN8_SURFACE_AUX_MODE_APPEND 2
402 #define GEN8_SURFACE_AUX_MODE_HIZ 3
403 #define GEN9_SURFACE_AUX_MODE_CCS_E 5
404
405 /* Surface state DW7 */
406 #define GEN9_SURFACE_RT_COMPRESSION_SHIFT 30
407 #define GEN9_SURFACE_RT_COMPRESSION_MASK INTEL_MASK(30, 30)
408 #define GEN7_SURFACE_CLEAR_COLOR_SHIFT 28
409 #define GEN7_SURFACE_SCS_R_SHIFT 25
410 #define GEN7_SURFACE_SCS_R_MASK INTEL_MASK(27, 25)
411 #define GEN7_SURFACE_SCS_G_SHIFT 22
412 #define GEN7_SURFACE_SCS_G_MASK INTEL_MASK(24, 22)
413 #define GEN7_SURFACE_SCS_B_SHIFT 19
414 #define GEN7_SURFACE_SCS_B_MASK INTEL_MASK(21, 19)
415 #define GEN7_SURFACE_SCS_A_SHIFT 16
416 #define GEN7_SURFACE_SCS_A_MASK INTEL_MASK(18, 16)
417
418 /* The actual swizzle values/what channel to use */
419 #define HSW_SCS_ZERO 0
420 #define HSW_SCS_ONE 1
421 #define HSW_SCS_RED 4
422 #define HSW_SCS_GREEN 5
423 #define HSW_SCS_BLUE 6
424 #define HSW_SCS_ALPHA 7
425
426 /* SAMPLER_STATE DW0 */
427 #define BRW_SAMPLER_DISABLE (1 << 31)
428 #define BRW_SAMPLER_LOD_PRECLAMP_ENABLE (1 << 28)
429 #define GEN6_SAMPLER_MIN_MAG_NOT_EQUAL (1 << 27) /* Gen6 only */
430 #define BRW_SAMPLER_BASE_MIPLEVEL_MASK INTEL_MASK(26, 22)
431 #define BRW_SAMPLER_BASE_MIPLEVEL_SHIFT 22
432 #define BRW_SAMPLER_MIP_FILTER_MASK INTEL_MASK(21, 20)
433 #define BRW_SAMPLER_MIP_FILTER_SHIFT 20
434 #define BRW_SAMPLER_MAG_FILTER_MASK INTEL_MASK(19, 17)
435 #define BRW_SAMPLER_MAG_FILTER_SHIFT 17
436 #define BRW_SAMPLER_MIN_FILTER_MASK INTEL_MASK(16, 14)
437 #define BRW_SAMPLER_MIN_FILTER_SHIFT 14
438 #define GEN4_SAMPLER_LOD_BIAS_MASK INTEL_MASK(13, 3)
439 #define GEN4_SAMPLER_LOD_BIAS_SHIFT 3
440 #define GEN4_SAMPLER_SHADOW_FUNCTION_MASK INTEL_MASK(2, 0)
441 #define GEN4_SAMPLER_SHADOW_FUNCTION_SHIFT 0
442
443 #define GEN7_SAMPLER_LOD_BIAS_MASK INTEL_MASK(13, 1)
444 #define GEN7_SAMPLER_LOD_BIAS_SHIFT 1
445 #define GEN7_SAMPLER_EWA_ANISOTROPIC_ALGORITHM (1 << 0)
446
447 /* SAMPLER_STATE DW1 */
448 #define GEN4_SAMPLER_MIN_LOD_MASK INTEL_MASK(31, 22)
449 #define GEN4_SAMPLER_MIN_LOD_SHIFT 22
450 #define GEN4_SAMPLER_MAX_LOD_MASK INTEL_MASK(21, 12)
451 #define GEN4_SAMPLER_MAX_LOD_SHIFT 12
452 #define GEN4_SAMPLER_CUBE_CONTROL_OVERRIDE (1 << 9)
453 /* Wrap modes are in DW1 on Gen4-6 and DW3 on Gen7+ */
454 #define BRW_SAMPLER_TCX_WRAP_MODE_MASK INTEL_MASK(8, 6)
455 #define BRW_SAMPLER_TCX_WRAP_MODE_SHIFT 6
456 #define BRW_SAMPLER_TCY_WRAP_MODE_MASK INTEL_MASK(5, 3)
457 #define BRW_SAMPLER_TCY_WRAP_MODE_SHIFT 3
458 #define BRW_SAMPLER_TCZ_WRAP_MODE_MASK INTEL_MASK(2, 0)
459 #define BRW_SAMPLER_TCZ_WRAP_MODE_SHIFT 0
460
461 #define GEN7_SAMPLER_MIN_LOD_MASK INTEL_MASK(31, 20)
462 #define GEN7_SAMPLER_MIN_LOD_SHIFT 20
463 #define GEN7_SAMPLER_MAX_LOD_MASK INTEL_MASK(19, 8)
464 #define GEN7_SAMPLER_MAX_LOD_SHIFT 8
465 #define GEN7_SAMPLER_SHADOW_FUNCTION_MASK INTEL_MASK(3, 1)
466 #define GEN7_SAMPLER_SHADOW_FUNCTION_SHIFT 1
467 #define GEN7_SAMPLER_CUBE_CONTROL_OVERRIDE (1 << 0)
468
469 /* SAMPLER_STATE DW2 - border color pointer */
470
471 /* SAMPLER_STATE DW3 */
472 #define BRW_SAMPLER_MAX_ANISOTROPY_MASK INTEL_MASK(21, 19)
473 #define BRW_SAMPLER_MAX_ANISOTROPY_SHIFT 19
474 #define BRW_SAMPLER_ADDRESS_ROUNDING_MASK INTEL_MASK(18, 13)
475 #define BRW_SAMPLER_ADDRESS_ROUNDING_SHIFT 13
476 #define GEN7_SAMPLER_NON_NORMALIZED_COORDINATES (1 << 10)
477 /* Gen7+ wrap modes reuse the same BRW_SAMPLER_TC*_WRAP_MODE enums. */
478 #define GEN6_SAMPLER_NON_NORMALIZED_COORDINATES (1 << 0)
479
480 enum brw_wrap_mode {
481 BRW_TEXCOORDMODE_WRAP = 0,
482 BRW_TEXCOORDMODE_MIRROR = 1,
483 BRW_TEXCOORDMODE_CLAMP = 2,
484 BRW_TEXCOORDMODE_CUBE = 3,
485 BRW_TEXCOORDMODE_CLAMP_BORDER = 4,
486 BRW_TEXCOORDMODE_MIRROR_ONCE = 5,
487 GEN8_TEXCOORDMODE_HALF_BORDER = 6,
488 };
489
490 #define BRW_THREAD_PRIORITY_NORMAL 0
491 #define BRW_THREAD_PRIORITY_HIGH 1
492
493 #define BRW_TILEWALK_XMAJOR 0
494 #define BRW_TILEWALK_YMAJOR 1
495
496 #define BRW_VERTEX_SUBPIXEL_PRECISION_8BITS 0
497 #define BRW_VERTEX_SUBPIXEL_PRECISION_4BITS 1
498
499
500 /* Execution Unit (EU) defines
501 */
502
503 #define BRW_ALIGN_1 0
504 #define BRW_ALIGN_16 1
505
506 #define BRW_ADDRESS_DIRECT 0
507 #define BRW_ADDRESS_REGISTER_INDIRECT_REGISTER 1
508
509 #define BRW_CHANNEL_X 0
510 #define BRW_CHANNEL_Y 1
511 #define BRW_CHANNEL_Z 2
512 #define BRW_CHANNEL_W 3
513
514 enum brw_compression {
515 BRW_COMPRESSION_NONE = 0,
516 BRW_COMPRESSION_2NDHALF = 1,
517 BRW_COMPRESSION_COMPRESSED = 2,
518 };
519
520 #define GEN6_COMPRESSION_1Q 0
521 #define GEN6_COMPRESSION_2Q 1
522 #define GEN6_COMPRESSION_3Q 2
523 #define GEN6_COMPRESSION_4Q 3
524 #define GEN6_COMPRESSION_1H 0
525 #define GEN6_COMPRESSION_2H 2
526
527 enum PACKED brw_conditional_mod {
528 BRW_CONDITIONAL_NONE = 0,
529 BRW_CONDITIONAL_Z = 1,
530 BRW_CONDITIONAL_NZ = 2,
531 BRW_CONDITIONAL_EQ = 1, /* Z */
532 BRW_CONDITIONAL_NEQ = 2, /* NZ */
533 BRW_CONDITIONAL_G = 3,
534 BRW_CONDITIONAL_GE = 4,
535 BRW_CONDITIONAL_L = 5,
536 BRW_CONDITIONAL_LE = 6,
537 BRW_CONDITIONAL_R = 7, /* Gen <= 5 */
538 BRW_CONDITIONAL_O = 8,
539 BRW_CONDITIONAL_U = 9,
540 };
541
542 #define BRW_DEBUG_NONE 0
543 #define BRW_DEBUG_BREAKPOINT 1
544
545 #define BRW_DEPENDENCY_NORMAL 0
546 #define BRW_DEPENDENCY_NOTCLEARED 1
547 #define BRW_DEPENDENCY_NOTCHECKED 2
548 #define BRW_DEPENDENCY_DISABLE 3
549
550 enum PACKED brw_execution_size {
551 BRW_EXECUTE_1 = 0,
552 BRW_EXECUTE_2 = 1,
553 BRW_EXECUTE_4 = 2,
554 BRW_EXECUTE_8 = 3,
555 BRW_EXECUTE_16 = 4,
556 BRW_EXECUTE_32 = 5,
557 };
558
559 enum PACKED brw_horizontal_stride {
560 BRW_HORIZONTAL_STRIDE_0 = 0,
561 BRW_HORIZONTAL_STRIDE_1 = 1,
562 BRW_HORIZONTAL_STRIDE_2 = 2,
563 BRW_HORIZONTAL_STRIDE_4 = 3,
564 };
565
566 #define BRW_INSTRUCTION_NORMAL 0
567 #define BRW_INSTRUCTION_SATURATE 1
568
569 #define BRW_MASK_ENABLE 0
570 #define BRW_MASK_DISABLE 1
571
572 /** @{
573 *
574 * Gen6 has replaced "mask enable/disable" with WECtrl, which is
575 * effectively the same but much simpler to think about. Now, there
576 * are two contributors ANDed together to whether channels are
577 * executed: The predication on the instruction, and the channel write
578 * enable.
579 */
580 /**
581 * This is the default value. It means that a channel's write enable is set
582 * if the per-channel IP is pointing at this instruction.
583 */
584 #define BRW_WE_NORMAL 0
585 /**
586 * This is used like BRW_MASK_DISABLE, and causes all channels to have
587 * their write enable set. Note that predication still contributes to
588 * whether the channel actually gets written.
589 */
590 #define BRW_WE_ALL 1
591 /** @} */
592
593 enum opcode {
594 /* These are the actual hardware opcodes. */
595 BRW_OPCODE_ILLEGAL = 0,
596 BRW_OPCODE_MOV = 1,
597 BRW_OPCODE_SEL = 2,
598 BRW_OPCODE_MOVI = 3, /**< G45+ */
599 BRW_OPCODE_NOT = 4,
600 BRW_OPCODE_AND = 5,
601 BRW_OPCODE_OR = 6,
602 BRW_OPCODE_XOR = 7,
603 BRW_OPCODE_SHR = 8,
604 BRW_OPCODE_SHL = 9,
605 BRW_OPCODE_DIM = 10, /**< Gen7.5 only */ /* Reused */
606 // BRW_OPCODE_SMOV = 10, /**< Gen8+ */ /* Reused */
607 /* Reserved - 11 */
608 BRW_OPCODE_ASR = 12,
609 /* Reserved - 13-15 */
610 BRW_OPCODE_CMP = 16,
611 BRW_OPCODE_CMPN = 17,
612 BRW_OPCODE_CSEL = 18, /**< Gen8+ */
613 BRW_OPCODE_F32TO16 = 19, /**< Gen7 only */
614 BRW_OPCODE_F16TO32 = 20, /**< Gen7 only */
615 /* Reserved - 21-22 */
616 BRW_OPCODE_BFREV = 23, /**< Gen7+ */
617 BRW_OPCODE_BFE = 24, /**< Gen7+ */
618 BRW_OPCODE_BFI1 = 25, /**< Gen7+ */
619 BRW_OPCODE_BFI2 = 26, /**< Gen7+ */
620 /* Reserved - 27-31 */
621 BRW_OPCODE_JMPI = 32,
622 // BRW_OPCODE_BRD = 33, /**< Gen7+ */
623 BRW_OPCODE_IF = 34,
624 BRW_OPCODE_IFF = 35, /**< Pre-Gen6 */ /* Reused */
625 // BRW_OPCODE_BRC = 35, /**< Gen7+ */ /* Reused */
626 BRW_OPCODE_ELSE = 36,
627 BRW_OPCODE_ENDIF = 37,
628 BRW_OPCODE_DO = 38, /**< Pre-Gen6 */ /* Reused */
629 // BRW_OPCODE_CASE = 38, /**< Gen6 only */ /* Reused */
630 BRW_OPCODE_WHILE = 39,
631 BRW_OPCODE_BREAK = 40,
632 BRW_OPCODE_CONTINUE = 41,
633 BRW_OPCODE_HALT = 42,
634 // BRW_OPCODE_CALLA = 43, /**< Gen7.5+ */
635 // BRW_OPCODE_MSAVE = 44, /**< Pre-Gen6 */ /* Reused */
636 // BRW_OPCODE_CALL = 44, /**< Gen6+ */ /* Reused */
637 // BRW_OPCODE_MREST = 45, /**< Pre-Gen6 */ /* Reused */
638 // BRW_OPCODE_RET = 45, /**< Gen6+ */ /* Reused */
639 // BRW_OPCODE_PUSH = 46, /**< Pre-Gen6 */ /* Reused */
640 // BRW_OPCODE_FORK = 46, /**< Gen6 only */ /* Reused */
641 // BRW_OPCODE_GOTO = 46, /**< Gen8+ */ /* Reused */
642 // BRW_OPCODE_POP = 47, /**< Pre-Gen6 */
643 BRW_OPCODE_WAIT = 48,
644 BRW_OPCODE_SEND = 49,
645 BRW_OPCODE_SENDC = 50,
646 BRW_OPCODE_SENDS = 51, /**< Gen9+ */
647 BRW_OPCODE_SENDSC = 52, /**< Gen9+ */
648 /* Reserved 53-55 */
649 BRW_OPCODE_MATH = 56, /**< Gen6+ */
650 /* Reserved 57-63 */
651 BRW_OPCODE_ADD = 64,
652 BRW_OPCODE_MUL = 65,
653 BRW_OPCODE_AVG = 66,
654 BRW_OPCODE_FRC = 67,
655 BRW_OPCODE_RNDU = 68,
656 BRW_OPCODE_RNDD = 69,
657 BRW_OPCODE_RNDE = 70,
658 BRW_OPCODE_RNDZ = 71,
659 BRW_OPCODE_MAC = 72,
660 BRW_OPCODE_MACH = 73,
661 BRW_OPCODE_LZD = 74,
662 BRW_OPCODE_FBH = 75, /**< Gen7+ */
663 BRW_OPCODE_FBL = 76, /**< Gen7+ */
664 BRW_OPCODE_CBIT = 77, /**< Gen7+ */
665 BRW_OPCODE_ADDC = 78, /**< Gen7+ */
666 BRW_OPCODE_SUBB = 79, /**< Gen7+ */
667 BRW_OPCODE_SAD2 = 80,
668 BRW_OPCODE_SADA2 = 81,
669 /* Reserved 82-83 */
670 BRW_OPCODE_DP4 = 84,
671 BRW_OPCODE_DPH = 85,
672 BRW_OPCODE_DP3 = 86,
673 BRW_OPCODE_DP2 = 87,
674 /* Reserved 88 */
675 BRW_OPCODE_LINE = 89,
676 BRW_OPCODE_PLN = 90, /**< G45+ */
677 BRW_OPCODE_MAD = 91, /**< Gen6+ */
678 BRW_OPCODE_LRP = 92, /**< Gen6+ */
679 // BRW_OPCODE_MADM = 93, /**< Gen8+ */
680 /* Reserved 94-124 */
681 BRW_OPCODE_NENOP = 125, /**< G45 only */
682 BRW_OPCODE_NOP = 126,
683 /* Reserved 127 */
684
685 /* These are compiler backend opcodes that get translated into other
686 * instructions.
687 */
688 FS_OPCODE_FB_WRITE = 128,
689
690 /**
691 * Same as FS_OPCODE_FB_WRITE but expects its arguments separately as
692 * individual sources instead of as a single payload blob. The
693 * position/ordering of the arguments are defined by the enum
694 * fb_write_logical_srcs.
695 */
696 FS_OPCODE_FB_WRITE_LOGICAL,
697
698 FS_OPCODE_REP_FB_WRITE,
699
700 FS_OPCODE_FB_READ,
701 FS_OPCODE_FB_READ_LOGICAL,
702
703 SHADER_OPCODE_RCP,
704 SHADER_OPCODE_RSQ,
705 SHADER_OPCODE_SQRT,
706 SHADER_OPCODE_EXP2,
707 SHADER_OPCODE_LOG2,
708 SHADER_OPCODE_POW,
709 SHADER_OPCODE_INT_QUOTIENT,
710 SHADER_OPCODE_INT_REMAINDER,
711 SHADER_OPCODE_SIN,
712 SHADER_OPCODE_COS,
713
714 /**
715 * Texture sampling opcodes.
716 *
717 * LOGICAL opcodes are eventually translated to the matching non-LOGICAL
718 * opcode but instead of taking a single payload blob they expect their
719 * arguments separately as individual sources. The position/ordering of the
720 * arguments are defined by the enum tex_logical_srcs.
721 */
722 SHADER_OPCODE_TEX,
723 SHADER_OPCODE_TEX_LOGICAL,
724 SHADER_OPCODE_TXD,
725 SHADER_OPCODE_TXD_LOGICAL,
726 SHADER_OPCODE_TXF,
727 SHADER_OPCODE_TXF_LOGICAL,
728 SHADER_OPCODE_TXF_LZ,
729 SHADER_OPCODE_TXL,
730 SHADER_OPCODE_TXL_LOGICAL,
731 SHADER_OPCODE_TXL_LZ,
732 SHADER_OPCODE_TXS,
733 SHADER_OPCODE_TXS_LOGICAL,
734 FS_OPCODE_TXB,
735 FS_OPCODE_TXB_LOGICAL,
736 SHADER_OPCODE_TXF_CMS,
737 SHADER_OPCODE_TXF_CMS_LOGICAL,
738 SHADER_OPCODE_TXF_CMS_W,
739 SHADER_OPCODE_TXF_CMS_W_LOGICAL,
740 SHADER_OPCODE_TXF_UMS,
741 SHADER_OPCODE_TXF_UMS_LOGICAL,
742 SHADER_OPCODE_TXF_MCS,
743 SHADER_OPCODE_TXF_MCS_LOGICAL,
744 SHADER_OPCODE_LOD,
745 SHADER_OPCODE_LOD_LOGICAL,
746 SHADER_OPCODE_TG4,
747 SHADER_OPCODE_TG4_LOGICAL,
748 SHADER_OPCODE_TG4_OFFSET,
749 SHADER_OPCODE_TG4_OFFSET_LOGICAL,
750 SHADER_OPCODE_SAMPLEINFO,
751 SHADER_OPCODE_SAMPLEINFO_LOGICAL,
752
753 /**
754 * Combines multiple sources of size 1 into a larger virtual GRF.
755 * For example, parameters for a send-from-GRF message. Or, updating
756 * channels of a size 4 VGRF used to store vec4s such as texturing results.
757 *
758 * This will be lowered into MOVs from each source to consecutive offsets
759 * of the destination VGRF.
760 *
761 * src[0] may be BAD_FILE. If so, the lowering pass skips emitting the MOV,
762 * but still reserves the first channel of the destination VGRF. This can be
763 * used to reserve space for, say, a message header set up by the generators.
764 */
765 SHADER_OPCODE_LOAD_PAYLOAD,
766
767 /**
768 * Packs a number of sources into a single value. Unlike LOAD_PAYLOAD, this
769 * acts intra-channel, obtaining the final value for each channel by
770 * combining the sources values for the same channel, the first source
771 * occupying the lowest bits and the last source occupying the highest
772 * bits.
773 */
774 FS_OPCODE_PACK,
775
776 SHADER_OPCODE_SHADER_TIME_ADD,
777
778 /**
779 * Typed and untyped surface access opcodes.
780 *
781 * LOGICAL opcodes are eventually translated to the matching non-LOGICAL
782 * opcode but instead of taking a single payload blob they expect their
783 * arguments separately as individual sources:
784 *
785 * Source 0: [required] Surface coordinates.
786 * Source 1: [optional] Operation source.
787 * Source 2: [required] Surface index.
788 * Source 3: [required] Number of coordinate components (as UD immediate).
789 * Source 4: [required] Opcode-specific control immediate, same as source 2
790 * of the matching non-LOGICAL opcode.
791 */
792 SHADER_OPCODE_UNTYPED_ATOMIC,
793 SHADER_OPCODE_UNTYPED_ATOMIC_LOGICAL,
794 SHADER_OPCODE_UNTYPED_SURFACE_READ,
795 SHADER_OPCODE_UNTYPED_SURFACE_READ_LOGICAL,
796 SHADER_OPCODE_UNTYPED_SURFACE_WRITE,
797 SHADER_OPCODE_UNTYPED_SURFACE_WRITE_LOGICAL,
798
799 SHADER_OPCODE_TYPED_ATOMIC,
800 SHADER_OPCODE_TYPED_ATOMIC_LOGICAL,
801 SHADER_OPCODE_TYPED_SURFACE_READ,
802 SHADER_OPCODE_TYPED_SURFACE_READ_LOGICAL,
803 SHADER_OPCODE_TYPED_SURFACE_WRITE,
804 SHADER_OPCODE_TYPED_SURFACE_WRITE_LOGICAL,
805
806 SHADER_OPCODE_MEMORY_FENCE,
807
808 SHADER_OPCODE_GEN4_SCRATCH_READ,
809 SHADER_OPCODE_GEN4_SCRATCH_WRITE,
810 SHADER_OPCODE_GEN7_SCRATCH_READ,
811
812 /**
813 * Gen8+ SIMD8 URB Read messages.
814 */
815 SHADER_OPCODE_URB_READ_SIMD8,
816 SHADER_OPCODE_URB_READ_SIMD8_PER_SLOT,
817
818 SHADER_OPCODE_URB_WRITE_SIMD8,
819 SHADER_OPCODE_URB_WRITE_SIMD8_PER_SLOT,
820 SHADER_OPCODE_URB_WRITE_SIMD8_MASKED,
821 SHADER_OPCODE_URB_WRITE_SIMD8_MASKED_PER_SLOT,
822
823 /**
824 * Return the index of an arbitrary live channel (i.e. one of the channels
825 * enabled in the current execution mask) and assign it to the first
826 * component of the destination. Expected to be used as input for the
827 * BROADCAST pseudo-opcode.
828 */
829 SHADER_OPCODE_FIND_LIVE_CHANNEL,
830
831 /**
832 * Pick the channel from its first source register given by the index
833 * specified as second source. Useful for variable indexing of surfaces.
834 *
835 * Note that because the result of this instruction is by definition
836 * uniform and it can always be splatted to multiple channels using a
837 * scalar regioning mode, only the first channel of the destination region
838 * is guaranteed to be updated, which implies that BROADCAST instructions
839 * should usually be marked force_writemask_all.
840 */
841 SHADER_OPCODE_BROADCAST,
842
843 VEC4_OPCODE_MOV_BYTES,
844 VEC4_OPCODE_PACK_BYTES,
845 VEC4_OPCODE_UNPACK_UNIFORM,
846 VEC4_OPCODE_FROM_DOUBLE,
847 VEC4_OPCODE_TO_DOUBLE,
848 VEC4_OPCODE_PICK_LOW_32BIT,
849 VEC4_OPCODE_PICK_HIGH_32BIT,
850 VEC4_OPCODE_SET_LOW_32BIT,
851 VEC4_OPCODE_SET_HIGH_32BIT,
852
853 FS_OPCODE_DDX_COARSE,
854 FS_OPCODE_DDX_FINE,
855 /**
856 * Compute dFdy(), dFdyCoarse(), or dFdyFine().
857 */
858 FS_OPCODE_DDY_COARSE,
859 FS_OPCODE_DDY_FINE,
860 FS_OPCODE_CINTERP,
861 FS_OPCODE_LINTERP,
862 FS_OPCODE_PIXEL_X,
863 FS_OPCODE_PIXEL_Y,
864 FS_OPCODE_UNIFORM_PULL_CONSTANT_LOAD,
865 FS_OPCODE_UNIFORM_PULL_CONSTANT_LOAD_GEN7,
866 FS_OPCODE_VARYING_PULL_CONSTANT_LOAD_GEN4,
867 FS_OPCODE_VARYING_PULL_CONSTANT_LOAD_GEN7,
868 FS_OPCODE_VARYING_PULL_CONSTANT_LOAD_LOGICAL,
869 FS_OPCODE_GET_BUFFER_SIZE,
870 FS_OPCODE_MOV_DISPATCH_TO_FLAGS,
871 FS_OPCODE_DISCARD_JUMP,
872 FS_OPCODE_SET_SAMPLE_ID,
873 FS_OPCODE_PACK_HALF_2x16_SPLIT,
874 FS_OPCODE_UNPACK_HALF_2x16_SPLIT_X,
875 FS_OPCODE_UNPACK_HALF_2x16_SPLIT_Y,
876 FS_OPCODE_PLACEHOLDER_HALT,
877 FS_OPCODE_INTERPOLATE_AT_SAMPLE,
878 FS_OPCODE_INTERPOLATE_AT_SHARED_OFFSET,
879 FS_OPCODE_INTERPOLATE_AT_PER_SLOT_OFFSET,
880
881 VS_OPCODE_URB_WRITE,
882 VS_OPCODE_PULL_CONSTANT_LOAD,
883 VS_OPCODE_PULL_CONSTANT_LOAD_GEN7,
884 VS_OPCODE_SET_SIMD4X2_HEADER_GEN9,
885
886 VS_OPCODE_GET_BUFFER_SIZE,
887
888 VS_OPCODE_UNPACK_FLAGS_SIMD4X2,
889
890 /**
891 * Write geometry shader output data to the URB.
892 *
893 * Unlike VS_OPCODE_URB_WRITE, this opcode doesn't do an implied move from
894 * R0 to the first MRF. This allows the geometry shader to override the
895 * "Slot {0,1} Offset" fields in the message header.
896 */
897 GS_OPCODE_URB_WRITE,
898
899 /**
900 * Write geometry shader output data to the URB and request a new URB
901 * handle (gen6).
902 *
903 * This opcode doesn't do an implied move from R0 to the first MRF.
904 */
905 GS_OPCODE_URB_WRITE_ALLOCATE,
906
907 /**
908 * Terminate the geometry shader thread by doing an empty URB write.
909 *
910 * This opcode doesn't do an implied move from R0 to the first MRF. This
911 * allows the geometry shader to override the "GS Number of Output Vertices
912 * for Slot {0,1}" fields in the message header.
913 */
914 GS_OPCODE_THREAD_END,
915
916 /**
917 * Set the "Slot {0,1} Offset" fields of a URB_WRITE message header.
918 *
919 * - dst is the MRF containing the message header.
920 *
921 * - src0.x indicates which portion of the URB should be written to (e.g. a
922 * vertex number)
923 *
924 * - src1 is an immediate multiplier which will be applied to src0
925 * (e.g. the size of a single vertex in the URB).
926 *
927 * Note: the hardware will apply this offset *in addition to* the offset in
928 * vec4_instruction::offset.
929 */
930 GS_OPCODE_SET_WRITE_OFFSET,
931
932 /**
933 * Set the "GS Number of Output Vertices for Slot {0,1}" fields of a
934 * URB_WRITE message header.
935 *
936 * - dst is the MRF containing the message header.
937 *
938 * - src0.x is the vertex count. The upper 16 bits will be ignored.
939 */
940 GS_OPCODE_SET_VERTEX_COUNT,
941
942 /**
943 * Set DWORD 2 of dst to the value in src.
944 */
945 GS_OPCODE_SET_DWORD_2,
946
947 /**
948 * Prepare the dst register for storage in the "Channel Mask" fields of a
949 * URB_WRITE message header.
950 *
951 * DWORD 4 of dst is shifted left by 4 bits, so that later,
952 * GS_OPCODE_SET_CHANNEL_MASKS can OR DWORDs 0 and 4 together to form the
953 * final channel mask.
954 *
955 * Note: since GS_OPCODE_SET_CHANNEL_MASKS ORs DWORDs 0 and 4 together to
956 * form the final channel mask, DWORDs 0 and 4 of the dst register must not
957 * have any extraneous bits set prior to execution of this opcode (that is,
958 * they should be in the range 0x0 to 0xf).
959 */
960 GS_OPCODE_PREPARE_CHANNEL_MASKS,
961
962 /**
963 * Set the "Channel Mask" fields of a URB_WRITE message header.
964 *
965 * - dst is the MRF containing the message header.
966 *
967 * - src.x is the channel mask, as prepared by
968 * GS_OPCODE_PREPARE_CHANNEL_MASKS. DWORDs 0 and 4 are OR'ed together to
969 * form the final channel mask.
970 */
971 GS_OPCODE_SET_CHANNEL_MASKS,
972
973 /**
974 * Get the "Instance ID" fields from the payload.
975 *
976 * - dst is the GRF for gl_InvocationID.
977 */
978 GS_OPCODE_GET_INSTANCE_ID,
979
980 /**
981 * Send a FF_SYNC message to allocate initial URB handles (gen6).
982 *
983 * - dst will be used as the writeback register for the FF_SYNC operation.
984 *
985 * - src0 is the number of primitives written.
986 *
987 * - src1 is the value to hold in M0.0: number of SO vertices to write
988 * and number of SO primitives needed. Its value will be overwritten
989 * with the SVBI values if transform feedback is enabled.
990 *
991 * Note: This opcode uses an implicit MRF register for the ff_sync message
992 * header, so the caller is expected to set inst->base_mrf and initialize
993 * that MRF register to r0. This opcode will also write to this MRF register
994 * to include the allocated URB handle so it can then be reused directly as
995 * the header in the URB write operation we are allocating the handle for.
996 */
997 GS_OPCODE_FF_SYNC,
998
999 /**
1000 * Move r0.1 (which holds PrimitiveID information in gen6) to a separate
1001 * register.
1002 *
1003 * - dst is the GRF where PrimitiveID information will be moved.
1004 */
1005 GS_OPCODE_SET_PRIMITIVE_ID,
1006
1007 /**
1008 * Write transform feedback data to the SVB by sending a SVB WRITE message.
1009 * Used in gen6.
1010 *
1011 * - dst is the MRF register containing the message header.
1012 *
1013 * - src0 is the register where the vertex data is going to be copied from.
1014 *
1015 * - src1 is the destination register when write commit occurs.
1016 */
1017 GS_OPCODE_SVB_WRITE,
1018
1019 /**
1020 * Set destination index in the SVB write message payload (M0.5). Used
1021 * in gen6 for transform feedback.
1022 *
1023 * - dst is the header to save the destination indices for SVB WRITE.
1024 * - src is the register that holds the destination indices value.
1025 */
1026 GS_OPCODE_SVB_SET_DST_INDEX,
1027
1028 /**
1029 * Prepare Mx.0 subregister for being used in the FF_SYNC message header.
1030 * Used in gen6 for transform feedback.
1031 *
1032 * - dst will hold the register with the final Mx.0 value.
1033 *
1034 * - src0 has the number of vertices emitted in SO (NumSOVertsToWrite)
1035 *
1036 * - src1 has the number of needed primitives for SO (NumSOPrimsNeeded)
1037 *
1038 * - src2 is the value to hold in M0: number of SO vertices to write
1039 * and number of SO primitives needed.
1040 */
1041 GS_OPCODE_FF_SYNC_SET_PRIMITIVES,
1042
1043 /**
1044 * Terminate the compute shader.
1045 */
1046 CS_OPCODE_CS_TERMINATE,
1047
1048 /**
1049 * GLSL barrier()
1050 */
1051 SHADER_OPCODE_BARRIER,
1052
1053 /**
1054 * Calculate the high 32-bits of a 32x32 multiply.
1055 */
1056 SHADER_OPCODE_MULH,
1057
1058 /**
1059 * A MOV that uses VxH indirect addressing.
1060 *
1061 * Source 0: A register to start from (HW_REG).
1062 * Source 1: An indirect offset (in bytes, UD GRF).
1063 * Source 2: The length of the region that could be accessed (in bytes,
1064 * UD immediate).
1065 */
1066 SHADER_OPCODE_MOV_INDIRECT,
1067
1068 VEC4_OPCODE_URB_READ,
1069 TCS_OPCODE_GET_INSTANCE_ID,
1070 TCS_OPCODE_URB_WRITE,
1071 TCS_OPCODE_SET_INPUT_URB_OFFSETS,
1072 TCS_OPCODE_SET_OUTPUT_URB_OFFSETS,
1073 TCS_OPCODE_GET_PRIMITIVE_ID,
1074 TCS_OPCODE_CREATE_BARRIER_HEADER,
1075 TCS_OPCODE_SRC0_010_IS_ZERO,
1076 TCS_OPCODE_RELEASE_INPUT,
1077 TCS_OPCODE_THREAD_END,
1078
1079 TES_OPCODE_GET_PRIMITIVE_ID,
1080 TES_OPCODE_CREATE_INPUT_READ_HEADER,
1081 TES_OPCODE_ADD_INDIRECT_URB_OFFSET,
1082 };
1083
1084 enum brw_urb_write_flags {
1085 BRW_URB_WRITE_NO_FLAGS = 0,
1086
1087 /**
1088 * Causes a new URB entry to be allocated, and its address stored in the
1089 * destination register (gen < 7).
1090 */
1091 BRW_URB_WRITE_ALLOCATE = 0x1,
1092
1093 /**
1094 * Causes the current URB entry to be deallocated (gen < 7).
1095 */
1096 BRW_URB_WRITE_UNUSED = 0x2,
1097
1098 /**
1099 * Causes the thread to terminate.
1100 */
1101 BRW_URB_WRITE_EOT = 0x4,
1102
1103 /**
1104 * Indicates that the given URB entry is complete, and may be sent further
1105 * down the 3D pipeline (gen < 7).
1106 */
1107 BRW_URB_WRITE_COMPLETE = 0x8,
1108
1109 /**
1110 * Indicates that an additional offset (which may be different for the two
1111 * vec4 slots) is stored in the message header (gen == 7).
1112 */
1113 BRW_URB_WRITE_PER_SLOT_OFFSET = 0x10,
1114
1115 /**
1116 * Indicates that the channel masks in the URB_WRITE message header should
1117 * not be overridden to 0xff (gen == 7).
1118 */
1119 BRW_URB_WRITE_USE_CHANNEL_MASKS = 0x20,
1120
1121 /**
1122 * Indicates that the data should be sent to the URB using the
1123 * URB_WRITE_OWORD message rather than URB_WRITE_HWORD (gen == 7). This
1124 * causes offsets to be interpreted as multiples of an OWORD instead of an
1125 * HWORD, and only allows one OWORD to be written.
1126 */
1127 BRW_URB_WRITE_OWORD = 0x40,
1128
1129 /**
1130 * Convenient combination of flags: end the thread while simultaneously
1131 * marking the given URB entry as complete.
1132 */
1133 BRW_URB_WRITE_EOT_COMPLETE = BRW_URB_WRITE_EOT | BRW_URB_WRITE_COMPLETE,
1134
1135 /**
1136 * Convenient combination of flags: mark the given URB entry as complete
1137 * and simultaneously allocate a new one.
1138 */
1139 BRW_URB_WRITE_ALLOCATE_COMPLETE =
1140 BRW_URB_WRITE_ALLOCATE | BRW_URB_WRITE_COMPLETE,
1141 };
1142
1143 enum fb_write_logical_srcs {
1144 FB_WRITE_LOGICAL_SRC_COLOR0, /* REQUIRED */
1145 FB_WRITE_LOGICAL_SRC_COLOR1, /* for dual source blend messages */
1146 FB_WRITE_LOGICAL_SRC_SRC0_ALPHA,
1147 FB_WRITE_LOGICAL_SRC_SRC_DEPTH, /* gl_FragDepth */
1148 FB_WRITE_LOGICAL_SRC_DST_DEPTH, /* GEN4-5: passthrough from thread */
1149 FB_WRITE_LOGICAL_SRC_SRC_STENCIL, /* gl_FragStencilRefARB */
1150 FB_WRITE_LOGICAL_SRC_OMASK, /* Sample Mask (gl_SampleMask) */
1151 FB_WRITE_LOGICAL_SRC_COMPONENTS, /* REQUIRED */
1152 FB_WRITE_LOGICAL_NUM_SRCS
1153 };
1154
1155 enum tex_logical_srcs {
1156 /** Texture coordinates */
1157 TEX_LOGICAL_SRC_COORDINATE,
1158 /** Shadow comparator */
1159 TEX_LOGICAL_SRC_SHADOW_C,
1160 /** dPdx if the operation takes explicit derivatives, otherwise LOD value */
1161 TEX_LOGICAL_SRC_LOD,
1162 /** dPdy if the operation takes explicit derivatives */
1163 TEX_LOGICAL_SRC_LOD2,
1164 /** Sample index */
1165 TEX_LOGICAL_SRC_SAMPLE_INDEX,
1166 /** MCS data */
1167 TEX_LOGICAL_SRC_MCS,
1168 /** REQUIRED: Texture surface index */
1169 TEX_LOGICAL_SRC_SURFACE,
1170 /** Texture sampler index */
1171 TEX_LOGICAL_SRC_SAMPLER,
1172 /** Texel offset for gathers */
1173 TEX_LOGICAL_SRC_TG4_OFFSET,
1174 /** REQUIRED: Number of coordinate components (as UD immediate) */
1175 TEX_LOGICAL_SRC_COORD_COMPONENTS,
1176 /** REQUIRED: Number of derivative components (as UD immediate) */
1177 TEX_LOGICAL_SRC_GRAD_COMPONENTS,
1178
1179 TEX_LOGICAL_NUM_SRCS,
1180 };
1181
1182 #ifdef __cplusplus
1183 /**
1184 * Allow brw_urb_write_flags enums to be ORed together.
1185 */
1186 inline brw_urb_write_flags
1187 operator|(brw_urb_write_flags x, brw_urb_write_flags y)
1188 {
1189 return static_cast<brw_urb_write_flags>(static_cast<int>(x) |
1190 static_cast<int>(y));
1191 }
1192 #endif
1193
1194 enum PACKED brw_predicate {
1195 BRW_PREDICATE_NONE = 0,
1196 BRW_PREDICATE_NORMAL = 1,
1197 BRW_PREDICATE_ALIGN1_ANYV = 2,
1198 BRW_PREDICATE_ALIGN1_ALLV = 3,
1199 BRW_PREDICATE_ALIGN1_ANY2H = 4,
1200 BRW_PREDICATE_ALIGN1_ALL2H = 5,
1201 BRW_PREDICATE_ALIGN1_ANY4H = 6,
1202 BRW_PREDICATE_ALIGN1_ALL4H = 7,
1203 BRW_PREDICATE_ALIGN1_ANY8H = 8,
1204 BRW_PREDICATE_ALIGN1_ALL8H = 9,
1205 BRW_PREDICATE_ALIGN1_ANY16H = 10,
1206 BRW_PREDICATE_ALIGN1_ALL16H = 11,
1207 BRW_PREDICATE_ALIGN1_ANY32H = 12,
1208 BRW_PREDICATE_ALIGN1_ALL32H = 13,
1209 BRW_PREDICATE_ALIGN16_REPLICATE_X = 2,
1210 BRW_PREDICATE_ALIGN16_REPLICATE_Y = 3,
1211 BRW_PREDICATE_ALIGN16_REPLICATE_Z = 4,
1212 BRW_PREDICATE_ALIGN16_REPLICATE_W = 5,
1213 BRW_PREDICATE_ALIGN16_ANY4H = 6,
1214 BRW_PREDICATE_ALIGN16_ALL4H = 7,
1215 };
1216
1217 enum PACKED brw_reg_file {
1218 BRW_ARCHITECTURE_REGISTER_FILE = 0,
1219 BRW_GENERAL_REGISTER_FILE = 1,
1220 BRW_MESSAGE_REGISTER_FILE = 2,
1221 BRW_IMMEDIATE_VALUE = 3,
1222
1223 ARF = BRW_ARCHITECTURE_REGISTER_FILE,
1224 FIXED_GRF = BRW_GENERAL_REGISTER_FILE,
1225 MRF = BRW_MESSAGE_REGISTER_FILE,
1226 IMM = BRW_IMMEDIATE_VALUE,
1227
1228 /* These are not hardware values */
1229 VGRF,
1230 ATTR,
1231 UNIFORM, /* prog_data->params[reg] */
1232 BAD_FILE,
1233 };
1234
1235 #define BRW_HW_REG_TYPE_UD 0
1236 #define BRW_HW_REG_TYPE_D 1
1237 #define BRW_HW_REG_TYPE_UW 2
1238 #define BRW_HW_REG_TYPE_W 3
1239 #define BRW_HW_REG_TYPE_F 7
1240 #define GEN8_HW_REG_TYPE_UQ 8
1241 #define GEN8_HW_REG_TYPE_Q 9
1242
1243 #define BRW_HW_REG_NON_IMM_TYPE_UB 4
1244 #define BRW_HW_REG_NON_IMM_TYPE_B 5
1245 #define GEN7_HW_REG_NON_IMM_TYPE_DF 6
1246 #define GEN8_HW_REG_NON_IMM_TYPE_HF 10
1247
1248 #define BRW_HW_REG_IMM_TYPE_UV 4 /* Gen6+ packed unsigned immediate vector */
1249 #define BRW_HW_REG_IMM_TYPE_VF 5 /* packed float immediate vector */
1250 #define BRW_HW_REG_IMM_TYPE_V 6 /* packed int imm. vector; uword dest only */
1251 #define GEN8_HW_REG_IMM_TYPE_DF 10
1252 #define GEN8_HW_REG_IMM_TYPE_HF 11
1253
1254 /* SNB adds 3-src instructions (MAD and LRP) that only operate on floats, so
1255 * the types were implied. IVB adds BFE and BFI2 that operate on doublewords
1256 * and unsigned doublewords, so a new field is also available in the da3src
1257 * struct (part of struct brw_instruction.bits1 in brw_structs.h) to select
1258 * dst and shared-src types. The values are different from BRW_REGISTER_TYPE_*.
1259 */
1260 #define BRW_3SRC_TYPE_F 0
1261 #define BRW_3SRC_TYPE_D 1
1262 #define BRW_3SRC_TYPE_UD 2
1263 #define BRW_3SRC_TYPE_DF 3
1264
1265 #define BRW_ARF_NULL 0x00
1266 #define BRW_ARF_ADDRESS 0x10
1267 #define BRW_ARF_ACCUMULATOR 0x20
1268 #define BRW_ARF_FLAG 0x30
1269 #define BRW_ARF_MASK 0x40
1270 #define BRW_ARF_MASK_STACK 0x50
1271 #define BRW_ARF_MASK_STACK_DEPTH 0x60
1272 #define BRW_ARF_STATE 0x70
1273 #define BRW_ARF_CONTROL 0x80
1274 #define BRW_ARF_NOTIFICATION_COUNT 0x90
1275 #define BRW_ARF_IP 0xA0
1276 #define BRW_ARF_TDR 0xB0
1277 #define BRW_ARF_TIMESTAMP 0xC0
1278
1279 #define BRW_MRF_COMPR4 (1 << 7)
1280
1281 #define BRW_AMASK 0
1282 #define BRW_IMASK 1
1283 #define BRW_LMASK 2
1284 #define BRW_CMASK 3
1285
1286
1287
1288 #define BRW_THREAD_NORMAL 0
1289 #define BRW_THREAD_ATOMIC 1
1290 #define BRW_THREAD_SWITCH 2
1291
1292 enum PACKED brw_vertical_stride {
1293 BRW_VERTICAL_STRIDE_0 = 0,
1294 BRW_VERTICAL_STRIDE_1 = 1,
1295 BRW_VERTICAL_STRIDE_2 = 2,
1296 BRW_VERTICAL_STRIDE_4 = 3,
1297 BRW_VERTICAL_STRIDE_8 = 4,
1298 BRW_VERTICAL_STRIDE_16 = 5,
1299 BRW_VERTICAL_STRIDE_32 = 6,
1300 BRW_VERTICAL_STRIDE_ONE_DIMENSIONAL = 0xF,
1301 };
1302
1303 enum PACKED brw_width {
1304 BRW_WIDTH_1 = 0,
1305 BRW_WIDTH_2 = 1,
1306 BRW_WIDTH_4 = 2,
1307 BRW_WIDTH_8 = 3,
1308 BRW_WIDTH_16 = 4,
1309 };
1310
1311 /**
1312 * Message target: Shared Function ID for where to SEND a message.
1313 *
1314 * These are enumerated in the ISA reference under "send - Send Message".
1315 * In particular, see the following tables:
1316 * - G45 PRM, Volume 4, Table 14-15 "Message Descriptor Definition"
1317 * - Sandybridge PRM, Volume 4 Part 2, Table 8-16 "Extended Message Descriptor"
1318 * - Ivybridge PRM, Volume 1 Part 1, section 3.2.7 "GPE Function IDs"
1319 */
1320 enum brw_message_target {
1321 BRW_SFID_NULL = 0,
1322 BRW_SFID_MATH = 1, /* Only valid on Gen4-5 */
1323 BRW_SFID_SAMPLER = 2,
1324 BRW_SFID_MESSAGE_GATEWAY = 3,
1325 BRW_SFID_DATAPORT_READ = 4,
1326 BRW_SFID_DATAPORT_WRITE = 5,
1327 BRW_SFID_URB = 6,
1328 BRW_SFID_THREAD_SPAWNER = 7,
1329 BRW_SFID_VME = 8,
1330
1331 GEN6_SFID_DATAPORT_SAMPLER_CACHE = 4,
1332 GEN6_SFID_DATAPORT_RENDER_CACHE = 5,
1333 GEN6_SFID_DATAPORT_CONSTANT_CACHE = 9,
1334
1335 GEN7_SFID_DATAPORT_DATA_CACHE = 10,
1336 GEN7_SFID_PIXEL_INTERPOLATOR = 11,
1337 HSW_SFID_DATAPORT_DATA_CACHE_1 = 12,
1338 HSW_SFID_CRE = 13,
1339 };
1340
1341 #define GEN7_MESSAGE_TARGET_DP_DATA_CACHE 10
1342
1343 #define BRW_SAMPLER_RETURN_FORMAT_FLOAT32 0
1344 #define BRW_SAMPLER_RETURN_FORMAT_UINT32 2
1345 #define BRW_SAMPLER_RETURN_FORMAT_SINT32 3
1346
1347 #define BRW_SAMPLER_MESSAGE_SIMD8_SAMPLE 0
1348 #define BRW_SAMPLER_MESSAGE_SIMD16_SAMPLE 0
1349 #define BRW_SAMPLER_MESSAGE_SIMD16_SAMPLE_BIAS 0
1350 #define BRW_SAMPLER_MESSAGE_SIMD8_KILLPIX 1
1351 #define BRW_SAMPLER_MESSAGE_SIMD4X2_SAMPLE_LOD 1
1352 #define BRW_SAMPLER_MESSAGE_SIMD16_SAMPLE_LOD 1
1353 #define BRW_SAMPLER_MESSAGE_SIMD4X2_SAMPLE_GRADIENTS 2
1354 #define BRW_SAMPLER_MESSAGE_SIMD8_SAMPLE_GRADIENTS 2
1355 #define BRW_SAMPLER_MESSAGE_SIMD4X2_SAMPLE_COMPARE 0
1356 #define BRW_SAMPLER_MESSAGE_SIMD16_SAMPLE_COMPARE 2
1357 #define BRW_SAMPLER_MESSAGE_SIMD8_SAMPLE_BIAS_COMPARE 0
1358 #define BRW_SAMPLER_MESSAGE_SIMD4X2_SAMPLE_LOD_COMPARE 1
1359 #define BRW_SAMPLER_MESSAGE_SIMD8_SAMPLE_LOD_COMPARE 1
1360 #define BRW_SAMPLER_MESSAGE_SIMD4X2_RESINFO 2
1361 #define BRW_SAMPLER_MESSAGE_SIMD16_RESINFO 2
1362 #define BRW_SAMPLER_MESSAGE_SIMD4X2_LD 3
1363 #define BRW_SAMPLER_MESSAGE_SIMD8_LD 3
1364 #define BRW_SAMPLER_MESSAGE_SIMD16_LD 3
1365
1366 #define GEN5_SAMPLER_MESSAGE_SAMPLE 0
1367 #define GEN5_SAMPLER_MESSAGE_SAMPLE_BIAS 1
1368 #define GEN5_SAMPLER_MESSAGE_SAMPLE_LOD 2
1369 #define GEN5_SAMPLER_MESSAGE_SAMPLE_COMPARE 3
1370 #define GEN5_SAMPLER_MESSAGE_SAMPLE_DERIVS 4
1371 #define GEN5_SAMPLER_MESSAGE_SAMPLE_BIAS_COMPARE 5
1372 #define GEN5_SAMPLER_MESSAGE_SAMPLE_LOD_COMPARE 6
1373 #define GEN5_SAMPLER_MESSAGE_SAMPLE_LD 7
1374 #define GEN7_SAMPLER_MESSAGE_SAMPLE_GATHER4 8
1375 #define GEN5_SAMPLER_MESSAGE_LOD 9
1376 #define GEN5_SAMPLER_MESSAGE_SAMPLE_RESINFO 10
1377 #define GEN6_SAMPLER_MESSAGE_SAMPLE_SAMPLEINFO 11
1378 #define GEN7_SAMPLER_MESSAGE_SAMPLE_GATHER4_C 16
1379 #define GEN7_SAMPLER_MESSAGE_SAMPLE_GATHER4_PO 17
1380 #define GEN7_SAMPLER_MESSAGE_SAMPLE_GATHER4_PO_C 18
1381 #define HSW_SAMPLER_MESSAGE_SAMPLE_DERIV_COMPARE 20
1382 #define GEN9_SAMPLER_MESSAGE_SAMPLE_LZ 24
1383 #define GEN9_SAMPLER_MESSAGE_SAMPLE_C_LZ 25
1384 #define GEN9_SAMPLER_MESSAGE_SAMPLE_LD_LZ 26
1385 #define GEN9_SAMPLER_MESSAGE_SAMPLE_LD2DMS_W 28
1386 #define GEN7_SAMPLER_MESSAGE_SAMPLE_LD_MCS 29
1387 #define GEN7_SAMPLER_MESSAGE_SAMPLE_LD2DMS 30
1388 #define GEN7_SAMPLER_MESSAGE_SAMPLE_LD2DSS 31
1389
1390 /* for GEN5 only */
1391 #define BRW_SAMPLER_SIMD_MODE_SIMD4X2 0
1392 #define BRW_SAMPLER_SIMD_MODE_SIMD8 1
1393 #define BRW_SAMPLER_SIMD_MODE_SIMD16 2
1394 #define BRW_SAMPLER_SIMD_MODE_SIMD32_64 3
1395
1396 /* GEN9 changes SIMD mode 0 to mean SIMD8D, but lets us get the SIMD4x2
1397 * behavior by setting bit 22 of dword 2 in the message header. */
1398 #define GEN9_SAMPLER_SIMD_MODE_SIMD8D 0
1399 #define GEN9_SAMPLER_SIMD_MODE_EXTENSION_SIMD4X2 (1 << 22)
1400
1401 #define BRW_DATAPORT_OWORD_BLOCK_1_OWORDLOW 0
1402 #define BRW_DATAPORT_OWORD_BLOCK_1_OWORDHIGH 1
1403 #define BRW_DATAPORT_OWORD_BLOCK_2_OWORDS 2
1404 #define BRW_DATAPORT_OWORD_BLOCK_4_OWORDS 3
1405 #define BRW_DATAPORT_OWORD_BLOCK_8_OWORDS 4
1406 #define BRW_DATAPORT_OWORD_BLOCK_DWORDS(n) \
1407 ((n) == 4 ? BRW_DATAPORT_OWORD_BLOCK_1_OWORDLOW : \
1408 (n) == 8 ? BRW_DATAPORT_OWORD_BLOCK_2_OWORDS : \
1409 (n) == 16 ? BRW_DATAPORT_OWORD_BLOCK_4_OWORDS : \
1410 (n) == 32 ? BRW_DATAPORT_OWORD_BLOCK_8_OWORDS : \
1411 (abort(), ~0))
1412
1413 #define BRW_DATAPORT_OWORD_DUAL_BLOCK_1OWORD 0
1414 #define BRW_DATAPORT_OWORD_DUAL_BLOCK_4OWORDS 2
1415
1416 #define BRW_DATAPORT_DWORD_SCATTERED_BLOCK_8DWORDS 2
1417 #define BRW_DATAPORT_DWORD_SCATTERED_BLOCK_16DWORDS 3
1418
1419 /* This one stays the same across generations. */
1420 #define BRW_DATAPORT_READ_MESSAGE_OWORD_BLOCK_READ 0
1421 /* GEN4 */
1422 #define BRW_DATAPORT_READ_MESSAGE_OWORD_DUAL_BLOCK_READ 1
1423 #define BRW_DATAPORT_READ_MESSAGE_MEDIA_BLOCK_READ 2
1424 #define BRW_DATAPORT_READ_MESSAGE_DWORD_SCATTERED_READ 3
1425 /* G45, GEN5 */
1426 #define G45_DATAPORT_READ_MESSAGE_RENDER_UNORM_READ 1
1427 #define G45_DATAPORT_READ_MESSAGE_OWORD_DUAL_BLOCK_READ 2
1428 #define G45_DATAPORT_READ_MESSAGE_AVC_LOOP_FILTER_READ 3
1429 #define G45_DATAPORT_READ_MESSAGE_MEDIA_BLOCK_READ 4
1430 #define G45_DATAPORT_READ_MESSAGE_DWORD_SCATTERED_READ 6
1431 /* GEN6 */
1432 #define GEN6_DATAPORT_READ_MESSAGE_RENDER_UNORM_READ 1
1433 #define GEN6_DATAPORT_READ_MESSAGE_OWORD_DUAL_BLOCK_READ 2
1434 #define GEN6_DATAPORT_READ_MESSAGE_MEDIA_BLOCK_READ 4
1435 #define GEN6_DATAPORT_READ_MESSAGE_OWORD_UNALIGN_BLOCK_READ 5
1436 #define GEN6_DATAPORT_READ_MESSAGE_DWORD_SCATTERED_READ 6
1437
1438 #define BRW_DATAPORT_READ_TARGET_DATA_CACHE 0
1439 #define BRW_DATAPORT_READ_TARGET_RENDER_CACHE 1
1440 #define BRW_DATAPORT_READ_TARGET_SAMPLER_CACHE 2
1441
1442 #define BRW_DATAPORT_RENDER_TARGET_WRITE_SIMD16_SINGLE_SOURCE 0
1443 #define BRW_DATAPORT_RENDER_TARGET_WRITE_SIMD16_SINGLE_SOURCE_REPLICATED 1
1444 #define BRW_DATAPORT_RENDER_TARGET_WRITE_SIMD8_DUAL_SOURCE_SUBSPAN01 2
1445 #define BRW_DATAPORT_RENDER_TARGET_WRITE_SIMD8_DUAL_SOURCE_SUBSPAN23 3
1446 #define BRW_DATAPORT_RENDER_TARGET_WRITE_SIMD8_SINGLE_SOURCE_SUBSPAN01 4
1447
1448 #define BRW_DATAPORT_WRITE_MESSAGE_OWORD_BLOCK_WRITE 0
1449 #define BRW_DATAPORT_WRITE_MESSAGE_OWORD_DUAL_BLOCK_WRITE 1
1450 #define BRW_DATAPORT_WRITE_MESSAGE_MEDIA_BLOCK_WRITE 2
1451 #define BRW_DATAPORT_WRITE_MESSAGE_DWORD_SCATTERED_WRITE 3
1452 #define BRW_DATAPORT_WRITE_MESSAGE_RENDER_TARGET_WRITE 4
1453 #define BRW_DATAPORT_WRITE_MESSAGE_STREAMED_VERTEX_BUFFER_WRITE 5
1454 #define BRW_DATAPORT_WRITE_MESSAGE_FLUSH_RENDER_CACHE 7
1455
1456 /* GEN6 */
1457 #define GEN6_DATAPORT_WRITE_MESSAGE_DWORD_ATOMIC_WRITE 7
1458 #define GEN6_DATAPORT_WRITE_MESSAGE_OWORD_BLOCK_WRITE 8
1459 #define GEN6_DATAPORT_WRITE_MESSAGE_OWORD_DUAL_BLOCK_WRITE 9
1460 #define GEN6_DATAPORT_WRITE_MESSAGE_MEDIA_BLOCK_WRITE 10
1461 #define GEN6_DATAPORT_WRITE_MESSAGE_DWORD_SCATTERED_WRITE 11
1462 #define GEN6_DATAPORT_WRITE_MESSAGE_RENDER_TARGET_WRITE 12
1463 #define GEN6_DATAPORT_WRITE_MESSAGE_STREAMED_VB_WRITE 13
1464 #define GEN6_DATAPORT_WRITE_MESSAGE_RENDER_TARGET_UNORM_WRITE 14
1465
1466 /* GEN7 */
1467 #define GEN7_DATAPORT_RC_MEDIA_BLOCK_READ 4
1468 #define GEN7_DATAPORT_RC_TYPED_SURFACE_READ 5
1469 #define GEN7_DATAPORT_RC_TYPED_ATOMIC_OP 6
1470 #define GEN7_DATAPORT_RC_MEMORY_FENCE 7
1471 #define GEN7_DATAPORT_RC_MEDIA_BLOCK_WRITE 10
1472 #define GEN7_DATAPORT_RC_RENDER_TARGET_WRITE 12
1473 #define GEN7_DATAPORT_RC_TYPED_SURFACE_WRITE 13
1474 #define GEN7_DATAPORT_DC_OWORD_BLOCK_READ 0
1475 #define GEN7_DATAPORT_DC_UNALIGNED_OWORD_BLOCK_READ 1
1476 #define GEN7_DATAPORT_DC_OWORD_DUAL_BLOCK_READ 2
1477 #define GEN7_DATAPORT_DC_DWORD_SCATTERED_READ 3
1478 #define GEN7_DATAPORT_DC_BYTE_SCATTERED_READ 4
1479 #define GEN7_DATAPORT_DC_UNTYPED_SURFACE_READ 5
1480 #define GEN7_DATAPORT_DC_UNTYPED_ATOMIC_OP 6
1481 #define GEN7_DATAPORT_DC_MEMORY_FENCE 7
1482 #define GEN7_DATAPORT_DC_OWORD_BLOCK_WRITE 8
1483 #define GEN7_DATAPORT_DC_OWORD_DUAL_BLOCK_WRITE 10
1484 #define GEN7_DATAPORT_DC_DWORD_SCATTERED_WRITE 11
1485 #define GEN7_DATAPORT_DC_BYTE_SCATTERED_WRITE 12
1486 #define GEN7_DATAPORT_DC_UNTYPED_SURFACE_WRITE 13
1487
1488 #define GEN7_DATAPORT_SCRATCH_READ ((1 << 18) | \
1489 (0 << 17))
1490 #define GEN7_DATAPORT_SCRATCH_WRITE ((1 << 18) | \
1491 (1 << 17))
1492 #define GEN7_DATAPORT_SCRATCH_NUM_REGS_SHIFT 12
1493
1494 #define GEN7_PIXEL_INTERPOLATOR_LOC_SHARED_OFFSET 0
1495 #define GEN7_PIXEL_INTERPOLATOR_LOC_SAMPLE 1
1496 #define GEN7_PIXEL_INTERPOLATOR_LOC_CENTROID 2
1497 #define GEN7_PIXEL_INTERPOLATOR_LOC_PER_SLOT_OFFSET 3
1498
1499 /* HSW */
1500 #define HSW_DATAPORT_DC_PORT0_OWORD_BLOCK_READ 0
1501 #define HSW_DATAPORT_DC_PORT0_UNALIGNED_OWORD_BLOCK_READ 1
1502 #define HSW_DATAPORT_DC_PORT0_OWORD_DUAL_BLOCK_READ 2
1503 #define HSW_DATAPORT_DC_PORT0_DWORD_SCATTERED_READ 3
1504 #define HSW_DATAPORT_DC_PORT0_BYTE_SCATTERED_READ 4
1505 #define HSW_DATAPORT_DC_PORT0_MEMORY_FENCE 7
1506 #define HSW_DATAPORT_DC_PORT0_OWORD_BLOCK_WRITE 8
1507 #define HSW_DATAPORT_DC_PORT0_OWORD_DUAL_BLOCK_WRITE 10
1508 #define HSW_DATAPORT_DC_PORT0_DWORD_SCATTERED_WRITE 11
1509 #define HSW_DATAPORT_DC_PORT0_BYTE_SCATTERED_WRITE 12
1510
1511 #define HSW_DATAPORT_DC_PORT1_UNTYPED_SURFACE_READ 1
1512 #define HSW_DATAPORT_DC_PORT1_UNTYPED_ATOMIC_OP 2
1513 #define HSW_DATAPORT_DC_PORT1_UNTYPED_ATOMIC_OP_SIMD4X2 3
1514 #define HSW_DATAPORT_DC_PORT1_MEDIA_BLOCK_READ 4
1515 #define HSW_DATAPORT_DC_PORT1_TYPED_SURFACE_READ 5
1516 #define HSW_DATAPORT_DC_PORT1_TYPED_ATOMIC_OP 6
1517 #define HSW_DATAPORT_DC_PORT1_TYPED_ATOMIC_OP_SIMD4X2 7
1518 #define HSW_DATAPORT_DC_PORT1_UNTYPED_SURFACE_WRITE 9
1519 #define HSW_DATAPORT_DC_PORT1_MEDIA_BLOCK_WRITE 10
1520 #define HSW_DATAPORT_DC_PORT1_ATOMIC_COUNTER_OP 11
1521 #define HSW_DATAPORT_DC_PORT1_ATOMIC_COUNTER_OP_SIMD4X2 12
1522 #define HSW_DATAPORT_DC_PORT1_TYPED_SURFACE_WRITE 13
1523
1524 /* GEN9 */
1525 #define GEN9_DATAPORT_RC_RENDER_TARGET_WRITE 12
1526 #define GEN9_DATAPORT_RC_RENDER_TARGET_READ 13
1527
1528 /* Dataport special binding table indices: */
1529 #define BRW_BTI_STATELESS 255
1530 #define GEN7_BTI_SLM 254
1531 /* Note that on Gen8+ BTI 255 was redefined to be IA-coherent according to the
1532 * hardware spec, however because the DRM sets bit 4 of HDC_CHICKEN0 on BDW,
1533 * CHV and at least some pre-production steppings of SKL due to
1534 * WaForceEnableNonCoherent, HDC memory access may have been overridden by the
1535 * kernel to be non-coherent (matching the behavior of the same BTI on
1536 * pre-Gen8 hardware) and BTI 255 may actually be an alias for BTI 253.
1537 */
1538 #define GEN8_BTI_STATELESS_IA_COHERENT 255
1539 #define GEN8_BTI_STATELESS_NON_COHERENT 253
1540
1541 /* dataport atomic operations. */
1542 #define BRW_AOP_AND 1
1543 #define BRW_AOP_OR 2
1544 #define BRW_AOP_XOR 3
1545 #define BRW_AOP_MOV 4
1546 #define BRW_AOP_INC 5
1547 #define BRW_AOP_DEC 6
1548 #define BRW_AOP_ADD 7
1549 #define BRW_AOP_SUB 8
1550 #define BRW_AOP_REVSUB 9
1551 #define BRW_AOP_IMAX 10
1552 #define BRW_AOP_IMIN 11
1553 #define BRW_AOP_UMAX 12
1554 #define BRW_AOP_UMIN 13
1555 #define BRW_AOP_CMPWR 14
1556 #define BRW_AOP_PREDEC 15
1557
1558 #define BRW_MATH_FUNCTION_INV 1
1559 #define BRW_MATH_FUNCTION_LOG 2
1560 #define BRW_MATH_FUNCTION_EXP 3
1561 #define BRW_MATH_FUNCTION_SQRT 4
1562 #define BRW_MATH_FUNCTION_RSQ 5
1563 #define BRW_MATH_FUNCTION_SIN 6
1564 #define BRW_MATH_FUNCTION_COS 7
1565 #define BRW_MATH_FUNCTION_SINCOS 8 /* gen4, gen5 */
1566 #define BRW_MATH_FUNCTION_FDIV 9 /* gen6+ */
1567 #define BRW_MATH_FUNCTION_POW 10
1568 #define BRW_MATH_FUNCTION_INT_DIV_QUOTIENT_AND_REMAINDER 11
1569 #define BRW_MATH_FUNCTION_INT_DIV_QUOTIENT 12
1570 #define BRW_MATH_FUNCTION_INT_DIV_REMAINDER 13
1571 #define GEN8_MATH_FUNCTION_INVM 14
1572 #define GEN8_MATH_FUNCTION_RSQRTM 15
1573
1574 #define BRW_MATH_INTEGER_UNSIGNED 0
1575 #define BRW_MATH_INTEGER_SIGNED 1
1576
1577 #define BRW_MATH_PRECISION_FULL 0
1578 #define BRW_MATH_PRECISION_PARTIAL 1
1579
1580 #define BRW_MATH_SATURATE_NONE 0
1581 #define BRW_MATH_SATURATE_SATURATE 1
1582
1583 #define BRW_MATH_DATA_VECTOR 0
1584 #define BRW_MATH_DATA_SCALAR 1
1585
1586 #define BRW_URB_OPCODE_WRITE_HWORD 0
1587 #define BRW_URB_OPCODE_WRITE_OWORD 1
1588 #define BRW_URB_OPCODE_READ_HWORD 2
1589 #define BRW_URB_OPCODE_READ_OWORD 3
1590 #define GEN7_URB_OPCODE_ATOMIC_MOV 4
1591 #define GEN7_URB_OPCODE_ATOMIC_INC 5
1592 #define GEN8_URB_OPCODE_ATOMIC_ADD 6
1593 #define GEN8_URB_OPCODE_SIMD8_WRITE 7
1594 #define GEN8_URB_OPCODE_SIMD8_READ 8
1595
1596 #define BRW_URB_SWIZZLE_NONE 0
1597 #define BRW_URB_SWIZZLE_INTERLEAVE 1
1598 #define BRW_URB_SWIZZLE_TRANSPOSE 2
1599
1600 #define BRW_SCRATCH_SPACE_SIZE_1K 0
1601 #define BRW_SCRATCH_SPACE_SIZE_2K 1
1602 #define BRW_SCRATCH_SPACE_SIZE_4K 2
1603 #define BRW_SCRATCH_SPACE_SIZE_8K 3
1604 #define BRW_SCRATCH_SPACE_SIZE_16K 4
1605 #define BRW_SCRATCH_SPACE_SIZE_32K 5
1606 #define BRW_SCRATCH_SPACE_SIZE_64K 6
1607 #define BRW_SCRATCH_SPACE_SIZE_128K 7
1608 #define BRW_SCRATCH_SPACE_SIZE_256K 8
1609 #define BRW_SCRATCH_SPACE_SIZE_512K 9
1610 #define BRW_SCRATCH_SPACE_SIZE_1M 10
1611 #define BRW_SCRATCH_SPACE_SIZE_2M 11
1612
1613 #define BRW_MESSAGE_GATEWAY_SFID_OPEN_GATEWAY 0
1614 #define BRW_MESSAGE_GATEWAY_SFID_CLOSE_GATEWAY 1
1615 #define BRW_MESSAGE_GATEWAY_SFID_FORWARD_MSG 2
1616 #define BRW_MESSAGE_GATEWAY_SFID_GET_TIMESTAMP 3
1617 #define BRW_MESSAGE_GATEWAY_SFID_BARRIER_MSG 4
1618 #define BRW_MESSAGE_GATEWAY_SFID_UPDATE_GATEWAY_STATE 5
1619 #define BRW_MESSAGE_GATEWAY_SFID_MMIO_READ_WRITE 6
1620
1621
1622 #define CMD_URB_FENCE 0x6000
1623 #define CMD_CS_URB_STATE 0x6001
1624 #define CMD_CONST_BUFFER 0x6002
1625
1626 #define CMD_STATE_BASE_ADDRESS 0x6101
1627 #define CMD_STATE_SIP 0x6102
1628 #define CMD_PIPELINE_SELECT_965 0x6104
1629 #define CMD_PIPELINE_SELECT_GM45 0x6904
1630
1631 #define _3DSTATE_PIPELINED_POINTERS 0x7800
1632 #define _3DSTATE_BINDING_TABLE_POINTERS 0x7801
1633 # define GEN6_BINDING_TABLE_MODIFY_VS (1 << 8)
1634 # define GEN6_BINDING_TABLE_MODIFY_GS (1 << 9)
1635 # define GEN6_BINDING_TABLE_MODIFY_PS (1 << 12)
1636
1637 #define _3DSTATE_BINDING_TABLE_POINTERS_VS 0x7826 /* GEN7+ */
1638 #define _3DSTATE_BINDING_TABLE_POINTERS_HS 0x7827 /* GEN7+ */
1639 #define _3DSTATE_BINDING_TABLE_POINTERS_DS 0x7828 /* GEN7+ */
1640 #define _3DSTATE_BINDING_TABLE_POINTERS_GS 0x7829 /* GEN7+ */
1641 #define _3DSTATE_BINDING_TABLE_POINTERS_PS 0x782A /* GEN7+ */
1642
1643 #define _3DSTATE_SAMPLER_STATE_POINTERS 0x7802 /* GEN6+ */
1644 # define PS_SAMPLER_STATE_CHANGE (1 << 12)
1645 # define GS_SAMPLER_STATE_CHANGE (1 << 9)
1646 # define VS_SAMPLER_STATE_CHANGE (1 << 8)
1647 /* DW1: VS */
1648 /* DW2: GS */
1649 /* DW3: PS */
1650
1651 #define _3DSTATE_SAMPLER_STATE_POINTERS_VS 0x782B /* GEN7+ */
1652 #define _3DSTATE_SAMPLER_STATE_POINTERS_HS 0x782C /* GEN7+ */
1653 #define _3DSTATE_SAMPLER_STATE_POINTERS_DS 0x782D /* GEN7+ */
1654 #define _3DSTATE_SAMPLER_STATE_POINTERS_GS 0x782E /* GEN7+ */
1655 #define _3DSTATE_SAMPLER_STATE_POINTERS_PS 0x782F /* GEN7+ */
1656
1657 #define _3DSTATE_VERTEX_BUFFERS 0x7808
1658 # define BRW_VB0_INDEX_SHIFT 27
1659 # define GEN6_VB0_INDEX_SHIFT 26
1660 # define BRW_VB0_ACCESS_VERTEXDATA (0 << 26)
1661 # define BRW_VB0_ACCESS_INSTANCEDATA (1 << 26)
1662 # define GEN6_VB0_ACCESS_VERTEXDATA (0 << 20)
1663 # define GEN6_VB0_ACCESS_INSTANCEDATA (1 << 20)
1664 # define GEN7_VB0_ADDRESS_MODIFYENABLE (1 << 14)
1665 # define BRW_VB0_PITCH_SHIFT 0
1666
1667 #define _3DSTATE_VERTEX_ELEMENTS 0x7809
1668 # define BRW_VE0_INDEX_SHIFT 27
1669 # define GEN6_VE0_INDEX_SHIFT 26
1670 # define BRW_VE0_FORMAT_SHIFT 16
1671 # define BRW_VE0_VALID (1 << 26)
1672 # define GEN6_VE0_VALID (1 << 25)
1673 # define GEN6_VE0_EDGE_FLAG_ENABLE (1 << 15)
1674 # define BRW_VE0_SRC_OFFSET_SHIFT 0
1675 # define BRW_VE1_COMPONENT_NOSTORE 0
1676 # define BRW_VE1_COMPONENT_STORE_SRC 1
1677 # define BRW_VE1_COMPONENT_STORE_0 2
1678 # define BRW_VE1_COMPONENT_STORE_1_FLT 3
1679 # define BRW_VE1_COMPONENT_STORE_1_INT 4
1680 # define BRW_VE1_COMPONENT_STORE_VID 5
1681 # define BRW_VE1_COMPONENT_STORE_IID 6
1682 # define BRW_VE1_COMPONENT_STORE_PID 7
1683 # define BRW_VE1_COMPONENT_0_SHIFT 28
1684 # define BRW_VE1_COMPONENT_1_SHIFT 24
1685 # define BRW_VE1_COMPONENT_2_SHIFT 20
1686 # define BRW_VE1_COMPONENT_3_SHIFT 16
1687 # define BRW_VE1_DST_OFFSET_SHIFT 0
1688
1689 #define CMD_INDEX_BUFFER 0x780a
1690 #define GEN4_3DSTATE_VF_STATISTICS 0x780b
1691 #define GM45_3DSTATE_VF_STATISTICS 0x680b
1692 #define _3DSTATE_CC_STATE_POINTERS 0x780e /* GEN6+ */
1693 #define _3DSTATE_BLEND_STATE_POINTERS 0x7824 /* GEN7+ */
1694 #define _3DSTATE_DEPTH_STENCIL_STATE_POINTERS 0x7825 /* GEN7+ */
1695
1696 #define _3DSTATE_URB 0x7805 /* GEN6 */
1697 # define GEN6_URB_VS_SIZE_SHIFT 16
1698 # define GEN6_URB_VS_ENTRIES_SHIFT 0
1699 # define GEN6_URB_GS_ENTRIES_SHIFT 8
1700 # define GEN6_URB_GS_SIZE_SHIFT 0
1701
1702 #define _3DSTATE_VF 0x780c /* GEN7.5+ */
1703 #define HSW_CUT_INDEX_ENABLE (1 << 8)
1704
1705 #define _3DSTATE_VF_INSTANCING 0x7849 /* GEN8+ */
1706 # define GEN8_VF_INSTANCING_ENABLE (1 << 8)
1707
1708 #define _3DSTATE_VF_SGVS 0x784a /* GEN8+ */
1709 # define GEN8_SGVS_ENABLE_INSTANCE_ID (1 << 31)
1710 # define GEN8_SGVS_INSTANCE_ID_COMPONENT_SHIFT 29
1711 # define GEN8_SGVS_INSTANCE_ID_ELEMENT_OFFSET_SHIFT 16
1712 # define GEN8_SGVS_ENABLE_VERTEX_ID (1 << 15)
1713 # define GEN8_SGVS_VERTEX_ID_COMPONENT_SHIFT 13
1714 # define GEN8_SGVS_VERTEX_ID_ELEMENT_OFFSET_SHIFT 0
1715
1716 #define _3DSTATE_VF_TOPOLOGY 0x784b /* GEN8+ */
1717
1718 #define _3DSTATE_WM_CHROMAKEY 0x784c /* GEN8+ */
1719
1720 #define _3DSTATE_URB_VS 0x7830 /* GEN7+ */
1721 #define _3DSTATE_URB_HS 0x7831 /* GEN7+ */
1722 #define _3DSTATE_URB_DS 0x7832 /* GEN7+ */
1723 #define _3DSTATE_URB_GS 0x7833 /* GEN7+ */
1724 # define GEN7_URB_ENTRY_SIZE_SHIFT 16
1725 # define GEN7_URB_STARTING_ADDRESS_SHIFT 25
1726
1727 /* Gen7 "GS URB Entry Allocation Size" is a U9-1 field, so the maximum gs_size
1728 * is 2^9, or 512. It's counted in multiples of 64 bytes.
1729 *
1730 * Identical for VS, DS, and HS.
1731 */
1732 #define GEN7_MAX_GS_URB_ENTRY_SIZE_BYTES (512*64)
1733 #define GEN7_MAX_DS_URB_ENTRY_SIZE_BYTES (512*64)
1734 #define GEN7_MAX_HS_URB_ENTRY_SIZE_BYTES (512*64)
1735 #define GEN7_MAX_VS_URB_ENTRY_SIZE_BYTES (512*64)
1736
1737 /* Gen6 "GS URB Entry Allocation Size" is defined as a number of 1024-bit
1738 * (128 bytes) URB rows and the maximum allowed value is 5 rows.
1739 */
1740 #define GEN6_MAX_GS_URB_ENTRY_SIZE_BYTES (5*128)
1741
1742 #define _3DSTATE_PUSH_CONSTANT_ALLOC_VS 0x7912 /* GEN7+ */
1743 #define _3DSTATE_PUSH_CONSTANT_ALLOC_HS 0x7913 /* GEN7+ */
1744 #define _3DSTATE_PUSH_CONSTANT_ALLOC_DS 0x7914 /* GEN7+ */
1745 #define _3DSTATE_PUSH_CONSTANT_ALLOC_GS 0x7915 /* GEN7+ */
1746 #define _3DSTATE_PUSH_CONSTANT_ALLOC_PS 0x7916 /* GEN7+ */
1747 # define GEN7_PUSH_CONSTANT_BUFFER_OFFSET_SHIFT 16
1748
1749 #define _3DSTATE_VIEWPORT_STATE_POINTERS 0x780d /* GEN6+ */
1750 # define GEN6_CC_VIEWPORT_MODIFY (1 << 12)
1751 # define GEN6_SF_VIEWPORT_MODIFY (1 << 11)
1752 # define GEN6_CLIP_VIEWPORT_MODIFY (1 << 10)
1753 # define GEN6_NUM_VIEWPORTS 16
1754
1755 #define _3DSTATE_VIEWPORT_STATE_POINTERS_CC 0x7823 /* GEN7+ */
1756 #define _3DSTATE_VIEWPORT_STATE_POINTERS_SF_CL 0x7821 /* GEN7+ */
1757
1758 #define _3DSTATE_SCISSOR_STATE_POINTERS 0x780f /* GEN6+ */
1759
1760 #define _3DSTATE_VS 0x7810 /* GEN6+ */
1761 /* DW2 */
1762 # define GEN6_VS_SPF_MODE (1 << 31)
1763 # define GEN6_VS_VECTOR_MASK_ENABLE (1 << 30)
1764 # define GEN6_VS_SAMPLER_COUNT_SHIFT 27
1765 # define GEN6_VS_BINDING_TABLE_ENTRY_COUNT_SHIFT 18
1766 # define GEN6_VS_FLOATING_POINT_MODE_IEEE_754 (0 << 16)
1767 # define GEN6_VS_FLOATING_POINT_MODE_ALT (1 << 16)
1768 # define HSW_VS_UAV_ACCESS_ENABLE (1 << 12)
1769 /* DW4 */
1770 # define GEN6_VS_DISPATCH_START_GRF_SHIFT 20
1771 # define GEN6_VS_URB_READ_LENGTH_SHIFT 11
1772 # define GEN6_VS_URB_ENTRY_READ_OFFSET_SHIFT 4
1773 /* DW5 */
1774 # define GEN6_VS_MAX_THREADS_SHIFT 25
1775 # define HSW_VS_MAX_THREADS_SHIFT 23
1776 # define GEN6_VS_STATISTICS_ENABLE (1 << 10)
1777 # define GEN6_VS_CACHE_DISABLE (1 << 1)
1778 # define GEN6_VS_ENABLE (1 << 0)
1779 /* Gen8+ DW7 */
1780 # define GEN8_VS_SIMD8_ENABLE (1 << 2)
1781 /* Gen8+ DW8 */
1782 # define GEN8_VS_URB_ENTRY_OUTPUT_OFFSET_SHIFT 21
1783 # define GEN8_VS_URB_OUTPUT_LENGTH_SHIFT 16
1784 # define GEN8_VS_USER_CLIP_DISTANCE_SHIFT 8
1785
1786 #define _3DSTATE_GS 0x7811 /* GEN6+ */
1787 /* DW2 */
1788 # define GEN6_GS_SPF_MODE (1 << 31)
1789 # define GEN6_GS_VECTOR_MASK_ENABLE (1 << 30)
1790 # define GEN6_GS_SAMPLER_COUNT_SHIFT 27
1791 # define GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT 18
1792 # define GEN6_GS_FLOATING_POINT_MODE_IEEE_754 (0 << 16)
1793 # define GEN6_GS_FLOATING_POINT_MODE_ALT (1 << 16)
1794 # define HSW_GS_UAV_ACCESS_ENABLE (1 << 12)
1795 /* DW4 */
1796 # define GEN7_GS_OUTPUT_VERTEX_SIZE_SHIFT 23
1797 # define GEN7_GS_OUTPUT_TOPOLOGY_SHIFT 17
1798 # define GEN6_GS_URB_READ_LENGTH_SHIFT 11
1799 # define GEN7_GS_INCLUDE_VERTEX_HANDLES (1 << 10)
1800 # define GEN6_GS_URB_ENTRY_READ_OFFSET_SHIFT 4
1801 # define GEN6_GS_DISPATCH_START_GRF_SHIFT 0
1802 /* DW5 */
1803 # define GEN6_GS_MAX_THREADS_SHIFT 25
1804 # define HSW_GS_MAX_THREADS_SHIFT 24
1805 # define IVB_GS_CONTROL_DATA_FORMAT_SHIFT 24
1806 # define GEN7_GS_CONTROL_DATA_FORMAT_GSCTL_CUT 0
1807 # define GEN7_GS_CONTROL_DATA_FORMAT_GSCTL_SID 1
1808 # define GEN7_GS_CONTROL_DATA_HEADER_SIZE_SHIFT 20
1809 # define GEN7_GS_INSTANCE_CONTROL_SHIFT 15
1810 # define GEN7_GS_DISPATCH_MODE_SHIFT 11
1811 # define GEN7_GS_DISPATCH_MODE_MASK INTEL_MASK(12, 11)
1812 # define GEN6_GS_STATISTICS_ENABLE (1 << 10)
1813 # define GEN6_GS_SO_STATISTICS_ENABLE (1 << 9)
1814 # define GEN6_GS_RENDERING_ENABLE (1 << 8)
1815 # define GEN7_GS_INCLUDE_PRIMITIVE_ID (1 << 4)
1816 # define GEN7_GS_REORDER_TRAILING (1 << 2)
1817 # define GEN7_GS_ENABLE (1 << 0)
1818 /* DW6 */
1819 # define HSW_GS_CONTROL_DATA_FORMAT_SHIFT 31
1820 # define GEN6_GS_REORDER (1 << 30)
1821 # define GEN6_GS_DISCARD_ADJACENCY (1 << 29)
1822 # define GEN6_GS_SVBI_PAYLOAD_ENABLE (1 << 28)
1823 # define GEN6_GS_SVBI_POSTINCREMENT_ENABLE (1 << 27)
1824 # define GEN6_GS_SVBI_POSTINCREMENT_VALUE_SHIFT 16
1825 # define GEN6_GS_SVBI_POSTINCREMENT_VALUE_MASK INTEL_MASK(25, 16)
1826 # define GEN6_GS_ENABLE (1 << 15)
1827
1828 /* Gen8+ DW8 */
1829 # define GEN8_GS_STATIC_OUTPUT (1 << 30)
1830 # define GEN8_GS_STATIC_VERTEX_COUNT_SHIFT 16
1831 # define GEN8_GS_STATIC_VERTEX_COUNT_MASK INTEL_MASK(26, 16)
1832
1833 /* Gen8+ DW9 */
1834 # define GEN8_GS_URB_ENTRY_OUTPUT_OFFSET_SHIFT 21
1835 # define GEN8_GS_URB_OUTPUT_LENGTH_SHIFT 16
1836 # define GEN8_GS_USER_CLIP_DISTANCE_SHIFT 8
1837
1838 # define BRW_GS_EDGE_INDICATOR_0 (1 << 8)
1839 # define BRW_GS_EDGE_INDICATOR_1 (1 << 9)
1840
1841 /* GS Thread Payload
1842 */
1843 /* R0 */
1844 # define GEN7_GS_PAYLOAD_INSTANCE_ID_SHIFT 27
1845
1846 /* 3DSTATE_GS "Output Vertex Size" has an effective maximum of 62. It's
1847 * counted in multiples of 16 bytes.
1848 */
1849 #define GEN7_MAX_GS_OUTPUT_VERTEX_SIZE_BYTES (62*16)
1850
1851 #define _3DSTATE_HS 0x781B /* GEN7+ */
1852 /* DW1 */
1853 # define GEN7_HS_SAMPLER_COUNT_MASK INTEL_MASK(29, 27)
1854 # define GEN7_HS_SAMPLER_COUNT_SHIFT 27
1855 # define GEN7_HS_BINDING_TABLE_ENTRY_COUNT_MASK INTEL_MASK(25, 18)
1856 # define GEN7_HS_BINDING_TABLE_ENTRY_COUNT_SHIFT 18
1857 # define GEN7_HS_FLOATING_POINT_MODE_IEEE_754 (0 << 16)
1858 # define GEN7_HS_FLOATING_POINT_MODE_ALT (1 << 16)
1859 # define GEN7_HS_MAX_THREADS_SHIFT 0
1860 /* DW2 */
1861 # define GEN7_HS_ENABLE (1 << 31)
1862 # define GEN7_HS_STATISTICS_ENABLE (1 << 29)
1863 # define GEN8_HS_MAX_THREADS_SHIFT 8
1864 # define GEN7_HS_INSTANCE_COUNT_MASK INTEL_MASK(3, 0)
1865 # define GEN7_HS_INSTANCE_COUNT_SHIFT 0
1866 /* DW5 */
1867 # define GEN7_HS_SINGLE_PROGRAM_FLOW (1 << 27)
1868 # define GEN7_HS_VECTOR_MASK_ENABLE (1 << 26)
1869 # define HSW_HS_ACCESSES_UAV (1 << 25)
1870 # define GEN7_HS_INCLUDE_VERTEX_HANDLES (1 << 24)
1871 # define GEN7_HS_DISPATCH_START_GRF_MASK INTEL_MASK(23, 19)
1872 # define GEN7_HS_DISPATCH_START_GRF_SHIFT 19
1873 # define GEN7_HS_URB_READ_LENGTH_MASK INTEL_MASK(16, 11)
1874 # define GEN7_HS_URB_READ_LENGTH_SHIFT 11
1875 # define GEN7_HS_URB_ENTRY_READ_OFFSET_MASK INTEL_MASK(9, 4)
1876 # define GEN7_HS_URB_ENTRY_READ_OFFSET_SHIFT 4
1877
1878 #define _3DSTATE_TE 0x781C /* GEN7+ */
1879 /* DW1 */
1880 # define GEN7_TE_PARTITIONING_SHIFT 12
1881 # define GEN7_TE_OUTPUT_TOPOLOGY_SHIFT 8
1882 # define GEN7_TE_DOMAIN_SHIFT 4
1883 //# define GEN7_TE_MODE_SW (1 << 1)
1884 # define GEN7_TE_ENABLE (1 << 0)
1885
1886 #define _3DSTATE_DS 0x781D /* GEN7+ */
1887 /* DW2 */
1888 # define GEN7_DS_SINGLE_DOMAIN_POINT_DISPATCH (1 << 31)
1889 # define GEN7_DS_VECTOR_MASK_ENABLE (1 << 30)
1890 # define GEN7_DS_SAMPLER_COUNT_MASK INTEL_MASK(29, 27)
1891 # define GEN7_DS_SAMPLER_COUNT_SHIFT 27
1892 # define GEN7_DS_BINDING_TABLE_ENTRY_COUNT_MASK INTEL_MASK(25, 18)
1893 # define GEN7_DS_BINDING_TABLE_ENTRY_COUNT_SHIFT 18
1894 # define GEN7_DS_FLOATING_POINT_MODE_IEEE_754 (0 << 16)
1895 # define GEN7_DS_FLOATING_POINT_MODE_ALT (1 << 16)
1896 # define HSW_DS_ACCESSES_UAV (1 << 14)
1897 /* DW4 */
1898 # define GEN7_DS_DISPATCH_START_GRF_MASK INTEL_MASK(24, 20)
1899 # define GEN7_DS_DISPATCH_START_GRF_SHIFT 20
1900 # define GEN7_DS_URB_READ_LENGTH_MASK INTEL_MASK(17, 11)
1901 # define GEN7_DS_URB_READ_LENGTH_SHIFT 11
1902 # define GEN7_DS_URB_ENTRY_READ_OFFSET_MASK INTEL_MASK(9, 4)
1903 # define GEN7_DS_URB_ENTRY_READ_OFFSET_SHIFT 4
1904 /* DW5 */
1905 # define GEN7_DS_MAX_THREADS_SHIFT 25
1906 # define HSW_DS_MAX_THREADS_SHIFT 21
1907 # define GEN7_DS_STATISTICS_ENABLE (1 << 10)
1908 # define GEN7_DS_SIMD8_DISPATCH_ENABLE (1 << 3)
1909 # define GEN7_DS_COMPUTE_W_COORDINATE_ENABLE (1 << 2)
1910 # define GEN7_DS_CACHE_DISABLE (1 << 1)
1911 # define GEN7_DS_ENABLE (1 << 0)
1912 /* Gen8+ DW8 */
1913 # define GEN8_DS_URB_ENTRY_OUTPUT_OFFSET_MASK INTEL_MASK(26, 21)
1914 # define GEN8_DS_URB_ENTRY_OUTPUT_OFFSET_SHIFT 21
1915 # define GEN8_DS_URB_OUTPUT_LENGTH_MASK INTEL_MASK(20, 16)
1916 # define GEN8_DS_URB_OUTPUT_LENGTH_SHIFT 16
1917 # define GEN8_DS_USER_CLIP_DISTANCE_MASK INTEL_MASK(15, 8)
1918 # define GEN8_DS_USER_CLIP_DISTANCE_SHIFT 8
1919 # define GEN8_DS_USER_CULL_DISTANCE_MASK INTEL_MASK(7, 0)
1920 # define GEN8_DS_USER_CULL_DISTANCE_SHIFT 0
1921
1922
1923 #define _3DSTATE_CLIP 0x7812 /* GEN6+ */
1924 /* DW1 */
1925 # define GEN7_CLIP_WINDING_CW (0 << 20)
1926 # define GEN7_CLIP_WINDING_CCW (1 << 20)
1927 # define GEN7_CLIP_VERTEX_SUBPIXEL_PRECISION_8 (0 << 19)
1928 # define GEN7_CLIP_VERTEX_SUBPIXEL_PRECISION_4 (1 << 19)
1929 # define GEN7_CLIP_EARLY_CULL (1 << 18)
1930 # define GEN8_CLIP_FORCE_USER_CLIP_DISTANCE_BITMASK (1 << 17)
1931 # define GEN7_CLIP_CULLMODE_BOTH (0 << 16)
1932 # define GEN7_CLIP_CULLMODE_NONE (1 << 16)
1933 # define GEN7_CLIP_CULLMODE_FRONT (2 << 16)
1934 # define GEN7_CLIP_CULLMODE_BACK (3 << 16)
1935 # define GEN6_CLIP_STATISTICS_ENABLE (1 << 10)
1936 /**
1937 * Just does cheap culling based on the clip distance. Bits must be
1938 * disjoint with USER_CLIP_CLIP_DISTANCE bits.
1939 */
1940 # define GEN6_USER_CLIP_CULL_DISTANCES_SHIFT 0
1941 /* DW2 */
1942 # define GEN6_CLIP_ENABLE (1 << 31)
1943 # define GEN6_CLIP_API_OGL (0 << 30)
1944 # define GEN6_CLIP_API_D3D (1 << 30)
1945 # define GEN6_CLIP_XY_TEST (1 << 28)
1946 # define GEN6_CLIP_Z_TEST (1 << 27)
1947 # define GEN6_CLIP_GB_TEST (1 << 26)
1948 /** 8-bit field of which user clip distances to clip aganist. */
1949 # define GEN6_USER_CLIP_CLIP_DISTANCES_SHIFT 16
1950 # define GEN6_CLIP_MODE_NORMAL (0 << 13)
1951 # define GEN6_CLIP_MODE_REJECT_ALL (3 << 13)
1952 # define GEN6_CLIP_MODE_ACCEPT_ALL (4 << 13)
1953 # define GEN6_CLIP_PERSPECTIVE_DIVIDE_DISABLE (1 << 9)
1954 # define GEN6_CLIP_NON_PERSPECTIVE_BARYCENTRIC_ENABLE (1 << 8)
1955 # define GEN6_CLIP_TRI_PROVOKE_SHIFT 4
1956 # define GEN6_CLIP_LINE_PROVOKE_SHIFT 2
1957 # define GEN6_CLIP_TRIFAN_PROVOKE_SHIFT 0
1958 /* DW3 */
1959 # define GEN6_CLIP_MIN_POINT_WIDTH_SHIFT 17
1960 # define GEN6_CLIP_MAX_POINT_WIDTH_SHIFT 6
1961 # define GEN6_CLIP_FORCE_ZERO_RTAINDEX (1 << 5)
1962 # define GEN6_CLIP_MAX_VP_INDEX_MASK INTEL_MASK(3, 0)
1963
1964 #define _3DSTATE_SF 0x7813 /* GEN6+ */
1965 /* DW1 (for gen6) */
1966 # define GEN6_SF_NUM_OUTPUTS_SHIFT 22
1967 # define GEN6_SF_SWIZZLE_ENABLE (1 << 21)
1968 # define GEN6_SF_POINT_SPRITE_UPPERLEFT (0 << 20)
1969 # define GEN6_SF_POINT_SPRITE_LOWERLEFT (1 << 20)
1970 # define GEN9_SF_LINE_WIDTH_SHIFT 12 /* U11.7 */
1971 # define GEN6_SF_URB_ENTRY_READ_LENGTH_SHIFT 11
1972 # define GEN6_SF_URB_ENTRY_READ_OFFSET_SHIFT 4
1973 /* DW2 */
1974 # define GEN6_SF_LEGACY_GLOBAL_DEPTH_BIAS (1 << 11)
1975 # define GEN6_SF_STATISTICS_ENABLE (1 << 10)
1976 # define GEN6_SF_GLOBAL_DEPTH_OFFSET_SOLID (1 << 9)
1977 # define GEN6_SF_GLOBAL_DEPTH_OFFSET_WIREFRAME (1 << 8)
1978 # define GEN6_SF_GLOBAL_DEPTH_OFFSET_POINT (1 << 7)
1979 # define GEN6_SF_FRONT_SOLID (0 << 5)
1980 # define GEN6_SF_FRONT_WIREFRAME (1 << 5)
1981 # define GEN6_SF_FRONT_POINT (2 << 5)
1982 # define GEN6_SF_BACK_SOLID (0 << 3)
1983 # define GEN6_SF_BACK_WIREFRAME (1 << 3)
1984 # define GEN6_SF_BACK_POINT (2 << 3)
1985 # define GEN6_SF_VIEWPORT_TRANSFORM_ENABLE (1 << 1)
1986 # define GEN6_SF_WINDING_CCW (1 << 0)
1987 /* DW3 */
1988 # define GEN6_SF_LINE_AA_ENABLE (1 << 31)
1989 # define GEN6_SF_CULL_BOTH (0 << 29)
1990 # define GEN6_SF_CULL_NONE (1 << 29)
1991 # define GEN6_SF_CULL_FRONT (2 << 29)
1992 # define GEN6_SF_CULL_BACK (3 << 29)
1993 # define GEN6_SF_LINE_WIDTH_SHIFT 18 /* U3.7 */
1994 # define GEN6_SF_LINE_END_CAP_WIDTH_0_5 (0 << 16)
1995 # define GEN6_SF_LINE_END_CAP_WIDTH_1_0 (1 << 16)
1996 # define GEN6_SF_LINE_END_CAP_WIDTH_2_0 (2 << 16)
1997 # define GEN6_SF_LINE_END_CAP_WIDTH_4_0 (3 << 16)
1998 # define GEN6_SF_SCISSOR_ENABLE (1 << 11)
1999 # define GEN6_SF_MSRAST_OFF_PIXEL (0 << 8)
2000 # define GEN6_SF_MSRAST_OFF_PATTERN (1 << 8)
2001 # define GEN6_SF_MSRAST_ON_PIXEL (2 << 8)
2002 # define GEN6_SF_MSRAST_ON_PATTERN (3 << 8)
2003 /* DW4 */
2004 # define GEN6_SF_TRI_PROVOKE_SHIFT 29
2005 # define GEN6_SF_LINE_PROVOKE_SHIFT 27
2006 # define GEN6_SF_TRIFAN_PROVOKE_SHIFT 25
2007 # define GEN6_SF_LINE_AA_MODE_MANHATTAN (0 << 14)
2008 # define GEN6_SF_LINE_AA_MODE_TRUE (1 << 14)
2009 # define GEN6_SF_VERTEX_SUBPIXEL_8BITS (0 << 12)
2010 # define GEN6_SF_VERTEX_SUBPIXEL_4BITS (1 << 12)
2011 # define GEN6_SF_USE_STATE_POINT_WIDTH (1 << 11)
2012 # define GEN6_SF_POINT_WIDTH_SHIFT 0 /* U8.3 */
2013 /* DW5: depth offset constant */
2014 /* DW6: depth offset scale */
2015 /* DW7: depth offset clamp */
2016 /* DW8 */
2017 # define ATTRIBUTE_1_OVERRIDE_W (1 << 31)
2018 # define ATTRIBUTE_1_OVERRIDE_Z (1 << 30)
2019 # define ATTRIBUTE_1_OVERRIDE_Y (1 << 29)
2020 # define ATTRIBUTE_1_OVERRIDE_X (1 << 28)
2021 # define ATTRIBUTE_1_CONST_SOURCE_SHIFT 25
2022 # define ATTRIBUTE_1_SWIZZLE_SHIFT 22
2023 # define ATTRIBUTE_1_SOURCE_SHIFT 16
2024 # define ATTRIBUTE_0_OVERRIDE_W (1 << 15)
2025 # define ATTRIBUTE_0_OVERRIDE_Z (1 << 14)
2026 # define ATTRIBUTE_0_OVERRIDE_Y (1 << 13)
2027 # define ATTRIBUTE_0_OVERRIDE_X (1 << 12)
2028 # define ATTRIBUTE_0_CONST_SOURCE_SHIFT 9
2029 # define ATTRIBUTE_CONST_0000 0
2030 # define ATTRIBUTE_CONST_0001_FLOAT 1
2031 # define ATTRIBUTE_CONST_1111_FLOAT 2
2032 # define ATTRIBUTE_CONST_PRIM_ID 3
2033 # define ATTRIBUTE_0_SWIZZLE_SHIFT 6
2034 # define ATTRIBUTE_0_SOURCE_SHIFT 0
2035
2036 # define ATTRIBUTE_SWIZZLE_INPUTATTR 0
2037 # define ATTRIBUTE_SWIZZLE_INPUTATTR_FACING 1
2038 # define ATTRIBUTE_SWIZZLE_INPUTATTR_W 2
2039 # define ATTRIBUTE_SWIZZLE_INPUTATTR_FACING_W 3
2040 # define ATTRIBUTE_SWIZZLE_SHIFT 6
2041
2042 /* DW16: Point sprite texture coordinate enables */
2043 /* DW17: Constant interpolation enables */
2044 /* DW18: attr 0-7 wrap shortest enables */
2045 /* DW19: attr 8-16 wrap shortest enables */
2046
2047 /* On GEN7, many fields of 3DSTATE_SF were split out into a new command:
2048 * 3DSTATE_SBE. The remaining fields live in different DWords, but retain
2049 * the same bit-offset. The only new field:
2050 */
2051 /* GEN7/DW1: */
2052 # define GEN7_SF_DEPTH_BUFFER_SURFACE_FORMAT_SHIFT 12
2053 /* GEN7/DW2: */
2054 # define HSW_SF_LINE_STIPPLE_ENABLE (1 << 14)
2055
2056 # define GEN8_SF_SMOOTH_POINT_ENABLE (1 << 13)
2057
2058 #define _3DSTATE_SBE 0x781F /* GEN7+ */
2059 /* DW1 */
2060 # define GEN8_SBE_FORCE_URB_ENTRY_READ_LENGTH (1 << 29)
2061 # define GEN8_SBE_FORCE_URB_ENTRY_READ_OFFSET (1 << 28)
2062 # define GEN7_SBE_SWIZZLE_CONTROL_MODE (1 << 28)
2063 # define GEN7_SBE_NUM_OUTPUTS_SHIFT 22
2064 # define GEN7_SBE_SWIZZLE_ENABLE (1 << 21)
2065 # define GEN7_SBE_POINT_SPRITE_LOWERLEFT (1 << 20)
2066 # define GEN7_SBE_URB_ENTRY_READ_LENGTH_SHIFT 11
2067 # define GEN7_SBE_URB_ENTRY_READ_OFFSET_SHIFT 4
2068 # define GEN8_SBE_URB_ENTRY_READ_OFFSET_SHIFT 5
2069 /* DW2-9: Attribute setup (same as DW8-15 of gen6 _3DSTATE_SF) */
2070 /* DW10: Point sprite texture coordinate enables */
2071 /* DW11: Constant interpolation enables */
2072 /* DW12: attr 0-7 wrap shortest enables */
2073 /* DW13: attr 8-16 wrap shortest enables */
2074
2075 /* DW4-5: Attribute active components (gen9) */
2076 #define GEN9_SBE_ACTIVE_COMPONENT_NONE 0
2077 #define GEN9_SBE_ACTIVE_COMPONENT_XY 1
2078 #define GEN9_SBE_ACTIVE_COMPONENT_XYZ 2
2079 #define GEN9_SBE_ACTIVE_COMPONENT_XYZW 3
2080
2081 #define _3DSTATE_SBE_SWIZ 0x7851 /* GEN8+ */
2082
2083 #define _3DSTATE_RASTER 0x7850 /* GEN8+ */
2084 /* DW1 */
2085 # define GEN9_RASTER_VIEWPORT_Z_FAR_CLIP_TEST_ENABLE (1 << 26)
2086 # define GEN9_RASTER_CONSERVATIVE_RASTERIZATION_ENABLE (1 << 24)
2087 # define GEN8_RASTER_FRONT_WINDING_CCW (1 << 21)
2088 # define GEN8_RASTER_CULL_BOTH (0 << 16)
2089 # define GEN8_RASTER_CULL_NONE (1 << 16)
2090 # define GEN8_RASTER_CULL_FRONT (2 << 16)
2091 # define GEN8_RASTER_CULL_BACK (3 << 16)
2092 # define GEN8_RASTER_SMOOTH_POINT_ENABLE (1 << 13)
2093 # define GEN8_RASTER_API_MULTISAMPLE_ENABLE (1 << 12)
2094 # define GEN8_RASTER_LINE_AA_ENABLE (1 << 2)
2095 # define GEN8_RASTER_SCISSOR_ENABLE (1 << 1)
2096 # define GEN8_RASTER_VIEWPORT_Z_CLIP_TEST_ENABLE (1 << 0)
2097 # define GEN9_RASTER_VIEWPORT_Z_NEAR_CLIP_TEST_ENABLE (1 << 0)
2098
2099 /* Gen8 BLEND_STATE */
2100 /* DW0 */
2101 #define GEN8_BLEND_ALPHA_TO_COVERAGE_ENABLE (1 << 31)
2102 #define GEN8_BLEND_INDEPENDENT_ALPHA_BLEND_ENABLE (1 << 30)
2103 #define GEN8_BLEND_ALPHA_TO_ONE_ENABLE (1 << 29)
2104 #define GEN8_BLEND_ALPHA_TO_COVERAGE_DITHER_ENABLE (1 << 28)
2105 #define GEN8_BLEND_ALPHA_TEST_ENABLE (1 << 27)
2106 #define GEN8_BLEND_ALPHA_TEST_FUNCTION_MASK INTEL_MASK(26, 24)
2107 #define GEN8_BLEND_ALPHA_TEST_FUNCTION_SHIFT 24
2108 #define GEN8_BLEND_COLOR_DITHER_ENABLE (1 << 23)
2109 #define GEN8_BLEND_X_DITHER_OFFSET_MASK INTEL_MASK(22, 21)
2110 #define GEN8_BLEND_X_DITHER_OFFSET_SHIFT 21
2111 #define GEN8_BLEND_Y_DITHER_OFFSET_MASK INTEL_MASK(20, 19)
2112 #define GEN8_BLEND_Y_DITHER_OFFSET_SHIFT 19
2113 /* DW1 + 2n */
2114 #define GEN8_BLEND_COLOR_BUFFER_BLEND_ENABLE (1 << 31)
2115 #define GEN8_BLEND_SRC_BLEND_FACTOR_MASK INTEL_MASK(30, 26)
2116 #define GEN8_BLEND_SRC_BLEND_FACTOR_SHIFT 26
2117 #define GEN8_BLEND_DST_BLEND_FACTOR_MASK INTEL_MASK(25, 21)
2118 #define GEN8_BLEND_DST_BLEND_FACTOR_SHIFT 21
2119 #define GEN8_BLEND_COLOR_BLEND_FUNCTION_MASK INTEL_MASK(20, 18)
2120 #define GEN8_BLEND_COLOR_BLEND_FUNCTION_SHIFT 18
2121 #define GEN8_BLEND_SRC_ALPHA_BLEND_FACTOR_MASK INTEL_MASK(17, 13)
2122 #define GEN8_BLEND_SRC_ALPHA_BLEND_FACTOR_SHIFT 13
2123 #define GEN8_BLEND_DST_ALPHA_BLEND_FACTOR_MASK INTEL_MASK(12, 8)
2124 #define GEN8_BLEND_DST_ALPHA_BLEND_FACTOR_SHIFT 8
2125 #define GEN8_BLEND_ALPHA_BLEND_FUNCTION_MASK INTEL_MASK(7, 5)
2126 #define GEN8_BLEND_ALPHA_BLEND_FUNCTION_SHIFT 5
2127 #define GEN8_BLEND_WRITE_DISABLE_ALPHA (1 << 3)
2128 #define GEN8_BLEND_WRITE_DISABLE_RED (1 << 2)
2129 #define GEN8_BLEND_WRITE_DISABLE_GREEN (1 << 1)
2130 #define GEN8_BLEND_WRITE_DISABLE_BLUE (1 << 0)
2131 /* DW1 + 2n + 1 */
2132 #define GEN8_BLEND_LOGIC_OP_ENABLE (1 << 31)
2133 #define GEN8_BLEND_LOGIC_OP_FUNCTION_MASK INTEL_MASK(30, 27)
2134 #define GEN8_BLEND_LOGIC_OP_FUNCTION_SHIFT 27
2135 #define GEN8_BLEND_PRE_BLEND_SRC_ONLY_CLAMP_ENABLE (1 << 4)
2136 #define GEN8_BLEND_COLOR_CLAMP_RANGE_RTFORMAT (2 << 2)
2137 #define GEN8_BLEND_PRE_BLEND_COLOR_CLAMP_ENABLE (1 << 1)
2138 #define GEN8_BLEND_POST_BLEND_COLOR_CLAMP_ENABLE (1 << 0)
2139
2140 #define _3DSTATE_WM_HZ_OP 0x7852 /* GEN8+ */
2141 /* DW1 */
2142 # define GEN8_WM_HZ_STENCIL_CLEAR (1 << 31)
2143 # define GEN8_WM_HZ_DEPTH_CLEAR (1 << 30)
2144 # define GEN8_WM_HZ_DEPTH_RESOLVE (1 << 28)
2145 # define GEN8_WM_HZ_HIZ_RESOLVE (1 << 27)
2146 # define GEN8_WM_HZ_PIXEL_OFFSET_ENABLE (1 << 26)
2147 # define GEN8_WM_HZ_FULL_SURFACE_DEPTH_CLEAR (1 << 25)
2148 # define GEN8_WM_HZ_STENCIL_CLEAR_VALUE_MASK INTEL_MASK(23, 16)
2149 # define GEN8_WM_HZ_STENCIL_CLEAR_VALUE_SHIFT 16
2150 # define GEN8_WM_HZ_NUM_SAMPLES_MASK INTEL_MASK(15, 13)
2151 # define GEN8_WM_HZ_NUM_SAMPLES_SHIFT 13
2152 /* DW2 */
2153 # define GEN8_WM_HZ_CLEAR_RECTANGLE_Y_MIN_MASK INTEL_MASK(31, 16)
2154 # define GEN8_WM_HZ_CLEAR_RECTANGLE_Y_MIN_SHIFT 16
2155 # define GEN8_WM_HZ_CLEAR_RECTANGLE_X_MIN_MASK INTEL_MASK(15, 0)
2156 # define GEN8_WM_HZ_CLEAR_RECTANGLE_X_MIN_SHIFT 0
2157 /* DW3 */
2158 # define GEN8_WM_HZ_CLEAR_RECTANGLE_Y_MAX_MASK INTEL_MASK(31, 16)
2159 # define GEN8_WM_HZ_CLEAR_RECTANGLE_Y_MAX_SHIFT 16
2160 # define GEN8_WM_HZ_CLEAR_RECTANGLE_X_MAX_MASK INTEL_MASK(15, 0)
2161 # define GEN8_WM_HZ_CLEAR_RECTANGLE_X_MAX_SHIFT 0
2162 /* DW4 */
2163 # define GEN8_WM_HZ_SAMPLE_MASK_MASK INTEL_MASK(15, 0)
2164 # define GEN8_WM_HZ_SAMPLE_MASK_SHIFT 0
2165
2166
2167 #define _3DSTATE_PS_BLEND 0x784D /* GEN8+ */
2168 /* DW1 */
2169 # define GEN8_PS_BLEND_ALPHA_TO_COVERAGE_ENABLE (1 << 31)
2170 # define GEN8_PS_BLEND_HAS_WRITEABLE_RT (1 << 30)
2171 # define GEN8_PS_BLEND_COLOR_BUFFER_BLEND_ENABLE (1 << 29)
2172 # define GEN8_PS_BLEND_SRC_ALPHA_BLEND_FACTOR_MASK INTEL_MASK(28, 24)
2173 # define GEN8_PS_BLEND_SRC_ALPHA_BLEND_FACTOR_SHIFT 24
2174 # define GEN8_PS_BLEND_DST_ALPHA_BLEND_FACTOR_MASK INTEL_MASK(23, 19)
2175 # define GEN8_PS_BLEND_DST_ALPHA_BLEND_FACTOR_SHIFT 19
2176 # define GEN8_PS_BLEND_SRC_BLEND_FACTOR_MASK INTEL_MASK(18, 14)
2177 # define GEN8_PS_BLEND_SRC_BLEND_FACTOR_SHIFT 14
2178 # define GEN8_PS_BLEND_DST_BLEND_FACTOR_MASK INTEL_MASK(13, 9)
2179 # define GEN8_PS_BLEND_DST_BLEND_FACTOR_SHIFT 9
2180 # define GEN8_PS_BLEND_ALPHA_TEST_ENABLE (1 << 8)
2181 # define GEN8_PS_BLEND_INDEPENDENT_ALPHA_BLEND_ENABLE (1 << 7)
2182
2183 #define _3DSTATE_WM_DEPTH_STENCIL 0x784E /* GEN8+ */
2184 /* DW1 */
2185 # define GEN8_WM_DS_STENCIL_FAIL_OP_SHIFT 29
2186 # define GEN8_WM_DS_Z_FAIL_OP_SHIFT 26
2187 # define GEN8_WM_DS_Z_PASS_OP_SHIFT 23
2188 # define GEN8_WM_DS_BF_STENCIL_FUNC_SHIFT 20
2189 # define GEN8_WM_DS_BF_STENCIL_FAIL_OP_SHIFT 17
2190 # define GEN8_WM_DS_BF_Z_FAIL_OP_SHIFT 14
2191 # define GEN8_WM_DS_BF_Z_PASS_OP_SHIFT 11
2192 # define GEN8_WM_DS_STENCIL_FUNC_SHIFT 8
2193 # define GEN8_WM_DS_DEPTH_FUNC_SHIFT 5
2194 # define GEN8_WM_DS_DOUBLE_SIDED_STENCIL_ENABLE (1 << 4)
2195 # define GEN8_WM_DS_STENCIL_TEST_ENABLE (1 << 3)
2196 # define GEN8_WM_DS_STENCIL_BUFFER_WRITE_ENABLE (1 << 2)
2197 # define GEN8_WM_DS_DEPTH_TEST_ENABLE (1 << 1)
2198 # define GEN8_WM_DS_DEPTH_BUFFER_WRITE_ENABLE (1 << 0)
2199 /* DW2 */
2200 # define GEN8_WM_DS_STENCIL_TEST_MASK_MASK INTEL_MASK(31, 24)
2201 # define GEN8_WM_DS_STENCIL_TEST_MASK_SHIFT 24
2202 # define GEN8_WM_DS_STENCIL_WRITE_MASK_MASK INTEL_MASK(23, 16)
2203 # define GEN8_WM_DS_STENCIL_WRITE_MASK_SHIFT 16
2204 # define GEN8_WM_DS_BF_STENCIL_TEST_MASK_MASK INTEL_MASK(15, 8)
2205 # define GEN8_WM_DS_BF_STENCIL_TEST_MASK_SHIFT 8
2206 # define GEN8_WM_DS_BF_STENCIL_WRITE_MASK_MASK INTEL_MASK(7, 0)
2207 # define GEN8_WM_DS_BF_STENCIL_WRITE_MASK_SHIFT 0
2208 /* DW3 */
2209 # define GEN9_WM_DS_STENCIL_REF_MASK INTEL_MASK(15, 8)
2210 # define GEN9_WM_DS_STENCIL_REF_SHIFT 8
2211 # define GEN9_WM_DS_BF_STENCIL_REF_MASK INTEL_MASK(7, 0)
2212 # define GEN9_WM_DS_BF_STENCIL_REF_SHIFT 0
2213
2214 enum brw_pixel_shader_computed_depth_mode {
2215 BRW_PSCDEPTH_OFF = 0, /* PS does not compute depth */
2216 BRW_PSCDEPTH_ON = 1, /* PS computes depth; no guarantee about value */
2217 BRW_PSCDEPTH_ON_GE = 2, /* PS guarantees output depth >= source depth */
2218 BRW_PSCDEPTH_ON_LE = 3, /* PS guarantees output depth <= source depth */
2219 };
2220
2221 enum brw_pixel_shader_coverage_mask_mode {
2222 BRW_PSICMS_OFF = 0, /* PS does not use input coverage masks. */
2223 BRW_PSICMS_NORMAL = 1, /* Input Coverage masks based on outer conservatism
2224 * and factors in SAMPLE_MASK. If Pixel is
2225 * conservatively covered, all samples are enabled.
2226 */
2227
2228 BRW_PSICMS_INNER = 2, /* Input Coverage masks based on inner conservatism
2229 * and factors in SAMPLE_MASK. If Pixel is
2230 * conservatively *FULLY* covered, all samples are
2231 * enabled.
2232 */
2233 BRW_PCICMS_DEPTH = 3,
2234 };
2235
2236 #define _3DSTATE_PS_EXTRA 0x784F /* GEN8+ */
2237 /* DW1 */
2238 # define GEN8_PSX_PIXEL_SHADER_VALID (1 << 31)
2239 # define GEN8_PSX_PIXEL_SHADER_NO_RT_WRITE (1 << 30)
2240 # define GEN8_PSX_OMASK_TO_RENDER_TARGET (1 << 29)
2241 # define GEN8_PSX_KILL_ENABLE (1 << 28)
2242 # define GEN8_PSX_COMPUTED_DEPTH_MODE_SHIFT 26
2243 # define GEN8_PSX_FORCE_COMPUTED_DEPTH (1 << 25)
2244 # define GEN8_PSX_USES_SOURCE_DEPTH (1 << 24)
2245 # define GEN8_PSX_USES_SOURCE_W (1 << 23)
2246 # define GEN8_PSX_ATTRIBUTE_ENABLE (1 << 8)
2247 # define GEN8_PSX_SHADER_DISABLES_ALPHA_TO_COVERAGE (1 << 7)
2248 # define GEN8_PSX_SHADER_IS_PER_SAMPLE (1 << 6)
2249 # define GEN9_PSX_SHADER_COMPUTES_STENCIL (1 << 5)
2250 # define GEN9_PSX_SHADER_PULLS_BARY (1 << 3)
2251 # define GEN8_PSX_SHADER_HAS_UAV (1 << 2)
2252 # define GEN8_PSX_SHADER_USES_INPUT_COVERAGE_MASK (1 << 1)
2253 # define GEN9_PSX_SHADER_NORMAL_COVERAGE_MASK_SHIFT 0
2254
2255 enum brw_barycentric_mode {
2256 BRW_BARYCENTRIC_PERSPECTIVE_PIXEL = 0,
2257 BRW_BARYCENTRIC_PERSPECTIVE_CENTROID = 1,
2258 BRW_BARYCENTRIC_PERSPECTIVE_SAMPLE = 2,
2259 BRW_BARYCENTRIC_NONPERSPECTIVE_PIXEL = 3,
2260 BRW_BARYCENTRIC_NONPERSPECTIVE_CENTROID = 4,
2261 BRW_BARYCENTRIC_NONPERSPECTIVE_SAMPLE = 5,
2262 BRW_BARYCENTRIC_MODE_COUNT = 6
2263 };
2264 #define BRW_BARYCENTRIC_NONPERSPECTIVE_BITS \
2265 ((1 << BRW_BARYCENTRIC_NONPERSPECTIVE_PIXEL) | \
2266 (1 << BRW_BARYCENTRIC_NONPERSPECTIVE_CENTROID) | \
2267 (1 << BRW_BARYCENTRIC_NONPERSPECTIVE_SAMPLE))
2268
2269 #define _3DSTATE_WM 0x7814 /* GEN6+ */
2270 /* DW1: kernel pointer */
2271 /* DW2 */
2272 # define GEN6_WM_SPF_MODE (1 << 31)
2273 # define GEN6_WM_VECTOR_MASK_ENABLE (1 << 30)
2274 # define GEN6_WM_SAMPLER_COUNT_SHIFT 27
2275 # define GEN6_WM_BINDING_TABLE_ENTRY_COUNT_SHIFT 18
2276 # define GEN6_WM_FLOATING_POINT_MODE_IEEE_754 (0 << 16)
2277 # define GEN6_WM_FLOATING_POINT_MODE_ALT (1 << 16)
2278 /* DW3: scratch space */
2279 /* DW4 */
2280 # define GEN6_WM_STATISTICS_ENABLE (1 << 31)
2281 # define GEN6_WM_DEPTH_CLEAR (1 << 30)
2282 # define GEN6_WM_DEPTH_RESOLVE (1 << 28)
2283 # define GEN6_WM_HIERARCHICAL_DEPTH_RESOLVE (1 << 27)
2284 # define GEN6_WM_DISPATCH_START_GRF_SHIFT_0 16
2285 # define GEN6_WM_DISPATCH_START_GRF_SHIFT_1 8
2286 # define GEN6_WM_DISPATCH_START_GRF_SHIFT_2 0
2287 /* DW5 */
2288 # define GEN6_WM_MAX_THREADS_SHIFT 25
2289 # define GEN6_WM_KILL_ENABLE (1 << 22)
2290 # define GEN6_WM_COMPUTED_DEPTH (1 << 21)
2291 # define GEN6_WM_USES_SOURCE_DEPTH (1 << 20)
2292 # define GEN6_WM_DISPATCH_ENABLE (1 << 19)
2293 # define GEN6_WM_LINE_END_CAP_AA_WIDTH_0_5 (0 << 16)
2294 # define GEN6_WM_LINE_END_CAP_AA_WIDTH_1_0 (1 << 16)
2295 # define GEN6_WM_LINE_END_CAP_AA_WIDTH_2_0 (2 << 16)
2296 # define GEN6_WM_LINE_END_CAP_AA_WIDTH_4_0 (3 << 16)
2297 # define GEN6_WM_LINE_AA_WIDTH_0_5 (0 << 14)
2298 # define GEN6_WM_LINE_AA_WIDTH_1_0 (1 << 14)
2299 # define GEN6_WM_LINE_AA_WIDTH_2_0 (2 << 14)
2300 # define GEN6_WM_LINE_AA_WIDTH_4_0 (3 << 14)
2301 # define GEN6_WM_POLYGON_STIPPLE_ENABLE (1 << 13)
2302 # define GEN6_WM_LINE_STIPPLE_ENABLE (1 << 11)
2303 # define GEN6_WM_OMASK_TO_RENDER_TARGET (1 << 9)
2304 # define GEN6_WM_USES_SOURCE_W (1 << 8)
2305 # define GEN6_WM_DUAL_SOURCE_BLEND_ENABLE (1 << 7)
2306 # define GEN6_WM_32_DISPATCH_ENABLE (1 << 2)
2307 # define GEN6_WM_16_DISPATCH_ENABLE (1 << 1)
2308 # define GEN6_WM_8_DISPATCH_ENABLE (1 << 0)
2309 /* DW6 */
2310 # define GEN6_WM_NUM_SF_OUTPUTS_SHIFT 20
2311 # define GEN6_WM_POSOFFSET_NONE (0 << 18)
2312 # define GEN6_WM_POSOFFSET_CENTROID (2 << 18)
2313 # define GEN6_WM_POSOFFSET_SAMPLE (3 << 18)
2314 # define GEN6_WM_POSITION_ZW_PIXEL (0 << 16)
2315 # define GEN6_WM_POSITION_ZW_CENTROID (2 << 16)
2316 # define GEN6_WM_POSITION_ZW_SAMPLE (3 << 16)
2317 # define GEN6_WM_NONPERSPECTIVE_SAMPLE_BARYCENTRIC (1 << 15)
2318 # define GEN6_WM_NONPERSPECTIVE_CENTROID_BARYCENTRIC (1 << 14)
2319 # define GEN6_WM_NONPERSPECTIVE_PIXEL_BARYCENTRIC (1 << 13)
2320 # define GEN6_WM_PERSPECTIVE_SAMPLE_BARYCENTRIC (1 << 12)
2321 # define GEN6_WM_PERSPECTIVE_CENTROID_BARYCENTRIC (1 << 11)
2322 # define GEN6_WM_PERSPECTIVE_PIXEL_BARYCENTRIC (1 << 10)
2323 # define GEN6_WM_BARYCENTRIC_INTERPOLATION_MODE_SHIFT 10
2324 # define GEN6_WM_POINT_RASTRULE_UPPER_RIGHT (1 << 9)
2325 # define GEN6_WM_MSRAST_OFF_PIXEL (0 << 1)
2326 # define GEN6_WM_MSRAST_OFF_PATTERN (1 << 1)
2327 # define GEN6_WM_MSRAST_ON_PIXEL (2 << 1)
2328 # define GEN6_WM_MSRAST_ON_PATTERN (3 << 1)
2329 # define GEN6_WM_MSDISPMODE_PERSAMPLE (0 << 0)
2330 # define GEN6_WM_MSDISPMODE_PERPIXEL (1 << 0)
2331 /* DW7: kernel 1 pointer */
2332 /* DW8: kernel 2 pointer */
2333
2334 #define _3DSTATE_CONSTANT_VS 0x7815 /* GEN6+ */
2335 #define _3DSTATE_CONSTANT_GS 0x7816 /* GEN6+ */
2336 #define _3DSTATE_CONSTANT_PS 0x7817 /* GEN6+ */
2337 # define GEN6_CONSTANT_BUFFER_3_ENABLE (1 << 15)
2338 # define GEN6_CONSTANT_BUFFER_2_ENABLE (1 << 14)
2339 # define GEN6_CONSTANT_BUFFER_1_ENABLE (1 << 13)
2340 # define GEN6_CONSTANT_BUFFER_0_ENABLE (1 << 12)
2341
2342 #define _3DSTATE_CONSTANT_HS 0x7819 /* GEN7+ */
2343 #define _3DSTATE_CONSTANT_DS 0x781A /* GEN7+ */
2344
2345 #define _3DSTATE_STREAMOUT 0x781e /* GEN7+ */
2346 /* DW1 */
2347 # define SO_FUNCTION_ENABLE (1 << 31)
2348 # define SO_RENDERING_DISABLE (1 << 30)
2349 /* This selects which incoming rendering stream goes down the pipeline. The
2350 * rendering stream is 0 if not defined by special cases in the GS state.
2351 */
2352 # define SO_RENDER_STREAM_SELECT_SHIFT 27
2353 # define SO_RENDER_STREAM_SELECT_MASK INTEL_MASK(28, 27)
2354 /* Controls reordering of TRISTRIP_* elements in stream output (not rendering).
2355 */
2356 # define SO_REORDER_TRAILING (1 << 26)
2357 /* Controls SO_NUM_PRIMS_WRITTEN_* and SO_PRIM_STORAGE_* */
2358 # define SO_STATISTICS_ENABLE (1 << 25)
2359 # define SO_BUFFER_ENABLE(n) (1 << (8 + (n)))
2360 /* DW2 */
2361 # define SO_STREAM_3_VERTEX_READ_OFFSET_SHIFT 29
2362 # define SO_STREAM_3_VERTEX_READ_OFFSET_MASK INTEL_MASK(29, 29)
2363 # define SO_STREAM_3_VERTEX_READ_LENGTH_SHIFT 24
2364 # define SO_STREAM_3_VERTEX_READ_LENGTH_MASK INTEL_MASK(28, 24)
2365 # define SO_STREAM_2_VERTEX_READ_OFFSET_SHIFT 21
2366 # define SO_STREAM_2_VERTEX_READ_OFFSET_MASK INTEL_MASK(21, 21)
2367 # define SO_STREAM_2_VERTEX_READ_LENGTH_SHIFT 16
2368 # define SO_STREAM_2_VERTEX_READ_LENGTH_MASK INTEL_MASK(20, 16)
2369 # define SO_STREAM_1_VERTEX_READ_OFFSET_SHIFT 13
2370 # define SO_STREAM_1_VERTEX_READ_OFFSET_MASK INTEL_MASK(13, 13)
2371 # define SO_STREAM_1_VERTEX_READ_LENGTH_SHIFT 8
2372 # define SO_STREAM_1_VERTEX_READ_LENGTH_MASK INTEL_MASK(12, 8)
2373 # define SO_STREAM_0_VERTEX_READ_OFFSET_SHIFT 5
2374 # define SO_STREAM_0_VERTEX_READ_OFFSET_MASK INTEL_MASK(5, 5)
2375 # define SO_STREAM_0_VERTEX_READ_LENGTH_SHIFT 0
2376 # define SO_STREAM_0_VERTEX_READ_LENGTH_MASK INTEL_MASK(4, 0)
2377
2378 /* 3DSTATE_WM for Gen7 */
2379 /* DW1 */
2380 # define GEN7_WM_STATISTICS_ENABLE (1 << 31)
2381 # define GEN7_WM_DEPTH_CLEAR (1 << 30)
2382 # define GEN7_WM_DISPATCH_ENABLE (1 << 29)
2383 # define GEN7_WM_DEPTH_RESOLVE (1 << 28)
2384 # define GEN7_WM_HIERARCHICAL_DEPTH_RESOLVE (1 << 27)
2385 # define GEN7_WM_KILL_ENABLE (1 << 25)
2386 # define GEN7_WM_COMPUTED_DEPTH_MODE_SHIFT 23
2387 # define GEN7_WM_USES_SOURCE_DEPTH (1 << 20)
2388 # define GEN7_WM_EARLY_DS_CONTROL_NORMAL (0 << 21)
2389 # define GEN7_WM_EARLY_DS_CONTROL_PSEXEC (1 << 21)
2390 # define GEN7_WM_EARLY_DS_CONTROL_PREPS (2 << 21)
2391 # define GEN7_WM_USES_SOURCE_W (1 << 19)
2392 # define GEN7_WM_POSITION_ZW_PIXEL (0 << 17)
2393 # define GEN7_WM_POSITION_ZW_CENTROID (2 << 17)
2394 # define GEN7_WM_POSITION_ZW_SAMPLE (3 << 17)
2395 # define GEN7_WM_BARYCENTRIC_INTERPOLATION_MODE_SHIFT 11
2396 # define GEN7_WM_USES_INPUT_COVERAGE_MASK (1 << 10)
2397 # define GEN7_WM_LINE_END_CAP_AA_WIDTH_0_5 (0 << 8)
2398 # define GEN7_WM_LINE_END_CAP_AA_WIDTH_1_0 (1 << 8)
2399 # define GEN7_WM_LINE_END_CAP_AA_WIDTH_2_0 (2 << 8)
2400 # define GEN7_WM_LINE_END_CAP_AA_WIDTH_4_0 (3 << 8)
2401 # define GEN7_WM_LINE_AA_WIDTH_0_5 (0 << 6)
2402 # define GEN7_WM_LINE_AA_WIDTH_1_0 (1 << 6)
2403 # define GEN7_WM_LINE_AA_WIDTH_2_0 (2 << 6)
2404 # define GEN7_WM_LINE_AA_WIDTH_4_0 (3 << 6)
2405 # define GEN7_WM_POLYGON_STIPPLE_ENABLE (1 << 4)
2406 # define GEN7_WM_LINE_STIPPLE_ENABLE (1 << 3)
2407 # define GEN7_WM_POINT_RASTRULE_UPPER_RIGHT (1 << 2)
2408 # define GEN7_WM_MSRAST_OFF_PIXEL (0 << 0)
2409 # define GEN7_WM_MSRAST_OFF_PATTERN (1 << 0)
2410 # define GEN7_WM_MSRAST_ON_PIXEL (2 << 0)
2411 # define GEN7_WM_MSRAST_ON_PATTERN (3 << 0)
2412 /* DW2 */
2413 # define GEN7_WM_MSDISPMODE_PERSAMPLE (0 << 31)
2414 # define GEN7_WM_MSDISPMODE_PERPIXEL (1 << 31)
2415 # define HSW_WM_UAV_ONLY (1 << 30)
2416
2417 #define _3DSTATE_PS 0x7820 /* GEN7+ */
2418 /* DW1: kernel pointer */
2419 /* DW2 */
2420 # define GEN7_PS_SPF_MODE (1 << 31)
2421 # define GEN7_PS_VECTOR_MASK_ENABLE (1 << 30)
2422 # define GEN7_PS_SAMPLER_COUNT_SHIFT 27
2423 # define GEN7_PS_SAMPLER_COUNT_MASK INTEL_MASK(29, 27)
2424 # define GEN7_PS_BINDING_TABLE_ENTRY_COUNT_SHIFT 18
2425 # define GEN7_PS_FLOATING_POINT_MODE_IEEE_754 (0 << 16)
2426 # define GEN7_PS_FLOATING_POINT_MODE_ALT (1 << 16)
2427 /* DW3: scratch space */
2428 /* DW4 */
2429 # define IVB_PS_MAX_THREADS_SHIFT 24
2430 # define HSW_PS_MAX_THREADS_SHIFT 23
2431 # define HSW_PS_SAMPLE_MASK_SHIFT 12
2432 # define HSW_PS_SAMPLE_MASK_MASK INTEL_MASK(19, 12)
2433 # define GEN7_PS_PUSH_CONSTANT_ENABLE (1 << 11)
2434 # define GEN7_PS_ATTRIBUTE_ENABLE (1 << 10)
2435 # define GEN7_PS_OMASK_TO_RENDER_TARGET (1 << 9)
2436 # define GEN7_PS_RENDER_TARGET_FAST_CLEAR_ENABLE (1 << 8)
2437 # define GEN7_PS_DUAL_SOURCE_BLEND_ENABLE (1 << 7)
2438 # define GEN7_PS_RENDER_TARGET_RESOLVE_ENABLE (1 << 6)
2439 # define GEN9_PS_RENDER_TARGET_RESOLVE_FULL (3 << 6)
2440 # define HSW_PS_UAV_ACCESS_ENABLE (1 << 5)
2441 # define GEN7_PS_POSOFFSET_NONE (0 << 3)
2442 # define GEN7_PS_POSOFFSET_CENTROID (2 << 3)
2443 # define GEN7_PS_POSOFFSET_SAMPLE (3 << 3)
2444 # define GEN7_PS_32_DISPATCH_ENABLE (1 << 2)
2445 # define GEN7_PS_16_DISPATCH_ENABLE (1 << 1)
2446 # define GEN7_PS_8_DISPATCH_ENABLE (1 << 0)
2447 /* DW5 */
2448 # define GEN7_PS_DISPATCH_START_GRF_SHIFT_0 16
2449 # define GEN7_PS_DISPATCH_START_GRF_SHIFT_1 8
2450 # define GEN7_PS_DISPATCH_START_GRF_SHIFT_2 0
2451 /* DW6: kernel 1 pointer */
2452 /* DW7: kernel 2 pointer */
2453
2454 #define _3DSTATE_SAMPLE_MASK 0x7818 /* GEN6+ */
2455
2456 #define _3DSTATE_DRAWING_RECTANGLE 0x7900
2457 #define _3DSTATE_BLEND_CONSTANT_COLOR 0x7901
2458 #define _3DSTATE_CHROMA_KEY 0x7904
2459 #define _3DSTATE_DEPTH_BUFFER 0x7905 /* GEN4-6 */
2460 #define _3DSTATE_POLY_STIPPLE_OFFSET 0x7906
2461 #define _3DSTATE_POLY_STIPPLE_PATTERN 0x7907
2462 #define _3DSTATE_LINE_STIPPLE_PATTERN 0x7908
2463 #define _3DSTATE_GLOBAL_DEPTH_OFFSET_CLAMP 0x7909
2464 #define _3DSTATE_AA_LINE_PARAMETERS 0x790a /* G45+ */
2465
2466 #define _3DSTATE_GS_SVB_INDEX 0x790b /* CTG+ */
2467 /* DW1 */
2468 # define SVB_INDEX_SHIFT 29
2469 # define SVB_LOAD_INTERNAL_VERTEX_COUNT (1 << 0) /* SNB+ */
2470 /* DW2: SVB index */
2471 /* DW3: SVB maximum index */
2472
2473 #define _3DSTATE_MULTISAMPLE 0x790d /* GEN6+ */
2474 #define GEN8_3DSTATE_MULTISAMPLE 0x780d /* GEN8+ */
2475 /* DW1 */
2476 # define MS_PIXEL_LOCATION_CENTER (0 << 4)
2477 # define MS_PIXEL_LOCATION_UPPER_LEFT (1 << 4)
2478 # define MS_NUMSAMPLES_1 (0 << 1)
2479 # define MS_NUMSAMPLES_2 (1 << 1)
2480 # define MS_NUMSAMPLES_4 (2 << 1)
2481 # define MS_NUMSAMPLES_8 (3 << 1)
2482 # define MS_NUMSAMPLES_16 (4 << 1)
2483
2484 #define _3DSTATE_SAMPLE_PATTERN 0x791c
2485
2486 #define _3DSTATE_STENCIL_BUFFER 0x790e /* ILK, SNB */
2487 #define _3DSTATE_HIER_DEPTH_BUFFER 0x790f /* ILK, SNB */
2488
2489 #define GEN7_3DSTATE_CLEAR_PARAMS 0x7804
2490 #define GEN7_3DSTATE_DEPTH_BUFFER 0x7805
2491 #define GEN7_3DSTATE_STENCIL_BUFFER 0x7806
2492 # define HSW_STENCIL_ENABLED (1 << 31)
2493 #define GEN7_3DSTATE_HIER_DEPTH_BUFFER 0x7807
2494
2495 #define _3DSTATE_CLEAR_PARAMS 0x7910 /* ILK, SNB */
2496 # define GEN5_DEPTH_CLEAR_VALID (1 << 15)
2497 /* DW1: depth clear value */
2498 /* DW2 */
2499 # define GEN7_DEPTH_CLEAR_VALID (1 << 0)
2500
2501 #define _3DSTATE_SO_DECL_LIST 0x7917 /* GEN7+ */
2502 /* DW1 */
2503 # define SO_STREAM_TO_BUFFER_SELECTS_3_SHIFT 12
2504 # define SO_STREAM_TO_BUFFER_SELECTS_3_MASK INTEL_MASK(15, 12)
2505 # define SO_STREAM_TO_BUFFER_SELECTS_2_SHIFT 8
2506 # define SO_STREAM_TO_BUFFER_SELECTS_2_MASK INTEL_MASK(11, 8)
2507 # define SO_STREAM_TO_BUFFER_SELECTS_1_SHIFT 4
2508 # define SO_STREAM_TO_BUFFER_SELECTS_1_MASK INTEL_MASK(7, 4)
2509 # define SO_STREAM_TO_BUFFER_SELECTS_0_SHIFT 0
2510 # define SO_STREAM_TO_BUFFER_SELECTS_0_MASK INTEL_MASK(3, 0)
2511 /* DW2 */
2512 # define SO_NUM_ENTRIES_3_SHIFT 24
2513 # define SO_NUM_ENTRIES_3_MASK INTEL_MASK(31, 24)
2514 # define SO_NUM_ENTRIES_2_SHIFT 16
2515 # define SO_NUM_ENTRIES_2_MASK INTEL_MASK(23, 16)
2516 # define SO_NUM_ENTRIES_1_SHIFT 8
2517 # define SO_NUM_ENTRIES_1_MASK INTEL_MASK(15, 8)
2518 # define SO_NUM_ENTRIES_0_SHIFT 0
2519 # define SO_NUM_ENTRIES_0_MASK INTEL_MASK(7, 0)
2520
2521 /* SO_DECL DW0 */
2522 # define SO_DECL_OUTPUT_BUFFER_SLOT_SHIFT 12
2523 # define SO_DECL_OUTPUT_BUFFER_SLOT_MASK INTEL_MASK(13, 12)
2524 # define SO_DECL_HOLE_FLAG (1 << 11)
2525 # define SO_DECL_REGISTER_INDEX_SHIFT 4
2526 # define SO_DECL_REGISTER_INDEX_MASK INTEL_MASK(9, 4)
2527 # define SO_DECL_COMPONENT_MASK_SHIFT 0
2528 # define SO_DECL_COMPONENT_MASK_MASK INTEL_MASK(3, 0)
2529
2530 #define _3DSTATE_SO_BUFFER 0x7918 /* GEN7+ */
2531 /* DW1 */
2532 # define GEN8_SO_BUFFER_ENABLE (1 << 31)
2533 # define SO_BUFFER_INDEX_SHIFT 29
2534 # define SO_BUFFER_INDEX_MASK INTEL_MASK(30, 29)
2535 # define GEN8_SO_BUFFER_OFFSET_WRITE_ENABLE (1 << 21)
2536 # define GEN8_SO_BUFFER_OFFSET_ADDRESS_ENABLE (1 << 20)
2537 # define SO_BUFFER_PITCH_SHIFT 0
2538 # define SO_BUFFER_PITCH_MASK INTEL_MASK(11, 0)
2539 /* DW2: start address */
2540 /* DW3: end address. */
2541
2542 #define CMD_MI_FLUSH 0x0200
2543
2544 # define BLT_X_SHIFT 0
2545 # define BLT_X_MASK INTEL_MASK(15, 0)
2546 # define BLT_Y_SHIFT 16
2547 # define BLT_Y_MASK INTEL_MASK(31, 16)
2548
2549 #define GEN5_MI_REPORT_PERF_COUNT ((0x26 << 23) | (3 - 2))
2550 /* DW0 */
2551 # define GEN5_MI_COUNTER_SET_0 (0 << 6)
2552 # define GEN5_MI_COUNTER_SET_1 (1 << 6)
2553 /* DW1 */
2554 # define MI_COUNTER_ADDRESS_GTT (1 << 0)
2555 /* DW2: a user-defined report ID (written to the buffer but can be anything) */
2556
2557 #define GEN6_MI_REPORT_PERF_COUNT ((0x28 << 23) | (3 - 2))
2558
2559 /* Bitfields for the URB_WRITE message, DW2 of message header: */
2560 #define URB_WRITE_PRIM_END 0x1
2561 #define URB_WRITE_PRIM_START 0x2
2562 #define URB_WRITE_PRIM_TYPE_SHIFT 2
2563
2564
2565 /* Maximum number of entries that can be addressed using a binding table
2566 * pointer of type SURFTYPE_BUFFER
2567 */
2568 #define BRW_MAX_NUM_BUFFER_ENTRIES (1 << 27)
2569
2570 /* Memory Object Control State:
2571 * Specifying zero for L3 means "uncached in L3", at least on Haswell
2572 * and Baytrail, since there are no PTE flags for setting L3 cacheability.
2573 * On Ivybridge, the PTEs do have a cache-in-L3 bit, so setting MOCS to 0
2574 * may still respect that.
2575 */
2576 #define GEN7_MOCS_L3 1
2577
2578 /* Ivybridge only: cache in LLC.
2579 * Specifying zero here means to use the PTE values set by the kernel;
2580 * non-zero overrides the PTE values.
2581 */
2582 #define IVB_MOCS_LLC (1 << 1)
2583
2584 /* Baytrail only: snoop in CPU cache */
2585 #define BYT_MOCS_SNOOP (1 << 1)
2586
2587 /* Haswell only: LLC/eLLC controls (write-back or uncached).
2588 * Specifying zero here means to use the PTE values set by the kernel,
2589 * which is useful since it offers additional control (write-through
2590 * cacheing and age). Non-zero overrides the PTE values.
2591 */
2592 #define HSW_MOCS_UC_LLC_UC_ELLC (1 << 1)
2593 #define HSW_MOCS_WB_LLC_WB_ELLC (2 << 1)
2594 #define HSW_MOCS_UC_LLC_WB_ELLC (3 << 1)
2595
2596 /* Broadwell: these defines always use all available caches (L3, LLC, eLLC),
2597 * and let you force write-back (WB) or write-through (WT) caching, or leave
2598 * it up to the page table entry (PTE) specified by the kernel.
2599 */
2600 #define BDW_MOCS_WB 0x78
2601 #define BDW_MOCS_WT 0x58
2602 #define BDW_MOCS_PTE 0x18
2603
2604 /* Skylake: MOCS is now an index into an array of 62 different caching
2605 * configurations programmed by the kernel.
2606 */
2607 /* TC=LLC/eLLC, LeCC=WB, LRUM=3, L3CC=WB */
2608 #define SKL_MOCS_WB (2 << 1)
2609 /* TC=LLC/eLLC, LeCC=PTE, LRUM=3, L3CC=WB */
2610 #define SKL_MOCS_PTE (1 << 1)
2611
2612 #define MEDIA_VFE_STATE 0x7000
2613 /* GEN7 DW2, GEN8+ DW3 */
2614 # define MEDIA_VFE_STATE_MAX_THREADS_SHIFT 16
2615 # define MEDIA_VFE_STATE_MAX_THREADS_MASK INTEL_MASK(31, 16)
2616 # define MEDIA_VFE_STATE_URB_ENTRIES_SHIFT 8
2617 # define MEDIA_VFE_STATE_URB_ENTRIES_MASK INTEL_MASK(15, 8)
2618 # define MEDIA_VFE_STATE_RESET_GTW_TIMER_SHIFT 7
2619 # define MEDIA_VFE_STATE_RESET_GTW_TIMER_MASK INTEL_MASK(7, 7)
2620 # define MEDIA_VFE_STATE_BYPASS_GTW_SHIFT 6
2621 # define MEDIA_VFE_STATE_BYPASS_GTW_MASK INTEL_MASK(6, 6)
2622 # define GEN7_MEDIA_VFE_STATE_GPGPU_MODE_SHIFT 2
2623 # define GEN7_MEDIA_VFE_STATE_GPGPU_MODE_MASK INTEL_MASK(2, 2)
2624 /* GEN7 DW4, GEN8+ DW5 */
2625 # define MEDIA_VFE_STATE_URB_ALLOC_SHIFT 16
2626 # define MEDIA_VFE_STATE_URB_ALLOC_MASK INTEL_MASK(31, 16)
2627 # define MEDIA_VFE_STATE_CURBE_ALLOC_SHIFT 0
2628 # define MEDIA_VFE_STATE_CURBE_ALLOC_MASK INTEL_MASK(15, 0)
2629
2630 #define MEDIA_CURBE_LOAD 0x7001
2631 #define MEDIA_INTERFACE_DESCRIPTOR_LOAD 0x7002
2632 /* GEN7 DW4, GEN8+ DW5 */
2633 # define MEDIA_CURBE_READ_LENGTH_SHIFT 16
2634 # define MEDIA_CURBE_READ_LENGTH_MASK INTEL_MASK(31, 16)
2635 # define MEDIA_CURBE_READ_OFFSET_SHIFT 0
2636 # define MEDIA_CURBE_READ_OFFSET_MASK INTEL_MASK(15, 0)
2637 /* GEN7 DW5, GEN8+ DW6 */
2638 # define MEDIA_BARRIER_ENABLE_SHIFT 21
2639 # define MEDIA_BARRIER_ENABLE_MASK INTEL_MASK(21, 21)
2640 # define MEDIA_SHARED_LOCAL_MEMORY_SIZE_SHIFT 16
2641 # define MEDIA_SHARED_LOCAL_MEMORY_SIZE_MASK INTEL_MASK(20, 16)
2642 # define MEDIA_GPGPU_THREAD_COUNT_SHIFT 0
2643 # define MEDIA_GPGPU_THREAD_COUNT_MASK INTEL_MASK(7, 0)
2644 # define GEN8_MEDIA_GPGPU_THREAD_COUNT_SHIFT 0
2645 # define GEN8_MEDIA_GPGPU_THREAD_COUNT_MASK INTEL_MASK(9, 0)
2646 /* GEN7 DW6, GEN8+ DW7 */
2647 # define CROSS_THREAD_READ_LENGTH_SHIFT 0
2648 # define CROSS_THREAD_READ_LENGTH_MASK INTEL_MASK(7, 0)
2649 #define MEDIA_STATE_FLUSH 0x7004
2650 #define GPGPU_WALKER 0x7105
2651 /* GEN7 DW0 */
2652 # define GEN7_GPGPU_INDIRECT_PARAMETER_ENABLE (1 << 10)
2653 # define GEN7_GPGPU_PREDICATE_ENABLE (1 << 8)
2654 /* GEN8+ DW2 */
2655 # define GPGPU_WALKER_INDIRECT_LENGTH_SHIFT 0
2656 # define GPGPU_WALKER_INDIRECT_LENGTH_MASK INTEL_MASK(15, 0)
2657 /* GEN7 DW2, GEN8+ DW4 */
2658 # define GPGPU_WALKER_SIMD_SIZE_SHIFT 30
2659 # define GPGPU_WALKER_SIMD_SIZE_MASK INTEL_MASK(31, 30)
2660 # define GPGPU_WALKER_THREAD_DEPTH_MAX_SHIFT 16
2661 # define GPGPU_WALKER_THREAD_DEPTH_MAX_MASK INTEL_MASK(21, 16)
2662 # define GPGPU_WALKER_THREAD_HEIGHT_MAX_SHIFT 8
2663 # define GPGPU_WALKER_THREAD_HEIGHT_MAX_MASK INTEL_MASK(31, 8)
2664 # define GPGPU_WALKER_THREAD_WIDTH_MAX_SHIFT 0
2665 # define GPGPU_WALKER_THREAD_WIDTH_MAX_MASK INTEL_MASK(5, 0)
2666
2667 #define CMD_MI (0x0 << 29)
2668 #define CMD_2D (0x2 << 29)
2669 #define CMD_3D (0x3 << 29)
2670
2671 #define MI_NOOP (CMD_MI | 0)
2672
2673 #define MI_BATCH_BUFFER_END (CMD_MI | 0xA << 23)
2674
2675 #define MI_FLUSH (CMD_MI | (4 << 23))
2676 #define FLUSH_MAP_CACHE (1 << 0)
2677 #define INHIBIT_FLUSH_RENDER_CACHE (1 << 2)
2678
2679 #define MI_STORE_DATA_IMM (CMD_MI | (0x20 << 23))
2680 #define MI_LOAD_REGISTER_IMM (CMD_MI | (0x22 << 23))
2681 #define MI_LOAD_REGISTER_REG (CMD_MI | (0x2A << 23))
2682
2683 #define MI_FLUSH_DW (CMD_MI | (0x26 << 23) | 2)
2684
2685 #define MI_STORE_REGISTER_MEM (CMD_MI | (0x24 << 23))
2686 # define MI_STORE_REGISTER_MEM_USE_GGTT (1 << 22)
2687 # define MI_STORE_REGISTER_MEM_PREDICATE (1 << 21)
2688
2689 /* Load a value from memory into a register. Only available on Gen7+. */
2690 #define GEN7_MI_LOAD_REGISTER_MEM (CMD_MI | (0x29 << 23))
2691 # define MI_LOAD_REGISTER_MEM_USE_GGTT (1 << 22)
2692
2693 /* Manipulate the predicate bit based on some register values. Only on Gen7+ */
2694 #define GEN7_MI_PREDICATE (CMD_MI | (0xC << 23))
2695 # define MI_PREDICATE_LOADOP_KEEP (0 << 6)
2696 # define MI_PREDICATE_LOADOP_LOAD (2 << 6)
2697 # define MI_PREDICATE_LOADOP_LOADINV (3 << 6)
2698 # define MI_PREDICATE_COMBINEOP_SET (0 << 3)
2699 # define MI_PREDICATE_COMBINEOP_AND (1 << 3)
2700 # define MI_PREDICATE_COMBINEOP_OR (2 << 3)
2701 # define MI_PREDICATE_COMBINEOP_XOR (3 << 3)
2702 # define MI_PREDICATE_COMPAREOP_TRUE (0 << 0)
2703 # define MI_PREDICATE_COMPAREOP_FALSE (1 << 0)
2704 # define MI_PREDICATE_COMPAREOP_SRCS_EQUAL (2 << 0)
2705 # define MI_PREDICATE_COMPAREOP_DELTAS_EQUAL (3 << 0)
2706
2707 #define HSW_MI_MATH (CMD_MI | (0x1a << 23))
2708
2709 #define MI_MATH_ALU2(opcode, operand1, operand2) \
2710 ( ((MI_MATH_OPCODE_##opcode) << 20) | ((MI_MATH_OPERAND_##operand1) << 10) | \
2711 ((MI_MATH_OPERAND_##operand2) << 0) )
2712
2713 #define MI_MATH_ALU1(opcode, operand1) \
2714 ( ((MI_MATH_OPCODE_##opcode) << 20) | ((MI_MATH_OPERAND_##operand1) << 10) )
2715
2716 #define MI_MATH_ALU0(opcode) \
2717 ( ((MI_MATH_OPCODE_##opcode) << 20) )
2718
2719 #define MI_MATH_OPCODE_NOOP 0x000
2720 #define MI_MATH_OPCODE_LOAD 0x080
2721 #define MI_MATH_OPCODE_LOADINV 0x480
2722 #define MI_MATH_OPCODE_LOAD0 0x081
2723 #define MI_MATH_OPCODE_LOAD1 0x481
2724 #define MI_MATH_OPCODE_ADD 0x100
2725 #define MI_MATH_OPCODE_SUB 0x101
2726 #define MI_MATH_OPCODE_AND 0x102
2727 #define MI_MATH_OPCODE_OR 0x103
2728 #define MI_MATH_OPCODE_XOR 0x104
2729 #define MI_MATH_OPCODE_STORE 0x180
2730 #define MI_MATH_OPCODE_STOREINV 0x580
2731
2732 #define MI_MATH_OPERAND_R0 0x00
2733 #define MI_MATH_OPERAND_R1 0x01
2734 #define MI_MATH_OPERAND_R2 0x02
2735 #define MI_MATH_OPERAND_R3 0x03
2736 #define MI_MATH_OPERAND_R4 0x04
2737 #define MI_MATH_OPERAND_SRCA 0x20
2738 #define MI_MATH_OPERAND_SRCB 0x21
2739 #define MI_MATH_OPERAND_ACCU 0x31
2740 #define MI_MATH_OPERAND_ZF 0x32
2741 #define MI_MATH_OPERAND_CF 0x33
2742
2743 /** @{
2744 *
2745 * PIPE_CONTROL operation, a combination MI_FLUSH and register write with
2746 * additional flushing control.
2747 */
2748 #define _3DSTATE_PIPE_CONTROL (CMD_3D | (3 << 27) | (2 << 24))
2749 #define PIPE_CONTROL_CS_STALL (1 << 20)
2750 #define PIPE_CONTROL_GLOBAL_SNAPSHOT_COUNT_RESET (1 << 19)
2751 #define PIPE_CONTROL_TLB_INVALIDATE (1 << 18)
2752 #define PIPE_CONTROL_SYNC_GFDT (1 << 17)
2753 #define PIPE_CONTROL_MEDIA_STATE_CLEAR (1 << 16)
2754 #define PIPE_CONTROL_NO_WRITE (0 << 14)
2755 #define PIPE_CONTROL_WRITE_IMMEDIATE (1 << 14)
2756 #define PIPE_CONTROL_WRITE_DEPTH_COUNT (2 << 14)
2757 #define PIPE_CONTROL_WRITE_TIMESTAMP (3 << 14)
2758 #define PIPE_CONTROL_DEPTH_STALL (1 << 13)
2759 #define PIPE_CONTROL_RENDER_TARGET_FLUSH (1 << 12)
2760 #define PIPE_CONTROL_INSTRUCTION_INVALIDATE (1 << 11)
2761 #define PIPE_CONTROL_TEXTURE_CACHE_INVALIDATE (1 << 10) /* GM45+ only */
2762 #define PIPE_CONTROL_ISP_DIS (1 << 9)
2763 #define PIPE_CONTROL_INTERRUPT_ENABLE (1 << 8)
2764 #define PIPE_CONTROL_FLUSH_ENABLE (1 << 7) /* Gen7+ only */
2765 /* GT */
2766 #define PIPE_CONTROL_DATA_CACHE_FLUSH (1 << 5)
2767 #define PIPE_CONTROL_VF_CACHE_INVALIDATE (1 << 4)
2768 #define PIPE_CONTROL_CONST_CACHE_INVALIDATE (1 << 3)
2769 #define PIPE_CONTROL_STATE_CACHE_INVALIDATE (1 << 2)
2770 #define PIPE_CONTROL_STALL_AT_SCOREBOARD (1 << 1)
2771 #define PIPE_CONTROL_DEPTH_CACHE_FLUSH (1 << 0)
2772 #define PIPE_CONTROL_PPGTT_WRITE (0 << 2)
2773 #define PIPE_CONTROL_GLOBAL_GTT_WRITE (1 << 2)
2774
2775 #define PIPE_CONTROL_CACHE_FLUSH_BITS \
2776 (PIPE_CONTROL_DEPTH_CACHE_FLUSH | PIPE_CONTROL_DATA_CACHE_FLUSH | \
2777 PIPE_CONTROL_RENDER_TARGET_FLUSH)
2778
2779 #define PIPE_CONTROL_CACHE_INVALIDATE_BITS \
2780 (PIPE_CONTROL_STATE_CACHE_INVALIDATE | PIPE_CONTROL_CONST_CACHE_INVALIDATE | \
2781 PIPE_CONTROL_VF_CACHE_INVALIDATE | PIPE_CONTROL_TEXTURE_CACHE_INVALIDATE | \
2782 PIPE_CONTROL_INSTRUCTION_INVALIDATE)
2783
2784 /** @} */
2785
2786 #define XY_SETUP_BLT_CMD (CMD_2D | (0x01 << 22))
2787
2788 #define XY_COLOR_BLT_CMD (CMD_2D | (0x50 << 22))
2789
2790 #define XY_SRC_COPY_BLT_CMD (CMD_2D | (0x53 << 22))
2791
2792 #define XY_FAST_COPY_BLT_CMD (CMD_2D | (0x42 << 22))
2793
2794 #define XY_TEXT_IMMEDIATE_BLIT_CMD (CMD_2D | (0x31 << 22))
2795 # define XY_TEXT_BYTE_PACKED (1 << 16)
2796
2797 /* BR00 */
2798 #define XY_BLT_WRITE_ALPHA (1 << 21)
2799 #define XY_BLT_WRITE_RGB (1 << 20)
2800 #define XY_SRC_TILED (1 << 15)
2801 #define XY_DST_TILED (1 << 11)
2802
2803 /* BR00 */
2804 #define XY_FAST_SRC_TILED_64K (3 << 20)
2805 #define XY_FAST_SRC_TILED_Y (2 << 20)
2806 #define XY_FAST_SRC_TILED_X (1 << 20)
2807
2808 #define XY_FAST_DST_TILED_64K (3 << 13)
2809 #define XY_FAST_DST_TILED_Y (2 << 13)
2810 #define XY_FAST_DST_TILED_X (1 << 13)
2811
2812 /* BR13 */
2813 #define BR13_8 (0x0 << 24)
2814 #define BR13_565 (0x1 << 24)
2815 #define BR13_8888 (0x3 << 24)
2816 #define BR13_16161616 (0x4 << 24)
2817 #define BR13_32323232 (0x5 << 24)
2818
2819 #define XY_FAST_SRC_TRMODE_YF (1 << 31)
2820 #define XY_FAST_DST_TRMODE_YF (1 << 30)
2821
2822 /* Pipeline Statistics Counter Registers */
2823 #define IA_VERTICES_COUNT 0x2310
2824 #define IA_PRIMITIVES_COUNT 0x2318
2825 #define VS_INVOCATION_COUNT 0x2320
2826 #define HS_INVOCATION_COUNT 0x2300
2827 #define DS_INVOCATION_COUNT 0x2308
2828 #define GS_INVOCATION_COUNT 0x2328
2829 #define GS_PRIMITIVES_COUNT 0x2330
2830 #define CL_INVOCATION_COUNT 0x2338
2831 #define CL_PRIMITIVES_COUNT 0x2340
2832 #define PS_INVOCATION_COUNT 0x2348
2833 #define CS_INVOCATION_COUNT 0x2290
2834 #define PS_DEPTH_COUNT 0x2350
2835
2836 #define GEN6_SO_PRIM_STORAGE_NEEDED 0x2280
2837 #define GEN7_SO_PRIM_STORAGE_NEEDED(n) (0x5240 + (n) * 8)
2838
2839 #define GEN6_SO_NUM_PRIMS_WRITTEN 0x2288
2840 #define GEN7_SO_NUM_PRIMS_WRITTEN(n) (0x5200 + (n) * 8)
2841
2842 #define GEN7_SO_WRITE_OFFSET(n) (0x5280 + (n) * 4)
2843
2844 #define TIMESTAMP 0x2358
2845
2846 #define BCS_SWCTRL 0x22200
2847 # define BCS_SWCTRL_SRC_Y (1 << 0)
2848 # define BCS_SWCTRL_DST_Y (1 << 1)
2849
2850 #define OACONTROL 0x2360
2851 # define OACONTROL_COUNTER_SELECT_SHIFT 2
2852 # define OACONTROL_ENABLE_COUNTERS (1 << 0)
2853
2854 /* Auto-Draw / Indirect Registers */
2855 #define GEN7_3DPRIM_END_OFFSET 0x2420
2856 #define GEN7_3DPRIM_START_VERTEX 0x2430
2857 #define GEN7_3DPRIM_VERTEX_COUNT 0x2434
2858 #define GEN7_3DPRIM_INSTANCE_COUNT 0x2438
2859 #define GEN7_3DPRIM_START_INSTANCE 0x243C
2860 #define GEN7_3DPRIM_BASE_VERTEX 0x2440
2861
2862 /* Auto-Compute / Indirect Registers */
2863 #define GEN7_GPGPU_DISPATCHDIMX 0x2500
2864 #define GEN7_GPGPU_DISPATCHDIMY 0x2504
2865 #define GEN7_GPGPU_DISPATCHDIMZ 0x2508
2866
2867 #define GEN7_CACHE_MODE_1 0x7004
2868 # define GEN8_HIZ_NP_PMA_FIX_ENABLE (1 << 11)
2869 # define GEN8_HIZ_NP_EARLY_Z_FAILS_DISABLE (1 << 13)
2870 # define GEN9_PARTIAL_RESOLVE_DISABLE_IN_VC (1 << 1)
2871 # define GEN8_HIZ_PMA_MASK_BITS \
2872 REG_MASK(GEN8_HIZ_NP_PMA_FIX_ENABLE | GEN8_HIZ_NP_EARLY_Z_FAILS_DISABLE)
2873
2874 /* Predicate registers */
2875 #define MI_PREDICATE_SRC0 0x2400
2876 #define MI_PREDICATE_SRC1 0x2408
2877 #define MI_PREDICATE_DATA 0x2410
2878 #define MI_PREDICATE_RESULT 0x2418
2879 #define MI_PREDICATE_RESULT_1 0x241C
2880 #define MI_PREDICATE_RESULT_2 0x2214
2881
2882 #define HSW_CS_GPR(n) (0x2600 + (n) * 8)
2883
2884 /* L3 cache control registers. */
2885 #define GEN7_L3SQCREG1 0xb010
2886 /* L3SQ general and high priority credit initialization. */
2887 # define IVB_L3SQCREG1_SQGHPCI_DEFAULT 0x00730000
2888 # define VLV_L3SQCREG1_SQGHPCI_DEFAULT 0x00d30000
2889 # define HSW_L3SQCREG1_SQGHPCI_DEFAULT 0x00610000
2890 # define GEN7_L3SQCREG1_CONV_DC_UC (1 << 24)
2891 # define GEN7_L3SQCREG1_CONV_IS_UC (1 << 25)
2892 # define GEN7_L3SQCREG1_CONV_C_UC (1 << 26)
2893 # define GEN7_L3SQCREG1_CONV_T_UC (1 << 27)
2894
2895 #define GEN7_L3CNTLREG2 0xb020
2896 # define GEN7_L3CNTLREG2_SLM_ENABLE (1 << 0)
2897 # define GEN7_L3CNTLREG2_URB_ALLOC_SHIFT 1
2898 # define GEN7_L3CNTLREG2_URB_ALLOC_MASK INTEL_MASK(6, 1)
2899 # define GEN7_L3CNTLREG2_URB_LOW_BW (1 << 7)
2900 # define GEN7_L3CNTLREG2_ALL_ALLOC_SHIFT 8
2901 # define GEN7_L3CNTLREG2_ALL_ALLOC_MASK INTEL_MASK(13, 8)
2902 # define GEN7_L3CNTLREG2_RO_ALLOC_SHIFT 14
2903 # define GEN7_L3CNTLREG2_RO_ALLOC_MASK INTEL_MASK(19, 14)
2904 # define GEN7_L3CNTLREG2_RO_LOW_BW (1 << 20)
2905 # define GEN7_L3CNTLREG2_DC_ALLOC_SHIFT 21
2906 # define GEN7_L3CNTLREG2_DC_ALLOC_MASK INTEL_MASK(26, 21)
2907 # define GEN7_L3CNTLREG2_DC_LOW_BW (1 << 27)
2908
2909 #define GEN7_L3CNTLREG3 0xb024
2910 # define GEN7_L3CNTLREG3_IS_ALLOC_SHIFT 1
2911 # define GEN7_L3CNTLREG3_IS_ALLOC_MASK INTEL_MASK(6, 1)
2912 # define GEN7_L3CNTLREG3_IS_LOW_BW (1 << 7)
2913 # define GEN7_L3CNTLREG3_C_ALLOC_SHIFT 8
2914 # define GEN7_L3CNTLREG3_C_ALLOC_MASK INTEL_MASK(13, 8)
2915 # define GEN7_L3CNTLREG3_C_LOW_BW (1 << 14)
2916 # define GEN7_L3CNTLREG3_T_ALLOC_SHIFT 15
2917 # define GEN7_L3CNTLREG3_T_ALLOC_MASK INTEL_MASK(20, 15)
2918 # define GEN7_L3CNTLREG3_T_LOW_BW (1 << 21)
2919
2920 #define HSW_SCRATCH1 0xb038
2921 #define HSW_SCRATCH1_L3_ATOMIC_DISABLE (1 << 27)
2922
2923 #define HSW_ROW_CHICKEN3 0xe49c
2924 #define HSW_ROW_CHICKEN3_L3_ATOMIC_DISABLE (1 << 6)
2925
2926 #define GEN8_L3CNTLREG 0x7034
2927 # define GEN8_L3CNTLREG_SLM_ENABLE (1 << 0)
2928 # define GEN8_L3CNTLREG_URB_ALLOC_SHIFT 1
2929 # define GEN8_L3CNTLREG_URB_ALLOC_MASK INTEL_MASK(7, 1)
2930 # define GEN8_L3CNTLREG_RO_ALLOC_SHIFT 11
2931 # define GEN8_L3CNTLREG_RO_ALLOC_MASK INTEL_MASK(17, 11)
2932 # define GEN8_L3CNTLREG_DC_ALLOC_SHIFT 18
2933 # define GEN8_L3CNTLREG_DC_ALLOC_MASK INTEL_MASK(24, 18)
2934 # define GEN8_L3CNTLREG_ALL_ALLOC_SHIFT 25
2935 # define GEN8_L3CNTLREG_ALL_ALLOC_MASK INTEL_MASK(31, 25)
2936
2937 #endif