spirv/nir: keep track of SPV_KHR_float_controls execution modes
[mesa.git] / src / compiler / shader_info.h
1 /*
2 * Copyright © 2016 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 *
23 */
24
25 #ifndef SHADER_INFO_H
26 #define SHADER_INFO_H
27
28 #include "shader_enums.h"
29 #include <stdint.h>
30
31 #ifdef __cplusplus
32 extern "C" {
33 #endif
34
35 struct spirv_supported_capabilities {
36 bool address;
37 bool atomic_storage;
38 bool demote_to_helper_invocation;
39 bool derivative_group;
40 bool descriptor_array_dynamic_indexing;
41 bool descriptor_array_non_uniform_indexing;
42 bool descriptor_indexing;
43 bool device_group;
44 bool draw_parameters;
45 bool float64;
46 bool fragment_shader_sample_interlock;
47 bool fragment_shader_pixel_interlock;
48 bool geometry_streams;
49 bool image_ms_array;
50 bool image_read_without_format;
51 bool image_write_without_format;
52 bool int8;
53 bool int16;
54 bool int64;
55 bool int64_atomics;
56 bool kernel;
57 bool min_lod;
58 bool multiview;
59 bool physical_storage_buffer_address;
60 bool post_depth_coverage;
61 bool runtime_descriptor_array;
62 bool float_controls;
63 bool shader_viewport_index_layer;
64 bool stencil_export;
65 bool storage_8bit;
66 bool storage_16bit;
67 bool storage_image_ms;
68 bool subgroup_arithmetic;
69 bool subgroup_ballot;
70 bool subgroup_basic;
71 bool subgroup_quad;
72 bool subgroup_shuffle;
73 bool subgroup_vote;
74 bool tessellation;
75 bool transform_feedback;
76 bool variable_pointers;
77 bool float16;
78 bool amd_gcn_shader;
79 bool amd_shader_ballot;
80 bool amd_trinary_minmax;
81 };
82
83 typedef struct shader_info {
84 const char *name;
85
86 /* Descriptive name provided by the client; may be NULL */
87 const char *label;
88
89 /** The shader stage, such as MESA_SHADER_VERTEX. */
90 gl_shader_stage stage;
91
92 /** The shader stage in a non SSO linked program that follows this stage,
93 * such as MESA_SHADER_FRAGMENT.
94 */
95 gl_shader_stage next_stage;
96
97 /* Number of textures used by this shader */
98 unsigned num_textures;
99 /* Number of uniform buffers used by this shader */
100 unsigned num_ubos;
101 /* Number of atomic buffers used by this shader */
102 unsigned num_abos;
103 /* Number of shader storage buffers used by this shader */
104 unsigned num_ssbos;
105 /* Number of images used by this shader */
106 unsigned num_images;
107
108 /* Which inputs are actually read */
109 uint64_t inputs_read;
110 /* Which outputs are actually written */
111 uint64_t outputs_written;
112 /* Which outputs are actually read */
113 uint64_t outputs_read;
114 /* Which system values are actually read */
115 uint64_t system_values_read;
116
117 /* Which patch inputs are actually read */
118 uint32_t patch_inputs_read;
119 /* Which patch outputs are actually written */
120 uint32_t patch_outputs_written;
121 /* Which patch outputs are read */
122 uint32_t patch_outputs_read;
123
124 /* Whether or not this shader ever uses textureGather() */
125 bool uses_texture_gather;
126
127 /** Bitfield of which textures are used */
128 uint32_t textures_used;
129
130 /** Bitfield of which textures are used by texelFetch() */
131 uint32_t textures_used_by_txf;
132
133 /**
134 * True if this shader uses the fddx/fddy opcodes.
135 *
136 * Note that this does not include the "fine" and "coarse" variants.
137 */
138 bool uses_fddx_fddy;
139
140 /**
141 * True if this shader uses 64-bit ALU operations
142 */
143 bool uses_64bit;
144
145 /* The size of the gl_ClipDistance[] array, if declared. */
146 unsigned clip_distance_array_size;
147
148 /* The size of the gl_CullDistance[] array, if declared. */
149 unsigned cull_distance_array_size;
150
151 /* Whether or not separate shader objects were used */
152 bool separate_shader;
153
154 /** Was this shader linked with any transform feedback varyings? */
155 bool has_transform_feedback_varyings;
156
157 /* SPV_KHR_float_controls: execution mode for floating point ops */
158 unsigned float_controls_execution_mode;
159
160 union {
161 struct {
162 /* Which inputs are doubles */
163 uint64_t double_inputs;
164
165 /* For AMD-specific driver-internal shaders. It replaces vertex
166 * buffer loads with code generating VS inputs from scalar registers.
167 *
168 * Valid values: SI_VS_BLIT_SGPRS_POS_*
169 */
170 unsigned blit_sgprs_amd;
171
172 /* True if the shader writes position in window space coordinates pre-transform */
173 bool window_space_position;
174 } vs;
175
176 struct {
177 /** The number of vertices recieves per input primitive */
178 unsigned vertices_in;
179
180 /** The output primitive type (GL enum value) */
181 unsigned output_primitive;
182
183 /** The input primitive type (GL enum value) */
184 unsigned input_primitive;
185
186 /** The maximum number of vertices the geometry shader might write. */
187 unsigned vertices_out;
188
189 /** 1 .. MAX_GEOMETRY_SHADER_INVOCATIONS */
190 unsigned invocations;
191
192 /** Whether or not this shader uses EndPrimitive */
193 bool uses_end_primitive;
194
195 /** Whether or not this shader uses non-zero streams */
196 bool uses_streams;
197 } gs;
198
199 struct {
200 bool uses_discard;
201
202 /**
203 * True if this fragment shader requires helper invocations. This
204 * can be caused by the use of ALU derivative ops, texture
205 * instructions which do implicit derivatives, and the use of quad
206 * subgroup operations.
207 */
208 bool needs_helper_invocations;
209
210 /**
211 * Whether any inputs are declared with the "sample" qualifier.
212 */
213 bool uses_sample_qualifier;
214
215 /**
216 * Whether early fragment tests are enabled as defined by
217 * ARB_shader_image_load_store.
218 */
219 bool early_fragment_tests;
220
221 /**
222 * Defined by INTEL_conservative_rasterization.
223 */
224 bool inner_coverage;
225
226 bool post_depth_coverage;
227
228 /**
229 * \name ARB_fragment_coord_conventions
230 * @{
231 */
232 bool pixel_center_integer;
233 bool origin_upper_left;
234 /*@}*/
235
236 bool pixel_interlock_ordered;
237 bool pixel_interlock_unordered;
238 bool sample_interlock_ordered;
239 bool sample_interlock_unordered;
240
241 /**
242 * Flags whether NIR's base types on the FS color outputs should be
243 * ignored.
244 *
245 * GLSL requires that fragment shader output base types match the
246 * render target's base types for the behavior to be defined. From
247 * the GL 4.6 spec:
248 *
249 * "If the values written by the fragment shader do not match the
250 * format(s) of the corresponding color buffer(s), the result is
251 * undefined."
252 *
253 * However, for NIR shaders translated from TGSI, we don't have the
254 * output types any more, so the driver will need to do whatever
255 * fixups are necessary to handle effectively untyped data being
256 * output from the FS.
257 */
258 bool untyped_color_outputs;
259
260 /** gl_FragDepth layout for ARB_conservative_depth. */
261 enum gl_frag_depth_layout depth_layout;
262 } fs;
263
264 struct {
265 unsigned local_size[3];
266
267 bool local_size_variable;
268 char user_data_components_amd;
269
270 /**
271 * Size of shared variables accessed by the compute shader.
272 */
273 unsigned shared_size;
274
275
276 /**
277 * pointer size is:
278 * AddressingModelLogical: 0 (default)
279 * AddressingModelPhysical32: 32
280 * AddressingModelPhysical64: 64
281 */
282 unsigned ptr_size;
283
284 /*
285 * Arrangement of invocations used to calculate derivatives in a compute
286 * shader. From NV_compute_shader_derivatives.
287 */
288 enum gl_derivative_group derivative_group;
289 } cs;
290
291 /* Applies to both TCS and TES. */
292 struct {
293 /** The number of vertices in the TCS output patch. */
294 unsigned tcs_vertices_out;
295
296 uint32_t primitive_mode; /* GL_TRIANGLES, GL_QUADS or GL_ISOLINES */
297 enum gl_tess_spacing spacing;
298 /** Is the vertex order counterclockwise? */
299 bool ccw;
300 bool point_mode;
301 } tess;
302 };
303 } shader_info;
304
305 #ifdef __cplusplus
306 }
307 #endif
308
309 #endif /* SHADER_INFO_H */