st/glsl_to_nir: copy nir compiler options to context
[mesa.git] / src / mesa / state_tracker / st_extensions.c
1 /**************************************************************************
2 *
3 * Copyright 2007 VMware, Inc.
4 * Copyright (c) 2008 VMware, Inc.
5 * All Rights Reserved.
6 *
7 * Permission is hereby granted, free of charge, to any person obtaining a
8 * copy of this software and associated documentation files (the
9 * "Software"), to deal in the Software without restriction, including
10 * without limitation the rights to use, copy, modify, merge, publish,
11 * distribute, sub license, and/or sell copies of the Software, and to
12 * permit persons to whom the Software is furnished to do so, subject to
13 * the following conditions:
14 *
15 * The above copyright notice and this permission notice (including the
16 * next paragraph) shall be included in all copies or substantial portions
17 * of the Software.
18 *
19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
20 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
21 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
22 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
23 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
24 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
25 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 *
27 **************************************************************************/
28
29 #include "compiler/nir/nir.h"
30
31 #include "main/imports.h"
32 #include "main/context.h"
33 #include "main/macros.h"
34 #include "main/version.h"
35
36 #include "pipe/p_context.h"
37 #include "pipe/p_defines.h"
38 #include "pipe/p_screen.h"
39 #include "util/u_math.h"
40
41 #include "st_context.h"
42 #include "st_debug.h"
43 #include "st_extensions.h"
44 #include "st_format.h"
45
46
47 /*
48 * Note: we use these function rather than the MIN2, MAX2, CLAMP macros to
49 * avoid evaluating arguments (which are often function calls) more than once.
50 */
51
52 static unsigned _min(unsigned a, unsigned b)
53 {
54 return (a < b) ? a : b;
55 }
56
57 static float _maxf(float a, float b)
58 {
59 return (a > b) ? a : b;
60 }
61
62 static int _clamp(int a, int min, int max)
63 {
64 if (a < min)
65 return min;
66 else if (a > max)
67 return max;
68 else
69 return a;
70 }
71
72
73 /**
74 * Query driver to get implementation limits.
75 * Note that we have to limit/clamp against Mesa's internal limits too.
76 */
77 void st_init_limits(struct pipe_screen *screen,
78 struct gl_constants *c, struct gl_extensions *extensions)
79 {
80 int supported_irs;
81 unsigned sh;
82 boolean can_ubo = TRUE;
83 int temp;
84 bool ssbo_atomic = true;
85
86 c->MaxTextureLevels
87 = _min(screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_2D_LEVELS),
88 MAX_TEXTURE_LEVELS);
89
90 c->Max3DTextureLevels
91 = _min(screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_3D_LEVELS),
92 MAX_3D_TEXTURE_LEVELS);
93
94 c->MaxCubeTextureLevels
95 = _min(screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS),
96 MAX_CUBE_TEXTURE_LEVELS);
97
98 c->MaxTextureRectSize
99 = _min(1 << (c->MaxTextureLevels - 1), MAX_TEXTURE_RECT_SIZE);
100
101 c->MaxArrayTextureLayers
102 = screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS);
103
104 /* Define max viewport size and max renderbuffer size in terms of
105 * max texture size (note: max tex RECT size = max tex 2D size).
106 * If this isn't true for some hardware we'll need new PIPE_CAP_ queries.
107 */
108 c->MaxViewportWidth =
109 c->MaxViewportHeight =
110 c->MaxRenderbufferSize = c->MaxTextureRectSize;
111
112 c->ViewportSubpixelBits =
113 screen->get_param(screen, PIPE_CAP_VIEWPORT_SUBPIXEL_BITS);
114
115 c->MaxDrawBuffers = c->MaxColorAttachments =
116 _clamp(screen->get_param(screen, PIPE_CAP_MAX_RENDER_TARGETS),
117 1, MAX_DRAW_BUFFERS);
118
119 c->MaxDualSourceDrawBuffers =
120 _clamp(screen->get_param(screen,
121 PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS),
122 0, MAX_DRAW_BUFFERS);
123
124 c->MaxLineWidth =
125 _maxf(1.0f, screen->get_paramf(screen, PIPE_CAPF_MAX_LINE_WIDTH));
126 c->MaxLineWidthAA =
127 _maxf(1.0f, screen->get_paramf(screen, PIPE_CAPF_MAX_LINE_WIDTH_AA));
128
129 c->MaxPointSize =
130 _maxf(1.0f, screen->get_paramf(screen, PIPE_CAPF_MAX_POINT_WIDTH));
131 c->MaxPointSizeAA =
132 _maxf(1.0f, screen->get_paramf(screen, PIPE_CAPF_MAX_POINT_WIDTH_AA));
133
134 /* these are not queryable. Note that GL basically mandates a 1.0 minimum
135 * for non-aa sizes, but we can go down to 0.0 for aa points.
136 */
137 c->MinPointSize = 1.0f;
138 c->MinPointSizeAA = 0.0f;
139
140 c->MaxTextureMaxAnisotropy =
141 _maxf(2.0f,
142 screen->get_paramf(screen, PIPE_CAPF_MAX_TEXTURE_ANISOTROPY));
143
144 c->MaxTextureLodBias =
145 screen->get_paramf(screen, PIPE_CAPF_MAX_TEXTURE_LOD_BIAS);
146
147 c->QuadsFollowProvokingVertexConvention =
148 screen->get_param(screen,
149 PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION);
150
151 c->MaxUniformBlockSize =
152 screen->get_shader_param(screen, PIPE_SHADER_FRAGMENT,
153 PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE);
154 if (c->MaxUniformBlockSize < 16384) {
155 can_ubo = FALSE;
156 }
157
158 for (sh = 0; sh < PIPE_SHADER_TYPES; ++sh) {
159 struct gl_shader_compiler_options *options;
160 struct gl_program_constants *pc;
161 const nir_shader_compiler_options *nir_options = NULL;
162
163 if (screen->get_compiler_options) {
164 nir_options = (const nir_shader_compiler_options *)
165 screen->get_compiler_options(screen, PIPE_SHADER_IR_NIR, sh);
166 }
167
168 switch (sh) {
169 case PIPE_SHADER_FRAGMENT:
170 pc = &c->Program[MESA_SHADER_FRAGMENT];
171 options = &c->ShaderCompilerOptions[MESA_SHADER_FRAGMENT];
172 c->ShaderCompilerOptions[MESA_SHADER_FRAGMENT].NirOptions =
173 nir_options;
174 break;
175 case PIPE_SHADER_VERTEX:
176 pc = &c->Program[MESA_SHADER_VERTEX];
177 options = &c->ShaderCompilerOptions[MESA_SHADER_VERTEX];
178 c->ShaderCompilerOptions[MESA_SHADER_VERTEX].NirOptions =
179 nir_options;
180 break;
181 case PIPE_SHADER_GEOMETRY:
182 pc = &c->Program[MESA_SHADER_GEOMETRY];
183 options = &c->ShaderCompilerOptions[MESA_SHADER_GEOMETRY];
184 c->ShaderCompilerOptions[MESA_SHADER_GEOMETRY].NirOptions =
185 nir_options;
186 break;
187 case PIPE_SHADER_TESS_CTRL:
188 pc = &c->Program[MESA_SHADER_TESS_CTRL];
189 options = &c->ShaderCompilerOptions[MESA_SHADER_TESS_CTRL];
190 c->ShaderCompilerOptions[MESA_SHADER_TESS_CTRL].NirOptions =
191 nir_options;
192 break;
193 case PIPE_SHADER_TESS_EVAL:
194 pc = &c->Program[MESA_SHADER_TESS_EVAL];
195 options = &c->ShaderCompilerOptions[MESA_SHADER_TESS_EVAL];
196 c->ShaderCompilerOptions[MESA_SHADER_TESS_EVAL].NirOptions =
197 nir_options;
198 break;
199 case PIPE_SHADER_COMPUTE:
200 pc = &c->Program[MESA_SHADER_COMPUTE];
201 options = &c->ShaderCompilerOptions[MESA_SHADER_COMPUTE];
202 c->ShaderCompilerOptions[MESA_SHADER_COMPUTE].NirOptions =
203 nir_options;
204
205 if (!screen->get_param(screen, PIPE_CAP_COMPUTE))
206 continue;
207 supported_irs =
208 screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_SUPPORTED_IRS);
209 if (!(supported_irs & (1 << PIPE_SHADER_IR_TGSI)))
210 continue;
211 break;
212 default:
213 assert(0);
214 }
215
216 pc->MaxTextureImageUnits =
217 _min(screen->get_shader_param(screen, sh,
218 PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS),
219 MAX_TEXTURE_IMAGE_UNITS);
220
221 pc->MaxInstructions =
222 pc->MaxNativeInstructions =
223 screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_MAX_INSTRUCTIONS);
224 pc->MaxAluInstructions =
225 pc->MaxNativeAluInstructions =
226 screen->get_shader_param(screen, sh,
227 PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS);
228 pc->MaxTexInstructions =
229 pc->MaxNativeTexInstructions =
230 screen->get_shader_param(screen, sh,
231 PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS);
232 pc->MaxTexIndirections =
233 pc->MaxNativeTexIndirections =
234 screen->get_shader_param(screen, sh,
235 PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS);
236 pc->MaxAttribs =
237 pc->MaxNativeAttribs =
238 screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_MAX_INPUTS);
239 pc->MaxTemps =
240 pc->MaxNativeTemps =
241 screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_MAX_TEMPS);
242 pc->MaxAddressRegs =
243 pc->MaxNativeAddressRegs = sh == PIPE_SHADER_VERTEX ? 1 : 0;
244 pc->MaxParameters =
245 pc->MaxNativeParameters =
246 screen->get_shader_param(screen, sh,
247 PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE) / sizeof(float[4]);
248 pc->MaxInputComponents =
249 screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_MAX_INPUTS) * 4;
250 pc->MaxOutputComponents =
251 screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_MAX_OUTPUTS) * 4;
252
253 pc->MaxUniformComponents =
254 4 * MIN2(pc->MaxNativeParameters, MAX_UNIFORMS);
255
256 pc->MaxUniformBlocks =
257 screen->get_shader_param(screen, sh,
258 PIPE_SHADER_CAP_MAX_CONST_BUFFERS);
259 if (pc->MaxUniformBlocks)
260 pc->MaxUniformBlocks -= 1; /* The first one is for ordinary uniforms. */
261 pc->MaxUniformBlocks = _min(pc->MaxUniformBlocks, MAX_UNIFORM_BUFFERS);
262
263 pc->MaxCombinedUniformComponents = (pc->MaxUniformComponents +
264 c->MaxUniformBlockSize / 4 *
265 pc->MaxUniformBlocks);
266
267 temp = screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS);
268 if (temp) {
269 /*
270 * for separate atomic counters get the actual hw limits
271 * per stage on atomic counters and buffers
272 */
273 ssbo_atomic = false;
274 pc->MaxAtomicCounters = temp;
275 pc->MaxAtomicBuffers = screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS);
276 pc->MaxShaderStorageBlocks = screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_MAX_SHADER_BUFFERS);
277 } else {
278 pc->MaxAtomicCounters = MAX_ATOMIC_COUNTERS;
279 pc->MaxAtomicBuffers = screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_MAX_SHADER_BUFFERS) / 2;
280 pc->MaxShaderStorageBlocks = pc->MaxAtomicBuffers;
281 }
282 pc->MaxImageUniforms = screen->get_shader_param(
283 screen, sh, PIPE_SHADER_CAP_MAX_SHADER_IMAGES);
284
285 /* Gallium doesn't really care about local vs. env parameters so use the
286 * same limits.
287 */
288 pc->MaxLocalParams = MIN2(pc->MaxParameters, MAX_PROGRAM_LOCAL_PARAMS);
289 pc->MaxEnvParams = MIN2(pc->MaxParameters, MAX_PROGRAM_ENV_PARAMS);
290
291 if (screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_INTEGERS)) {
292 pc->LowInt.RangeMin = 31;
293 pc->LowInt.RangeMax = 30;
294 pc->LowInt.Precision = 0;
295 pc->MediumInt = pc->HighInt = pc->LowInt;
296 }
297
298 /* TODO: make these more fine-grained if anyone needs it */
299 options->MaxIfDepth =
300 screen->get_shader_param(screen, sh,
301 PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH);
302 options->EmitNoLoops =
303 !screen->get_shader_param(screen, sh,
304 PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH);
305 options->EmitNoMainReturn =
306 !screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_SUBROUTINES);
307
308 options->EmitNoCont =
309 !screen->get_shader_param(screen, sh,
310 PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED);
311
312 options->EmitNoIndirectInput =
313 !screen->get_shader_param(screen, sh,
314 PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR);
315 options->EmitNoIndirectOutput =
316 !screen->get_shader_param(screen, sh,
317 PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR);
318 options->EmitNoIndirectTemp =
319 !screen->get_shader_param(screen, sh,
320 PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR);
321 options->EmitNoIndirectUniform =
322 !screen->get_shader_param(screen, sh,
323 PIPE_SHADER_CAP_INDIRECT_CONST_ADDR);
324
325 if (pc->MaxNativeInstructions &&
326 (options->EmitNoIndirectUniform || pc->MaxUniformBlocks < 12)) {
327 can_ubo = FALSE;
328 }
329
330 if (options->EmitNoLoops)
331 options->MaxUnrollIterations =
332 MIN2(screen->get_shader_param(screen, sh,
333 PIPE_SHADER_CAP_MAX_INSTRUCTIONS),
334 65536);
335 else
336 options->MaxUnrollIterations =
337 screen->get_shader_param(screen, sh,
338 PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT);
339
340 options->LowerCombinedClipCullDistance = true;
341 options->LowerBufferInterfaceBlocks = true;
342 }
343
344 c->GLSLOptimizeConservatively =
345 screen->get_param(screen, PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY);
346 c->LowerTessLevel = true;
347 c->LowerCsDerivedVariables = true;
348 c->PrimitiveRestartForPatches =
349 screen->get_param(screen, PIPE_CAP_PRIMITIVE_RESTART_FOR_PATCHES);
350
351 c->MaxCombinedTextureImageUnits =
352 _min(c->Program[MESA_SHADER_VERTEX].MaxTextureImageUnits +
353 c->Program[MESA_SHADER_TESS_CTRL].MaxTextureImageUnits +
354 c->Program[MESA_SHADER_TESS_EVAL].MaxTextureImageUnits +
355 c->Program[MESA_SHADER_GEOMETRY].MaxTextureImageUnits +
356 c->Program[MESA_SHADER_FRAGMENT].MaxTextureImageUnits +
357 c->Program[MESA_SHADER_COMPUTE].MaxTextureImageUnits,
358 MAX_COMBINED_TEXTURE_IMAGE_UNITS);
359
360 /* This depends on program constants. */
361 c->MaxTextureCoordUnits
362 = _min(c->Program[MESA_SHADER_FRAGMENT].MaxTextureImageUnits,
363 MAX_TEXTURE_COORD_UNITS);
364
365 c->MaxTextureUnits =
366 _min(c->Program[MESA_SHADER_FRAGMENT].MaxTextureImageUnits,
367 c->MaxTextureCoordUnits);
368
369 c->Program[MESA_SHADER_VERTEX].MaxAttribs =
370 MIN2(c->Program[MESA_SHADER_VERTEX].MaxAttribs, 16);
371
372 /* PIPE_SHADER_CAP_MAX_INPUTS for the FS specifies the maximum number
373 * of inputs. It's always 2 colors + N generic inputs. */
374 c->MaxVarying = screen->get_shader_param(screen, PIPE_SHADER_FRAGMENT,
375 PIPE_SHADER_CAP_MAX_INPUTS);
376 c->MaxVarying = MIN2(c->MaxVarying, MAX_VARYING);
377 c->MaxGeometryOutputVertices =
378 screen->get_param(screen, PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES);
379 c->MaxGeometryTotalOutputComponents =
380 screen->get_param(screen, PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS);
381 c->MaxTessPatchComponents =
382 MIN2(screen->get_param(screen, PIPE_CAP_MAX_SHADER_PATCH_VARYINGS),
383 MAX_VARYING) * 4;
384
385 c->MinProgramTexelOffset =
386 screen->get_param(screen, PIPE_CAP_MIN_TEXEL_OFFSET);
387 c->MaxProgramTexelOffset =
388 screen->get_param(screen, PIPE_CAP_MAX_TEXEL_OFFSET);
389
390 c->MaxProgramTextureGatherComponents =
391 screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS);
392 c->MinProgramTextureGatherOffset =
393 screen->get_param(screen, PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET);
394 c->MaxProgramTextureGatherOffset =
395 screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET);
396
397 c->MaxTransformFeedbackBuffers =
398 screen->get_param(screen, PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS);
399 c->MaxTransformFeedbackBuffers = MIN2(c->MaxTransformFeedbackBuffers,
400 MAX_FEEDBACK_BUFFERS);
401 c->MaxTransformFeedbackSeparateComponents =
402 screen->get_param(screen, PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS);
403 c->MaxTransformFeedbackInterleavedComponents =
404 screen->get_param(screen,
405 PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS);
406 c->MaxVertexStreams =
407 MAX2(1, screen->get_param(screen, PIPE_CAP_MAX_VERTEX_STREAMS));
408
409 /* The vertex stream must fit into pipe_stream_output_info::stream */
410 assert(c->MaxVertexStreams <= 4);
411
412 c->MaxVertexAttribStride
413 = screen->get_param(screen, PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE);
414
415 c->StripTextureBorder = GL_TRUE;
416
417 c->GLSLSkipStrictMaxUniformLimitCheck =
418 screen->get_param(screen, PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS);
419
420 c->UniformBufferOffsetAlignment =
421 screen->get_param(screen, PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT);
422
423 if (can_ubo) {
424 extensions->ARB_uniform_buffer_object = GL_TRUE;
425 c->MaxCombinedUniformBlocks = c->MaxUniformBufferBindings =
426 c->Program[MESA_SHADER_VERTEX].MaxUniformBlocks +
427 c->Program[MESA_SHADER_TESS_CTRL].MaxUniformBlocks +
428 c->Program[MESA_SHADER_TESS_EVAL].MaxUniformBlocks +
429 c->Program[MESA_SHADER_GEOMETRY].MaxUniformBlocks +
430 c->Program[MESA_SHADER_FRAGMENT].MaxUniformBlocks +
431 c->Program[MESA_SHADER_COMPUTE].MaxUniformBlocks;
432 assert(c->MaxCombinedUniformBlocks <= MAX_COMBINED_UNIFORM_BUFFERS);
433 }
434
435 c->GLSLFragCoordIsSysVal =
436 screen->get_param(screen, PIPE_CAP_TGSI_FS_POSITION_IS_SYSVAL);
437 c->GLSLFrontFacingIsSysVal =
438 screen->get_param(screen, PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL);
439
440 /* GL_ARB_get_program_binary */
441 if (screen->get_disk_shader_cache && screen->get_disk_shader_cache(screen))
442 c->NumProgramBinaryFormats = 1;
443
444 c->MaxAtomicBufferBindings =
445 c->Program[MESA_SHADER_FRAGMENT].MaxAtomicBuffers;
446
447 if (!ssbo_atomic) {
448 /* for separate atomic buffers - there atomic buffer size will be
449 limited */
450 c->MaxAtomicBufferSize = c->Program[MESA_SHADER_FRAGMENT].MaxAtomicCounters * ATOMIC_COUNTER_SIZE;
451 /* on all HW with separate atomic (evergreen) the following
452 lines are true. not sure it's worth adding CAPs for this at this
453 stage. */
454 c->MaxCombinedAtomicCounters = c->Program[MESA_SHADER_FRAGMENT].MaxAtomicCounters;
455 c->MaxCombinedAtomicBuffers = c->Program[MESA_SHADER_FRAGMENT].MaxAtomicBuffers;
456 } else {
457 c->MaxCombinedAtomicBuffers =
458 c->Program[MESA_SHADER_VERTEX].MaxAtomicBuffers +
459 c->Program[MESA_SHADER_TESS_CTRL].MaxAtomicBuffers +
460 c->Program[MESA_SHADER_TESS_EVAL].MaxAtomicBuffers +
461 c->Program[MESA_SHADER_GEOMETRY].MaxAtomicBuffers +
462 c->Program[MESA_SHADER_FRAGMENT].MaxAtomicBuffers;
463 assert(c->MaxCombinedAtomicBuffers <= MAX_COMBINED_ATOMIC_BUFFERS);
464 }
465
466 if (c->MaxCombinedAtomicBuffers > 0) {
467 extensions->ARB_shader_atomic_counters = GL_TRUE;
468 extensions->ARB_shader_atomic_counter_ops = GL_TRUE;
469 }
470
471 c->MaxCombinedShaderOutputResources = c->MaxDrawBuffers;
472 c->ShaderStorageBufferOffsetAlignment =
473 screen->get_param(screen, PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT);
474 if (c->ShaderStorageBufferOffsetAlignment) {
475 /* for hw atomic counters leaves these at default for now */
476 if (ssbo_atomic)
477 c->MaxCombinedShaderStorageBlocks = c->MaxShaderStorageBufferBindings =
478 c->MaxCombinedAtomicBuffers;
479 c->MaxCombinedShaderOutputResources +=
480 c->MaxCombinedShaderStorageBlocks;
481 c->MaxShaderStorageBlockSize = 1 << 27;
482 extensions->ARB_shader_storage_buffer_object = GL_TRUE;
483 }
484
485 c->MaxCombinedImageUniforms =
486 c->Program[MESA_SHADER_VERTEX].MaxImageUniforms +
487 c->Program[MESA_SHADER_TESS_CTRL].MaxImageUniforms +
488 c->Program[MESA_SHADER_TESS_EVAL].MaxImageUniforms +
489 c->Program[MESA_SHADER_GEOMETRY].MaxImageUniforms +
490 c->Program[MESA_SHADER_FRAGMENT].MaxImageUniforms +
491 c->Program[MESA_SHADER_COMPUTE].MaxImageUniforms;
492 c->MaxCombinedShaderOutputResources += c->MaxCombinedImageUniforms;
493 c->MaxImageUnits = MAX_IMAGE_UNITS;
494 if (c->MaxCombinedImageUniforms) {
495 extensions->ARB_shader_image_load_store = GL_TRUE;
496 extensions->ARB_shader_image_size = GL_TRUE;
497 }
498
499 /* ARB_framebuffer_no_attachments */
500 c->MaxFramebufferWidth = c->MaxViewportWidth;
501 c->MaxFramebufferHeight = c->MaxViewportHeight;
502 /* NOTE: we cheat here a little by assuming that
503 * PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS has the same
504 * number of layers as we need, although we technically
505 * could have more the generality is not really useful
506 * in practicality.
507 */
508 c->MaxFramebufferLayers =
509 screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS);
510
511 c->MaxWindowRectangles =
512 screen->get_param(screen, PIPE_CAP_MAX_WINDOW_RECTANGLES);
513
514 c->SparseBufferPageSize =
515 screen->get_param(screen, PIPE_CAP_SPARSE_BUFFER_PAGE_SIZE);
516
517 c->AllowMappedBuffersDuringExecution =
518 screen->get_param(screen, PIPE_CAP_ALLOW_MAPPED_BUFFERS_DURING_EXECUTION);
519
520 c->UseSTD430AsDefaultPacking =
521 screen->get_param(screen, PIPE_CAP_LOAD_CONSTBUF);
522
523 /* limit the max combined shader output resources to a driver limit */
524 temp = screen->get_param(screen, PIPE_CAP_MAX_COMBINED_SHADER_OUTPUT_RESOURCES);
525 if (temp > 0 && c->MaxCombinedShaderOutputResources > temp)
526 c->MaxCombinedShaderOutputResources = temp;
527 }
528
529
530 /**
531 * Given a member \c x of struct gl_extensions, return offset of
532 * \c x in bytes.
533 */
534 #define o(x) offsetof(struct gl_extensions, x)
535
536
537 struct st_extension_cap_mapping {
538 int extension_offset;
539 int cap;
540 };
541
542 struct st_extension_format_mapping {
543 int extension_offset[2];
544 enum pipe_format format[32];
545
546 /* If TRUE, at least one format must be supported for the extensions to be
547 * advertised. If FALSE, all the formats must be supported. */
548 GLboolean need_at_least_one;
549 };
550
551 /**
552 * Enable extensions if certain pipe formats are supported by the driver.
553 * What extensions will be enabled and what formats must be supported is
554 * described by the array of st_extension_format_mapping.
555 *
556 * target and bind_flags are passed to is_format_supported.
557 */
558 static void
559 init_format_extensions(struct pipe_screen *screen,
560 struct gl_extensions *extensions,
561 const struct st_extension_format_mapping *mapping,
562 unsigned num_mappings,
563 enum pipe_texture_target target,
564 unsigned bind_flags)
565 {
566 GLboolean *extension_table = (GLboolean *) extensions;
567 unsigned i;
568 int j;
569 int num_formats = ARRAY_SIZE(mapping->format);
570 int num_ext = ARRAY_SIZE(mapping->extension_offset);
571
572 for (i = 0; i < num_mappings; i++) {
573 int num_supported = 0;
574
575 /* Examine each format in the list. */
576 for (j = 0; j < num_formats && mapping[i].format[j]; j++) {
577 if (screen->is_format_supported(screen, mapping[i].format[j],
578 target, 0, bind_flags)) {
579 num_supported++;
580 }
581 }
582
583 if (!num_supported ||
584 (!mapping[i].need_at_least_one && num_supported != j)) {
585 continue;
586 }
587
588 /* Enable all extensions in the list. */
589 for (j = 0; j < num_ext && mapping[i].extension_offset[j]; j++)
590 extension_table[mapping[i].extension_offset[j]] = GL_TRUE;
591 }
592 }
593
594
595 /**
596 * Given a list of formats and bind flags, return the maximum number
597 * of samples supported by any of those formats.
598 */
599 static unsigned
600 get_max_samples_for_formats(struct pipe_screen *screen,
601 unsigned num_formats,
602 const enum pipe_format *formats,
603 unsigned max_samples,
604 unsigned bind)
605 {
606 unsigned i, f;
607
608 for (i = max_samples; i > 0; --i) {
609 for (f = 0; f < num_formats; f++) {
610 if (screen->is_format_supported(screen, formats[f],
611 PIPE_TEXTURE_2D, i, bind)) {
612 return i;
613 }
614 }
615 }
616 return 0;
617 }
618
619
620 /**
621 * Use pipe_screen::get_param() to query PIPE_CAP_ values to determine
622 * which GL extensions are supported.
623 * Quite a few extensions are always supported because they are standard
624 * features or can be built on top of other gallium features.
625 * Some fine tuning may still be needed.
626 */
627 void st_init_extensions(struct pipe_screen *screen,
628 struct gl_constants *consts,
629 struct gl_extensions *extensions,
630 struct st_config_options *options,
631 gl_api api)
632 {
633 unsigned i;
634 GLboolean *extension_table = (GLboolean *) extensions;
635
636 static const struct st_extension_cap_mapping cap_mapping[] = {
637 { o(ARB_base_instance), PIPE_CAP_START_INSTANCE },
638 { o(ARB_bindless_texture), PIPE_CAP_BINDLESS_TEXTURE },
639 { o(ARB_buffer_storage), PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT },
640 { o(ARB_clear_texture), PIPE_CAP_CLEAR_TEXTURE },
641 { o(ARB_clip_control), PIPE_CAP_CLIP_HALFZ },
642 { o(ARB_color_buffer_float), PIPE_CAP_VERTEX_COLOR_UNCLAMPED },
643 { o(ARB_conditional_render_inverted), PIPE_CAP_CONDITIONAL_RENDER_INVERTED },
644 { o(ARB_copy_image), PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS },
645 { o(OES_copy_image), PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS },
646 { o(ARB_cull_distance), PIPE_CAP_CULL_DISTANCE },
647 { o(ARB_depth_clamp), PIPE_CAP_DEPTH_CLIP_DISABLE },
648 { o(ARB_derivative_control), PIPE_CAP_TGSI_FS_FINE_DERIVATIVE },
649 { o(ARB_draw_buffers_blend), PIPE_CAP_INDEP_BLEND_FUNC },
650 { o(ARB_draw_indirect), PIPE_CAP_DRAW_INDIRECT },
651 { o(ARB_draw_instanced), PIPE_CAP_TGSI_INSTANCEID },
652 { o(ARB_framebuffer_object), PIPE_CAP_MIXED_FRAMEBUFFER_SIZES },
653 { o(ARB_gpu_shader_int64), PIPE_CAP_INT64 },
654 { o(ARB_indirect_parameters), PIPE_CAP_MULTI_DRAW_INDIRECT_PARAMS },
655 { o(ARB_instanced_arrays), PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR },
656 { o(ARB_occlusion_query), PIPE_CAP_OCCLUSION_QUERY },
657 { o(ARB_occlusion_query2), PIPE_CAP_OCCLUSION_QUERY },
658 { o(ARB_pipeline_statistics_query), PIPE_CAP_QUERY_PIPELINE_STATISTICS },
659 { o(ARB_point_sprite), PIPE_CAP_POINT_SPRITE },
660 { o(ARB_polygon_offset_clamp), PIPE_CAP_POLYGON_OFFSET_CLAMP },
661 { o(ARB_post_depth_coverage), PIPE_CAP_POST_DEPTH_COVERAGE },
662 { o(ARB_query_buffer_object), PIPE_CAP_QUERY_BUFFER_OBJECT },
663 { o(ARB_robust_buffer_access_behavior), PIPE_CAP_ROBUST_BUFFER_ACCESS_BEHAVIOR },
664 { o(ARB_sample_shading), PIPE_CAP_SAMPLE_SHADING },
665 { o(ARB_seamless_cube_map), PIPE_CAP_SEAMLESS_CUBE_MAP },
666 { o(ARB_shader_ballot), PIPE_CAP_TGSI_BALLOT },
667 { o(ARB_shader_clock), PIPE_CAP_TGSI_CLOCK },
668 { o(ARB_shader_draw_parameters), PIPE_CAP_DRAW_PARAMETERS },
669 { o(ARB_shader_group_vote), PIPE_CAP_TGSI_VOTE },
670 { o(ARB_shader_stencil_export), PIPE_CAP_SHADER_STENCIL_EXPORT },
671 { o(ARB_shader_texture_image_samples), PIPE_CAP_TGSI_TXQS },
672 { o(ARB_shader_texture_lod), PIPE_CAP_SM3 },
673 { o(ARB_sparse_buffer), PIPE_CAP_SPARSE_BUFFER_PAGE_SIZE },
674 { o(ARB_texture_buffer_object), PIPE_CAP_TEXTURE_BUFFER_OBJECTS },
675 { o(ARB_texture_cube_map_array), PIPE_CAP_CUBE_MAP_ARRAY },
676 { o(ARB_texture_gather), PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS },
677 { o(ARB_texture_mirror_clamp_to_edge), PIPE_CAP_TEXTURE_MIRROR_CLAMP },
678 { o(ARB_texture_multisample), PIPE_CAP_TEXTURE_MULTISAMPLE },
679 { o(ARB_texture_non_power_of_two), PIPE_CAP_NPOT_TEXTURES },
680 { o(ARB_texture_query_lod), PIPE_CAP_TEXTURE_QUERY_LOD },
681 { o(ARB_texture_view), PIPE_CAP_SAMPLER_VIEW_TARGET },
682 { o(ARB_timer_query), PIPE_CAP_QUERY_TIMESTAMP },
683 { o(ARB_transform_feedback2), PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME },
684 { o(ARB_transform_feedback3), PIPE_CAP_STREAM_OUTPUT_INTERLEAVE_BUFFERS },
685 { o(ARB_transform_feedback_overflow_query), PIPE_CAP_QUERY_SO_OVERFLOW },
686
687 { o(KHR_blend_equation_advanced), PIPE_CAP_TGSI_FS_FBFETCH },
688
689 { o(EXT_blend_equation_separate), PIPE_CAP_BLEND_EQUATION_SEPARATE },
690 { o(EXT_depth_bounds_test), PIPE_CAP_DEPTH_BOUNDS_TEST },
691 { o(EXT_draw_buffers2), PIPE_CAP_INDEP_BLEND_ENABLE },
692 { o(EXT_memory_object), PIPE_CAP_MEMOBJ },
693 { o(EXT_memory_object_fd), PIPE_CAP_MEMOBJ },
694 { o(EXT_semaphore), PIPE_CAP_FENCE_SIGNAL },
695 { o(EXT_semaphore_fd), PIPE_CAP_FENCE_SIGNAL },
696 { o(EXT_texture_array), PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS },
697 { o(EXT_texture_filter_anisotropic), PIPE_CAP_ANISOTROPIC_FILTER },
698 { o(EXT_texture_mirror_clamp), PIPE_CAP_TEXTURE_MIRROR_CLAMP },
699 { o(EXT_texture_swizzle), PIPE_CAP_TEXTURE_SWIZZLE },
700 { o(EXT_transform_feedback), PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS },
701 { o(EXT_window_rectangles), PIPE_CAP_MAX_WINDOW_RECTANGLES },
702
703 { o(AMD_pinned_memory), PIPE_CAP_RESOURCE_FROM_USER_MEMORY },
704 { o(ATI_meminfo), PIPE_CAP_QUERY_MEMORY_INFO },
705 { o(AMD_seamless_cubemap_per_texture), PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE },
706 { o(ATI_texture_mirror_once), PIPE_CAP_TEXTURE_MIRROR_CLAMP },
707 { o(MESA_tile_raster_order), PIPE_CAP_TILE_RASTER_ORDER },
708 { o(NV_conditional_render), PIPE_CAP_CONDITIONAL_RENDER },
709 { o(NV_fill_rectangle), PIPE_CAP_POLYGON_MODE_FILL_RECTANGLE },
710 { o(NV_primitive_restart), PIPE_CAP_PRIMITIVE_RESTART },
711 { o(NV_texture_barrier), PIPE_CAP_TEXTURE_BARRIER },
712 { o(NVX_gpu_memory_info), PIPE_CAP_QUERY_MEMORY_INFO },
713 /* GL_NV_point_sprite is not supported by gallium because we don't
714 * support the GL_POINT_SPRITE_R_MODE_NV option. */
715
716 { o(OES_standard_derivatives), PIPE_CAP_SM3 },
717 { o(OES_texture_float_linear), PIPE_CAP_TEXTURE_FLOAT_LINEAR },
718 { o(OES_texture_half_float_linear), PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR },
719 };
720
721 /* Required: render target and sampler support */
722 static const struct st_extension_format_mapping rendertarget_mapping[] = {
723 { { o(ARB_texture_float) },
724 { PIPE_FORMAT_R32G32B32A32_FLOAT,
725 PIPE_FORMAT_R16G16B16A16_FLOAT } },
726
727 { { o(OES_texture_float) },
728 { PIPE_FORMAT_R32G32B32A32_FLOAT } },
729
730 { { o(OES_texture_half_float) },
731 { PIPE_FORMAT_R16G16B16A16_FLOAT } },
732
733 { { o(ARB_texture_rgb10_a2ui) },
734 { PIPE_FORMAT_R10G10B10A2_UINT,
735 PIPE_FORMAT_B10G10R10A2_UINT },
736 GL_TRUE }, /* at least one format must be supported */
737
738 { { o(EXT_framebuffer_sRGB) },
739 { PIPE_FORMAT_A8B8G8R8_SRGB,
740 PIPE_FORMAT_B8G8R8A8_SRGB },
741 GL_TRUE }, /* at least one format must be supported */
742
743 { { o(EXT_packed_float) },
744 { PIPE_FORMAT_R11G11B10_FLOAT } },
745
746 { { o(EXT_texture_integer) },
747 { PIPE_FORMAT_R32G32B32A32_UINT,
748 PIPE_FORMAT_R32G32B32A32_SINT } },
749
750 { { o(ARB_texture_rg) },
751 { PIPE_FORMAT_R8_UNORM,
752 PIPE_FORMAT_R8G8_UNORM } },
753 };
754
755 /* Required: depth stencil and sampler support */
756 static const struct st_extension_format_mapping depthstencil_mapping[] = {
757 { { o(ARB_depth_buffer_float) },
758 { PIPE_FORMAT_Z32_FLOAT,
759 PIPE_FORMAT_Z32_FLOAT_S8X24_UINT } },
760 };
761
762 /* Required: sampler support */
763 static const struct st_extension_format_mapping texture_mapping[] = {
764 { { o(ARB_texture_compression_rgtc) },
765 { PIPE_FORMAT_RGTC1_UNORM,
766 PIPE_FORMAT_RGTC1_SNORM,
767 PIPE_FORMAT_RGTC2_UNORM,
768 PIPE_FORMAT_RGTC2_SNORM } },
769
770 { { o(EXT_texture_compression_latc) },
771 { PIPE_FORMAT_LATC1_UNORM,
772 PIPE_FORMAT_LATC1_SNORM,
773 PIPE_FORMAT_LATC2_UNORM,
774 PIPE_FORMAT_LATC2_SNORM } },
775
776 { { o(EXT_texture_compression_s3tc),
777 o(ANGLE_texture_compression_dxt) },
778 { PIPE_FORMAT_DXT1_RGB,
779 PIPE_FORMAT_DXT1_RGBA,
780 PIPE_FORMAT_DXT3_RGBA,
781 PIPE_FORMAT_DXT5_RGBA } },
782
783 { { o(ARB_texture_compression_bptc) },
784 { PIPE_FORMAT_BPTC_RGBA_UNORM,
785 PIPE_FORMAT_BPTC_SRGBA,
786 PIPE_FORMAT_BPTC_RGB_FLOAT,
787 PIPE_FORMAT_BPTC_RGB_UFLOAT } },
788
789 { { o(KHR_texture_compression_astc_ldr) },
790 { PIPE_FORMAT_ASTC_4x4,
791 PIPE_FORMAT_ASTC_5x4,
792 PIPE_FORMAT_ASTC_5x5,
793 PIPE_FORMAT_ASTC_6x5,
794 PIPE_FORMAT_ASTC_6x6,
795 PIPE_FORMAT_ASTC_8x5,
796 PIPE_FORMAT_ASTC_8x6,
797 PIPE_FORMAT_ASTC_8x8,
798 PIPE_FORMAT_ASTC_10x5,
799 PIPE_FORMAT_ASTC_10x6,
800 PIPE_FORMAT_ASTC_10x8,
801 PIPE_FORMAT_ASTC_10x10,
802 PIPE_FORMAT_ASTC_12x10,
803 PIPE_FORMAT_ASTC_12x12,
804 PIPE_FORMAT_ASTC_4x4_SRGB,
805 PIPE_FORMAT_ASTC_5x4_SRGB,
806 PIPE_FORMAT_ASTC_5x5_SRGB,
807 PIPE_FORMAT_ASTC_6x5_SRGB,
808 PIPE_FORMAT_ASTC_6x6_SRGB,
809 PIPE_FORMAT_ASTC_8x5_SRGB,
810 PIPE_FORMAT_ASTC_8x6_SRGB,
811 PIPE_FORMAT_ASTC_8x8_SRGB,
812 PIPE_FORMAT_ASTC_10x5_SRGB,
813 PIPE_FORMAT_ASTC_10x6_SRGB,
814 PIPE_FORMAT_ASTC_10x8_SRGB,
815 PIPE_FORMAT_ASTC_10x10_SRGB,
816 PIPE_FORMAT_ASTC_12x10_SRGB,
817 PIPE_FORMAT_ASTC_12x12_SRGB } },
818
819 { { o(EXT_texture_shared_exponent) },
820 { PIPE_FORMAT_R9G9B9E5_FLOAT } },
821
822 { { o(EXT_texture_snorm) },
823 { PIPE_FORMAT_R8G8B8A8_SNORM } },
824
825 { { o(EXT_texture_sRGB),
826 o(EXT_texture_sRGB_decode) },
827 { PIPE_FORMAT_A8B8G8R8_SRGB,
828 PIPE_FORMAT_B8G8R8A8_SRGB },
829 GL_TRUE }, /* at least one format must be supported */
830
831 { { o(EXT_texture_type_2_10_10_10_REV) },
832 { PIPE_FORMAT_R10G10B10A2_UNORM,
833 PIPE_FORMAT_B10G10R10A2_UNORM },
834 GL_TRUE }, /* at least one format must be supported */
835
836 { { o(ATI_texture_compression_3dc) },
837 { PIPE_FORMAT_LATC2_UNORM } },
838
839 { { o(MESA_ycbcr_texture) },
840 { PIPE_FORMAT_UYVY,
841 PIPE_FORMAT_YUYV },
842 GL_TRUE }, /* at least one format must be supported */
843
844 { { o(OES_compressed_ETC1_RGB8_texture) },
845 { PIPE_FORMAT_ETC1_RGB8,
846 PIPE_FORMAT_R8G8B8A8_UNORM },
847 GL_TRUE }, /* at least one format must be supported */
848
849 { { o(ARB_stencil_texturing),
850 o(ARB_texture_stencil8) },
851 { PIPE_FORMAT_X24S8_UINT,
852 PIPE_FORMAT_S8X24_UINT },
853 GL_TRUE }, /* at least one format must be supported */
854 };
855
856 /* Required: vertex fetch support. */
857 static const struct st_extension_format_mapping vertex_mapping[] = {
858 { { o(EXT_vertex_array_bgra) },
859 { PIPE_FORMAT_B8G8R8A8_UNORM } },
860 { { o(ARB_vertex_type_2_10_10_10_rev) },
861 { PIPE_FORMAT_R10G10B10A2_UNORM,
862 PIPE_FORMAT_B10G10R10A2_UNORM,
863 PIPE_FORMAT_R10G10B10A2_SNORM,
864 PIPE_FORMAT_B10G10R10A2_SNORM,
865 PIPE_FORMAT_R10G10B10A2_USCALED,
866 PIPE_FORMAT_B10G10R10A2_USCALED,
867 PIPE_FORMAT_R10G10B10A2_SSCALED,
868 PIPE_FORMAT_B10G10R10A2_SSCALED } },
869 { { o(ARB_vertex_type_10f_11f_11f_rev) },
870 { PIPE_FORMAT_R11G11B10_FLOAT } },
871 };
872
873 static const struct st_extension_format_mapping tbo_rgb32[] = {
874 { {o(ARB_texture_buffer_object_rgb32) },
875 { PIPE_FORMAT_R32G32B32_FLOAT,
876 PIPE_FORMAT_R32G32B32_UINT,
877 PIPE_FORMAT_R32G32B32_SINT,
878 } },
879 };
880
881 /*
882 * Extensions that are supported by all Gallium drivers:
883 */
884 extensions->ARB_ES2_compatibility = GL_TRUE;
885 extensions->ARB_depth_texture = GL_TRUE;
886 extensions->ARB_draw_elements_base_vertex = GL_TRUE;
887 extensions->ARB_explicit_attrib_location = GL_TRUE;
888 extensions->ARB_explicit_uniform_location = GL_TRUE;
889 extensions->ARB_fragment_coord_conventions = GL_TRUE;
890 extensions->ARB_fragment_program = GL_TRUE;
891 extensions->ARB_fragment_program_shadow = GL_TRUE;
892 extensions->ARB_fragment_shader = GL_TRUE;
893 extensions->ARB_half_float_vertex = GL_TRUE;
894 extensions->ARB_internalformat_query = GL_TRUE;
895 extensions->ARB_internalformat_query2 = GL_TRUE;
896 extensions->ARB_map_buffer_range = GL_TRUE;
897 extensions->ARB_shadow = GL_TRUE;
898 extensions->ARB_sync = GL_TRUE;
899 extensions->ARB_texture_border_clamp = GL_TRUE;
900 extensions->ARB_texture_cube_map = GL_TRUE;
901 extensions->ARB_texture_env_combine = GL_TRUE;
902 extensions->ARB_texture_env_crossbar = GL_TRUE;
903 extensions->ARB_texture_env_dot3 = GL_TRUE;
904 extensions->ARB_vertex_program = GL_TRUE;
905 extensions->ARB_vertex_shader = GL_TRUE;
906
907 extensions->EXT_blend_color = GL_TRUE;
908 extensions->EXT_blend_func_separate = GL_TRUE;
909 extensions->EXT_blend_minmax = GL_TRUE;
910 extensions->EXT_gpu_program_parameters = GL_TRUE;
911 extensions->EXT_pixel_buffer_object = GL_TRUE;
912 extensions->EXT_point_parameters = GL_TRUE;
913 extensions->EXT_provoking_vertex = GL_TRUE;
914 extensions->EXT_stencil_two_side = GL_TRUE;
915 extensions->EXT_texture_env_dot3 = GL_TRUE;
916
917 extensions->ATI_fragment_shader = GL_TRUE;
918 extensions->ATI_separate_stencil = GL_TRUE;
919 extensions->ATI_texture_env_combine3 = GL_TRUE;
920
921 extensions->MESA_pack_invert = GL_TRUE;
922
923 extensions->NV_fog_distance = GL_TRUE;
924 extensions->NV_texture_env_combine4 = GL_TRUE;
925 extensions->NV_texture_rectangle = GL_TRUE;
926
927 extensions->OES_EGL_image = GL_TRUE;
928 extensions->OES_EGL_image_external = GL_TRUE;
929 extensions->OES_draw_texture = GL_TRUE;
930
931 /* Expose the extensions which directly correspond to gallium caps. */
932 for (i = 0; i < ARRAY_SIZE(cap_mapping); i++) {
933 if (screen->get_param(screen, cap_mapping[i].cap)) {
934 extension_table[cap_mapping[i].extension_offset] = GL_TRUE;
935 }
936 }
937
938 /* Expose the extensions which directly correspond to gallium formats. */
939 init_format_extensions(screen, extensions, rendertarget_mapping,
940 ARRAY_SIZE(rendertarget_mapping), PIPE_TEXTURE_2D,
941 PIPE_BIND_RENDER_TARGET | PIPE_BIND_SAMPLER_VIEW);
942 init_format_extensions(screen, extensions, depthstencil_mapping,
943 ARRAY_SIZE(depthstencil_mapping), PIPE_TEXTURE_2D,
944 PIPE_BIND_DEPTH_STENCIL | PIPE_BIND_SAMPLER_VIEW);
945 init_format_extensions(screen, extensions, texture_mapping,
946 ARRAY_SIZE(texture_mapping), PIPE_TEXTURE_2D,
947 PIPE_BIND_SAMPLER_VIEW);
948 init_format_extensions(screen, extensions, vertex_mapping,
949 ARRAY_SIZE(vertex_mapping), PIPE_BUFFER,
950 PIPE_BIND_VERTEX_BUFFER);
951
952 /* Figure out GLSL support and set GLSLVersion to it. */
953 consts->GLSLVersion = screen->get_param(screen, PIPE_CAP_GLSL_FEATURE_LEVEL);
954
955 _mesa_override_glsl_version(consts);
956
957 if (options->force_glsl_version > 0 &&
958 options->force_glsl_version <= consts->GLSLVersion) {
959 consts->ForceGLSLVersion = options->force_glsl_version;
960 }
961
962 consts->AllowHigherCompatVersion = options->allow_higher_compat_version;
963
964 consts->ForceGLSLAbsSqrt = options->force_glsl_abs_sqrt;
965
966 consts->AllowGLSLBuiltinVariableRedeclaration = options->allow_glsl_builtin_variable_redeclaration;
967
968 consts->dri_config_options_sha1 = options->config_options_sha1;
969
970 consts->AllowGLSLCrossStageInterpolationMismatch = options->allow_glsl_cross_stage_interpolation_mismatch;
971
972 if (consts->GLSLVersion >= 400)
973 extensions->ARB_gpu_shader5 = GL_TRUE;
974 if (consts->GLSLVersion >= 410)
975 extensions->ARB_shader_precision = GL_TRUE;
976
977 /* This extension needs full OpenGL 3.2, but we don't know if that's
978 * supported at this point. Only check the GLSL version. */
979 if (consts->GLSLVersion >= 150 &&
980 screen->get_param(screen, PIPE_CAP_TGSI_VS_LAYER_VIEWPORT)) {
981 extensions->AMD_vertex_shader_layer = GL_TRUE;
982 }
983
984 if (consts->GLSLVersion >= 140) {
985 if (screen->get_param(screen, PIPE_CAP_TGSI_ARRAY_COMPONENTS))
986 extensions->ARB_enhanced_layouts = GL_TRUE;
987 }
988
989 if (consts->GLSLVersion >= 130) {
990 consts->NativeIntegers = GL_TRUE;
991 consts->MaxClipPlanes = 8;
992
993 if (screen->get_param(screen, PIPE_CAP_VERTEXID_NOBASE)) {
994 consts->VertexID_is_zero_based = GL_TRUE;
995 }
996
997 /* Extensions that either depend on GLSL 1.30 or are a subset thereof. */
998 extensions->ARB_conservative_depth = GL_TRUE;
999 extensions->ARB_shading_language_packing = GL_TRUE;
1000 extensions->OES_depth_texture_cube_map = GL_TRUE;
1001 extensions->ARB_shading_language_420pack = GL_TRUE;
1002 extensions->ARB_texture_query_levels = GL_TRUE;
1003
1004 if (!options->disable_shader_bit_encoding) {
1005 extensions->ARB_shader_bit_encoding = GL_TRUE;
1006 }
1007
1008 extensions->EXT_shader_integer_mix = GL_TRUE;
1009 extensions->ARB_arrays_of_arrays = GL_TRUE;
1010 extensions->MESA_shader_integer_functions = GL_TRUE;
1011 } else {
1012 /* Optional integer support for GLSL 1.2. */
1013 if (screen->get_shader_param(screen, PIPE_SHADER_VERTEX,
1014 PIPE_SHADER_CAP_INTEGERS) &&
1015 screen->get_shader_param(screen, PIPE_SHADER_FRAGMENT,
1016 PIPE_SHADER_CAP_INTEGERS)) {
1017 consts->NativeIntegers = GL_TRUE;
1018
1019 extensions->EXT_shader_integer_mix = GL_TRUE;
1020 }
1021
1022 /* Integer textures make no sense before GLSL 1.30 */
1023 extensions->EXT_texture_integer = GL_FALSE;
1024 }
1025
1026 consts->GLSLZeroInit = options->glsl_zero_init;
1027
1028 consts->UniformBooleanTrue = consts->NativeIntegers ? ~0U : fui(1.0f);
1029
1030 /* Below are the cases which cannot be moved into tables easily. */
1031
1032 if (screen->get_shader_param(screen, PIPE_SHADER_TESS_CTRL,
1033 PIPE_SHADER_CAP_MAX_INSTRUCTIONS) > 0) {
1034 extensions->ARB_tessellation_shader = GL_TRUE;
1035 }
1036
1037 /* What this is really checking for is the ability to support multiple
1038 * invocations of a geometry shader. There is no separate cap for that, so
1039 * we check the GLSLVersion.
1040 */
1041 if (consts->GLSLVersion >= 400 &&
1042 screen->get_shader_param(screen, PIPE_SHADER_GEOMETRY,
1043 PIPE_SHADER_CAP_MAX_INSTRUCTIONS) > 0) {
1044 extensions->OES_geometry_shader = GL_TRUE;
1045 }
1046
1047 /* Needs PIPE_CAP_SAMPLE_SHADING + all the sample-related bits of
1048 * ARB_gpu_shader5. This enables all the per-sample shading ES extensions.
1049 */
1050 extensions->OES_sample_variables = extensions->ARB_sample_shading &&
1051 extensions->ARB_gpu_shader5;
1052
1053 /* Maximum sample count. */
1054 {
1055 static const enum pipe_format color_formats[] = {
1056 PIPE_FORMAT_R8G8B8A8_UNORM,
1057 PIPE_FORMAT_B8G8R8A8_UNORM,
1058 PIPE_FORMAT_A8R8G8B8_UNORM,
1059 PIPE_FORMAT_A8B8G8R8_UNORM,
1060 };
1061 static const enum pipe_format depth_formats[] = {
1062 PIPE_FORMAT_Z16_UNORM,
1063 PIPE_FORMAT_Z24X8_UNORM,
1064 PIPE_FORMAT_X8Z24_UNORM,
1065 PIPE_FORMAT_Z32_UNORM,
1066 PIPE_FORMAT_Z32_FLOAT
1067 };
1068 static const enum pipe_format int_formats[] = {
1069 PIPE_FORMAT_R8G8B8A8_SINT
1070 };
1071 static const enum pipe_format void_formats[] = {
1072 PIPE_FORMAT_NONE
1073 };
1074
1075 consts->MaxSamples =
1076 get_max_samples_for_formats(screen, ARRAY_SIZE(color_formats),
1077 color_formats, 16,
1078 PIPE_BIND_RENDER_TARGET);
1079
1080 consts->MaxImageSamples =
1081 get_max_samples_for_formats(screen, ARRAY_SIZE(color_formats),
1082 color_formats, 16,
1083 PIPE_BIND_SHADER_IMAGE);
1084
1085 consts->MaxColorTextureSamples =
1086 get_max_samples_for_formats(screen, ARRAY_SIZE(color_formats),
1087 color_formats, consts->MaxSamples,
1088 PIPE_BIND_SAMPLER_VIEW);
1089
1090 consts->MaxDepthTextureSamples =
1091 get_max_samples_for_formats(screen, ARRAY_SIZE(depth_formats),
1092 depth_formats, consts->MaxSamples,
1093 PIPE_BIND_SAMPLER_VIEW);
1094
1095 consts->MaxIntegerSamples =
1096 get_max_samples_for_formats(screen, ARRAY_SIZE(int_formats),
1097 int_formats, consts->MaxSamples,
1098 PIPE_BIND_SAMPLER_VIEW);
1099
1100 /* ARB_framebuffer_no_attachments, assume max no. of samples 32 */
1101 consts->MaxFramebufferSamples =
1102 get_max_samples_for_formats(screen, ARRAY_SIZE(void_formats),
1103 void_formats, 32,
1104 PIPE_BIND_RENDER_TARGET);
1105 }
1106
1107 if (consts->MaxSamples >= 2) {
1108 /* Real MSAA support */
1109 extensions->EXT_framebuffer_multisample = GL_TRUE;
1110 extensions->EXT_framebuffer_multisample_blit_scaled = GL_TRUE;
1111 }
1112 else if (consts->MaxSamples > 0 &&
1113 screen->get_param(screen, PIPE_CAP_FAKE_SW_MSAA)) {
1114 /* fake MSAA support */
1115 consts->FakeSWMSAA = GL_TRUE;
1116 extensions->EXT_framebuffer_multisample = GL_TRUE;
1117 extensions->EXT_framebuffer_multisample_blit_scaled = GL_TRUE;
1118 extensions->ARB_texture_multisample = GL_TRUE;
1119 }
1120
1121 if (consts->MaxDualSourceDrawBuffers > 0 &&
1122 !options->disable_blend_func_extended)
1123 extensions->ARB_blend_func_extended = GL_TRUE;
1124
1125 if (screen->get_param(screen, PIPE_CAP_QUERY_TIME_ELAPSED) ||
1126 extensions->ARB_timer_query) {
1127 extensions->EXT_timer_query = GL_TRUE;
1128 }
1129
1130 if (extensions->ARB_transform_feedback2 &&
1131 extensions->ARB_draw_instanced) {
1132 extensions->ARB_transform_feedback_instanced = GL_TRUE;
1133 }
1134 if (options->force_glsl_extensions_warn)
1135 consts->ForceGLSLExtensionsWarn = 1;
1136
1137 if (options->disable_glsl_line_continuations)
1138 consts->DisableGLSLLineContinuations = 1;
1139
1140 if (options->allow_glsl_extension_directive_midshader)
1141 consts->AllowGLSLExtensionDirectiveMidShader = GL_TRUE;
1142
1143 consts->MinMapBufferAlignment =
1144 screen->get_param(screen, PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT);
1145
1146 /* The OpenGL Compatibility profile requires arbitrary buffer swizzling. */
1147 if (api == API_OPENGL_COMPAT &&
1148 screen->get_param(screen, PIPE_CAP_BUFFER_SAMPLER_VIEW_RGBA_ONLY))
1149 extensions->ARB_texture_buffer_object = GL_FALSE;
1150
1151 if (extensions->ARB_texture_buffer_object) {
1152 consts->MaxTextureBufferSize =
1153 _min(screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE),
1154 (1u << 31) - 1);
1155 consts->TextureBufferOffsetAlignment =
1156 screen->get_param(screen, PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT);
1157
1158 if (consts->TextureBufferOffsetAlignment)
1159 extensions->ARB_texture_buffer_range = GL_TRUE;
1160
1161 init_format_extensions(screen, extensions, tbo_rgb32,
1162 ARRAY_SIZE(tbo_rgb32), PIPE_BUFFER,
1163 PIPE_BIND_SAMPLER_VIEW);
1164 }
1165
1166 extensions->OES_texture_buffer =
1167 extensions->ARB_texture_buffer_object &&
1168 extensions->ARB_texture_buffer_range &&
1169 extensions->ARB_texture_buffer_object_rgb32 &&
1170 extensions->ARB_shader_image_load_store;
1171
1172 /* Unpacking a varying in the fragment shader costs 1 texture indirection.
1173 * If the number of available texture indirections is very limited, then we
1174 * prefer to disable varying packing rather than run the risk of varying
1175 * packing preventing a shader from running.
1176 */
1177 if (screen->get_shader_param(screen, PIPE_SHADER_FRAGMENT,
1178 PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS) <= 8) {
1179 /* We can't disable varying packing if transform feedback is available,
1180 * because transform feedback code assumes a packed varying layout.
1181 */
1182 if (!extensions->EXT_transform_feedback)
1183 consts->DisableVaryingPacking = GL_TRUE;
1184 }
1185
1186 consts->MaxViewports = screen->get_param(screen, PIPE_CAP_MAX_VIEWPORTS);
1187 if (consts->MaxViewports >= 16) {
1188 if (consts->GLSLVersion >= 400) {
1189 consts->ViewportBounds.Min = -32768.0;
1190 consts->ViewportBounds.Max = 32767.0;
1191 } else {
1192 consts->ViewportBounds.Min = -16384.0;
1193 consts->ViewportBounds.Max = 16383.0;
1194 }
1195 extensions->ARB_viewport_array = GL_TRUE;
1196 extensions->ARB_fragment_layer_viewport = GL_TRUE;
1197 if (extensions->AMD_vertex_shader_layer)
1198 extensions->AMD_vertex_shader_viewport_index = GL_TRUE;
1199 }
1200
1201 if (extensions->AMD_vertex_shader_layer &&
1202 extensions->AMD_vertex_shader_viewport_index &&
1203 screen->get_param(screen, PIPE_CAP_TGSI_TES_LAYER_VIEWPORT))
1204 extensions->ARB_shader_viewport_layer_array = GL_TRUE;
1205
1206 /* ARB_framebuffer_no_attachments */
1207 if (screen->get_param(screen, PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT) &&
1208 ((consts->MaxSamples >= 4 && consts->MaxFramebufferLayers >= 2048) ||
1209 (consts->MaxFramebufferSamples >= consts->MaxSamples &&
1210 consts->MaxFramebufferLayers >= consts->MaxArrayTextureLayers)))
1211 extensions->ARB_framebuffer_no_attachments = GL_TRUE;
1212
1213 /* GL_ARB_ES3_compatibility.
1214 *
1215 * Assume that ES3 is supported if GLSL 3.30 is supported.
1216 * (OpenGL 3.3 is a requirement for that extension.)
1217 */
1218 if (consts->GLSLVersion >= 330 &&
1219 /* Requirements for ETC2 emulation. */
1220 screen->is_format_supported(screen, PIPE_FORMAT_R8G8B8A8_UNORM,
1221 PIPE_TEXTURE_2D, 0,
1222 PIPE_BIND_SAMPLER_VIEW) &&
1223 screen->is_format_supported(screen, PIPE_FORMAT_B8G8R8A8_SRGB,
1224 PIPE_TEXTURE_2D, 0,
1225 PIPE_BIND_SAMPLER_VIEW) &&
1226 screen->is_format_supported(screen, PIPE_FORMAT_R16_UNORM,
1227 PIPE_TEXTURE_2D, 0,
1228 PIPE_BIND_SAMPLER_VIEW) &&
1229 screen->is_format_supported(screen, PIPE_FORMAT_R16G16_UNORM,
1230 PIPE_TEXTURE_2D, 0,
1231 PIPE_BIND_SAMPLER_VIEW) &&
1232 screen->is_format_supported(screen, PIPE_FORMAT_R16_SNORM,
1233 PIPE_TEXTURE_2D, 0,
1234 PIPE_BIND_SAMPLER_VIEW) &&
1235 screen->is_format_supported(screen, PIPE_FORMAT_R16G16_SNORM,
1236 PIPE_TEXTURE_2D, 0,
1237 PIPE_BIND_SAMPLER_VIEW)) {
1238 extensions->ARB_ES3_compatibility = GL_TRUE;
1239 }
1240
1241 #ifdef HAVE_ST_VDPAU
1242 if (screen->get_video_param &&
1243 screen->get_video_param(screen, PIPE_VIDEO_PROFILE_UNKNOWN,
1244 PIPE_VIDEO_ENTRYPOINT_BITSTREAM,
1245 PIPE_VIDEO_CAP_SUPPORTS_INTERLACED)) {
1246 extensions->NV_vdpau_interop = GL_TRUE;
1247 }
1248 #endif
1249
1250 if (screen->get_param(screen, PIPE_CAP_DOUBLES)) {
1251 extensions->ARB_gpu_shader_fp64 = GL_TRUE;
1252 extensions->ARB_vertex_attrib_64bit = GL_TRUE;
1253 }
1254
1255 if ((ST_DEBUG & DEBUG_GREMEDY) &&
1256 screen->get_param(screen, PIPE_CAP_STRING_MARKER))
1257 extensions->GREMEDY_string_marker = GL_TRUE;
1258
1259 if (screen->get_param(screen, PIPE_CAP_COMPUTE)) {
1260 int compute_supported_irs =
1261 screen->get_shader_param(screen, PIPE_SHADER_COMPUTE,
1262 PIPE_SHADER_CAP_SUPPORTED_IRS);
1263 if (compute_supported_irs & (1 << PIPE_SHADER_IR_TGSI)) {
1264 uint64_t grid_size[3], block_size[3];
1265 uint64_t max_local_size, max_threads_per_block;
1266
1267 screen->get_compute_param(screen, PIPE_SHADER_IR_TGSI,
1268 PIPE_COMPUTE_CAP_MAX_GRID_SIZE, grid_size);
1269 screen->get_compute_param(screen, PIPE_SHADER_IR_TGSI,
1270 PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE, block_size);
1271 screen->get_compute_param(screen, PIPE_SHADER_IR_TGSI,
1272 PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK,
1273 &max_threads_per_block);
1274 screen->get_compute_param(screen, PIPE_SHADER_IR_TGSI,
1275 PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE,
1276 &max_local_size);
1277
1278 consts->MaxComputeWorkGroupInvocations = max_threads_per_block;
1279 consts->MaxComputeSharedMemorySize = max_local_size;
1280
1281 for (i = 0; i < 3; i++) {
1282 consts->MaxComputeWorkGroupCount[i] = grid_size[i];
1283 consts->MaxComputeWorkGroupSize[i] = block_size[i];
1284 }
1285
1286 extensions->ARB_compute_shader =
1287 extensions->ARB_shader_image_load_store &&
1288 extensions->ARB_shader_atomic_counters;
1289
1290 if (extensions->ARB_compute_shader) {
1291 uint64_t max_variable_threads_per_block = 0;
1292
1293 screen->get_compute_param(screen, PIPE_SHADER_IR_TGSI,
1294 PIPE_COMPUTE_CAP_MAX_VARIABLE_THREADS_PER_BLOCK,
1295 &max_variable_threads_per_block);
1296
1297 for (i = 0; i < 3; i++) {
1298 /* Clamp the values to avoid having a local work group size
1299 * greater than the maximum number of invocations.
1300 */
1301 consts->MaxComputeVariableGroupSize[i] =
1302 MIN2(consts->MaxComputeWorkGroupSize[i],
1303 max_variable_threads_per_block);
1304 }
1305 consts->MaxComputeVariableGroupInvocations =
1306 max_variable_threads_per_block;
1307
1308 extensions->ARB_compute_variable_group_size =
1309 max_variable_threads_per_block > 0;
1310 }
1311 }
1312 }
1313
1314 if (extensions->EXT_texture_filter_anisotropic &&
1315 screen->get_paramf(screen, PIPE_CAPF_MAX_TEXTURE_ANISOTROPY) >= 16.0)
1316 extensions->ARB_texture_filter_anisotropic = GL_TRUE;
1317
1318 extensions->KHR_robustness = extensions->ARB_robust_buffer_access_behavior;
1319
1320 /* If we support ES 3.1, we support the ES3_1_compatibility ext. However
1321 * there's no clean way of telling whether we would support ES 3.1 from
1322 * here, so copy the condition from compute_version_es2 here. A lot of
1323 * these are redunant, but simpler to just have a (near-)exact copy here.
1324 */
1325 extensions->ARB_ES3_1_compatibility =
1326 extensions->ARB_ES3_compatibility &&
1327 extensions->ARB_arrays_of_arrays &&
1328 extensions->ARB_compute_shader &&
1329 extensions->ARB_draw_indirect &&
1330 extensions->ARB_explicit_uniform_location &&
1331 extensions->ARB_framebuffer_no_attachments &&
1332 extensions->ARB_shader_atomic_counters &&
1333 extensions->ARB_shader_image_load_store &&
1334 extensions->ARB_shader_image_size &&
1335 extensions->ARB_shader_storage_buffer_object &&
1336 extensions->ARB_shading_language_packing &&
1337 extensions->ARB_stencil_texturing &&
1338 extensions->ARB_texture_multisample &&
1339 extensions->ARB_gpu_shader5 &&
1340 extensions->EXT_shader_integer_mix;
1341
1342 extensions->OES_texture_cube_map_array =
1343 extensions->ARB_ES3_1_compatibility &&
1344 extensions->OES_geometry_shader &&
1345 extensions->ARB_texture_cube_map_array;
1346
1347 extensions->OES_viewport_array =
1348 extensions->ARB_ES3_1_compatibility &&
1349 extensions->OES_geometry_shader &&
1350 extensions->ARB_viewport_array;
1351
1352 extensions->OES_primitive_bounding_box = extensions->ARB_ES3_1_compatibility;
1353 consts->NoPrimitiveBoundingBoxOutput = true;
1354
1355 extensions->ANDROID_extension_pack_es31a =
1356 extensions->KHR_texture_compression_astc_ldr &&
1357 extensions->KHR_blend_equation_advanced &&
1358 extensions->OES_sample_variables &&
1359 extensions->ARB_shader_image_load_store &&
1360 extensions->ARB_texture_stencil8 &&
1361 extensions->ARB_texture_multisample &&
1362 extensions->OES_copy_image &&
1363 extensions->ARB_draw_buffers_blend &&
1364 extensions->OES_geometry_shader &&
1365 extensions->ARB_gpu_shader5 &&
1366 extensions->OES_primitive_bounding_box &&
1367 extensions->ARB_tessellation_shader &&
1368 extensions->ARB_texture_border_clamp &&
1369 extensions->OES_texture_buffer &&
1370 extensions->OES_texture_cube_map_array &&
1371 extensions->EXT_texture_sRGB_decode;
1372
1373 /* Same deal as for ARB_ES3_1_compatibility - this has to be computed
1374 * before overall versions are selected. Also it's actually a subset of ES
1375 * 3.2, since it doesn't require ASTC or advanced blending.
1376 */
1377 extensions->ARB_ES3_2_compatibility =
1378 extensions->ARB_ES3_1_compatibility &&
1379 extensions->KHR_robustness &&
1380 extensions->ARB_copy_image &&
1381 extensions->ARB_draw_buffers_blend &&
1382 extensions->ARB_draw_elements_base_vertex &&
1383 extensions->OES_geometry_shader &&
1384 extensions->ARB_gpu_shader5 &&
1385 extensions->ARB_sample_shading &&
1386 extensions->ARB_tessellation_shader &&
1387 extensions->ARB_texture_border_clamp &&
1388 extensions->OES_texture_buffer &&
1389 extensions->ARB_texture_cube_map_array &&
1390 extensions->ARB_texture_stencil8 &&
1391 extensions->ARB_texture_multisample;
1392 }