st/mesa: clean up atomic vs ssbo code
[mesa.git] / src / mesa / state_tracker / st_extensions.c
1 /**************************************************************************
2 *
3 * Copyright 2007 VMware, Inc.
4 * Copyright (c) 2008 VMware, Inc.
5 * All Rights Reserved.
6 *
7 * Permission is hereby granted, free of charge, to any person obtaining a
8 * copy of this software and associated documentation files (the
9 * "Software"), to deal in the Software without restriction, including
10 * without limitation the rights to use, copy, modify, merge, publish,
11 * distribute, sub license, and/or sell copies of the Software, and to
12 * permit persons to whom the Software is furnished to do so, subject to
13 * the following conditions:
14 *
15 * The above copyright notice and this permission notice (including the
16 * next paragraph) shall be included in all copies or substantial portions
17 * of the Software.
18 *
19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
20 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
21 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
22 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
23 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
24 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
25 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 *
27 **************************************************************************/
28
29 #include "compiler/nir/nir.h"
30
31 #include "main/imports.h"
32 #include "main/context.h"
33 #include "main/macros.h"
34 #include "main/version.h"
35
36 #include "pipe/p_context.h"
37 #include "pipe/p_defines.h"
38 #include "pipe/p_screen.h"
39 #include "tgsi/tgsi_from_mesa.h"
40 #include "util/u_math.h"
41
42 #include "st_context.h"
43 #include "st_debug.h"
44 #include "st_extensions.h"
45 #include "st_format.h"
46
47
48 /*
49 * Note: we use these function rather than the MIN2, MAX2, CLAMP macros to
50 * avoid evaluating arguments (which are often function calls) more than once.
51 */
52
53 static unsigned _min(unsigned a, unsigned b)
54 {
55 return (a < b) ? a : b;
56 }
57
58 static float _maxf(float a, float b)
59 {
60 return (a > b) ? a : b;
61 }
62
63 static int _clamp(int a, int min, int max)
64 {
65 if (a < min)
66 return min;
67 else if (a > max)
68 return max;
69 else
70 return a;
71 }
72
73
74 /**
75 * Query driver to get implementation limits.
76 * Note that we have to limit/clamp against Mesa's internal limits too.
77 */
78 void st_init_limits(struct pipe_screen *screen,
79 struct gl_constants *c, struct gl_extensions *extensions,
80 gl_api api)
81 {
82 int supported_irs;
83 unsigned sh;
84 bool can_ubo = true;
85 int temp;
86 bool ssbo_atomic = true;
87
88 c->MaxTextureLevels
89 = _min(screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_2D_LEVELS),
90 MAX_TEXTURE_LEVELS);
91
92 c->Max3DTextureLevels
93 = _min(screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_3D_LEVELS),
94 MAX_3D_TEXTURE_LEVELS);
95
96 c->MaxCubeTextureLevels
97 = _min(screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS),
98 MAX_CUBE_TEXTURE_LEVELS);
99
100 c->MaxTextureRectSize
101 = _min(1 << (c->MaxTextureLevels - 1), MAX_TEXTURE_RECT_SIZE);
102
103 c->MaxArrayTextureLayers
104 = screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS);
105
106 /* Define max viewport size and max renderbuffer size in terms of
107 * max texture size (note: max tex RECT size = max tex 2D size).
108 * If this isn't true for some hardware we'll need new PIPE_CAP_ queries.
109 */
110 c->MaxViewportWidth =
111 c->MaxViewportHeight =
112 c->MaxRenderbufferSize = c->MaxTextureRectSize;
113
114 c->SubPixelBits =
115 c->ViewportSubpixelBits =
116 screen->get_param(screen, PIPE_CAP_VIEWPORT_SUBPIXEL_BITS);
117
118 c->MaxDrawBuffers = c->MaxColorAttachments =
119 _clamp(screen->get_param(screen, PIPE_CAP_MAX_RENDER_TARGETS),
120 1, MAX_DRAW_BUFFERS);
121
122 c->MaxDualSourceDrawBuffers =
123 _clamp(screen->get_param(screen,
124 PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS),
125 0, MAX_DRAW_BUFFERS);
126
127 c->MaxLineWidth =
128 _maxf(1.0f, screen->get_paramf(screen, PIPE_CAPF_MAX_LINE_WIDTH));
129 c->MaxLineWidthAA =
130 _maxf(1.0f, screen->get_paramf(screen, PIPE_CAPF_MAX_LINE_WIDTH_AA));
131
132 c->MaxPointSize =
133 _maxf(1.0f, screen->get_paramf(screen, PIPE_CAPF_MAX_POINT_WIDTH));
134 c->MaxPointSizeAA =
135 _maxf(1.0f, screen->get_paramf(screen, PIPE_CAPF_MAX_POINT_WIDTH_AA));
136
137 /* these are not queryable. Note that GL basically mandates a 1.0 minimum
138 * for non-aa sizes, but we can go down to 0.0 for aa points.
139 */
140 c->MinPointSize = 1.0f;
141 c->MinPointSizeAA = 0.0f;
142
143 c->MaxTextureMaxAnisotropy =
144 _maxf(2.0f,
145 screen->get_paramf(screen, PIPE_CAPF_MAX_TEXTURE_ANISOTROPY));
146
147 c->MaxTextureLodBias =
148 screen->get_paramf(screen, PIPE_CAPF_MAX_TEXTURE_LOD_BIAS);
149
150 c->QuadsFollowProvokingVertexConvention =
151 screen->get_param(screen,
152 PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION);
153
154 c->MaxUniformBlockSize =
155 screen->get_shader_param(screen, PIPE_SHADER_FRAGMENT,
156 PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE);
157 /* GL45-CTS.enhanced_layouts.ssb_member_invalid_offset_alignment fails if
158 * this is larger than INT_MAX - 100. Use a nicely aligned limit.
159 */
160 c->MaxUniformBlockSize = MIN2(c->MaxUniformBlockSize, INT_MAX - 127);
161
162 if (c->MaxUniformBlockSize < 16384) {
163 can_ubo = false;
164 }
165
166 for (sh = 0; sh < PIPE_SHADER_TYPES; ++sh) {
167 struct gl_shader_compiler_options *options;
168 struct gl_program_constants *pc;
169 const nir_shader_compiler_options *nir_options = NULL;
170
171 if (screen->get_compiler_options) {
172 nir_options = (const nir_shader_compiler_options *)
173 screen->get_compiler_options(screen, PIPE_SHADER_IR_NIR, sh);
174 }
175
176 const gl_shader_stage stage = tgsi_processor_to_shader_stage(sh);
177 pc = &c->Program[stage];
178 options = &c->ShaderCompilerOptions[stage];
179 c->ShaderCompilerOptions[stage].NirOptions = nir_options;
180
181 if (sh == PIPE_SHADER_COMPUTE) {
182 if (!screen->get_param(screen, PIPE_CAP_COMPUTE))
183 continue;
184 supported_irs =
185 screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_SUPPORTED_IRS);
186 if (!(supported_irs & (1 << PIPE_SHADER_IR_TGSI)))
187 continue;
188 }
189
190 pc->MaxTextureImageUnits =
191 _min(screen->get_shader_param(screen, sh,
192 PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS),
193 MAX_TEXTURE_IMAGE_UNITS);
194
195 pc->MaxInstructions =
196 pc->MaxNativeInstructions =
197 screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_MAX_INSTRUCTIONS);
198 pc->MaxAluInstructions =
199 pc->MaxNativeAluInstructions =
200 screen->get_shader_param(screen, sh,
201 PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS);
202 pc->MaxTexInstructions =
203 pc->MaxNativeTexInstructions =
204 screen->get_shader_param(screen, sh,
205 PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS);
206 pc->MaxTexIndirections =
207 pc->MaxNativeTexIndirections =
208 screen->get_shader_param(screen, sh,
209 PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS);
210 pc->MaxAttribs =
211 pc->MaxNativeAttribs =
212 screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_MAX_INPUTS);
213 pc->MaxTemps =
214 pc->MaxNativeTemps =
215 screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_MAX_TEMPS);
216 pc->MaxAddressRegs =
217 pc->MaxNativeAddressRegs = sh == PIPE_SHADER_VERTEX ? 1 : 0;
218
219 pc->MaxUniformComponents =
220 screen->get_shader_param(screen, sh,
221 PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE) / 4;
222 pc->MaxUniformComponents = MIN2(pc->MaxUniformComponents,
223 MAX_UNIFORMS * 4);
224
225 pc->MaxParameters =
226 pc->MaxNativeParameters = pc->MaxUniformComponents / 4;
227 pc->MaxInputComponents =
228 screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_MAX_INPUTS) * 4;
229 pc->MaxOutputComponents =
230 screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_MAX_OUTPUTS) * 4;
231
232
233 pc->MaxUniformBlocks =
234 screen->get_shader_param(screen, sh,
235 PIPE_SHADER_CAP_MAX_CONST_BUFFERS);
236 if (pc->MaxUniformBlocks)
237 pc->MaxUniformBlocks -= 1; /* The first one is for ordinary uniforms. */
238 pc->MaxUniformBlocks = _min(pc->MaxUniformBlocks, MAX_UNIFORM_BUFFERS);
239
240 pc->MaxCombinedUniformComponents =
241 pc->MaxUniformComponents +
242 (uint64_t)c->MaxUniformBlockSize / 4 * pc->MaxUniformBlocks;
243
244 pc->MaxShaderStorageBlocks =
245 screen->get_shader_param(screen, sh,
246 PIPE_SHADER_CAP_MAX_SHADER_BUFFERS);
247
248 temp = screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS);
249 if (temp) {
250 /*
251 * for separate atomic counters get the actual hw limits
252 * per stage on atomic counters and buffers
253 */
254 ssbo_atomic = false;
255 pc->MaxAtomicCounters = temp;
256 pc->MaxAtomicBuffers = screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS);
257 } else {
258 pc->MaxAtomicCounters = MAX_ATOMIC_COUNTERS;
259 /*
260 * without separate atomic counters, reserve half of the available
261 * SSBOs for atomic buffers, and the other half for normal SSBOs.
262 */
263 pc->MaxAtomicBuffers = pc->MaxShaderStorageBlocks / 2;
264 pc->MaxShaderStorageBlocks -= pc->MaxAtomicBuffers;
265 }
266 pc->MaxImageUniforms = screen->get_shader_param(
267 screen, sh, PIPE_SHADER_CAP_MAX_SHADER_IMAGES);
268
269 /* Gallium doesn't really care about local vs. env parameters so use the
270 * same limits.
271 */
272 pc->MaxLocalParams = MIN2(pc->MaxParameters, MAX_PROGRAM_LOCAL_PARAMS);
273 pc->MaxEnvParams = MIN2(pc->MaxParameters, MAX_PROGRAM_ENV_PARAMS);
274
275 if (screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_INTEGERS)) {
276 pc->LowInt.RangeMin = 31;
277 pc->LowInt.RangeMax = 30;
278 pc->LowInt.Precision = 0;
279 pc->MediumInt = pc->HighInt = pc->LowInt;
280 }
281
282 /* TODO: make these more fine-grained if anyone needs it */
283 options->MaxIfDepth =
284 screen->get_shader_param(screen, sh,
285 PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH);
286 options->EmitNoLoops =
287 !screen->get_shader_param(screen, sh,
288 PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH);
289 options->EmitNoMainReturn =
290 !screen->get_shader_param(screen, sh, PIPE_SHADER_CAP_SUBROUTINES);
291
292 options->EmitNoCont =
293 !screen->get_shader_param(screen, sh,
294 PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED);
295
296 options->EmitNoIndirectInput =
297 !screen->get_shader_param(screen, sh,
298 PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR);
299 options->EmitNoIndirectOutput =
300 !screen->get_shader_param(screen, sh,
301 PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR);
302 options->EmitNoIndirectTemp =
303 !screen->get_shader_param(screen, sh,
304 PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR);
305 options->EmitNoIndirectUniform =
306 !screen->get_shader_param(screen, sh,
307 PIPE_SHADER_CAP_INDIRECT_CONST_ADDR);
308
309 if (pc->MaxNativeInstructions &&
310 (options->EmitNoIndirectUniform || pc->MaxUniformBlocks < 12)) {
311 can_ubo = false;
312 }
313
314 if (options->EmitNoLoops)
315 options->MaxUnrollIterations =
316 MIN2(screen->get_shader_param(screen, sh,
317 PIPE_SHADER_CAP_MAX_INSTRUCTIONS),
318 65536);
319 else
320 options->MaxUnrollIterations =
321 screen->get_shader_param(screen, sh,
322 PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT);
323
324 options->LowerCombinedClipCullDistance = true;
325 options->LowerBufferInterfaceBlocks = true;
326 }
327
328 c->MaxUserAssignableUniformLocations =
329 c->Program[MESA_SHADER_VERTEX].MaxUniformComponents +
330 c->Program[MESA_SHADER_TESS_CTRL].MaxUniformComponents +
331 c->Program[MESA_SHADER_TESS_EVAL].MaxUniformComponents +
332 c->Program[MESA_SHADER_GEOMETRY].MaxUniformComponents +
333 c->Program[MESA_SHADER_FRAGMENT].MaxUniformComponents;
334
335 c->GLSLOptimizeConservatively =
336 screen->get_param(screen, PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY);
337 c->LowerTessLevel = true;
338 c->LowerCsDerivedVariables = true;
339 c->PrimitiveRestartForPatches =
340 screen->get_param(screen, PIPE_CAP_PRIMITIVE_RESTART_FOR_PATCHES);
341
342 c->MaxCombinedTextureImageUnits =
343 _min(c->Program[MESA_SHADER_VERTEX].MaxTextureImageUnits +
344 c->Program[MESA_SHADER_TESS_CTRL].MaxTextureImageUnits +
345 c->Program[MESA_SHADER_TESS_EVAL].MaxTextureImageUnits +
346 c->Program[MESA_SHADER_GEOMETRY].MaxTextureImageUnits +
347 c->Program[MESA_SHADER_FRAGMENT].MaxTextureImageUnits +
348 c->Program[MESA_SHADER_COMPUTE].MaxTextureImageUnits,
349 MAX_COMBINED_TEXTURE_IMAGE_UNITS);
350
351 /* This depends on program constants. */
352 c->MaxTextureCoordUnits
353 = _min(c->Program[MESA_SHADER_FRAGMENT].MaxTextureImageUnits,
354 MAX_TEXTURE_COORD_UNITS);
355
356 c->MaxTextureUnits =
357 _min(c->Program[MESA_SHADER_FRAGMENT].MaxTextureImageUnits,
358 c->MaxTextureCoordUnits);
359
360 c->Program[MESA_SHADER_VERTEX].MaxAttribs =
361 MIN2(c->Program[MESA_SHADER_VERTEX].MaxAttribs, 16);
362
363 /* PIPE_SHADER_CAP_MAX_INPUTS for the FS specifies the maximum number
364 * of inputs. It's always 2 colors + N generic inputs. */
365 c->MaxVarying = screen->get_shader_param(screen, PIPE_SHADER_FRAGMENT,
366 PIPE_SHADER_CAP_MAX_INPUTS);
367 c->MaxVarying = MIN2(c->MaxVarying, MAX_VARYING);
368 c->MaxGeometryOutputVertices =
369 screen->get_param(screen, PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES);
370 c->MaxGeometryTotalOutputComponents =
371 screen->get_param(screen, PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS);
372 c->MaxGeometryShaderInvocations =
373 screen->get_param(screen, PIPE_CAP_MAX_GS_INVOCATIONS);
374 c->MaxTessPatchComponents =
375 MIN2(screen->get_param(screen, PIPE_CAP_MAX_SHADER_PATCH_VARYINGS),
376 MAX_VARYING) * 4;
377
378 c->MinProgramTexelOffset =
379 screen->get_param(screen, PIPE_CAP_MIN_TEXEL_OFFSET);
380 c->MaxProgramTexelOffset =
381 screen->get_param(screen, PIPE_CAP_MAX_TEXEL_OFFSET);
382
383 c->MaxProgramTextureGatherComponents =
384 screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS);
385 c->MinProgramTextureGatherOffset =
386 screen->get_param(screen, PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET);
387 c->MaxProgramTextureGatherOffset =
388 screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET);
389
390 c->MaxTransformFeedbackBuffers =
391 screen->get_param(screen, PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS);
392 c->MaxTransformFeedbackBuffers = MIN2(c->MaxTransformFeedbackBuffers,
393 MAX_FEEDBACK_BUFFERS);
394 c->MaxTransformFeedbackSeparateComponents =
395 screen->get_param(screen, PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS);
396 c->MaxTransformFeedbackInterleavedComponents =
397 screen->get_param(screen,
398 PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS);
399 c->MaxVertexStreams =
400 MAX2(1, screen->get_param(screen, PIPE_CAP_MAX_VERTEX_STREAMS));
401
402 /* The vertex stream must fit into pipe_stream_output_info::stream */
403 assert(c->MaxVertexStreams <= 4);
404
405 c->MaxVertexAttribStride
406 = screen->get_param(screen, PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE);
407
408 c->StripTextureBorder = GL_TRUE;
409
410 c->GLSLSkipStrictMaxUniformLimitCheck =
411 screen->get_param(screen, PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS);
412
413 c->UniformBufferOffsetAlignment =
414 screen->get_param(screen, PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT);
415
416 if (can_ubo) {
417 extensions->ARB_uniform_buffer_object = GL_TRUE;
418 c->MaxCombinedUniformBlocks = c->MaxUniformBufferBindings =
419 c->Program[MESA_SHADER_VERTEX].MaxUniformBlocks +
420 c->Program[MESA_SHADER_TESS_CTRL].MaxUniformBlocks +
421 c->Program[MESA_SHADER_TESS_EVAL].MaxUniformBlocks +
422 c->Program[MESA_SHADER_GEOMETRY].MaxUniformBlocks +
423 c->Program[MESA_SHADER_FRAGMENT].MaxUniformBlocks +
424 c->Program[MESA_SHADER_COMPUTE].MaxUniformBlocks;
425 assert(c->MaxCombinedUniformBlocks <= MAX_COMBINED_UNIFORM_BUFFERS);
426 }
427
428 c->GLSLFragCoordIsSysVal =
429 screen->get_param(screen, PIPE_CAP_TGSI_FS_POSITION_IS_SYSVAL);
430 c->GLSLFrontFacingIsSysVal =
431 screen->get_param(screen, PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL);
432
433 /* GL_ARB_get_program_binary
434 *
435 * The QT framework has a bug in their shader program cache, which is built
436 * on GL_ARB_get_program_binary. In an effort to allow them to fix the bug
437 * we don't enable more than 1 binary format for compatibility profiles.
438 */
439 if (api != API_OPENGL_COMPAT &&
440 screen->get_disk_shader_cache && screen->get_disk_shader_cache(screen))
441 c->NumProgramBinaryFormats = 1;
442
443 c->MaxAtomicBufferBindings =
444 c->Program[MESA_SHADER_FRAGMENT].MaxAtomicBuffers;
445
446 if (!ssbo_atomic) {
447 /* for separate atomic buffers - there atomic buffer size will be
448 limited */
449 c->MaxAtomicBufferSize = c->Program[MESA_SHADER_FRAGMENT].MaxAtomicCounters * ATOMIC_COUNTER_SIZE;
450 /* on all HW with separate atomic (evergreen) the following
451 lines are true. not sure it's worth adding CAPs for this at this
452 stage. */
453 c->MaxCombinedAtomicCounters = c->Program[MESA_SHADER_FRAGMENT].MaxAtomicCounters;
454 c->MaxCombinedAtomicBuffers = c->Program[MESA_SHADER_FRAGMENT].MaxAtomicBuffers;
455 } else {
456 c->MaxCombinedAtomicBuffers =
457 c->Program[MESA_SHADER_VERTEX].MaxAtomicBuffers +
458 c->Program[MESA_SHADER_TESS_CTRL].MaxAtomicBuffers +
459 c->Program[MESA_SHADER_TESS_EVAL].MaxAtomicBuffers +
460 c->Program[MESA_SHADER_GEOMETRY].MaxAtomicBuffers +
461 c->Program[MESA_SHADER_FRAGMENT].MaxAtomicBuffers;
462 assert(c->MaxCombinedAtomicBuffers <= MAX_COMBINED_ATOMIC_BUFFERS);
463 }
464
465 if (c->MaxCombinedAtomicBuffers > 0) {
466 extensions->ARB_shader_atomic_counters = GL_TRUE;
467 extensions->ARB_shader_atomic_counter_ops = GL_TRUE;
468 }
469
470 c->MaxCombinedShaderOutputResources = c->MaxDrawBuffers;
471 c->ShaderStorageBufferOffsetAlignment =
472 screen->get_param(screen, PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT);
473 if (c->ShaderStorageBufferOffsetAlignment) {
474 /* for hw atomic counters leaves these at default for now */
475 if (ssbo_atomic) {
476 c->MaxCombinedShaderStorageBlocks =
477 c->Program[MESA_SHADER_VERTEX].MaxShaderStorageBlocks +
478 c->Program[MESA_SHADER_TESS_CTRL].MaxShaderStorageBlocks +
479 c->Program[MESA_SHADER_TESS_EVAL].MaxShaderStorageBlocks +
480 c->Program[MESA_SHADER_GEOMETRY].MaxShaderStorageBlocks +
481 c->Program[MESA_SHADER_FRAGMENT].MaxShaderStorageBlocks;
482 assert(c->MaxCombinedShaderStorageBlocks < MAX_COMBINED_SHADER_STORAGE_BUFFERS);
483 }
484 c->MaxShaderStorageBufferBindings = c->MaxCombinedShaderStorageBlocks;
485
486 c->MaxCombinedShaderOutputResources +=
487 c->MaxCombinedShaderStorageBlocks;
488 c->MaxShaderStorageBlockSize =
489 screen->get_param(screen, PIPE_CAP_MAX_SHADER_BUFFER_SIZE);
490 extensions->ARB_shader_storage_buffer_object = GL_TRUE;
491 }
492
493 c->MaxCombinedImageUniforms =
494 c->Program[MESA_SHADER_VERTEX].MaxImageUniforms +
495 c->Program[MESA_SHADER_TESS_CTRL].MaxImageUniforms +
496 c->Program[MESA_SHADER_TESS_EVAL].MaxImageUniforms +
497 c->Program[MESA_SHADER_GEOMETRY].MaxImageUniforms +
498 c->Program[MESA_SHADER_FRAGMENT].MaxImageUniforms +
499 c->Program[MESA_SHADER_COMPUTE].MaxImageUniforms;
500 c->MaxCombinedShaderOutputResources += c->MaxCombinedImageUniforms;
501 c->MaxImageUnits = MAX_IMAGE_UNITS;
502 if (c->MaxCombinedImageUniforms) {
503 extensions->ARB_shader_image_load_store = GL_TRUE;
504 extensions->ARB_shader_image_size = GL_TRUE;
505 }
506
507 /* ARB_framebuffer_no_attachments */
508 c->MaxFramebufferWidth = c->MaxViewportWidth;
509 c->MaxFramebufferHeight = c->MaxViewportHeight;
510 /* NOTE: we cheat here a little by assuming that
511 * PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS has the same
512 * number of layers as we need, although we technically
513 * could have more the generality is not really useful
514 * in practicality.
515 */
516 c->MaxFramebufferLayers =
517 screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS);
518
519 c->MaxWindowRectangles =
520 screen->get_param(screen, PIPE_CAP_MAX_WINDOW_RECTANGLES);
521
522 c->SparseBufferPageSize =
523 screen->get_param(screen, PIPE_CAP_SPARSE_BUFFER_PAGE_SIZE);
524
525 c->AllowMappedBuffersDuringExecution =
526 screen->get_param(screen, PIPE_CAP_ALLOW_MAPPED_BUFFERS_DURING_EXECUTION);
527
528 c->UseSTD430AsDefaultPacking =
529 screen->get_param(screen, PIPE_CAP_LOAD_CONSTBUF);
530
531 c->MaxSubpixelPrecisionBiasBits =
532 screen->get_param(screen, PIPE_CAP_MAX_CONSERVATIVE_RASTER_SUBPIXEL_PRECISION_BIAS);
533
534 c->ConservativeRasterDilateRange[0] =
535 screen->get_paramf(screen, PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE);
536 c->ConservativeRasterDilateRange[1] =
537 screen->get_paramf(screen, PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE);
538 c->ConservativeRasterDilateGranularity =
539 screen->get_paramf(screen, PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY);
540
541 /* limit the max combined shader output resources to a driver limit */
542 temp = screen->get_param(screen, PIPE_CAP_MAX_COMBINED_SHADER_OUTPUT_RESOURCES);
543 if (temp > 0 && c->MaxCombinedShaderOutputResources > temp)
544 c->MaxCombinedShaderOutputResources = temp;
545 }
546
547
548 /**
549 * Given a member \c x of struct gl_extensions, return offset of
550 * \c x in bytes.
551 */
552 #define o(x) offsetof(struct gl_extensions, x)
553
554
555 struct st_extension_cap_mapping {
556 int extension_offset;
557 int cap;
558 };
559
560 struct st_extension_format_mapping {
561 int extension_offset[2];
562 enum pipe_format format[32];
563
564 /* If TRUE, at least one format must be supported for the extensions to be
565 * advertised. If FALSE, all the formats must be supported. */
566 GLboolean need_at_least_one;
567 };
568
569 /**
570 * Enable extensions if certain pipe formats are supported by the driver.
571 * What extensions will be enabled and what formats must be supported is
572 * described by the array of st_extension_format_mapping.
573 *
574 * target and bind_flags are passed to is_format_supported.
575 */
576 static void
577 init_format_extensions(struct pipe_screen *screen,
578 struct gl_extensions *extensions,
579 const struct st_extension_format_mapping *mapping,
580 unsigned num_mappings,
581 enum pipe_texture_target target,
582 unsigned bind_flags)
583 {
584 GLboolean *extension_table = (GLboolean *) extensions;
585 unsigned i;
586 int j;
587 int num_formats = ARRAY_SIZE(mapping->format);
588 int num_ext = ARRAY_SIZE(mapping->extension_offset);
589
590 for (i = 0; i < num_mappings; i++) {
591 int num_supported = 0;
592
593 /* Examine each format in the list. */
594 for (j = 0; j < num_formats && mapping[i].format[j]; j++) {
595 if (screen->is_format_supported(screen, mapping[i].format[j],
596 target, 0, 0, bind_flags)) {
597 num_supported++;
598 }
599 }
600
601 if (!num_supported ||
602 (!mapping[i].need_at_least_one && num_supported != j)) {
603 continue;
604 }
605
606 /* Enable all extensions in the list. */
607 for (j = 0; j < num_ext && mapping[i].extension_offset[j]; j++)
608 extension_table[mapping[i].extension_offset[j]] = GL_TRUE;
609 }
610 }
611
612
613 /**
614 * Given a list of formats and bind flags, return the maximum number
615 * of samples supported by any of those formats.
616 */
617 static unsigned
618 get_max_samples_for_formats(struct pipe_screen *screen,
619 unsigned num_formats,
620 const enum pipe_format *formats,
621 unsigned max_samples,
622 unsigned bind)
623 {
624 unsigned i, f;
625
626 for (i = max_samples; i > 0; --i) {
627 for (f = 0; f < num_formats; f++) {
628 if (screen->is_format_supported(screen, formats[f],
629 PIPE_TEXTURE_2D, i, i, bind)) {
630 return i;
631 }
632 }
633 }
634 return 0;
635 }
636
637 static unsigned
638 get_max_samples_for_formats_advanced(struct pipe_screen *screen,
639 unsigned num_formats,
640 const enum pipe_format *formats,
641 unsigned max_samples,
642 unsigned num_storage_samples,
643 unsigned bind)
644 {
645 unsigned i, f;
646
647 for (i = max_samples; i > 0; --i) {
648 for (f = 0; f < num_formats; f++) {
649 if (screen->is_format_supported(screen, formats[f], PIPE_TEXTURE_2D,
650 i, num_storage_samples, bind)) {
651 return i;
652 }
653 }
654 }
655 return 0;
656 }
657
658 /**
659 * Use pipe_screen::get_param() to query PIPE_CAP_ values to determine
660 * which GL extensions are supported.
661 * Quite a few extensions are always supported because they are standard
662 * features or can be built on top of other gallium features.
663 * Some fine tuning may still be needed.
664 */
665 void st_init_extensions(struct pipe_screen *screen,
666 struct gl_constants *consts,
667 struct gl_extensions *extensions,
668 struct st_config_options *options,
669 gl_api api)
670 {
671 unsigned i;
672 GLboolean *extension_table = (GLboolean *) extensions;
673
674 static const struct st_extension_cap_mapping cap_mapping[] = {
675 { o(ARB_base_instance), PIPE_CAP_START_INSTANCE },
676 { o(ARB_bindless_texture), PIPE_CAP_BINDLESS_TEXTURE },
677 { o(ARB_buffer_storage), PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT },
678 { o(ARB_clear_texture), PIPE_CAP_CLEAR_TEXTURE },
679 { o(ARB_clip_control), PIPE_CAP_CLIP_HALFZ },
680 { o(ARB_color_buffer_float), PIPE_CAP_VERTEX_COLOR_UNCLAMPED },
681 { o(ARB_conditional_render_inverted), PIPE_CAP_CONDITIONAL_RENDER_INVERTED },
682 { o(ARB_copy_image), PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS },
683 { o(OES_copy_image), PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS },
684 { o(ARB_cull_distance), PIPE_CAP_CULL_DISTANCE },
685 { o(ARB_depth_clamp), PIPE_CAP_DEPTH_CLIP_DISABLE },
686 { o(ARB_derivative_control), PIPE_CAP_TGSI_FS_FINE_DERIVATIVE },
687 { o(ARB_draw_buffers_blend), PIPE_CAP_INDEP_BLEND_FUNC },
688 { o(ARB_draw_indirect), PIPE_CAP_DRAW_INDIRECT },
689 { o(ARB_draw_instanced), PIPE_CAP_TGSI_INSTANCEID },
690 { o(ARB_framebuffer_object), PIPE_CAP_MIXED_FRAMEBUFFER_SIZES },
691 { o(ARB_gpu_shader_int64), PIPE_CAP_INT64 },
692 { o(ARB_indirect_parameters), PIPE_CAP_MULTI_DRAW_INDIRECT_PARAMS },
693 { o(ARB_instanced_arrays), PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR },
694 { o(ARB_occlusion_query), PIPE_CAP_OCCLUSION_QUERY },
695 { o(ARB_occlusion_query2), PIPE_CAP_OCCLUSION_QUERY },
696 { o(ARB_pipeline_statistics_query), PIPE_CAP_QUERY_PIPELINE_STATISTICS },
697 { o(ARB_point_sprite), PIPE_CAP_POINT_SPRITE },
698 { o(ARB_polygon_offset_clamp), PIPE_CAP_POLYGON_OFFSET_CLAMP },
699 { o(ARB_post_depth_coverage), PIPE_CAP_POST_DEPTH_COVERAGE },
700 { o(ARB_query_buffer_object), PIPE_CAP_QUERY_BUFFER_OBJECT },
701 { o(ARB_robust_buffer_access_behavior), PIPE_CAP_ROBUST_BUFFER_ACCESS_BEHAVIOR },
702 { o(ARB_sample_shading), PIPE_CAP_SAMPLE_SHADING },
703 { o(ARB_sample_locations), PIPE_CAP_PROGRAMMABLE_SAMPLE_LOCATIONS },
704 { o(ARB_seamless_cube_map), PIPE_CAP_SEAMLESS_CUBE_MAP },
705 { o(ARB_shader_ballot), PIPE_CAP_TGSI_BALLOT },
706 { o(ARB_shader_clock), PIPE_CAP_TGSI_CLOCK },
707 { o(ARB_shader_draw_parameters), PIPE_CAP_DRAW_PARAMETERS },
708 { o(ARB_shader_group_vote), PIPE_CAP_TGSI_VOTE },
709 { o(ARB_shader_stencil_export), PIPE_CAP_SHADER_STENCIL_EXPORT },
710 { o(ARB_shader_texture_image_samples), PIPE_CAP_TGSI_TXQS },
711 { o(ARB_shader_texture_lod), PIPE_CAP_SM3 },
712 { o(ARB_sparse_buffer), PIPE_CAP_SPARSE_BUFFER_PAGE_SIZE },
713 { o(ARB_texture_buffer_object), PIPE_CAP_TEXTURE_BUFFER_OBJECTS },
714 { o(ARB_texture_cube_map_array), PIPE_CAP_CUBE_MAP_ARRAY },
715 { o(ARB_texture_gather), PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS },
716 { o(ARB_texture_mirror_clamp_to_edge), PIPE_CAP_TEXTURE_MIRROR_CLAMP_TO_EDGE },
717 { o(ARB_texture_multisample), PIPE_CAP_TEXTURE_MULTISAMPLE },
718 { o(ARB_texture_non_power_of_two), PIPE_CAP_NPOT_TEXTURES },
719 { o(ARB_texture_query_lod), PIPE_CAP_TEXTURE_QUERY_LOD },
720 { o(ARB_texture_view), PIPE_CAP_SAMPLER_VIEW_TARGET },
721 { o(ARB_timer_query), PIPE_CAP_QUERY_TIMESTAMP },
722 { o(ARB_transform_feedback2), PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME },
723 { o(ARB_transform_feedback3), PIPE_CAP_STREAM_OUTPUT_INTERLEAVE_BUFFERS },
724 { o(ARB_transform_feedback_overflow_query), PIPE_CAP_QUERY_SO_OVERFLOW },
725
726 { o(KHR_blend_equation_advanced), PIPE_CAP_TGSI_FS_FBFETCH },
727
728 { o(EXT_blend_equation_separate), PIPE_CAP_BLEND_EQUATION_SEPARATE },
729 { o(EXT_depth_bounds_test), PIPE_CAP_DEPTH_BOUNDS_TEST },
730 { o(EXT_disjoint_timer_query), PIPE_CAP_QUERY_TIMESTAMP },
731 { o(EXT_draw_buffers2), PIPE_CAP_INDEP_BLEND_ENABLE },
732 { o(EXT_memory_object), PIPE_CAP_MEMOBJ },
733 { o(EXT_memory_object_fd), PIPE_CAP_MEMOBJ },
734 { o(EXT_semaphore), PIPE_CAP_FENCE_SIGNAL },
735 { o(EXT_semaphore_fd), PIPE_CAP_FENCE_SIGNAL },
736 { o(EXT_texture_array), PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS },
737 { o(EXT_texture_filter_anisotropic), PIPE_CAP_ANISOTROPIC_FILTER },
738 { o(EXT_texture_mirror_clamp), PIPE_CAP_TEXTURE_MIRROR_CLAMP },
739 { o(EXT_texture_swizzle), PIPE_CAP_TEXTURE_SWIZZLE },
740 { o(EXT_transform_feedback), PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS },
741 { o(EXT_window_rectangles), PIPE_CAP_MAX_WINDOW_RECTANGLES },
742
743 { o(AMD_framebuffer_multisample_advanced), PIPE_CAP_FRAMEBUFFER_MSAA_CONSTRAINTS },
744 { o(AMD_pinned_memory), PIPE_CAP_RESOURCE_FROM_USER_MEMORY },
745 { o(ATI_meminfo), PIPE_CAP_QUERY_MEMORY_INFO },
746 { o(AMD_seamless_cubemap_per_texture), PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE },
747 { o(ATI_texture_mirror_once), PIPE_CAP_TEXTURE_MIRROR_CLAMP },
748 { o(MESA_tile_raster_order), PIPE_CAP_TILE_RASTER_ORDER },
749 { o(NV_conditional_render), PIPE_CAP_CONDITIONAL_RENDER },
750 { o(NV_fill_rectangle), PIPE_CAP_POLYGON_MODE_FILL_RECTANGLE },
751 { o(NV_primitive_restart), PIPE_CAP_PRIMITIVE_RESTART },
752 { o(NV_texture_barrier), PIPE_CAP_TEXTURE_BARRIER },
753 { o(NVX_gpu_memory_info), PIPE_CAP_QUERY_MEMORY_INFO },
754 /* GL_NV_point_sprite is not supported by gallium because we don't
755 * support the GL_POINT_SPRITE_R_MODE_NV option. */
756
757 { o(OES_standard_derivatives), PIPE_CAP_SM3 },
758 { o(OES_texture_float_linear), PIPE_CAP_TEXTURE_FLOAT_LINEAR },
759 { o(OES_texture_half_float_linear), PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR },
760 };
761
762 /* Required: render target and sampler support */
763 static const struct st_extension_format_mapping rendertarget_mapping[] = {
764 { { o(ARB_texture_float) },
765 { PIPE_FORMAT_R32G32B32A32_FLOAT,
766 PIPE_FORMAT_R16G16B16A16_FLOAT } },
767
768 { { o(OES_texture_float) },
769 { PIPE_FORMAT_R32G32B32A32_FLOAT } },
770
771 { { o(OES_texture_half_float) },
772 { PIPE_FORMAT_R16G16B16A16_FLOAT } },
773
774 { { o(ARB_texture_rgb10_a2ui) },
775 { PIPE_FORMAT_R10G10B10A2_UINT,
776 PIPE_FORMAT_B10G10R10A2_UINT },
777 GL_TRUE }, /* at least one format must be supported */
778
779 { { o(EXT_framebuffer_sRGB) },
780 { PIPE_FORMAT_A8B8G8R8_SRGB,
781 PIPE_FORMAT_B8G8R8A8_SRGB,
782 PIPE_FORMAT_R8G8B8A8_SRGB },
783 GL_TRUE }, /* at least one format must be supported */
784
785 { { o(EXT_packed_float) },
786 { PIPE_FORMAT_R11G11B10_FLOAT } },
787
788 { { o(EXT_texture_integer) },
789 { PIPE_FORMAT_R32G32B32A32_UINT,
790 PIPE_FORMAT_R32G32B32A32_SINT } },
791
792 { { o(ARB_texture_rg) },
793 { PIPE_FORMAT_R8_UNORM,
794 PIPE_FORMAT_R8G8_UNORM } },
795 };
796
797 /* Required: depth stencil and sampler support */
798 static const struct st_extension_format_mapping depthstencil_mapping[] = {
799 { { o(ARB_depth_buffer_float) },
800 { PIPE_FORMAT_Z32_FLOAT,
801 PIPE_FORMAT_Z32_FLOAT_S8X24_UINT } },
802 };
803
804 /* Required: sampler support */
805 static const struct st_extension_format_mapping texture_mapping[] = {
806 { { o(ARB_texture_compression_rgtc) },
807 { PIPE_FORMAT_RGTC1_UNORM,
808 PIPE_FORMAT_RGTC1_SNORM,
809 PIPE_FORMAT_RGTC2_UNORM,
810 PIPE_FORMAT_RGTC2_SNORM } },
811
812 { { o(EXT_texture_compression_latc) },
813 { PIPE_FORMAT_LATC1_UNORM,
814 PIPE_FORMAT_LATC1_SNORM,
815 PIPE_FORMAT_LATC2_UNORM,
816 PIPE_FORMAT_LATC2_SNORM } },
817
818 { { o(EXT_texture_compression_s3tc),
819 o(ANGLE_texture_compression_dxt) },
820 { PIPE_FORMAT_DXT1_RGB,
821 PIPE_FORMAT_DXT1_RGBA,
822 PIPE_FORMAT_DXT3_RGBA,
823 PIPE_FORMAT_DXT5_RGBA } },
824
825 { { o(ARB_texture_compression_bptc) },
826 { PIPE_FORMAT_BPTC_RGBA_UNORM,
827 PIPE_FORMAT_BPTC_SRGBA,
828 PIPE_FORMAT_BPTC_RGB_FLOAT,
829 PIPE_FORMAT_BPTC_RGB_UFLOAT } },
830
831 { { o(KHR_texture_compression_astc_ldr),
832 o(KHR_texture_compression_astc_sliced_3d) },
833 { PIPE_FORMAT_ASTC_4x4,
834 PIPE_FORMAT_ASTC_5x4,
835 PIPE_FORMAT_ASTC_5x5,
836 PIPE_FORMAT_ASTC_6x5,
837 PIPE_FORMAT_ASTC_6x6,
838 PIPE_FORMAT_ASTC_8x5,
839 PIPE_FORMAT_ASTC_8x6,
840 PIPE_FORMAT_ASTC_8x8,
841 PIPE_FORMAT_ASTC_10x5,
842 PIPE_FORMAT_ASTC_10x6,
843 PIPE_FORMAT_ASTC_10x8,
844 PIPE_FORMAT_ASTC_10x10,
845 PIPE_FORMAT_ASTC_12x10,
846 PIPE_FORMAT_ASTC_12x12,
847 PIPE_FORMAT_ASTC_4x4_SRGB,
848 PIPE_FORMAT_ASTC_5x4_SRGB,
849 PIPE_FORMAT_ASTC_5x5_SRGB,
850 PIPE_FORMAT_ASTC_6x5_SRGB,
851 PIPE_FORMAT_ASTC_6x6_SRGB,
852 PIPE_FORMAT_ASTC_8x5_SRGB,
853 PIPE_FORMAT_ASTC_8x6_SRGB,
854 PIPE_FORMAT_ASTC_8x8_SRGB,
855 PIPE_FORMAT_ASTC_10x5_SRGB,
856 PIPE_FORMAT_ASTC_10x6_SRGB,
857 PIPE_FORMAT_ASTC_10x8_SRGB,
858 PIPE_FORMAT_ASTC_10x10_SRGB,
859 PIPE_FORMAT_ASTC_12x10_SRGB,
860 PIPE_FORMAT_ASTC_12x12_SRGB } },
861
862 /* ASTC software fallback support. */
863 { { o(KHR_texture_compression_astc_ldr),
864 o(KHR_texture_compression_astc_sliced_3d) },
865 { PIPE_FORMAT_R8G8B8A8_UNORM,
866 PIPE_FORMAT_R8G8B8A8_SRGB } },
867
868 { { o(EXT_texture_shared_exponent) },
869 { PIPE_FORMAT_R9G9B9E5_FLOAT } },
870
871 { { o(EXT_texture_snorm) },
872 { PIPE_FORMAT_R8G8B8A8_SNORM } },
873
874 { { o(EXT_texture_sRGB),
875 o(EXT_texture_sRGB_decode) },
876 { PIPE_FORMAT_A8B8G8R8_SRGB,
877 PIPE_FORMAT_B8G8R8A8_SRGB,
878 PIPE_FORMAT_A8R8G8B8_SRGB,
879 PIPE_FORMAT_R8G8B8A8_SRGB},
880 GL_TRUE }, /* at least one format must be supported */
881
882 { { o(EXT_texture_type_2_10_10_10_REV) },
883 { PIPE_FORMAT_R10G10B10A2_UNORM,
884 PIPE_FORMAT_B10G10R10A2_UNORM },
885 GL_TRUE }, /* at least one format must be supported */
886
887 { { o(ATI_texture_compression_3dc) },
888 { PIPE_FORMAT_LATC2_UNORM } },
889
890 { { o(MESA_ycbcr_texture) },
891 { PIPE_FORMAT_UYVY,
892 PIPE_FORMAT_YUYV },
893 GL_TRUE }, /* at least one format must be supported */
894
895 { { o(OES_compressed_ETC1_RGB8_texture) },
896 { PIPE_FORMAT_ETC1_RGB8,
897 PIPE_FORMAT_R8G8B8A8_UNORM },
898 GL_TRUE }, /* at least one format must be supported */
899
900 { { o(ARB_stencil_texturing),
901 o(ARB_texture_stencil8) },
902 { PIPE_FORMAT_X24S8_UINT,
903 PIPE_FORMAT_S8X24_UINT },
904 GL_TRUE }, /* at least one format must be supported */
905 };
906
907 /* Required: vertex fetch support. */
908 static const struct st_extension_format_mapping vertex_mapping[] = {
909 { { o(EXT_vertex_array_bgra) },
910 { PIPE_FORMAT_B8G8R8A8_UNORM } },
911 { { o(ARB_vertex_type_2_10_10_10_rev) },
912 { PIPE_FORMAT_R10G10B10A2_UNORM,
913 PIPE_FORMAT_B10G10R10A2_UNORM,
914 PIPE_FORMAT_R10G10B10A2_SNORM,
915 PIPE_FORMAT_B10G10R10A2_SNORM,
916 PIPE_FORMAT_R10G10B10A2_USCALED,
917 PIPE_FORMAT_B10G10R10A2_USCALED,
918 PIPE_FORMAT_R10G10B10A2_SSCALED,
919 PIPE_FORMAT_B10G10R10A2_SSCALED } },
920 { { o(ARB_vertex_type_10f_11f_11f_rev) },
921 { PIPE_FORMAT_R11G11B10_FLOAT } },
922 };
923
924 static const struct st_extension_format_mapping tbo_rgb32[] = {
925 { {o(ARB_texture_buffer_object_rgb32) },
926 { PIPE_FORMAT_R32G32B32_FLOAT,
927 PIPE_FORMAT_R32G32B32_UINT,
928 PIPE_FORMAT_R32G32B32_SINT,
929 } },
930 };
931
932 /*
933 * Extensions that are supported by all Gallium drivers:
934 */
935 extensions->ARB_ES2_compatibility = GL_TRUE;
936 extensions->ARB_depth_texture = GL_TRUE;
937 extensions->ARB_draw_elements_base_vertex = GL_TRUE;
938 extensions->ARB_explicit_attrib_location = GL_TRUE;
939 extensions->ARB_explicit_uniform_location = GL_TRUE;
940 extensions->ARB_fragment_coord_conventions = GL_TRUE;
941 extensions->ARB_fragment_program = GL_TRUE;
942 extensions->ARB_fragment_program_shadow = GL_TRUE;
943 extensions->ARB_fragment_shader = GL_TRUE;
944 extensions->ARB_half_float_vertex = GL_TRUE;
945 extensions->ARB_internalformat_query = GL_TRUE;
946 extensions->ARB_internalformat_query2 = GL_TRUE;
947 extensions->ARB_map_buffer_range = GL_TRUE;
948 extensions->ARB_shadow = GL_TRUE;
949 extensions->ARB_sync = GL_TRUE;
950 extensions->ARB_texture_border_clamp = GL_TRUE;
951 extensions->ARB_texture_cube_map = GL_TRUE;
952 extensions->ARB_texture_env_combine = GL_TRUE;
953 extensions->ARB_texture_env_crossbar = GL_TRUE;
954 extensions->ARB_texture_env_dot3 = GL_TRUE;
955 extensions->ARB_vertex_program = GL_TRUE;
956 extensions->ARB_vertex_shader = GL_TRUE;
957
958 extensions->EXT_blend_color = GL_TRUE;
959 extensions->EXT_blend_func_separate = GL_TRUE;
960 extensions->EXT_blend_minmax = GL_TRUE;
961 extensions->EXT_gpu_program_parameters = GL_TRUE;
962 extensions->EXT_pixel_buffer_object = GL_TRUE;
963 extensions->EXT_point_parameters = GL_TRUE;
964 extensions->EXT_provoking_vertex = GL_TRUE;
965 extensions->EXT_stencil_two_side = GL_TRUE;
966 extensions->EXT_texture_env_dot3 = GL_TRUE;
967
968 extensions->ATI_fragment_shader = GL_TRUE;
969 extensions->ATI_texture_env_combine3 = GL_TRUE;
970
971 extensions->MESA_pack_invert = GL_TRUE;
972
973 extensions->NV_fog_distance = GL_TRUE;
974 extensions->NV_texture_env_combine4 = GL_TRUE;
975 extensions->NV_texture_rectangle = GL_TRUE;
976
977 extensions->OES_EGL_image = GL_TRUE;
978 extensions->OES_EGL_image_external = GL_TRUE;
979 extensions->OES_draw_texture = GL_TRUE;
980
981 /* Expose the extensions which directly correspond to gallium caps. */
982 for (i = 0; i < ARRAY_SIZE(cap_mapping); i++) {
983 if (screen->get_param(screen, cap_mapping[i].cap)) {
984 extension_table[cap_mapping[i].extension_offset] = GL_TRUE;
985 }
986 }
987
988 /* Expose the extensions which directly correspond to gallium formats. */
989 init_format_extensions(screen, extensions, rendertarget_mapping,
990 ARRAY_SIZE(rendertarget_mapping), PIPE_TEXTURE_2D,
991 PIPE_BIND_RENDER_TARGET | PIPE_BIND_SAMPLER_VIEW);
992 init_format_extensions(screen, extensions, depthstencil_mapping,
993 ARRAY_SIZE(depthstencil_mapping), PIPE_TEXTURE_2D,
994 PIPE_BIND_DEPTH_STENCIL | PIPE_BIND_SAMPLER_VIEW);
995 init_format_extensions(screen, extensions, texture_mapping,
996 ARRAY_SIZE(texture_mapping), PIPE_TEXTURE_2D,
997 PIPE_BIND_SAMPLER_VIEW);
998 init_format_extensions(screen, extensions, vertex_mapping,
999 ARRAY_SIZE(vertex_mapping), PIPE_BUFFER,
1000 PIPE_BIND_VERTEX_BUFFER);
1001
1002 /* Figure out GLSL support and set GLSLVersion to it. */
1003 consts->GLSLVersion = screen->get_param(screen, PIPE_CAP_GLSL_FEATURE_LEVEL);
1004 consts->GLSLVersionCompat =
1005 screen->get_param(screen, PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY);
1006
1007 const unsigned GLSLVersion =
1008 api == API_OPENGL_COMPAT ? consts->GLSLVersionCompat :
1009 consts->GLSLVersion;
1010
1011 _mesa_override_glsl_version(consts);
1012
1013 if (options->force_glsl_version > 0 &&
1014 options->force_glsl_version <= GLSLVersion) {
1015 consts->ForceGLSLVersion = options->force_glsl_version;
1016 }
1017
1018 consts->AllowHigherCompatVersion = options->allow_higher_compat_version;
1019
1020 consts->ForceGLSLAbsSqrt = options->force_glsl_abs_sqrt;
1021
1022 consts->AllowGLSLBuiltinVariableRedeclaration = options->allow_glsl_builtin_variable_redeclaration;
1023
1024 consts->dri_config_options_sha1 = options->config_options_sha1;
1025
1026 consts->AllowGLSLCrossStageInterpolationMismatch = options->allow_glsl_cross_stage_interpolation_mismatch;
1027
1028 if (GLSLVersion >= 400)
1029 extensions->ARB_gpu_shader5 = GL_TRUE;
1030 if (GLSLVersion >= 410)
1031 extensions->ARB_shader_precision = GL_TRUE;
1032
1033 /* This extension needs full OpenGL 3.2, but we don't know if that's
1034 * supported at this point. Only check the GLSL version. */
1035 if (GLSLVersion >= 150 &&
1036 screen->get_param(screen, PIPE_CAP_TGSI_VS_LAYER_VIEWPORT)) {
1037 extensions->AMD_vertex_shader_layer = GL_TRUE;
1038 }
1039
1040 if (GLSLVersion >= 140) {
1041 if (screen->get_param(screen, PIPE_CAP_TGSI_ARRAY_COMPONENTS))
1042 extensions->ARB_enhanced_layouts = GL_TRUE;
1043 }
1044
1045 if (GLSLVersion >= 130) {
1046 consts->NativeIntegers = GL_TRUE;
1047 consts->MaxClipPlanes = 8;
1048
1049 if (screen->get_param(screen, PIPE_CAP_VERTEXID_NOBASE)) {
1050 consts->VertexID_is_zero_based = GL_TRUE;
1051 }
1052
1053 /* Extensions that either depend on GLSL 1.30 or are a subset thereof. */
1054 extensions->ARB_conservative_depth = GL_TRUE;
1055 extensions->ARB_shading_language_packing = GL_TRUE;
1056 extensions->OES_depth_texture_cube_map = GL_TRUE;
1057 extensions->ARB_shading_language_420pack = GL_TRUE;
1058 extensions->ARB_texture_query_levels = GL_TRUE;
1059
1060 extensions->ARB_shader_bit_encoding = GL_TRUE;
1061
1062 extensions->EXT_shader_integer_mix = GL_TRUE;
1063 extensions->ARB_arrays_of_arrays = GL_TRUE;
1064 extensions->MESA_shader_integer_functions = GL_TRUE;
1065 } else {
1066 /* Optional integer support for GLSL 1.2. */
1067 if (screen->get_shader_param(screen, PIPE_SHADER_VERTEX,
1068 PIPE_SHADER_CAP_INTEGERS) &&
1069 screen->get_shader_param(screen, PIPE_SHADER_FRAGMENT,
1070 PIPE_SHADER_CAP_INTEGERS)) {
1071 consts->NativeIntegers = GL_TRUE;
1072
1073 extensions->EXT_shader_integer_mix = GL_TRUE;
1074 }
1075
1076 /* Integer textures make no sense before GLSL 1.30 */
1077 extensions->EXT_texture_integer = GL_FALSE;
1078 }
1079
1080 consts->GLSLZeroInit = options->glsl_zero_init;
1081
1082 consts->UniformBooleanTrue = consts->NativeIntegers ? ~0U : fui(1.0f);
1083
1084 /* Below are the cases which cannot be moved into tables easily. */
1085
1086 /* The compatibility profile also requires GLSLVersionCompat >= 400. */
1087 if (screen->get_shader_param(screen, PIPE_SHADER_TESS_CTRL,
1088 PIPE_SHADER_CAP_MAX_INSTRUCTIONS) > 0 &&
1089 (api != API_OPENGL_COMPAT || consts->GLSLVersionCompat >= 400)) {
1090 extensions->ARB_tessellation_shader = GL_TRUE;
1091 }
1092
1093 /* What this is really checking for is the ability to support multiple
1094 * invocations of a geometry shader. There is no separate cap for that, so
1095 * we check the GLSLVersion.
1096 */
1097 if (GLSLVersion >= 400 &&
1098 screen->get_shader_param(screen, PIPE_SHADER_GEOMETRY,
1099 PIPE_SHADER_CAP_MAX_INSTRUCTIONS) > 0) {
1100 extensions->OES_geometry_shader = GL_TRUE;
1101 }
1102
1103 /* Needs PIPE_CAP_SAMPLE_SHADING + all the sample-related bits of
1104 * ARB_gpu_shader5. This enables all the per-sample shading ES extensions.
1105 */
1106 extensions->OES_sample_variables = extensions->ARB_sample_shading &&
1107 extensions->ARB_gpu_shader5;
1108
1109 /* Maximum sample count. */
1110 {
1111 static const enum pipe_format color_formats[] = {
1112 PIPE_FORMAT_R8G8B8A8_UNORM,
1113 PIPE_FORMAT_B8G8R8A8_UNORM,
1114 PIPE_FORMAT_A8R8G8B8_UNORM,
1115 PIPE_FORMAT_A8B8G8R8_UNORM,
1116 };
1117 static const enum pipe_format depth_formats[] = {
1118 PIPE_FORMAT_Z16_UNORM,
1119 PIPE_FORMAT_Z24X8_UNORM,
1120 PIPE_FORMAT_X8Z24_UNORM,
1121 PIPE_FORMAT_Z32_UNORM,
1122 PIPE_FORMAT_Z32_FLOAT
1123 };
1124 static const enum pipe_format int_formats[] = {
1125 PIPE_FORMAT_R8G8B8A8_SINT
1126 };
1127 static const enum pipe_format void_formats[] = {
1128 PIPE_FORMAT_NONE
1129 };
1130
1131 consts->MaxSamples =
1132 get_max_samples_for_formats(screen, ARRAY_SIZE(color_formats),
1133 color_formats, 16,
1134 PIPE_BIND_RENDER_TARGET);
1135
1136 consts->MaxImageSamples =
1137 get_max_samples_for_formats(screen, ARRAY_SIZE(color_formats),
1138 color_formats, 16,
1139 PIPE_BIND_SHADER_IMAGE);
1140
1141 consts->MaxColorTextureSamples =
1142 get_max_samples_for_formats(screen, ARRAY_SIZE(color_formats),
1143 color_formats, consts->MaxSamples,
1144 PIPE_BIND_SAMPLER_VIEW);
1145
1146 consts->MaxDepthTextureSamples =
1147 get_max_samples_for_formats(screen, ARRAY_SIZE(depth_formats),
1148 depth_formats, consts->MaxSamples,
1149 PIPE_BIND_SAMPLER_VIEW);
1150
1151 consts->MaxIntegerSamples =
1152 get_max_samples_for_formats(screen, ARRAY_SIZE(int_formats),
1153 int_formats, consts->MaxSamples,
1154 PIPE_BIND_SAMPLER_VIEW);
1155
1156 /* ARB_framebuffer_no_attachments, assume max no. of samples 32 */
1157 consts->MaxFramebufferSamples =
1158 get_max_samples_for_formats(screen, ARRAY_SIZE(void_formats),
1159 void_formats, 32,
1160 PIPE_BIND_RENDER_TARGET);
1161
1162 if (extensions->AMD_framebuffer_multisample_advanced) {
1163 /* AMD_framebuffer_multisample_advanced */
1164 /* This can be greater than storage samples. */
1165 consts->MaxColorFramebufferSamples =
1166 get_max_samples_for_formats_advanced(screen,
1167 ARRAY_SIZE(color_formats),
1168 color_formats, 16,
1169 consts->MaxSamples,
1170 PIPE_BIND_RENDER_TARGET);
1171
1172 /* If the driver supports N color samples, it means it supports
1173 * N samples and N storage samples. N samples >= N storage
1174 * samples.
1175 */
1176 consts->MaxColorFramebufferStorageSamples = consts->MaxSamples;
1177 consts->MaxDepthStencilFramebufferSamples =
1178 consts->MaxDepthTextureSamples;
1179
1180 assert(consts->MaxColorFramebufferSamples >=
1181 consts->MaxDepthStencilFramebufferSamples);
1182 assert(consts->MaxDepthStencilFramebufferSamples >=
1183 consts->MaxColorFramebufferStorageSamples);
1184
1185 consts->NumSupportedMultisampleModes = 0;
1186
1187 unsigned depth_samples_supported = 0;
1188
1189 for (unsigned samples = 2;
1190 samples <= consts->MaxDepthStencilFramebufferSamples;
1191 samples++) {
1192 if (screen->is_format_supported(screen, PIPE_FORMAT_Z32_FLOAT,
1193 PIPE_TEXTURE_2D, samples, samples,
1194 PIPE_BIND_DEPTH_STENCIL))
1195 depth_samples_supported |= 1 << samples;
1196 }
1197
1198 for (unsigned samples = 2;
1199 samples <= consts->MaxColorFramebufferSamples;
1200 samples++) {
1201 for (unsigned depth_samples = 2;
1202 depth_samples <= samples; depth_samples++) {
1203 if (!(depth_samples_supported & (1 << depth_samples)))
1204 continue;
1205
1206 for (unsigned storage_samples = 2;
1207 storage_samples <= depth_samples; storage_samples++) {
1208 if (screen->is_format_supported(screen,
1209 PIPE_FORMAT_R8G8B8A8_UNORM,
1210 PIPE_TEXTURE_2D,
1211 samples,
1212 storage_samples,
1213 PIPE_BIND_RENDER_TARGET)) {
1214 unsigned i = consts->NumSupportedMultisampleModes;
1215
1216 assert(i < ARRAY_SIZE(consts->SupportedMultisampleModes));
1217 consts->SupportedMultisampleModes[i].NumColorSamples =
1218 samples;
1219 consts->SupportedMultisampleModes[i].NumColorStorageSamples =
1220 storage_samples;
1221 consts->SupportedMultisampleModes[i].NumDepthStencilSamples =
1222 depth_samples;
1223 consts->NumSupportedMultisampleModes++;
1224 }
1225 }
1226 }
1227 }
1228 }
1229 }
1230
1231 if (consts->MaxSamples >= 2) {
1232 /* Real MSAA support */
1233 extensions->EXT_framebuffer_multisample = GL_TRUE;
1234 extensions->EXT_framebuffer_multisample_blit_scaled = GL_TRUE;
1235 }
1236 else if (consts->MaxSamples > 0 &&
1237 screen->get_param(screen, PIPE_CAP_FAKE_SW_MSAA)) {
1238 /* fake MSAA support */
1239 consts->FakeSWMSAA = GL_TRUE;
1240 extensions->EXT_framebuffer_multisample = GL_TRUE;
1241 extensions->EXT_framebuffer_multisample_blit_scaled = GL_TRUE;
1242 extensions->ARB_texture_multisample = GL_TRUE;
1243 }
1244
1245 if (consts->MaxDualSourceDrawBuffers > 0 &&
1246 !options->disable_blend_func_extended)
1247 extensions->ARB_blend_func_extended = GL_TRUE;
1248
1249 if (screen->get_param(screen, PIPE_CAP_QUERY_TIME_ELAPSED) ||
1250 extensions->ARB_timer_query) {
1251 extensions->EXT_timer_query = GL_TRUE;
1252 }
1253
1254 if (extensions->ARB_transform_feedback2 &&
1255 extensions->ARB_draw_instanced) {
1256 extensions->ARB_transform_feedback_instanced = GL_TRUE;
1257 }
1258 if (options->force_glsl_extensions_warn)
1259 consts->ForceGLSLExtensionsWarn = 1;
1260
1261 if (options->disable_glsl_line_continuations)
1262 consts->DisableGLSLLineContinuations = 1;
1263
1264 if (options->allow_glsl_extension_directive_midshader)
1265 consts->AllowGLSLExtensionDirectiveMidShader = GL_TRUE;
1266
1267 if (options->allow_glsl_builtin_const_expression)
1268 consts->AllowGLSLBuiltinConstantExpression = GL_TRUE;
1269
1270 if (options->allow_glsl_relaxed_es)
1271 consts->AllowGLSLRelaxedES = GL_TRUE;
1272
1273 if (options->allow_glsl_layout_qualifier_on_function_parameters)
1274 consts->AllowLayoutQualifiersOnFunctionParameters = GL_TRUE;
1275
1276 consts->MinMapBufferAlignment =
1277 screen->get_param(screen, PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT);
1278
1279 /* The OpenGL Compatibility profile requires arbitrary buffer swizzling. */
1280 if (api == API_OPENGL_COMPAT &&
1281 screen->get_param(screen, PIPE_CAP_BUFFER_SAMPLER_VIEW_RGBA_ONLY))
1282 extensions->ARB_texture_buffer_object = GL_FALSE;
1283
1284 if (extensions->ARB_texture_buffer_object) {
1285 consts->MaxTextureBufferSize =
1286 _min(screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE),
1287 (1u << 31) - 1);
1288 consts->TextureBufferOffsetAlignment =
1289 screen->get_param(screen, PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT);
1290
1291 if (consts->TextureBufferOffsetAlignment)
1292 extensions->ARB_texture_buffer_range = GL_TRUE;
1293
1294 init_format_extensions(screen, extensions, tbo_rgb32,
1295 ARRAY_SIZE(tbo_rgb32), PIPE_BUFFER,
1296 PIPE_BIND_SAMPLER_VIEW);
1297 }
1298
1299 extensions->OES_texture_buffer =
1300 extensions->ARB_texture_buffer_object &&
1301 extensions->ARB_texture_buffer_range &&
1302 extensions->ARB_texture_buffer_object_rgb32 &&
1303 extensions->ARB_shader_image_load_store;
1304
1305 /* Unpacking a varying in the fragment shader costs 1 texture indirection.
1306 * If the number of available texture indirections is very limited, then we
1307 * prefer to disable varying packing rather than run the risk of varying
1308 * packing preventing a shader from running.
1309 */
1310 if (screen->get_shader_param(screen, PIPE_SHADER_FRAGMENT,
1311 PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS) <= 8) {
1312 /* We can't disable varying packing if transform feedback is available,
1313 * because transform feedback code assumes a packed varying layout.
1314 */
1315 if (!extensions->EXT_transform_feedback)
1316 consts->DisableVaryingPacking = GL_TRUE;
1317 }
1318
1319 consts->MaxViewports = screen->get_param(screen, PIPE_CAP_MAX_VIEWPORTS);
1320 if (consts->MaxViewports >= 16) {
1321 if (GLSLVersion >= 400) {
1322 consts->ViewportBounds.Min = -32768.0;
1323 consts->ViewportBounds.Max = 32767.0;
1324 } else {
1325 consts->ViewportBounds.Min = -16384.0;
1326 consts->ViewportBounds.Max = 16383.0;
1327 }
1328 extensions->ARB_viewport_array = GL_TRUE;
1329 extensions->ARB_fragment_layer_viewport = GL_TRUE;
1330 if (extensions->AMD_vertex_shader_layer)
1331 extensions->AMD_vertex_shader_viewport_index = GL_TRUE;
1332 }
1333
1334 if (extensions->AMD_vertex_shader_layer &&
1335 extensions->AMD_vertex_shader_viewport_index &&
1336 screen->get_param(screen, PIPE_CAP_TGSI_TES_LAYER_VIEWPORT))
1337 extensions->ARB_shader_viewport_layer_array = GL_TRUE;
1338
1339 /* ARB_framebuffer_no_attachments */
1340 if (screen->get_param(screen, PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT) &&
1341 ((consts->MaxSamples >= 4 && consts->MaxFramebufferLayers >= 2048) ||
1342 (consts->MaxFramebufferSamples >= consts->MaxSamples &&
1343 consts->MaxFramebufferLayers >= consts->MaxArrayTextureLayers)))
1344 extensions->ARB_framebuffer_no_attachments = GL_TRUE;
1345
1346 /* GL_ARB_ES3_compatibility.
1347 * Check requirements for GLSL ES 3.00.
1348 */
1349 if (GLSLVersion >= 130 &&
1350 extensions->ARB_uniform_buffer_object &&
1351 extensions->ARB_shader_bit_encoding &&
1352 extensions->NV_primitive_restart &&
1353 screen->get_shader_param(screen, PIPE_SHADER_VERTEX,
1354 PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS) >= 16 &&
1355 /* Requirements for ETC2 emulation. */
1356 screen->is_format_supported(screen, PIPE_FORMAT_R8G8B8A8_UNORM,
1357 PIPE_TEXTURE_2D, 0, 0,
1358 PIPE_BIND_SAMPLER_VIEW) &&
1359 screen->is_format_supported(screen, PIPE_FORMAT_R8G8B8A8_SRGB,
1360 PIPE_TEXTURE_2D, 0, 0,
1361 PIPE_BIND_SAMPLER_VIEW) &&
1362 screen->is_format_supported(screen, PIPE_FORMAT_R16_UNORM,
1363 PIPE_TEXTURE_2D, 0, 0,
1364 PIPE_BIND_SAMPLER_VIEW) &&
1365 screen->is_format_supported(screen, PIPE_FORMAT_R16G16_UNORM,
1366 PIPE_TEXTURE_2D, 0, 0,
1367 PIPE_BIND_SAMPLER_VIEW) &&
1368 screen->is_format_supported(screen, PIPE_FORMAT_R16_SNORM,
1369 PIPE_TEXTURE_2D, 0, 0,
1370 PIPE_BIND_SAMPLER_VIEW) &&
1371 screen->is_format_supported(screen, PIPE_FORMAT_R16G16_SNORM,
1372 PIPE_TEXTURE_2D, 0, 0,
1373 PIPE_BIND_SAMPLER_VIEW)) {
1374 extensions->ARB_ES3_compatibility = GL_TRUE;
1375 }
1376
1377 #ifdef HAVE_ST_VDPAU
1378 if (screen->get_video_param &&
1379 screen->get_video_param(screen, PIPE_VIDEO_PROFILE_UNKNOWN,
1380 PIPE_VIDEO_ENTRYPOINT_BITSTREAM,
1381 PIPE_VIDEO_CAP_SUPPORTS_INTERLACED)) {
1382 extensions->NV_vdpau_interop = GL_TRUE;
1383 }
1384 #endif
1385
1386 if (screen->get_param(screen, PIPE_CAP_DOUBLES)) {
1387 extensions->ARB_gpu_shader_fp64 = GL_TRUE;
1388 extensions->ARB_vertex_attrib_64bit = GL_TRUE;
1389 }
1390
1391 if ((ST_DEBUG & DEBUG_GREMEDY) &&
1392 screen->get_param(screen, PIPE_CAP_STRING_MARKER))
1393 extensions->GREMEDY_string_marker = GL_TRUE;
1394
1395 if (screen->get_param(screen, PIPE_CAP_COMPUTE)) {
1396 int compute_supported_irs =
1397 screen->get_shader_param(screen, PIPE_SHADER_COMPUTE,
1398 PIPE_SHADER_CAP_SUPPORTED_IRS);
1399 if (compute_supported_irs & (1 << PIPE_SHADER_IR_TGSI)) {
1400 uint64_t grid_size[3], block_size[3];
1401 uint64_t max_local_size, max_threads_per_block;
1402
1403 screen->get_compute_param(screen, PIPE_SHADER_IR_TGSI,
1404 PIPE_COMPUTE_CAP_MAX_GRID_SIZE, grid_size);
1405 screen->get_compute_param(screen, PIPE_SHADER_IR_TGSI,
1406 PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE, block_size);
1407 screen->get_compute_param(screen, PIPE_SHADER_IR_TGSI,
1408 PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK,
1409 &max_threads_per_block);
1410 screen->get_compute_param(screen, PIPE_SHADER_IR_TGSI,
1411 PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE,
1412 &max_local_size);
1413
1414 consts->MaxComputeWorkGroupInvocations = max_threads_per_block;
1415 consts->MaxComputeSharedMemorySize = max_local_size;
1416
1417 for (i = 0; i < 3; i++) {
1418 consts->MaxComputeWorkGroupCount[i] = grid_size[i];
1419 consts->MaxComputeWorkGroupSize[i] = block_size[i];
1420 }
1421
1422 extensions->ARB_compute_shader =
1423 extensions->ARB_shader_image_load_store &&
1424 extensions->ARB_shader_atomic_counters;
1425
1426 if (extensions->ARB_compute_shader) {
1427 uint64_t max_variable_threads_per_block = 0;
1428
1429 screen->get_compute_param(screen, PIPE_SHADER_IR_TGSI,
1430 PIPE_COMPUTE_CAP_MAX_VARIABLE_THREADS_PER_BLOCK,
1431 &max_variable_threads_per_block);
1432
1433 for (i = 0; i < 3; i++) {
1434 /* Clamp the values to avoid having a local work group size
1435 * greater than the maximum number of invocations.
1436 */
1437 consts->MaxComputeVariableGroupSize[i] =
1438 MIN2(consts->MaxComputeWorkGroupSize[i],
1439 max_variable_threads_per_block);
1440 }
1441 consts->MaxComputeVariableGroupInvocations =
1442 max_variable_threads_per_block;
1443
1444 extensions->ARB_compute_variable_group_size =
1445 max_variable_threads_per_block > 0;
1446 }
1447 }
1448 }
1449
1450 if (extensions->EXT_texture_filter_anisotropic &&
1451 screen->get_paramf(screen, PIPE_CAPF_MAX_TEXTURE_ANISOTROPY) >= 16.0)
1452 extensions->ARB_texture_filter_anisotropic = GL_TRUE;
1453
1454 extensions->KHR_robustness = extensions->ARB_robust_buffer_access_behavior;
1455
1456 /* If we support ES 3.1, we support the ES3_1_compatibility ext. However
1457 * there's no clean way of telling whether we would support ES 3.1 from
1458 * here, so copy the condition from compute_version_es2 here. A lot of
1459 * these are redunant, but simpler to just have a (near-)exact copy here.
1460 */
1461 extensions->ARB_ES3_1_compatibility =
1462 extensions->ARB_ES3_compatibility &&
1463 extensions->ARB_arrays_of_arrays &&
1464 extensions->ARB_compute_shader &&
1465 extensions->ARB_draw_indirect &&
1466 extensions->ARB_explicit_uniform_location &&
1467 extensions->ARB_framebuffer_no_attachments &&
1468 extensions->ARB_shader_atomic_counters &&
1469 extensions->ARB_shader_image_load_store &&
1470 extensions->ARB_shader_image_size &&
1471 extensions->ARB_shader_storage_buffer_object &&
1472 extensions->ARB_shading_language_packing &&
1473 extensions->ARB_stencil_texturing &&
1474 extensions->ARB_texture_multisample &&
1475 extensions->ARB_gpu_shader5 &&
1476 extensions->EXT_shader_integer_mix;
1477
1478 extensions->OES_texture_cube_map_array =
1479 extensions->ARB_ES3_1_compatibility &&
1480 extensions->OES_geometry_shader &&
1481 extensions->ARB_texture_cube_map_array;
1482
1483 extensions->OES_viewport_array =
1484 extensions->ARB_ES3_1_compatibility &&
1485 extensions->OES_geometry_shader &&
1486 extensions->ARB_viewport_array;
1487
1488 extensions->OES_primitive_bounding_box = extensions->ARB_ES3_1_compatibility;
1489 consts->NoPrimitiveBoundingBoxOutput = true;
1490
1491 extensions->ANDROID_extension_pack_es31a =
1492 extensions->KHR_texture_compression_astc_ldr &&
1493 extensions->KHR_blend_equation_advanced &&
1494 extensions->OES_sample_variables &&
1495 extensions->ARB_shader_image_load_store &&
1496 extensions->ARB_texture_stencil8 &&
1497 extensions->ARB_texture_multisample &&
1498 extensions->OES_copy_image &&
1499 extensions->ARB_draw_buffers_blend &&
1500 extensions->OES_geometry_shader &&
1501 extensions->ARB_gpu_shader5 &&
1502 extensions->OES_primitive_bounding_box &&
1503 extensions->ARB_tessellation_shader &&
1504 extensions->ARB_texture_border_clamp &&
1505 extensions->OES_texture_buffer &&
1506 extensions->OES_texture_cube_map_array &&
1507 extensions->EXT_texture_sRGB_decode;
1508
1509 /* Same deal as for ARB_ES3_1_compatibility - this has to be computed
1510 * before overall versions are selected. Also it's actually a subset of ES
1511 * 3.2, since it doesn't require ASTC or advanced blending.
1512 */
1513 extensions->ARB_ES3_2_compatibility =
1514 extensions->ARB_ES3_1_compatibility &&
1515 extensions->KHR_robustness &&
1516 extensions->ARB_copy_image &&
1517 extensions->ARB_draw_buffers_blend &&
1518 extensions->ARB_draw_elements_base_vertex &&
1519 extensions->OES_geometry_shader &&
1520 extensions->ARB_gpu_shader5 &&
1521 extensions->ARB_sample_shading &&
1522 extensions->ARB_tessellation_shader &&
1523 extensions->ARB_texture_border_clamp &&
1524 extensions->OES_texture_buffer &&
1525 extensions->ARB_texture_cube_map_array &&
1526 extensions->ARB_texture_stencil8 &&
1527 extensions->ARB_texture_multisample;
1528
1529 if (screen->get_param(screen, PIPE_CAP_CONSERVATIVE_RASTER_POST_SNAP_TRIANGLES) &&
1530 screen->get_param(screen, PIPE_CAP_CONSERVATIVE_RASTER_POST_SNAP_POINTS_LINES) &&
1531 screen->get_param(screen, PIPE_CAP_CONSERVATIVE_RASTER_POST_DEPTH_COVERAGE)) {
1532 float max_dilate;
1533 bool pre_snap_triangles, pre_snap_points_lines;
1534
1535 max_dilate = screen->get_paramf(screen, PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE);
1536
1537 pre_snap_triangles =
1538 screen->get_param(screen, PIPE_CAP_CONSERVATIVE_RASTER_PRE_SNAP_TRIANGLES);
1539 pre_snap_points_lines =
1540 screen->get_param(screen, PIPE_CAP_CONSERVATIVE_RASTER_PRE_SNAP_POINTS_LINES);
1541
1542 extensions->NV_conservative_raster =
1543 screen->get_param(screen, PIPE_CAP_MAX_CONSERVATIVE_RASTER_SUBPIXEL_PRECISION_BIAS) > 1;
1544
1545 if (extensions->NV_conservative_raster) {
1546 extensions->NV_conservative_raster_dilate = max_dilate >= 0.75;
1547 extensions->NV_conservative_raster_pre_snap_triangles = pre_snap_triangles;
1548 extensions->NV_conservative_raster_pre_snap =
1549 pre_snap_triangles && pre_snap_points_lines;
1550 }
1551 }
1552 }