2 * Copyright © 2013 Intel Corporation
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
24 #include "glsl_parser_extras.h"
26 #include "ir_uniform.h"
28 #include "program/hash_table.h"
29 #include "main/macros.h"
33 * Atomic counter as seen by the program.
35 struct active_atomic_counter
{
41 * Atomic counter buffer referenced by the program. There is a one
42 * to one correspondence between these and the objects that can be
43 * queried using glGetActiveAtomicCounterBufferiv().
45 struct active_atomic_buffer
{
46 active_atomic_buffer()
47 : counters(0), num_counters(0), stage_references(), size(0)
50 ~active_atomic_buffer()
55 void push_back(unsigned uniform_loc
, ir_variable
*var
)
57 active_atomic_counter
*new_counters
;
59 new_counters
= (active_atomic_counter
*)
60 realloc(counters
, sizeof(active_atomic_counter
) *
63 if (new_counters
== NULL
) {
64 _mesa_error_no_memory(__func__
);
68 counters
= new_counters
;
69 counters
[num_counters
].uniform_loc
= uniform_loc
;
70 counters
[num_counters
].var
= var
;
74 active_atomic_counter
*counters
;
75 unsigned num_counters
;
76 unsigned stage_references
[MESA_SHADER_STAGES
];
81 cmp_actives(const void *a
, const void *b
)
83 const active_atomic_counter
*const first
= (active_atomic_counter
*) a
;
84 const active_atomic_counter
*const second
= (active_atomic_counter
*) b
;
86 return int(first
->var
->data
.offset
) - int(second
->var
->data
.offset
);
90 check_atomic_counters_overlap(const ir_variable
*x
, const ir_variable
*y
)
92 return ((x
->data
.offset
>= y
->data
.offset
&&
93 x
->data
.offset
< y
->data
.offset
+ y
->type
->atomic_size()) ||
94 (y
->data
.offset
>= x
->data
.offset
&&
95 y
->data
.offset
< x
->data
.offset
+ x
->type
->atomic_size()));
99 process_atomic_variable(const glsl_type
*t
, struct gl_shader_program
*prog
,
100 unsigned *uniform_loc
, ir_variable
*var
,
101 active_atomic_buffer
*const buffers
,
102 unsigned *num_buffers
, int *offset
,
103 const unsigned shader_stage
)
105 /* FIXME: Arrays of arrays get counted separately. For example:
106 * x1[3][3][2] = 9 counters
107 * x2[3][2] = 3 counters
110 * However this code marks all the counters as active even when they
113 if (t
->is_array() && t
->fields
.array
->is_array()) {
114 for (unsigned i
= 0; i
< t
->length
; i
++) {
115 process_atomic_variable(t
->fields
.array
, prog
, uniform_loc
,
116 var
, buffers
, num_buffers
, offset
,
120 active_atomic_buffer
*buf
= &buffers
[var
->data
.binding
];
121 gl_uniform_storage
*const storage
=
122 &prog
->UniformStorage
[*uniform_loc
];
124 /* If this is the first time the buffer is used, increment
125 * the counter of buffers used.
130 buf
->push_back(*uniform_loc
, var
);
132 buf
->stage_references
[shader_stage
]++;
133 buf
->size
= MAX2(buf
->size
, *offset
+ t
->atomic_size());
135 storage
->offset
= *offset
;
136 *offset
+= t
->atomic_size();
142 active_atomic_buffer
*
143 find_active_atomic_counters(struct gl_context
*ctx
,
144 struct gl_shader_program
*prog
,
145 unsigned *num_buffers
)
147 active_atomic_buffer
*const buffers
=
148 new active_atomic_buffer
[ctx
->Const
.MaxAtomicBufferBindings
];
152 for (unsigned i
= 0; i
< MESA_SHADER_STAGES
; ++i
) {
153 struct gl_shader
*sh
= prog
->_LinkedShaders
[i
];
157 foreach_in_list(ir_instruction
, node
, sh
->ir
) {
158 ir_variable
*var
= node
->as_variable();
160 if (var
&& var
->type
->contains_atomic()) {
161 int offset
= var
->data
.offset
;
162 unsigned uniform_loc
= var
->data
.location
;
163 process_atomic_variable(var
->type
, prog
, &uniform_loc
,
164 var
, buffers
, num_buffers
, &offset
, i
);
169 for (unsigned i
= 0; i
< ctx
->Const
.MaxAtomicBufferBindings
; i
++) {
170 if (buffers
[i
].size
== 0)
173 qsort(buffers
[i
].counters
, buffers
[i
].num_counters
,
174 sizeof(active_atomic_counter
),
177 for (unsigned j
= 1; j
< buffers
[i
].num_counters
; j
++) {
178 /* If an overlapping counter found, it must be a reference to the
179 * same counter from a different shader stage.
181 if (check_atomic_counters_overlap(buffers
[i
].counters
[j
-1].var
,
182 buffers
[i
].counters
[j
].var
)
183 && strcmp(buffers
[i
].counters
[j
-1].var
->name
,
184 buffers
[i
].counters
[j
].var
->name
) != 0) {
185 linker_error(prog
, "Atomic counter %s declared at offset %d "
186 "which is already in use.",
187 buffers
[i
].counters
[j
].var
->name
,
188 buffers
[i
].counters
[j
].var
->data
.offset
);
197 link_assign_atomic_counter_resources(struct gl_context
*ctx
,
198 struct gl_shader_program
*prog
)
200 unsigned num_buffers
;
201 unsigned num_atomic_buffers
[MESA_SHADER_STAGES
] = {};
202 active_atomic_buffer
*abs
=
203 find_active_atomic_counters(ctx
, prog
, &num_buffers
);
205 prog
->AtomicBuffers
= rzalloc_array(prog
, gl_active_atomic_buffer
,
207 prog
->NumAtomicBuffers
= num_buffers
;
210 for (unsigned binding
= 0;
211 binding
< ctx
->Const
.MaxAtomicBufferBindings
;
214 /* If the binding was not used, skip.
216 if (abs
[binding
].size
== 0)
219 active_atomic_buffer
&ab
= abs
[binding
];
220 gl_active_atomic_buffer
&mab
= prog
->AtomicBuffers
[i
];
222 /* Assign buffer-specific fields. */
223 mab
.Binding
= binding
;
224 mab
.MinimumSize
= ab
.size
;
225 mab
.Uniforms
= rzalloc_array(prog
->AtomicBuffers
, GLuint
,
227 mab
.NumUniforms
= ab
.num_counters
;
229 /* Assign counter-specific fields. */
230 for (unsigned j
= 0; j
< ab
.num_counters
; j
++) {
231 ir_variable
*const var
= ab
.counters
[j
].var
;
232 gl_uniform_storage
*const storage
=
233 &prog
->UniformStorage
[ab
.counters
[j
].uniform_loc
];
235 mab
.Uniforms
[j
] = ab
.counters
[j
].uniform_loc
;
236 if (!var
->data
.explicit_binding
)
237 var
->data
.binding
= i
;
239 storage
->atomic_buffer_index
= i
;
240 storage
->offset
= var
->data
.offset
;
241 storage
->array_stride
= (var
->type
->is_array() ?
242 var
->type
->without_array()->atomic_size() : 0);
243 if (!var
->type
->is_matrix())
244 storage
->matrix_stride
= 0;
247 /* Assign stage-specific fields. */
248 for (unsigned j
= 0; j
< MESA_SHADER_STAGES
; ++j
) {
249 if (ab
.stage_references
[j
]) {
250 mab
.StageReferences
[j
] = GL_TRUE
;
251 num_atomic_buffers
[j
]++;
253 mab
.StageReferences
[j
] = GL_FALSE
;
260 /* Store a list pointers to atomic buffers per stage and store the index
261 * to the intra-stage buffer list in uniform storage.
263 for (unsigned j
= 0; j
< MESA_SHADER_STAGES
; ++j
) {
264 if (prog
->_LinkedShaders
[j
] && num_atomic_buffers
[j
] > 0) {
265 prog
->_LinkedShaders
[j
]->NumAtomicBuffers
= num_atomic_buffers
[j
];
266 prog
->_LinkedShaders
[j
]->AtomicBuffers
=
267 rzalloc_array(prog
, gl_active_atomic_buffer
*,
268 num_atomic_buffers
[j
]);
270 unsigned intra_stage_idx
= 0;
271 for (unsigned i
= 0; i
< num_buffers
; i
++) {
272 struct gl_active_atomic_buffer
*atomic_buffer
=
273 &prog
->AtomicBuffers
[i
];
274 if (atomic_buffer
->StageReferences
[j
]) {
275 prog
->_LinkedShaders
[j
]->AtomicBuffers
[intra_stage_idx
] =
278 for (unsigned u
= 0; u
< atomic_buffer
->NumUniforms
; u
++) {
279 prog
->UniformStorage
[atomic_buffer
->Uniforms
[u
]].opaque
[j
].index
=
281 prog
->UniformStorage
[atomic_buffer
->Uniforms
[u
]].opaque
[j
].active
=
292 assert(i
== num_buffers
);
296 link_check_atomic_counter_resources(struct gl_context
*ctx
,
297 struct gl_shader_program
*prog
)
299 unsigned num_buffers
;
300 active_atomic_buffer
*const abs
=
301 find_active_atomic_counters(ctx
, prog
, &num_buffers
);
302 unsigned atomic_counters
[MESA_SHADER_STAGES
] = {};
303 unsigned atomic_buffers
[MESA_SHADER_STAGES
] = {};
304 unsigned total_atomic_counters
= 0;
305 unsigned total_atomic_buffers
= 0;
307 /* Sum the required resources. Note that this counts buffers and
308 * counters referenced by several shader stages multiple times
309 * against the combined limit -- That's the behavior the spec
312 for (unsigned i
= 0; i
< ctx
->Const
.MaxAtomicBufferBindings
; i
++) {
313 if (abs
[i
].size
== 0)
316 for (unsigned j
= 0; j
< MESA_SHADER_STAGES
; ++j
) {
317 const unsigned n
= abs
[i
].stage_references
[j
];
320 atomic_counters
[j
] += n
;
321 total_atomic_counters
+= n
;
323 total_atomic_buffers
++;
328 /* Check that they are within the supported limits. */
329 for (unsigned i
= 0; i
< MESA_SHADER_STAGES
; i
++) {
330 if (atomic_counters
[i
] > ctx
->Const
.Program
[i
].MaxAtomicCounters
)
331 linker_error(prog
, "Too many %s shader atomic counters",
332 _mesa_shader_stage_to_string(i
));
334 if (atomic_buffers
[i
] > ctx
->Const
.Program
[i
].MaxAtomicBuffers
)
335 linker_error(prog
, "Too many %s shader atomic counter buffers",
336 _mesa_shader_stage_to_string(i
));
339 if (total_atomic_counters
> ctx
->Const
.MaxCombinedAtomicCounters
)
340 linker_error(prog
, "Too many combined atomic counters");
342 if (total_atomic_buffers
> ctx
->Const
.MaxCombinedAtomicBuffers
)
343 linker_error(prog
, "Too many combined atomic buffers");