glsl: Add parser/compiler support for std430 interface packing qualifier
[mesa.git] / src / glsl / link_uniform_blocks.cpp
1 /*
2 * Copyright © 2012 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
22 */
23
24 #include "main/core.h"
25 #include "ir.h"
26 #include "linker.h"
27 #include "ir_uniform.h"
28 #include "link_uniform_block_active_visitor.h"
29 #include "util/hash_table.h"
30 #include "program.h"
31
32 namespace {
33
34 class ubo_visitor : public program_resource_visitor {
35 public:
36 ubo_visitor(void *mem_ctx, gl_uniform_buffer_variable *variables,
37 unsigned num_variables)
38 : index(0), offset(0), buffer_size(0), variables(variables),
39 num_variables(num_variables), mem_ctx(mem_ctx), is_array_instance(false)
40 {
41 /* empty */
42 }
43
44 void process(const glsl_type *type, const char *name)
45 {
46 this->offset = 0;
47 this->buffer_size = 0;
48 this->is_array_instance = strchr(name, ']') != NULL;
49 this->program_resource_visitor::process(type, name);
50 }
51
52 unsigned index;
53 unsigned offset;
54 unsigned buffer_size;
55 gl_uniform_buffer_variable *variables;
56 unsigned num_variables;
57 void *mem_ctx;
58 bool is_array_instance;
59
60 private:
61 virtual void visit_field(const glsl_type *type, const char *name,
62 bool row_major)
63 {
64 (void) type;
65 (void) name;
66 (void) row_major;
67 assert(!"Should not get here.");
68 }
69
70 virtual void enter_record(const glsl_type *type, const char *,
71 bool row_major) {
72 assert(type->is_record());
73 this->offset = glsl_align(
74 this->offset, type->std140_base_alignment(row_major));
75 }
76
77 virtual void leave_record(const glsl_type *type, const char *,
78 bool row_major) {
79 assert(type->is_record());
80
81 /* If this is the last field of a structure, apply rule #9. The
82 * GL_ARB_uniform_buffer_object spec says:
83 *
84 * "The structure may have padding at the end; the base offset of
85 * the member following the sub-structure is rounded up to the next
86 * multiple of the base alignment of the structure."
87 */
88 this->offset = glsl_align(
89 this->offset, type->std140_base_alignment(row_major));
90 }
91
92 virtual void visit_field(const glsl_type *type, const char *name,
93 bool row_major, const glsl_type *,
94 bool /* last_field */)
95 {
96 assert(this->index < this->num_variables);
97
98 gl_uniform_buffer_variable *v = &this->variables[this->index++];
99
100 v->Name = ralloc_strdup(mem_ctx, name);
101 v->Type = type;
102 v->RowMajor = type->without_array()->is_matrix() && row_major;
103
104 if (this->is_array_instance) {
105 v->IndexName = ralloc_strdup(mem_ctx, name);
106
107 char *open_bracket = strchr(v->IndexName, '[');
108 assert(open_bracket != NULL);
109
110 char *close_bracket = strchr(open_bracket, ']');
111 assert(close_bracket != NULL);
112
113 /* Length of the tail without the ']' but with the NUL.
114 */
115 unsigned len = strlen(close_bracket + 1) + 1;
116
117 memmove(open_bracket, close_bracket + 1, len);
118 } else {
119 v->IndexName = v->Name;
120 }
121
122 unsigned alignment = 0;
123 unsigned size = 0;
124
125 if (v->Type->interface_packing == GLSL_INTERFACE_PACKING_STD430) {
126 alignment = type->std430_base_alignment(v->RowMajor);
127 size = type->std430_size(v->RowMajor);
128 } else {
129 alignment = type->std140_base_alignment(v->RowMajor);
130 size = type->std140_size(v->RowMajor);
131 }
132
133 this->offset = glsl_align(this->offset, alignment);
134 v->Offset = this->offset;
135
136 this->offset += size;
137
138 /* From the GL_ARB_uniform_buffer_object spec:
139 *
140 * "For uniform blocks laid out according to [std140] rules, the
141 * minimum buffer object size returned by the
142 * UNIFORM_BLOCK_DATA_SIZE query is derived by taking the offset of
143 * the last basic machine unit consumed by the last uniform of the
144 * uniform block (including any end-of-array or end-of-structure
145 * padding), adding one, and rounding up to the next multiple of
146 * the base alignment required for a vec4."
147 */
148 this->buffer_size = glsl_align(this->offset, 16);
149 }
150 };
151
152 class count_block_size : public program_resource_visitor {
153 public:
154 count_block_size() : num_active_uniforms(0)
155 {
156 /* empty */
157 }
158
159 unsigned num_active_uniforms;
160
161 private:
162 virtual void visit_field(const glsl_type *type, const char *name,
163 bool row_major)
164 {
165 (void) type;
166 (void) name;
167 (void) row_major;
168 this->num_active_uniforms++;
169 }
170 };
171
172 } /* anonymous namespace */
173
174 struct block {
175 const glsl_type *type;
176 bool has_instance_name;
177 };
178
179 unsigned
180 link_uniform_blocks(void *mem_ctx,
181 struct gl_shader_program *prog,
182 struct gl_shader **shader_list,
183 unsigned num_shaders,
184 struct gl_uniform_block **blocks_ret)
185 {
186 /* This hash table will track all of the uniform blocks that have been
187 * encountered. Since blocks with the same block-name must be the same,
188 * the hash is organized by block-name.
189 */
190 struct hash_table *block_hash =
191 _mesa_hash_table_create(mem_ctx, _mesa_key_hash_string,
192 _mesa_key_string_equal);
193
194 if (block_hash == NULL) {
195 _mesa_error_no_memory(__func__);
196 linker_error(prog, "out of memory\n");
197 return 0;
198 }
199
200 /* Determine which uniform blocks are active.
201 */
202 link_uniform_block_active_visitor v(mem_ctx, block_hash, prog);
203 for (unsigned i = 0; i < num_shaders; i++) {
204 visit_list_elements(&v, shader_list[i]->ir);
205 }
206
207 /* Count the number of active uniform blocks. Count the total number of
208 * active slots in those uniform blocks.
209 */
210 unsigned num_blocks = 0;
211 unsigned num_variables = 0;
212 count_block_size block_size;
213 struct hash_entry *entry;
214
215 hash_table_foreach (block_hash, entry) {
216 const struct link_uniform_block_active *const b =
217 (const struct link_uniform_block_active *) entry->data;
218
219 const glsl_type *const block_type =
220 b->type->is_array() ? b->type->fields.array : b->type;
221
222 assert((b->num_array_elements > 0) == b->type->is_array());
223
224 block_size.num_active_uniforms = 0;
225 block_size.process(block_type, "");
226
227 if (b->num_array_elements > 0) {
228 num_blocks += b->num_array_elements;
229 num_variables += b->num_array_elements
230 * block_size.num_active_uniforms;
231 } else {
232 num_blocks++;
233 num_variables += block_size.num_active_uniforms;
234 }
235
236 }
237
238 if (num_blocks == 0) {
239 assert(num_variables == 0);
240 _mesa_hash_table_destroy(block_hash, NULL);
241 return 0;
242 }
243
244 assert(num_variables != 0);
245
246 /* Allocate storage to hold all of the informatation related to uniform
247 * blocks that can be queried through the API.
248 */
249 gl_uniform_block *blocks =
250 ralloc_array(mem_ctx, gl_uniform_block, num_blocks);
251 gl_uniform_buffer_variable *variables =
252 ralloc_array(blocks, gl_uniform_buffer_variable, num_variables);
253
254 /* Add each variable from each uniform block to the API tracking
255 * structures.
256 */
257 unsigned i = 0;
258 ubo_visitor parcel(blocks, variables, num_variables);
259
260 STATIC_ASSERT(unsigned(GLSL_INTERFACE_PACKING_STD140)
261 == unsigned(ubo_packing_std140));
262 STATIC_ASSERT(unsigned(GLSL_INTERFACE_PACKING_SHARED)
263 == unsigned(ubo_packing_shared));
264 STATIC_ASSERT(unsigned(GLSL_INTERFACE_PACKING_PACKED)
265 == unsigned(ubo_packing_packed));
266 STATIC_ASSERT(unsigned(GLSL_INTERFACE_PACKING_STD430)
267 == unsigned(ubo_packing_std430));
268
269 hash_table_foreach (block_hash, entry) {
270 const struct link_uniform_block_active *const b =
271 (const struct link_uniform_block_active *) entry->data;
272 const glsl_type *block_type = b->type;
273
274 if (b->num_array_elements > 0) {
275 const char *const name = block_type->fields.array->name;
276
277 assert(b->has_instance_name);
278 for (unsigned j = 0; j < b->num_array_elements; j++) {
279 blocks[i].Name = ralloc_asprintf(blocks, "%s[%u]", name,
280 b->array_elements[j]);
281 blocks[i].Uniforms = &variables[parcel.index];
282
283 /* The GL_ARB_shading_language_420pack spec says:
284 *
285 * "If the binding identifier is used with a uniform block
286 * instanced as an array then the first element of the array
287 * takes the specified block binding and each subsequent
288 * element takes the next consecutive uniform block binding
289 * point."
290 */
291 blocks[i].Binding = (b->has_binding) ? b->binding + j : 0;
292
293 blocks[i].UniformBufferSize = 0;
294 blocks[i]._Packing =
295 gl_uniform_block_packing(block_type->interface_packing);
296
297 parcel.process(block_type->fields.array,
298 blocks[i].Name);
299
300 blocks[i].UniformBufferSize = parcel.buffer_size;
301
302 blocks[i].NumUniforms =
303 (unsigned)(ptrdiff_t)(&variables[parcel.index] - blocks[i].Uniforms);
304
305 blocks[i].IsShaderStorage = b->is_shader_storage;
306
307 i++;
308 }
309 } else {
310 blocks[i].Name = ralloc_strdup(blocks, block_type->name);
311 blocks[i].Uniforms = &variables[parcel.index];
312 blocks[i].Binding = (b->has_binding) ? b->binding : 0;
313 blocks[i].UniformBufferSize = 0;
314 blocks[i]._Packing =
315 gl_uniform_block_packing(block_type->interface_packing);
316
317 parcel.process(block_type,
318 b->has_instance_name ? block_type->name : "");
319
320 blocks[i].UniformBufferSize = parcel.buffer_size;
321
322 blocks[i].NumUniforms =
323 (unsigned)(ptrdiff_t)(&variables[parcel.index] - blocks[i].Uniforms);
324
325 blocks[i].IsShaderStorage = b->is_shader_storage;
326
327 i++;
328 }
329 }
330
331 assert(parcel.index == num_variables);
332
333 _mesa_hash_table_destroy(block_hash, NULL);
334
335 *blocks_ret = blocks;
336 return num_blocks;
337 }
338
339 bool
340 link_uniform_blocks_are_compatible(const gl_uniform_block *a,
341 const gl_uniform_block *b)
342 {
343 assert(strcmp(a->Name, b->Name) == 0);
344
345 /* Page 35 (page 42 of the PDF) in section 4.3.7 of the GLSL 1.50 spec says:
346 *
347 * "Matched block names within an interface (as defined above) must
348 * match in terms of having the same number of declarations with the
349 * same sequence of types and the same sequence of member names, as
350 * well as having the same member-wise layout qualification....if a
351 * matching block is declared as an array, then the array sizes must
352 * also match... Any mismatch will generate a link error."
353 *
354 * Arrays are not yet supported, so there is no check for that.
355 */
356 if (a->NumUniforms != b->NumUniforms)
357 return false;
358
359 if (a->_Packing != b->_Packing)
360 return false;
361
362 for (unsigned i = 0; i < a->NumUniforms; i++) {
363 if (strcmp(a->Uniforms[i].Name, b->Uniforms[i].Name) != 0)
364 return false;
365
366 if (a->Uniforms[i].Type != b->Uniforms[i].Type)
367 return false;
368
369 if (a->Uniforms[i].RowMajor != b->Uniforms[i].RowMajor)
370 return false;
371 }
372
373 return true;
374 }