2 * Copyright © 2010 Intel Corporation
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
24 #include "glsl_symbol_table.h"
26 #include "compiler/glsl_types.h"
28 #include "main/core.h" /* for MIN2 */
29 #include "main/shaderobj.h"
32 convert_component(ir_rvalue
*src
, const glsl_type
*desired_type
);
35 apply_implicit_conversion(const glsl_type
*to
, ir_rvalue
* &from
,
36 struct _mesa_glsl_parse_state
*state
);
39 process_parameters(exec_list
*instructions
, exec_list
*actual_parameters
,
40 exec_list
*parameters
,
41 struct _mesa_glsl_parse_state
*state
)
45 foreach_list_typed(ast_node
, ast
, link
, parameters
) {
46 ir_rvalue
*result
= ast
->hir(instructions
, state
);
48 ir_constant
*const constant
= result
->constant_expression_value();
52 actual_parameters
->push_tail(result
);
61 * Generate a source prototype for a function signature
63 * \param return_type Return type of the function. May be \c NULL.
64 * \param name Name of the function.
65 * \param parameters List of \c ir_instruction nodes representing the
66 * parameter list for the function. This may be either a
67 * formal (\c ir_variable) or actual (\c ir_rvalue)
68 * parameter list. Only the type is used.
71 * A ralloced string representing the prototype of the function.
74 prototype_string(const glsl_type
*return_type
, const char *name
,
75 exec_list
*parameters
)
79 if (return_type
!= NULL
)
80 str
= ralloc_asprintf(NULL
, "%s ", return_type
->name
);
82 ralloc_asprintf_append(&str
, "%s(", name
);
84 const char *comma
= "";
85 foreach_in_list(const ir_variable
, param
, parameters
) {
86 ralloc_asprintf_append(&str
, "%s%s", comma
, param
->type
->name
);
90 ralloc_strcat(&str
, ")");
95 verify_image_parameter(YYLTYPE
*loc
, _mesa_glsl_parse_state
*state
,
96 const ir_variable
*formal
, const ir_variable
*actual
)
99 * From the ARB_shader_image_load_store specification:
101 * "The values of image variables qualified with coherent,
102 * volatile, restrict, readonly, or writeonly may not be passed
103 * to functions whose formal parameters lack such
104 * qualifiers. [...] It is legal to have additional qualifiers
105 * on a formal parameter, but not to have fewer."
107 if (actual
->data
.image_coherent
&& !formal
->data
.image_coherent
) {
108 _mesa_glsl_error(loc
, state
,
109 "function call parameter `%s' drops "
110 "`coherent' qualifier", formal
->name
);
114 if (actual
->data
.image_volatile
&& !formal
->data
.image_volatile
) {
115 _mesa_glsl_error(loc
, state
,
116 "function call parameter `%s' drops "
117 "`volatile' qualifier", formal
->name
);
121 if (actual
->data
.image_restrict
&& !formal
->data
.image_restrict
) {
122 _mesa_glsl_error(loc
, state
,
123 "function call parameter `%s' drops "
124 "`restrict' qualifier", formal
->name
);
128 if (actual
->data
.image_read_only
&& !formal
->data
.image_read_only
) {
129 _mesa_glsl_error(loc
, state
,
130 "function call parameter `%s' drops "
131 "`readonly' qualifier", formal
->name
);
135 if (actual
->data
.image_write_only
&& !formal
->data
.image_write_only
) {
136 _mesa_glsl_error(loc
, state
,
137 "function call parameter `%s' drops "
138 "`writeonly' qualifier", formal
->name
);
146 verify_first_atomic_parameter(YYLTYPE
*loc
, _mesa_glsl_parse_state
*state
,
150 (!var
->is_in_shader_storage_block() &&
151 var
->data
.mode
!= ir_var_shader_shared
)) {
152 _mesa_glsl_error(loc
, state
, "First argument to atomic function "
153 "must be a buffer or shared variable");
160 is_atomic_function(const char *func_name
)
162 return !strcmp(func_name
, "atomicAdd") ||
163 !strcmp(func_name
, "atomicMin") ||
164 !strcmp(func_name
, "atomicMax") ||
165 !strcmp(func_name
, "atomicAnd") ||
166 !strcmp(func_name
, "atomicOr") ||
167 !strcmp(func_name
, "atomicXor") ||
168 !strcmp(func_name
, "atomicExchange") ||
169 !strcmp(func_name
, "atomicCompSwap");
173 * Verify that 'out' and 'inout' actual parameters are lvalues. Also, verify
174 * that 'const_in' formal parameters (an extension in our IR) correspond to
175 * ir_constant actual parameters.
178 verify_parameter_modes(_mesa_glsl_parse_state
*state
,
179 ir_function_signature
*sig
,
180 exec_list
&actual_ir_parameters
,
181 exec_list
&actual_ast_parameters
)
183 exec_node
*actual_ir_node
= actual_ir_parameters
.head
;
184 exec_node
*actual_ast_node
= actual_ast_parameters
.head
;
186 foreach_in_list(const ir_variable
, formal
, &sig
->parameters
) {
187 /* The lists must be the same length. */
188 assert(!actual_ir_node
->is_tail_sentinel());
189 assert(!actual_ast_node
->is_tail_sentinel());
191 const ir_rvalue
*const actual
= (ir_rvalue
*) actual_ir_node
;
192 const ast_expression
*const actual_ast
=
193 exec_node_data(ast_expression
, actual_ast_node
, link
);
195 /* FIXME: 'loc' is incorrect (as of 2011-01-21). It is always
198 YYLTYPE loc
= actual_ast
->get_location();
200 /* Verify that 'const_in' parameters are ir_constants. */
201 if (formal
->data
.mode
== ir_var_const_in
&&
202 actual
->ir_type
!= ir_type_constant
) {
203 _mesa_glsl_error(&loc
, state
,
204 "parameter `in %s' must be a constant expression",
209 /* Verify that shader_in parameters are shader inputs */
210 if (formal
->data
.must_be_shader_input
) {
211 ir_variable
*var
= actual
->variable_referenced();
212 if (var
&& var
->data
.mode
!= ir_var_shader_in
) {
213 _mesa_glsl_error(&loc
, state
,
214 "parameter `%s` must be a shader input",
219 if (actual
->ir_type
== ir_type_swizzle
) {
220 _mesa_glsl_error(&loc
, state
,
221 "parameter `%s` must not be swizzled",
227 /* Verify that 'out' and 'inout' actual parameters are lvalues. */
228 if (formal
->data
.mode
== ir_var_function_out
229 || formal
->data
.mode
== ir_var_function_inout
) {
230 const char *mode
= NULL
;
231 switch (formal
->data
.mode
) {
232 case ir_var_function_out
: mode
= "out"; break;
233 case ir_var_function_inout
: mode
= "inout"; break;
234 default: assert(false); break;
237 /* This AST-based check catches errors like f(i++). The IR-based
238 * is_lvalue() is insufficient because the actual parameter at the
239 * IR-level is just a temporary value, which is an l-value.
241 if (actual_ast
->non_lvalue_description
!= NULL
) {
242 _mesa_glsl_error(&loc
, state
,
243 "function parameter '%s %s' references a %s",
245 actual_ast
->non_lvalue_description
);
249 ir_variable
*var
= actual
->variable_referenced();
251 var
->data
.assigned
= true;
253 if (var
&& var
->data
.read_only
) {
254 _mesa_glsl_error(&loc
, state
,
255 "function parameter '%s %s' references the "
256 "read-only variable '%s'",
258 actual
->variable_referenced()->name
);
260 } else if (!actual
->is_lvalue()) {
261 _mesa_glsl_error(&loc
, state
,
262 "function parameter '%s %s' is not an lvalue",
268 if (formal
->type
->is_image() &&
269 actual
->variable_referenced()) {
270 if (!verify_image_parameter(&loc
, state
, formal
,
271 actual
->variable_referenced()))
275 actual_ir_node
= actual_ir_node
->next
;
276 actual_ast_node
= actual_ast_node
->next
;
279 /* The first parameter of atomic functions must be a buffer variable */
280 const char *func_name
= sig
->function_name();
281 bool is_atomic
= is_atomic_function(func_name
);
283 const ir_rvalue
*const actual
= (ir_rvalue
*) actual_ir_parameters
.head
;
285 const ast_expression
*const actual_ast
=
286 exec_node_data(ast_expression
, actual_ast_parameters
.head
, link
);
287 YYLTYPE loc
= actual_ast
->get_location();
289 if (!verify_first_atomic_parameter(&loc
, state
,
290 actual
->variable_referenced())) {
299 fix_parameter(void *mem_ctx
, ir_rvalue
*actual
, const glsl_type
*formal_type
,
300 exec_list
*before_instructions
, exec_list
*after_instructions
,
301 bool parameter_is_inout
)
303 ir_expression
*const expr
= actual
->as_expression();
305 /* If the types match exactly and the parameter is not a vector-extract,
306 * nothing needs to be done to fix the parameter.
308 if (formal_type
== actual
->type
309 && (expr
== NULL
|| expr
->operation
!= ir_binop_vector_extract
))
312 /* To convert an out parameter, we need to create a temporary variable to
313 * hold the value before conversion, and then perform the conversion after
314 * the function call returns.
316 * This has the effect of transforming code like this:
322 * Into IR that's equivalent to this:
326 * int out_parameter_conversion;
327 * f(out_parameter_conversion);
328 * value = float(out_parameter_conversion);
330 * If the parameter is an ir_expression of ir_binop_vector_extract,
331 * additional conversion is needed in the post-call re-write.
334 new(mem_ctx
) ir_variable(formal_type
, "inout_tmp", ir_var_temporary
);
336 before_instructions
->push_tail(tmp
);
338 /* If the parameter is an inout parameter, copy the value of the actual
339 * parameter to the new temporary. Note that no type conversion is allowed
340 * here because inout parameters must match types exactly.
342 if (parameter_is_inout
) {
343 /* Inout parameters should never require conversion, since that would
344 * require an implicit conversion to exist both to and from the formal
345 * parameter type, and there are no bidirectional implicit conversions.
347 assert (actual
->type
== formal_type
);
349 ir_dereference_variable
*const deref_tmp_1
=
350 new(mem_ctx
) ir_dereference_variable(tmp
);
351 ir_assignment
*const assignment
=
352 new(mem_ctx
) ir_assignment(deref_tmp_1
, actual
);
353 before_instructions
->push_tail(assignment
);
356 /* Replace the parameter in the call with a dereference of the new
359 ir_dereference_variable
*const deref_tmp_2
=
360 new(mem_ctx
) ir_dereference_variable(tmp
);
361 actual
->replace_with(deref_tmp_2
);
364 /* Copy the temporary variable to the actual parameter with optional
365 * type conversion applied.
367 ir_rvalue
*rhs
= new(mem_ctx
) ir_dereference_variable(tmp
);
368 if (actual
->type
!= formal_type
)
369 rhs
= convert_component(rhs
, actual
->type
);
371 ir_rvalue
*lhs
= actual
;
372 if (expr
!= NULL
&& expr
->operation
== ir_binop_vector_extract
) {
373 lhs
= new(mem_ctx
) ir_dereference_array(expr
->operands
[0]->clone(mem_ctx
, NULL
),
374 expr
->operands
[1]->clone(mem_ctx
, NULL
));
377 ir_assignment
*const assignment_2
= new(mem_ctx
) ir_assignment(lhs
, rhs
);
378 after_instructions
->push_tail(assignment_2
);
382 * Generate a function call.
384 * For non-void functions, this returns a dereference of the temporary variable
385 * which stores the return value for the call. For void functions, this returns
389 generate_call(exec_list
*instructions
, ir_function_signature
*sig
,
390 exec_list
*actual_parameters
,
391 ir_variable
*sub_var
,
392 ir_rvalue
*array_idx
,
393 struct _mesa_glsl_parse_state
*state
)
396 exec_list post_call_conversions
;
398 /* Perform implicit conversion of arguments. For out parameters, we need
399 * to place them in a temporary variable and do the conversion after the
400 * call takes place. Since we haven't emitted the call yet, we'll place
401 * the post-call conversions in a temporary exec_list, and emit them later.
403 foreach_two_lists(formal_node
, &sig
->parameters
,
404 actual_node
, actual_parameters
) {
405 ir_rvalue
*actual
= (ir_rvalue
*) actual_node
;
406 ir_variable
*formal
= (ir_variable
*) formal_node
;
408 if (formal
->type
->is_numeric() || formal
->type
->is_boolean()) {
409 switch (formal
->data
.mode
) {
410 case ir_var_const_in
:
411 case ir_var_function_in
: {
413 = convert_component(actual
, formal
->type
);
414 actual
->replace_with(converted
);
417 case ir_var_function_out
:
418 case ir_var_function_inout
:
419 fix_parameter(ctx
, actual
, formal
->type
,
420 instructions
, &post_call_conversions
,
421 formal
->data
.mode
== ir_var_function_inout
);
424 assert (!"Illegal formal parameter mode");
430 /* Section 4.3.2 (Const) of the GLSL 1.10.59 spec says:
432 * "Initializers for const declarations must be formed from literal
433 * values, other const variables (not including function call
434 * paramaters), or expressions of these.
436 * Constructors may be used in such expressions, but function calls may
439 * Section 4.3.3 (Constant Expressions) of the GLSL 1.20.8 spec says:
441 * "A constant expression is one of
445 * - a built-in function call whose arguments are all constant
446 * expressions, with the exception of the texture lookup
447 * functions, the noise functions, and ftransform. The built-in
448 * functions dFdx, dFdy, and fwidth must return 0 when evaluated
449 * inside an initializer with an argument that is a constant
452 * Section 5.10 (Constant Expressions) of the GLSL ES 1.00.17 spec says:
454 * "A constant expression is one of
458 * - a built-in function call whose arguments are all constant
459 * expressions, with the exception of the texture lookup
462 * Section 4.3.3 (Constant Expressions) of the GLSL ES 3.00.4 spec says:
464 * "A constant expression is one of
468 * - a built-in function call whose arguments are all constant
469 * expressions, with the exception of the texture lookup
470 * functions. The built-in functions dFdx, dFdy, and fwidth must
471 * return 0 when evaluated inside an initializer with an argument
472 * that is a constant expression."
474 * If the function call is a constant expression, don't generate any
475 * instructions; just generate an ir_constant.
477 if (state
->is_version(120, 100)) {
478 ir_constant
*value
= sig
->constant_expression_value(actual_parameters
, NULL
);
484 ir_dereference_variable
*deref
= NULL
;
485 if (!sig
->return_type
->is_void()) {
486 /* Create a new temporary to hold the return value. */
487 char *const name
= ir_variable::temporaries_allocate_names
488 ? ralloc_asprintf(ctx
, "%s_retval", sig
->function_name())
493 var
= new(ctx
) ir_variable(sig
->return_type
, name
, ir_var_temporary
);
494 instructions
->push_tail(var
);
498 deref
= new(ctx
) ir_dereference_variable(var
);
501 ir_call
*call
= new(ctx
) ir_call(sig
, deref
, actual_parameters
, sub_var
, array_idx
);
502 instructions
->push_tail(call
);
504 /* Also emit any necessary out-parameter conversions. */
505 instructions
->append_list(&post_call_conversions
);
507 return deref
? deref
->clone(ctx
, NULL
) : NULL
;
511 * Given a function name and parameter list, find the matching signature.
513 static ir_function_signature
*
514 match_function_by_name(const char *name
,
515 exec_list
*actual_parameters
,
516 struct _mesa_glsl_parse_state
*state
)
519 ir_function
*f
= state
->symbols
->get_function(name
);
520 ir_function_signature
*local_sig
= NULL
;
521 ir_function_signature
*sig
= NULL
;
523 /* Is the function hidden by a record type constructor? */
524 if (state
->symbols
->get_type(name
))
525 goto done
; /* no match */
527 /* Is the function hidden by a variable (impossible in 1.10)? */
528 if (!state
->symbols
->separate_function_namespace
529 && state
->symbols
->get_variable(name
))
530 goto done
; /* no match */
533 /* In desktop GL, the presence of a user-defined signature hides any
534 * built-in signatures, so we must ignore them. In contrast, in ES2
535 * user-defined signatures add new overloads, so we must consider them.
537 bool allow_builtins
= state
->es_shader
|| !f
->has_user_signature();
539 /* Look for a match in the local shader. If exact, we're done. */
540 bool is_exact
= false;
541 sig
= local_sig
= f
->matching_signature(state
, actual_parameters
,
542 allow_builtins
, &is_exact
);
550 /* Local shader has no exact candidates; check the built-ins. */
551 _mesa_glsl_initialize_builtin_functions();
552 sig
= _mesa_glsl_find_builtin_function(state
, name
, actual_parameters
);
556 /* If the match is from a linked built-in shader, import the prototype. */
557 if (sig
!= local_sig
) {
559 f
= new(ctx
) ir_function(name
);
560 state
->symbols
->add_global_function(f
);
561 emit_function(state
, f
);
563 sig
= sig
->clone_prototype(f
, NULL
);
564 f
->add_signature(sig
);
570 static ir_function_signature
*
571 match_subroutine_by_name(const char *name
,
572 exec_list
*actual_parameters
,
573 struct _mesa_glsl_parse_state
*state
,
577 ir_function_signature
*sig
= NULL
;
578 ir_function
*f
, *found
= NULL
;
579 const char *new_name
;
581 bool is_exact
= false;
583 new_name
= ralloc_asprintf(ctx
, "%s_%s", _mesa_shader_stage_to_subroutine_prefix(state
->stage
), name
);
584 var
= state
->symbols
->get_variable(new_name
);
588 for (int i
= 0; i
< state
->num_subroutine_types
; i
++) {
589 f
= state
->subroutine_types
[i
];
590 if (strcmp(f
->name
, var
->type
->without_array()->name
))
599 sig
= found
->matching_signature(state
, actual_parameters
,
605 generate_array_index(void *mem_ctx
, exec_list
*instructions
,
606 struct _mesa_glsl_parse_state
*state
, YYLTYPE loc
,
607 const ast_expression
*array
, ast_expression
*idx
,
608 const char **function_name
, exec_list
*actual_parameters
)
610 if (array
->oper
== ast_array_index
) {
611 /* This handles arrays of arrays */
612 ir_rvalue
*outer_array
= generate_array_index(mem_ctx
, instructions
,
614 array
->subexpressions
[0],
615 array
->subexpressions
[1],
616 function_name
, actual_parameters
);
617 ir_rvalue
*outer_array_idx
= idx
->hir(instructions
, state
);
619 YYLTYPE index_loc
= idx
->get_location();
620 return _mesa_ast_array_index_to_hir(mem_ctx
, state
, outer_array
,
621 outer_array_idx
, loc
,
624 ir_variable
*sub_var
= NULL
;
625 *function_name
= array
->primary_expression
.identifier
;
627 match_subroutine_by_name(*function_name
, actual_parameters
,
630 ir_rvalue
*outer_array_idx
= idx
->hir(instructions
, state
);
631 return new(mem_ctx
) ir_dereference_array(sub_var
, outer_array_idx
);
636 print_function_prototypes(_mesa_glsl_parse_state
*state
, YYLTYPE
*loc
,
642 foreach_in_list(ir_function_signature
, sig
, &f
->signatures
) {
643 if (sig
->is_builtin() && !sig
->is_builtin_available(state
))
646 char *str
= prototype_string(sig
->return_type
, f
->name
, &sig
->parameters
);
647 _mesa_glsl_error(loc
, state
, " %s", str
);
653 * Raise a "no matching function" error, listing all possible overloads the
654 * compiler considered so developers can figure out what went wrong.
657 no_matching_function_error(const char *name
,
659 exec_list
*actual_parameters
,
660 _mesa_glsl_parse_state
*state
)
662 gl_shader
*sh
= _mesa_glsl_get_builtin_function_shader();
664 if (state
->symbols
->get_function(name
) == NULL
665 && (!state
->uses_builtin_functions
666 || sh
->symbols
->get_function(name
) == NULL
)) {
667 _mesa_glsl_error(loc
, state
, "no function with name '%s'", name
);
669 char *str
= prototype_string(NULL
, name
, actual_parameters
);
670 _mesa_glsl_error(loc
, state
,
671 "no matching function for call to `%s'; candidates are:",
675 print_function_prototypes(state
, loc
, state
->symbols
->get_function(name
));
677 if (state
->uses_builtin_functions
) {
678 print_function_prototypes(state
, loc
, sh
->symbols
->get_function(name
));
684 * Perform automatic type conversion of constructor parameters
686 * This implements the rules in the "Conversion and Scalar Constructors"
687 * section (GLSL 1.10 section 5.4.1), not the "Implicit Conversions" rules.
690 convert_component(ir_rvalue
*src
, const glsl_type
*desired_type
)
692 void *ctx
= ralloc_parent(src
);
693 const unsigned a
= desired_type
->base_type
;
694 const unsigned b
= src
->type
->base_type
;
695 ir_expression
*result
= NULL
;
697 if (src
->type
->is_error())
700 assert(a
<= GLSL_TYPE_BOOL
);
701 assert(b
<= GLSL_TYPE_BOOL
);
710 result
= new(ctx
) ir_expression(ir_unop_i2u
, src
);
712 case GLSL_TYPE_FLOAT
:
713 result
= new(ctx
) ir_expression(ir_unop_f2u
, src
);
716 result
= new(ctx
) ir_expression(ir_unop_i2u
,
717 new(ctx
) ir_expression(ir_unop_b2i
, src
));
719 case GLSL_TYPE_DOUBLE
:
720 result
= new(ctx
) ir_expression(ir_unop_d2u
, src
);
727 result
= new(ctx
) ir_expression(ir_unop_u2i
, src
);
729 case GLSL_TYPE_FLOAT
:
730 result
= new(ctx
) ir_expression(ir_unop_f2i
, src
);
733 result
= new(ctx
) ir_expression(ir_unop_b2i
, src
);
735 case GLSL_TYPE_DOUBLE
:
736 result
= new(ctx
) ir_expression(ir_unop_d2i
, src
);
740 case GLSL_TYPE_FLOAT
:
743 result
= new(ctx
) ir_expression(ir_unop_u2f
, desired_type
, src
, NULL
);
746 result
= new(ctx
) ir_expression(ir_unop_i2f
, desired_type
, src
, NULL
);
749 result
= new(ctx
) ir_expression(ir_unop_b2f
, desired_type
, src
, NULL
);
751 case GLSL_TYPE_DOUBLE
:
752 result
= new(ctx
) ir_expression(ir_unop_d2f
, desired_type
, src
, NULL
);
759 result
= new(ctx
) ir_expression(ir_unop_i2b
,
760 new(ctx
) ir_expression(ir_unop_u2i
, src
));
763 result
= new(ctx
) ir_expression(ir_unop_i2b
, desired_type
, src
, NULL
);
765 case GLSL_TYPE_FLOAT
:
766 result
= new(ctx
) ir_expression(ir_unop_f2b
, desired_type
, src
, NULL
);
768 case GLSL_TYPE_DOUBLE
:
769 result
= new(ctx
) ir_expression(ir_unop_d2b
, desired_type
, src
, NULL
);
773 case GLSL_TYPE_DOUBLE
:
776 result
= new(ctx
) ir_expression(ir_unop_i2d
, src
);
779 result
= new(ctx
) ir_expression(ir_unop_u2d
, src
);
782 result
= new(ctx
) ir_expression(ir_unop_f2d
,
783 new(ctx
) ir_expression(ir_unop_b2f
, src
));
785 case GLSL_TYPE_FLOAT
:
786 result
= new(ctx
) ir_expression(ir_unop_f2d
, desired_type
, src
, NULL
);
791 assert(result
!= NULL
);
792 assert(result
->type
== desired_type
);
794 /* Try constant folding; it may fold in the conversion we just added. */
795 ir_constant
*const constant
= result
->constant_expression_value();
796 return (constant
!= NULL
) ? (ir_rvalue
*) constant
: (ir_rvalue
*) result
;
800 * Dereference a specific component from a scalar, vector, or matrix
803 dereference_component(ir_rvalue
*src
, unsigned component
)
805 void *ctx
= ralloc_parent(src
);
806 assert(component
< src
->type
->components());
808 /* If the source is a constant, just create a new constant instead of a
809 * dereference of the existing constant.
811 ir_constant
*constant
= src
->as_constant();
813 return new(ctx
) ir_constant(constant
, component
);
815 if (src
->type
->is_scalar()) {
817 } else if (src
->type
->is_vector()) {
818 return new(ctx
) ir_swizzle(src
, component
, 0, 0, 0, 1);
820 assert(src
->type
->is_matrix());
822 /* Dereference a row of the matrix, then call this function again to get
823 * a specific element from that row.
825 const int c
= component
/ src
->type
->column_type()->vector_elements
;
826 const int r
= component
% src
->type
->column_type()->vector_elements
;
827 ir_constant
*const col_index
= new(ctx
) ir_constant(c
);
828 ir_dereference
*const col
= new(ctx
) ir_dereference_array(src
, col_index
);
830 col
->type
= src
->type
->column_type();
832 return dereference_component(col
, r
);
835 assert(!"Should not get here.");
841 process_vec_mat_constructor(exec_list
*instructions
,
842 const glsl_type
*constructor_type
,
843 YYLTYPE
*loc
, exec_list
*parameters
,
844 struct _mesa_glsl_parse_state
*state
)
848 /* The ARB_shading_language_420pack spec says:
850 * "If an initializer is a list of initializers enclosed in curly braces,
851 * the variable being declared must be a vector, a matrix, an array, or a
854 * int i = { 1 }; // illegal, i is not an aggregate"
856 if (constructor_type
->vector_elements
<= 1) {
857 _mesa_glsl_error(loc
, state
, "aggregates can only initialize vectors, "
858 "matrices, arrays, and structs");
859 return ir_rvalue::error_value(ctx
);
862 exec_list actual_parameters
;
863 const unsigned parameter_count
=
864 process_parameters(instructions
, &actual_parameters
, parameters
, state
);
866 if (parameter_count
== 0
867 || (constructor_type
->is_vector() &&
868 constructor_type
->vector_elements
!= parameter_count
)
869 || (constructor_type
->is_matrix() &&
870 constructor_type
->matrix_columns
!= parameter_count
)) {
871 _mesa_glsl_error(loc
, state
, "%s constructor must have %u parameters",
872 constructor_type
->is_vector() ? "vector" : "matrix",
873 constructor_type
->vector_elements
);
874 return ir_rvalue::error_value(ctx
);
877 bool all_parameters_are_constant
= true;
879 /* Type cast each parameter and, if possible, fold constants. */
880 foreach_in_list_safe(ir_rvalue
, ir
, &actual_parameters
) {
881 ir_rvalue
*result
= ir
;
883 /* Apply implicit conversions (not the scalar constructor rules!). See
884 * the spec quote above. */
885 if (constructor_type
->base_type
!= result
->type
->base_type
) {
886 const glsl_type
*desired_type
=
887 glsl_type::get_instance(constructor_type
->base_type
,
888 ir
->type
->vector_elements
,
889 ir
->type
->matrix_columns
);
890 if (result
->type
->can_implicitly_convert_to(desired_type
, state
)) {
891 /* Even though convert_component() implements the constructor
892 * conversion rules (not the implicit conversion rules), its safe
893 * to use it here because we already checked that the implicit
894 * conversion is legal.
896 result
= convert_component(ir
, desired_type
);
900 if (constructor_type
->is_matrix()) {
901 if (result
->type
!= constructor_type
->column_type()) {
902 _mesa_glsl_error(loc
, state
, "type error in matrix constructor: "
903 "expected: %s, found %s",
904 constructor_type
->column_type()->name
,
906 return ir_rvalue::error_value(ctx
);
908 } else if (result
->type
!= constructor_type
->get_scalar_type()) {
909 _mesa_glsl_error(loc
, state
, "type error in vector constructor: "
910 "expected: %s, found %s",
911 constructor_type
->get_scalar_type()->name
,
913 return ir_rvalue::error_value(ctx
);
916 /* Attempt to convert the parameter to a constant valued expression.
917 * After doing so, track whether or not all the parameters to the
918 * constructor are trivially constant valued expressions.
920 ir_rvalue
*const constant
= result
->constant_expression_value();
922 if (constant
!= NULL
)
925 all_parameters_are_constant
= false;
927 ir
->replace_with(result
);
930 if (all_parameters_are_constant
)
931 return new(ctx
) ir_constant(constructor_type
, &actual_parameters
);
933 ir_variable
*var
= new(ctx
) ir_variable(constructor_type
, "vec_mat_ctor",
935 instructions
->push_tail(var
);
939 foreach_in_list(ir_rvalue
, rhs
, &actual_parameters
) {
940 ir_instruction
*assignment
= NULL
;
942 if (var
->type
->is_matrix()) {
943 ir_rvalue
*lhs
= new(ctx
) ir_dereference_array(var
,
944 new(ctx
) ir_constant(i
));
945 assignment
= new(ctx
) ir_assignment(lhs
, rhs
, NULL
);
947 /* use writemask rather than index for vector */
948 assert(var
->type
->is_vector());
950 ir_dereference
*lhs
= new(ctx
) ir_dereference_variable(var
);
951 assignment
= new(ctx
) ir_assignment(lhs
, rhs
, NULL
, (unsigned)(1 << i
));
954 instructions
->push_tail(assignment
);
959 return new(ctx
) ir_dereference_variable(var
);
964 process_array_constructor(exec_list
*instructions
,
965 const glsl_type
*constructor_type
,
966 YYLTYPE
*loc
, exec_list
*parameters
,
967 struct _mesa_glsl_parse_state
*state
)
970 /* Array constructors come in two forms: sized and unsized. Sized array
971 * constructors look like 'vec4[2](a, b)', where 'a' and 'b' are vec4
972 * variables. In this case the number of parameters must exactly match the
973 * specified size of the array.
975 * Unsized array constructors look like 'vec4[](a, b)', where 'a' and 'b'
976 * are vec4 variables. In this case the size of the array being constructed
977 * is determined by the number of parameters.
979 * From page 52 (page 58 of the PDF) of the GLSL 1.50 spec:
981 * "There must be exactly the same number of arguments as the size of
982 * the array being constructed. If no size is present in the
983 * constructor, then the array is explicitly sized to the number of
984 * arguments provided. The arguments are assigned in order, starting at
985 * element 0, to the elements of the constructed array. Each argument
986 * must be the same type as the element type of the array, or be a type
987 * that can be converted to the element type of the array according to
988 * Section 4.1.10 "Implicit Conversions.""
990 exec_list actual_parameters
;
991 const unsigned parameter_count
=
992 process_parameters(instructions
, &actual_parameters
, parameters
, state
);
993 bool is_unsized_array
= constructor_type
->is_unsized_array();
995 if ((parameter_count
== 0) ||
996 (!is_unsized_array
&& (constructor_type
->length
!= parameter_count
))) {
997 const unsigned min_param
= is_unsized_array
998 ? 1 : constructor_type
->length
;
1000 _mesa_glsl_error(loc
, state
, "array constructor must have %s %u "
1002 is_unsized_array
? "at least" : "exactly",
1003 min_param
, (min_param
<= 1) ? "" : "s");
1004 return ir_rvalue::error_value(ctx
);
1007 if (is_unsized_array
) {
1009 glsl_type::get_array_instance(constructor_type
->fields
.array
,
1011 assert(constructor_type
!= NULL
);
1012 assert(constructor_type
->length
== parameter_count
);
1015 bool all_parameters_are_constant
= true;
1016 const glsl_type
*element_type
= constructor_type
->fields
.array
;
1018 /* Type cast each parameter and, if possible, fold constants. */
1019 foreach_in_list_safe(ir_rvalue
, ir
, &actual_parameters
) {
1020 ir_rvalue
*result
= ir
;
1022 const glsl_base_type element_base_type
=
1023 constructor_type
->fields
.array
->base_type
;
1025 /* Apply implicit conversions (not the scalar constructor rules!). See
1026 * the spec quote above. */
1027 if (element_base_type
!= result
->type
->base_type
) {
1028 const glsl_type
*desired_type
=
1029 glsl_type::get_instance(element_base_type
,
1030 ir
->type
->vector_elements
,
1031 ir
->type
->matrix_columns
);
1033 if (result
->type
->can_implicitly_convert_to(desired_type
, state
)) {
1034 /* Even though convert_component() implements the constructor
1035 * conversion rules (not the implicit conversion rules), its safe
1036 * to use it here because we already checked that the implicit
1037 * conversion is legal.
1039 result
= convert_component(ir
, desired_type
);
1043 if (constructor_type
->fields
.array
->is_unsized_array()) {
1044 /* As the inner parameters of the constructor are created without
1045 * knowledge of each other we need to check to make sure unsized
1046 * parameters of unsized constructors all end up with the same size.
1048 * e.g we make sure to fail for a constructor like this:
1049 * vec4[][] a = vec4[][](vec4[](vec4(0.0), vec4(1.0)),
1050 * vec4[](vec4(0.0), vec4(1.0), vec4(1.0)),
1051 * vec4[](vec4(0.0), vec4(1.0)));
1053 if (element_type
->is_unsized_array()) {
1054 /* This is the first parameter so just get the type */
1055 element_type
= result
->type
;
1056 } else if (element_type
!= result
->type
) {
1057 _mesa_glsl_error(loc
, state
, "type error in array constructor: "
1058 "expected: %s, found %s",
1060 result
->type
->name
);
1061 return ir_rvalue::error_value(ctx
);
1063 } else if (result
->type
!= constructor_type
->fields
.array
) {
1064 _mesa_glsl_error(loc
, state
, "type error in array constructor: "
1065 "expected: %s, found %s",
1066 constructor_type
->fields
.array
->name
,
1067 result
->type
->name
);
1068 return ir_rvalue::error_value(ctx
);
1070 element_type
= result
->type
;
1073 /* Attempt to convert the parameter to a constant valued expression.
1074 * After doing so, track whether or not all the parameters to the
1075 * constructor are trivially constant valued expressions.
1077 ir_rvalue
*const constant
= result
->constant_expression_value();
1079 if (constant
!= NULL
)
1082 all_parameters_are_constant
= false;
1084 ir
->replace_with(result
);
1087 if (constructor_type
->fields
.array
->is_unsized_array()) {
1089 glsl_type::get_array_instance(element_type
,
1091 assert(constructor_type
!= NULL
);
1092 assert(constructor_type
->length
== parameter_count
);
1095 if (all_parameters_are_constant
)
1096 return new(ctx
) ir_constant(constructor_type
, &actual_parameters
);
1098 ir_variable
*var
= new(ctx
) ir_variable(constructor_type
, "array_ctor",
1100 instructions
->push_tail(var
);
1103 foreach_in_list(ir_rvalue
, rhs
, &actual_parameters
) {
1104 ir_rvalue
*lhs
= new(ctx
) ir_dereference_array(var
,
1105 new(ctx
) ir_constant(i
));
1107 ir_instruction
*assignment
= new(ctx
) ir_assignment(lhs
, rhs
, NULL
);
1108 instructions
->push_tail(assignment
);
1113 return new(ctx
) ir_dereference_variable(var
);
1118 * Try to convert a record constructor to a constant expression
1120 static ir_constant
*
1121 constant_record_constructor(const glsl_type
*constructor_type
,
1122 exec_list
*parameters
, void *mem_ctx
)
1124 foreach_in_list(ir_instruction
, node
, parameters
) {
1125 ir_constant
*constant
= node
->as_constant();
1126 if (constant
== NULL
)
1128 node
->replace_with(constant
);
1131 return new(mem_ctx
) ir_constant(constructor_type
, parameters
);
1136 * Determine if a list consists of a single scalar r-value
1139 single_scalar_parameter(exec_list
*parameters
)
1141 const ir_rvalue
*const p
= (ir_rvalue
*) parameters
->head
;
1142 assert(((ir_rvalue
*)p
)->as_rvalue() != NULL
);
1144 return (p
->type
->is_scalar() && p
->next
->is_tail_sentinel());
1149 * Generate inline code for a vector constructor
1151 * The generated constructor code will consist of a temporary variable
1152 * declaration of the same type as the constructor. A sequence of assignments
1153 * from constructor parameters to the temporary will follow.
1156 * An \c ir_dereference_variable of the temprorary generated in the constructor
1160 emit_inline_vector_constructor(const glsl_type
*type
,
1161 exec_list
*instructions
,
1162 exec_list
*parameters
,
1165 assert(!parameters
->is_empty());
1167 ir_variable
*var
= new(ctx
) ir_variable(type
, "vec_ctor", ir_var_temporary
);
1168 instructions
->push_tail(var
);
1170 /* There are three kinds of vector constructors.
1172 * - Construct a vector from a single scalar by replicating that scalar to
1173 * all components of the vector.
1175 * - Construct a vector from at least a matrix. This case should already
1176 * have been taken care of in ast_function_expression::hir by breaking
1177 * down the matrix into a series of column vectors.
1179 * - Construct a vector from an arbirary combination of vectors and
1180 * scalars. The components of the constructor parameters are assigned
1181 * to the vector in order until the vector is full.
1183 const unsigned lhs_components
= type
->components();
1184 if (single_scalar_parameter(parameters
)) {
1185 ir_rvalue
*first_param
= (ir_rvalue
*)parameters
->head
;
1186 ir_rvalue
*rhs
= new(ctx
) ir_swizzle(first_param
, 0, 0, 0, 0,
1188 ir_dereference_variable
*lhs
= new(ctx
) ir_dereference_variable(var
);
1189 const unsigned mask
= (1U << lhs_components
) - 1;
1191 assert(rhs
->type
== lhs
->type
);
1193 ir_instruction
*inst
= new(ctx
) ir_assignment(lhs
, rhs
, NULL
, mask
);
1194 instructions
->push_tail(inst
);
1196 unsigned base_component
= 0;
1197 unsigned base_lhs_component
= 0;
1198 ir_constant_data data
;
1199 unsigned constant_mask
= 0, constant_components
= 0;
1201 memset(&data
, 0, sizeof(data
));
1203 foreach_in_list(ir_rvalue
, param
, parameters
) {
1204 unsigned rhs_components
= param
->type
->components();
1206 /* Do not try to assign more components to the vector than it has!
1208 if ((rhs_components
+ base_lhs_component
) > lhs_components
) {
1209 rhs_components
= lhs_components
- base_lhs_component
;
1212 const ir_constant
*const c
= param
->as_constant();
1214 for (unsigned i
= 0; i
< rhs_components
; i
++) {
1215 switch (c
->type
->base_type
) {
1216 case GLSL_TYPE_UINT
:
1217 data
.u
[i
+ base_component
] = c
->get_uint_component(i
);
1220 data
.i
[i
+ base_component
] = c
->get_int_component(i
);
1222 case GLSL_TYPE_FLOAT
:
1223 data
.f
[i
+ base_component
] = c
->get_float_component(i
);
1225 case GLSL_TYPE_DOUBLE
:
1226 data
.d
[i
+ base_component
] = c
->get_double_component(i
);
1228 case GLSL_TYPE_BOOL
:
1229 data
.b
[i
+ base_component
] = c
->get_bool_component(i
);
1232 assert(!"Should not get here.");
1237 /* Mask of fields to be written in the assignment.
1239 constant_mask
|= ((1U << rhs_components
) - 1) << base_lhs_component
;
1240 constant_components
+= rhs_components
;
1242 base_component
+= rhs_components
;
1244 /* Advance the component index by the number of components
1245 * that were just assigned.
1247 base_lhs_component
+= rhs_components
;
1250 if (constant_mask
!= 0) {
1251 ir_dereference
*lhs
= new(ctx
) ir_dereference_variable(var
);
1252 const glsl_type
*rhs_type
= glsl_type::get_instance(var
->type
->base_type
,
1253 constant_components
,
1255 ir_rvalue
*rhs
= new(ctx
) ir_constant(rhs_type
, &data
);
1257 ir_instruction
*inst
=
1258 new(ctx
) ir_assignment(lhs
, rhs
, NULL
, constant_mask
);
1259 instructions
->push_tail(inst
);
1263 foreach_in_list(ir_rvalue
, param
, parameters
) {
1264 unsigned rhs_components
= param
->type
->components();
1266 /* Do not try to assign more components to the vector than it has!
1268 if ((rhs_components
+ base_component
) > lhs_components
) {
1269 rhs_components
= lhs_components
- base_component
;
1272 /* If we do not have any components left to copy, break out of the
1273 * loop. This can happen when initializing a vec4 with a mat3 as the
1274 * mat3 would have been broken into a series of column vectors.
1276 if (rhs_components
== 0) {
1280 const ir_constant
*const c
= param
->as_constant();
1282 /* Mask of fields to be written in the assignment.
1284 const unsigned write_mask
= ((1U << rhs_components
) - 1)
1287 ir_dereference
*lhs
= new(ctx
) ir_dereference_variable(var
);
1289 /* Generate a swizzle so that LHS and RHS sizes match.
1292 new(ctx
) ir_swizzle(param
, 0, 1, 2, 3, rhs_components
);
1294 ir_instruction
*inst
=
1295 new(ctx
) ir_assignment(lhs
, rhs
, NULL
, write_mask
);
1296 instructions
->push_tail(inst
);
1299 /* Advance the component index by the number of components that were
1302 base_component
+= rhs_components
;
1305 return new(ctx
) ir_dereference_variable(var
);
1310 * Generate assignment of a portion of a vector to a portion of a matrix column
1312 * \param src_base First component of the source to be used in assignment
1313 * \param column Column of destination to be assiged
1314 * \param row_base First component of the destination column to be assigned
1315 * \param count Number of components to be assigned
1318 * \c src_base + \c count must be less than or equal to the number of components
1319 * in the source vector.
1322 assign_to_matrix_column(ir_variable
*var
, unsigned column
, unsigned row_base
,
1323 ir_rvalue
*src
, unsigned src_base
, unsigned count
,
1326 ir_constant
*col_idx
= new(mem_ctx
) ir_constant(column
);
1327 ir_dereference
*column_ref
= new(mem_ctx
) ir_dereference_array(var
, col_idx
);
1329 assert(column_ref
->type
->components() >= (row_base
+ count
));
1330 assert(src
->type
->components() >= (src_base
+ count
));
1332 /* Generate a swizzle that extracts the number of components from the source
1333 * that are to be assigned to the column of the matrix.
1335 if (count
< src
->type
->vector_elements
) {
1336 src
= new(mem_ctx
) ir_swizzle(src
,
1337 src_base
+ 0, src_base
+ 1,
1338 src_base
+ 2, src_base
+ 3,
1342 /* Mask of fields to be written in the assignment.
1344 const unsigned write_mask
= ((1U << count
) - 1) << row_base
;
1346 return new(mem_ctx
) ir_assignment(column_ref
, src
, NULL
, write_mask
);
1351 * Generate inline code for a matrix constructor
1353 * The generated constructor code will consist of a temporary variable
1354 * declaration of the same type as the constructor. A sequence of assignments
1355 * from constructor parameters to the temporary will follow.
1358 * An \c ir_dereference_variable of the temprorary generated in the constructor
1362 emit_inline_matrix_constructor(const glsl_type
*type
,
1363 exec_list
*instructions
,
1364 exec_list
*parameters
,
1367 assert(!parameters
->is_empty());
1369 ir_variable
*var
= new(ctx
) ir_variable(type
, "mat_ctor", ir_var_temporary
);
1370 instructions
->push_tail(var
);
1372 /* There are three kinds of matrix constructors.
1374 * - Construct a matrix from a single scalar by replicating that scalar to
1375 * along the diagonal of the matrix and setting all other components to
1378 * - Construct a matrix from an arbirary combination of vectors and
1379 * scalars. The components of the constructor parameters are assigned
1380 * to the matrix in column-major order until the matrix is full.
1382 * - Construct a matrix from a single matrix. The source matrix is copied
1383 * to the upper left portion of the constructed matrix, and the remaining
1384 * elements take values from the identity matrix.
1386 ir_rvalue
*const first_param
= (ir_rvalue
*) parameters
->head
;
1387 if (single_scalar_parameter(parameters
)) {
1388 /* Assign the scalar to the X component of a vec4, and fill the remaining
1389 * components with zero.
1391 glsl_base_type param_base_type
= first_param
->type
->base_type
;
1392 assert(param_base_type
== GLSL_TYPE_FLOAT
||
1393 param_base_type
== GLSL_TYPE_DOUBLE
);
1394 ir_variable
*rhs_var
=
1395 new(ctx
) ir_variable(glsl_type::get_instance(param_base_type
, 4, 1),
1398 instructions
->push_tail(rhs_var
);
1400 ir_constant_data zero
;
1401 for (unsigned i
= 0; i
< 4; i
++)
1402 if (param_base_type
== GLSL_TYPE_FLOAT
)
1407 ir_instruction
*inst
=
1408 new(ctx
) ir_assignment(new(ctx
) ir_dereference_variable(rhs_var
),
1409 new(ctx
) ir_constant(rhs_var
->type
, &zero
),
1411 instructions
->push_tail(inst
);
1413 ir_dereference
*const rhs_ref
= new(ctx
) ir_dereference_variable(rhs_var
);
1415 inst
= new(ctx
) ir_assignment(rhs_ref
, first_param
, NULL
, 0x01);
1416 instructions
->push_tail(inst
);
1418 /* Assign the temporary vector to each column of the destination matrix
1419 * with a swizzle that puts the X component on the diagonal of the
1420 * matrix. In some cases this may mean that the X component does not
1421 * get assigned into the column at all (i.e., when the matrix has more
1422 * columns than rows).
1424 static const unsigned rhs_swiz
[4][4] = {
1431 const unsigned cols_to_init
= MIN2(type
->matrix_columns
,
1432 type
->vector_elements
);
1433 for (unsigned i
= 0; i
< cols_to_init
; i
++) {
1434 ir_constant
*const col_idx
= new(ctx
) ir_constant(i
);
1435 ir_rvalue
*const col_ref
= new(ctx
) ir_dereference_array(var
, col_idx
);
1437 ir_rvalue
*const rhs_ref
= new(ctx
) ir_dereference_variable(rhs_var
);
1438 ir_rvalue
*const rhs
= new(ctx
) ir_swizzle(rhs_ref
, rhs_swiz
[i
],
1439 type
->vector_elements
);
1441 inst
= new(ctx
) ir_assignment(col_ref
, rhs
, NULL
);
1442 instructions
->push_tail(inst
);
1445 for (unsigned i
= cols_to_init
; i
< type
->matrix_columns
; i
++) {
1446 ir_constant
*const col_idx
= new(ctx
) ir_constant(i
);
1447 ir_rvalue
*const col_ref
= new(ctx
) ir_dereference_array(var
, col_idx
);
1449 ir_rvalue
*const rhs_ref
= new(ctx
) ir_dereference_variable(rhs_var
);
1450 ir_rvalue
*const rhs
= new(ctx
) ir_swizzle(rhs_ref
, 1, 1, 1, 1,
1451 type
->vector_elements
);
1453 inst
= new(ctx
) ir_assignment(col_ref
, rhs
, NULL
);
1454 instructions
->push_tail(inst
);
1456 } else if (first_param
->type
->is_matrix()) {
1457 /* From page 50 (56 of the PDF) of the GLSL 1.50 spec:
1459 * "If a matrix is constructed from a matrix, then each component
1460 * (column i, row j) in the result that has a corresponding
1461 * component (column i, row j) in the argument will be initialized
1462 * from there. All other components will be initialized to the
1463 * identity matrix. If a matrix argument is given to a matrix
1464 * constructor, it is an error to have any other arguments."
1466 assert(first_param
->next
->is_tail_sentinel());
1467 ir_rvalue
*const src_matrix
= first_param
;
1469 /* If the source matrix is smaller, pre-initialize the relavent parts of
1470 * the destination matrix to the identity matrix.
1472 if ((src_matrix
->type
->matrix_columns
< var
->type
->matrix_columns
) ||
1473 (src_matrix
->type
->vector_elements
< var
->type
->vector_elements
)) {
1475 /* If the source matrix has fewer rows, every column of the destination
1476 * must be initialized. Otherwise only the columns in the destination
1477 * that do not exist in the source must be initialized.
1480 (src_matrix
->type
->vector_elements
< var
->type
->vector_elements
)
1481 ? 0 : src_matrix
->type
->matrix_columns
;
1483 const glsl_type
*const col_type
= var
->type
->column_type();
1484 for (/* empty */; col
< var
->type
->matrix_columns
; col
++) {
1485 ir_constant_data ident
;
1487 if (!col_type
->is_double()) {
1492 ident
.f
[col
] = 1.0f
;
1501 ir_rvalue
*const rhs
= new(ctx
) ir_constant(col_type
, &ident
);
1503 ir_rvalue
*const lhs
=
1504 new(ctx
) ir_dereference_array(var
, new(ctx
) ir_constant(col
));
1506 ir_instruction
*inst
= new(ctx
) ir_assignment(lhs
, rhs
, NULL
);
1507 instructions
->push_tail(inst
);
1511 /* Assign columns from the source matrix to the destination matrix.
1513 * Since the parameter will be used in the RHS of multiple assignments,
1514 * generate a temporary and copy the paramter there.
1516 ir_variable
*const rhs_var
=
1517 new(ctx
) ir_variable(first_param
->type
, "mat_ctor_mat",
1519 instructions
->push_tail(rhs_var
);
1521 ir_dereference
*const rhs_var_ref
=
1522 new(ctx
) ir_dereference_variable(rhs_var
);
1523 ir_instruction
*const inst
=
1524 new(ctx
) ir_assignment(rhs_var_ref
, first_param
, NULL
);
1525 instructions
->push_tail(inst
);
1527 const unsigned last_row
= MIN2(src_matrix
->type
->vector_elements
,
1528 var
->type
->vector_elements
);
1529 const unsigned last_col
= MIN2(src_matrix
->type
->matrix_columns
,
1530 var
->type
->matrix_columns
);
1532 unsigned swiz
[4] = { 0, 0, 0, 0 };
1533 for (unsigned i
= 1; i
< last_row
; i
++)
1536 const unsigned write_mask
= (1U << last_row
) - 1;
1538 for (unsigned i
= 0; i
< last_col
; i
++) {
1539 ir_dereference
*const lhs
=
1540 new(ctx
) ir_dereference_array(var
, new(ctx
) ir_constant(i
));
1541 ir_rvalue
*const rhs_col
=
1542 new(ctx
) ir_dereference_array(rhs_var
, new(ctx
) ir_constant(i
));
1544 /* If one matrix has columns that are smaller than the columns of the
1545 * other matrix, wrap the column access of the larger with a swizzle
1546 * so that the LHS and RHS of the assignment have the same size (and
1547 * therefore have the same type).
1549 * It would be perfectly valid to unconditionally generate the
1550 * swizzles, this this will typically result in a more compact IR tree.
1553 if (lhs
->type
->vector_elements
!= rhs_col
->type
->vector_elements
) {
1554 rhs
= new(ctx
) ir_swizzle(rhs_col
, swiz
, last_row
);
1559 ir_instruction
*inst
=
1560 new(ctx
) ir_assignment(lhs
, rhs
, NULL
, write_mask
);
1561 instructions
->push_tail(inst
);
1564 const unsigned cols
= type
->matrix_columns
;
1565 const unsigned rows
= type
->vector_elements
;
1566 unsigned remaining_slots
= rows
* cols
;
1567 unsigned col_idx
= 0;
1568 unsigned row_idx
= 0;
1570 foreach_in_list(ir_rvalue
, rhs
, parameters
) {
1571 unsigned rhs_components
= rhs
->type
->components();
1572 unsigned rhs_base
= 0;
1574 if (remaining_slots
== 0)
1577 /* Since the parameter might be used in the RHS of two assignments,
1578 * generate a temporary and copy the paramter there.
1580 ir_variable
*rhs_var
=
1581 new(ctx
) ir_variable(rhs
->type
, "mat_ctor_vec", ir_var_temporary
);
1582 instructions
->push_tail(rhs_var
);
1584 ir_dereference
*rhs_var_ref
=
1585 new(ctx
) ir_dereference_variable(rhs_var
);
1586 ir_instruction
*inst
= new(ctx
) ir_assignment(rhs_var_ref
, rhs
, NULL
);
1587 instructions
->push_tail(inst
);
1590 /* Assign the current parameter to as many components of the matrix
1593 * NOTE: A single vector parameter can span two matrix columns. A
1594 * single vec4, for example, can completely fill a mat2.
1596 unsigned count
= MIN2(rows
- row_idx
,
1597 rhs_components
- rhs_base
);
1599 rhs_var_ref
= new(ctx
) ir_dereference_variable(rhs_var
);
1600 ir_instruction
*inst
= assign_to_matrix_column(var
, col_idx
,
1605 instructions
->push_tail(inst
);
1608 remaining_slots
-= count
;
1610 /* Sometimes, there is still data left in the parameters and
1611 * components left to be set in the destination but in other
1614 if (row_idx
>= rows
) {
1618 } while(remaining_slots
> 0 && rhs_base
< rhs_components
);
1622 return new(ctx
) ir_dereference_variable(var
);
1627 emit_inline_record_constructor(const glsl_type
*type
,
1628 exec_list
*instructions
,
1629 exec_list
*parameters
,
1632 ir_variable
*const var
=
1633 new(mem_ctx
) ir_variable(type
, "record_ctor", ir_var_temporary
);
1634 ir_dereference_variable
*const d
= new(mem_ctx
) ir_dereference_variable(var
);
1636 instructions
->push_tail(var
);
1638 exec_node
*node
= parameters
->head
;
1639 for (unsigned i
= 0; i
< type
->length
; i
++) {
1640 assert(!node
->is_tail_sentinel());
1642 ir_dereference
*const lhs
=
1643 new(mem_ctx
) ir_dereference_record(d
->clone(mem_ctx
, NULL
),
1644 type
->fields
.structure
[i
].name
);
1646 ir_rvalue
*const rhs
= ((ir_instruction
*) node
)->as_rvalue();
1647 assert(rhs
!= NULL
);
1649 ir_instruction
*const assign
= new(mem_ctx
) ir_assignment(lhs
, rhs
, NULL
);
1651 instructions
->push_tail(assign
);
1660 process_record_constructor(exec_list
*instructions
,
1661 const glsl_type
*constructor_type
,
1662 YYLTYPE
*loc
, exec_list
*parameters
,
1663 struct _mesa_glsl_parse_state
*state
)
1666 exec_list actual_parameters
;
1668 process_parameters(instructions
, &actual_parameters
,
1671 exec_node
*node
= actual_parameters
.head
;
1672 for (unsigned i
= 0; i
< constructor_type
->length
; i
++) {
1673 ir_rvalue
*ir
= (ir_rvalue
*) node
;
1675 if (node
->is_tail_sentinel()) {
1676 _mesa_glsl_error(loc
, state
,
1677 "insufficient parameters to constructor for `%s'",
1678 constructor_type
->name
);
1679 return ir_rvalue::error_value(ctx
);
1682 if (apply_implicit_conversion(constructor_type
->fields
.structure
[i
].type
,
1684 node
->replace_with(ir
);
1686 _mesa_glsl_error(loc
, state
,
1687 "parameter type mismatch in constructor for `%s.%s' "
1689 constructor_type
->name
,
1690 constructor_type
->fields
.structure
[i
].name
,
1692 constructor_type
->fields
.structure
[i
].type
->name
);
1693 return ir_rvalue::error_value(ctx
);
1699 if (!node
->is_tail_sentinel()) {
1700 _mesa_glsl_error(loc
, state
, "too many parameters in constructor "
1701 "for `%s'", constructor_type
->name
);
1702 return ir_rvalue::error_value(ctx
);
1705 ir_rvalue
*const constant
=
1706 constant_record_constructor(constructor_type
, &actual_parameters
,
1709 return (constant
!= NULL
)
1711 : emit_inline_record_constructor(constructor_type
, instructions
,
1712 &actual_parameters
, state
);
1716 ast_function_expression::handle_method(exec_list
*instructions
,
1717 struct _mesa_glsl_parse_state
*state
)
1719 const ast_expression
*field
= subexpressions
[0];
1723 /* Handle "method calls" in GLSL 1.20 - namely, array.length() */
1724 YYLTYPE loc
= get_location();
1725 state
->check_version(120, 300, &loc
, "methods not supported");
1728 method
= field
->primary_expression
.identifier
;
1730 /* This would prevent to raise "uninitialized variable" warnings when
1731 * calling array.length.
1733 field
->subexpressions
[0]->set_is_lhs(true);
1734 op
= field
->subexpressions
[0]->hir(instructions
, state
);
1735 if (strcmp(method
, "length") == 0) {
1736 if (!this->expressions
.is_empty()) {
1737 _mesa_glsl_error(&loc
, state
, "length method takes no arguments");
1741 if (op
->type
->is_array()) {
1742 if (op
->type
->is_unsized_array()) {
1743 if (!state
->has_shader_storage_buffer_objects()) {
1744 _mesa_glsl_error(&loc
, state
, "length called on unsized array"
1745 " only available with "
1746 "ARB_shader_storage_buffer_object");
1748 /* Calculate length of an unsized array in run-time */
1749 result
= new(ctx
) ir_expression(ir_unop_ssbo_unsized_array_length
, op
);
1751 result
= new(ctx
) ir_constant(op
->type
->array_size());
1753 } else if (op
->type
->is_vector()) {
1754 if (state
->has_420pack()) {
1755 /* .length() returns int. */
1756 result
= new(ctx
) ir_constant((int) op
->type
->vector_elements
);
1758 _mesa_glsl_error(&loc
, state
, "length method on matrix only available"
1759 "with ARB_shading_language_420pack");
1762 } else if (op
->type
->is_matrix()) {
1763 if (state
->has_420pack()) {
1764 /* .length() returns int. */
1765 result
= new(ctx
) ir_constant((int) op
->type
->matrix_columns
);
1767 _mesa_glsl_error(&loc
, state
, "length method on matrix only available"
1768 "with ARB_shading_language_420pack");
1772 _mesa_glsl_error(&loc
, state
, "length called on scalar.");
1776 _mesa_glsl_error(&loc
, state
, "unknown method: `%s'", method
);
1781 return ir_rvalue::error_value(ctx
);
1785 ast_function_expression::hir(exec_list
*instructions
,
1786 struct _mesa_glsl_parse_state
*state
)
1789 /* There are three sorts of function calls.
1791 * 1. constructors - The first subexpression is an ast_type_specifier.
1792 * 2. methods - Only the .length() method of array types.
1793 * 3. functions - Calls to regular old functions.
1796 if (is_constructor()) {
1797 const ast_type_specifier
*type
= (ast_type_specifier
*) subexpressions
[0];
1798 YYLTYPE loc
= type
->get_location();
1801 const glsl_type
*const constructor_type
= type
->glsl_type(& name
, state
);
1803 /* constructor_type can be NULL if a variable with the same name as the
1804 * structure has come into scope.
1806 if (constructor_type
== NULL
) {
1807 _mesa_glsl_error(& loc
, state
, "unknown type `%s' (structure name "
1808 "may be shadowed by a variable with the same name)",
1810 return ir_rvalue::error_value(ctx
);
1814 /* Constructors for opaque types are illegal.
1816 if (constructor_type
->contains_opaque()) {
1817 _mesa_glsl_error(& loc
, state
, "cannot construct opaque type `%s'",
1818 constructor_type
->name
);
1819 return ir_rvalue::error_value(ctx
);
1822 if (constructor_type
->is_array()) {
1823 if (!state
->check_version(120, 300, &loc
,
1824 "array constructors forbidden")) {
1825 return ir_rvalue::error_value(ctx
);
1828 return process_array_constructor(instructions
, constructor_type
,
1829 & loc
, &this->expressions
, state
);
1833 /* There are two kinds of constructor calls. Constructors for arrays and
1834 * structures must have the exact number of arguments with matching types
1835 * in the correct order. These constructors follow essentially the same
1836 * type matching rules as functions.
1838 * Constructors for built-in language types, such as mat4 and vec2, are
1839 * free form. The only requirements are that the parameters must provide
1840 * enough values of the correct scalar type and that no arguments are
1841 * given past the last used argument.
1843 * When using the C-style initializer syntax from GLSL 4.20, constructors
1844 * must have the exact number of arguments with matching types in the
1847 if (constructor_type
->is_record()) {
1848 return process_record_constructor(instructions
, constructor_type
,
1849 &loc
, &this->expressions
,
1853 if (!constructor_type
->is_numeric() && !constructor_type
->is_boolean())
1854 return ir_rvalue::error_value(ctx
);
1856 /* Total number of components of the type being constructed. */
1857 const unsigned type_components
= constructor_type
->components();
1859 /* Number of components from parameters that have actually been
1860 * consumed. This is used to perform several kinds of error checking.
1862 unsigned components_used
= 0;
1864 unsigned matrix_parameters
= 0;
1865 unsigned nonmatrix_parameters
= 0;
1866 exec_list actual_parameters
;
1868 foreach_list_typed(ast_node
, ast
, link
, &this->expressions
) {
1869 ir_rvalue
*result
= ast
->hir(instructions
, state
);
1871 /* From page 50 (page 56 of the PDF) of the GLSL 1.50 spec:
1873 * "It is an error to provide extra arguments beyond this
1874 * last used argument."
1876 if (components_used
>= type_components
) {
1877 _mesa_glsl_error(& loc
, state
, "too many parameters to `%s' "
1879 constructor_type
->name
);
1880 return ir_rvalue::error_value(ctx
);
1883 if (!result
->type
->is_numeric() && !result
->type
->is_boolean()) {
1884 _mesa_glsl_error(& loc
, state
, "cannot construct `%s' from a "
1885 "non-numeric data type",
1886 constructor_type
->name
);
1887 return ir_rvalue::error_value(ctx
);
1890 /* Count the number of matrix and nonmatrix parameters. This
1891 * is used below to enforce some of the constructor rules.
1893 if (result
->type
->is_matrix())
1894 matrix_parameters
++;
1896 nonmatrix_parameters
++;
1898 actual_parameters
.push_tail(result
);
1899 components_used
+= result
->type
->components();
1902 /* From page 28 (page 34 of the PDF) of the GLSL 1.10 spec:
1904 * "It is an error to construct matrices from other matrices. This
1905 * is reserved for future use."
1907 if (matrix_parameters
> 0
1908 && constructor_type
->is_matrix()
1909 && !state
->check_version(120, 100, &loc
,
1910 "cannot construct `%s' from a matrix",
1911 constructor_type
->name
)) {
1912 return ir_rvalue::error_value(ctx
);
1915 /* From page 50 (page 56 of the PDF) of the GLSL 1.50 spec:
1917 * "If a matrix argument is given to a matrix constructor, it is
1918 * an error to have any other arguments."
1920 if ((matrix_parameters
> 0)
1921 && ((matrix_parameters
+ nonmatrix_parameters
) > 1)
1922 && constructor_type
->is_matrix()) {
1923 _mesa_glsl_error(& loc
, state
, "for matrix `%s' constructor, "
1924 "matrix must be only parameter",
1925 constructor_type
->name
);
1926 return ir_rvalue::error_value(ctx
);
1929 /* From page 28 (page 34 of the PDF) of the GLSL 1.10 spec:
1931 * "In these cases, there must be enough components provided in the
1932 * arguments to provide an initializer for every component in the
1933 * constructed value."
1935 if (components_used
< type_components
&& components_used
!= 1
1936 && matrix_parameters
== 0) {
1937 _mesa_glsl_error(& loc
, state
, "too few components to construct "
1939 constructor_type
->name
);
1940 return ir_rvalue::error_value(ctx
);
1943 /* Matrices can never be consumed as is by any constructor but matrix
1944 * constructors. If the constructor type is not matrix, always break the
1945 * matrix up into a series of column vectors.
1947 if (!constructor_type
->is_matrix()) {
1948 foreach_in_list_safe(ir_rvalue
, matrix
, &actual_parameters
) {
1949 if (!matrix
->type
->is_matrix())
1952 /* Create a temporary containing the matrix. */
1953 ir_variable
*var
= new(ctx
) ir_variable(matrix
->type
, "matrix_tmp",
1955 instructions
->push_tail(var
);
1956 instructions
->push_tail(new(ctx
) ir_assignment(new(ctx
)
1957 ir_dereference_variable(var
), matrix
, NULL
));
1958 var
->constant_value
= matrix
->constant_expression_value();
1960 /* Replace the matrix with dereferences of its columns. */
1961 for (int i
= 0; i
< matrix
->type
->matrix_columns
; i
++) {
1962 matrix
->insert_before(new (ctx
) ir_dereference_array(var
,
1963 new(ctx
) ir_constant(i
)));
1969 bool all_parameters_are_constant
= true;
1971 /* Type cast each parameter and, if possible, fold constants.*/
1972 foreach_in_list_safe(ir_rvalue
, ir
, &actual_parameters
) {
1973 const glsl_type
*desired_type
=
1974 glsl_type::get_instance(constructor_type
->base_type
,
1975 ir
->type
->vector_elements
,
1976 ir
->type
->matrix_columns
);
1977 ir_rvalue
*result
= convert_component(ir
, desired_type
);
1979 /* Attempt to convert the parameter to a constant valued expression.
1980 * After doing so, track whether or not all the parameters to the
1981 * constructor are trivially constant valued expressions.
1983 ir_rvalue
*const constant
= result
->constant_expression_value();
1985 if (constant
!= NULL
)
1988 all_parameters_are_constant
= false;
1991 ir
->replace_with(result
);
1995 /* If all of the parameters are trivially constant, create a
1996 * constant representing the complete collection of parameters.
1998 if (all_parameters_are_constant
) {
1999 return new(ctx
) ir_constant(constructor_type
, &actual_parameters
);
2000 } else if (constructor_type
->is_scalar()) {
2001 return dereference_component((ir_rvalue
*) actual_parameters
.head
,
2003 } else if (constructor_type
->is_vector()) {
2004 return emit_inline_vector_constructor(constructor_type
,
2009 assert(constructor_type
->is_matrix());
2010 return emit_inline_matrix_constructor(constructor_type
,
2015 } else if (subexpressions
[0]->oper
== ast_field_selection
) {
2016 return handle_method(instructions
, state
);
2018 const ast_expression
*id
= subexpressions
[0];
2019 const char *func_name
;
2020 YYLTYPE loc
= get_location();
2021 exec_list actual_parameters
;
2022 ir_variable
*sub_var
= NULL
;
2023 ir_rvalue
*array_idx
= NULL
;
2025 process_parameters(instructions
, &actual_parameters
, &this->expressions
,
2028 if (id
->oper
== ast_array_index
) {
2029 array_idx
= generate_array_index(ctx
, instructions
, state
, loc
,
2030 id
->subexpressions
[0],
2031 id
->subexpressions
[1], &func_name
,
2032 &actual_parameters
);
2034 func_name
= id
->primary_expression
.identifier
;
2037 ir_function_signature
*sig
=
2038 match_function_by_name(func_name
, &actual_parameters
, state
);
2040 ir_rvalue
*value
= NULL
;
2042 sig
= match_subroutine_by_name(func_name
, &actual_parameters
, state
, &sub_var
);
2046 no_matching_function_error(func_name
, &loc
, &actual_parameters
, state
);
2047 value
= ir_rvalue::error_value(ctx
);
2048 } else if (!verify_parameter_modes(state
, sig
, actual_parameters
, this->expressions
)) {
2049 /* an error has already been emitted */
2050 value
= ir_rvalue::error_value(ctx
);
2052 value
= generate_call(instructions
, sig
, &actual_parameters
, sub_var
, array_idx
, state
);
2054 ir_variable
*const tmp
= new(ctx
) ir_variable(glsl_type::void_type
,
2057 instructions
->push_tail(tmp
);
2058 value
= new(ctx
) ir_dereference_variable(tmp
);
2065 unreachable("not reached");
2069 ast_function_expression::has_sequence_subexpression() const
2071 foreach_list_typed(const ast_node
, ast
, link
, &this->expressions
) {
2072 if (ast
->has_sequence_subexpression())
2080 ast_aggregate_initializer::hir(exec_list
*instructions
,
2081 struct _mesa_glsl_parse_state
*state
)
2084 YYLTYPE loc
= this->get_location();
2086 if (!this->constructor_type
) {
2087 _mesa_glsl_error(&loc
, state
, "type of C-style initializer unknown");
2088 return ir_rvalue::error_value(ctx
);
2090 const glsl_type
*const constructor_type
= this->constructor_type
;
2092 if (!state
->has_420pack()) {
2093 _mesa_glsl_error(&loc
, state
, "C-style initialization requires the "
2094 "GL_ARB_shading_language_420pack extension");
2095 return ir_rvalue::error_value(ctx
);
2098 if (constructor_type
->is_array()) {
2099 return process_array_constructor(instructions
, constructor_type
, &loc
,
2100 &this->expressions
, state
);
2103 if (constructor_type
->is_record()) {
2104 return process_record_constructor(instructions
, constructor_type
, &loc
,
2105 &this->expressions
, state
);
2108 return process_vec_mat_constructor(instructions
, constructor_type
, &loc
,
2109 &this->expressions
, state
);