Merge remote branch 'origin/master' into pipe-video
[mesa.git] / src / glsl / ast_function.cpp
1 /*
2 * Copyright © 2010 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
22 */
23
24 #include "glsl_symbol_table.h"
25 #include "ast.h"
26 #include "glsl_types.h"
27 #include "ir.h"
28 #include "main/core.h" /* for MIN2 */
29
30 static ir_rvalue *
31 convert_component(ir_rvalue *src, const glsl_type *desired_type);
32
33 bool
34 apply_implicit_conversion(const glsl_type *to, ir_rvalue * &from,
35 struct _mesa_glsl_parse_state *state);
36
37 static unsigned
38 process_parameters(exec_list *instructions, exec_list *actual_parameters,
39 exec_list *parameters,
40 struct _mesa_glsl_parse_state *state)
41 {
42 unsigned count = 0;
43
44 foreach_list (n, parameters) {
45 ast_node *const ast = exec_node_data(ast_node, n, link);
46 ir_rvalue *result = ast->hir(instructions, state);
47
48 ir_constant *const constant = result->constant_expression_value();
49 if (constant != NULL)
50 result = constant;
51
52 actual_parameters->push_tail(result);
53 count++;
54 }
55
56 return count;
57 }
58
59
60 /**
61 * Generate a source prototype for a function signature
62 *
63 * \param return_type Return type of the function. May be \c NULL.
64 * \param name Name of the function.
65 * \param parameters Parameter list for the function. This may be either a
66 * formal or actual parameter list. Only the type is used.
67 *
68 * \return
69 * A talloced string representing the prototype of the function.
70 */
71 char *
72 prototype_string(const glsl_type *return_type, const char *name,
73 exec_list *parameters)
74 {
75 char *str = NULL;
76
77 if (return_type != NULL)
78 str = talloc_asprintf(str, "%s ", return_type->name);
79
80 str = talloc_asprintf_append(str, "%s(", name);
81
82 const char *comma = "";
83 foreach_list(node, parameters) {
84 const ir_instruction *const param = (ir_instruction *) node;
85
86 str = talloc_asprintf_append(str, "%s%s", comma, param->type->name);
87 comma = ", ";
88 }
89
90 str = talloc_strdup_append(str, ")");
91 return str;
92 }
93
94
95 static ir_rvalue *
96 process_call(exec_list *instructions, ir_function *f,
97 YYLTYPE *loc, exec_list *actual_parameters,
98 struct _mesa_glsl_parse_state *state)
99 {
100 void *ctx = state;
101
102 ir_function_signature *sig = f->matching_signature(actual_parameters);
103
104 if (sig != NULL) {
105 /* Verify that 'out' and 'inout' actual parameters are lvalues. This
106 * isn't done in ir_function::matching_signature because that function
107 * cannot generate the necessary diagnostics.
108 */
109 exec_list_iterator actual_iter = actual_parameters->iterator();
110 exec_list_iterator formal_iter = sig->parameters.iterator();
111
112 while (actual_iter.has_next()) {
113 ir_rvalue *actual = (ir_rvalue *) actual_iter.get();
114 ir_variable *formal = (ir_variable *) formal_iter.get();
115
116 assert(actual != NULL);
117 assert(formal != NULL);
118
119 if ((formal->mode == ir_var_out)
120 || (formal->mode == ir_var_inout)) {
121 if (! actual->is_lvalue()) {
122 /* FINISHME: Log a better diagnostic here. There is no way
123 * FINISHME: to tell the user which parameter is invalid.
124 */
125 _mesa_glsl_error(loc, state, "`%s' parameter is not lvalue",
126 (formal->mode == ir_var_out) ? "out" : "inout");
127 }
128 }
129
130 if (formal->type->is_numeric() || formal->type->is_boolean()) {
131 ir_rvalue *converted = convert_component(actual, formal->type);
132 actual->replace_with(converted);
133 }
134
135 actual_iter.next();
136 formal_iter.next();
137 }
138
139 /* Always insert the call in the instruction stream, and return a deref
140 * of its return val if it returns a value, since we don't know if
141 * the rvalue is going to be assigned to anything or not.
142 */
143 ir_call *call = new(ctx) ir_call(sig, actual_parameters);
144 if (!sig->return_type->is_void()) {
145 ir_variable *var;
146 ir_dereference_variable *deref;
147
148 var = new(ctx) ir_variable(sig->return_type,
149 talloc_asprintf(ctx, "%s_retval",
150 sig->function_name()),
151 ir_var_temporary);
152 instructions->push_tail(var);
153
154 deref = new(ctx) ir_dereference_variable(var);
155 ir_assignment *assign = new(ctx) ir_assignment(deref, call, NULL);
156 instructions->push_tail(assign);
157 if (state->language_version >= 120)
158 var->constant_value = call->constant_expression_value();
159
160 deref = new(ctx) ir_dereference_variable(var);
161 return deref;
162 } else {
163 instructions->push_tail(call);
164 return NULL;
165 }
166 } else {
167 char *str = prototype_string(NULL, f->name, actual_parameters);
168
169 _mesa_glsl_error(loc, state, "no matching function for call to `%s'",
170 str);
171 talloc_free(str);
172
173 const char *prefix = "candidates are: ";
174 foreach_list (node, &f->signatures) {
175 ir_function_signature *sig = (ir_function_signature *) node;
176
177 str = prototype_string(sig->return_type, f->name, &sig->parameters);
178 _mesa_glsl_error(loc, state, "%s%s\n", prefix, str);
179 talloc_free(str);
180
181 prefix = " ";
182 }
183
184 return ir_call::get_error_instruction(ctx);
185 }
186 }
187
188
189 static ir_rvalue *
190 match_function_by_name(exec_list *instructions, const char *name,
191 YYLTYPE *loc, exec_list *actual_parameters,
192 struct _mesa_glsl_parse_state *state)
193 {
194 void *ctx = state;
195 ir_function *f = state->symbols->get_function(name);
196
197 if (f == NULL) {
198 _mesa_glsl_error(loc, state, "function `%s' undeclared", name);
199 return ir_call::get_error_instruction(ctx);
200 }
201
202 /* Once we've determined that the function being called might exist, try
203 * to find an overload of the function that matches the parameters.
204 */
205 return process_call(instructions, f, loc, actual_parameters, state);
206 }
207
208
209 /**
210 * Perform automatic type conversion of constructor parameters
211 *
212 * This implements the rules in the "Conversion and Scalar Constructors"
213 * section (GLSL 1.10 section 5.4.1), not the "Implicit Conversions" rules.
214 */
215 static ir_rvalue *
216 convert_component(ir_rvalue *src, const glsl_type *desired_type)
217 {
218 void *ctx = talloc_parent(src);
219 const unsigned a = desired_type->base_type;
220 const unsigned b = src->type->base_type;
221 ir_expression *result = NULL;
222
223 if (src->type->is_error())
224 return src;
225
226 assert(a <= GLSL_TYPE_BOOL);
227 assert(b <= GLSL_TYPE_BOOL);
228
229 if ((a == b) || (src->type->is_integer() && desired_type->is_integer()))
230 return src;
231
232 switch (a) {
233 case GLSL_TYPE_UINT:
234 case GLSL_TYPE_INT:
235 if (b == GLSL_TYPE_FLOAT)
236 result = new(ctx) ir_expression(ir_unop_f2i, desired_type, src, NULL);
237 else {
238 assert(b == GLSL_TYPE_BOOL);
239 result = new(ctx) ir_expression(ir_unop_b2i, desired_type, src, NULL);
240 }
241 break;
242 case GLSL_TYPE_FLOAT:
243 switch (b) {
244 case GLSL_TYPE_UINT:
245 result = new(ctx) ir_expression(ir_unop_u2f, desired_type, src, NULL);
246 break;
247 case GLSL_TYPE_INT:
248 result = new(ctx) ir_expression(ir_unop_i2f, desired_type, src, NULL);
249 break;
250 case GLSL_TYPE_BOOL:
251 result = new(ctx) ir_expression(ir_unop_b2f, desired_type, src, NULL);
252 break;
253 }
254 break;
255 case GLSL_TYPE_BOOL:
256 switch (b) {
257 case GLSL_TYPE_UINT:
258 case GLSL_TYPE_INT:
259 result = new(ctx) ir_expression(ir_unop_i2b, desired_type, src, NULL);
260 break;
261 case GLSL_TYPE_FLOAT:
262 result = new(ctx) ir_expression(ir_unop_f2b, desired_type, src, NULL);
263 break;
264 }
265 break;
266 }
267
268 assert(result != NULL);
269
270 /* Try constant folding; it may fold in the conversion we just added. */
271 ir_constant *const constant = result->constant_expression_value();
272 return (constant != NULL) ? (ir_rvalue *) constant : (ir_rvalue *) result;
273 }
274
275 /**
276 * Dereference a specific component from a scalar, vector, or matrix
277 */
278 static ir_rvalue *
279 dereference_component(ir_rvalue *src, unsigned component)
280 {
281 void *ctx = talloc_parent(src);
282 assert(component < src->type->components());
283
284 /* If the source is a constant, just create a new constant instead of a
285 * dereference of the existing constant.
286 */
287 ir_constant *constant = src->as_constant();
288 if (constant)
289 return new(ctx) ir_constant(constant, component);
290
291 if (src->type->is_scalar()) {
292 return src;
293 } else if (src->type->is_vector()) {
294 return new(ctx) ir_swizzle(src, component, 0, 0, 0, 1);
295 } else {
296 assert(src->type->is_matrix());
297
298 /* Dereference a row of the matrix, then call this function again to get
299 * a specific element from that row.
300 */
301 const int c = component / src->type->column_type()->vector_elements;
302 const int r = component % src->type->column_type()->vector_elements;
303 ir_constant *const col_index = new(ctx) ir_constant(c);
304 ir_dereference *const col = new(ctx) ir_dereference_array(src, col_index);
305
306 col->type = src->type->column_type();
307
308 return dereference_component(col, r);
309 }
310
311 assert(!"Should not get here.");
312 return NULL;
313 }
314
315
316 static ir_rvalue *
317 process_array_constructor(exec_list *instructions,
318 const glsl_type *constructor_type,
319 YYLTYPE *loc, exec_list *parameters,
320 struct _mesa_glsl_parse_state *state)
321 {
322 void *ctx = state;
323 /* Array constructors come in two forms: sized and unsized. Sized array
324 * constructors look like 'vec4[2](a, b)', where 'a' and 'b' are vec4
325 * variables. In this case the number of parameters must exactly match the
326 * specified size of the array.
327 *
328 * Unsized array constructors look like 'vec4[](a, b)', where 'a' and 'b'
329 * are vec4 variables. In this case the size of the array being constructed
330 * is determined by the number of parameters.
331 *
332 * From page 52 (page 58 of the PDF) of the GLSL 1.50 spec:
333 *
334 * "There must be exactly the same number of arguments as the size of
335 * the array being constructed. If no size is present in the
336 * constructor, then the array is explicitly sized to the number of
337 * arguments provided. The arguments are assigned in order, starting at
338 * element 0, to the elements of the constructed array. Each argument
339 * must be the same type as the element type of the array, or be a type
340 * that can be converted to the element type of the array according to
341 * Section 4.1.10 "Implicit Conversions.""
342 */
343 exec_list actual_parameters;
344 const unsigned parameter_count =
345 process_parameters(instructions, &actual_parameters, parameters, state);
346
347 if ((parameter_count == 0)
348 || ((constructor_type->length != 0)
349 && (constructor_type->length != parameter_count))) {
350 const unsigned min_param = (constructor_type->length == 0)
351 ? 1 : constructor_type->length;
352
353 _mesa_glsl_error(loc, state, "array constructor must have %s %u "
354 "parameter%s",
355 (constructor_type->length != 0) ? "at least" : "exactly",
356 min_param, (min_param <= 1) ? "" : "s");
357 return ir_call::get_error_instruction(ctx);
358 }
359
360 if (constructor_type->length == 0) {
361 constructor_type =
362 glsl_type::get_array_instance(constructor_type->element_type(),
363 parameter_count);
364 assert(constructor_type != NULL);
365 assert(constructor_type->length == parameter_count);
366 }
367
368 bool all_parameters_are_constant = true;
369
370 /* Type cast each parameter and, if possible, fold constants. */
371 foreach_list_safe(n, &actual_parameters) {
372 ir_rvalue *ir = (ir_rvalue *) n;
373 ir_rvalue *result = ir;
374
375 /* Apply implicit conversions (not the scalar constructor rules!) */
376 if (constructor_type->element_type()->is_float()) {
377 const glsl_type *desired_type =
378 glsl_type::get_instance(GLSL_TYPE_FLOAT,
379 ir->type->vector_elements,
380 ir->type->matrix_columns);
381 result = convert_component(ir, desired_type);
382 }
383
384 if (result->type != constructor_type->element_type()) {
385 _mesa_glsl_error(loc, state, "type error in array constructor: "
386 "expected: %s, found %s",
387 constructor_type->element_type()->name,
388 result->type->name);
389 }
390
391 /* Attempt to convert the parameter to a constant valued expression.
392 * After doing so, track whether or not all the parameters to the
393 * constructor are trivially constant valued expressions.
394 */
395 ir_rvalue *const constant = result->constant_expression_value();
396
397 if (constant != NULL)
398 result = constant;
399 else
400 all_parameters_are_constant = false;
401
402 ir->replace_with(result);
403 }
404
405 if (all_parameters_are_constant)
406 return new(ctx) ir_constant(constructor_type, &actual_parameters);
407
408 ir_variable *var = new(ctx) ir_variable(constructor_type, "array_ctor",
409 ir_var_temporary);
410 instructions->push_tail(var);
411
412 int i = 0;
413 foreach_list(node, &actual_parameters) {
414 ir_rvalue *rhs = (ir_rvalue *) node;
415 ir_rvalue *lhs = new(ctx) ir_dereference_array(var,
416 new(ctx) ir_constant(i));
417
418 ir_instruction *assignment = new(ctx) ir_assignment(lhs, rhs, NULL);
419 instructions->push_tail(assignment);
420
421 i++;
422 }
423
424 return new(ctx) ir_dereference_variable(var);
425 }
426
427
428 /**
429 * Try to convert a record constructor to a constant expression
430 */
431 static ir_constant *
432 constant_record_constructor(const glsl_type *constructor_type,
433 exec_list *parameters, void *mem_ctx)
434 {
435 foreach_list(node, parameters) {
436 ir_constant *constant = ((ir_instruction *) node)->as_constant();
437 if (constant == NULL)
438 return NULL;
439 node->replace_with(constant);
440 }
441
442 return new(mem_ctx) ir_constant(constructor_type, parameters);
443 }
444
445
446 /**
447 * Determine if a list consists of a single scalar r-value
448 */
449 bool
450 single_scalar_parameter(exec_list *parameters)
451 {
452 const ir_rvalue *const p = (ir_rvalue *) parameters->head;
453 assert(((ir_rvalue *)p)->as_rvalue() != NULL);
454
455 return (p->type->is_scalar() && p->next->is_tail_sentinel());
456 }
457
458
459 /**
460 * Generate inline code for a vector constructor
461 *
462 * The generated constructor code will consist of a temporary variable
463 * declaration of the same type as the constructor. A sequence of assignments
464 * from constructor parameters to the temporary will follow.
465 *
466 * \return
467 * An \c ir_dereference_variable of the temprorary generated in the constructor
468 * body.
469 */
470 ir_rvalue *
471 emit_inline_vector_constructor(const glsl_type *type,
472 exec_list *instructions,
473 exec_list *parameters,
474 void *ctx)
475 {
476 assert(!parameters->is_empty());
477
478 ir_variable *var = new(ctx) ir_variable(type, "vec_ctor", ir_var_temporary);
479 instructions->push_tail(var);
480
481 /* There are two kinds of vector constructors.
482 *
483 * - Construct a vector from a single scalar by replicating that scalar to
484 * all components of the vector.
485 *
486 * - Construct a vector from an arbirary combination of vectors and
487 * scalars. The components of the constructor parameters are assigned
488 * to the vector in order until the vector is full.
489 */
490 const unsigned lhs_components = type->components();
491 if (single_scalar_parameter(parameters)) {
492 ir_rvalue *first_param = (ir_rvalue *)parameters->head;
493 ir_rvalue *rhs = new(ctx) ir_swizzle(first_param, 0, 0, 0, 0,
494 lhs_components);
495 ir_dereference_variable *lhs = new(ctx) ir_dereference_variable(var);
496 const unsigned mask = (1U << lhs_components) - 1;
497
498 assert(rhs->type == lhs->type);
499
500 ir_instruction *inst = new(ctx) ir_assignment(lhs, rhs, NULL, mask);
501 instructions->push_tail(inst);
502 } else {
503 unsigned base_component = 0;
504 unsigned base_lhs_component = 0;
505 ir_constant_data data;
506 unsigned constant_mask = 0, constant_components = 0;
507
508 memset(&data, 0, sizeof(data));
509
510 foreach_list(node, parameters) {
511 ir_rvalue *param = (ir_rvalue *) node;
512 unsigned rhs_components = param->type->components();
513
514 /* Do not try to assign more components to the vector than it has!
515 */
516 if ((rhs_components + base_lhs_component) > lhs_components) {
517 rhs_components = lhs_components - base_lhs_component;
518 }
519
520 const ir_constant *const c = param->as_constant();
521 if (c != NULL) {
522 for (unsigned i = 0; i < rhs_components; i++) {
523 switch (c->type->base_type) {
524 case GLSL_TYPE_UINT:
525 data.u[i + base_component] = c->get_uint_component(i);
526 break;
527 case GLSL_TYPE_INT:
528 data.i[i + base_component] = c->get_int_component(i);
529 break;
530 case GLSL_TYPE_FLOAT:
531 data.f[i + base_component] = c->get_float_component(i);
532 break;
533 case GLSL_TYPE_BOOL:
534 data.b[i + base_component] = c->get_bool_component(i);
535 break;
536 default:
537 assert(!"Should not get here.");
538 break;
539 }
540 }
541
542 /* Mask of fields to be written in the assignment.
543 */
544 constant_mask |= ((1U << rhs_components) - 1) << base_lhs_component;
545 constant_components += rhs_components;
546
547 base_component += rhs_components;
548 }
549 /* Advance the component index by the number of components
550 * that were just assigned.
551 */
552 base_lhs_component += rhs_components;
553 }
554
555 if (constant_mask != 0) {
556 ir_dereference *lhs = new(ctx) ir_dereference_variable(var);
557 const glsl_type *rhs_type = glsl_type::get_instance(var->type->base_type,
558 constant_components,
559 1);
560 ir_rvalue *rhs = new(ctx) ir_constant(rhs_type, &data);
561
562 ir_instruction *inst =
563 new(ctx) ir_assignment(lhs, rhs, NULL, constant_mask);
564 instructions->push_tail(inst);
565 }
566
567 base_component = 0;
568 foreach_list(node, parameters) {
569 ir_rvalue *param = (ir_rvalue *) node;
570 unsigned rhs_components = param->type->components();
571
572 /* Do not try to assign more components to the vector than it has!
573 */
574 if ((rhs_components + base_component) > lhs_components) {
575 rhs_components = lhs_components - base_component;
576 }
577
578 const ir_constant *const c = param->as_constant();
579 if (c == NULL) {
580 /* Generate a swizzle in case rhs_components != rhs->type->vector_elements. */
581 unsigned swiz[4] = { 0, 0, 0, 0 };
582 for (unsigned i = 0; i < rhs_components; i++)
583 swiz[i] = i;
584
585 /* Mask of fields to be written in the assignment.
586 */
587 const unsigned write_mask = ((1U << rhs_components) - 1)
588 << base_component;
589
590 ir_dereference *lhs = new(ctx) ir_dereference_variable(var);
591 ir_rvalue *rhs = new(ctx) ir_swizzle(param, swiz, rhs_components);
592
593 ir_instruction *inst =
594 new(ctx) ir_assignment(lhs, rhs, NULL, write_mask);
595 instructions->push_tail(inst);
596 }
597
598 /* Advance the component index by the number of components that were
599 * just assigned.
600 */
601 base_component += rhs_components;
602 }
603 }
604 return new(ctx) ir_dereference_variable(var);
605 }
606
607
608 /**
609 * Generate assignment of a portion of a vector to a portion of a matrix column
610 *
611 * \param src_base First component of the source to be used in assignment
612 * \param column Column of destination to be assiged
613 * \param row_base First component of the destination column to be assigned
614 * \param count Number of components to be assigned
615 *
616 * \note
617 * \c src_base + \c count must be less than or equal to the number of components
618 * in the source vector.
619 */
620 ir_instruction *
621 assign_to_matrix_column(ir_variable *var, unsigned column, unsigned row_base,
622 ir_rvalue *src, unsigned src_base, unsigned count,
623 void *mem_ctx)
624 {
625 ir_constant *col_idx = new(mem_ctx) ir_constant(column);
626 ir_dereference *column_ref = new(mem_ctx) ir_dereference_array(var, col_idx);
627
628 assert(column_ref->type->components() >= (row_base + count));
629 assert(src->type->components() >= (src_base + count));
630
631 /* Generate a swizzle that puts the first element of the source at the
632 * location of the first element of the destination.
633 */
634 unsigned swiz[4] = { src_base, src_base, src_base, src_base };
635 for (unsigned i = 0; i < count; i++)
636 swiz[i + row_base] = i;
637
638 ir_rvalue *const rhs =
639 new(mem_ctx) ir_swizzle(src, swiz, count);
640
641 /* Mask of fields to be written in the assignment.
642 */
643 const unsigned write_mask = ((1U << count) - 1) << row_base;
644
645 return new(mem_ctx) ir_assignment(column_ref, rhs, NULL, write_mask);
646 }
647
648
649 /**
650 * Generate inline code for a matrix constructor
651 *
652 * The generated constructor code will consist of a temporary variable
653 * declaration of the same type as the constructor. A sequence of assignments
654 * from constructor parameters to the temporary will follow.
655 *
656 * \return
657 * An \c ir_dereference_variable of the temprorary generated in the constructor
658 * body.
659 */
660 ir_rvalue *
661 emit_inline_matrix_constructor(const glsl_type *type,
662 exec_list *instructions,
663 exec_list *parameters,
664 void *ctx)
665 {
666 assert(!parameters->is_empty());
667
668 ir_variable *var = new(ctx) ir_variable(type, "mat_ctor", ir_var_temporary);
669 instructions->push_tail(var);
670
671 /* There are three kinds of matrix constructors.
672 *
673 * - Construct a matrix from a single scalar by replicating that scalar to
674 * along the diagonal of the matrix and setting all other components to
675 * zero.
676 *
677 * - Construct a matrix from an arbirary combination of vectors and
678 * scalars. The components of the constructor parameters are assigned
679 * to the matrix in colum-major order until the matrix is full.
680 *
681 * - Construct a matrix from a single matrix. The source matrix is copied
682 * to the upper left portion of the constructed matrix, and the remaining
683 * elements take values from the identity matrix.
684 */
685 ir_rvalue *const first_param = (ir_rvalue *) parameters->head;
686 if (single_scalar_parameter(parameters)) {
687 /* Assign the scalar to the X component of a vec4, and fill the remaining
688 * components with zero.
689 */
690 ir_variable *rhs_var =
691 new(ctx) ir_variable(glsl_type::vec4_type, "mat_ctor_vec",
692 ir_var_temporary);
693 instructions->push_tail(rhs_var);
694
695 ir_constant_data zero;
696 zero.f[0] = 0.0;
697 zero.f[1] = 0.0;
698 zero.f[2] = 0.0;
699 zero.f[3] = 0.0;
700
701 ir_instruction *inst =
702 new(ctx) ir_assignment(new(ctx) ir_dereference_variable(rhs_var),
703 new(ctx) ir_constant(rhs_var->type, &zero),
704 NULL);
705 instructions->push_tail(inst);
706
707 ir_dereference *const rhs_ref = new(ctx) ir_dereference_variable(rhs_var);
708
709 inst = new(ctx) ir_assignment(rhs_ref, first_param, NULL, 0x01);
710 instructions->push_tail(inst);
711
712 /* Assign the temporary vector to each column of the destination matrix
713 * with a swizzle that puts the X component on the diagonal of the
714 * matrix. In some cases this may mean that the X component does not
715 * get assigned into the column at all (i.e., when the matrix has more
716 * columns than rows).
717 */
718 static const unsigned rhs_swiz[4][4] = {
719 { 0, 1, 1, 1 },
720 { 1, 0, 1, 1 },
721 { 1, 1, 0, 1 },
722 { 1, 1, 1, 0 }
723 };
724
725 const unsigned cols_to_init = MIN2(type->matrix_columns,
726 type->vector_elements);
727 for (unsigned i = 0; i < cols_to_init; i++) {
728 ir_constant *const col_idx = new(ctx) ir_constant(i);
729 ir_rvalue *const col_ref = new(ctx) ir_dereference_array(var, col_idx);
730
731 ir_rvalue *const rhs_ref = new(ctx) ir_dereference_variable(rhs_var);
732 ir_rvalue *const rhs = new(ctx) ir_swizzle(rhs_ref, rhs_swiz[i],
733 type->vector_elements);
734
735 inst = new(ctx) ir_assignment(col_ref, rhs, NULL);
736 instructions->push_tail(inst);
737 }
738
739 for (unsigned i = cols_to_init; i < type->matrix_columns; i++) {
740 ir_constant *const col_idx = new(ctx) ir_constant(i);
741 ir_rvalue *const col_ref = new(ctx) ir_dereference_array(var, col_idx);
742
743 ir_rvalue *const rhs_ref = new(ctx) ir_dereference_variable(rhs_var);
744 ir_rvalue *const rhs = new(ctx) ir_swizzle(rhs_ref, 1, 1, 1, 1,
745 type->vector_elements);
746
747 inst = new(ctx) ir_assignment(col_ref, rhs, NULL);
748 instructions->push_tail(inst);
749 }
750 } else if (first_param->type->is_matrix()) {
751 /* From page 50 (56 of the PDF) of the GLSL 1.50 spec:
752 *
753 * "If a matrix is constructed from a matrix, then each component
754 * (column i, row j) in the result that has a corresponding
755 * component (column i, row j) in the argument will be initialized
756 * from there. All other components will be initialized to the
757 * identity matrix. If a matrix argument is given to a matrix
758 * constructor, it is an error to have any other arguments."
759 */
760 assert(first_param->next->is_tail_sentinel());
761 ir_rvalue *const src_matrix = first_param;
762
763 /* If the source matrix is smaller, pre-initialize the relavent parts of
764 * the destination matrix to the identity matrix.
765 */
766 if ((src_matrix->type->matrix_columns < var->type->matrix_columns)
767 || (src_matrix->type->vector_elements < var->type->vector_elements)) {
768
769 /* If the source matrix has fewer rows, every column of the destination
770 * must be initialized. Otherwise only the columns in the destination
771 * that do not exist in the source must be initialized.
772 */
773 unsigned col =
774 (src_matrix->type->vector_elements < var->type->vector_elements)
775 ? 0 : src_matrix->type->matrix_columns;
776
777 const glsl_type *const col_type = var->type->column_type();
778 for (/* empty */; col < var->type->matrix_columns; col++) {
779 ir_constant_data ident;
780
781 ident.f[0] = 0.0;
782 ident.f[1] = 0.0;
783 ident.f[2] = 0.0;
784 ident.f[3] = 0.0;
785
786 ident.f[col] = 1.0;
787
788 ir_rvalue *const rhs = new(ctx) ir_constant(col_type, &ident);
789
790 ir_rvalue *const lhs =
791 new(ctx) ir_dereference_array(var, new(ctx) ir_constant(col));
792
793 ir_instruction *inst = new(ctx) ir_assignment(lhs, rhs, NULL);
794 instructions->push_tail(inst);
795 }
796 }
797
798 /* Assign columns from the source matrix to the destination matrix.
799 *
800 * Since the parameter will be used in the RHS of multiple assignments,
801 * generate a temporary and copy the paramter there.
802 */
803 ir_variable *const rhs_var =
804 new(ctx) ir_variable(first_param->type, "mat_ctor_mat",
805 ir_var_temporary);
806 instructions->push_tail(rhs_var);
807
808 ir_dereference *const rhs_var_ref =
809 new(ctx) ir_dereference_variable(rhs_var);
810 ir_instruction *const inst =
811 new(ctx) ir_assignment(rhs_var_ref, first_param, NULL);
812 instructions->push_tail(inst);
813
814 const unsigned last_row = MIN2(src_matrix->type->vector_elements,
815 var->type->vector_elements);
816 const unsigned last_col = MIN2(src_matrix->type->matrix_columns,
817 var->type->matrix_columns);
818
819 unsigned swiz[4] = { 0, 0, 0, 0 };
820 for (unsigned i = 1; i < last_row; i++)
821 swiz[i] = i;
822
823 const unsigned write_mask = (1U << last_row) - 1;
824
825 for (unsigned i = 0; i < last_col; i++) {
826 ir_dereference *const lhs =
827 new(ctx) ir_dereference_array(var, new(ctx) ir_constant(i));
828 ir_rvalue *const rhs_col =
829 new(ctx) ir_dereference_array(rhs_var, new(ctx) ir_constant(i));
830
831 /* If one matrix has columns that are smaller than the columns of the
832 * other matrix, wrap the column access of the larger with a swizzle
833 * so that the LHS and RHS of the assignment have the same size (and
834 * therefore have the same type).
835 *
836 * It would be perfectly valid to unconditionally generate the
837 * swizzles, this this will typically result in a more compact IR tree.
838 */
839 ir_rvalue *rhs;
840 if (lhs->type->vector_elements != rhs_col->type->vector_elements) {
841 rhs = new(ctx) ir_swizzle(rhs_col, swiz, last_row);
842 } else {
843 rhs = rhs_col;
844 }
845
846 ir_instruction *inst =
847 new(ctx) ir_assignment(lhs, rhs, NULL, write_mask);
848 instructions->push_tail(inst);
849 }
850 } else {
851 const unsigned cols = type->matrix_columns;
852 const unsigned rows = type->vector_elements;
853 unsigned col_idx = 0;
854 unsigned row_idx = 0;
855
856 foreach_list (node, parameters) {
857 ir_rvalue *const rhs = (ir_rvalue *) node;
858 const unsigned components_remaining_this_column = rows - row_idx;
859 unsigned rhs_components = rhs->type->components();
860 unsigned rhs_base = 0;
861
862 /* Since the parameter might be used in the RHS of two assignments,
863 * generate a temporary and copy the paramter there.
864 */
865 ir_variable *rhs_var =
866 new(ctx) ir_variable(rhs->type, "mat_ctor_vec", ir_var_temporary);
867 instructions->push_tail(rhs_var);
868
869 ir_dereference *rhs_var_ref =
870 new(ctx) ir_dereference_variable(rhs_var);
871 ir_instruction *inst = new(ctx) ir_assignment(rhs_var_ref, rhs, NULL);
872 instructions->push_tail(inst);
873
874 /* Assign the current parameter to as many components of the matrix
875 * as it will fill.
876 *
877 * NOTE: A single vector parameter can span two matrix columns. A
878 * single vec4, for example, can completely fill a mat2.
879 */
880 if (rhs_components >= components_remaining_this_column) {
881 const unsigned count = MIN2(rhs_components,
882 components_remaining_this_column);
883
884 rhs_var_ref = new(ctx) ir_dereference_variable(rhs_var);
885
886 ir_instruction *inst = assign_to_matrix_column(var, col_idx,
887 row_idx,
888 rhs_var_ref, 0,
889 count, ctx);
890 instructions->push_tail(inst);
891
892 rhs_base = count;
893
894 col_idx++;
895 row_idx = 0;
896 }
897
898 /* If there is data left in the parameter and components left to be
899 * set in the destination, emit another assignment. It is possible
900 * that the assignment could be of a vec4 to the last element of the
901 * matrix. In this case col_idx==cols, but there is still data
902 * left in the source parameter. Obviously, don't emit an assignment
903 * to data outside the destination matrix.
904 */
905 if ((col_idx < cols) && (rhs_base < rhs_components)) {
906 const unsigned count = rhs_components - rhs_base;
907
908 rhs_var_ref = new(ctx) ir_dereference_variable(rhs_var);
909
910 ir_instruction *inst = assign_to_matrix_column(var, col_idx,
911 row_idx,
912 rhs_var_ref,
913 rhs_base,
914 count, ctx);
915 instructions->push_tail(inst);
916
917 row_idx += count;
918 }
919 }
920 }
921
922 return new(ctx) ir_dereference_variable(var);
923 }
924
925
926 ir_rvalue *
927 emit_inline_record_constructor(const glsl_type *type,
928 exec_list *instructions,
929 exec_list *parameters,
930 void *mem_ctx)
931 {
932 ir_variable *const var =
933 new(mem_ctx) ir_variable(type, "record_ctor", ir_var_temporary);
934 ir_dereference_variable *const d = new(mem_ctx) ir_dereference_variable(var);
935
936 instructions->push_tail(var);
937
938 exec_node *node = parameters->head;
939 for (unsigned i = 0; i < type->length; i++) {
940 assert(!node->is_tail_sentinel());
941
942 ir_dereference *const lhs =
943 new(mem_ctx) ir_dereference_record(d->clone(mem_ctx, NULL),
944 type->fields.structure[i].name);
945
946 ir_rvalue *const rhs = ((ir_instruction *) node)->as_rvalue();
947 assert(rhs != NULL);
948
949 ir_instruction *const assign = new(mem_ctx) ir_assignment(lhs, rhs, NULL);
950
951 instructions->push_tail(assign);
952 node = node->next;
953 }
954
955 return d;
956 }
957
958
959 ir_rvalue *
960 ast_function_expression::hir(exec_list *instructions,
961 struct _mesa_glsl_parse_state *state)
962 {
963 void *ctx = state;
964 /* There are three sorts of function calls.
965 *
966 * 1. constructors - The first subexpression is an ast_type_specifier.
967 * 2. methods - Only the .length() method of array types.
968 * 3. functions - Calls to regular old functions.
969 *
970 * Method calls are actually detected when the ast_field_selection
971 * expression is handled.
972 */
973 if (is_constructor()) {
974 const ast_type_specifier *type = (ast_type_specifier *) subexpressions[0];
975 YYLTYPE loc = type->get_location();
976 const char *name;
977
978 const glsl_type *const constructor_type = type->glsl_type(& name, state);
979
980
981 /* Constructors for samplers are illegal.
982 */
983 if (constructor_type->is_sampler()) {
984 _mesa_glsl_error(& loc, state, "cannot construct sampler type `%s'",
985 constructor_type->name);
986 return ir_call::get_error_instruction(ctx);
987 }
988
989 if (constructor_type->is_array()) {
990 if (state->language_version <= 110) {
991 _mesa_glsl_error(& loc, state,
992 "array constructors forbidden in GLSL 1.10");
993 return ir_call::get_error_instruction(ctx);
994 }
995
996 return process_array_constructor(instructions, constructor_type,
997 & loc, &this->expressions, state);
998 }
999
1000
1001 /* There are two kinds of constructor call. Constructors for built-in
1002 * language types, such as mat4 and vec2, are free form. The only
1003 * requirement is that the parameters must provide enough values of the
1004 * correct scalar type. Constructors for arrays and structures must
1005 * have the exact number of parameters with matching types in the
1006 * correct order. These constructors follow essentially the same type
1007 * matching rules as functions.
1008 */
1009 if (!constructor_type->is_numeric() && !constructor_type->is_boolean())
1010 return ir_call::get_error_instruction(ctx);
1011
1012 /* Total number of components of the type being constructed. */
1013 const unsigned type_components = constructor_type->components();
1014
1015 /* Number of components from parameters that have actually been
1016 * consumed. This is used to perform several kinds of error checking.
1017 */
1018 unsigned components_used = 0;
1019
1020 unsigned matrix_parameters = 0;
1021 unsigned nonmatrix_parameters = 0;
1022 exec_list actual_parameters;
1023
1024 foreach_list (n, &this->expressions) {
1025 ast_node *ast = exec_node_data(ast_node, n, link);
1026 ir_rvalue *result = ast->hir(instructions, state)->as_rvalue();
1027
1028 /* From page 50 (page 56 of the PDF) of the GLSL 1.50 spec:
1029 *
1030 * "It is an error to provide extra arguments beyond this
1031 * last used argument."
1032 */
1033 if (components_used >= type_components) {
1034 _mesa_glsl_error(& loc, state, "too many parameters to `%s' "
1035 "constructor",
1036 constructor_type->name);
1037 return ir_call::get_error_instruction(ctx);
1038 }
1039
1040 if (!result->type->is_numeric() && !result->type->is_boolean()) {
1041 _mesa_glsl_error(& loc, state, "cannot construct `%s' from a "
1042 "non-numeric data type",
1043 constructor_type->name);
1044 return ir_call::get_error_instruction(ctx);
1045 }
1046
1047 /* Count the number of matrix and nonmatrix parameters. This
1048 * is used below to enforce some of the constructor rules.
1049 */
1050 if (result->type->is_matrix())
1051 matrix_parameters++;
1052 else
1053 nonmatrix_parameters++;
1054
1055 actual_parameters.push_tail(result);
1056 components_used += result->type->components();
1057 }
1058
1059 /* From page 28 (page 34 of the PDF) of the GLSL 1.10 spec:
1060 *
1061 * "It is an error to construct matrices from other matrices. This
1062 * is reserved for future use."
1063 */
1064 if (state->language_version == 110 && matrix_parameters > 0
1065 && constructor_type->is_matrix()) {
1066 _mesa_glsl_error(& loc, state, "cannot construct `%s' from a "
1067 "matrix in GLSL 1.10",
1068 constructor_type->name);
1069 return ir_call::get_error_instruction(ctx);
1070 }
1071
1072 /* From page 50 (page 56 of the PDF) of the GLSL 1.50 spec:
1073 *
1074 * "If a matrix argument is given to a matrix constructor, it is
1075 * an error to have any other arguments."
1076 */
1077 if ((matrix_parameters > 0)
1078 && ((matrix_parameters + nonmatrix_parameters) > 1)
1079 && constructor_type->is_matrix()) {
1080 _mesa_glsl_error(& loc, state, "for matrix `%s' constructor, "
1081 "matrix must be only parameter",
1082 constructor_type->name);
1083 return ir_call::get_error_instruction(ctx);
1084 }
1085
1086 /* From page 28 (page 34 of the PDF) of the GLSL 1.10 spec:
1087 *
1088 * "In these cases, there must be enough components provided in the
1089 * arguments to provide an initializer for every component in the
1090 * constructed value."
1091 */
1092 if (components_used < type_components && components_used != 1
1093 && matrix_parameters == 0) {
1094 _mesa_glsl_error(& loc, state, "too few components to construct "
1095 "`%s'",
1096 constructor_type->name);
1097 return ir_call::get_error_instruction(ctx);
1098 }
1099
1100 /* Later, we cast each parameter to the same base type as the
1101 * constructor. Since there are no non-floating point matrices, we
1102 * need to break them up into a series of column vectors.
1103 */
1104 if (constructor_type->base_type != GLSL_TYPE_FLOAT) {
1105 foreach_list_safe(n, &actual_parameters) {
1106 ir_rvalue *matrix = (ir_rvalue *) n;
1107
1108 if (!matrix->type->is_matrix())
1109 continue;
1110
1111 /* Create a temporary containing the matrix. */
1112 ir_variable *var = new(ctx) ir_variable(matrix->type, "matrix_tmp",
1113 ir_var_temporary);
1114 instructions->push_tail(var);
1115 instructions->push_tail(new(ctx) ir_assignment(new(ctx)
1116 ir_dereference_variable(var), matrix, NULL));
1117 var->constant_value = matrix->constant_expression_value();
1118
1119 /* Replace the matrix with dereferences of its columns. */
1120 for (int i = 0; i < matrix->type->matrix_columns; i++) {
1121 matrix->insert_before(new (ctx) ir_dereference_array(var,
1122 new(ctx) ir_constant(i)));
1123 }
1124 matrix->remove();
1125 }
1126 }
1127
1128 bool all_parameters_are_constant = true;
1129
1130 /* Type cast each parameter and, if possible, fold constants.*/
1131 foreach_list_safe(n, &actual_parameters) {
1132 ir_rvalue *ir = (ir_rvalue *) n;
1133
1134 const glsl_type *desired_type =
1135 glsl_type::get_instance(constructor_type->base_type,
1136 ir->type->vector_elements,
1137 ir->type->matrix_columns);
1138 ir_rvalue *result = convert_component(ir, desired_type);
1139
1140 /* Attempt to convert the parameter to a constant valued expression.
1141 * After doing so, track whether or not all the parameters to the
1142 * constructor are trivially constant valued expressions.
1143 */
1144 ir_rvalue *const constant = result->constant_expression_value();
1145
1146 if (constant != NULL)
1147 result = constant;
1148 else
1149 all_parameters_are_constant = false;
1150
1151 if (result != ir) {
1152 ir->replace_with(result);
1153 }
1154 }
1155
1156 /* If all of the parameters are trivially constant, create a
1157 * constant representing the complete collection of parameters.
1158 */
1159 if (all_parameters_are_constant) {
1160 return new(ctx) ir_constant(constructor_type, &actual_parameters);
1161 } else if (constructor_type->is_scalar()) {
1162 return dereference_component((ir_rvalue *) actual_parameters.head,
1163 0);
1164 } else if (constructor_type->is_vector()) {
1165 return emit_inline_vector_constructor(constructor_type,
1166 instructions,
1167 &actual_parameters,
1168 ctx);
1169 } else {
1170 assert(constructor_type->is_matrix());
1171 return emit_inline_matrix_constructor(constructor_type,
1172 instructions,
1173 &actual_parameters,
1174 ctx);
1175 }
1176 } else {
1177 const ast_expression *id = subexpressions[0];
1178 YYLTYPE loc = id->get_location();
1179 exec_list actual_parameters;
1180
1181 process_parameters(instructions, &actual_parameters, &this->expressions,
1182 state);
1183
1184 const glsl_type *const type =
1185 state->symbols->get_type(id->primary_expression.identifier);
1186
1187 if ((type != NULL) && type->is_record()) {
1188 exec_node *node = actual_parameters.head;
1189 for (unsigned i = 0; i < type->length; i++) {
1190 ir_rvalue *ir = (ir_rvalue *) node;
1191
1192 if (node->is_tail_sentinel()) {
1193 _mesa_glsl_error(&loc, state,
1194 "insufficient parameters to constructor "
1195 "for `%s'",
1196 type->name);
1197 return ir_call::get_error_instruction(ctx);
1198 }
1199
1200 if (apply_implicit_conversion(type->fields.structure[i].type, ir,
1201 state)) {
1202 node->replace_with(ir);
1203 } else {
1204 _mesa_glsl_error(&loc, state,
1205 "parameter type mismatch in constructor "
1206 "for `%s.%s' (%s vs %s)",
1207 type->name,
1208 type->fields.structure[i].name,
1209 ir->type->name,
1210 type->fields.structure[i].type->name);
1211 return ir_call::get_error_instruction(ctx);;
1212 }
1213
1214 node = node->next;
1215 }
1216
1217 if (!node->is_tail_sentinel()) {
1218 _mesa_glsl_error(&loc, state, "too many parameters in constructor "
1219 "for `%s'", type->name);
1220 return ir_call::get_error_instruction(ctx);
1221 }
1222
1223 ir_rvalue *const constant =
1224 constant_record_constructor(type, &actual_parameters, state);
1225
1226 return (constant != NULL)
1227 ? constant
1228 : emit_inline_record_constructor(type, instructions,
1229 &actual_parameters, state);
1230 }
1231
1232 return match_function_by_name(instructions,
1233 id->primary_expression.identifier, & loc,
1234 &actual_parameters, state);
1235 }
1236
1237 return ir_call::get_error_instruction(ctx);
1238 }