glsl/ast/ir: Add 64-bit integer constant support
[mesa.git] / src / compiler / glsl / ir.cpp
1 /*
2 * Copyright © 2010 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
22 */
23 #include <string.h>
24 #include "main/core.h" /* for MAX2 */
25 #include "ir.h"
26 #include "compiler/glsl_types.h"
27
28 ir_rvalue::ir_rvalue(enum ir_node_type t)
29 : ir_instruction(t)
30 {
31 this->type = glsl_type::error_type;
32 }
33
34 bool ir_rvalue::is_zero() const
35 {
36 return false;
37 }
38
39 bool ir_rvalue::is_one() const
40 {
41 return false;
42 }
43
44 bool ir_rvalue::is_negative_one() const
45 {
46 return false;
47 }
48
49 /**
50 * Modify the swizzle make to move one component to another
51 *
52 * \param m IR swizzle to be modified
53 * \param from Component in the RHS that is to be swizzled
54 * \param to Desired swizzle location of \c from
55 */
56 static void
57 update_rhs_swizzle(ir_swizzle_mask &m, unsigned from, unsigned to)
58 {
59 switch (to) {
60 case 0: m.x = from; break;
61 case 1: m.y = from; break;
62 case 2: m.z = from; break;
63 case 3: m.w = from; break;
64 default: assert(!"Should not get here.");
65 }
66 }
67
68 void
69 ir_assignment::set_lhs(ir_rvalue *lhs)
70 {
71 void *mem_ctx = this;
72 bool swizzled = false;
73
74 while (lhs != NULL) {
75 ir_swizzle *swiz = lhs->as_swizzle();
76
77 if (swiz == NULL)
78 break;
79
80 unsigned write_mask = 0;
81 ir_swizzle_mask rhs_swiz = { 0, 0, 0, 0, 0, 0 };
82
83 for (unsigned i = 0; i < swiz->mask.num_components; i++) {
84 unsigned c = 0;
85
86 switch (i) {
87 case 0: c = swiz->mask.x; break;
88 case 1: c = swiz->mask.y; break;
89 case 2: c = swiz->mask.z; break;
90 case 3: c = swiz->mask.w; break;
91 default: assert(!"Should not get here.");
92 }
93
94 write_mask |= (((this->write_mask >> i) & 1) << c);
95 update_rhs_swizzle(rhs_swiz, i, c);
96 rhs_swiz.num_components = swiz->val->type->vector_elements;
97 }
98
99 this->write_mask = write_mask;
100 lhs = swiz->val;
101
102 this->rhs = new(mem_ctx) ir_swizzle(this->rhs, rhs_swiz);
103 swizzled = true;
104 }
105
106 if (swizzled) {
107 /* Now, RHS channels line up with the LHS writemask. Collapse it
108 * to just the channels that will be written.
109 */
110 ir_swizzle_mask rhs_swiz = { 0, 0, 0, 0, 0, 0 };
111 int rhs_chan = 0;
112 for (int i = 0; i < 4; i++) {
113 if (write_mask & (1 << i))
114 update_rhs_swizzle(rhs_swiz, i, rhs_chan++);
115 }
116 rhs_swiz.num_components = rhs_chan;
117 this->rhs = new(mem_ctx) ir_swizzle(this->rhs, rhs_swiz);
118 }
119
120 assert((lhs == NULL) || lhs->as_dereference());
121
122 this->lhs = (ir_dereference *) lhs;
123 }
124
125 ir_variable *
126 ir_assignment::whole_variable_written()
127 {
128 ir_variable *v = this->lhs->whole_variable_referenced();
129
130 if (v == NULL)
131 return NULL;
132
133 if (v->type->is_scalar())
134 return v;
135
136 if (v->type->is_vector()) {
137 const unsigned mask = (1U << v->type->vector_elements) - 1;
138
139 if (mask != this->write_mask)
140 return NULL;
141 }
142
143 /* Either all the vector components are assigned or the variable is some
144 * composite type (and the whole thing is assigned.
145 */
146 return v;
147 }
148
149 ir_assignment::ir_assignment(ir_dereference *lhs, ir_rvalue *rhs,
150 ir_rvalue *condition, unsigned write_mask)
151 : ir_instruction(ir_type_assignment)
152 {
153 this->condition = condition;
154 this->rhs = rhs;
155 this->lhs = lhs;
156 this->write_mask = write_mask;
157
158 if (lhs->type->is_scalar() || lhs->type->is_vector()) {
159 int lhs_components = 0;
160 for (int i = 0; i < 4; i++) {
161 if (write_mask & (1 << i))
162 lhs_components++;
163 }
164
165 assert(lhs_components == this->rhs->type->vector_elements);
166 }
167 }
168
169 ir_assignment::ir_assignment(ir_rvalue *lhs, ir_rvalue *rhs,
170 ir_rvalue *condition)
171 : ir_instruction(ir_type_assignment)
172 {
173 this->condition = condition;
174 this->rhs = rhs;
175
176 /* If the RHS is a vector type, assume that all components of the vector
177 * type are being written to the LHS. The write mask comes from the RHS
178 * because we can have a case where the LHS is a vec4 and the RHS is a
179 * vec3. In that case, the assignment is:
180 *
181 * (assign (...) (xyz) (var_ref lhs) (var_ref rhs))
182 */
183 if (rhs->type->is_vector())
184 this->write_mask = (1U << rhs->type->vector_elements) - 1;
185 else if (rhs->type->is_scalar())
186 this->write_mask = 1;
187 else
188 this->write_mask = 0;
189
190 this->set_lhs(lhs);
191 }
192
193 ir_expression::ir_expression(int op, const struct glsl_type *type,
194 ir_rvalue *op0, ir_rvalue *op1,
195 ir_rvalue *op2, ir_rvalue *op3)
196 : ir_rvalue(ir_type_expression)
197 {
198 this->type = type;
199 this->operation = ir_expression_operation(op);
200 this->operands[0] = op0;
201 this->operands[1] = op1;
202 this->operands[2] = op2;
203 this->operands[3] = op3;
204 #ifndef NDEBUG
205 int num_operands = get_num_operands(this->operation);
206 for (int i = num_operands; i < 4; i++) {
207 assert(this->operands[i] == NULL);
208 }
209 #endif
210 }
211
212 ir_expression::ir_expression(int op, ir_rvalue *op0)
213 : ir_rvalue(ir_type_expression)
214 {
215 this->operation = ir_expression_operation(op);
216 this->operands[0] = op0;
217 this->operands[1] = NULL;
218 this->operands[2] = NULL;
219 this->operands[3] = NULL;
220
221 assert(op <= ir_last_unop);
222
223 switch (this->operation) {
224 case ir_unop_bit_not:
225 case ir_unop_logic_not:
226 case ir_unop_neg:
227 case ir_unop_abs:
228 case ir_unop_sign:
229 case ir_unop_rcp:
230 case ir_unop_rsq:
231 case ir_unop_sqrt:
232 case ir_unop_exp:
233 case ir_unop_log:
234 case ir_unop_exp2:
235 case ir_unop_log2:
236 case ir_unop_trunc:
237 case ir_unop_ceil:
238 case ir_unop_floor:
239 case ir_unop_fract:
240 case ir_unop_round_even:
241 case ir_unop_sin:
242 case ir_unop_cos:
243 case ir_unop_dFdx:
244 case ir_unop_dFdx_coarse:
245 case ir_unop_dFdx_fine:
246 case ir_unop_dFdy:
247 case ir_unop_dFdy_coarse:
248 case ir_unop_dFdy_fine:
249 case ir_unop_bitfield_reverse:
250 case ir_unop_interpolate_at_centroid:
251 case ir_unop_saturate:
252 this->type = op0->type;
253 break;
254
255 case ir_unop_f2i:
256 case ir_unop_b2i:
257 case ir_unop_u2i:
258 case ir_unop_d2i:
259 case ir_unop_bitcast_f2i:
260 case ir_unop_bit_count:
261 case ir_unop_find_msb:
262 case ir_unop_find_lsb:
263 case ir_unop_subroutine_to_int:
264 this->type = glsl_type::get_instance(GLSL_TYPE_INT,
265 op0->type->vector_elements, 1);
266 break;
267
268 case ir_unop_b2f:
269 case ir_unop_i2f:
270 case ir_unop_u2f:
271 case ir_unop_d2f:
272 case ir_unop_bitcast_i2f:
273 case ir_unop_bitcast_u2f:
274 this->type = glsl_type::get_instance(GLSL_TYPE_FLOAT,
275 op0->type->vector_elements, 1);
276 break;
277
278 case ir_unop_f2b:
279 case ir_unop_i2b:
280 case ir_unop_d2b:
281 this->type = glsl_type::get_instance(GLSL_TYPE_BOOL,
282 op0->type->vector_elements, 1);
283 break;
284
285 case ir_unop_f2d:
286 case ir_unop_i2d:
287 case ir_unop_u2d:
288 this->type = glsl_type::get_instance(GLSL_TYPE_DOUBLE,
289 op0->type->vector_elements, 1);
290 break;
291
292 case ir_unop_i2u:
293 case ir_unop_f2u:
294 case ir_unop_d2u:
295 case ir_unop_bitcast_f2u:
296 this->type = glsl_type::get_instance(GLSL_TYPE_UINT,
297 op0->type->vector_elements, 1);
298 break;
299
300 case ir_unop_noise:
301 this->type = glsl_type::float_type;
302 break;
303
304 case ir_unop_unpack_double_2x32:
305 this->type = glsl_type::uvec2_type;
306 break;
307
308 case ir_unop_pack_snorm_2x16:
309 case ir_unop_pack_snorm_4x8:
310 case ir_unop_pack_unorm_2x16:
311 case ir_unop_pack_unorm_4x8:
312 case ir_unop_pack_half_2x16:
313 this->type = glsl_type::uint_type;
314 break;
315
316 case ir_unop_pack_double_2x32:
317 this->type = glsl_type::double_type;
318 break;
319
320 case ir_unop_unpack_snorm_2x16:
321 case ir_unop_unpack_unorm_2x16:
322 case ir_unop_unpack_half_2x16:
323 this->type = glsl_type::vec2_type;
324 break;
325
326 case ir_unop_unpack_snorm_4x8:
327 case ir_unop_unpack_unorm_4x8:
328 this->type = glsl_type::vec4_type;
329 break;
330
331 case ir_unop_frexp_sig:
332 this->type = op0->type;
333 break;
334 case ir_unop_frexp_exp:
335 this->type = glsl_type::get_instance(GLSL_TYPE_INT,
336 op0->type->vector_elements, 1);
337 break;
338
339 case ir_unop_get_buffer_size:
340 case ir_unop_ssbo_unsized_array_length:
341 this->type = glsl_type::int_type;
342 break;
343
344 case ir_unop_vote_any:
345 case ir_unop_vote_all:
346 case ir_unop_vote_eq:
347 this->type = glsl_type::bool_type;
348 break;
349
350 default:
351 assert(!"not reached: missing automatic type setup for ir_expression");
352 this->type = op0->type;
353 break;
354 }
355 }
356
357 ir_expression::ir_expression(int op, ir_rvalue *op0, ir_rvalue *op1)
358 : ir_rvalue(ir_type_expression)
359 {
360 this->operation = ir_expression_operation(op);
361 this->operands[0] = op0;
362 this->operands[1] = op1;
363 this->operands[2] = NULL;
364 this->operands[3] = NULL;
365
366 assert(op > ir_last_unop);
367
368 switch (this->operation) {
369 case ir_binop_all_equal:
370 case ir_binop_any_nequal:
371 this->type = glsl_type::bool_type;
372 break;
373
374 case ir_binop_add:
375 case ir_binop_sub:
376 case ir_binop_min:
377 case ir_binop_max:
378 case ir_binop_pow:
379 case ir_binop_mul:
380 case ir_binop_div:
381 case ir_binop_mod:
382 if (op0->type->is_scalar()) {
383 this->type = op1->type;
384 } else if (op1->type->is_scalar()) {
385 this->type = op0->type;
386 } else {
387 if (this->operation == ir_binop_mul) {
388 this->type = glsl_type::get_mul_type(op0->type, op1->type);
389 } else {
390 assert(op0->type == op1->type);
391 this->type = op0->type;
392 }
393 }
394 break;
395
396 case ir_binop_logic_and:
397 case ir_binop_logic_xor:
398 case ir_binop_logic_or:
399 case ir_binop_bit_and:
400 case ir_binop_bit_xor:
401 case ir_binop_bit_or:
402 assert(!op0->type->is_matrix());
403 assert(!op1->type->is_matrix());
404 if (op0->type->is_scalar()) {
405 this->type = op1->type;
406 } else if (op1->type->is_scalar()) {
407 this->type = op0->type;
408 } else {
409 assert(op0->type->vector_elements == op1->type->vector_elements);
410 this->type = op0->type;
411 }
412 break;
413
414 case ir_binop_equal:
415 case ir_binop_nequal:
416 case ir_binop_lequal:
417 case ir_binop_gequal:
418 case ir_binop_less:
419 case ir_binop_greater:
420 assert(op0->type == op1->type);
421 this->type = glsl_type::get_instance(GLSL_TYPE_BOOL,
422 op0->type->vector_elements, 1);
423 break;
424
425 case ir_binop_dot:
426 this->type = op0->type->get_base_type();
427 break;
428
429 case ir_binop_imul_high:
430 case ir_binop_carry:
431 case ir_binop_borrow:
432 case ir_binop_lshift:
433 case ir_binop_rshift:
434 case ir_binop_ldexp:
435 case ir_binop_interpolate_at_offset:
436 case ir_binop_interpolate_at_sample:
437 this->type = op0->type;
438 break;
439
440 case ir_binop_vector_extract:
441 this->type = op0->type->get_scalar_type();
442 break;
443
444 default:
445 assert(!"not reached: missing automatic type setup for ir_expression");
446 this->type = glsl_type::float_type;
447 }
448 }
449
450 ir_expression::ir_expression(int op, ir_rvalue *op0, ir_rvalue *op1,
451 ir_rvalue *op2)
452 : ir_rvalue(ir_type_expression)
453 {
454 this->operation = ir_expression_operation(op);
455 this->operands[0] = op0;
456 this->operands[1] = op1;
457 this->operands[2] = op2;
458 this->operands[3] = NULL;
459
460 assert(op > ir_last_binop && op <= ir_last_triop);
461
462 switch (this->operation) {
463 case ir_triop_fma:
464 case ir_triop_lrp:
465 case ir_triop_bitfield_extract:
466 case ir_triop_vector_insert:
467 this->type = op0->type;
468 break;
469
470 case ir_triop_csel:
471 this->type = op1->type;
472 break;
473
474 default:
475 assert(!"not reached: missing automatic type setup for ir_expression");
476 this->type = glsl_type::float_type;
477 }
478 }
479
480 unsigned int
481 ir_expression::get_num_operands(ir_expression_operation op)
482 {
483 assert(op <= ir_last_opcode);
484
485 if (op <= ir_last_unop)
486 return 1;
487
488 if (op <= ir_last_binop)
489 return 2;
490
491 if (op <= ir_last_triop)
492 return 3;
493
494 if (op <= ir_last_quadop)
495 return 4;
496
497 assert(false);
498 return 0;
499 }
500
501 #include "ir_expression_operation_strings.h"
502
503 const char*
504 depth_layout_string(ir_depth_layout layout)
505 {
506 switch(layout) {
507 case ir_depth_layout_none: return "";
508 case ir_depth_layout_any: return "depth_any";
509 case ir_depth_layout_greater: return "depth_greater";
510 case ir_depth_layout_less: return "depth_less";
511 case ir_depth_layout_unchanged: return "depth_unchanged";
512
513 default:
514 assert(0);
515 return "";
516 }
517 }
518
519 ir_expression_operation
520 ir_expression::get_operator(const char *str)
521 {
522 for (int op = 0; op <= int(ir_last_opcode); op++) {
523 if (strcmp(str, ir_expression_operation_strings[op]) == 0)
524 return (ir_expression_operation) op;
525 }
526 return (ir_expression_operation) -1;
527 }
528
529 ir_variable *
530 ir_expression::variable_referenced() const
531 {
532 switch (operation) {
533 case ir_binop_vector_extract:
534 case ir_triop_vector_insert:
535 /* We get these for things like a[0] where a is a vector type. In these
536 * cases we want variable_referenced() to return the actual vector
537 * variable this is wrapping.
538 */
539 return operands[0]->variable_referenced();
540 default:
541 return ir_rvalue::variable_referenced();
542 }
543 }
544
545 ir_constant::ir_constant()
546 : ir_rvalue(ir_type_constant)
547 {
548 this->array_elements = NULL;
549 }
550
551 ir_constant::ir_constant(const struct glsl_type *type,
552 const ir_constant_data *data)
553 : ir_rvalue(ir_type_constant)
554 {
555 this->array_elements = NULL;
556
557 assert((type->base_type >= GLSL_TYPE_UINT)
558 && (type->base_type <= GLSL_TYPE_BOOL));
559
560 this->type = type;
561 memcpy(& this->value, data, sizeof(this->value));
562 }
563
564 ir_constant::ir_constant(float f, unsigned vector_elements)
565 : ir_rvalue(ir_type_constant)
566 {
567 assert(vector_elements <= 4);
568 this->type = glsl_type::get_instance(GLSL_TYPE_FLOAT, vector_elements, 1);
569 for (unsigned i = 0; i < vector_elements; i++) {
570 this->value.f[i] = f;
571 }
572 for (unsigned i = vector_elements; i < 16; i++) {
573 this->value.f[i] = 0;
574 }
575 }
576
577 ir_constant::ir_constant(double d, unsigned vector_elements)
578 : ir_rvalue(ir_type_constant)
579 {
580 assert(vector_elements <= 4);
581 this->type = glsl_type::get_instance(GLSL_TYPE_DOUBLE, vector_elements, 1);
582 for (unsigned i = 0; i < vector_elements; i++) {
583 this->value.d[i] = d;
584 }
585 for (unsigned i = vector_elements; i < 16; i++) {
586 this->value.d[i] = 0.0;
587 }
588 }
589
590 ir_constant::ir_constant(unsigned int u, unsigned vector_elements)
591 : ir_rvalue(ir_type_constant)
592 {
593 assert(vector_elements <= 4);
594 this->type = glsl_type::get_instance(GLSL_TYPE_UINT, vector_elements, 1);
595 for (unsigned i = 0; i < vector_elements; i++) {
596 this->value.u[i] = u;
597 }
598 for (unsigned i = vector_elements; i < 16; i++) {
599 this->value.u[i] = 0;
600 }
601 }
602
603 ir_constant::ir_constant(int integer, unsigned vector_elements)
604 : ir_rvalue(ir_type_constant)
605 {
606 assert(vector_elements <= 4);
607 this->type = glsl_type::get_instance(GLSL_TYPE_INT, vector_elements, 1);
608 for (unsigned i = 0; i < vector_elements; i++) {
609 this->value.i[i] = integer;
610 }
611 for (unsigned i = vector_elements; i < 16; i++) {
612 this->value.i[i] = 0;
613 }
614 }
615
616 ir_constant::ir_constant(uint64_t u64, unsigned vector_elements)
617 : ir_rvalue(ir_type_constant)
618 {
619 assert(vector_elements <= 4);
620 this->type = glsl_type::get_instance(GLSL_TYPE_UINT64, vector_elements, 1);
621 for (unsigned i = 0; i < vector_elements; i++) {
622 this->value.u64[i] = u64;
623 }
624 for (unsigned i = vector_elements; i < 16; i++) {
625 this->value.u64[i] = 0;
626 }
627 }
628
629 ir_constant::ir_constant(int64_t int64, unsigned vector_elements)
630 : ir_rvalue(ir_type_constant)
631 {
632 assert(vector_elements <= 4);
633 this->type = glsl_type::get_instance(GLSL_TYPE_INT64, vector_elements, 1);
634 for (unsigned i = 0; i < vector_elements; i++) {
635 this->value.i64[i] = int64;
636 }
637 for (unsigned i = vector_elements; i < 16; i++) {
638 this->value.i64[i] = 0;
639 }
640 }
641
642 ir_constant::ir_constant(bool b, unsigned vector_elements)
643 : ir_rvalue(ir_type_constant)
644 {
645 assert(vector_elements <= 4);
646 this->type = glsl_type::get_instance(GLSL_TYPE_BOOL, vector_elements, 1);
647 for (unsigned i = 0; i < vector_elements; i++) {
648 this->value.b[i] = b;
649 }
650 for (unsigned i = vector_elements; i < 16; i++) {
651 this->value.b[i] = false;
652 }
653 }
654
655 ir_constant::ir_constant(const ir_constant *c, unsigned i)
656 : ir_rvalue(ir_type_constant)
657 {
658 this->array_elements = NULL;
659 this->type = c->type->get_base_type();
660
661 switch (this->type->base_type) {
662 case GLSL_TYPE_UINT: this->value.u[0] = c->value.u[i]; break;
663 case GLSL_TYPE_INT: this->value.i[0] = c->value.i[i]; break;
664 case GLSL_TYPE_FLOAT: this->value.f[0] = c->value.f[i]; break;
665 case GLSL_TYPE_BOOL: this->value.b[0] = c->value.b[i]; break;
666 case GLSL_TYPE_DOUBLE: this->value.d[0] = c->value.d[i]; break;
667 default: assert(!"Should not get here."); break;
668 }
669 }
670
671 ir_constant::ir_constant(const struct glsl_type *type, exec_list *value_list)
672 : ir_rvalue(ir_type_constant)
673 {
674 this->array_elements = NULL;
675 this->type = type;
676
677 assert(type->is_scalar() || type->is_vector() || type->is_matrix()
678 || type->is_record() || type->is_array());
679
680 if (type->is_array()) {
681 this->array_elements = ralloc_array(this, ir_constant *, type->length);
682 unsigned i = 0;
683 foreach_in_list(ir_constant, value, value_list) {
684 assert(value->as_constant() != NULL);
685
686 this->array_elements[i++] = value;
687 }
688 return;
689 }
690
691 /* If the constant is a record, the types of each of the entries in
692 * value_list must be a 1-for-1 match with the structure components. Each
693 * entry must also be a constant. Just move the nodes from the value_list
694 * to the list in the ir_constant.
695 */
696 /* FINISHME: Should there be some type checking and / or assertions here? */
697 /* FINISHME: Should the new constant take ownership of the nodes from
698 * FINISHME: value_list, or should it make copies?
699 */
700 if (type->is_record()) {
701 value_list->move_nodes_to(& this->components);
702 return;
703 }
704
705 for (unsigned i = 0; i < 16; i++) {
706 this->value.u[i] = 0;
707 }
708
709 ir_constant *value = (ir_constant *) (value_list->get_head_raw());
710
711 /* Constructors with exactly one scalar argument are special for vectors
712 * and matrices. For vectors, the scalar value is replicated to fill all
713 * the components. For matrices, the scalar fills the components of the
714 * diagonal while the rest is filled with 0.
715 */
716 if (value->type->is_scalar() && value->next->is_tail_sentinel()) {
717 if (type->is_matrix()) {
718 /* Matrix - fill diagonal (rest is already set to 0) */
719 assert(type->base_type == GLSL_TYPE_FLOAT ||
720 type->base_type == GLSL_TYPE_DOUBLE);
721 for (unsigned i = 0; i < type->matrix_columns; i++) {
722 if (type->base_type == GLSL_TYPE_FLOAT)
723 this->value.f[i * type->vector_elements + i] =
724 value->value.f[0];
725 else
726 this->value.d[i * type->vector_elements + i] =
727 value->value.d[0];
728 }
729 } else {
730 /* Vector or scalar - fill all components */
731 switch (type->base_type) {
732 case GLSL_TYPE_UINT:
733 case GLSL_TYPE_INT:
734 for (unsigned i = 0; i < type->components(); i++)
735 this->value.u[i] = value->value.u[0];
736 break;
737 case GLSL_TYPE_FLOAT:
738 for (unsigned i = 0; i < type->components(); i++)
739 this->value.f[i] = value->value.f[0];
740 break;
741 case GLSL_TYPE_DOUBLE:
742 for (unsigned i = 0; i < type->components(); i++)
743 this->value.d[i] = value->value.d[0];
744 break;
745 case GLSL_TYPE_UINT64:
746 case GLSL_TYPE_INT64:
747 for (unsigned i = 0; i < type->components(); i++)
748 this->value.u64[i] = value->value.u64[0];
749 break;
750 case GLSL_TYPE_BOOL:
751 for (unsigned i = 0; i < type->components(); i++)
752 this->value.b[i] = value->value.b[0];
753 break;
754 default:
755 assert(!"Should not get here.");
756 break;
757 }
758 }
759 return;
760 }
761
762 if (type->is_matrix() && value->type->is_matrix()) {
763 assert(value->next->is_tail_sentinel());
764
765 /* From section 5.4.2 of the GLSL 1.20 spec:
766 * "If a matrix is constructed from a matrix, then each component
767 * (column i, row j) in the result that has a corresponding component
768 * (column i, row j) in the argument will be initialized from there."
769 */
770 unsigned cols = MIN2(type->matrix_columns, value->type->matrix_columns);
771 unsigned rows = MIN2(type->vector_elements, value->type->vector_elements);
772 for (unsigned i = 0; i < cols; i++) {
773 for (unsigned j = 0; j < rows; j++) {
774 const unsigned src = i * value->type->vector_elements + j;
775 const unsigned dst = i * type->vector_elements + j;
776 this->value.f[dst] = value->value.f[src];
777 }
778 }
779
780 /* "All other components will be initialized to the identity matrix." */
781 for (unsigned i = cols; i < type->matrix_columns; i++)
782 this->value.f[i * type->vector_elements + i] = 1.0;
783
784 return;
785 }
786
787 /* Use each component from each entry in the value_list to initialize one
788 * component of the constant being constructed.
789 */
790 unsigned i = 0;
791 for (;;) {
792 assert(value->as_constant() != NULL);
793 assert(!value->is_tail_sentinel());
794
795 for (unsigned j = 0; j < value->type->components(); j++) {
796 switch (type->base_type) {
797 case GLSL_TYPE_UINT:
798 this->value.u[i] = value->get_uint_component(j);
799 break;
800 case GLSL_TYPE_INT:
801 this->value.i[i] = value->get_int_component(j);
802 break;
803 case GLSL_TYPE_FLOAT:
804 this->value.f[i] = value->get_float_component(j);
805 break;
806 case GLSL_TYPE_BOOL:
807 this->value.b[i] = value->get_bool_component(j);
808 break;
809 case GLSL_TYPE_DOUBLE:
810 this->value.d[i] = value->get_double_component(j);
811 break;
812 case GLSL_TYPE_UINT64:
813 this->value.u64[i] = value->get_uint64_component(j);
814 break;
815 case GLSL_TYPE_INT64:
816 this->value.i64[i] = value->get_int64_component(j);
817 break;
818 default:
819 /* FINISHME: What to do? Exceptions are not the answer.
820 */
821 break;
822 }
823
824 i++;
825 if (i >= type->components())
826 break;
827 }
828
829 if (i >= type->components())
830 break; /* avoid downcasting a list sentinel */
831 value = (ir_constant *) value->next;
832 }
833 }
834
835 ir_constant *
836 ir_constant::zero(void *mem_ctx, const glsl_type *type)
837 {
838 assert(type->is_scalar() || type->is_vector() || type->is_matrix()
839 || type->is_record() || type->is_array());
840
841 ir_constant *c = new(mem_ctx) ir_constant;
842 c->type = type;
843 memset(&c->value, 0, sizeof(c->value));
844
845 if (type->is_array()) {
846 c->array_elements = ralloc_array(c, ir_constant *, type->length);
847
848 for (unsigned i = 0; i < type->length; i++)
849 c->array_elements[i] = ir_constant::zero(c, type->fields.array);
850 }
851
852 if (type->is_record()) {
853 for (unsigned i = 0; i < type->length; i++) {
854 ir_constant *comp = ir_constant::zero(mem_ctx, type->fields.structure[i].type);
855 c->components.push_tail(comp);
856 }
857 }
858
859 return c;
860 }
861
862 bool
863 ir_constant::get_bool_component(unsigned i) const
864 {
865 switch (this->type->base_type) {
866 case GLSL_TYPE_UINT: return this->value.u[i] != 0;
867 case GLSL_TYPE_INT: return this->value.i[i] != 0;
868 case GLSL_TYPE_FLOAT: return ((int)this->value.f[i]) != 0;
869 case GLSL_TYPE_BOOL: return this->value.b[i];
870 case GLSL_TYPE_DOUBLE: return this->value.d[i] != 0.0;
871 case GLSL_TYPE_UINT64: return this->value.u64[i] != 0;
872 case GLSL_TYPE_INT64: return this->value.i64[i] != 0;
873 default: assert(!"Should not get here."); break;
874 }
875
876 /* Must return something to make the compiler happy. This is clearly an
877 * error case.
878 */
879 return false;
880 }
881
882 float
883 ir_constant::get_float_component(unsigned i) const
884 {
885 switch (this->type->base_type) {
886 case GLSL_TYPE_UINT: return (float) this->value.u[i];
887 case GLSL_TYPE_INT: return (float) this->value.i[i];
888 case GLSL_TYPE_FLOAT: return this->value.f[i];
889 case GLSL_TYPE_BOOL: return this->value.b[i] ? 1.0f : 0.0f;
890 case GLSL_TYPE_DOUBLE: return (float) this->value.d[i];
891 case GLSL_TYPE_UINT64: return (float) this->value.u64[i];
892 case GLSL_TYPE_INT64: return (float) this->value.i64[i];
893 default: assert(!"Should not get here."); break;
894 }
895
896 /* Must return something to make the compiler happy. This is clearly an
897 * error case.
898 */
899 return 0.0;
900 }
901
902 double
903 ir_constant::get_double_component(unsigned i) const
904 {
905 switch (this->type->base_type) {
906 case GLSL_TYPE_UINT: return (double) this->value.u[i];
907 case GLSL_TYPE_INT: return (double) this->value.i[i];
908 case GLSL_TYPE_FLOAT: return (double) this->value.f[i];
909 case GLSL_TYPE_BOOL: return this->value.b[i] ? 1.0 : 0.0;
910 case GLSL_TYPE_DOUBLE: return this->value.d[i];
911 case GLSL_TYPE_UINT64: return (double) this->value.u64[i];
912 case GLSL_TYPE_INT64: return (double) this->value.i64[i];
913 default: assert(!"Should not get here."); break;
914 }
915
916 /* Must return something to make the compiler happy. This is clearly an
917 * error case.
918 */
919 return 0.0;
920 }
921
922 int
923 ir_constant::get_int_component(unsigned i) const
924 {
925 switch (this->type->base_type) {
926 case GLSL_TYPE_UINT: return this->value.u[i];
927 case GLSL_TYPE_INT: return this->value.i[i];
928 case GLSL_TYPE_FLOAT: return (int) this->value.f[i];
929 case GLSL_TYPE_BOOL: return this->value.b[i] ? 1 : 0;
930 case GLSL_TYPE_DOUBLE: return (int) this->value.d[i];
931 case GLSL_TYPE_UINT64: return (int) this->value.u64[i];
932 case GLSL_TYPE_INT64: return (int) this->value.i64[i];
933 default: assert(!"Should not get here."); break;
934 }
935
936 /* Must return something to make the compiler happy. This is clearly an
937 * error case.
938 */
939 return 0;
940 }
941
942 unsigned
943 ir_constant::get_uint_component(unsigned i) const
944 {
945 switch (this->type->base_type) {
946 case GLSL_TYPE_UINT: return this->value.u[i];
947 case GLSL_TYPE_INT: return this->value.i[i];
948 case GLSL_TYPE_FLOAT: return (unsigned) this->value.f[i];
949 case GLSL_TYPE_BOOL: return this->value.b[i] ? 1 : 0;
950 case GLSL_TYPE_DOUBLE: return (unsigned) this->value.d[i];
951 case GLSL_TYPE_UINT64: return (unsigned) this->value.u64[i];
952 case GLSL_TYPE_INT64: return (unsigned) this->value.i64[i];
953 default: assert(!"Should not get here."); break;
954 }
955
956 /* Must return something to make the compiler happy. This is clearly an
957 * error case.
958 */
959 return 0;
960 }
961
962 int64_t
963 ir_constant::get_int64_component(unsigned i) const
964 {
965 switch (this->type->base_type) {
966 case GLSL_TYPE_UINT: return this->value.u[i];
967 case GLSL_TYPE_INT: return this->value.i[i];
968 case GLSL_TYPE_FLOAT: return (int64_t) this->value.f[i];
969 case GLSL_TYPE_BOOL: return this->value.b[i] ? 1 : 0;
970 case GLSL_TYPE_DOUBLE: return (int64_t) this->value.d[i];
971 case GLSL_TYPE_UINT64: return (int64_t) this->value.u64[i];
972 case GLSL_TYPE_INT64: return this->value.i64[i];
973 default: assert(!"Should not get here."); break;
974 }
975
976 /* Must return something to make the compiler happy. This is clearly an
977 * error case.
978 */
979 return 0;
980 }
981
982 uint64_t
983 ir_constant::get_uint64_component(unsigned i) const
984 {
985 switch (this->type->base_type) {
986 case GLSL_TYPE_UINT: return this->value.u[i];
987 case GLSL_TYPE_INT: return this->value.i[i];
988 case GLSL_TYPE_FLOAT: return (uint64_t) this->value.f[i];
989 case GLSL_TYPE_BOOL: return this->value.b[i] ? 1 : 0;
990 case GLSL_TYPE_DOUBLE: return (uint64_t) this->value.d[i];
991 case GLSL_TYPE_UINT64: return this->value.u64[i];
992 case GLSL_TYPE_INT64: return (uint64_t) this->value.i64[i];
993 default: assert(!"Should not get here."); break;
994 }
995
996 /* Must return something to make the compiler happy. This is clearly an
997 * error case.
998 */
999 return 0;
1000 }
1001
1002 ir_constant *
1003 ir_constant::get_array_element(unsigned i) const
1004 {
1005 assert(this->type->is_array());
1006
1007 /* From page 35 (page 41 of the PDF) of the GLSL 1.20 spec:
1008 *
1009 * "Behavior is undefined if a shader subscripts an array with an index
1010 * less than 0 or greater than or equal to the size the array was
1011 * declared with."
1012 *
1013 * Most out-of-bounds accesses are removed before things could get this far.
1014 * There are cases where non-constant array index values can get constant
1015 * folded.
1016 */
1017 if (int(i) < 0)
1018 i = 0;
1019 else if (i >= this->type->length)
1020 i = this->type->length - 1;
1021
1022 return array_elements[i];
1023 }
1024
1025 ir_constant *
1026 ir_constant::get_record_field(const char *name)
1027 {
1028 int idx = this->type->field_index(name);
1029
1030 if (idx < 0)
1031 return NULL;
1032
1033 if (this->components.is_empty())
1034 return NULL;
1035
1036 exec_node *node = this->components.get_head_raw();
1037 for (int i = 0; i < idx; i++) {
1038 node = node->next;
1039
1040 /* If the end of the list is encountered before the element matching the
1041 * requested field is found, return NULL.
1042 */
1043 if (node->is_tail_sentinel())
1044 return NULL;
1045 }
1046
1047 return (ir_constant *) node;
1048 }
1049
1050 void
1051 ir_constant::copy_offset(ir_constant *src, int offset)
1052 {
1053 switch (this->type->base_type) {
1054 case GLSL_TYPE_UINT:
1055 case GLSL_TYPE_INT:
1056 case GLSL_TYPE_FLOAT:
1057 case GLSL_TYPE_DOUBLE:
1058 case GLSL_TYPE_UINT64:
1059 case GLSL_TYPE_INT64:
1060 case GLSL_TYPE_BOOL: {
1061 unsigned int size = src->type->components();
1062 assert (size <= this->type->components() - offset);
1063 for (unsigned int i=0; i<size; i++) {
1064 switch (this->type->base_type) {
1065 case GLSL_TYPE_UINT:
1066 value.u[i+offset] = src->get_uint_component(i);
1067 break;
1068 case GLSL_TYPE_INT:
1069 value.i[i+offset] = src->get_int_component(i);
1070 break;
1071 case GLSL_TYPE_FLOAT:
1072 value.f[i+offset] = src->get_float_component(i);
1073 break;
1074 case GLSL_TYPE_BOOL:
1075 value.b[i+offset] = src->get_bool_component(i);
1076 break;
1077 case GLSL_TYPE_DOUBLE:
1078 value.d[i+offset] = src->get_double_component(i);
1079 break;
1080 case GLSL_TYPE_UINT64:
1081 value.u64[i+offset] = src->get_uint64_component(i);
1082 break;
1083 case GLSL_TYPE_INT64:
1084 value.i64[i+offset] = src->get_int64_component(i);
1085 break;
1086 default: // Shut up the compiler
1087 break;
1088 }
1089 }
1090 break;
1091 }
1092
1093 case GLSL_TYPE_STRUCT: {
1094 assert (src->type == this->type);
1095 this->components.make_empty();
1096 foreach_in_list(ir_constant, orig, &src->components) {
1097 this->components.push_tail(orig->clone(this, NULL));
1098 }
1099 break;
1100 }
1101
1102 case GLSL_TYPE_ARRAY: {
1103 assert (src->type == this->type);
1104 for (unsigned i = 0; i < this->type->length; i++) {
1105 this->array_elements[i] = src->array_elements[i]->clone(this, NULL);
1106 }
1107 break;
1108 }
1109
1110 default:
1111 assert(!"Should not get here.");
1112 break;
1113 }
1114 }
1115
1116 void
1117 ir_constant::copy_masked_offset(ir_constant *src, int offset, unsigned int mask)
1118 {
1119 assert (!type->is_array() && !type->is_record());
1120
1121 if (!type->is_vector() && !type->is_matrix()) {
1122 offset = 0;
1123 mask = 1;
1124 }
1125
1126 int id = 0;
1127 for (int i=0; i<4; i++) {
1128 if (mask & (1 << i)) {
1129 switch (this->type->base_type) {
1130 case GLSL_TYPE_UINT:
1131 value.u[i+offset] = src->get_uint_component(id++);
1132 break;
1133 case GLSL_TYPE_INT:
1134 value.i[i+offset] = src->get_int_component(id++);
1135 break;
1136 case GLSL_TYPE_FLOAT:
1137 value.f[i+offset] = src->get_float_component(id++);
1138 break;
1139 case GLSL_TYPE_BOOL:
1140 value.b[i+offset] = src->get_bool_component(id++);
1141 break;
1142 case GLSL_TYPE_DOUBLE:
1143 value.d[i+offset] = src->get_double_component(id++);
1144 break;
1145 case GLSL_TYPE_UINT64:
1146 value.u64[i+offset] = src->get_uint64_component(id++);
1147 break;
1148 case GLSL_TYPE_INT64:
1149 value.i64[i+offset] = src->get_int64_component(id++);
1150 break;
1151 default:
1152 assert(!"Should not get here.");
1153 return;
1154 }
1155 }
1156 }
1157 }
1158
1159 bool
1160 ir_constant::has_value(const ir_constant *c) const
1161 {
1162 if (this->type != c->type)
1163 return false;
1164
1165 if (this->type->is_array()) {
1166 for (unsigned i = 0; i < this->type->length; i++) {
1167 if (!this->array_elements[i]->has_value(c->array_elements[i]))
1168 return false;
1169 }
1170 return true;
1171 }
1172
1173 if (this->type->base_type == GLSL_TYPE_STRUCT) {
1174 const exec_node *a_node = this->components.get_head_raw();
1175 const exec_node *b_node = c->components.get_head_raw();
1176
1177 while (!a_node->is_tail_sentinel()) {
1178 assert(!b_node->is_tail_sentinel());
1179
1180 const ir_constant *const a_field = (ir_constant *) a_node;
1181 const ir_constant *const b_field = (ir_constant *) b_node;
1182
1183 if (!a_field->has_value(b_field))
1184 return false;
1185
1186 a_node = a_node->next;
1187 b_node = b_node->next;
1188 }
1189
1190 return true;
1191 }
1192
1193 for (unsigned i = 0; i < this->type->components(); i++) {
1194 switch (this->type->base_type) {
1195 case GLSL_TYPE_UINT:
1196 if (this->value.u[i] != c->value.u[i])
1197 return false;
1198 break;
1199 case GLSL_TYPE_INT:
1200 if (this->value.i[i] != c->value.i[i])
1201 return false;
1202 break;
1203 case GLSL_TYPE_FLOAT:
1204 if (this->value.f[i] != c->value.f[i])
1205 return false;
1206 break;
1207 case GLSL_TYPE_BOOL:
1208 if (this->value.b[i] != c->value.b[i])
1209 return false;
1210 break;
1211 case GLSL_TYPE_DOUBLE:
1212 if (this->value.d[i] != c->value.d[i])
1213 return false;
1214 break;
1215 case GLSL_TYPE_UINT64:
1216 if (this->value.u64[i] != c->value.u64[i])
1217 return false;
1218 break;
1219 case GLSL_TYPE_INT64:
1220 if (this->value.i64[i] != c->value.i64[i])
1221 return false;
1222 break;
1223 default:
1224 assert(!"Should not get here.");
1225 return false;
1226 }
1227 }
1228
1229 return true;
1230 }
1231
1232 bool
1233 ir_constant::is_value(float f, int i) const
1234 {
1235 if (!this->type->is_scalar() && !this->type->is_vector())
1236 return false;
1237
1238 /* Only accept boolean values for 0/1. */
1239 if (int(bool(i)) != i && this->type->is_boolean())
1240 return false;
1241
1242 for (unsigned c = 0; c < this->type->vector_elements; c++) {
1243 switch (this->type->base_type) {
1244 case GLSL_TYPE_FLOAT:
1245 if (this->value.f[c] != f)
1246 return false;
1247 break;
1248 case GLSL_TYPE_INT:
1249 if (this->value.i[c] != i)
1250 return false;
1251 break;
1252 case GLSL_TYPE_UINT:
1253 if (this->value.u[c] != unsigned(i))
1254 return false;
1255 break;
1256 case GLSL_TYPE_BOOL:
1257 if (this->value.b[c] != bool(i))
1258 return false;
1259 break;
1260 case GLSL_TYPE_DOUBLE:
1261 if (this->value.d[c] != double(f))
1262 return false;
1263 break;
1264 case GLSL_TYPE_UINT64:
1265 if (this->value.u64[c] != uint64_t(i))
1266 return false;
1267 break;
1268 case GLSL_TYPE_INT64:
1269 if (this->value.i64[c] != i)
1270 return false;
1271 break;
1272 default:
1273 /* The only other base types are structures, arrays, and samplers.
1274 * Samplers cannot be constants, and the others should have been
1275 * filtered out above.
1276 */
1277 assert(!"Should not get here.");
1278 return false;
1279 }
1280 }
1281
1282 return true;
1283 }
1284
1285 bool
1286 ir_constant::is_zero() const
1287 {
1288 return is_value(0.0, 0);
1289 }
1290
1291 bool
1292 ir_constant::is_one() const
1293 {
1294 return is_value(1.0, 1);
1295 }
1296
1297 bool
1298 ir_constant::is_negative_one() const
1299 {
1300 return is_value(-1.0, -1);
1301 }
1302
1303 bool
1304 ir_constant::is_uint16_constant() const
1305 {
1306 if (!type->is_integer())
1307 return false;
1308
1309 return value.u[0] < (1 << 16);
1310 }
1311
1312 ir_loop::ir_loop()
1313 : ir_instruction(ir_type_loop)
1314 {
1315 }
1316
1317
1318 ir_dereference_variable::ir_dereference_variable(ir_variable *var)
1319 : ir_dereference(ir_type_dereference_variable)
1320 {
1321 assert(var != NULL);
1322
1323 this->var = var;
1324 this->type = var->type;
1325 }
1326
1327
1328 ir_dereference_array::ir_dereference_array(ir_rvalue *value,
1329 ir_rvalue *array_index)
1330 : ir_dereference(ir_type_dereference_array)
1331 {
1332 this->array_index = array_index;
1333 this->set_array(value);
1334 }
1335
1336
1337 ir_dereference_array::ir_dereference_array(ir_variable *var,
1338 ir_rvalue *array_index)
1339 : ir_dereference(ir_type_dereference_array)
1340 {
1341 void *ctx = ralloc_parent(var);
1342
1343 this->array_index = array_index;
1344 this->set_array(new(ctx) ir_dereference_variable(var));
1345 }
1346
1347
1348 void
1349 ir_dereference_array::set_array(ir_rvalue *value)
1350 {
1351 assert(value != NULL);
1352
1353 this->array = value;
1354
1355 const glsl_type *const vt = this->array->type;
1356
1357 if (vt->is_array()) {
1358 type = vt->fields.array;
1359 } else if (vt->is_matrix()) {
1360 type = vt->column_type();
1361 } else if (vt->is_vector()) {
1362 type = vt->get_base_type();
1363 }
1364 }
1365
1366
1367 ir_dereference_record::ir_dereference_record(ir_rvalue *value,
1368 const char *field)
1369 : ir_dereference(ir_type_dereference_record)
1370 {
1371 assert(value != NULL);
1372
1373 this->record = value;
1374 this->field = ralloc_strdup(this, field);
1375 this->type = this->record->type->field_type(field);
1376 }
1377
1378
1379 ir_dereference_record::ir_dereference_record(ir_variable *var,
1380 const char *field)
1381 : ir_dereference(ir_type_dereference_record)
1382 {
1383 void *ctx = ralloc_parent(var);
1384
1385 this->record = new(ctx) ir_dereference_variable(var);
1386 this->field = ralloc_strdup(this, field);
1387 this->type = this->record->type->field_type(field);
1388 }
1389
1390 bool
1391 ir_dereference::is_lvalue() const
1392 {
1393 ir_variable *var = this->variable_referenced();
1394
1395 /* Every l-value derference chain eventually ends in a variable.
1396 */
1397 if ((var == NULL) || var->data.read_only)
1398 return false;
1399
1400 /* From section 4.1.7 of the GLSL 4.40 spec:
1401 *
1402 * "Opaque variables cannot be treated as l-values; hence cannot
1403 * be used as out or inout function parameters, nor can they be
1404 * assigned into."
1405 */
1406 if (this->type->contains_opaque())
1407 return false;
1408
1409 return true;
1410 }
1411
1412
1413 static const char * const tex_opcode_strs[] = { "tex", "txb", "txl", "txd", "txf", "txf_ms", "txs", "lod", "tg4", "query_levels", "texture_samples", "samples_identical" };
1414
1415 const char *ir_texture::opcode_string()
1416 {
1417 assert((unsigned int) op < ARRAY_SIZE(tex_opcode_strs));
1418 return tex_opcode_strs[op];
1419 }
1420
1421 ir_texture_opcode
1422 ir_texture::get_opcode(const char *str)
1423 {
1424 const int count = sizeof(tex_opcode_strs) / sizeof(tex_opcode_strs[0]);
1425 for (int op = 0; op < count; op++) {
1426 if (strcmp(str, tex_opcode_strs[op]) == 0)
1427 return (ir_texture_opcode) op;
1428 }
1429 return (ir_texture_opcode) -1;
1430 }
1431
1432
1433 void
1434 ir_texture::set_sampler(ir_dereference *sampler, const glsl_type *type)
1435 {
1436 assert(sampler != NULL);
1437 assert(type != NULL);
1438 this->sampler = sampler;
1439 this->type = type;
1440
1441 if (this->op == ir_txs || this->op == ir_query_levels ||
1442 this->op == ir_texture_samples) {
1443 assert(type->base_type == GLSL_TYPE_INT);
1444 } else if (this->op == ir_lod) {
1445 assert(type->vector_elements == 2);
1446 assert(type->base_type == GLSL_TYPE_FLOAT);
1447 } else if (this->op == ir_samples_identical) {
1448 assert(type == glsl_type::bool_type);
1449 assert(sampler->type->base_type == GLSL_TYPE_SAMPLER);
1450 assert(sampler->type->sampler_dimensionality == GLSL_SAMPLER_DIM_MS);
1451 } else {
1452 assert(sampler->type->sampled_type == (int) type->base_type);
1453 if (sampler->type->sampler_shadow)
1454 assert(type->vector_elements == 4 || type->vector_elements == 1);
1455 else
1456 assert(type->vector_elements == 4);
1457 }
1458 }
1459
1460
1461 void
1462 ir_swizzle::init_mask(const unsigned *comp, unsigned count)
1463 {
1464 assert((count >= 1) && (count <= 4));
1465
1466 memset(&this->mask, 0, sizeof(this->mask));
1467 this->mask.num_components = count;
1468
1469 unsigned dup_mask = 0;
1470 switch (count) {
1471 case 4:
1472 assert(comp[3] <= 3);
1473 dup_mask |= (1U << comp[3])
1474 & ((1U << comp[0]) | (1U << comp[1]) | (1U << comp[2]));
1475 this->mask.w = comp[3];
1476
1477 case 3:
1478 assert(comp[2] <= 3);
1479 dup_mask |= (1U << comp[2])
1480 & ((1U << comp[0]) | (1U << comp[1]));
1481 this->mask.z = comp[2];
1482
1483 case 2:
1484 assert(comp[1] <= 3);
1485 dup_mask |= (1U << comp[1])
1486 & ((1U << comp[0]));
1487 this->mask.y = comp[1];
1488
1489 case 1:
1490 assert(comp[0] <= 3);
1491 this->mask.x = comp[0];
1492 }
1493
1494 this->mask.has_duplicates = dup_mask != 0;
1495
1496 /* Based on the number of elements in the swizzle and the base type
1497 * (i.e., float, int, unsigned, or bool) of the vector being swizzled,
1498 * generate the type of the resulting value.
1499 */
1500 type = glsl_type::get_instance(val->type->base_type, mask.num_components, 1);
1501 }
1502
1503 ir_swizzle::ir_swizzle(ir_rvalue *val, unsigned x, unsigned y, unsigned z,
1504 unsigned w, unsigned count)
1505 : ir_rvalue(ir_type_swizzle), val(val)
1506 {
1507 const unsigned components[4] = { x, y, z, w };
1508 this->init_mask(components, count);
1509 }
1510
1511 ir_swizzle::ir_swizzle(ir_rvalue *val, const unsigned *comp,
1512 unsigned count)
1513 : ir_rvalue(ir_type_swizzle), val(val)
1514 {
1515 this->init_mask(comp, count);
1516 }
1517
1518 ir_swizzle::ir_swizzle(ir_rvalue *val, ir_swizzle_mask mask)
1519 : ir_rvalue(ir_type_swizzle)
1520 {
1521 this->val = val;
1522 this->mask = mask;
1523 this->type = glsl_type::get_instance(val->type->base_type,
1524 mask.num_components, 1);
1525 }
1526
1527 #define X 1
1528 #define R 5
1529 #define S 9
1530 #define I 13
1531
1532 ir_swizzle *
1533 ir_swizzle::create(ir_rvalue *val, const char *str, unsigned vector_length)
1534 {
1535 void *ctx = ralloc_parent(val);
1536
1537 /* For each possible swizzle character, this table encodes the value in
1538 * \c idx_map that represents the 0th element of the vector. For invalid
1539 * swizzle characters (e.g., 'k'), a special value is used that will allow
1540 * detection of errors.
1541 */
1542 static const unsigned char base_idx[26] = {
1543 /* a b c d e f g h i j k l m */
1544 R, R, I, I, I, I, R, I, I, I, I, I, I,
1545 /* n o p q r s t u v w x y z */
1546 I, I, S, S, R, S, S, I, I, X, X, X, X
1547 };
1548
1549 /* Each valid swizzle character has an entry in the previous table. This
1550 * table encodes the base index encoded in the previous table plus the actual
1551 * index of the swizzle character. When processing swizzles, the first
1552 * character in the string is indexed in the previous table. Each character
1553 * in the string is indexed in this table, and the value found there has the
1554 * value form the first table subtracted. The result must be on the range
1555 * [0,3].
1556 *
1557 * For example, the string "wzyx" will get X from the first table. Each of
1558 * the charcaters will get X+3, X+2, X+1, and X+0 from this table. After
1559 * subtraction, the swizzle values are { 3, 2, 1, 0 }.
1560 *
1561 * The string "wzrg" will get X from the first table. Each of the characters
1562 * will get X+3, X+2, R+0, and R+1 from this table. After subtraction, the
1563 * swizzle values are { 3, 2, 4, 5 }. Since 4 and 5 are outside the range
1564 * [0,3], the error is detected.
1565 */
1566 static const unsigned char idx_map[26] = {
1567 /* a b c d e f g h i j k l m */
1568 R+3, R+2, 0, 0, 0, 0, R+1, 0, 0, 0, 0, 0, 0,
1569 /* n o p q r s t u v w x y z */
1570 0, 0, S+2, S+3, R+0, S+0, S+1, 0, 0, X+3, X+0, X+1, X+2
1571 };
1572
1573 int swiz_idx[4] = { 0, 0, 0, 0 };
1574 unsigned i;
1575
1576
1577 /* Validate the first character in the swizzle string and look up the base
1578 * index value as described above.
1579 */
1580 if ((str[0] < 'a') || (str[0] > 'z'))
1581 return NULL;
1582
1583 const unsigned base = base_idx[str[0] - 'a'];
1584
1585
1586 for (i = 0; (i < 4) && (str[i] != '\0'); i++) {
1587 /* Validate the next character, and, as described above, convert it to a
1588 * swizzle index.
1589 */
1590 if ((str[i] < 'a') || (str[i] > 'z'))
1591 return NULL;
1592
1593 swiz_idx[i] = idx_map[str[i] - 'a'] - base;
1594 if ((swiz_idx[i] < 0) || (swiz_idx[i] >= (int) vector_length))
1595 return NULL;
1596 }
1597
1598 if (str[i] != '\0')
1599 return NULL;
1600
1601 return new(ctx) ir_swizzle(val, swiz_idx[0], swiz_idx[1], swiz_idx[2],
1602 swiz_idx[3], i);
1603 }
1604
1605 #undef X
1606 #undef R
1607 #undef S
1608 #undef I
1609
1610 ir_variable *
1611 ir_swizzle::variable_referenced() const
1612 {
1613 return this->val->variable_referenced();
1614 }
1615
1616
1617 bool ir_variable::temporaries_allocate_names = false;
1618
1619 const char ir_variable::tmp_name[] = "compiler_temp";
1620
1621 ir_variable::ir_variable(const struct glsl_type *type, const char *name,
1622 ir_variable_mode mode)
1623 : ir_instruction(ir_type_variable)
1624 {
1625 this->type = type;
1626
1627 if (mode == ir_var_temporary && !ir_variable::temporaries_allocate_names)
1628 name = NULL;
1629
1630 /* The ir_variable clone method may call this constructor with name set to
1631 * tmp_name.
1632 */
1633 assert(name != NULL
1634 || mode == ir_var_temporary
1635 || mode == ir_var_function_in
1636 || mode == ir_var_function_out
1637 || mode == ir_var_function_inout);
1638 assert(name != ir_variable::tmp_name
1639 || mode == ir_var_temporary);
1640 if (mode == ir_var_temporary
1641 && (name == NULL || name == ir_variable::tmp_name)) {
1642 this->name = ir_variable::tmp_name;
1643 } else if (name == NULL ||
1644 strlen(name) < ARRAY_SIZE(this->name_storage)) {
1645 strcpy(this->name_storage, name ? name : "");
1646 this->name = this->name_storage;
1647 } else {
1648 this->name = ralloc_strdup(this, name);
1649 }
1650
1651 this->u.max_ifc_array_access = NULL;
1652
1653 this->data.explicit_location = false;
1654 this->data.has_initializer = false;
1655 this->data.location = -1;
1656 this->data.location_frac = 0;
1657 this->data.binding = 0;
1658 this->data.warn_extension_index = 0;
1659 this->constant_value = NULL;
1660 this->constant_initializer = NULL;
1661 this->data.origin_upper_left = false;
1662 this->data.pixel_center_integer = false;
1663 this->data.depth_layout = ir_depth_layout_none;
1664 this->data.used = false;
1665 this->data.always_active_io = false;
1666 this->data.read_only = false;
1667 this->data.centroid = false;
1668 this->data.sample = false;
1669 this->data.patch = false;
1670 this->data.invariant = false;
1671 this->data.how_declared = ir_var_declared_normally;
1672 this->data.mode = mode;
1673 this->data.interpolation = INTERP_MODE_NONE;
1674 this->data.max_array_access = -1;
1675 this->data.offset = 0;
1676 this->data.precision = GLSL_PRECISION_NONE;
1677 this->data.image_read_only = false;
1678 this->data.image_write_only = false;
1679 this->data.image_coherent = false;
1680 this->data.image_volatile = false;
1681 this->data.image_restrict = false;
1682 this->data.from_ssbo_unsized_array = false;
1683 this->data.fb_fetch_output = false;
1684
1685 if (type != NULL) {
1686 if (type->base_type == GLSL_TYPE_SAMPLER)
1687 this->data.read_only = true;
1688
1689 if (type->is_interface())
1690 this->init_interface_type(type);
1691 else if (type->without_array()->is_interface())
1692 this->init_interface_type(type->without_array());
1693 }
1694 }
1695
1696
1697 const char *
1698 interpolation_string(unsigned interpolation)
1699 {
1700 switch (interpolation) {
1701 case INTERP_MODE_NONE: return "no";
1702 case INTERP_MODE_SMOOTH: return "smooth";
1703 case INTERP_MODE_FLAT: return "flat";
1704 case INTERP_MODE_NOPERSPECTIVE: return "noperspective";
1705 }
1706
1707 assert(!"Should not get here.");
1708 return "";
1709 }
1710
1711 const char *const ir_variable::warn_extension_table[] = {
1712 "",
1713 "GL_ARB_shader_stencil_export",
1714 "GL_AMD_shader_stencil_export",
1715 };
1716
1717 void
1718 ir_variable::enable_extension_warning(const char *extension)
1719 {
1720 for (unsigned i = 0; i < ARRAY_SIZE(warn_extension_table); i++) {
1721 if (strcmp(warn_extension_table[i], extension) == 0) {
1722 this->data.warn_extension_index = i;
1723 return;
1724 }
1725 }
1726
1727 assert(!"Should not get here.");
1728 this->data.warn_extension_index = 0;
1729 }
1730
1731 const char *
1732 ir_variable::get_extension_warning() const
1733 {
1734 return this->data.warn_extension_index == 0
1735 ? NULL : warn_extension_table[this->data.warn_extension_index];
1736 }
1737
1738 ir_function_signature::ir_function_signature(const glsl_type *return_type,
1739 builtin_available_predicate b)
1740 : ir_instruction(ir_type_function_signature),
1741 return_type(return_type), is_defined(false),
1742 intrinsic_id(ir_intrinsic_invalid), builtin_avail(b), _function(NULL)
1743 {
1744 this->origin = NULL;
1745 }
1746
1747
1748 bool
1749 ir_function_signature::is_builtin() const
1750 {
1751 return builtin_avail != NULL;
1752 }
1753
1754
1755 bool
1756 ir_function_signature::is_builtin_available(const _mesa_glsl_parse_state *state) const
1757 {
1758 /* We can't call the predicate without a state pointer, so just say that
1759 * the signature is available. At compile time, we need the filtering,
1760 * but also receive a valid state pointer. At link time, we're resolving
1761 * imported built-in prototypes to their definitions, which will always
1762 * be an exact match. So we can skip the filtering.
1763 */
1764 if (state == NULL)
1765 return true;
1766
1767 assert(builtin_avail != NULL);
1768 return builtin_avail(state);
1769 }
1770
1771
1772 static bool
1773 modes_match(unsigned a, unsigned b)
1774 {
1775 if (a == b)
1776 return true;
1777
1778 /* Accept "in" vs. "const in" */
1779 if ((a == ir_var_const_in && b == ir_var_function_in) ||
1780 (b == ir_var_const_in && a == ir_var_function_in))
1781 return true;
1782
1783 return false;
1784 }
1785
1786
1787 const char *
1788 ir_function_signature::qualifiers_match(exec_list *params)
1789 {
1790 /* check that the qualifiers match. */
1791 foreach_two_lists(a_node, &this->parameters, b_node, params) {
1792 ir_variable *a = (ir_variable *) a_node;
1793 ir_variable *b = (ir_variable *) b_node;
1794
1795 if (a->data.read_only != b->data.read_only ||
1796 !modes_match(a->data.mode, b->data.mode) ||
1797 a->data.interpolation != b->data.interpolation ||
1798 a->data.centroid != b->data.centroid ||
1799 a->data.sample != b->data.sample ||
1800 a->data.patch != b->data.patch ||
1801 a->data.image_read_only != b->data.image_read_only ||
1802 a->data.image_write_only != b->data.image_write_only ||
1803 a->data.image_coherent != b->data.image_coherent ||
1804 a->data.image_volatile != b->data.image_volatile ||
1805 a->data.image_restrict != b->data.image_restrict) {
1806
1807 /* parameter a's qualifiers don't match */
1808 return a->name;
1809 }
1810 }
1811 return NULL;
1812 }
1813
1814
1815 void
1816 ir_function_signature::replace_parameters(exec_list *new_params)
1817 {
1818 /* Destroy all of the previous parameter information. If the previous
1819 * parameter information comes from the function prototype, it may either
1820 * specify incorrect parameter names or not have names at all.
1821 */
1822 new_params->move_nodes_to(&parameters);
1823 }
1824
1825
1826 ir_function::ir_function(const char *name)
1827 : ir_instruction(ir_type_function)
1828 {
1829 this->subroutine_index = -1;
1830 this->name = ralloc_strdup(this, name);
1831 }
1832
1833
1834 bool
1835 ir_function::has_user_signature()
1836 {
1837 foreach_in_list(ir_function_signature, sig, &this->signatures) {
1838 if (!sig->is_builtin())
1839 return true;
1840 }
1841 return false;
1842 }
1843
1844
1845 ir_rvalue *
1846 ir_rvalue::error_value(void *mem_ctx)
1847 {
1848 ir_rvalue *v = new(mem_ctx) ir_rvalue(ir_type_unset);
1849
1850 v->type = glsl_type::error_type;
1851 return v;
1852 }
1853
1854
1855 void
1856 visit_exec_list(exec_list *list, ir_visitor *visitor)
1857 {
1858 foreach_in_list_safe(ir_instruction, node, list) {
1859 node->accept(visitor);
1860 }
1861 }
1862
1863
1864 static void
1865 steal_memory(ir_instruction *ir, void *new_ctx)
1866 {
1867 ir_variable *var = ir->as_variable();
1868 ir_function *fn = ir->as_function();
1869 ir_constant *constant = ir->as_constant();
1870 if (var != NULL && var->constant_value != NULL)
1871 steal_memory(var->constant_value, ir);
1872
1873 if (var != NULL && var->constant_initializer != NULL)
1874 steal_memory(var->constant_initializer, ir);
1875
1876 if (fn != NULL && fn->subroutine_types)
1877 ralloc_steal(new_ctx, fn->subroutine_types);
1878
1879 /* The components of aggregate constants are not visited by the normal
1880 * visitor, so steal their values by hand.
1881 */
1882 if (constant != NULL) {
1883 if (constant->type->is_record()) {
1884 foreach_in_list(ir_constant, field, &constant->components) {
1885 steal_memory(field, ir);
1886 }
1887 } else if (constant->type->is_array()) {
1888 for (unsigned int i = 0; i < constant->type->length; i++) {
1889 steal_memory(constant->array_elements[i], ir);
1890 }
1891 }
1892 }
1893
1894 ralloc_steal(new_ctx, ir);
1895 }
1896
1897
1898 void
1899 reparent_ir(exec_list *list, void *mem_ctx)
1900 {
1901 foreach_in_list(ir_instruction, node, list) {
1902 visit_tree(node, steal_memory, mem_ctx);
1903 }
1904 }
1905
1906
1907 static ir_rvalue *
1908 try_min_one(ir_rvalue *ir)
1909 {
1910 ir_expression *expr = ir->as_expression();
1911
1912 if (!expr || expr->operation != ir_binop_min)
1913 return NULL;
1914
1915 if (expr->operands[0]->is_one())
1916 return expr->operands[1];
1917
1918 if (expr->operands[1]->is_one())
1919 return expr->operands[0];
1920
1921 return NULL;
1922 }
1923
1924 static ir_rvalue *
1925 try_max_zero(ir_rvalue *ir)
1926 {
1927 ir_expression *expr = ir->as_expression();
1928
1929 if (!expr || expr->operation != ir_binop_max)
1930 return NULL;
1931
1932 if (expr->operands[0]->is_zero())
1933 return expr->operands[1];
1934
1935 if (expr->operands[1]->is_zero())
1936 return expr->operands[0];
1937
1938 return NULL;
1939 }
1940
1941 ir_rvalue *
1942 ir_rvalue::as_rvalue_to_saturate()
1943 {
1944 ir_expression *expr = this->as_expression();
1945
1946 if (!expr)
1947 return NULL;
1948
1949 ir_rvalue *max_zero = try_max_zero(expr);
1950 if (max_zero) {
1951 return try_min_one(max_zero);
1952 } else {
1953 ir_rvalue *min_one = try_min_one(expr);
1954 if (min_one) {
1955 return try_max_zero(min_one);
1956 }
1957 }
1958
1959 return NULL;
1960 }
1961
1962
1963 unsigned
1964 vertices_per_prim(GLenum prim)
1965 {
1966 switch (prim) {
1967 case GL_POINTS:
1968 return 1;
1969 case GL_LINES:
1970 return 2;
1971 case GL_TRIANGLES:
1972 return 3;
1973 case GL_LINES_ADJACENCY:
1974 return 4;
1975 case GL_TRIANGLES_ADJACENCY:
1976 return 6;
1977 default:
1978 assert(!"Bad primitive");
1979 return 3;
1980 }
1981 }
1982
1983 /**
1984 * Generate a string describing the mode of a variable
1985 */
1986 const char *
1987 mode_string(const ir_variable *var)
1988 {
1989 switch (var->data.mode) {
1990 case ir_var_auto:
1991 return (var->data.read_only) ? "global constant" : "global variable";
1992
1993 case ir_var_uniform:
1994 return "uniform";
1995
1996 case ir_var_shader_storage:
1997 return "buffer";
1998
1999 case ir_var_shader_in:
2000 return "shader input";
2001
2002 case ir_var_shader_out:
2003 return "shader output";
2004
2005 case ir_var_function_in:
2006 case ir_var_const_in:
2007 return "function input";
2008
2009 case ir_var_function_out:
2010 return "function output";
2011
2012 case ir_var_function_inout:
2013 return "function inout";
2014
2015 case ir_var_system_value:
2016 return "shader input";
2017
2018 case ir_var_temporary:
2019 return "compiler temporary";
2020
2021 case ir_var_mode_count:
2022 break;
2023 }
2024
2025 assert(!"Should not get here.");
2026 return "invalid variable";
2027 }