2 * Copyright © 2010 Intel Corporation
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
24 #include "main/core.h" /* for MAX2 */
26 #include "ir_visitor.h"
27 #include "glsl_types.h"
29 ir_rvalue::ir_rvalue()
31 this->type
= glsl_type::error_type
;
34 bool ir_rvalue::is_zero() const
39 bool ir_rvalue::is_one() const
44 bool ir_rvalue::is_negative_one() const
49 bool ir_rvalue::is_basis() const
55 * Modify the swizzle make to move one component to another
57 * \param m IR swizzle to be modified
58 * \param from Component in the RHS that is to be swizzled
59 * \param to Desired swizzle location of \c from
62 update_rhs_swizzle(ir_swizzle_mask
&m
, unsigned from
, unsigned to
)
65 case 0: m
.x
= from
; break;
66 case 1: m
.y
= from
; break;
67 case 2: m
.z
= from
; break;
68 case 3: m
.w
= from
; break;
69 default: assert(!"Should not get here.");
72 m
.num_components
= MAX2(m
.num_components
, (to
+ 1));
76 ir_assignment::set_lhs(ir_rvalue
*lhs
)
79 bool swizzled
= false;
82 ir_swizzle
*swiz
= lhs
->as_swizzle();
87 unsigned write_mask
= 0;
88 ir_swizzle_mask rhs_swiz
= { 0, 0, 0, 0, 0, 0 };
90 for (unsigned i
= 0; i
< swiz
->mask
.num_components
; i
++) {
94 case 0: c
= swiz
->mask
.x
; break;
95 case 1: c
= swiz
->mask
.y
; break;
96 case 2: c
= swiz
->mask
.z
; break;
97 case 3: c
= swiz
->mask
.w
; break;
98 default: assert(!"Should not get here.");
101 write_mask
|= (((this->write_mask
>> i
) & 1) << c
);
102 update_rhs_swizzle(rhs_swiz
, i
, c
);
105 this->write_mask
= write_mask
;
108 this->rhs
= new(mem_ctx
) ir_swizzle(this->rhs
, rhs_swiz
);
113 /* Now, RHS channels line up with the LHS writemask. Collapse it
114 * to just the channels that will be written.
116 ir_swizzle_mask rhs_swiz
= { 0, 0, 0, 0, 0, 0 };
118 for (int i
= 0; i
< 4; i
++) {
119 if (write_mask
& (1 << i
))
120 update_rhs_swizzle(rhs_swiz
, i
, rhs_chan
++);
122 this->rhs
= new(mem_ctx
) ir_swizzle(this->rhs
, rhs_swiz
);
125 assert((lhs
== NULL
) || lhs
->as_dereference());
127 this->lhs
= (ir_dereference
*) lhs
;
131 ir_assignment::whole_variable_written()
133 ir_variable
*v
= this->lhs
->whole_variable_referenced();
138 if (v
->type
->is_scalar())
141 if (v
->type
->is_vector()) {
142 const unsigned mask
= (1U << v
->type
->vector_elements
) - 1;
144 if (mask
!= this->write_mask
)
148 /* Either all the vector components are assigned or the variable is some
149 * composite type (and the whole thing is assigned.
154 ir_assignment::ir_assignment(ir_dereference
*lhs
, ir_rvalue
*rhs
,
155 ir_rvalue
*condition
, unsigned write_mask
)
157 this->ir_type
= ir_type_assignment
;
158 this->condition
= condition
;
161 this->write_mask
= write_mask
;
163 if (lhs
->type
->is_scalar() || lhs
->type
->is_vector()) {
164 int lhs_components
= 0;
165 for (int i
= 0; i
< 4; i
++) {
166 if (write_mask
& (1 << i
))
170 assert(lhs_components
== this->rhs
->type
->vector_elements
);
174 ir_assignment::ir_assignment(ir_rvalue
*lhs
, ir_rvalue
*rhs
,
175 ir_rvalue
*condition
)
177 this->ir_type
= ir_type_assignment
;
178 this->condition
= condition
;
181 /* If the RHS is a vector type, assume that all components of the vector
182 * type are being written to the LHS. The write mask comes from the RHS
183 * because we can have a case where the LHS is a vec4 and the RHS is a
184 * vec3. In that case, the assignment is:
186 * (assign (...) (xyz) (var_ref lhs) (var_ref rhs))
188 if (rhs
->type
->is_vector())
189 this->write_mask
= (1U << rhs
->type
->vector_elements
) - 1;
190 else if (rhs
->type
->is_scalar())
191 this->write_mask
= 1;
193 this->write_mask
= 0;
198 ir_expression::ir_expression(int op
, const struct glsl_type
*type
,
199 ir_rvalue
*op0
, ir_rvalue
*op1
,
200 ir_rvalue
*op2
, ir_rvalue
*op3
)
202 this->ir_type
= ir_type_expression
;
204 this->operation
= ir_expression_operation(op
);
205 this->operands
[0] = op0
;
206 this->operands
[1] = op1
;
207 this->operands
[2] = op2
;
208 this->operands
[3] = op3
;
210 int num_operands
= get_num_operands(this->operation
);
211 for (int i
= num_operands
; i
< 4; i
++) {
212 assert(this->operands
[i
] == NULL
);
217 ir_expression::ir_expression(int op
, ir_rvalue
*op0
)
219 this->ir_type
= ir_type_expression
;
221 this->operation
= ir_expression_operation(op
);
222 this->operands
[0] = op0
;
223 this->operands
[1] = NULL
;
224 this->operands
[2] = NULL
;
225 this->operands
[3] = NULL
;
227 assert(op
<= ir_last_unop
);
229 switch (this->operation
) {
230 case ir_unop_bit_not
:
231 case ir_unop_logic_not
:
246 case ir_unop_round_even
:
249 case ir_unop_sin_reduced
:
250 case ir_unop_cos_reduced
:
253 case ir_unop_bitfield_reverse
:
254 this->type
= op0
->type
;
260 case ir_unop_bitcast_f2i
:
261 case ir_unop_bit_count
:
262 case ir_unop_find_msb
:
263 case ir_unop_find_lsb
:
264 this->type
= glsl_type::get_instance(GLSL_TYPE_INT
,
265 op0
->type
->vector_elements
, 1);
271 case ir_unop_bitcast_i2f
:
272 case ir_unop_bitcast_u2f
:
273 this->type
= glsl_type::get_instance(GLSL_TYPE_FLOAT
,
274 op0
->type
->vector_elements
, 1);
279 this->type
= glsl_type::get_instance(GLSL_TYPE_BOOL
,
280 op0
->type
->vector_elements
, 1);
285 case ir_unop_bitcast_f2u
:
286 this->type
= glsl_type::get_instance(GLSL_TYPE_UINT
,
287 op0
->type
->vector_elements
, 1);
291 case ir_unop_unpack_half_2x16_split_x
:
292 case ir_unop_unpack_half_2x16_split_y
:
293 this->type
= glsl_type::float_type
;
297 this->type
= glsl_type::bool_type
;
300 case ir_unop_pack_snorm_2x16
:
301 case ir_unop_pack_snorm_4x8
:
302 case ir_unop_pack_unorm_2x16
:
303 case ir_unop_pack_unorm_4x8
:
304 case ir_unop_pack_half_2x16
:
305 this->type
= glsl_type::uint_type
;
308 case ir_unop_unpack_snorm_2x16
:
309 case ir_unop_unpack_unorm_2x16
:
310 case ir_unop_unpack_half_2x16
:
311 this->type
= glsl_type::vec2_type
;
314 case ir_unop_unpack_snorm_4x8
:
315 case ir_unop_unpack_unorm_4x8
:
316 this->type
= glsl_type::vec4_type
;
320 assert(!"not reached: missing automatic type setup for ir_expression");
321 this->type
= op0
->type
;
326 ir_expression::ir_expression(int op
, ir_rvalue
*op0
, ir_rvalue
*op1
)
328 this->ir_type
= ir_type_expression
;
330 this->operation
= ir_expression_operation(op
);
331 this->operands
[0] = op0
;
332 this->operands
[1] = op1
;
333 this->operands
[2] = NULL
;
334 this->operands
[3] = NULL
;
336 assert(op
> ir_last_unop
);
338 switch (this->operation
) {
339 case ir_binop_all_equal
:
340 case ir_binop_any_nequal
:
341 this->type
= glsl_type::bool_type
;
352 if (op0
->type
->is_scalar()) {
353 this->type
= op1
->type
;
354 } else if (op1
->type
->is_scalar()) {
355 this->type
= op0
->type
;
357 /* FINISHME: matrix types */
358 assert(!op0
->type
->is_matrix() && !op1
->type
->is_matrix());
359 assert(op0
->type
== op1
->type
);
360 this->type
= op0
->type
;
364 case ir_binop_logic_and
:
365 case ir_binop_logic_xor
:
366 case ir_binop_logic_or
:
367 case ir_binop_bit_and
:
368 case ir_binop_bit_xor
:
369 case ir_binop_bit_or
:
370 assert(!op0
->type
->is_matrix());
371 assert(!op1
->type
->is_matrix());
372 if (op0
->type
->is_scalar()) {
373 this->type
= op1
->type
;
374 } else if (op1
->type
->is_scalar()) {
375 this->type
= op0
->type
;
377 assert(op0
->type
->vector_elements
== op1
->type
->vector_elements
);
378 this->type
= op0
->type
;
383 case ir_binop_nequal
:
384 case ir_binop_lequal
:
385 case ir_binop_gequal
:
387 case ir_binop_greater
:
388 assert(op0
->type
== op1
->type
);
389 this->type
= glsl_type::get_instance(GLSL_TYPE_BOOL
,
390 op0
->type
->vector_elements
, 1);
394 this->type
= glsl_type::float_type
;
397 case ir_binop_pack_half_2x16_split
:
398 this->type
= glsl_type::uint_type
;
401 case ir_binop_imul_high
:
403 case ir_binop_borrow
:
404 case ir_binop_lshift
:
405 case ir_binop_rshift
:
408 this->type
= op0
->type
;
411 case ir_binop_vector_extract
:
412 this->type
= op0
->type
->get_scalar_type();
416 assert(!"not reached: missing automatic type setup for ir_expression");
417 this->type
= glsl_type::float_type
;
421 ir_expression::ir_expression(int op
, ir_rvalue
*op0
, ir_rvalue
*op1
,
424 this->ir_type
= ir_type_expression
;
426 this->operation
= ir_expression_operation(op
);
427 this->operands
[0] = op0
;
428 this->operands
[1] = op1
;
429 this->operands
[2] = op2
;
430 this->operands
[3] = NULL
;
432 assert(op
> ir_last_binop
&& op
<= ir_last_triop
);
434 switch (this->operation
) {
437 case ir_triop_bitfield_extract
:
438 case ir_triop_vector_insert
:
439 this->type
= op0
->type
;
444 this->type
= op1
->type
;
448 assert(!"not reached: missing automatic type setup for ir_expression");
449 this->type
= glsl_type::float_type
;
454 ir_expression::get_num_operands(ir_expression_operation op
)
456 assert(op
<= ir_last_opcode
);
458 if (op
<= ir_last_unop
)
461 if (op
<= ir_last_binop
)
464 if (op
<= ir_last_triop
)
467 if (op
<= ir_last_quadop
)
474 static const char *const operator_strs
[] = {
523 "unpackHalf2x16_split_x",
524 "unpackHalf2x16_split_y",
558 "packHalf2x16_split",
573 const char *ir_expression::operator_string(ir_expression_operation op
)
575 assert((unsigned int) op
< Elements(operator_strs
));
576 assert(Elements(operator_strs
) == (ir_quadop_vector
+ 1));
577 return operator_strs
[op
];
580 const char *ir_expression::operator_string()
582 return operator_string(this->operation
);
586 depth_layout_string(ir_depth_layout layout
)
589 case ir_depth_layout_none
: return "";
590 case ir_depth_layout_any
: return "depth_any";
591 case ir_depth_layout_greater
: return "depth_greater";
592 case ir_depth_layout_less
: return "depth_less";
593 case ir_depth_layout_unchanged
: return "depth_unchanged";
601 ir_expression_operation
602 ir_expression::get_operator(const char *str
)
604 const int operator_count
= sizeof(operator_strs
) / sizeof(operator_strs
[0]);
605 for (int op
= 0; op
< operator_count
; op
++) {
606 if (strcmp(str
, operator_strs
[op
]) == 0)
607 return (ir_expression_operation
) op
;
609 return (ir_expression_operation
) -1;
612 ir_constant::ir_constant()
614 this->ir_type
= ir_type_constant
;
617 ir_constant::ir_constant(const struct glsl_type
*type
,
618 const ir_constant_data
*data
)
620 assert((type
->base_type
>= GLSL_TYPE_UINT
)
621 && (type
->base_type
<= GLSL_TYPE_BOOL
));
623 this->ir_type
= ir_type_constant
;
625 memcpy(& this->value
, data
, sizeof(this->value
));
628 ir_constant::ir_constant(float f
, unsigned vector_elements
)
630 assert(vector_elements
<= 4);
631 this->ir_type
= ir_type_constant
;
632 this->type
= glsl_type::get_instance(GLSL_TYPE_FLOAT
, vector_elements
, 1);
633 for (unsigned i
= 0; i
< vector_elements
; i
++) {
634 this->value
.f
[i
] = f
;
636 for (unsigned i
= vector_elements
; i
< 16; i
++) {
637 this->value
.f
[i
] = 0;
641 ir_constant::ir_constant(unsigned int u
, unsigned vector_elements
)
643 assert(vector_elements
<= 4);
644 this->ir_type
= ir_type_constant
;
645 this->type
= glsl_type::get_instance(GLSL_TYPE_UINT
, vector_elements
, 1);
646 for (unsigned i
= 0; i
< vector_elements
; i
++) {
647 this->value
.u
[i
] = u
;
649 for (unsigned i
= vector_elements
; i
< 16; i
++) {
650 this->value
.u
[i
] = 0;
654 ir_constant::ir_constant(int integer
, unsigned vector_elements
)
656 assert(vector_elements
<= 4);
657 this->ir_type
= ir_type_constant
;
658 this->type
= glsl_type::get_instance(GLSL_TYPE_INT
, vector_elements
, 1);
659 for (unsigned i
= 0; i
< vector_elements
; i
++) {
660 this->value
.i
[i
] = integer
;
662 for (unsigned i
= vector_elements
; i
< 16; i
++) {
663 this->value
.i
[i
] = 0;
667 ir_constant::ir_constant(bool b
, unsigned vector_elements
)
669 assert(vector_elements
<= 4);
670 this->ir_type
= ir_type_constant
;
671 this->type
= glsl_type::get_instance(GLSL_TYPE_BOOL
, vector_elements
, 1);
672 for (unsigned i
= 0; i
< vector_elements
; i
++) {
673 this->value
.b
[i
] = b
;
675 for (unsigned i
= vector_elements
; i
< 16; i
++) {
676 this->value
.b
[i
] = false;
680 ir_constant::ir_constant(const ir_constant
*c
, unsigned i
)
682 this->ir_type
= ir_type_constant
;
683 this->type
= c
->type
->get_base_type();
685 switch (this->type
->base_type
) {
686 case GLSL_TYPE_UINT
: this->value
.u
[0] = c
->value
.u
[i
]; break;
687 case GLSL_TYPE_INT
: this->value
.i
[0] = c
->value
.i
[i
]; break;
688 case GLSL_TYPE_FLOAT
: this->value
.f
[0] = c
->value
.f
[i
]; break;
689 case GLSL_TYPE_BOOL
: this->value
.b
[0] = c
->value
.b
[i
]; break;
690 default: assert(!"Should not get here."); break;
694 ir_constant::ir_constant(const struct glsl_type
*type
, exec_list
*value_list
)
696 this->ir_type
= ir_type_constant
;
699 assert(type
->is_scalar() || type
->is_vector() || type
->is_matrix()
700 || type
->is_record() || type
->is_array());
702 if (type
->is_array()) {
703 this->array_elements
= ralloc_array(this, ir_constant
*, type
->length
);
705 foreach_list(node
, value_list
) {
706 ir_constant
*value
= (ir_constant
*) node
;
707 assert(value
->as_constant() != NULL
);
709 this->array_elements
[i
++] = value
;
714 /* If the constant is a record, the types of each of the entries in
715 * value_list must be a 1-for-1 match with the structure components. Each
716 * entry must also be a constant. Just move the nodes from the value_list
717 * to the list in the ir_constant.
719 /* FINISHME: Should there be some type checking and / or assertions here? */
720 /* FINISHME: Should the new constant take ownership of the nodes from
721 * FINISHME: value_list, or should it make copies?
723 if (type
->is_record()) {
724 value_list
->move_nodes_to(& this->components
);
728 for (unsigned i
= 0; i
< 16; i
++) {
729 this->value
.u
[i
] = 0;
732 ir_constant
*value
= (ir_constant
*) (value_list
->head
);
734 /* Constructors with exactly one scalar argument are special for vectors
735 * and matrices. For vectors, the scalar value is replicated to fill all
736 * the components. For matrices, the scalar fills the components of the
737 * diagonal while the rest is filled with 0.
739 if (value
->type
->is_scalar() && value
->next
->is_tail_sentinel()) {
740 if (type
->is_matrix()) {
741 /* Matrix - fill diagonal (rest is already set to 0) */
742 assert(type
->base_type
== GLSL_TYPE_FLOAT
);
743 for (unsigned i
= 0; i
< type
->matrix_columns
; i
++)
744 this->value
.f
[i
* type
->vector_elements
+ i
] = value
->value
.f
[0];
746 /* Vector or scalar - fill all components */
747 switch (type
->base_type
) {
750 for (unsigned i
= 0; i
< type
->components(); i
++)
751 this->value
.u
[i
] = value
->value
.u
[0];
753 case GLSL_TYPE_FLOAT
:
754 for (unsigned i
= 0; i
< type
->components(); i
++)
755 this->value
.f
[i
] = value
->value
.f
[0];
758 for (unsigned i
= 0; i
< type
->components(); i
++)
759 this->value
.b
[i
] = value
->value
.b
[0];
762 assert(!"Should not get here.");
769 if (type
->is_matrix() && value
->type
->is_matrix()) {
770 assert(value
->next
->is_tail_sentinel());
772 /* From section 5.4.2 of the GLSL 1.20 spec:
773 * "If a matrix is constructed from a matrix, then each component
774 * (column i, row j) in the result that has a corresponding component
775 * (column i, row j) in the argument will be initialized from there."
777 unsigned cols
= MIN2(type
->matrix_columns
, value
->type
->matrix_columns
);
778 unsigned rows
= MIN2(type
->vector_elements
, value
->type
->vector_elements
);
779 for (unsigned i
= 0; i
< cols
; i
++) {
780 for (unsigned j
= 0; j
< rows
; j
++) {
781 const unsigned src
= i
* value
->type
->vector_elements
+ j
;
782 const unsigned dst
= i
* type
->vector_elements
+ j
;
783 this->value
.f
[dst
] = value
->value
.f
[src
];
787 /* "All other components will be initialized to the identity matrix." */
788 for (unsigned i
= cols
; i
< type
->matrix_columns
; i
++)
789 this->value
.f
[i
* type
->vector_elements
+ i
] = 1.0;
794 /* Use each component from each entry in the value_list to initialize one
795 * component of the constant being constructed.
797 for (unsigned i
= 0; i
< type
->components(); /* empty */) {
798 assert(value
->as_constant() != NULL
);
799 assert(!value
->is_tail_sentinel());
801 for (unsigned j
= 0; j
< value
->type
->components(); j
++) {
802 switch (type
->base_type
) {
804 this->value
.u
[i
] = value
->get_uint_component(j
);
807 this->value
.i
[i
] = value
->get_int_component(j
);
809 case GLSL_TYPE_FLOAT
:
810 this->value
.f
[i
] = value
->get_float_component(j
);
813 this->value
.b
[i
] = value
->get_bool_component(j
);
816 /* FINISHME: What to do? Exceptions are not the answer.
822 if (i
>= type
->components())
826 value
= (ir_constant
*) value
->next
;
831 ir_constant::zero(void *mem_ctx
, const glsl_type
*type
)
833 assert(type
->is_scalar() || type
->is_vector() || type
->is_matrix()
834 || type
->is_record() || type
->is_array());
836 ir_constant
*c
= new(mem_ctx
) ir_constant
;
838 memset(&c
->value
, 0, sizeof(c
->value
));
840 if (type
->is_array()) {
841 c
->array_elements
= ralloc_array(c
, ir_constant
*, type
->length
);
843 for (unsigned i
= 0; i
< type
->length
; i
++)
844 c
->array_elements
[i
] = ir_constant::zero(c
, type
->element_type());
847 if (type
->is_record()) {
848 for (unsigned i
= 0; i
< type
->length
; i
++) {
849 ir_constant
*comp
= ir_constant::zero(mem_ctx
, type
->fields
.structure
[i
].type
);
850 c
->components
.push_tail(comp
);
858 ir_constant::get_bool_component(unsigned i
) const
860 switch (this->type
->base_type
) {
861 case GLSL_TYPE_UINT
: return this->value
.u
[i
] != 0;
862 case GLSL_TYPE_INT
: return this->value
.i
[i
] != 0;
863 case GLSL_TYPE_FLOAT
: return ((int)this->value
.f
[i
]) != 0;
864 case GLSL_TYPE_BOOL
: return this->value
.b
[i
];
865 default: assert(!"Should not get here."); break;
868 /* Must return something to make the compiler happy. This is clearly an
875 ir_constant::get_float_component(unsigned i
) const
877 switch (this->type
->base_type
) {
878 case GLSL_TYPE_UINT
: return (float) this->value
.u
[i
];
879 case GLSL_TYPE_INT
: return (float) this->value
.i
[i
];
880 case GLSL_TYPE_FLOAT
: return this->value
.f
[i
];
881 case GLSL_TYPE_BOOL
: return this->value
.b
[i
] ? 1.0f
: 0.0f
;
882 default: assert(!"Should not get here."); break;
885 /* Must return something to make the compiler happy. This is clearly an
892 ir_constant::get_int_component(unsigned i
) const
894 switch (this->type
->base_type
) {
895 case GLSL_TYPE_UINT
: return this->value
.u
[i
];
896 case GLSL_TYPE_INT
: return this->value
.i
[i
];
897 case GLSL_TYPE_FLOAT
: return (int) this->value
.f
[i
];
898 case GLSL_TYPE_BOOL
: return this->value
.b
[i
] ? 1 : 0;
899 default: assert(!"Should not get here."); break;
902 /* Must return something to make the compiler happy. This is clearly an
909 ir_constant::get_uint_component(unsigned i
) const
911 switch (this->type
->base_type
) {
912 case GLSL_TYPE_UINT
: return this->value
.u
[i
];
913 case GLSL_TYPE_INT
: return this->value
.i
[i
];
914 case GLSL_TYPE_FLOAT
: return (unsigned) this->value
.f
[i
];
915 case GLSL_TYPE_BOOL
: return this->value
.b
[i
] ? 1 : 0;
916 default: assert(!"Should not get here."); break;
919 /* Must return something to make the compiler happy. This is clearly an
926 ir_constant::get_array_element(unsigned i
) const
928 assert(this->type
->is_array());
930 /* From page 35 (page 41 of the PDF) of the GLSL 1.20 spec:
932 * "Behavior is undefined if a shader subscripts an array with an index
933 * less than 0 or greater than or equal to the size the array was
936 * Most out-of-bounds accesses are removed before things could get this far.
937 * There are cases where non-constant array index values can get constant
942 else if (i
>= this->type
->length
)
943 i
= this->type
->length
- 1;
945 return array_elements
[i
];
949 ir_constant::get_record_field(const char *name
)
951 int idx
= this->type
->field_index(name
);
956 if (this->components
.is_empty())
959 exec_node
*node
= this->components
.head
;
960 for (int i
= 0; i
< idx
; i
++) {
963 /* If the end of the list is encountered before the element matching the
964 * requested field is found, return NULL.
966 if (node
->is_tail_sentinel())
970 return (ir_constant
*) node
;
974 ir_constant::copy_offset(ir_constant
*src
, int offset
)
976 switch (this->type
->base_type
) {
979 case GLSL_TYPE_FLOAT
:
980 case GLSL_TYPE_BOOL
: {
981 unsigned int size
= src
->type
->components();
982 assert (size
<= this->type
->components() - offset
);
983 for (unsigned int i
=0; i
<size
; i
++) {
984 switch (this->type
->base_type
) {
986 value
.u
[i
+offset
] = src
->get_uint_component(i
);
989 value
.i
[i
+offset
] = src
->get_int_component(i
);
991 case GLSL_TYPE_FLOAT
:
992 value
.f
[i
+offset
] = src
->get_float_component(i
);
995 value
.b
[i
+offset
] = src
->get_bool_component(i
);
997 default: // Shut up the compiler
1004 case GLSL_TYPE_STRUCT
: {
1005 assert (src
->type
== this->type
);
1006 this->components
.make_empty();
1007 foreach_list(node
, &src
->components
) {
1008 ir_constant
*const orig
= (ir_constant
*) node
;
1010 this->components
.push_tail(orig
->clone(this, NULL
));
1015 case GLSL_TYPE_ARRAY
: {
1016 assert (src
->type
== this->type
);
1017 for (unsigned i
= 0; i
< this->type
->length
; i
++) {
1018 this->array_elements
[i
] = src
->array_elements
[i
]->clone(this, NULL
);
1024 assert(!"Should not get here.");
1030 ir_constant::copy_masked_offset(ir_constant
*src
, int offset
, unsigned int mask
)
1032 assert (!type
->is_array() && !type
->is_record());
1034 if (!type
->is_vector() && !type
->is_matrix()) {
1040 for (int i
=0; i
<4; i
++) {
1041 if (mask
& (1 << i
)) {
1042 switch (this->type
->base_type
) {
1043 case GLSL_TYPE_UINT
:
1044 value
.u
[i
+offset
] = src
->get_uint_component(id
++);
1047 value
.i
[i
+offset
] = src
->get_int_component(id
++);
1049 case GLSL_TYPE_FLOAT
:
1050 value
.f
[i
+offset
] = src
->get_float_component(id
++);
1052 case GLSL_TYPE_BOOL
:
1053 value
.b
[i
+offset
] = src
->get_bool_component(id
++);
1056 assert(!"Should not get here.");
1064 ir_constant::has_value(const ir_constant
*c
) const
1066 if (this->type
!= c
->type
)
1069 if (this->type
->is_array()) {
1070 for (unsigned i
= 0; i
< this->type
->length
; i
++) {
1071 if (!this->array_elements
[i
]->has_value(c
->array_elements
[i
]))
1077 if (this->type
->base_type
== GLSL_TYPE_STRUCT
) {
1078 const exec_node
*a_node
= this->components
.head
;
1079 const exec_node
*b_node
= c
->components
.head
;
1081 while (!a_node
->is_tail_sentinel()) {
1082 assert(!b_node
->is_tail_sentinel());
1084 const ir_constant
*const a_field
= (ir_constant
*) a_node
;
1085 const ir_constant
*const b_field
= (ir_constant
*) b_node
;
1087 if (!a_field
->has_value(b_field
))
1090 a_node
= a_node
->next
;
1091 b_node
= b_node
->next
;
1097 for (unsigned i
= 0; i
< this->type
->components(); i
++) {
1098 switch (this->type
->base_type
) {
1099 case GLSL_TYPE_UINT
:
1100 if (this->value
.u
[i
] != c
->value
.u
[i
])
1104 if (this->value
.i
[i
] != c
->value
.i
[i
])
1107 case GLSL_TYPE_FLOAT
:
1108 if (this->value
.f
[i
] != c
->value
.f
[i
])
1111 case GLSL_TYPE_BOOL
:
1112 if (this->value
.b
[i
] != c
->value
.b
[i
])
1116 assert(!"Should not get here.");
1125 ir_constant::is_value(float f
, int i
) const
1127 if (!this->type
->is_scalar() && !this->type
->is_vector())
1130 /* Only accept boolean values for 0/1. */
1131 if (int(bool(i
)) != i
&& this->type
->is_boolean())
1134 for (unsigned c
= 0; c
< this->type
->vector_elements
; c
++) {
1135 switch (this->type
->base_type
) {
1136 case GLSL_TYPE_FLOAT
:
1137 if (this->value
.f
[c
] != f
)
1141 if (this->value
.i
[c
] != i
)
1144 case GLSL_TYPE_UINT
:
1145 if (this->value
.u
[c
] != unsigned(i
))
1148 case GLSL_TYPE_BOOL
:
1149 if (this->value
.b
[c
] != bool(i
))
1153 /* The only other base types are structures, arrays, and samplers.
1154 * Samplers cannot be constants, and the others should have been
1155 * filtered out above.
1157 assert(!"Should not get here.");
1166 ir_constant::is_zero() const
1168 return is_value(0.0, 0);
1172 ir_constant::is_one() const
1174 return is_value(1.0, 1);
1178 ir_constant::is_negative_one() const
1180 return is_value(-1.0, -1);
1184 ir_constant::is_basis() const
1186 if (!this->type
->is_scalar() && !this->type
->is_vector())
1189 if (this->type
->is_boolean())
1193 for (unsigned c
= 0; c
< this->type
->vector_elements
; c
++) {
1194 switch (this->type
->base_type
) {
1195 case GLSL_TYPE_FLOAT
:
1196 if (this->value
.f
[c
] == 1.0)
1198 else if (this->value
.f
[c
] != 0.0)
1202 if (this->value
.i
[c
] == 1)
1204 else if (this->value
.i
[c
] != 0)
1207 case GLSL_TYPE_UINT
:
1208 if (int(this->value
.u
[c
]) == 1)
1210 else if (int(this->value
.u
[c
]) != 0)
1214 /* The only other base types are structures, arrays, samplers, and
1215 * booleans. Samplers cannot be constants, and the others should
1216 * have been filtered out above.
1218 assert(!"Should not get here.");
1228 this->ir_type
= ir_type_loop
;
1232 ir_dereference_variable::ir_dereference_variable(ir_variable
*var
)
1234 assert(var
!= NULL
);
1236 this->ir_type
= ir_type_dereference_variable
;
1238 this->type
= var
->type
;
1242 ir_dereference_array::ir_dereference_array(ir_rvalue
*value
,
1243 ir_rvalue
*array_index
)
1245 this->ir_type
= ir_type_dereference_array
;
1246 this->array_index
= array_index
;
1247 this->set_array(value
);
1251 ir_dereference_array::ir_dereference_array(ir_variable
*var
,
1252 ir_rvalue
*array_index
)
1254 void *ctx
= ralloc_parent(var
);
1256 this->ir_type
= ir_type_dereference_array
;
1257 this->array_index
= array_index
;
1258 this->set_array(new(ctx
) ir_dereference_variable(var
));
1263 ir_dereference_array::set_array(ir_rvalue
*value
)
1265 assert(value
!= NULL
);
1267 this->array
= value
;
1269 const glsl_type
*const vt
= this->array
->type
;
1271 if (vt
->is_array()) {
1272 type
= vt
->element_type();
1273 } else if (vt
->is_matrix()) {
1274 type
= vt
->column_type();
1275 } else if (vt
->is_vector()) {
1276 type
= vt
->get_base_type();
1281 ir_dereference_record::ir_dereference_record(ir_rvalue
*value
,
1284 assert(value
!= NULL
);
1286 this->ir_type
= ir_type_dereference_record
;
1287 this->record
= value
;
1288 this->field
= ralloc_strdup(this, field
);
1289 this->type
= this->record
->type
->field_type(field
);
1293 ir_dereference_record::ir_dereference_record(ir_variable
*var
,
1296 void *ctx
= ralloc_parent(var
);
1298 this->ir_type
= ir_type_dereference_record
;
1299 this->record
= new(ctx
) ir_dereference_variable(var
);
1300 this->field
= ralloc_strdup(this, field
);
1301 this->type
= this->record
->type
->field_type(field
);
1305 ir_dereference::is_lvalue() const
1307 ir_variable
*var
= this->variable_referenced();
1309 /* Every l-value derference chain eventually ends in a variable.
1311 if ((var
== NULL
) || var
->data
.read_only
)
1314 /* From page 17 (page 23 of the PDF) of the GLSL 1.20 spec:
1316 * "Samplers cannot be treated as l-values; hence cannot be used
1317 * as out or inout function parameters, nor can they be
1320 if (this->type
->contains_sampler())
1327 static const char *tex_opcode_strs
[] = { "tex", "txb", "txl", "txd", "txf", "txf_ms", "txs", "lod", "tg4", "query_levels" };
1329 const char *ir_texture::opcode_string()
1331 assert((unsigned int) op
<=
1332 sizeof(tex_opcode_strs
) / sizeof(tex_opcode_strs
[0]));
1333 return tex_opcode_strs
[op
];
1337 ir_texture::get_opcode(const char *str
)
1339 const int count
= sizeof(tex_opcode_strs
) / sizeof(tex_opcode_strs
[0]);
1340 for (int op
= 0; op
< count
; op
++) {
1341 if (strcmp(str
, tex_opcode_strs
[op
]) == 0)
1342 return (ir_texture_opcode
) op
;
1344 return (ir_texture_opcode
) -1;
1349 ir_texture::set_sampler(ir_dereference
*sampler
, const glsl_type
*type
)
1351 assert(sampler
!= NULL
);
1352 assert(type
!= NULL
);
1353 this->sampler
= sampler
;
1356 if (this->op
== ir_txs
|| this->op
== ir_query_levels
) {
1357 assert(type
->base_type
== GLSL_TYPE_INT
);
1358 } else if (this->op
== ir_lod
) {
1359 assert(type
->vector_elements
== 2);
1360 assert(type
->base_type
== GLSL_TYPE_FLOAT
);
1362 assert(sampler
->type
->sampler_type
== (int) type
->base_type
);
1363 if (sampler
->type
->sampler_shadow
)
1364 assert(type
->vector_elements
== 4 || type
->vector_elements
== 1);
1366 assert(type
->vector_elements
== 4);
1372 ir_swizzle::init_mask(const unsigned *comp
, unsigned count
)
1374 assert((count
>= 1) && (count
<= 4));
1376 memset(&this->mask
, 0, sizeof(this->mask
));
1377 this->mask
.num_components
= count
;
1379 unsigned dup_mask
= 0;
1382 assert(comp
[3] <= 3);
1383 dup_mask
|= (1U << comp
[3])
1384 & ((1U << comp
[0]) | (1U << comp
[1]) | (1U << comp
[2]));
1385 this->mask
.w
= comp
[3];
1388 assert(comp
[2] <= 3);
1389 dup_mask
|= (1U << comp
[2])
1390 & ((1U << comp
[0]) | (1U << comp
[1]));
1391 this->mask
.z
= comp
[2];
1394 assert(comp
[1] <= 3);
1395 dup_mask
|= (1U << comp
[1])
1396 & ((1U << comp
[0]));
1397 this->mask
.y
= comp
[1];
1400 assert(comp
[0] <= 3);
1401 this->mask
.x
= comp
[0];
1404 this->mask
.has_duplicates
= dup_mask
!= 0;
1406 /* Based on the number of elements in the swizzle and the base type
1407 * (i.e., float, int, unsigned, or bool) of the vector being swizzled,
1408 * generate the type of the resulting value.
1410 type
= glsl_type::get_instance(val
->type
->base_type
, mask
.num_components
, 1);
1413 ir_swizzle::ir_swizzle(ir_rvalue
*val
, unsigned x
, unsigned y
, unsigned z
,
1414 unsigned w
, unsigned count
)
1417 const unsigned components
[4] = { x
, y
, z
, w
};
1418 this->ir_type
= ir_type_swizzle
;
1419 this->init_mask(components
, count
);
1422 ir_swizzle::ir_swizzle(ir_rvalue
*val
, const unsigned *comp
,
1426 this->ir_type
= ir_type_swizzle
;
1427 this->init_mask(comp
, count
);
1430 ir_swizzle::ir_swizzle(ir_rvalue
*val
, ir_swizzle_mask mask
)
1432 this->ir_type
= ir_type_swizzle
;
1435 this->type
= glsl_type::get_instance(val
->type
->base_type
,
1436 mask
.num_components
, 1);
1445 ir_swizzle::create(ir_rvalue
*val
, const char *str
, unsigned vector_length
)
1447 void *ctx
= ralloc_parent(val
);
1449 /* For each possible swizzle character, this table encodes the value in
1450 * \c idx_map that represents the 0th element of the vector. For invalid
1451 * swizzle characters (e.g., 'k'), a special value is used that will allow
1452 * detection of errors.
1454 static const unsigned char base_idx
[26] = {
1455 /* a b c d e f g h i j k l m */
1456 R
, R
, I
, I
, I
, I
, R
, I
, I
, I
, I
, I
, I
,
1457 /* n o p q r s t u v w x y z */
1458 I
, I
, S
, S
, R
, S
, S
, I
, I
, X
, X
, X
, X
1461 /* Each valid swizzle character has an entry in the previous table. This
1462 * table encodes the base index encoded in the previous table plus the actual
1463 * index of the swizzle character. When processing swizzles, the first
1464 * character in the string is indexed in the previous table. Each character
1465 * in the string is indexed in this table, and the value found there has the
1466 * value form the first table subtracted. The result must be on the range
1469 * For example, the string "wzyx" will get X from the first table. Each of
1470 * the charcaters will get X+3, X+2, X+1, and X+0 from this table. After
1471 * subtraction, the swizzle values are { 3, 2, 1, 0 }.
1473 * The string "wzrg" will get X from the first table. Each of the characters
1474 * will get X+3, X+2, R+0, and R+1 from this table. After subtraction, the
1475 * swizzle values are { 3, 2, 4, 5 }. Since 4 and 5 are outside the range
1476 * [0,3], the error is detected.
1478 static const unsigned char idx_map
[26] = {
1479 /* a b c d e f g h i j k l m */
1480 R
+3, R
+2, 0, 0, 0, 0, R
+1, 0, 0, 0, 0, 0, 0,
1481 /* n o p q r s t u v w x y z */
1482 0, 0, S
+2, S
+3, R
+0, S
+0, S
+1, 0, 0, X
+3, X
+0, X
+1, X
+2
1485 int swiz_idx
[4] = { 0, 0, 0, 0 };
1489 /* Validate the first character in the swizzle string and look up the base
1490 * index value as described above.
1492 if ((str
[0] < 'a') || (str
[0] > 'z'))
1495 const unsigned base
= base_idx
[str
[0] - 'a'];
1498 for (i
= 0; (i
< 4) && (str
[i
] != '\0'); i
++) {
1499 /* Validate the next character, and, as described above, convert it to a
1502 if ((str
[i
] < 'a') || (str
[i
] > 'z'))
1505 swiz_idx
[i
] = idx_map
[str
[i
] - 'a'] - base
;
1506 if ((swiz_idx
[i
] < 0) || (swiz_idx
[i
] >= (int) vector_length
))
1513 return new(ctx
) ir_swizzle(val
, swiz_idx
[0], swiz_idx
[1], swiz_idx
[2],
1523 ir_swizzle::variable_referenced() const
1525 return this->val
->variable_referenced();
1529 ir_variable::ir_variable(const struct glsl_type
*type
, const char *name
,
1530 ir_variable_mode mode
)
1531 : max_ifc_array_access(NULL
)
1533 this->ir_type
= ir_type_variable
;
1535 this->name
= ralloc_strdup(this, name
);
1536 this->data
.explicit_location
= false;
1537 this->data
.has_initializer
= false;
1538 this->data
.location
= -1;
1539 this->data
.location_frac
= 0;
1540 this->warn_extension
= NULL
;
1541 this->constant_value
= NULL
;
1542 this->constant_initializer
= NULL
;
1543 this->data
.origin_upper_left
= false;
1544 this->data
.pixel_center_integer
= false;
1545 this->data
.depth_layout
= ir_depth_layout_none
;
1546 this->data
.used
= false;
1547 this->data
.read_only
= false;
1548 this->data
.centroid
= false;
1549 this->data
.sample
= false;
1550 this->data
.invariant
= false;
1551 this->data
.how_declared
= ir_var_declared_normally
;
1552 this->data
.mode
= mode
;
1553 this->data
.interpolation
= INTERP_QUALIFIER_NONE
;
1554 this->data
.max_array_access
= 0;
1555 this->data
.atomic
.buffer_index
= 0;
1556 this->data
.atomic
.offset
= 0;
1559 if (type
->base_type
== GLSL_TYPE_SAMPLER
)
1560 this->data
.read_only
= true;
1562 if (type
->is_interface())
1563 this->init_interface_type(type
);
1564 else if (type
->is_array() && type
->fields
.array
->is_interface())
1565 this->init_interface_type(type
->fields
.array
);
1571 interpolation_string(unsigned interpolation
)
1573 switch (interpolation
) {
1574 case INTERP_QUALIFIER_NONE
: return "no";
1575 case INTERP_QUALIFIER_SMOOTH
: return "smooth";
1576 case INTERP_QUALIFIER_FLAT
: return "flat";
1577 case INTERP_QUALIFIER_NOPERSPECTIVE
: return "noperspective";
1580 assert(!"Should not get here.");
1585 glsl_interp_qualifier
1586 ir_variable::determine_interpolation_mode(bool flat_shade
)
1588 if (this->data
.interpolation
!= INTERP_QUALIFIER_NONE
)
1589 return (glsl_interp_qualifier
) this->data
.interpolation
;
1590 int location
= this->data
.location
;
1592 location
== VARYING_SLOT_COL0
|| location
== VARYING_SLOT_COL1
;
1593 if (flat_shade
&& is_gl_Color
)
1594 return INTERP_QUALIFIER_FLAT
;
1596 return INTERP_QUALIFIER_SMOOTH
;
1600 ir_function_signature::ir_function_signature(const glsl_type
*return_type
,
1601 builtin_available_predicate b
)
1602 : return_type(return_type
), is_defined(false), is_intrinsic(false),
1603 builtin_avail(b
), _function(NULL
)
1605 this->ir_type
= ir_type_function_signature
;
1606 this->origin
= NULL
;
1611 ir_function_signature::is_builtin() const
1613 return builtin_avail
!= NULL
;
1618 ir_function_signature::is_builtin_available(const _mesa_glsl_parse_state
*state
) const
1620 /* We can't call the predicate without a state pointer, so just say that
1621 * the signature is available. At compile time, we need the filtering,
1622 * but also receive a valid state pointer. At link time, we're resolving
1623 * imported built-in prototypes to their definitions, which will always
1624 * be an exact match. So we can skip the filtering.
1629 assert(builtin_avail
!= NULL
);
1630 return builtin_avail(state
);
1635 modes_match(unsigned a
, unsigned b
)
1640 /* Accept "in" vs. "const in" */
1641 if ((a
== ir_var_const_in
&& b
== ir_var_function_in
) ||
1642 (b
== ir_var_const_in
&& a
== ir_var_function_in
))
1650 ir_function_signature::qualifiers_match(exec_list
*params
)
1652 /* check that the qualifiers match. */
1653 foreach_two_lists(a_node
, &this->parameters
, b_node
, params
) {
1654 ir_variable
*a
= (ir_variable
*) a_node
;
1655 ir_variable
*b
= (ir_variable
*) b_node
;
1657 if (a
->data
.read_only
!= b
->data
.read_only
||
1658 !modes_match(a
->data
.mode
, b
->data
.mode
) ||
1659 a
->data
.interpolation
!= b
->data
.interpolation
||
1660 a
->data
.centroid
!= b
->data
.centroid
||
1661 a
->data
.sample
!= b
->data
.sample
) {
1663 /* parameter a's qualifiers don't match */
1672 ir_function_signature::replace_parameters(exec_list
*new_params
)
1674 /* Destroy all of the previous parameter information. If the previous
1675 * parameter information comes from the function prototype, it may either
1676 * specify incorrect parameter names or not have names at all.
1678 new_params
->move_nodes_to(¶meters
);
1682 ir_function::ir_function(const char *name
)
1684 this->ir_type
= ir_type_function
;
1685 this->name
= ralloc_strdup(this, name
);
1690 ir_function::has_user_signature()
1692 foreach_list(n
, &this->signatures
) {
1693 ir_function_signature
*const sig
= (ir_function_signature
*) n
;
1694 if (!sig
->is_builtin())
1702 ir_rvalue::error_value(void *mem_ctx
)
1704 ir_rvalue
*v
= new(mem_ctx
) ir_rvalue
;
1706 v
->type
= glsl_type::error_type
;
1712 visit_exec_list(exec_list
*list
, ir_visitor
*visitor
)
1714 foreach_list_safe(n
, list
) {
1715 ((ir_instruction
*) n
)->accept(visitor
);
1721 steal_memory(ir_instruction
*ir
, void *new_ctx
)
1723 ir_variable
*var
= ir
->as_variable();
1724 ir_constant
*constant
= ir
->as_constant();
1725 if (var
!= NULL
&& var
->constant_value
!= NULL
)
1726 steal_memory(var
->constant_value
, ir
);
1728 if (var
!= NULL
&& var
->constant_initializer
!= NULL
)
1729 steal_memory(var
->constant_initializer
, ir
);
1731 /* The components of aggregate constants are not visited by the normal
1732 * visitor, so steal their values by hand.
1734 if (constant
!= NULL
) {
1735 if (constant
->type
->is_record()) {
1736 foreach_list(n
, &constant
->components
) {
1737 ir_constant
*field
= (ir_constant
*) n
;
1738 steal_memory(field
, ir
);
1740 } else if (constant
->type
->is_array()) {
1741 for (unsigned int i
= 0; i
< constant
->type
->length
; i
++) {
1742 steal_memory(constant
->array_elements
[i
], ir
);
1747 ralloc_steal(new_ctx
, ir
);
1752 reparent_ir(exec_list
*list
, void *mem_ctx
)
1754 foreach_list(node
, list
) {
1755 visit_tree((ir_instruction
*) node
, steal_memory
, mem_ctx
);
1761 try_min_one(ir_rvalue
*ir
)
1763 ir_expression
*expr
= ir
->as_expression();
1765 if (!expr
|| expr
->operation
!= ir_binop_min
)
1768 if (expr
->operands
[0]->is_one())
1769 return expr
->operands
[1];
1771 if (expr
->operands
[1]->is_one())
1772 return expr
->operands
[0];
1778 try_max_zero(ir_rvalue
*ir
)
1780 ir_expression
*expr
= ir
->as_expression();
1782 if (!expr
|| expr
->operation
!= ir_binop_max
)
1785 if (expr
->operands
[0]->is_zero())
1786 return expr
->operands
[1];
1788 if (expr
->operands
[1]->is_zero())
1789 return expr
->operands
[0];
1795 ir_rvalue::as_rvalue_to_saturate()
1797 ir_expression
*expr
= this->as_expression();
1802 ir_rvalue
*max_zero
= try_max_zero(expr
);
1804 return try_min_one(max_zero
);
1806 ir_rvalue
*min_one
= try_min_one(expr
);
1808 return try_max_zero(min_one
);
1817 vertices_per_prim(GLenum prim
)
1826 case GL_LINES_ADJACENCY
:
1828 case GL_TRIANGLES_ADJACENCY
:
1831 assert(!"Bad primitive");
1837 * Generate a string describing the mode of a variable
1840 mode_string(const ir_variable
*var
)
1842 switch (var
->data
.mode
) {
1844 return (var
->data
.read_only
) ? "global constant" : "global variable";
1846 case ir_var_uniform
:
1849 case ir_var_shader_in
:
1850 return "shader input";
1852 case ir_var_shader_out
:
1853 return "shader output";
1855 case ir_var_function_in
:
1856 case ir_var_const_in
:
1857 return "function input";
1859 case ir_var_function_out
:
1860 return "function output";
1862 case ir_var_function_inout
:
1863 return "function inout";
1865 case ir_var_system_value
:
1866 return "shader input";
1868 case ir_var_temporary
:
1869 return "compiler temporary";
1871 case ir_var_mode_count
:
1875 assert(!"Should not get here.");
1876 return "invalid variable";