2 * Copyright © 2010 Intel Corporation
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
25 * \file ir_constant_expression.cpp
26 * Evaluate and process constant valued expressions
28 * In GLSL, constant valued expressions are used in several places. These
29 * must be processed and evaluated very early in the compilation process.
32 * * Initializers for uniforms
33 * * Initializers for \c const variables
37 #include "main/core.h" /* for MAX2, MIN2, CLAMP */
38 #include "util/rounding.h" /* for _mesa_roundeven */
39 #include "util/half_float.h"
41 #include "glsl_types.h"
42 #include "program/hash_table.h"
45 dot_f(ir_constant
*op0
, ir_constant
*op1
)
47 assert(op0
->type
->is_float() && op1
->type
->is_float());
50 for (unsigned c
= 0; c
< op0
->type
->components(); c
++)
51 result
+= op0
->value
.f
[c
] * op1
->value
.f
[c
];
57 dot_d(ir_constant
*op0
, ir_constant
*op1
)
59 assert(op0
->type
->is_double() && op1
->type
->is_double());
62 for (unsigned c
= 0; c
< op0
->type
->components(); c
++)
63 result
+= op0
->value
.d
[c
] * op1
->value
.d
[c
];
68 /* This method is the only one supported by gcc. Unions in particular
69 * are iffy, and read-through-converted-pointer is killed by strict
70 * aliasing. OTOH, the compiler sees through the memcpy, so the
71 * resulting asm is reasonable.
74 bitcast_u2f(unsigned int u
)
76 assert(sizeof(float) == sizeof(unsigned int));
78 memcpy(&f
, &u
, sizeof(f
));
85 assert(sizeof(float) == sizeof(unsigned int));
87 memcpy(&u
, &f
, sizeof(f
));
92 * Evaluate one component of a floating-point 4x8 unpacking function.
95 (*pack_1x8_func_t
)(float);
98 * Evaluate one component of a floating-point 2x16 unpacking function.
101 (*pack_1x16_func_t
)(float);
104 * Evaluate one component of a floating-point 4x8 unpacking function.
107 (*unpack_1x8_func_t
)(uint8_t);
110 * Evaluate one component of a floating-point 2x16 unpacking function.
113 (*unpack_1x16_func_t
)(uint16_t);
116 * Evaluate a 2x16 floating-point packing function.
119 pack_2x16(pack_1x16_func_t pack_1x16
,
122 /* From section 8.4 of the GLSL ES 3.00 spec:
126 * The first component of the vector will be written to the least
127 * significant bits of the output; the last component will be written to
128 * the most significant bits.
130 * The specifications for the other packing functions contain similar
134 u
|= ((uint32_t) pack_1x16(x
) << 0);
135 u
|= ((uint32_t) pack_1x16(y
) << 16);
140 * Evaluate a 4x8 floating-point packing function.
143 pack_4x8(pack_1x8_func_t pack_1x8
,
144 float x
, float y
, float z
, float w
)
146 /* From section 8.4 of the GLSL 4.30 spec:
150 * The first component of the vector will be written to the least
151 * significant bits of the output; the last component will be written to
152 * the most significant bits.
154 * The specifications for the other packing functions contain similar
158 u
|= ((uint32_t) pack_1x8(x
) << 0);
159 u
|= ((uint32_t) pack_1x8(y
) << 8);
160 u
|= ((uint32_t) pack_1x8(z
) << 16);
161 u
|= ((uint32_t) pack_1x8(w
) << 24);
166 * Evaluate a 2x16 floating-point unpacking function.
169 unpack_2x16(unpack_1x16_func_t unpack_1x16
,
173 /* From section 8.4 of the GLSL ES 3.00 spec:
177 * The first component of the returned vector will be extracted from
178 * the least significant bits of the input; the last component will be
179 * extracted from the most significant bits.
181 * The specifications for the other unpacking functions contain similar
184 *x
= unpack_1x16((uint16_t) (u
& 0xffff));
185 *y
= unpack_1x16((uint16_t) (u
>> 16));
189 * Evaluate a 4x8 floating-point unpacking function.
192 unpack_4x8(unpack_1x8_func_t unpack_1x8
, uint32_t u
,
193 float *x
, float *y
, float *z
, float *w
)
195 /* From section 8.4 of the GLSL 4.30 spec:
199 * The first component of the returned vector will be extracted from
200 * the least significant bits of the input; the last component will be
201 * extracted from the most significant bits.
203 * The specifications for the other unpacking functions contain similar
206 *x
= unpack_1x8((uint8_t) (u
& 0xff));
207 *y
= unpack_1x8((uint8_t) (u
>> 8));
208 *z
= unpack_1x8((uint8_t) (u
>> 16));
209 *w
= unpack_1x8((uint8_t) (u
>> 24));
213 * Evaluate one component of packSnorm4x8.
216 pack_snorm_1x8(float x
)
218 /* From section 8.4 of the GLSL 4.30 spec:
222 * The conversion for component c of v to fixed point is done as
225 * packSnorm4x8: round(clamp(c, -1, +1) * 127.0)
228 _mesa_lroundevenf(CLAMP(x
, -1.0f
, +1.0f
) * 127.0f
);
232 * Evaluate one component of packSnorm2x16.
235 pack_snorm_1x16(float x
)
237 /* From section 8.4 of the GLSL ES 3.00 spec:
241 * The conversion for component c of v to fixed point is done as
244 * packSnorm2x16: round(clamp(c, -1, +1) * 32767.0)
247 _mesa_lroundevenf(CLAMP(x
, -1.0f
, +1.0f
) * 32767.0f
);
251 * Evaluate one component of unpackSnorm4x8.
254 unpack_snorm_1x8(uint8_t u
)
256 /* From section 8.4 of the GLSL 4.30 spec:
260 * The conversion for unpacked fixed-point value f to floating point is
263 * unpackSnorm4x8: clamp(f / 127.0, -1, +1)
265 return CLAMP((int8_t) u
/ 127.0f
, -1.0f
, +1.0f
);
269 * Evaluate one component of unpackSnorm2x16.
272 unpack_snorm_1x16(uint16_t u
)
274 /* From section 8.4 of the GLSL ES 3.00 spec:
278 * The conversion for unpacked fixed-point value f to floating point is
281 * unpackSnorm2x16: clamp(f / 32767.0, -1, +1)
283 return CLAMP((int16_t) u
/ 32767.0f
, -1.0f
, +1.0f
);
287 * Evaluate one component packUnorm4x8.
290 pack_unorm_1x8(float x
)
292 /* From section 8.4 of the GLSL 4.30 spec:
296 * The conversion for component c of v to fixed point is done as
299 * packUnorm4x8: round(clamp(c, 0, +1) * 255.0)
301 return (uint8_t) (int) _mesa_roundevenf(CLAMP(x
, 0.0f
, 1.0f
) * 255.0f
);
305 * Evaluate one component packUnorm2x16.
308 pack_unorm_1x16(float x
)
310 /* From section 8.4 of the GLSL ES 3.00 spec:
314 * The conversion for component c of v to fixed point is done as
317 * packUnorm2x16: round(clamp(c, 0, +1) * 65535.0)
319 return (uint16_t) (int)
320 _mesa_roundevenf(CLAMP(x
, 0.0f
, 1.0f
) * 65535.0f
);
324 * Evaluate one component of unpackUnorm4x8.
327 unpack_unorm_1x8(uint8_t u
)
329 /* From section 8.4 of the GLSL 4.30 spec:
333 * The conversion for unpacked fixed-point value f to floating point is
336 * unpackUnorm4x8: f / 255.0
338 return (float) u
/ 255.0f
;
342 * Evaluate one component of unpackUnorm2x16.
345 unpack_unorm_1x16(uint16_t u
)
347 /* From section 8.4 of the GLSL ES 3.00 spec:
351 * The conversion for unpacked fixed-point value f to floating point is
354 * unpackUnorm2x16: f / 65535.0
356 return (float) u
/ 65535.0f
;
360 * Evaluate one component of packHalf2x16.
363 pack_half_1x16(float x
)
365 return _mesa_float_to_half(x
);
369 * Evaluate one component of unpackHalf2x16.
372 unpack_half_1x16(uint16_t u
)
374 return _mesa_half_to_float(u
);
378 * Get the constant that is ultimately referenced by an r-value, in a constant
379 * expression evaluation context.
381 * The offset is used when the reference is to a specific column of a matrix.
384 constant_referenced(const ir_dereference
*deref
,
385 struct hash_table
*variable_context
,
386 ir_constant
*&store
, int &offset
)
391 if (variable_context
== NULL
)
394 switch (deref
->ir_type
) {
395 case ir_type_dereference_array
: {
396 const ir_dereference_array
*const da
=
397 (const ir_dereference_array
*) deref
;
399 ir_constant
*const index_c
=
400 da
->array_index
->constant_expression_value(variable_context
);
402 if (!index_c
|| !index_c
->type
->is_scalar() || !index_c
->type
->is_integer())
405 const int index
= index_c
->type
->base_type
== GLSL_TYPE_INT
?
406 index_c
->get_int_component(0) :
407 index_c
->get_uint_component(0);
409 ir_constant
*substore
;
412 const ir_dereference
*const deref
= da
->array
->as_dereference();
416 if (!constant_referenced(deref
, variable_context
, substore
, suboffset
))
419 const glsl_type
*const vt
= da
->array
->type
;
420 if (vt
->is_array()) {
421 store
= substore
->get_array_element(index
);
423 } else if (vt
->is_matrix()) {
425 offset
= index
* vt
->vector_elements
;
426 } else if (vt
->is_vector()) {
428 offset
= suboffset
+ index
;
434 case ir_type_dereference_record
: {
435 const ir_dereference_record
*const dr
=
436 (const ir_dereference_record
*) deref
;
438 const ir_dereference
*const deref
= dr
->record
->as_dereference();
442 ir_constant
*substore
;
445 if (!constant_referenced(deref
, variable_context
, substore
, suboffset
))
448 /* Since we're dropping it on the floor...
450 assert(suboffset
== 0);
452 store
= substore
->get_record_field(dr
->field
);
456 case ir_type_dereference_variable
: {
457 const ir_dereference_variable
*const dv
=
458 (const ir_dereference_variable
*) deref
;
460 store
= (ir_constant
*) hash_table_find(variable_context
, dv
->var
);
465 assert(!"Should not get here.");
469 return store
!= NULL
;
474 ir_rvalue::constant_expression_value(struct hash_table
*)
476 assert(this->type
->is_error());
481 ir_expression::constant_expression_value(struct hash_table
*variable_context
)
483 if (this->type
->is_error())
486 ir_constant
*op
[ARRAY_SIZE(this->operands
)] = { NULL
, };
487 ir_constant_data data
;
489 memset(&data
, 0, sizeof(data
));
491 for (unsigned operand
= 0; operand
< this->get_num_operands(); operand
++) {
492 op
[operand
] = this->operands
[operand
]->constant_expression_value(variable_context
);
498 switch (this->operation
) {
499 case ir_binop_lshift
:
500 case ir_binop_rshift
:
502 case ir_binop_interpolate_at_offset
:
503 case ir_binop_interpolate_at_sample
:
504 case ir_binop_vector_extract
:
506 case ir_triop_bitfield_extract
:
510 assert(op
[0]->type
->base_type
== op
[1]->type
->base_type
);
514 bool op0_scalar
= op
[0]->type
->is_scalar();
515 bool op1_scalar
= op
[1] != NULL
&& op
[1]->type
->is_scalar();
517 /* When iterating over a vector or matrix's components, we want to increase
518 * the loop counter. However, for scalars, we want to stay at 0.
520 unsigned c0_inc
= op0_scalar
? 0 : 1;
521 unsigned c1_inc
= op1_scalar
? 0 : 1;
523 if (op1_scalar
|| !op
[1]) {
524 components
= op
[0]->type
->components();
526 components
= op
[1]->type
->components();
529 void *ctx
= ralloc_parent(this);
531 /* Handle array operations here, rather than below. */
532 if (op
[0]->type
->is_array()) {
533 assert(op
[1] != NULL
&& op
[1]->type
->is_array());
534 switch (this->operation
) {
535 case ir_binop_all_equal
:
536 return new(ctx
) ir_constant(op
[0]->has_value(op
[1]));
537 case ir_binop_any_nequal
:
538 return new(ctx
) ir_constant(!op
[0]->has_value(op
[1]));
545 switch (this->operation
) {
546 case ir_unop_bit_not
:
547 switch (op
[0]->type
->base_type
) {
549 for (unsigned c
= 0; c
< components
; c
++)
550 data
.i
[c
] = ~ op
[0]->value
.i
[c
];
553 for (unsigned c
= 0; c
< components
; c
++)
554 data
.u
[c
] = ~ op
[0]->value
.u
[c
];
561 case ir_unop_logic_not
:
562 assert(op
[0]->type
->base_type
== GLSL_TYPE_BOOL
);
563 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++)
564 data
.b
[c
] = !op
[0]->value
.b
[c
];
568 assert(op
[0]->type
->base_type
== GLSL_TYPE_FLOAT
);
569 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
570 data
.i
[c
] = (int) op
[0]->value
.f
[c
];
574 assert(op
[0]->type
->base_type
== GLSL_TYPE_FLOAT
);
575 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
576 data
.i
[c
] = (unsigned) op
[0]->value
.f
[c
];
580 assert(op
[0]->type
->base_type
== GLSL_TYPE_INT
);
581 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
582 data
.f
[c
] = (float) op
[0]->value
.i
[c
];
586 assert(op
[0]->type
->base_type
== GLSL_TYPE_UINT
);
587 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
588 data
.f
[c
] = (float) op
[0]->value
.u
[c
];
592 assert(op
[0]->type
->base_type
== GLSL_TYPE_BOOL
);
593 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
594 data
.f
[c
] = op
[0]->value
.b
[c
] ? 1.0F
: 0.0F
;
598 assert(op
[0]->type
->base_type
== GLSL_TYPE_FLOAT
);
599 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
600 data
.b
[c
] = op
[0]->value
.f
[c
] != 0.0F
? true : false;
604 assert(op
[0]->type
->base_type
== GLSL_TYPE_BOOL
);
605 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
606 data
.u
[c
] = op
[0]->value
.b
[c
] ? 1 : 0;
610 assert(op
[0]->type
->is_integer());
611 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
612 data
.b
[c
] = op
[0]->value
.u
[c
] ? true : false;
616 assert(op
[0]->type
->base_type
== GLSL_TYPE_UINT
);
617 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
618 data
.i
[c
] = op
[0]->value
.u
[c
];
622 assert(op
[0]->type
->base_type
== GLSL_TYPE_INT
);
623 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
624 data
.u
[c
] = op
[0]->value
.i
[c
];
627 case ir_unop_bitcast_i2f
:
628 assert(op
[0]->type
->base_type
== GLSL_TYPE_INT
);
629 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
630 data
.f
[c
] = bitcast_u2f(op
[0]->value
.i
[c
]);
633 case ir_unop_bitcast_f2i
:
634 assert(op
[0]->type
->base_type
== GLSL_TYPE_FLOAT
);
635 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
636 data
.i
[c
] = bitcast_f2u(op
[0]->value
.f
[c
]);
639 case ir_unop_bitcast_u2f
:
640 assert(op
[0]->type
->base_type
== GLSL_TYPE_UINT
);
641 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
642 data
.f
[c
] = bitcast_u2f(op
[0]->value
.u
[c
]);
645 case ir_unop_bitcast_f2u
:
646 assert(op
[0]->type
->base_type
== GLSL_TYPE_FLOAT
);
647 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
648 data
.u
[c
] = bitcast_f2u(op
[0]->value
.f
[c
]);
652 assert(op
[0]->type
->is_boolean());
654 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
655 if (op
[0]->value
.b
[c
])
660 assert(op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
);
661 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
662 data
.f
[c
] = op
[0]->value
.d
[c
];
666 assert(op
[0]->type
->base_type
== GLSL_TYPE_FLOAT
);
667 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
668 data
.d
[c
] = op
[0]->value
.f
[c
];
672 assert(op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
);
673 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
674 data
.i
[c
] = op
[0]->value
.d
[c
];
678 assert(op
[0]->type
->base_type
== GLSL_TYPE_INT
);
679 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
680 data
.d
[c
] = op
[0]->value
.i
[c
];
684 assert(op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
);
685 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
686 data
.u
[c
] = op
[0]->value
.d
[c
];
690 assert(op
[0]->type
->base_type
== GLSL_TYPE_UINT
);
691 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
692 data
.d
[c
] = op
[0]->value
.u
[c
];
696 assert(op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
);
697 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
698 data
.b
[c
] = op
[0]->value
.d
[c
] != 0.0;
702 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
703 if (op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
)
704 data
.d
[c
] = trunc(op
[0]->value
.d
[c
]);
706 data
.f
[c
] = truncf(op
[0]->value
.f
[c
]);
710 case ir_unop_round_even
:
711 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
712 if (op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
)
713 data
.d
[c
] = _mesa_roundeven(op
[0]->value
.d
[c
]);
715 data
.f
[c
] = _mesa_roundevenf(op
[0]->value
.f
[c
]);
720 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
721 if (op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
)
722 data
.d
[c
] = ceil(op
[0]->value
.d
[c
]);
724 data
.f
[c
] = ceilf(op
[0]->value
.f
[c
]);
729 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
730 if (op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
)
731 data
.d
[c
] = floor(op
[0]->value
.d
[c
]);
733 data
.f
[c
] = floorf(op
[0]->value
.f
[c
]);
738 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
739 switch (this->type
->base_type
) {
746 case GLSL_TYPE_FLOAT
:
747 data
.f
[c
] = op
[0]->value
.f
[c
] - floor(op
[0]->value
.f
[c
]);
749 case GLSL_TYPE_DOUBLE
:
750 data
.d
[c
] = op
[0]->value
.d
[c
] - floor(op
[0]->value
.d
[c
]);
759 assert(op
[0]->type
->base_type
== GLSL_TYPE_FLOAT
);
760 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
761 data
.f
[c
] = sinf(op
[0]->value
.f
[c
]);
766 assert(op
[0]->type
->base_type
== GLSL_TYPE_FLOAT
);
767 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
768 data
.f
[c
] = cosf(op
[0]->value
.f
[c
]);
773 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
774 switch (this->type
->base_type
) {
776 data
.u
[c
] = -((int) op
[0]->value
.u
[c
]);
779 data
.i
[c
] = -op
[0]->value
.i
[c
];
781 case GLSL_TYPE_FLOAT
:
782 data
.f
[c
] = -op
[0]->value
.f
[c
];
784 case GLSL_TYPE_DOUBLE
:
785 data
.d
[c
] = -op
[0]->value
.d
[c
];
794 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
795 switch (this->type
->base_type
) {
797 data
.u
[c
] = op
[0]->value
.u
[c
];
800 data
.i
[c
] = op
[0]->value
.i
[c
];
802 data
.i
[c
] = -data
.i
[c
];
804 case GLSL_TYPE_FLOAT
:
805 data
.f
[c
] = fabs(op
[0]->value
.f
[c
]);
807 case GLSL_TYPE_DOUBLE
:
808 data
.d
[c
] = fabs(op
[0]->value
.d
[c
]);
817 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
818 switch (this->type
->base_type
) {
820 data
.u
[c
] = op
[0]->value
.i
[c
] > 0;
823 data
.i
[c
] = (op
[0]->value
.i
[c
] > 0) - (op
[0]->value
.i
[c
] < 0);
825 case GLSL_TYPE_FLOAT
:
826 data
.f
[c
] = float((op
[0]->value
.f
[c
] > 0)-(op
[0]->value
.f
[c
] < 0));
828 case GLSL_TYPE_DOUBLE
:
829 data
.d
[c
] = double((op
[0]->value
.d
[c
] > 0)-(op
[0]->value
.d
[c
] < 0));
838 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
839 switch (this->type
->base_type
) {
841 if (op
[0]->value
.u
[c
] != 0.0)
842 data
.u
[c
] = 1 / op
[0]->value
.u
[c
];
845 if (op
[0]->value
.i
[c
] != 0.0)
846 data
.i
[c
] = 1 / op
[0]->value
.i
[c
];
848 case GLSL_TYPE_FLOAT
:
849 if (op
[0]->value
.f
[c
] != 0.0)
850 data
.f
[c
] = 1.0F
/ op
[0]->value
.f
[c
];
852 case GLSL_TYPE_DOUBLE
:
853 if (op
[0]->value
.d
[c
] != 0.0)
854 data
.d
[c
] = 1.0 / op
[0]->value
.d
[c
];
863 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
864 if (op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
)
865 data
.d
[c
] = 1.0 / sqrt(op
[0]->value
.d
[c
]);
867 data
.f
[c
] = 1.0F
/ sqrtf(op
[0]->value
.f
[c
]);
872 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
873 if (op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
)
874 data
.d
[c
] = sqrt(op
[0]->value
.d
[c
]);
876 data
.f
[c
] = sqrtf(op
[0]->value
.f
[c
]);
881 assert(op
[0]->type
->base_type
== GLSL_TYPE_FLOAT
);
882 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
883 data
.f
[c
] = expf(op
[0]->value
.f
[c
]);
888 assert(op
[0]->type
->base_type
== GLSL_TYPE_FLOAT
);
889 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
890 data
.f
[c
] = exp2f(op
[0]->value
.f
[c
]);
895 assert(op
[0]->type
->base_type
== GLSL_TYPE_FLOAT
);
896 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
897 data
.f
[c
] = logf(op
[0]->value
.f
[c
]);
902 assert(op
[0]->type
->base_type
== GLSL_TYPE_FLOAT
);
903 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
904 data
.f
[c
] = log2f(op
[0]->value
.f
[c
]);
909 case ir_unop_dFdx_coarse
:
910 case ir_unop_dFdx_fine
:
912 case ir_unop_dFdy_coarse
:
913 case ir_unop_dFdy_fine
:
914 assert(op
[0]->type
->base_type
== GLSL_TYPE_FLOAT
);
915 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
920 case ir_unop_pack_snorm_2x16
:
921 assert(op
[0]->type
== glsl_type::vec2_type
);
922 data
.u
[0] = pack_2x16(pack_snorm_1x16
,
926 case ir_unop_pack_snorm_4x8
:
927 assert(op
[0]->type
== glsl_type::vec4_type
);
928 data
.u
[0] = pack_4x8(pack_snorm_1x8
,
934 case ir_unop_unpack_snorm_2x16
:
935 assert(op
[0]->type
== glsl_type::uint_type
);
936 unpack_2x16(unpack_snorm_1x16
,
938 &data
.f
[0], &data
.f
[1]);
940 case ir_unop_unpack_snorm_4x8
:
941 assert(op
[0]->type
== glsl_type::uint_type
);
942 unpack_4x8(unpack_snorm_1x8
,
944 &data
.f
[0], &data
.f
[1], &data
.f
[2], &data
.f
[3]);
946 case ir_unop_pack_unorm_2x16
:
947 assert(op
[0]->type
== glsl_type::vec2_type
);
948 data
.u
[0] = pack_2x16(pack_unorm_1x16
,
952 case ir_unop_pack_unorm_4x8
:
953 assert(op
[0]->type
== glsl_type::vec4_type
);
954 data
.u
[0] = pack_4x8(pack_unorm_1x8
,
960 case ir_unop_unpack_unorm_2x16
:
961 assert(op
[0]->type
== glsl_type::uint_type
);
962 unpack_2x16(unpack_unorm_1x16
,
964 &data
.f
[0], &data
.f
[1]);
966 case ir_unop_unpack_unorm_4x8
:
967 assert(op
[0]->type
== glsl_type::uint_type
);
968 unpack_4x8(unpack_unorm_1x8
,
970 &data
.f
[0], &data
.f
[1], &data
.f
[2], &data
.f
[3]);
972 case ir_unop_pack_half_2x16
:
973 assert(op
[0]->type
== glsl_type::vec2_type
);
974 data
.u
[0] = pack_2x16(pack_half_1x16
,
978 case ir_unop_unpack_half_2x16
:
979 assert(op
[0]->type
== glsl_type::uint_type
);
980 unpack_2x16(unpack_half_1x16
,
982 &data
.f
[0], &data
.f
[1]);
985 assert(op
[0]->type
->base_type
== GLSL_TYPE_FLOAT
);
986 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
987 data
.f
[c
] = powf(op
[0]->value
.f
[c
], op
[1]->value
.f
[c
]);
992 if (op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
)
993 data
.d
[0] = dot_d(op
[0], op
[1]);
995 data
.f
[0] = dot_f(op
[0], op
[1]);
999 assert(op
[0]->type
== op
[1]->type
|| op0_scalar
|| op1_scalar
);
1000 for (unsigned c
= 0, c0
= 0, c1
= 0;
1002 c0
+= c0_inc
, c1
+= c1_inc
, c
++) {
1004 switch (op
[0]->type
->base_type
) {
1005 case GLSL_TYPE_UINT
:
1006 data
.u
[c
] = MIN2(op
[0]->value
.u
[c0
], op
[1]->value
.u
[c1
]);
1009 data
.i
[c
] = MIN2(op
[0]->value
.i
[c0
], op
[1]->value
.i
[c1
]);
1011 case GLSL_TYPE_FLOAT
:
1012 data
.f
[c
] = MIN2(op
[0]->value
.f
[c0
], op
[1]->value
.f
[c1
]);
1014 case GLSL_TYPE_DOUBLE
:
1015 data
.d
[c
] = MIN2(op
[0]->value
.d
[c0
], op
[1]->value
.d
[c1
]);
1024 assert(op
[0]->type
== op
[1]->type
|| op0_scalar
|| op1_scalar
);
1025 for (unsigned c
= 0, c0
= 0, c1
= 0;
1027 c0
+= c0_inc
, c1
+= c1_inc
, c
++) {
1029 switch (op
[0]->type
->base_type
) {
1030 case GLSL_TYPE_UINT
:
1031 data
.u
[c
] = MAX2(op
[0]->value
.u
[c0
], op
[1]->value
.u
[c1
]);
1034 data
.i
[c
] = MAX2(op
[0]->value
.i
[c0
], op
[1]->value
.i
[c1
]);
1036 case GLSL_TYPE_FLOAT
:
1037 data
.f
[c
] = MAX2(op
[0]->value
.f
[c0
], op
[1]->value
.f
[c1
]);
1039 case GLSL_TYPE_DOUBLE
:
1040 data
.d
[c
] = MAX2(op
[0]->value
.d
[c0
], op
[1]->value
.d
[c1
]);
1049 assert(op
[0]->type
== op
[1]->type
|| op0_scalar
|| op1_scalar
);
1050 for (unsigned c
= 0, c0
= 0, c1
= 0;
1052 c0
+= c0_inc
, c1
+= c1_inc
, c
++) {
1054 switch (op
[0]->type
->base_type
) {
1055 case GLSL_TYPE_UINT
:
1056 data
.u
[c
] = op
[0]->value
.u
[c0
] + op
[1]->value
.u
[c1
];
1059 data
.i
[c
] = op
[0]->value
.i
[c0
] + op
[1]->value
.i
[c1
];
1061 case GLSL_TYPE_FLOAT
:
1062 data
.f
[c
] = op
[0]->value
.f
[c0
] + op
[1]->value
.f
[c1
];
1064 case GLSL_TYPE_DOUBLE
:
1065 data
.d
[c
] = op
[0]->value
.d
[c0
] + op
[1]->value
.d
[c1
];
1074 assert(op
[0]->type
== op
[1]->type
|| op0_scalar
|| op1_scalar
);
1075 for (unsigned c
= 0, c0
= 0, c1
= 0;
1077 c0
+= c0_inc
, c1
+= c1_inc
, c
++) {
1079 switch (op
[0]->type
->base_type
) {
1080 case GLSL_TYPE_UINT
:
1081 data
.u
[c
] = op
[0]->value
.u
[c0
] - op
[1]->value
.u
[c1
];
1084 data
.i
[c
] = op
[0]->value
.i
[c0
] - op
[1]->value
.i
[c1
];
1086 case GLSL_TYPE_FLOAT
:
1087 data
.f
[c
] = op
[0]->value
.f
[c0
] - op
[1]->value
.f
[c1
];
1089 case GLSL_TYPE_DOUBLE
:
1090 data
.d
[c
] = op
[0]->value
.d
[c0
] - op
[1]->value
.d
[c1
];
1099 /* Check for equal types, or unequal types involving scalars */
1100 if ((op
[0]->type
== op
[1]->type
&& !op
[0]->type
->is_matrix())
1101 || op0_scalar
|| op1_scalar
) {
1102 for (unsigned c
= 0, c0
= 0, c1
= 0;
1104 c0
+= c0_inc
, c1
+= c1_inc
, c
++) {
1106 switch (op
[0]->type
->base_type
) {
1107 case GLSL_TYPE_UINT
:
1108 data
.u
[c
] = op
[0]->value
.u
[c0
] * op
[1]->value
.u
[c1
];
1111 data
.i
[c
] = op
[0]->value
.i
[c0
] * op
[1]->value
.i
[c1
];
1113 case GLSL_TYPE_FLOAT
:
1114 data
.f
[c
] = op
[0]->value
.f
[c0
] * op
[1]->value
.f
[c1
];
1116 case GLSL_TYPE_DOUBLE
:
1117 data
.d
[c
] = op
[0]->value
.d
[c0
] * op
[1]->value
.d
[c1
];
1124 assert(op
[0]->type
->is_matrix() || op
[1]->type
->is_matrix());
1126 /* Multiply an N-by-M matrix with an M-by-P matrix. Since either
1127 * matrix can be a GLSL vector, either N or P can be 1.
1129 * For vec*mat, the vector is treated as a row vector. This
1130 * means the vector is a 1-row x M-column matrix.
1132 * For mat*vec, the vector is treated as a column vector. Since
1133 * matrix_columns is 1 for vectors, this just works.
1135 const unsigned n
= op
[0]->type
->is_vector()
1136 ? 1 : op
[0]->type
->vector_elements
;
1137 const unsigned m
= op
[1]->type
->vector_elements
;
1138 const unsigned p
= op
[1]->type
->matrix_columns
;
1139 for (unsigned j
= 0; j
< p
; j
++) {
1140 for (unsigned i
= 0; i
< n
; i
++) {
1141 for (unsigned k
= 0; k
< m
; k
++) {
1142 if (op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
)
1143 data
.d
[i
+n
*j
] += op
[0]->value
.d
[i
+n
*k
]*op
[1]->value
.d
[k
+m
*j
];
1145 data
.f
[i
+n
*j
] += op
[0]->value
.f
[i
+n
*k
]*op
[1]->value
.f
[k
+m
*j
];
1153 /* FINISHME: Emit warning when division-by-zero is detected. */
1154 assert(op
[0]->type
== op
[1]->type
|| op0_scalar
|| op1_scalar
);
1155 for (unsigned c
= 0, c0
= 0, c1
= 0;
1157 c0
+= c0_inc
, c1
+= c1_inc
, c
++) {
1159 switch (op
[0]->type
->base_type
) {
1160 case GLSL_TYPE_UINT
:
1161 if (op
[1]->value
.u
[c1
] == 0) {
1164 data
.u
[c
] = op
[0]->value
.u
[c0
] / op
[1]->value
.u
[c1
];
1168 if (op
[1]->value
.i
[c1
] == 0) {
1171 data
.i
[c
] = op
[0]->value
.i
[c0
] / op
[1]->value
.i
[c1
];
1174 case GLSL_TYPE_FLOAT
:
1175 data
.f
[c
] = op
[0]->value
.f
[c0
] / op
[1]->value
.f
[c1
];
1177 case GLSL_TYPE_DOUBLE
:
1178 data
.d
[c
] = op
[0]->value
.d
[c0
] / op
[1]->value
.d
[c1
];
1187 /* FINISHME: Emit warning when division-by-zero is detected. */
1188 assert(op
[0]->type
== op
[1]->type
|| op0_scalar
|| op1_scalar
);
1189 for (unsigned c
= 0, c0
= 0, c1
= 0;
1191 c0
+= c0_inc
, c1
+= c1_inc
, c
++) {
1193 switch (op
[0]->type
->base_type
) {
1194 case GLSL_TYPE_UINT
:
1195 if (op
[1]->value
.u
[c1
] == 0) {
1198 data
.u
[c
] = op
[0]->value
.u
[c0
] % op
[1]->value
.u
[c1
];
1202 if (op
[1]->value
.i
[c1
] == 0) {
1205 data
.i
[c
] = op
[0]->value
.i
[c0
] % op
[1]->value
.i
[c1
];
1208 case GLSL_TYPE_FLOAT
:
1209 /* We don't use fmod because it rounds toward zero; GLSL specifies
1212 data
.f
[c
] = op
[0]->value
.f
[c0
] - op
[1]->value
.f
[c1
]
1213 * floorf(op
[0]->value
.f
[c0
] / op
[1]->value
.f
[c1
]);
1215 case GLSL_TYPE_DOUBLE
:
1216 /* We don't use fmod because it rounds toward zero; GLSL specifies
1219 data
.d
[c
] = op
[0]->value
.d
[c0
] - op
[1]->value
.d
[c1
]
1220 * floor(op
[0]->value
.d
[c0
] / op
[1]->value
.d
[c1
]);
1229 case ir_binop_logic_and
:
1230 assert(op
[0]->type
->base_type
== GLSL_TYPE_BOOL
);
1231 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++)
1232 data
.b
[c
] = op
[0]->value
.b
[c
] && op
[1]->value
.b
[c
];
1234 case ir_binop_logic_xor
:
1235 assert(op
[0]->type
->base_type
== GLSL_TYPE_BOOL
);
1236 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++)
1237 data
.b
[c
] = op
[0]->value
.b
[c
] ^ op
[1]->value
.b
[c
];
1239 case ir_binop_logic_or
:
1240 assert(op
[0]->type
->base_type
== GLSL_TYPE_BOOL
);
1241 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++)
1242 data
.b
[c
] = op
[0]->value
.b
[c
] || op
[1]->value
.b
[c
];
1246 assert(op
[0]->type
== op
[1]->type
);
1247 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
1248 switch (op
[0]->type
->base_type
) {
1249 case GLSL_TYPE_UINT
:
1250 data
.b
[c
] = op
[0]->value
.u
[c
] < op
[1]->value
.u
[c
];
1253 data
.b
[c
] = op
[0]->value
.i
[c
] < op
[1]->value
.i
[c
];
1255 case GLSL_TYPE_FLOAT
:
1256 data
.b
[c
] = op
[0]->value
.f
[c
] < op
[1]->value
.f
[c
];
1258 case GLSL_TYPE_DOUBLE
:
1259 data
.b
[c
] = op
[0]->value
.d
[c
] < op
[1]->value
.d
[c
];
1266 case ir_binop_greater
:
1267 assert(op
[0]->type
== op
[1]->type
);
1268 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
1269 switch (op
[0]->type
->base_type
) {
1270 case GLSL_TYPE_UINT
:
1271 data
.b
[c
] = op
[0]->value
.u
[c
] > op
[1]->value
.u
[c
];
1274 data
.b
[c
] = op
[0]->value
.i
[c
] > op
[1]->value
.i
[c
];
1276 case GLSL_TYPE_FLOAT
:
1277 data
.b
[c
] = op
[0]->value
.f
[c
] > op
[1]->value
.f
[c
];
1279 case GLSL_TYPE_DOUBLE
:
1280 data
.b
[c
] = op
[0]->value
.d
[c
] > op
[1]->value
.d
[c
];
1287 case ir_binop_lequal
:
1288 assert(op
[0]->type
== op
[1]->type
);
1289 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
1290 switch (op
[0]->type
->base_type
) {
1291 case GLSL_TYPE_UINT
:
1292 data
.b
[c
] = op
[0]->value
.u
[c
] <= op
[1]->value
.u
[c
];
1295 data
.b
[c
] = op
[0]->value
.i
[c
] <= op
[1]->value
.i
[c
];
1297 case GLSL_TYPE_FLOAT
:
1298 data
.b
[c
] = op
[0]->value
.f
[c
] <= op
[1]->value
.f
[c
];
1300 case GLSL_TYPE_DOUBLE
:
1301 data
.b
[c
] = op
[0]->value
.d
[c
] <= op
[1]->value
.d
[c
];
1308 case ir_binop_gequal
:
1309 assert(op
[0]->type
== op
[1]->type
);
1310 for (unsigned c
= 0; c
< op
[0]->type
->components(); c
++) {
1311 switch (op
[0]->type
->base_type
) {
1312 case GLSL_TYPE_UINT
:
1313 data
.b
[c
] = op
[0]->value
.u
[c
] >= op
[1]->value
.u
[c
];
1316 data
.b
[c
] = op
[0]->value
.i
[c
] >= op
[1]->value
.i
[c
];
1318 case GLSL_TYPE_FLOAT
:
1319 data
.b
[c
] = op
[0]->value
.f
[c
] >= op
[1]->value
.f
[c
];
1321 case GLSL_TYPE_DOUBLE
:
1322 data
.b
[c
] = op
[0]->value
.d
[c
] >= op
[1]->value
.d
[c
];
1329 case ir_binop_equal
:
1330 assert(op
[0]->type
== op
[1]->type
);
1331 for (unsigned c
= 0; c
< components
; c
++) {
1332 switch (op
[0]->type
->base_type
) {
1333 case GLSL_TYPE_UINT
:
1334 data
.b
[c
] = op
[0]->value
.u
[c
] == op
[1]->value
.u
[c
];
1337 data
.b
[c
] = op
[0]->value
.i
[c
] == op
[1]->value
.i
[c
];
1339 case GLSL_TYPE_FLOAT
:
1340 data
.b
[c
] = op
[0]->value
.f
[c
] == op
[1]->value
.f
[c
];
1342 case GLSL_TYPE_BOOL
:
1343 data
.b
[c
] = op
[0]->value
.b
[c
] == op
[1]->value
.b
[c
];
1345 case GLSL_TYPE_DOUBLE
:
1346 data
.b
[c
] = op
[0]->value
.d
[c
] == op
[1]->value
.d
[c
];
1353 case ir_binop_nequal
:
1354 assert(op
[0]->type
== op
[1]->type
);
1355 for (unsigned c
= 0; c
< components
; c
++) {
1356 switch (op
[0]->type
->base_type
) {
1357 case GLSL_TYPE_UINT
:
1358 data
.b
[c
] = op
[0]->value
.u
[c
] != op
[1]->value
.u
[c
];
1361 data
.b
[c
] = op
[0]->value
.i
[c
] != op
[1]->value
.i
[c
];
1363 case GLSL_TYPE_FLOAT
:
1364 data
.b
[c
] = op
[0]->value
.f
[c
] != op
[1]->value
.f
[c
];
1366 case GLSL_TYPE_BOOL
:
1367 data
.b
[c
] = op
[0]->value
.b
[c
] != op
[1]->value
.b
[c
];
1369 case GLSL_TYPE_DOUBLE
:
1370 data
.b
[c
] = op
[0]->value
.d
[c
] != op
[1]->value
.d
[c
];
1377 case ir_binop_all_equal
:
1378 data
.b
[0] = op
[0]->has_value(op
[1]);
1380 case ir_binop_any_nequal
:
1381 data
.b
[0] = !op
[0]->has_value(op
[1]);
1384 case ir_binop_lshift
:
1385 for (unsigned c
= 0, c0
= 0, c1
= 0;
1387 c0
+= c0_inc
, c1
+= c1_inc
, c
++) {
1389 if (op
[0]->type
->base_type
== GLSL_TYPE_INT
&&
1390 op
[1]->type
->base_type
== GLSL_TYPE_INT
) {
1391 data
.i
[c
] = op
[0]->value
.i
[c0
] << op
[1]->value
.i
[c1
];
1393 } else if (op
[0]->type
->base_type
== GLSL_TYPE_INT
&&
1394 op
[1]->type
->base_type
== GLSL_TYPE_UINT
) {
1395 data
.i
[c
] = op
[0]->value
.i
[c0
] << op
[1]->value
.u
[c1
];
1397 } else if (op
[0]->type
->base_type
== GLSL_TYPE_UINT
&&
1398 op
[1]->type
->base_type
== GLSL_TYPE_INT
) {
1399 data
.u
[c
] = op
[0]->value
.u
[c0
] << op
[1]->value
.i
[c1
];
1401 } else if (op
[0]->type
->base_type
== GLSL_TYPE_UINT
&&
1402 op
[1]->type
->base_type
== GLSL_TYPE_UINT
) {
1403 data
.u
[c
] = op
[0]->value
.u
[c0
] << op
[1]->value
.u
[c1
];
1408 case ir_binop_rshift
:
1409 for (unsigned c
= 0, c0
= 0, c1
= 0;
1411 c0
+= c0_inc
, c1
+= c1_inc
, c
++) {
1413 if (op
[0]->type
->base_type
== GLSL_TYPE_INT
&&
1414 op
[1]->type
->base_type
== GLSL_TYPE_INT
) {
1415 data
.i
[c
] = op
[0]->value
.i
[c0
] >> op
[1]->value
.i
[c1
];
1417 } else if (op
[0]->type
->base_type
== GLSL_TYPE_INT
&&
1418 op
[1]->type
->base_type
== GLSL_TYPE_UINT
) {
1419 data
.i
[c
] = op
[0]->value
.i
[c0
] >> op
[1]->value
.u
[c1
];
1421 } else if (op
[0]->type
->base_type
== GLSL_TYPE_UINT
&&
1422 op
[1]->type
->base_type
== GLSL_TYPE_INT
) {
1423 data
.u
[c
] = op
[0]->value
.u
[c0
] >> op
[1]->value
.i
[c1
];
1425 } else if (op
[0]->type
->base_type
== GLSL_TYPE_UINT
&&
1426 op
[1]->type
->base_type
== GLSL_TYPE_UINT
) {
1427 data
.u
[c
] = op
[0]->value
.u
[c0
] >> op
[1]->value
.u
[c1
];
1432 case ir_binop_bit_and
:
1433 for (unsigned c
= 0, c0
= 0, c1
= 0;
1435 c0
+= c0_inc
, c1
+= c1_inc
, c
++) {
1437 switch (op
[0]->type
->base_type
) {
1439 data
.i
[c
] = op
[0]->value
.i
[c0
] & op
[1]->value
.i
[c1
];
1441 case GLSL_TYPE_UINT
:
1442 data
.u
[c
] = op
[0]->value
.u
[c0
] & op
[1]->value
.u
[c1
];
1450 case ir_binop_bit_or
:
1451 for (unsigned c
= 0, c0
= 0, c1
= 0;
1453 c0
+= c0_inc
, c1
+= c1_inc
, c
++) {
1455 switch (op
[0]->type
->base_type
) {
1457 data
.i
[c
] = op
[0]->value
.i
[c0
] | op
[1]->value
.i
[c1
];
1459 case GLSL_TYPE_UINT
:
1460 data
.u
[c
] = op
[0]->value
.u
[c0
] | op
[1]->value
.u
[c1
];
1468 case ir_binop_vector_extract
: {
1469 const int c
= CLAMP(op
[1]->value
.i
[0], 0,
1470 (int) op
[0]->type
->vector_elements
- 1);
1472 switch (op
[0]->type
->base_type
) {
1473 case GLSL_TYPE_UINT
:
1474 data
.u
[0] = op
[0]->value
.u
[c
];
1477 data
.i
[0] = op
[0]->value
.i
[c
];
1479 case GLSL_TYPE_FLOAT
:
1480 data
.f
[0] = op
[0]->value
.f
[c
];
1482 case GLSL_TYPE_DOUBLE
:
1483 data
.d
[0] = op
[0]->value
.d
[c
];
1485 case GLSL_TYPE_BOOL
:
1486 data
.b
[0] = op
[0]->value
.b
[c
];
1494 case ir_binop_bit_xor
:
1495 for (unsigned c
= 0, c0
= 0, c1
= 0;
1497 c0
+= c0_inc
, c1
+= c1_inc
, c
++) {
1499 switch (op
[0]->type
->base_type
) {
1501 data
.i
[c
] = op
[0]->value
.i
[c0
] ^ op
[1]->value
.i
[c1
];
1503 case GLSL_TYPE_UINT
:
1504 data
.u
[c
] = op
[0]->value
.u
[c0
] ^ op
[1]->value
.u
[c1
];
1512 case ir_unop_bitfield_reverse
:
1513 /* http://graphics.stanford.edu/~seander/bithacks.html#BitReverseObvious */
1514 for (unsigned c
= 0; c
< components
; c
++) {
1515 unsigned int v
= op
[0]->value
.u
[c
]; // input bits to be reversed
1516 unsigned int r
= v
; // r will be reversed bits of v; first get LSB of v
1517 int s
= sizeof(v
) * CHAR_BIT
- 1; // extra shift needed at end
1519 for (v
>>= 1; v
; v
>>= 1) {
1524 r
<<= s
; // shift when v's highest bits are zero
1530 case ir_unop_bit_count
:
1531 for (unsigned c
= 0; c
< components
; c
++) {
1533 unsigned v
= op
[0]->value
.u
[c
];
1535 for (; v
; count
++) {
1542 case ir_unop_find_msb
:
1543 for (unsigned c
= 0; c
< components
; c
++) {
1544 int v
= op
[0]->value
.i
[c
];
1546 if (v
== 0 || (op
[0]->type
->base_type
== GLSL_TYPE_INT
&& v
== -1))
1550 int top_bit
= op
[0]->type
->base_type
== GLSL_TYPE_UINT
1551 ? 0 : v
& (1 << 31);
1553 while (((v
& (1 << 31)) == top_bit
) && count
!= 32) {
1558 data
.i
[c
] = 31 - count
;
1563 case ir_unop_find_lsb
:
1564 for (unsigned c
= 0; c
< components
; c
++) {
1565 if (op
[0]->value
.i
[c
] == 0)
1569 unsigned v
= op
[0]->value
.u
[c
];
1571 for (; !(v
& 1); v
>>= 1) {
1579 case ir_unop_saturate
:
1580 for (unsigned c
= 0; c
< components
; c
++) {
1581 data
.f
[c
] = CLAMP(op
[0]->value
.f
[c
], 0.0f
, 1.0f
);
1584 case ir_unop_pack_double_2x32
: {
1585 /* XXX needs to be checked on big-endian */
1587 temp
= (uint64_t)op
[0]->value
.u
[0] | ((uint64_t)op
[0]->value
.u
[1] << 32);
1588 data
.d
[0] = *(double *)&temp
;
1592 case ir_unop_unpack_double_2x32
:
1593 /* XXX needs to be checked on big-endian */
1594 data
.u
[0] = *(uint32_t *)&op
[0]->value
.d
[0];
1595 data
.u
[1] = *((uint32_t *)&op
[0]->value
.d
[0] + 1);
1598 case ir_triop_bitfield_extract
: {
1599 int offset
= op
[1]->value
.i
[0];
1600 int bits
= op
[2]->value
.i
[0];
1602 for (unsigned c
= 0; c
< components
; c
++) {
1605 else if (offset
< 0 || bits
< 0)
1606 data
.u
[c
] = 0; /* Undefined, per spec. */
1607 else if (offset
+ bits
> 32)
1608 data
.u
[c
] = 0; /* Undefined, per spec. */
1610 if (op
[0]->type
->base_type
== GLSL_TYPE_INT
) {
1611 /* int so that the right shift will sign-extend. */
1612 int value
= op
[0]->value
.i
[c
];
1613 value
<<= 32 - bits
- offset
;
1614 value
>>= 32 - bits
;
1617 unsigned value
= op
[0]->value
.u
[c
];
1618 value
<<= 32 - bits
- offset
;
1619 value
>>= 32 - bits
;
1627 case ir_binop_bfm
: {
1628 int bits
= op
[0]->value
.i
[0];
1629 int offset
= op
[1]->value
.i
[0];
1631 for (unsigned c
= 0; c
< components
; c
++) {
1633 data
.u
[c
] = op
[0]->value
.u
[c
];
1634 else if (offset
< 0 || bits
< 0)
1635 data
.u
[c
] = 0; /* Undefined for bitfieldInsert, per spec. */
1636 else if (offset
+ bits
> 32)
1637 data
.u
[c
] = 0; /* Undefined for bitfieldInsert, per spec. */
1639 data
.u
[c
] = ((1 << bits
) - 1) << offset
;
1644 case ir_binop_ldexp
:
1645 for (unsigned c
= 0; c
< components
; c
++) {
1646 if (op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
) {
1647 data
.d
[c
] = ldexp(op
[0]->value
.d
[c
], op
[1]->value
.i
[c
]);
1648 /* Flush subnormal values to zero. */
1649 if (!isnormal(data
.d
[c
]))
1650 data
.d
[c
] = copysign(0.0, op
[0]->value
.d
[c
]);
1652 data
.f
[c
] = ldexpf(op
[0]->value
.f
[c
], op
[1]->value
.i
[c
]);
1653 /* Flush subnormal values to zero. */
1654 if (!isnormal(data
.f
[c
]))
1655 data
.f
[c
] = copysignf(0.0f
, op
[0]->value
.f
[c
]);
1661 assert(op
[0]->type
->base_type
== GLSL_TYPE_FLOAT
||
1662 op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
);
1663 assert(op
[1]->type
->base_type
== GLSL_TYPE_FLOAT
||
1664 op
[1]->type
->base_type
== GLSL_TYPE_DOUBLE
);
1665 assert(op
[2]->type
->base_type
== GLSL_TYPE_FLOAT
||
1666 op
[2]->type
->base_type
== GLSL_TYPE_DOUBLE
);
1668 for (unsigned c
= 0; c
< components
; c
++) {
1669 if (op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
)
1670 data
.d
[c
] = op
[0]->value
.d
[c
] * op
[1]->value
.d
[c
]
1671 + op
[2]->value
.d
[c
];
1673 data
.f
[c
] = op
[0]->value
.f
[c
] * op
[1]->value
.f
[c
]
1674 + op
[2]->value
.f
[c
];
1678 case ir_triop_lrp
: {
1679 assert(op
[0]->type
->base_type
== GLSL_TYPE_FLOAT
||
1680 op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
);
1681 assert(op
[1]->type
->base_type
== GLSL_TYPE_FLOAT
||
1682 op
[1]->type
->base_type
== GLSL_TYPE_DOUBLE
);
1683 assert(op
[2]->type
->base_type
== GLSL_TYPE_FLOAT
||
1684 op
[2]->type
->base_type
== GLSL_TYPE_DOUBLE
);
1686 unsigned c2_inc
= op
[2]->type
->is_scalar() ? 0 : 1;
1687 for (unsigned c
= 0, c2
= 0; c
< components
; c2
+= c2_inc
, c
++) {
1688 if (op
[0]->type
->base_type
== GLSL_TYPE_DOUBLE
)
1689 data
.d
[c
] = op
[0]->value
.d
[c
] * (1.0 - op
[2]->value
.d
[c2
]) +
1690 (op
[1]->value
.d
[c
] * op
[2]->value
.d
[c2
]);
1692 data
.f
[c
] = op
[0]->value
.f
[c
] * (1.0f
- op
[2]->value
.f
[c2
]) +
1693 (op
[1]->value
.f
[c
] * op
[2]->value
.f
[c2
]);
1699 for (unsigned c
= 0; c
< components
; c
++) {
1700 if (op
[1]->type
->base_type
== GLSL_TYPE_DOUBLE
)
1701 data
.d
[c
] = op
[0]->value
.b
[c
] ? op
[1]->value
.d
[c
]
1702 : op
[2]->value
.d
[c
];
1704 data
.u
[c
] = op
[0]->value
.b
[c
] ? op
[1]->value
.u
[c
]
1705 : op
[2]->value
.u
[c
];
1709 case ir_triop_vector_insert
: {
1710 const unsigned idx
= op
[2]->value
.u
[0];
1712 memcpy(&data
, &op
[0]->value
, sizeof(data
));
1714 switch (this->type
->base_type
) {
1716 data
.i
[idx
] = op
[1]->value
.i
[0];
1718 case GLSL_TYPE_UINT
:
1719 data
.u
[idx
] = op
[1]->value
.u
[0];
1721 case GLSL_TYPE_FLOAT
:
1722 data
.f
[idx
] = op
[1]->value
.f
[0];
1724 case GLSL_TYPE_BOOL
:
1725 data
.b
[idx
] = op
[1]->value
.b
[0];
1727 case GLSL_TYPE_DOUBLE
:
1728 data
.d
[idx
] = op
[1]->value
.d
[0];
1731 assert(!"Should not get here.");
1737 case ir_quadop_bitfield_insert
: {
1738 int offset
= op
[2]->value
.i
[0];
1739 int bits
= op
[3]->value
.i
[0];
1741 for (unsigned c
= 0; c
< components
; c
++) {
1743 data
.u
[c
] = op
[0]->value
.u
[c
];
1744 else if (offset
< 0 || bits
< 0)
1745 data
.u
[c
] = 0; /* Undefined, per spec. */
1746 else if (offset
+ bits
> 32)
1747 data
.u
[c
] = 0; /* Undefined, per spec. */
1749 unsigned insert_mask
= ((1 << bits
) - 1) << offset
;
1751 unsigned insert
= op
[1]->value
.u
[c
];
1753 insert
&= insert_mask
;
1755 unsigned base
= op
[0]->value
.u
[c
];
1756 base
&= ~insert_mask
;
1758 data
.u
[c
] = base
| insert
;
1764 case ir_quadop_vector
:
1765 for (unsigned c
= 0; c
< this->type
->vector_elements
; c
++) {
1766 switch (this->type
->base_type
) {
1768 data
.i
[c
] = op
[c
]->value
.i
[0];
1770 case GLSL_TYPE_UINT
:
1771 data
.u
[c
] = op
[c
]->value
.u
[0];
1773 case GLSL_TYPE_FLOAT
:
1774 data
.f
[c
] = op
[c
]->value
.f
[0];
1776 case GLSL_TYPE_DOUBLE
:
1777 data
.d
[c
] = op
[c
]->value
.d
[0];
1786 /* FINISHME: Should handle all expression types. */
1790 return new(ctx
) ir_constant(this->type
, &data
);
1795 ir_texture::constant_expression_value(struct hash_table
*)
1797 /* texture lookups aren't constant expressions */
1803 ir_swizzle::constant_expression_value(struct hash_table
*variable_context
)
1805 ir_constant
*v
= this->val
->constant_expression_value(variable_context
);
1808 ir_constant_data data
= { { 0 } };
1810 const unsigned swiz_idx
[4] = {
1811 this->mask
.x
, this->mask
.y
, this->mask
.z
, this->mask
.w
1814 for (unsigned i
= 0; i
< this->mask
.num_components
; i
++) {
1815 switch (v
->type
->base_type
) {
1816 case GLSL_TYPE_UINT
:
1817 case GLSL_TYPE_INT
: data
.u
[i
] = v
->value
.u
[swiz_idx
[i
]]; break;
1818 case GLSL_TYPE_FLOAT
: data
.f
[i
] = v
->value
.f
[swiz_idx
[i
]]; break;
1819 case GLSL_TYPE_BOOL
: data
.b
[i
] = v
->value
.b
[swiz_idx
[i
]]; break;
1820 case GLSL_TYPE_DOUBLE
:data
.d
[i
] = v
->value
.d
[swiz_idx
[i
]]; break;
1821 default: assert(!"Should not get here."); break;
1825 void *ctx
= ralloc_parent(this);
1826 return new(ctx
) ir_constant(this->type
, &data
);
1833 ir_dereference_variable::constant_expression_value(struct hash_table
*variable_context
)
1835 /* This may occur during compile and var->type is glsl_type::error_type */
1839 /* Give priority to the context hashtable, if it exists */
1840 if (variable_context
) {
1841 ir_constant
*value
= (ir_constant
*)hash_table_find(variable_context
, var
);
1846 /* The constant_value of a uniform variable is its initializer,
1847 * not the lifetime constant value of the uniform.
1849 if (var
->data
.mode
== ir_var_uniform
)
1852 if (!var
->constant_value
)
1855 return var
->constant_value
->clone(ralloc_parent(var
), NULL
);
1860 ir_dereference_array::constant_expression_value(struct hash_table
*variable_context
)
1862 ir_constant
*array
= this->array
->constant_expression_value(variable_context
);
1863 ir_constant
*idx
= this->array_index
->constant_expression_value(variable_context
);
1865 if ((array
!= NULL
) && (idx
!= NULL
)) {
1866 void *ctx
= ralloc_parent(this);
1867 if (array
->type
->is_matrix()) {
1868 /* Array access of a matrix results in a vector.
1870 const unsigned column
= idx
->value
.u
[0];
1872 const glsl_type
*const column_type
= array
->type
->column_type();
1874 /* Offset in the constant matrix to the first element of the column
1877 const unsigned mat_idx
= column
* column_type
->vector_elements
;
1879 ir_constant_data data
= { { 0 } };
1881 switch (column_type
->base_type
) {
1882 case GLSL_TYPE_UINT
:
1884 for (unsigned i
= 0; i
< column_type
->vector_elements
; i
++)
1885 data
.u
[i
] = array
->value
.u
[mat_idx
+ i
];
1889 case GLSL_TYPE_FLOAT
:
1890 for (unsigned i
= 0; i
< column_type
->vector_elements
; i
++)
1891 data
.f
[i
] = array
->value
.f
[mat_idx
+ i
];
1895 case GLSL_TYPE_DOUBLE
:
1896 for (unsigned i
= 0; i
< column_type
->vector_elements
; i
++)
1897 data
.d
[i
] = array
->value
.d
[mat_idx
+ i
];
1902 assert(!"Should not get here.");
1906 return new(ctx
) ir_constant(column_type
, &data
);
1907 } else if (array
->type
->is_vector()) {
1908 const unsigned component
= idx
->value
.u
[0];
1910 return new(ctx
) ir_constant(array
, component
);
1912 const unsigned index
= idx
->value
.u
[0];
1913 return array
->get_array_element(index
)->clone(ctx
, NULL
);
1921 ir_dereference_record::constant_expression_value(struct hash_table
*)
1923 ir_constant
*v
= this->record
->constant_expression_value();
1925 return (v
!= NULL
) ? v
->get_record_field(this->field
) : NULL
;
1930 ir_assignment::constant_expression_value(struct hash_table
*)
1932 /* FINISHME: Handle CEs involving assignment (return RHS) */
1938 ir_constant::constant_expression_value(struct hash_table
*)
1945 ir_call::constant_expression_value(struct hash_table
*variable_context
)
1947 return this->callee
->constant_expression_value(&this->actual_parameters
, variable_context
);
1951 bool ir_function_signature::constant_expression_evaluate_expression_list(const struct exec_list
&body
,
1952 struct hash_table
*variable_context
,
1953 ir_constant
**result
)
1955 foreach_in_list(ir_instruction
, inst
, &body
) {
1956 switch(inst
->ir_type
) {
1958 /* (declare () type symbol) */
1959 case ir_type_variable
: {
1960 ir_variable
*var
= inst
->as_variable();
1961 hash_table_insert(variable_context
, ir_constant::zero(this, var
->type
), var
);
1965 /* (assign [condition] (write-mask) (ref) (value)) */
1966 case ir_type_assignment
: {
1967 ir_assignment
*asg
= inst
->as_assignment();
1968 if (asg
->condition
) {
1969 ir_constant
*cond
= asg
->condition
->constant_expression_value(variable_context
);
1972 if (!cond
->get_bool_component(0))
1976 ir_constant
*store
= NULL
;
1979 if (!constant_referenced(asg
->lhs
, variable_context
, store
, offset
))
1982 ir_constant
*value
= asg
->rhs
->constant_expression_value(variable_context
);
1987 store
->copy_masked_offset(value
, offset
, asg
->write_mask
);
1991 /* (return (expression)) */
1992 case ir_type_return
:
1994 *result
= inst
->as_return()->value
->constant_expression_value(variable_context
);
1995 return *result
!= NULL
;
1997 /* (call name (ref) (params))*/
1998 case ir_type_call
: {
1999 ir_call
*call
= inst
->as_call();
2001 /* Just say no to void functions in constant expressions. We
2002 * don't need them at that point.
2005 if (!call
->return_deref
)
2008 ir_constant
*store
= NULL
;
2011 if (!constant_referenced(call
->return_deref
, variable_context
,
2015 ir_constant
*value
= call
->constant_expression_value(variable_context
);
2020 store
->copy_offset(value
, offset
);
2024 /* (if condition (then-instructions) (else-instructions)) */
2026 ir_if
*iif
= inst
->as_if();
2028 ir_constant
*cond
= iif
->condition
->constant_expression_value(variable_context
);
2029 if (!cond
|| !cond
->type
->is_boolean())
2032 exec_list
&branch
= cond
->get_bool_component(0) ? iif
->then_instructions
: iif
->else_instructions
;
2035 if (!constant_expression_evaluate_expression_list(branch
, variable_context
, result
))
2038 /* If there was a return in the branch chosen, drop out now. */
2045 /* Every other expression type, we drop out. */
2051 /* Reaching the end of the block is not an error condition */
2059 ir_function_signature::constant_expression_value(exec_list
*actual_parameters
, struct hash_table
*variable_context
)
2061 const glsl_type
*type
= this->return_type
;
2062 if (type
== glsl_type::void_type
)
2065 /* From the GLSL 1.20 spec, page 23:
2066 * "Function calls to user-defined functions (non-built-in functions)
2067 * cannot be used to form constant expressions."
2069 if (!this->is_builtin())
2073 * Of the builtin functions, only the texture lookups and the noise
2074 * ones must not be used in constant expressions. They all include
2075 * specific opcodes so they don't need to be special-cased at this
2079 /* Initialize the table of dereferencable names with the function
2080 * parameters. Verify their const-ness on the way.
2082 * We expect the correctness of the number of parameters to have
2083 * been checked earlier.
2085 hash_table
*deref_hash
= hash_table_ctor(8, hash_table_pointer_hash
,
2086 hash_table_pointer_compare
);
2088 /* If "origin" is non-NULL, then the function body is there. So we
2089 * have to use the variable objects from the object with the body,
2090 * but the parameter instanciation on the current object.
2092 const exec_node
*parameter_info
= origin
? origin
->parameters
.head
: parameters
.head
;
2094 foreach_in_list(ir_rvalue
, n
, actual_parameters
) {
2095 ir_constant
*constant
= n
->constant_expression_value(variable_context
);
2096 if (constant
== NULL
) {
2097 hash_table_dtor(deref_hash
);
2102 ir_variable
*var
= (ir_variable
*)parameter_info
;
2103 hash_table_insert(deref_hash
, constant
, var
);
2105 parameter_info
= parameter_info
->next
;
2108 ir_constant
*result
= NULL
;
2110 /* Now run the builtin function until something non-constant
2111 * happens or we get the result.
2113 if (constant_expression_evaluate_expression_list(origin
? origin
->body
: body
, deref_hash
, &result
) && result
)
2114 result
= result
->clone(ralloc_parent(this), NULL
);
2116 hash_table_dtor(deref_hash
);