src/compiler/glsl/ir.cpp

   1 /*
   2  * Copyright © 2010 Intel Corporation
   3  *
   4  * Permission is hereby granted, free of charge, to any person obtaining a
   5  * copy of this software and associated documentation files (the "Software"),
   6  * to deal in the Software without restriction, including without limitation
   7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
   8  * and/or sell copies of the Software, and to permit persons to whom the
   9  * Software is furnished to do so, subject to the following conditions:
  10  *
  11  * The above copyright notice and this permission notice (including the next
  12  * paragraph) shall be included in all copies or substantial portions of the
  13  * Software.
  14  *
  15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  20  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
  21  * DEALINGS IN THE SOFTWARE.
  22  */
  23 #include <string.h>
  24 #include "ir.h"
  25 #include "util/half_float.h"
  26 #include "compiler/glsl_types.h"
  27 #include "glsl_parser_extras.h"
  28
  29
  30 ir_rvalue::ir_rvalue(enum ir_node_type t)
  31    : ir_instruction(t)
  32 {
  33    this->type = glsl_type::error_type;
  34 }
  35
  36 bool ir_rvalue::is_zero() const
  37 {
  38    return false;
  39 }
  40
  41 bool ir_rvalue::is_one() const
  42 {
  43    return false;
  44 }
  45
  46 bool ir_rvalue::is_negative_one() const
  47 {
  48    return false;
  49 }
  50
  51 /**
  52  * Modify the swizzle make to move one component to another
  53  *
  54  * \param m    IR swizzle to be modified
  55  * \param from Component in the RHS that is to be swizzled
  56  * \param to   Desired swizzle location of \c from
  57  */
  58 static void
  59 update_rhs_swizzle(ir_swizzle_mask &m, unsigned from, unsigned to)
  60 {
  61    switch (to) {
  62    case 0: m.x = from; break;
  63    case 1: m.y = from; break;
  64    case 2: m.z = from; break;
  65    case 3: m.w = from; break;
  66    default: assert(!"Should not get here.");
  67    }
  68 }
  69
  70 void
  71 ir_assignment::set_lhs(ir_rvalue *lhs)
  72 {
  73    void *mem_ctx = this;
  74    bool swizzled = false;
  75
  76    while (lhs != NULL) {
  77       ir_swizzle *swiz = lhs->as_swizzle();
  78
  79       if (swiz == NULL)
  80          break;
  81
  82       unsigned write_mask = 0;
  83       ir_swizzle_mask rhs_swiz = { 0, 0, 0, 0, 0, 0 };
  84
  85       for (unsigned i = 0; i < swiz->mask.num_components; i++) {
  86          unsigned c = 0;
  87
  88          switch (i) {
  89          case 0: c = swiz->mask.x; break;
  90          case 1: c = swiz->mask.y; break;
  91          case 2: c = swiz->mask.z; break;
  92          case 3: c = swiz->mask.w; break;
  93          default: assert(!"Should not get here.");
  94          }
  95
  96          write_mask |= (((this->write_mask >> i) & 1) << c);
  97          update_rhs_swizzle(rhs_swiz, i, c);
  98          rhs_swiz.num_components = swiz->val->type->vector_elements;
  99       }
 100
 101       this->write_mask = write_mask;
 102       lhs = swiz->val;
 103
 104       this->rhs = new(mem_ctx) ir_swizzle(this->rhs, rhs_swiz);
 105       swizzled = true;
 106    }
 107
 108    if (swizzled) {
 109       /* Now, RHS channels line up with the LHS writemask.  Collapse it
 110        * to just the channels that will be written.
 111        */
 112       ir_swizzle_mask rhs_swiz = { 0, 0, 0, 0, 0, 0 };
 113       int rhs_chan = 0;
 114       for (int i = 0; i < 4; i++) {
 115          if (write_mask & (1 << i))
 116             update_rhs_swizzle(rhs_swiz, i, rhs_chan++);
 117       }
 118       rhs_swiz.num_components = rhs_chan;
 119       this->rhs = new(mem_ctx) ir_swizzle(this->rhs, rhs_swiz);
 120    }
 121
 122    assert((lhs == NULL) || lhs->as_dereference());
 123
 124    this->lhs = (ir_dereference *) lhs;
 125 }
 126
 127 ir_variable *
 128 ir_assignment::whole_variable_written()
 129 {
 130    ir_variable *v = this->lhs->whole_variable_referenced();
 131
 132    if (v == NULL)
 133       return NULL;
 134
 135    if (v->type->is_scalar())
 136       return v;
 137
 138    if (v->type->is_vector()) {
 139       const unsigned mask = (1U << v->type->vector_elements) - 1;
 140
 141       if (mask != this->write_mask)
 142          return NULL;
 143    }
 144
 145    /* Either all the vector components are assigned or the variable is some
 146     * composite type (and the whole thing is assigned.
 147     */
 148    return v;
 149 }
 150
 151 ir_assignment::ir_assignment(ir_dereference *lhs, ir_rvalue *rhs,
 152                              ir_rvalue *condition, unsigned write_mask)
 153    : ir_instruction(ir_type_assignment)
 154 {
 155    this->condition = condition;
 156    this->rhs = rhs;
 157    this->lhs = lhs;
 158    this->write_mask = write_mask;
 159
 160    if (lhs->type->is_scalar() || lhs->type->is_vector()) {
 161       int lhs_components = 0;
 162       for (int i = 0; i < 4; i++) {
 163          if (write_mask & (1 << i))
 164             lhs_components++;
 165       }
 166
 167       assert(lhs_components == this->rhs->type->vector_elements);
 168    }
 169 }
 170
 171 ir_assignment::ir_assignment(ir_rvalue *lhs, ir_rvalue *rhs,
 172                              ir_rvalue *condition)
 173    : ir_instruction(ir_type_assignment)
 174 {
 175    this->condition = condition;
 176    this->rhs = rhs;
 177
 178    /* If the RHS is a vector type, assume that all components of the vector
 179     * type are being written to the LHS.  The write mask comes from the RHS
 180     * because we can have a case where the LHS is a vec4 and the RHS is a
 181     * vec3.  In that case, the assignment is:
 182     *
 183     *     (assign (...) (xyz) (var_ref lhs) (var_ref rhs))
 184     */
 185    if (rhs->type->is_vector())
 186       this->write_mask = (1U << rhs->type->vector_elements) - 1;
 187    else if (rhs->type->is_scalar())
 188       this->write_mask = 1;
 189    else
 190       this->write_mask = 0;
 191
 192    this->set_lhs(lhs);
 193 }
 194
 195 ir_expression::ir_expression(int op, const struct glsl_type *type,
 196                              ir_rvalue *op0, ir_rvalue *op1,
 197                              ir_rvalue *op2, ir_rvalue *op3)
 198    : ir_rvalue(ir_type_expression)
 199 {
 200    this->type = type;
 201    this->operation = ir_expression_operation(op);
 202    this->operands[0] = op0;
 203    this->operands[1] = op1;
 204    this->operands[2] = op2;
 205    this->operands[3] = op3;
 206    init_num_operands();
 207
 208 #ifndef NDEBUG
 209    for (unsigned i = num_operands; i < 4; i++) {
 210       assert(this->operands[i] == NULL);
 211    }
 212
 213    for (unsigned i = 0; i < num_operands; i++) {
 214       assert(this->operands[i] != NULL);
 215    }
 216 #endif
 217 }
 218
 219 ir_expression::ir_expression(int op, ir_rvalue *op0)
 220    : ir_rvalue(ir_type_expression)
 221 {
 222    this->operation = ir_expression_operation(op);
 223    this->operands[0] = op0;
 224    this->operands[1] = NULL;
 225    this->operands[2] = NULL;
 226    this->operands[3] = NULL;
 227
 228    assert(op <= ir_last_unop);
 229    init_num_operands();
 230    assert(num_operands == 1);
 231    assert(this->operands[0]);
 232
 233    switch (this->operation) {
 234    case ir_unop_bit_not:
 235    case ir_unop_logic_not:
 236    case ir_unop_neg:
 237    case ir_unop_abs:
 238    case ir_unop_sign:
 239    case ir_unop_rcp:
 240    case ir_unop_rsq:
 241    case ir_unop_sqrt:
 242    case ir_unop_exp:
 243    case ir_unop_log:
 244    case ir_unop_exp2:
 245    case ir_unop_log2:
 246    case ir_unop_trunc:
 247    case ir_unop_ceil:
 248    case ir_unop_floor:
 249    case ir_unop_fract:
 250    case ir_unop_round_even:
 251    case ir_unop_sin:
 252    case ir_unop_cos:
 253    case ir_unop_dFdx:
 254    case ir_unop_dFdx_coarse:
 255    case ir_unop_dFdx_fine:
 256    case ir_unop_dFdy:
 257    case ir_unop_dFdy_coarse:
 258    case ir_unop_dFdy_fine:
 259    case ir_unop_bitfield_reverse:
 260    case ir_unop_interpolate_at_centroid:
 261    case ir_unop_clz:
 262    case ir_unop_saturate:
 263    case ir_unop_atan:
 264       this->type = op0->type;
 265       break;
 266
 267    case ir_unop_f2i:
 268    case ir_unop_b2i:
 269    case ir_unop_u2i:
 270    case ir_unop_d2i:
 271    case ir_unop_bitcast_f2i:
 272    case ir_unop_bit_count:
 273    case ir_unop_find_msb:
 274    case ir_unop_find_lsb:
 275    case ir_unop_subroutine_to_int:
 276    case ir_unop_i642i:
 277    case ir_unop_u642i:
 278       this->type = glsl_type::get_instance(GLSL_TYPE_INT,
 279                                            op0->type->vector_elements, 1);
 280       break;
 281
 282    case ir_unop_b2f:
 283    case ir_unop_i2f:
 284    case ir_unop_u2f:
 285    case ir_unop_d2f:
 286    case ir_unop_f162f:
 287    case ir_unop_bitcast_i2f:
 288    case ir_unop_bitcast_u2f:
 289    case ir_unop_i642f:
 290    case ir_unop_u642f:
 291       this->type = glsl_type::get_instance(GLSL_TYPE_FLOAT,
 292                                            op0->type->vector_elements, 1);
 293       break;
 294
 295    case ir_unop_f2f16:
 296    case ir_unop_f2fmp:
 297    case ir_unop_b2f16:
 298       this->type = glsl_type::get_instance(GLSL_TYPE_FLOAT16,
 299                                            op0->type->vector_elements, 1);
 300       break;
 301
 302    case ir_unop_i2imp:
 303       this->type = glsl_type::get_instance(GLSL_TYPE_INT16,
 304                                            op0->type->vector_elements, 1);
 305       break;
 306
 307    case ir_unop_i2i:
 308       if (op0->type->base_type == GLSL_TYPE_INT) {
 309          this->type = glsl_type::get_instance(GLSL_TYPE_INT16,
 310                                               op0->type->vector_elements, 1);
 311       } else {
 312          assert(op0->type->base_type == GLSL_TYPE_INT16);
 313          this->type = glsl_type::get_instance(GLSL_TYPE_INT,
 314                                               op0->type->vector_elements, 1);
 315       }
 316       break;
 317
 318    case ir_unop_u2u:
 319       if (op0->type->base_type == GLSL_TYPE_UINT) {
 320          this->type = glsl_type::get_instance(GLSL_TYPE_UINT16,
 321                                               op0->type->vector_elements, 1);
 322       } else {
 323          assert(op0->type->base_type == GLSL_TYPE_UINT16);
 324          this->type = glsl_type::get_instance(GLSL_TYPE_UINT,
 325                                               op0->type->vector_elements, 1);
 326       }
 327       break;
 328
 329    case ir_unop_u2ump:
 330       this->type = glsl_type::get_instance(GLSL_TYPE_UINT16,
 331                                            op0->type->vector_elements, 1);
 332       break;
 333
 334    case ir_unop_f2b:
 335    case ir_unop_i2b:
 336    case ir_unop_d2b:
 337    case ir_unop_f162b:
 338    case ir_unop_i642b:
 339       this->type = glsl_type::get_instance(GLSL_TYPE_BOOL,
 340                                            op0->type->vector_elements, 1);
 341       break;
 342
 343    case ir_unop_f2d:
 344    case ir_unop_i2d:
 345    case ir_unop_u2d:
 346    case ir_unop_i642d:
 347    case ir_unop_u642d:
 348       this->type = glsl_type::get_instance(GLSL_TYPE_DOUBLE,
 349                                            op0->type->vector_elements, 1);
 350       break;
 351
 352    case ir_unop_i2u:
 353    case ir_unop_f2u:
 354    case ir_unop_d2u:
 355    case ir_unop_bitcast_f2u:
 356    case ir_unop_i642u:
 357    case ir_unop_u642u:
 358       this->type = glsl_type::get_instance(GLSL_TYPE_UINT,
 359                                            op0->type->vector_elements, 1);
 360       break;
 361
 362    case ir_unop_i2i64:
 363    case ir_unop_u2i64:
 364    case ir_unop_b2i64:
 365    case ir_unop_f2i64:
 366    case ir_unop_d2i64:
 367    case ir_unop_u642i64:
 368       this->type = glsl_type::get_instance(GLSL_TYPE_INT64,
 369                                            op0->type->vector_elements, 1);
 370       break;
 371
 372    case ir_unop_i2u64:
 373    case ir_unop_u2u64:
 374    case ir_unop_f2u64:
 375    case ir_unop_d2u64:
 376    case ir_unop_i642u64:
 377       this->type = glsl_type::get_instance(GLSL_TYPE_UINT64,
 378                                            op0->type->vector_elements, 1);
 379       break;
 380
 381    case ir_unop_unpack_double_2x32:
 382    case ir_unop_unpack_uint_2x32:
 383       this->type = glsl_type::uvec2_type;
 384       break;
 385
 386    case ir_unop_unpack_int_2x32:
 387       this->type = glsl_type::ivec2_type;
 388       break;
 389
 390    case ir_unop_pack_snorm_2x16:
 391    case ir_unop_pack_snorm_4x8:
 392    case ir_unop_pack_unorm_2x16:
 393    case ir_unop_pack_unorm_4x8:
 394    case ir_unop_pack_half_2x16:
 395       this->type = glsl_type::uint_type;
 396       break;
 397
 398    case ir_unop_pack_double_2x32:
 399       this->type = glsl_type::double_type;
 400       break;
 401
 402    case ir_unop_pack_int_2x32:
 403       this->type = glsl_type::int64_t_type;
 404       break;
 405
 406    case ir_unop_pack_uint_2x32:
 407       this->type = glsl_type::uint64_t_type;
 408       break;
 409
 410    case ir_unop_unpack_snorm_2x16:
 411    case ir_unop_unpack_unorm_2x16:
 412    case ir_unop_unpack_half_2x16:
 413       this->type = glsl_type::vec2_type;
 414       break;
 415
 416    case ir_unop_unpack_snorm_4x8:
 417    case ir_unop_unpack_unorm_4x8:
 418       this->type = glsl_type::vec4_type;
 419       break;
 420
 421    case ir_unop_unpack_sampler_2x32:
 422    case ir_unop_unpack_image_2x32:
 423       this->type = glsl_type::uvec2_type;
 424       break;
 425
 426    case ir_unop_pack_sampler_2x32:
 427    case ir_unop_pack_image_2x32:
 428       this->type = op0->type;
 429       break;
 430
 431    case ir_unop_frexp_sig:
 432       this->type = op0->type;
 433       break;
 434    case ir_unop_frexp_exp:
 435       this->type = glsl_type::get_instance(GLSL_TYPE_INT,
 436                                            op0->type->vector_elements, 1);
 437       break;
 438
 439    case ir_unop_get_buffer_size:
 440    case ir_unop_ssbo_unsized_array_length:
 441       this->type = glsl_type::int_type;
 442       break;
 443
 444    case ir_unop_bitcast_i642d:
 445    case ir_unop_bitcast_u642d:
 446       this->type = glsl_type::get_instance(GLSL_TYPE_DOUBLE,
 447                                            op0->type->vector_elements, 1);
 448       break;
 449
 450    case ir_unop_bitcast_d2i64:
 451       this->type = glsl_type::get_instance(GLSL_TYPE_INT64,
 452                                            op0->type->vector_elements, 1);
 453       break;
 454    case ir_unop_bitcast_d2u64:
 455       this->type = glsl_type::get_instance(GLSL_TYPE_UINT64,
 456                                            op0->type->vector_elements, 1);
 457       break;
 458
 459    default:
 460       assert(!"not reached: missing automatic type setup for ir_expression");
 461       this->type = op0->type;
 462       break;
 463    }
 464 }
 465
 466 ir_expression::ir_expression(int op, ir_rvalue *op0, ir_rvalue *op1)
 467    : ir_rvalue(ir_type_expression)
 468 {
 469    this->operation = ir_expression_operation(op);
 470    this->operands[0] = op0;
 471    this->operands[1] = op1;
 472    this->operands[2] = NULL;
 473    this->operands[3] = NULL;
 474
 475    assert(op > ir_last_unop);
 476    init_num_operands();
 477    assert(num_operands == 2);
 478    for (unsigned i = 0; i < num_operands; i++) {
 479       assert(this->operands[i] != NULL);
 480    }
 481
 482    switch (this->operation) {
 483    case ir_binop_all_equal:
 484    case ir_binop_any_nequal:
 485       this->type = glsl_type::bool_type;
 486       break;
 487
 488    case ir_binop_add:
 489    case ir_binop_sub:
 490    case ir_binop_min:
 491    case ir_binop_max:
 492    case ir_binop_pow:
 493    case ir_binop_mul:
 494    case ir_binop_div:
 495    case ir_binop_mod:
 496    case ir_binop_atan2:
 497       if (op0->type->is_scalar()) {
 498          this->type = op1->type;
 499       } else if (op1->type->is_scalar()) {
 500          this->type = op0->type;
 501       } else {
 502          if (this->operation == ir_binop_mul) {
 503             this->type = glsl_type::get_mul_type(op0->type, op1->type);
 504          } else {
 505             assert(op0->type == op1->type);
 506             this->type = op0->type;
 507          }
 508       }
 509       break;
 510
 511    case ir_binop_logic_and:
 512    case ir_binop_logic_xor:
 513    case ir_binop_logic_or:
 514    case ir_binop_bit_and:
 515    case ir_binop_bit_xor:
 516    case ir_binop_bit_or:
 517        assert(!op0->type->is_matrix());
 518        assert(!op1->type->is_matrix());
 519       if (op0->type->is_scalar()) {
 520          this->type = op1->type;
 521       } else if (op1->type->is_scalar()) {
 522          this->type = op0->type;
 523       } else {
 524           assert(op0->type->vector_elements == op1->type->vector_elements);
 525           this->type = op0->type;
 526       }
 527       break;
 528
 529    case ir_binop_equal:
 530    case ir_binop_nequal:
 531    case ir_binop_gequal:
 532    case ir_binop_less:
 533       assert(op0->type == op1->type);
 534       this->type = glsl_type::get_instance(GLSL_TYPE_BOOL,
 535                                            op0->type->vector_elements, 1);
 536       break;
 537
 538    case ir_binop_dot:
 539       this->type = op0->type->get_base_type();
 540       break;
 541
 542    case ir_binop_imul_high:
 543    case ir_binop_mul_32x16:
 544    case ir_binop_carry:
 545    case ir_binop_borrow:
 546    case ir_binop_lshift:
 547    case ir_binop_rshift:
 548    case ir_binop_ldexp:
 549    case ir_binop_interpolate_at_offset:
 550    case ir_binop_interpolate_at_sample:
 551       this->type = op0->type;
 552       break;
 553
 554    case ir_binop_add_sat:
 555    case ir_binop_sub_sat:
 556    case ir_binop_avg:
 557    case ir_binop_avg_round:
 558       assert(op0->type == op1->type);
 559       this->type = op0->type;
 560       break;
 561
 562    case ir_binop_abs_sub: {
 563       enum glsl_base_type base;
 564
 565       assert(op0->type == op1->type);
 566
 567       switch (op0->type->base_type) {
 568       case GLSL_TYPE_UINT:
 569       case GLSL_TYPE_INT:
 570          base = GLSL_TYPE_UINT;
 571          break;
 572       case GLSL_TYPE_UINT8:
 573       case GLSL_TYPE_INT8:
 574          base = GLSL_TYPE_UINT8;
 575          break;
 576       case GLSL_TYPE_UINT16:
 577       case GLSL_TYPE_INT16:
 578          base = GLSL_TYPE_UINT16;
 579          break;
 580       case GLSL_TYPE_UINT64:
 581       case GLSL_TYPE_INT64:
 582          base = GLSL_TYPE_UINT64;
 583          break;
 584       default:
 585          unreachable(!"Invalid base type.");
 586       }
 587
 588       this->type = glsl_type::get_instance(base, op0->type->vector_elements, 1);
 589       break;
 590    }
 591
 592    case ir_binop_vector_extract:
 593       this->type = op0->type->get_scalar_type();
 594       break;
 595
 596    default:
 597       assert(!"not reached: missing automatic type setup for ir_expression");
 598       this->type = glsl_type::float_type;
 599    }
 600 }
 601
 602 ir_expression::ir_expression(int op, ir_rvalue *op0, ir_rvalue *op1,
 603                              ir_rvalue *op2)
 604    : ir_rvalue(ir_type_expression)
 605 {
 606    this->operation = ir_expression_operation(op);
 607    this->operands[0] = op0;
 608    this->operands[1] = op1;
 609    this->operands[2] = op2;
 610    this->operands[3] = NULL;
 611
 612    assert(op > ir_last_binop && op <= ir_last_triop);
 613    init_num_operands();
 614    assert(num_operands == 3);
 615    for (unsigned i = 0; i < num_operands; i++) {
 616       assert(this->operands[i] != NULL);
 617    }
 618
 619    switch (this->operation) {
 620    case ir_triop_fma:
 621    case ir_triop_lrp:
 622    case ir_triop_bitfield_extract:
 623    case ir_triop_vector_insert:
 624       this->type = op0->type;
 625       break;
 626
 627    case ir_triop_csel:
 628       this->type = op1->type;
 629       break;
 630
 631    default:
 632       assert(!"not reached: missing automatic type setup for ir_expression");
 633       this->type = glsl_type::float_type;
 634    }
 635 }
 636
 637 /**
 638  * This is only here for ir_reader to used for testing purposes. Please use
 639  * the precomputed num_operands field if you need the number of operands.
 640  */
 641 unsigned
 642 ir_expression::get_num_operands(ir_expression_operation op)
 643 {
 644    assert(op <= ir_last_opcode);
 645
 646    if (op <= ir_last_unop)
 647       return 1;
 648
 649    if (op <= ir_last_binop)
 650       return 2;
 651
 652    if (op <= ir_last_triop)
 653       return 3;
 654
 655    if (op <= ir_last_quadop)
 656       return 4;
 657
 658    unreachable("Could not calculate number of operands");
 659 }
 660
 661 #include "ir_expression_operation_strings.h"
 662
 663 const char*
 664 depth_layout_string(ir_depth_layout layout)
 665 {
 666    switch(layout) {
 667    case ir_depth_layout_none:      return "";
 668    case ir_depth_layout_any:       return "depth_any";
 669    case ir_depth_layout_greater:   return "depth_greater";
 670    case ir_depth_layout_less:      return "depth_less";
 671    case ir_depth_layout_unchanged: return "depth_unchanged";
 672
 673    default:
 674       assert(0);
 675       return "";
 676    }
 677 }
 678
 679 ir_expression_operation
 680 ir_expression::get_operator(const char *str)
 681 {
 682    for (int op = 0; op <= int(ir_last_opcode); op++) {
 683       if (strcmp(str, ir_expression_operation_strings[op]) == 0)
 684          return (ir_expression_operation) op;
 685    }
 686    return (ir_expression_operation) -1;
 687 }
 688
 689 ir_variable *
 690 ir_expression::variable_referenced() const
 691 {
 692    switch (operation) {
 693       case ir_binop_vector_extract:
 694       case ir_triop_vector_insert:
 695          /* We get these for things like a[0] where a is a vector type. In these
 696           * cases we want variable_referenced() to return the actual vector
 697           * variable this is wrapping.
 698           */
 699          return operands[0]->variable_referenced();
 700       default:
 701          return ir_rvalue::variable_referenced();
 702    }
 703 }
 704
 705 ir_constant::ir_constant()
 706    : ir_rvalue(ir_type_constant)
 707 {
 708    this->const_elements = NULL;
 709 }
 710
 711 ir_constant::ir_constant(const struct glsl_type *type,
 712                          const ir_constant_data *data)
 713    : ir_rvalue(ir_type_constant)
 714 {
 715    this->const_elements = NULL;
 716
 717    assert((type->base_type >= GLSL_TYPE_UINT)
 718           && (type->base_type <= GLSL_TYPE_IMAGE));
 719
 720    this->type = type;
 721    memcpy(& this->value, data, sizeof(this->value));
 722 }
 723
 724 ir_constant::ir_constant(float16_t f16, unsigned vector_elements)
 725    : ir_rvalue(ir_type_constant)
 726 {
 727    assert(vector_elements <= 4);
 728    this->type = glsl_type::get_instance(GLSL_TYPE_FLOAT16, vector_elements, 1);
 729    for (unsigned i = 0; i < vector_elements; i++) {
 730       this->value.f16[i] = f16.bits;
 731    }
 732    for (unsigned i = vector_elements; i < 16; i++)  {
 733       this->value.f[i] = 0;
 734    }
 735 }
 736
 737 ir_constant::ir_constant(float f, unsigned vector_elements)
 738    : ir_rvalue(ir_type_constant)
 739 {
 740    assert(vector_elements <= 4);
 741    this->type = glsl_type::get_instance(GLSL_TYPE_FLOAT, vector_elements, 1);
 742    for (unsigned i = 0; i < vector_elements; i++) {
 743       this->value.f[i] = f;
 744    }
 745    for (unsigned i = vector_elements; i < 16; i++)  {
 746       this->value.f[i] = 0;
 747    }
 748 }
 749
 750 ir_constant::ir_constant(double d, unsigned vector_elements)
 751    : ir_rvalue(ir_type_constant)
 752 {
 753    assert(vector_elements <= 4);
 754    this->type = glsl_type::get_instance(GLSL_TYPE_DOUBLE, vector_elements, 1);
 755    for (unsigned i = 0; i < vector_elements; i++) {
 756       this->value.d[i] = d;
 757    }
 758    for (unsigned i = vector_elements; i < 16; i++)  {
 759       this->value.d[i] = 0.0;
 760    }
 761 }
 762
 763 ir_constant::ir_constant(int16_t i16, unsigned vector_elements)
 764    : ir_rvalue(ir_type_constant)
 765 {
 766    assert(vector_elements <= 4);
 767    this->type = glsl_type::get_instance(GLSL_TYPE_INT16, vector_elements, 1);
 768    for (unsigned i = 0; i < vector_elements; i++) {
 769       this->value.i16[i] = i16;
 770    }
 771    for (unsigned i = vector_elements; i < 16; i++) {
 772       this->value.i16[i] = 0;
 773    }
 774 }
 775
 776 ir_constant::ir_constant(uint16_t u16, unsigned vector_elements)
 777    : ir_rvalue(ir_type_constant)
 778 {
 779    assert(vector_elements <= 4);
 780    this->type = glsl_type::get_instance(GLSL_TYPE_UINT16, vector_elements, 1);
 781    for (unsigned i = 0; i < vector_elements; i++) {
 782       this->value.u16[i] = u16;
 783    }
 784    for (unsigned i = vector_elements; i < 16; i++) {
 785       this->value.u16[i] = 0;
 786    }
 787 }
 788
 789 ir_constant::ir_constant(unsigned int u, unsigned vector_elements)
 790    : ir_rvalue(ir_type_constant)
 791 {
 792    assert(vector_elements <= 4);
 793    this->type = glsl_type::get_instance(GLSL_TYPE_UINT, vector_elements, 1);
 794    for (unsigned i = 0; i < vector_elements; i++) {
 795       this->value.u[i] = u;
 796    }
 797    for (unsigned i = vector_elements; i < 16; i++) {
 798       this->value.u[i] = 0;
 799    }
 800 }
 801
 802 ir_constant::ir_constant(int integer, unsigned vector_elements)
 803    : ir_rvalue(ir_type_constant)
 804 {
 805    assert(vector_elements <= 4);
 806    this->type = glsl_type::get_instance(GLSL_TYPE_INT, vector_elements, 1);
 807    for (unsigned i = 0; i < vector_elements; i++) {
 808       this->value.i[i] = integer;
 809    }
 810    for (unsigned i = vector_elements; i < 16; i++) {
 811       this->value.i[i] = 0;
 812    }
 813 }
 814
 815 ir_constant::ir_constant(uint64_t u64, unsigned vector_elements)
 816    : ir_rvalue(ir_type_constant)
 817 {
 818    assert(vector_elements <= 4);
 819    this->type = glsl_type::get_instance(GLSL_TYPE_UINT64, vector_elements, 1);
 820    for (unsigned i = 0; i < vector_elements; i++) {
 821       this->value.u64[i] = u64;
 822    }
 823    for (unsigned i = vector_elements; i < 16; i++) {
 824       this->value.u64[i] = 0;
 825    }
 826 }
 827
 828 ir_constant::ir_constant(int64_t int64, unsigned vector_elements)
 829    : ir_rvalue(ir_type_constant)
 830 {
 831    assert(vector_elements <= 4);
 832    this->type = glsl_type::get_instance(GLSL_TYPE_INT64, vector_elements, 1);
 833    for (unsigned i = 0; i < vector_elements; i++) {
 834       this->value.i64[i] = int64;
 835    }
 836    for (unsigned i = vector_elements; i < 16; i++) {
 837       this->value.i64[i] = 0;
 838    }
 839 }
 840
 841 ir_constant::ir_constant(bool b, unsigned vector_elements)
 842    : ir_rvalue(ir_type_constant)
 843 {
 844    assert(vector_elements <= 4);
 845    this->type = glsl_type::get_instance(GLSL_TYPE_BOOL, vector_elements, 1);
 846    for (unsigned i = 0; i < vector_elements; i++) {
 847       this->value.b[i] = b;
 848    }
 849    for (unsigned i = vector_elements; i < 16; i++) {
 850       this->value.b[i] = false;
 851    }
 852 }
 853
 854 ir_constant::ir_constant(const ir_constant *c, unsigned i)
 855    : ir_rvalue(ir_type_constant)
 856 {
 857    this->const_elements = NULL;
 858    this->type = c->type->get_base_type();
 859
 860    switch (this->type->base_type) {
 861    case GLSL_TYPE_UINT16:  this->value.u16[0] = c->value.u16[i]; break;
 862    case GLSL_TYPE_INT16:  this->value.i16[0] = c->value.i16[i]; break;
 863    case GLSL_TYPE_UINT:  this->value.u[0] = c->value.u[i]; break;
 864    case GLSL_TYPE_INT:   this->value.i[0] = c->value.i[i]; break;
 865    case GLSL_TYPE_FLOAT: this->value.f[0] = c->value.f[i]; break;
 866    case GLSL_TYPE_FLOAT16: this->value.f16[0] = c->value.f16[i]; break;
 867    case GLSL_TYPE_BOOL:  this->value.b[0] = c->value.b[i]; break;
 868    case GLSL_TYPE_DOUBLE: this->value.d[0] = c->value.d[i]; break;
 869    default:              assert(!"Should not get here."); break;
 870    }
 871 }
 872
 873 ir_constant::ir_constant(const struct glsl_type *type, exec_list *value_list)
 874    : ir_rvalue(ir_type_constant)
 875 {
 876    this->const_elements = NULL;
 877    this->type = type;
 878
 879    assert(type->is_scalar() || type->is_vector() || type->is_matrix()
 880           || type->is_struct() || type->is_array());
 881
 882    /* If the constant is a record, the types of each of the entries in
 883     * value_list must be a 1-for-1 match with the structure components.  Each
 884     * entry must also be a constant.  Just move the nodes from the value_list
 885     * to the list in the ir_constant.
 886     */
 887    if (type->is_array() || type->is_struct()) {
 888       this->const_elements = ralloc_array(this, ir_constant *, type->length);
 889       unsigned i = 0;
 890       foreach_in_list(ir_constant, value, value_list) {
 891          assert(value->as_constant() != NULL);
 892
 893          this->const_elements[i++] = value;
 894       }
 895       return;
 896    }
 897
 898    for (unsigned i = 0; i < 16; i++) {
 899       this->value.u[i] = 0;
 900    }
 901
 902    ir_constant *value = (ir_constant *) (value_list->get_head_raw());
 903
 904    /* Constructors with exactly one scalar argument are special for vectors
 905     * and matrices.  For vectors, the scalar value is replicated to fill all
 906     * the components.  For matrices, the scalar fills the components of the
 907     * diagonal while the rest is filled with 0.
 908     */
 909    if (value->type->is_scalar() && value->next->is_tail_sentinel()) {
 910       if (type->is_matrix()) {
 911          /* Matrix - fill diagonal (rest is already set to 0) */
 912          for (unsigned i = 0; i < type->matrix_columns; i++) {
 913             switch (type->base_type) {
 914             case GLSL_TYPE_FLOAT:
 915                this->value.f[i * type->vector_elements + i] =
 916                   value->value.f[0];
 917                break;
 918             case GLSL_TYPE_DOUBLE:
 919                this->value.d[i * type->vector_elements + i] =
 920                   value->value.d[0];
 921                break;
 922             case GLSL_TYPE_FLOAT16:
 923                this->value.f16[i * type->vector_elements + i] =
 924                   value->value.f16[0];
 925                break;
 926             default:
 927                assert(!"unexpected matrix base type");
 928             }
 929          }
 930       } else {
 931          /* Vector or scalar - fill all components */
 932          switch (type->base_type) {
 933          case GLSL_TYPE_UINT16:
 934          case GLSL_TYPE_INT16:
 935             for (unsigned i = 0; i < type->components(); i++)
 936                this->value.u16[i] = value->value.u16[0];
 937             break;
 938          case GLSL_TYPE_UINT:
 939          case GLSL_TYPE_INT:
 940             for (unsigned i = 0; i < type->components(); i++)
 941                this->value.u[i] = value->value.u[0];
 942             break;
 943          case GLSL_TYPE_FLOAT:
 944             for (unsigned i = 0; i < type->components(); i++)
 945                this->value.f[i] = value->value.f[0];
 946             break;
 947          case GLSL_TYPE_FLOAT16:
 948             for (unsigned i = 0; i < type->components(); i++)
 949                this->value.f16[i] = value->value.f16[0];
 950             break;
 951          case GLSL_TYPE_DOUBLE:
 952             for (unsigned i = 0; i < type->components(); i++)
 953                this->value.d[i] = value->value.d[0];
 954             break;
 955          case GLSL_TYPE_UINT64:
 956          case GLSL_TYPE_INT64:
 957             for (unsigned i = 0; i < type->components(); i++)
 958                this->value.u64[i] = value->value.u64[0];
 959             break;
 960          case GLSL_TYPE_BOOL:
 961             for (unsigned i = 0; i < type->components(); i++)
 962                this->value.b[i] = value->value.b[0];
 963             break;
 964          case GLSL_TYPE_SAMPLER:
 965          case GLSL_TYPE_IMAGE:
 966             this->value.u64[0] = value->value.u64[0];
 967             break;
 968          default:
 969             assert(!"Should not get here.");
 970             break;
 971          }
 972       }
 973       return;
 974    }
 975
 976    if (type->is_matrix() && value->type->is_matrix()) {
 977       assert(value->next->is_tail_sentinel());
 978
 979       /* From section 5.4.2 of the GLSL 1.20 spec:
 980        * "If a matrix is constructed from a matrix, then each component
 981        *  (column i, row j) in the result that has a corresponding component
 982        *  (column i, row j) in the argument will be initialized from there."
 983        */
 984       unsigned cols = MIN2(type->matrix_columns, value->type->matrix_columns);
 985       unsigned rows = MIN2(type->vector_elements, value->type->vector_elements);
 986       for (unsigned i = 0; i < cols; i++) {
 987          for (unsigned j = 0; j < rows; j++) {
 988             const unsigned src = i * value->type->vector_elements + j;
 989             const unsigned dst = i * type->vector_elements + j;
 990             this->value.f[dst] = value->value.f[src];
 991          }
 992       }
 993
 994       /* "All other components will be initialized to the identity matrix." */
 995       for (unsigned i = cols; i < type->matrix_columns; i++)
 996          this->value.f[i * type->vector_elements + i] = 1.0;
 997
 998       return;
 999    }
1000
1001    /* Use each component from each entry in the value_list to initialize one
1002     * component of the constant being constructed.
1003     */
1004    unsigned i = 0;
1005    for (;;) {
1006       assert(value->as_constant() != NULL);
1007       assert(!value->is_tail_sentinel());
1008
1009       for (unsigned j = 0; j < value->type->components(); j++) {
1010          switch (type->base_type) {
1011          case GLSL_TYPE_UINT16:
1012             this->value.u16[i] = value->get_uint16_component(j);
1013             break;
1014          case GLSL_TYPE_INT16:
1015             this->value.i16[i] = value->get_int16_component(j);
1016             break;
1017          case GLSL_TYPE_UINT:
1018             this->value.u[i] = value->get_uint_component(j);
1019             break;
1020          case GLSL_TYPE_INT:
1021             this->value.i[i] = value->get_int_component(j);
1022             break;
1023          case GLSL_TYPE_FLOAT:
1024             this->value.f[i] = value->get_float_component(j);
1025             break;
1026          case GLSL_TYPE_FLOAT16:
1027             this->value.f16[i] = value->get_float16_component(j);
1028             break;
1029          case GLSL_TYPE_BOOL:
1030             this->value.b[i] = value->get_bool_component(j);
1031             break;
1032          case GLSL_TYPE_DOUBLE:
1033             this->value.d[i] = value->get_double_component(j);
1034             break;
1035          case GLSL_TYPE_UINT64:
1036             this->value.u64[i] = value->get_uint64_component(j);
1037             break;
1038          case GLSL_TYPE_INT64:
1039             this->value.i64[i] = value->get_int64_component(j);
1040             break;
1041          default:
1042             /* FINISHME: What to do?  Exceptions are not the answer.
1043              */
1044             break;
1045          }
1046
1047          i++;
1048          if (i >= type->components())
1049             break;
1050       }
1051
1052       if (i >= type->components())
1053          break; /* avoid downcasting a list sentinel */
1054       value = (ir_constant *) value->next;
1055    }
1056 }
1057
1058 ir_constant *
1059 ir_constant::zero(void *mem_ctx, const glsl_type *type)
1060 {
1061    assert(type->is_scalar() || type->is_vector() || type->is_matrix()
1062           || type->is_struct() || type->is_array());
1063
1064    ir_constant *c = new(mem_ctx) ir_constant;
1065    c->type = type;
1066    memset(&c->value, 0, sizeof(c->value));
1067
1068    if (type->is_array()) {
1069       c->const_elements = ralloc_array(c, ir_constant *, type->length);
1070
1071       for (unsigned i = 0; i < type->length; i++)
1072          c->const_elements[i] = ir_constant::zero(c, type->fields.array);
1073    }
1074
1075    if (type->is_struct()) {
1076       c->const_elements = ralloc_array(c, ir_constant *, type->length);
1077
1078       for (unsigned i = 0; i < type->length; i++) {
1079          c->const_elements[i] =
1080             ir_constant::zero(mem_ctx, type->fields.structure[i].type);
1081       }
1082    }
1083
1084    return c;
1085 }
1086
1087 bool
1088 ir_constant::get_bool_component(unsigned i) const
1089 {
1090    switch (this->type->base_type) {
1091    case GLSL_TYPE_UINT16:return this->value.u16[i] != 0;
1092    case GLSL_TYPE_INT16: return this->value.i16[i] != 0;
1093    case GLSL_TYPE_UINT:  return this->value.u[i] != 0;
1094    case GLSL_TYPE_INT:   return this->value.i[i] != 0;
1095    case GLSL_TYPE_FLOAT: return ((int)this->value.f[i]) != 0;
1096    case GLSL_TYPE_FLOAT16: return ((int)_mesa_half_to_float(this->value.f16[i])) != 0;
1097    case GLSL_TYPE_BOOL:  return this->value.b[i];
1098    case GLSL_TYPE_DOUBLE: return this->value.d[i] != 0.0;
1099    case GLSL_TYPE_SAMPLER:
1100    case GLSL_TYPE_IMAGE:
1101    case GLSL_TYPE_UINT64: return this->value.u64[i] != 0;
1102    case GLSL_TYPE_INT64:  return this->value.i64[i] != 0;
1103    default:              assert(!"Should not get here."); break;
1104    }
1105
1106    /* Must return something to make the compiler happy.  This is clearly an
1107     * error case.
1108     */
1109    return false;
1110 }
1111
1112 float
1113 ir_constant::get_float_component(unsigned i) const
1114 {
1115    switch (this->type->base_type) {
1116    case GLSL_TYPE_UINT16:return (float) this->value.u16[i];
1117    case GLSL_TYPE_INT16: return (float) this->value.i16[i];
1118    case GLSL_TYPE_UINT:  return (float) this->value.u[i];
1119    case GLSL_TYPE_INT:   return (float) this->value.i[i];
1120    case GLSL_TYPE_FLOAT: return this->value.f[i];
1121    case GLSL_TYPE_FLOAT16: return _mesa_half_to_float(this->value.f16[i]);
1122    case GLSL_TYPE_BOOL:  return this->value.b[i] ? 1.0f : 0.0f;
1123    case GLSL_TYPE_DOUBLE: return (float) this->value.d[i];
1124    case GLSL_TYPE_SAMPLER:
1125    case GLSL_TYPE_IMAGE:
1126    case GLSL_TYPE_UINT64: return (float) this->value.u64[i];
1127    case GLSL_TYPE_INT64:  return (float) this->value.i64[i];
1128    default:              assert(!"Should not get here."); break;
1129    }
1130
1131    /* Must return something to make the compiler happy.  This is clearly an
1132     * error case.
1133     */
1134    return 0.0;
1135 }
1136
1137 uint16_t
1138 ir_constant::get_float16_component(unsigned i) const
1139 {
1140    if (this->type->base_type == GLSL_TYPE_FLOAT16)
1141       return this->value.f16[i];
1142    else
1143       return _mesa_float_to_half(get_float_component(i));
1144 }
1145
1146 double
1147 ir_constant::get_double_component(unsigned i) const
1148 {
1149    switch (this->type->base_type) {
1150    case GLSL_TYPE_UINT16:return (double) this->value.u16[i];
1151    case GLSL_TYPE_INT16: return (double) this->value.i16[i];
1152    case GLSL_TYPE_UINT:  return (double) this->value.u[i];
1153    case GLSL_TYPE_INT:   return (double) this->value.i[i];
1154    case GLSL_TYPE_FLOAT: return (double) this->value.f[i];
1155    case GLSL_TYPE_FLOAT16: return (double) _mesa_half_to_float(this->value.f16[i]);
1156    case GLSL_TYPE_BOOL:  return this->value.b[i] ? 1.0 : 0.0;
1157    case GLSL_TYPE_DOUBLE: return this->value.d[i];
1158    case GLSL_TYPE_SAMPLER:
1159    case GLSL_TYPE_IMAGE:
1160    case GLSL_TYPE_UINT64: return (double) this->value.u64[i];
1161    case GLSL_TYPE_INT64:  return (double) this->value.i64[i];
1162    default:              assert(!"Should not get here."); break;
1163    }
1164
1165    /* Must return something to make the compiler happy.  This is clearly an
1166     * error case.
1167     */
1168    return 0.0;
1169 }
1170
1171 int16_t
1172 ir_constant::get_int16_component(unsigned i) const
1173 {
1174    switch (this->type->base_type) {
1175    case GLSL_TYPE_UINT16:return this->value.u16[i];
1176    case GLSL_TYPE_INT16: return this->value.i16[i];
1177    case GLSL_TYPE_UINT:  return this->value.u[i];
1178    case GLSL_TYPE_INT:   return this->value.i[i];
1179    case GLSL_TYPE_FLOAT: return (int16_t) this->value.f[i];
1180    case GLSL_TYPE_FLOAT16: return (int16_t) _mesa_half_to_float(this->value.f16[i]);
1181    case GLSL_TYPE_BOOL:  return this->value.b[i] ? 1 : 0;
1182    case GLSL_TYPE_DOUBLE: return (int16_t) this->value.d[i];
1183    case GLSL_TYPE_SAMPLER:
1184    case GLSL_TYPE_IMAGE:
1185    case GLSL_TYPE_UINT64: return (int16_t) this->value.u64[i];
1186    case GLSL_TYPE_INT64:  return (int16_t) this->value.i64[i];
1187    default:              assert(!"Should not get here."); break;
1188    }
1189
1190    /* Must return something to make the compiler happy.  This is clearly an
1191     * error case.
1192     */
1193    return 0;
1194 }
1195
1196 uint16_t
1197 ir_constant::get_uint16_component(unsigned i) const
1198 {
1199    switch (this->type->base_type) {
1200    case GLSL_TYPE_UINT16:return this->value.u16[i];
1201    case GLSL_TYPE_INT16: return this->value.i16[i];
1202    case GLSL_TYPE_UINT:  return this->value.u[i];
1203    case GLSL_TYPE_INT:   return this->value.i[i];
1204    case GLSL_TYPE_FLOAT: return (uint16_t) this->value.f[i];
1205    case GLSL_TYPE_FLOAT16: return (uint16_t) _mesa_half_to_float(this->value.f16[i]);
1206    case GLSL_TYPE_BOOL:  return this->value.b[i] ? 1 : 0;
1207    case GLSL_TYPE_DOUBLE: return (uint16_t) this->value.d[i];
1208    case GLSL_TYPE_SAMPLER:
1209    case GLSL_TYPE_IMAGE:
1210    case GLSL_TYPE_UINT64: return (uint16_t) this->value.u64[i];
1211    case GLSL_TYPE_INT64:  return (uint16_t) this->value.i64[i];
1212    default:              assert(!"Should not get here."); break;
1213    }
1214
1215    /* Must return something to make the compiler happy.  This is clearly an
1216     * error case.
1217     */
1218    return 0;
1219 }
1220
1221 int
1222 ir_constant::get_int_component(unsigned i) const
1223 {
1224    switch (this->type->base_type) {
1225    case GLSL_TYPE_UINT16:return this->value.u16[i];
1226    case GLSL_TYPE_INT16: return this->value.i16[i];
1227    case GLSL_TYPE_UINT:  return this->value.u[i];
1228    case GLSL_TYPE_INT:   return this->value.i[i];
1229    case GLSL_TYPE_FLOAT: return (int) this->value.f[i];
1230    case GLSL_TYPE_FLOAT16: return (int) _mesa_half_to_float(this->value.f16[i]);
1231    case GLSL_TYPE_BOOL:  return this->value.b[i] ? 1 : 0;
1232    case GLSL_TYPE_DOUBLE: return (int) this->value.d[i];
1233    case GLSL_TYPE_SAMPLER:
1234    case GLSL_TYPE_IMAGE:
1235    case GLSL_TYPE_UINT64: return (int) this->value.u64[i];
1236    case GLSL_TYPE_INT64:  return (int) this->value.i64[i];
1237    default:              assert(!"Should not get here."); break;
1238    }
1239
1240    /* Must return something to make the compiler happy.  This is clearly an
1241     * error case.
1242     */
1243    return 0;
1244 }
1245
1246 unsigned
1247 ir_constant::get_uint_component(unsigned i) const
1248 {
1249    switch (this->type->base_type) {
1250    case GLSL_TYPE_UINT16:return this->value.u16[i];
1251    case GLSL_TYPE_INT16: return this->value.i16[i];
1252    case GLSL_TYPE_UINT:  return this->value.u[i];
1253    case GLSL_TYPE_INT:   return this->value.i[i];
1254    case GLSL_TYPE_FLOAT: return (unsigned) this->value.f[i];
1255    case GLSL_TYPE_FLOAT16: return (unsigned) _mesa_half_to_float(this->value.f16[i]);
1256    case GLSL_TYPE_BOOL:  return this->value.b[i] ? 1 : 0;
1257    case GLSL_TYPE_DOUBLE: return (unsigned) this->value.d[i];
1258    case GLSL_TYPE_SAMPLER:
1259    case GLSL_TYPE_IMAGE:
1260    case GLSL_TYPE_UINT64: return (unsigned) this->value.u64[i];
1261    case GLSL_TYPE_INT64:  return (unsigned) this->value.i64[i];
1262    default:              assert(!"Should not get here."); break;
1263    }
1264
1265    /* Must return something to make the compiler happy.  This is clearly an
1266     * error case.
1267     */
1268    return 0;
1269 }
1270
1271 int64_t
1272 ir_constant::get_int64_component(unsigned i) const
1273 {
1274    switch (this->type->base_type) {
1275    case GLSL_TYPE_UINT16:return this->value.u16[i];
1276    case GLSL_TYPE_INT16: return this->value.i16[i];
1277    case GLSL_TYPE_UINT:  return this->value.u[i];
1278    case GLSL_TYPE_INT:   return this->value.i[i];
1279    case GLSL_TYPE_FLOAT: return (int64_t) this->value.f[i];
1280    case GLSL_TYPE_FLOAT16: return (int64_t) _mesa_half_to_float(this->value.f16[i]);
1281    case GLSL_TYPE_BOOL:  return this->value.b[i] ? 1 : 0;
1282    case GLSL_TYPE_DOUBLE: return (int64_t) this->value.d[i];
1283    case GLSL_TYPE_SAMPLER:
1284    case GLSL_TYPE_IMAGE:
1285    case GLSL_TYPE_UINT64: return (int64_t) this->value.u64[i];
1286    case GLSL_TYPE_INT64:  return this->value.i64[i];
1287    default:              assert(!"Should not get here."); break;
1288    }
1289
1290    /* Must return something to make the compiler happy.  This is clearly an
1291     * error case.
1292     */
1293    return 0;
1294 }
1295
1296 uint64_t
1297 ir_constant::get_uint64_component(unsigned i) const
1298 {
1299    switch (this->type->base_type) {
1300    case GLSL_TYPE_UINT16:return this->value.u16[i];
1301    case GLSL_TYPE_INT16: return this->value.i16[i];
1302    case GLSL_TYPE_UINT:  return this->value.u[i];
1303    case GLSL_TYPE_INT:   return this->value.i[i];
1304    case GLSL_TYPE_FLOAT: return (uint64_t) this->value.f[i];
1305    case GLSL_TYPE_FLOAT16: return (uint64_t) _mesa_half_to_float(this->value.f16[i]);
1306    case GLSL_TYPE_BOOL:  return this->value.b[i] ? 1 : 0;
1307    case GLSL_TYPE_DOUBLE: return (uint64_t) this->value.d[i];
1308    case GLSL_TYPE_SAMPLER:
1309    case GLSL_TYPE_IMAGE:
1310    case GLSL_TYPE_UINT64: return this->value.u64[i];
1311    case GLSL_TYPE_INT64:  return (uint64_t) this->value.i64[i];
1312    default:              assert(!"Should not get here."); break;
1313    }
1314
1315    /* Must return something to make the compiler happy.  This is clearly an
1316     * error case.
1317     */
1318    return 0;
1319 }
1320
1321 ir_constant *
1322 ir_constant::get_array_element(unsigned i) const
1323 {
1324    assert(this->type->is_array());
1325
1326    /* From page 35 (page 41 of the PDF) of the GLSL 1.20 spec:
1327     *
1328     *     "Behavior is undefined if a shader subscripts an array with an index
1329     *     less than 0 or greater than or equal to the size the array was
1330     *     declared with."
1331     *
1332     * Most out-of-bounds accesses are removed before things could get this far.
1333     * There are cases where non-constant array index values can get constant
1334     * folded.
1335     */
1336    if (int(i) < 0)
1337       i = 0;
1338    else if (i >= this->type->length)
1339       i = this->type->length - 1;
1340
1341    return const_elements[i];
1342 }
1343
1344 ir_constant *
1345 ir_constant::get_record_field(int idx)
1346 {
1347    assert(this->type->is_struct());
1348    assert(idx >= 0 && (unsigned) idx < this->type->length);
1349
1350    return const_elements[idx];
1351 }
1352
1353 void
1354 ir_constant::copy_offset(ir_constant *src, int offset)
1355 {
1356    switch (this->type->base_type) {
1357    case GLSL_TYPE_UINT16:
1358    case GLSL_TYPE_INT16:
1359    case GLSL_TYPE_UINT:
1360    case GLSL_TYPE_INT:
1361    case GLSL_TYPE_FLOAT:
1362    case GLSL_TYPE_FLOAT16:
1363    case GLSL_TYPE_DOUBLE:
1364    case GLSL_TYPE_SAMPLER:
1365    case GLSL_TYPE_IMAGE:
1366    case GLSL_TYPE_UINT64:
1367    case GLSL_TYPE_INT64:
1368    case GLSL_TYPE_BOOL: {
1369       unsigned int size = src->type->components();
1370       assert (size <= this->type->components() - offset);
1371       for (unsigned int i=0; i<size; i++) {
1372          switch (this->type->base_type) {
1373          case GLSL_TYPE_UINT16:
1374             value.u16[i+offset] = src->get_uint16_component(i);
1375             break;
1376          case GLSL_TYPE_INT16:
1377             value.i16[i+offset] = src->get_int16_component(i);
1378             break;
1379          case GLSL_TYPE_UINT:
1380             value.u[i+offset] = src->get_uint_component(i);
1381             break;
1382          case GLSL_TYPE_INT:
1383             value.i[i+offset] = src->get_int_component(i);
1384             break;
1385          case GLSL_TYPE_FLOAT:
1386             value.f[i+offset] = src->get_float_component(i);
1387             break;
1388          case GLSL_TYPE_FLOAT16:
1389             value.f16[i+offset] = src->get_float16_component(i);
1390             break;
1391          case GLSL_TYPE_BOOL:
1392             value.b[i+offset] = src->get_bool_component(i);
1393             break;
1394          case GLSL_TYPE_DOUBLE:
1395             value.d[i+offset] = src->get_double_component(i);
1396             break;
1397          case GLSL_TYPE_SAMPLER:
1398          case GLSL_TYPE_IMAGE:
1399          case GLSL_TYPE_UINT64:
1400             value.u64[i+offset] = src->get_uint64_component(i);
1401             break;
1402          case GLSL_TYPE_INT64:
1403             value.i64[i+offset] = src->get_int64_component(i);
1404             break;
1405          default: // Shut up the compiler
1406             break;
1407          }
1408       }
1409       break;
1410    }
1411
1412    case GLSL_TYPE_STRUCT:
1413    case GLSL_TYPE_ARRAY: {
1414       assert (src->type == this->type);
1415       for (unsigned i = 0; i < this->type->length; i++) {
1416          this->const_elements[i] = src->const_elements[i]->clone(this, NULL);
1417       }
1418       break;
1419    }
1420
1421    default:
1422       assert(!"Should not get here.");
1423       break;
1424    }
1425 }
1426
1427 void
1428 ir_constant::copy_masked_offset(ir_constant *src, int offset, unsigned int mask)
1429 {
1430    assert (!type->is_array() && !type->is_struct());
1431
1432    if (!type->is_vector() && !type->is_matrix()) {
1433       offset = 0;
1434       mask = 1;
1435    }
1436
1437    int id = 0;
1438    for (int i=0; i<4; i++) {
1439       if (mask & (1 << i)) {
1440          switch (this->type->base_type) {
1441          case GLSL_TYPE_UINT16:
1442             value.u16[i+offset] = src->get_uint16_component(id++);
1443             break;
1444          case GLSL_TYPE_INT16:
1445             value.i16[i+offset] = src->get_int16_component(id++);
1446             break;
1447          case GLSL_TYPE_UINT:
1448             value.u[i+offset] = src->get_uint_component(id++);
1449             break;
1450          case GLSL_TYPE_INT:
1451             value.i[i+offset] = src->get_int_component(id++);
1452             break;
1453          case GLSL_TYPE_FLOAT:
1454             value.f[i+offset] = src->get_float_component(id++);
1455             break;
1456          case GLSL_TYPE_FLOAT16:
1457             value.f16[i+offset] = src->get_float16_component(id++);
1458             break;
1459          case GLSL_TYPE_BOOL:
1460             value.b[i+offset] = src->get_bool_component(id++);
1461             break;
1462          case GLSL_TYPE_DOUBLE:
1463             value.d[i+offset] = src->get_double_component(id++);
1464             break;
1465          case GLSL_TYPE_SAMPLER:
1466          case GLSL_TYPE_IMAGE:
1467          case GLSL_TYPE_UINT64:
1468             value.u64[i+offset] = src->get_uint64_component(id++);
1469             break;
1470          case GLSL_TYPE_INT64:
1471             value.i64[i+offset] = src->get_int64_component(id++);
1472             break;
1473          default:
1474             assert(!"Should not get here.");
1475             return;
1476          }
1477       }
1478    }
1479 }
1480
1481 bool
1482 ir_constant::has_value(const ir_constant *c) const
1483 {
1484    if (this->type != c->type)
1485       return false;
1486
1487    if (this->type->is_array() || this->type->is_struct()) {
1488       for (unsigned i = 0; i < this->type->length; i++) {
1489          if (!this->const_elements[i]->has_value(c->const_elements[i]))
1490             return false;
1491       }
1492       return true;
1493    }
1494
1495    for (unsigned i = 0; i < this->type->components(); i++) {
1496       switch (this->type->base_type) {
1497       case GLSL_TYPE_UINT16:
1498          if (this->value.u16[i] != c->value.u16[i])
1499             return false;
1500          break;
1501       case GLSL_TYPE_INT16:
1502          if (this->value.i16[i] != c->value.i16[i])
1503             return false;
1504          break;
1505       case GLSL_TYPE_UINT:
1506          if (this->value.u[i] != c->value.u[i])
1507             return false;
1508          break;
1509       case GLSL_TYPE_INT:
1510          if (this->value.i[i] != c->value.i[i])
1511             return false;
1512          break;
1513       case GLSL_TYPE_FLOAT:
1514          if (this->value.f[i] != c->value.f[i])
1515             return false;
1516          break;
1517       case GLSL_TYPE_FLOAT16:
1518         /* Convert to float to make sure NaN and ±0.0 compares correctly */
1519          if (_mesa_half_to_float(this->value.f16[i]) !=
1520              _mesa_half_to_float(c->value.f16[i]))
1521             return false;
1522          break;
1523       case GLSL_TYPE_BOOL:
1524          if (this->value.b[i] != c->value.b[i])
1525             return false;
1526          break;
1527       case GLSL_TYPE_DOUBLE:
1528          if (this->value.d[i] != c->value.d[i])
1529             return false;
1530          break;
1531       case GLSL_TYPE_SAMPLER:
1532       case GLSL_TYPE_IMAGE:
1533       case GLSL_TYPE_UINT64:
1534          if (this->value.u64[i] != c->value.u64[i])
1535             return false;
1536          break;
1537       case GLSL_TYPE_INT64:
1538          if (this->value.i64[i] != c->value.i64[i])
1539             return false;
1540          break;
1541       default:
1542          assert(!"Should not get here.");
1543          return false;
1544       }
1545    }
1546
1547    return true;
1548 }
1549
1550 bool
1551 ir_constant::is_value(float f, int i) const
1552 {
1553    if (!this->type->is_scalar() && !this->type->is_vector())
1554       return false;
1555
1556    /* Only accept boolean values for 0/1. */
1557    if (int(bool(i)) != i && this->type->is_boolean())
1558       return false;
1559
1560    for (unsigned c = 0; c < this->type->vector_elements; c++) {
1561       switch (this->type->base_type) {
1562       case GLSL_TYPE_FLOAT:
1563          if (this->value.f[c] != f)
1564             return false;
1565          break;
1566       case GLSL_TYPE_FLOAT16:
1567          if (_mesa_half_to_float(this->value.f16[c]) != f)
1568             return false;
1569          break;
1570       case GLSL_TYPE_INT16:
1571          if (this->value.i16[c] != int16_t(i))
1572             return false;
1573          break;
1574       case GLSL_TYPE_UINT16:
1575          if (this->value.u16[c] != uint16_t(i))
1576             return false;
1577          break;
1578       case GLSL_TYPE_INT:
1579          if (this->value.i[c] != i)
1580             return false;
1581          break;
1582       case GLSL_TYPE_UINT:
1583          if (this->value.u[c] != unsigned(i))
1584             return false;
1585          break;
1586       case GLSL_TYPE_BOOL:
1587          if (this->value.b[c] != bool(i))
1588             return false;
1589          break;
1590       case GLSL_TYPE_DOUBLE:
1591          if (this->value.d[c] != double(f))
1592             return false;
1593          break;
1594       case GLSL_TYPE_SAMPLER:
1595       case GLSL_TYPE_IMAGE:
1596       case GLSL_TYPE_UINT64:
1597          if (this->value.u64[c] != uint64_t(i))
1598             return false;
1599          break;
1600       case GLSL_TYPE_INT64:
1601          if (this->value.i64[c] != i)
1602             return false;
1603          break;
1604       default:
1605          /* The only other base types are structures, arrays, and samplers.
1606           * Samplers cannot be constants, and the others should have been
1607           * filtered out above.
1608           */
1609          assert(!"Should not get here.");
1610          return false;
1611       }
1612    }
1613
1614    return true;
1615 }
1616
1617 bool
1618 ir_constant::is_zero() const
1619 {
1620    return is_value(0.0, 0);
1621 }
1622
1623 bool
1624 ir_constant::is_one() const
1625 {
1626    return is_value(1.0, 1);
1627 }
1628
1629 bool
1630 ir_constant::is_negative_one() const
1631 {
1632    return is_value(-1.0, -1);
1633 }
1634
1635 bool
1636 ir_constant::is_uint16_constant() const
1637 {
1638    if (!type->is_integer_32())
1639       return false;
1640
1641    return value.u[0] < (1 << 16);
1642 }
1643
1644 ir_loop::ir_loop()
1645    : ir_instruction(ir_type_loop)
1646 {
1647 }
1648
1649
1650 ir_dereference_variable::ir_dereference_variable(ir_variable *var)
1651    : ir_dereference(ir_type_dereference_variable)
1652 {
1653    assert(var != NULL);
1654
1655    this->var = var;
1656    this->type = var->type;
1657 }
1658
1659
1660 ir_dereference_array::ir_dereference_array(ir_rvalue *value,
1661                                            ir_rvalue *array_index)
1662    : ir_dereference(ir_type_dereference_array)
1663 {
1664    this->array_index = array_index;
1665    this->set_array(value);
1666 }
1667
1668
1669 ir_dereference_array::ir_dereference_array(ir_variable *var,
1670                                            ir_rvalue *array_index)
1671    : ir_dereference(ir_type_dereference_array)
1672 {
1673    void *ctx = ralloc_parent(var);
1674
1675    this->array_index = array_index;
1676    this->set_array(new(ctx) ir_dereference_variable(var));
1677 }
1678
1679
1680 void
1681 ir_dereference_array::set_array(ir_rvalue *value)
1682 {
1683    assert(value != NULL);
1684
1685    this->array = value;
1686
1687    const glsl_type *const vt = this->array->type;
1688
1689    if (vt->is_array()) {
1690       type = vt->fields.array;
1691    } else if (vt->is_matrix()) {
1692       type = vt->column_type();
1693    } else if (vt->is_vector()) {
1694       type = vt->get_base_type();
1695    }
1696 }
1697
1698
1699 ir_dereference_record::ir_dereference_record(ir_rvalue *value,
1700                                              const char *field)
1701    : ir_dereference(ir_type_dereference_record)
1702 {
1703    assert(value != NULL);
1704
1705    this->record = value;
1706    this->type = this->record->type->field_type(field);
1707    this->field_idx = this->record->type->field_index(field);
1708 }
1709
1710
1711 ir_dereference_record::ir_dereference_record(ir_variable *var,
1712                                              const char *field)
1713    : ir_dereference(ir_type_dereference_record)
1714 {
1715    void *ctx = ralloc_parent(var);
1716
1717    this->record = new(ctx) ir_dereference_variable(var);
1718    this->type = this->record->type->field_type(field);
1719    this->field_idx = this->record->type->field_index(field);
1720 }
1721
1722 bool
1723 ir_dereference::is_lvalue(const struct _mesa_glsl_parse_state *state) const
1724 {
1725    ir_variable *var = this->variable_referenced();
1726
1727    /* Every l-value derference chain eventually ends in a variable.
1728     */
1729    if ((var == NULL) || var->data.read_only)
1730       return false;
1731
1732    /* From section 4.1.7 of the ARB_bindless_texture spec:
1733     *
1734     * "Samplers can be used as l-values, so can be assigned into and used as
1735     *  "out" and "inout" function parameters."
1736     *
1737     * From section 4.1.X of the ARB_bindless_texture spec:
1738     *
1739     * "Images can be used as l-values, so can be assigned into and used as
1740     *  "out" and "inout" function parameters."
1741     */
1742    if ((!state || state->has_bindless()) &&
1743        (this->type->contains_sampler() || this->type->contains_image()))
1744       return true;
1745
1746    /* From section 4.1.7 of the GLSL 4.40 spec:
1747     *
1748     *   "Opaque variables cannot be treated as l-values; hence cannot
1749     *    be used as out or inout function parameters, nor can they be
1750     *    assigned into."
1751     */
1752    if (this->type->contains_opaque())
1753       return false;
1754
1755    return true;
1756 }
1757
1758
1759 static const char * const tex_opcode_strs[] = { "tex", "txb", "txl", "txd", "txf", "txf_ms", "txs", "lod", "tg4", "query_levels", "texture_samples", "samples_identical" };
1760
1761 const char *ir_texture::opcode_string()
1762 {
1763    assert((unsigned int) op < ARRAY_SIZE(tex_opcode_strs));
1764    return tex_opcode_strs[op];
1765 }
1766
1767 ir_texture_opcode
1768 ir_texture::get_opcode(const char *str)
1769 {
1770    const int count = sizeof(tex_opcode_strs) / sizeof(tex_opcode_strs[0]);
1771    for (int op = 0; op < count; op++) {
1772       if (strcmp(str, tex_opcode_strs[op]) == 0)
1773          return (ir_texture_opcode) op;
1774    }
1775    return (ir_texture_opcode) -1;
1776 }
1777
1778
1779 void
1780 ir_texture::set_sampler(ir_dereference *sampler, const glsl_type *type)
1781 {
1782    assert(sampler != NULL);
1783    assert(type != NULL);
1784    this->sampler = sampler;
1785    this->type = type;
1786
1787    if (this->op == ir_txs || this->op == ir_query_levels ||
1788        this->op == ir_texture_samples) {
1789       assert(type->base_type == GLSL_TYPE_INT);
1790    } else if (this->op == ir_lod) {
1791       assert(type->vector_elements == 2);
1792       assert(type->is_float());
1793    } else if (this->op == ir_samples_identical) {
1794       assert(type == glsl_type::bool_type);
1795       assert(sampler->type->is_sampler());
1796       assert(sampler->type->sampler_dimensionality == GLSL_SAMPLER_DIM_MS);
1797    } else {
1798       assert(sampler->type->sampled_type == (int) type->base_type);
1799       if (sampler->type->sampler_shadow)
1800          assert(type->vector_elements == 4 || type->vector_elements == 1);
1801       else
1802          assert(type->vector_elements == 4);
1803    }
1804 }
1805
1806
1807 void
1808 ir_swizzle::init_mask(const unsigned *comp, unsigned count)
1809 {
1810    assert((count >= 1) && (count <= 4));
1811
1812    memset(&this->mask, 0, sizeof(this->mask));
1813    this->mask.num_components = count;
1814
1815    unsigned dup_mask = 0;
1816    switch (count) {
1817    case 4:
1818       assert(comp[3] <= 3);
1819       dup_mask |= (1U << comp[3])
1820          & ((1U << comp[0]) | (1U << comp[1]) | (1U << comp[2]));
1821       this->mask.w = comp[3];
1822
1823    case 3:
1824       assert(comp[2] <= 3);
1825       dup_mask |= (1U << comp[2])
1826          & ((1U << comp[0]) | (1U << comp[1]));
1827       this->mask.z = comp[2];
1828
1829    case 2:
1830       assert(comp[1] <= 3);
1831       dup_mask |= (1U << comp[1])
1832          & ((1U << comp[0]));
1833       this->mask.y = comp[1];
1834
1835    case 1:
1836       assert(comp[0] <= 3);
1837       this->mask.x = comp[0];
1838    }
1839
1840    this->mask.has_duplicates = dup_mask != 0;
1841
1842    /* Based on the number of elements in the swizzle and the base type
1843     * (i.e., float, int, unsigned, or bool) of the vector being swizzled,
1844     * generate the type of the resulting value.
1845     */
1846    type = glsl_type::get_instance(val->type->base_type, mask.num_components, 1);
1847 }
1848
1849 ir_swizzle::ir_swizzle(ir_rvalue *val, unsigned x, unsigned y, unsigned z,
1850                        unsigned w, unsigned count)
1851    : ir_rvalue(ir_type_swizzle), val(val)
1852 {
1853    const unsigned components[4] = { x, y, z, w };
1854    this->init_mask(components, count);
1855 }
1856
1857 ir_swizzle::ir_swizzle(ir_rvalue *val, const unsigned *comp,
1858                        unsigned count)
1859    : ir_rvalue(ir_type_swizzle), val(val)
1860 {
1861    this->init_mask(comp, count);
1862 }
1863
1864 ir_swizzle::ir_swizzle(ir_rvalue *val, ir_swizzle_mask mask)
1865    : ir_rvalue(ir_type_swizzle), val(val), mask(mask)
1866 {
1867    this->type = glsl_type::get_instance(val->type->base_type,
1868                                         mask.num_components, 1);
1869 }
1870
1871 #define X 1
1872 #define R 5
1873 #define S 9
1874 #define I 13
1875
1876 ir_swizzle *
1877 ir_swizzle::create(ir_rvalue *val, const char *str, unsigned vector_length)
1878 {
1879    void *ctx = ralloc_parent(val);
1880
1881    /* For each possible swizzle character, this table encodes the value in
1882     * \c idx_map that represents the 0th element of the vector.  For invalid
1883     * swizzle characters (e.g., 'k'), a special value is used that will allow
1884     * detection of errors.
1885     */
1886    static const unsigned char base_idx[26] = {
1887    /* a  b  c  d  e  f  g  h  i  j  k  l  m */
1888       R, R, I, I, I, I, R, I, I, I, I, I, I,
1889    /* n  o  p  q  r  s  t  u  v  w  x  y  z */
1890       I, I, S, S, R, S, S, I, I, X, X, X, X
1891    };
1892
1893    /* Each valid swizzle character has an entry in the previous table.  This
1894     * table encodes the base index encoded in the previous table plus the actual
1895     * index of the swizzle character.  When processing swizzles, the first
1896     * character in the string is indexed in the previous table.  Each character
1897     * in the string is indexed in this table, and the value found there has the
1898     * value form the first table subtracted.  The result must be on the range
1899     * [0,3].
1900     *
1901     * For example, the string "wzyx" will get X from the first table.  Each of
1902     * the charcaters will get X+3, X+2, X+1, and X+0 from this table.  After
1903     * subtraction, the swizzle values are { 3, 2, 1, 0 }.
1904     *
1905     * The string "wzrg" will get X from the first table.  Each of the characters
1906     * will get X+3, X+2, R+0, and R+1 from this table.  After subtraction, the
1907     * swizzle values are { 3, 2, 4, 5 }.  Since 4 and 5 are outside the range
1908     * [0,3], the error is detected.
1909     */
1910    static const unsigned char idx_map[26] = {
1911    /* a    b    c    d    e    f    g    h    i    j    k    l    m */
1912       R+3, R+2, 0,   0,   0,   0,   R+1, 0,   0,   0,   0,   0,   0,
1913    /* n    o    p    q    r    s    t    u    v    w    x    y    z */
1914       0,   0,   S+2, S+3, R+0, S+0, S+1, 0,   0,   X+3, X+0, X+1, X+2
1915    };
1916
1917    int swiz_idx[4] = { 0, 0, 0, 0 };
1918    unsigned i;
1919
1920
1921    /* Validate the first character in the swizzle string and look up the base
1922     * index value as described above.
1923     */
1924    if ((str[0] < 'a') || (str[0] > 'z'))
1925       return NULL;
1926
1927    const unsigned base = base_idx[str[0] - 'a'];
1928
1929
1930    for (i = 0; (i < 4) && (str[i] != '\0'); i++) {
1931       /* Validate the next character, and, as described above, convert it to a
1932        * swizzle index.
1933        */
1934       if ((str[i] < 'a') || (str[i] > 'z'))
1935          return NULL;
1936
1937       swiz_idx[i] = idx_map[str[i] - 'a'] - base;
1938       if ((swiz_idx[i] < 0) || (swiz_idx[i] >= (int) vector_length))
1939          return NULL;
1940    }
1941
1942    if (str[i] != '\0')
1943          return NULL;
1944
1945    return new(ctx) ir_swizzle(val, swiz_idx[0], swiz_idx[1], swiz_idx[2],
1946                               swiz_idx[3], i);
1947 }
1948
1949 #undef X
1950 #undef R
1951 #undef S
1952 #undef I
1953
1954 ir_variable *
1955 ir_swizzle::variable_referenced() const
1956 {
1957    return this->val->variable_referenced();
1958 }
1959
1960
1961 bool ir_variable::temporaries_allocate_names = false;
1962
1963 const char ir_variable::tmp_name[] = "compiler_temp";
1964
1965 ir_variable::ir_variable(const struct glsl_type *type, const char *name,
1966                          ir_variable_mode mode)
1967    : ir_instruction(ir_type_variable)
1968 {
1969    this->type = type;
1970
1971    if (mode == ir_var_temporary && !ir_variable::temporaries_allocate_names)
1972       name = NULL;
1973
1974    /* The ir_variable clone method may call this constructor with name set to
1975     * tmp_name.
1976     */
1977    assert(name != NULL
1978           || mode == ir_var_temporary
1979           || mode == ir_var_function_in
1980           || mode == ir_var_function_out
1981           || mode == ir_var_function_inout);
1982    assert(name != ir_variable::tmp_name
1983           || mode == ir_var_temporary);
1984    if (mode == ir_var_temporary
1985        && (name == NULL || name == ir_variable::tmp_name)) {
1986       this->name = ir_variable::tmp_name;
1987    } else if (name == NULL ||
1988               strlen(name) < ARRAY_SIZE(this->name_storage)) {
1989       strcpy(this->name_storage, name ? name : "");
1990       this->name = this->name_storage;
1991    } else {
1992       this->name = ralloc_strdup(this, name);
1993    }
1994
1995    this->u.max_ifc_array_access = NULL;
1996
1997    this->data.explicit_location = false;
1998    this->data.explicit_index = false;
1999    this->data.explicit_binding = false;
2000    this->data.explicit_component = false;
2001    this->data.has_initializer = false;
2002    this->data.is_implicit_initializer = false;
2003    this->data.is_unmatched_generic_inout = false;
2004    this->data.is_xfb_only = false;
2005    this->data.explicit_xfb_buffer = false;
2006    this->data.explicit_xfb_offset = false;
2007    this->data.explicit_xfb_stride = false;
2008    this->data.location = -1;
2009    this->data.location_frac = 0;
2010    this->data.matrix_layout = GLSL_MATRIX_LAYOUT_INHERITED;
2011    this->data.from_named_ifc_block = false;
2012    this->data.must_be_shader_input = false;
2013    this->data.index = 0;
2014    this->data.binding = 0;
2015    this->data.warn_extension_index = 0;
2016    this->constant_value = NULL;
2017    this->constant_initializer = NULL;
2018    this->data.depth_layout = ir_depth_layout_none;
2019    this->data.used = false;
2020    this->data.assigned = false;
2021    this->data.always_active_io = false;
2022    this->data.read_only = false;
2023    this->data.centroid = false;
2024    this->data.sample = false;
2025    this->data.patch = false;
2026    this->data.explicit_invariant = false;
2027    this->data.invariant = false;
2028    this->data.precise = false;
2029    this->data.how_declared = ir_var_declared_normally;
2030    this->data.mode = mode;
2031    this->data.interpolation = INTERP_MODE_NONE;
2032    this->data.max_array_access = -1;
2033    this->data.offset = 0;
2034    this->data.precision = GLSL_PRECISION_NONE;
2035    this->data.memory_read_only = false;
2036    this->data.memory_write_only = false;
2037    this->data.memory_coherent = false;
2038    this->data.memory_volatile = false;
2039    this->data.memory_restrict = false;
2040    this->data.from_ssbo_unsized_array = false;
2041    this->data.implicit_sized_array = false;
2042    this->data.fb_fetch_output = false;
2043    this->data.bindless = false;
2044    this->data.bound = false;
2045    this->data.image_format = PIPE_FORMAT_NONE;
2046    this->data._num_state_slots = 0;
2047    this->data.param_index = 0;
2048    this->data.stream = 0;
2049    this->data.xfb_buffer = -1;
2050    this->data.xfb_stride = -1;
2051
2052    this->interface_type = NULL;
2053
2054    if (type != NULL) {
2055       if (type->is_interface())
2056          this->init_interface_type(type);
2057       else if (type->without_array()->is_interface())
2058          this->init_interface_type(type->without_array());
2059    }
2060 }
2061
2062
2063 const char *
2064 interpolation_string(unsigned interpolation)
2065 {
2066    switch (interpolation) {
2067    case INTERP_MODE_NONE:          return "no";
2068    case INTERP_MODE_SMOOTH:        return "smooth";
2069    case INTERP_MODE_FLAT:          return "flat";
2070    case INTERP_MODE_NOPERSPECTIVE: return "noperspective";
2071    }
2072
2073    assert(!"Should not get here.");
2074    return "";
2075 }
2076
2077 const char *const ir_variable::warn_extension_table[] = {
2078    "",
2079    "GL_ARB_shader_stencil_export",
2080    "GL_AMD_shader_stencil_export",
2081 };
2082
2083 void
2084 ir_variable::enable_extension_warning(const char *extension)
2085 {
2086    for (unsigned i = 0; i < ARRAY_SIZE(warn_extension_table); i++) {
2087       if (strcmp(warn_extension_table[i], extension) == 0) {
2088          this->data.warn_extension_index = i;
2089          return;
2090       }
2091    }
2092
2093    assert(!"Should not get here.");
2094    this->data.warn_extension_index = 0;
2095 }
2096
2097 const char *
2098 ir_variable::get_extension_warning() const
2099 {
2100    return this->data.warn_extension_index == 0
2101       ? NULL : warn_extension_table[this->data.warn_extension_index];
2102 }
2103
2104 ir_function_signature::ir_function_signature(const glsl_type *return_type,
2105                                              builtin_available_predicate b)
2106    : ir_instruction(ir_type_function_signature),
2107      return_type(return_type), is_defined(false),
2108      return_precision(GLSL_PRECISION_NONE),
2109      intrinsic_id(ir_intrinsic_invalid), builtin_avail(b), _function(NULL)
2110 {
2111    this->origin = NULL;
2112 }
2113
2114
2115 bool
2116 ir_function_signature::is_builtin() const
2117 {
2118    return builtin_avail != NULL;
2119 }
2120
2121
2122 bool
2123 ir_function_signature::is_builtin_available(const _mesa_glsl_parse_state *state) const
2124 {
2125    /* We can't call the predicate without a state pointer, so just say that
2126     * the signature is available.  At compile time, we need the filtering,
2127     * but also receive a valid state pointer.  At link time, we're resolving
2128     * imported built-in prototypes to their definitions, which will always
2129     * be an exact match.  So we can skip the filtering.
2130     */
2131    if (state == NULL)
2132       return true;
2133
2134    assert(builtin_avail != NULL);
2135    return builtin_avail(state);
2136 }
2137
2138
2139 static bool
2140 modes_match(unsigned a, unsigned b)
2141 {
2142    if (a == b)
2143       return true;
2144
2145    /* Accept "in" vs. "const in" */
2146    if ((a == ir_var_const_in && b == ir_var_function_in) ||
2147        (b == ir_var_const_in && a == ir_var_function_in))
2148       return true;
2149
2150    return false;
2151 }
2152
2153
2154 const char *
2155 ir_function_signature::qualifiers_match(exec_list *params)
2156 {
2157    /* check that the qualifiers match. */
2158    foreach_two_lists(a_node, &this->parameters, b_node, params) {
2159       ir_variable *a = (ir_variable *) a_node;
2160       ir_variable *b = (ir_variable *) b_node;
2161
2162       if (a->data.read_only != b->data.read_only ||
2163           !modes_match(a->data.mode, b->data.mode) ||
2164           a->data.interpolation != b->data.interpolation ||
2165           a->data.centroid != b->data.centroid ||
2166           a->data.sample != b->data.sample ||
2167           a->data.patch != b->data.patch ||
2168           a->data.memory_read_only != b->data.memory_read_only ||
2169           a->data.memory_write_only != b->data.memory_write_only ||
2170           a->data.memory_coherent != b->data.memory_coherent ||
2171           a->data.memory_volatile != b->data.memory_volatile ||
2172           a->data.memory_restrict != b->data.memory_restrict) {
2173
2174          /* parameter a's qualifiers don't match */
2175          return a->name;
2176       }
2177    }
2178    return NULL;
2179 }
2180
2181
2182 void
2183 ir_function_signature::replace_parameters(exec_list *new_params)
2184 {
2185    /* Destroy all of the previous parameter information.  If the previous
2186     * parameter information comes from the function prototype, it may either
2187     * specify incorrect parameter names or not have names at all.
2188     */
2189    new_params->move_nodes_to(&parameters);
2190 }
2191
2192
2193 ir_function::ir_function(const char *name)
2194    : ir_instruction(ir_type_function)
2195 {
2196    this->subroutine_index = -1;
2197    this->name = ralloc_strdup(this, name);
2198 }
2199
2200
2201 bool
2202 ir_function::has_user_signature()
2203 {
2204    foreach_in_list(ir_function_signature, sig, &this->signatures) {
2205       if (!sig->is_builtin())
2206          return true;
2207    }
2208    return false;
2209 }
2210
2211
2212 ir_rvalue *
2213 ir_rvalue::error_value(void *mem_ctx)
2214 {
2215    ir_rvalue *v = new(mem_ctx) ir_rvalue(ir_type_unset);
2216
2217    v->type = glsl_type::error_type;
2218    return v;
2219 }
2220
2221
2222 void
2223 visit_exec_list(exec_list *list, ir_visitor *visitor)
2224 {
2225    foreach_in_list_safe(ir_instruction, node, list) {
2226       node->accept(visitor);
2227    }
2228 }
2229
2230
2231 static void
2232 steal_memory(ir_instruction *ir, void *new_ctx)
2233 {
2234    ir_variable *var = ir->as_variable();
2235    ir_function *fn = ir->as_function();
2236    ir_constant *constant = ir->as_constant();
2237    if (var != NULL && var->constant_value != NULL)
2238       steal_memory(var->constant_value, ir);
2239
2240    if (var != NULL && var->constant_initializer != NULL)
2241       steal_memory(var->constant_initializer, ir);
2242
2243    if (fn != NULL && fn->subroutine_types)
2244       ralloc_steal(new_ctx, fn->subroutine_types);
2245
2246    /* The components of aggregate constants are not visited by the normal
2247     * visitor, so steal their values by hand.
2248     */
2249    if (constant != NULL &&
2250        (constant->type->is_array() || constant->type->is_struct())) {
2251       for (unsigned int i = 0; i < constant->type->length; i++) {
2252          steal_memory(constant->const_elements[i], ir);
2253       }
2254    }
2255
2256    ralloc_steal(new_ctx, ir);
2257 }
2258
2259
2260 void
2261 reparent_ir(exec_list *list, void *mem_ctx)
2262 {
2263    foreach_in_list(ir_instruction, node, list) {
2264       visit_tree(node, steal_memory, mem_ctx);
2265    }
2266 }
2267
2268
2269 static ir_rvalue *
2270 try_min_one(ir_rvalue *ir)
2271 {
2272    ir_expression *expr = ir->as_expression();
2273
2274    if (!expr || expr->operation != ir_binop_min)
2275       return NULL;
2276
2277    if (expr->operands[0]->is_one())
2278       return expr->operands[1];
2279
2280    if (expr->operands[1]->is_one())
2281       return expr->operands[0];
2282
2283    return NULL;
2284 }
2285
2286 static ir_rvalue *
2287 try_max_zero(ir_rvalue *ir)
2288 {
2289    ir_expression *expr = ir->as_expression();
2290
2291    if (!expr || expr->operation != ir_binop_max)
2292       return NULL;
2293
2294    if (expr->operands[0]->is_zero())
2295       return expr->operands[1];
2296
2297    if (expr->operands[1]->is_zero())
2298       return expr->operands[0];
2299
2300    return NULL;
2301 }
2302
2303 ir_rvalue *
2304 ir_rvalue::as_rvalue_to_saturate()
2305 {
2306    ir_expression *expr = this->as_expression();
2307
2308    if (!expr)
2309       return NULL;
2310
2311    ir_rvalue *max_zero = try_max_zero(expr);
2312    if (max_zero) {
2313       return try_min_one(max_zero);
2314    } else {
2315       ir_rvalue *min_one = try_min_one(expr);
2316       if (min_one) {
2317          return try_max_zero(min_one);
2318       }
2319    }
2320
2321    return NULL;
2322 }
2323
2324
2325 unsigned
2326 vertices_per_prim(GLenum prim)
2327 {
2328    switch (prim) {
2329    case GL_POINTS:
2330       return 1;
2331    case GL_LINES:
2332       return 2;
2333    case GL_TRIANGLES:
2334       return 3;
2335    case GL_LINES_ADJACENCY:
2336       return 4;
2337    case GL_TRIANGLES_ADJACENCY:
2338       return 6;
2339    default:
2340       assert(!"Bad primitive");
2341       return 3;
2342    }
2343 }
2344
2345 /**
2346  * Generate a string describing the mode of a variable
2347  */
2348 const char *
2349 mode_string(const ir_variable *var)
2350 {
2351    switch (var->data.mode) {
2352    case ir_var_auto:
2353       return (var->data.read_only) ? "global constant" : "global variable";
2354
2355    case ir_var_uniform:
2356       return "uniform";
2357
2358    case ir_var_shader_storage:
2359       return "buffer";
2360
2361    case ir_var_shader_in:
2362       return "shader input";
2363
2364    case ir_var_shader_out:
2365       return "shader output";
2366
2367    case ir_var_function_in:
2368    case ir_var_const_in:
2369       return "function input";
2370
2371    case ir_var_function_out:
2372       return "function output";
2373
2374    case ir_var_function_inout:
2375       return "function inout";
2376
2377    case ir_var_system_value:
2378       return "shader input";
2379
2380    case ir_var_temporary:
2381       return "compiler temporary";
2382
2383    case ir_var_mode_count:
2384       break;
2385    }
2386
2387    assert(!"Should not get here.");
2388    return "invalid variable";
2389 }