src/glsl/ir_constant_expression.cpp

   1 /*
   2  * Copyright © 2010 Intel Corporation
   3  *
   4  * Permission is hereby granted, free of charge, to any person obtaining a
   5  * copy of this software and associated documentation files (the "Software"),
   6  * to deal in the Software without restriction, including without limitation
   7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
   8  * and/or sell copies of the Software, and to permit persons to whom the
   9  * Software is furnished to do so, subject to the following conditions:
  10  *
  11  * The above copyright notice and this permission notice (including the next
  12  * paragraph) shall be included in all copies or substantial portions of the
  13  * Software.
  14  *
  15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  20  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
  21  * DEALINGS IN THE SOFTWARE.
  22  */
  23
  24 /**
  25  * \file ir_constant_expression.cpp
  26  * Evaluate and process constant valued expressions
  27  *
  28  * In GLSL, constant valued expressions are used in several places.  These
  29  * must be processed and evaluated very early in the compilation process.
  30  *
  31  *    * Sizes of arrays
  32  *    * Initializers for uniforms
  33  *    * Initializers for \c const variables
  34  */
  35
  36 #include <math.h>
  37 #include "main/core.h" /* for MAX2, MIN2, CLAMP */
  38 #include "ir.h"
  39 #include "ir_visitor.h"
  40 #include "glsl_types.h"
  41 #include "program/hash_table.h"
  42
  43 static float
  44 dot(ir_constant *op0, ir_constant *op1)
  45 {
  46    assert(op0->type->is_float() && op1->type->is_float());
  47
  48    float result = 0;
  49    for (unsigned c = 0; c < op0->type->components(); c++)
  50       result += op0->value.f[c] * op1->value.f[c];
  51
  52    return result;
  53 }
  54
  55 /* This method is the only one supported by gcc.  Unions in particular
  56  * are iffy, and read-through-converted-pointer is killed by strict
  57  * aliasing.  OTOH, the compiler sees through the memcpy, so the
  58  * resulting asm is reasonable.
  59  */
  60 static float
  61 bitcast_u2f(unsigned int u)
  62 {
  63    assert(sizeof(float) == sizeof(unsigned int));
  64    float f;
  65    memcpy(&f, &u, sizeof(f));
  66    return f;
  67 }
  68
  69 static unsigned int
  70 bitcast_f2u(float f)
  71 {
  72    assert(sizeof(float) == sizeof(unsigned int));
  73    unsigned int u;
  74    memcpy(&u, &f, sizeof(f));
  75    return u;
  76 }
  77
  78 /**
  79  * Evaluate one component of a floating-point 4x8 unpacking function.
  80  */
  81 typedef uint8_t
  82 (*pack_1x8_func_t)(float);
  83
  84 /**
  85  * Evaluate one component of a floating-point 2x16 unpacking function.
  86  */
  87 typedef uint16_t
  88 (*pack_1x16_func_t)(float);
  89
  90 /**
  91  * Evaluate one component of a floating-point 4x8 unpacking function.
  92  */
  93 typedef float
  94 (*unpack_1x8_func_t)(uint8_t);
  95
  96 /**
  97  * Evaluate one component of a floating-point 2x16 unpacking function.
  98  */
  99 typedef float
 100 (*unpack_1x16_func_t)(uint16_t);
 101
 102 /**
 103  * Evaluate a 2x16 floating-point packing function.
 104  */
 105 static uint32_t
 106 pack_2x16(pack_1x16_func_t pack_1x16,
 107           float x, float y)
 108 {
 109    /* From section 8.4 of the GLSL ES 3.00 spec:
 110     *
 111     *    packSnorm2x16
 112     *    -------------
 113     *    The first component of the vector will be written to the least
 114     *    significant bits of the output; the last component will be written to
 115     *    the most significant bits.
 116     *
 117     * The specifications for the other packing functions contain similar
 118     * language.
 119     */
 120    uint32_t u = 0;
 121    u |= ((uint32_t) pack_1x16(x) << 0);
 122    u |= ((uint32_t) pack_1x16(y) << 16);
 123    return u;
 124 }
 125
 126 /**
 127  * Evaluate a 4x8 floating-point packing function.
 128  */
 129 static uint32_t
 130 pack_4x8(pack_1x8_func_t pack_1x8,
 131          float x, float y, float z, float w)
 132 {
 133    /* From section 8.4 of the GLSL 4.30 spec:
 134     *
 135     *    packSnorm4x8
 136     *    ------------
 137     *    The first component of the vector will be written to the least
 138     *    significant bits of the output; the last component will be written to
 139     *    the most significant bits.
 140     *
 141     * The specifications for the other packing functions contain similar
 142     * language.
 143     */
 144    uint32_t u = 0;
 145    u |= ((uint32_t) pack_1x8(x) << 0);
 146    u |= ((uint32_t) pack_1x8(y) << 8);
 147    u |= ((uint32_t) pack_1x8(z) << 16);
 148    u |= ((uint32_t) pack_1x8(w) << 24);
 149    return u;
 150 }
 151
 152 /**
 153  * Evaluate a 2x16 floating-point unpacking function.
 154  */
 155 static void
 156 unpack_2x16(unpack_1x16_func_t unpack_1x16,
 157             uint32_t u,
 158             float *x, float *y)
 159 {
 160     /* From section 8.4 of the GLSL ES 3.00 spec:
 161      *
 162      *    unpackSnorm2x16
 163      *    ---------------
 164      *    The first component of the returned vector will be extracted from
 165      *    the least significant bits of the input; the last component will be
 166      *    extracted from the most significant bits.
 167      *
 168      * The specifications for the other unpacking functions contain similar
 169      * language.
 170      */
 171    *x = unpack_1x16((uint16_t) (u & 0xffff));
 172    *y = unpack_1x16((uint16_t) (u >> 16));
 173 }
 174
 175 /**
 176  * Evaluate a 4x8 floating-point unpacking function.
 177  */
 178 static void
 179 unpack_4x8(unpack_1x8_func_t unpack_1x8, uint32_t u,
 180            float *x, float *y, float *z, float *w)
 181 {
 182     /* From section 8.4 of the GLSL 4.30 spec:
 183      *
 184      *    unpackSnorm4x8
 185      *    --------------
 186      *    The first component of the returned vector will be extracted from
 187      *    the least significant bits of the input; the last component will be
 188      *    extracted from the most significant bits.
 189      *
 190      * The specifications for the other unpacking functions contain similar
 191      * language.
 192      */
 193    *x = unpack_1x8((uint8_t) (u & 0xff));
 194    *y = unpack_1x8((uint8_t) (u >> 8));
 195    *z = unpack_1x8((uint8_t) (u >> 16));
 196    *w = unpack_1x8((uint8_t) (u >> 24));
 197 }
 198
 199 /**
 200  * Evaluate one component of packSnorm4x8.
 201  */
 202 static uint8_t
 203 pack_snorm_1x8(float x)
 204 {
 205     /* From section 8.4 of the GLSL 4.30 spec:
 206      *
 207      *    packSnorm4x8
 208      *    ------------
 209      *    The conversion for component c of v to fixed point is done as
 210      *    follows:
 211      *
 212      *      packSnorm4x8: round(clamp(c, -1, +1) * 127.0)
 213      *
 214      * We must first cast the float to an int, because casting a negative
 215      * float to a uint is undefined.
 216      */
 217    return (uint8_t) (int8_t)
 218           _mesa_round_to_even(CLAMP(x, -1.0f, +1.0f) * 127.0f);
 219 }
 220
 221 /**
 222  * Evaluate one component of packSnorm2x16.
 223  */
 224 static uint16_t
 225 pack_snorm_1x16(float x)
 226 {
 227     /* From section 8.4 of the GLSL ES 3.00 spec:
 228      *
 229      *    packSnorm2x16
 230      *    -------------
 231      *    The conversion for component c of v to fixed point is done as
 232      *    follows:
 233      *
 234      *      packSnorm2x16: round(clamp(c, -1, +1) * 32767.0)
 235      *
 236      * We must first cast the float to an int, because casting a negative
 237      * float to a uint is undefined.
 238      */
 239    return (uint16_t) (int16_t)
 240           _mesa_round_to_even(CLAMP(x, -1.0f, +1.0f) * 32767.0f);
 241 }
 242
 243 /**
 244  * Evaluate one component of unpackSnorm4x8.
 245  */
 246 static float
 247 unpack_snorm_1x8(uint8_t u)
 248 {
 249     /* From section 8.4 of the GLSL 4.30 spec:
 250      *
 251      *    unpackSnorm4x8
 252      *    --------------
 253      *    The conversion for unpacked fixed-point value f to floating point is
 254      *    done as follows:
 255      *
 256      *       unpackSnorm4x8: clamp(f / 127.0, -1, +1)
 257      */
 258    return CLAMP((int8_t) u / 127.0f, -1.0f, +1.0f);
 259 }
 260
 261 /**
 262  * Evaluate one component of unpackSnorm2x16.
 263  */
 264 static float
 265 unpack_snorm_1x16(uint16_t u)
 266 {
 267     /* From section 8.4 of the GLSL ES 3.00 spec:
 268      *
 269      *    unpackSnorm2x16
 270      *    ---------------
 271      *    The conversion for unpacked fixed-point value f to floating point is
 272      *    done as follows:
 273      *
 274      *       unpackSnorm2x16: clamp(f / 32767.0, -1, +1)
 275      */
 276    return CLAMP((int16_t) u / 32767.0f, -1.0f, +1.0f);
 277 }
 278
 279 /**
 280  * Evaluate one component packUnorm4x8.
 281  */
 282 static uint8_t
 283 pack_unorm_1x8(float x)
 284 {
 285     /* From section 8.4 of the GLSL 4.30 spec:
 286      *
 287      *    packUnorm4x8
 288      *    ------------
 289      *    The conversion for component c of v to fixed point is done as
 290      *    follows:
 291      *
 292      *       packUnorm4x8: round(clamp(c, 0, +1) * 255.0)
 293      */
 294    return (uint8_t) _mesa_round_to_even(CLAMP(x, 0.0f, 1.0f) * 255.0f);
 295 }
 296
 297 /**
 298  * Evaluate one component packUnorm2x16.
 299  */
 300 static uint16_t
 301 pack_unorm_1x16(float x)
 302 {
 303     /* From section 8.4 of the GLSL ES 3.00 spec:
 304      *
 305      *    packUnorm2x16
 306      *    -------------
 307      *    The conversion for component c of v to fixed point is done as
 308      *    follows:
 309      *
 310      *       packUnorm2x16: round(clamp(c, 0, +1) * 65535.0)
 311      */
 312    return (uint16_t) _mesa_round_to_even(CLAMP(x, 0.0f, 1.0f) * 65535.0f);
 313 }
 314
 315 /**
 316  * Evaluate one component of unpackUnorm4x8.
 317  */
 318 static float
 319 unpack_unorm_1x8(uint8_t u)
 320 {
 321     /* From section 8.4 of the GLSL 4.30 spec:
 322      *
 323      *    unpackUnorm4x8
 324      *    --------------
 325      *    The conversion for unpacked fixed-point value f to floating point is
 326      *    done as follows:
 327      *
 328      *       unpackUnorm4x8: f / 255.0
 329      */
 330    return (float) u / 255.0f;
 331 }
 332
 333 /**
 334  * Evaluate one component of unpackUnorm2x16.
 335  */
 336 static float
 337 unpack_unorm_1x16(uint16_t u)
 338 {
 339     /* From section 8.4 of the GLSL ES 3.00 spec:
 340      *
 341      *    unpackUnorm2x16
 342      *    ---------------
 343      *    The conversion for unpacked fixed-point value f to floating point is
 344      *    done as follows:
 345      *
 346      *       unpackUnorm2x16: f / 65535.0
 347      */
 348    return (float) u / 65535.0f;
 349 }
 350
 351 /**
 352  * Evaluate one component of packHalf2x16.
 353  */
 354 static uint16_t
 355 pack_half_1x16(float x)
 356 {
 357    return _mesa_float_to_half(x);
 358 }
 359
 360 /**
 361  * Evaluate one component of unpackHalf2x16.
 362  */
 363 static float
 364 unpack_half_1x16(uint16_t u)
 365 {
 366    return _mesa_half_to_float(u);
 367 }
 368
 369 ir_constant *
 370 ir_rvalue::constant_expression_value(struct hash_table *variable_context)
 371 {
 372    assert(this->type->is_error());
 373    return NULL;
 374 }
 375
 376 ir_constant *
 377 ir_expression::constant_expression_value(struct hash_table *variable_context)
 378 {
 379    if (this->type->is_error())
 380       return NULL;
 381
 382    ir_constant *op[Elements(this->operands)] = { NULL, };
 383    ir_constant_data data;
 384
 385    memset(&data, 0, sizeof(data));
 386
 387    for (unsigned operand = 0; operand < this->get_num_operands(); operand++) {
 388       op[operand] = this->operands[operand]->constant_expression_value(variable_context);
 389       if (!op[operand])
 390          return NULL;
 391    }
 392
 393    if (op[1] != NULL)
 394       switch (this->operation) {
 395       case ir_binop_lshift:
 396       case ir_binop_rshift:
 397       case ir_binop_vector_extract:
 398       case ir_triop_bitfield_extract:
 399          break;
 400
 401       default:
 402          assert(op[0]->type->base_type == op[1]->type->base_type);
 403          break;
 404       }
 405
 406    bool op0_scalar = op[0]->type->is_scalar();
 407    bool op1_scalar = op[1] != NULL && op[1]->type->is_scalar();
 408
 409    /* When iterating over a vector or matrix's components, we want to increase
 410     * the loop counter.  However, for scalars, we want to stay at 0.
 411     */
 412    unsigned c0_inc = op0_scalar ? 0 : 1;
 413    unsigned c1_inc = op1_scalar ? 0 : 1;
 414    unsigned components;
 415    if (op1_scalar || !op[1]) {
 416       components = op[0]->type->components();
 417    } else {
 418       components = op[1]->type->components();
 419    }
 420
 421    void *ctx = ralloc_parent(this);
 422
 423    /* Handle array operations here, rather than below. */
 424    if (op[0]->type->is_array()) {
 425       assert(op[1] != NULL && op[1]->type->is_array());
 426       switch (this->operation) {
 427       case ir_binop_all_equal:
 428          return new(ctx) ir_constant(op[0]->has_value(op[1]));
 429       case ir_binop_any_nequal:
 430          return new(ctx) ir_constant(!op[0]->has_value(op[1]));
 431       default:
 432          break;
 433       }
 434       return NULL;
 435    }
 436
 437    switch (this->operation) {
 438    case ir_unop_bit_not:
 439        switch (op[0]->type->base_type) {
 440        case GLSL_TYPE_INT:
 441            for (unsigned c = 0; c < components; c++)
 442                data.i[c] = ~ op[0]->value.i[c];
 443            break;
 444        case GLSL_TYPE_UINT:
 445            for (unsigned c = 0; c < components; c++)
 446                data.u[c] = ~ op[0]->value.u[c];
 447            break;
 448        default:
 449            assert(0);
 450        }
 451        break;
 452
 453    case ir_unop_logic_not:
 454       assert(op[0]->type->base_type == GLSL_TYPE_BOOL);
 455       for (unsigned c = 0; c < op[0]->type->components(); c++)
 456          data.b[c] = !op[0]->value.b[c];
 457       break;
 458
 459    case ir_unop_f2i:
 460       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 461       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 462          data.i[c] = (int) op[0]->value.f[c];
 463       }
 464       break;
 465    case ir_unop_f2u:
 466       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 467       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 468          data.i[c] = (unsigned) op[0]->value.f[c];
 469       }
 470       break;
 471    case ir_unop_i2f:
 472       assert(op[0]->type->base_type == GLSL_TYPE_INT);
 473       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 474          data.f[c] = (float) op[0]->value.i[c];
 475       }
 476       break;
 477    case ir_unop_u2f:
 478       assert(op[0]->type->base_type == GLSL_TYPE_UINT);
 479       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 480          data.f[c] = (float) op[0]->value.u[c];
 481       }
 482       break;
 483    case ir_unop_b2f:
 484       assert(op[0]->type->base_type == GLSL_TYPE_BOOL);
 485       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 486          data.f[c] = op[0]->value.b[c] ? 1.0F : 0.0F;
 487       }
 488       break;
 489    case ir_unop_f2b:
 490       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 491       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 492          data.b[c] = op[0]->value.f[c] != 0.0F ? true : false;
 493       }
 494       break;
 495    case ir_unop_b2i:
 496       assert(op[0]->type->base_type == GLSL_TYPE_BOOL);
 497       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 498          data.u[c] = op[0]->value.b[c] ? 1 : 0;
 499       }
 500       break;
 501    case ir_unop_i2b:
 502       assert(op[0]->type->is_integer());
 503       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 504          data.b[c] = op[0]->value.u[c] ? true : false;
 505       }
 506       break;
 507    case ir_unop_u2i:
 508       assert(op[0]->type->base_type == GLSL_TYPE_UINT);
 509       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 510          data.i[c] = op[0]->value.u[c];
 511       }
 512       break;
 513    case ir_unop_i2u:
 514       assert(op[0]->type->base_type == GLSL_TYPE_INT);
 515       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 516          data.u[c] = op[0]->value.i[c];
 517       }
 518       break;
 519    case ir_unop_bitcast_i2f:
 520       assert(op[0]->type->base_type == GLSL_TYPE_INT);
 521       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 522          data.f[c] = bitcast_u2f(op[0]->value.i[c]);
 523       }
 524       break;
 525    case ir_unop_bitcast_f2i:
 526       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 527       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 528          data.i[c] = bitcast_f2u(op[0]->value.f[c]);
 529       }
 530       break;
 531    case ir_unop_bitcast_u2f:
 532       assert(op[0]->type->base_type == GLSL_TYPE_UINT);
 533       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 534          data.f[c] = bitcast_u2f(op[0]->value.u[c]);
 535       }
 536       break;
 537    case ir_unop_bitcast_f2u:
 538       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 539       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 540          data.u[c] = bitcast_f2u(op[0]->value.f[c]);
 541       }
 542       break;
 543    case ir_unop_any:
 544       assert(op[0]->type->is_boolean());
 545       data.b[0] = false;
 546       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 547          if (op[0]->value.b[c])
 548             data.b[0] = true;
 549       }
 550       break;
 551
 552    case ir_unop_trunc:
 553       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 554       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 555          data.f[c] = truncf(op[0]->value.f[c]);
 556       }
 557       break;
 558
 559    case ir_unop_round_even:
 560       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 561       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 562          data.f[c] = _mesa_round_to_even(op[0]->value.f[c]);
 563       }
 564       break;
 565
 566    case ir_unop_ceil:
 567       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 568       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 569          data.f[c] = ceilf(op[0]->value.f[c]);
 570       }
 571       break;
 572
 573    case ir_unop_floor:
 574       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 575       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 576          data.f[c] = floorf(op[0]->value.f[c]);
 577       }
 578       break;
 579
 580    case ir_unop_fract:
 581       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 582          switch (this->type->base_type) {
 583          case GLSL_TYPE_UINT:
 584             data.u[c] = 0;
 585             break;
 586          case GLSL_TYPE_INT:
 587             data.i[c] = 0;
 588             break;
 589          case GLSL_TYPE_FLOAT:
 590             data.f[c] = op[0]->value.f[c] - floor(op[0]->value.f[c]);
 591             break;
 592          default:
 593             assert(0);
 594          }
 595       }
 596       break;
 597
 598    case ir_unop_sin:
 599    case ir_unop_sin_reduced:
 600       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 601       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 602          data.f[c] = sinf(op[0]->value.f[c]);
 603       }
 604       break;
 605
 606    case ir_unop_cos:
 607    case ir_unop_cos_reduced:
 608       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 609       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 610          data.f[c] = cosf(op[0]->value.f[c]);
 611       }
 612       break;
 613
 614    case ir_unop_neg:
 615       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 616          switch (this->type->base_type) {
 617          case GLSL_TYPE_UINT:
 618             data.u[c] = -((int) op[0]->value.u[c]);
 619             break;
 620          case GLSL_TYPE_INT:
 621             data.i[c] = -op[0]->value.i[c];
 622             break;
 623          case GLSL_TYPE_FLOAT:
 624             data.f[c] = -op[0]->value.f[c];
 625             break;
 626          default:
 627             assert(0);
 628          }
 629       }
 630       break;
 631
 632    case ir_unop_abs:
 633       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 634          switch (this->type->base_type) {
 635          case GLSL_TYPE_UINT:
 636             data.u[c] = op[0]->value.u[c];
 637             break;
 638          case GLSL_TYPE_INT:
 639             data.i[c] = op[0]->value.i[c];
 640             if (data.i[c] < 0)
 641                data.i[c] = -data.i[c];
 642             break;
 643          case GLSL_TYPE_FLOAT:
 644             data.f[c] = fabs(op[0]->value.f[c]);
 645             break;
 646          default:
 647             assert(0);
 648          }
 649       }
 650       break;
 651
 652    case ir_unop_sign:
 653       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 654          switch (this->type->base_type) {
 655          case GLSL_TYPE_UINT:
 656             data.u[c] = op[0]->value.i[c] > 0;
 657             break;
 658          case GLSL_TYPE_INT:
 659             data.i[c] = (op[0]->value.i[c] > 0) - (op[0]->value.i[c] < 0);
 660             break;
 661          case GLSL_TYPE_FLOAT:
 662             data.f[c] = float((op[0]->value.f[c] > 0)-(op[0]->value.f[c] < 0));
 663             break;
 664          default:
 665             assert(0);
 666          }
 667       }
 668       break;
 669
 670    case ir_unop_rcp:
 671       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 672       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 673          switch (this->type->base_type) {
 674          case GLSL_TYPE_UINT:
 675             if (op[0]->value.u[c] != 0.0)
 676                data.u[c] = 1 / op[0]->value.u[c];
 677             break;
 678          case GLSL_TYPE_INT:
 679             if (op[0]->value.i[c] != 0.0)
 680                data.i[c] = 1 / op[0]->value.i[c];
 681             break;
 682          case GLSL_TYPE_FLOAT:
 683             if (op[0]->value.f[c] != 0.0)
 684                data.f[c] = 1.0F / op[0]->value.f[c];
 685             break;
 686          default:
 687             assert(0);
 688          }
 689       }
 690       break;
 691
 692    case ir_unop_rsq:
 693       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 694       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 695          data.f[c] = 1.0F / sqrtf(op[0]->value.f[c]);
 696       }
 697       break;
 698
 699    case ir_unop_sqrt:
 700       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 701       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 702          data.f[c] = sqrtf(op[0]->value.f[c]);
 703       }
 704       break;
 705
 706    case ir_unop_exp:
 707       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 708       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 709          data.f[c] = expf(op[0]->value.f[c]);
 710       }
 711       break;
 712
 713    case ir_unop_exp2:
 714       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 715       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 716          data.f[c] = exp2f(op[0]->value.f[c]);
 717       }
 718       break;
 719
 720    case ir_unop_log:
 721       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 722       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 723          data.f[c] = logf(op[0]->value.f[c]);
 724       }
 725       break;
 726
 727    case ir_unop_log2:
 728       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 729       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 730          data.f[c] = log2f(op[0]->value.f[c]);
 731       }
 732       break;
 733
 734    case ir_unop_dFdx:
 735    case ir_unop_dFdy:
 736       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 737       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 738          data.f[c] = 0.0;
 739       }
 740       break;
 741
 742    case ir_unop_pack_snorm_2x16:
 743       assert(op[0]->type == glsl_type::vec2_type);
 744       data.u[0] = pack_2x16(pack_snorm_1x16,
 745                             op[0]->value.f[0],
 746                             op[0]->value.f[1]);
 747       break;
 748    case ir_unop_pack_snorm_4x8:
 749       assert(op[0]->type == glsl_type::vec4_type);
 750       data.u[0] = pack_4x8(pack_snorm_1x8,
 751                            op[0]->value.f[0],
 752                            op[0]->value.f[1],
 753                            op[0]->value.f[2],
 754                            op[0]->value.f[3]);
 755       break;
 756    case ir_unop_unpack_snorm_2x16:
 757       assert(op[0]->type == glsl_type::uint_type);
 758       unpack_2x16(unpack_snorm_1x16,
 759                   op[0]->value.u[0],
 760                   &data.f[0], &data.f[1]);
 761       break;
 762    case ir_unop_unpack_snorm_4x8:
 763       assert(op[0]->type == glsl_type::uint_type);
 764       unpack_4x8(unpack_snorm_1x8,
 765                  op[0]->value.u[0],
 766                  &data.f[0], &data.f[1], &data.f[2], &data.f[3]);
 767       break;
 768    case ir_unop_pack_unorm_2x16:
 769       assert(op[0]->type == glsl_type::vec2_type);
 770       data.u[0] = pack_2x16(pack_unorm_1x16,
 771                             op[0]->value.f[0],
 772                             op[0]->value.f[1]);
 773       break;
 774    case ir_unop_pack_unorm_4x8:
 775       assert(op[0]->type == glsl_type::vec4_type);
 776       data.u[0] = pack_4x8(pack_unorm_1x8,
 777                            op[0]->value.f[0],
 778                            op[0]->value.f[1],
 779                            op[0]->value.f[2],
 780                            op[0]->value.f[3]);
 781       break;
 782    case ir_unop_unpack_unorm_2x16:
 783       assert(op[0]->type == glsl_type::uint_type);
 784       unpack_2x16(unpack_unorm_1x16,
 785                   op[0]->value.u[0],
 786                   &data.f[0], &data.f[1]);
 787       break;
 788    case ir_unop_unpack_unorm_4x8:
 789       assert(op[0]->type == glsl_type::uint_type);
 790       unpack_4x8(unpack_unorm_1x8,
 791                  op[0]->value.u[0],
 792                  &data.f[0], &data.f[1], &data.f[2], &data.f[3]);
 793       break;
 794    case ir_unop_pack_half_2x16:
 795       assert(op[0]->type == glsl_type::vec2_type);
 796       data.u[0] = pack_2x16(pack_half_1x16,
 797                             op[0]->value.f[0],
 798                             op[0]->value.f[1]);
 799       break;
 800    case ir_unop_unpack_half_2x16:
 801       assert(op[0]->type == glsl_type::uint_type);
 802       unpack_2x16(unpack_half_1x16,
 803                   op[0]->value.u[0],
 804                   &data.f[0], &data.f[1]);
 805       break;
 806    case ir_binop_pow:
 807       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
 808       for (unsigned c = 0; c < op[0]->type->components(); c++) {
 809          data.f[c] = powf(op[0]->value.f[c], op[1]->value.f[c]);
 810       }
 811       break;
 812
 813    case ir_binop_dot:
 814       data.f[0] = dot(op[0], op[1]);
 815       break;
 816
 817    case ir_binop_min:
 818       assert(op[0]->type == op[1]->type || op0_scalar || op1_scalar);
 819       for (unsigned c = 0, c0 = 0, c1 = 0;
 820            c < components;
 821            c0 += c0_inc, c1 += c1_inc, c++) {
 822
 823          switch (op[0]->type->base_type) {
 824          case GLSL_TYPE_UINT:
 825             data.u[c] = MIN2(op[0]->value.u[c0], op[1]->value.u[c1]);
 826             break;
 827          case GLSL_TYPE_INT:
 828             data.i[c] = MIN2(op[0]->value.i[c0], op[1]->value.i[c1]);
 829             break;
 830          case GLSL_TYPE_FLOAT:
 831             data.f[c] = MIN2(op[0]->value.f[c0], op[1]->value.f[c1]);
 832             break;
 833          default:
 834             assert(0);
 835          }
 836       }
 837
 838       break;
 839    case ir_binop_max:
 840       assert(op[0]->type == op[1]->type || op0_scalar || op1_scalar);
 841       for (unsigned c = 0, c0 = 0, c1 = 0;
 842            c < components;
 843            c0 += c0_inc, c1 += c1_inc, c++) {
 844
 845          switch (op[0]->type->base_type) {
 846          case GLSL_TYPE_UINT:
 847             data.u[c] = MAX2(op[0]->value.u[c0], op[1]->value.u[c1]);
 848             break;
 849          case GLSL_TYPE_INT:
 850             data.i[c] = MAX2(op[0]->value.i[c0], op[1]->value.i[c1]);
 851             break;
 852          case GLSL_TYPE_FLOAT:
 853             data.f[c] = MAX2(op[0]->value.f[c0], op[1]->value.f[c1]);
 854             break;
 855          default:
 856             assert(0);
 857          }
 858       }
 859       break;
 860
 861    case ir_binop_add:
 862       assert(op[0]->type == op[1]->type || op0_scalar || op1_scalar);
 863       for (unsigned c = 0, c0 = 0, c1 = 0;
 864            c < components;
 865            c0 += c0_inc, c1 += c1_inc, c++) {
 866
 867          switch (op[0]->type->base_type) {
 868          case GLSL_TYPE_UINT:
 869             data.u[c] = op[0]->value.u[c0] + op[1]->value.u[c1];
 870             break;
 871          case GLSL_TYPE_INT:
 872             data.i[c] = op[0]->value.i[c0] + op[1]->value.i[c1];
 873             break;
 874          case GLSL_TYPE_FLOAT:
 875             data.f[c] = op[0]->value.f[c0] + op[1]->value.f[c1];
 876             break;
 877          default:
 878             assert(0);
 879          }
 880       }
 881
 882       break;
 883    case ir_binop_sub:
 884       assert(op[0]->type == op[1]->type || op0_scalar || op1_scalar);
 885       for (unsigned c = 0, c0 = 0, c1 = 0;
 886            c < components;
 887            c0 += c0_inc, c1 += c1_inc, c++) {
 888
 889          switch (op[0]->type->base_type) {
 890          case GLSL_TYPE_UINT:
 891             data.u[c] = op[0]->value.u[c0] - op[1]->value.u[c1];
 892             break;
 893          case GLSL_TYPE_INT:
 894             data.i[c] = op[0]->value.i[c0] - op[1]->value.i[c1];
 895             break;
 896          case GLSL_TYPE_FLOAT:
 897             data.f[c] = op[0]->value.f[c0] - op[1]->value.f[c1];
 898             break;
 899          default:
 900             assert(0);
 901          }
 902       }
 903
 904       break;
 905    case ir_binop_mul:
 906       /* Check for equal types, or unequal types involving scalars */
 907       if ((op[0]->type == op[1]->type && !op[0]->type->is_matrix())
 908           || op0_scalar || op1_scalar) {
 909          for (unsigned c = 0, c0 = 0, c1 = 0;
 910               c < components;
 911               c0 += c0_inc, c1 += c1_inc, c++) {
 912
 913             switch (op[0]->type->base_type) {
 914             case GLSL_TYPE_UINT:
 915                data.u[c] = op[0]->value.u[c0] * op[1]->value.u[c1];
 916                break;
 917             case GLSL_TYPE_INT:
 918                data.i[c] = op[0]->value.i[c0] * op[1]->value.i[c1];
 919                break;
 920             case GLSL_TYPE_FLOAT:
 921                data.f[c] = op[0]->value.f[c0] * op[1]->value.f[c1];
 922                break;
 923             default:
 924                assert(0);
 925             }
 926          }
 927       } else {
 928          assert(op[0]->type->is_matrix() || op[1]->type->is_matrix());
 929
 930          /* Multiply an N-by-M matrix with an M-by-P matrix.  Since either
 931           * matrix can be a GLSL vector, either N or P can be 1.
 932           *
 933           * For vec*mat, the vector is treated as a row vector.  This
 934           * means the vector is a 1-row x M-column matrix.
 935           *
 936           * For mat*vec, the vector is treated as a column vector.  Since
 937           * matrix_columns is 1 for vectors, this just works.
 938           */
 939          const unsigned n = op[0]->type->is_vector()
 940             ? 1 : op[0]->type->vector_elements;
 941          const unsigned m = op[1]->type->vector_elements;
 942          const unsigned p = op[1]->type->matrix_columns;
 943          for (unsigned j = 0; j < p; j++) {
 944             for (unsigned i = 0; i < n; i++) {
 945                for (unsigned k = 0; k < m; k++) {
 946                   data.f[i+n*j] += op[0]->value.f[i+n*k]*op[1]->value.f[k+m*j];
 947                }
 948             }
 949          }
 950       }
 951
 952       break;
 953    case ir_binop_div:
 954       /* FINISHME: Emit warning when division-by-zero is detected. */
 955       assert(op[0]->type == op[1]->type || op0_scalar || op1_scalar);
 956       for (unsigned c = 0, c0 = 0, c1 = 0;
 957            c < components;
 958            c0 += c0_inc, c1 += c1_inc, c++) {
 959
 960          switch (op[0]->type->base_type) {
 961          case GLSL_TYPE_UINT:
 962             if (op[1]->value.u[c1] == 0) {
 963                data.u[c] = 0;
 964             } else {
 965                data.u[c] = op[0]->value.u[c0] / op[1]->value.u[c1];
 966             }
 967             break;
 968          case GLSL_TYPE_INT:
 969             if (op[1]->value.i[c1] == 0) {
 970                data.i[c] = 0;
 971             } else {
 972                data.i[c] = op[0]->value.i[c0] / op[1]->value.i[c1];
 973             }
 974             break;
 975          case GLSL_TYPE_FLOAT:
 976             data.f[c] = op[0]->value.f[c0] / op[1]->value.f[c1];
 977             break;
 978          default:
 979             assert(0);
 980          }
 981       }
 982
 983       break;
 984    case ir_binop_mod:
 985       /* FINISHME: Emit warning when division-by-zero is detected. */
 986       assert(op[0]->type == op[1]->type || op0_scalar || op1_scalar);
 987       for (unsigned c = 0, c0 = 0, c1 = 0;
 988            c < components;
 989            c0 += c0_inc, c1 += c1_inc, c++) {
 990
 991          switch (op[0]->type->base_type) {
 992          case GLSL_TYPE_UINT:
 993             if (op[1]->value.u[c1] == 0) {
 994                data.u[c] = 0;
 995             } else {
 996                data.u[c] = op[0]->value.u[c0] % op[1]->value.u[c1];
 997             }
 998             break;
 999          case GLSL_TYPE_INT:
1000             if (op[1]->value.i[c1] == 0) {
1001                data.i[c] = 0;
1002             } else {
1003                data.i[c] = op[0]->value.i[c0] % op[1]->value.i[c1];
1004             }
1005             break;
1006          case GLSL_TYPE_FLOAT:
1007             /* We don't use fmod because it rounds toward zero; GLSL specifies
1008              * the use of floor.
1009              */
1010             data.f[c] = op[0]->value.f[c0] - op[1]->value.f[c1]
1011                * floorf(op[0]->value.f[c0] / op[1]->value.f[c1]);
1012             break;
1013          default:
1014             assert(0);
1015          }
1016       }
1017
1018       break;
1019
1020    case ir_binop_logic_and:
1021       assert(op[0]->type->base_type == GLSL_TYPE_BOOL);
1022       for (unsigned c = 0; c < op[0]->type->components(); c++)
1023          data.b[c] = op[0]->value.b[c] && op[1]->value.b[c];
1024       break;
1025    case ir_binop_logic_xor:
1026       assert(op[0]->type->base_type == GLSL_TYPE_BOOL);
1027       for (unsigned c = 0; c < op[0]->type->components(); c++)
1028          data.b[c] = op[0]->value.b[c] ^ op[1]->value.b[c];
1029       break;
1030    case ir_binop_logic_or:
1031       assert(op[0]->type->base_type == GLSL_TYPE_BOOL);
1032       for (unsigned c = 0; c < op[0]->type->components(); c++)
1033          data.b[c] = op[0]->value.b[c] || op[1]->value.b[c];
1034       break;
1035
1036    case ir_binop_less:
1037       assert(op[0]->type == op[1]->type);
1038       for (unsigned c = 0; c < op[0]->type->components(); c++) {
1039          switch (op[0]->type->base_type) {
1040          case GLSL_TYPE_UINT:
1041             data.b[c] = op[0]->value.u[c] < op[1]->value.u[c];
1042             break;
1043          case GLSL_TYPE_INT:
1044             data.b[c] = op[0]->value.i[c] < op[1]->value.i[c];
1045             break;
1046          case GLSL_TYPE_FLOAT:
1047             data.b[c] = op[0]->value.f[c] < op[1]->value.f[c];
1048             break;
1049          default:
1050             assert(0);
1051          }
1052       }
1053       break;
1054    case ir_binop_greater:
1055       assert(op[0]->type == op[1]->type);
1056       for (unsigned c = 0; c < op[0]->type->components(); c++) {
1057          switch (op[0]->type->base_type) {
1058          case GLSL_TYPE_UINT:
1059             data.b[c] = op[0]->value.u[c] > op[1]->value.u[c];
1060             break;
1061          case GLSL_TYPE_INT:
1062             data.b[c] = op[0]->value.i[c] > op[1]->value.i[c];
1063             break;
1064          case GLSL_TYPE_FLOAT:
1065             data.b[c] = op[0]->value.f[c] > op[1]->value.f[c];
1066             break;
1067          default:
1068             assert(0);
1069          }
1070       }
1071       break;
1072    case ir_binop_lequal:
1073       assert(op[0]->type == op[1]->type);
1074       for (unsigned c = 0; c < op[0]->type->components(); c++) {
1075          switch (op[0]->type->base_type) {
1076          case GLSL_TYPE_UINT:
1077             data.b[c] = op[0]->value.u[c] <= op[1]->value.u[c];
1078             break;
1079          case GLSL_TYPE_INT:
1080             data.b[c] = op[0]->value.i[c] <= op[1]->value.i[c];
1081             break;
1082          case GLSL_TYPE_FLOAT:
1083             data.b[c] = op[0]->value.f[c] <= op[1]->value.f[c];
1084             break;
1085          default:
1086             assert(0);
1087          }
1088       }
1089       break;
1090    case ir_binop_gequal:
1091       assert(op[0]->type == op[1]->type);
1092       for (unsigned c = 0; c < op[0]->type->components(); c++) {
1093          switch (op[0]->type->base_type) {
1094          case GLSL_TYPE_UINT:
1095             data.b[c] = op[0]->value.u[c] >= op[1]->value.u[c];
1096             break;
1097          case GLSL_TYPE_INT:
1098             data.b[c] = op[0]->value.i[c] >= op[1]->value.i[c];
1099             break;
1100          case GLSL_TYPE_FLOAT:
1101             data.b[c] = op[0]->value.f[c] >= op[1]->value.f[c];
1102             break;
1103          default:
1104             assert(0);
1105          }
1106       }
1107       break;
1108    case ir_binop_equal:
1109       assert(op[0]->type == op[1]->type);
1110       for (unsigned c = 0; c < components; c++) {
1111          switch (op[0]->type->base_type) {
1112          case GLSL_TYPE_UINT:
1113             data.b[c] = op[0]->value.u[c] == op[1]->value.u[c];
1114             break;
1115          case GLSL_TYPE_INT:
1116             data.b[c] = op[0]->value.i[c] == op[1]->value.i[c];
1117             break;
1118          case GLSL_TYPE_FLOAT:
1119             data.b[c] = op[0]->value.f[c] == op[1]->value.f[c];
1120             break;
1121          case GLSL_TYPE_BOOL:
1122             data.b[c] = op[0]->value.b[c] == op[1]->value.b[c];
1123             break;
1124          default:
1125             assert(0);
1126          }
1127       }
1128       break;
1129    case ir_binop_nequal:
1130       assert(op[0]->type == op[1]->type);
1131       for (unsigned c = 0; c < components; c++) {
1132          switch (op[0]->type->base_type) {
1133          case GLSL_TYPE_UINT:
1134             data.b[c] = op[0]->value.u[c] != op[1]->value.u[c];
1135             break;
1136          case GLSL_TYPE_INT:
1137             data.b[c] = op[0]->value.i[c] != op[1]->value.i[c];
1138             break;
1139          case GLSL_TYPE_FLOAT:
1140             data.b[c] = op[0]->value.f[c] != op[1]->value.f[c];
1141             break;
1142          case GLSL_TYPE_BOOL:
1143             data.b[c] = op[0]->value.b[c] != op[1]->value.b[c];
1144             break;
1145          default:
1146             assert(0);
1147          }
1148       }
1149       break;
1150    case ir_binop_all_equal:
1151       data.b[0] = op[0]->has_value(op[1]);
1152       break;
1153    case ir_binop_any_nequal:
1154       data.b[0] = !op[0]->has_value(op[1]);
1155       break;
1156
1157    case ir_binop_lshift:
1158       for (unsigned c = 0, c0 = 0, c1 = 0;
1159            c < components;
1160            c0 += c0_inc, c1 += c1_inc, c++) {
1161
1162           if (op[0]->type->base_type == GLSL_TYPE_INT &&
1163               op[1]->type->base_type == GLSL_TYPE_INT) {
1164               data.i[c] = op[0]->value.i[c0] << op[1]->value.i[c1];
1165
1166           } else if (op[0]->type->base_type == GLSL_TYPE_INT &&
1167                      op[1]->type->base_type == GLSL_TYPE_UINT) {
1168               data.i[c] = op[0]->value.i[c0] << op[1]->value.u[c1];
1169
1170           } else if (op[0]->type->base_type == GLSL_TYPE_UINT &&
1171                      op[1]->type->base_type == GLSL_TYPE_INT) {
1172               data.u[c] = op[0]->value.u[c0] << op[1]->value.i[c1];
1173
1174           } else if (op[0]->type->base_type == GLSL_TYPE_UINT &&
1175                      op[1]->type->base_type == GLSL_TYPE_UINT) {
1176               data.u[c] = op[0]->value.u[c0] << op[1]->value.u[c1];
1177           }
1178       }
1179       break;
1180
1181    case ir_binop_rshift:
1182        for (unsigned c = 0, c0 = 0, c1 = 0;
1183             c < components;
1184             c0 += c0_inc, c1 += c1_inc, c++) {
1185
1186            if (op[0]->type->base_type == GLSL_TYPE_INT &&
1187                op[1]->type->base_type == GLSL_TYPE_INT) {
1188                data.i[c] = op[0]->value.i[c0] >> op[1]->value.i[c1];
1189
1190            } else if (op[0]->type->base_type == GLSL_TYPE_INT &&
1191                       op[1]->type->base_type == GLSL_TYPE_UINT) {
1192                data.i[c] = op[0]->value.i[c0] >> op[1]->value.u[c1];
1193
1194            } else if (op[0]->type->base_type == GLSL_TYPE_UINT &&
1195                       op[1]->type->base_type == GLSL_TYPE_INT) {
1196                data.u[c] = op[0]->value.u[c0] >> op[1]->value.i[c1];
1197
1198            } else if (op[0]->type->base_type == GLSL_TYPE_UINT &&
1199                       op[1]->type->base_type == GLSL_TYPE_UINT) {
1200                data.u[c] = op[0]->value.u[c0] >> op[1]->value.u[c1];
1201            }
1202        }
1203        break;
1204
1205    case ir_binop_bit_and:
1206       for (unsigned c = 0, c0 = 0, c1 = 0;
1207            c < components;
1208            c0 += c0_inc, c1 += c1_inc, c++) {
1209
1210           switch (op[0]->type->base_type) {
1211           case GLSL_TYPE_INT:
1212               data.i[c] = op[0]->value.i[c0] & op[1]->value.i[c1];
1213               break;
1214           case GLSL_TYPE_UINT:
1215               data.u[c] = op[0]->value.u[c0] & op[1]->value.u[c1];
1216               break;
1217           default:
1218               assert(0);
1219           }
1220       }
1221       break;
1222
1223    case ir_binop_bit_or:
1224       for (unsigned c = 0, c0 = 0, c1 = 0;
1225            c < components;
1226            c0 += c0_inc, c1 += c1_inc, c++) {
1227
1228           switch (op[0]->type->base_type) {
1229           case GLSL_TYPE_INT:
1230               data.i[c] = op[0]->value.i[c0] | op[1]->value.i[c1];
1231               break;
1232           case GLSL_TYPE_UINT:
1233               data.u[c] = op[0]->value.u[c0] | op[1]->value.u[c1];
1234               break;
1235           default:
1236               assert(0);
1237           }
1238       }
1239       break;
1240
1241    case ir_binop_vector_extract: {
1242       const int c = CLAMP(op[1]->value.i[0], 0,
1243                           (int) op[0]->type->vector_elements - 1);
1244
1245       switch (op[0]->type->base_type) {
1246       case GLSL_TYPE_UINT:
1247          data.u[0] = op[0]->value.u[c];
1248          break;
1249       case GLSL_TYPE_INT:
1250          data.i[0] = op[0]->value.i[c];
1251          break;
1252       case GLSL_TYPE_FLOAT:
1253          data.f[0] = op[0]->value.f[c];
1254          break;
1255       case GLSL_TYPE_BOOL:
1256          data.b[0] = op[0]->value.b[c];
1257          break;
1258       default:
1259          assert(0);
1260       }
1261       break;
1262    }
1263
1264    case ir_binop_bit_xor:
1265       for (unsigned c = 0, c0 = 0, c1 = 0;
1266            c < components;
1267            c0 += c0_inc, c1 += c1_inc, c++) {
1268
1269           switch (op[0]->type->base_type) {
1270           case GLSL_TYPE_INT:
1271               data.i[c] = op[0]->value.i[c0] ^ op[1]->value.i[c1];
1272               break;
1273           case GLSL_TYPE_UINT:
1274               data.u[c] = op[0]->value.u[c0] ^ op[1]->value.u[c1];
1275               break;
1276           default:
1277               assert(0);
1278           }
1279       }
1280       break;
1281
1282    case ir_unop_bitfield_reverse:
1283       /* http://graphics.stanford.edu/~seander/bithacks.html#BitReverseObvious */
1284       for (unsigned c = 0; c < components; c++) {
1285          unsigned int v = op[0]->value.u[c]; // input bits to be reversed
1286          unsigned int r = v; // r will be reversed bits of v; first get LSB of v
1287          int s = sizeof(v) * CHAR_BIT - 1; // extra shift needed at end
1288
1289          for (v >>= 1; v; v >>= 1) {
1290             r <<= 1;
1291             r |= v & 1;
1292             s--;
1293          }
1294          r <<= s; // shift when v's highest bits are zero
1295
1296          data.u[c] = r;
1297       }
1298       break;
1299
1300    case ir_unop_bit_count:
1301       for (unsigned c = 0; c < components; c++) {
1302          unsigned count = 0;
1303          unsigned v = op[0]->value.u[c];
1304
1305          for (; v; count++) {
1306             v &= v - 1;
1307          }
1308          data.u[c] = count;
1309       }
1310       break;
1311
1312    case ir_unop_find_msb:
1313       for (unsigned c = 0; c < components; c++) {
1314          int v = op[0]->value.i[c];
1315
1316          if (v == 0 || (op[0]->type->base_type == GLSL_TYPE_INT && v == -1))
1317             data.i[c] = -1;
1318          else {
1319             int count = 0;
1320             int top_bit = op[0]->type->base_type == GLSL_TYPE_UINT
1321                           ? 0 : v & (1 << 31);
1322
1323             while (((v & (1 << 31)) == top_bit) && count != 32) {
1324                count++;
1325                v <<= 1;
1326             }
1327
1328             data.i[c] = 31 - count;
1329          }
1330       }
1331       break;
1332
1333    case ir_unop_find_lsb:
1334       for (unsigned c = 0; c < components; c++) {
1335          if (op[0]->value.i[c] == 0)
1336             data.i[c] = -1;
1337          else {
1338             unsigned pos = 0;
1339             unsigned v = op[0]->value.u[c];
1340
1341             for (; !(v & 1); v >>= 1) {
1342                pos++;
1343             }
1344             data.u[c] = pos;
1345          }
1346       }
1347       break;
1348
1349    case ir_triop_bitfield_extract: {
1350       int offset = op[1]->value.i[0];
1351       int bits = op[2]->value.i[0];
1352
1353       for (unsigned c = 0; c < components; c++) {
1354          if (bits == 0)
1355             data.u[c] = 0;
1356          else if (offset < 0 || bits < 0)
1357             data.u[c] = 0; /* Undefined, per spec. */
1358          else if (offset + bits > 32)
1359             data.u[c] = 0; /* Undefined, per spec. */
1360          else {
1361             if (op[0]->type->base_type == GLSL_TYPE_INT) {
1362                /* int so that the right shift will sign-extend. */
1363                int value = op[0]->value.i[c];
1364                value <<= 32 - bits - offset;
1365                value >>= 32 - bits;
1366                data.i[c] = value;
1367             } else {
1368                unsigned value = op[0]->value.u[c];
1369                value <<= 32 - bits - offset;
1370                value >>= 32 - bits;
1371                data.u[c] = value;
1372             }
1373          }
1374       }
1375       break;
1376    }
1377
1378    case ir_triop_lrp: {
1379       assert(op[0]->type->base_type == GLSL_TYPE_FLOAT);
1380       assert(op[1]->type->base_type == GLSL_TYPE_FLOAT);
1381       assert(op[2]->type->base_type == GLSL_TYPE_FLOAT);
1382
1383       unsigned c2_inc = op[2]->type->is_scalar() ? 0 : 1;
1384       for (unsigned c = 0, c2 = 0; c < components; c2 += c2_inc, c++) {
1385          data.f[c] = op[0]->value.f[c] * (1.0f - op[2]->value.f[c2]) +
1386                      (op[1]->value.f[c] * op[2]->value.f[c2]);
1387       }
1388       break;
1389    }
1390
1391    case ir_triop_vector_insert: {
1392       const unsigned idx = op[2]->value.u[0];
1393
1394       memcpy(&data, &op[0]->value, sizeof(data));
1395
1396       switch (this->type->base_type) {
1397       case GLSL_TYPE_INT:
1398          data.i[idx] = op[1]->value.i[0];
1399          break;
1400       case GLSL_TYPE_UINT:
1401          data.u[idx] = op[1]->value.u[0];
1402          break;
1403       case GLSL_TYPE_FLOAT:
1404          data.f[idx] = op[1]->value.f[0];
1405          break;
1406       case GLSL_TYPE_BOOL:
1407          data.b[idx] = op[1]->value.b[0];
1408          break;
1409       default:
1410          assert(!"Should not get here.");
1411          break;
1412       }
1413       break;
1414    }
1415
1416    case ir_quadop_bitfield_insert: {
1417       int offset = op[2]->value.i[0];
1418       int bits = op[3]->value.i[0];
1419
1420       for (unsigned c = 0; c < components; c++) {
1421          if (bits == 0)
1422             data.u[c] = op[0]->value.u[c];
1423          else if (offset < 0 || bits < 0)
1424             data.u[c] = 0; /* Undefined, per spec. */
1425          else if (offset + bits > 32)
1426             data.u[c] = 0; /* Undefined, per spec. */
1427          else {
1428             unsigned insert_mask = ((1 << bits) - 1) << offset;
1429
1430             unsigned insert = op[1]->value.u[c];
1431             insert <<= offset;
1432             insert &= insert_mask;
1433
1434             unsigned base = op[0]->value.u[c];
1435             base &= ~insert_mask;
1436
1437             data.u[c] = base | insert;
1438          }
1439       }
1440       break;
1441    }
1442
1443    case ir_quadop_vector:
1444       for (unsigned c = 0; c < this->type->vector_elements; c++) {
1445          switch (this->type->base_type) {
1446          case GLSL_TYPE_INT:
1447             data.i[c] = op[c]->value.i[0];
1448             break;
1449          case GLSL_TYPE_UINT:
1450             data.u[c] = op[c]->value.u[0];
1451             break;
1452          case GLSL_TYPE_FLOAT:
1453             data.f[c] = op[c]->value.f[0];
1454             break;
1455          default:
1456             assert(0);
1457          }
1458       }
1459       break;
1460
1461    default:
1462       /* FINISHME: Should handle all expression types. */
1463       return NULL;
1464    }
1465
1466    return new(ctx) ir_constant(this->type, &data);
1467 }
1468
1469
1470 ir_constant *
1471 ir_texture::constant_expression_value(struct hash_table *variable_context)
1472 {
1473    /* texture lookups aren't constant expressions */
1474    return NULL;
1475 }
1476
1477
1478 ir_constant *
1479 ir_swizzle::constant_expression_value(struct hash_table *variable_context)
1480 {
1481    ir_constant *v = this->val->constant_expression_value(variable_context);
1482
1483    if (v != NULL) {
1484       ir_constant_data data = { { 0 } };
1485
1486       const unsigned swiz_idx[4] = {
1487          this->mask.x, this->mask.y, this->mask.z, this->mask.w
1488       };
1489
1490       for (unsigned i = 0; i < this->mask.num_components; i++) {
1491          switch (v->type->base_type) {
1492          case GLSL_TYPE_UINT:
1493          case GLSL_TYPE_INT:   data.u[i] = v->value.u[swiz_idx[i]]; break;
1494          case GLSL_TYPE_FLOAT: data.f[i] = v->value.f[swiz_idx[i]]; break;
1495          case GLSL_TYPE_BOOL:  data.b[i] = v->value.b[swiz_idx[i]]; break;
1496          default:              assert(!"Should not get here."); break;
1497          }
1498       }
1499
1500       void *ctx = ralloc_parent(this);
1501       return new(ctx) ir_constant(this->type, &data);
1502    }
1503    return NULL;
1504 }
1505
1506
1507 void
1508 ir_dereference_variable::constant_referenced(struct hash_table *variable_context,
1509                                              ir_constant *&store, int &offset) const
1510 {
1511    if (variable_context) {
1512       store = (ir_constant *)hash_table_find(variable_context, var);
1513       offset = 0;
1514    } else {
1515       store = NULL;
1516       offset = 0;
1517    }
1518 }
1519
1520 ir_constant *
1521 ir_dereference_variable::constant_expression_value(struct hash_table *variable_context)
1522 {
1523    /* This may occur during compile and var->type is glsl_type::error_type */
1524    if (!var)
1525       return NULL;
1526
1527    /* Give priority to the context hashtable, if it exists */
1528    if (variable_context) {
1529       ir_constant *value = (ir_constant *)hash_table_find(variable_context, var);
1530       if(value)
1531          return value;
1532    }
1533
1534    /* The constant_value of a uniform variable is its initializer,
1535     * not the lifetime constant value of the uniform.
1536     */
1537    if (var->mode == ir_var_uniform)
1538       return NULL;
1539
1540    if (!var->constant_value)
1541       return NULL;
1542
1543    return var->constant_value->clone(ralloc_parent(var), NULL);
1544 }
1545
1546
1547 void
1548 ir_dereference_array::constant_referenced(struct hash_table *variable_context,
1549                                           ir_constant *&store, int &offset) const
1550 {
1551    ir_constant *index_c = array_index->constant_expression_value(variable_context);
1552
1553    if (!index_c || !index_c->type->is_scalar() || !index_c->type->is_integer()) {
1554       store = 0;
1555       offset = 0;
1556       return;
1557    }
1558
1559    int index = index_c->type->base_type == GLSL_TYPE_INT ?
1560       index_c->get_int_component(0) :
1561       index_c->get_uint_component(0);
1562
1563    ir_constant *substore;
1564    int suboffset;
1565    const ir_dereference *deref = array->as_dereference();
1566    if (!deref) {
1567       store = 0;
1568       offset = 0;
1569       return;
1570    }
1571
1572    deref->constant_referenced(variable_context, substore, suboffset);
1573
1574    if (!substore) {
1575       store = 0;
1576       offset = 0;
1577       return;
1578    }
1579
1580    const glsl_type *vt = array->type;
1581    if (vt->is_array()) {
1582       store = substore->get_array_element(index);
1583       offset = 0;
1584       return;
1585    }
1586    if (vt->is_matrix()) {
1587       store = substore;
1588       offset = index * vt->vector_elements;
1589       return;
1590    }
1591    if (vt->is_vector()) {
1592       store = substore;
1593       offset = suboffset + index;
1594       return;
1595    }
1596
1597    store = 0;
1598    offset = 0;
1599 }
1600
1601 ir_constant *
1602 ir_dereference_array::constant_expression_value(struct hash_table *variable_context)
1603 {
1604    ir_constant *array = this->array->constant_expression_value(variable_context);
1605    ir_constant *idx = this->array_index->constant_expression_value(variable_context);
1606
1607    if ((array != NULL) && (idx != NULL)) {
1608       void *ctx = ralloc_parent(this);
1609       if (array->type->is_matrix()) {
1610          /* Array access of a matrix results in a vector.
1611           */
1612          const unsigned column = idx->value.u[0];
1613
1614          const glsl_type *const column_type = array->type->column_type();
1615
1616          /* Offset in the constant matrix to the first element of the column
1617           * to be extracted.
1618           */
1619          const unsigned mat_idx = column * column_type->vector_elements;
1620
1621          ir_constant_data data = { { 0 } };
1622
1623          switch (column_type->base_type) {
1624          case GLSL_TYPE_UINT:
1625          case GLSL_TYPE_INT:
1626             for (unsigned i = 0; i < column_type->vector_elements; i++)
1627                data.u[i] = array->value.u[mat_idx + i];
1628
1629             break;
1630
1631          case GLSL_TYPE_FLOAT:
1632             for (unsigned i = 0; i < column_type->vector_elements; i++)
1633                data.f[i] = array->value.f[mat_idx + i];
1634
1635             break;
1636
1637          default:
1638             assert(!"Should not get here.");
1639             break;
1640          }
1641
1642          return new(ctx) ir_constant(column_type, &data);
1643       } else if (array->type->is_vector()) {
1644          const unsigned component = idx->value.u[0];
1645
1646          return new(ctx) ir_constant(array, component);
1647       } else {
1648          const unsigned index = idx->value.u[0];
1649          return array->get_array_element(index)->clone(ctx, NULL);
1650       }
1651    }
1652    return NULL;
1653 }
1654
1655
1656 void
1657 ir_dereference_record::constant_referenced(struct hash_table *variable_context,
1658                                            ir_constant *&store, int &offset) const
1659 {
1660    ir_constant *substore;
1661    int suboffset;
1662    const ir_dereference *deref = record->as_dereference();
1663    if (!deref) {
1664       store = 0;
1665       offset = 0;
1666       return;
1667    }
1668
1669    deref->constant_referenced(variable_context, substore, suboffset);
1670
1671    if (!substore) {
1672       store = 0;
1673       offset = 0;
1674       return;
1675    }
1676
1677    store = substore->get_record_field(field);
1678    offset = 0;
1679 }
1680
1681 ir_constant *
1682 ir_dereference_record::constant_expression_value(struct hash_table *variable_context)
1683 {
1684    ir_constant *v = this->record->constant_expression_value();
1685
1686    return (v != NULL) ? v->get_record_field(this->field) : NULL;
1687 }
1688
1689
1690 ir_constant *
1691 ir_assignment::constant_expression_value(struct hash_table *variable_context)
1692 {
1693    /* FINISHME: Handle CEs involving assignment (return RHS) */
1694    return NULL;
1695 }
1696
1697
1698 ir_constant *
1699 ir_constant::constant_expression_value(struct hash_table *variable_context)
1700 {
1701    return this;
1702 }
1703
1704
1705 ir_constant *
1706 ir_call::constant_expression_value(struct hash_table *variable_context)
1707 {
1708    return this->callee->constant_expression_value(&this->actual_parameters, variable_context);
1709 }
1710
1711
1712 bool ir_function_signature::constant_expression_evaluate_expression_list(const struct exec_list &body,
1713                                                                          struct hash_table *variable_context,
1714                                                                          ir_constant **result)
1715 {
1716    foreach_list(n, &body) {
1717       ir_instruction *inst = (ir_instruction *)n;
1718       switch(inst->ir_type) {
1719
1720          /* (declare () type symbol) */
1721       case ir_type_variable: {
1722          ir_variable *var = inst->as_variable();
1723          hash_table_insert(variable_context, ir_constant::zero(this, var->type), var);
1724          break;
1725       }
1726
1727          /* (assign [condition] (write-mask) (ref) (value)) */
1728       case ir_type_assignment: {
1729          ir_assignment *asg = inst->as_assignment();
1730          if (asg->condition) {
1731             ir_constant *cond = asg->condition->constant_expression_value(variable_context);
1732             if (!cond)
1733                return false;
1734             if (!cond->get_bool_component(0))
1735                break;
1736          }
1737
1738          ir_constant *store = NULL;
1739          int offset = 0;
1740          asg->lhs->constant_referenced(variable_context, store, offset);
1741
1742          if (!store)
1743             return false;
1744
1745          ir_constant *value = asg->rhs->constant_expression_value(variable_context);
1746
1747          if (!value)
1748             return false;
1749
1750          store->copy_masked_offset(value, offset, asg->write_mask);
1751          break;
1752       }
1753
1754          /* (return (expression)) */
1755       case ir_type_return:
1756          assert (result);
1757          *result = inst->as_return()->value->constant_expression_value(variable_context);
1758          return *result != NULL;
1759
1760          /* (call name (ref) (params))*/
1761       case ir_type_call: {
1762          ir_call *call = inst->as_call();
1763
1764          /* Just say no to void functions in constant expressions.  We
1765           * don't need them at that point.
1766           */
1767
1768          if (!call->return_deref)
1769             return false;
1770
1771          ir_constant *store = NULL;
1772          int offset = 0;
1773          call->return_deref->constant_referenced(variable_context, store, offset);
1774
1775          if (!store)
1776             return false;
1777
1778          ir_constant *value = call->constant_expression_value(variable_context);
1779
1780          if(!value)
1781             return false;
1782
1783          store->copy_offset(value, offset);
1784          break;
1785       }
1786
1787          /* (if condition (then-instructions) (else-instructions)) */
1788       case ir_type_if: {
1789          ir_if *iif = inst->as_if();
1790
1791          ir_constant *cond = iif->condition->constant_expression_value(variable_context);
1792          if (!cond || !cond->type->is_boolean())
1793             return false;
1794
1795          exec_list &branch = cond->get_bool_component(0) ? iif->then_instructions : iif->else_instructions;
1796
1797          *result = NULL;
1798          if (!constant_expression_evaluate_expression_list(branch, variable_context, result))
1799             return false;
1800
1801          /* If there was a return in the branch chosen, drop out now. */
1802          if (*result)
1803             return true;
1804
1805          break;
1806       }
1807
1808          /* Every other expression type, we drop out. */
1809       default:
1810          return false;
1811       }
1812    }
1813
1814    /* Reaching the end of the block is not an error condition */
1815    if (result)
1816       *result = NULL;
1817
1818    return true;
1819 }
1820
1821 ir_constant *
1822 ir_function_signature::constant_expression_value(exec_list *actual_parameters, struct hash_table *variable_context)
1823 {
1824    const glsl_type *type = this->return_type;
1825    if (type == glsl_type::void_type)
1826       return NULL;
1827
1828    /* From the GLSL 1.20 spec, page 23:
1829     * "Function calls to user-defined functions (non-built-in functions)
1830     *  cannot be used to form constant expressions."
1831     */
1832    if (!this->is_builtin)
1833       return NULL;
1834
1835    /*
1836     * Of the builtin functions, only the texture lookups and the noise
1837     * ones must not be used in constant expressions.  They all include
1838     * specific opcodes so they don't need to be special-cased at this
1839     * point.
1840     */
1841
1842    /* Initialize the table of dereferencable names with the function
1843     * parameters.  Verify their const-ness on the way.
1844     *
1845     * We expect the correctness of the number of parameters to have
1846     * been checked earlier.
1847     */
1848    hash_table *deref_hash = hash_table_ctor(8, hash_table_pointer_hash,
1849                                             hash_table_pointer_compare);
1850
1851    /* If "origin" is non-NULL, then the function body is there.  So we
1852     * have to use the variable objects from the object with the body,
1853     * but the parameter instanciation on the current object.
1854     */
1855    const exec_node *parameter_info = origin ? origin->parameters.head : parameters.head;
1856
1857    foreach_list(n, actual_parameters) {
1858       ir_constant *constant = ((ir_rvalue *) n)->constant_expression_value(variable_context);
1859       if (constant == NULL) {
1860          hash_table_dtor(deref_hash);
1861          return NULL;
1862       }
1863
1864
1865       ir_variable *var = (ir_variable *)parameter_info;
1866       hash_table_insert(deref_hash, constant, var);
1867
1868       parameter_info = parameter_info->next;
1869    }
1870
1871    ir_constant *result = NULL;
1872
1873    /* Now run the builtin function until something non-constant
1874     * happens or we get the result.
1875     */
1876    if (constant_expression_evaluate_expression_list(origin ? origin->body : body, deref_hash, &result) && result)
1877       result = result->clone(ralloc_parent(this), NULL);
1878
1879    hash_table_dtor(deref_hash);
1880
1881    return result;
1882 }