src/mesa/main/pack.c

   1 /*
   2  * Mesa 3-D graphics library
   3  *
   4  * Copyright (C) 1999-2008  Brian Paul   All Rights Reserved.
   5  * Copyright (C) 2009-2010  VMware, Inc.  All Rights Reserved.
   6  *
   7  * Permission is hereby granted, free of charge, to any person obtaining a
   8  * copy of this software and associated documentation files (the "Software"),
   9  * to deal in the Software without restriction, including without limitation
  10  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  11  * and/or sell copies of the Software, and to permit persons to whom the
  12  * Software is furnished to do so, subject to the following conditions:
  13  *
  14  * The above copyright notice and this permission notice shall be included
  15  * in all copies or substantial portions of the Software.
  16  *
  17  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
  18  * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  19  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  20  * THEA AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
  21  * AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  22  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
  23  */
  24
  25
  26 /**
  27  * \file pack.c
  28  * Image and pixel span packing and unpacking.
  29  */
  30
  31
  32 /*
  33  * XXX: MSVC takes forever to compile this module for x86_64 unless we disable
  34  * this global optimization.
  35  *
  36  * See also:
  37  * - http://msdn.microsoft.com/en-us/library/1yk3ydd7.aspx
  38  * - http://msdn.microsoft.com/en-us/library/chh3fb0k.aspx
  39  */
  40 #if defined(_MSC_VER) && defined(_M_X64)
  41 #  pragma optimize( "g", off )
  42 #endif
  43
  44
  45 #include "glheader.h"
  46 #include "enums.h"
  47 #include "image.h"
  48 #include "imports.h"
  49 #include "macros.h"
  50 #include "mtypes.h"
  51 #include "pack.h"
  52 #include "pixeltransfer.h"
  53 #include "imports.h"
  54 #include "glformats.h"
  55 #include "format_utils.h"
  56 #include "format_pack.h"
  57
  58
  59 /**
  60  * Flip the 8 bits in each byte of the given array.
  61  *
  62  * \param p array.
  63  * \param n number of bytes.
  64  *
  65  * \todo try this trick to flip bytes someday:
  66  * \code
  67  *  v = ((v & 0x55555555) << 1) | ((v >> 1) & 0x55555555);
  68  *  v = ((v & 0x33333333) << 2) | ((v >> 2) & 0x33333333);
  69  *  v = ((v & 0x0f0f0f0f) << 4) | ((v >> 4) & 0x0f0f0f0f);
  70  * \endcode
  71  */
  72 static void
  73 flip_bytes( GLubyte *p, GLuint n )
  74 {
  75    GLuint i, a, b;
  76    for (i = 0; i < n; i++) {
  77       b = (GLuint) p[i];        /* words are often faster than bytes */
  78       a = ((b & 0x01) << 7) |
  79           ((b & 0x02) << 5) |
  80           ((b & 0x04) << 3) |
  81           ((b & 0x08) << 1) |
  82           ((b & 0x10) >> 1) |
  83           ((b & 0x20) >> 3) |
  84           ((b & 0x40) >> 5) |
  85           ((b & 0x80) >> 7);
  86       p[i] = (GLubyte) a;
  87    }
  88 }
  89
  90
  91
  92 /*
  93  * Unpack a 32x32 pixel polygon stipple from user memory using the
  94  * current pixel unpack settings.
  95  */
  96 void
  97 _mesa_unpack_polygon_stipple( const GLubyte *pattern, GLuint dest[32],
  98                               const struct gl_pixelstore_attrib *unpacking )
  99 {
 100    GLubyte *ptrn = (GLubyte *) _mesa_unpack_image(2, 32, 32, 1, GL_COLOR_INDEX,
 101                                                   GL_BITMAP, pattern, unpacking);
 102    if (ptrn) {
 103       /* Convert pattern from GLubytes to GLuints and handle big/little
 104        * endian differences
 105        */
 106       GLubyte *p = ptrn;
 107       GLint i;
 108       for (i = 0; i < 32; i++) {
 109          dest[i] = (p[0] << 24)
 110                  | (p[1] << 16)
 111                  | (p[2] <<  8)
 112                  | (p[3]      );
 113          p += 4;
 114       }
 115       free(ptrn);
 116    }
 117 }
 118
 119
 120 /*
 121  * Pack polygon stipple into user memory given current pixel packing
 122  * settings.
 123  */
 124 void
 125 _mesa_pack_polygon_stipple( const GLuint pattern[32], GLubyte *dest,
 126                             const struct gl_pixelstore_attrib *packing )
 127 {
 128    /* Convert pattern from GLuints to GLubytes to handle big/little
 129     * endian differences.
 130     */
 131    GLubyte ptrn[32*4];
 132    GLint i;
 133    for (i = 0; i < 32; i++) {
 134       ptrn[i * 4 + 0] = (GLubyte) ((pattern[i] >> 24) & 0xff);
 135       ptrn[i * 4 + 1] = (GLubyte) ((pattern[i] >> 16) & 0xff);
 136       ptrn[i * 4 + 2] = (GLubyte) ((pattern[i] >> 8 ) & 0xff);
 137       ptrn[i * 4 + 3] = (GLubyte) ((pattern[i]      ) & 0xff);
 138    }
 139
 140    _mesa_pack_bitmap(32, 32, ptrn, dest, packing);
 141 }
 142
 143
 144 /*
 145  * Pack bitmap data.
 146  */
 147 void
 148 _mesa_pack_bitmap( GLint width, GLint height, const GLubyte *source,
 149                    GLubyte *dest, const struct gl_pixelstore_attrib *packing )
 150 {
 151    GLint row, width_in_bytes;
 152    const GLubyte *src;
 153
 154    if (!source)
 155       return;
 156
 157    width_in_bytes = DIV_ROUND_UP( width, 8 );
 158    src = source;
 159    for (row = 0; row < height; row++) {
 160       GLubyte *dst = (GLubyte *) _mesa_image_address2d(packing, dest,
 161                        width, height, GL_COLOR_INDEX, GL_BITMAP, row, 0);
 162       if (!dst)
 163          return;
 164
 165       if ((packing->SkipPixels & 7) == 0) {
 166          memcpy( dst, src, width_in_bytes );
 167          if (packing->LsbFirst) {
 168             flip_bytes( dst, width_in_bytes );
 169          }
 170       }
 171       else {
 172          /* handling SkipPixels is a bit tricky (no pun intended!) */
 173          GLint i;
 174          if (packing->LsbFirst) {
 175             GLubyte srcMask = 128;
 176             GLubyte dstMask = 1 << (packing->SkipPixels & 0x7);
 177             const GLubyte *s = src;
 178             GLubyte *d = dst;
 179             *d = 0;
 180             for (i = 0; i < width; i++) {
 181                if (*s & srcMask) {
 182                   *d |= dstMask;
 183                }
 184                if (srcMask == 1) {
 185                   srcMask = 128;
 186                   s++;
 187                }
 188                else {
 189                   srcMask = srcMask >> 1;
 190                }
 191                if (dstMask == 128) {
 192                   dstMask = 1;
 193                   d++;
 194                   *d = 0;
 195                }
 196                else {
 197                   dstMask = dstMask << 1;
 198                }
 199             }
 200          }
 201          else {
 202             GLubyte srcMask = 128;
 203             GLubyte dstMask = 128 >> (packing->SkipPixels & 0x7);
 204             const GLubyte *s = src;
 205             GLubyte *d = dst;
 206             *d = 0;
 207             for (i = 0; i < width; i++) {
 208                if (*s & srcMask) {
 209                   *d |= dstMask;
 210                }
 211                if (srcMask == 1) {
 212                   srcMask = 128;
 213                   s++;
 214                }
 215                else {
 216                   srcMask = srcMask >> 1;
 217                }
 218                if (dstMask == 1) {
 219                   dstMask = 128;
 220                   d++;
 221                   *d = 0;
 222                }
 223                else {
 224                   dstMask = dstMask >> 1;
 225                }
 226             }
 227          }
 228       }
 229       src += width_in_bytes;
 230    }
 231 }
 232
 233
 234 #define SWAP2BYTE(VALUE)                        \
 235    {                                            \
 236       GLubyte *bytes = (GLubyte *) &(VALUE);    \
 237       GLubyte tmp = bytes[0];                   \
 238       bytes[0] = bytes[1];                      \
 239       bytes[1] = tmp;                           \
 240    }
 241
 242 #define SWAP4BYTE(VALUE)                        \
 243    {                                            \
 244       GLubyte *bytes = (GLubyte *) &(VALUE);    \
 245       GLubyte tmp = bytes[0];                   \
 246       bytes[0] = bytes[3];                      \
 247       bytes[3] = tmp;                           \
 248       tmp = bytes[1];                           \
 249       bytes[1] = bytes[2];                      \
 250       bytes[2] = tmp;                           \
 251    }
 252
 253
 254 static void
 255 extract_uint_indexes(GLuint n, GLuint indexes[],
 256                      GLenum srcFormat, GLenum srcType, const GLvoid *src,
 257                      const struct gl_pixelstore_attrib *unpack )
 258 {
 259    assert(srcFormat == GL_COLOR_INDEX || srcFormat == GL_STENCIL_INDEX);
 260
 261    assert(srcType == GL_BITMAP ||
 262           srcType == GL_UNSIGNED_BYTE ||
 263           srcType == GL_BYTE ||
 264           srcType == GL_UNSIGNED_SHORT ||
 265           srcType == GL_SHORT ||
 266           srcType == GL_UNSIGNED_INT ||
 267           srcType == GL_INT ||
 268           srcType == GL_UNSIGNED_INT_24_8_EXT ||
 269           srcType == GL_HALF_FLOAT_ARB ||
 270           srcType == GL_HALF_FLOAT_OES ||
 271           srcType == GL_FLOAT ||
 272           srcType == GL_FLOAT_32_UNSIGNED_INT_24_8_REV);
 273
 274    switch (srcType) {
 275       case GL_BITMAP:
 276          {
 277             GLubyte *ubsrc = (GLubyte *) src;
 278             if (unpack->LsbFirst) {
 279                GLubyte mask = 1 << (unpack->SkipPixels & 0x7);
 280                GLuint i;
 281                for (i = 0; i < n; i++) {
 282                   indexes[i] = (*ubsrc & mask) ? 1 : 0;
 283                   if (mask == 128) {
 284                      mask = 1;
 285                      ubsrc++;
 286                   }
 287                   else {
 288                      mask = mask << 1;
 289                   }
 290                }
 291             }
 292             else {
 293                GLubyte mask = 128 >> (unpack->SkipPixels & 0x7);
 294                GLuint i;
 295                for (i = 0; i < n; i++) {
 296                   indexes[i] = (*ubsrc & mask) ? 1 : 0;
 297                   if (mask == 1) {
 298                      mask = 128;
 299                      ubsrc++;
 300                   }
 301                   else {
 302                      mask = mask >> 1;
 303                   }
 304                }
 305             }
 306          }
 307          break;
 308       case GL_UNSIGNED_BYTE:
 309          {
 310             GLuint i;
 311             const GLubyte *s = (const GLubyte *) src;
 312             for (i = 0; i < n; i++)
 313                indexes[i] = s[i];
 314          }
 315          break;
 316       case GL_BYTE:
 317          {
 318             GLuint i;
 319             const GLbyte *s = (const GLbyte *) src;
 320             for (i = 0; i < n; i++)
 321                indexes[i] = s[i];
 322          }
 323          break;
 324       case GL_UNSIGNED_SHORT:
 325          {
 326             GLuint i;
 327             const GLushort *s = (const GLushort *) src;
 328             if (unpack->SwapBytes) {
 329                for (i = 0; i < n; i++) {
 330                   GLushort value = s[i];
 331                   SWAP2BYTE(value);
 332                   indexes[i] = value;
 333                }
 334             }
 335             else {
 336                for (i = 0; i < n; i++)
 337                   indexes[i] = s[i];
 338             }
 339          }
 340          break;
 341       case GL_SHORT:
 342          {
 343             GLuint i;
 344             const GLshort *s = (const GLshort *) src;
 345             if (unpack->SwapBytes) {
 346                for (i = 0; i < n; i++) {
 347                   GLshort value = s[i];
 348                   SWAP2BYTE(value);
 349                   indexes[i] = value;
 350                }
 351             }
 352             else {
 353                for (i = 0; i < n; i++)
 354                   indexes[i] = s[i];
 355             }
 356          }
 357          break;
 358       case GL_UNSIGNED_INT:
 359          {
 360             GLuint i;
 361             const GLuint *s = (const GLuint *) src;
 362             if (unpack->SwapBytes) {
 363                for (i = 0; i < n; i++) {
 364                   GLuint value = s[i];
 365                   SWAP4BYTE(value);
 366                   indexes[i] = value;
 367                }
 368             }
 369             else {
 370                for (i = 0; i < n; i++)
 371                   indexes[i] = s[i];
 372             }
 373          }
 374          break;
 375       case GL_INT:
 376          {
 377             GLuint i;
 378             const GLint *s = (const GLint *) src;
 379             if (unpack->SwapBytes) {
 380                for (i = 0; i < n; i++) {
 381                   GLint value = s[i];
 382                   SWAP4BYTE(value);
 383                   indexes[i] = value;
 384                }
 385             }
 386             else {
 387                for (i = 0; i < n; i++)
 388                   indexes[i] = s[i];
 389             }
 390          }
 391          break;
 392       case GL_FLOAT:
 393          {
 394             GLuint i;
 395             const GLfloat *s = (const GLfloat *) src;
 396             if (unpack->SwapBytes) {
 397                for (i = 0; i < n; i++) {
 398                   GLfloat value = s[i];
 399                   SWAP4BYTE(value);
 400                   indexes[i] = (GLuint) value;
 401                }
 402             }
 403             else {
 404                for (i = 0; i < n; i++)
 405                   indexes[i] = (GLuint) s[i];
 406             }
 407          }
 408          break;
 409       case GL_HALF_FLOAT_ARB:
 410       case GL_HALF_FLOAT_OES:
 411          {
 412             GLuint i;
 413             const GLhalfARB *s = (const GLhalfARB *) src;
 414             if (unpack->SwapBytes) {
 415                for (i = 0; i < n; i++) {
 416                   GLhalfARB value = s[i];
 417                   SWAP2BYTE(value);
 418                   indexes[i] = (GLuint) _mesa_half_to_float(value);
 419                }
 420             }
 421             else {
 422                for (i = 0; i < n; i++)
 423                   indexes[i] = (GLuint) _mesa_half_to_float(s[i]);
 424             }
 425          }
 426          break;
 427       case GL_UNSIGNED_INT_24_8_EXT:
 428          {
 429             GLuint i;
 430             const GLuint *s = (const GLuint *) src;
 431             if (unpack->SwapBytes) {
 432                for (i = 0; i < n; i++) {
 433                   GLuint value = s[i];
 434                   SWAP4BYTE(value);
 435                   indexes[i] = value & 0xff;  /* lower 8 bits */
 436                }
 437             }
 438             else {
 439                for (i = 0; i < n; i++)
 440                   indexes[i] = s[i] & 0xff;  /* lower 8 bits */
 441             }
 442          }
 443          break;
 444       case GL_FLOAT_32_UNSIGNED_INT_24_8_REV:
 445          {
 446             GLuint i;
 447             const GLuint *s = (const GLuint *) src;
 448             if (unpack->SwapBytes) {
 449                for (i = 0; i < n; i++) {
 450                   GLuint value = s[i*2+1];
 451                   SWAP4BYTE(value);
 452                   indexes[i] = value & 0xff;  /* lower 8 bits */
 453                }
 454             }
 455             else {
 456                for (i = 0; i < n; i++)
 457                   indexes[i] = s[i*2+1] & 0xff;  /* lower 8 bits */
 458             }
 459          }
 460          break;
 461
 462       default:
 463          _mesa_problem(NULL, "bad srcType in extract_uint_indexes");
 464          return;
 465    }
 466 }
 467
 468
 469 static inline GLuint
 470 clamp_float_to_uint(GLfloat f)
 471 {
 472    return f < 0.0F ? 0 : _mesa_lroundevenf(f);
 473 }
 474
 475
 476 static inline GLuint
 477 clamp_half_to_uint(GLhalfARB h)
 478 {
 479    GLfloat f = _mesa_half_to_float(h);
 480    return f < 0.0F ? 0 : _mesa_lroundevenf(f);
 481 }
 482
 483
 484 /*
 485  * Unpack a row of stencil data from a client buffer according to
 486  * the pixel unpacking parameters.
 487  * This is (or will be) used by glDrawPixels
 488  *
 489  * Args:  ctx - the context
 490  *        n - number of pixels
 491  *        dstType - destination data type
 492  *        dest - destination array
 493  *        srcType - source pixel type
 494  *        source - source data pointer
 495  *        srcPacking - pixel unpacking parameters
 496  *        transferOps - apply offset/bias/lookup ops?
 497  */
 498 void
 499 _mesa_unpack_stencil_span( struct gl_context *ctx, GLuint n,
 500                            GLenum dstType, GLvoid *dest,
 501                            GLenum srcType, const GLvoid *source,
 502                            const struct gl_pixelstore_attrib *srcPacking,
 503                            GLbitfield transferOps )
 504 {
 505    assert(srcType == GL_BITMAP ||
 506           srcType == GL_UNSIGNED_BYTE ||
 507           srcType == GL_BYTE ||
 508           srcType == GL_UNSIGNED_SHORT ||
 509           srcType == GL_SHORT ||
 510           srcType == GL_UNSIGNED_INT ||
 511           srcType == GL_INT ||
 512           srcType == GL_UNSIGNED_INT_24_8_EXT ||
 513           srcType == GL_HALF_FLOAT_ARB ||
 514           srcType == GL_HALF_FLOAT_OES ||
 515           srcType == GL_FLOAT ||
 516           srcType == GL_FLOAT_32_UNSIGNED_INT_24_8_REV);
 517
 518    assert(dstType == GL_UNSIGNED_BYTE ||
 519           dstType == GL_UNSIGNED_SHORT ||
 520           dstType == GL_UNSIGNED_INT ||
 521           dstType == GL_FLOAT_32_UNSIGNED_INT_24_8_REV);
 522
 523    /* only shift and offset apply to stencil */
 524    transferOps &= IMAGE_SHIFT_OFFSET_BIT;
 525
 526    /*
 527     * Try simple cases first
 528     */
 529    if (transferOps == 0 &&
 530        !ctx->Pixel.MapStencilFlag &&
 531        srcType == GL_UNSIGNED_BYTE &&
 532        dstType == GL_UNSIGNED_BYTE) {
 533       memcpy(dest, source, n * sizeof(GLubyte));
 534    }
 535    else if (transferOps == 0 &&
 536             !ctx->Pixel.MapStencilFlag &&
 537             srcType == GL_UNSIGNED_INT &&
 538             dstType == GL_UNSIGNED_INT &&
 539             !srcPacking->SwapBytes) {
 540       memcpy(dest, source, n * sizeof(GLuint));
 541    }
 542    else {
 543       /*
 544        * general solution
 545        */
 546       GLuint *indexes = malloc(n * sizeof(GLuint));
 547
 548       if (!indexes) {
 549          _mesa_error(ctx, GL_OUT_OF_MEMORY, "stencil unpacking");
 550          return;
 551       }
 552
 553       extract_uint_indexes(n, indexes, GL_STENCIL_INDEX, srcType, source,
 554                            srcPacking);
 555
 556       if (transferOps & IMAGE_SHIFT_OFFSET_BIT) {
 557          /* shift and offset indexes */
 558          _mesa_shift_and_offset_ci(ctx, n, indexes);
 559       }
 560
 561       if (ctx->Pixel.MapStencilFlag) {
 562          /* Apply stencil lookup table */
 563          const GLuint mask = ctx->PixelMaps.StoS.Size - 1;
 564          GLuint i;
 565          for (i = 0; i < n; i++) {
 566             indexes[i] = (GLuint)ctx->PixelMaps.StoS.Map[ indexes[i] & mask ];
 567          }
 568       }
 569
 570       /* convert to dest type */
 571       switch (dstType) {
 572          case GL_UNSIGNED_BYTE:
 573             {
 574                GLubyte *dst = (GLubyte *) dest;
 575                GLuint i;
 576                for (i = 0; i < n; i++) {
 577                   dst[i] = (GLubyte) (indexes[i] & 0xff);
 578                }
 579             }
 580             break;
 581          case GL_UNSIGNED_SHORT:
 582             {
 583                GLuint *dst = (GLuint *) dest;
 584                GLuint i;
 585                for (i = 0; i < n; i++) {
 586                   dst[i] = (GLushort) (indexes[i] & 0xffff);
 587                }
 588             }
 589             break;
 590          case GL_UNSIGNED_INT:
 591             memcpy(dest, indexes, n * sizeof(GLuint));
 592             break;
 593          case GL_FLOAT_32_UNSIGNED_INT_24_8_REV:
 594             {
 595                GLuint *dst = (GLuint *) dest;
 596                GLuint i;
 597                for (i = 0; i < n; i++) {
 598                   dst[i*2+1] = indexes[i] & 0xff; /* lower 8 bits */
 599                }
 600             }
 601             break;
 602          default:
 603             _mesa_problem(ctx, "bad dstType in _mesa_unpack_stencil_span");
 604       }
 605
 606       free(indexes);
 607    }
 608 }
 609
 610
 611 void
 612 _mesa_pack_stencil_span( struct gl_context *ctx, GLuint n,
 613                          GLenum dstType, GLvoid *dest, const GLubyte *source,
 614                          const struct gl_pixelstore_attrib *dstPacking )
 615 {
 616    GLubyte *stencil = malloc(n * sizeof(GLubyte));
 617
 618    if (!stencil) {
 619       _mesa_error(ctx, GL_OUT_OF_MEMORY, "stencil packing");
 620       return;
 621    }
 622
 623    if (ctx->Pixel.IndexShift || ctx->Pixel.IndexOffset ||
 624        ctx->Pixel.MapStencilFlag) {
 625       /* make a copy of input */
 626       memcpy(stencil, source, n * sizeof(GLubyte));
 627       _mesa_apply_stencil_transfer_ops(ctx, n, stencil);
 628       source = stencil;
 629    }
 630
 631    switch (dstType) {
 632    case GL_UNSIGNED_BYTE:
 633       memcpy(dest, source, n);
 634       break;
 635    case GL_BYTE:
 636       {
 637          GLbyte *dst = (GLbyte *) dest;
 638          GLuint i;
 639          for (i=0;i<n;i++) {
 640             dst[i] = (GLbyte) (source[i] & 0x7f);
 641          }
 642       }
 643       break;
 644    case GL_UNSIGNED_SHORT:
 645       {
 646          GLushort *dst = (GLushort *) dest;
 647          GLuint i;
 648          for (i=0;i<n;i++) {
 649             dst[i] = (GLushort) source[i];
 650          }
 651          if (dstPacking->SwapBytes) {
 652             _mesa_swap2( (GLushort *) dst, n );
 653          }
 654       }
 655       break;
 656    case GL_SHORT:
 657       {
 658          GLshort *dst = (GLshort *) dest;
 659          GLuint i;
 660          for (i=0;i<n;i++) {
 661             dst[i] = (GLshort) source[i];
 662          }
 663          if (dstPacking->SwapBytes) {
 664             _mesa_swap2( (GLushort *) dst, n );
 665          }
 666       }
 667       break;
 668    case GL_UNSIGNED_INT:
 669       {
 670          GLuint *dst = (GLuint *) dest;
 671          GLuint i;
 672          for (i=0;i<n;i++) {
 673             dst[i] = (GLuint) source[i];
 674          }
 675          if (dstPacking->SwapBytes) {
 676             _mesa_swap4( (GLuint *) dst, n );
 677          }
 678       }
 679       break;
 680    case GL_INT:
 681       {
 682          GLint *dst = (GLint *) dest;
 683          GLuint i;
 684          for (i=0;i<n;i++) {
 685             dst[i] = (GLint) source[i];
 686          }
 687          if (dstPacking->SwapBytes) {
 688             _mesa_swap4( (GLuint *) dst, n );
 689          }
 690       }
 691       break;
 692    case GL_FLOAT:
 693       {
 694          GLfloat *dst = (GLfloat *) dest;
 695          GLuint i;
 696          for (i=0;i<n;i++) {
 697             dst[i] = (GLfloat) source[i];
 698          }
 699          if (dstPacking->SwapBytes) {
 700             _mesa_swap4( (GLuint *) dst, n );
 701          }
 702       }
 703       break;
 704    case GL_HALF_FLOAT_ARB:
 705    case GL_HALF_FLOAT_OES:
 706       {
 707          GLhalfARB *dst = (GLhalfARB *) dest;
 708          GLuint i;
 709          for (i=0;i<n;i++) {
 710             dst[i] = _mesa_float_to_half( (float) source[i] );
 711          }
 712          if (dstPacking->SwapBytes) {
 713             _mesa_swap2( (GLushort *) dst, n );
 714          }
 715       }
 716       break;
 717    case GL_BITMAP:
 718       if (dstPacking->LsbFirst) {
 719          GLubyte *dst = (GLubyte *) dest;
 720          GLint shift = 0;
 721          GLuint i;
 722          for (i = 0; i < n; i++) {
 723             if (shift == 0)
 724                *dst = 0;
 725             *dst |= ((source[i] != 0) << shift);
 726             shift++;
 727             if (shift == 8) {
 728                shift = 0;
 729                dst++;
 730             }
 731          }
 732       }
 733       else {
 734          GLubyte *dst = (GLubyte *) dest;
 735          GLint shift = 7;
 736          GLuint i;
 737          for (i = 0; i < n; i++) {
 738             if (shift == 7)
 739                *dst = 0;
 740             *dst |= ((source[i] != 0) << shift);
 741             shift--;
 742             if (shift < 0) {
 743                shift = 7;
 744                dst++;
 745             }
 746          }
 747       }
 748       break;
 749    default:
 750       _mesa_problem(ctx, "bad type in _mesa_pack_index_span");
 751    }
 752
 753    free(stencil);
 754 }
 755
 756 #define DEPTH_VALUES(GLTYPE, GLTYPE2FLOAT)                              \
 757     do {                                                                \
 758         GLuint i;                                                       \
 759         const GLTYPE *src = (const GLTYPE *)source;                     \
 760         for (i = 0; i < n; i++) {                                       \
 761             GLTYPE value = src[i];                                      \
 762             if (srcPacking->SwapBytes) {                                \
 763                 if (sizeof(GLTYPE) == 2) {                              \
 764                     SWAP2BYTE(value);                                   \
 765                 } else if (sizeof(GLTYPE) == 4) {                       \
 766                     SWAP4BYTE(value);                                   \
 767                 }                                                       \
 768             }                                                           \
 769             depthValues[i] = GLTYPE2FLOAT(value);                       \
 770         }                                                               \
 771     } while (0)
 772
 773
 774 /**
 775  * Unpack a row of depth/z values from memory, returning GLushort, GLuint
 776  * or GLfloat values.
 777  * The glPixelTransfer (scale/bias) params will be applied.
 778  *
 779  * \param dstType  one of GL_UNSIGNED_SHORT, GL_UNSIGNED_INT, GL_FLOAT
 780  * \param depthMax  max value for returned GLushort or GLuint values
 781  *                  (ignored for GLfloat).
 782  */
 783 void
 784 _mesa_unpack_depth_span( struct gl_context *ctx, GLuint n,
 785                          GLenum dstType, GLvoid *dest, GLuint depthMax,
 786                          GLenum srcType, const GLvoid *source,
 787                          const struct gl_pixelstore_attrib *srcPacking )
 788 {
 789    GLfloat *depthTemp = NULL, *depthValues;
 790    GLboolean needClamp = GL_FALSE;
 791
 792    /* Look for special cases first.
 793     * Not only are these faster, they're less prone to numeric conversion
 794     * problems.  Otherwise, converting from an int type to a float then
 795     * back to an int type can introduce errors that will show up as
 796     * artifacts in things like depth peeling which uses glCopyTexImage.
 797     */
 798    if (ctx->Pixel.DepthScale == 1.0F && ctx->Pixel.DepthBias == 0.0F) {
 799       if (srcType == GL_UNSIGNED_INT && dstType == GL_UNSIGNED_SHORT) {
 800          const GLuint *src = (const GLuint *) source;
 801          GLushort *dst = (GLushort *) dest;
 802          GLuint i;
 803          for (i = 0; i < n; i++) {
 804             dst[i] = src[i] >> 16;
 805          }
 806          return;
 807       }
 808       if (srcType == GL_UNSIGNED_SHORT
 809           && dstType == GL_UNSIGNED_INT
 810           && depthMax == 0xffffffff) {
 811          const GLushort *src = (const GLushort *) source;
 812          GLuint *dst = (GLuint *) dest;
 813          GLuint i;
 814          for (i = 0; i < n; i++) {
 815             dst[i] = src[i] | (src[i] << 16);
 816          }
 817          return;
 818       }
 819       if (srcType == GL_UNSIGNED_INT_24_8
 820           && dstType == GL_UNSIGNED_INT
 821           && depthMax == 0xffffff) {
 822          const GLuint *src = (const GLuint *) source;
 823          GLuint *dst = (GLuint *) dest;
 824          GLuint i;
 825          for (i = 0; i < n; i++) {
 826             dst[i] = src[i] >> 8;
 827          }
 828          return;
 829       }
 830       /* XXX may want to add additional cases here someday */
 831    }
 832
 833    /* general case path follows */
 834
 835    if (dstType == GL_FLOAT) {
 836       depthValues = (GLfloat *) dest;
 837    }
 838    else {
 839       depthTemp = malloc(n * sizeof(GLfloat));
 840       if (!depthTemp) {
 841          _mesa_error(ctx, GL_OUT_OF_MEMORY, "pixel unpacking");
 842          return;
 843       }
 844
 845       depthValues = depthTemp;
 846    }
 847
 848    /* Convert incoming values to GLfloat.  Some conversions will require
 849     * clamping, below.
 850     */
 851    switch (srcType) {
 852       case GL_BYTE:
 853          DEPTH_VALUES(GLbyte, BYTE_TO_FLOATZ);
 854          needClamp = GL_TRUE;
 855          break;
 856       case GL_UNSIGNED_BYTE:
 857          DEPTH_VALUES(GLubyte, UBYTE_TO_FLOAT);
 858          break;
 859       case GL_SHORT:
 860          DEPTH_VALUES(GLshort, SHORT_TO_FLOATZ);
 861          needClamp = GL_TRUE;
 862          break;
 863       case GL_UNSIGNED_SHORT:
 864          DEPTH_VALUES(GLushort, USHORT_TO_FLOAT);
 865          break;
 866       case GL_INT:
 867          DEPTH_VALUES(GLint, INT_TO_FLOAT);
 868          needClamp = GL_TRUE;
 869          break;
 870       case GL_UNSIGNED_INT:
 871          DEPTH_VALUES(GLuint, UINT_TO_FLOAT);
 872          break;
 873       case GL_UNSIGNED_INT_24_8_EXT: /* GL_EXT_packed_depth_stencil */
 874          if (dstType == GL_UNSIGNED_INT_24_8_EXT &&
 875              depthMax == 0xffffff &&
 876              ctx->Pixel.DepthScale == 1.0F &&
 877              ctx->Pixel.DepthBias == 0.0F) {
 878             const GLuint *src = (const GLuint *) source;
 879             GLuint *zValues = (GLuint *) dest;
 880             GLuint i;
 881             for (i = 0; i < n; i++) {
 882                 GLuint value = src[i];
 883                 if (srcPacking->SwapBytes) {
 884                     SWAP4BYTE(value);
 885                 }
 886                 zValues[i] = value & 0xffffff00;
 887             }
 888             free(depthTemp);
 889             return;
 890          }
 891          else {
 892             const GLuint *src = (const GLuint *) source;
 893             const GLfloat scale = 1.0f / 0xffffff;
 894             GLuint i;
 895             for (i = 0; i < n; i++) {
 896                 GLuint value = src[i];
 897                 if (srcPacking->SwapBytes) {
 898                     SWAP4BYTE(value);
 899                 }
 900                 depthValues[i] = (value >> 8) * scale;
 901             }
 902          }
 903          break;
 904       case GL_FLOAT_32_UNSIGNED_INT_24_8_REV:
 905          {
 906             GLuint i;
 907             const GLfloat *src = (const GLfloat *)source;
 908             for (i = 0; i < n; i++) {
 909                GLfloat value = src[i * 2];
 910                if (srcPacking->SwapBytes) {
 911                   SWAP4BYTE(value);
 912                }
 913                depthValues[i] = value;
 914             }
 915             needClamp = GL_TRUE;
 916          }
 917          break;
 918       case GL_FLOAT:
 919          DEPTH_VALUES(GLfloat, 1*);
 920          needClamp = GL_TRUE;
 921          break;
 922       case GL_HALF_FLOAT_ARB:
 923       case GL_HALF_FLOAT_OES:
 924          {
 925             GLuint i;
 926             const GLhalfARB *src = (const GLhalfARB *) source;
 927             for (i = 0; i < n; i++) {
 928                GLhalfARB value = src[i];
 929                if (srcPacking->SwapBytes) {
 930                   SWAP2BYTE(value);
 931                }
 932                depthValues[i] = _mesa_half_to_float(value);
 933             }
 934             needClamp = GL_TRUE;
 935          }
 936          break;
 937       default:
 938          _mesa_problem(NULL, "bad type in _mesa_unpack_depth_span()");
 939          free(depthTemp);
 940          return;
 941    }
 942
 943    /* apply depth scale and bias */
 944    {
 945       const GLfloat scale = ctx->Pixel.DepthScale;
 946       const GLfloat bias = ctx->Pixel.DepthBias;
 947       if (scale != 1.0F || bias != 0.0F) {
 948          GLuint i;
 949          for (i = 0; i < n; i++) {
 950             depthValues[i] = depthValues[i] * scale + bias;
 951          }
 952          needClamp = GL_TRUE;
 953       }
 954    }
 955
 956    /* clamp to [0, 1] */
 957    if (needClamp) {
 958       GLuint i;
 959       for (i = 0; i < n; i++) {
 960          depthValues[i] = CLAMP(depthValues[i], 0.0F, 1.0F);
 961       }
 962    }
 963
 964    /*
 965     * Convert values to dstType
 966     */
 967    if (dstType == GL_UNSIGNED_INT) {
 968       GLuint *zValues = (GLuint *) dest;
 969       GLuint i;
 970       if (depthMax <= 0xffffff) {
 971          /* no overflow worries */
 972          for (i = 0; i < n; i++) {
 973             zValues[i] = (GLuint) (depthValues[i] * (GLfloat) depthMax);
 974          }
 975       }
 976       else {
 977          /* need to use double precision to prevent overflow problems */
 978          for (i = 0; i < n; i++) {
 979             GLdouble z = depthValues[i] * (GLdouble) depthMax;
 980             if (z >= (GLdouble) 0xffffffff)
 981                zValues[i] = 0xffffffff;
 982             else
 983                zValues[i] = (GLuint) z;
 984          }
 985       }
 986    }
 987    else if (dstType == GL_UNSIGNED_SHORT) {
 988       GLushort *zValues = (GLushort *) dest;
 989       GLuint i;
 990       assert(depthMax <= 0xffff);
 991       for (i = 0; i < n; i++) {
 992          zValues[i] = (GLushort) (depthValues[i] * (GLfloat) depthMax);
 993       }
 994    }
 995    else if (dstType == GL_FLOAT) {
 996       /* Nothing to do. depthValues is pointing to dest. */
 997    }
 998    else if (dstType == GL_FLOAT_32_UNSIGNED_INT_24_8_REV) {
 999       GLfloat *zValues = (GLfloat*) dest;
1000       GLuint i;
1001       for (i = 0; i < n; i++) {
1002          zValues[i*2] = depthValues[i];
1003       }
1004    }
1005    else {
1006       assert(0);
1007    }
1008
1009    free(depthTemp);
1010 }
1011
1012
1013 /*
1014  * Pack an array of depth values.  The values are floats in [0,1].
1015  */
1016 void
1017 _mesa_pack_depth_span( struct gl_context *ctx, GLuint n, GLvoid *dest,
1018                        GLenum dstType, const GLfloat *depthSpan,
1019                        const struct gl_pixelstore_attrib *dstPacking )
1020 {
1021    GLfloat *depthCopy = malloc(n * sizeof(GLfloat));
1022    if (!depthCopy) {
1023       _mesa_error(ctx, GL_OUT_OF_MEMORY, "pixel packing");
1024       return;
1025    }
1026
1027    if (ctx->Pixel.DepthScale != 1.0F || ctx->Pixel.DepthBias != 0.0F) {
1028       memcpy(depthCopy, depthSpan, n * sizeof(GLfloat));
1029       _mesa_scale_and_bias_depth(ctx, n, depthCopy);
1030       depthSpan = depthCopy;
1031    }
1032
1033    switch (dstType) {
1034    case GL_UNSIGNED_BYTE:
1035       {
1036          GLubyte *dst = (GLubyte *) dest;
1037          GLuint i;
1038          for (i = 0; i < n; i++) {
1039             dst[i] = FLOAT_TO_UBYTE( depthSpan[i] );
1040          }
1041       }
1042       break;
1043    case GL_BYTE:
1044       {
1045          GLbyte *dst = (GLbyte *) dest;
1046          GLuint i;
1047          for (i = 0; i < n; i++) {
1048             dst[i] = FLOAT_TO_BYTE( depthSpan[i] );
1049          }
1050       }
1051       break;
1052    case GL_UNSIGNED_SHORT:
1053       {
1054          GLushort *dst = (GLushort *) dest;
1055          GLuint i;
1056          for (i = 0; i < n; i++) {
1057             CLAMPED_FLOAT_TO_USHORT(dst[i], depthSpan[i]);
1058          }
1059          if (dstPacking->SwapBytes) {
1060             _mesa_swap2( (GLushort *) dst, n );
1061          }
1062       }
1063       break;
1064    case GL_SHORT:
1065       {
1066          GLshort *dst = (GLshort *) dest;
1067          GLuint i;
1068          for (i = 0; i < n; i++) {
1069             dst[i] = FLOAT_TO_SHORT( depthSpan[i] );
1070          }
1071          if (dstPacking->SwapBytes) {
1072             _mesa_swap2( (GLushort *) dst, n );
1073          }
1074       }
1075       break;
1076    case GL_UNSIGNED_INT_24_8:
1077       {
1078          const GLdouble scale = (GLdouble) 0xffffff;
1079          GLuint *dst = (GLuint *) dest;
1080          GLuint i;
1081          for (i = 0; i < n; i++) {
1082             GLuint z = (GLuint) (depthSpan[i] * scale);
1083             assert(z <= 0xffffff);
1084             dst[i] = (z << 8);
1085          }
1086          if (dstPacking->SwapBytes) {
1087             _mesa_swap4( (GLuint *) dst, n );
1088          }
1089          break;
1090       }
1091    case GL_UNSIGNED_INT:
1092       {
1093          GLuint *dst = (GLuint *) dest;
1094          GLuint i;
1095          for (i = 0; i < n; i++) {
1096             dst[i] = FLOAT_TO_UINT( depthSpan[i] );
1097          }
1098          if (dstPacking->SwapBytes) {
1099             _mesa_swap4( (GLuint *) dst, n );
1100          }
1101       }
1102       break;
1103    case GL_INT:
1104       {
1105          GLint *dst = (GLint *) dest;
1106          GLuint i;
1107          for (i = 0; i < n; i++) {
1108             dst[i] = FLOAT_TO_INT( depthSpan[i] );
1109          }
1110          if (dstPacking->SwapBytes) {
1111             _mesa_swap4( (GLuint *) dst, n );
1112          }
1113       }
1114       break;
1115    case GL_FLOAT:
1116       {
1117          GLfloat *dst = (GLfloat *) dest;
1118          GLuint i;
1119          for (i = 0; i < n; i++) {
1120             dst[i] = depthSpan[i];
1121          }
1122          if (dstPacking->SwapBytes) {
1123             _mesa_swap4( (GLuint *) dst, n );
1124          }
1125       }
1126       break;
1127    case GL_HALF_FLOAT_ARB:
1128    case GL_HALF_FLOAT_OES:
1129       {
1130          GLhalfARB *dst = (GLhalfARB *) dest;
1131          GLuint i;
1132          for (i = 0; i < n; i++) {
1133             dst[i] = _mesa_float_to_half(depthSpan[i]);
1134          }
1135          if (dstPacking->SwapBytes) {
1136             _mesa_swap2( (GLushort *) dst, n );
1137          }
1138       }
1139       break;
1140    default:
1141       _mesa_problem(ctx, "bad type in _mesa_pack_depth_span (%s)",
1142                     _mesa_enum_to_string(dstType));
1143    }
1144
1145    free(depthCopy);
1146 }
1147
1148
1149
1150 /**
1151  * Pack depth and stencil values as GL_DEPTH_STENCIL (GL_UNSIGNED_INT_24_8 etc)
1152  */
1153 void
1154 _mesa_pack_depth_stencil_span(struct gl_context *ctx,GLuint n,
1155                               GLenum dstType, GLuint *dest,
1156                               const GLfloat *depthVals,
1157                               const GLubyte *stencilVals,
1158                               const struct gl_pixelstore_attrib *dstPacking)
1159 {
1160    GLfloat *depthCopy = malloc(n * sizeof(GLfloat));
1161    GLubyte *stencilCopy = malloc(n * sizeof(GLubyte));
1162    GLuint i;
1163
1164    if (!depthCopy || !stencilCopy) {
1165       _mesa_error(ctx, GL_OUT_OF_MEMORY, "pixel packing");
1166       free(depthCopy);
1167       free(stencilCopy);
1168       return;
1169    }
1170
1171    if (ctx->Pixel.DepthScale != 1.0F || ctx->Pixel.DepthBias != 0.0F) {
1172       memcpy(depthCopy, depthVals, n * sizeof(GLfloat));
1173       _mesa_scale_and_bias_depth(ctx, n, depthCopy);
1174       depthVals = depthCopy;
1175    }
1176
1177    if (ctx->Pixel.IndexShift ||
1178        ctx->Pixel.IndexOffset ||
1179        ctx->Pixel.MapStencilFlag) {
1180       memcpy(stencilCopy, stencilVals, n * sizeof(GLubyte));
1181       _mesa_apply_stencil_transfer_ops(ctx, n, stencilCopy);
1182       stencilVals = stencilCopy;
1183    }
1184
1185    switch (dstType) {
1186    case GL_UNSIGNED_INT_24_8:
1187       for (i = 0; i < n; i++) {
1188          GLuint z = (GLuint) (depthVals[i] * 0xffffff);
1189          dest[i] = (z << 8) | (stencilVals[i] & 0xff);
1190       }
1191       break;
1192    case GL_FLOAT_32_UNSIGNED_INT_24_8_REV:
1193       for (i = 0; i < n; i++) {
1194          ((GLfloat*)dest)[i*2] = depthVals[i];
1195          dest[i*2+1] = stencilVals[i] & 0xff;
1196       }
1197       break;
1198    }
1199
1200    if (dstPacking->SwapBytes) {
1201       _mesa_swap4(dest, n);
1202    }
1203
1204    free(depthCopy);
1205    free(stencilCopy);
1206 }
1207
1208
1209
1210 /**
1211  * Unpack image data.  Apply byte swapping, byte flipping (bitmap).
1212  * Return all image data in a contiguous block.  This is used when we
1213  * compile glDrawPixels, glTexImage, etc into a display list.  We
1214  * need a copy of the data in a standard format.
1215  */
1216 void *
1217 _mesa_unpack_image( GLuint dimensions,
1218                     GLsizei width, GLsizei height, GLsizei depth,
1219                     GLenum format, GLenum type, const GLvoid *pixels,
1220                     const struct gl_pixelstore_attrib *unpack )
1221 {
1222    GLint bytesPerRow, compsPerRow;
1223    GLboolean flipBytes, swap2, swap4;
1224
1225    if (!pixels)
1226       return NULL;  /* not necessarily an error */
1227
1228    if (width <= 0 || height <= 0 || depth <= 0)
1229       return NULL;  /* generate error later */
1230
1231    if (type == GL_BITMAP) {
1232       bytesPerRow = (width + 7) >> 3;
1233       flipBytes = unpack->LsbFirst;
1234       swap2 = swap4 = GL_FALSE;
1235       compsPerRow = 0;
1236    }
1237    else {
1238       const GLint bytesPerPixel = _mesa_bytes_per_pixel(format, type);
1239       GLint components = _mesa_components_in_format(format);
1240       GLint bytesPerComp;
1241
1242       if (_mesa_type_is_packed(type))
1243           components = 1;
1244
1245       if (bytesPerPixel <= 0 || components <= 0)
1246          return NULL;   /* bad format or type.  generate error later */
1247       bytesPerRow = bytesPerPixel * width;
1248       bytesPerComp = bytesPerPixel / components;
1249       flipBytes = GL_FALSE;
1250       swap2 = (bytesPerComp == 2) && unpack->SwapBytes;
1251       swap4 = (bytesPerComp == 4) && unpack->SwapBytes;
1252       compsPerRow = components * width;
1253       assert(compsPerRow >= width);
1254    }
1255
1256    {
1257       GLubyte *destBuffer
1258          = malloc(bytesPerRow * height * depth);
1259       GLubyte *dst;
1260       GLint img, row;
1261       if (!destBuffer)
1262          return NULL;   /* generate GL_OUT_OF_MEMORY later */
1263
1264       dst = destBuffer;
1265       for (img = 0; img < depth; img++) {
1266          for (row = 0; row < height; row++) {
1267             const GLvoid *src = _mesa_image_address(dimensions, unpack, pixels,
1268                                width, height, format, type, img, row, 0);
1269
1270             if ((type == GL_BITMAP) && (unpack->SkipPixels & 0x7)) {
1271                GLint i;
1272                flipBytes = GL_FALSE;
1273                if (unpack->LsbFirst) {
1274                   GLubyte srcMask = 1 << (unpack->SkipPixels & 0x7);
1275                   GLubyte dstMask = 128;
1276                   const GLubyte *s = src;
1277                   GLubyte *d = dst;
1278                   *d = 0;
1279                   for (i = 0; i < width; i++) {
1280                      if (*s & srcMask) {
1281                         *d |= dstMask;
1282                      }
1283                      if (srcMask == 128) {
1284                         srcMask = 1;
1285                         s++;
1286                      }
1287                      else {
1288                         srcMask = srcMask << 1;
1289                      }
1290                      if (dstMask == 1) {
1291                         dstMask = 128;
1292                         d++;
1293                         *d = 0;
1294                      }
1295                      else {
1296                         dstMask = dstMask >> 1;
1297                      }
1298                   }
1299                }
1300                else {
1301                   GLubyte srcMask = 128 >> (unpack->SkipPixels & 0x7);
1302                   GLubyte dstMask = 128;
1303                   const GLubyte *s = src;
1304                   GLubyte *d = dst;
1305                   *d = 0;
1306                   for (i = 0; i < width; i++) {
1307                      if (*s & srcMask) {
1308                         *d |= dstMask;
1309                      }
1310                      if (srcMask == 1) {
1311                         srcMask = 128;
1312                         s++;
1313                      }
1314                      else {
1315                         srcMask = srcMask >> 1;
1316                      }
1317                      if (dstMask == 1) {
1318                         dstMask = 128;
1319                         d++;
1320                         *d = 0;
1321                      }
1322                      else {
1323                         dstMask = dstMask >> 1;
1324                      }
1325                   }
1326                }
1327             }
1328             else {
1329                memcpy(dst, src, bytesPerRow);
1330             }
1331
1332             /* byte flipping/swapping */
1333             if (flipBytes) {
1334                flip_bytes((GLubyte *) dst, bytesPerRow);
1335             }
1336             else if (swap2) {
1337                _mesa_swap2((GLushort*) dst, compsPerRow);
1338             }
1339             else if (swap4) {
1340                _mesa_swap4((GLuint*) dst, compsPerRow);
1341             }
1342             dst += bytesPerRow;
1343          }
1344       }
1345       return destBuffer;
1346    }
1347 }
1348
1349 void
1350 _mesa_pack_luminance_from_rgba_float(GLuint n, GLfloat rgba[][4],
1351                                      GLvoid *dstAddr, GLenum dst_format,
1352                                      GLbitfield transferOps)
1353 {
1354    int i;
1355    GLfloat *dst = (GLfloat *) dstAddr;
1356
1357    switch (dst_format) {
1358    case GL_LUMINANCE:
1359       if (transferOps & IMAGE_CLAMP_BIT) {
1360          for (i = 0; i < n; i++) {
1361             GLfloat sum = rgba[i][RCOMP] + rgba[i][GCOMP] + rgba[i][BCOMP];
1362             dst[i] = CLAMP(sum, 0.0F, 1.0F);
1363          }
1364       } else {
1365          for (i = 0; i < n; i++) {
1366             dst[i] = rgba[i][RCOMP] + rgba[i][GCOMP] + rgba[i][BCOMP];
1367          }
1368       }
1369       return;
1370    case GL_LUMINANCE_ALPHA:
1371       if (transferOps & IMAGE_CLAMP_BIT) {
1372          for (i = 0; i < n; i++) {
1373             GLfloat sum = rgba[i][RCOMP] + rgba[i][GCOMP] + rgba[i][BCOMP];
1374             dst[2*i] = CLAMP(sum, 0.0F, 1.0F);
1375             dst[2*i+1] = rgba[i][ACOMP];
1376          }
1377       } else {
1378          for (i = 0; i < n; i++) {
1379             dst[2*i] = rgba[i][RCOMP] + rgba[i][GCOMP] + rgba[i][BCOMP];
1380             dst[2*i+1] = rgba[i][ACOMP];
1381          }
1382       }
1383       return;
1384    default:
1385       assert(!"Unsupported format");
1386    }
1387 }
1388
1389 static int32_t
1390 clamp_sint64_to_sint32(int64_t src)
1391 {
1392    return CLAMP(src, INT32_MIN, INT32_MAX);
1393 }
1394
1395 static int32_t
1396 clamp_sint64_to_uint32(int64_t src)
1397 {
1398    return CLAMP(src, 0, UINT32_MAX);
1399 }
1400
1401 static int32_t
1402 clamp_uint64_to_uint32(uint64_t src)
1403 {
1404    return MIN2(src, UINT32_MAX);
1405 }
1406
1407 static int32_t
1408 clamp_uint64_to_sint32(uint64_t src)
1409 {
1410    return MIN2(src, INT32_MAX);
1411 }
1412
1413 static int32_t
1414 convert_integer_luminance64(int64_t src64, int bits,
1415                             bool dst_is_signed, bool src_is_signed)
1416 {
1417    int32_t src32;
1418
1419    /* Clamp Luminance value from 64-bit to 32-bit. Consider if we need
1420     * any signed<->unsigned conversion too.
1421     */
1422    if (src_is_signed && dst_is_signed)
1423       src32 = clamp_sint64_to_sint32(src64);
1424    else if (src_is_signed && !dst_is_signed)
1425       src32 = clamp_sint64_to_uint32(src64);
1426    else if (!src_is_signed && dst_is_signed)
1427       src32 = clamp_uint64_to_sint32(src64);
1428    else
1429       src32 = clamp_uint64_to_uint32(src64);
1430
1431    /* If the dst type is < 32-bit, we need an extra clamp */
1432    if (bits == 32) {
1433       return src32;
1434    } else {
1435       if (dst_is_signed)
1436          return _mesa_signed_to_signed(src32, bits);
1437       else
1438          return _mesa_unsigned_to_unsigned(src32, bits);
1439    }
1440 }
1441
1442 static int32_t
1443 convert_integer(int32_t src, int bits, bool dst_is_signed, bool src_is_signed)
1444 {
1445    if (src_is_signed && dst_is_signed)
1446       return _mesa_signed_to_signed(src, bits);
1447    else if (src_is_signed && !dst_is_signed)
1448       return _mesa_signed_to_unsigned(src, bits);
1449    else if (!src_is_signed && dst_is_signed)
1450       return _mesa_unsigned_to_signed(src, bits);
1451    else
1452       return _mesa_unsigned_to_unsigned(src, bits);
1453 }
1454
1455 void
1456 _mesa_pack_luminance_from_rgba_integer(GLuint n,
1457                                        GLuint rgba[][4], bool rgba_is_signed,
1458                                        GLvoid *dstAddr,
1459                                        GLenum dst_format,
1460                                        GLenum dst_type)
1461 {
1462    int i;
1463    int64_t lum64;
1464    int32_t lum32, alpha;
1465    bool dst_is_signed;
1466    int dst_bits;
1467
1468    assert(dst_format == GL_LUMINANCE_INTEGER_EXT ||
1469           dst_format == GL_LUMINANCE_ALPHA_INTEGER_EXT);
1470
1471    /* We first compute luminance values as a 64-bit addition of the
1472     * 32-bit R,G,B components, then we clamp the result to the dst type size.
1473     *
1474     * Notice that this operation involves casting the 32-bit R,G,B components
1475     * to 64-bit before the addition. Since rgba is defined as a GLuint array
1476     * we need to be careful when rgba packs signed data and make sure
1477     * that we cast to a 32-bit signed integer values before casting them to
1478     * 64-bit signed integers.
1479     */
1480    dst_is_signed = (dst_type == GL_BYTE || dst_type == GL_SHORT ||
1481                     dst_type == GL_INT);
1482
1483    dst_bits = _mesa_sizeof_type(dst_type) * 8;
1484    assert(dst_bits > 0);
1485
1486    switch (dst_format) {
1487    case GL_LUMINANCE_INTEGER_EXT:
1488       for (i = 0; i < n; i++) {
1489          if (!rgba_is_signed) {
1490             lum64 = (uint64_t) rgba[i][RCOMP] +
1491                     (uint64_t) rgba[i][GCOMP] +
1492                     (uint64_t) rgba[i][BCOMP];
1493          } else {
1494             lum64 = (int64_t) ((int32_t) rgba[i][RCOMP]) +
1495                     (int64_t) ((int32_t) rgba[i][GCOMP]) +
1496                     (int64_t) ((int32_t) rgba[i][BCOMP]);
1497          }
1498          lum32 = convert_integer_luminance64(lum64, dst_bits,
1499                                              dst_is_signed, rgba_is_signed);
1500          switch (dst_type) {
1501          case GL_BYTE:
1502          case GL_UNSIGNED_BYTE: {
1503             GLbyte *dst = (GLbyte *) dstAddr;
1504             dst[i] = lum32;
1505             break;
1506          }
1507          case GL_SHORT:
1508          case GL_UNSIGNED_SHORT: {
1509             GLshort *dst = (GLshort *) dstAddr;
1510             dst[i] = lum32;
1511             break;
1512          }
1513          case GL_INT:
1514          case GL_UNSIGNED_INT: {
1515             GLint *dst = (GLint *) dstAddr;
1516             dst[i] = lum32;
1517             break;
1518          }
1519          }
1520       }
1521       return;
1522    case GL_LUMINANCE_ALPHA_INTEGER_EXT:
1523       for (i = 0; i < n; i++) {
1524          if (!rgba_is_signed) {
1525             lum64 = (uint64_t) rgba[i][RCOMP] +
1526                     (uint64_t) rgba[i][GCOMP] +
1527                     (uint64_t) rgba[i][BCOMP];
1528          } else {
1529             lum64 = (int64_t) ((int32_t) rgba[i][RCOMP]) +
1530                     (int64_t) ((int32_t) rgba[i][GCOMP]) +
1531                     (int64_t) ((int32_t) rgba[i][BCOMP]);
1532          }
1533          lum32 = convert_integer_luminance64(lum64, dst_bits,
1534                                              dst_is_signed, rgba_is_signed);
1535          alpha = convert_integer(rgba[i][ACOMP], dst_bits,
1536                                  dst_is_signed, rgba_is_signed);
1537          switch (dst_type) {
1538          case GL_BYTE:
1539          case GL_UNSIGNED_BYTE: {
1540             GLbyte *dst = (GLbyte *) dstAddr;
1541             dst[2*i] = lum32;
1542             dst[2*i+1] = alpha;
1543             break;
1544          }
1545          case GL_SHORT:
1546          case GL_UNSIGNED_SHORT: {
1547             GLshort *dst = (GLshort *) dstAddr;
1548             dst[i] = lum32;
1549             dst[2*i+1] = alpha;
1550             break;
1551          }
1552          case GL_INT:
1553          case GL_UNSIGNED_INT: {
1554             GLint *dst = (GLint *) dstAddr;
1555             dst[i] = lum32;
1556             dst[2*i+1] = alpha;
1557             break;
1558          }
1559          }
1560       }
1561       return;
1562    }
1563 }
1564
1565 GLfloat *
1566 _mesa_unpack_color_index_to_rgba_float(struct gl_context *ctx, GLuint dims,
1567                                        const void *src, GLenum srcFormat, GLenum srcType,
1568                                        int srcWidth, int srcHeight, int srcDepth,
1569                                        const struct gl_pixelstore_attrib *srcPacking,
1570                                        GLbitfield transferOps)
1571 {
1572    int count, img;
1573    GLuint *indexes;
1574    GLfloat *rgba, *dstPtr;
1575
1576    count = srcWidth * srcHeight;
1577    indexes = malloc(count * sizeof(GLuint));
1578    if (!indexes) {
1579       _mesa_error(ctx, GL_OUT_OF_MEMORY, "pixel unpacking");
1580       return NULL;
1581    }
1582
1583    rgba = malloc(4 * count * srcDepth * sizeof(GLfloat));
1584    if (!rgba) {
1585       free(indexes);
1586       _mesa_error(ctx, GL_OUT_OF_MEMORY, "pixel unpacking");
1587       return NULL;
1588    }
1589
1590    /* Convert indexes to RGBA float */
1591    dstPtr = rgba;
1592    for (img = 0; img < srcDepth; img++) {
1593       const GLubyte *srcPtr =
1594          (const GLubyte *) _mesa_image_address(dims, srcPacking, src,
1595                                                srcWidth, srcHeight,
1596                                                srcFormat, srcType,
1597                                                img, 0, 0);
1598
1599       extract_uint_indexes(count, indexes, srcFormat, srcType, srcPtr, srcPacking);
1600
1601       if (transferOps & IMAGE_SHIFT_OFFSET_BIT)
1602          _mesa_shift_and_offset_ci(ctx, count, indexes);
1603
1604       _mesa_map_ci_to_rgba(ctx, count, indexes, (float (*)[4])dstPtr);
1605
1606       /* Don't do RGBA scale/bias or RGBA->RGBA mapping if starting
1607        * with color indexes.
1608        */
1609       transferOps &= ~(IMAGE_SCALE_BIAS_BIT | IMAGE_MAP_COLOR_BIT);
1610       _mesa_apply_rgba_transfer_ops(ctx, transferOps, count, (float (*)[4])dstPtr);
1611
1612       dstPtr += srcHeight * srcWidth * 4;
1613    }
1614
1615    free(indexes);
1616
1617    return rgba;
1618 }
1619
1620 GLubyte *
1621 _mesa_unpack_color_index_to_rgba_ubyte(struct gl_context *ctx, GLuint dims,
1622                                        const void *src, GLenum srcFormat, GLenum srcType,
1623                                        int srcWidth, int srcHeight, int srcDepth,
1624                                        const struct gl_pixelstore_attrib *srcPacking,
1625                                        GLbitfield transferOps)
1626 {
1627    GLfloat *rgba;
1628    GLubyte *dst;
1629    int count, i;
1630
1631    transferOps |= IMAGE_CLAMP_BIT;
1632    rgba = _mesa_unpack_color_index_to_rgba_float(ctx, dims,
1633                                                  src, srcFormat, srcType,
1634                                                  srcWidth, srcHeight, srcDepth,
1635                                                  srcPacking, transferOps);
1636
1637    count = srcWidth * srcHeight * srcDepth;
1638    dst = malloc(count * 4 * sizeof(GLubyte));
1639    for (i = 0; i < count; i++) {
1640       CLAMPED_FLOAT_TO_UBYTE(dst[i * 4 + 0], rgba[i * 4 + 0]);
1641       CLAMPED_FLOAT_TO_UBYTE(dst[i * 4 + 1], rgba[i * 4 + 1]);
1642       CLAMPED_FLOAT_TO_UBYTE(dst[i * 4 + 2], rgba[i * 4 + 2]);
1643       CLAMPED_FLOAT_TO_UBYTE(dst[i * 4 + 3], rgba[i * 4 + 3]);
1644    }
1645
1646    free(rgba);
1647
1648    return dst;
1649 }