2 * Mesa 3-D graphics library
4 * Copyright (C) 1999-2008 Brian Paul All Rights Reserved.
5 * Copyright (C) 2009-2010 VMware, Inc. All Rights Reserved.
7 * Permission is hereby granted, free of charge, to any person obtaining a
8 * copy of this software and associated documentation files (the "Software"),
9 * to deal in the Software without restriction, including without limitation
10 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
11 * and/or sell copies of the Software, and to permit persons to whom the
12 * Software is furnished to do so, subject to the following conditions:
14 * The above copyright notice and this permission notice shall be included
15 * in all copies or substantial portions of the Software.
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
18 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 * THEA AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
21 * AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
22 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
28 * Image and pixel span packing and unpacking.
33 * XXX: MSVC takes forever to compile this module for x86_64 unless we disable
34 * this global optimization.
37 * - http://msdn.microsoft.com/en-us/library/1yk3ydd7.aspx
38 * - http://msdn.microsoft.com/en-us/library/chh3fb0k.aspx
40 #if defined(_MSC_VER) && defined(_M_X64)
41 # pragma optimize( "g", off )
53 #include "pixeltransfer.h"
55 #include "glformats.h"
56 #include "format_utils.h"
57 #include "format_pack.h"
61 * Flip the 8 bits in each byte of the given array.
64 * \param n number of bytes.
66 * \todo try this trick to flip bytes someday:
68 * v = ((v & 0x55555555) << 1) | ((v >> 1) & 0x55555555);
69 * v = ((v & 0x33333333) << 2) | ((v >> 2) & 0x33333333);
70 * v = ((v & 0x0f0f0f0f) << 4) | ((v >> 4) & 0x0f0f0f0f);
74 flip_bytes( GLubyte
*p
, GLuint n
)
77 for (i
= 0; i
< n
; i
++) {
78 b
= (GLuint
) p
[i
]; /* words are often faster than bytes */
79 a
= ((b
& 0x01) << 7) |
94 * Unpack a 32x32 pixel polygon stipple from user memory using the
95 * current pixel unpack settings.
98 _mesa_unpack_polygon_stipple( const GLubyte
*pattern
, GLuint dest
[32],
99 const struct gl_pixelstore_attrib
*unpacking
)
101 GLubyte
*ptrn
= (GLubyte
*) _mesa_unpack_image(2, 32, 32, 1, GL_COLOR_INDEX
,
102 GL_BITMAP
, pattern
, unpacking
);
104 /* Convert pattern from GLubytes to GLuints and handle big/little
109 for (i
= 0; i
< 32; i
++) {
110 dest
[i
] = (p
[0] << 24)
122 * Pack polygon stipple into user memory given current pixel packing
126 _mesa_pack_polygon_stipple( const GLuint pattern
[32], GLubyte
*dest
,
127 const struct gl_pixelstore_attrib
*packing
)
129 /* Convert pattern from GLuints to GLubytes to handle big/little
130 * endian differences.
134 for (i
= 0; i
< 32; i
++) {
135 ptrn
[i
* 4 + 0] = (GLubyte
) ((pattern
[i
] >> 24) & 0xff);
136 ptrn
[i
* 4 + 1] = (GLubyte
) ((pattern
[i
] >> 16) & 0xff);
137 ptrn
[i
* 4 + 2] = (GLubyte
) ((pattern
[i
] >> 8 ) & 0xff);
138 ptrn
[i
* 4 + 3] = (GLubyte
) ((pattern
[i
] ) & 0xff);
141 _mesa_pack_bitmap(32, 32, ptrn
, dest
, packing
);
149 _mesa_pack_bitmap( GLint width
, GLint height
, const GLubyte
*source
,
150 GLubyte
*dest
, const struct gl_pixelstore_attrib
*packing
)
152 GLint row
, width_in_bytes
;
158 width_in_bytes
= DIV_ROUND_UP( width
, 8 );
160 for (row
= 0; row
< height
; row
++) {
161 GLubyte
*dst
= (GLubyte
*) _mesa_image_address2d(packing
, dest
,
162 width
, height
, GL_COLOR_INDEX
, GL_BITMAP
, row
, 0);
166 if ((packing
->SkipPixels
& 7) == 0) {
167 memcpy( dst
, src
, width_in_bytes
);
168 if (packing
->LsbFirst
) {
169 flip_bytes( dst
, width_in_bytes
);
173 /* handling SkipPixels is a bit tricky (no pun intended!) */
175 if (packing
->LsbFirst
) {
176 GLubyte srcMask
= 128;
177 GLubyte dstMask
= 1 << (packing
->SkipPixels
& 0x7);
178 const GLubyte
*s
= src
;
181 for (i
= 0; i
< width
; i
++) {
190 srcMask
= srcMask
>> 1;
192 if (dstMask
== 128) {
198 dstMask
= dstMask
<< 1;
203 GLubyte srcMask
= 128;
204 GLubyte dstMask
= 128 >> (packing
->SkipPixels
& 0x7);
205 const GLubyte
*s
= src
;
208 for (i
= 0; i
< width
; i
++) {
217 srcMask
= srcMask
>> 1;
225 dstMask
= dstMask
>> 1;
230 src
+= width_in_bytes
;
235 #define SWAP2BYTE(VALUE) \
237 GLubyte *bytes = (GLubyte *) &(VALUE); \
238 GLubyte tmp = bytes[0]; \
239 bytes[0] = bytes[1]; \
243 #define SWAP4BYTE(VALUE) \
245 GLubyte *bytes = (GLubyte *) &(VALUE); \
246 GLubyte tmp = bytes[0]; \
247 bytes[0] = bytes[3]; \
250 bytes[1] = bytes[2]; \
256 extract_uint_indexes(GLuint n
, GLuint indexes
[],
257 GLenum srcFormat
, GLenum srcType
, const GLvoid
*src
,
258 const struct gl_pixelstore_attrib
*unpack
)
260 assert(srcFormat
== GL_COLOR_INDEX
|| srcFormat
== GL_STENCIL_INDEX
);
262 assert(srcType
== GL_BITMAP
||
263 srcType
== GL_UNSIGNED_BYTE
||
264 srcType
== GL_BYTE
||
265 srcType
== GL_UNSIGNED_SHORT
||
266 srcType
== GL_SHORT
||
267 srcType
== GL_UNSIGNED_INT
||
269 srcType
== GL_UNSIGNED_INT_24_8_EXT
||
270 srcType
== GL_HALF_FLOAT_ARB
||
271 srcType
== GL_HALF_FLOAT_OES
||
272 srcType
== GL_FLOAT
||
273 srcType
== GL_FLOAT_32_UNSIGNED_INT_24_8_REV
);
278 GLubyte
*ubsrc
= (GLubyte
*) src
;
279 if (unpack
->LsbFirst
) {
280 GLubyte mask
= 1 << (unpack
->SkipPixels
& 0x7);
282 for (i
= 0; i
< n
; i
++) {
283 indexes
[i
] = (*ubsrc
& mask
) ? 1 : 0;
294 GLubyte mask
= 128 >> (unpack
->SkipPixels
& 0x7);
296 for (i
= 0; i
< n
; i
++) {
297 indexes
[i
] = (*ubsrc
& mask
) ? 1 : 0;
309 case GL_UNSIGNED_BYTE
:
312 const GLubyte
*s
= (const GLubyte
*) src
;
313 for (i
= 0; i
< n
; i
++)
320 const GLbyte
*s
= (const GLbyte
*) src
;
321 for (i
= 0; i
< n
; i
++)
325 case GL_UNSIGNED_SHORT
:
328 const GLushort
*s
= (const GLushort
*) src
;
329 if (unpack
->SwapBytes
) {
330 for (i
= 0; i
< n
; i
++) {
331 GLushort value
= s
[i
];
337 for (i
= 0; i
< n
; i
++)
345 const GLshort
*s
= (const GLshort
*) src
;
346 if (unpack
->SwapBytes
) {
347 for (i
= 0; i
< n
; i
++) {
348 GLshort value
= s
[i
];
354 for (i
= 0; i
< n
; i
++)
359 case GL_UNSIGNED_INT
:
362 const GLuint
*s
= (const GLuint
*) src
;
363 if (unpack
->SwapBytes
) {
364 for (i
= 0; i
< n
; i
++) {
371 for (i
= 0; i
< n
; i
++)
379 const GLint
*s
= (const GLint
*) src
;
380 if (unpack
->SwapBytes
) {
381 for (i
= 0; i
< n
; i
++) {
388 for (i
= 0; i
< n
; i
++)
396 const GLfloat
*s
= (const GLfloat
*) src
;
397 if (unpack
->SwapBytes
) {
398 for (i
= 0; i
< n
; i
++) {
399 GLfloat value
= s
[i
];
401 indexes
[i
] = (GLuint
) value
;
405 for (i
= 0; i
< n
; i
++)
406 indexes
[i
] = (GLuint
) s
[i
];
410 case GL_HALF_FLOAT_ARB
:
411 case GL_HALF_FLOAT_OES
:
414 const GLhalfARB
*s
= (const GLhalfARB
*) src
;
415 if (unpack
->SwapBytes
) {
416 for (i
= 0; i
< n
; i
++) {
417 GLhalfARB value
= s
[i
];
419 indexes
[i
] = (GLuint
) _mesa_half_to_float(value
);
423 for (i
= 0; i
< n
; i
++)
424 indexes
[i
] = (GLuint
) _mesa_half_to_float(s
[i
]);
428 case GL_UNSIGNED_INT_24_8_EXT
:
431 const GLuint
*s
= (const GLuint
*) src
;
432 if (unpack
->SwapBytes
) {
433 for (i
= 0; i
< n
; i
++) {
436 indexes
[i
] = value
& 0xff; /* lower 8 bits */
440 for (i
= 0; i
< n
; i
++)
441 indexes
[i
] = s
[i
] & 0xff; /* lower 8 bits */
445 case GL_FLOAT_32_UNSIGNED_INT_24_8_REV
:
448 const GLuint
*s
= (const GLuint
*) src
;
449 if (unpack
->SwapBytes
) {
450 for (i
= 0; i
< n
; i
++) {
451 GLuint value
= s
[i
*2+1];
453 indexes
[i
] = value
& 0xff; /* lower 8 bits */
457 for (i
= 0; i
< n
; i
++)
458 indexes
[i
] = s
[i
*2+1] & 0xff; /* lower 8 bits */
464 _mesa_problem(NULL
, "bad srcType in extract_uint_indexes");
471 clamp_float_to_uint(GLfloat f
)
473 return f
< 0.0F
? 0 : _mesa_lroundevenf(f
);
478 clamp_half_to_uint(GLhalfARB h
)
480 GLfloat f
= _mesa_half_to_float(h
);
481 return f
< 0.0F
? 0 : _mesa_lroundevenf(f
);
486 * Unpack a row of stencil data from a client buffer according to
487 * the pixel unpacking parameters.
488 * This is (or will be) used by glDrawPixels
490 * Args: ctx - the context
491 * n - number of pixels
492 * dstType - destination data type
493 * dest - destination array
494 * srcType - source pixel type
495 * source - source data pointer
496 * srcPacking - pixel unpacking parameters
497 * transferOps - apply offset/bias/lookup ops?
500 _mesa_unpack_stencil_span( struct gl_context
*ctx
, GLuint n
,
501 GLenum dstType
, GLvoid
*dest
,
502 GLenum srcType
, const GLvoid
*source
,
503 const struct gl_pixelstore_attrib
*srcPacking
,
504 GLbitfield transferOps
)
506 assert(srcType
== GL_BITMAP
||
507 srcType
== GL_UNSIGNED_BYTE
||
508 srcType
== GL_BYTE
||
509 srcType
== GL_UNSIGNED_SHORT
||
510 srcType
== GL_SHORT
||
511 srcType
== GL_UNSIGNED_INT
||
513 srcType
== GL_UNSIGNED_INT_24_8_EXT
||
514 srcType
== GL_HALF_FLOAT_ARB
||
515 srcType
== GL_HALF_FLOAT_OES
||
516 srcType
== GL_FLOAT
||
517 srcType
== GL_FLOAT_32_UNSIGNED_INT_24_8_REV
);
519 assert(dstType
== GL_UNSIGNED_BYTE
||
520 dstType
== GL_UNSIGNED_SHORT
||
521 dstType
== GL_UNSIGNED_INT
||
522 dstType
== GL_FLOAT_32_UNSIGNED_INT_24_8_REV
);
524 /* only shift and offset apply to stencil */
525 transferOps
&= IMAGE_SHIFT_OFFSET_BIT
;
528 * Try simple cases first
530 if (transferOps
== 0 &&
531 !ctx
->Pixel
.MapStencilFlag
&&
532 srcType
== GL_UNSIGNED_BYTE
&&
533 dstType
== GL_UNSIGNED_BYTE
) {
534 memcpy(dest
, source
, n
* sizeof(GLubyte
));
536 else if (transferOps
== 0 &&
537 !ctx
->Pixel
.MapStencilFlag
&&
538 srcType
== GL_UNSIGNED_INT
&&
539 dstType
== GL_UNSIGNED_INT
&&
540 !srcPacking
->SwapBytes
) {
541 memcpy(dest
, source
, n
* sizeof(GLuint
));
547 GLuint
*indexes
= malloc(n
* sizeof(GLuint
));
550 _mesa_error(ctx
, GL_OUT_OF_MEMORY
, "stencil unpacking");
554 extract_uint_indexes(n
, indexes
, GL_STENCIL_INDEX
, srcType
, source
,
557 if (transferOps
& IMAGE_SHIFT_OFFSET_BIT
) {
558 /* shift and offset indexes */
559 _mesa_shift_and_offset_ci(ctx
, n
, indexes
);
562 if (ctx
->Pixel
.MapStencilFlag
) {
563 /* Apply stencil lookup table */
564 const GLuint mask
= ctx
->PixelMaps
.StoS
.Size
- 1;
566 for (i
= 0; i
< n
; i
++) {
567 indexes
[i
] = (GLuint
)ctx
->PixelMaps
.StoS
.Map
[ indexes
[i
] & mask
];
571 /* convert to dest type */
573 case GL_UNSIGNED_BYTE
:
575 GLubyte
*dst
= (GLubyte
*) dest
;
577 for (i
= 0; i
< n
; i
++) {
578 dst
[i
] = (GLubyte
) (indexes
[i
] & 0xff);
582 case GL_UNSIGNED_SHORT
:
584 GLuint
*dst
= (GLuint
*) dest
;
586 for (i
= 0; i
< n
; i
++) {
587 dst
[i
] = (GLushort
) (indexes
[i
] & 0xffff);
591 case GL_UNSIGNED_INT
:
592 memcpy(dest
, indexes
, n
* sizeof(GLuint
));
594 case GL_FLOAT_32_UNSIGNED_INT_24_8_REV
:
596 GLuint
*dst
= (GLuint
*) dest
;
598 for (i
= 0; i
< n
; i
++) {
599 dst
[i
*2+1] = indexes
[i
] & 0xff; /* lower 8 bits */
604 _mesa_problem(ctx
, "bad dstType in _mesa_unpack_stencil_span");
613 _mesa_pack_stencil_span( struct gl_context
*ctx
, GLuint n
,
614 GLenum dstType
, GLvoid
*dest
, const GLubyte
*source
,
615 const struct gl_pixelstore_attrib
*dstPacking
)
617 GLubyte
*stencil
= malloc(n
* sizeof(GLubyte
));
620 _mesa_error(ctx
, GL_OUT_OF_MEMORY
, "stencil packing");
624 if (ctx
->Pixel
.IndexShift
|| ctx
->Pixel
.IndexOffset
||
625 ctx
->Pixel
.MapStencilFlag
) {
626 /* make a copy of input */
627 memcpy(stencil
, source
, n
* sizeof(GLubyte
));
628 _mesa_apply_stencil_transfer_ops(ctx
, n
, stencil
);
633 case GL_UNSIGNED_BYTE
:
634 memcpy(dest
, source
, n
);
638 GLbyte
*dst
= (GLbyte
*) dest
;
641 dst
[i
] = (GLbyte
) (source
[i
] & 0x7f);
645 case GL_UNSIGNED_SHORT
:
647 GLushort
*dst
= (GLushort
*) dest
;
650 dst
[i
] = (GLushort
) source
[i
];
652 if (dstPacking
->SwapBytes
) {
653 _mesa_swap2( (GLushort
*) dst
, n
);
659 GLshort
*dst
= (GLshort
*) dest
;
662 dst
[i
] = (GLshort
) source
[i
];
664 if (dstPacking
->SwapBytes
) {
665 _mesa_swap2( (GLushort
*) dst
, n
);
669 case GL_UNSIGNED_INT
:
671 GLuint
*dst
= (GLuint
*) dest
;
674 dst
[i
] = (GLuint
) source
[i
];
676 if (dstPacking
->SwapBytes
) {
677 _mesa_swap4( (GLuint
*) dst
, n
);
683 GLint
*dst
= (GLint
*) dest
;
686 dst
[i
] = (GLint
) source
[i
];
688 if (dstPacking
->SwapBytes
) {
689 _mesa_swap4( (GLuint
*) dst
, n
);
695 GLfloat
*dst
= (GLfloat
*) dest
;
698 dst
[i
] = (GLfloat
) source
[i
];
700 if (dstPacking
->SwapBytes
) {
701 _mesa_swap4( (GLuint
*) dst
, n
);
705 case GL_HALF_FLOAT_ARB
:
706 case GL_HALF_FLOAT_OES
:
708 GLhalfARB
*dst
= (GLhalfARB
*) dest
;
711 dst
[i
] = _mesa_float_to_half( (float) source
[i
] );
713 if (dstPacking
->SwapBytes
) {
714 _mesa_swap2( (GLushort
*) dst
, n
);
719 if (dstPacking
->LsbFirst
) {
720 GLubyte
*dst
= (GLubyte
*) dest
;
723 for (i
= 0; i
< n
; i
++) {
726 *dst
|= ((source
[i
] != 0) << shift
);
735 GLubyte
*dst
= (GLubyte
*) dest
;
738 for (i
= 0; i
< n
; i
++) {
741 *dst
|= ((source
[i
] != 0) << shift
);
751 _mesa_problem(ctx
, "bad type in _mesa_pack_index_span");
757 #define DEPTH_VALUES(GLTYPE, GLTYPE2FLOAT) \
760 const GLTYPE *src = (const GLTYPE *)source; \
761 for (i = 0; i < n; i++) { \
762 GLTYPE value = src[i]; \
763 if (srcPacking->SwapBytes) { \
764 if (sizeof(GLTYPE) == 2) { \
766 } else if (sizeof(GLTYPE) == 4) { \
770 depthValues[i] = GLTYPE2FLOAT(value); \
776 * Unpack a row of depth/z values from memory, returning GLushort, GLuint
778 * The glPixelTransfer (scale/bias) params will be applied.
780 * \param dstType one of GL_UNSIGNED_SHORT, GL_UNSIGNED_INT, GL_FLOAT
781 * \param depthMax max value for returned GLushort or GLuint values
782 * (ignored for GLfloat).
785 _mesa_unpack_depth_span( struct gl_context
*ctx
, GLuint n
,
786 GLenum dstType
, GLvoid
*dest
, GLuint depthMax
,
787 GLenum srcType
, const GLvoid
*source
,
788 const struct gl_pixelstore_attrib
*srcPacking
)
790 GLfloat
*depthTemp
= NULL
, *depthValues
;
791 GLboolean needClamp
= GL_FALSE
;
793 /* Look for special cases first.
794 * Not only are these faster, they're less prone to numeric conversion
795 * problems. Otherwise, converting from an int type to a float then
796 * back to an int type can introduce errors that will show up as
797 * artifacts in things like depth peeling which uses glCopyTexImage.
799 if (ctx
->Pixel
.DepthScale
== 1.0F
&& ctx
->Pixel
.DepthBias
== 0.0F
) {
800 if (srcType
== GL_UNSIGNED_INT
&& dstType
== GL_UNSIGNED_SHORT
) {
801 const GLuint
*src
= (const GLuint
*) source
;
802 GLushort
*dst
= (GLushort
*) dest
;
804 for (i
= 0; i
< n
; i
++) {
805 dst
[i
] = src
[i
] >> 16;
809 if (srcType
== GL_UNSIGNED_SHORT
810 && dstType
== GL_UNSIGNED_INT
811 && depthMax
== 0xffffffff) {
812 const GLushort
*src
= (const GLushort
*) source
;
813 GLuint
*dst
= (GLuint
*) dest
;
815 for (i
= 0; i
< n
; i
++) {
816 dst
[i
] = src
[i
] | (src
[i
] << 16);
820 if (srcType
== GL_UNSIGNED_INT_24_8
821 && dstType
== GL_UNSIGNED_INT
822 && depthMax
== 0xffffff) {
823 const GLuint
*src
= (const GLuint
*) source
;
824 GLuint
*dst
= (GLuint
*) dest
;
826 for (i
= 0; i
< n
; i
++) {
827 dst
[i
] = src
[i
] >> 8;
831 /* XXX may want to add additional cases here someday */
834 /* general case path follows */
836 if (dstType
== GL_FLOAT
) {
837 depthValues
= (GLfloat
*) dest
;
840 depthTemp
= malloc(n
* sizeof(GLfloat
));
842 _mesa_error(ctx
, GL_OUT_OF_MEMORY
, "pixel unpacking");
846 depthValues
= depthTemp
;
849 /* Convert incoming values to GLfloat. Some conversions will require
854 DEPTH_VALUES(GLbyte
, BYTE_TO_FLOATZ
);
857 case GL_UNSIGNED_BYTE
:
858 DEPTH_VALUES(GLubyte
, UBYTE_TO_FLOAT
);
861 DEPTH_VALUES(GLshort
, SHORT_TO_FLOATZ
);
864 case GL_UNSIGNED_SHORT
:
865 DEPTH_VALUES(GLushort
, USHORT_TO_FLOAT
);
868 DEPTH_VALUES(GLint
, INT_TO_FLOAT
);
871 case GL_UNSIGNED_INT
:
872 DEPTH_VALUES(GLuint
, UINT_TO_FLOAT
);
874 case GL_UNSIGNED_INT_24_8_EXT
: /* GL_EXT_packed_depth_stencil */
875 if (dstType
== GL_UNSIGNED_INT_24_8_EXT
&&
876 depthMax
== 0xffffff &&
877 ctx
->Pixel
.DepthScale
== 1.0F
&&
878 ctx
->Pixel
.DepthBias
== 0.0F
) {
879 const GLuint
*src
= (const GLuint
*) source
;
880 GLuint
*zValues
= (GLuint
*) dest
;
882 for (i
= 0; i
< n
; i
++) {
883 GLuint value
= src
[i
];
884 if (srcPacking
->SwapBytes
) {
887 zValues
[i
] = value
& 0xffffff00;
893 const GLuint
*src
= (const GLuint
*) source
;
894 const GLfloat scale
= 1.0f
/ 0xffffff;
896 for (i
= 0; i
< n
; i
++) {
897 GLuint value
= src
[i
];
898 if (srcPacking
->SwapBytes
) {
901 depthValues
[i
] = (value
>> 8) * scale
;
905 case GL_FLOAT_32_UNSIGNED_INT_24_8_REV
:
908 const GLfloat
*src
= (const GLfloat
*)source
;
909 for (i
= 0; i
< n
; i
++) {
910 GLfloat value
= src
[i
* 2];
911 if (srcPacking
->SwapBytes
) {
914 depthValues
[i
] = value
;
920 DEPTH_VALUES(GLfloat
, 1*);
923 case GL_HALF_FLOAT_ARB
:
924 case GL_HALF_FLOAT_OES
:
927 const GLhalfARB
*src
= (const GLhalfARB
*) source
;
928 for (i
= 0; i
< n
; i
++) {
929 GLhalfARB value
= src
[i
];
930 if (srcPacking
->SwapBytes
) {
933 depthValues
[i
] = _mesa_half_to_float(value
);
939 _mesa_problem(NULL
, "bad type in _mesa_unpack_depth_span()");
944 /* apply depth scale and bias */
946 const GLfloat scale
= ctx
->Pixel
.DepthScale
;
947 const GLfloat bias
= ctx
->Pixel
.DepthBias
;
948 if (scale
!= 1.0F
|| bias
!= 0.0F
) {
950 for (i
= 0; i
< n
; i
++) {
951 depthValues
[i
] = depthValues
[i
] * scale
+ bias
;
957 /* clamp to [0, 1] */
960 for (i
= 0; i
< n
; i
++) {
961 depthValues
[i
] = CLAMP(depthValues
[i
], 0.0F
, 1.0F
);
966 * Convert values to dstType
968 if (dstType
== GL_UNSIGNED_INT
) {
969 GLuint
*zValues
= (GLuint
*) dest
;
971 if (depthMax
<= 0xffffff) {
972 /* no overflow worries */
973 for (i
= 0; i
< n
; i
++) {
974 zValues
[i
] = (GLuint
) (depthValues
[i
] * (GLfloat
) depthMax
);
978 /* need to use double precision to prevent overflow problems */
979 for (i
= 0; i
< n
; i
++) {
980 GLdouble z
= depthValues
[i
] * (GLdouble
) depthMax
;
981 if (z
>= (GLdouble
) 0xffffffff)
982 zValues
[i
] = 0xffffffff;
984 zValues
[i
] = (GLuint
) z
;
988 else if (dstType
== GL_UNSIGNED_SHORT
) {
989 GLushort
*zValues
= (GLushort
*) dest
;
991 assert(depthMax
<= 0xffff);
992 for (i
= 0; i
< n
; i
++) {
993 zValues
[i
] = (GLushort
) (depthValues
[i
] * (GLfloat
) depthMax
);
996 else if (dstType
== GL_FLOAT
) {
997 /* Nothing to do. depthValues is pointing to dest. */
999 else if (dstType
== GL_FLOAT_32_UNSIGNED_INT_24_8_REV
) {
1000 GLfloat
*zValues
= (GLfloat
*) dest
;
1002 for (i
= 0; i
< n
; i
++) {
1003 zValues
[i
*2] = depthValues
[i
];
1015 * Pack an array of depth values. The values are floats in [0,1].
1018 _mesa_pack_depth_span( struct gl_context
*ctx
, GLuint n
, GLvoid
*dest
,
1019 GLenum dstType
, const GLfloat
*depthSpan
,
1020 const struct gl_pixelstore_attrib
*dstPacking
)
1022 GLfloat
*depthCopy
= malloc(n
* sizeof(GLfloat
));
1024 _mesa_error(ctx
, GL_OUT_OF_MEMORY
, "pixel packing");
1028 if (ctx
->Pixel
.DepthScale
!= 1.0F
|| ctx
->Pixel
.DepthBias
!= 0.0F
) {
1029 memcpy(depthCopy
, depthSpan
, n
* sizeof(GLfloat
));
1030 _mesa_scale_and_bias_depth(ctx
, n
, depthCopy
);
1031 depthSpan
= depthCopy
;
1035 case GL_UNSIGNED_BYTE
:
1037 GLubyte
*dst
= (GLubyte
*) dest
;
1039 for (i
= 0; i
< n
; i
++) {
1040 dst
[i
] = FLOAT_TO_UBYTE( depthSpan
[i
] );
1046 GLbyte
*dst
= (GLbyte
*) dest
;
1048 for (i
= 0; i
< n
; i
++) {
1049 dst
[i
] = FLOAT_TO_BYTE( depthSpan
[i
] );
1053 case GL_UNSIGNED_SHORT
:
1055 GLushort
*dst
= (GLushort
*) dest
;
1057 for (i
= 0; i
< n
; i
++) {
1058 CLAMPED_FLOAT_TO_USHORT(dst
[i
], depthSpan
[i
]);
1060 if (dstPacking
->SwapBytes
) {
1061 _mesa_swap2( (GLushort
*) dst
, n
);
1067 GLshort
*dst
= (GLshort
*) dest
;
1069 for (i
= 0; i
< n
; i
++) {
1070 dst
[i
] = FLOAT_TO_SHORT( depthSpan
[i
] );
1072 if (dstPacking
->SwapBytes
) {
1073 _mesa_swap2( (GLushort
*) dst
, n
);
1077 case GL_UNSIGNED_INT
:
1079 GLuint
*dst
= (GLuint
*) dest
;
1081 for (i
= 0; i
< n
; i
++) {
1082 dst
[i
] = FLOAT_TO_UINT( depthSpan
[i
] );
1084 if (dstPacking
->SwapBytes
) {
1085 _mesa_swap4( (GLuint
*) dst
, n
);
1091 GLint
*dst
= (GLint
*) dest
;
1093 for (i
= 0; i
< n
; i
++) {
1094 dst
[i
] = FLOAT_TO_INT( depthSpan
[i
] );
1096 if (dstPacking
->SwapBytes
) {
1097 _mesa_swap4( (GLuint
*) dst
, n
);
1103 GLfloat
*dst
= (GLfloat
*) dest
;
1105 for (i
= 0; i
< n
; i
++) {
1106 dst
[i
] = depthSpan
[i
];
1108 if (dstPacking
->SwapBytes
) {
1109 _mesa_swap4( (GLuint
*) dst
, n
);
1113 case GL_HALF_FLOAT_ARB
:
1114 case GL_HALF_FLOAT_OES
:
1116 GLhalfARB
*dst
= (GLhalfARB
*) dest
;
1118 for (i
= 0; i
< n
; i
++) {
1119 dst
[i
] = _mesa_float_to_half(depthSpan
[i
]);
1121 if (dstPacking
->SwapBytes
) {
1122 _mesa_swap2( (GLushort
*) dst
, n
);
1127 _mesa_problem(ctx
, "bad type in _mesa_pack_depth_span");
1136 * Pack depth and stencil values as GL_DEPTH_STENCIL (GL_UNSIGNED_INT_24_8 etc)
1139 _mesa_pack_depth_stencil_span(struct gl_context
*ctx
,GLuint n
,
1140 GLenum dstType
, GLuint
*dest
,
1141 const GLfloat
*depthVals
,
1142 const GLubyte
*stencilVals
,
1143 const struct gl_pixelstore_attrib
*dstPacking
)
1145 GLfloat
*depthCopy
= malloc(n
* sizeof(GLfloat
));
1146 GLubyte
*stencilCopy
= malloc(n
* sizeof(GLubyte
));
1149 if (!depthCopy
|| !stencilCopy
) {
1150 _mesa_error(ctx
, GL_OUT_OF_MEMORY
, "pixel packing");
1156 if (ctx
->Pixel
.DepthScale
!= 1.0F
|| ctx
->Pixel
.DepthBias
!= 0.0F
) {
1157 memcpy(depthCopy
, depthVals
, n
* sizeof(GLfloat
));
1158 _mesa_scale_and_bias_depth(ctx
, n
, depthCopy
);
1159 depthVals
= depthCopy
;
1162 if (ctx
->Pixel
.IndexShift
||
1163 ctx
->Pixel
.IndexOffset
||
1164 ctx
->Pixel
.MapStencilFlag
) {
1165 memcpy(stencilCopy
, stencilVals
, n
* sizeof(GLubyte
));
1166 _mesa_apply_stencil_transfer_ops(ctx
, n
, stencilCopy
);
1167 stencilVals
= stencilCopy
;
1171 case GL_UNSIGNED_INT_24_8
:
1172 for (i
= 0; i
< n
; i
++) {
1173 GLuint z
= (GLuint
) (depthVals
[i
] * 0xffffff);
1174 dest
[i
] = (z
<< 8) | (stencilVals
[i
] & 0xff);
1177 case GL_FLOAT_32_UNSIGNED_INT_24_8_REV
:
1178 for (i
= 0; i
< n
; i
++) {
1179 ((GLfloat
*)dest
)[i
*2] = depthVals
[i
];
1180 dest
[i
*2+1] = stencilVals
[i
] & 0xff;
1185 if (dstPacking
->SwapBytes
) {
1186 _mesa_swap4(dest
, n
);
1196 * Unpack image data. Apply byte swapping, byte flipping (bitmap).
1197 * Return all image data in a contiguous block. This is used when we
1198 * compile glDrawPixels, glTexImage, etc into a display list. We
1199 * need a copy of the data in a standard format.
1202 _mesa_unpack_image( GLuint dimensions
,
1203 GLsizei width
, GLsizei height
, GLsizei depth
,
1204 GLenum format
, GLenum type
, const GLvoid
*pixels
,
1205 const struct gl_pixelstore_attrib
*unpack
)
1207 GLint bytesPerRow
, compsPerRow
;
1208 GLboolean flipBytes
, swap2
, swap4
;
1211 return NULL
; /* not necessarily an error */
1213 if (width
<= 0 || height
<= 0 || depth
<= 0)
1214 return NULL
; /* generate error later */
1216 if (type
== GL_BITMAP
) {
1217 bytesPerRow
= (width
+ 7) >> 3;
1218 flipBytes
= unpack
->LsbFirst
;
1219 swap2
= swap4
= GL_FALSE
;
1223 const GLint bytesPerPixel
= _mesa_bytes_per_pixel(format
, type
);
1224 GLint components
= _mesa_components_in_format(format
);
1227 if (_mesa_type_is_packed(type
))
1230 if (bytesPerPixel
<= 0 || components
<= 0)
1231 return NULL
; /* bad format or type. generate error later */
1232 bytesPerRow
= bytesPerPixel
* width
;
1233 bytesPerComp
= bytesPerPixel
/ components
;
1234 flipBytes
= GL_FALSE
;
1235 swap2
= (bytesPerComp
== 2) && unpack
->SwapBytes
;
1236 swap4
= (bytesPerComp
== 4) && unpack
->SwapBytes
;
1237 compsPerRow
= components
* width
;
1238 assert(compsPerRow
>= width
);
1243 = malloc(bytesPerRow
* height
* depth
);
1247 return NULL
; /* generate GL_OUT_OF_MEMORY later */
1250 for (img
= 0; img
< depth
; img
++) {
1251 for (row
= 0; row
< height
; row
++) {
1252 const GLvoid
*src
= _mesa_image_address(dimensions
, unpack
, pixels
,
1253 width
, height
, format
, type
, img
, row
, 0);
1255 if ((type
== GL_BITMAP
) && (unpack
->SkipPixels
& 0x7)) {
1257 flipBytes
= GL_FALSE
;
1258 if (unpack
->LsbFirst
) {
1259 GLubyte srcMask
= 1 << (unpack
->SkipPixels
& 0x7);
1260 GLubyte dstMask
= 128;
1261 const GLubyte
*s
= src
;
1264 for (i
= 0; i
< width
; i
++) {
1268 if (srcMask
== 128) {
1273 srcMask
= srcMask
<< 1;
1281 dstMask
= dstMask
>> 1;
1286 GLubyte srcMask
= 128 >> (unpack
->SkipPixels
& 0x7);
1287 GLubyte dstMask
= 128;
1288 const GLubyte
*s
= src
;
1291 for (i
= 0; i
< width
; i
++) {
1300 srcMask
= srcMask
>> 1;
1308 dstMask
= dstMask
>> 1;
1314 memcpy(dst
, src
, bytesPerRow
);
1317 /* byte flipping/swapping */
1319 flip_bytes((GLubyte
*) dst
, bytesPerRow
);
1322 _mesa_swap2((GLushort
*) dst
, compsPerRow
);
1325 _mesa_swap4((GLuint
*) dst
, compsPerRow
);
1335 _mesa_pack_luminance_from_rgba_float(GLuint n
, GLfloat rgba
[][4],
1336 GLvoid
*dstAddr
, GLenum dst_format
,
1337 GLbitfield transferOps
)
1340 GLfloat
*dst
= (GLfloat
*) dstAddr
;
1342 switch (dst_format
) {
1344 if (transferOps
& IMAGE_CLAMP_BIT
) {
1345 for (i
= 0; i
< n
; i
++) {
1346 GLfloat sum
= rgba
[i
][RCOMP
] + rgba
[i
][GCOMP
] + rgba
[i
][BCOMP
];
1347 dst
[i
] = CLAMP(sum
, 0.0F
, 1.0F
);
1350 for (i
= 0; i
< n
; i
++) {
1351 dst
[i
] = rgba
[i
][RCOMP
] + rgba
[i
][GCOMP
] + rgba
[i
][BCOMP
];
1355 case GL_LUMINANCE_ALPHA
:
1356 if (transferOps
& IMAGE_CLAMP_BIT
) {
1357 for (i
= 0; i
< n
; i
++) {
1358 GLfloat sum
= rgba
[i
][RCOMP
] + rgba
[i
][GCOMP
] + rgba
[i
][BCOMP
];
1359 dst
[2*i
] = CLAMP(sum
, 0.0F
, 1.0F
);
1360 dst
[2*i
+1] = rgba
[i
][ACOMP
];
1363 for (i
= 0; i
< n
; i
++) {
1364 dst
[2*i
] = rgba
[i
][RCOMP
] + rgba
[i
][GCOMP
] + rgba
[i
][BCOMP
];
1365 dst
[2*i
+1] = rgba
[i
][ACOMP
];
1370 assert(!"Unsupported format");
1375 clamp_sint64_to_sint32(int64_t src
)
1377 return CLAMP(src
, INT32_MIN
, INT32_MAX
);
1381 clamp_sint64_to_uint32(int64_t src
)
1383 return CLAMP(src
, 0, UINT32_MAX
);
1387 clamp_uint64_to_uint32(uint64_t src
)
1389 return MIN2(src
, UINT32_MAX
);
1393 clamp_uint64_to_sint32(uint64_t src
)
1395 return MIN2(src
, INT32_MAX
);
1399 convert_integer_luminance64(int64_t src64
, int bits
,
1400 bool dst_is_signed
, bool src_is_signed
)
1404 /* Clamp Luminance value from 64-bit to 32-bit. Consider if we need
1405 * any signed<->unsigned conversion too.
1407 if (src_is_signed
&& dst_is_signed
)
1408 src32
= clamp_sint64_to_sint32(src64
);
1409 else if (src_is_signed
&& !dst_is_signed
)
1410 src32
= clamp_sint64_to_uint32(src64
);
1411 else if (!src_is_signed
&& dst_is_signed
)
1412 src32
= clamp_uint64_to_sint32(src64
);
1414 src32
= clamp_uint64_to_uint32(src64
);
1416 /* If the dst type is < 32-bit, we need an extra clamp */
1421 return _mesa_signed_to_signed(src32
, bits
);
1423 return _mesa_unsigned_to_unsigned(src32
, bits
);
1428 convert_integer(int32_t src
, int bits
, bool dst_is_signed
, bool src_is_signed
)
1430 if (src_is_signed
&& dst_is_signed
)
1431 return _mesa_signed_to_signed(src
, bits
);
1432 else if (src_is_signed
&& !dst_is_signed
)
1433 return _mesa_signed_to_unsigned(src
, bits
);
1434 else if (!src_is_signed
&& dst_is_signed
)
1435 return _mesa_unsigned_to_signed(src
, bits
);
1437 return _mesa_unsigned_to_unsigned(src
, bits
);
1441 _mesa_pack_luminance_from_rgba_integer(GLuint n
,
1442 GLuint rgba
[][4], bool rgba_is_signed
,
1449 int32_t lum32
, alpha
;
1453 assert(dst_format
== GL_LUMINANCE_INTEGER_EXT
||
1454 dst_format
== GL_LUMINANCE_ALPHA_INTEGER_EXT
);
1456 /* We first compute luminance values as a 64-bit addition of the
1457 * 32-bit R,G,B components, then we clamp the result to the dst type size.
1459 * Notice that this operation involves casting the 32-bit R,G,B components
1460 * to 64-bit before the addition. Since rgba is defined as a GLuint array
1461 * we need to be careful when rgba packs signed data and make sure
1462 * that we cast to a 32-bit signed integer values before casting them to
1463 * 64-bit signed integers.
1465 dst_is_signed
= (dst_type
== GL_BYTE
|| dst_type
== GL_SHORT
||
1466 dst_type
== GL_INT
);
1468 dst_bits
= _mesa_sizeof_type(dst_type
) * 8;
1469 assert(dst_bits
> 0);
1471 switch (dst_format
) {
1472 case GL_LUMINANCE_INTEGER_EXT
:
1473 for (i
= 0; i
< n
; i
++) {
1474 if (!rgba_is_signed
) {
1475 lum64
= (uint64_t) rgba
[i
][RCOMP
] +
1476 (uint64_t) rgba
[i
][GCOMP
] +
1477 (uint64_t) rgba
[i
][BCOMP
];
1479 lum64
= (int64_t) ((int32_t) rgba
[i
][RCOMP
]) +
1480 (int64_t) ((int32_t) rgba
[i
][GCOMP
]) +
1481 (int64_t) ((int32_t) rgba
[i
][BCOMP
]);
1483 lum32
= convert_integer_luminance64(lum64
, dst_bits
,
1484 dst_is_signed
, rgba_is_signed
);
1487 case GL_UNSIGNED_BYTE
: {
1488 GLbyte
*dst
= (GLbyte
*) dstAddr
;
1493 case GL_UNSIGNED_SHORT
: {
1494 GLshort
*dst
= (GLshort
*) dstAddr
;
1499 case GL_UNSIGNED_INT
: {
1500 GLint
*dst
= (GLint
*) dstAddr
;
1507 case GL_LUMINANCE_ALPHA_INTEGER_EXT
:
1508 for (i
= 0; i
< n
; i
++) {
1509 if (!rgba_is_signed
) {
1510 lum64
= (uint64_t) rgba
[i
][RCOMP
] +
1511 (uint64_t) rgba
[i
][GCOMP
] +
1512 (uint64_t) rgba
[i
][BCOMP
];
1514 lum64
= (int64_t) ((int32_t) rgba
[i
][RCOMP
]) +
1515 (int64_t) ((int32_t) rgba
[i
][GCOMP
]) +
1516 (int64_t) ((int32_t) rgba
[i
][BCOMP
]);
1518 lum32
= convert_integer_luminance64(lum64
, dst_bits
,
1519 dst_is_signed
, rgba_is_signed
);
1520 alpha
= convert_integer(rgba
[i
][ACOMP
], dst_bits
,
1521 dst_is_signed
, rgba_is_signed
);
1524 case GL_UNSIGNED_BYTE
: {
1525 GLbyte
*dst
= (GLbyte
*) dstAddr
;
1531 case GL_UNSIGNED_SHORT
: {
1532 GLshort
*dst
= (GLshort
*) dstAddr
;
1538 case GL_UNSIGNED_INT
: {
1539 GLint
*dst
= (GLint
*) dstAddr
;
1551 _mesa_unpack_color_index_to_rgba_float(struct gl_context
*ctx
, GLuint dims
,
1552 const void *src
, GLenum srcFormat
, GLenum srcType
,
1553 int srcWidth
, int srcHeight
, int srcDepth
,
1554 const struct gl_pixelstore_attrib
*srcPacking
,
1555 GLbitfield transferOps
)
1559 GLfloat
*rgba
, *dstPtr
;
1561 count
= srcWidth
* srcHeight
;
1562 indexes
= malloc(count
* sizeof(GLuint
));
1564 _mesa_error(ctx
, GL_OUT_OF_MEMORY
, "pixel unpacking");
1568 rgba
= malloc(4 * count
* srcDepth
* sizeof(GLfloat
));
1571 _mesa_error(ctx
, GL_OUT_OF_MEMORY
, "pixel unpacking");
1575 /* Convert indexes to RGBA float */
1577 for (img
= 0; img
< srcDepth
; img
++) {
1578 const GLubyte
*srcPtr
=
1579 (const GLubyte
*) _mesa_image_address(dims
, srcPacking
, src
,
1580 srcWidth
, srcHeight
,
1584 extract_uint_indexes(count
, indexes
, srcFormat
, srcType
, srcPtr
, srcPacking
);
1586 if (transferOps
& IMAGE_SHIFT_OFFSET_BIT
)
1587 _mesa_shift_and_offset_ci(ctx
, count
, indexes
);
1589 _mesa_map_ci_to_rgba(ctx
, count
, indexes
, (float (*)[4])dstPtr
);
1591 /* Don't do RGBA scale/bias or RGBA->RGBA mapping if starting
1592 * with color indexes.
1594 transferOps
&= ~(IMAGE_SCALE_BIAS_BIT
| IMAGE_MAP_COLOR_BIT
);
1595 _mesa_apply_rgba_transfer_ops(ctx
, transferOps
, count
, (float (*)[4])dstPtr
);
1597 dstPtr
+= srcHeight
* srcWidth
* 4;
1606 _mesa_unpack_color_index_to_rgba_ubyte(struct gl_context
*ctx
, GLuint dims
,
1607 const void *src
, GLenum srcFormat
, GLenum srcType
,
1608 int srcWidth
, int srcHeight
, int srcDepth
,
1609 const struct gl_pixelstore_attrib
*srcPacking
,
1610 GLbitfield transferOps
)
1616 transferOps
|= IMAGE_CLAMP_BIT
;
1617 rgba
= _mesa_unpack_color_index_to_rgba_float(ctx
, dims
,
1618 src
, srcFormat
, srcType
,
1619 srcWidth
, srcHeight
, srcDepth
,
1620 srcPacking
, transferOps
);
1622 count
= srcWidth
* srcHeight
* srcDepth
;
1623 dst
= malloc(count
* 4 * sizeof(GLubyte
));
1624 for (i
= 0; i
< count
; i
++) {
1625 CLAMPED_FLOAT_TO_UBYTE(dst
[i
* 4 + 0], rgba
[i
* 4 + 0]);
1626 CLAMPED_FLOAT_TO_UBYTE(dst
[i
* 4 + 1], rgba
[i
* 4 + 1]);
1627 CLAMPED_FLOAT_TO_UBYTE(dst
[i
* 4 + 2], rgba
[i
* 4 + 2]);
1628 CLAMPED_FLOAT_TO_UBYTE(dst
[i
* 4 + 3], rgba
[i
* 4 + 3]);