3 * Standard C library function wrappers.
5 * Imports are services which the device driver or window system or
6 * operating system provides to the core renderer. The core renderer (Mesa)
7 * will call these functions in order to do memory allocation, simple I/O,
10 * Some drivers will want to override/replace this file with something
11 * specialized, but that'll be rare.
13 * Eventually, I want to move roll the glheader.h file into this.
15 * \todo Functions still needed:
22 * Mesa 3-D graphics library
25 * Copyright (C) 1999-2007 Brian Paul All Rights Reserved.
27 * Permission is hereby granted, free of charge, to any person obtaining a
28 * copy of this software and associated documentation files (the "Software"),
29 * to deal in the Software without restriction, including without limitation
30 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
31 * and/or sell copies of the Software, and to permit persons to whom the
32 * Software is furnished to do so, subject to the following conditions:
34 * The above copyright notice and this permission notice shall be included
35 * in all copies or substantial portions of the Software.
37 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
38 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
39 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
40 * BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
41 * AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
42 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
61 #define vsnprintf _vsnprintf
62 #elif defined(__IBMC__) || defined(__IBMCPP__) || ( defined(__VMS) && __CRTL_VER < 70312000 )
63 extern int vsnprintf(char *str
, size_t count
, const char *fmt
, va_list arg
);
65 #include "vsnprintf.c"
69 /**********************************************************************/
74 * Allocate aligned memory.
76 * \param bytes number of bytes to allocate.
77 * \param alignment alignment (must be greater than zero).
79 * Allocates extra memory to accommodate rounding up the address for
80 * alignment and to record the real malloc address.
82 * \sa _mesa_align_free().
85 _mesa_align_malloc(size_t bytes
, unsigned long alignment
)
87 #if defined(HAVE_POSIX_MEMALIGN)
89 int err
= posix_memalign(& mem
, alignment
, bytes
);
93 #elif defined(_WIN32) && defined(_MSC_VER)
94 return _aligned_malloc(bytes
, alignment
);
98 ASSERT( alignment
> 0 );
100 ptr
= (uintptr_t) malloc(bytes
+ alignment
+ sizeof(void *));
104 buf
= (ptr
+ alignment
+ sizeof(void *)) & ~(uintptr_t)(alignment
- 1);
105 *(uintptr_t *)(buf
- sizeof(void *)) = ptr
;
108 /* mark the non-aligned area */
109 while ( ptr
< buf
- sizeof(void *) ) {
110 *(unsigned long *)ptr
= 0xcdcdcdcd;
111 ptr
+= sizeof(unsigned long);
116 #endif /* defined(HAVE_POSIX_MEMALIGN) */
120 * Same as _mesa_align_malloc(), but using calloc(1, ) instead of
124 _mesa_align_calloc(size_t bytes
, unsigned long alignment
)
126 #if defined(HAVE_POSIX_MEMALIGN)
129 mem
= _mesa_align_malloc(bytes
, alignment
);
131 (void) memset(mem
, 0, bytes
);
135 #elif defined(_WIN32) && defined(_MSC_VER)
138 mem
= _aligned_malloc(bytes
, alignment
);
140 (void) memset(mem
, 0, bytes
);
147 ASSERT( alignment
> 0 );
149 ptr
= (uintptr_t) calloc(1, bytes
+ alignment
+ sizeof(void *));
153 buf
= (ptr
+ alignment
+ sizeof(void *)) & ~(uintptr_t)(alignment
- 1);
154 *(uintptr_t *)(buf
- sizeof(void *)) = ptr
;
157 /* mark the non-aligned area */
158 while ( ptr
< buf
- sizeof(void *) ) {
159 *(unsigned long *)ptr
= 0xcdcdcdcd;
160 ptr
+= sizeof(unsigned long);
165 #endif /* defined(HAVE_POSIX_MEMALIGN) */
169 * Free memory which was allocated with either _mesa_align_malloc()
170 * or _mesa_align_calloc().
171 * \param ptr pointer to the memory to be freed.
172 * The actual address to free is stored in the word immediately before the
173 * address the client sees.
176 _mesa_align_free(void *ptr
)
178 #if defined(HAVE_POSIX_MEMALIGN)
180 #elif defined(_WIN32) && defined(_MSC_VER)
183 void **cubbyHole
= (void **) ((char *) ptr
- sizeof(void *));
184 void *realAddr
= *cubbyHole
;
186 #endif /* defined(HAVE_POSIX_MEMALIGN) */
190 * Reallocate memory, with alignment.
193 _mesa_align_realloc(void *oldBuffer
, size_t oldSize
, size_t newSize
,
194 unsigned long alignment
)
196 #if defined(_WIN32) && defined(_MSC_VER)
198 return _aligned_realloc(oldBuffer
, newSize
, alignment
);
200 const size_t copySize
= (oldSize
< newSize
) ? oldSize
: newSize
;
201 void *newBuf
= _mesa_align_malloc(newSize
, alignment
);
202 if (newBuf
&& oldBuffer
&& copySize
> 0) {
203 memcpy(newBuf
, oldBuffer
, copySize
);
206 _mesa_align_free(oldBuffer
);
213 /** Reallocate memory */
215 _mesa_realloc(void *oldBuffer
, size_t oldSize
, size_t newSize
)
217 const size_t copySize
= (oldSize
< newSize
) ? oldSize
: newSize
;
218 void *newBuffer
= malloc(newSize
);
219 if (newBuffer
&& oldBuffer
&& copySize
> 0)
220 memcpy(newBuffer
, oldBuffer
, copySize
);
227 * Fill memory with a constant 16bit word.
228 * \param dst destination pointer.
230 * \param n number of words.
233 _mesa_memset16( unsigned short *dst
, unsigned short val
, size_t n
)
242 /**********************************************************************/
248 inv_sqrt - A single precision 1/sqrt routine for IEEE format floats.
249 written by Josh Vanderhoof, based on newsgroup posts by James Van Buskirk
253 _mesa_inv_sqrtf(float n
)
255 #if defined(USE_IEEE) && !defined(DEBUG)
259 #if 0 /* not used, see below -BP */
266 Exponent part of the magic number -
269 1. subtract the bias from the exponent,
271 3. divide by two (rounding towards -inf)
274 Which is the same as subtracting the exponent from 381 and dividing
277 floor(-(x - 127) / 2) + 127 = floor((381 - x) / 2)
283 Significand part of magic number -
285 With the current magic number, "(magic - u.i) >> 1" will give you:
287 for 1 <= u.f <= 2: 1.25 - u.f / 4
288 for 2 <= u.f <= 4: 1.00 - u.f / 8
290 This isn't a bad approximation of 1/sqrt. The maximum difference from
291 1/sqrt will be around .06. After three Newton-Raphson iterations, the
292 maximum difference is less than 4.5e-8. (Which is actually close
293 enough to make the following bias academic...)
295 To get a better approximation you can add a bias to the magic
296 number. For example, if you subtract 1/2 of the maximum difference in
297 the first approximation (.03), you will get the following function:
299 for 1 <= u.f <= 2: 1.22 - u.f / 4
300 for 2 <= u.f <= 3.76: 0.97 - u.f / 8
301 for 3.76 <= u.f <= 4: 0.72 - u.f / 16
302 (The 3.76 to 4 range is where the result is < .5.)
304 This is the closest possible initial approximation, but with a maximum
305 error of 8e-11 after three NR iterations, it is still not perfect. If
306 you subtract 0.0332281 instead of .03, the maximum error will be
307 2.5e-11 after three NR iterations, which should be about as close as
310 for 1 <= u.f <= 2: 1.2167719 - u.f / 4
311 for 2 <= u.f <= 3.73: 0.9667719 - u.f / 8
312 for 3.73 <= u.f <= 4: 0.7167719 - u.f / 16
316 magic
-= (int)(0.0332281 * (1 << 25));
319 u
.i
= (magic
- u
.i
) >> 1;
322 Instead of Newton-Raphson, we use Goldschmidt's algorithm, which
323 allows more parallelism. From what I understand, the parallelism
324 comes at the cost of less precision, because it lets error
325 accumulate across iterations.
340 return x2
* r2
; /* we can stop here, and be conformant -BP */
349 return (float) (1.0 / sqrt(n
));
355 * Find the first bit set in a word.
360 register int bit
= 0;
362 if ((i
& 0xffff) == 0) {
366 if ((i
& 0xff) == 0) {
370 if ((i
& 0xf) == 0) {
374 while ((i
& 1) == 0) {
385 * Find position of first bit set in given value.
386 * XXX Warning: this function can only be used on 64-bit systems!
387 * \return position of least-significant bit set, starting at 1, return zero
391 ffsll(long long int val
)
395 assert(sizeof(val
) == 8);
397 bit
= ffs((int) val
);
401 bit
= ffs((int) (val
>> 32));
407 #endif /* __GNUC__ */
410 #if !defined(__GNUC__) ||\
411 ((__GNUC__ * 100 + __GNUC_MINOR__) < 304) /* Not gcc 3.4 or later */
413 * Return number of bits set in given GLuint.
416 _mesa_bitcount(unsigned int n
)
419 for (bits
= 0; n
> 0; n
= n
>> 1) {
426 * Return number of bits set in given 64-bit uint.
429 _mesa_bitcount_64(uint64_t n
)
432 for (bits
= 0; n
> 0; n
= n
>> 1) {
441 * Convert a 4-byte float to a 2-byte half float.
442 * Based on code from:
443 * http://www.opengl.org/discussion_boards/ubb/Forum3/HTML/008786.html
446 _mesa_float_to_half(float val
)
448 const fi_type fi
= {val
};
449 const int flt_m
= fi
.i
& 0x7fffff;
450 const int flt_e
= (fi
.i
>> 23) & 0xff;
451 const int flt_s
= (fi
.i
>> 31) & 0x1;
458 /* handle special cases */
459 if ((flt_e
== 0) && (flt_m
== 0)) {
461 /* m = 0; - already set */
464 else if ((flt_e
== 0) && (flt_m
!= 0)) {
465 /* denorm -- denorm float maps to 0 half */
466 /* m = 0; - already set */
469 else if ((flt_e
== 0xff) && (flt_m
== 0)) {
471 /* m = 0; - already set */
474 else if ((flt_e
== 0xff) && (flt_m
!= 0)) {
481 const int new_exp
= flt_e
- 127;
484 /* m = 0; - already set */
487 else if (new_exp
< -14) {
488 /* this maps to a denorm */
489 unsigned int exp_val
= (unsigned int) (-14 - new_exp
); /* 2^-exp_val*/
494 "float_to_half: logical error in denorm creation!\n");
495 /* m = 0; - already set */
497 case 1: m
= 512 + (flt_m
>> 14); break;
498 case 2: m
= 256 + (flt_m
>> 15); break;
499 case 3: m
= 128 + (flt_m
>> 16); break;
500 case 4: m
= 64 + (flt_m
>> 17); break;
501 case 5: m
= 32 + (flt_m
>> 18); break;
502 case 6: m
= 16 + (flt_m
>> 19); break;
503 case 7: m
= 8 + (flt_m
>> 20); break;
504 case 8: m
= 4 + (flt_m
>> 21); break;
505 case 9: m
= 2 + (flt_m
>> 22); break;
506 case 10: m
= 1; break;
509 else if (new_exp
> 15) {
510 /* map this value to infinity */
511 /* m = 0; - already set */
521 result
= (s
<< 15) | (e
<< 10) | m
;
527 * Convert a 2-byte half float to a 4-byte float.
528 * Based on code from:
529 * http://www.opengl.org/discussion_boards/ubb/Forum3/HTML/008786.html
532 _mesa_half_to_float(GLhalfARB val
)
534 /* XXX could also use a 64K-entry lookup table */
535 const int m
= val
& 0x3ff;
536 const int e
= (val
>> 10) & 0x1f;
537 const int s
= (val
>> 15) & 0x1;
538 int flt_m
, flt_e
, flt_s
;
545 /* handle special cases */
546 if ((e
== 0) && (m
== 0)) {
551 else if ((e
== 0) && (m
!= 0)) {
552 /* denorm -- denorm half will fit in non-denorm single */
553 const float half_denorm
= 1.0f
/ 16384.0f
; /* 2^-14 */
554 float mantissa
= ((float) (m
)) / 1024.0f
;
555 float sign
= s
? -1.0f
: 1.0f
;
556 return sign
* mantissa
* half_denorm
;
558 else if ((e
== 31) && (m
== 0)) {
563 else if ((e
== 31) && (m
!= 0)) {
574 fi
.i
= (flt_s
<< 31) | (flt_e
<< 23) | flt_m
;
582 /**********************************************************************/
583 /** \name Sort & Search */
587 * Wrapper for bsearch().
590 _mesa_bsearch( const void *key
, const void *base
, size_t nmemb
, size_t size
,
591 int (*compar
)(const void *, const void *) )
593 #if defined(_WIN32_WCE)
598 mid
= (char *)base
+ nmemb
* size
;
599 cmp
= (*compar
)(key
, mid
);
603 base
= (char *)mid
+ size
;
609 return bsearch(key
, base
, nmemb
, size
, compar
);
616 /**********************************************************************/
617 /** \name Environment vars */
621 * Wrapper for getenv().
624 _mesa_getenv( const char *var
)
626 #if defined(_XBOX) || defined(_WIN32_WCE)
636 /**********************************************************************/
641 * Implemented using malloc() and strcpy.
642 * Note that NULL is handled accordingly.
645 _mesa_strdup( const char *s
)
648 size_t l
= strlen(s
);
649 char *s2
= (char *) malloc(l
+ 1);
659 /** Wrapper around strtof() */
661 _mesa_strtof( const char *s
, char **end
)
663 #if defined(_GNU_SOURCE) && !defined(__CYGWIN__) && !defined(__FreeBSD__) && \
664 !defined(ANDROID) && !defined(__HAIKU__)
665 static locale_t loc
= NULL
;
667 loc
= newlocale(LC_CTYPE_MASK
, "C", NULL
);
669 return strtof_l(s
, end
, loc
);
670 #elif defined(_ISOC99_SOURCE) || (defined(_XOPEN_SOURCE) && _XOPEN_SOURCE >= 600)
671 return strtof(s
, end
);
673 return (float)strtod(s
, end
);
677 /** Compute simple checksum/hash for a string */
679 _mesa_str_checksum(const char *str
)
681 /* This could probably be much better */
685 for (c
= str
; *c
; c
++, i
++)
686 sum
+= *c
* (i
% 100);
694 /** Needed due to #ifdef's, above. */
696 _mesa_vsnprintf(char *str
, size_t size
, const char *fmt
, va_list args
)
698 return vsnprintf( str
, size
, fmt
, args
);
701 /** Wrapper around vsnprintf() */
703 _mesa_snprintf( char *str
, size_t size
, const char *fmt
, ... )
707 va_start( args
, fmt
);
708 r
= vsnprintf( str
, size
, fmt
, args
);