Merge remote branch 'origin/master' into nv50-compiler
[mesa.git] / src / mesa / main / compiler.h
1 /*
2 * Mesa 3-D graphics library
3 * Version: 7.5
4 *
5 * Copyright (C) 1999-2008 Brian Paul All Rights Reserved.
6 * Copyright (C) 2009 VMware, Inc. All Rights Reserved.
7 *
8 * Permission is hereby granted, free of charge, to any person obtaining a
9 * copy of this software and associated documentation files (the "Software"),
10 * to deal in the Software without restriction, including without limitation
11 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
12 * and/or sell copies of the Software, and to permit persons to whom the
13 * Software is furnished to do so, subject to the following conditions:
14 *
15 * The above copyright notice and this permission notice shall be included
16 * in all copies or substantial portions of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
21 * BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
22 * AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
23 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
24 */
25
26
27 /**
28 * \file compiler.h
29 * Compiler-related stuff.
30 */
31
32
33 #ifndef COMPILER_H
34 #define COMPILER_H
35
36
37 #include <assert.h>
38 #include <ctype.h>
39 #if defined(__alpha__) && defined(CCPML)
40 #include <cpml.h> /* use Compaq's Fast Math Library on Alpha */
41 #else
42 #include <math.h>
43 #endif
44 #include <limits.h>
45 #include <stdlib.h>
46 #include <stdio.h>
47 #include <string.h>
48 #if defined(__linux__) && defined(__i386__)
49 #include <fpu_control.h>
50 #endif
51 #include <float.h>
52 #include <stdarg.h>
53
54
55 #ifdef __cplusplus
56 extern "C" {
57 #endif
58
59
60 /**
61 * Get standard integer types
62 */
63 #if defined(_MSC_VER)
64 typedef __int8 int8_t;
65 typedef unsigned __int8 uint8_t;
66 typedef __int16 int16_t;
67 typedef unsigned __int16 uint16_t;
68 typedef __int32 int32_t;
69 typedef unsigned __int32 uint32_t;
70 typedef __int64 int64_t;
71 typedef unsigned __int64 uint64_t;
72
73 # if defined(_WIN64)
74 typedef __int64 intptr_t;
75 typedef unsigned __int64 uintptr_t;
76 # else
77 typedef __int32 intptr_t;
78 typedef unsigned __int32 uintptr_t;
79 # endif
80
81 # define INT64_C(__val) __val##i64
82 # define UINT64_C(__val) __val##ui64
83 #else
84 # include <stdint.h>
85 #endif
86
87
88 /**
89 * Sun compilers define __i386 instead of the gcc-style __i386__
90 */
91 #ifdef __SUNPRO_C
92 # if !defined(__i386__) && defined(__i386)
93 # define __i386__
94 # elif !defined(__amd64__) && defined(__amd64)
95 # define __amd64__
96 # elif !defined(__sparc__) && defined(__sparc)
97 # define __sparc__
98 # endif
99 # if !defined(__volatile)
100 # define __volatile volatile
101 # endif
102 #endif
103
104
105 /**
106 * finite macro.
107 */
108 #if defined(_MSC_VER)
109 # define finite _finite
110 #elif defined(__WATCOMC__)
111 # define finite _finite
112 #endif
113
114
115 /**
116 * Disable assorted warnings
117 */
118 #if !defined(OPENSTEP) && (defined(__WIN32__) && !defined(__CYGWIN__)) && !defined(BUILD_FOR_SNAP)
119 # if !defined(__GNUC__) /* mingw environment */
120 # pragma warning( disable : 4068 ) /* unknown pragma */
121 # pragma warning( disable : 4710 ) /* function 'foo' not inlined */
122 # pragma warning( disable : 4711 ) /* function 'foo' selected for automatic inline expansion */
123 # pragma warning( disable : 4127 ) /* conditional expression is constant */
124 # if defined(MESA_MINWARN)
125 # pragma warning( disable : 4244 ) /* '=' : conversion from 'const double ' to 'float ', possible loss of data */
126 # pragma warning( disable : 4018 ) /* '<' : signed/unsigned mismatch */
127 # pragma warning( disable : 4305 ) /* '=' : truncation from 'const double ' to 'float ' */
128 # pragma warning( disable : 4550 ) /* 'function' undefined; assuming extern returning int */
129 # pragma warning( disable : 4761 ) /* integral size mismatch in argument; conversion supplied */
130 # endif
131 # endif
132 #endif
133 #if defined(__WATCOMC__)
134 # pragma disable_message(201) /* Disable unreachable code warnings */
135 #endif
136
137
138
139 /**
140 * Function inlining
141 */
142 #if defined(__GNUC__)
143 # define INLINE __inline__
144 #elif defined(__MSC__)
145 # define INLINE __inline
146 #elif defined(_MSC_VER)
147 # define INLINE __inline
148 #elif defined(__ICL)
149 # define INLINE __inline
150 #elif defined(__INTEL_COMPILER)
151 # define INLINE inline
152 #elif defined(__WATCOMC__) && (__WATCOMC__ >= 1100)
153 # define INLINE __inline
154 #elif defined(__SUNPRO_C) && defined(__C99FEATURES__)
155 # define INLINE inline
156 # define __inline inline
157 # define __inline__ inline
158 #elif (__STDC_VERSION__ >= 199901L) /* C99 */
159 # define INLINE inline
160 #else
161 # define INLINE
162 #endif
163
164
165 /**
166 * PUBLIC/USED macros
167 *
168 * If we build the library with gcc's -fvisibility=hidden flag, we'll
169 * use the PUBLIC macro to mark functions that are to be exported.
170 *
171 * We also need to define a USED attribute, so the optimizer doesn't
172 * inline a static function that we later use in an alias. - ajax
173 */
174 #if defined(__GNUC__) || (defined(__SUNPRO_C) && (__SUNPRO_C >= 0x590))
175 # define PUBLIC __attribute__((visibility("default")))
176 # define USED __attribute__((used))
177 #else
178 # define PUBLIC
179 # define USED
180 #endif
181
182
183 /**
184 * Some compilers don't like some of Mesa's const usage. In those places use
185 * CONST instead of const. Pass -DNO_CONST to compilers where this matters.
186 */
187 #ifdef NO_CONST
188 # define CONST
189 #else
190 # define CONST const
191 #endif
192
193
194 /**
195 * __builtin_expect macros
196 */
197 #if !defined(__GNUC__)
198 # define __builtin_expect(x, y) x
199 #endif
200
201 #ifdef __GNUC__
202 #define likely(x) __builtin_expect(!!(x), 1)
203 #define unlikely(x) __builtin_expect(!!(x), 0)
204 #else
205 #define likely(x) !!(x)
206 #define unlikely(x) !!(x)
207 #endif
208
209 /**
210 * The __FUNCTION__ gcc variable is generally only used for debugging.
211 * If we're not using gcc, define __FUNCTION__ as a cpp symbol here.
212 * Don't define it if using a newer Windows compiler.
213 */
214 #ifndef __FUNCTION__
215 # if defined(__VMS)
216 # define __FUNCTION__ "VMS$NL:"
217 # elif !defined(__GNUC__) && !defined(__xlC__) && \
218 (!defined(_MSC_VER) || _MSC_VER < 1300)
219 # if (__STDC_VERSION__ >= 199901L) /* C99 */ || \
220 (defined(__SUNPRO_C) && defined(__C99FEATURES__))
221 # define __FUNCTION__ __func__
222 # else
223 # define __FUNCTION__ "<unknown>"
224 # endif
225 # endif
226 #endif
227
228
229 /**
230 * Either define MESA_BIG_ENDIAN or MESA_LITTLE_ENDIAN, and CPU_TO_LE32.
231 * Do not use these unless absolutely necessary!
232 * Try to use a runtime test instead.
233 * For now, only used by some DRI hardware drivers for color/texel packing.
234 */
235 #if defined(BYTE_ORDER) && defined(BIG_ENDIAN) && BYTE_ORDER == BIG_ENDIAN
236 #if defined(__linux__)
237 #include <byteswap.h>
238 #define CPU_TO_LE32( x ) bswap_32( x )
239 #elif defined(__APPLE__)
240 #include <CoreFoundation/CFByteOrder.h>
241 #define CPU_TO_LE32( x ) CFSwapInt32HostToLittle( x )
242 #elif (defined(_AIX) || defined(__blrts))
243 static INLINE GLuint CPU_TO_LE32(GLuint x)
244 {
245 return (((x & 0x000000ff) << 24) |
246 ((x & 0x0000ff00) << 8) |
247 ((x & 0x00ff0000) >> 8) |
248 ((x & 0xff000000) >> 24));
249 }
250 #else /*__linux__ */
251 #include <sys/endian.h>
252 #define CPU_TO_LE32( x ) bswap32( x )
253 #endif /*__linux__*/
254 #define MESA_BIG_ENDIAN 1
255 #else
256 #define CPU_TO_LE32( x ) ( x )
257 #define MESA_LITTLE_ENDIAN 1
258 #endif
259 #define LE32_TO_CPU( x ) CPU_TO_LE32( x )
260
261
262
263 #if !defined(CAPI) && defined(WIN32) && !defined(BUILD_FOR_SNAP)
264 #define CAPI _cdecl
265 #endif
266
267
268 /**
269 * Create a macro so that asm functions can be linked into compilers other
270 * than GNU C
271 */
272 #ifndef _ASMAPI
273 #if defined(WIN32) && !defined(BUILD_FOR_SNAP)/* was: !defined( __GNUC__ ) && !defined( VMS ) && !defined( __INTEL_COMPILER )*/
274 #define _ASMAPI __cdecl
275 #else
276 #define _ASMAPI
277 #endif
278 #ifdef PTR_DECL_IN_FRONT
279 #define _ASMAPIP * _ASMAPI
280 #else
281 #define _ASMAPIP _ASMAPI *
282 #endif
283 #endif
284
285 #ifdef USE_X86_ASM
286 #define _NORMAPI _ASMAPI
287 #define _NORMAPIP _ASMAPIP
288 #else
289 #define _NORMAPI
290 #define _NORMAPIP *
291 #endif
292
293
294 /* This is a macro on IRIX */
295 #ifdef _P
296 #undef _P
297 #endif
298
299
300 /* Turn off macro checking systems used by other libraries */
301 #ifdef CHECK
302 #undef CHECK
303 #endif
304
305
306 /**
307 * ASSERT macro
308 */
309 #if !defined(_WIN32_WCE)
310 #if defined(BUILD_FOR_SNAP) && defined(CHECKED)
311 # define ASSERT(X) _CHECK(X)
312 #elif defined(DEBUG)
313 # define ASSERT(X) assert(X)
314 #else
315 # define ASSERT(X)
316 #endif
317 #endif
318
319 #if (__GNUC__ >= 3)
320 #define PRINTFLIKE(f, a) __attribute__ ((format(__printf__, f, a)))
321 #else
322 #define PRINTFLIKE(f, a)
323 #endif
324
325 #ifndef NULL
326 #define NULL 0
327 #endif
328
329
330 /**
331 * LONGSTRING macro
332 * gcc -pedantic warns about long string literals, LONGSTRING silences that.
333 */
334 #if !defined(__GNUC__)
335 # define LONGSTRING
336 #else
337 # define LONGSTRING __extension__
338 #endif
339
340
341 #ifndef M_PI
342 #define M_PI (3.1415926536)
343 #endif
344
345 #ifndef M_E
346 #define M_E (2.7182818284590452354)
347 #endif
348
349 #ifndef ONE_DIV_LN2
350 #define ONE_DIV_LN2 (1.442695040888963456)
351 #endif
352
353 #ifndef ONE_DIV_SQRT_LN2
354 #define ONE_DIV_SQRT_LN2 (1.201122408786449815)
355 #endif
356
357 #ifndef FLT_MAX_EXP
358 #define FLT_MAX_EXP 128
359 #endif
360
361
362 /**
363 * USE_IEEE: Determine if we're using IEEE floating point
364 */
365 #if defined(__i386__) || defined(__386__) || defined(__sparc__) || \
366 defined(__s390x__) || defined(__powerpc__) || \
367 defined(__x86_64__) || \
368 defined(ia64) || defined(__ia64__) || \
369 defined(__hppa__) || defined(hpux) || \
370 defined(__mips) || defined(_MIPS_ARCH) || \
371 defined(__arm__) || \
372 defined(__sh__) || defined(__m32r__) || \
373 (defined(__sun) && defined(_IEEE_754)) || \
374 (defined(__alpha__) && (defined(__IEEE_FLOAT) || !defined(VMS)))
375 #define USE_IEEE
376 #define IEEE_ONE 0x3f800000
377 #endif
378
379
380 /**
381 * START/END_FAST_MATH macros:
382 *
383 * START_FAST_MATH: Set x86 FPU to faster, 32-bit precision mode (and save
384 * original mode to a temporary).
385 * END_FAST_MATH: Restore x86 FPU to original mode.
386 */
387 #if defined(__GNUC__) && defined(__i386__)
388 /*
389 * Set the x86 FPU control word to guarentee only 32 bits of precision
390 * are stored in registers. Allowing the FPU to store more introduces
391 * differences between situations where numbers are pulled out of memory
392 * vs. situations where the compiler is able to optimize register usage.
393 *
394 * In the worst case, we force the compiler to use a memory access to
395 * truncate the float, by specifying the 'volatile' keyword.
396 */
397 /* Hardware default: All exceptions masked, extended double precision,
398 * round to nearest (IEEE compliant):
399 */
400 #define DEFAULT_X86_FPU 0x037f
401 /* All exceptions masked, single precision, round to nearest:
402 */
403 #define FAST_X86_FPU 0x003f
404 /* The fldcw instruction will cause any pending FP exceptions to be
405 * raised prior to entering the block, and we clear any pending
406 * exceptions before exiting the block. Hence, asm code has free
407 * reign over the FPU while in the fast math block.
408 */
409 #if defined(NO_FAST_MATH)
410 #define START_FAST_MATH(x) \
411 do { \
412 static GLuint mask = DEFAULT_X86_FPU; \
413 __asm__ ( "fnstcw %0" : "=m" (*&(x)) ); \
414 __asm__ ( "fldcw %0" : : "m" (mask) ); \
415 } while (0)
416 #else
417 #define START_FAST_MATH(x) \
418 do { \
419 static GLuint mask = FAST_X86_FPU; \
420 __asm__ ( "fnstcw %0" : "=m" (*&(x)) ); \
421 __asm__ ( "fldcw %0" : : "m" (mask) ); \
422 } while (0)
423 #endif
424 /* Restore original FPU mode, and clear any exceptions that may have
425 * occurred in the FAST_MATH block.
426 */
427 #define END_FAST_MATH(x) \
428 do { \
429 __asm__ ( "fnclex ; fldcw %0" : : "m" (*&(x)) ); \
430 } while (0)
431
432 #elif defined(__WATCOMC__) && defined(__386__)
433 #define DEFAULT_X86_FPU 0x037f /* See GCC comments above */
434 #define FAST_X86_FPU 0x003f /* See GCC comments above */
435 void _watcom_start_fast_math(unsigned short *x,unsigned short *mask);
436 #pragma aux _watcom_start_fast_math = \
437 "fnstcw word ptr [eax]" \
438 "fldcw word ptr [ecx]" \
439 parm [eax] [ecx] \
440 modify exact [];
441 void _watcom_end_fast_math(unsigned short *x);
442 #pragma aux _watcom_end_fast_math = \
443 "fnclex" \
444 "fldcw word ptr [eax]" \
445 parm [eax] \
446 modify exact [];
447 #if defined(NO_FAST_MATH)
448 #define START_FAST_MATH(x) \
449 do { \
450 static GLushort mask = DEFAULT_X86_FPU; \
451 _watcom_start_fast_math(&x,&mask); \
452 } while (0)
453 #else
454 #define START_FAST_MATH(x) \
455 do { \
456 static GLushort mask = FAST_X86_FPU; \
457 _watcom_start_fast_math(&x,&mask); \
458 } while (0)
459 #endif
460 #define END_FAST_MATH(x) _watcom_end_fast_math(&x)
461
462 #elif defined(_MSC_VER) && defined(_M_IX86)
463 #define DEFAULT_X86_FPU 0x037f /* See GCC comments above */
464 #define FAST_X86_FPU 0x003f /* See GCC comments above */
465 #if defined(NO_FAST_MATH)
466 #define START_FAST_MATH(x) do {\
467 static GLuint mask = DEFAULT_X86_FPU;\
468 __asm fnstcw word ptr [x]\
469 __asm fldcw word ptr [mask]\
470 } while(0)
471 #else
472 #define START_FAST_MATH(x) do {\
473 static GLuint mask = FAST_X86_FPU;\
474 __asm fnstcw word ptr [x]\
475 __asm fldcw word ptr [mask]\
476 } while(0)
477 #endif
478 #define END_FAST_MATH(x) do {\
479 __asm fnclex\
480 __asm fldcw word ptr [x]\
481 } while(0)
482
483 #else
484 #define START_FAST_MATH(x) x = 0
485 #define END_FAST_MATH(x) (void)(x)
486 #endif
487
488
489 #ifndef Elements
490 #define Elements(x) (sizeof(x)/sizeof(*(x)))
491 #endif
492
493
494
495 #ifdef __cplusplus
496 }
497 #endif
498
499
500 #endif /* COMPILER_H */