1 /* $Id: common_x86_asm.S,v 1.16 2003/01/09 23:43:02 brianp Exp $ */
4 * Mesa 3-D graphics library
7 * Copyright (C) 1999-2003 Brian Paul All Rights Reserved.
9 * Permission is hereby granted, free of charge, to any person obtaining a
10 * copy of this software and associated documentation files (the "Software"),
11 * to deal in the Software without restriction, including without limitation
12 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
13 * and/or sell copies of the Software, and to permit persons to whom the
14 * Software is furnished to do so, subject to the following conditions:
16 * The above copyright notice and this permission notice shall be included
17 * in all copies or substantial portions of the Software.
19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
20 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
21 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
22 * BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
23 * AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
24 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
28 * Check extended CPU capabilities. Now justs returns the raw CPUID
29 * feature information, allowing the higher level code to interpret the
32 * Written by Holger Waechtler <holger@akaflieg.extern.tu-berlin.de>
34 * Cleaned up and simplified by Gareth Hughes <gareth@valinux.com>
38 * NOTE: Avoid using spaces in between '(' ')' and arguments, especially
39 * with macros like CONST, LLBL that expand to CONCAT(...). Putting spaces
40 * in there will break the build on some platforms.
44 #include "common_x86_features.h"
47 /* Intel vendor string
49 #define GENU 0x756e6547 /* "Genu" */
50 #define INEI 0x49656e69 /* "ineI" */
51 #define NTEL 0x6c65746e /* "ntel" */
55 #define AUTH 0x68747541 /* "Auth" */
56 #define ENTI 0x69746e65 /* "enti" */
57 #define CAMD 0x444d4163 /* "cAMD" */
62 /* We might want to print out some useful messages.
64 GLNAME( found_intel ): STRING( "Genuine Intel processor found\n\0" )
65 GLNAME( found_amd ): STRING( "Authentic AMD processor found\n\0" )
71 GLOBL GLNAME( _mesa_identify_x86_cpu_features )
72 GLNAME( _mesa_identify_x86_cpu_features ):
77 /* Test for the CPUID command. If the ID Flag bit in EFLAGS
78 * (bit 21) is writable, the CPUID command is present.
83 XOR_L ( CONST(0x00200000), EAX )
89 /* Verify the ID Flag bit has been written.
92 JZ ( LLBL (cpuid_done) )
94 /* Get the CPU vendor info.
99 /* Test for Intel processors. We must look for the
100 * "GenuineIntel" string in EBX, ECX and EDX.
102 CMP_L ( CONST(GENU), EBX )
103 JNE ( LLBL(cpuid_amd) )
104 CMP_L ( CONST(INEI), EDX )
105 JNE ( LLBL(cpuid_amd) )
106 CMP_L ( CONST(NTEL), ECX )
107 JNE ( LLBL(cpuid_amd) )
109 /* We have an Intel processor, so we can get the feature
110 * information with an CPUID input value of 1.
112 MOV_L ( CONST(0x1), EAX )
116 /* Mask out highest bit, which is used by AMD for 3dnow
117 * Newer Intel have this bit set, but do not support 3dnow
119 AND_L ( CONST(0X7FFFFFFF), EAX)
120 JMP ( LLBL(cpuid_done) )
124 /* Test for AMD processors. We must look for the
125 * "AuthenticAMD" string in EBX, ECX and EDX.
127 CMP_L ( CONST(AUTH), EBX )
128 JNE ( LLBL(cpuid_other) )
129 CMP_L ( CONST(ENTI), EDX )
130 JNE ( LLBL(cpuid_other) )
131 CMP_L ( CONST(CAMD), ECX )
132 JNE ( LLBL(cpuid_other) )
134 /* We have an AMD processor, so we can get the feature
135 * information after we verify that the extended functions are
138 /* The features we need are almost all in the extended set. The
139 * exception is SSE enable, which is in the standard set (0x1).
141 MOV_L ( CONST(0x1), EAX )
144 JZ ( LLBL (cpuid_failed) )
147 MOV_L ( CONST(0x80000000), EAX )
150 JZ ( LLBL (cpuid_failed) )
152 MOV_L ( CONST(0x80000001), EAX )
156 AND_L ( CONST(0x02000000), ESI ) /* OR in the SSE bit */
159 JMP ( LLBL (cpuid_done) )
163 /* Test for other processors here when required.
168 /* If we can't determine the feature information, we must
169 * return zero to indicate that no platform-specific
170 * optimizations can be used.
172 MOV_L ( CONST(0), EAX )
182 /* Execute an SSE instruction to see if the operating system correctly
183 * supports SSE. A signal handler for SIGILL should have been set
184 * before calling this function, otherwise this could kill the client
188 GLOBL GLNAME( _mesa_test_os_sse_support )
189 GLNAME( _mesa_test_os_sse_support ):
196 /* Perform an SSE divide-by-zero to see if the operating system
197 * correctly supports unmasked SIMD FPU exceptions. Signal handlers for
198 * SIGILL and SIGFPE should have been set before calling this function,
199 * otherwise this could kill the client application.
202 GLOBL GLNAME( _mesa_test_os_sse_exception_support )
203 GLNAME( _mesa_test_os_sse_exception_support ):
207 SUB_L ( CONST( 8 ), ESP )
209 /* Save the original MXCSR register value.
211 STMXCSR ( REGOFF( -4, EBP ) )
213 /* Unmask the divide-by-zero exception and perform one.
215 STMXCSR ( REGOFF( -8, EBP ) )
216 AND_L ( CONST( 0xfffffdff ), REGOFF( -8, EBP ) )
217 LDMXCSR ( REGOFF( -8, EBP ) )
221 PUSH_L ( CONST( 0x3f800000 ) )
222 PUSH_L ( CONST( 0x3f800000 ) )
223 PUSH_L ( CONST( 0x3f800000 ) )
224 PUSH_L ( CONST( 0x3f800000 ) )
226 MOVUPS ( REGIND( ESP ), XMM1 )
230 /* Restore the original MXCSR register value.
232 LDMXCSR ( REGOFF( -4, EBP ) )