3 # (C) Copyright IBM Corporation 2005
6 # Permission is hereby granted, free of charge, to any person obtaining a
7 # copy of this software and associated documentation files (the "Software"),
8 # to deal in the Software without restriction, including without limitation
9 # on the rights to use, copy, modify, merge, publish, distribute, sub
10 # license, and/or sell copies of the Software, and to permit persons to whom
11 # the Software is furnished to do so, subject to the following conditions:
13 # The above copyright notice and this permission notice (including the next
14 # paragraph) shall be included in all copies or substantial portions of the
17 # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18 # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 # FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
20 # IBM AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21 # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
22 # FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
26 # Ian Romanick <idr@us.ibm.com>
29 import gl_XML
, glX_XML
30 import sys
, getopt
, copy
32 def should_use_push(registers
):
33 for [reg
, offset
] in registers
:
41 def local_size(registers
):
42 # The x86-64 ABI says "the value (%rsp - 8) is always a multiple of
43 # 16 when control is transfered to the function entry point." This
44 # means that the local stack usage must be (16*N)+8 for some value
45 # of N. (16*N)+8 = (8*(2N))+8 = 8*(2N+1). As long as N is odd, we
46 # meet this requirement.
48 N
= (len(registers
) |
1)
52 def save_all_regs(registers
):
54 if not should_use_push(registers
):
55 adjust_stack
= local_size(registers
)
56 print '\tsubq\t$%u, %%rsp' % (adjust_stack
)
58 for [reg
, stack_offset
] in registers
:
59 save_reg( reg
, stack_offset
, adjust_stack
)
63 def restore_all_regs(registers
):
65 if not should_use_push(registers
):
66 adjust_stack
= local_size(registers
)
68 temp
= copy
.deepcopy(registers
)
70 [reg
, stack_offset
] = temp
.pop()
71 restore_reg(reg
, stack_offset
, adjust_stack
)
74 print '\taddq\t$%u, %%rsp' % (adjust_stack
)
78 def save_reg(reg
, offset
, use_move
):
81 print '\tmovq\t%s, (%%rsp)' % (reg
)
83 print '\tmovq\t%s, %u(%%rsp)' % (reg
, offset
)
85 print '\tpushq\t%s' % (reg
)
90 def restore_reg(reg
, offset
, use_move
):
93 print '\tmovq\t(%%rsp), %s' % (reg
)
95 print '\tmovq\t%u(%%rsp), %s' % (offset
, reg
)
97 print '\tpopq\t%s' % (reg
)
102 class PrintGenericStubs(gl_XML
.gl_print_base
):
105 gl_XML
.gl_print_base
.__init
__(self
)
107 self
.name
= "gl_x86-64_asm.py (from Mesa)"
108 self
.license
= license
.bsd_license_template
% ("(C) Copyright IBM Corporation 2005", "IBM")
112 def get_stack_size(self
, f
):
114 for p
in f
.parameterIterator():
115 size
+= p
.get_stack_size()
120 def printRealHeader(self
):
121 print "/* If we build with gcc's -fvisibility=hidden flag, we'll need to change"
122 print " * the symbol visibility mode to 'default'."
125 print '#include "../x86/assyntax.h"'
127 print '#if defined(__GNUC__) && (__GNUC__ * 100 + __GNUC_MINOR__) >= 303'
128 print '# pragma GCC visibility push(default)'
129 print '# define HIDDEN(x) .hidden x'
131 print '# define HIDDEN(x)'
134 print '# if defined(USE_MGL_NAMESPACE)'
135 print '# define GL_PREFIX(n) GLNAME(CONCAT(mgl,n))'
137 print '# define GL_PREFIX(n) GLNAME(CONCAT(gl,n))'
140 print '#if defined(PTHREADS) || defined(USE_XTHREADS) || defined(SOLARIS_THREADS) || defined(WIN32_THREADS) || defined(BEOS_THREADS)'
141 print '# define THREADS'
144 print '#ifdef USE_MGL_NAMESPACE'
145 print '#define _glapi_Dispatch _mglapi_Dispatch'
150 print '#ifdef GLX_USE_TLS'
152 print '\t.globl _x86_64_get_get_dispatch; HIDDEN(_x86_64_get_get_dispatch)'
153 print '_x86_64_get_get_dispatch:'
154 print '\tlea\t_x86_64_get_dispatch(%rip), %rax'
157 print '\t.p2align\t4,,15'
158 print '_x86_64_get_dispatch:'
159 print '\tmovq\t_glapi_tls_Dispatch@GOTTPOFF(%rip), %rax'
160 print '\tmovq\t%fs:(%rax), %rax'
162 print '\t.size\t_x86_64_get_dispatch, .-_x86_64_get_dispatch'
164 print '#elif defined(PTHREADS)'
166 print '\t.extern\t_glapi_Dispatch'
167 print '\t.extern\t_gl_DispatchTSD'
168 print '\t.extern\tpthread_getspecific'
170 print '\t.p2align\t4,,15'
171 print '_x86_64_get_dispatch:'
172 print '\tmovq\t_gl_DispatchTSD(%rip), %rdi'
173 print '\tjmp\tpthread_getspecific@PLT'
175 print '#elif defined(THREADS)'
177 print '\t.extern\t_glapi_get_dispatch'
184 def printRealFooter(self
):
186 print '#if defined(GLX_USE_TLS) && defined(__linux__)'
187 print ' .section ".note.ABI-tag", "a"'
189 print ' .long 1f - 0f /* name length */'
190 print ' .long 3f - 2f /* data length */'
191 print ' .long 1 /* note length */'
192 print '0: .asciz "GNU" /* vendor name */'
193 print '1: .p2align 2'
194 print '2: .long 0 /* note data: the ABI tag */'
195 print ' .long 2,4,20 /* Minimum kernel version w/TLS */'
196 print '3: .p2align 2 /* pad out section */'
197 print '#endif /* GLX_USE_TLS */'
199 print '#if defined (__ELF__) && defined (__linux__)'
200 print ' .section .note.GNU-stack,"",%progbits'
205 def printFunction(self
, f
):
207 # The x86-64 ABI divides function parameters into a couple
208 # classes. For the OpenGL interface, the only ones that are
209 # relevent are INTEGER and SSE. Basically, the first 8
210 # GLfloat or GLdouble parameters are placed in %xmm0 - %xmm7,
211 # the first 6 non-GLfloat / non-GLdouble parameters are placed
212 # in registers listed in int_parameters.
214 # If more parameters than that are required, they are passed
215 # on the stack. Therefore, we just have to make sure that
216 # %esp hasn't changed when we jump to the actual function.
217 # Since we're jumping to the function (and not calling it), we
218 # have to make sure of that anyway!
220 int_parameters
= ["%rdi", "%rsi", "%rdx", "%rcx", "%r8", "%r9"]
226 for p
in f
.parameterIterator():
227 type_name
= p
.get_base_type_string()
229 if p
.is_pointer() or (type_name
!= "GLfloat" and type_name
!= "GLdouble"):
231 registers
.append( [int_parameters
[int_class
], stack_offset
] )
236 registers
.append( ["%%xmm%u" % (sse_class
), stack_offset
] )
240 if ((int_class
& 1) == 0) and (sse_class
== 0):
241 registers
.append( ["%rbp", 0] )
244 name
= f
.dispatch_name()
246 print '\t.p2align\t4,,15'
247 print '\t.globl\tGL_PREFIX(%s)' % (name
)
248 print '\t.type\tGL_PREFIX(%s), @function' % (name
)
249 if not f
.is_static_entry_point(f
.name
):
250 print '\tHIDDEN(GL_PREFIX(%s))' % (name
)
251 print 'GL_PREFIX(%s):' % (name
)
252 print '#if defined(GLX_USE_TLS)'
253 print '\tcall\t_x86_64_get_dispatch@PLT'
254 print '\tmovq\t%u(%%rax), %%r11' % (f
.offset
* 8)
256 print '#elif defined(PTHREADS)'
258 save_all_regs(registers
)
259 print '\tcall\t_x86_64_get_dispatch@PLT'
260 restore_all_regs(registers
)
263 print '\tmovq\t(%rax), %r11'
265 print '\tmovq\t%u(%%rax), %%r11' % (f
.offset
* 8)
270 print '\tmovq\t_glapi_Dispatch(%rip), %rax'
271 print '\ttestq\t%rax, %rax'
273 print '\tmovq\t%u(%%rax), %%r11' % (f
.offset
* 8)
277 save_all_regs(registers
)
278 print '\tcall\t_glapi_get_dispatch'
279 restore_all_regs(registers
)
281 print '\tmovq\t%u(%%rax), %%r11' % (f
.offset
* 8)
283 print '#endif /* defined(GLX_USE_TLS) */'
285 print '\t.size\tGL_PREFIX(%s), .-GL_PREFIX(%s)' % (name
, name
)
290 def printBody(self
, api
):
291 for f
in api
.functionIterateByOffset():
292 self
.printFunction(f
)
295 for f
in api
.functionIterateByOffset():
296 dispatch
= f
.dispatch_name()
297 for n
in f
.entry_points
:
299 if f
.is_static_entry_point(n
):
300 text
= '\t.globl GL_PREFIX(%s) ; .set GL_PREFIX(%s), GL_PREFIX(%s)' % (n
, n
, dispatch
)
302 if f
.has_different_protocol(n
):
303 print '#ifndef GLX_INDIRECT_RENDERING'
312 print "Usage: %s [-f input_file_name] [-m output_mode]" % sys
.argv
[0]
315 if __name__
== '__main__':
316 file_name
= "gl_API.xml"
320 (args
, trail
) = getopt
.getopt(sys
.argv
[1:], "m:f:")
324 for (arg
,val
) in args
:
330 if mode
== "generic":
331 printer
= PrintGenericStubs()
333 print "ERROR: Invalid mode \"%s\" specified." % mode
336 api
= gl_XML
.parse_GL_API(file_name
, glX_XML
.glx_item_factory())