# (C) Copyright IBM Corporation 2005 # All Rights Reserved. # # Permission is hereby granted, free of charge, to any person obtaining a # copy of this software and associated documentation files (the "Software"), # to deal in the Software without restriction, including without limitation # on the rights to use, copy, modify, merge, publish, distribute, sub # license, and/or sell copies of the Software, and to permit persons to whom # the Software is furnished to do so, subject to the following conditions: # # The above copyright notice and this permission notice (including the next # paragraph) shall be included in all copies or substantial portions of the # Software. # # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, # FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL # IBM AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING # FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS # IN THE SOFTWARE. # # Authors: # Ian Romanick <idr@us.ibm.com> import argparse import copy import license import gl_XML, glX_XML def should_use_push(registers): for [reg, offset] in registers: if reg[1:4] == "xmm": return 0 N = len(registers) return (N & 1) != 0 def local_size(registers): # The x86-64 ABI says "the value (%rsp - 8) is always a multiple of # 16 when control is transfered to the function entry point." This # means that the local stack usage must be (16*N)+8 for some value # of N. (16*N)+8 = (8*(2N))+8 = 8*(2N+1). As long as N is odd, we # meet this requirement. N = (len(registers) | 1) return 8*N def save_all_regs(registers): adjust_stack = 0 if not should_use_push(registers): adjust_stack = local_size(registers) print '\tsubq\t$%u, %%rsp' % (adjust_stack) for [reg, stack_offset] in registers: save_reg( reg, stack_offset, adjust_stack ) return def restore_all_regs(registers): adjust_stack = 0 if not should_use_push(registers): adjust_stack = local_size(registers) temp = copy.deepcopy(registers) while len(temp): [reg, stack_offset] = temp.pop() restore_reg(reg, stack_offset, adjust_stack) if adjust_stack: print '\taddq\t$%u, %%rsp' % (adjust_stack) return def save_reg(reg, offset, use_move): if use_move: if offset == 0: print '\tmovq\t%s, (%%rsp)' % (reg) else: print '\tmovq\t%s, %u(%%rsp)' % (reg, offset) else: print '\tpushq\t%s' % (reg) return def restore_reg(reg, offset, use_move): if use_move: if offset == 0: print '\tmovq\t(%%rsp), %s' % (reg) else: print '\tmovq\t%u(%%rsp), %s' % (offset, reg) else: print '\tpopq\t%s' % (reg) return class PrintGenericStubs(gl_XML.gl_print_base): def __init__(self): gl_XML.gl_print_base.__init__(self) self.name = "gl_x86-64_asm.py (from Mesa)" self.license = license.bsd_license_template % ("(C) Copyright IBM Corporation 2005", "IBM") return def get_stack_size(self, f): size = 0 for p in f.parameterIterator(): size += p.get_stack_size() return size def printRealHeader(self): print "/* If we build with gcc's -fvisibility=hidden flag, we'll need to change" print " * the symbol visibility mode to 'default'." print ' */' print '' print '#include "x86/assyntax.h"' print '' print '#ifdef __GNUC__' print '# pragma GCC visibility push(default)' print '# define HIDDEN(x) .hidden x' print '#else' print '# define HIDDEN(x)' print '#endif' print '' print '# if defined(USE_MGL_NAMESPACE)' print '# define GL_PREFIX(n) GLNAME(CONCAT(mgl,n))' print '# define _glapi_Dispatch _mglapi_Dispatch' print '# else' print '# define GL_PREFIX(n) GLNAME(CONCAT(gl,n))' print '# endif' print '' print '\t.text' print '' print '#ifdef GLX_USE_TLS' print '' print '_x86_64_get_dispatch:' print '\tmovq\t_glapi_tls_Dispatch@GOTTPOFF(%rip), %rax' print '\tmovq\t%fs:(%rax), %rax' print '\tret' print '\t.size\t_x86_64_get_dispatch, .-_x86_64_get_dispatch' print '' print '#elif defined(HAVE_PTHREAD)' print '' print '\t.extern\t_glapi_Dispatch' print '\t.extern\t_gl_DispatchTSD' print '\t.extern\tpthread_getspecific' print '' print '\t.p2align\t4,,15' print '_x86_64_get_dispatch:' print '\tmovq\t_gl_DispatchTSD@GOTPCREL(%rip), %rax' print '\tmovl\t(%rax), %edi' print '\tjmp\tpthread_getspecific@PLT' print '' print '#else' print '' print '\t.extern\t_glapi_get_dispatch' print '' print '#endif' print '' return def printRealFooter(self): print '' print '#if defined (__ELF__) && defined (__linux__)' print ' .section .note.GNU-stack,"",%progbits' print '#endif' return def printFunction(self, f): # The x86-64 ABI divides function parameters into a couple # classes. For the OpenGL interface, the only ones that are # relevant are INTEGER and SSE. Basically, the first 8 # GLfloat or GLdouble parameters are placed in %xmm0 - %xmm7, # the first 6 non-GLfloat / non-GLdouble parameters are placed # in registers listed in int_parameters. # # If more parameters than that are required, they are passed # on the stack. Therefore, we just have to make sure that # %esp hasn't changed when we jump to the actual function. # Since we're jumping to the function (and not calling it), we # have to make sure of that anyway! int_parameters = ["%rdi", "%rsi", "%rdx", "%rcx", "%r8", "%r9"] int_class = 0 sse_class = 0 stack_offset = 0 registers = [] for p in f.parameterIterator(): type_name = p.get_base_type_string() if p.is_pointer() or (type_name != "GLfloat" and type_name != "GLdouble"): if int_class < 6: registers.append( [int_parameters[int_class], stack_offset] ) int_class += 1 stack_offset += 8 else: if sse_class < 8: registers.append( ["%%xmm%u" % (sse_class), stack_offset] ) sse_class += 1 stack_offset += 8 if ((int_class & 1) == 0) and (sse_class == 0): registers.append( ["%rbp", 0] ) name = f.dispatch_name() print '\t.p2align\t4,,15' print '\t.globl\tGL_PREFIX(%s)' % (name) print '\t.type\tGL_PREFIX(%s), @function' % (name) if not f.is_static_entry_point(f.name): print '\tHIDDEN(GL_PREFIX(%s))' % (name) print 'GL_PREFIX(%s):' % (name) print '#if defined(GLX_USE_TLS)' print '\tcall\t_x86_64_get_dispatch@PLT' print '\tmovq\t%u(%%rax), %%r11' % (f.offset * 8) print '\tjmp\t*%r11' print '#elif defined(HAVE_PTHREAD)' save_all_regs(registers) print '\tcall\t_x86_64_get_dispatch@PLT' restore_all_regs(registers) if f.offset == 0: print '\tmovq\t(%rax), %r11' else: print '\tmovq\t%u(%%rax), %%r11' % (f.offset * 8) print '\tjmp\t*%r11' print '#else' print '\tmovq\t_glapi_Dispatch(%rip), %rax' print '\ttestq\t%rax, %rax' print '\tje\t1f' print '\tmovq\t%u(%%rax), %%r11' % (f.offset * 8) print '\tjmp\t*%r11' print '1:' save_all_regs(registers) print '\tcall\t_glapi_get_dispatch' restore_all_regs(registers) print '\tmovq\t%u(%%rax), %%r11' % (f.offset * 8) print '\tjmp\t*%r11' print '#endif /* defined(GLX_USE_TLS) */' print '\t.size\tGL_PREFIX(%s), .-GL_PREFIX(%s)' % (name, name) print '' return def printBody(self, api): for f in api.functionIterateByOffset(): self.printFunction(f) for f in api.functionIterateByOffset(): dispatch = f.dispatch_name() for n in f.entry_points: if n != f.name: if f.is_static_entry_point(n): text = '\t.globl GL_PREFIX(%s) ; .set GL_PREFIX(%s), GL_PREFIX(%s)' % (n, n, dispatch) if f.has_different_protocol(n): print '#ifndef GLX_INDIRECT_RENDERING' print text print '#endif' else: print text return def _parser(): """Parse arguments and return a namespace.""" parser = argparse.ArgumentParser() parser.add_argument('-f', default='gl_API.xml', dest='filename', help='An XML file describing an API') return parser.parse_args() def main(): """Main file.""" args = _parser() printer = PrintGenericStubs() api = gl_XML.parse_GL_API(args.filename, glX_XML.glx_item_factory()) printer.Print(api) if __name__ == '__main__': main()