/* * Mesa 3-D graphics library * * Copyright (C) 1999-2008 Brian Paul All Rights Reserved. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included * in all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR * OTHER DEALINGS IN THE SOFTWARE. */ /** * \file glapi_entrypoint.c * * Arch-specific code for manipulating GL API entrypoints (dispatch stubs). */ #include <string.h> #include "c11/threads.h" #include "glapi/glapi_priv.h" #include "u_execmem.h" #ifdef USE_X86_ASM #if defined( GLX_USE_TLS ) extern GLubyte gl_dispatch_functions_start[]; extern GLubyte gl_dispatch_functions_end[]; #else extern const GLubyte gl_dispatch_functions_start[]; #endif #endif /* USE_X86_ASM */ #if defined(DISPATCH_FUNCTION_SIZE) _glapi_proc get_entrypoint_address(unsigned int functionOffset) { return (_glapi_proc) (gl_dispatch_functions_start + (DISPATCH_FUNCTION_SIZE * functionOffset)); } #endif #if defined(USE_X86_ASM) /** * Perform platform-specific GL API entry-point fixups. */ static void init_glapi_relocs( void ) { #if defined(GLX_USE_TLS) && !defined(GLX_X86_READONLY_TEXT) extern unsigned long _x86_get_dispatch(void); char run_time_patch[] = { 0x65, 0xa1, 0, 0, 0, 0 /* movl %gs:0,%eax */ }; GLuint *offset = (GLuint *) &run_time_patch[2]; /* 32-bits for x86/32 */ const GLubyte * const get_disp = (const GLubyte *) run_time_patch; GLubyte * curr_func = (GLubyte *) gl_dispatch_functions_start; *offset = _x86_get_dispatch(); while ( curr_func != (GLubyte *) gl_dispatch_functions_end ) { (void) memcpy( curr_func, get_disp, sizeof(run_time_patch)); curr_func += DISPATCH_FUNCTION_SIZE; } #endif } /** * Generate a dispatch function (entrypoint) which jumps through * the given slot number (offset) in the current dispatch table. * We need assembly language in order to accomplish this. */ _glapi_proc generate_entrypoint(unsigned int functionOffset) { /* 32 is chosen as something of a magic offset. For x86, the dispatch * at offset 32 is the first one where the offset in the * "jmp OFFSET*4(%eax)" can't be encoded in a single byte. */ const GLubyte * const template_func = gl_dispatch_functions_start + (DISPATCH_FUNCTION_SIZE * 32); GLubyte * const code = (GLubyte *) u_execmem_alloc(DISPATCH_FUNCTION_SIZE); if ( code != NULL ) { (void) memcpy(code, template_func, DISPATCH_FUNCTION_SIZE); fill_in_entrypoint_offset( (_glapi_proc) code, functionOffset ); } return (_glapi_proc) code; } /** * This function inserts a new dispatch offset into the assembly language * stub that was generated with the preceeding function. */ void fill_in_entrypoint_offset(_glapi_proc entrypoint, unsigned int offset) { GLubyte * const code = (GLubyte *) entrypoint; #if defined(GLX_USE_TLS) *((unsigned int *)(code + 8)) = 4 * offset; #else *((unsigned int *)(code + 11)) = 4 * offset; *((unsigned int *)(code + 22)) = 4 * offset; #endif } #elif defined(USE_SPARC_ASM) extern void __glapi_sparc_icache_flush(unsigned int *); static void init_glapi_relocs( void ) { #if defined(HAVE_PTHREAD) || defined(GLX_USE_TLS) static const unsigned int template[] = { #ifdef GLX_USE_TLS 0x05000000, /* sethi %hi(_glapi_tls_Dispatch), %g2 */ 0x8730e00a, /* srl %g3, 10, %g3 */ 0x8410a000, /* or %g2, %lo(_glapi_tls_Dispatch), %g2 */ #ifdef __arch64__ 0xc259c002, /* ldx [%g7 + %g2], %g1 */ 0xc2584003, /* ldx [%g1 + %g3], %g1 */ #else 0xc201c002, /* ld [%g7 + %g2], %g1 */ 0xc2004003, /* ld [%g1 + %g3], %g1 */ #endif 0x81c04000, /* jmp %g1 */ 0x01000000, /* nop */ #else #ifdef __arch64__ 0x03000000, /* 64-bit 0x00 --> sethi %hh(_glapi_Dispatch), %g1 */ 0x05000000, /* 64-bit 0x04 --> sethi %lm(_glapi_Dispatch), %g2 */ 0x82106000, /* 64-bit 0x08 --> or %g1, %hm(_glapi_Dispatch), %g1 */ 0x8730e00a, /* 64-bit 0x0c --> srl %g3, 10, %g3 */ 0x83287020, /* 64-bit 0x10 --> sllx %g1, 32, %g1 */ 0x82004002, /* 64-bit 0x14 --> add %g1, %g2, %g1 */ 0xc2586000, /* 64-bit 0x18 --> ldx [%g1 + %lo(_glapi_Dispatch)], %g1 */ #else 0x03000000, /* 32-bit 0x00 --> sethi %hi(_glapi_Dispatch), %g1 */ 0x8730e00a, /* 32-bit 0x04 --> srl %g3, 10, %g3 */ 0xc2006000, /* 32-bit 0x08 --> ld [%g1 + %lo(_glapi_Dispatch)], %g1 */ #endif 0x80a06000, /* --> cmp %g1, 0 */ 0x02800005, /* --> be +4*5 */ 0x01000000, /* --> nop */ #ifdef __arch64__ 0xc2584003, /* 64-bit --> ldx [%g1 + %g3], %g1 */ #else 0xc2004003, /* 32-bit --> ld [%g1 + %g3], %g1 */ #endif 0x81c04000, /* --> jmp %g1 */ 0x01000000, /* --> nop */ #ifdef __arch64__ 0x9de3bf80, /* 64-bit --> save %sp, -128, %sp */ #else 0x9de3bfc0, /* 32-bit --> save %sp, -64, %sp */ #endif 0xa0100003, /* --> mov %g3, %l0 */ 0x40000000, /* --> call _glapi_get_dispatch */ 0x01000000, /* --> nop */ 0x82100008, /* --> mov %o0, %g1 */ 0x86100010, /* --> mov %l0, %g3 */ 0x10bffff7, /* --> ba -4*9 */ 0x81e80000, /* --> restore */ #endif }; #ifdef GLX_USE_TLS extern unsigned int __glapi_sparc_tls_stub; extern unsigned long __glapi_sparc_get_dispatch(void); unsigned int *code = &__glapi_sparc_tls_stub; unsigned long dispatch = __glapi_sparc_get_dispatch(); #else extern unsigned int __glapi_sparc_pthread_stub; unsigned int *code = &__glapi_sparc_pthread_stub; unsigned long dispatch = (unsigned long) &_glapi_Dispatch; unsigned long call_dest = (unsigned long ) &_glapi_get_dispatch; int idx; #endif #ifdef GLX_USE_TLS code[0] = template[0] | (dispatch >> 10); code[1] = template[1]; __glapi_sparc_icache_flush(&code[0]); code[2] = template[2] | (dispatch & 0x3ff); code[3] = template[3]; __glapi_sparc_icache_flush(&code[2]); code[4] = template[4]; code[5] = template[5]; __glapi_sparc_icache_flush(&code[4]); code[6] = template[6]; __glapi_sparc_icache_flush(&code[6]); #else #if defined(__arch64__) code[0] = template[0] | (dispatch >> (32 + 10)); code[1] = template[1] | ((dispatch & 0xffffffff) >> 10); __glapi_sparc_icache_flush(&code[0]); code[2] = template[2] | ((dispatch >> 32) & 0x3ff); code[3] = template[3]; __glapi_sparc_icache_flush(&code[2]); code[4] = template[4]; code[5] = template[5]; __glapi_sparc_icache_flush(&code[4]); code[6] = template[6] | (dispatch & 0x3ff); idx = 7; #else code[0] = template[0] | (dispatch >> 10); code[1] = template[1]; __glapi_sparc_icache_flush(&code[0]); code[2] = template[2] | (dispatch & 0x3ff); idx = 3; #endif code[idx + 0] = template[idx + 0]; __glapi_sparc_icache_flush(&code[idx - 1]); code[idx + 1] = template[idx + 1]; code[idx + 2] = template[idx + 2]; __glapi_sparc_icache_flush(&code[idx + 1]); code[idx + 3] = template[idx + 3]; code[idx + 4] = template[idx + 4]; __glapi_sparc_icache_flush(&code[idx + 3]); code[idx + 5] = template[idx + 5]; code[idx + 6] = template[idx + 6]; __glapi_sparc_icache_flush(&code[idx + 5]); code[idx + 7] = template[idx + 7]; code[idx + 8] = template[idx + 8] | (((call_dest - ((unsigned long) &code[idx + 8])) >> 2) & 0x3fffffff); __glapi_sparc_icache_flush(&code[idx + 7]); code[idx + 9] = template[idx + 9]; code[idx + 10] = template[idx + 10]; __glapi_sparc_icache_flush(&code[idx + 9]); code[idx + 11] = template[idx + 11]; code[idx + 12] = template[idx + 12]; __glapi_sparc_icache_flush(&code[idx + 11]); code[idx + 13] = template[idx + 13]; __glapi_sparc_icache_flush(&code[idx + 13]); #endif #endif } _glapi_proc generate_entrypoint(GLuint functionOffset) { #if defined(HAVE_PTHREAD) || defined(GLX_USE_TLS) static const unsigned int template[] = { 0x07000000, /* sethi %hi(0), %g3 */ 0x8210000f, /* mov %o7, %g1 */ 0x40000000, /* call */ 0x9e100001, /* mov %g1, %o7 */ }; #ifdef GLX_USE_TLS extern unsigned int __glapi_sparc_tls_stub; unsigned long call_dest = (unsigned long ) &__glapi_sparc_tls_stub; #else extern unsigned int __glapi_sparc_pthread_stub; unsigned long call_dest = (unsigned long ) &__glapi_sparc_pthread_stub; #endif unsigned int *code = (unsigned int *) u_execmem_alloc(sizeof(template)); if (code) { code[0] = template[0] | (functionOffset & 0x3fffff); code[1] = template[1]; __glapi_sparc_icache_flush(&code[0]); code[2] = template[2] | (((call_dest - ((unsigned long) &code[2])) >> 2) & 0x3fffffff); code[3] = template[3]; __glapi_sparc_icache_flush(&code[2]); } return (_glapi_proc) code; #endif } void fill_in_entrypoint_offset(_glapi_proc entrypoint, GLuint offset) { unsigned int *code = (unsigned int *) entrypoint; code[0] &= ~0x3fffff; code[0] |= (offset * sizeof(void *)) & 0x3fffff; __glapi_sparc_icache_flush(&code[0]); } #else /* USE_*_ASM */ static void init_glapi_relocs( void ) { } _glapi_proc generate_entrypoint(GLuint functionOffset) { (void) functionOffset; return NULL; } void fill_in_entrypoint_offset(_glapi_proc entrypoint, GLuint offset) { /* an unimplemented architecture */ (void) entrypoint; (void) offset; } #endif /* USE_*_ASM */ void init_glapi_relocs_once( void ) { #if defined(HAVE_PTHREAD) || defined(GLX_USE_TLS) static once_flag flag = ONCE_FLAG_INIT; call_once(&flag, init_glapi_relocs); #endif }