// Copyright 2009 The Go Authors. All rights reserved. // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file. #include "go_asm.h" #include "go_tls.h" #include "textflag.h" // void runtime·asmstdcall(void *c); TEXT runtime·asmstdcall(SB),NOSPLIT,$0 MOVL fn+0(FP), BX // SetLastError(0). MOVL $0, 0x34(FS) // Copy args to the stack. MOVL SP, BP MOVL libcall_n(BX), CX // words MOVL CX, AX SALL $2, AX SUBL AX, SP // room for args MOVL SP, DI MOVL libcall_args(BX), SI CLD REP; MOVSL // Call stdcall or cdecl function. // DI SI BP BX are preserved, SP is not CALL libcall_fn(BX) MOVL BP, SP // Return result. MOVL fn+0(FP), BX MOVL AX, libcall_r1(BX) MOVL DX, libcall_r2(BX) // GetLastError(). MOVL 0x34(FS), AX MOVL AX, libcall_err(BX) RET TEXT runtime·badsignal2(SB),NOSPLIT,$24 // stderr MOVL $-12, 0(SP) MOVL SP, BP CALL *runtime·_GetStdHandle(SB) MOVL BP, SP MOVL AX, 0(SP) // handle MOVL $runtime·badsignalmsg(SB), DX // pointer MOVL DX, 4(SP) MOVL runtime·badsignallen(SB), DX // count MOVL DX, 8(SP) LEAL 20(SP), DX // written count MOVL $0, 0(DX) MOVL DX, 12(SP) MOVL $0, 16(SP) // overlapped CALL *runtime·_WriteFile(SB) MOVL BP, SI RET // faster get/set last error TEXT runtime·getlasterror(SB),NOSPLIT,$0 MOVL 0x34(FS), AX MOVL AX, ret+0(FP) RET TEXT runtime·setlasterror(SB),NOSPLIT,$0 MOVL err+0(FP), AX MOVL AX, 0x34(FS) RET // Called by Windows as a Vectored Exception Handler (VEH). // First argument is pointer to struct containing // exception record and context pointers. // Handler function is stored in AX. // Return 0 for 'not handled', -1 for handled. TEXT runtime·sigtramp(SB),NOSPLIT,$0-0 MOVL ptrs+0(FP), CX SUBL $40, SP // save callee-saved registers MOVL BX, 28(SP) MOVL BP, 16(SP) MOVL SI, 20(SP) MOVL DI, 24(SP) MOVL AX, SI // save handler address // find g get_tls(DX) CMPL DX, $0 JNE 3(PC) MOVL $0, AX // continue JMP done MOVL g(DX), DX CMPL DX, $0 JNE 2(PC) CALL runtime·badsignal2(SB) // save g and SP in case of stack switch MOVL DX, 32(SP) // g MOVL SP, 36(SP) // do we need to switch to the g0 stack? MOVL g_m(DX), BX MOVL m_g0(BX), BX CMPL DX, BX JEQ g0 // switch to the g0 stack get_tls(BP) MOVL BX, g(BP) MOVL (g_sched+gobuf_sp)(BX), DI // make it look like mstart called us on g0, to stop traceback SUBL $4, DI MOVL $runtime·mstart(SB), 0(DI) // traceback will think that we've done SUBL // on this stack, so subtract them here to match. // (we need room for sighandler arguments anyway). // and re-save old SP for restoring later. SUBL $40, DI MOVL SP, 36(DI) MOVL DI, SP g0: MOVL 0(CX), BX // ExceptionRecord* MOVL 4(CX), CX // Context* MOVL BX, 0(SP) MOVL CX, 4(SP) MOVL DX, 8(SP) CALL SI // call handler // AX is set to report result back to Windows MOVL 12(SP), AX // switch back to original stack and g // no-op if we never left. MOVL 36(SP), SP MOVL 32(SP), DX get_tls(BP) MOVL DX, g(BP) done: // restore callee-saved registers MOVL 24(SP), DI MOVL 20(SP), SI MOVL 16(SP), BP MOVL 28(SP), BX ADDL $40, SP // RET 4 (return and pop 4 bytes parameters) BYTE $0xC2; WORD $4 RET // unreached; make assembler happy TEXT runtime·exceptiontramp(SB),NOSPLIT,$0 MOVL $runtime·exceptionhandler(SB), AX JMP runtime·sigtramp(SB) TEXT runtime·firstcontinuetramp(SB),NOSPLIT,$0-0 // is never called INT $3 TEXT runtime·lastcontinuetramp(SB),NOSPLIT,$0-0 MOVL $runtime·lastcontinuehandler(SB), AX JMP runtime·sigtramp(SB) TEXT runtime·ctrlhandler(SB),NOSPLIT,$0 PUSHL $runtime·ctrlhandler1(SB) CALL runtime·externalthreadhandler(SB) MOVL 4(SP), CX ADDL $12, SP JMP CX TEXT runtime·profileloop(SB),NOSPLIT,$0 PUSHL $runtime·profileloop1(SB) CALL runtime·externalthreadhandler(SB) MOVL 4(SP), CX ADDL $12, SP JMP CX TEXT runtime·externalthreadhandler(SB),NOSPLIT,$0 PUSHL BP MOVL SP, BP PUSHL BX PUSHL SI PUSHL DI PUSHL 0x14(FS) MOVL SP, DX // setup dummy m, g SUBL $m__size, SP // space for M MOVL SP, 0(SP) MOVL $m__size, 4(SP) CALL runtime·memclrNoHeapPointers(SB) // smashes AX,BX,CX LEAL m_tls(SP), CX MOVL CX, 0x14(FS) MOVL SP, BX SUBL $g__size, SP // space for G MOVL SP, g(CX) MOVL SP, m_g0(BX) MOVL SP, 0(SP) MOVL $g__size, 4(SP) CALL runtime·memclrNoHeapPointers(SB) // smashes AX,BX,CX LEAL g__size(SP), BX MOVL BX, g_m(SP) LEAL -32768(SP), CX // must be less than SizeOfStackReserve set by linker MOVL CX, (g_stack+stack_lo)(SP) ADDL $const__StackGuard, CX MOVL CX, g_stackguard0(SP) MOVL CX, g_stackguard1(SP) MOVL DX, (g_stack+stack_hi)(SP) PUSHL AX // room for return value PUSHL 16(BP) // arg for handler CALL 8(BP) POPL CX POPL AX // pass return value to Windows in AX get_tls(CX) MOVL g(CX), CX MOVL (g_stack+stack_hi)(CX), SP POPL 0x14(FS) POPL DI POPL SI POPL BX POPL BP RET GLOBL runtime·cbctxts(SB), NOPTR, $4 TEXT runtime·callbackasm1+0(SB),NOSPLIT,$0 MOVL 0(SP), AX // will use to find our callback context // remove return address from stack, we are not returning there ADDL $4, SP // address to callback parameters into CX LEAL 4(SP), CX // save registers as required for windows callback PUSHL DI PUSHL SI PUSHL BP PUSHL BX // determine index into runtime·cbctxts table SUBL $runtime·callbackasm(SB), AX MOVL $0, DX MOVL $5, BX // divide by 5 because each call instruction in runtime·callbacks is 5 bytes long DIVL BX // find correspondent runtime·cbctxts table entry MOVL runtime·cbctxts(SB), BX MOVL -4(BX)(AX*4), BX // extract callback context MOVL wincallbackcontext_gobody(BX), AX MOVL wincallbackcontext_argsize(BX), DX // preserve whatever's at the memory location that // the callback will use to store the return value PUSHL 0(CX)(DX*1) // extend argsize by size of return value ADDL $4, DX // remember how to restore stack on return MOVL wincallbackcontext_restorestack(BX), BX PUSHL BX // call target Go function PUSHL DX // argsize (including return value) PUSHL CX // callback parameters PUSHL AX // address of target Go function CLD CALL runtime·cgocallback_gofunc(SB) POPL AX POPL CX POPL DX // how to restore stack on return POPL BX // return value into AX (as per Windows spec) // and restore previously preserved value MOVL -4(CX)(DX*1), AX POPL -4(CX)(DX*1) MOVL BX, CX // cannot use BX anymore // restore registers as required for windows callback POPL BX POPL BP POPL SI POPL DI // remove callback parameters before return (as per Windows spec) POPL DX ADDL CX, SP PUSHL DX CLD RET // void tstart(M *newm); TEXT runtime·tstart(SB),NOSPLIT,$0 MOVL newm+0(FP), CX // m MOVL m_g0(CX), DX // g // Layout new m scheduler stack on os stack. MOVL SP, AX MOVL AX, (g_stack+stack_hi)(DX) SUBL $(64*1024), AX // initial stack size (adjusted later) MOVL AX, (g_stack+stack_lo)(DX) ADDL $const__StackGuard, AX MOVL AX, g_stackguard0(DX) MOVL AX, g_stackguard1(DX) // Set up tls. LEAL m_tls(CX), SI MOVL SI, 0x14(FS) MOVL CX, g_m(DX) MOVL DX, g(SI) // Someday the convention will be D is always cleared. CLD CALL runtime·stackcheck(SB) // clobbers AX,CX CALL runtime·mstart(SB) RET // uint32 tstart_stdcall(M *newm); TEXT runtime·tstart_stdcall(SB),NOSPLIT,$0 MOVL newm+0(FP), BX PUSHL BX CALL runtime·tstart(SB) POPL BX // Adjust stack for stdcall to return properly. MOVL (SP), AX // save return address ADDL $4, SP // remove single parameter MOVL AX, (SP) // restore return address XORL AX, AX // return 0 == success RET // setldt(int entry, int address, int limit) TEXT runtime·setldt(SB),NOSPLIT,$0 MOVL address+4(FP), CX MOVL CX, 0x14(FS) RET // onosstack calls fn on OS stack. // func onosstack(fn unsafe.Pointer, arg uint32) TEXT runtime·onosstack(SB),NOSPLIT,$0 MOVL fn+0(FP), AX // to hide from 8l MOVL arg+4(FP), BX // Execute call on m->g0 stack, in case we are not actually // calling a system call wrapper, like when running under WINE. get_tls(CX) CMPL CX, $0 JNE 3(PC) // Not a Go-managed thread. Do not switch stack. CALL AX RET MOVL g(CX), BP MOVL g_m(BP), BP // leave pc/sp for cpu profiler MOVL (SP), SI MOVL SI, m_libcallpc(BP) MOVL g(CX), SI MOVL SI, m_libcallg(BP) // sp must be the last, because once async cpu profiler finds // all three values to be non-zero, it will use them LEAL usec+0(FP), SI MOVL SI, m_libcallsp(BP) MOVL m_g0(BP), SI CMPL g(CX), SI JNE switch // executing on m->g0 already CALL AX JMP ret switch: // Switch to m->g0 stack and back. MOVL (g_sched+gobuf_sp)(SI), SI MOVL SP, -4(SI) LEAL -4(SI), SP CALL AX MOVL 0(SP), SP ret: get_tls(CX) MOVL g(CX), BP MOVL g_m(BP), BP MOVL $0, m_libcallsp(BP) RET // Runs on OS stack. duration (in 100ns units) is in BX. TEXT runtime·usleep2(SB),NOSPLIT,$20 // Want negative 100ns units. NEGL BX MOVL $-1, hi-4(SP) MOVL BX, lo-8(SP) LEAL lo-8(SP), BX MOVL BX, ptime-12(SP) MOVL $0, alertable-16(SP) MOVL $-1, handle-20(SP) MOVL SP, BP MOVL runtime·_NtWaitForSingleObject(SB), AX CALL AX MOVL BP, SP RET // Runs on OS stack. TEXT runtime·switchtothread(SB),NOSPLIT,$0 MOVL SP, BP MOVL runtime·_SwitchToThread(SB), AX CALL AX MOVL BP, SP RET // See https://www.dcl.hpi.uni-potsdam.de/research/WRK/2007/08/getting-os-information-the-kuser_shared_data-structure/ // Must read hi1, then lo, then hi2. The snapshot is valid if hi1 == hi2. #define _INTERRUPT_TIME 0x7ffe0008 #define _SYSTEM_TIME 0x7ffe0014 #define time_lo 0 #define time_hi1 4 #define time_hi2 8 TEXT runtime·nanotime(SB),NOSPLIT,$0-8 CMPB runtime·useQPCTime(SB), $0 JNE useQPC loop: MOVL (_INTERRUPT_TIME+time_hi1), AX MOVL (_INTERRUPT_TIME+time_lo), CX MOVL (_INTERRUPT_TIME+time_hi2), DI CMPL AX, DI JNE loop // wintime = DI:CX, multiply by 100 MOVL $100, AX MULL CX IMULL $100, DI ADDL DI, DX // wintime*100 = DX:AX MOVL AX, ret_lo+0(FP) MOVL DX, ret_hi+4(FP) RET useQPC: JMP runtime·nanotimeQPC(SB) RET TEXT time·now(SB),NOSPLIT,$0-20 CMPB runtime·useQPCTime(SB), $0 JNE useQPC loop: MOVL (_INTERRUPT_TIME+time_hi1), AX MOVL (_INTERRUPT_TIME+time_lo), CX MOVL (_INTERRUPT_TIME+time_hi2), DI CMPL AX, DI JNE loop // w = DI:CX // multiply by 100 MOVL $100, AX MULL CX IMULL $100, DI ADDL DI, DX // w*100 = DX:AX MOVL AX, mono+12(FP) MOVL DX, mono+16(FP) wall: MOVL (_SYSTEM_TIME+time_hi1), CX MOVL (_SYSTEM_TIME+time_lo), AX MOVL (_SYSTEM_TIME+time_hi2), DX CMPL CX, DX JNE wall // w = DX:AX // convert to Unix epoch (but still 100ns units) #define delta 116444736000000000 SUBL $(delta & 0xFFFFFFFF), AX SBBL $(delta >> 32), DX // nano/100 = DX:AX // split into two decimal halves by div 1e9. // (decimal point is two spots over from correct place, // but we avoid overflow in the high word.) MOVL $1000000000, CX DIVL CX MOVL AX, DI MOVL DX, SI // DI = nano/100/1e9 = nano/1e11 = sec/100, DX = SI = nano/100%1e9 // split DX into seconds and nanoseconds by div 1e7 magic multiply. MOVL DX, AX MOVL $1801439851, CX MULL CX SHRL $22, DX MOVL DX, BX IMULL $10000000, DX MOVL SI, CX SUBL DX, CX // DI = sec/100 (still) // BX = (nano/100%1e9)/1e7 = (nano/1e9)%100 = sec%100 // CX = (nano/100%1e9)%1e7 = (nano%1e9)/100 = nsec/100 // store nsec for return IMULL $100, CX MOVL CX, nsec+8(FP) // DI = sec/100 (still) // BX = sec%100 // construct DX:AX = 64-bit sec and store for return MOVL $0, DX MOVL $100, AX MULL DI ADDL BX, AX ADCL $0, DX MOVL AX, sec+0(FP) MOVL DX, sec+4(FP) RET useQPC: JMP runtime·nowQPC(SB) RET