|  | // Copyright 2009 The Go Authors. All rights reserved. | 
|  | // Use of this source code is governed by a BSD-style | 
|  | // license that can be found in the LICENSE file. | 
|  |  | 
|  | #include "go_asm.h" | 
|  | #include "go_tls.h" | 
|  | #include "textflag.h" | 
|  |  | 
|  | // void runtime·asmstdcall(void *c); | 
|  | TEXT runtime·asmstdcall(SB),NOSPLIT,$0 | 
|  | MOVL	fn+0(FP), BX | 
|  |  | 
|  | // SetLastError(0). | 
|  | MOVL	$0, 0x34(FS) | 
|  |  | 
|  | // Copy args to the stack. | 
|  | MOVL	SP, BP | 
|  | MOVL	libcall_n(BX), CX	// words | 
|  | MOVL	CX, AX | 
|  | SALL	$2, AX | 
|  | SUBL	AX, SP			// room for args | 
|  | MOVL	SP, DI | 
|  | MOVL	libcall_args(BX), SI | 
|  | CLD | 
|  | REP; MOVSL | 
|  |  | 
|  | // Call stdcall or cdecl function. | 
|  | // DI SI BP BX are preserved, SP is not | 
|  | CALL	libcall_fn(BX) | 
|  | MOVL	BP, SP | 
|  |  | 
|  | // Return result. | 
|  | MOVL	fn+0(FP), BX | 
|  | MOVL	AX, libcall_r1(BX) | 
|  | MOVL	DX, libcall_r2(BX) | 
|  |  | 
|  | // GetLastError(). | 
|  | MOVL	0x34(FS), AX | 
|  | MOVL	AX, libcall_err(BX) | 
|  |  | 
|  | RET | 
|  |  | 
|  | TEXT	runtime·badsignal2(SB),NOSPLIT,$24 | 
|  | // stderr | 
|  | MOVL	$-12, 0(SP) | 
|  | MOVL	SP, BP | 
|  | CALL	*runtime·_GetStdHandle(SB) | 
|  | MOVL	BP, SP | 
|  |  | 
|  | MOVL	AX, 0(SP)	// handle | 
|  | MOVL	$runtime·badsignalmsg(SB), DX // pointer | 
|  | MOVL	DX, 4(SP) | 
|  | MOVL	runtime·badsignallen(SB), DX // count | 
|  | MOVL	DX, 8(SP) | 
|  | LEAL	20(SP), DX  // written count | 
|  | MOVL	$0, 0(DX) | 
|  | MOVL	DX, 12(SP) | 
|  | MOVL	$0, 16(SP) // overlapped | 
|  | CALL	*runtime·_WriteFile(SB) | 
|  | MOVL	BP, SI | 
|  | RET | 
|  |  | 
|  | // faster get/set last error | 
|  | TEXT runtime·getlasterror(SB),NOSPLIT,$0 | 
|  | MOVL	0x34(FS), AX | 
|  | MOVL	AX, ret+0(FP) | 
|  | RET | 
|  |  | 
|  | TEXT runtime·setlasterror(SB),NOSPLIT,$0 | 
|  | MOVL	err+0(FP), AX | 
|  | MOVL	AX, 0x34(FS) | 
|  | RET | 
|  |  | 
|  | // Called by Windows as a Vectored Exception Handler (VEH). | 
|  | // First argument is pointer to struct containing | 
|  | // exception record and context pointers. | 
|  | // Handler function is stored in AX. | 
|  | // Return 0 for 'not handled', -1 for handled. | 
|  | TEXT sigtramp<>(SB),NOSPLIT,$0-0 | 
|  | MOVL	ptrs+0(FP), CX | 
|  | SUBL	$40, SP | 
|  |  | 
|  | // save callee-saved registers | 
|  | MOVL	BX, 28(SP) | 
|  | MOVL	BP, 16(SP) | 
|  | MOVL	SI, 20(SP) | 
|  | MOVL	DI, 24(SP) | 
|  |  | 
|  | MOVL	AX, SI	// save handler address | 
|  |  | 
|  | // find g | 
|  | get_tls(DX) | 
|  | CMPL	DX, $0 | 
|  | JNE	3(PC) | 
|  | MOVL	$0, AX // continue | 
|  | JMP	done | 
|  | MOVL	g(DX), DX | 
|  | CMPL	DX, $0 | 
|  | JNE	2(PC) | 
|  | CALL	runtime·badsignal2(SB) | 
|  |  | 
|  | // save g and SP in case of stack switch | 
|  | MOVL	DX, 32(SP)	// g | 
|  | MOVL	SP, 36(SP) | 
|  |  | 
|  | // do we need to switch to the g0 stack? | 
|  | MOVL	g_m(DX), BX | 
|  | MOVL	m_g0(BX), BX | 
|  | CMPL	DX, BX | 
|  | JEQ	g0 | 
|  |  | 
|  | // switch to the g0 stack | 
|  | get_tls(BP) | 
|  | MOVL	BX, g(BP) | 
|  | MOVL	(g_sched+gobuf_sp)(BX), DI | 
|  | // make it look like mstart called us on g0, to stop traceback | 
|  | SUBL	$4, DI | 
|  | MOVL	$runtime·mstart(SB), 0(DI) | 
|  | // traceback will think that we've done SUBL | 
|  | // on this stack, so subtract them here to match. | 
|  | // (we need room for sighandler arguments anyway). | 
|  | // and re-save old SP for restoring later. | 
|  | SUBL	$40, DI | 
|  | MOVL	SP, 36(DI) | 
|  | MOVL	DI, SP | 
|  |  | 
|  | g0: | 
|  | MOVL	0(CX), BX // ExceptionRecord* | 
|  | MOVL	4(CX), CX // Context* | 
|  | MOVL	BX, 0(SP) | 
|  | MOVL	CX, 4(SP) | 
|  | MOVL	DX, 8(SP) | 
|  | CALL	SI	// call handler | 
|  | // AX is set to report result back to Windows | 
|  | MOVL	12(SP), AX | 
|  |  | 
|  | // switch back to original stack and g | 
|  | // no-op if we never left. | 
|  | MOVL	36(SP), SP | 
|  | MOVL	32(SP), DX | 
|  | get_tls(BP) | 
|  | MOVL	DX, g(BP) | 
|  |  | 
|  | done: | 
|  | // restore callee-saved registers | 
|  | MOVL	24(SP), DI | 
|  | MOVL	20(SP), SI | 
|  | MOVL	16(SP), BP | 
|  | MOVL	28(SP), BX | 
|  |  | 
|  | ADDL	$40, SP | 
|  | // RET 4 (return and pop 4 bytes parameters) | 
|  | BYTE $0xC2; WORD $4 | 
|  | RET // unreached; make assembler happy | 
|  |  | 
|  | TEXT runtime·exceptiontramp(SB),NOSPLIT,$0 | 
|  | MOVL	$runtime·exceptionhandler(SB), AX | 
|  | JMP	sigtramp<>(SB) | 
|  |  | 
|  | TEXT runtime·firstcontinuetramp(SB),NOSPLIT,$0-0 | 
|  | // is never called | 
|  | INT	$3 | 
|  |  | 
|  | TEXT runtime·lastcontinuetramp(SB),NOSPLIT,$0-0 | 
|  | MOVL	$runtime·lastcontinuehandler(SB), AX | 
|  | JMP	sigtramp<>(SB) | 
|  |  | 
|  | // Called by OS using stdcall ABI: bool ctrlhandler(uint32). | 
|  | TEXT runtime·ctrlhandler(SB),NOSPLIT,$0 | 
|  | PUSHL	$runtime·ctrlhandler1(SB) | 
|  | NOP	SP	// tell vet SP changed - stop checking offsets | 
|  | CALL	runtime·externalthreadhandler(SB) | 
|  | MOVL	4(SP), CX | 
|  | ADDL	$12, SP | 
|  | JMP	CX | 
|  |  | 
|  | // Called by OS using stdcall ABI: uint32 profileloop(void*). | 
|  | TEXT runtime·profileloop(SB),NOSPLIT,$0 | 
|  | PUSHL	$runtime·profileloop1(SB) | 
|  | NOP	SP	// tell vet SP changed - stop checking offsets | 
|  | CALL	runtime·externalthreadhandler(SB) | 
|  | MOVL	4(SP), CX | 
|  | ADDL	$12, SP | 
|  | JMP	CX | 
|  |  | 
|  | TEXT runtime·externalthreadhandler(SB),NOSPLIT,$0 | 
|  | PUSHL	BP | 
|  | MOVL	SP, BP | 
|  | PUSHL	BX | 
|  | PUSHL	SI | 
|  | PUSHL	DI | 
|  | PUSHL	0x14(FS) | 
|  | MOVL	SP, DX | 
|  |  | 
|  | // setup dummy m, g | 
|  | SUBL	$m__size, SP		// space for M | 
|  | MOVL	SP, 0(SP) | 
|  | MOVL	$m__size, 4(SP) | 
|  | CALL	runtime·memclrNoHeapPointers(SB)	// smashes AX,BX,CX | 
|  |  | 
|  | LEAL	m_tls(SP), CX | 
|  | MOVL	CX, 0x14(FS) | 
|  | MOVL	SP, BX | 
|  | SUBL	$g__size, SP		// space for G | 
|  | MOVL	SP, g(CX) | 
|  | MOVL	SP, m_g0(BX) | 
|  |  | 
|  | MOVL	SP, 0(SP) | 
|  | MOVL	$g__size, 4(SP) | 
|  | CALL	runtime·memclrNoHeapPointers(SB)	// smashes AX,BX,CX | 
|  | LEAL	g__size(SP), BX | 
|  | MOVL	BX, g_m(SP) | 
|  |  | 
|  | LEAL	-32768(SP), CX		// must be less than SizeOfStackReserve set by linker | 
|  | MOVL	CX, (g_stack+stack_lo)(SP) | 
|  | ADDL	$const__StackGuard, CX | 
|  | MOVL	CX, g_stackguard0(SP) | 
|  | MOVL	CX, g_stackguard1(SP) | 
|  | MOVL	DX, (g_stack+stack_hi)(SP) | 
|  |  | 
|  | PUSHL	AX			// room for return value | 
|  | PUSHL	16(BP)			// arg for handler | 
|  | CALL	8(BP) | 
|  | POPL	CX | 
|  | POPL	AX			// pass return value to Windows in AX | 
|  |  | 
|  | get_tls(CX) | 
|  | MOVL	g(CX), CX | 
|  | MOVL	(g_stack+stack_hi)(CX), SP | 
|  | POPL	0x14(FS) | 
|  | POPL	DI | 
|  | POPL	SI | 
|  | POPL	BX | 
|  | POPL	BP | 
|  | RET | 
|  |  | 
|  | GLOBL runtime·cbctxts(SB), NOPTR, $4 | 
|  |  | 
|  | TEXT runtime·callbackasm1(SB),NOSPLIT,$0 | 
|  | MOVL	0(SP), AX	// will use to find our callback context | 
|  |  | 
|  | // remove return address from stack, we are not returning there | 
|  | ADDL	$4, SP | 
|  |  | 
|  | // address to callback parameters into CX | 
|  | LEAL	4(SP), CX | 
|  |  | 
|  | // save registers as required for windows callback | 
|  | PUSHL	DI | 
|  | PUSHL	SI | 
|  | PUSHL	BP | 
|  | PUSHL	BX | 
|  |  | 
|  | // determine index into runtime·cbctxts table | 
|  | SUBL	$runtime·callbackasm(SB), AX | 
|  | MOVL	$0, DX | 
|  | MOVL	$5, BX	// divide by 5 because each call instruction in runtime·callbacks is 5 bytes long | 
|  | DIVL	BX | 
|  |  | 
|  | // find correspondent runtime·cbctxts table entry | 
|  | MOVL	runtime·cbctxts(SB), BX | 
|  | MOVL	-4(BX)(AX*4), BX | 
|  |  | 
|  | // extract callback context | 
|  | MOVL	wincallbackcontext_gobody(BX), AX | 
|  | MOVL	wincallbackcontext_argsize(BX), DX | 
|  |  | 
|  | // preserve whatever's at the memory location that | 
|  | // the callback will use to store the return value | 
|  | PUSHL	0(CX)(DX*1) | 
|  |  | 
|  | // extend argsize by size of return value | 
|  | ADDL	$4, DX | 
|  |  | 
|  | // remember how to restore stack on return | 
|  | MOVL	wincallbackcontext_restorestack(BX), BX | 
|  | PUSHL	BX | 
|  |  | 
|  | // call target Go function | 
|  | PUSHL	DX			// argsize (including return value) | 
|  | PUSHL	CX			// callback parameters | 
|  | PUSHL	AX			// address of target Go function | 
|  | CLD | 
|  | CALL	runtime·cgocallback_gofunc(SB) | 
|  | POPL	AX | 
|  | POPL	CX | 
|  | POPL	DX | 
|  |  | 
|  | // how to restore stack on return | 
|  | POPL	BX | 
|  |  | 
|  | // return value into AX (as per Windows spec) | 
|  | // and restore previously preserved value | 
|  | MOVL	-4(CX)(DX*1), AX | 
|  | POPL	-4(CX)(DX*1) | 
|  |  | 
|  | MOVL	BX, CX			// cannot use BX anymore | 
|  |  | 
|  | // restore registers as required for windows callback | 
|  | POPL	BX | 
|  | POPL	BP | 
|  | POPL	SI | 
|  | POPL	DI | 
|  |  | 
|  | // remove callback parameters before return (as per Windows spec) | 
|  | POPL	DX | 
|  | ADDL	CX, SP | 
|  | PUSHL	DX | 
|  |  | 
|  | CLD | 
|  |  | 
|  | RET | 
|  |  | 
|  | // void tstart(M *newm); | 
|  | TEXT tstart<>(SB),NOSPLIT,$0 | 
|  | MOVL	newm+0(FP), CX		// m | 
|  | MOVL	m_g0(CX), DX		// g | 
|  |  | 
|  | // Layout new m scheduler stack on os stack. | 
|  | MOVL	SP, AX | 
|  | MOVL	AX, (g_stack+stack_hi)(DX) | 
|  | SUBL	$(64*1024), AX		// initial stack size (adjusted later) | 
|  | MOVL	AX, (g_stack+stack_lo)(DX) | 
|  | ADDL	$const__StackGuard, AX | 
|  | MOVL	AX, g_stackguard0(DX) | 
|  | MOVL	AX, g_stackguard1(DX) | 
|  |  | 
|  | // Set up tls. | 
|  | LEAL	m_tls(CX), SI | 
|  | MOVL	SI, 0x14(FS) | 
|  | MOVL	CX, g_m(DX) | 
|  | MOVL	DX, g(SI) | 
|  |  | 
|  | // Someday the convention will be D is always cleared. | 
|  | CLD | 
|  |  | 
|  | CALL	runtime·stackcheck(SB)	// clobbers AX,CX | 
|  | CALL	runtime·mstart(SB) | 
|  |  | 
|  | RET | 
|  |  | 
|  | // uint32 tstart_stdcall(M *newm); | 
|  | TEXT runtime·tstart_stdcall(SB),NOSPLIT,$0 | 
|  | MOVL	newm+0(FP), BX | 
|  |  | 
|  | PUSHL	BX | 
|  | CALL	tstart<>(SB) | 
|  | POPL	BX | 
|  |  | 
|  | // Adjust stack for stdcall to return properly. | 
|  | MOVL	(SP), AX		// save return address | 
|  | ADDL	$4, SP			// remove single parameter | 
|  | MOVL	AX, (SP)		// restore return address | 
|  |  | 
|  | XORL	AX, AX			// return 0 == success | 
|  |  | 
|  | RET | 
|  |  | 
|  | // setldt(int entry, int address, int limit) | 
|  | TEXT runtime·setldt(SB),NOSPLIT,$0 | 
|  | MOVL	base+4(FP), CX | 
|  | MOVL	CX, 0x14(FS) | 
|  | RET | 
|  |  | 
|  | // onosstack calls fn on OS stack. | 
|  | // func onosstack(fn unsafe.Pointer, arg uint32) | 
|  | TEXT runtime·onosstack(SB),NOSPLIT,$0 | 
|  | MOVL	fn+0(FP), AX		// to hide from 8l | 
|  | MOVL	arg+4(FP), BX | 
|  |  | 
|  | // Execute call on m->g0 stack, in case we are not actually | 
|  | // calling a system call wrapper, like when running under WINE. | 
|  | get_tls(CX) | 
|  | CMPL	CX, $0 | 
|  | JNE	3(PC) | 
|  | // Not a Go-managed thread. Do not switch stack. | 
|  | CALL	AX | 
|  | RET | 
|  |  | 
|  | MOVL	g(CX), BP | 
|  | MOVL	g_m(BP), BP | 
|  |  | 
|  | // leave pc/sp for cpu profiler | 
|  | MOVL	(SP), SI | 
|  | MOVL	SI, m_libcallpc(BP) | 
|  | MOVL	g(CX), SI | 
|  | MOVL	SI, m_libcallg(BP) | 
|  | // sp must be the last, because once async cpu profiler finds | 
|  | // all three values to be non-zero, it will use them | 
|  | LEAL	fn+0(FP), SI | 
|  | MOVL	SI, m_libcallsp(BP) | 
|  |  | 
|  | MOVL	m_g0(BP), SI | 
|  | CMPL	g(CX), SI | 
|  | JNE	switch | 
|  | // executing on m->g0 already | 
|  | CALL	AX | 
|  | JMP	ret | 
|  |  | 
|  | switch: | 
|  | // Switch to m->g0 stack and back. | 
|  | MOVL	(g_sched+gobuf_sp)(SI), SI | 
|  | MOVL	SP, -4(SI) | 
|  | LEAL	-4(SI), SP | 
|  | CALL	AX | 
|  | MOVL	0(SP), SP | 
|  |  | 
|  | ret: | 
|  | get_tls(CX) | 
|  | MOVL	g(CX), BP | 
|  | MOVL	g_m(BP), BP | 
|  | MOVL	$0, m_libcallsp(BP) | 
|  | RET | 
|  |  | 
|  | // Runs on OS stack. duration (in 100ns units) is in BX. | 
|  | TEXT runtime·usleep2(SB),NOSPLIT,$20 | 
|  | // Want negative 100ns units. | 
|  | NEGL	BX | 
|  | MOVL	$-1, hi-4(SP) | 
|  | MOVL	BX, lo-8(SP) | 
|  | LEAL	lo-8(SP), BX | 
|  | MOVL	BX, ptime-12(SP) | 
|  | MOVL	$0, alertable-16(SP) | 
|  | MOVL	$-1, handle-20(SP) | 
|  | MOVL	SP, BP | 
|  | MOVL	runtime·_NtWaitForSingleObject(SB), AX | 
|  | CALL	AX | 
|  | MOVL	BP, SP | 
|  | RET | 
|  |  | 
|  | // Runs on OS stack. | 
|  | TEXT runtime·switchtothread(SB),NOSPLIT,$0 | 
|  | MOVL	SP, BP | 
|  | MOVL	runtime·_SwitchToThread(SB), AX | 
|  | CALL	AX | 
|  | MOVL	BP, SP | 
|  | RET | 
|  |  | 
|  | // See https://www.dcl.hpi.uni-potsdam.de/research/WRK/2007/08/getting-os-information-the-kuser_shared_data-structure/ | 
|  | // Must read hi1, then lo, then hi2. The snapshot is valid if hi1 == hi2. | 
|  | #define _INTERRUPT_TIME 0x7ffe0008 | 
|  | #define _SYSTEM_TIME 0x7ffe0014 | 
|  | #define time_lo 0 | 
|  | #define time_hi1 4 | 
|  | #define time_hi2 8 | 
|  |  | 
|  | TEXT runtime·nanotime(SB),NOSPLIT,$0-8 | 
|  | CMPB	runtime·useQPCTime(SB), $0 | 
|  | JNE	useQPC | 
|  | loop: | 
|  | MOVL	(_INTERRUPT_TIME+time_hi1), AX | 
|  | MOVL	(_INTERRUPT_TIME+time_lo), CX | 
|  | MOVL	(_INTERRUPT_TIME+time_hi2), DI | 
|  | CMPL	AX, DI | 
|  | JNE	loop | 
|  |  | 
|  | // wintime = DI:CX, multiply by 100 | 
|  | MOVL	$100, AX | 
|  | MULL	CX | 
|  | IMULL	$100, DI | 
|  | ADDL	DI, DX | 
|  | // wintime*100 = DX:AX | 
|  | MOVL	AX, ret_lo+0(FP) | 
|  | MOVL	DX, ret_hi+4(FP) | 
|  | RET | 
|  | useQPC: | 
|  | JMP	runtime·nanotimeQPC(SB) | 
|  | RET | 
|  |  | 
|  | TEXT time·now(SB),NOSPLIT,$0-20 | 
|  | CMPB	runtime·useQPCTime(SB), $0 | 
|  | JNE	useQPC | 
|  | loop: | 
|  | MOVL	(_INTERRUPT_TIME+time_hi1), AX | 
|  | MOVL	(_INTERRUPT_TIME+time_lo), CX | 
|  | MOVL	(_INTERRUPT_TIME+time_hi2), DI | 
|  | CMPL	AX, DI | 
|  | JNE	loop | 
|  |  | 
|  | // w = DI:CX | 
|  | // multiply by 100 | 
|  | MOVL	$100, AX | 
|  | MULL	CX | 
|  | IMULL	$100, DI | 
|  | ADDL	DI, DX | 
|  | // w*100 = DX:AX | 
|  | MOVL	AX, mono+12(FP) | 
|  | MOVL	DX, mono+16(FP) | 
|  |  | 
|  | wall: | 
|  | MOVL	(_SYSTEM_TIME+time_hi1), CX | 
|  | MOVL	(_SYSTEM_TIME+time_lo), AX | 
|  | MOVL	(_SYSTEM_TIME+time_hi2), DX | 
|  | CMPL	CX, DX | 
|  | JNE	wall | 
|  |  | 
|  | // w = DX:AX | 
|  | // convert to Unix epoch (but still 100ns units) | 
|  | #define delta 116444736000000000 | 
|  | SUBL	$(delta & 0xFFFFFFFF), AX | 
|  | SBBL $(delta >> 32), DX | 
|  |  | 
|  | // nano/100 = DX:AX | 
|  | // split into two decimal halves by div 1e9. | 
|  | // (decimal point is two spots over from correct place, | 
|  | // but we avoid overflow in the high word.) | 
|  | MOVL	$1000000000, CX | 
|  | DIVL	CX | 
|  | MOVL	AX, DI | 
|  | MOVL	DX, SI | 
|  |  | 
|  | // DI = nano/100/1e9 = nano/1e11 = sec/100, DX = SI = nano/100%1e9 | 
|  | // split DX into seconds and nanoseconds by div 1e7 magic multiply. | 
|  | MOVL	DX, AX | 
|  | MOVL	$1801439851, CX | 
|  | MULL	CX | 
|  | SHRL	$22, DX | 
|  | MOVL	DX, BX | 
|  | IMULL	$10000000, DX | 
|  | MOVL	SI, CX | 
|  | SUBL	DX, CX | 
|  |  | 
|  | // DI = sec/100 (still) | 
|  | // BX = (nano/100%1e9)/1e7 = (nano/1e9)%100 = sec%100 | 
|  | // CX = (nano/100%1e9)%1e7 = (nano%1e9)/100 = nsec/100 | 
|  | // store nsec for return | 
|  | IMULL	$100, CX | 
|  | MOVL	CX, nsec+8(FP) | 
|  |  | 
|  | // DI = sec/100 (still) | 
|  | // BX = sec%100 | 
|  | // construct DX:AX = 64-bit sec and store for return | 
|  | MOVL	$0, DX | 
|  | MOVL	$100, AX | 
|  | MULL	DI | 
|  | ADDL	BX, AX | 
|  | ADCL	$0, DX | 
|  | MOVL	AX, sec+0(FP) | 
|  | MOVL	DX, sec+4(FP) | 
|  | RET | 
|  | useQPC: | 
|  | JMP	runtime·nowQPC(SB) | 
|  | RET |