Text file
src/runtime/sys_windows_arm64.s
1 // Copyright 2018 The Go Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style
3 // license that can be found in the LICENSE file.
4
5 #include "go_asm.h"
6 #include "go_tls.h"
7 #include "textflag.h"
8 #include "funcdata.h"
9 #include "time_windows.h"
10
11 // Offsets into Thread Environment Block (pointer in R18)
12 #define TEB_error 0x68
13 #define TEB_TlsSlots 0x1480
14
15 // Note: R0-R7 are args, R8 is indirect return value address,
16 // R9-R15 are caller-save, R19-R29 are callee-save.
17 //
18 // load_g and save_g (in tls_arm64.s) clobber R27 (REGTMP) and R0.
19
20 // void runtime·asmstdcall(void *c);
21 TEXT runtime·asmstdcall(SB),NOSPLIT|NOFRAME,$0
22 STP.W (R29, R30), -32(RSP) // allocate C ABI stack frame
23 STP (R19, R20), 16(RSP) // save old R19, R20
24 MOVD R0, R19 // save libcall pointer
25 MOVD RSP, R20 // save stack pointer
26
27 // SetLastError(0)
28 MOVD $0, TEB_error(R18_PLATFORM)
29 MOVD libcall_args(R19), R12 // libcall->args
30
31 // Do we have more than 8 arguments?
32 MOVD libcall_n(R19), R0
33 CMP $0, R0; BEQ _0args
34 CMP $1, R0; BEQ _1args
35 CMP $2, R0; BEQ _2args
36 CMP $3, R0; BEQ _3args
37 CMP $4, R0; BEQ _4args
38 CMP $5, R0; BEQ _5args
39 CMP $6, R0; BEQ _6args
40 CMP $7, R0; BEQ _7args
41 CMP $8, R0; BEQ _8args
42
43 // Reserve stack space for remaining args
44 SUB $8, R0, R2
45 ADD $1, R2, R3 // make even number of words for stack alignment
46 AND $~1, R3
47 LSL $3, R3
48 SUB R3, RSP
49
50 // R4: size of stack arguments (n-8)*8
51 // R5: &args[8]
52 // R6: loop counter, from 0 to (n-8)*8
53 // R7: scratch
54 // R8: copy of RSP - (R2)(RSP) assembles as (R2)(ZR)
55 SUB $8, R0, R4
56 LSL $3, R4
57 ADD $(8*8), R12, R5
58 MOVD $0, R6
59 MOVD RSP, R8
60 stackargs:
61 MOVD (R6)(R5), R7
62 MOVD R7, (R6)(R8)
63 ADD $8, R6
64 CMP R6, R4
65 BNE stackargs
66
67 _8args:
68 MOVD (7*8)(R12), R7
69 _7args:
70 MOVD (6*8)(R12), R6
71 _6args:
72 MOVD (5*8)(R12), R5
73 _5args:
74 MOVD (4*8)(R12), R4
75 _4args:
76 MOVD (3*8)(R12), R3
77 _3args:
78 MOVD (2*8)(R12), R2
79 _2args:
80 MOVD (1*8)(R12), R1
81 _1args:
82 MOVD (0*8)(R12), R0
83 _0args:
84
85 MOVD libcall_fn(R19), R12 // branch to libcall->fn
86 BL (R12)
87
88 MOVD R20, RSP // free stack space
89 MOVD R0, libcall_r1(R19) // save return value to libcall->r1
90 // TODO(rsc) floating point like amd64 in libcall->r2?
91
92 // GetLastError
93 MOVD TEB_error(R18_PLATFORM), R0
94 MOVD R0, libcall_err(R19)
95
96 // Restore callee-saved registers.
97 LDP 16(RSP), (R19, R20)
98 LDP.P 32(RSP), (R29, R30)
99 RET
100
101 TEXT runtime·badsignal2(SB),NOSPLIT,$16-0
102 NO_LOCAL_POINTERS
103
104 // stderr
105 MOVD runtime·_GetStdHandle(SB), R1
106 MOVD $-12, R0
107 SUB $16, RSP // skip over saved frame pointer below RSP
108 BL (R1)
109 ADD $16, RSP
110
111 // handle in R0 already
112 MOVD $runtime·badsignalmsg(SB), R1 // lpBuffer
113 MOVD $runtime·badsignallen(SB), R2 // lpNumberOfBytesToWrite
114 MOVD (R2), R2
115 MOVD R13, R3 // lpNumberOfBytesWritten
116 MOVD $0, R4 // lpOverlapped
117 MOVD runtime·_WriteFile(SB), R12
118 SUB $16, RSP // skip over saved frame pointer below RSP
119 BL (R12)
120
121 // Does not return.
122 B runtime·abort(SB)
123
124 RET
125
126 TEXT runtime·getlasterror(SB),NOSPLIT|NOFRAME,$0
127 MOVD TEB_error(R18_PLATFORM), R0
128 MOVD R0, ret+0(FP)
129 RET
130
131 #define SAVE_R19_TO_R28(offset) \
132 MOVD R19, savedR19+((offset)+0*8)(SP); \
133 MOVD R20, savedR20+((offset)+1*8)(SP); \
134 MOVD R21, savedR21+((offset)+2*8)(SP); \
135 MOVD R22, savedR22+((offset)+3*8)(SP); \
136 MOVD R23, savedR23+((offset)+4*8)(SP); \
137 MOVD R24, savedR24+((offset)+5*8)(SP); \
138 MOVD R25, savedR25+((offset)+6*8)(SP); \
139 MOVD R26, savedR26+((offset)+7*8)(SP); \
140 MOVD R27, savedR27+((offset)+8*8)(SP); \
141 MOVD g, savedR28+((offset)+9*8)(SP);
142
143 #define RESTORE_R19_TO_R28(offset) \
144 MOVD savedR19+((offset)+0*8)(SP), R19; \
145 MOVD savedR20+((offset)+1*8)(SP), R20; \
146 MOVD savedR21+((offset)+2*8)(SP), R21; \
147 MOVD savedR22+((offset)+3*8)(SP), R22; \
148 MOVD savedR23+((offset)+4*8)(SP), R23; \
149 MOVD savedR24+((offset)+5*8)(SP), R24; \
150 MOVD savedR25+((offset)+6*8)(SP), R25; \
151 MOVD savedR26+((offset)+7*8)(SP), R26; \
152 MOVD savedR27+((offset)+8*8)(SP), R27; \
153 MOVD savedR28+((offset)+9*8)(SP), g; /* R28 */
154
155 // Called by Windows as a Vectored Exception Handler (VEH).
156 // First argument is pointer to struct containing
157 // exception record and context pointers.
158 // Handler function is stored in R1
159 // Return 0 for 'not handled', -1 for handled.
160 // int32_t sigtramp(
161 // PEXCEPTION_POINTERS ExceptionInfo,
162 // func *GoExceptionHandler);
163 TEXT sigtramp<>(SB),NOSPLIT|NOFRAME,$0
164 // Save R0, R1 (args) as well as LR, R27, R28 (callee-save).
165 MOVD R0, R5
166 MOVD R1, R6
167 MOVD LR, R7
168 MOVD R27, R16 // saved R27 (callee-save)
169 MOVD g, R17 // saved R28 (callee-save from Windows, not really g)
170
171 BL runtime·load_g(SB) // smashes R0, R27, R28 (g)
172 CMP $0, g // is there a current g?
173 BNE 2(PC)
174 BL runtime·badsignal2(SB)
175
176 // Do we need to switch to the g0 stack?
177 MOVD g, R3 // R3 = oldg (for sigtramp_g0)
178 MOVD g_m(g), R2 // R2 = m
179 MOVD m_g0(R2), R2 // R2 = g0
180 CMP g, R2 // if curg == g0
181 BNE switch
182
183 // No: on g0 stack already, tail call to sigtramp_g0.
184 // Restore all the callee-saves so sigtramp_g0 can return to our caller.
185 // We also pass R2 = g0, R3 = oldg, both set above.
186 MOVD R5, R0
187 MOVD R6, R1
188 MOVD R7, LR
189 MOVD R16, R27 // restore R27
190 MOVD R17, g // restore R28
191 B sigtramp_g0<>(SB)
192
193 switch:
194 // switch to g0 stack (but do not update g - that's sigtramp_g0's job)
195 MOVD RSP, R8
196 MOVD (g_sched+gobuf_sp)(R2), R4 // R4 = g->gobuf.sp
197 SUB $(6*8), R4 // alloc space for saves - 2 words below SP for frame pointer, 3 for us to use, 1 for alignment
198 MOVD R4, RSP // switch to g0 stack
199
200 MOVD $0, (0*8)(RSP) // fake saved LR
201 MOVD R7, (1*8)(RSP) // saved LR
202 MOVD R8, (2*8)(RSP) // saved SP
203
204 MOVD R5, R0 // original args
205 MOVD R6, R1 // original args
206 MOVD R16, R27
207 MOVD R17, g // R28
208 BL sigtramp_g0<>(SB)
209
210 // switch back to original stack; g already updated
211 MOVD (1*8)(RSP), R7 // saved LR
212 MOVD (2*8)(RSP), R8 // saved SP
213 MOVD R7, LR
214 MOVD R8, RSP
215 RET
216
217 // sigtramp_g0 is running on the g0 stack, with R2 = g0, R3 = oldg.
218 // But g itself is not set - that's R28, a callee-save register,
219 // and it still holds the value from the Windows DLL caller.
220 TEXT sigtramp_g0<>(SB),NOSPLIT,$128
221 NO_LOCAL_POINTERS
222
223 // Push C callee-save registers R19-R28. LR, FP already saved.
224 SAVE_R19_TO_R28(-10*8)
225
226 MOVD 0(R0), R5 // R5 = ExceptionPointers->ExceptionRecord
227 MOVD 8(R0), R6 // R6 = ExceptionPointers->ContextRecord
228 MOVD R6, context-(11*8)(SP)
229
230 MOVD R2, g // g0
231 BL runtime·save_g(SB) // smashes R0
232
233 MOVD R5, (1*8)(RSP) // arg0 (ExceptionRecord)
234 MOVD R6, (2*8)(RSP) // arg1 (ContextRecord)
235 MOVD R3, (3*8)(RSP) // arg2 (original g)
236 MOVD R3, oldg-(12*8)(SP)
237 BL (R1)
238 MOVD oldg-(12*8)(SP), g
239 BL runtime·save_g(SB) // smashes R0
240 MOVW (4*8)(RSP), R0 // return value (0 or -1)
241
242 // if return value is CONTINUE_SEARCH, do not set up control
243 // flow guard workaround
244 CMP $0, R0
245 BEQ return
246
247 // Check if we need to set up the control flow guard workaround.
248 // On Windows, the stack pointer in the context must lie within
249 // system stack limits when we resume from exception.
250 // Store the resume SP and PC in alternate registers
251 // and return to sigresume on the g0 stack.
252 // sigresume makes no use of the stack at all,
253 // loading SP from R0 and jumping to R1.
254 // Note that smashing R0 and R1 is only safe because we know sigpanic
255 // will not actually return to the original frame, so the registers
256 // are effectively dead. But this does mean we can't use the
257 // same mechanism for async preemption.
258 MOVD context-(11*8)(SP), R6
259 MOVD context_pc(R6), R2 // load PC from context record
260 MOVD $sigresume<>(SB), R1
261
262 CMP R1, R2
263 BEQ return // do not clobber saved SP/PC
264
265 // Save resume SP and PC into R0, R1.
266 MOVD context_xsp(R6), R2
267 MOVD R2, (context_x+0*8)(R6)
268 MOVD context_pc(R6), R2
269 MOVD R2, (context_x+1*8)(R6)
270
271 // Set up context record to return to sigresume on g0 stack
272 MOVD RSP, R2
273 MOVD R2, context_xsp(R6)
274 MOVD $sigresume<>(SB), R2
275 MOVD R2, context_pc(R6)
276
277 return:
278 RESTORE_R19_TO_R28(-10*8) // smashes g
279 RET
280
281 // Trampoline to resume execution from exception handler.
282 // This is part of the control flow guard workaround.
283 // It switches stacks and jumps to the continuation address.
284 // R0 and R1 are set above at the end of sigtramp<>
285 // in the context that starts executing at sigresume<>.
286 TEXT sigresume<>(SB),NOSPLIT|NOFRAME,$0
287 // Important: do not smash LR,
288 // which is set to a live value when handling
289 // a signal by pushing a call to sigpanic onto the stack.
290 MOVD R0, RSP
291 B (R1)
292
293 TEXT runtime·exceptiontramp(SB),NOSPLIT|NOFRAME,$0
294 MOVD $runtime·exceptionhandler(SB), R1
295 B sigtramp<>(SB)
296
297 TEXT runtime·firstcontinuetramp(SB),NOSPLIT|NOFRAME,$0
298 MOVD $runtime·firstcontinuehandler(SB), R1
299 B sigtramp<>(SB)
300
301 TEXT runtime·lastcontinuetramp(SB),NOSPLIT|NOFRAME,$0
302 MOVD $runtime·lastcontinuehandler(SB), R1
303 B sigtramp<>(SB)
304
305 GLOBL runtime·cbctxts(SB), NOPTR, $4
306
307 TEXT runtime·callbackasm1(SB),NOSPLIT,$208-0
308 NO_LOCAL_POINTERS
309
310 // On entry, the trampoline in zcallback_windows_arm64.s left
311 // the callback index in R12 (which is volatile in the C ABI).
312
313 // Save callback register arguments R0-R7.
314 // We do this at the top of the frame so they're contiguous with stack arguments.
315 // The 7*8 setting up R14 looks like a bug but is not: the eighth word
316 // is the space the assembler reserved for our caller's frame pointer,
317 // but we are not called from Go so that space is ours to use,
318 // and we must to be contiguous with the stack arguments.
319 MOVD $arg0-(7*8)(SP), R14
320 MOVD R0, (0*8)(R14)
321 MOVD R1, (1*8)(R14)
322 MOVD R2, (2*8)(R14)
323 MOVD R3, (3*8)(R14)
324 MOVD R4, (4*8)(R14)
325 MOVD R5, (5*8)(R14)
326 MOVD R6, (6*8)(R14)
327 MOVD R7, (7*8)(R14)
328
329 // Push C callee-save registers R19-R28.
330 // LR, FP already saved.
331 SAVE_R19_TO_R28(-18*8)
332
333 // Create a struct callbackArgs on our stack.
334 MOVD $cbargs-(18*8+callbackArgs__size)(SP), R13
335 MOVD R12, callbackArgs_index(R13) // callback index
336 MOVD R14, R0
337 MOVD R0, callbackArgs_args(R13) // address of args vector
338 MOVD $0, R0
339 MOVD R0, callbackArgs_result(R13) // result
340
341 // Call cgocallback, which will call callbackWrap(frame).
342 MOVD $·callbackWrap<ABIInternal>(SB), R0 // PC of function to call, cgocallback takes an ABIInternal entry-point
343 MOVD R13, R1 // frame (&callbackArgs{...})
344 MOVD $0, R2 // context
345 MOVD R0, (1*8)(RSP)
346 MOVD R1, (2*8)(RSP)
347 MOVD R2, (3*8)(RSP)
348 BL runtime·cgocallback(SB)
349
350 // Get callback result.
351 MOVD $cbargs-(18*8+callbackArgs__size)(SP), R13
352 MOVD callbackArgs_result(R13), R0
353
354 RESTORE_R19_TO_R28(-18*8)
355
356 RET
357
358 // uint32 tstart_stdcall(M *newm);
359 TEXT runtime·tstart_stdcall(SB),NOSPLIT,$96-0
360 SAVE_R19_TO_R28(-10*8)
361
362 MOVD m_g0(R0), g
363 MOVD R0, g_m(g)
364 BL runtime·save_g(SB)
365
366 // Set up stack guards for OS stack.
367 MOVD RSP, R0
368 MOVD R0, g_stack+stack_hi(g)
369 SUB $(64*1024), R0
370 MOVD R0, (g_stack+stack_lo)(g)
371 MOVD R0, g_stackguard0(g)
372 MOVD R0, g_stackguard1(g)
373
374 BL runtime·emptyfunc(SB) // fault if stack check is wrong
375 BL runtime·mstart(SB)
376
377 RESTORE_R19_TO_R28(-10*8)
378
379 // Exit the thread.
380 MOVD $0, R0
381 RET
382
383 // Runs on OS stack.
384 // duration (in -100ns units) is in dt+0(FP).
385 // g may be nil.
386 TEXT runtime·usleep2(SB),NOSPLIT,$32-4
387 MOVW dt+0(FP), R0
388 MOVD $16(RSP), R2 // R2 = pTime
389 MOVD R0, 0(R2) // *pTime = -dt
390 MOVD $-1, R0 // R0 = handle
391 MOVD $0, R1 // R1 = FALSE (alertable)
392 MOVD runtime·_NtWaitForSingleObject(SB), R3
393 SUB $16, RSP // skip over saved frame pointer below RSP
394 BL (R3)
395 ADD $16, RSP
396 RET
397
398 // Runs on OS stack.
399 // duration (in -100ns units) is in dt+0(FP).
400 // g is valid.
401 // TODO: neeeds to be implemented properly.
402 TEXT runtime·usleep2HighRes(SB),NOSPLIT,$0-4
403 B runtime·abort(SB)
404
405 // Runs on OS stack.
406 TEXT runtime·switchtothread(SB),NOSPLIT,$16-0
407 MOVD runtime·_SwitchToThread(SB), R0
408 SUB $16, RSP // skip over saved frame pointer below RSP
409 BL (R0)
410 ADD $16, RSP
411 RET
412
413 TEXT runtime·nanotime1(SB),NOSPLIT|NOFRAME,$0-8
414 MOVB runtime·useQPCTime(SB), R0
415 CMP $0, R0
416 BNE useQPC
417 MOVD $_INTERRUPT_TIME, R3
418 MOVD time_lo(R3), R0
419 MOVD $100, R1
420 MUL R1, R0
421 MOVD R0, ret+0(FP)
422 RET
423 useQPC:
424 B runtime·nanotimeQPC(SB) // tail call
425
426 // This is called from rt0_go, which runs on the system stack
427 // using the initial stack allocated by the OS.
428 // It calls back into standard C using the BL below.
429 TEXT runtime·wintls(SB),NOSPLIT,$0
430 // Allocate a TLS slot to hold g across calls to external code
431 MOVD runtime·_TlsAlloc(SB), R0
432 SUB $16, RSP // skip over saved frame pointer below RSP
433 BL (R0)
434 ADD $16, RSP
435
436 // Assert that slot is less than 64 so we can use _TEB->TlsSlots
437 CMP $64, R0
438 BLT ok
439 MOVD $runtime·abort(SB), R1
440 BL (R1)
441 ok:
442
443 // Save offset from R18 into tls_g.
444 LSL $3, R0
445 ADD $TEB_TlsSlots, R0
446 MOVD R0, runtime·tls_g(SB)
447 RET
448
View as plain text