|
| 1 | +; Based on the code by Samuel Williams. Created by Sergey Fedorov on 04/06/2022. |
| 2 | +; Credits to Samuel Williams, Rei Odaira and Iain Sandoe. Errors, if any, are mine. |
| 3 | +; Some relevant examples: https://github.com/gcc-mirror/gcc/blob/master/libphobos/libdruntime/config/powerpc/switchcontext.S |
| 4 | +; https://github.com/gcc-mirror/gcc/blob/master/libgcc/config/rs6000/darwin-gpsave.S |
| 5 | +; https://www.ibm.com/docs/en/aix/7.2?topic=epilogs-saving-gprs-only |
| 6 | +; ppc32 version may be re-written compactly with stmw/lwm, but the code wonʼt be faster, see: https://github.com/ruby/ruby/pull/5927#issuecomment-1139730541 |
| 7 | + |
| 8 | +; Notice that this code is only for Darwin (macOS). Darwin ABI differs from AIX and ELF. |
| 9 | +; To add support for AIX, *BSD or *Linux, please make separate implementations. |
| 10 | + |
1 | 11 | #define TOKEN_PASTE(x,y) x##y
|
2 | 12 | #define PREFIXED_SYMBOL(prefix,name) TOKEN_PASTE(prefix,name)
|
3 | 13 |
|
| 14 | +.machine ppc7400 ; = G4, Rosetta |
4 | 15 | .text
|
5 |
| -.align 2 |
6 | 16 |
|
7 | 17 | .globl PREFIXED_SYMBOL(SYMBOL_PREFIX,coroutine_transfer)
|
| 18 | +.align 2 |
| 19 | + |
8 | 20 | PREFIXED_SYMBOL(SYMBOL_PREFIX,coroutine_transfer):
|
9 |
| - # Make space on the stack for caller registers |
10 |
| - addi r1,r1,-80 |
| 21 | + ; Make space on the stack for caller registers |
| 22 | + ; (Should we rather use red zone? See libphobos example.) |
| 23 | + subi r1,r1,80 |
| 24 | + |
| 25 | + ; Get LR |
| 26 | + mflr r0 |
11 | 27 |
|
12 |
| - # Save caller registers |
13 |
| - stw r13,0(r1) |
14 |
| - stw r14,4(r1) |
15 |
| - stw r15,8(r1) |
16 |
| - stw r16,12(r1) |
17 |
| - stw r17,16(r1) |
18 |
| - stw r18,20(r1) |
19 |
| - stw r19,24(r1) |
20 |
| - stw r20,28(r1) |
21 |
| - stw r21,32(r1) |
| 28 | + ; Save caller registers |
| 29 | + stw r31,0(r1) |
| 30 | + stw r30,4(r1) |
| 31 | + stw r29,8(r1) |
| 32 | + stw r28,12(r1) |
| 33 | + stw r27,16(r1) |
| 34 | + stw r26,20(r1) |
| 35 | + stw r25,24(r1) |
| 36 | + stw r24,28(r1) |
| 37 | + stw r23,32(r1) |
22 | 38 | stw r22,36(r1)
|
23 |
| - stw r23,40(r1) |
24 |
| - stw r24,44(r1) |
25 |
| - stw r25,48(r1) |
26 |
| - stw r26,52(r1) |
27 |
| - stw r27,56(r1) |
28 |
| - stw r28,60(r1) |
29 |
| - stw r29,64(r1) |
30 |
| - stw r30,68(r1) |
31 |
| - stw r31,72(r1) |
| 39 | + stw r21,40(r1) |
| 40 | + stw r20,44(r1) |
| 41 | + stw r19,48(r1) |
| 42 | + stw r18,52(r1) |
| 43 | + stw r17,56(r1) |
| 44 | + stw r16,60(r1) |
| 45 | + stw r15,64(r1) |
| 46 | + stw r14,68(r1) |
| 47 | + stw r13,72(r1) |
32 | 48 |
|
33 |
| - # Save return address |
34 |
| - mflr r0 |
| 49 | + ; Save return address |
| 50 | + ; Possibly should rather be saved into linkage area, see libphobos and IBM docs |
35 | 51 | stw r0,76(r1)
|
36 | 52 |
|
37 |
| - # Save stack pointer to first argument |
| 53 | + ; Save stack pointer to first argument |
38 | 54 | stw r1,0(r3)
|
39 | 55 |
|
40 |
| - # Load stack pointer from second argument |
| 56 | + ; Load stack pointer from second argument |
41 | 57 | lwz r1,0(r4)
|
42 | 58 |
|
43 |
| - # Restore caller registers |
44 |
| - lwz r13,0(r1) |
45 |
| - lwz r14,4(r1) |
46 |
| - lwz r15,8(r1) |
47 |
| - lwz r16,12(r1) |
48 |
| - lwz r17,16(r1) |
49 |
| - lwz r18,20(r1) |
50 |
| - lwz r19,24(r1) |
51 |
| - lwz r20,28(r1) |
52 |
| - lwz r21,32(r1) |
| 59 | + ; Load return address |
| 60 | + lwz r0,76(r1) |
| 61 | + |
| 62 | + ; Restore caller registers |
| 63 | + lwz r13,72(r1) |
| 64 | + lwz r14,68(r1) |
| 65 | + lwz r15,64(r1) |
| 66 | + lwz r16,60(r1) |
| 67 | + lwz r17,56(r1) |
| 68 | + lwz r18,52(r1) |
| 69 | + lwz r19,48(r1) |
| 70 | + lwz r20,44(r1) |
| 71 | + lwz r21,40(r1) |
53 | 72 | lwz r22,36(r1)
|
54 |
| - lwz r23,40(r1) |
55 |
| - lwz r24,44(r1) |
56 |
| - lwz r25,48(r1) |
57 |
| - lwz r26,52(r1) |
58 |
| - lwz r27,56(r1) |
59 |
| - lwz r28,60(r1) |
60 |
| - lwz r29,64(r1) |
61 |
| - lwz r30,68(r1) |
62 |
| - lwz r31,72(r1) |
| 73 | + lwz r23,32(r1) |
| 74 | + lwz r24,28(r1) |
| 75 | + lwz r25,24(r1) |
| 76 | + lwz r26,20(r1) |
| 77 | + lwz r27,16(r1) |
| 78 | + lwz r28,12(r1) |
| 79 | + lwz r29,8(r1) |
| 80 | + lwz r30,4(r1) |
| 81 | + lwz r31,0(r1) |
63 | 82 |
|
64 |
| - # Load return address |
65 |
| - lwz r0,76(r1) |
| 83 | + ; Set LR |
66 | 84 | mtlr r0
|
67 | 85 |
|
68 |
| - # Pop stack frame |
| 86 | + ; Pop stack frame |
69 | 87 | addi r1,r1,80
|
70 | 88 |
|
71 |
| - # Jump to return address |
| 89 | + ; Jump to return address |
72 | 90 | blr
|
73 |
| - |
|
0 commit comments