Skip to content

Commit

Permalink
Merge pull request #262 from Liryna/develop
Browse files Browse the repository at this point in the history
Convert ARM64 armasm to armclang
  • Loading branch information
olk authored Aug 28, 2024
2 parents 1bde50e + e878e8e commit f7c27e2
Show file tree
Hide file tree
Showing 4 changed files with 411 additions and 0 deletions.
12 changes: 12 additions & 0 deletions build/Jamfile.v2
Original file line number Diff line number Diff line change
Expand Up @@ -253,6 +253,18 @@ alias asm_sources
<toolset>msvc
;

# ARM64/AAPCS/PE
alias asm_sources
: asm/make_arm64_aapcs_pe_armclang.asm
asm/jump_arm64_aapcs_pe_armclang.asm
asm/ontop_arm64_aapcs_pe_armclang.asm
: <abi>aapcs
<address-model>64
<architecture>arm
<binary-format>pe
<toolset>clang
;

# LOONGARCH64
# LOONGARCH64/SYSV/ELF
alias asm_sources
Expand Down
141 changes: 141 additions & 0 deletions src/asm/jump_arm64_aapcs_pe_armclang.S
Original file line number Diff line number Diff line change
@@ -0,0 +1,141 @@
/*
Copyright Edward Nevill + Oliver Kowalke 2015
Distributed under the Boost Software License, Version 1.0.
(See accompanying file LICENSE_1_0.txt or copy at
http://www.boost.org/LICENSE_1_0.txt)
*/

/******************************************************
* *
* ------------------------------------------------- *
* | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | *
* ------------------------------------------------- *
* | 0x0 | 0x4 | 0x8 | 0xc | 0x10| 0x14| 0x18| 0x1c| *
* ------------------------------------------------- *
* | d8 | d9 | d10 | d11 | *
* ------------------------------------------------- *
* ------------------------------------------------- *
* | 8 | 9 | 10 | 11 | 12 | 13 | 14 | 15 | *
* ------------------------------------------------- *
* | 0x20| 0x24| 0x28| 0x2c| 0x30| 0x34| 0x38| 0x3c| *
* ------------------------------------------------- *
* | d12 | d13 | d14 | d15 | *
* ------------------------------------------------- *
* ------------------------------------------------- *
* | 16 | 17 | 18 | 19 | 20 | 21 | 22 | 23 | *
* ------------------------------------------------- *
* | 0x40| 0x44| 0x48| 0x4c| 0x50| 0x54| 0x58| 0x5c| *
* ------------------------------------------------- *
* | x19 | x20 | x21 | x22 | *
* ------------------------------------------------- *
* ------------------------------------------------- *
* | 24 | 25 | 26 | 27 | 28 | 29 | 30 | 31 | *
* ------------------------------------------------- *
* | 0x60| 0x64| 0x68| 0x6c| 0x70| 0x74| 0x78| 0x7c| *
* ------------------------------------------------- *
* | x23 | x24 | x25 | x26 | *
* ------------------------------------------------- *
* ------------------------------------------------- *
* | 32 | 33 | 34 | 35 | 36 | 37 | 38 | 39 | *
* ------------------------------------------------- *
* | 0x80| 0x84| 0x88| 0x8c| 0x90| 0x94| 0x98| 0x9c| *
* ------------------------------------------------- *
* | x27 | x28 | FP | LR | *
* ------------------------------------------------- *
* ------------------------------------------------- *
* | 40 | 41 | 42 | 43 | 44 | 45 | 46 | 47 | *
* ------------------------------------------------- *
* | 0xa0| 0xa4| 0xa8| 0xac| 0xb0| 0xb4| 0xb8| 0xbc| *
* ------------------------------------------------- *
* | fiber data| base | limit | dealloc | *
* ------------------------------------------------- *
* ------------------------------------------------- *
* | 48 | 49 | 50 | 51 | | | *
* ------------------------------------------------- *
* | 0xc0| 0xc4| 0xc8| 0xcc| | | *
* ------------------------------------------------- *
* | PC | align | | | *
* ------------------------------------------------- *
* *
*******************************************************/

.file "jump_arm64_aapcs_pe_armclang.S"
.text
.balign 4

.def jump_fcontext; .scl 2; .type 32; .endef
.seh_proc jump_fcontext
jump_fcontext:
.seh_endprologue
// prepare stack for GP + FPU
sub sp, sp, #0xd0

// save d8 - d15
stp d8, d9, [sp, #0x00]
stp d10, d11, [sp, #0x10]
stp d12, d13, [sp, #0x20]
stp d14, d15, [sp, #0x30]

// save x19-x30
stp x19, x20, [sp, #0x40]
stp x21, x22, [sp, #0x50]
stp x23, x24, [sp, #0x60]
stp x25, x26, [sp, #0x70]
stp x27, x28, [sp, #0x80]
stp x29, x30, [sp, #0x90]

// save LR as PC
str x30, [sp, #0xc0]

// save current stack base and limit
ldp x5, x6, [x18, #0x08] // TeStackBase and TeStackLimit at ksarm64.h
stp x5, x6, [sp, #0xa0]
// save current fiber data and deallocation stack
ldr x5, [x18, #0x1478] // TeDeallocationStack at ksarm64.h
ldr x6, [x18, #0x20] // TeFiberData at ksarm64.h
stp x5, x6, [sp, #0xb0]

// store RSP (pointing to context-data) in X0
mov x4, sp

// restore RSP (pointing to context-data) from X1
mov sp, x0

// restore stack base and limit
ldp x5, x6, [sp, #0xa0]
stp x5, x6, [x18, #0x08] // TeStackBase and TeStackLimit at ksarm64.h
// restore fiber data and deallocation stack
ldp x5, x6, [sp, #0xb0]
str x5, [x18, #0x1478] // TeDeallocationStack at ksarm64.h
str x6, [x18, #0x20] // TeFiberData at ksarm64.h

// load d8 - d15
ldp d8, d9, [sp, #0x00]
ldp d10, d11, [sp, #0x10]
ldp d12, d13, [sp, #0x20]
ldp d14, d15, [sp, #0x30]

// load x19-x30
ldp x19, x20, [sp, #0x40]
ldp x21, x22, [sp, #0x50]
ldp x23, x24, [sp, #0x60]
ldp x25, x26, [sp, #0x70]
ldp x27, x28, [sp, #0x80]
ldp x29, x30, [sp, #0x90]

// return transfer_t from jump
// pass transfer_t as first arg in context function
// X0 == FCTX, X1 == DATA
mov x0, x4

// load pc
ldr x4, [sp, #0xc0]

// restore stack from GP + FPU
add sp, sp, #0xd0

ret x4
.seh_endproc

.section .drectve
.ascii " -export:\"jump_fcontext\""
118 changes: 118 additions & 0 deletions src/asm/make_arm64_aapcs_pe_armclang.S
Original file line number Diff line number Diff line change
@@ -0,0 +1,118 @@
/*
Copyright Edward Nevill + Oliver Kowalke 2015
Distributed under the Boost Software License, Version 1.0.
(See accompanying file LICENSE_1_0.txt or copy at
http://www.boost.org/LICENSE_1_0.txt)
*/

/******************************************************
* *
* ------------------------------------------------- *
* | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | *
* ------------------------------------------------- *
* | 0x0 | 0x4 | 0x8 | 0xc | 0x10| 0x14| 0x18| 0x1c| *
* ------------------------------------------------- *
* | d8 | d9 | d10 | d11 | *
* ------------------------------------------------- *
* ------------------------------------------------- *
* | 8 | 9 | 10 | 11 | 12 | 13 | 14 | 15 | *
* ------------------------------------------------- *
* | 0x20| 0x24| 0x28| 0x2c| 0x30| 0x34| 0x38| 0x3c| *
* ------------------------------------------------- *
* | d12 | d13 | d14 | d15 | *
* ------------------------------------------------- *
* ------------------------------------------------- *
* | 16 | 17 | 18 | 19 | 20 | 21 | 22 | 23 | *
* ------------------------------------------------- *
* | 0x40| 0x44| 0x48| 0x4c| 0x50| 0x54| 0x58| 0x5c| *
* ------------------------------------------------- *
* | x19 | x20 | x21 | x22 | *
* ------------------------------------------------- *
* ------------------------------------------------- *
* | 24 | 25 | 26 | 27 | 28 | 29 | 30 | 31 | *
* ------------------------------------------------- *
* | 0x60| 0x64| 0x68| 0x6c| 0x70| 0x74| 0x78| 0x7c| *
* ------------------------------------------------- *
* | x23 | x24 | x25 | x26 | *
* ------------------------------------------------- *
* ------------------------------------------------- *
* | 32 | 33 | 34 | 35 | 36 | 37 | 38 | 39 | *
* ------------------------------------------------- *
* | 0x80| 0x84| 0x88| 0x8c| 0x90| 0x94| 0x98| 0x9c| *
* ------------------------------------------------- *
* | x27 | x28 | FP | LR | *
* ------------------------------------------------- *
* ------------------------------------------------- *
* | 40 | 41 | 42 | 43 | 44 | 45 | 46 | 47 | *
* ------------------------------------------------- *
* | 0xa0| 0xa4| 0xa8| 0xac| 0xb0| 0xb4| 0xb8| 0xbc| *
* ------------------------------------------------- *
* | base | limit | dealloc | fiber data| *
* ------------------------------------------------- *
* ------------------------------------------------- *
* | 48 | 49 | 50 | 51 | | | *
* ------------------------------------------------- *
* | 0xc0| 0xc4| 0xc8| 0xcc| | | *
* ------------------------------------------------- *
* | PC | align | | | *
* ------------------------------------------------- *
* *
*******************************************************/

.file "make_arm64_aapcs_pe_armclang.S"
.text
.balign 4

.globl make_fcontext
.def make_fcontext; .scl 2; .type 32; .endef
.seh_proc make_fcontext
make_fcontext:
.seh_endprologue
// save stack top address to x3
mov x3, x0

// shift address in x0 (allocated stack) to lower 16 byte boundary
and x0, x0, ~0xF

// reserve space for context-data on context-stack
sub x0, x0, #0xd0

// save top address of context_stack as 'base'
str x3, [x0, #0xa0]
// save bottom address of context-stack as 'limit' and 'dealloction stack'
sub x3, x3, x1
stp x3, x3, [x0, #0xa8]
// save 0 as 'fiber data'
str xzr, [x0, #0xb8]

// third arg of make_fcontext() == address of context-function
// store address as x19 for trampoline
str x2, [x0, #0x40]
// store trampoline address as pc
adr x2, trampoline
str x2, [x0, #0xc0]

// save address of finish as return-address for context-function
// will be entered after context-function returns (LR register)
adr x1, finish
str x1, [x0, #0x98]

ret x30 // return pointer to context-data (x0)

trampoline:
stp fp, lr, [sp, #-0x10]!
mov fp, sp
blr x19

finish:
// exit code is zero
mov x0, #0
// exit application
bl _exit

.seh_endproc

.def _exit; .scl 2; .type 32; .endef /* standard C library function */

.section .drectve
.ascii " -export:\"make_fcontext\""
Loading

0 comments on commit f7c27e2

Please sign in to comment.