123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512 |
- /* SPDX-License-Identifier: MIT */
- /* Copyright (c) 2021-2022 The SRS Authors */
- /* If user disable the ASM, such as avoiding bugs in ASM, donot compile it. */
- #if !defined(MD_ST_NO_ASM)
- #if defined(__aarch64__)
- /****************************************************************/
- /* See https://developer.arm.com/documentation/102374/0100/Function-calls */
- /* See https://developer.arm.com/documentation/102374/0100/Procedure-Call-Standard */
- /* See https://github.com/ARM-software/abi-aa/blob/main/aapcs64/aapcs64.rst#machine-registers */
- /* See https://wiki.cdot.senecacollege.ca/wiki/AArch64_Register_and_Instruction_Quick_Start */
- /* See https://chromium.googlesource.com/native_client/nacl-glibc/+/glibc-2.21/sysdeps/aarch64/__longjmp.S */
- /* See https://chromium.googlesource.com/native_client/nacl-glibc/+/glibc-2.21/sysdeps/aarch64/setjmp.S */
- /* The called routine is expected to preserve r19-r28 *** These registers are generally
- safe to use in your program. */
- #define JB_X19 0
- #define JB_X20 1
- #define JB_X21 2
- #define JB_X22 3
- #define JB_X23 4
- #define JB_X24 5
- #define JB_X25 6
- #define JB_X26 7
- #define JB_X27 8
- #define JB_X28 9
- /* r29 and r30 are used as the frame register and link register (avoid) */
- #define JB_X29 10
- #define JB_LR 11
- /* Register '31' is one of two registers depending on the instruction context:
- For instructions dealing with the stack, it is the stack pointer, named rsp */
- #define JB_SP 13
- /* FP registers */
- #define JB_D8 14
- #define JB_D9 15
- #define JB_D10 16
- #define JB_D11 17
- #define JB_D12 18
- #define JB_D13 19
- #define JB_D14 20
- #define JB_D15 21
- .file "md.S"
- .text
- /* _st_md_cxt_save(__jmp_buf env) */
- .globl _st_md_cxt_save
- .type _st_md_cxt_save, %function
- .align 4
- _st_md_cxt_save:
- stp x19, x20, [x0, #JB_X19<<3]
- stp x21, x22, [x0, #JB_X21<<3]
- stp x23, x24, [x0, #JB_X23<<3]
- stp x25, x26, [x0, #JB_X25<<3]
- stp x27, x28, [x0, #JB_X27<<3]
- stp x29, x30, [x0, #JB_X29<<3]
- stp d8, d9, [x0, #JB_D8<<3]
- stp d10, d11, [x0, #JB_D10<<3]
- stp d12, d13, [x0, #JB_D12<<3]
- stp d14, d15, [x0, #JB_D14<<3]
- mov x2, sp
- str x2, [x0, #JB_SP<<3]
- mov x0, #0
- ret
- .size _st_md_cxt_save, .-_st_md_cxt_save
- /****************************************************************/
- /* _st_md_cxt_restore(__jmp_buf env, int val) */
- .globl _st_md_cxt_restore
- .type _st_md_cxt_restore, %function
- .align 4
- _st_md_cxt_restore:
- ldp x19, x20, [x0, #JB_X19<<3]
- ldp x21, x22, [x0, #JB_X21<<3]
- ldp x23, x24, [x0, #JB_X23<<3]
- ldp x25, x26, [x0, #JB_X25<<3]
- ldp x27, x28, [x0, #JB_X27<<3]
- ldp x29, x30, [x0, #JB_X29<<3]
- ldp d8, d9, [x0, #JB_D8<<3]
- ldp d10, d11, [x0, #JB_D10<<3]
- ldp d12, d13, [x0, #JB_D12<<3]
- ldp d14, d15, [x0, #JB_D14<<3]
- ldr x5, [x0, #JB_SP<<3]
- mov sp, x5
- cmp x1, #0
- mov x0, #1
- csel x0, x1, x0, ne
- /* Use br instead of ret because ret is guaranteed to mispredict */
- br x30
- .size _st_md_cxt_restore, .-_st_md_cxt_restore
- /****************************************************************/
- #elif defined(__arm__)
- /****************************************************************/
- /* https://github.com/ossrs/srs/issues/1282#issuecomment-445539513 */
- /* Register list for a ldm/stm instruction to load/store
- the general registers from a __jmp_buf. */
- # define JMP_BUF_REGLIST {v1-v6, sl, fp, sp, lr}
- .file "md.S"
- .text
- /* _st_md_cxt_save(__jmp_buf env) */
- .globl _st_md_cxt_save
- .type _st_md_cxt_save, %function
- .align 2
- _st_md_cxt_save:
- mov ip, r0
- /* Save registers */
- stmia ip!, JMP_BUF_REGLIST
- #ifdef __VFP_FP__
- /* Store the VFP registers. */
- /* Following instruction is vstmia ip!, {d8-d15}. */
- stc p11, cr8, [ip], #64
- #endif
- #ifdef __IWMMXT__
- /* Save the call-preserved iWMMXt registers. */
- /* Following instructions are wstrd wr10, [ip], #8 (etc.) */
- stcl p1, cr10, [r12], #8
- stcl p1, cr11, [r12], #8
- stcl p1, cr12, [r12], #8
- stcl p1, cr13, [r12], #8
- stcl p1, cr14, [r12], #8
- stcl p1, cr15, [r12], #8
- #endif
- mov r0, #0
- bx lr
- .size _st_md_cxt_save, .-_st_md_cxt_save
- /****************************************************************/
- /* _st_md_cxt_restore(__jmp_buf env, int val) */
- .globl _st_md_cxt_restore
- .type _st_md_cxt_restore, %function
- .align 2
- _st_md_cxt_restore:
- mov ip, r0
- /* Restore registers */
- ldmia ip!, JMP_BUF_REGLIST
- #ifdef __VFP_FP__
- /* Restore the VFP registers. */
- /* Following instruction is vldmia ip!, {d8-d15}. */
- ldc p11, cr8, [r12], #64
- #endif
- #ifdef __IWMMXT__
- /* Restore the call-preserved iWMMXt registers. */
- /* Following instructions are wldrd wr10, [ip], #8 (etc.) */
- ldcl p1, cr10, [r12], #8
- ldcl p1, cr11, [r12], #8
- ldcl p1, cr12, [r12], #8
- ldcl p1, cr13, [r12], #8
- ldcl p1, cr14, [r12], #8
- ldcl p1, cr15, [r12], #8
- #endif
- movs r0, r1 /* get the return value in place */
- moveq r0, #1 /* can't let setjmp() return zero! */
- bx lr
- .size _st_md_cxt_restore, .-_st_md_cxt_restore
- /****************************************************************/
- #elif defined(__riscv)
- /****************************************************************/
- /*
- * Internal __jmp_buf layout
- * riscv-asm: https://github.com/riscv/riscv-asm-manual/blob/master/riscv-asm.md
- */
- #define JB_SP 0 /* A0, SP, Stack pointer */
- #define JB_RA 1 /* RA, Return address */
- #define JB_FP 2 /* FP/S0 Frame pointer */
- #define JB_S1 3 /* S1 Saved register*/
- #define JB_S2 4 /* S2-S11, Saved register */
- #define JB_S3 5 /* S2-S11, Saved register */
- #define JB_S4 6 /* S2-S11, Saved register */
- #define JB_S5 7 /* S2-S11, Saved register */
- #define JB_S6 8 /* S2-S11, Saved register */
- #define JB_S7 9 /* S2-S11, Saved register */
- #define JB_S8 10 /* S2-S11, Saved register */
- #define JB_S9 11 /* S2-S11, Saved register */
- #define JB_S10 12 /* S2-S11, Saved register */
- #define JB_S11 13 /* S2-S11, Saved register */
- .file "md_linux.S"
- .text
- /* _st_md_cxt_save(__jmp_buf env) */ /* The env is $a0, https://en.wikipedia.org/wiki/RISC-V#Register_sets */
- .globl _st_md_cxt_save
- .type _st_md_cxt_save, %function
- .align 2
- _st_md_cxt_save:
- sd sp, JB_SP * 8(a0)
- sd ra, JB_RA * 8(a0)
- sd s0, JB_FP * 8(a0)
- sd s1, JB_S1 * 8(a0)
- sd s2, JB_S2 * 8(a0)
- sd s3, JB_S3 * 8(a0)
- sd s4, JB_S4 * 8(a0)
- sd s5, JB_S5 * 8(a0)
- sd s6, JB_S6 * 8(a0)
- sd s7, JB_S7 * 8(a0)
- sd s8, JB_S8 * 8(a0)
- sd s9, JB_S9 * 8(a0)
- sd s10, JB_S10 * 8(a0)
- sd s11, JB_S11 * 8(a0)
- li a0, 0
- jr ra
- .size _st_md_cxt_save, .-_st_md_cxt_save
- /****************************************************************/
- /* _st_md_cxt_restore(__jmp_buf env, int val) */
- .globl _st_md_cxt_restore
- .type _st_md_cxt_restore, %function
- .align 2
- _st_md_cxt_restore:
- ld sp, JB_SP * 8(a0)
- ld ra, JB_RA * 8(a0)
- ld s0, JB_FP * 8(a0)
- ld s1, JB_S1 * 8(a0)
- ld s2, JB_S2 * 8(a0)
- ld s3, JB_S3 * 8(a0)
- ld s4, JB_S4 * 8(a0)
- ld s5, JB_S5 * 8(a0)
- ld s6, JB_S6 * 8(a0)
- ld s7, JB_S7 * 8(a0)
- ld s8, JB_S8 * 8(a0)
- ld s9, JB_S9 * 8(a0)
- ld s10, JB_S10 * 8(a0)
- ld s11, JB_S11 * 8(a0)
- li a0, 1
- jr ra
- .size _st_md_cxt_restore, .-_st_md_cxt_restore
- /****************************************************************/
- #elif defined(__mips64)
- /****************************************************************/
- /* For MIPS64, see https://s3-eu-west-1.amazonaws.com/downloads-mips/documents/MIPS_Architecture_MIPS64_InstructionSet_%20AFP_P_MD00087_06.05.pdf */
- /*
- * Internal __jmp_buf layout
- */
- #define JB_SP 0 /* Stack pointer */
- #define JB_RA 11 /* Return address */
- #define JB_GP 1 /* Global pointer */
- #define JB_S0 3 /* S0-S7, Saved temporaries */
- #define JB_S1 4 /* S0-S7, Saved temporaries */
- #define JB_S2 5 /* S0-S7, Saved temporaries */
- #define JB_S3 6 /* S0-S7, Saved temporaries */
- #define JB_S4 7 /* S0-S7, Saved temporaries */
- #define JB_S5 8 /* S0-S7, Saved temporaries */
- #define JB_S6 9 /* S0-S7, Saved temporaries */
- #define JB_S7 10 /* S0-S7, Saved temporaries */
- #define JB_FP 2 /* FP/S8 Frame pointer */
- .file "md_linux.S"
- .text
- /* _st_md_cxt_save(__jmp_buf env) */ /* The env is $a0, https://en.wikipedia.org/wiki/MIPS_architecture#Calling_conventions */
- .globl _st_md_cxt_save
- .type _st_md_cxt_save, %function
- .align 2
- _st_md_cxt_save:
- sd $sp, 0($a0) /* Save sp to env[0], *(long*)($a0+ 0) =sp */
- sd $ra, 8($a0) /* Save ra to env[1], *(long*)($a0+ 8)=ra, the return address, https://chortle.ccsu.edu/AssemblyTutorial/Chapter-26/ass26_4.html */
- sd $gp, 16($a0) /* Save gp to env[2], *(long*)($a0+16) =gp */
- sd $s0, 24($a0) /* Save s0 to env[3], *(long*)($a0+24)=s0 */
- sd $s1, 32($a0) /* Save s1 to env[4], *(long*)($a0+32)=s1 */
- sd $s2, 40($a0) /* Save s2 to env[5], *(long*)($a0+40)=s2 */
- sd $s3, 48($a0) /* Save s3 to env[6], *(long*)($a0+48)=s3 */
- sd $s4, 56($a0) /* Save s4 to env[7], *(long*)($a0+56)=s4 */
- sd $s5, 64($a0) /* Save s5 to env[8], *(long*)($a0+64)=s5 */
- sd $s6, 72($a0) /* Save s6 to env[9], *(long*)($a0+72)=s6 */
- sd $s7, 80($a0) /* Save s7 to env[10], *(long*)($a0+80)=s7 */
- sd $fp, 88($a0) /* Save fp to env[11], *(long*)($a0+88) =fp */
- li $v0, 0 /* Set return value to 0 */
- jr $ra /* Return */
- .size _st_md_cxt_save, .-_st_md_cxt_save
- /****************************************************************/
- /* _st_md_cxt_restore(__jmp_buf env, int val) */
- .globl _st_md_cxt_restore
- .type _st_md_cxt_restore, %function
- .align 2
- _st_md_cxt_restore:
- ld $sp, 0($a0) /* Load sp from env[0], sp=*(long*)($a0+ 0) */
- ld $ra, 8($a0) /* Load sp from env[1], ra=*(long*)($a0+ 8), the saved return address */
- ld $gp, 16($a0) /* Load sp from env[2], gp=*(long*)($a0+16) */
- ld $s0, 24($a0) /* Load sp from env[3], s0=*(long*)($a0+24) */
- ld $s1, 32($a0) /* Load sp from env[4], s1=*(long*)($a0+32) */
- ld $s2, 40($a0) /* Load sp from env[5], s2=*(long*)($a0+40) */
- ld $s3, 48($a0) /* Load sp from env[6], s3=*(long*)($a0+48) */
- ld $s4, 56($a0) /* Load sp from env[7], s4=*(long*)($a0+56) */
- ld $s5, 64($a0) /* Load sp from env[8], s5=*(long*)($a0+64) */
- ld $s6, 72($a0) /* Load sp from env[9], s6=*(long*)($a0+72) */
- ld $s7, 80($a0) /* Load sp from env[10], s7=*(long*)($a0+80) */
- ld $fp, 88($a0) /* Load sp from env[2], fp=*(long*)($a0+88) */
- li $v0, 1 /* Set return value to 1 */
- jr $ra /* Return to the saved return address */
- .size _st_md_cxt_restore, .-_st_md_cxt_restore
- /****************************************************************/
- #elif defined(__mips__)
- /****************************************************************/
- /* For MIPS32, see https://s3-eu-west-1.amazonaws.com/downloads-mips/documents/MD00565-2B-MIPS32-QRC-01.01.pdf */
- /*
- * Internal __jmp_buf layout
- */
- #define JB_SP 0 /* Stack pointer */
- #define JB_RA 11 /* Return address */
- #define JB_GP 1 /* Global pointer */
- #define JB_S0 3 /* S0-S7, Saved temporaries */
- #define JB_S1 4 /* S0-S7, Saved temporaries */
- #define JB_S2 5 /* S0-S7, Saved temporaries */
- #define JB_S3 6 /* S0-S7, Saved temporaries */
- #define JB_S4 7 /* S0-S7, Saved temporaries */
- #define JB_S5 8 /* S0-S7, Saved temporaries */
- #define JB_S6 9 /* S0-S7, Saved temporaries */
- #define JB_S7 10 /* S0-S7, Saved temporaries */
- #define JB_FP 2 /* FP/S8 Frame pointer */
- .file "md_linux.S"
- .text
- /* _st_md_cxt_save(__jmp_buf env) */ /* The env is $a0, https://en.wikipedia.org/wiki/MIPS_architecture#Calling_conventions */
- .globl _st_md_cxt_save
- .type _st_md_cxt_save, %function
- .align 2
- _st_md_cxt_save:
- sw $sp, 0($a0) /* Save sp to env[0], *(long*)($a0+0) =sp */
- sw $ra, 4($a0) /* Save ra to env[1], *(long*)($a0+4)=ra, the return address, https://chortle.ccsu.edu/AssemblyTutorial/Chapter-26/ass26_4.html */
- sw $gp, 8($a0) /* Save gp to env[2], *(long*)($a0+8) =gp */
- sw $s0, 12($a0) /* Save s0 to env[3], *(long*)($a0+12)=s0 */
- sw $s1, 16($a0) /* Save s1 to env[4], *(long*)($a0+16)=s1 */
- sw $s2, 20($a0) /* Save s2 to env[5], *(long*)($a0+20)=s2 */
- sw $s3, 24($a0) /* Save s3 to env[6], *(long*)($a0+24)=s3 */
- sw $s4, 28($a0) /* Save s4 to env[7], *(long*)($a0+28)=s4 */
- sw $s5, 32($a0) /* Save s5 to env[8], *(long*)($a0+32)=s5 */
- sw $s6, 36($a0) /* Save s6 to env[9], *(long*)($a0+36)=s6 */
- sw $s7, 40($a0) /* Save s7 to env[10], *(long*)($a0+40)=s7 */
- sw $fp, 44($a0) /* Save fp to env[11], *(long*)($a0+44) =fp */
- li $v0, 0 /* Set return value to 0 */
- jr $ra /* Return */
- .size _st_md_cxt_save, .-_st_md_cxt_save
- /****************************************************************/
- /* _st_md_cxt_restore(__jmp_buf env, int val) */
- .globl _st_md_cxt_restore
- .type _st_md_cxt_restore, %function
- .align 2
- _st_md_cxt_restore:
- lw $sp, 0($a0) /* Load sp from env[0], sp=*(long*)($a0+0) */
- lw $ra, 4($a0) /* Load sp from env[1], ra=*(long*)($a0+4), the saved return address */
- lw $gp, 8($a0) /* Load sp from env[2], gp=*(long*)($a0+8) */
- lw $s0, 12($a0) /* Load sp from env[3], s0=*(long*)($a0+12) */
- lw $s1, 16($a0) /* Load sp from env[4], s1=*(long*)($a0+16) */
- lw $s2, 20($a0) /* Load sp from env[5], s2=*(long*)($a0+20) */
- lw $s3, 24($a0) /* Load sp from env[6], s3=*(long*)($a0+24) */
- lw $s4, 28($a0) /* Load sp from env[7], s4=*(long*)($a0+28) */
- lw $s5, 32($a0) /* Load sp from env[8], s5=*(long*)($a0+32) */
- lw $s6, 36($a0) /* Load sp from env[9], s6=*(long*)($a0+36) */
- lw $s7, 40($a0) /* Load sp from env[10], s7=*(long*)($a0+40) */
- lw $fp, 44($a0) /* Load sp from env[2], fp=*(long*)($a0+44) */
- li $v0, 1 /* Set return value to 1 */
- jr $ra /* Return to the saved return address */
- .size _st_md_cxt_restore, .-_st_md_cxt_restore
- /****************************************************************/
- #elif defined(__loongarch64)
- /****************************************************************/
- /*
- * Internal __jmp_buf layout
- */
- #define JB_SP 0 /* R3, SP, Stack pointer */
- #define JB_RA 1 /* R1, RA, Return address */
- #define JB_FP 2 /* FP/R22 Frame pointer */
- #define JB_S0 3 /* R23-R31, S0-S8, Subroutine register variable */
- #define JB_S1 4 /* R23-R31, S0-S8, Subroutine register variable */
- #define JB_S2 5 /* R23-R31, S0-S8, Subroutine register variable */
- #define JB_S3 6 /* R23-R31, S0-S8, Subroutine register variable */
- #define JB_S4 7 /* R23-R31, S0-S8, Subroutine register variable */
- #define JB_S5 8 /* R23-R31, S0-S8, Subroutine register variable */
- #define JB_S6 9 /* R23-R31, S0-S8, Subroutine register variable */
- #define JB_S7 10 /* R23-R31, S0-S8, Subroutine register variable */
- #define JB_S8 11 /* R23-R31, S0-S8, Subroutine register variable */
- .file "md_linux.S"
- .text
- /* _st_md_cxt_save(__jmp_buf env) */ /* The env is $r4, https://github.com/ossrs/state-threads/issues/24#porting */
- .globl _st_md_cxt_save
- .type _st_md_cxt_save, %function
- .align 2
- _st_md_cxt_save:
- st.d $r3, $r4, 0 /* Save sp to env[0], *(long*)($r4+0) = sp */
- st.d $r1, $r4, 8 /* Save ra to env[1], *(long*)($r4+8) = r1 */
- st.d $r22, $r4, 16 /* Save fp to env[2], *(long*)($r4+16) = r22 */
- st.d $r23, $r4, 24 /* Save r23 to env[3], *(long*)($r4+24) = r23 */
- st.d $r24, $r4, 32 /* Save r24 to env[4], *(long*)($r4+32) = r24 */
- st.d $r25, $r4, 40 /* Save r25 to env[5], *(long*)($r4+40) = r25 */
- st.d $r26, $r4, 48 /* Save r26 to env[6], *(long*)($r4+48) = r26 */
- st.d $r27, $r4, 56 /* Save r27 to env[7], *(long*)($r4+56) = r27 */
- st.d $r28, $r4, 64 /* Save r28 to env[8], *(long*)($r4+64) = r28 */
- st.d $r29, $r4, 72 /* Save r29 to env[9], *(long*)($r4+72) = r29 */
- st.d $r30, $r4, 80 /* Save r30 to env[10], *(long*)($r4+80) = r30 */
- st.d $r31, $r4, 88 /* Save r31 to env[11], *(long*)($r4+88) = r31 */
- addi.w $r12, $r0, 0 /* Set return value to 0 */
- move $r4, $r12 /* Set return value to 0 */
- jirl $r0, $r1, 0 /* Return */
- .size _st_md_cxt_save, .-_st_md_cxt_save
- /****************************************************************/
- /* _st_md_cxt_restore(__jmp_buf env, int val) */
- .globl _st_md_cxt_restore
- .type _st_md_cxt_restore, %function
- .align 2
- _st_md_cxt_restore:
- ld.d $r3, $r4, 0 /* Load sp from env[0], sp=*(long*)($r4+0) */
- ld.d $r1, $r4, 8 /* Load ra from env[1], r1=*(long*)($r4+8) */
- ld.d $r22, $r4, 16 /* Load fp from env[2], r22=*(long*)($r4+16) */
- ld.d $r23, $r4, 24 /* Load r23 from env[3], r23=*(long*)($r4+24) */
- ld.d $r24, $r4, 32 /* Load r24 from env[4], r24=*(long*)($r4+32) */
- ld.d $r25, $r4, 40 /* Load r25 from env[5], r25=*(long*)($r4+40) */
- ld.d $r26, $r4, 48 /* Load r26 from env[6], r26=*(long*)($r4+48) */
- ld.d $r27, $r4, 56 /* Load r27 from env[7], r27=*(long*)($r4+56) */
- ld.d $r28, $r4, 64 /* Load r28 from env[8], r28=*(long*)($r4+64) */
- ld.d $r29, $r4, 72 /* Load r29 from env[9], r29=*(long*)($r4+72) */
- ld.d $r30, $r4, 80 /* Load r30 from env[10], r30=*(long*)($r4+80) */
- ld.d $r31, $r4, 88 /* Load r31 from env[11], r31=*(long*)($r4+88) */
- addi.w $r12, $r0, 1 /* Set return value to 1 */
- move $r4, $r12 /* Set return value to 1 */
- jirl $r0, $r1, 0 /* Return to the saved return address */
- .size _st_md_cxt_restore, .-_st_md_cxt_restore
- /****************************************************************/
- #endif
- #endif
|