123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197 |
- /****************************************************************************
- * Assembly testing and benchmarking tool
- * Copyright (c) 2015 Martin Storsjo
- * Copyright (c) 2015 Janne Grunau
- *
- * This file is part of FFmpeg.
- *
- * FFmpeg is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License as published by
- * the Free Software Foundation; either version 2 of the License, or
- * (at your option) any later version.
- *
- * FFmpeg is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with this program; if not, write to the Free Software
- * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02111, USA.
- *****************************************************************************/
- #include "libavutil/arm/asm.S"
- /* override fpu so that NEON instructions are rejected */
- #if HAVE_VFP
- FPU .fpu vfp
- ELF .eabi_attribute 10, 0 @ suppress Tag_FP_arch
- #endif
- const register_init, align=3
- .quad 0x21f86d66c8ca00ce
- .quad 0x75b6ba21077c48ad
- .quad 0xed56bb2dcb3c7736
- .quad 0x8bda43d3fd1a7e06
- .quad 0xb64a9c9e5d318408
- .quad 0xdf9a54b303f1d3a3
- .quad 0x4a75479abd64e097
- .quad 0x249214109d5d1c88
- endconst
- const error_message_fpscr
- .asciz "failed to preserve register FPSCR, changed bits: %x"
- error_message_gpr:
- .asciz "failed to preserve register r%d"
- error_message_vfp:
- .asciz "failed to preserve register d%d"
- error_message_stack:
- .asciz "failed to preserve stack"
- endconst
- @ max number of args used by any asm function.
- #define MAX_ARGS 15
- #define ARG_STACK 4*(MAX_ARGS - 4)
- @ Align the used stack space to 8 to preserve the stack alignment.
- @ +8 for stack canary reference.
- #define ARG_STACK_A (((ARG_STACK + pushed + 7) & ~7) - pushed + 8)
- .macro clobbercheck variant
- .equ pushed, 4*9
- function checkasm_checked_call_\variant, export=1
- push {r4-r11, lr}
- .ifc \variant, vfp
- vpush {d8-d15}
- fmrx r4, FPSCR
- push {r4}
- .equ pushed, pushed + 16*4 + 4
- .endif
- movrel r12, register_init
- .ifc \variant, vfp
- vldm r12, {d8-d15}
- .endif
- ldm r12, {r4-r11}
- sub sp, sp, #ARG_STACK_A
- .equ pos, 0
- .rept MAX_ARGS-4
- ldr r12, [sp, #ARG_STACK_A + pushed + 8 + pos]
- str r12, [sp, #pos]
- .equ pos, pos + 4
- .endr
- @ For stack overflows, the callee is free to overwrite the parameters
- @ that were passed on the stack (if any), so we can only check after
- @ that point. First figure out how many parameters the function
- @ really took on the stack:
- ldr r12, [sp, #ARG_STACK_A + pushed + 8 + 4*(MAX_ARGS-4)]
- @ Load the first non-parameter value from the stack, that should be
- @ left untouched by the function. Store a copy of it inverted, so that
- @ e.g. overwriting everything with zero would be noticed.
- ldr r12, [sp, r12, lsl #2]
- mvn r12, r12
- str r12, [sp, #ARG_STACK_A - 4]
- mov r12, r0
- mov r0, r2
- mov r1, r3
- ldrd r2, r3, [sp, #ARG_STACK_A + pushed]
- @ Call the target function
- blx r12
- @ Load the number of stack parameters, stack canary and its reference
- ldr r12, [sp, #ARG_STACK_A + pushed + 8 + 4*(MAX_ARGS-4)]
- ldr r2, [sp, r12, lsl #2]
- ldr r3, [sp, #ARG_STACK_A - 4]
- add sp, sp, #ARG_STACK_A
- push {r0, r1}
- mvn r3, r3
- cmp r2, r3
- bne 5f
- movrel r12, register_init
- .ifc \variant, vfp
- .macro check_reg_vfp, dreg, offset
- ldrd r2, r3, [r12, #8 * (\offset)]
- vmov r0, lr, \dreg
- eor r2, r2, r0
- eor r3, r3, lr
- orrs r2, r2, r3
- bne 4f
- .endm
- .irp n, 8, 9, 10, 11, 12, 13, 14, 15
- @ keep track of the checked double/SIMD register
- mov r1, #\n
- check_reg_vfp d\n, \n-8
- .endr
- .purgem check_reg_vfp
- fmrx r1, FPSCR
- ldr r3, [sp, #8]
- eor r1, r1, r3
- @ Ignore changes in bits 0-4 and 7
- bic r1, r1, #0x9f
- @ Ignore changes in the topmost 5 bits
- bics r1, r1, #0xf8000000
- bne 3f
- .endif
- @ keep track of the checked GPR
- mov r1, #4
- .macro check_reg reg1, reg2=
- ldrd r2, r3, [r12], #8
- eors r2, r2, \reg1
- bne 2f
- add r1, r1, #1
- .ifnb \reg2
- eors r3, r3, \reg2
- bne 2f
- .endif
- add r1, r1, #1
- .endm
- check_reg r4, r5
- check_reg r6, r7
- @ r9 is a volatile register in the ios ABI
- #ifdef __APPLE__
- check_reg r8
- #else
- check_reg r8, r9
- #endif
- check_reg r10, r11
- .purgem check_reg
- b 0f
- 5:
- movrel r0, error_message_stack
- b 1f
- 4:
- movrel r0, error_message_vfp
- b 1f
- 3:
- movrel r0, error_message_fpscr
- b 1f
- 2:
- movrel r0, error_message_gpr
- 1:
- bl X(checkasm_fail_func)
- 0:
- pop {r0, r1}
- .ifc \variant, vfp
- pop {r2}
- fmxr FPSCR, r2
- vpop {d8-d15}
- .endif
- pop {r4-r11, pc}
- endfunc
- .endm
- #if HAVE_VFP || HAVE_NEON
- clobbercheck vfp
- #endif
- clobbercheck novfp
|