mirror of https://github.com/FFmpeg/FFmpeg.git
197 lines
6.0 KiB
197 lines
6.0 KiB
/**************************************************************************** |
|
* Assembly testing and benchmarking tool |
|
* Copyright (c) 2015 Martin Storsjo |
|
* Copyright (c) 2015 Janne Grunau |
|
* |
|
* This file is part of FFmpeg. |
|
* |
|
* FFmpeg is free software; you can redistribute it and/or modify |
|
* it under the terms of the GNU General Public License as published by |
|
* the Free Software Foundation; either version 2 of the License, or |
|
* (at your option) any later version. |
|
* |
|
* FFmpeg is distributed in the hope that it will be useful, |
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
|
* GNU General Public License for more details. |
|
* |
|
* You should have received a copy of the GNU General Public License |
|
* along with this program; if not, write to the Free Software |
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02111, USA. |
|
*****************************************************************************/ |
|
|
|
#include "libavutil/arm/asm.S" |
|
|
|
/* override fpu so that NEON instructions are rejected */ |
|
#if HAVE_VFP |
|
FPU .fpu vfp |
|
ELF .eabi_attribute 10, 0 @ suppress Tag_FP_arch |
|
#endif |
|
|
|
const register_init, align=3 |
|
.quad 0x21f86d66c8ca00ce |
|
.quad 0x75b6ba21077c48ad |
|
.quad 0xed56bb2dcb3c7736 |
|
.quad 0x8bda43d3fd1a7e06 |
|
.quad 0xb64a9c9e5d318408 |
|
.quad 0xdf9a54b303f1d3a3 |
|
.quad 0x4a75479abd64e097 |
|
.quad 0x249214109d5d1c88 |
|
endconst |
|
|
|
const error_message_fpscr |
|
.asciz "failed to preserve register FPSCR, changed bits: %x" |
|
error_message_gpr: |
|
.asciz "failed to preserve register r%d" |
|
error_message_vfp: |
|
.asciz "failed to preserve register d%d" |
|
error_message_stack: |
|
.asciz "failed to preserve stack" |
|
endconst |
|
|
|
@ max number of args used by any asm function. |
|
#define MAX_ARGS 15 |
|
|
|
#define ARG_STACK 4*(MAX_ARGS - 4) |
|
|
|
@ Align the used stack space to 8 to preserve the stack alignment. |
|
@ +8 for stack canary reference. |
|
#define ARG_STACK_A (((ARG_STACK + pushed + 7) & ~7) - pushed + 8) |
|
|
|
.macro clobbercheck variant |
|
.equ pushed, 4*9 |
|
function checkasm_checked_call_\variant, export=1 |
|
push {r4-r11, lr} |
|
.ifc \variant, vfp |
|
vpush {d8-d15} |
|
fmrx r4, FPSCR |
|
push {r4} |
|
.equ pushed, pushed + 16*4 + 4 |
|
.endif |
|
|
|
movrel r12, register_init |
|
.ifc \variant, vfp |
|
vldm r12, {d8-d15} |
|
.endif |
|
ldm r12, {r4-r11} |
|
|
|
sub sp, sp, #ARG_STACK_A |
|
.equ pos, 0 |
|
.rept MAX_ARGS-4 |
|
ldr r12, [sp, #ARG_STACK_A + pushed + 8 + pos] |
|
str r12, [sp, #pos] |
|
.equ pos, pos + 4 |
|
.endr |
|
|
|
@ For stack overflows, the callee is free to overwrite the parameters |
|
@ that were passed on the stack (if any), so we can only check after |
|
@ that point. First figure out how many parameters the function |
|
@ really took on the stack: |
|
ldr r12, [sp, #ARG_STACK_A + pushed + 8 + 4*(MAX_ARGS-4)] |
|
@ Load the first non-parameter value from the stack, that should be |
|
@ left untouched by the function. Store a copy of it inverted, so that |
|
@ e.g. overwriting everything with zero would be noticed. |
|
ldr r12, [sp, r12, lsl #2] |
|
mvn r12, r12 |
|
str r12, [sp, #ARG_STACK_A - 4] |
|
|
|
mov r12, r0 |
|
mov r0, r2 |
|
mov r1, r3 |
|
ldrd r2, r3, [sp, #ARG_STACK_A + pushed] |
|
@ Call the target function |
|
blx r12 |
|
|
|
@ Load the number of stack parameters, stack canary and its reference |
|
ldr r12, [sp, #ARG_STACK_A + pushed + 8 + 4*(MAX_ARGS-4)] |
|
ldr r2, [sp, r12, lsl #2] |
|
ldr r3, [sp, #ARG_STACK_A - 4] |
|
|
|
add sp, sp, #ARG_STACK_A |
|
push {r0, r1} |
|
|
|
mvn r3, r3 |
|
cmp r2, r3 |
|
bne 5f |
|
|
|
movrel r12, register_init |
|
.ifc \variant, vfp |
|
.macro check_reg_vfp, dreg, offset |
|
ldrd r2, r3, [r12, #8 * (\offset)] |
|
vmov r0, lr, \dreg |
|
eor r2, r2, r0 |
|
eor r3, r3, lr |
|
orrs r2, r2, r3 |
|
bne 4f |
|
.endm |
|
|
|
.irp n, 8, 9, 10, 11, 12, 13, 14, 15 |
|
@ keep track of the checked double/SIMD register |
|
mov r1, #\n |
|
check_reg_vfp d\n, \n-8 |
|
.endr |
|
.purgem check_reg_vfp |
|
|
|
fmrx r1, FPSCR |
|
ldr r3, [sp, #8] |
|
eor r1, r1, r3 |
|
@ Ignore changes in bits 0-4 and 7 |
|
bic r1, r1, #0x9f |
|
@ Ignore changes in the topmost 5 bits |
|
bics r1, r1, #0xf8000000 |
|
bne 3f |
|
.endif |
|
|
|
@ keep track of the checked GPR |
|
mov r1, #4 |
|
.macro check_reg reg1, reg2= |
|
ldrd r2, r3, [r12], #8 |
|
eors r2, r2, \reg1 |
|
bne 2f |
|
add r1, r1, #1 |
|
.ifnb \reg2 |
|
eors r3, r3, \reg2 |
|
bne 2f |
|
.endif |
|
add r1, r1, #1 |
|
.endm |
|
check_reg r4, r5 |
|
check_reg r6, r7 |
|
@ r9 is a volatile register in the ios ABI |
|
#ifdef __APPLE__ |
|
check_reg r8 |
|
#else |
|
check_reg r8, r9 |
|
#endif |
|
check_reg r10, r11 |
|
.purgem check_reg |
|
|
|
b 0f |
|
5: |
|
movrel r0, error_message_stack |
|
b 1f |
|
4: |
|
movrel r0, error_message_vfp |
|
b 1f |
|
3: |
|
movrel r0, error_message_fpscr |
|
b 1f |
|
2: |
|
movrel r0, error_message_gpr |
|
1: |
|
bl X(checkasm_fail_func) |
|
0: |
|
pop {r0, r1} |
|
.ifc \variant, vfp |
|
pop {r2} |
|
fmxr FPSCR, r2 |
|
vpop {d8-d15} |
|
.endif |
|
pop {r4-r11, pc} |
|
endfunc |
|
.endm |
|
|
|
#if HAVE_VFP || HAVE_NEON |
|
clobbercheck vfp |
|
#endif |
|
clobbercheck novfp
|
|
|