| ;***************************************************************************** |
| ;* Assembly testing and benchmarking tool |
| ;* Copyright (c) 2008 Loren Merritt |
| ;* Copyright (c) 2012 Henrik Gramner |
| ;* |
| ;* This file is part of FFmpeg. |
| ;* |
| ;* FFmpeg is free software; you can redistribute it and/or modify |
| ;* it under the terms of the GNU General Public License as published by |
| ;* the Free Software Foundation; either version 2 of the License, or |
| ;* (at your option) any later version. |
| ;* |
| ;* FFmpeg is distributed in the hope that it will be useful, |
| ;* but WITHOUT ANY WARRANTY; without even the implied warranty of |
| ;* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| ;* GNU General Public License for more details. |
| ;* |
| ;* You should have received a copy of the GNU General Public License |
| ;* along with this program; if not, write to the Free Software |
| ;* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02111, USA. |
| ;***************************************************************************** |
| |
| %define private_prefix checkasm |
| %include "libavutil/x86/x86inc.asm" |
| |
| SECTION_RODATA |
| |
| error_message: db "failed to preserve register", 0 |
| error_message_emms: db "failed to issue emms", 0 |
| |
| %if ARCH_X86_64 |
| ; just random numbers to reduce the chance of incidental match |
| ALIGN 16 |
| x6: dq 0x1a1b2550a612b48c,0x79445c159ce79064 |
| x7: dq 0x2eed899d5a28ddcd,0x86b2536fcd8cf636 |
| x8: dq 0xb0856806085e7943,0x3f2bf84fc0fcca4e |
| x9: dq 0xacbd382dcf5b8de2,0xd229e1f5b281303f |
| x10: dq 0x71aeaff20b095fd9,0xab63e2e11fa38ed9 |
| x11: dq 0x89b0c0765892729a,0x77d410d5c42c882d |
| x12: dq 0xc45ea11a955d8dd5,0x24b3c1d2a024048b |
| x13: dq 0x2e8ec680de14b47c,0xdd7b8919edd42786 |
| x14: dq 0x135ce6888fa02cbf,0x11e53e2b2ac655ef |
| x15: dq 0x011ff554472a7a10,0x6de8f4c914c334d5 |
| n7: dq 0x21f86d66c8ca00ce |
| n8: dq 0x75b6ba21077c48ad |
| n9: dq 0xed56bb2dcb3c7736 |
| n10: dq 0x8bda43d3fd1a7e06 |
| n11: dq 0xb64a9c9e5d318408 |
| n12: dq 0xdf9a54b303f1d3a3 |
| n13: dq 0x4a75479abd64e097 |
| n14: dq 0x249214109d5d1c88 |
| %endif |
| |
| SECTION .text |
| |
| cextern fail_func |
| |
| ; max number of args used by any asm function. |
| ; (max_args % 4) must equal 3 for stack alignment |
| %define max_args 15 |
| |
| %if ARCH_X86_64 |
| |
| ;----------------------------------------------------------------------------- |
| ; int checkasm_stack_clobber(uint64_t clobber, ...) |
| ;----------------------------------------------------------------------------- |
| cglobal stack_clobber, 1,2 |
| ; Clobber the stack with junk below the stack pointer |
| %define argsize (max_args+6)*8 |
| SUB rsp, argsize |
| mov r1, argsize-8 |
| .loop: |
| mov [rsp+r1], r0 |
| sub r1, 8 |
| jge .loop |
| ADD rsp, argsize |
| RET |
| |
| %if WIN64 |
| %assign free_regs 7 |
| DECLARE_REG_TMP 4 |
| %else |
| %assign free_regs 9 |
| DECLARE_REG_TMP 7 |
| %endif |
| |
| %macro report_fail 1 |
| mov r9, rax |
| mov r10, rdx |
| lea r0, [%1] |
| xor eax, eax |
| call fail_func |
| mov rdx, r10 |
| mov rax, r9 |
| %endmacro |
| |
| ;----------------------------------------------------------------------------- |
| ; void checkasm_checked_call(void *func, ...) |
| ;----------------------------------------------------------------------------- |
| INIT_XMM |
| %macro CHECKED_CALL 0-1 |
| cglobal checked_call%1, 2,15,16,max_args*8+8 |
| mov t0, r0 |
| |
| ; All arguments have been pushed on the stack instead of registers in order to |
| ; test for incorrect assumptions that 32-bit ints are zero-extended to 64-bit. |
| mov r0, r6mp |
| mov r1, r7mp |
| mov r2, r8mp |
| mov r3, r9mp |
| %if UNIX64 |
| mov r4, r10mp |
| mov r5, r11mp |
| %assign i 6 |
| %rep max_args-6 |
| mov r9, [rsp+stack_offset+(i+1)*8] |
| mov [rsp+(i-6)*8], r9 |
| %assign i i+1 |
| %endrep |
| %else ; WIN64 |
| %assign i 4 |
| %rep max_args-4 |
| mov r9, [rsp+stack_offset+(i+7)*8] |
| mov [rsp+i*8], r9 |
| %assign i i+1 |
| %endrep |
| |
| ; Move possible floating-point arguments to the correct registers |
| movq m0, r0 |
| movq m1, r1 |
| movq m2, r2 |
| movq m3, r3 |
| |
| %assign i 6 |
| %rep 16-6 |
| mova m %+ i, [x %+ i] |
| %assign i i+1 |
| %endrep |
| %endif |
| |
| %assign i 14 |
| %rep 15-free_regs |
| mov r %+ i, [n %+ i] |
| %assign i i-1 |
| %endrep |
| call t0 |
| %assign i 14 |
| %rep 15-free_regs |
| xor r %+ i, [n %+ i] |
| or r14, r %+ i |
| %assign i i-1 |
| %endrep |
| |
| %if WIN64 |
| %assign i 6 |
| %rep 16-6 |
| pxor m %+ i, [x %+ i] |
| por m6, m %+ i |
| %assign i i+1 |
| %endrep |
| packsswb m6, m6 |
| movq r5, m6 |
| or r14, r5 |
| %endif |
| |
| ; Call fail_func() with a descriptive message to mark it as a failure |
| ; if the called function didn't preserve all callee-saved registers. |
| ; Save the return value located in rdx:rax first to prevent clobbering. |
| jz .clobber_ok |
| report_fail error_message |
| .clobber_ok: |
| %ifnid %1, _emms |
| fstenv [rsp] |
| cmp word [rsp + 8], 0xffff |
| je .emms_ok |
| report_fail error_message_emms |
| emms |
| .emms_ok: |
| %else |
| emms |
| %endif |
| RET |
| %endmacro |
| |
| %else |
| |
| ; just random numbers to reduce the chance of incidental match |
| %define n3 dword 0x6549315c |
| %define n4 dword 0xe02f3e23 |
| %define n5 dword 0xb78d0d1d |
| %define n6 dword 0x33627ba7 |
| |
| %macro report_fail 1 |
| mov r3, eax |
| mov r4, edx |
| lea r0, [%1] |
| mov [esp], r0 |
| call fail_func |
| mov edx, r4 |
| mov eax, r3 |
| %endmacro |
| |
| %macro CHECKED_CALL 0-1 |
| ;----------------------------------------------------------------------------- |
| ; void checkasm_checked_call(void *func, ...) |
| ;----------------------------------------------------------------------------- |
| cglobal checked_call%1, 1,7 |
| mov r3, n3 |
| mov r4, n4 |
| mov r5, n5 |
| mov r6, n6 |
| %rep max_args |
| PUSH dword [esp+20+max_args*4] |
| %endrep |
| call r0 |
| xor r3, n3 |
| xor r4, n4 |
| xor r5, n5 |
| xor r6, n6 |
| or r3, r4 |
| or r5, r6 |
| or r3, r5 |
| jz .clobber_ok |
| report_fail error_message |
| .clobber_ok: |
| %ifnid %1, _emms |
| fstenv [esp] |
| cmp word [esp + 8], 0xffff |
| je .emms_ok |
| report_fail error_message_emms |
| emms |
| .emms_ok: |
| %else |
| emms |
| %endif |
| add esp, max_args*4 |
| REP_RET |
| %endmacro |
| |
| %endif ; ARCH_X86_64 |
| |
| CHECKED_CALL |
| CHECKED_CALL _emms |