forked from mirror/libbpg
198 lines
4.6 KiB
NASM
198 lines
4.6 KiB
NASM
|
;*****************************************************************************
|
||
|
;* cpu-a.asm: x86 cpu utilities
|
||
|
;*****************************************************************************
|
||
|
;* Copyright (C) 2003-2013 x264 project
|
||
|
;*
|
||
|
;* Authors: Laurent Aimar <fenrir@via.ecp.fr>
|
||
|
;* Loren Merritt <lorenm@u.washington.edu>
|
||
|
;* Fiona Glaser <fiona@x264.com>
|
||
|
;*
|
||
|
;* This program is free software; you can redistribute it and/or modify
|
||
|
;* it under the terms of the GNU General Public License as published by
|
||
|
;* the Free Software Foundation; either version 2 of the License, or
|
||
|
;* (at your option) any later version.
|
||
|
;*
|
||
|
;* This program is distributed in the hope that it will be useful,
|
||
|
;* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
;* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
|
;* GNU General Public License for more details.
|
||
|
;*
|
||
|
;* You should have received a copy of the GNU General Public License
|
||
|
;* along with this program; if not, write to the Free Software
|
||
|
;* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02111, USA.
|
||
|
;*
|
||
|
;* This program is also available under a commercial proprietary license.
|
||
|
;* For more information, contact us at license @ x265.com.
|
||
|
;*****************************************************************************
|
||
|
|
||
|
%include "x86inc.asm"
|
||
|
|
||
|
SECTION .text
|
||
|
|
||
|
;-----------------------------------------------------------------------------
|
||
|
; void cpu_cpuid( int op, int *eax, int *ebx, int *ecx, int *edx )
|
||
|
;-----------------------------------------------------------------------------
|
||
|
cglobal cpu_cpuid, 5,7
|
||
|
push rbx
|
||
|
push r4
|
||
|
push r3
|
||
|
push r2
|
||
|
push r1
|
||
|
mov eax, r0d
|
||
|
xor ecx, ecx
|
||
|
cpuid
|
||
|
pop r4
|
||
|
mov [r4], eax
|
||
|
pop r4
|
||
|
mov [r4], ebx
|
||
|
pop r4
|
||
|
mov [r4], ecx
|
||
|
pop r4
|
||
|
mov [r4], edx
|
||
|
pop rbx
|
||
|
RET
|
||
|
|
||
|
;-----------------------------------------------------------------------------
|
||
|
; void cpu_xgetbv( int op, int *eax, int *edx )
|
||
|
;-----------------------------------------------------------------------------
|
||
|
cglobal cpu_xgetbv, 3,7
|
||
|
push r2
|
||
|
push r1
|
||
|
mov ecx, r0d
|
||
|
xgetbv
|
||
|
pop r4
|
||
|
mov [r4], eax
|
||
|
pop r4
|
||
|
mov [r4], edx
|
||
|
RET
|
||
|
|
||
|
%if ARCH_X86_64
|
||
|
|
||
|
;-----------------------------------------------------------------------------
|
||
|
; void stack_align( void (*func)(void*), void *arg );
|
||
|
;-----------------------------------------------------------------------------
|
||
|
cglobal stack_align
|
||
|
push rbp
|
||
|
mov rbp, rsp
|
||
|
%if WIN64
|
||
|
sub rsp, 32 ; shadow space
|
||
|
%endif
|
||
|
and rsp, ~31
|
||
|
mov rax, r0
|
||
|
mov r0, r1
|
||
|
mov r1, r2
|
||
|
mov r2, r3
|
||
|
call rax
|
||
|
leave
|
||
|
ret
|
||
|
|
||
|
%else
|
||
|
|
||
|
;-----------------------------------------------------------------------------
|
||
|
; int cpu_cpuid_test( void )
|
||
|
; return 0 if unsupported
|
||
|
;-----------------------------------------------------------------------------
|
||
|
cglobal cpu_cpuid_test
|
||
|
pushfd
|
||
|
push ebx
|
||
|
push ebp
|
||
|
push esi
|
||
|
push edi
|
||
|
pushfd
|
||
|
pop eax
|
||
|
mov ebx, eax
|
||
|
xor eax, 0x200000
|
||
|
push eax
|
||
|
popfd
|
||
|
pushfd
|
||
|
pop eax
|
||
|
xor eax, ebx
|
||
|
pop edi
|
||
|
pop esi
|
||
|
pop ebp
|
||
|
pop ebx
|
||
|
popfd
|
||
|
ret
|
||
|
|
||
|
cglobal stack_align
|
||
|
push ebp
|
||
|
mov ebp, esp
|
||
|
sub esp, 12
|
||
|
and esp, ~31
|
||
|
mov ecx, [ebp+8]
|
||
|
mov edx, [ebp+12]
|
||
|
mov [esp], edx
|
||
|
mov edx, [ebp+16]
|
||
|
mov [esp+4], edx
|
||
|
mov edx, [ebp+20]
|
||
|
mov [esp+8], edx
|
||
|
call ecx
|
||
|
leave
|
||
|
ret
|
||
|
|
||
|
%endif
|
||
|
|
||
|
;-----------------------------------------------------------------------------
|
||
|
; void cpu_emms( void )
|
||
|
;-----------------------------------------------------------------------------
|
||
|
cglobal cpu_emms
|
||
|
emms
|
||
|
ret
|
||
|
|
||
|
;-----------------------------------------------------------------------------
|
||
|
; void cpu_sfence( void )
|
||
|
;-----------------------------------------------------------------------------
|
||
|
cglobal cpu_sfence
|
||
|
sfence
|
||
|
ret
|
||
|
|
||
|
cextern intel_cpu_indicator_init
|
||
|
|
||
|
;-----------------------------------------------------------------------------
|
||
|
; void safe_intel_cpu_indicator_init( void );
|
||
|
;-----------------------------------------------------------------------------
|
||
|
cglobal safe_intel_cpu_indicator_init
|
||
|
push r0
|
||
|
push r1
|
||
|
push r2
|
||
|
push r3
|
||
|
push r4
|
||
|
push r5
|
||
|
push r6
|
||
|
%if ARCH_X86_64
|
||
|
push r7
|
||
|
push r8
|
||
|
push r9
|
||
|
push r10
|
||
|
push r11
|
||
|
push r12
|
||
|
push r13
|
||
|
push r14
|
||
|
%endif
|
||
|
push rbp
|
||
|
mov rbp, rsp
|
||
|
%if WIN64
|
||
|
sub rsp, 32 ; shadow space
|
||
|
%endif
|
||
|
and rsp, ~31
|
||
|
call intel_cpu_indicator_init
|
||
|
leave
|
||
|
%if ARCH_X86_64
|
||
|
pop r14
|
||
|
pop r13
|
||
|
pop r12
|
||
|
pop r11
|
||
|
pop r10
|
||
|
pop r9
|
||
|
pop r8
|
||
|
pop r7
|
||
|
%endif
|
||
|
pop r6
|
||
|
pop r5
|
||
|
pop r4
|
||
|
pop r3
|
||
|
pop r2
|
||
|
pop r1
|
||
|
pop r0
|
||
|
ret
|