;------------------------------------------------------------------------------ ; ; Copyright (c) 2015, Intel Corporation. All rights reserved.
; This program and the accompanying materials ; are licensed and made available under the terms and conditions of the BSD License ; which accompanies this distribution. The full text of the license may be found at ; http://opensource.org/licenses/bsd-license.php. ; ; THE PROGRAM IS DISTRIBUTED UNDER THE BSD LICENSE ON AN "AS IS" BASIS, ; WITHOUT WARRANTIES OR REPRESENTATIONS OF ANY KIND, EITHER EXPRESS OR IMPLIED. ; ; Abstract: ; ; Provide macro for register save/restore using SSE registers ; ;------------------------------------------------------------------------------ ; ; Define SSE instruction set ; %ifdef USE_SSE41_FLAG ; ; Define SSE macros using SSE 4.1 instructions ; args 1:XMM, 2:IDX, 3:REG %macro SXMMN 3 pinsrd %1, %3, (%2 & 3) %endmacro ; ;args 1:XMM, 2:REG, 3:IDX ; %macro LXMMN 3 pextrd %2, %1, (%3 & 3) %endmacro %else ; ; Define SSE macros using SSE 2 instructions ; args 1:XMM, 2:IDX, 3:REG %macro SXMMN 3 pinsrw %1, %3, (%2 & 3) * 2 ror %3, 16 pinsrw %1, %3, (%2 & 3) * 2 + 1 rol %3, 16 %endmacro ; ;args 1:XMM, 2:REG, 3:IDX ; %macro LXMMN 3 pshufd %1, %1, ((0E4E4E4h >> (%3 * 2)) & 0FFh) movd %2, %1 pshufd %1, %1, ((0E4E4E4h >> (%3 * 2 + (%3 & 1) * 4)) & 0FFh) %endmacro %endif ; ; XMM7 to save/restore EBP, EBX, ESI, EDI ; %macro SAVE_REGS 0 SXMMN xmm7, 0, ebp SXMMN xmm7, 1, ebx SXMMN xmm7, 2, esi SXMMN xmm7, 3, edi SAVE_ESP %endmacro %macro LOAD_REGS 0 LXMMN xmm7, ebp, 0 LXMMN xmm7, ebx, 1 LXMMN xmm7, esi, 2 LXMMN xmm7, edi, 3 LOAD_ESP %endmacro ; ; XMM6 to save/restore EAX, EDX, ECX, ESP ; %macro LOAD_EAX 0 LXMMN xmm6, eax, 1 %endmacro %macro SAVE_EAX 0 SXMMN xmm6, 1, eax %endmacro %macro LOAD_EDX 0 LXMMN xmm6, edx, 2 %endmacro %macro SAVE_EDX 0 SXMMN xmm6, 2, edx %endmacro %macro SAVE_ECX 0 SXMMN xmm6, 3, ecx %endmacro %macro LOAD_ECX 0 LXMMN xmm6, ecx, 3 %endmacro %macro SAVE_ESP 0 SXMMN xmm6, 0, esp %endmacro %macro LOAD_ESP 0 movd esp, xmm6 %endmacro ; ; XMM5 for calling stack ; arg 1:Entry %macro CALL_XMM 1 mov esi, %%ReturnAddress pslldq xmm5, 4 %ifdef USE_SSE41_FLAG pinsrd xmm5, esi, 0 %else pinsrw xmm5, esi, 0 ror esi, 16 pinsrw xmm5, esi, 1 %endif mov esi, %1 jmp esi %%ReturnAddress: %endmacro %macro RET_XMM 0 movd esi, xmm5 psrldq xmm5, 4 jmp esi %endmacro %macro ENABLE_SSE 0 ; ; Initialize floating point units ; jmp NextAddress align 4 ; ; Float control word initial value: ; all exceptions masked, double-precision, round-to-nearest ; FpuControlWord DW 027Fh ; ; Multimedia-extensions control word: ; all exceptions masked, round-to-nearest, flush to zero for masked underflow ; MmxControlWord DD 01F80h SseError: ; ; Processor has to support SSE ; jmp SseError NextAddress: finit fldcw [FpuControlWord] ; ; Use CpuId instructuion (CPUID.01H:EDX.SSE[bit 25] = 1) to test ; whether the processor supports SSE instruction. ; mov eax, 1 cpuid bt edx, 25 jnc SseError %ifdef USE_SSE41_FLAG ; ; SSE 4.1 support ; bt ecx, 19 jnc SseError %endif ; ; Set OSFXSR bit (bit #9) & OSXMMEXCPT bit (bit #10) ; mov eax, cr4 or eax, 00000600h mov cr4, eax ; ; The processor should support SSE instruction and we can use ; ldmxcsr instruction ; ldmxcsr [MmxControlWord] %endmacro