]> git.proxmox.com Git - mirror_edk2.git/blob - MdePkg/Library/BaseMemoryLibOptDxe/Ia32/CopyMem.nasm
ArmPkg/ArmDisassemblerLib: fix check for MSR instruction
[mirror_edk2.git] / MdePkg / Library / BaseMemoryLibOptDxe / Ia32 / CopyMem.nasm
1 ;------------------------------------------------------------------------------
2 ;
3 ; Copyright (c) 2006, Intel Corporation. All rights reserved.<BR>
4 ; This program and the accompanying materials
5 ; are licensed and made available under the terms and conditions of the BSD License
6 ; which accompanies this distribution. The full text of the license may be found at
7 ; http://opensource.org/licenses/bsd-license.php.
8 ;
9 ; THE PROGRAM IS DISTRIBUTED UNDER THE BSD LICENSE ON AN "AS IS" BASIS,
10 ; WITHOUT WARRANTIES OR REPRESENTATIONS OF ANY KIND, EITHER EXPRESS OR IMPLIED.
11 ;
12 ; Module Name:
13 ;
14 ; CopyMem.nasm
15 ;
16 ; Abstract:
17 ;
18 ; CopyMem function
19 ;
20 ; Notes:
21 ;
22 ;------------------------------------------------------------------------------
23
24 SECTION .text
25
26 ;------------------------------------------------------------------------------
27 ; VOID *
28 ; InternalMemCopyMem (
29 ; IN VOID *Destination,
30 ; IN VOID *Source,
31 ; IN UINTN Count
32 ; );
33 ;------------------------------------------------------------------------------
34 global ASM_PFX(InternalMemCopyMem)
35 ASM_PFX(InternalMemCopyMem):
36 push esi
37 push edi
38 mov esi, [esp + 16] ; esi <- Source
39 mov edi, [esp + 12] ; edi <- Destination
40 mov edx, [esp + 20] ; edx <- Count
41 lea eax, [esi + edx - 1] ; eax <- End of Source
42 cmp esi, edi
43 jae .0
44 cmp eax, edi ; Overlapped?
45 jae @CopyBackward ; Copy backward if overlapped
46 .0:
47 xor ecx, ecx
48 sub ecx, edi
49 and ecx, 15 ; ecx + edi aligns on 16-byte boundary
50 jz .1
51 cmp ecx, edx
52 cmova ecx, edx
53 sub edx, ecx ; edx <- remaining bytes to copy
54 rep movsb
55 .1:
56 mov ecx, edx
57 and edx, 15
58 shr ecx, 4 ; ecx <- # of DQwords to copy
59 jz @CopyBytes
60 add esp, -16
61 movdqu [esp], xmm0 ; save xmm0
62 .2:
63 movdqu xmm0, [esi] ; esi may not be 16-bytes aligned
64 movntdq [edi], xmm0 ; edi should be 16-bytes aligned
65 add esi, 16
66 add edi, 16
67 loop .2
68 mfence
69 movdqu xmm0, [esp] ; restore xmm0
70 add esp, 16 ; stack cleanup
71 jmp @CopyBytes
72 @CopyBackward:
73 mov esi, eax ; esi <- Last byte in Source
74 lea edi, [edi + edx - 1] ; edi <- Last byte in Destination
75 std
76 @CopyBytes:
77 mov ecx, edx
78 rep movsb
79 cld
80 mov eax, [esp + 12] ; eax <- Destination as return value
81 pop edi
82 pop esi
83 ret
84