3 ;Copyright (c) 2006, Intel Corporation. All rights reserved.<BR>
4 ;This program and the accompanying materials
5 ;are licensed and made available under the terms and conditions of the BSD License
6 ;which accompanies this distribution. The full text of the license may be found at
7 ;http://opensource.org/licenses/bsd-license.php
9 ;THE PROGRAM IS DISTRIBUTED UNDER THE BSD LICENSE ON AN "AS IS" BASIS,
10 ;WITHOUT WARRANTIES OR REPRESENTATIONS OF ANY KIND, EITHER EXPRESS OR IMPLIED.
18 ; This is the code that supports IA32-optimized CopyMem service
22 ;---------------------------------------------------------------------------
28 ;---------------------------------------------------------------------------
31 ;EfiCommonLibCopyMem (
32 ; IN VOID *Destination,
40 ; Copy Length bytes from Source to Destination.
44 ; Destination - Target of copy
46 ; Source - Place to copy from
48 ; Length - Number of bytes to copy
55 EfiCommonLibCopyMem PROC
59 push ecx ; reserve space for Scratch Local variable UINT64 MmxSave
64 mov ecx, [ebp + 10h] ; Count
65 mov esi, [ebp + 0Ch] ; Source
66 mov edi, [ebp + 8] ; Destination
68 ; First off, make sure we have no overlap. That is to say,
69 ; if (Source == Destination) => do nothing
70 ; if (Source + Count <= Destination) => regular copy
71 ; if (Destination + Count <= Source) => regular copy
72 ; otherwise, do a reverse copy
74 add eax, ecx ; Source + Count
79 add eax, ecx ; Dest + Count
85 jb _CopyOverlapped ; too bad -- overlaps
87 ; Pick up misaligned start bytes to get destination pointer 4-byte aligned
90 je _CopyMemDone ; Count == 0, all done
92 and dl, 3 ; check lower 2 bits of address
94 je SHORT _CopyBlocks ; already aligned?
97 mov al, BYTE PTR [esi] ; get byte from Source
98 mov BYTE PTR [edi], al ; write byte to Destination
102 jmp _StartByteCopy ; back to top of loop
105 ; Compute how many 64-byte blocks we can clear
106 mov eax, ecx ; get Count in eax
107 shr eax, 6 ; convert to 64-byte count
108 shl eax, 6 ; convert back to bytes
109 sub ecx, eax ; subtract from the original count
110 shr eax, 6 ; and this is how many 64-byte blocks
112 ; If no 64-byte blocks, then skip
114 je _CopyRemainingDWords
116 ; Save mm0 to UINT64 MmxSave
121 movq mm0, QWORD PTR ds:[esi]
122 movq QWORD PTR ds:[edi], mm0
123 movq mm0, QWORD PTR ds:[esi+8]
124 movq QWORD PTR ds:[edi+8], mm0
125 movq mm0, QWORD PTR ds:[esi+16]
126 movq QWORD PTR ds:[edi+16], mm0
127 movq mm0, QWORD PTR ds:[esi+24]
128 movq QWORD PTR ds:[edi+24], mm0
129 movq mm0, QWORD PTR ds:[esi+32]
130 movq QWORD PTR ds:[edi+32], mm0
131 movq mm0, QWORD PTR ds:[esi+40]
132 movq QWORD PTR ds:[edi+40], mm0
133 movq mm0, QWORD PTR ds:[esi+48]
134 movq QWORD PTR ds:[edi+48], mm0
135 movq mm0, QWORD PTR ds:[esi+56]
136 movq QWORD PTR ds:[edi+56], mm0
143 ; Restore mm0 from MmxSave
145 emms ; Exit MMX Instruction
147 ; Copy as many DWORDS as possible
148 _CopyRemainingDWords:
150 jb _CopyRemainingBytes
152 mov eax, DWORD PTR [esi] ; get data from Source
153 mov DWORD PTR [edi], eax ; write byte to Destination
154 sub ecx, 4 ; decrement Count
155 add esi, 4 ; advance Source pointer
156 add edi, 4 ; advance Destination pointer
157 jmp _CopyRemainingDWords ; back to top
162 mov al, BYTE PTR [esi] ; get byte from Source
163 mov BYTE PTR [edi], al ; write byte to Destination
166 inc edi ; advance Destination pointer
167 jmp SHORT _CopyRemainingBytes ; back to top of loop
170 ; We do this block if the source and destination buffers overlap. To
171 ; handle it, copy starting at the end of the source buffer and work
172 ; your way back. Since this is the atypical case, this code has not
173 ; been optimized, and thus simply copies bytes.
177 ; Move the source and destination pointers to the end of the range
178 add esi, ecx ; Source + Count
180 add edi, ecx ; Dest + Count
186 mov al, BYTE PTR [esi] ; get byte from Source
187 mov BYTE PTR [edi], al ; write byte to Destination
191 jmp _CopyOverlappedLoop ; back to top of loop
199 EfiCommonLibCopyMem ENDP