]>
Commit | Line | Data |
---|---|---|
3eb9473e | 1 | ;------------------------------------------------------------------------------\r |
2 | ;\r | |
4ea9375a HT |
3 | ; Copyright (c) 2007, Intel Corporation. All rights reserved.<BR>\r |
4 | ; This program and the accompanying materials\r | |
3eb9473e | 5 | ; are licensed and made available under the terms and conditions of the BSD License\r |
6 | ; which accompanies this distribution. The full text of the license may be found at\r | |
7 | ; http://opensource.org/licenses/bsd-license.php\r | |
8 | ;\r | |
9 | ; THE PROGRAM IS DISTRIBUTED UNDER THE BSD LICENSE ON AN "AS IS" BASIS,\r | |
10 | ; WITHOUT WARRANTIES OR REPRESENTATIONS OF ANY KIND, EITHER EXPRESS OR IMPLIED.\r | |
11 | ;\r | |
12 | ; Module Name:\r | |
13 | ;\r | |
14 | ; SetMem.asm\r | |
15 | ;\r | |
16 | ; Abstract:\r | |
17 | ;\r | |
18 | ; memset function\r | |
19 | ;\r | |
20 | ; Notes:\r | |
21 | ;\r | |
22 | ;------------------------------------------------------------------------------\r | |
23 | \r | |
24 | .code\r | |
25 | \r | |
26 | ;------------------------------------------------------------------------------\r | |
27 | ; VOID *\r | |
28 | ; memset (\r | |
29 | ; OUT VOID *Buffer, --> rcx\r | |
30 | ; IN UINT8 Value, --> rdx\r | |
31 | ; IN UINTN Length --> r8\r | |
32 | ; );\r | |
33 | ;------------------------------------------------------------------------------\r | |
34 | memset PROC USES rdi\r | |
35 | mov rax, rcx \r | |
36 | cmp r8, 0 ; if Size == 0, do nothing\r | |
37 | je @SetDone \r | |
38 | mov rax, rdx ; rdx <-> r8\r | |
39 | mov rdx, r8 ; rdx <- Length\r | |
40 | mov r8, rax ; r8 <- Value\r | |
41 | \r | |
42 | mov rdi, rcx ; rdi <- Buffer\r | |
43 | mov al, r8b ; al <- Value\r | |
44 | mov r9, rdi ; r9 <- Buffer as return value\r | |
45 | xor rcx, rcx\r | |
46 | sub rcx, rdi\r | |
47 | and rcx, 15 ; rcx + rdi aligns on 16-byte boundary\r | |
48 | jz @F\r | |
49 | cmp rcx, rdx\r | |
50 | cmova rcx, rdx\r | |
51 | sub rdx, rcx\r | |
52 | rep stosb\r | |
53 | @@:\r | |
54 | mov rcx, rdx\r | |
55 | and rdx, 15\r | |
56 | shr rcx, 4\r | |
57 | jz @SetBytes\r | |
58 | mov ah, al ; ax <- Value repeats twice\r | |
59 | movd xmm0, eax ; xmm0[0..16] <- Value repeats twice\r | |
60 | pshuflw xmm0, xmm0, 0 ; xmm0[0..63] <- Value repeats 8 times\r | |
61 | movlhps xmm0, xmm0 ; xmm0 <- Value repeats 16 times\r | |
62 | @@:\r | |
63 | movdqa [rdi], xmm0 ; rdi should be 16-byte aligned\r | |
64 | add rdi, 16\r | |
65 | loop @B\r | |
66 | @SetBytes:\r | |
67 | mov ecx, edx ; high 32 bits of rcx are always zero\r | |
68 | rep stosb\r | |
69 | mov rax, r9 ; rax <- Return value\r | |
70 | @SetDone:\r | |
71 | ret\r | |
72 | memset ENDP\r | |
73 | \r | |
74 | END\r |