]> git.proxmox.com Git - mirror_edk2.git/blob - UefiCpuPkg/Library/MpInitLib/X64/MpFuncs.nasm
e7e7d8086dd01e989ab6114c983b9abd37d04513
[mirror_edk2.git] / UefiCpuPkg / Library / MpInitLib / X64 / MpFuncs.nasm
1 ;------------------------------------------------------------------------------ ;
2 ; Copyright (c) 2015 - 2016, Intel Corporation. All rights reserved.<BR>
3 ; This program and the accompanying materials
4 ; are licensed and made available under the terms and conditions of the BSD License
5 ; which accompanies this distribution. The full text of the license may be found at
6 ; http://opensource.org/licenses/bsd-license.php.
7 ;
8 ; THE PROGRAM IS DISTRIBUTED UNDER THE BSD LICENSE ON AN "AS IS" BASIS,
9 ; WITHOUT WARRANTIES OR REPRESENTATIONS OF ANY KIND, EITHER EXPRESS OR IMPLIED.
10 ;
11 ; Module Name:
12 ;
13 ; MpFuncs.nasm
14 ;
15 ; Abstract:
16 ;
17 ; This is the assembly code for MP support
18 ;
19 ;-------------------------------------------------------------------------------
20
21 %include "MpEqu.inc"
22 extern ASM_PFX(InitializeFloatingPointUnits)
23
24 DEFAULT REL
25
26 SECTION .text
27
28 ;-------------------------------------------------------------------------------------
29 ;RendezvousFunnelProc procedure follows. All APs execute their procedure. This
30 ;procedure serializes all the AP processors through an Init sequence. It must be
31 ;noted that APs arrive here very raw...ie: real mode, no stack.
32 ;ALSO THIS PROCEDURE IS EXECUTED BY APs ONLY ON 16 BIT MODE. HENCE THIS PROC
33 ;IS IN MACHINE CODE.
34 ;-------------------------------------------------------------------------------------
35 global ASM_PFX(RendezvousFunnelProc)
36 ASM_PFX(RendezvousFunnelProc):
37 RendezvousFunnelProcStart:
38 ; At this point CS = 0x(vv00) and ip= 0x0.
39 ; Save BIST information to ebp firstly
40
41 BITS 16
42 mov ebp, eax ; Save BIST information
43
44 mov ax, cs
45 mov ds, ax
46 mov es, ax
47 mov ss, ax
48 xor ax, ax
49 mov fs, ax
50 mov gs, ax
51
52 mov si, BufferStartLocation
53 mov ebx, [si]
54
55 mov di, ModeOffsetLocation
56 mov eax, [di]
57 mov di, CodeSegmentLocation
58 mov edx, [di]
59 mov di, ax
60 sub di, 02h
61 mov [di],dx ; Patch long mode CS
62 sub di, 04h
63 add eax, ebx
64 mov [di],eax ; Patch address
65
66 mov si, GdtrLocation
67 o32 lgdt [cs:si]
68
69 mov si, IdtrLocation
70 o32 lidt [cs:si]
71
72 mov si, EnableExecuteDisableLocation
73 cmp byte [si], 0
74 jz SkipEnableExecuteDisableBit
75
76 ;
77 ; Enable execute disable bit
78 ;
79 mov ecx, 0c0000080h ; EFER MSR number
80 rdmsr ; Read EFER
81 bts eax, 11 ; Enable Execute Disable Bit
82 wrmsr ; Write EFER
83
84 SkipEnableExecuteDisableBit:
85
86 mov di, DataSegmentLocation
87 mov edi, [di] ; Save long mode DS in edi
88
89 mov si, Cr3Location ; Save CR3 in ecx
90 mov ecx, [si]
91
92 xor ax, ax
93 mov ds, ax ; Clear data segment
94
95 mov eax, cr0 ; Get control register 0
96 or eax, 000000003h ; Set PE bit (bit #0) & MP
97 mov cr0, eax
98
99 mov eax, cr4
100 bts eax, 5
101 mov cr4, eax
102
103 mov cr3, ecx ; Load CR3
104
105 mov ecx, 0c0000080h ; EFER MSR number
106 rdmsr ; Read EFER
107 bts eax, 8 ; Set LME=1
108 wrmsr ; Write EFER
109
110 mov eax, cr0 ; Read CR0
111 bts eax, 31 ; Set PG=1
112 mov cr0, eax ; Write CR0
113
114 jmp 0:strict dword 0 ; far jump to long mode
115 BITS 64
116 LongModeStart:
117 mov eax, edi
118 mov ds, ax
119 mov es, ax
120 mov ss, ax
121
122 mov esi, ebx
123 lea edi, [esi + InitFlagLocation]
124 cmp qword [edi], 1 ; ApInitConfig
125 jnz GetApicId
126
127 ; AP init
128 mov edi, esi
129 add edi, LockLocation
130 mov rax, NotVacantFlag
131
132 TestLock:
133 xchg qword [edi], rax
134 cmp rax, NotVacantFlag
135 jz TestLock
136
137 lea ecx, [esi + NumApsExecutingLocation]
138 inc dword [ecx]
139 mov ebx, [ecx]
140
141 Releaselock:
142 mov rax, VacantFlag
143 xchg qword [edi], rax
144 ; program stack
145 mov edi, esi
146 add edi, StackSizeLocation
147 mov eax, dword [edi]
148 mov ecx, ebx
149 inc ecx
150 mul ecx ; EAX = StackSize * (CpuNumber + 1)
151 mov edi, esi
152 add edi, StackStartAddressLocation
153 add rax, qword [edi]
154 mov rsp, rax
155 jmp CProcedureInvoke
156
157 GetApicId:
158 mov eax, 0
159 cpuid
160 cmp eax, 0bh
161 jb NoX2Apic ; CPUID level below CPUID_EXTENDED_TOPOLOGY
162
163 mov eax, 0bh
164 xor ecx, ecx
165 cpuid
166 test ebx, 0ffffh
167 jz NoX2Apic ; CPUID.0BH:EBX[15:0] is zero
168
169 ; Processor is x2APIC capable; 32-bit x2APIC ID is already in EDX
170 jmp GetProcessorNumber
171
172 NoX2Apic:
173 ; Processor is not x2APIC capable, so get 8-bit APIC ID
174 mov eax, 1
175 cpuid
176 shr ebx, 24
177 mov edx, ebx
178
179 GetProcessorNumber:
180 ;
181 ; Get processor number for this AP
182 ; Note that BSP may become an AP due to SwitchBsp()
183 ;
184 xor ebx, ebx
185 lea eax, [esi + CpuInfoLocation]
186 mov edi, [eax]
187
188 GetNextProcNumber:
189 cmp dword [edi], edx ; APIC ID match?
190 jz ProgramStack
191 add edi, 20
192 inc ebx
193 jmp GetNextProcNumber
194
195 ProgramStack:
196 mov rsp, qword [edi + 12]
197
198 CProcedureInvoke:
199 push rbp ; Push BIST data at top of AP stack
200 xor rbp, rbp ; Clear ebp for call stack trace
201 push rbp
202 mov rbp, rsp
203
204 mov rax, ASM_PFX(InitializeFloatingPointUnits)
205 sub rsp, 20h
206 call rax ; Call assembly function to initialize FPU per UEFI spec
207 add rsp, 20h
208
209 mov edx, ebx ; edx is NumApsExecuting
210 mov ecx, esi
211 add ecx, LockLocation ; rcx is address of exchange info data buffer
212
213 mov edi, esi
214 add edi, ApProcedureLocation
215 mov rax, qword [edi]
216
217 sub rsp, 20h
218 call rax ; Invoke C function
219 add rsp, 20h
220 jmp $ ; Should never reach here
221
222 RendezvousFunnelProcEnd:
223
224 ;-------------------------------------------------------------------------------------
225 ; AsmRelocateApLoop (MwaitSupport, ApTargetCState, PmCodeSegment);
226 ;-------------------------------------------------------------------------------------
227 global ASM_PFX(AsmRelocateApLoop)
228 ASM_PFX(AsmRelocateApLoop):
229 AsmRelocateApLoopStart:
230 push rcx
231 push rdx
232
233 lea rsi, [PmEntry] ; rsi <- The start address of transition code
234
235 push r8
236 push rsi
237 DB 0x48
238 retf
239 BITS 32
240 PmEntry:
241 mov eax, cr0
242 btr eax, 31 ; Clear CR0.PG
243 mov cr0, eax ; Disable paging and caches
244
245 mov ebx, edx ; Save EntryPoint to rbx, for rdmsr will overwrite rdx
246 mov ecx, 0xc0000080
247 rdmsr
248 and ah, ~ 1 ; Clear LME
249 wrmsr
250 mov eax, cr4
251 and al, ~ (1 << 5) ; Clear PAE
252 mov cr4, eax
253
254 pop edx
255 add esp, 4
256 pop ecx,
257 add esp, 4
258 cmp cl, 1 ; Check mwait-monitor support
259 jnz HltLoop
260 mov ebx, edx ; Save C-State to ebx
261 MwaitLoop:
262 mov eax, esp ; Set Monitor Address
263 xor ecx, ecx ; ecx = 0
264 xor edx, edx ; edx = 0
265 monitor
266 shl ebx, 4
267 mov eax, ebx ; Mwait Cx, Target C-State per eax[7:4]
268 mwait
269 jmp MwaitLoop
270 HltLoop:
271 cli
272 hlt
273 jmp HltLoop
274 ret
275 BITS 64
276 AsmRelocateApLoopEnd:
277
278 ;-------------------------------------------------------------------------------------
279 ; AsmGetAddressMap (&AddressMap);
280 ;-------------------------------------------------------------------------------------
281 global ASM_PFX(AsmGetAddressMap)
282 ASM_PFX(AsmGetAddressMap):
283 mov rax, ASM_PFX(RendezvousFunnelProc)
284 mov qword [rcx], rax
285 mov qword [rcx + 8h], LongModeStart - RendezvousFunnelProcStart
286 mov qword [rcx + 10h], RendezvousFunnelProcEnd - RendezvousFunnelProcStart
287 mov rax, ASM_PFX(AsmRelocateApLoop)
288 mov qword [rcx + 18h], rax
289 mov qword [rcx + 20h], AsmRelocateApLoopEnd - AsmRelocateApLoopStart
290 ret
291
292 ;-------------------------------------------------------------------------------------
293 ;AsmExchangeRole procedure follows. This procedure executed by current BSP, that is
294 ;about to become an AP. It switches its stack with the current AP.
295 ;AsmExchangeRole (IN CPU_EXCHANGE_INFO *MyInfo, IN CPU_EXCHANGE_INFO *OthersInfo);
296 ;-------------------------------------------------------------------------------------
297 global ASM_PFX(AsmExchangeRole)
298 ASM_PFX(AsmExchangeRole):
299 ; DO NOT call other functions in this function, since 2 CPU may use 1 stack
300 ; at the same time. If 1 CPU try to call a function, stack will be corrupted.
301
302 push rax
303 push rbx
304 push rcx
305 push rdx
306 push rsi
307 push rdi
308 push rbp
309 push r8
310 push r9
311 push r10
312 push r11
313 push r12
314 push r13
315 push r14
316 push r15
317
318 mov rax, cr0
319 push rax
320
321 mov rax, cr4
322 push rax
323
324 ; rsi contains MyInfo pointer
325 mov rsi, rcx
326
327 ; rdi contains OthersInfo pointer
328 mov rdi, rdx
329
330 ;Store EFLAGS, GDTR and IDTR regiter to stack
331 pushfq
332 sgdt [rsi + 16]
333 sidt [rsi + 26]
334
335 ; Store the its StackPointer
336 mov [rsi + 8], rsp
337
338 ; update its switch state to STORED
339 mov byte [rsi], CPU_SWITCH_STATE_STORED
340
341 WaitForOtherStored:
342 ; wait until the other CPU finish storing its state
343 cmp byte [rdi], CPU_SWITCH_STATE_STORED
344 jz OtherStored
345 pause
346 jmp WaitForOtherStored
347
348 OtherStored:
349 ; Since another CPU already stored its state, load them
350 ; load GDTR value
351 lgdt [rdi + 16]
352
353 ; load IDTR value
354 lidt [rdi + 26]
355
356 ; load its future StackPointer
357 mov rsp, [rdi + 8]
358
359 ; update the other CPU's switch state to LOADED
360 mov byte [rdi], CPU_SWITCH_STATE_LOADED
361
362 WaitForOtherLoaded:
363 ; wait until the other CPU finish loading new state,
364 ; otherwise the data in stack may corrupt
365 cmp byte [rsi], CPU_SWITCH_STATE_LOADED
366 jz OtherLoaded
367 pause
368 jmp WaitForOtherLoaded
369
370 OtherLoaded:
371 ; since the other CPU already get the data it want, leave this procedure
372 popfq
373
374 pop rax
375 mov cr4, rax
376
377 pop rax
378 mov cr0, rax
379
380 pop r15
381 pop r14
382 pop r13
383 pop r12
384 pop r11
385 pop r10
386 pop r9
387 pop r8
388 pop rbp
389 pop rdi
390 pop rsi
391 pop rdx
392 pop rcx
393 pop rbx
394 pop rax
395
396 ret