]> git.proxmox.com Git - mirror_ubuntu-bionic-kernel.git/blame - arch/arm64/include/asm/kvm_host.h
arm64: KVM: Add ARCH_WORKAROUND_2 support for guests
[mirror_ubuntu-bionic-kernel.git] / arch / arm64 / include / asm / kvm_host.h
CommitLineData
4f8d6632
MZ
1/*
2 * Copyright (C) 2012,2013 - ARM Ltd
3 * Author: Marc Zyngier <marc.zyngier@arm.com>
4 *
5 * Derived from arch/arm/include/asm/kvm_host.h:
6 * Copyright (C) 2012 - Virtual Open Systems and Columbia University
7 * Author: Christoffer Dall <c.dall@virtualopensystems.com>
8 *
9 * This program is free software; you can redistribute it and/or modify
10 * it under the terms of the GNU General Public License version 2 as
11 * published by the Free Software Foundation.
12 *
13 * This program is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
17 *
18 * You should have received a copy of the GNU General Public License
19 * along with this program. If not, see <http://www.gnu.org/licenses/>.
20 */
21
22#ifndef __ARM64_KVM_HOST_H__
23#define __ARM64_KVM_HOST_H__
24
65647300
PB
25#include <linux/types.h>
26#include <linux/kvm_types.h>
63a1e1c9 27#include <asm/cpufeature.h>
bb5e4e0c 28#include <asm/daifflags.h>
17eed27b 29#include <asm/fpsimd.h>
4f8d6632 30#include <asm/kvm.h>
3a3604bc 31#include <asm/kvm_asm.h>
4f8d6632
MZ
32#include <asm/kvm_mmio.h>
33
c1426e4c
EA
34#define __KVM_HAVE_ARCH_INTC_INITIALIZED
35
955a3fc6 36#define KVM_USER_MEM_SLOTS 512
920552b2 37#define KVM_HALT_POLL_NS_DEFAULT 500000
4f8d6632
MZ
38
39#include <kvm/arm_vgic.h>
40#include <kvm/arm_arch_timer.h>
04fe4726 41#include <kvm/arm_pmu.h>
4f8d6632 42
ef748917
ML
43#define KVM_MAX_VCPUS VGIC_V3_MAX_CPUS
44
808e7381 45#define KVM_VCPU_MAX_FEATURES 4
4f8d6632 46
7b244e2b 47#define KVM_REQ_SLEEP \
2387149e 48 KVM_ARCH_REQ_FLAGS(0, KVM_REQUEST_WAIT | KVM_REQUEST_NO_WAKEUP)
325f9c64 49#define KVM_REQ_IRQ_PENDING KVM_ARCH_REQ(1)
b13216cf 50
6951e48b 51int __attribute_const__ kvm_target_cpu(void);
4f8d6632 52int kvm_reset_vcpu(struct kvm_vcpu *vcpu);
b46f01ce 53int kvm_arch_dev_ioctl_check_extension(struct kvm *kvm, long ext);
c612505f 54void __extended_idmap_trampoline(phys_addr_t boot_pgd, phys_addr_t idmap_start);
4f8d6632
MZ
55
56struct kvm_arch {
57 /* The VMID generation used for the virt. memory system */
58 u64 vmid_gen;
59 u32 vmid;
60
61 /* 1-level 2nd stage table and lock */
62 spinlock_t pgd_lock;
63 pgd_t *pgd;
64
65 /* VTTBR value associated with above pgd and vmid */
66 u64 vttbr;
67
94d0e598
MZ
68 /* The last vcpu id that ran on each physical CPU */
69 int __percpu *last_vcpu_ran;
70
3caa2d8c
AP
71 /* The maximum number of vCPUs depends on the used GIC model */
72 int max_vcpus;
73
4f8d6632
MZ
74 /* Interrupt controller */
75 struct vgic_dist vgic;
9c98a823
MZ
76
77 /* Mandated version of PSCI */
78 u32 psci_version;
4f8d6632
MZ
79};
80
81#define KVM_NR_MEM_OBJS 40
82
83/*
84 * We don't want allocation failures within the mmu code, so we preallocate
85 * enough memory for a single page fault in a cache.
86 */
87struct kvm_mmu_memory_cache {
88 int nobjs;
89 void *objects[KVM_NR_MEM_OBJS];
90};
91
92struct kvm_vcpu_fault_info {
93 u32 esr_el2; /* Hyp Syndrom Register */
94 u64 far_el2; /* Hyp Fault Address Register */
95 u64 hpfar_el2; /* Hyp IPA Fault Address Register */
2e66e3af 96 u64 disr_el1; /* Deferred [SError] Status Register */
4f8d6632
MZ
97};
98
9d8415d6
MZ
99/*
100 * 0 is reserved as an invalid value.
101 * Order should be kept in sync with the save/restore code.
102 */
103enum vcpu_sysreg {
104 __INVALID_SYSREG__,
105 MPIDR_EL1, /* MultiProcessor Affinity Register */
106 CSSELR_EL1, /* Cache Size Selection Register */
107 SCTLR_EL1, /* System Control Register */
108 ACTLR_EL1, /* Auxiliary Control Register */
109 CPACR_EL1, /* Coprocessor Access Control */
110 TTBR0_EL1, /* Translation Table Base Register 0 */
111 TTBR1_EL1, /* Translation Table Base Register 1 */
112 TCR_EL1, /* Translation Control Register */
113 ESR_EL1, /* Exception Syndrome Register */
ef769e32
AB
114 AFSR0_EL1, /* Auxiliary Fault Status Register 0 */
115 AFSR1_EL1, /* Auxiliary Fault Status Register 1 */
9d8415d6
MZ
116 FAR_EL1, /* Fault Address Register */
117 MAIR_EL1, /* Memory Attribute Indirection Register */
118 VBAR_EL1, /* Vector Base Address Register */
119 CONTEXTIDR_EL1, /* Context ID Register */
120 TPIDR_EL0, /* Thread ID, User R/W */
121 TPIDRRO_EL0, /* Thread ID, User R/O */
122 TPIDR_EL1, /* Thread ID, Privileged */
123 AMAIR_EL1, /* Aux Memory Attribute Indirection Register */
124 CNTKCTL_EL1, /* Timer Control Register (EL1) */
125 PAR_EL1, /* Physical Address Register */
126 MDSCR_EL1, /* Monitor Debug System Control Register */
127 MDCCINT_EL1, /* Monitor Debug Comms Channel Interrupt Enable Reg */
dd627dd4 128 DISR_EL1, /* Deferred Interrupt Status Register */
9d8415d6 129
ab946834
SZ
130 /* Performance Monitors Registers */
131 PMCR_EL0, /* Control Register */
3965c3ce 132 PMSELR_EL0, /* Event Counter Selection Register */
051ff581
SZ
133 PMEVCNTR0_EL0, /* Event Counter Register (0-30) */
134 PMEVCNTR30_EL0 = PMEVCNTR0_EL0 + 30,
135 PMCCNTR_EL0, /* Cycle Counter Register */
9feb21ac
SZ
136 PMEVTYPER0_EL0, /* Event Type Register (0-30) */
137 PMEVTYPER30_EL0 = PMEVTYPER0_EL0 + 30,
138 PMCCFILTR_EL0, /* Cycle Count Filter Register */
96b0eebc 139 PMCNTENSET_EL0, /* Count Enable Set Register */
9db52c78 140 PMINTENSET_EL1, /* Interrupt Enable Set Register */
76d883c4 141 PMOVSSET_EL0, /* Overflow Flag Status Set Register */
7a0adc70 142 PMSWINC_EL0, /* Software Increment Register */
d692b8ad 143 PMUSERENR_EL0, /* User Enable Register */
ab946834 144
9d8415d6
MZ
145 /* 32bit specific registers. Keep them at the end of the range */
146 DACR32_EL2, /* Domain Access Control Register */
147 IFSR32_EL2, /* Instruction Fault Status Register */
148 FPEXC32_EL2, /* Floating-Point Exception Control Register */
149 DBGVCR32_EL2, /* Debug Vector Catch Register */
150
151 NR_SYS_REGS /* Nothing after this line! */
152};
153
154/* 32bit mapping */
155#define c0_MPIDR (MPIDR_EL1 * 2) /* MultiProcessor ID Register */
156#define c0_CSSELR (CSSELR_EL1 * 2)/* Cache Size Selection Register */
157#define c1_SCTLR (SCTLR_EL1 * 2) /* System Control Register */
158#define c1_ACTLR (ACTLR_EL1 * 2) /* Auxiliary Control Register */
159#define c1_CPACR (CPACR_EL1 * 2) /* Coprocessor Access Control */
160#define c2_TTBR0 (TTBR0_EL1 * 2) /* Translation Table Base Register 0 */
161#define c2_TTBR0_high (c2_TTBR0 + 1) /* TTBR0 top 32 bits */
162#define c2_TTBR1 (TTBR1_EL1 * 2) /* Translation Table Base Register 1 */
163#define c2_TTBR1_high (c2_TTBR1 + 1) /* TTBR1 top 32 bits */
164#define c2_TTBCR (TCR_EL1 * 2) /* Translation Table Base Control R. */
165#define c3_DACR (DACR32_EL2 * 2)/* Domain Access Control Register */
166#define c5_DFSR (ESR_EL1 * 2) /* Data Fault Status Register */
167#define c5_IFSR (IFSR32_EL2 * 2)/* Instruction Fault Status Register */
168#define c5_ADFSR (AFSR0_EL1 * 2) /* Auxiliary Data Fault Status R */
169#define c5_AIFSR (AFSR1_EL1 * 2) /* Auxiliary Instr Fault Status R */
170#define c6_DFAR (FAR_EL1 * 2) /* Data Fault Address Register */
171#define c6_IFAR (c6_DFAR + 1) /* Instruction Fault Address Register */
172#define c7_PAR (PAR_EL1 * 2) /* Physical Address Register */
173#define c7_PAR_high (c7_PAR + 1) /* PAR top 32 bits */
174#define c10_PRRR (MAIR_EL1 * 2) /* Primary Region Remap Register */
175#define c10_NMRR (c10_PRRR + 1) /* Normal Memory Remap Register */
176#define c12_VBAR (VBAR_EL1 * 2) /* Vector Base Address Register */
177#define c13_CID (CONTEXTIDR_EL1 * 2) /* Context ID Register */
178#define c13_TID_URW (TPIDR_EL0 * 2) /* Thread ID, User R/W */
179#define c13_TID_URO (TPIDRRO_EL0 * 2)/* Thread ID, User R/O */
180#define c13_TID_PRIV (TPIDR_EL1 * 2) /* Thread ID, Privileged */
181#define c10_AMAIR0 (AMAIR_EL1 * 2) /* Aux Memory Attr Indirection Reg */
182#define c10_AMAIR1 (c10_AMAIR0 + 1)/* Aux Memory Attr Indirection Reg */
183#define c14_CNTKCTL (CNTKCTL_EL1 * 2) /* Timer Control Register (PL1) */
184
185#define cp14_DBGDSCRext (MDSCR_EL1 * 2)
186#define cp14_DBGBCR0 (DBGBCR0_EL1 * 2)
187#define cp14_DBGBVR0 (DBGBVR0_EL1 * 2)
188#define cp14_DBGBXVR0 (cp14_DBGBVR0 + 1)
189#define cp14_DBGWCR0 (DBGWCR0_EL1 * 2)
190#define cp14_DBGWVR0 (DBGWVR0_EL1 * 2)
191#define cp14_DBGDCCINT (MDCCINT_EL1 * 2)
192
193#define NR_COPRO_REGS (NR_SYS_REGS * 2)
194
4f8d6632
MZ
195struct kvm_cpu_context {
196 struct kvm_regs gp_regs;
40033a61
MZ
197 union {
198 u64 sys_regs[NR_SYS_REGS];
72564016 199 u32 copro[NR_COPRO_REGS];
40033a61 200 };
303c68ce
JM
201
202 struct kvm_vcpu *__hyp_running_vcpu;
4f8d6632
MZ
203};
204
205typedef struct kvm_cpu_context kvm_cpu_context_t;
206
207struct kvm_vcpu_arch {
208 struct kvm_cpu_context ctxt;
209
210 /* HYP configuration */
211 u64 hcr_el2;
56c7f5e7 212 u32 mdcr_el2;
4f8d6632
MZ
213
214 /* Exception Information */
215 struct kvm_vcpu_fault_info fault;
216
9ae6a587
MZ
217 /* State of various workarounds, see kvm_asm.h for bit assignment */
218 u64 workaround_flags;
219
84e690bf 220 /* Guest debug state */
0c557ed4
MZ
221 u64 debug_flags;
222
84e690bf
AB
223 /*
224 * We maintain more than a single set of debug registers to support
225 * debugging the guest from the host and to maintain separate host and
226 * guest state during world switches. vcpu_debug_state are the debug
227 * registers of the vcpu as the guest sees them. host_debug_state are
834bf887
AB
228 * the host registers which are saved and restored during
229 * world switches. external_debug_state contains the debug
230 * values we want to debug the guest. This is set via the
231 * KVM_SET_GUEST_DEBUG ioctl.
84e690bf
AB
232 *
233 * debug_ptr points to the set of debug registers that should be loaded
234 * onto the hardware when running the guest.
235 */
236 struct kvm_guest_debug_arch *debug_ptr;
237 struct kvm_guest_debug_arch vcpu_debug_state;
834bf887 238 struct kvm_guest_debug_arch external_debug_state;
84e690bf 239
4f8d6632
MZ
240 /* Pointer to host CPU context */
241 kvm_cpu_context_t *host_cpu_context;
f85279b4
WD
242 struct {
243 /* {Break,watch}point registers */
244 struct kvm_guest_debug_arch regs;
245 /* Statistical profiling extension */
246 u64 pmscr_el1;
247 } host_debug_state;
4f8d6632
MZ
248
249 /* VGIC state */
250 struct vgic_cpu vgic_cpu;
251 struct arch_timer_cpu timer_cpu;
04fe4726 252 struct kvm_pmu pmu;
4f8d6632
MZ
253
254 /*
255 * Anything that is not used directly from assembly code goes
256 * here.
257 */
4f8d6632 258
337b99bf
AB
259 /*
260 * Guest registers we preserve during guest debugging.
261 *
262 * These shadow registers are updated by the kvm_handle_sys_reg
263 * trap handler if the guest accesses or updates them while we
264 * are using guest debug.
265 */
266 struct {
267 u32 mdscr_el1;
268 } guest_debug_preserved;
269
3781528e
EA
270 /* vcpu power-off state */
271 bool power_off;
4f8d6632 272
3b92830a
EA
273 /* Don't run the guest (internal implementation need) */
274 bool pause;
275
4f8d6632
MZ
276 /* IO related fields */
277 struct kvm_decode mmio_decode;
278
279 /* Interrupt related fields */
280 u64 irq_lines; /* IRQ and FIQ levels */
281
282 /* Cache some mmu pages needed inside spinlock regions */
283 struct kvm_mmu_memory_cache mmu_page_cache;
284
285 /* Target CPU and feature flags */
6c8c0c4d 286 int target;
4f8d6632
MZ
287 DECLARE_BITMAP(features, KVM_VCPU_MAX_FEATURES);
288
289 /* Detect first run of a vcpu */
290 bool has_run_once;
b9da0f1a
JM
291
292 /* Virtual SError ESR to restore when HCR_EL2.VSE is set */
293 u64 vsesr_el2;
4f8d6632
MZ
294};
295
296#define vcpu_gp_regs(v) (&(v)->arch.ctxt.gp_regs)
297#define vcpu_sys_reg(v,r) ((v)->arch.ctxt.sys_regs[(r)])
72564016
MZ
298/*
299 * CP14 and CP15 live in the same array, as they are backed by the
300 * same system registers.
301 */
302#define vcpu_cp14(v,r) ((v)->arch.ctxt.copro[(r)])
303#define vcpu_cp15(v,r) ((v)->arch.ctxt.copro[(r)])
4f8d6632 304
f0a3eaff 305#ifdef CONFIG_CPU_BIG_ENDIAN
dedf97e8
MZ
306#define vcpu_cp15_64_high(v,r) vcpu_cp15((v),(r))
307#define vcpu_cp15_64_low(v,r) vcpu_cp15((v),(r) + 1)
f0a3eaff 308#else
dedf97e8
MZ
309#define vcpu_cp15_64_high(v,r) vcpu_cp15((v),(r) + 1)
310#define vcpu_cp15_64_low(v,r) vcpu_cp15((v),(r))
f0a3eaff
VK
311#endif
312
4f8d6632 313struct kvm_vm_stat {
8a7e75d4 314 ulong remote_tlb_flush;
4f8d6632
MZ
315};
316
317struct kvm_vcpu_stat {
8a7e75d4
SJS
318 u64 halt_successful_poll;
319 u64 halt_attempted_poll;
320 u64 halt_poll_invalid;
321 u64 halt_wakeup;
322 u64 hvc_exit_stat;
b19e6892
AT
323 u64 wfe_exit_stat;
324 u64 wfi_exit_stat;
325 u64 mmio_exit_user;
326 u64 mmio_exit_kernel;
327 u64 exits;
4f8d6632
MZ
328};
329
473bdc0e 330int kvm_vcpu_preferred_target(struct kvm_vcpu_init *init);
4f8d6632
MZ
331unsigned long kvm_arm_num_regs(struct kvm_vcpu *vcpu);
332int kvm_arm_copy_reg_indices(struct kvm_vcpu *vcpu, u64 __user *indices);
4f8d6632
MZ
333int kvm_arm_get_reg(struct kvm_vcpu *vcpu, const struct kvm_one_reg *reg);
334int kvm_arm_set_reg(struct kvm_vcpu *vcpu, const struct kvm_one_reg *reg);
335
336#define KVM_ARCH_WANT_MMU_NOTIFIER
4f8d6632
MZ
337int kvm_unmap_hva(struct kvm *kvm, unsigned long hva);
338int kvm_unmap_hva_range(struct kvm *kvm,
339 unsigned long start, unsigned long end);
340void kvm_set_spte_hva(struct kvm *kvm, unsigned long hva, pte_t pte);
35307b9a
MZ
341int kvm_age_hva(struct kvm *kvm, unsigned long start, unsigned long end);
342int kvm_test_age_hva(struct kvm *kvm, unsigned long hva);
4f8d6632 343
4f8d6632 344struct kvm_vcpu *kvm_arm_get_running_vcpu(void);
4000be42 345struct kvm_vcpu * __percpu *kvm_get_running_vcpus(void);
b13216cf
CD
346void kvm_arm_halt_guest(struct kvm *kvm);
347void kvm_arm_resume_guest(struct kvm *kvm);
4f8d6632 348
a0bf9776 349u64 __kvm_call_hyp(void *hypfn, ...);
22b39ca3
MZ
350#define kvm_call_hyp(f, ...) __kvm_call_hyp(kvm_ksym_ref(f), ##__VA_ARGS__)
351
cf5d3188 352void force_vm_exit(const cpumask_t *mask);
8199ed0e 353void kvm_mmu_wp_memory_region(struct kvm *kvm, int slot);
4f8d6632
MZ
354
355int handle_exit(struct kvm_vcpu *vcpu, struct kvm_run *run,
356 int exception_index);
56394072
JM
357void handle_exit_early(struct kvm_vcpu *vcpu, struct kvm_run *run,
358 int exception_index);
4f8d6632
MZ
359
360int kvm_perf_init(void);
361int kvm_perf_teardown(void);
362
4429fc64
AP
363struct kvm_vcpu *kvm_mpidr_to_vcpu(struct kvm *kvm, unsigned long mpidr);
364
47e02f07
CD
365void __kvm_set_tpidr_el2(u64 tpidr_el2);
366DECLARE_PER_CPU(kvm_cpu_context_t, kvm_host_cpu_state);
367
12fda812 368static inline void __cpu_init_hyp_mode(phys_addr_t pgd_ptr,
092bd143
MZ
369 unsigned long hyp_stack_ptr,
370 unsigned long vector_ptr)
371{
47e02f07
CD
372 u64 tpidr_el2;
373
092bd143 374 /*
63a1e1c9
MR
375 * Call initialization code, and switch to the full blown HYP code.
376 * If the cpucaps haven't been finalized yet, something has gone very
377 * wrong, and hyp will crash and burn when it uses any
378 * cpus_have_const_cap() wrapper.
092bd143 379 */
63a1e1c9 380 BUG_ON(!static_branch_likely(&arm64_const_caps_ready));
3421e9d8 381 __kvm_call_hyp((void *)pgd_ptr, hyp_stack_ptr, vector_ptr);
47e02f07
CD
382
383 /*
384 * Calculate the raw per-cpu offset without a translation from the
385 * kernel's mapping to the linear mapping, and store it in tpidr_el2
386 * so that we can use adr_l to access per-cpu variables in EL2.
387 */
388 tpidr_el2 = (u64)this_cpu_ptr(&kvm_host_cpu_state)
389 - (u64)kvm_ksym_ref(kvm_host_cpu_state);
390
391 kvm_call_hyp(__kvm_set_tpidr_el2, tpidr_el2);
092bd143 392}
67f69197 393
0865e636
RK
394static inline void kvm_arch_hardware_unsetup(void) {}
395static inline void kvm_arch_sync_events(struct kvm *kvm) {}
396static inline void kvm_arch_vcpu_uninit(struct kvm_vcpu *vcpu) {}
397static inline void kvm_arch_sched_in(struct kvm_vcpu *vcpu, int cpu) {}
3491caf2 398static inline void kvm_arch_vcpu_block_finish(struct kvm_vcpu *vcpu) {}
0865e636 399
56c7f5e7
AB
400void kvm_arm_init_debug(void);
401void kvm_arm_setup_debug(struct kvm_vcpu *vcpu);
402void kvm_arm_clear_debug(struct kvm_vcpu *vcpu);
84e690bf 403void kvm_arm_reset_debug_ptr(struct kvm_vcpu *vcpu);
696673d1 404bool kvm_arm_handle_step_debug(struct kvm_vcpu *vcpu, struct kvm_run *run);
bb0c70bc
SZ
405int kvm_arm_vcpu_arch_set_attr(struct kvm_vcpu *vcpu,
406 struct kvm_device_attr *attr);
407int kvm_arm_vcpu_arch_get_attr(struct kvm_vcpu *vcpu,
408 struct kvm_device_attr *attr);
409int kvm_arm_vcpu_arch_has_attr(struct kvm_vcpu *vcpu,
410 struct kvm_device_attr *attr);
56c7f5e7 411
21a4179c
MZ
412static inline void __cpu_init_stage2(void)
413{
6141570c
MZ
414 u32 parange = kvm_call_hyp(__init_stage2_translation);
415
416 WARN_ONCE(parange < 40,
417 "PARange is %d bits, unsupported configuration!", parange);
21a4179c
MZ
418}
419
17eed27b
DM
420/*
421 * All host FP/SIMD state is restored on guest exit, so nothing needs
422 * doing here except in the SVE case:
423*/
424static inline void kvm_fpsimd_flush_cpu_state(void)
425{
426 if (system_supports_sve())
427 sve_flush_cpu_state();
428}
429
bb5e4e0c
JM
430static inline void kvm_arm_vhe_guest_enter(void)
431{
432 local_daif_mask();
433}
434
435static inline void kvm_arm_vhe_guest_exit(void)
436{
437 local_daif_restore(DAIF_PROCCTX_NOIRQ);
438}
439
d5a70971
MZ
440static inline bool kvm_arm_harden_branch_predictor(void)
441{
442 return cpus_have_const_cap(ARM64_HARDEN_BRANCH_PREDICTOR);
443}
444
4f8d6632 445#endif /* __ARM64_KVM_HOST_H__ */