]> git.proxmox.com Git - mirror_ubuntu-zesty-kernel.git/blame - include/linux/kvm_host.h
mm: sched: Adapt the scanning rate if a NUMA hinting fault does not migrate
[mirror_ubuntu-zesty-kernel.git] / include / linux / kvm_host.h
CommitLineData
edf88417
AK
1#ifndef __KVM_HOST_H
2#define __KVM_HOST_H
6aa8b732
AK
3
4/*
5 * This work is licensed under the terms of the GNU GPL, version 2. See
6 * the COPYING file in the top-level directory.
7 */
8
9#include <linux/types.h>
e56a7a28 10#include <linux/hardirq.h>
6aa8b732
AK
11#include <linux/list.h>
12#include <linux/mutex.h>
13#include <linux/spinlock.h>
06ff0d37
MR
14#include <linux/signal.h>
15#include <linux/sched.h>
187f1882 16#include <linux/bug.h>
6aa8b732 17#include <linux/mm.h>
b297e672 18#include <linux/mmu_notifier.h>
15ad7146 19#include <linux/preempt.h>
0937c48d 20#include <linux/msi.h>
d89f5eff 21#include <linux/slab.h>
bd2b53b2 22#include <linux/rcupdate.h>
bd80158a 23#include <linux/ratelimit.h>
83f09228 24#include <linux/err.h>
e8edc6e0 25#include <asm/signal.h>
6aa8b732 26
6aa8b732 27#include <linux/kvm.h>
102d8325 28#include <linux/kvm_para.h>
6aa8b732 29
edf88417 30#include <linux/kvm_types.h>
d77a39d9 31
edf88417 32#include <asm/kvm_host.h>
d657a98e 33
cef4dea0
AK
34#ifndef KVM_MMIO_SIZE
35#define KVM_MMIO_SIZE 8
36#endif
37
67b29204
XG
38/*
39 * The bit 16 ~ bit 31 of kvm_memory_region::flags are internally used
40 * in kvm, other bits are visible for userspace which are defined in
41 * include/linux/kvm_h.
42 */
43#define KVM_MEMSLOT_INVALID (1UL << 16)
44
87da7e66
XG
45/* Two fragments for cross MMIO pages. */
46#define KVM_MAX_MMIO_FRAGMENTS 2
f78146b0 47
9c5b1172
XG
48/*
49 * For the normal pfn, the highest 12 bits should be zero,
50 * so we can mask these bits to indicate the error.
51 */
52#define KVM_PFN_ERR_MASK (0xfffULL << 52)
53
54#define KVM_PFN_ERR_FAULT (KVM_PFN_ERR_MASK)
55#define KVM_PFN_ERR_HWPOISON (KVM_PFN_ERR_MASK + 1)
56#define KVM_PFN_ERR_BAD (KVM_PFN_ERR_MASK + 2)
69552c29 57#define KVM_PFN_ERR_RO_FAULT (KVM_PFN_ERR_MASK + 3)
6c8ee57b 58
9c5b1172 59static inline bool is_error_pfn(pfn_t pfn)
83f09228 60{
9c5b1172 61 return !!(pfn & KVM_PFN_ERR_MASK);
83f09228
XG
62}
63
9c5b1172 64static inline bool is_noslot_pfn(pfn_t pfn)
83f09228 65{
9c5b1172 66 return pfn == KVM_PFN_ERR_BAD;
83f09228
XG
67}
68
9c5b1172 69static inline bool is_invalid_pfn(pfn_t pfn)
83f09228
XG
70{
71 return !is_noslot_pfn(pfn) && is_error_pfn(pfn);
72}
73
7068d097
XG
74#define KVM_HVA_ERR_BAD (PAGE_OFFSET)
75#define KVM_HVA_ERR_RO_BAD (PAGE_OFFSET + PAGE_SIZE)
ca3a490c
XG
76
77static inline bool kvm_is_error_hva(unsigned long addr)
78{
7068d097 79 return addr >= PAGE_OFFSET;
ca3a490c
XG
80}
81
6cede2e6
XG
82#define KVM_ERR_PTR_BAD_PAGE (ERR_PTR(-ENOENT))
83
9c5b1172 84static inline bool is_error_page(struct page *page)
6cede2e6
XG
85{
86 return IS_ERR(page);
87}
88
d9e368d6
AK
89/*
90 * vcpu->requests bit members
91 */
3176bc3e 92#define KVM_REQ_TLB_FLUSH 0
2f52d58c 93#define KVM_REQ_MIGRATE_TIMER 1
b209749f 94#define KVM_REQ_REPORT_TPR_ACCESS 2
2e53d63a 95#define KVM_REQ_MMU_RELOAD 3
71c4dfaf 96#define KVM_REQ_TRIPLE_FAULT 4
06e05645 97#define KVM_REQ_PENDING_TIMER 5
d7690175 98#define KVM_REQ_UNHALT 6
4731d4c7 99#define KVM_REQ_MMU_SYNC 7
34c238a1 100#define KVM_REQ_CLOCK_UPDATE 8
32f88400 101#define KVM_REQ_KICK 9
02daab21 102#define KVM_REQ_DEACTIVATE_FPU 10
3842d135 103#define KVM_REQ_EVENT 11
af585b92 104#define KVM_REQ_APF_HALT 12
c9aaa895 105#define KVM_REQ_STEAL_UPDATE 13
7460fb4a 106#define KVM_REQ_NMI 14
d6185f20 107#define KVM_REQ_IMMEDIATE_EXIT 15
f5132b01
GN
108#define KVM_REQ_PMU 16
109#define KVM_REQ_PMI 17
6aa8b732 110
7a84428a
AW
111#define KVM_USERSPACE_IRQ_SOURCE_ID 0
112#define KVM_IRQFD_RESAMPLE_IRQ_SOURCE_ID 1
5550af4d 113
6c474694 114struct kvm;
6aa8b732 115struct kvm_vcpu;
c16f862d 116extern struct kmem_cache *kvm_vcpu_cache;
6aa8b732 117
743eeb0b
SL
118struct kvm_io_range {
119 gpa_t addr;
120 int len;
121 struct kvm_io_device *dev;
122};
123
786a9f88 124#define NR_IOBUS_DEVS 1000
a1300716 125
2eeb2e94
GH
126struct kvm_io_bus {
127 int dev_count;
a1300716 128 struct kvm_io_range range[];
2eeb2e94
GH
129};
130
e93f8a0f
MT
131enum kvm_bus {
132 KVM_MMIO_BUS,
133 KVM_PIO_BUS,
134 KVM_NR_BUSES
135};
136
137int kvm_io_bus_write(struct kvm *kvm, enum kvm_bus bus_idx, gpa_t addr,
138 int len, const void *val);
139int kvm_io_bus_read(struct kvm *kvm, enum kvm_bus bus_idx, gpa_t addr, int len,
bda9020e 140 void *val);
743eeb0b
SL
141int kvm_io_bus_register_dev(struct kvm *kvm, enum kvm_bus bus_idx, gpa_t addr,
142 int len, struct kvm_io_device *dev);
e93f8a0f
MT
143int kvm_io_bus_unregister_dev(struct kvm *kvm, enum kvm_bus bus_idx,
144 struct kvm_io_device *dev);
2eeb2e94 145
af585b92
GN
146#ifdef CONFIG_KVM_ASYNC_PF
147struct kvm_async_pf {
148 struct work_struct work;
149 struct list_head link;
150 struct list_head queue;
151 struct kvm_vcpu *vcpu;
152 struct mm_struct *mm;
153 gva_t gva;
154 unsigned long addr;
155 struct kvm_arch_async_pf arch;
156 struct page *page;
157 bool done;
158};
159
160void kvm_clear_async_pf_completion_queue(struct kvm_vcpu *vcpu);
161void kvm_check_async_pf_completion(struct kvm_vcpu *vcpu);
162int kvm_setup_async_pf(struct kvm_vcpu *vcpu, gva_t gva, gfn_t gfn,
163 struct kvm_arch_async_pf *arch);
344d9588 164int kvm_async_pf_wakeup_all(struct kvm_vcpu *vcpu);
af585b92
GN
165#endif
166
6b7e2d09
XG
167enum {
168 OUTSIDE_GUEST_MODE,
169 IN_GUEST_MODE,
c142786c
AK
170 EXITING_GUEST_MODE,
171 READING_SHADOW_PAGE_TABLES,
6b7e2d09
XG
172};
173
f78146b0
AK
174/*
175 * Sometimes a large or cross-page mmio needs to be broken up into separate
176 * exits for userspace servicing.
177 */
178struct kvm_mmio_fragment {
179 gpa_t gpa;
180 void *data;
181 unsigned len;
182};
183
d17fbbf7
ZX
184struct kvm_vcpu {
185 struct kvm *kvm;
31bb117e 186#ifdef CONFIG_PREEMPT_NOTIFIERS
d17fbbf7 187 struct preempt_notifier preempt_notifier;
31bb117e 188#endif
6b7e2d09 189 int cpu;
d17fbbf7 190 int vcpu_id;
6b7e2d09
XG
191 int srcu_idx;
192 int mode;
d17fbbf7 193 unsigned long requests;
d0bfb940 194 unsigned long guest_debug;
6b7e2d09
XG
195
196 struct mutex mutex;
197 struct kvm_run *run;
f656ce01 198
d17fbbf7 199 int fpu_active;
2acf923e 200 int guest_fpu_loaded, guest_xcr0_loaded;
d17fbbf7 201 wait_queue_head_t wq;
34bb10b7 202 struct pid *pid;
d17fbbf7
ZX
203 int sigset_active;
204 sigset_t sigset;
205 struct kvm_vcpu_stat stat;
206
34c16eec 207#ifdef CONFIG_HAS_IOMEM
d17fbbf7
ZX
208 int mmio_needed;
209 int mmio_read_completed;
210 int mmio_is_write;
f78146b0
AK
211 int mmio_cur_fragment;
212 int mmio_nr_fragments;
213 struct kvm_mmio_fragment mmio_fragments[KVM_MAX_MMIO_FRAGMENTS];
34c16eec 214#endif
1165f5fe 215
af585b92
GN
216#ifdef CONFIG_KVM_ASYNC_PF
217 struct {
218 u32 queued;
219 struct list_head queue;
220 struct list_head done;
221 spinlock_t lock;
222 } async_pf;
223#endif
224
4c088493
R
225#ifdef CONFIG_HAVE_KVM_CPU_RELAX_INTERCEPT
226 /*
227 * Cpu relax intercept or pause loop exit optimization
228 * in_spin_loop: set when a vcpu does a pause loop exit
229 * or cpu relax intercepted.
230 * dy_eligible: indicates whether vcpu is eligible for directed yield.
231 */
232 struct {
233 bool in_spin_loop;
234 bool dy_eligible;
235 } spin_loop;
236#endif
d657a98e
ZX
237 struct kvm_vcpu_arch arch;
238};
239
6b7e2d09
XG
240static inline int kvm_vcpu_exiting_guest_mode(struct kvm_vcpu *vcpu)
241{
242 return cmpxchg(&vcpu->mode, IN_GUEST_MODE, EXITING_GUEST_MODE);
243}
244
660c22c4
TY
245/*
246 * Some of the bitops functions do not support too long bitmaps.
247 * This number must be determined not to exceed such limits.
248 */
249#define KVM_MEM_MAX_NR_PAGES ((1UL << 31) - 1)
250
6aa8b732
AK
251struct kvm_memory_slot {
252 gfn_t base_gfn;
253 unsigned long npages;
254 unsigned long flags;
6aa8b732 255 unsigned long *dirty_bitmap;
db3fe4eb 256 struct kvm_arch_memory_slot arch;
8a7ae055 257 unsigned long userspace_addr;
80b14b5b 258 int user_alloc;
e36d96f7 259 int id;
6aa8b732
AK
260};
261
87bf6e7d
TY
262static inline unsigned long kvm_dirty_bitmap_bytes(struct kvm_memory_slot *memslot)
263{
264 return ALIGN(memslot->npages, BITS_PER_LONG) / 8;
265}
266
399ec807
AK
267struct kvm_kernel_irq_routing_entry {
268 u32 gsi;
5116d8f6 269 u32 type;
4925663a 270 int (*set)(struct kvm_kernel_irq_routing_entry *e,
1a6e4a8c 271 struct kvm *kvm, int irq_source_id, int level);
399ec807
AK
272 union {
273 struct {
274 unsigned irqchip;
275 unsigned pin;
276 } irqchip;
79950e10 277 struct msi_msg msi;
399ec807 278 };
46e624b9
GN
279 struct hlist_node link;
280};
281
3e71f88b
GN
282#ifdef __KVM_HAVE_IOAPIC
283
46e624b9 284struct kvm_irq_routing_table {
3e71f88b 285 int chip[KVM_NR_IRQCHIPS][KVM_IOAPIC_NUM_PINS];
46e624b9
GN
286 struct kvm_kernel_irq_routing_entry *rt_entries;
287 u32 nr_rt_entries;
288 /*
289 * Array indexed by gsi. Each entry contains list of irq chips
290 * the gsi is connected to.
291 */
292 struct hlist_head map[0];
399ec807
AK
293};
294
3e71f88b
GN
295#else
296
297struct kvm_irq_routing_table {};
298
299#endif
300
93a5cef0
XG
301#ifndef KVM_MEM_SLOTS_NUM
302#define KVM_MEM_SLOTS_NUM (KVM_MEMORY_SLOTS + KVM_PRIVATE_MEM_SLOTS)
303#endif
304
bf3e05bc
XG
305/*
306 * Note:
307 * memslots are not sorted by id anymore, please use id_to_memslot()
308 * to get the memslot by its id.
309 */
46a26bf5 310struct kvm_memslots {
49c7754c 311 u64 generation;
93a5cef0 312 struct kvm_memory_slot memslots[KVM_MEM_SLOTS_NUM];
f85e2cb5
XG
313 /* The mapping table from slot id to the index in memslots[]. */
314 int id_to_index[KVM_MEM_SLOTS_NUM];
46a26bf5
MT
315};
316
6aa8b732 317struct kvm {
aaee2c94 318 spinlock_t mmu_lock;
79fac95e 319 struct mutex slots_lock;
6d4e4c4f 320 struct mm_struct *mm; /* userspace tied to this vm */
46a26bf5 321 struct kvm_memslots *memslots;
bc6678a3 322 struct srcu_struct srcu;
73880c80
GN
323#ifdef CONFIG_KVM_APIC_ARCHITECTURE
324 u32 bsp_vcpu_id;
73880c80 325#endif
fb3f0f51 326 struct kvm_vcpu *vcpus[KVM_MAX_VCPUS];
73880c80 327 atomic_t online_vcpus;
217ece61 328 int last_boosted_vcpu;
133de902 329 struct list_head vm_list;
60eead79 330 struct mutex lock;
e93f8a0f 331 struct kvm_io_bus *buses[KVM_NR_BUSES];
721eecbf
GH
332#ifdef CONFIG_HAVE_KVM_EVENTFD
333 struct {
334 spinlock_t lock;
335 struct list_head items;
7a84428a
AW
336 struct list_head resampler_list;
337 struct mutex resampler_lock;
721eecbf 338 } irqfds;
d34e6b17 339 struct list_head ioeventfds;
721eecbf 340#endif
ba1389b7 341 struct kvm_vm_stat stat;
d69fb81f 342 struct kvm_arch arch;
d39f13b0 343 atomic_t users_count;
5f94c174 344#ifdef KVM_COALESCED_MMIO_PAGE_OFFSET
5f94c174 345 struct kvm_coalesced_mmio_ring *coalesced_mmio_ring;
2b3c246a
SL
346 spinlock_t ring_lock;
347 struct list_head coalesced_zones;
5f94c174 348#endif
e930bffe 349
60eead79 350 struct mutex irq_lock;
75858a84 351#ifdef CONFIG_HAVE_KVM_IRQCHIP
bd2b53b2
MT
352 /*
353 * Update side is protected by irq_lock and,
354 * if configured, irqfds.lock.
355 */
4b6a2872 356 struct kvm_irq_routing_table __rcu *irq_routing;
75858a84 357 struct hlist_head mask_notifier_list;
136bdfee 358 struct hlist_head irq_ack_notifier_list;
75858a84
AK
359#endif
360
36c1ed82 361#if defined(CONFIG_MMU_NOTIFIER) && defined(KVM_ARCH_WANT_MMU_NOTIFIER)
e930bffe
AA
362 struct mmu_notifier mmu_notifier;
363 unsigned long mmu_notifier_seq;
364 long mmu_notifier_count;
365#endif
5c663a15 366 long tlbs_dirty;
6aa8b732
AK
367};
368
a737f256
CD
369#define kvm_err(fmt, ...) \
370 pr_err("kvm [%i]: " fmt, task_pid_nr(current), ## __VA_ARGS__)
371#define kvm_info(fmt, ...) \
372 pr_info("kvm [%i]: " fmt, task_pid_nr(current), ## __VA_ARGS__)
373#define kvm_debug(fmt, ...) \
374 pr_debug("kvm [%i]: " fmt, task_pid_nr(current), ## __VA_ARGS__)
375#define kvm_pr_unimpl(fmt, ...) \
376 pr_err_ratelimited("kvm [%i]: " fmt, \
377 task_tgid_nr(current), ## __VA_ARGS__)
f0242478 378
a737f256
CD
379/* The guest did something we don't support. */
380#define vcpu_unimpl(vcpu, fmt, ...) \
381 kvm_pr_unimpl("vcpu%i " fmt, (vcpu)->vcpu_id, ## __VA_ARGS__)
6aa8b732 382
988a2cae
GN
383static inline struct kvm_vcpu *kvm_get_vcpu(struct kvm *kvm, int i)
384{
385 smp_rmb();
386 return kvm->vcpus[i];
387}
388
389#define kvm_for_each_vcpu(idx, vcpup, kvm) \
b42fc3cb
JM
390 for (idx = 0; \
391 idx < atomic_read(&kvm->online_vcpus) && \
392 (vcpup = kvm_get_vcpu(kvm, idx)) != NULL; \
393 idx++)
988a2cae 394
be6ba0f0
XG
395#define kvm_for_each_memslot(memslot, slots) \
396 for (memslot = &slots->memslots[0]; \
bf3e05bc
XG
397 memslot < slots->memslots + KVM_MEM_SLOTS_NUM && memslot->npages;\
398 memslot++)
be6ba0f0 399
fb3f0f51
RR
400int kvm_vcpu_init(struct kvm_vcpu *vcpu, struct kvm *kvm, unsigned id);
401void kvm_vcpu_uninit(struct kvm_vcpu *vcpu);
402
9fc77441 403int __must_check vcpu_load(struct kvm_vcpu *vcpu);
313a3dc7
CO
404void vcpu_put(struct kvm_vcpu *vcpu);
405
0ee75bea 406int kvm_init(void *opaque, unsigned vcpu_size, unsigned vcpu_align,
c16f862d 407 struct module *module);
cb498ea2 408void kvm_exit(void);
6aa8b732 409
d39f13b0
IE
410void kvm_get_kvm(struct kvm *kvm);
411void kvm_put_kvm(struct kvm *kvm);
be593d62 412void update_memslots(struct kvm_memslots *slots, struct kvm_memory_slot *new);
d39f13b0 413
90d83dc3
LJ
414static inline struct kvm_memslots *kvm_memslots(struct kvm *kvm)
415{
416 return rcu_dereference_check(kvm->memslots,
417 srcu_read_lock_held(&kvm->srcu)
418 || lockdep_is_held(&kvm->slots_lock));
419}
420
28a37544
XG
421static inline struct kvm_memory_slot *
422id_to_memslot(struct kvm_memslots *slots, int id)
423{
f85e2cb5
XG
424 int index = slots->id_to_index[id];
425 struct kvm_memory_slot *slot;
bf3e05bc 426
f85e2cb5 427 slot = &slots->memslots[index];
bf3e05bc 428
f85e2cb5
XG
429 WARN_ON(slot->id != id);
430 return slot;
28a37544
XG
431}
432
210c7c4d
IE
433int kvm_set_memory_region(struct kvm *kvm,
434 struct kvm_userspace_memory_region *mem,
435 int user_alloc);
f78e0e2e
SY
436int __kvm_set_memory_region(struct kvm *kvm,
437 struct kvm_userspace_memory_region *mem,
438 int user_alloc);
db3fe4eb
TY
439void kvm_arch_free_memslot(struct kvm_memory_slot *free,
440 struct kvm_memory_slot *dont);
441int kvm_arch_create_memslot(struct kvm_memory_slot *slot, unsigned long npages);
f7784b8e
MT
442int kvm_arch_prepare_memory_region(struct kvm *kvm,
443 struct kvm_memory_slot *memslot,
444 struct kvm_memory_slot old,
445 struct kvm_userspace_memory_region *mem,
446 int user_alloc);
447void kvm_arch_commit_memory_region(struct kvm *kvm,
0de10343
ZX
448 struct kvm_userspace_memory_region *mem,
449 struct kvm_memory_slot old,
450 int user_alloc);
db3fe4eb 451bool kvm_largepages_enabled(void);
54dee993 452void kvm_disable_largepages(void);
2df72e9b
MT
453/* flush all memory translations */
454void kvm_arch_flush_shadow_all(struct kvm *kvm);
455/* flush memory translations pointing to 'slot' */
456void kvm_arch_flush_shadow_memslot(struct kvm *kvm,
457 struct kvm_memory_slot *slot);
a983fb23 458
48987781
XG
459int gfn_to_page_many_atomic(struct kvm *kvm, gfn_t gfn, struct page **pages,
460 int nr_pages);
461
954bbbc2 462struct page *gfn_to_page(struct kvm *kvm, gfn_t gfn);
05da4558 463unsigned long gfn_to_hva(struct kvm *kvm, gfn_t gfn);
4d8b81ab 464unsigned long gfn_to_hva_memslot(struct kvm_memory_slot *slot, gfn_t gfn);
b4231d61
IE
465void kvm_release_page_clean(struct page *page);
466void kvm_release_page_dirty(struct page *page);
35149e21
AL
467void kvm_set_page_dirty(struct page *page);
468void kvm_set_page_accessed(struct page *page);
469
365fb3fd 470pfn_t gfn_to_pfn_atomic(struct kvm *kvm, gfn_t gfn);
612819c3
MT
471pfn_t gfn_to_pfn_async(struct kvm *kvm, gfn_t gfn, bool *async,
472 bool write_fault, bool *writable);
35149e21 473pfn_t gfn_to_pfn(struct kvm *kvm, gfn_t gfn);
612819c3
MT
474pfn_t gfn_to_pfn_prot(struct kvm *kvm, gfn_t gfn, bool write_fault,
475 bool *writable);
d5661048 476pfn_t gfn_to_pfn_memslot(struct kvm_memory_slot *slot, gfn_t gfn);
037d92dc
XG
477pfn_t gfn_to_pfn_memslot_atomic(struct kvm_memory_slot *slot, gfn_t gfn);
478
32cad84f 479void kvm_release_pfn_dirty(pfn_t pfn);
35149e21
AL
480void kvm_release_pfn_clean(pfn_t pfn);
481void kvm_set_pfn_dirty(pfn_t pfn);
482void kvm_set_pfn_accessed(pfn_t pfn);
483void kvm_get_pfn(pfn_t pfn);
484
195aefde
IE
485int kvm_read_guest_page(struct kvm *kvm, gfn_t gfn, void *data, int offset,
486 int len);
7ec54588
MT
487int kvm_read_guest_atomic(struct kvm *kvm, gpa_t gpa, void *data,
488 unsigned long len);
195aefde 489int kvm_read_guest(struct kvm *kvm, gpa_t gpa, void *data, unsigned long len);
e03b644f
GN
490int kvm_read_guest_cached(struct kvm *kvm, struct gfn_to_hva_cache *ghc,
491 void *data, unsigned long len);
195aefde
IE
492int kvm_write_guest_page(struct kvm *kvm, gfn_t gfn, const void *data,
493 int offset, int len);
494int kvm_write_guest(struct kvm *kvm, gpa_t gpa, const void *data,
495 unsigned long len);
49c7754c
GN
496int kvm_write_guest_cached(struct kvm *kvm, struct gfn_to_hva_cache *ghc,
497 void *data, unsigned long len);
498int kvm_gfn_to_hva_cache_init(struct kvm *kvm, struct gfn_to_hva_cache *ghc,
499 gpa_t gpa);
195aefde
IE
500int kvm_clear_guest_page(struct kvm *kvm, gfn_t gfn, int offset, int len);
501int kvm_clear_guest(struct kvm *kvm, gpa_t gpa, unsigned long len);
6aa8b732 502struct kvm_memory_slot *gfn_to_memslot(struct kvm *kvm, gfn_t gfn);
e0d62c7f 503int kvm_is_visible_gfn(struct kvm *kvm, gfn_t gfn);
8f0b1ab6 504unsigned long kvm_host_page_size(struct kvm *kvm, gfn_t gfn);
6aa8b732 505void mark_page_dirty(struct kvm *kvm, gfn_t gfn);
49c7754c
GN
506void mark_page_dirty_in_slot(struct kvm *kvm, struct kvm_memory_slot *memslot,
507 gfn_t gfn);
6aa8b732 508
8776e519 509void kvm_vcpu_block(struct kvm_vcpu *vcpu);
b6d33834 510void kvm_vcpu_kick(struct kvm_vcpu *vcpu);
41628d33 511bool kvm_vcpu_yield_to(struct kvm_vcpu *target);
d255f4f2 512void kvm_vcpu_on_spin(struct kvm_vcpu *vcpu);
6aa8b732 513void kvm_resched(struct kvm_vcpu *vcpu);
7702fd1f
AK
514void kvm_load_guest_fpu(struct kvm_vcpu *vcpu);
515void kvm_put_guest_fpu(struct kvm_vcpu *vcpu);
a4ee1ca4 516
d9e368d6 517void kvm_flush_remote_tlbs(struct kvm *kvm);
2e53d63a 518void kvm_reload_remote_mmus(struct kvm *kvm);
6aa8b732 519
043405e1
CO
520long kvm_arch_dev_ioctl(struct file *filp,
521 unsigned int ioctl, unsigned long arg);
313a3dc7
CO
522long kvm_arch_vcpu_ioctl(struct file *filp,
523 unsigned int ioctl, unsigned long arg);
5b1c1493 524int kvm_arch_vcpu_fault(struct kvm_vcpu *vcpu, struct vm_fault *vmf);
018d00d2
ZX
525
526int kvm_dev_ioctl_check_extension(long ext);
527
5bb064dc
ZX
528int kvm_get_dirty_log(struct kvm *kvm,
529 struct kvm_dirty_log *log, int *is_dirty);
530int kvm_vm_ioctl_get_dirty_log(struct kvm *kvm,
531 struct kvm_dirty_log *log);
532
1fe779f8
CO
533int kvm_vm_ioctl_set_memory_region(struct kvm *kvm,
534 struct
535 kvm_userspace_memory_region *mem,
536 int user_alloc);
23d43cf9 537int kvm_vm_ioctl_irq_line(struct kvm *kvm, struct kvm_irq_level *irq_level);
1fe779f8
CO
538long kvm_arch_vm_ioctl(struct file *filp,
539 unsigned int ioctl, unsigned long arg);
313a3dc7 540
d0752060
HB
541int kvm_arch_vcpu_ioctl_get_fpu(struct kvm_vcpu *vcpu, struct kvm_fpu *fpu);
542int kvm_arch_vcpu_ioctl_set_fpu(struct kvm_vcpu *vcpu, struct kvm_fpu *fpu);
543
8b006791
ZX
544int kvm_arch_vcpu_ioctl_translate(struct kvm_vcpu *vcpu,
545 struct kvm_translation *tr);
546
b6c7a5dc
HB
547int kvm_arch_vcpu_ioctl_get_regs(struct kvm_vcpu *vcpu, struct kvm_regs *regs);
548int kvm_arch_vcpu_ioctl_set_regs(struct kvm_vcpu *vcpu, struct kvm_regs *regs);
549int kvm_arch_vcpu_ioctl_get_sregs(struct kvm_vcpu *vcpu,
550 struct kvm_sregs *sregs);
551int kvm_arch_vcpu_ioctl_set_sregs(struct kvm_vcpu *vcpu,
552 struct kvm_sregs *sregs);
62d9f0db
MT
553int kvm_arch_vcpu_ioctl_get_mpstate(struct kvm_vcpu *vcpu,
554 struct kvm_mp_state *mp_state);
555int kvm_arch_vcpu_ioctl_set_mpstate(struct kvm_vcpu *vcpu,
556 struct kvm_mp_state *mp_state);
d0bfb940
JK
557int kvm_arch_vcpu_ioctl_set_guest_debug(struct kvm_vcpu *vcpu,
558 struct kvm_guest_debug *dbg);
b6c7a5dc
HB
559int kvm_arch_vcpu_ioctl_run(struct kvm_vcpu *vcpu, struct kvm_run *kvm_run);
560
f8c16bba
ZX
561int kvm_arch_init(void *opaque);
562void kvm_arch_exit(void);
043405e1 563
e9b11c17
ZX
564int kvm_arch_vcpu_init(struct kvm_vcpu *vcpu);
565void kvm_arch_vcpu_uninit(struct kvm_vcpu *vcpu);
566
567void kvm_arch_vcpu_free(struct kvm_vcpu *vcpu);
568void kvm_arch_vcpu_load(struct kvm_vcpu *vcpu, int cpu);
569void kvm_arch_vcpu_put(struct kvm_vcpu *vcpu);
570struct kvm_vcpu *kvm_arch_vcpu_create(struct kvm *kvm, unsigned int id);
26e5215f 571int kvm_arch_vcpu_setup(struct kvm_vcpu *vcpu);
d40ccc62 572void kvm_arch_vcpu_destroy(struct kvm_vcpu *vcpu);
e9b11c17
ZX
573
574int kvm_arch_vcpu_reset(struct kvm_vcpu *vcpu);
10474ae8 575int kvm_arch_hardware_enable(void *garbage);
e9b11c17
ZX
576void kvm_arch_hardware_disable(void *garbage);
577int kvm_arch_hardware_setup(void);
578void kvm_arch_hardware_unsetup(void);
579void kvm_arch_check_processor_compat(void *rtn);
1d737c8a 580int kvm_arch_vcpu_runnable(struct kvm_vcpu *vcpu);
b6d33834 581int kvm_arch_vcpu_should_kick(struct kvm_vcpu *vcpu);
e9b11c17 582
d19a9cd2
ZX
583void kvm_free_physmem(struct kvm *kvm);
584
c1a7b32a
TY
585void *kvm_kvzalloc(unsigned long size);
586void kvm_kvfree(const void *addr);
587
d89f5eff
JK
588#ifndef __KVM_HAVE_ARCH_VM_ALLOC
589static inline struct kvm *kvm_arch_alloc_vm(void)
590{
591 return kzalloc(sizeof(struct kvm), GFP_KERNEL);
592}
593
594static inline void kvm_arch_free_vm(struct kvm *kvm)
595{
596 kfree(kvm);
597}
598#endif
599
b6d33834
CD
600static inline wait_queue_head_t *kvm_arch_vcpu_wq(struct kvm_vcpu *vcpu)
601{
2246f8b5
AG
602#ifdef __KVM_HAVE_ARCH_WQP
603 return vcpu->arch.wqp;
604#else
b6d33834 605 return &vcpu->wq;
b6d33834 606#endif
2246f8b5 607}
b6d33834 608
e08b9637 609int kvm_arch_init_vm(struct kvm *kvm, unsigned long type);
d19a9cd2 610void kvm_arch_destroy_vm(struct kvm *kvm);
8a98f664 611void kvm_free_all_assigned_devices(struct kvm *kvm);
ad8ba2cd 612void kvm_arch_sync_events(struct kvm *kvm);
e9b11c17 613
3d80840d 614int kvm_cpu_has_pending_timer(struct kvm_vcpu *vcpu);
5736199a 615void kvm_vcpu_kick(struct kvm_vcpu *vcpu);
682c59a3 616
a2766325 617bool kvm_is_mmio_pfn(pfn_t pfn);
c77fb9dc 618
62c476c7
BAY
619struct kvm_irq_ack_notifier {
620 struct hlist_node link;
621 unsigned gsi;
622 void (*irq_acked)(struct kvm_irq_ack_notifier *kian);
623};
624
625struct kvm_assigned_dev_kernel {
626 struct kvm_irq_ack_notifier ack_notifier;
62c476c7
BAY
627 struct list_head list;
628 int assigned_dev_id;
ab9f4ecb 629 int host_segnr;
62c476c7
BAY
630 int host_busnr;
631 int host_devfn;
c1e01514 632 unsigned int entries_nr;
62c476c7 633 int host_irq;
defaf158 634 bool host_irq_disabled;
07700a94 635 bool pci_2_3;
c1e01514 636 struct msix_entry *host_msix_entries;
62c476c7 637 int guest_irq;
0645211c 638 struct msix_entry *guest_msix_entries;
4f906c19 639 unsigned long irq_requested_type;
5550af4d 640 int irq_source_id;
b653574a 641 int flags;
62c476c7
BAY
642 struct pci_dev *dev;
643 struct kvm *kvm;
0645211c 644 spinlock_t intx_lock;
cf9eeac4 645 spinlock_t intx_mask_lock;
1e001d49 646 char irq_name[32];
f8fcfd77 647 struct pci_saved_state *pci_saved_state;
62c476c7 648};
75858a84
AK
649
650struct kvm_irq_mask_notifier {
651 void (*func)(struct kvm_irq_mask_notifier *kimn, bool masked);
652 int irq;
653 struct hlist_node link;
654};
655
656void kvm_register_irq_mask_notifier(struct kvm *kvm, int irq,
657 struct kvm_irq_mask_notifier *kimn);
658void kvm_unregister_irq_mask_notifier(struct kvm *kvm, int irq,
659 struct kvm_irq_mask_notifier *kimn);
4a994358
GN
660void kvm_fire_mask_notifiers(struct kvm *kvm, unsigned irqchip, unsigned pin,
661 bool mask);
75858a84 662
46e624b9
GN
663#ifdef __KVM_HAVE_IOAPIC
664void kvm_get_intr_delivery_bitmask(struct kvm_ioapic *ioapic,
665 union kvm_ioapic_redirect_entry *entry,
666 unsigned long *deliver_bitmask);
667#endif
668int kvm_set_irq(struct kvm *kvm, int irq_source_id, u32 irq, int level);
bd2b53b2
MT
669int kvm_set_msi(struct kvm_kernel_irq_routing_entry *irq_entry, struct kvm *kvm,
670 int irq_source_id, int level);
44882eed 671void kvm_notify_acked_irq(struct kvm *kvm, unsigned irqchip, unsigned pin);
3de42dc0
XZ
672void kvm_register_irq_ack_notifier(struct kvm *kvm,
673 struct kvm_irq_ack_notifier *kian);
fa40a821
MT
674void kvm_unregister_irq_ack_notifier(struct kvm *kvm,
675 struct kvm_irq_ack_notifier *kian);
5550af4d
SY
676int kvm_request_irq_source_id(struct kvm *kvm);
677void kvm_free_irq_source_id(struct kvm *kvm, int irq_source_id);
62c476c7 678
522c68c4
SY
679/* For vcpu->arch.iommu_flags */
680#define KVM_IOMMU_CACHE_COHERENCY 0x1
681
19de40a8 682#ifdef CONFIG_IOMMU_API
3ad26d81 683int kvm_iommu_map_pages(struct kvm *kvm, struct kvm_memory_slot *slot);
32f6daad 684void kvm_iommu_unmap_pages(struct kvm *kvm, struct kvm_memory_slot *slot);
260782bc 685int kvm_iommu_map_guest(struct kvm *kvm);
62c476c7 686int kvm_iommu_unmap_guest(struct kvm *kvm);
260782bc
WH
687int kvm_assign_device(struct kvm *kvm,
688 struct kvm_assigned_dev_kernel *assigned_dev);
0a920356
WH
689int kvm_deassign_device(struct kvm *kvm,
690 struct kvm_assigned_dev_kernel *assigned_dev);
19de40a8 691#else /* CONFIG_IOMMU_API */
62c476c7 692static inline int kvm_iommu_map_pages(struct kvm *kvm,
d7a79b6c 693 struct kvm_memory_slot *slot)
62c476c7
BAY
694{
695 return 0;
696}
697
32f6daad
AW
698static inline void kvm_iommu_unmap_pages(struct kvm *kvm,
699 struct kvm_memory_slot *slot)
700{
701}
702
260782bc 703static inline int kvm_iommu_map_guest(struct kvm *kvm)
62c476c7
BAY
704{
705 return -ENODEV;
706}
707
708static inline int kvm_iommu_unmap_guest(struct kvm *kvm)
709{
710 return 0;
711}
260782bc
WH
712
713static inline int kvm_assign_device(struct kvm *kvm,
714 struct kvm_assigned_dev_kernel *assigned_dev)
715{
716 return 0;
717}
0a920356
WH
718
719static inline int kvm_deassign_device(struct kvm *kvm,
720 struct kvm_assigned_dev_kernel *assigned_dev)
721{
722 return 0;
723}
19de40a8 724#endif /* CONFIG_IOMMU_API */
62c476c7 725
d172fcd3
LV
726static inline void kvm_guest_enter(void)
727{
8fa22068 728 BUG_ON(preemptible());
bf9fae9f 729 vtime_account(current);
d172fcd3 730 current->flags |= PF_VCPU;
8fa22068
GN
731 /* KVM does not hold any references to rcu protected data when it
732 * switches CPU into a guest mode. In fact switching to a guest mode
733 * is very similar to exiting to userspase from rcu point of view. In
734 * addition CPU may stay in a guest mode for quite a long time (up to
735 * one time slice). Lets treat guest mode as quiescent state, just like
736 * we do with user-mode execution.
737 */
738 rcu_virt_note_context_switch(smp_processor_id());
d172fcd3
LV
739}
740
741static inline void kvm_guest_exit(void)
742{
bf9fae9f 743 vtime_account(current);
d172fcd3
LV
744 current->flags &= ~PF_VCPU;
745}
746
9d4cba7f
PM
747/*
748 * search_memslots() and __gfn_to_memslot() are here because they are
749 * used in non-modular code in arch/powerpc/kvm/book3s_hv_rm_mmu.c.
750 * gfn_to_memslot() itself isn't here as an inline because that would
751 * bloat other code too much.
752 */
753static inline struct kvm_memory_slot *
754search_memslots(struct kvm_memslots *slots, gfn_t gfn)
755{
756 struct kvm_memory_slot *memslot;
757
758 kvm_for_each_memslot(memslot, slots)
759 if (gfn >= memslot->base_gfn &&
760 gfn < memslot->base_gfn + memslot->npages)
761 return memslot;
762
763 return NULL;
764}
765
766static inline struct kvm_memory_slot *
767__gfn_to_memslot(struct kvm_memslots *slots, gfn_t gfn)
768{
769 return search_memslots(slots, gfn);
770}
771
66a03505
GS
772static inline unsigned long
773__gfn_to_hva_memslot(struct kvm_memory_slot *slot, gfn_t gfn)
774{
775 return slot->userspace_addr + (gfn - slot->base_gfn) * PAGE_SIZE;
776}
777
0ee8dcb8
XG
778static inline int memslot_id(struct kvm *kvm, gfn_t gfn)
779{
780 return gfn_to_memslot(kvm, gfn)->id;
781}
782
fb03cb6f
TY
783static inline gfn_t gfn_to_index(gfn_t gfn, gfn_t base_gfn, int level)
784{
785 /* KVM_HPAGE_GFN_SHIFT(PT_PAGE_TABLE_LEVEL) must be 0. */
786 return (gfn >> KVM_HPAGE_GFN_SHIFT(level)) -
787 (base_gfn >> KVM_HPAGE_GFN_SHIFT(level));
788}
789
d19a748b
TY
790static inline gfn_t
791hva_to_gfn_memslot(unsigned long hva, struct kvm_memory_slot *slot)
887c08ac 792{
d19a748b
TY
793 gfn_t gfn_offset = (hva - slot->userspace_addr) >> PAGE_SHIFT;
794
795 return slot->base_gfn + gfn_offset;
887c08ac
XG
796}
797
1755fbcc
AK
798static inline gpa_t gfn_to_gpa(gfn_t gfn)
799{
800 return (gpa_t)gfn << PAGE_SHIFT;
801}
6aa8b732 802
c30a358d
JR
803static inline gfn_t gpa_to_gfn(gpa_t gpa)
804{
805 return (gfn_t)(gpa >> PAGE_SHIFT);
806}
807
62c476c7
BAY
808static inline hpa_t pfn_to_hpa(pfn_t pfn)
809{
810 return (hpa_t)pfn << PAGE_SHIFT;
811}
812
2f599714 813static inline void kvm_migrate_timers(struct kvm_vcpu *vcpu)
2f52d58c
AK
814{
815 set_bit(KVM_REQ_MIGRATE_TIMER, &vcpu->requests);
816}
817
ba1389b7
AK
818enum kvm_stat_kind {
819 KVM_STAT_VM,
820 KVM_STAT_VCPU,
821};
822
417bc304
HB
823struct kvm_stats_debugfs_item {
824 const char *name;
825 int offset;
ba1389b7 826 enum kvm_stat_kind kind;
417bc304
HB
827 struct dentry *dentry;
828};
829extern struct kvm_stats_debugfs_item debugfs_entries[];
76f7c879 830extern struct dentry *kvm_debugfs_dir;
d4c9ff2d 831
36c1ed82 832#if defined(CONFIG_MMU_NOTIFIER) && defined(KVM_ARCH_WANT_MMU_NOTIFIER)
e930bffe
AA
833static inline int mmu_notifier_retry(struct kvm_vcpu *vcpu, unsigned long mmu_seq)
834{
835 if (unlikely(vcpu->kvm->mmu_notifier_count))
836 return 1;
837 /*
a355aa54
PM
838 * Ensure the read of mmu_notifier_count happens before the read
839 * of mmu_notifier_seq. This interacts with the smp_wmb() in
840 * mmu_notifier_invalidate_range_end to make sure that the caller
841 * either sees the old (non-zero) value of mmu_notifier_count or
842 * the new (incremented) value of mmu_notifier_seq.
843 * PowerPC Book3s HV KVM calls this under a per-page lock
844 * rather than under kvm->mmu_lock, for scalability, so
845 * can't rely on kvm->mmu_lock to keep things ordered.
e930bffe 846 */
a355aa54 847 smp_rmb();
e930bffe
AA
848 if (vcpu->kvm->mmu_notifier_seq != mmu_seq)
849 return 1;
850 return 0;
851}
852#endif
853
9900b4b4 854#ifdef KVM_CAP_IRQ_ROUTING
399ec807
AK
855
856#define KVM_MAX_IRQ_ROUTES 1024
857
858int kvm_setup_default_irq_routing(struct kvm *kvm);
859int kvm_set_irq_routing(struct kvm *kvm,
860 const struct kvm_irq_routing_entry *entries,
861 unsigned nr,
862 unsigned flags);
863void kvm_free_irq_routing(struct kvm *kvm);
864
07975ad3
JK
865int kvm_send_userspace_msi(struct kvm *kvm, struct kvm_msi *msi);
866
399ec807
AK
867#else
868
869static inline void kvm_free_irq_routing(struct kvm *kvm) {}
870
871#endif
872
721eecbf
GH
873#ifdef CONFIG_HAVE_KVM_EVENTFD
874
d34e6b17 875void kvm_eventfd_init(struct kvm *kvm);
d4db2935 876int kvm_irqfd(struct kvm *kvm, struct kvm_irqfd *args);
721eecbf 877void kvm_irqfd_release(struct kvm *kvm);
bd2b53b2 878void kvm_irq_routing_update(struct kvm *, struct kvm_irq_routing_table *);
d34e6b17 879int kvm_ioeventfd(struct kvm *kvm, struct kvm_ioeventfd *args);
721eecbf
GH
880
881#else
882
d34e6b17 883static inline void kvm_eventfd_init(struct kvm *kvm) {}
bd2b53b2 884
d4db2935 885static inline int kvm_irqfd(struct kvm *kvm, struct kvm_irqfd *args)
721eecbf
GH
886{
887 return -EINVAL;
888}
889
890static inline void kvm_irqfd_release(struct kvm *kvm) {}
bd2b53b2 891
27923eb1 892#ifdef CONFIG_HAVE_KVM_IRQCHIP
bd2b53b2
MT
893static inline void kvm_irq_routing_update(struct kvm *kvm,
894 struct kvm_irq_routing_table *irq_rt)
895{
896 rcu_assign_pointer(kvm->irq_routing, irq_rt);
897}
27923eb1 898#endif
bd2b53b2 899
d34e6b17
GH
900static inline int kvm_ioeventfd(struct kvm *kvm, struct kvm_ioeventfd *args)
901{
902 return -ENOSYS;
903}
721eecbf
GH
904
905#endif /* CONFIG_HAVE_KVM_EVENTFD */
906
73880c80 907#ifdef CONFIG_KVM_APIC_ARCHITECTURE
c5af89b6
GN
908static inline bool kvm_vcpu_is_bsp(struct kvm_vcpu *vcpu)
909{
d3efc8ef 910 return vcpu->kvm->bsp_vcpu_id == vcpu->vcpu_id;
c5af89b6 911}
3e515705
AK
912
913bool kvm_vcpu_compatible(struct kvm_vcpu *vcpu);
914
915#else
916
917static inline bool kvm_vcpu_compatible(struct kvm_vcpu *vcpu) { return true; }
918
6aa8b732 919#endif
bfd99ff5
AK
920
921#ifdef __KVM_HAVE_DEVICE_ASSIGNMENT
922
923long kvm_vm_ioctl_assigned_device(struct kvm *kvm, unsigned ioctl,
924 unsigned long arg);
925
926#else
927
928static inline long kvm_vm_ioctl_assigned_device(struct kvm *kvm, unsigned ioctl,
929 unsigned long arg)
930{
931 return -ENOTTY;
932}
933
73880c80 934#endif
bfd99ff5 935
a8eeb04a
AK
936static inline void kvm_make_request(int req, struct kvm_vcpu *vcpu)
937{
938 set_bit(req, &vcpu->requests);
939}
940
a8eeb04a
AK
941static inline bool kvm_check_request(int req, struct kvm_vcpu *vcpu)
942{
0719837c
AK
943 if (test_bit(req, &vcpu->requests)) {
944 clear_bit(req, &vcpu->requests);
945 return true;
946 } else {
947 return false;
948 }
a8eeb04a
AK
949}
950
4c088493
R
951#ifdef CONFIG_HAVE_KVM_CPU_RELAX_INTERCEPT
952
953static inline void kvm_vcpu_set_in_spin_loop(struct kvm_vcpu *vcpu, bool val)
954{
955 vcpu->spin_loop.in_spin_loop = val;
956}
957static inline void kvm_vcpu_set_dy_eligible(struct kvm_vcpu *vcpu, bool val)
958{
959 vcpu->spin_loop.dy_eligible = val;
960}
961
962#else /* !CONFIG_HAVE_KVM_CPU_RELAX_INTERCEPT */
963
964static inline void kvm_vcpu_set_in_spin_loop(struct kvm_vcpu *vcpu, bool val)
965{
966}
967
968static inline void kvm_vcpu_set_dy_eligible(struct kvm_vcpu *vcpu, bool val)
969{
970}
971
06e48c51
R
972static inline bool kvm_vcpu_eligible_for_directed_yield(struct kvm_vcpu *vcpu)
973{
974 return true;
975}
976
4c088493 977#endif /* CONFIG_HAVE_KVM_CPU_RELAX_INTERCEPT */
bfd99ff5
AK
978#endif
979