Merge branch 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/sage/ceph...
[linux-2.6-block.git] / include / linux / kvm_host.h
CommitLineData
edf88417
AK
1#ifndef __KVM_HOST_H
2#define __KVM_HOST_H
6aa8b732
AK
3
4/*
5 * This work is licensed under the terms of the GNU GPL, version 2. See
6 * the COPYING file in the top-level directory.
7 */
8
9#include <linux/types.h>
e56a7a28 10#include <linux/hardirq.h>
6aa8b732
AK
11#include <linux/list.h>
12#include <linux/mutex.h>
13#include <linux/spinlock.h>
06ff0d37
MR
14#include <linux/signal.h>
15#include <linux/sched.h>
187f1882 16#include <linux/bug.h>
6aa8b732 17#include <linux/mm.h>
b297e672 18#include <linux/mmu_notifier.h>
15ad7146 19#include <linux/preempt.h>
0937c48d 20#include <linux/msi.h>
d89f5eff 21#include <linux/slab.h>
bd2b53b2 22#include <linux/rcupdate.h>
bd80158a 23#include <linux/ratelimit.h>
83f09228 24#include <linux/err.h>
e8edc6e0 25#include <asm/signal.h>
6aa8b732 26
6aa8b732 27#include <linux/kvm.h>
102d8325 28#include <linux/kvm_para.h>
6aa8b732 29
edf88417 30#include <linux/kvm_types.h>
d77a39d9 31
edf88417 32#include <asm/kvm_host.h>
d657a98e 33
cef4dea0
AK
34#ifndef KVM_MMIO_SIZE
35#define KVM_MMIO_SIZE 8
36#endif
37
67b29204
XG
38/*
39 * The bit 16 ~ bit 31 of kvm_memory_region::flags are internally used
40 * in kvm, other bits are visible for userspace which are defined in
41 * include/linux/kvm_h.
42 */
43#define KVM_MEMSLOT_INVALID (1UL << 16)
44
f78146b0
AK
45/*
46 * If we support unaligned MMIO, at most one fragment will be split into two:
47 */
48#ifdef KVM_UNALIGNED_MMIO
49# define KVM_EXTRA_MMIO_FRAGMENTS 1
50#else
51# define KVM_EXTRA_MMIO_FRAGMENTS 0
52#endif
53
54#define KVM_USER_MMIO_SIZE 8
55
56#define KVM_MAX_MMIO_FRAGMENTS \
57 (KVM_MMIO_SIZE / KVM_USER_MMIO_SIZE + KVM_EXTRA_MMIO_FRAGMENTS)
58
9c5b1172
XG
59/*
60 * For the normal pfn, the highest 12 bits should be zero,
61 * so we can mask these bits to indicate the error.
62 */
63#define KVM_PFN_ERR_MASK (0xfffULL << 52)
64
65#define KVM_PFN_ERR_FAULT (KVM_PFN_ERR_MASK)
66#define KVM_PFN_ERR_HWPOISON (KVM_PFN_ERR_MASK + 1)
67#define KVM_PFN_ERR_BAD (KVM_PFN_ERR_MASK + 2)
69552c29 68#define KVM_PFN_ERR_RO_FAULT (KVM_PFN_ERR_MASK + 3)
6c8ee57b 69
9c5b1172 70static inline bool is_error_pfn(pfn_t pfn)
83f09228 71{
9c5b1172 72 return !!(pfn & KVM_PFN_ERR_MASK);
83f09228
XG
73}
74
9c5b1172 75static inline bool is_noslot_pfn(pfn_t pfn)
83f09228 76{
9c5b1172 77 return pfn == KVM_PFN_ERR_BAD;
83f09228
XG
78}
79
9c5b1172 80static inline bool is_invalid_pfn(pfn_t pfn)
83f09228
XG
81{
82 return !is_noslot_pfn(pfn) && is_error_pfn(pfn);
83}
84
7068d097
XG
85#define KVM_HVA_ERR_BAD (PAGE_OFFSET)
86#define KVM_HVA_ERR_RO_BAD (PAGE_OFFSET + PAGE_SIZE)
ca3a490c
XG
87
88static inline bool kvm_is_error_hva(unsigned long addr)
89{
7068d097 90 return addr >= PAGE_OFFSET;
ca3a490c
XG
91}
92
6cede2e6
XG
93#define KVM_ERR_PTR_BAD_PAGE (ERR_PTR(-ENOENT))
94
9c5b1172 95static inline bool is_error_page(struct page *page)
6cede2e6
XG
96{
97 return IS_ERR(page);
98}
99
d9e368d6
AK
100/*
101 * vcpu->requests bit members
102 */
3176bc3e 103#define KVM_REQ_TLB_FLUSH 0
2f52d58c 104#define KVM_REQ_MIGRATE_TIMER 1
b209749f 105#define KVM_REQ_REPORT_TPR_ACCESS 2
2e53d63a 106#define KVM_REQ_MMU_RELOAD 3
71c4dfaf 107#define KVM_REQ_TRIPLE_FAULT 4
06e05645 108#define KVM_REQ_PENDING_TIMER 5
d7690175 109#define KVM_REQ_UNHALT 6
4731d4c7 110#define KVM_REQ_MMU_SYNC 7
34c238a1 111#define KVM_REQ_CLOCK_UPDATE 8
32f88400 112#define KVM_REQ_KICK 9
02daab21 113#define KVM_REQ_DEACTIVATE_FPU 10
3842d135 114#define KVM_REQ_EVENT 11
af585b92 115#define KVM_REQ_APF_HALT 12
c9aaa895 116#define KVM_REQ_STEAL_UPDATE 13
7460fb4a 117#define KVM_REQ_NMI 14
d6185f20 118#define KVM_REQ_IMMEDIATE_EXIT 15
f5132b01
GN
119#define KVM_REQ_PMU 16
120#define KVM_REQ_PMI 17
6aa8b732 121
7a84428a
AW
122#define KVM_USERSPACE_IRQ_SOURCE_ID 0
123#define KVM_IRQFD_RESAMPLE_IRQ_SOURCE_ID 1
5550af4d 124
6c474694 125struct kvm;
6aa8b732 126struct kvm_vcpu;
c16f862d 127extern struct kmem_cache *kvm_vcpu_cache;
6aa8b732 128
743eeb0b
SL
129struct kvm_io_range {
130 gpa_t addr;
131 int len;
132 struct kvm_io_device *dev;
133};
134
786a9f88 135#define NR_IOBUS_DEVS 1000
a1300716 136
2eeb2e94
GH
137struct kvm_io_bus {
138 int dev_count;
a1300716 139 struct kvm_io_range range[];
2eeb2e94
GH
140};
141
e93f8a0f
MT
142enum kvm_bus {
143 KVM_MMIO_BUS,
144 KVM_PIO_BUS,
145 KVM_NR_BUSES
146};
147
148int kvm_io_bus_write(struct kvm *kvm, enum kvm_bus bus_idx, gpa_t addr,
149 int len, const void *val);
150int kvm_io_bus_read(struct kvm *kvm, enum kvm_bus bus_idx, gpa_t addr, int len,
bda9020e 151 void *val);
743eeb0b
SL
152int kvm_io_bus_register_dev(struct kvm *kvm, enum kvm_bus bus_idx, gpa_t addr,
153 int len, struct kvm_io_device *dev);
e93f8a0f
MT
154int kvm_io_bus_unregister_dev(struct kvm *kvm, enum kvm_bus bus_idx,
155 struct kvm_io_device *dev);
2eeb2e94 156
af585b92
GN
157#ifdef CONFIG_KVM_ASYNC_PF
158struct kvm_async_pf {
159 struct work_struct work;
160 struct list_head link;
161 struct list_head queue;
162 struct kvm_vcpu *vcpu;
163 struct mm_struct *mm;
164 gva_t gva;
165 unsigned long addr;
166 struct kvm_arch_async_pf arch;
167 struct page *page;
168 bool done;
169};
170
171void kvm_clear_async_pf_completion_queue(struct kvm_vcpu *vcpu);
172void kvm_check_async_pf_completion(struct kvm_vcpu *vcpu);
173int kvm_setup_async_pf(struct kvm_vcpu *vcpu, gva_t gva, gfn_t gfn,
174 struct kvm_arch_async_pf *arch);
344d9588 175int kvm_async_pf_wakeup_all(struct kvm_vcpu *vcpu);
af585b92
GN
176#endif
177
6b7e2d09
XG
178enum {
179 OUTSIDE_GUEST_MODE,
180 IN_GUEST_MODE,
c142786c
AK
181 EXITING_GUEST_MODE,
182 READING_SHADOW_PAGE_TABLES,
6b7e2d09
XG
183};
184
f78146b0
AK
185/*
186 * Sometimes a large or cross-page mmio needs to be broken up into separate
187 * exits for userspace servicing.
188 */
189struct kvm_mmio_fragment {
190 gpa_t gpa;
191 void *data;
192 unsigned len;
193};
194
d17fbbf7
ZX
195struct kvm_vcpu {
196 struct kvm *kvm;
31bb117e 197#ifdef CONFIG_PREEMPT_NOTIFIERS
d17fbbf7 198 struct preempt_notifier preempt_notifier;
31bb117e 199#endif
6b7e2d09 200 int cpu;
d17fbbf7 201 int vcpu_id;
6b7e2d09
XG
202 int srcu_idx;
203 int mode;
d17fbbf7 204 unsigned long requests;
d0bfb940 205 unsigned long guest_debug;
6b7e2d09
XG
206
207 struct mutex mutex;
208 struct kvm_run *run;
f656ce01 209
d17fbbf7 210 int fpu_active;
2acf923e 211 int guest_fpu_loaded, guest_xcr0_loaded;
d17fbbf7 212 wait_queue_head_t wq;
34bb10b7 213 struct pid *pid;
d17fbbf7
ZX
214 int sigset_active;
215 sigset_t sigset;
216 struct kvm_vcpu_stat stat;
217
34c16eec 218#ifdef CONFIG_HAS_IOMEM
d17fbbf7
ZX
219 int mmio_needed;
220 int mmio_read_completed;
221 int mmio_is_write;
f78146b0
AK
222 int mmio_cur_fragment;
223 int mmio_nr_fragments;
224 struct kvm_mmio_fragment mmio_fragments[KVM_MAX_MMIO_FRAGMENTS];
34c16eec 225#endif
1165f5fe 226
af585b92
GN
227#ifdef CONFIG_KVM_ASYNC_PF
228 struct {
229 u32 queued;
230 struct list_head queue;
231 struct list_head done;
232 spinlock_t lock;
233 } async_pf;
234#endif
235
4c088493
R
236#ifdef CONFIG_HAVE_KVM_CPU_RELAX_INTERCEPT
237 /*
238 * Cpu relax intercept or pause loop exit optimization
239 * in_spin_loop: set when a vcpu does a pause loop exit
240 * or cpu relax intercepted.
241 * dy_eligible: indicates whether vcpu is eligible for directed yield.
242 */
243 struct {
244 bool in_spin_loop;
245 bool dy_eligible;
246 } spin_loop;
247#endif
d657a98e
ZX
248 struct kvm_vcpu_arch arch;
249};
250
6b7e2d09
XG
251static inline int kvm_vcpu_exiting_guest_mode(struct kvm_vcpu *vcpu)
252{
253 return cmpxchg(&vcpu->mode, IN_GUEST_MODE, EXITING_GUEST_MODE);
254}
255
660c22c4
TY
256/*
257 * Some of the bitops functions do not support too long bitmaps.
258 * This number must be determined not to exceed such limits.
259 */
260#define KVM_MEM_MAX_NR_PAGES ((1UL << 31) - 1)
261
6aa8b732
AK
262struct kvm_memory_slot {
263 gfn_t base_gfn;
264 unsigned long npages;
265 unsigned long flags;
6aa8b732 266 unsigned long *dirty_bitmap;
db3fe4eb 267 struct kvm_arch_memory_slot arch;
8a7ae055 268 unsigned long userspace_addr;
80b14b5b 269 int user_alloc;
e36d96f7 270 int id;
6aa8b732
AK
271};
272
87bf6e7d
TY
273static inline unsigned long kvm_dirty_bitmap_bytes(struct kvm_memory_slot *memslot)
274{
275 return ALIGN(memslot->npages, BITS_PER_LONG) / 8;
276}
277
399ec807
AK
278struct kvm_kernel_irq_routing_entry {
279 u32 gsi;
5116d8f6 280 u32 type;
4925663a 281 int (*set)(struct kvm_kernel_irq_routing_entry *e,
1a6e4a8c 282 struct kvm *kvm, int irq_source_id, int level);
399ec807
AK
283 union {
284 struct {
285 unsigned irqchip;
286 unsigned pin;
287 } irqchip;
79950e10 288 struct msi_msg msi;
399ec807 289 };
46e624b9
GN
290 struct hlist_node link;
291};
292
3e71f88b
GN
293#ifdef __KVM_HAVE_IOAPIC
294
46e624b9 295struct kvm_irq_routing_table {
3e71f88b 296 int chip[KVM_NR_IRQCHIPS][KVM_IOAPIC_NUM_PINS];
46e624b9
GN
297 struct kvm_kernel_irq_routing_entry *rt_entries;
298 u32 nr_rt_entries;
299 /*
300 * Array indexed by gsi. Each entry contains list of irq chips
301 * the gsi is connected to.
302 */
303 struct hlist_head map[0];
399ec807
AK
304};
305
3e71f88b
GN
306#else
307
308struct kvm_irq_routing_table {};
309
310#endif
311
93a5cef0
XG
312#ifndef KVM_MEM_SLOTS_NUM
313#define KVM_MEM_SLOTS_NUM (KVM_MEMORY_SLOTS + KVM_PRIVATE_MEM_SLOTS)
314#endif
315
bf3e05bc
XG
316/*
317 * Note:
318 * memslots are not sorted by id anymore, please use id_to_memslot()
319 * to get the memslot by its id.
320 */
46a26bf5 321struct kvm_memslots {
49c7754c 322 u64 generation;
93a5cef0 323 struct kvm_memory_slot memslots[KVM_MEM_SLOTS_NUM];
f85e2cb5
XG
324 /* The mapping table from slot id to the index in memslots[]. */
325 int id_to_index[KVM_MEM_SLOTS_NUM];
46a26bf5
MT
326};
327
6aa8b732 328struct kvm {
aaee2c94 329 spinlock_t mmu_lock;
79fac95e 330 struct mutex slots_lock;
6d4e4c4f 331 struct mm_struct *mm; /* userspace tied to this vm */
46a26bf5 332 struct kvm_memslots *memslots;
bc6678a3 333 struct srcu_struct srcu;
73880c80
GN
334#ifdef CONFIG_KVM_APIC_ARCHITECTURE
335 u32 bsp_vcpu_id;
73880c80 336#endif
fb3f0f51 337 struct kvm_vcpu *vcpus[KVM_MAX_VCPUS];
73880c80 338 atomic_t online_vcpus;
217ece61 339 int last_boosted_vcpu;
133de902 340 struct list_head vm_list;
60eead79 341 struct mutex lock;
e93f8a0f 342 struct kvm_io_bus *buses[KVM_NR_BUSES];
721eecbf
GH
343#ifdef CONFIG_HAVE_KVM_EVENTFD
344 struct {
345 spinlock_t lock;
346 struct list_head items;
7a84428a
AW
347 struct list_head resampler_list;
348 struct mutex resampler_lock;
721eecbf 349 } irqfds;
d34e6b17 350 struct list_head ioeventfds;
721eecbf 351#endif
ba1389b7 352 struct kvm_vm_stat stat;
d69fb81f 353 struct kvm_arch arch;
d39f13b0 354 atomic_t users_count;
5f94c174 355#ifdef KVM_COALESCED_MMIO_PAGE_OFFSET
5f94c174 356 struct kvm_coalesced_mmio_ring *coalesced_mmio_ring;
2b3c246a
SL
357 spinlock_t ring_lock;
358 struct list_head coalesced_zones;
5f94c174 359#endif
e930bffe 360
60eead79 361 struct mutex irq_lock;
75858a84 362#ifdef CONFIG_HAVE_KVM_IRQCHIP
bd2b53b2
MT
363 /*
364 * Update side is protected by irq_lock and,
365 * if configured, irqfds.lock.
366 */
4b6a2872 367 struct kvm_irq_routing_table __rcu *irq_routing;
75858a84 368 struct hlist_head mask_notifier_list;
136bdfee 369 struct hlist_head irq_ack_notifier_list;
75858a84
AK
370#endif
371
36c1ed82 372#if defined(CONFIG_MMU_NOTIFIER) && defined(KVM_ARCH_WANT_MMU_NOTIFIER)
e930bffe
AA
373 struct mmu_notifier mmu_notifier;
374 unsigned long mmu_notifier_seq;
375 long mmu_notifier_count;
376#endif
5c663a15 377 long tlbs_dirty;
6aa8b732
AK
378};
379
a737f256
CD
380#define kvm_err(fmt, ...) \
381 pr_err("kvm [%i]: " fmt, task_pid_nr(current), ## __VA_ARGS__)
382#define kvm_info(fmt, ...) \
383 pr_info("kvm [%i]: " fmt, task_pid_nr(current), ## __VA_ARGS__)
384#define kvm_debug(fmt, ...) \
385 pr_debug("kvm [%i]: " fmt, task_pid_nr(current), ## __VA_ARGS__)
386#define kvm_pr_unimpl(fmt, ...) \
387 pr_err_ratelimited("kvm [%i]: " fmt, \
388 task_tgid_nr(current), ## __VA_ARGS__)
f0242478 389
a737f256
CD
390/* The guest did something we don't support. */
391#define vcpu_unimpl(vcpu, fmt, ...) \
392 kvm_pr_unimpl("vcpu%i " fmt, (vcpu)->vcpu_id, ## __VA_ARGS__)
6aa8b732 393
988a2cae
GN
394static inline struct kvm_vcpu *kvm_get_vcpu(struct kvm *kvm, int i)
395{
396 smp_rmb();
397 return kvm->vcpus[i];
398}
399
400#define kvm_for_each_vcpu(idx, vcpup, kvm) \
b42fc3cb
JM
401 for (idx = 0; \
402 idx < atomic_read(&kvm->online_vcpus) && \
403 (vcpup = kvm_get_vcpu(kvm, idx)) != NULL; \
404 idx++)
988a2cae 405
be6ba0f0
XG
406#define kvm_for_each_memslot(memslot, slots) \
407 for (memslot = &slots->memslots[0]; \
bf3e05bc
XG
408 memslot < slots->memslots + KVM_MEM_SLOTS_NUM && memslot->npages;\
409 memslot++)
be6ba0f0 410
fb3f0f51
RR
411int kvm_vcpu_init(struct kvm_vcpu *vcpu, struct kvm *kvm, unsigned id);
412void kvm_vcpu_uninit(struct kvm_vcpu *vcpu);
413
9fc77441 414int __must_check vcpu_load(struct kvm_vcpu *vcpu);
313a3dc7
CO
415void vcpu_put(struct kvm_vcpu *vcpu);
416
0ee75bea 417int kvm_init(void *opaque, unsigned vcpu_size, unsigned vcpu_align,
c16f862d 418 struct module *module);
cb498ea2 419void kvm_exit(void);
6aa8b732 420
d39f13b0
IE
421void kvm_get_kvm(struct kvm *kvm);
422void kvm_put_kvm(struct kvm *kvm);
be593d62 423void update_memslots(struct kvm_memslots *slots, struct kvm_memory_slot *new);
d39f13b0 424
90d83dc3
LJ
425static inline struct kvm_memslots *kvm_memslots(struct kvm *kvm)
426{
427 return rcu_dereference_check(kvm->memslots,
428 srcu_read_lock_held(&kvm->srcu)
429 || lockdep_is_held(&kvm->slots_lock));
430}
431
28a37544
XG
432static inline struct kvm_memory_slot *
433id_to_memslot(struct kvm_memslots *slots, int id)
434{
f85e2cb5
XG
435 int index = slots->id_to_index[id];
436 struct kvm_memory_slot *slot;
bf3e05bc 437
f85e2cb5 438 slot = &slots->memslots[index];
bf3e05bc 439
f85e2cb5
XG
440 WARN_ON(slot->id != id);
441 return slot;
28a37544
XG
442}
443
210c7c4d
IE
444int kvm_set_memory_region(struct kvm *kvm,
445 struct kvm_userspace_memory_region *mem,
446 int user_alloc);
f78e0e2e
SY
447int __kvm_set_memory_region(struct kvm *kvm,
448 struct kvm_userspace_memory_region *mem,
449 int user_alloc);
db3fe4eb
TY
450void kvm_arch_free_memslot(struct kvm_memory_slot *free,
451 struct kvm_memory_slot *dont);
452int kvm_arch_create_memslot(struct kvm_memory_slot *slot, unsigned long npages);
f7784b8e
MT
453int kvm_arch_prepare_memory_region(struct kvm *kvm,
454 struct kvm_memory_slot *memslot,
455 struct kvm_memory_slot old,
456 struct kvm_userspace_memory_region *mem,
457 int user_alloc);
458void kvm_arch_commit_memory_region(struct kvm *kvm,
0de10343
ZX
459 struct kvm_userspace_memory_region *mem,
460 struct kvm_memory_slot old,
461 int user_alloc);
db3fe4eb 462bool kvm_largepages_enabled(void);
54dee993 463void kvm_disable_largepages(void);
2df72e9b
MT
464/* flush all memory translations */
465void kvm_arch_flush_shadow_all(struct kvm *kvm);
466/* flush memory translations pointing to 'slot' */
467void kvm_arch_flush_shadow_memslot(struct kvm *kvm,
468 struct kvm_memory_slot *slot);
a983fb23 469
48987781
XG
470int gfn_to_page_many_atomic(struct kvm *kvm, gfn_t gfn, struct page **pages,
471 int nr_pages);
472
954bbbc2 473struct page *gfn_to_page(struct kvm *kvm, gfn_t gfn);
05da4558 474unsigned long gfn_to_hva(struct kvm *kvm, gfn_t gfn);
4d8b81ab 475unsigned long gfn_to_hva_memslot(struct kvm_memory_slot *slot, gfn_t gfn);
b4231d61
IE
476void kvm_release_page_clean(struct page *page);
477void kvm_release_page_dirty(struct page *page);
35149e21
AL
478void kvm_set_page_dirty(struct page *page);
479void kvm_set_page_accessed(struct page *page);
480
365fb3fd 481pfn_t gfn_to_pfn_atomic(struct kvm *kvm, gfn_t gfn);
612819c3
MT
482pfn_t gfn_to_pfn_async(struct kvm *kvm, gfn_t gfn, bool *async,
483 bool write_fault, bool *writable);
35149e21 484pfn_t gfn_to_pfn(struct kvm *kvm, gfn_t gfn);
612819c3
MT
485pfn_t gfn_to_pfn_prot(struct kvm *kvm, gfn_t gfn, bool write_fault,
486 bool *writable);
d5661048 487pfn_t gfn_to_pfn_memslot(struct kvm_memory_slot *slot, gfn_t gfn);
037d92dc
XG
488pfn_t gfn_to_pfn_memslot_atomic(struct kvm_memory_slot *slot, gfn_t gfn);
489
32cad84f 490void kvm_release_pfn_dirty(pfn_t pfn);
35149e21
AL
491void kvm_release_pfn_clean(pfn_t pfn);
492void kvm_set_pfn_dirty(pfn_t pfn);
493void kvm_set_pfn_accessed(pfn_t pfn);
494void kvm_get_pfn(pfn_t pfn);
495
195aefde
IE
496int kvm_read_guest_page(struct kvm *kvm, gfn_t gfn, void *data, int offset,
497 int len);
7ec54588
MT
498int kvm_read_guest_atomic(struct kvm *kvm, gpa_t gpa, void *data,
499 unsigned long len);
195aefde 500int kvm_read_guest(struct kvm *kvm, gpa_t gpa, void *data, unsigned long len);
e03b644f
GN
501int kvm_read_guest_cached(struct kvm *kvm, struct gfn_to_hva_cache *ghc,
502 void *data, unsigned long len);
195aefde
IE
503int kvm_write_guest_page(struct kvm *kvm, gfn_t gfn, const void *data,
504 int offset, int len);
505int kvm_write_guest(struct kvm *kvm, gpa_t gpa, const void *data,
506 unsigned long len);
49c7754c
GN
507int kvm_write_guest_cached(struct kvm *kvm, struct gfn_to_hva_cache *ghc,
508 void *data, unsigned long len);
509int kvm_gfn_to_hva_cache_init(struct kvm *kvm, struct gfn_to_hva_cache *ghc,
510 gpa_t gpa);
195aefde
IE
511int kvm_clear_guest_page(struct kvm *kvm, gfn_t gfn, int offset, int len);
512int kvm_clear_guest(struct kvm *kvm, gpa_t gpa, unsigned long len);
6aa8b732 513struct kvm_memory_slot *gfn_to_memslot(struct kvm *kvm, gfn_t gfn);
e0d62c7f 514int kvm_is_visible_gfn(struct kvm *kvm, gfn_t gfn);
8f0b1ab6 515unsigned long kvm_host_page_size(struct kvm *kvm, gfn_t gfn);
6aa8b732 516void mark_page_dirty(struct kvm *kvm, gfn_t gfn);
49c7754c
GN
517void mark_page_dirty_in_slot(struct kvm *kvm, struct kvm_memory_slot *memslot,
518 gfn_t gfn);
6aa8b732 519
8776e519 520void kvm_vcpu_block(struct kvm_vcpu *vcpu);
b6d33834 521void kvm_vcpu_kick(struct kvm_vcpu *vcpu);
41628d33 522bool kvm_vcpu_yield_to(struct kvm_vcpu *target);
d255f4f2 523void kvm_vcpu_on_spin(struct kvm_vcpu *vcpu);
6aa8b732 524void kvm_resched(struct kvm_vcpu *vcpu);
7702fd1f
AK
525void kvm_load_guest_fpu(struct kvm_vcpu *vcpu);
526void kvm_put_guest_fpu(struct kvm_vcpu *vcpu);
a4ee1ca4 527
d9e368d6 528void kvm_flush_remote_tlbs(struct kvm *kvm);
2e53d63a 529void kvm_reload_remote_mmus(struct kvm *kvm);
6aa8b732 530
043405e1
CO
531long kvm_arch_dev_ioctl(struct file *filp,
532 unsigned int ioctl, unsigned long arg);
313a3dc7
CO
533long kvm_arch_vcpu_ioctl(struct file *filp,
534 unsigned int ioctl, unsigned long arg);
5b1c1493 535int kvm_arch_vcpu_fault(struct kvm_vcpu *vcpu, struct vm_fault *vmf);
018d00d2
ZX
536
537int kvm_dev_ioctl_check_extension(long ext);
538
5bb064dc
ZX
539int kvm_get_dirty_log(struct kvm *kvm,
540 struct kvm_dirty_log *log, int *is_dirty);
541int kvm_vm_ioctl_get_dirty_log(struct kvm *kvm,
542 struct kvm_dirty_log *log);
543
1fe779f8
CO
544int kvm_vm_ioctl_set_memory_region(struct kvm *kvm,
545 struct
546 kvm_userspace_memory_region *mem,
547 int user_alloc);
23d43cf9 548int kvm_vm_ioctl_irq_line(struct kvm *kvm, struct kvm_irq_level *irq_level);
1fe779f8
CO
549long kvm_arch_vm_ioctl(struct file *filp,
550 unsigned int ioctl, unsigned long arg);
313a3dc7 551
d0752060
HB
552int kvm_arch_vcpu_ioctl_get_fpu(struct kvm_vcpu *vcpu, struct kvm_fpu *fpu);
553int kvm_arch_vcpu_ioctl_set_fpu(struct kvm_vcpu *vcpu, struct kvm_fpu *fpu);
554
8b006791
ZX
555int kvm_arch_vcpu_ioctl_translate(struct kvm_vcpu *vcpu,
556 struct kvm_translation *tr);
557
b6c7a5dc
HB
558int kvm_arch_vcpu_ioctl_get_regs(struct kvm_vcpu *vcpu, struct kvm_regs *regs);
559int kvm_arch_vcpu_ioctl_set_regs(struct kvm_vcpu *vcpu, struct kvm_regs *regs);
560int kvm_arch_vcpu_ioctl_get_sregs(struct kvm_vcpu *vcpu,
561 struct kvm_sregs *sregs);
562int kvm_arch_vcpu_ioctl_set_sregs(struct kvm_vcpu *vcpu,
563 struct kvm_sregs *sregs);
62d9f0db
MT
564int kvm_arch_vcpu_ioctl_get_mpstate(struct kvm_vcpu *vcpu,
565 struct kvm_mp_state *mp_state);
566int kvm_arch_vcpu_ioctl_set_mpstate(struct kvm_vcpu *vcpu,
567 struct kvm_mp_state *mp_state);
d0bfb940
JK
568int kvm_arch_vcpu_ioctl_set_guest_debug(struct kvm_vcpu *vcpu,
569 struct kvm_guest_debug *dbg);
b6c7a5dc
HB
570int kvm_arch_vcpu_ioctl_run(struct kvm_vcpu *vcpu, struct kvm_run *kvm_run);
571
f8c16bba
ZX
572int kvm_arch_init(void *opaque);
573void kvm_arch_exit(void);
043405e1 574
e9b11c17
ZX
575int kvm_arch_vcpu_init(struct kvm_vcpu *vcpu);
576void kvm_arch_vcpu_uninit(struct kvm_vcpu *vcpu);
577
578void kvm_arch_vcpu_free(struct kvm_vcpu *vcpu);
579void kvm_arch_vcpu_load(struct kvm_vcpu *vcpu, int cpu);
580void kvm_arch_vcpu_put(struct kvm_vcpu *vcpu);
581struct kvm_vcpu *kvm_arch_vcpu_create(struct kvm *kvm, unsigned int id);
26e5215f 582int kvm_arch_vcpu_setup(struct kvm_vcpu *vcpu);
d40ccc62 583void kvm_arch_vcpu_destroy(struct kvm_vcpu *vcpu);
e9b11c17
ZX
584
585int kvm_arch_vcpu_reset(struct kvm_vcpu *vcpu);
10474ae8 586int kvm_arch_hardware_enable(void *garbage);
e9b11c17
ZX
587void kvm_arch_hardware_disable(void *garbage);
588int kvm_arch_hardware_setup(void);
589void kvm_arch_hardware_unsetup(void);
590void kvm_arch_check_processor_compat(void *rtn);
1d737c8a 591int kvm_arch_vcpu_runnable(struct kvm_vcpu *vcpu);
b6d33834 592int kvm_arch_vcpu_should_kick(struct kvm_vcpu *vcpu);
e9b11c17 593
d19a9cd2
ZX
594void kvm_free_physmem(struct kvm *kvm);
595
c1a7b32a
TY
596void *kvm_kvzalloc(unsigned long size);
597void kvm_kvfree(const void *addr);
598
d89f5eff
JK
599#ifndef __KVM_HAVE_ARCH_VM_ALLOC
600static inline struct kvm *kvm_arch_alloc_vm(void)
601{
602 return kzalloc(sizeof(struct kvm), GFP_KERNEL);
603}
604
605static inline void kvm_arch_free_vm(struct kvm *kvm)
606{
607 kfree(kvm);
608}
609#endif
610
b6d33834
CD
611static inline wait_queue_head_t *kvm_arch_vcpu_wq(struct kvm_vcpu *vcpu)
612{
2246f8b5
AG
613#ifdef __KVM_HAVE_ARCH_WQP
614 return vcpu->arch.wqp;
615#else
b6d33834 616 return &vcpu->wq;
b6d33834 617#endif
2246f8b5 618}
b6d33834 619
e08b9637 620int kvm_arch_init_vm(struct kvm *kvm, unsigned long type);
d19a9cd2 621void kvm_arch_destroy_vm(struct kvm *kvm);
8a98f664 622void kvm_free_all_assigned_devices(struct kvm *kvm);
ad8ba2cd 623void kvm_arch_sync_events(struct kvm *kvm);
e9b11c17 624
3d80840d 625int kvm_cpu_has_pending_timer(struct kvm_vcpu *vcpu);
5736199a 626void kvm_vcpu_kick(struct kvm_vcpu *vcpu);
682c59a3 627
a2766325 628bool kvm_is_mmio_pfn(pfn_t pfn);
c77fb9dc 629
62c476c7
BAY
630struct kvm_irq_ack_notifier {
631 struct hlist_node link;
632 unsigned gsi;
633 void (*irq_acked)(struct kvm_irq_ack_notifier *kian);
634};
635
636struct kvm_assigned_dev_kernel {
637 struct kvm_irq_ack_notifier ack_notifier;
62c476c7
BAY
638 struct list_head list;
639 int assigned_dev_id;
ab9f4ecb 640 int host_segnr;
62c476c7
BAY
641 int host_busnr;
642 int host_devfn;
c1e01514 643 unsigned int entries_nr;
62c476c7 644 int host_irq;
defaf158 645 bool host_irq_disabled;
07700a94 646 bool pci_2_3;
c1e01514 647 struct msix_entry *host_msix_entries;
62c476c7 648 int guest_irq;
0645211c 649 struct msix_entry *guest_msix_entries;
4f906c19 650 unsigned long irq_requested_type;
5550af4d 651 int irq_source_id;
b653574a 652 int flags;
62c476c7
BAY
653 struct pci_dev *dev;
654 struct kvm *kvm;
0645211c 655 spinlock_t intx_lock;
cf9eeac4 656 spinlock_t intx_mask_lock;
1e001d49 657 char irq_name[32];
f8fcfd77 658 struct pci_saved_state *pci_saved_state;
62c476c7 659};
75858a84
AK
660
661struct kvm_irq_mask_notifier {
662 void (*func)(struct kvm_irq_mask_notifier *kimn, bool masked);
663 int irq;
664 struct hlist_node link;
665};
666
667void kvm_register_irq_mask_notifier(struct kvm *kvm, int irq,
668 struct kvm_irq_mask_notifier *kimn);
669void kvm_unregister_irq_mask_notifier(struct kvm *kvm, int irq,
670 struct kvm_irq_mask_notifier *kimn);
4a994358
GN
671void kvm_fire_mask_notifiers(struct kvm *kvm, unsigned irqchip, unsigned pin,
672 bool mask);
75858a84 673
46e624b9
GN
674#ifdef __KVM_HAVE_IOAPIC
675void kvm_get_intr_delivery_bitmask(struct kvm_ioapic *ioapic,
676 union kvm_ioapic_redirect_entry *entry,
677 unsigned long *deliver_bitmask);
678#endif
679int kvm_set_irq(struct kvm *kvm, int irq_source_id, u32 irq, int level);
bd2b53b2
MT
680int kvm_set_msi(struct kvm_kernel_irq_routing_entry *irq_entry, struct kvm *kvm,
681 int irq_source_id, int level);
44882eed 682void kvm_notify_acked_irq(struct kvm *kvm, unsigned irqchip, unsigned pin);
3de42dc0
XZ
683void kvm_register_irq_ack_notifier(struct kvm *kvm,
684 struct kvm_irq_ack_notifier *kian);
fa40a821
MT
685void kvm_unregister_irq_ack_notifier(struct kvm *kvm,
686 struct kvm_irq_ack_notifier *kian);
5550af4d
SY
687int kvm_request_irq_source_id(struct kvm *kvm);
688void kvm_free_irq_source_id(struct kvm *kvm, int irq_source_id);
62c476c7 689
522c68c4
SY
690/* For vcpu->arch.iommu_flags */
691#define KVM_IOMMU_CACHE_COHERENCY 0x1
692
19de40a8 693#ifdef CONFIG_IOMMU_API
3ad26d81 694int kvm_iommu_map_pages(struct kvm *kvm, struct kvm_memory_slot *slot);
32f6daad 695void kvm_iommu_unmap_pages(struct kvm *kvm, struct kvm_memory_slot *slot);
260782bc 696int kvm_iommu_map_guest(struct kvm *kvm);
62c476c7 697int kvm_iommu_unmap_guest(struct kvm *kvm);
260782bc
WH
698int kvm_assign_device(struct kvm *kvm,
699 struct kvm_assigned_dev_kernel *assigned_dev);
0a920356
WH
700int kvm_deassign_device(struct kvm *kvm,
701 struct kvm_assigned_dev_kernel *assigned_dev);
19de40a8 702#else /* CONFIG_IOMMU_API */
62c476c7 703static inline int kvm_iommu_map_pages(struct kvm *kvm,
d7a79b6c 704 struct kvm_memory_slot *slot)
62c476c7
BAY
705{
706 return 0;
707}
708
32f6daad
AW
709static inline void kvm_iommu_unmap_pages(struct kvm *kvm,
710 struct kvm_memory_slot *slot)
711{
712}
713
260782bc 714static inline int kvm_iommu_map_guest(struct kvm *kvm)
62c476c7
BAY
715{
716 return -ENODEV;
717}
718
719static inline int kvm_iommu_unmap_guest(struct kvm *kvm)
720{
721 return 0;
722}
260782bc
WH
723
724static inline int kvm_assign_device(struct kvm *kvm,
725 struct kvm_assigned_dev_kernel *assigned_dev)
726{
727 return 0;
728}
0a920356
WH
729
730static inline int kvm_deassign_device(struct kvm *kvm,
731 struct kvm_assigned_dev_kernel *assigned_dev)
732{
733 return 0;
734}
19de40a8 735#endif /* CONFIG_IOMMU_API */
62c476c7 736
d172fcd3
LV
737static inline void kvm_guest_enter(void)
738{
8fa22068 739 BUG_ON(preemptible());
bf9fae9f 740 vtime_account(current);
d172fcd3 741 current->flags |= PF_VCPU;
8fa22068
GN
742 /* KVM does not hold any references to rcu protected data when it
743 * switches CPU into a guest mode. In fact switching to a guest mode
744 * is very similar to exiting to userspase from rcu point of view. In
745 * addition CPU may stay in a guest mode for quite a long time (up to
746 * one time slice). Lets treat guest mode as quiescent state, just like
747 * we do with user-mode execution.
748 */
749 rcu_virt_note_context_switch(smp_processor_id());
d172fcd3
LV
750}
751
752static inline void kvm_guest_exit(void)
753{
bf9fae9f 754 vtime_account(current);
d172fcd3
LV
755 current->flags &= ~PF_VCPU;
756}
757
9d4cba7f
PM
758/*
759 * search_memslots() and __gfn_to_memslot() are here because they are
760 * used in non-modular code in arch/powerpc/kvm/book3s_hv_rm_mmu.c.
761 * gfn_to_memslot() itself isn't here as an inline because that would
762 * bloat other code too much.
763 */
764static inline struct kvm_memory_slot *
765search_memslots(struct kvm_memslots *slots, gfn_t gfn)
766{
767 struct kvm_memory_slot *memslot;
768
769 kvm_for_each_memslot(memslot, slots)
770 if (gfn >= memslot->base_gfn &&
771 gfn < memslot->base_gfn + memslot->npages)
772 return memslot;
773
774 return NULL;
775}
776
777static inline struct kvm_memory_slot *
778__gfn_to_memslot(struct kvm_memslots *slots, gfn_t gfn)
779{
780 return search_memslots(slots, gfn);
781}
782
66a03505
GS
783static inline unsigned long
784__gfn_to_hva_memslot(struct kvm_memory_slot *slot, gfn_t gfn)
785{
786 return slot->userspace_addr + (gfn - slot->base_gfn) * PAGE_SIZE;
787}
788
0ee8dcb8
XG
789static inline int memslot_id(struct kvm *kvm, gfn_t gfn)
790{
791 return gfn_to_memslot(kvm, gfn)->id;
792}
793
fb03cb6f
TY
794static inline gfn_t gfn_to_index(gfn_t gfn, gfn_t base_gfn, int level)
795{
796 /* KVM_HPAGE_GFN_SHIFT(PT_PAGE_TABLE_LEVEL) must be 0. */
797 return (gfn >> KVM_HPAGE_GFN_SHIFT(level)) -
798 (base_gfn >> KVM_HPAGE_GFN_SHIFT(level));
799}
800
d19a748b
TY
801static inline gfn_t
802hva_to_gfn_memslot(unsigned long hva, struct kvm_memory_slot *slot)
887c08ac 803{
d19a748b
TY
804 gfn_t gfn_offset = (hva - slot->userspace_addr) >> PAGE_SHIFT;
805
806 return slot->base_gfn + gfn_offset;
887c08ac
XG
807}
808
1755fbcc
AK
809static inline gpa_t gfn_to_gpa(gfn_t gfn)
810{
811 return (gpa_t)gfn << PAGE_SHIFT;
812}
6aa8b732 813
c30a358d
JR
814static inline gfn_t gpa_to_gfn(gpa_t gpa)
815{
816 return (gfn_t)(gpa >> PAGE_SHIFT);
817}
818
62c476c7
BAY
819static inline hpa_t pfn_to_hpa(pfn_t pfn)
820{
821 return (hpa_t)pfn << PAGE_SHIFT;
822}
823
2f599714 824static inline void kvm_migrate_timers(struct kvm_vcpu *vcpu)
2f52d58c
AK
825{
826 set_bit(KVM_REQ_MIGRATE_TIMER, &vcpu->requests);
827}
828
ba1389b7
AK
829enum kvm_stat_kind {
830 KVM_STAT_VM,
831 KVM_STAT_VCPU,
832};
833
417bc304
HB
834struct kvm_stats_debugfs_item {
835 const char *name;
836 int offset;
ba1389b7 837 enum kvm_stat_kind kind;
417bc304
HB
838 struct dentry *dentry;
839};
840extern struct kvm_stats_debugfs_item debugfs_entries[];
76f7c879 841extern struct dentry *kvm_debugfs_dir;
d4c9ff2d 842
36c1ed82 843#if defined(CONFIG_MMU_NOTIFIER) && defined(KVM_ARCH_WANT_MMU_NOTIFIER)
e930bffe
AA
844static inline int mmu_notifier_retry(struct kvm_vcpu *vcpu, unsigned long mmu_seq)
845{
846 if (unlikely(vcpu->kvm->mmu_notifier_count))
847 return 1;
848 /*
a355aa54
PM
849 * Ensure the read of mmu_notifier_count happens before the read
850 * of mmu_notifier_seq. This interacts with the smp_wmb() in
851 * mmu_notifier_invalidate_range_end to make sure that the caller
852 * either sees the old (non-zero) value of mmu_notifier_count or
853 * the new (incremented) value of mmu_notifier_seq.
854 * PowerPC Book3s HV KVM calls this under a per-page lock
855 * rather than under kvm->mmu_lock, for scalability, so
856 * can't rely on kvm->mmu_lock to keep things ordered.
e930bffe 857 */
a355aa54 858 smp_rmb();
e930bffe
AA
859 if (vcpu->kvm->mmu_notifier_seq != mmu_seq)
860 return 1;
861 return 0;
862}
863#endif
864
9900b4b4 865#ifdef KVM_CAP_IRQ_ROUTING
399ec807
AK
866
867#define KVM_MAX_IRQ_ROUTES 1024
868
869int kvm_setup_default_irq_routing(struct kvm *kvm);
870int kvm_set_irq_routing(struct kvm *kvm,
871 const struct kvm_irq_routing_entry *entries,
872 unsigned nr,
873 unsigned flags);
874void kvm_free_irq_routing(struct kvm *kvm);
875
07975ad3
JK
876int kvm_send_userspace_msi(struct kvm *kvm, struct kvm_msi *msi);
877
399ec807
AK
878#else
879
880static inline void kvm_free_irq_routing(struct kvm *kvm) {}
881
882#endif
883
721eecbf
GH
884#ifdef CONFIG_HAVE_KVM_EVENTFD
885
d34e6b17 886void kvm_eventfd_init(struct kvm *kvm);
d4db2935 887int kvm_irqfd(struct kvm *kvm, struct kvm_irqfd *args);
721eecbf 888void kvm_irqfd_release(struct kvm *kvm);
bd2b53b2 889void kvm_irq_routing_update(struct kvm *, struct kvm_irq_routing_table *);
d34e6b17 890int kvm_ioeventfd(struct kvm *kvm, struct kvm_ioeventfd *args);
721eecbf
GH
891
892#else
893
d34e6b17 894static inline void kvm_eventfd_init(struct kvm *kvm) {}
bd2b53b2 895
d4db2935 896static inline int kvm_irqfd(struct kvm *kvm, struct kvm_irqfd *args)
721eecbf
GH
897{
898 return -EINVAL;
899}
900
901static inline void kvm_irqfd_release(struct kvm *kvm) {}
bd2b53b2 902
27923eb1 903#ifdef CONFIG_HAVE_KVM_IRQCHIP
bd2b53b2
MT
904static inline void kvm_irq_routing_update(struct kvm *kvm,
905 struct kvm_irq_routing_table *irq_rt)
906{
907 rcu_assign_pointer(kvm->irq_routing, irq_rt);
908}
27923eb1 909#endif
bd2b53b2 910
d34e6b17
GH
911static inline int kvm_ioeventfd(struct kvm *kvm, struct kvm_ioeventfd *args)
912{
913 return -ENOSYS;
914}
721eecbf
GH
915
916#endif /* CONFIG_HAVE_KVM_EVENTFD */
917
73880c80 918#ifdef CONFIG_KVM_APIC_ARCHITECTURE
c5af89b6
GN
919static inline bool kvm_vcpu_is_bsp(struct kvm_vcpu *vcpu)
920{
d3efc8ef 921 return vcpu->kvm->bsp_vcpu_id == vcpu->vcpu_id;
c5af89b6 922}
3e515705
AK
923
924bool kvm_vcpu_compatible(struct kvm_vcpu *vcpu);
925
926#else
927
928static inline bool kvm_vcpu_compatible(struct kvm_vcpu *vcpu) { return true; }
929
6aa8b732 930#endif
bfd99ff5
AK
931
932#ifdef __KVM_HAVE_DEVICE_ASSIGNMENT
933
934long kvm_vm_ioctl_assigned_device(struct kvm *kvm, unsigned ioctl,
935 unsigned long arg);
936
937#else
938
939static inline long kvm_vm_ioctl_assigned_device(struct kvm *kvm, unsigned ioctl,
940 unsigned long arg)
941{
942 return -ENOTTY;
943}
944
73880c80 945#endif
bfd99ff5 946
a8eeb04a
AK
947static inline void kvm_make_request(int req, struct kvm_vcpu *vcpu)
948{
949 set_bit(req, &vcpu->requests);
950}
951
a8eeb04a
AK
952static inline bool kvm_check_request(int req, struct kvm_vcpu *vcpu)
953{
0719837c
AK
954 if (test_bit(req, &vcpu->requests)) {
955 clear_bit(req, &vcpu->requests);
956 return true;
957 } else {
958 return false;
959 }
a8eeb04a
AK
960}
961
4c088493
R
962#ifdef CONFIG_HAVE_KVM_CPU_RELAX_INTERCEPT
963
964static inline void kvm_vcpu_set_in_spin_loop(struct kvm_vcpu *vcpu, bool val)
965{
966 vcpu->spin_loop.in_spin_loop = val;
967}
968static inline void kvm_vcpu_set_dy_eligible(struct kvm_vcpu *vcpu, bool val)
969{
970 vcpu->spin_loop.dy_eligible = val;
971}
972
973#else /* !CONFIG_HAVE_KVM_CPU_RELAX_INTERCEPT */
974
975static inline void kvm_vcpu_set_in_spin_loop(struct kvm_vcpu *vcpu, bool val)
976{
977}
978
979static inline void kvm_vcpu_set_dy_eligible(struct kvm_vcpu *vcpu, bool val)
980{
981}
982
06e48c51
R
983static inline bool kvm_vcpu_eligible_for_directed_yield(struct kvm_vcpu *vcpu)
984{
985 return true;
986}
987
4c088493 988#endif /* CONFIG_HAVE_KVM_CPU_RELAX_INTERCEPT */
bfd99ff5
AK
989#endif
990