Linux kernel mirror (for testing) git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel os linux
at v3.10-rc5 1117 lines 31 kB view raw
1#ifndef __KVM_HOST_H 2#define __KVM_HOST_H 3 4/* 5 * This work is licensed under the terms of the GNU GPL, version 2. See 6 * the COPYING file in the top-level directory. 7 */ 8 9#include <linux/types.h> 10#include <linux/hardirq.h> 11#include <linux/list.h> 12#include <linux/mutex.h> 13#include <linux/spinlock.h> 14#include <linux/signal.h> 15#include <linux/sched.h> 16#include <linux/bug.h> 17#include <linux/mm.h> 18#include <linux/mmu_notifier.h> 19#include <linux/preempt.h> 20#include <linux/msi.h> 21#include <linux/slab.h> 22#include <linux/rcupdate.h> 23#include <linux/ratelimit.h> 24#include <linux/err.h> 25#include <linux/irqflags.h> 26#include <asm/signal.h> 27 28#include <linux/kvm.h> 29#include <linux/kvm_para.h> 30 31#include <linux/kvm_types.h> 32 33#include <asm/kvm_host.h> 34 35#ifndef KVM_MMIO_SIZE 36#define KVM_MMIO_SIZE 8 37#endif 38 39/* 40 * The bit 16 ~ bit 31 of kvm_memory_region::flags are internally used 41 * in kvm, other bits are visible for userspace which are defined in 42 * include/linux/kvm_h. 43 */ 44#define KVM_MEMSLOT_INVALID (1UL << 16) 45 46/* Two fragments for cross MMIO pages. */ 47#define KVM_MAX_MMIO_FRAGMENTS 2 48 49/* 50 * For the normal pfn, the highest 12 bits should be zero, 51 * so we can mask bit 62 ~ bit 52 to indicate the error pfn, 52 * mask bit 63 to indicate the noslot pfn. 53 */ 54#define KVM_PFN_ERR_MASK (0x7ffULL << 52) 55#define KVM_PFN_ERR_NOSLOT_MASK (0xfffULL << 52) 56#define KVM_PFN_NOSLOT (0x1ULL << 63) 57 58#define KVM_PFN_ERR_FAULT (KVM_PFN_ERR_MASK) 59#define KVM_PFN_ERR_HWPOISON (KVM_PFN_ERR_MASK + 1) 60#define KVM_PFN_ERR_RO_FAULT (KVM_PFN_ERR_MASK + 2) 61 62/* 63 * error pfns indicate that the gfn is in slot but faild to 64 * translate it to pfn on host. 65 */ 66static inline bool is_error_pfn(pfn_t pfn) 67{ 68 return !!(pfn & KVM_PFN_ERR_MASK); 69} 70 71/* 72 * error_noslot pfns indicate that the gfn can not be 73 * translated to pfn - it is not in slot or failed to 74 * translate it to pfn. 75 */ 76static inline bool is_error_noslot_pfn(pfn_t pfn) 77{ 78 return !!(pfn & KVM_PFN_ERR_NOSLOT_MASK); 79} 80 81/* noslot pfn indicates that the gfn is not in slot. */ 82static inline bool is_noslot_pfn(pfn_t pfn) 83{ 84 return pfn == KVM_PFN_NOSLOT; 85} 86 87#define KVM_HVA_ERR_BAD (PAGE_OFFSET) 88#define KVM_HVA_ERR_RO_BAD (PAGE_OFFSET + PAGE_SIZE) 89 90static inline bool kvm_is_error_hva(unsigned long addr) 91{ 92 return addr >= PAGE_OFFSET; 93} 94 95#define KVM_ERR_PTR_BAD_PAGE (ERR_PTR(-ENOENT)) 96 97static inline bool is_error_page(struct page *page) 98{ 99 return IS_ERR(page); 100} 101 102/* 103 * vcpu->requests bit members 104 */ 105#define KVM_REQ_TLB_FLUSH 0 106#define KVM_REQ_MIGRATE_TIMER 1 107#define KVM_REQ_REPORT_TPR_ACCESS 2 108#define KVM_REQ_MMU_RELOAD 3 109#define KVM_REQ_TRIPLE_FAULT 4 110#define KVM_REQ_PENDING_TIMER 5 111#define KVM_REQ_UNHALT 6 112#define KVM_REQ_MMU_SYNC 7 113#define KVM_REQ_CLOCK_UPDATE 8 114#define KVM_REQ_KICK 9 115#define KVM_REQ_DEACTIVATE_FPU 10 116#define KVM_REQ_EVENT 11 117#define KVM_REQ_APF_HALT 12 118#define KVM_REQ_STEAL_UPDATE 13 119#define KVM_REQ_NMI 14 120#define KVM_REQ_PMU 15 121#define KVM_REQ_PMI 16 122#define KVM_REQ_WATCHDOG 17 123#define KVM_REQ_MASTERCLOCK_UPDATE 18 124#define KVM_REQ_MCLOCK_INPROGRESS 19 125#define KVM_REQ_EPR_EXIT 20 126#define KVM_REQ_SCAN_IOAPIC 21 127 128#define KVM_USERSPACE_IRQ_SOURCE_ID 0 129#define KVM_IRQFD_RESAMPLE_IRQ_SOURCE_ID 1 130 131struct kvm; 132struct kvm_vcpu; 133extern struct kmem_cache *kvm_vcpu_cache; 134 135extern raw_spinlock_t kvm_lock; 136extern struct list_head vm_list; 137 138struct kvm_io_range { 139 gpa_t addr; 140 int len; 141 struct kvm_io_device *dev; 142}; 143 144#define NR_IOBUS_DEVS 1000 145 146struct kvm_io_bus { 147 int dev_count; 148 struct kvm_io_range range[]; 149}; 150 151enum kvm_bus { 152 KVM_MMIO_BUS, 153 KVM_PIO_BUS, 154 KVM_VIRTIO_CCW_NOTIFY_BUS, 155 KVM_NR_BUSES 156}; 157 158int kvm_io_bus_write(struct kvm *kvm, enum kvm_bus bus_idx, gpa_t addr, 159 int len, const void *val); 160int kvm_io_bus_read(struct kvm *kvm, enum kvm_bus bus_idx, gpa_t addr, int len, 161 void *val); 162int kvm_io_bus_register_dev(struct kvm *kvm, enum kvm_bus bus_idx, gpa_t addr, 163 int len, struct kvm_io_device *dev); 164int kvm_io_bus_unregister_dev(struct kvm *kvm, enum kvm_bus bus_idx, 165 struct kvm_io_device *dev); 166 167#ifdef CONFIG_KVM_ASYNC_PF 168struct kvm_async_pf { 169 struct work_struct work; 170 struct list_head link; 171 struct list_head queue; 172 struct kvm_vcpu *vcpu; 173 struct mm_struct *mm; 174 gva_t gva; 175 unsigned long addr; 176 struct kvm_arch_async_pf arch; 177 struct page *page; 178 bool done; 179}; 180 181void kvm_clear_async_pf_completion_queue(struct kvm_vcpu *vcpu); 182void kvm_check_async_pf_completion(struct kvm_vcpu *vcpu); 183int kvm_setup_async_pf(struct kvm_vcpu *vcpu, gva_t gva, gfn_t gfn, 184 struct kvm_arch_async_pf *arch); 185int kvm_async_pf_wakeup_all(struct kvm_vcpu *vcpu); 186#endif 187 188enum { 189 OUTSIDE_GUEST_MODE, 190 IN_GUEST_MODE, 191 EXITING_GUEST_MODE, 192 READING_SHADOW_PAGE_TABLES, 193}; 194 195/* 196 * Sometimes a large or cross-page mmio needs to be broken up into separate 197 * exits for userspace servicing. 198 */ 199struct kvm_mmio_fragment { 200 gpa_t gpa; 201 void *data; 202 unsigned len; 203}; 204 205struct kvm_vcpu { 206 struct kvm *kvm; 207#ifdef CONFIG_PREEMPT_NOTIFIERS 208 struct preempt_notifier preempt_notifier; 209#endif 210 int cpu; 211 int vcpu_id; 212 int srcu_idx; 213 int mode; 214 unsigned long requests; 215 unsigned long guest_debug; 216 217 struct mutex mutex; 218 struct kvm_run *run; 219 220 int fpu_active; 221 int guest_fpu_loaded, guest_xcr0_loaded; 222 wait_queue_head_t wq; 223 struct pid *pid; 224 int sigset_active; 225 sigset_t sigset; 226 struct kvm_vcpu_stat stat; 227 228#ifdef CONFIG_HAS_IOMEM 229 int mmio_needed; 230 int mmio_read_completed; 231 int mmio_is_write; 232 int mmio_cur_fragment; 233 int mmio_nr_fragments; 234 struct kvm_mmio_fragment mmio_fragments[KVM_MAX_MMIO_FRAGMENTS]; 235#endif 236 237#ifdef CONFIG_KVM_ASYNC_PF 238 struct { 239 u32 queued; 240 struct list_head queue; 241 struct list_head done; 242 spinlock_t lock; 243 } async_pf; 244#endif 245 246#ifdef CONFIG_HAVE_KVM_CPU_RELAX_INTERCEPT 247 /* 248 * Cpu relax intercept or pause loop exit optimization 249 * in_spin_loop: set when a vcpu does a pause loop exit 250 * or cpu relax intercepted. 251 * dy_eligible: indicates whether vcpu is eligible for directed yield. 252 */ 253 struct { 254 bool in_spin_loop; 255 bool dy_eligible; 256 } spin_loop; 257#endif 258 bool preempted; 259 struct kvm_vcpu_arch arch; 260}; 261 262static inline int kvm_vcpu_exiting_guest_mode(struct kvm_vcpu *vcpu) 263{ 264 return cmpxchg(&vcpu->mode, IN_GUEST_MODE, EXITING_GUEST_MODE); 265} 266 267/* 268 * Some of the bitops functions do not support too long bitmaps. 269 * This number must be determined not to exceed such limits. 270 */ 271#define KVM_MEM_MAX_NR_PAGES ((1UL << 31) - 1) 272 273struct kvm_memory_slot { 274 gfn_t base_gfn; 275 unsigned long npages; 276 unsigned long *dirty_bitmap; 277 struct kvm_arch_memory_slot arch; 278 unsigned long userspace_addr; 279 u32 flags; 280 short id; 281}; 282 283static inline unsigned long kvm_dirty_bitmap_bytes(struct kvm_memory_slot *memslot) 284{ 285 return ALIGN(memslot->npages, BITS_PER_LONG) / 8; 286} 287 288struct kvm_kernel_irq_routing_entry { 289 u32 gsi; 290 u32 type; 291 int (*set)(struct kvm_kernel_irq_routing_entry *e, 292 struct kvm *kvm, int irq_source_id, int level, 293 bool line_status); 294 union { 295 struct { 296 unsigned irqchip; 297 unsigned pin; 298 } irqchip; 299 struct msi_msg msi; 300 }; 301 struct hlist_node link; 302}; 303 304#ifdef CONFIG_HAVE_KVM_IRQ_ROUTING 305 306struct kvm_irq_routing_table { 307 int chip[KVM_NR_IRQCHIPS][KVM_IRQCHIP_NUM_PINS]; 308 struct kvm_kernel_irq_routing_entry *rt_entries; 309 u32 nr_rt_entries; 310 /* 311 * Array indexed by gsi. Each entry contains list of irq chips 312 * the gsi is connected to. 313 */ 314 struct hlist_head map[0]; 315}; 316 317#else 318 319struct kvm_irq_routing_table {}; 320 321#endif 322 323#ifndef KVM_PRIVATE_MEM_SLOTS 324#define KVM_PRIVATE_MEM_SLOTS 0 325#endif 326 327#ifndef KVM_MEM_SLOTS_NUM 328#define KVM_MEM_SLOTS_NUM (KVM_USER_MEM_SLOTS + KVM_PRIVATE_MEM_SLOTS) 329#endif 330 331/* 332 * Note: 333 * memslots are not sorted by id anymore, please use id_to_memslot() 334 * to get the memslot by its id. 335 */ 336struct kvm_memslots { 337 u64 generation; 338 struct kvm_memory_slot memslots[KVM_MEM_SLOTS_NUM]; 339 /* The mapping table from slot id to the index in memslots[]. */ 340 short id_to_index[KVM_MEM_SLOTS_NUM]; 341}; 342 343struct kvm { 344 spinlock_t mmu_lock; 345 struct mutex slots_lock; 346 struct mm_struct *mm; /* userspace tied to this vm */ 347 struct kvm_memslots *memslots; 348 struct srcu_struct srcu; 349#ifdef CONFIG_KVM_APIC_ARCHITECTURE 350 u32 bsp_vcpu_id; 351#endif 352 struct kvm_vcpu *vcpus[KVM_MAX_VCPUS]; 353 atomic_t online_vcpus; 354 int last_boosted_vcpu; 355 struct list_head vm_list; 356 struct mutex lock; 357 struct kvm_io_bus *buses[KVM_NR_BUSES]; 358#ifdef CONFIG_HAVE_KVM_EVENTFD 359 struct { 360 spinlock_t lock; 361 struct list_head items; 362 struct list_head resampler_list; 363 struct mutex resampler_lock; 364 } irqfds; 365 struct list_head ioeventfds; 366#endif 367 struct kvm_vm_stat stat; 368 struct kvm_arch arch; 369 atomic_t users_count; 370#ifdef KVM_COALESCED_MMIO_PAGE_OFFSET 371 struct kvm_coalesced_mmio_ring *coalesced_mmio_ring; 372 spinlock_t ring_lock; 373 struct list_head coalesced_zones; 374#endif 375 376 struct mutex irq_lock; 377#ifdef CONFIG_HAVE_KVM_IRQCHIP 378 /* 379 * Update side is protected by irq_lock and, 380 * if configured, irqfds.lock. 381 */ 382 struct kvm_irq_routing_table __rcu *irq_routing; 383 struct hlist_head mask_notifier_list; 384 struct hlist_head irq_ack_notifier_list; 385#endif 386 387#if defined(CONFIG_MMU_NOTIFIER) && defined(KVM_ARCH_WANT_MMU_NOTIFIER) 388 struct mmu_notifier mmu_notifier; 389 unsigned long mmu_notifier_seq; 390 long mmu_notifier_count; 391#endif 392 long tlbs_dirty; 393 struct list_head devices; 394}; 395 396#define kvm_err(fmt, ...) \ 397 pr_err("kvm [%i]: " fmt, task_pid_nr(current), ## __VA_ARGS__) 398#define kvm_info(fmt, ...) \ 399 pr_info("kvm [%i]: " fmt, task_pid_nr(current), ## __VA_ARGS__) 400#define kvm_debug(fmt, ...) \ 401 pr_debug("kvm [%i]: " fmt, task_pid_nr(current), ## __VA_ARGS__) 402#define kvm_pr_unimpl(fmt, ...) \ 403 pr_err_ratelimited("kvm [%i]: " fmt, \ 404 task_tgid_nr(current), ## __VA_ARGS__) 405 406/* The guest did something we don't support. */ 407#define vcpu_unimpl(vcpu, fmt, ...) \ 408 kvm_pr_unimpl("vcpu%i " fmt, (vcpu)->vcpu_id, ## __VA_ARGS__) 409 410static inline struct kvm_vcpu *kvm_get_vcpu(struct kvm *kvm, int i) 411{ 412 smp_rmb(); 413 return kvm->vcpus[i]; 414} 415 416#define kvm_for_each_vcpu(idx, vcpup, kvm) \ 417 for (idx = 0; \ 418 idx < atomic_read(&kvm->online_vcpus) && \ 419 (vcpup = kvm_get_vcpu(kvm, idx)) != NULL; \ 420 idx++) 421 422#define kvm_for_each_memslot(memslot, slots) \ 423 for (memslot = &slots->memslots[0]; \ 424 memslot < slots->memslots + KVM_MEM_SLOTS_NUM && memslot->npages;\ 425 memslot++) 426 427int kvm_vcpu_init(struct kvm_vcpu *vcpu, struct kvm *kvm, unsigned id); 428void kvm_vcpu_uninit(struct kvm_vcpu *vcpu); 429 430int __must_check vcpu_load(struct kvm_vcpu *vcpu); 431void vcpu_put(struct kvm_vcpu *vcpu); 432 433#ifdef CONFIG_HAVE_KVM_IRQ_ROUTING 434int kvm_irqfd_init(void); 435void kvm_irqfd_exit(void); 436#else 437static inline int kvm_irqfd_init(void) 438{ 439 return 0; 440} 441 442static inline void kvm_irqfd_exit(void) 443{ 444} 445#endif 446int kvm_init(void *opaque, unsigned vcpu_size, unsigned vcpu_align, 447 struct module *module); 448void kvm_exit(void); 449 450void kvm_get_kvm(struct kvm *kvm); 451void kvm_put_kvm(struct kvm *kvm); 452void update_memslots(struct kvm_memslots *slots, struct kvm_memory_slot *new, 453 u64 last_generation); 454 455static inline struct kvm_memslots *kvm_memslots(struct kvm *kvm) 456{ 457 return rcu_dereference_check(kvm->memslots, 458 srcu_read_lock_held(&kvm->srcu) 459 || lockdep_is_held(&kvm->slots_lock)); 460} 461 462static inline struct kvm_memory_slot * 463id_to_memslot(struct kvm_memslots *slots, int id) 464{ 465 int index = slots->id_to_index[id]; 466 struct kvm_memory_slot *slot; 467 468 slot = &slots->memslots[index]; 469 470 WARN_ON(slot->id != id); 471 return slot; 472} 473 474/* 475 * KVM_SET_USER_MEMORY_REGION ioctl allows the following operations: 476 * - create a new memory slot 477 * - delete an existing memory slot 478 * - modify an existing memory slot 479 * -- move it in the guest physical memory space 480 * -- just change its flags 481 * 482 * Since flags can be changed by some of these operations, the following 483 * differentiation is the best we can do for __kvm_set_memory_region(): 484 */ 485enum kvm_mr_change { 486 KVM_MR_CREATE, 487 KVM_MR_DELETE, 488 KVM_MR_MOVE, 489 KVM_MR_FLAGS_ONLY, 490}; 491 492int kvm_set_memory_region(struct kvm *kvm, 493 struct kvm_userspace_memory_region *mem); 494int __kvm_set_memory_region(struct kvm *kvm, 495 struct kvm_userspace_memory_region *mem); 496void kvm_arch_free_memslot(struct kvm_memory_slot *free, 497 struct kvm_memory_slot *dont); 498int kvm_arch_create_memslot(struct kvm_memory_slot *slot, unsigned long npages); 499int kvm_arch_prepare_memory_region(struct kvm *kvm, 500 struct kvm_memory_slot *memslot, 501 struct kvm_userspace_memory_region *mem, 502 enum kvm_mr_change change); 503void kvm_arch_commit_memory_region(struct kvm *kvm, 504 struct kvm_userspace_memory_region *mem, 505 const struct kvm_memory_slot *old, 506 enum kvm_mr_change change); 507bool kvm_largepages_enabled(void); 508void kvm_disable_largepages(void); 509/* flush all memory translations */ 510void kvm_arch_flush_shadow_all(struct kvm *kvm); 511/* flush memory translations pointing to 'slot' */ 512void kvm_arch_flush_shadow_memslot(struct kvm *kvm, 513 struct kvm_memory_slot *slot); 514 515int gfn_to_page_many_atomic(struct kvm *kvm, gfn_t gfn, struct page **pages, 516 int nr_pages); 517 518struct page *gfn_to_page(struct kvm *kvm, gfn_t gfn); 519unsigned long gfn_to_hva(struct kvm *kvm, gfn_t gfn); 520unsigned long gfn_to_hva_memslot(struct kvm_memory_slot *slot, gfn_t gfn); 521void kvm_release_page_clean(struct page *page); 522void kvm_release_page_dirty(struct page *page); 523void kvm_set_page_dirty(struct page *page); 524void kvm_set_page_accessed(struct page *page); 525 526pfn_t gfn_to_pfn_atomic(struct kvm *kvm, gfn_t gfn); 527pfn_t gfn_to_pfn_async(struct kvm *kvm, gfn_t gfn, bool *async, 528 bool write_fault, bool *writable); 529pfn_t gfn_to_pfn(struct kvm *kvm, gfn_t gfn); 530pfn_t gfn_to_pfn_prot(struct kvm *kvm, gfn_t gfn, bool write_fault, 531 bool *writable); 532pfn_t gfn_to_pfn_memslot(struct kvm_memory_slot *slot, gfn_t gfn); 533pfn_t gfn_to_pfn_memslot_atomic(struct kvm_memory_slot *slot, gfn_t gfn); 534 535void kvm_release_pfn_dirty(pfn_t pfn); 536void kvm_release_pfn_clean(pfn_t pfn); 537void kvm_set_pfn_dirty(pfn_t pfn); 538void kvm_set_pfn_accessed(pfn_t pfn); 539void kvm_get_pfn(pfn_t pfn); 540 541int kvm_read_guest_page(struct kvm *kvm, gfn_t gfn, void *data, int offset, 542 int len); 543int kvm_read_guest_atomic(struct kvm *kvm, gpa_t gpa, void *data, 544 unsigned long len); 545int kvm_read_guest(struct kvm *kvm, gpa_t gpa, void *data, unsigned long len); 546int kvm_read_guest_cached(struct kvm *kvm, struct gfn_to_hva_cache *ghc, 547 void *data, unsigned long len); 548int kvm_write_guest_page(struct kvm *kvm, gfn_t gfn, const void *data, 549 int offset, int len); 550int kvm_write_guest(struct kvm *kvm, gpa_t gpa, const void *data, 551 unsigned long len); 552int kvm_write_guest_cached(struct kvm *kvm, struct gfn_to_hva_cache *ghc, 553 void *data, unsigned long len); 554int kvm_gfn_to_hva_cache_init(struct kvm *kvm, struct gfn_to_hva_cache *ghc, 555 gpa_t gpa, unsigned long len); 556int kvm_clear_guest_page(struct kvm *kvm, gfn_t gfn, int offset, int len); 557int kvm_clear_guest(struct kvm *kvm, gpa_t gpa, unsigned long len); 558struct kvm_memory_slot *gfn_to_memslot(struct kvm *kvm, gfn_t gfn); 559int kvm_is_visible_gfn(struct kvm *kvm, gfn_t gfn); 560unsigned long kvm_host_page_size(struct kvm *kvm, gfn_t gfn); 561void mark_page_dirty(struct kvm *kvm, gfn_t gfn); 562void mark_page_dirty_in_slot(struct kvm *kvm, struct kvm_memory_slot *memslot, 563 gfn_t gfn); 564 565void kvm_vcpu_block(struct kvm_vcpu *vcpu); 566void kvm_vcpu_kick(struct kvm_vcpu *vcpu); 567bool kvm_vcpu_yield_to(struct kvm_vcpu *target); 568void kvm_vcpu_on_spin(struct kvm_vcpu *vcpu); 569void kvm_resched(struct kvm_vcpu *vcpu); 570void kvm_load_guest_fpu(struct kvm_vcpu *vcpu); 571void kvm_put_guest_fpu(struct kvm_vcpu *vcpu); 572 573void kvm_flush_remote_tlbs(struct kvm *kvm); 574void kvm_reload_remote_mmus(struct kvm *kvm); 575void kvm_make_mclock_inprogress_request(struct kvm *kvm); 576void kvm_make_scan_ioapic_request(struct kvm *kvm); 577 578long kvm_arch_dev_ioctl(struct file *filp, 579 unsigned int ioctl, unsigned long arg); 580long kvm_arch_vcpu_ioctl(struct file *filp, 581 unsigned int ioctl, unsigned long arg); 582int kvm_arch_vcpu_fault(struct kvm_vcpu *vcpu, struct vm_fault *vmf); 583 584int kvm_dev_ioctl_check_extension(long ext); 585 586int kvm_get_dirty_log(struct kvm *kvm, 587 struct kvm_dirty_log *log, int *is_dirty); 588int kvm_vm_ioctl_get_dirty_log(struct kvm *kvm, 589 struct kvm_dirty_log *log); 590 591int kvm_vm_ioctl_set_memory_region(struct kvm *kvm, 592 struct kvm_userspace_memory_region *mem); 593int kvm_vm_ioctl_irq_line(struct kvm *kvm, struct kvm_irq_level *irq_level, 594 bool line_status); 595long kvm_arch_vm_ioctl(struct file *filp, 596 unsigned int ioctl, unsigned long arg); 597 598int kvm_arch_vcpu_ioctl_get_fpu(struct kvm_vcpu *vcpu, struct kvm_fpu *fpu); 599int kvm_arch_vcpu_ioctl_set_fpu(struct kvm_vcpu *vcpu, struct kvm_fpu *fpu); 600 601int kvm_arch_vcpu_ioctl_translate(struct kvm_vcpu *vcpu, 602 struct kvm_translation *tr); 603 604int kvm_arch_vcpu_ioctl_get_regs(struct kvm_vcpu *vcpu, struct kvm_regs *regs); 605int kvm_arch_vcpu_ioctl_set_regs(struct kvm_vcpu *vcpu, struct kvm_regs *regs); 606int kvm_arch_vcpu_ioctl_get_sregs(struct kvm_vcpu *vcpu, 607 struct kvm_sregs *sregs); 608int kvm_arch_vcpu_ioctl_set_sregs(struct kvm_vcpu *vcpu, 609 struct kvm_sregs *sregs); 610int kvm_arch_vcpu_ioctl_get_mpstate(struct kvm_vcpu *vcpu, 611 struct kvm_mp_state *mp_state); 612int kvm_arch_vcpu_ioctl_set_mpstate(struct kvm_vcpu *vcpu, 613 struct kvm_mp_state *mp_state); 614int kvm_arch_vcpu_ioctl_set_guest_debug(struct kvm_vcpu *vcpu, 615 struct kvm_guest_debug *dbg); 616int kvm_arch_vcpu_ioctl_run(struct kvm_vcpu *vcpu, struct kvm_run *kvm_run); 617 618int kvm_arch_init(void *opaque); 619void kvm_arch_exit(void); 620 621int kvm_arch_vcpu_init(struct kvm_vcpu *vcpu); 622void kvm_arch_vcpu_uninit(struct kvm_vcpu *vcpu); 623 624void kvm_arch_vcpu_free(struct kvm_vcpu *vcpu); 625void kvm_arch_vcpu_load(struct kvm_vcpu *vcpu, int cpu); 626void kvm_arch_vcpu_put(struct kvm_vcpu *vcpu); 627struct kvm_vcpu *kvm_arch_vcpu_create(struct kvm *kvm, unsigned int id); 628int kvm_arch_vcpu_setup(struct kvm_vcpu *vcpu); 629int kvm_arch_vcpu_postcreate(struct kvm_vcpu *vcpu); 630void kvm_arch_vcpu_destroy(struct kvm_vcpu *vcpu); 631 632int kvm_arch_hardware_enable(void *garbage); 633void kvm_arch_hardware_disable(void *garbage); 634int kvm_arch_hardware_setup(void); 635void kvm_arch_hardware_unsetup(void); 636void kvm_arch_check_processor_compat(void *rtn); 637int kvm_arch_vcpu_runnable(struct kvm_vcpu *vcpu); 638int kvm_arch_vcpu_should_kick(struct kvm_vcpu *vcpu); 639 640void kvm_free_physmem(struct kvm *kvm); 641 642void *kvm_kvzalloc(unsigned long size); 643void kvm_kvfree(const void *addr); 644 645#ifndef __KVM_HAVE_ARCH_VM_ALLOC 646static inline struct kvm *kvm_arch_alloc_vm(void) 647{ 648 return kzalloc(sizeof(struct kvm), GFP_KERNEL); 649} 650 651static inline void kvm_arch_free_vm(struct kvm *kvm) 652{ 653 kfree(kvm); 654} 655#endif 656 657static inline wait_queue_head_t *kvm_arch_vcpu_wq(struct kvm_vcpu *vcpu) 658{ 659#ifdef __KVM_HAVE_ARCH_WQP 660 return vcpu->arch.wqp; 661#else 662 return &vcpu->wq; 663#endif 664} 665 666int kvm_arch_init_vm(struct kvm *kvm, unsigned long type); 667void kvm_arch_destroy_vm(struct kvm *kvm); 668void kvm_arch_sync_events(struct kvm *kvm); 669 670int kvm_cpu_has_pending_timer(struct kvm_vcpu *vcpu); 671void kvm_vcpu_kick(struct kvm_vcpu *vcpu); 672 673bool kvm_is_mmio_pfn(pfn_t pfn); 674 675struct kvm_irq_ack_notifier { 676 struct hlist_node link; 677 unsigned gsi; 678 void (*irq_acked)(struct kvm_irq_ack_notifier *kian); 679}; 680 681struct kvm_assigned_dev_kernel { 682 struct kvm_irq_ack_notifier ack_notifier; 683 struct list_head list; 684 int assigned_dev_id; 685 int host_segnr; 686 int host_busnr; 687 int host_devfn; 688 unsigned int entries_nr; 689 int host_irq; 690 bool host_irq_disabled; 691 bool pci_2_3; 692 struct msix_entry *host_msix_entries; 693 int guest_irq; 694 struct msix_entry *guest_msix_entries; 695 unsigned long irq_requested_type; 696 int irq_source_id; 697 int flags; 698 struct pci_dev *dev; 699 struct kvm *kvm; 700 spinlock_t intx_lock; 701 spinlock_t intx_mask_lock; 702 char irq_name[32]; 703 struct pci_saved_state *pci_saved_state; 704}; 705 706struct kvm_irq_mask_notifier { 707 void (*func)(struct kvm_irq_mask_notifier *kimn, bool masked); 708 int irq; 709 struct hlist_node link; 710}; 711 712void kvm_register_irq_mask_notifier(struct kvm *kvm, int irq, 713 struct kvm_irq_mask_notifier *kimn); 714void kvm_unregister_irq_mask_notifier(struct kvm *kvm, int irq, 715 struct kvm_irq_mask_notifier *kimn); 716void kvm_fire_mask_notifiers(struct kvm *kvm, unsigned irqchip, unsigned pin, 717 bool mask); 718 719int kvm_set_irq(struct kvm *kvm, int irq_source_id, u32 irq, int level, 720 bool line_status); 721int kvm_set_irq_inatomic(struct kvm *kvm, int irq_source_id, u32 irq, int level); 722int kvm_set_msi(struct kvm_kernel_irq_routing_entry *irq_entry, struct kvm *kvm, 723 int irq_source_id, int level, bool line_status); 724bool kvm_irq_has_notifier(struct kvm *kvm, unsigned irqchip, unsigned pin); 725void kvm_notify_acked_irq(struct kvm *kvm, unsigned irqchip, unsigned pin); 726void kvm_register_irq_ack_notifier(struct kvm *kvm, 727 struct kvm_irq_ack_notifier *kian); 728void kvm_unregister_irq_ack_notifier(struct kvm *kvm, 729 struct kvm_irq_ack_notifier *kian); 730int kvm_request_irq_source_id(struct kvm *kvm); 731void kvm_free_irq_source_id(struct kvm *kvm, int irq_source_id); 732 733/* For vcpu->arch.iommu_flags */ 734#define KVM_IOMMU_CACHE_COHERENCY 0x1 735 736#ifdef CONFIG_KVM_DEVICE_ASSIGNMENT 737int kvm_iommu_map_pages(struct kvm *kvm, struct kvm_memory_slot *slot); 738void kvm_iommu_unmap_pages(struct kvm *kvm, struct kvm_memory_slot *slot); 739int kvm_iommu_map_guest(struct kvm *kvm); 740int kvm_iommu_unmap_guest(struct kvm *kvm); 741int kvm_assign_device(struct kvm *kvm, 742 struct kvm_assigned_dev_kernel *assigned_dev); 743int kvm_deassign_device(struct kvm *kvm, 744 struct kvm_assigned_dev_kernel *assigned_dev); 745#else 746static inline int kvm_iommu_map_pages(struct kvm *kvm, 747 struct kvm_memory_slot *slot) 748{ 749 return 0; 750} 751 752static inline void kvm_iommu_unmap_pages(struct kvm *kvm, 753 struct kvm_memory_slot *slot) 754{ 755} 756 757static inline int kvm_iommu_unmap_guest(struct kvm *kvm) 758{ 759 return 0; 760} 761#endif 762 763static inline void __guest_enter(void) 764{ 765 /* 766 * This is running in ioctl context so we can avoid 767 * the call to vtime_account() with its unnecessary idle check. 768 */ 769 vtime_account_system(current); 770 current->flags |= PF_VCPU; 771} 772 773static inline void __guest_exit(void) 774{ 775 /* 776 * This is running in ioctl context so we can avoid 777 * the call to vtime_account() with its unnecessary idle check. 778 */ 779 vtime_account_system(current); 780 current->flags &= ~PF_VCPU; 781} 782 783#ifdef CONFIG_CONTEXT_TRACKING 784extern void guest_enter(void); 785extern void guest_exit(void); 786 787#else /* !CONFIG_CONTEXT_TRACKING */ 788static inline void guest_enter(void) 789{ 790 __guest_enter(); 791} 792 793static inline void guest_exit(void) 794{ 795 __guest_exit(); 796} 797#endif /* !CONFIG_CONTEXT_TRACKING */ 798 799static inline void kvm_guest_enter(void) 800{ 801 unsigned long flags; 802 803 BUG_ON(preemptible()); 804 805 local_irq_save(flags); 806 guest_enter(); 807 local_irq_restore(flags); 808 809 /* KVM does not hold any references to rcu protected data when it 810 * switches CPU into a guest mode. In fact switching to a guest mode 811 * is very similar to exiting to userspase from rcu point of view. In 812 * addition CPU may stay in a guest mode for quite a long time (up to 813 * one time slice). Lets treat guest mode as quiescent state, just like 814 * we do with user-mode execution. 815 */ 816 rcu_virt_note_context_switch(smp_processor_id()); 817} 818 819static inline void kvm_guest_exit(void) 820{ 821 unsigned long flags; 822 823 local_irq_save(flags); 824 guest_exit(); 825 local_irq_restore(flags); 826} 827 828/* 829 * search_memslots() and __gfn_to_memslot() are here because they are 830 * used in non-modular code in arch/powerpc/kvm/book3s_hv_rm_mmu.c. 831 * gfn_to_memslot() itself isn't here as an inline because that would 832 * bloat other code too much. 833 */ 834static inline struct kvm_memory_slot * 835search_memslots(struct kvm_memslots *slots, gfn_t gfn) 836{ 837 struct kvm_memory_slot *memslot; 838 839 kvm_for_each_memslot(memslot, slots) 840 if (gfn >= memslot->base_gfn && 841 gfn < memslot->base_gfn + memslot->npages) 842 return memslot; 843 844 return NULL; 845} 846 847static inline struct kvm_memory_slot * 848__gfn_to_memslot(struct kvm_memslots *slots, gfn_t gfn) 849{ 850 return search_memslots(slots, gfn); 851} 852 853static inline unsigned long 854__gfn_to_hva_memslot(struct kvm_memory_slot *slot, gfn_t gfn) 855{ 856 return slot->userspace_addr + (gfn - slot->base_gfn) * PAGE_SIZE; 857} 858 859static inline int memslot_id(struct kvm *kvm, gfn_t gfn) 860{ 861 return gfn_to_memslot(kvm, gfn)->id; 862} 863 864static inline gfn_t gfn_to_index(gfn_t gfn, gfn_t base_gfn, int level) 865{ 866 /* KVM_HPAGE_GFN_SHIFT(PT_PAGE_TABLE_LEVEL) must be 0. */ 867 return (gfn >> KVM_HPAGE_GFN_SHIFT(level)) - 868 (base_gfn >> KVM_HPAGE_GFN_SHIFT(level)); 869} 870 871static inline gfn_t 872hva_to_gfn_memslot(unsigned long hva, struct kvm_memory_slot *slot) 873{ 874 gfn_t gfn_offset = (hva - slot->userspace_addr) >> PAGE_SHIFT; 875 876 return slot->base_gfn + gfn_offset; 877} 878 879static inline gpa_t gfn_to_gpa(gfn_t gfn) 880{ 881 return (gpa_t)gfn << PAGE_SHIFT; 882} 883 884static inline gfn_t gpa_to_gfn(gpa_t gpa) 885{ 886 return (gfn_t)(gpa >> PAGE_SHIFT); 887} 888 889static inline hpa_t pfn_to_hpa(pfn_t pfn) 890{ 891 return (hpa_t)pfn << PAGE_SHIFT; 892} 893 894static inline void kvm_migrate_timers(struct kvm_vcpu *vcpu) 895{ 896 set_bit(KVM_REQ_MIGRATE_TIMER, &vcpu->requests); 897} 898 899enum kvm_stat_kind { 900 KVM_STAT_VM, 901 KVM_STAT_VCPU, 902}; 903 904struct kvm_stats_debugfs_item { 905 const char *name; 906 int offset; 907 enum kvm_stat_kind kind; 908 struct dentry *dentry; 909}; 910extern struct kvm_stats_debugfs_item debugfs_entries[]; 911extern struct dentry *kvm_debugfs_dir; 912 913#if defined(CONFIG_MMU_NOTIFIER) && defined(KVM_ARCH_WANT_MMU_NOTIFIER) 914static inline int mmu_notifier_retry(struct kvm *kvm, unsigned long mmu_seq) 915{ 916 if (unlikely(kvm->mmu_notifier_count)) 917 return 1; 918 /* 919 * Ensure the read of mmu_notifier_count happens before the read 920 * of mmu_notifier_seq. This interacts with the smp_wmb() in 921 * mmu_notifier_invalidate_range_end to make sure that the caller 922 * either sees the old (non-zero) value of mmu_notifier_count or 923 * the new (incremented) value of mmu_notifier_seq. 924 * PowerPC Book3s HV KVM calls this under a per-page lock 925 * rather than under kvm->mmu_lock, for scalability, so 926 * can't rely on kvm->mmu_lock to keep things ordered. 927 */ 928 smp_rmb(); 929 if (kvm->mmu_notifier_seq != mmu_seq) 930 return 1; 931 return 0; 932} 933#endif 934 935#ifdef CONFIG_HAVE_KVM_IRQ_ROUTING 936 937#define KVM_MAX_IRQ_ROUTES 1024 938 939int kvm_setup_default_irq_routing(struct kvm *kvm); 940int kvm_set_irq_routing(struct kvm *kvm, 941 const struct kvm_irq_routing_entry *entries, 942 unsigned nr, 943 unsigned flags); 944int kvm_set_routing_entry(struct kvm_irq_routing_table *rt, 945 struct kvm_kernel_irq_routing_entry *e, 946 const struct kvm_irq_routing_entry *ue); 947void kvm_free_irq_routing(struct kvm *kvm); 948 949int kvm_send_userspace_msi(struct kvm *kvm, struct kvm_msi *msi); 950 951#else 952 953static inline void kvm_free_irq_routing(struct kvm *kvm) {} 954 955#endif 956 957#ifdef CONFIG_HAVE_KVM_EVENTFD 958 959void kvm_eventfd_init(struct kvm *kvm); 960int kvm_ioeventfd(struct kvm *kvm, struct kvm_ioeventfd *args); 961 962#ifdef CONFIG_HAVE_KVM_IRQCHIP 963int kvm_irqfd(struct kvm *kvm, struct kvm_irqfd *args); 964void kvm_irqfd_release(struct kvm *kvm); 965void kvm_irq_routing_update(struct kvm *, struct kvm_irq_routing_table *); 966#else 967static inline int kvm_irqfd(struct kvm *kvm, struct kvm_irqfd *args) 968{ 969 return -EINVAL; 970} 971 972static inline void kvm_irqfd_release(struct kvm *kvm) {} 973#endif 974 975#else 976 977static inline void kvm_eventfd_init(struct kvm *kvm) {} 978 979static inline int kvm_irqfd(struct kvm *kvm, struct kvm_irqfd *args) 980{ 981 return -EINVAL; 982} 983 984static inline void kvm_irqfd_release(struct kvm *kvm) {} 985 986#ifdef CONFIG_HAVE_KVM_IRQCHIP 987static inline void kvm_irq_routing_update(struct kvm *kvm, 988 struct kvm_irq_routing_table *irq_rt) 989{ 990 rcu_assign_pointer(kvm->irq_routing, irq_rt); 991} 992#endif 993 994static inline int kvm_ioeventfd(struct kvm *kvm, struct kvm_ioeventfd *args) 995{ 996 return -ENOSYS; 997} 998 999#endif /* CONFIG_HAVE_KVM_EVENTFD */ 1000 1001#ifdef CONFIG_KVM_APIC_ARCHITECTURE 1002static inline bool kvm_vcpu_is_bsp(struct kvm_vcpu *vcpu) 1003{ 1004 return vcpu->kvm->bsp_vcpu_id == vcpu->vcpu_id; 1005} 1006 1007bool kvm_vcpu_compatible(struct kvm_vcpu *vcpu); 1008 1009#else 1010 1011static inline bool kvm_vcpu_compatible(struct kvm_vcpu *vcpu) { return true; } 1012 1013#endif 1014 1015#ifdef CONFIG_KVM_DEVICE_ASSIGNMENT 1016 1017long kvm_vm_ioctl_assigned_device(struct kvm *kvm, unsigned ioctl, 1018 unsigned long arg); 1019 1020void kvm_free_all_assigned_devices(struct kvm *kvm); 1021 1022#else 1023 1024static inline long kvm_vm_ioctl_assigned_device(struct kvm *kvm, unsigned ioctl, 1025 unsigned long arg) 1026{ 1027 return -ENOTTY; 1028} 1029 1030static inline void kvm_free_all_assigned_devices(struct kvm *kvm) {} 1031 1032#endif 1033 1034static inline void kvm_make_request(int req, struct kvm_vcpu *vcpu) 1035{ 1036 set_bit(req, &vcpu->requests); 1037} 1038 1039static inline bool kvm_check_request(int req, struct kvm_vcpu *vcpu) 1040{ 1041 if (test_bit(req, &vcpu->requests)) { 1042 clear_bit(req, &vcpu->requests); 1043 return true; 1044 } else { 1045 return false; 1046 } 1047} 1048 1049extern bool kvm_rebooting; 1050 1051struct kvm_device_ops; 1052 1053struct kvm_device { 1054 struct kvm_device_ops *ops; 1055 struct kvm *kvm; 1056 void *private; 1057 struct list_head vm_node; 1058}; 1059 1060/* create, destroy, and name are mandatory */ 1061struct kvm_device_ops { 1062 const char *name; 1063 int (*create)(struct kvm_device *dev, u32 type); 1064 1065 /* 1066 * Destroy is responsible for freeing dev. 1067 * 1068 * Destroy may be called before or after destructors are called 1069 * on emulated I/O regions, depending on whether a reference is 1070 * held by a vcpu or other kvm component that gets destroyed 1071 * after the emulated I/O. 1072 */ 1073 void (*destroy)(struct kvm_device *dev); 1074 1075 int (*set_attr)(struct kvm_device *dev, struct kvm_device_attr *attr); 1076 int (*get_attr)(struct kvm_device *dev, struct kvm_device_attr *attr); 1077 int (*has_attr)(struct kvm_device *dev, struct kvm_device_attr *attr); 1078 long (*ioctl)(struct kvm_device *dev, unsigned int ioctl, 1079 unsigned long arg); 1080}; 1081 1082void kvm_device_get(struct kvm_device *dev); 1083void kvm_device_put(struct kvm_device *dev); 1084struct kvm_device *kvm_device_from_filp(struct file *filp); 1085 1086extern struct kvm_device_ops kvm_mpic_ops; 1087extern struct kvm_device_ops kvm_xics_ops; 1088 1089#ifdef CONFIG_HAVE_KVM_CPU_RELAX_INTERCEPT 1090 1091static inline void kvm_vcpu_set_in_spin_loop(struct kvm_vcpu *vcpu, bool val) 1092{ 1093 vcpu->spin_loop.in_spin_loop = val; 1094} 1095static inline void kvm_vcpu_set_dy_eligible(struct kvm_vcpu *vcpu, bool val) 1096{ 1097 vcpu->spin_loop.dy_eligible = val; 1098} 1099 1100#else /* !CONFIG_HAVE_KVM_CPU_RELAX_INTERCEPT */ 1101 1102static inline void kvm_vcpu_set_in_spin_loop(struct kvm_vcpu *vcpu, bool val) 1103{ 1104} 1105 1106static inline void kvm_vcpu_set_dy_eligible(struct kvm_vcpu *vcpu, bool val) 1107{ 1108} 1109 1110static inline bool kvm_vcpu_eligible_for_directed_yield(struct kvm_vcpu *vcpu) 1111{ 1112 return true; 1113} 1114 1115#endif /* CONFIG_HAVE_KVM_CPU_RELAX_INTERCEPT */ 1116#endif 1117