kvm.h 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516
  1. #ifndef __KVM_H
  2. #define __KVM_H
  3. /*
  4. * This work is licensed under the terms of the GNU GPL, version 2. See
  5. * the COPYING file in the top-level directory.
  6. */
  7. #include <linux/types.h>
  8. #include <linux/hardirq.h>
  9. #include <linux/list.h>
  10. #include <linux/mutex.h>
  11. #include <linux/spinlock.h>
  12. #include <linux/signal.h>
  13. #include <linux/sched.h>
  14. #include <linux/mm.h>
  15. #include <linux/preempt.h>
  16. #include <asm/signal.h>
  17. #include <linux/kvm.h>
  18. #include <linux/kvm_para.h>
  19. #define KVM_MAX_VCPUS 4
  20. #define KVM_ALIAS_SLOTS 4
  21. #define KVM_MEMORY_SLOTS 8
  22. /* memory slots that does not exposed to userspace */
  23. #define KVM_PRIVATE_MEM_SLOTS 4
  24. #define KVM_PERMILLE_MMU_PAGES 20
  25. #define KVM_MIN_ALLOC_MMU_PAGES 64
  26. #define KVM_NUM_MMU_PAGES 1024
  27. #define KVM_MIN_FREE_MMU_PAGES 5
  28. #define KVM_REFILL_PAGES 25
  29. #define KVM_MAX_CPUID_ENTRIES 40
  30. #define KVM_PIO_PAGE_OFFSET 1
  31. /*
  32. * vcpu->requests bit members
  33. */
  34. #define KVM_REQ_TLB_FLUSH 0
  35. /*
  36. * Address types:
  37. *
  38. * gva - guest virtual address
  39. * gpa - guest physical address
  40. * gfn - guest frame number
  41. * hva - host virtual address
  42. * hpa - host physical address
  43. * hfn - host frame number
  44. */
  45. typedef unsigned long gva_t;
  46. typedef u64 gpa_t;
  47. typedef unsigned long gfn_t;
  48. typedef unsigned long hva_t;
  49. typedef u64 hpa_t;
  50. typedef unsigned long hfn_t;
  51. #define NR_PTE_CHAIN_ENTRIES 5
  52. struct kvm_pte_chain {
  53. u64 *parent_ptes[NR_PTE_CHAIN_ENTRIES];
  54. struct hlist_node link;
  55. };
  56. /*
  57. * kvm_mmu_page_role, below, is defined as:
  58. *
  59. * bits 0:3 - total guest paging levels (2-4, or zero for real mode)
  60. * bits 4:7 - page table level for this shadow (1-4)
  61. * bits 8:9 - page table quadrant for 2-level guests
  62. * bit 16 - "metaphysical" - gfn is not a real page (huge page/real mode)
  63. * bits 17:19 - "access" - the user, writable, and nx bits of a huge page pde
  64. */
  65. union kvm_mmu_page_role {
  66. unsigned word;
  67. struct {
  68. unsigned glevels : 4;
  69. unsigned level : 4;
  70. unsigned quadrant : 2;
  71. unsigned pad_for_nice_hex_output : 6;
  72. unsigned metaphysical : 1;
  73. unsigned hugepage_access : 3;
  74. };
  75. };
  76. struct kvm_mmu_page {
  77. struct list_head link;
  78. struct hlist_node hash_link;
  79. /*
  80. * The following two entries are used to key the shadow page in the
  81. * hash table.
  82. */
  83. gfn_t gfn;
  84. union kvm_mmu_page_role role;
  85. u64 *spt;
  86. /* hold the gfn of each spte inside spt */
  87. gfn_t *gfns;
  88. unsigned long slot_bitmap; /* One bit set per slot which has memory
  89. * in this shadow page.
  90. */
  91. int multimapped; /* More than one parent_pte? */
  92. int root_count; /* Currently serving as active root */
  93. union {
  94. u64 *parent_pte; /* !multimapped */
  95. struct hlist_head parent_ptes; /* multimapped, kvm_pte_chain */
  96. };
  97. };
  98. struct kvm_vcpu;
  99. extern struct kmem_cache *kvm_vcpu_cache;
  100. /*
  101. * x86 supports 3 paging modes (4-level 64-bit, 3-level 64-bit, and 2-level
  102. * 32-bit). The kvm_mmu structure abstracts the details of the current mmu
  103. * mode.
  104. */
  105. struct kvm_mmu {
  106. void (*new_cr3)(struct kvm_vcpu *vcpu);
  107. int (*page_fault)(struct kvm_vcpu *vcpu, gva_t gva, u32 err);
  108. void (*free)(struct kvm_vcpu *vcpu);
  109. gpa_t (*gva_to_gpa)(struct kvm_vcpu *vcpu, gva_t gva);
  110. void (*prefetch_page)(struct kvm_vcpu *vcpu,
  111. struct kvm_mmu_page *page);
  112. hpa_t root_hpa;
  113. int root_level;
  114. int shadow_root_level;
  115. u64 *pae_root;
  116. };
  117. #define KVM_NR_MEM_OBJS 40
  118. /*
  119. * We don't want allocation failures within the mmu code, so we preallocate
  120. * enough memory for a single page fault in a cache.
  121. */
  122. struct kvm_mmu_memory_cache {
  123. int nobjs;
  124. void *objects[KVM_NR_MEM_OBJS];
  125. };
  126. struct kvm_guest_debug {
  127. int enabled;
  128. unsigned long bp[4];
  129. int singlestep;
  130. };
  131. struct kvm_pio_request {
  132. unsigned long count;
  133. int cur_count;
  134. struct page *guest_pages[2];
  135. unsigned guest_page_offset;
  136. int in;
  137. int port;
  138. int size;
  139. int string;
  140. int down;
  141. int rep;
  142. };
  143. struct kvm_vcpu_stat {
  144. u32 pf_fixed;
  145. u32 pf_guest;
  146. u32 tlb_flush;
  147. u32 invlpg;
  148. u32 exits;
  149. u32 io_exits;
  150. u32 mmio_exits;
  151. u32 signal_exits;
  152. u32 irq_window_exits;
  153. u32 halt_exits;
  154. u32 halt_wakeup;
  155. u32 request_irq_exits;
  156. u32 irq_exits;
  157. u32 host_state_reload;
  158. u32 efer_reload;
  159. u32 fpu_reload;
  160. u32 insn_emulation;
  161. u32 insn_emulation_fail;
  162. };
  163. struct kvm_io_device {
  164. void (*read)(struct kvm_io_device *this,
  165. gpa_t addr,
  166. int len,
  167. void *val);
  168. void (*write)(struct kvm_io_device *this,
  169. gpa_t addr,
  170. int len,
  171. const void *val);
  172. int (*in_range)(struct kvm_io_device *this, gpa_t addr);
  173. void (*destructor)(struct kvm_io_device *this);
  174. void *private;
  175. };
  176. static inline void kvm_iodevice_read(struct kvm_io_device *dev,
  177. gpa_t addr,
  178. int len,
  179. void *val)
  180. {
  181. dev->read(dev, addr, len, val);
  182. }
  183. static inline void kvm_iodevice_write(struct kvm_io_device *dev,
  184. gpa_t addr,
  185. int len,
  186. const void *val)
  187. {
  188. dev->write(dev, addr, len, val);
  189. }
  190. static inline int kvm_iodevice_inrange(struct kvm_io_device *dev, gpa_t addr)
  191. {
  192. return dev->in_range(dev, addr);
  193. }
  194. static inline void kvm_iodevice_destructor(struct kvm_io_device *dev)
  195. {
  196. if (dev->destructor)
  197. dev->destructor(dev);
  198. }
  199. /*
  200. * It would be nice to use something smarter than a linear search, TBD...
  201. * Thankfully we dont expect many devices to register (famous last words :),
  202. * so until then it will suffice. At least its abstracted so we can change
  203. * in one place.
  204. */
  205. struct kvm_io_bus {
  206. int dev_count;
  207. #define NR_IOBUS_DEVS 6
  208. struct kvm_io_device *devs[NR_IOBUS_DEVS];
  209. };
  210. void kvm_io_bus_init(struct kvm_io_bus *bus);
  211. void kvm_io_bus_destroy(struct kvm_io_bus *bus);
  212. struct kvm_io_device *kvm_io_bus_find_dev(struct kvm_io_bus *bus, gpa_t addr);
  213. void kvm_io_bus_register_dev(struct kvm_io_bus *bus,
  214. struct kvm_io_device *dev);
  215. #ifdef CONFIG_HAS_IOMEM
  216. #define KVM_VCPU_MMIO \
  217. int mmio_needed; \
  218. int mmio_read_completed; \
  219. int mmio_is_write; \
  220. int mmio_size; \
  221. unsigned char mmio_data[8]; \
  222. gpa_t mmio_phys_addr;
  223. #else
  224. #define KVM_VCPU_MMIO
  225. #endif
  226. #define KVM_VCPU_COMM \
  227. struct kvm *kvm; \
  228. struct preempt_notifier preempt_notifier; \
  229. int vcpu_id; \
  230. struct mutex mutex; \
  231. int cpu; \
  232. struct kvm_run *run; \
  233. int guest_mode; \
  234. unsigned long requests; \
  235. struct kvm_guest_debug guest_debug; \
  236. int fpu_active; \
  237. int guest_fpu_loaded; \
  238. wait_queue_head_t wq; \
  239. int sigset_active; \
  240. sigset_t sigset; \
  241. struct kvm_vcpu_stat stat; \
  242. KVM_VCPU_MMIO
  243. struct kvm_mem_alias {
  244. gfn_t base_gfn;
  245. unsigned long npages;
  246. gfn_t target_gfn;
  247. };
  248. struct kvm_memory_slot {
  249. gfn_t base_gfn;
  250. unsigned long npages;
  251. unsigned long flags;
  252. unsigned long *rmap;
  253. unsigned long *dirty_bitmap;
  254. unsigned long userspace_addr;
  255. int user_alloc;
  256. };
  257. struct kvm_vm_stat {
  258. u32 mmu_shadow_zapped;
  259. u32 mmu_pte_write;
  260. u32 mmu_pte_updated;
  261. u32 mmu_pde_zapped;
  262. u32 mmu_flooded;
  263. u32 mmu_recycled;
  264. u32 remote_tlb_flush;
  265. };
  266. struct kvm {
  267. struct mutex lock; /* protects everything except vcpus */
  268. int naliases;
  269. struct kvm_mem_alias aliases[KVM_ALIAS_SLOTS];
  270. int nmemslots;
  271. struct kvm_memory_slot memslots[KVM_MEMORY_SLOTS +
  272. KVM_PRIVATE_MEM_SLOTS];
  273. /*
  274. * Hash table of struct kvm_mmu_page.
  275. */
  276. struct list_head active_mmu_pages;
  277. unsigned int n_free_mmu_pages;
  278. unsigned int n_requested_mmu_pages;
  279. unsigned int n_alloc_mmu_pages;
  280. struct hlist_head mmu_page_hash[KVM_NUM_MMU_PAGES];
  281. struct kvm_vcpu *vcpus[KVM_MAX_VCPUS];
  282. struct list_head vm_list;
  283. struct file *filp;
  284. struct kvm_io_bus mmio_bus;
  285. struct kvm_io_bus pio_bus;
  286. struct kvm_pic *vpic;
  287. struct kvm_ioapic *vioapic;
  288. int round_robin_prev_vcpu;
  289. unsigned int tss_addr;
  290. struct page *apic_access_page;
  291. struct kvm_vm_stat stat;
  292. };
  293. static inline struct kvm_pic *pic_irqchip(struct kvm *kvm)
  294. {
  295. return kvm->vpic;
  296. }
  297. static inline struct kvm_ioapic *ioapic_irqchip(struct kvm *kvm)
  298. {
  299. return kvm->vioapic;
  300. }
  301. static inline int irqchip_in_kernel(struct kvm *kvm)
  302. {
  303. return pic_irqchip(kvm) != NULL;
  304. }
  305. struct descriptor_table {
  306. u16 limit;
  307. unsigned long base;
  308. } __attribute__((packed));
  309. /* The guest did something we don't support. */
  310. #define pr_unimpl(vcpu, fmt, ...) \
  311. do { \
  312. if (printk_ratelimit()) \
  313. printk(KERN_ERR "kvm: %i: cpu%i " fmt, \
  314. current->tgid, (vcpu)->vcpu_id , ## __VA_ARGS__); \
  315. } while (0)
  316. #define kvm_printf(kvm, fmt ...) printk(KERN_DEBUG fmt)
  317. #define vcpu_printf(vcpu, fmt...) kvm_printf(vcpu->kvm, fmt)
  318. int kvm_vcpu_init(struct kvm_vcpu *vcpu, struct kvm *kvm, unsigned id);
  319. void kvm_vcpu_uninit(struct kvm_vcpu *vcpu);
  320. void vcpu_load(struct kvm_vcpu *vcpu);
  321. void vcpu_put(struct kvm_vcpu *vcpu);
  322. void decache_vcpus_on_cpu(int cpu);
  323. int kvm_init(void *opaque, unsigned int vcpu_size,
  324. struct module *module);
  325. void kvm_exit(void);
  326. hpa_t gpa_to_hpa(struct kvm *kvm, gpa_t gpa);
  327. #define HPA_MSB ((sizeof(hpa_t) * 8) - 1)
  328. #define HPA_ERR_MASK ((hpa_t)1 << HPA_MSB)
  329. static inline int is_error_hpa(hpa_t hpa) { return hpa >> HPA_MSB; }
  330. hpa_t gva_to_hpa(struct kvm_vcpu *vcpu, gva_t gva);
  331. struct page *gva_to_page(struct kvm_vcpu *vcpu, gva_t gva);
  332. extern struct page *bad_page;
  333. int is_error_page(struct page *page);
  334. int kvm_is_error_hva(unsigned long addr);
  335. int kvm_set_memory_region(struct kvm *kvm,
  336. struct kvm_userspace_memory_region *mem,
  337. int user_alloc);
  338. int __kvm_set_memory_region(struct kvm *kvm,
  339. struct kvm_userspace_memory_region *mem,
  340. int user_alloc);
  341. int kvm_arch_set_memory_region(struct kvm *kvm,
  342. struct kvm_userspace_memory_region *mem,
  343. struct kvm_memory_slot old,
  344. int user_alloc);
  345. gfn_t unalias_gfn(struct kvm *kvm, gfn_t gfn);
  346. struct page *gfn_to_page(struct kvm *kvm, gfn_t gfn);
  347. void kvm_release_page_clean(struct page *page);
  348. void kvm_release_page_dirty(struct page *page);
  349. int kvm_read_guest_page(struct kvm *kvm, gfn_t gfn, void *data, int offset,
  350. int len);
  351. int kvm_read_guest(struct kvm *kvm, gpa_t gpa, void *data, unsigned long len);
  352. int kvm_write_guest_page(struct kvm *kvm, gfn_t gfn, const void *data,
  353. int offset, int len);
  354. int kvm_write_guest(struct kvm *kvm, gpa_t gpa, const void *data,
  355. unsigned long len);
  356. int kvm_clear_guest_page(struct kvm *kvm, gfn_t gfn, int offset, int len);
  357. int kvm_clear_guest(struct kvm *kvm, gpa_t gpa, unsigned long len);
  358. struct kvm_memory_slot *gfn_to_memslot(struct kvm *kvm, gfn_t gfn);
  359. int kvm_is_visible_gfn(struct kvm *kvm, gfn_t gfn);
  360. void mark_page_dirty(struct kvm *kvm, gfn_t gfn);
  361. void kvm_vcpu_block(struct kvm_vcpu *vcpu);
  362. void kvm_resched(struct kvm_vcpu *vcpu);
  363. void kvm_load_guest_fpu(struct kvm_vcpu *vcpu);
  364. void kvm_put_guest_fpu(struct kvm_vcpu *vcpu);
  365. void kvm_flush_remote_tlbs(struct kvm *kvm);
  366. long kvm_arch_dev_ioctl(struct file *filp,
  367. unsigned int ioctl, unsigned long arg);
  368. long kvm_arch_vcpu_ioctl(struct file *filp,
  369. unsigned int ioctl, unsigned long arg);
  370. void kvm_arch_vcpu_load(struct kvm_vcpu *vcpu, int cpu);
  371. void kvm_arch_vcpu_put(struct kvm_vcpu *vcpu);
  372. int kvm_dev_ioctl_check_extension(long ext);
  373. int kvm_get_dirty_log(struct kvm *kvm,
  374. struct kvm_dirty_log *log, int *is_dirty);
  375. int kvm_vm_ioctl_get_dirty_log(struct kvm *kvm,
  376. struct kvm_dirty_log *log);
  377. int kvm_vm_ioctl_set_memory_region(struct kvm *kvm,
  378. struct
  379. kvm_userspace_memory_region *mem,
  380. int user_alloc);
  381. long kvm_arch_vm_ioctl(struct file *filp,
  382. unsigned int ioctl, unsigned long arg);
  383. void kvm_arch_destroy_vm(struct kvm *kvm);
  384. int kvm_arch_vcpu_ioctl_get_fpu(struct kvm_vcpu *vcpu, struct kvm_fpu *fpu);
  385. int kvm_arch_vcpu_ioctl_set_fpu(struct kvm_vcpu *vcpu, struct kvm_fpu *fpu);
  386. int kvm_arch_vcpu_ioctl_translate(struct kvm_vcpu *vcpu,
  387. struct kvm_translation *tr);
  388. int kvm_arch_vcpu_ioctl_get_regs(struct kvm_vcpu *vcpu, struct kvm_regs *regs);
  389. int kvm_arch_vcpu_ioctl_set_regs(struct kvm_vcpu *vcpu, struct kvm_regs *regs);
  390. int kvm_arch_vcpu_ioctl_get_sregs(struct kvm_vcpu *vcpu,
  391. struct kvm_sregs *sregs);
  392. int kvm_arch_vcpu_ioctl_set_sregs(struct kvm_vcpu *vcpu,
  393. struct kvm_sregs *sregs);
  394. int kvm_arch_vcpu_ioctl_debug_guest(struct kvm_vcpu *vcpu,
  395. struct kvm_debug_guest *dbg);
  396. int kvm_arch_vcpu_ioctl_run(struct kvm_vcpu *vcpu, struct kvm_run *kvm_run);
  397. int kvm_arch_init(void *opaque);
  398. void kvm_arch_exit(void);
  399. int kvm_arch_vcpu_init(struct kvm_vcpu *vcpu);
  400. void kvm_arch_vcpu_uninit(struct kvm_vcpu *vcpu);
  401. void kvm_arch_vcpu_free(struct kvm_vcpu *vcpu);
  402. void kvm_arch_vcpu_load(struct kvm_vcpu *vcpu, int cpu);
  403. void kvm_arch_vcpu_put(struct kvm_vcpu *vcpu);
  404. struct kvm_vcpu *kvm_arch_vcpu_create(struct kvm *kvm, unsigned int id);
  405. int kvm_arch_vcpu_setup(struct kvm_vcpu *vcpu);
  406. void kvm_arch_vcpu_destroy(struct kvm_vcpu *vcpu);
  407. int kvm_arch_vcpu_reset(struct kvm_vcpu *vcpu);
  408. void kvm_arch_hardware_enable(void *garbage);
  409. void kvm_arch_hardware_disable(void *garbage);
  410. int kvm_arch_hardware_setup(void);
  411. void kvm_arch_hardware_unsetup(void);
  412. void kvm_arch_check_processor_compat(void *rtn);
  413. void kvm_free_physmem(struct kvm *kvm);
  414. struct kvm *kvm_arch_create_vm(void);
  415. void kvm_arch_destroy_vm(struct kvm *kvm);
  416. static inline void kvm_guest_enter(void)
  417. {
  418. account_system_vtime(current);
  419. current->flags |= PF_VCPU;
  420. }
  421. static inline void kvm_guest_exit(void)
  422. {
  423. account_system_vtime(current);
  424. current->flags &= ~PF_VCPU;
  425. }
  426. static inline int memslot_id(struct kvm *kvm, struct kvm_memory_slot *slot)
  427. {
  428. return slot - kvm->memslots;
  429. }
  430. enum kvm_stat_kind {
  431. KVM_STAT_VM,
  432. KVM_STAT_VCPU,
  433. };
  434. struct kvm_stats_debugfs_item {
  435. const char *name;
  436. int offset;
  437. enum kvm_stat_kind kind;
  438. struct dentry *dentry;
  439. };
  440. extern struct kvm_stats_debugfs_item debugfs_entries[];
  441. #endif