kvm_host.h 25 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901
  1. /*
  2. * Kernel-based Virtual Machine driver for Linux
  3. *
  4. * This header defines architecture specific interfaces, x86 version
  5. *
  6. * This work is licensed under the terms of the GNU GPL, version 2. See
  7. * the COPYING file in the top-level directory.
  8. *
  9. */
  10. #ifndef _ASM_X86_KVM_HOST_H
  11. #define _ASM_X86_KVM_HOST_H
  12. #include <linux/types.h>
  13. #include <linux/mm.h>
  14. #include <linux/mmu_notifier.h>
  15. #include <linux/tracepoint.h>
  16. #include <linux/cpumask.h>
  17. #include <linux/kvm.h>
  18. #include <linux/kvm_para.h>
  19. #include <linux/kvm_types.h>
  20. #include <asm/pvclock-abi.h>
  21. #include <asm/desc.h>
  22. #include <asm/mtrr.h>
  23. #include <asm/msr-index.h>
  24. #define KVM_MAX_VCPUS 254
  25. #define KVM_SOFT_MAX_VCPUS 64
  26. #define KVM_MEMORY_SLOTS 32
  27. /* memory slots that does not exposed to userspace */
  28. #define KVM_PRIVATE_MEM_SLOTS 4
  29. #define KVM_MMIO_SIZE 16
  30. #define KVM_PIO_PAGE_OFFSET 1
  31. #define KVM_COALESCED_MMIO_PAGE_OFFSET 2
  32. #define CR0_RESERVED_BITS \
  33. (~(unsigned long)(X86_CR0_PE | X86_CR0_MP | X86_CR0_EM | X86_CR0_TS \
  34. | X86_CR0_ET | X86_CR0_NE | X86_CR0_WP | X86_CR0_AM \
  35. | X86_CR0_NW | X86_CR0_CD | X86_CR0_PG))
  36. #define CR3_PAE_RESERVED_BITS ((X86_CR3_PWT | X86_CR3_PCD) - 1)
  37. #define CR3_NONPAE_RESERVED_BITS ((PAGE_SIZE-1) & ~(X86_CR3_PWT | X86_CR3_PCD))
  38. #define CR3_L_MODE_RESERVED_BITS (CR3_NONPAE_RESERVED_BITS | \
  39. 0xFFFFFF0000000000ULL)
  40. #define CR4_RESERVED_BITS \
  41. (~(unsigned long)(X86_CR4_VME | X86_CR4_PVI | X86_CR4_TSD | X86_CR4_DE\
  42. | X86_CR4_PSE | X86_CR4_PAE | X86_CR4_MCE \
  43. | X86_CR4_PGE | X86_CR4_PCE | X86_CR4_OSFXSR \
  44. | X86_CR4_OSXSAVE | X86_CR4_SMEP | X86_CR4_RDWRGSFS \
  45. | X86_CR4_OSXMMEXCPT | X86_CR4_VMXE))
  46. #define CR8_RESERVED_BITS (~(unsigned long)X86_CR8_TPR)
  47. #define INVALID_PAGE (~(hpa_t)0)
  48. #define VALID_PAGE(x) ((x) != INVALID_PAGE)
  49. #define UNMAPPED_GVA (~(gpa_t)0)
  50. /* KVM Hugepage definitions for x86 */
  51. #define KVM_NR_PAGE_SIZES 3
  52. #define KVM_HPAGE_GFN_SHIFT(x) (((x) - 1) * 9)
  53. #define KVM_HPAGE_SHIFT(x) (PAGE_SHIFT + KVM_HPAGE_GFN_SHIFT(x))
  54. #define KVM_HPAGE_SIZE(x) (1UL << KVM_HPAGE_SHIFT(x))
  55. #define KVM_HPAGE_MASK(x) (~(KVM_HPAGE_SIZE(x) - 1))
  56. #define KVM_PAGES_PER_HPAGE(x) (KVM_HPAGE_SIZE(x) / PAGE_SIZE)
  57. #define DE_VECTOR 0
  58. #define DB_VECTOR 1
  59. #define BP_VECTOR 3
  60. #define OF_VECTOR 4
  61. #define BR_VECTOR 5
  62. #define UD_VECTOR 6
  63. #define NM_VECTOR 7
  64. #define DF_VECTOR 8
  65. #define TS_VECTOR 10
  66. #define NP_VECTOR 11
  67. #define SS_VECTOR 12
  68. #define GP_VECTOR 13
  69. #define PF_VECTOR 14
  70. #define MF_VECTOR 16
  71. #define MC_VECTOR 18
  72. #define SELECTOR_TI_MASK (1 << 2)
  73. #define SELECTOR_RPL_MASK 0x03
  74. #define IOPL_SHIFT 12
  75. #define KVM_PERMILLE_MMU_PAGES 20
  76. #define KVM_MIN_ALLOC_MMU_PAGES 64
  77. #define KVM_MMU_HASH_SHIFT 10
  78. #define KVM_NUM_MMU_PAGES (1 << KVM_MMU_HASH_SHIFT)
  79. #define KVM_MIN_FREE_MMU_PAGES 5
  80. #define KVM_REFILL_PAGES 25
  81. #define KVM_MAX_CPUID_ENTRIES 80
  82. #define KVM_NR_FIXED_MTRR_REGION 88
  83. #define KVM_NR_VAR_MTRR 8
  84. #define ASYNC_PF_PER_VCPU 64
  85. extern raw_spinlock_t kvm_lock;
  86. extern struct list_head vm_list;
  87. struct kvm_vcpu;
  88. struct kvm;
  89. struct kvm_async_pf;
  90. enum kvm_reg {
  91. VCPU_REGS_RAX = 0,
  92. VCPU_REGS_RCX = 1,
  93. VCPU_REGS_RDX = 2,
  94. VCPU_REGS_RBX = 3,
  95. VCPU_REGS_RSP = 4,
  96. VCPU_REGS_RBP = 5,
  97. VCPU_REGS_RSI = 6,
  98. VCPU_REGS_RDI = 7,
  99. #ifdef CONFIG_X86_64
  100. VCPU_REGS_R8 = 8,
  101. VCPU_REGS_R9 = 9,
  102. VCPU_REGS_R10 = 10,
  103. VCPU_REGS_R11 = 11,
  104. VCPU_REGS_R12 = 12,
  105. VCPU_REGS_R13 = 13,
  106. VCPU_REGS_R14 = 14,
  107. VCPU_REGS_R15 = 15,
  108. #endif
  109. VCPU_REGS_RIP,
  110. NR_VCPU_REGS
  111. };
  112. enum kvm_reg_ex {
  113. VCPU_EXREG_PDPTR = NR_VCPU_REGS,
  114. VCPU_EXREG_CR3,
  115. VCPU_EXREG_RFLAGS,
  116. VCPU_EXREG_CPL,
  117. VCPU_EXREG_SEGMENTS,
  118. };
  119. enum {
  120. VCPU_SREG_ES,
  121. VCPU_SREG_CS,
  122. VCPU_SREG_SS,
  123. VCPU_SREG_DS,
  124. VCPU_SREG_FS,
  125. VCPU_SREG_GS,
  126. VCPU_SREG_TR,
  127. VCPU_SREG_LDTR,
  128. };
  129. #include <asm/kvm_emulate.h>
  130. #define KVM_NR_MEM_OBJS 40
  131. #define KVM_NR_DB_REGS 4
  132. #define DR6_BD (1 << 13)
  133. #define DR6_BS (1 << 14)
  134. #define DR6_FIXED_1 0xffff0ff0
  135. #define DR6_VOLATILE 0x0000e00f
  136. #define DR7_BP_EN_MASK 0x000000ff
  137. #define DR7_GE (1 << 9)
  138. #define DR7_GD (1 << 13)
  139. #define DR7_FIXED_1 0x00000400
  140. #define DR7_VOLATILE 0xffff23ff
  141. /*
  142. * We don't want allocation failures within the mmu code, so we preallocate
  143. * enough memory for a single page fault in a cache.
  144. */
  145. struct kvm_mmu_memory_cache {
  146. int nobjs;
  147. void *objects[KVM_NR_MEM_OBJS];
  148. };
  149. #define NR_PTE_CHAIN_ENTRIES 5
  150. struct kvm_pte_chain {
  151. u64 *parent_ptes[NR_PTE_CHAIN_ENTRIES];
  152. struct hlist_node link;
  153. };
  154. /*
  155. * kvm_mmu_page_role, below, is defined as:
  156. *
  157. * bits 0:3 - total guest paging levels (2-4, or zero for real mode)
  158. * bits 4:7 - page table level for this shadow (1-4)
  159. * bits 8:9 - page table quadrant for 2-level guests
  160. * bit 16 - direct mapping of virtual to physical mapping at gfn
  161. * used for real mode and two-dimensional paging
  162. * bits 17:19 - common access permissions for all ptes in this shadow page
  163. */
  164. union kvm_mmu_page_role {
  165. unsigned word;
  166. struct {
  167. unsigned level:4;
  168. unsigned cr4_pae:1;
  169. unsigned quadrant:2;
  170. unsigned pad_for_nice_hex_output:6;
  171. unsigned direct:1;
  172. unsigned access:3;
  173. unsigned invalid:1;
  174. unsigned nxe:1;
  175. unsigned cr0_wp:1;
  176. unsigned smep_andnot_wp:1;
  177. };
  178. };
  179. struct kvm_mmu_page {
  180. struct list_head link;
  181. struct hlist_node hash_link;
  182. /*
  183. * The following two entries are used to key the shadow page in the
  184. * hash table.
  185. */
  186. gfn_t gfn;
  187. union kvm_mmu_page_role role;
  188. u64 *spt;
  189. /* hold the gfn of each spte inside spt */
  190. gfn_t *gfns;
  191. /*
  192. * One bit set per slot which has memory
  193. * in this shadow page.
  194. */
  195. DECLARE_BITMAP(slot_bitmap, KVM_MEMORY_SLOTS + KVM_PRIVATE_MEM_SLOTS);
  196. bool unsync;
  197. int root_count; /* Currently serving as active root */
  198. unsigned int unsync_children;
  199. unsigned long parent_ptes; /* Reverse mapping for parent_pte */
  200. DECLARE_BITMAP(unsync_child_bitmap, 512);
  201. #ifdef CONFIG_X86_32
  202. int clear_spte_count;
  203. #endif
  204. struct rcu_head rcu;
  205. };
  206. struct kvm_pv_mmu_op_buffer {
  207. void *ptr;
  208. unsigned len;
  209. unsigned processed;
  210. char buf[512] __aligned(sizeof(long));
  211. };
  212. struct kvm_pio_request {
  213. unsigned long count;
  214. int in;
  215. int port;
  216. int size;
  217. };
  218. /*
  219. * x86 supports 3 paging modes (4-level 64-bit, 3-level 64-bit, and 2-level
  220. * 32-bit). The kvm_mmu structure abstracts the details of the current mmu
  221. * mode.
  222. */
  223. struct kvm_mmu {
  224. void (*new_cr3)(struct kvm_vcpu *vcpu);
  225. void (*set_cr3)(struct kvm_vcpu *vcpu, unsigned long root);
  226. unsigned long (*get_cr3)(struct kvm_vcpu *vcpu);
  227. u64 (*get_pdptr)(struct kvm_vcpu *vcpu, int index);
  228. int (*page_fault)(struct kvm_vcpu *vcpu, gva_t gva, u32 err,
  229. bool prefault);
  230. void (*inject_page_fault)(struct kvm_vcpu *vcpu,
  231. struct x86_exception *fault);
  232. void (*free)(struct kvm_vcpu *vcpu);
  233. gpa_t (*gva_to_gpa)(struct kvm_vcpu *vcpu, gva_t gva, u32 access,
  234. struct x86_exception *exception);
  235. gpa_t (*translate_gpa)(struct kvm_vcpu *vcpu, gpa_t gpa, u32 access);
  236. int (*sync_page)(struct kvm_vcpu *vcpu,
  237. struct kvm_mmu_page *sp);
  238. void (*invlpg)(struct kvm_vcpu *vcpu, gva_t gva);
  239. void (*update_pte)(struct kvm_vcpu *vcpu, struct kvm_mmu_page *sp,
  240. u64 *spte, const void *pte);
  241. hpa_t root_hpa;
  242. int root_level;
  243. int shadow_root_level;
  244. union kvm_mmu_page_role base_role;
  245. bool direct_map;
  246. u64 *pae_root;
  247. u64 *lm_root;
  248. u64 rsvd_bits_mask[2][4];
  249. bool nx;
  250. u64 pdptrs[4]; /* pae */
  251. };
  252. struct kvm_vcpu_arch {
  253. /*
  254. * rip and regs accesses must go through
  255. * kvm_{register,rip}_{read,write} functions.
  256. */
  257. unsigned long regs[NR_VCPU_REGS];
  258. u32 regs_avail;
  259. u32 regs_dirty;
  260. unsigned long cr0;
  261. unsigned long cr0_guest_owned_bits;
  262. unsigned long cr2;
  263. unsigned long cr3;
  264. unsigned long cr4;
  265. unsigned long cr4_guest_owned_bits;
  266. unsigned long cr8;
  267. u32 hflags;
  268. u64 efer;
  269. u64 apic_base;
  270. struct kvm_lapic *apic; /* kernel irqchip context */
  271. int32_t apic_arb_prio;
  272. int mp_state;
  273. int sipi_vector;
  274. u64 ia32_misc_enable_msr;
  275. bool tpr_access_reporting;
  276. /*
  277. * Paging state of the vcpu
  278. *
  279. * If the vcpu runs in guest mode with two level paging this still saves
  280. * the paging mode of the l1 guest. This context is always used to
  281. * handle faults.
  282. */
  283. struct kvm_mmu mmu;
  284. /*
  285. * Paging state of an L2 guest (used for nested npt)
  286. *
  287. * This context will save all necessary information to walk page tables
  288. * of the an L2 guest. This context is only initialized for page table
  289. * walking and not for faulting since we never handle l2 page faults on
  290. * the host.
  291. */
  292. struct kvm_mmu nested_mmu;
  293. /*
  294. * Pointer to the mmu context currently used for
  295. * gva_to_gpa translations.
  296. */
  297. struct kvm_mmu *walk_mmu;
  298. /* only needed in kvm_pv_mmu_op() path, but it's hot so
  299. * put it here to avoid allocation */
  300. struct kvm_pv_mmu_op_buffer mmu_op_buffer;
  301. struct kvm_mmu_memory_cache mmu_pte_list_desc_cache;
  302. struct kvm_mmu_memory_cache mmu_page_cache;
  303. struct kvm_mmu_memory_cache mmu_page_header_cache;
  304. gfn_t last_pt_write_gfn;
  305. int last_pt_write_count;
  306. u64 *last_pte_updated;
  307. struct fpu guest_fpu;
  308. u64 xcr0;
  309. struct kvm_pio_request pio;
  310. void *pio_data;
  311. u8 event_exit_inst_len;
  312. struct kvm_queued_exception {
  313. bool pending;
  314. bool has_error_code;
  315. bool reinject;
  316. u8 nr;
  317. u32 error_code;
  318. } exception;
  319. struct kvm_queued_interrupt {
  320. bool pending;
  321. bool soft;
  322. u8 nr;
  323. } interrupt;
  324. int halt_request; /* real mode on Intel only */
  325. int cpuid_nent;
  326. struct kvm_cpuid_entry2 cpuid_entries[KVM_MAX_CPUID_ENTRIES];
  327. /* emulate context */
  328. struct x86_emulate_ctxt emulate_ctxt;
  329. bool emulate_regs_need_sync_to_vcpu;
  330. bool emulate_regs_need_sync_from_vcpu;
  331. gpa_t time;
  332. struct pvclock_vcpu_time_info hv_clock;
  333. unsigned int hw_tsc_khz;
  334. unsigned int time_offset;
  335. struct page *time_page;
  336. struct {
  337. u64 msr_val;
  338. u64 last_steal;
  339. u64 accum_steal;
  340. struct gfn_to_hva_cache stime;
  341. struct kvm_steal_time steal;
  342. } st;
  343. u64 last_guest_tsc;
  344. u64 last_kernel_ns;
  345. u64 last_tsc_nsec;
  346. u64 last_tsc_write;
  347. u32 virtual_tsc_khz;
  348. bool tsc_catchup;
  349. u32 tsc_catchup_mult;
  350. s8 tsc_catchup_shift;
  351. atomic_t nmi_queued; /* unprocessed asynchronous NMIs */
  352. unsigned nmi_pending; /* NMI queued after currently running handler */
  353. bool nmi_injected; /* Trying to inject an NMI this entry */
  354. struct mtrr_state_type mtrr_state;
  355. u32 pat;
  356. int switch_db_regs;
  357. unsigned long db[KVM_NR_DB_REGS];
  358. unsigned long dr6;
  359. unsigned long dr7;
  360. unsigned long eff_db[KVM_NR_DB_REGS];
  361. u64 mcg_cap;
  362. u64 mcg_status;
  363. u64 mcg_ctl;
  364. u64 *mce_banks;
  365. /* Cache MMIO info */
  366. u64 mmio_gva;
  367. unsigned access;
  368. gfn_t mmio_gfn;
  369. /* used for guest single stepping over the given code position */
  370. unsigned long singlestep_rip;
  371. /* fields used by HYPER-V emulation */
  372. u64 hv_vapic;
  373. cpumask_var_t wbinvd_dirty_mask;
  374. unsigned long last_retry_eip;
  375. unsigned long last_retry_addr;
  376. struct {
  377. bool halted;
  378. gfn_t gfns[roundup_pow_of_two(ASYNC_PF_PER_VCPU)];
  379. struct gfn_to_hva_cache data;
  380. u64 msr_val;
  381. u32 id;
  382. bool send_user_only;
  383. } apf;
  384. };
  385. struct kvm_arch {
  386. unsigned int n_used_mmu_pages;
  387. unsigned int n_requested_mmu_pages;
  388. unsigned int n_max_mmu_pages;
  389. unsigned int indirect_shadow_pages;
  390. atomic_t invlpg_counter;
  391. struct hlist_head mmu_page_hash[KVM_NUM_MMU_PAGES];
  392. /*
  393. * Hash table of struct kvm_mmu_page.
  394. */
  395. struct list_head active_mmu_pages;
  396. struct list_head assigned_dev_head;
  397. struct iommu_domain *iommu_domain;
  398. int iommu_flags;
  399. struct kvm_pic *vpic;
  400. struct kvm_ioapic *vioapic;
  401. struct kvm_pit *vpit;
  402. int vapics_in_nmi_mode;
  403. unsigned int tss_addr;
  404. struct page *apic_access_page;
  405. gpa_t wall_clock;
  406. struct page *ept_identity_pagetable;
  407. bool ept_identity_pagetable_done;
  408. gpa_t ept_identity_map_addr;
  409. unsigned long irq_sources_bitmap;
  410. s64 kvmclock_offset;
  411. raw_spinlock_t tsc_write_lock;
  412. u64 last_tsc_nsec;
  413. u64 last_tsc_offset;
  414. u64 last_tsc_write;
  415. struct kvm_xen_hvm_config xen_hvm_config;
  416. /* fields used by HYPER-V emulation */
  417. u64 hv_guest_os_id;
  418. u64 hv_hypercall;
  419. atomic_t reader_counter;
  420. #ifdef CONFIG_KVM_MMU_AUDIT
  421. int audit_point;
  422. #endif
  423. };
  424. struct kvm_vm_stat {
  425. u32 mmu_shadow_zapped;
  426. u32 mmu_pte_write;
  427. u32 mmu_pte_updated;
  428. u32 mmu_pde_zapped;
  429. u32 mmu_flooded;
  430. u32 mmu_recycled;
  431. u32 mmu_cache_miss;
  432. u32 mmu_unsync;
  433. u32 remote_tlb_flush;
  434. u32 lpages;
  435. };
  436. struct kvm_vcpu_stat {
  437. u32 pf_fixed;
  438. u32 pf_guest;
  439. u32 tlb_flush;
  440. u32 invlpg;
  441. u32 exits;
  442. u32 io_exits;
  443. u32 mmio_exits;
  444. u32 signal_exits;
  445. u32 irq_window_exits;
  446. u32 nmi_window_exits;
  447. u32 halt_exits;
  448. u32 halt_wakeup;
  449. u32 request_irq_exits;
  450. u32 irq_exits;
  451. u32 host_state_reload;
  452. u32 efer_reload;
  453. u32 fpu_reload;
  454. u32 insn_emulation;
  455. u32 insn_emulation_fail;
  456. u32 hypercalls;
  457. u32 irq_injections;
  458. u32 nmi_injections;
  459. };
  460. struct x86_instruction_info;
  461. struct kvm_x86_ops {
  462. int (*cpu_has_kvm_support)(void); /* __init */
  463. int (*disabled_by_bios)(void); /* __init */
  464. int (*hardware_enable)(void *dummy);
  465. void (*hardware_disable)(void *dummy);
  466. void (*check_processor_compatibility)(void *rtn);
  467. int (*hardware_setup)(void); /* __init */
  468. void (*hardware_unsetup)(void); /* __exit */
  469. bool (*cpu_has_accelerated_tpr)(void);
  470. void (*cpuid_update)(struct kvm_vcpu *vcpu);
  471. /* Create, but do not attach this VCPU */
  472. struct kvm_vcpu *(*vcpu_create)(struct kvm *kvm, unsigned id);
  473. void (*vcpu_free)(struct kvm_vcpu *vcpu);
  474. int (*vcpu_reset)(struct kvm_vcpu *vcpu);
  475. void (*prepare_guest_switch)(struct kvm_vcpu *vcpu);
  476. void (*vcpu_load)(struct kvm_vcpu *vcpu, int cpu);
  477. void (*vcpu_put)(struct kvm_vcpu *vcpu);
  478. void (*set_guest_debug)(struct kvm_vcpu *vcpu,
  479. struct kvm_guest_debug *dbg);
  480. int (*get_msr)(struct kvm_vcpu *vcpu, u32 msr_index, u64 *pdata);
  481. int (*set_msr)(struct kvm_vcpu *vcpu, u32 msr_index, u64 data);
  482. u64 (*get_segment_base)(struct kvm_vcpu *vcpu, int seg);
  483. void (*get_segment)(struct kvm_vcpu *vcpu,
  484. struct kvm_segment *var, int seg);
  485. int (*get_cpl)(struct kvm_vcpu *vcpu);
  486. void (*set_segment)(struct kvm_vcpu *vcpu,
  487. struct kvm_segment *var, int seg);
  488. void (*get_cs_db_l_bits)(struct kvm_vcpu *vcpu, int *db, int *l);
  489. void (*decache_cr0_guest_bits)(struct kvm_vcpu *vcpu);
  490. void (*decache_cr3)(struct kvm_vcpu *vcpu);
  491. void (*decache_cr4_guest_bits)(struct kvm_vcpu *vcpu);
  492. void (*set_cr0)(struct kvm_vcpu *vcpu, unsigned long cr0);
  493. void (*set_cr3)(struct kvm_vcpu *vcpu, unsigned long cr3);
  494. int (*set_cr4)(struct kvm_vcpu *vcpu, unsigned long cr4);
  495. void (*set_efer)(struct kvm_vcpu *vcpu, u64 efer);
  496. void (*get_idt)(struct kvm_vcpu *vcpu, struct desc_ptr *dt);
  497. void (*set_idt)(struct kvm_vcpu *vcpu, struct desc_ptr *dt);
  498. void (*get_gdt)(struct kvm_vcpu *vcpu, struct desc_ptr *dt);
  499. void (*set_gdt)(struct kvm_vcpu *vcpu, struct desc_ptr *dt);
  500. void (*set_dr7)(struct kvm_vcpu *vcpu, unsigned long value);
  501. void (*cache_reg)(struct kvm_vcpu *vcpu, enum kvm_reg reg);
  502. unsigned long (*get_rflags)(struct kvm_vcpu *vcpu);
  503. void (*set_rflags)(struct kvm_vcpu *vcpu, unsigned long rflags);
  504. void (*fpu_activate)(struct kvm_vcpu *vcpu);
  505. void (*fpu_deactivate)(struct kvm_vcpu *vcpu);
  506. void (*tlb_flush)(struct kvm_vcpu *vcpu);
  507. void (*run)(struct kvm_vcpu *vcpu);
  508. int (*handle_exit)(struct kvm_vcpu *vcpu);
  509. void (*skip_emulated_instruction)(struct kvm_vcpu *vcpu);
  510. void (*set_interrupt_shadow)(struct kvm_vcpu *vcpu, int mask);
  511. u32 (*get_interrupt_shadow)(struct kvm_vcpu *vcpu, int mask);
  512. void (*patch_hypercall)(struct kvm_vcpu *vcpu,
  513. unsigned char *hypercall_addr);
  514. void (*set_irq)(struct kvm_vcpu *vcpu);
  515. void (*set_nmi)(struct kvm_vcpu *vcpu);
  516. void (*queue_exception)(struct kvm_vcpu *vcpu, unsigned nr,
  517. bool has_error_code, u32 error_code,
  518. bool reinject);
  519. void (*cancel_injection)(struct kvm_vcpu *vcpu);
  520. int (*interrupt_allowed)(struct kvm_vcpu *vcpu);
  521. int (*nmi_allowed)(struct kvm_vcpu *vcpu);
  522. bool (*get_nmi_mask)(struct kvm_vcpu *vcpu);
  523. void (*set_nmi_mask)(struct kvm_vcpu *vcpu, bool masked);
  524. void (*enable_nmi_window)(struct kvm_vcpu *vcpu);
  525. void (*enable_irq_window)(struct kvm_vcpu *vcpu);
  526. void (*update_cr8_intercept)(struct kvm_vcpu *vcpu, int tpr, int irr);
  527. int (*set_tss_addr)(struct kvm *kvm, unsigned int addr);
  528. int (*get_tdp_level)(void);
  529. u64 (*get_mt_mask)(struct kvm_vcpu *vcpu, gfn_t gfn, bool is_mmio);
  530. int (*get_lpage_level)(void);
  531. bool (*rdtscp_supported)(void);
  532. void (*adjust_tsc_offset)(struct kvm_vcpu *vcpu, s64 adjustment);
  533. void (*set_tdp_cr3)(struct kvm_vcpu *vcpu, unsigned long cr3);
  534. void (*set_supported_cpuid)(u32 func, struct kvm_cpuid_entry2 *entry);
  535. bool (*has_wbinvd_exit)(void);
  536. void (*set_tsc_khz)(struct kvm_vcpu *vcpu, u32 user_tsc_khz);
  537. void (*write_tsc_offset)(struct kvm_vcpu *vcpu, u64 offset);
  538. u64 (*compute_tsc_offset)(struct kvm_vcpu *vcpu, u64 target_tsc);
  539. u64 (*read_l1_tsc)(struct kvm_vcpu *vcpu);
  540. void (*get_exit_info)(struct kvm_vcpu *vcpu, u64 *info1, u64 *info2);
  541. int (*check_intercept)(struct kvm_vcpu *vcpu,
  542. struct x86_instruction_info *info,
  543. enum x86_intercept_stage stage);
  544. };
  545. struct kvm_arch_async_pf {
  546. u32 token;
  547. gfn_t gfn;
  548. unsigned long cr3;
  549. bool direct_map;
  550. };
  551. extern struct kvm_x86_ops *kvm_x86_ops;
  552. int kvm_mmu_module_init(void);
  553. void kvm_mmu_module_exit(void);
  554. void kvm_mmu_destroy(struct kvm_vcpu *vcpu);
  555. int kvm_mmu_create(struct kvm_vcpu *vcpu);
  556. int kvm_mmu_setup(struct kvm_vcpu *vcpu);
  557. void kvm_mmu_set_mask_ptes(u64 user_mask, u64 accessed_mask,
  558. u64 dirty_mask, u64 nx_mask, u64 x_mask);
  559. int kvm_mmu_reset_context(struct kvm_vcpu *vcpu);
  560. void kvm_mmu_slot_remove_write_access(struct kvm *kvm, int slot);
  561. void kvm_mmu_zap_all(struct kvm *kvm);
  562. unsigned int kvm_mmu_calculate_mmu_pages(struct kvm *kvm);
  563. void kvm_mmu_change_mmu_pages(struct kvm *kvm, unsigned int kvm_nr_mmu_pages);
  564. int load_pdptrs(struct kvm_vcpu *vcpu, struct kvm_mmu *mmu, unsigned long cr3);
  565. int emulator_write_phys(struct kvm_vcpu *vcpu, gpa_t gpa,
  566. const void *val, int bytes);
  567. int kvm_pv_mmu_op(struct kvm_vcpu *vcpu, unsigned long bytes,
  568. gpa_t addr, unsigned long *ret);
  569. u8 kvm_get_guest_memory_type(struct kvm_vcpu *vcpu, gfn_t gfn);
  570. extern bool tdp_enabled;
  571. u64 vcpu_tsc_khz(struct kvm_vcpu *vcpu);
  572. /* control of guest tsc rate supported? */
  573. extern bool kvm_has_tsc_control;
  574. /* minimum supported tsc_khz for guests */
  575. extern u32 kvm_min_guest_tsc_khz;
  576. /* maximum supported tsc_khz for guests */
  577. extern u32 kvm_max_guest_tsc_khz;
  578. enum emulation_result {
  579. EMULATE_DONE, /* no further processing */
  580. EMULATE_DO_MMIO, /* kvm_run filled with mmio request */
  581. EMULATE_FAIL, /* can't emulate this instruction */
  582. };
  583. #define EMULTYPE_NO_DECODE (1 << 0)
  584. #define EMULTYPE_TRAP_UD (1 << 1)
  585. #define EMULTYPE_SKIP (1 << 2)
  586. #define EMULTYPE_RETRY (1 << 3)
  587. int x86_emulate_instruction(struct kvm_vcpu *vcpu, unsigned long cr2,
  588. int emulation_type, void *insn, int insn_len);
  589. static inline int emulate_instruction(struct kvm_vcpu *vcpu,
  590. int emulation_type)
  591. {
  592. return x86_emulate_instruction(vcpu, 0, emulation_type, NULL, 0);
  593. }
  594. void kvm_enable_efer_bits(u64);
  595. int kvm_get_msr(struct kvm_vcpu *vcpu, u32 msr_index, u64 *data);
  596. int kvm_set_msr(struct kvm_vcpu *vcpu, u32 msr_index, u64 data);
  597. struct x86_emulate_ctxt;
  598. int kvm_fast_pio_out(struct kvm_vcpu *vcpu, int size, unsigned short port);
  599. void kvm_emulate_cpuid(struct kvm_vcpu *vcpu);
  600. int kvm_emulate_halt(struct kvm_vcpu *vcpu);
  601. int kvm_emulate_wbinvd(struct kvm_vcpu *vcpu);
  602. void kvm_get_segment(struct kvm_vcpu *vcpu, struct kvm_segment *var, int seg);
  603. int kvm_load_segment_descriptor(struct kvm_vcpu *vcpu, u16 selector, int seg);
  604. int kvm_task_switch(struct kvm_vcpu *vcpu, u16 tss_selector, int reason,
  605. bool has_error_code, u32 error_code);
  606. int kvm_set_cr0(struct kvm_vcpu *vcpu, unsigned long cr0);
  607. int kvm_set_cr3(struct kvm_vcpu *vcpu, unsigned long cr3);
  608. int kvm_set_cr4(struct kvm_vcpu *vcpu, unsigned long cr4);
  609. int kvm_set_cr8(struct kvm_vcpu *vcpu, unsigned long cr8);
  610. int kvm_set_dr(struct kvm_vcpu *vcpu, int dr, unsigned long val);
  611. int kvm_get_dr(struct kvm_vcpu *vcpu, int dr, unsigned long *val);
  612. unsigned long kvm_get_cr8(struct kvm_vcpu *vcpu);
  613. void kvm_lmsw(struct kvm_vcpu *vcpu, unsigned long msw);
  614. void kvm_get_cs_db_l_bits(struct kvm_vcpu *vcpu, int *db, int *l);
  615. int kvm_set_xcr(struct kvm_vcpu *vcpu, u32 index, u64 xcr);
  616. int kvm_get_msr_common(struct kvm_vcpu *vcpu, u32 msr, u64 *pdata);
  617. int kvm_set_msr_common(struct kvm_vcpu *vcpu, u32 msr, u64 data);
  618. unsigned long kvm_get_rflags(struct kvm_vcpu *vcpu);
  619. void kvm_set_rflags(struct kvm_vcpu *vcpu, unsigned long rflags);
  620. void kvm_queue_exception(struct kvm_vcpu *vcpu, unsigned nr);
  621. void kvm_queue_exception_e(struct kvm_vcpu *vcpu, unsigned nr, u32 error_code);
  622. void kvm_requeue_exception(struct kvm_vcpu *vcpu, unsigned nr);
  623. void kvm_requeue_exception_e(struct kvm_vcpu *vcpu, unsigned nr, u32 error_code);
  624. void kvm_inject_page_fault(struct kvm_vcpu *vcpu, struct x86_exception *fault);
  625. int kvm_read_guest_page_mmu(struct kvm_vcpu *vcpu, struct kvm_mmu *mmu,
  626. gfn_t gfn, void *data, int offset, int len,
  627. u32 access);
  628. void kvm_propagate_fault(struct kvm_vcpu *vcpu, struct x86_exception *fault);
  629. bool kvm_require_cpl(struct kvm_vcpu *vcpu, int required_cpl);
  630. int kvm_pic_set_irq(void *opaque, int irq, int level);
  631. void kvm_inject_nmi(struct kvm_vcpu *vcpu);
  632. int fx_init(struct kvm_vcpu *vcpu);
  633. void kvm_mmu_flush_tlb(struct kvm_vcpu *vcpu);
  634. void kvm_mmu_pte_write(struct kvm_vcpu *vcpu, gpa_t gpa,
  635. const u8 *new, int bytes,
  636. bool guest_initiated);
  637. int kvm_mmu_unprotect_page(struct kvm *kvm, gfn_t gfn);
  638. int kvm_mmu_unprotect_page_virt(struct kvm_vcpu *vcpu, gva_t gva);
  639. void __kvm_mmu_free_some_pages(struct kvm_vcpu *vcpu);
  640. int kvm_mmu_load(struct kvm_vcpu *vcpu);
  641. void kvm_mmu_unload(struct kvm_vcpu *vcpu);
  642. void kvm_mmu_sync_roots(struct kvm_vcpu *vcpu);
  643. gpa_t kvm_mmu_gva_to_gpa_read(struct kvm_vcpu *vcpu, gva_t gva,
  644. struct x86_exception *exception);
  645. gpa_t kvm_mmu_gva_to_gpa_fetch(struct kvm_vcpu *vcpu, gva_t gva,
  646. struct x86_exception *exception);
  647. gpa_t kvm_mmu_gva_to_gpa_write(struct kvm_vcpu *vcpu, gva_t gva,
  648. struct x86_exception *exception);
  649. gpa_t kvm_mmu_gva_to_gpa_system(struct kvm_vcpu *vcpu, gva_t gva,
  650. struct x86_exception *exception);
  651. int kvm_emulate_hypercall(struct kvm_vcpu *vcpu);
  652. int kvm_mmu_page_fault(struct kvm_vcpu *vcpu, gva_t gva, u32 error_code,
  653. void *insn, int insn_len);
  654. void kvm_mmu_invlpg(struct kvm_vcpu *vcpu, gva_t gva);
  655. void kvm_enable_tdp(void);
  656. void kvm_disable_tdp(void);
  657. int complete_pio(struct kvm_vcpu *vcpu);
  658. bool kvm_check_iopl(struct kvm_vcpu *vcpu);
  659. static inline struct kvm_mmu_page *page_header(hpa_t shadow_page)
  660. {
  661. struct page *page = pfn_to_page(shadow_page >> PAGE_SHIFT);
  662. return (struct kvm_mmu_page *)page_private(page);
  663. }
  664. static inline u16 kvm_read_ldt(void)
  665. {
  666. u16 ldt;
  667. asm("sldt %0" : "=g"(ldt));
  668. return ldt;
  669. }
  670. static inline void kvm_load_ldt(u16 sel)
  671. {
  672. asm("lldt %0" : : "rm"(sel));
  673. }
  674. #ifdef CONFIG_X86_64
  675. static inline unsigned long read_msr(unsigned long msr)
  676. {
  677. u64 value;
  678. rdmsrl(msr, value);
  679. return value;
  680. }
  681. #endif
  682. static inline u32 get_rdx_init_val(void)
  683. {
  684. return 0x600; /* P6 family */
  685. }
  686. static inline void kvm_inject_gp(struct kvm_vcpu *vcpu, u32 error_code)
  687. {
  688. kvm_queue_exception_e(vcpu, GP_VECTOR, error_code);
  689. }
  690. #define TSS_IOPB_BASE_OFFSET 0x66
  691. #define TSS_BASE_SIZE 0x68
  692. #define TSS_IOPB_SIZE (65536 / 8)
  693. #define TSS_REDIRECTION_SIZE (256 / 8)
  694. #define RMODE_TSS_SIZE \
  695. (TSS_BASE_SIZE + TSS_REDIRECTION_SIZE + TSS_IOPB_SIZE + 1)
  696. enum {
  697. TASK_SWITCH_CALL = 0,
  698. TASK_SWITCH_IRET = 1,
  699. TASK_SWITCH_JMP = 2,
  700. TASK_SWITCH_GATE = 3,
  701. };
  702. #define HF_GIF_MASK (1 << 0)
  703. #define HF_HIF_MASK (1 << 1)
  704. #define HF_VINTR_MASK (1 << 2)
  705. #define HF_NMI_MASK (1 << 3)
  706. #define HF_IRET_MASK (1 << 4)
  707. #define HF_GUEST_MASK (1 << 5) /* VCPU is in guest-mode */
  708. /*
  709. * Hardware virtualization extension instructions may fault if a
  710. * reboot turns off virtualization while processes are running.
  711. * Trap the fault and ignore the instruction if that happens.
  712. */
  713. asmlinkage void kvm_spurious_fault(void);
  714. extern bool kvm_rebooting;
  715. #define ____kvm_handle_fault_on_reboot(insn, cleanup_insn) \
  716. "666: " insn "\n\t" \
  717. "668: \n\t" \
  718. ".pushsection .fixup, \"ax\" \n" \
  719. "667: \n\t" \
  720. cleanup_insn "\n\t" \
  721. "cmpb $0, kvm_rebooting \n\t" \
  722. "jne 668b \n\t" \
  723. __ASM_SIZE(push) " $666b \n\t" \
  724. "call kvm_spurious_fault \n\t" \
  725. ".popsection \n\t" \
  726. ".pushsection __ex_table, \"a\" \n\t" \
  727. _ASM_PTR " 666b, 667b \n\t" \
  728. ".popsection"
  729. #define __kvm_handle_fault_on_reboot(insn) \
  730. ____kvm_handle_fault_on_reboot(insn, "")
  731. #define KVM_ARCH_WANT_MMU_NOTIFIER
  732. int kvm_unmap_hva(struct kvm *kvm, unsigned long hva);
  733. int kvm_age_hva(struct kvm *kvm, unsigned long hva);
  734. int kvm_test_age_hva(struct kvm *kvm, unsigned long hva);
  735. void kvm_set_spte_hva(struct kvm *kvm, unsigned long hva, pte_t pte);
  736. int cpuid_maxphyaddr(struct kvm_vcpu *vcpu);
  737. int kvm_cpu_has_interrupt(struct kvm_vcpu *vcpu);
  738. int kvm_arch_interrupt_allowed(struct kvm_vcpu *vcpu);
  739. int kvm_cpu_get_interrupt(struct kvm_vcpu *v);
  740. void kvm_define_shared_msr(unsigned index, u32 msr);
  741. void kvm_set_shared_msr(unsigned index, u64 val, u64 mask);
  742. bool kvm_is_linear_rip(struct kvm_vcpu *vcpu, unsigned long linear_rip);
  743. void kvm_arch_async_page_not_present(struct kvm_vcpu *vcpu,
  744. struct kvm_async_pf *work);
  745. void kvm_arch_async_page_present(struct kvm_vcpu *vcpu,
  746. struct kvm_async_pf *work);
  747. void kvm_arch_async_page_ready(struct kvm_vcpu *vcpu,
  748. struct kvm_async_pf *work);
  749. bool kvm_arch_can_inject_async_page_present(struct kvm_vcpu *vcpu);
  750. extern bool kvm_find_async_pf_gfn(struct kvm_vcpu *vcpu, gfn_t gfn);
  751. void kvm_complete_insn_gp(struct kvm_vcpu *vcpu, int err);
  752. #endif /* _ASM_X86_KVM_HOST_H */