kvm_host.h 28 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001
  1. /*
  2. * Kernel-based Virtual Machine driver for Linux
  3. *
  4. * This header defines architecture specific interfaces, x86 version
  5. *
  6. * This work is licensed under the terms of the GNU GPL, version 2. See
  7. * the COPYING file in the top-level directory.
  8. *
  9. */
  10. #ifndef _ASM_X86_KVM_HOST_H
  11. #define _ASM_X86_KVM_HOST_H
  12. #include <linux/types.h>
  13. #include <linux/mm.h>
  14. #include <linux/mmu_notifier.h>
  15. #include <linux/tracepoint.h>
  16. #include <linux/cpumask.h>
  17. #include <linux/irq_work.h>
  18. #include <linux/kvm.h>
  19. #include <linux/kvm_para.h>
  20. #include <linux/kvm_types.h>
  21. #include <linux/perf_event.h>
  22. #include <asm/pvclock-abi.h>
  23. #include <asm/desc.h>
  24. #include <asm/mtrr.h>
  25. #include <asm/msr-index.h>
  26. #include <asm/asm.h>
  27. #define KVM_MAX_VCPUS 254
  28. #define KVM_SOFT_MAX_VCPUS 160
  29. #define KVM_MEMORY_SLOTS 32
  30. /* memory slots that does not exposed to userspace */
  31. #define KVM_PRIVATE_MEM_SLOTS 4
  32. #define KVM_MEM_SLOTS_NUM (KVM_MEMORY_SLOTS + KVM_PRIVATE_MEM_SLOTS)
  33. #define KVM_MMIO_SIZE 16
  34. #define KVM_PIO_PAGE_OFFSET 1
  35. #define KVM_COALESCED_MMIO_PAGE_OFFSET 2
  36. #define CR0_RESERVED_BITS \
  37. (~(unsigned long)(X86_CR0_PE | X86_CR0_MP | X86_CR0_EM | X86_CR0_TS \
  38. | X86_CR0_ET | X86_CR0_NE | X86_CR0_WP | X86_CR0_AM \
  39. | X86_CR0_NW | X86_CR0_CD | X86_CR0_PG))
  40. #define CR3_PAE_RESERVED_BITS ((X86_CR3_PWT | X86_CR3_PCD) - 1)
  41. #define CR3_NONPAE_RESERVED_BITS ((PAGE_SIZE-1) & ~(X86_CR3_PWT | X86_CR3_PCD))
  42. #define CR3_PCID_ENABLED_RESERVED_BITS 0xFFFFFF0000000000ULL
  43. #define CR3_L_MODE_RESERVED_BITS (CR3_NONPAE_RESERVED_BITS | \
  44. 0xFFFFFF0000000000ULL)
  45. #define CR4_RESERVED_BITS \
  46. (~(unsigned long)(X86_CR4_VME | X86_CR4_PVI | X86_CR4_TSD | X86_CR4_DE\
  47. | X86_CR4_PSE | X86_CR4_PAE | X86_CR4_MCE \
  48. | X86_CR4_PGE | X86_CR4_PCE | X86_CR4_OSFXSR | X86_CR4_PCIDE \
  49. | X86_CR4_OSXSAVE | X86_CR4_SMEP | X86_CR4_RDWRGSFS \
  50. | X86_CR4_OSXMMEXCPT | X86_CR4_VMXE))
  51. #define CR8_RESERVED_BITS (~(unsigned long)X86_CR8_TPR)
  52. #define INVALID_PAGE (~(hpa_t)0)
  53. #define VALID_PAGE(x) ((x) != INVALID_PAGE)
  54. #define UNMAPPED_GVA (~(gpa_t)0)
  55. /* KVM Hugepage definitions for x86 */
  56. #define KVM_NR_PAGE_SIZES 3
  57. #define KVM_HPAGE_GFN_SHIFT(x) (((x) - 1) * 9)
  58. #define KVM_HPAGE_SHIFT(x) (PAGE_SHIFT + KVM_HPAGE_GFN_SHIFT(x))
  59. #define KVM_HPAGE_SIZE(x) (1UL << KVM_HPAGE_SHIFT(x))
  60. #define KVM_HPAGE_MASK(x) (~(KVM_HPAGE_SIZE(x) - 1))
  61. #define KVM_PAGES_PER_HPAGE(x) (KVM_HPAGE_SIZE(x) / PAGE_SIZE)
  62. #define DE_VECTOR 0
  63. #define DB_VECTOR 1
  64. #define BP_VECTOR 3
  65. #define OF_VECTOR 4
  66. #define BR_VECTOR 5
  67. #define UD_VECTOR 6
  68. #define NM_VECTOR 7
  69. #define DF_VECTOR 8
  70. #define TS_VECTOR 10
  71. #define NP_VECTOR 11
  72. #define SS_VECTOR 12
  73. #define GP_VECTOR 13
  74. #define PF_VECTOR 14
  75. #define MF_VECTOR 16
  76. #define MC_VECTOR 18
  77. #define SELECTOR_TI_MASK (1 << 2)
  78. #define SELECTOR_RPL_MASK 0x03
  79. #define IOPL_SHIFT 12
  80. #define KVM_PERMILLE_MMU_PAGES 20
  81. #define KVM_MIN_ALLOC_MMU_PAGES 64
  82. #define KVM_MMU_HASH_SHIFT 10
  83. #define KVM_NUM_MMU_PAGES (1 << KVM_MMU_HASH_SHIFT)
  84. #define KVM_MIN_FREE_MMU_PAGES 5
  85. #define KVM_REFILL_PAGES 25
  86. #define KVM_MAX_CPUID_ENTRIES 80
  87. #define KVM_NR_FIXED_MTRR_REGION 88
  88. #define KVM_NR_VAR_MTRR 8
  89. #define ASYNC_PF_PER_VCPU 64
  90. extern raw_spinlock_t kvm_lock;
  91. extern struct list_head vm_list;
  92. struct kvm_vcpu;
  93. struct kvm;
  94. struct kvm_async_pf;
  95. enum kvm_reg {
  96. VCPU_REGS_RAX = 0,
  97. VCPU_REGS_RCX = 1,
  98. VCPU_REGS_RDX = 2,
  99. VCPU_REGS_RBX = 3,
  100. VCPU_REGS_RSP = 4,
  101. VCPU_REGS_RBP = 5,
  102. VCPU_REGS_RSI = 6,
  103. VCPU_REGS_RDI = 7,
  104. #ifdef CONFIG_X86_64
  105. VCPU_REGS_R8 = 8,
  106. VCPU_REGS_R9 = 9,
  107. VCPU_REGS_R10 = 10,
  108. VCPU_REGS_R11 = 11,
  109. VCPU_REGS_R12 = 12,
  110. VCPU_REGS_R13 = 13,
  111. VCPU_REGS_R14 = 14,
  112. VCPU_REGS_R15 = 15,
  113. #endif
  114. VCPU_REGS_RIP,
  115. NR_VCPU_REGS
  116. };
  117. enum kvm_reg_ex {
  118. VCPU_EXREG_PDPTR = NR_VCPU_REGS,
  119. VCPU_EXREG_CR3,
  120. VCPU_EXREG_RFLAGS,
  121. VCPU_EXREG_CPL,
  122. VCPU_EXREG_SEGMENTS,
  123. };
  124. enum {
  125. VCPU_SREG_ES,
  126. VCPU_SREG_CS,
  127. VCPU_SREG_SS,
  128. VCPU_SREG_DS,
  129. VCPU_SREG_FS,
  130. VCPU_SREG_GS,
  131. VCPU_SREG_TR,
  132. VCPU_SREG_LDTR,
  133. };
  134. #include <asm/kvm_emulate.h>
  135. #define KVM_NR_MEM_OBJS 40
  136. #define KVM_NR_DB_REGS 4
  137. #define DR6_BD (1 << 13)
  138. #define DR6_BS (1 << 14)
  139. #define DR6_FIXED_1 0xffff0ff0
  140. #define DR6_VOLATILE 0x0000e00f
  141. #define DR7_BP_EN_MASK 0x000000ff
  142. #define DR7_GE (1 << 9)
  143. #define DR7_GD (1 << 13)
  144. #define DR7_FIXED_1 0x00000400
  145. #define DR7_VOLATILE 0xffff23ff
  146. /* apic attention bits */
  147. #define KVM_APIC_CHECK_VAPIC 0
  148. /*
  149. * The following bit is set with PV-EOI, unset on EOI.
  150. * We detect PV-EOI changes by guest by comparing
  151. * this bit with PV-EOI in guest memory.
  152. * See the implementation in apic_update_pv_eoi.
  153. */
  154. #define KVM_APIC_PV_EOI_PENDING 1
  155. /*
  156. * We don't want allocation failures within the mmu code, so we preallocate
  157. * enough memory for a single page fault in a cache.
  158. */
  159. struct kvm_mmu_memory_cache {
  160. int nobjs;
  161. void *objects[KVM_NR_MEM_OBJS];
  162. };
  163. /*
  164. * kvm_mmu_page_role, below, is defined as:
  165. *
  166. * bits 0:3 - total guest paging levels (2-4, or zero for real mode)
  167. * bits 4:7 - page table level for this shadow (1-4)
  168. * bits 8:9 - page table quadrant for 2-level guests
  169. * bit 16 - direct mapping of virtual to physical mapping at gfn
  170. * used for real mode and two-dimensional paging
  171. * bits 17:19 - common access permissions for all ptes in this shadow page
  172. */
  173. union kvm_mmu_page_role {
  174. unsigned word;
  175. struct {
  176. unsigned level:4;
  177. unsigned cr4_pae:1;
  178. unsigned quadrant:2;
  179. unsigned pad_for_nice_hex_output:6;
  180. unsigned direct:1;
  181. unsigned access:3;
  182. unsigned invalid:1;
  183. unsigned nxe:1;
  184. unsigned cr0_wp:1;
  185. unsigned smep_andnot_wp:1;
  186. };
  187. };
  188. struct kvm_mmu_page {
  189. struct list_head link;
  190. struct hlist_node hash_link;
  191. /*
  192. * The following two entries are used to key the shadow page in the
  193. * hash table.
  194. */
  195. gfn_t gfn;
  196. union kvm_mmu_page_role role;
  197. u64 *spt;
  198. /* hold the gfn of each spte inside spt */
  199. gfn_t *gfns;
  200. /*
  201. * One bit set per slot which has memory
  202. * in this shadow page.
  203. */
  204. DECLARE_BITMAP(slot_bitmap, KVM_MEM_SLOTS_NUM);
  205. bool unsync;
  206. int root_count; /* Currently serving as active root */
  207. unsigned int unsync_children;
  208. unsigned long parent_ptes; /* Reverse mapping for parent_pte */
  209. DECLARE_BITMAP(unsync_child_bitmap, 512);
  210. #ifdef CONFIG_X86_32
  211. int clear_spte_count;
  212. #endif
  213. int write_flooding_count;
  214. };
  215. struct kvm_pio_request {
  216. unsigned long count;
  217. int in;
  218. int port;
  219. int size;
  220. };
  221. /*
  222. * x86 supports 3 paging modes (4-level 64-bit, 3-level 64-bit, and 2-level
  223. * 32-bit). The kvm_mmu structure abstracts the details of the current mmu
  224. * mode.
  225. */
  226. struct kvm_mmu {
  227. void (*new_cr3)(struct kvm_vcpu *vcpu);
  228. void (*set_cr3)(struct kvm_vcpu *vcpu, unsigned long root);
  229. unsigned long (*get_cr3)(struct kvm_vcpu *vcpu);
  230. u64 (*get_pdptr)(struct kvm_vcpu *vcpu, int index);
  231. int (*page_fault)(struct kvm_vcpu *vcpu, gva_t gva, u32 err,
  232. bool prefault);
  233. void (*inject_page_fault)(struct kvm_vcpu *vcpu,
  234. struct x86_exception *fault);
  235. void (*free)(struct kvm_vcpu *vcpu);
  236. gpa_t (*gva_to_gpa)(struct kvm_vcpu *vcpu, gva_t gva, u32 access,
  237. struct x86_exception *exception);
  238. gpa_t (*translate_gpa)(struct kvm_vcpu *vcpu, gpa_t gpa, u32 access);
  239. int (*sync_page)(struct kvm_vcpu *vcpu,
  240. struct kvm_mmu_page *sp);
  241. void (*invlpg)(struct kvm_vcpu *vcpu, gva_t gva);
  242. void (*update_pte)(struct kvm_vcpu *vcpu, struct kvm_mmu_page *sp,
  243. u64 *spte, const void *pte);
  244. hpa_t root_hpa;
  245. int root_level;
  246. int shadow_root_level;
  247. union kvm_mmu_page_role base_role;
  248. bool direct_map;
  249. u64 *pae_root;
  250. u64 *lm_root;
  251. u64 rsvd_bits_mask[2][4];
  252. bool nx;
  253. u64 pdptrs[4]; /* pae */
  254. };
  255. enum pmc_type {
  256. KVM_PMC_GP = 0,
  257. KVM_PMC_FIXED,
  258. };
  259. struct kvm_pmc {
  260. enum pmc_type type;
  261. u8 idx;
  262. u64 counter;
  263. u64 eventsel;
  264. struct perf_event *perf_event;
  265. struct kvm_vcpu *vcpu;
  266. };
  267. struct kvm_pmu {
  268. unsigned nr_arch_gp_counters;
  269. unsigned nr_arch_fixed_counters;
  270. unsigned available_event_types;
  271. u64 fixed_ctr_ctrl;
  272. u64 global_ctrl;
  273. u64 global_status;
  274. u64 global_ovf_ctrl;
  275. u64 counter_bitmask[2];
  276. u64 global_ctrl_mask;
  277. u8 version;
  278. struct kvm_pmc gp_counters[INTEL_PMC_MAX_GENERIC];
  279. struct kvm_pmc fixed_counters[INTEL_PMC_MAX_FIXED];
  280. struct irq_work irq_work;
  281. u64 reprogram_pmi;
  282. };
  283. struct kvm_vcpu_arch {
  284. /*
  285. * rip and regs accesses must go through
  286. * kvm_{register,rip}_{read,write} functions.
  287. */
  288. unsigned long regs[NR_VCPU_REGS];
  289. u32 regs_avail;
  290. u32 regs_dirty;
  291. unsigned long cr0;
  292. unsigned long cr0_guest_owned_bits;
  293. unsigned long cr2;
  294. unsigned long cr3;
  295. unsigned long cr4;
  296. unsigned long cr4_guest_owned_bits;
  297. unsigned long cr8;
  298. u32 hflags;
  299. u64 efer;
  300. u64 apic_base;
  301. struct kvm_lapic *apic; /* kernel irqchip context */
  302. unsigned long apic_attention;
  303. int32_t apic_arb_prio;
  304. int mp_state;
  305. int sipi_vector;
  306. u64 ia32_misc_enable_msr;
  307. bool tpr_access_reporting;
  308. /*
  309. * Paging state of the vcpu
  310. *
  311. * If the vcpu runs in guest mode with two level paging this still saves
  312. * the paging mode of the l1 guest. This context is always used to
  313. * handle faults.
  314. */
  315. struct kvm_mmu mmu;
  316. /*
  317. * Paging state of an L2 guest (used for nested npt)
  318. *
  319. * This context will save all necessary information to walk page tables
  320. * of the an L2 guest. This context is only initialized for page table
  321. * walking and not for faulting since we never handle l2 page faults on
  322. * the host.
  323. */
  324. struct kvm_mmu nested_mmu;
  325. /*
  326. * Pointer to the mmu context currently used for
  327. * gva_to_gpa translations.
  328. */
  329. struct kvm_mmu *walk_mmu;
  330. struct kvm_mmu_memory_cache mmu_pte_list_desc_cache;
  331. struct kvm_mmu_memory_cache mmu_page_cache;
  332. struct kvm_mmu_memory_cache mmu_page_header_cache;
  333. struct fpu guest_fpu;
  334. u64 xcr0;
  335. struct kvm_pio_request pio;
  336. void *pio_data;
  337. u8 event_exit_inst_len;
  338. struct kvm_queued_exception {
  339. bool pending;
  340. bool has_error_code;
  341. bool reinject;
  342. u8 nr;
  343. u32 error_code;
  344. } exception;
  345. struct kvm_queued_interrupt {
  346. bool pending;
  347. bool soft;
  348. u8 nr;
  349. } interrupt;
  350. int halt_request; /* real mode on Intel only */
  351. int cpuid_nent;
  352. struct kvm_cpuid_entry2 cpuid_entries[KVM_MAX_CPUID_ENTRIES];
  353. /* emulate context */
  354. struct x86_emulate_ctxt emulate_ctxt;
  355. bool emulate_regs_need_sync_to_vcpu;
  356. bool emulate_regs_need_sync_from_vcpu;
  357. int (*complete_userspace_io)(struct kvm_vcpu *vcpu);
  358. gpa_t time;
  359. struct pvclock_vcpu_time_info hv_clock;
  360. unsigned int hw_tsc_khz;
  361. unsigned int time_offset;
  362. struct page *time_page;
  363. /* set guest stopped flag in pvclock flags field */
  364. bool pvclock_set_guest_stopped_request;
  365. struct {
  366. u64 msr_val;
  367. u64 last_steal;
  368. u64 accum_steal;
  369. struct gfn_to_hva_cache stime;
  370. struct kvm_steal_time steal;
  371. } st;
  372. u64 last_guest_tsc;
  373. u64 last_kernel_ns;
  374. u64 last_host_tsc;
  375. u64 tsc_offset_adjustment;
  376. u64 this_tsc_nsec;
  377. u64 this_tsc_write;
  378. u8 this_tsc_generation;
  379. bool tsc_catchup;
  380. bool tsc_always_catchup;
  381. s8 virtual_tsc_shift;
  382. u32 virtual_tsc_mult;
  383. u32 virtual_tsc_khz;
  384. atomic_t nmi_queued; /* unprocessed asynchronous NMIs */
  385. unsigned nmi_pending; /* NMI queued after currently running handler */
  386. bool nmi_injected; /* Trying to inject an NMI this entry */
  387. struct mtrr_state_type mtrr_state;
  388. u32 pat;
  389. int switch_db_regs;
  390. unsigned long db[KVM_NR_DB_REGS];
  391. unsigned long dr6;
  392. unsigned long dr7;
  393. unsigned long eff_db[KVM_NR_DB_REGS];
  394. u64 mcg_cap;
  395. u64 mcg_status;
  396. u64 mcg_ctl;
  397. u64 *mce_banks;
  398. /* Cache MMIO info */
  399. u64 mmio_gva;
  400. unsigned access;
  401. gfn_t mmio_gfn;
  402. struct kvm_pmu pmu;
  403. /* used for guest single stepping over the given code position */
  404. unsigned long singlestep_rip;
  405. /* fields used by HYPER-V emulation */
  406. u64 hv_vapic;
  407. cpumask_var_t wbinvd_dirty_mask;
  408. unsigned long last_retry_eip;
  409. unsigned long last_retry_addr;
  410. struct {
  411. bool halted;
  412. gfn_t gfns[roundup_pow_of_two(ASYNC_PF_PER_VCPU)];
  413. struct gfn_to_hva_cache data;
  414. u64 msr_val;
  415. u32 id;
  416. bool send_user_only;
  417. } apf;
  418. /* OSVW MSRs (AMD only) */
  419. struct {
  420. u64 length;
  421. u64 status;
  422. } osvw;
  423. struct {
  424. u64 msr_val;
  425. struct gfn_to_hva_cache data;
  426. } pv_eoi;
  427. };
  428. struct kvm_lpage_info {
  429. int write_count;
  430. };
  431. struct kvm_arch_memory_slot {
  432. unsigned long *rmap[KVM_NR_PAGE_SIZES];
  433. struct kvm_lpage_info *lpage_info[KVM_NR_PAGE_SIZES - 1];
  434. };
  435. struct kvm_arch {
  436. unsigned int n_used_mmu_pages;
  437. unsigned int n_requested_mmu_pages;
  438. unsigned int n_max_mmu_pages;
  439. unsigned int indirect_shadow_pages;
  440. struct hlist_head mmu_page_hash[KVM_NUM_MMU_PAGES];
  441. /*
  442. * Hash table of struct kvm_mmu_page.
  443. */
  444. struct list_head active_mmu_pages;
  445. struct list_head assigned_dev_head;
  446. struct iommu_domain *iommu_domain;
  447. int iommu_flags;
  448. struct kvm_pic *vpic;
  449. struct kvm_ioapic *vioapic;
  450. struct kvm_pit *vpit;
  451. int vapics_in_nmi_mode;
  452. unsigned int tss_addr;
  453. struct page *apic_access_page;
  454. gpa_t wall_clock;
  455. struct page *ept_identity_pagetable;
  456. bool ept_identity_pagetable_done;
  457. gpa_t ept_identity_map_addr;
  458. unsigned long irq_sources_bitmap;
  459. s64 kvmclock_offset;
  460. raw_spinlock_t tsc_write_lock;
  461. u64 last_tsc_nsec;
  462. u64 last_tsc_write;
  463. u32 last_tsc_khz;
  464. u64 cur_tsc_nsec;
  465. u64 cur_tsc_write;
  466. u64 cur_tsc_offset;
  467. u8 cur_tsc_generation;
  468. struct kvm_xen_hvm_config xen_hvm_config;
  469. /* fields used by HYPER-V emulation */
  470. u64 hv_guest_os_id;
  471. u64 hv_hypercall;
  472. #ifdef CONFIG_KVM_MMU_AUDIT
  473. int audit_point;
  474. #endif
  475. };
  476. struct kvm_vm_stat {
  477. u32 mmu_shadow_zapped;
  478. u32 mmu_pte_write;
  479. u32 mmu_pte_updated;
  480. u32 mmu_pde_zapped;
  481. u32 mmu_flooded;
  482. u32 mmu_recycled;
  483. u32 mmu_cache_miss;
  484. u32 mmu_unsync;
  485. u32 remote_tlb_flush;
  486. u32 lpages;
  487. };
  488. struct kvm_vcpu_stat {
  489. u32 pf_fixed;
  490. u32 pf_guest;
  491. u32 tlb_flush;
  492. u32 invlpg;
  493. u32 exits;
  494. u32 io_exits;
  495. u32 mmio_exits;
  496. u32 signal_exits;
  497. u32 irq_window_exits;
  498. u32 nmi_window_exits;
  499. u32 halt_exits;
  500. u32 halt_wakeup;
  501. u32 request_irq_exits;
  502. u32 irq_exits;
  503. u32 host_state_reload;
  504. u32 efer_reload;
  505. u32 fpu_reload;
  506. u32 insn_emulation;
  507. u32 insn_emulation_fail;
  508. u32 hypercalls;
  509. u32 irq_injections;
  510. u32 nmi_injections;
  511. };
  512. struct x86_instruction_info;
  513. struct kvm_x86_ops {
  514. int (*cpu_has_kvm_support)(void); /* __init */
  515. int (*disabled_by_bios)(void); /* __init */
  516. int (*hardware_enable)(void *dummy);
  517. void (*hardware_disable)(void *dummy);
  518. void (*check_processor_compatibility)(void *rtn);
  519. int (*hardware_setup)(void); /* __init */
  520. void (*hardware_unsetup)(void); /* __exit */
  521. bool (*cpu_has_accelerated_tpr)(void);
  522. void (*cpuid_update)(struct kvm_vcpu *vcpu);
  523. /* Create, but do not attach this VCPU */
  524. struct kvm_vcpu *(*vcpu_create)(struct kvm *kvm, unsigned id);
  525. void (*vcpu_free)(struct kvm_vcpu *vcpu);
  526. int (*vcpu_reset)(struct kvm_vcpu *vcpu);
  527. void (*prepare_guest_switch)(struct kvm_vcpu *vcpu);
  528. void (*vcpu_load)(struct kvm_vcpu *vcpu, int cpu);
  529. void (*vcpu_put)(struct kvm_vcpu *vcpu);
  530. void (*set_guest_debug)(struct kvm_vcpu *vcpu,
  531. struct kvm_guest_debug *dbg);
  532. int (*get_msr)(struct kvm_vcpu *vcpu, u32 msr_index, u64 *pdata);
  533. int (*set_msr)(struct kvm_vcpu *vcpu, u32 msr_index, u64 data);
  534. u64 (*get_segment_base)(struct kvm_vcpu *vcpu, int seg);
  535. void (*get_segment)(struct kvm_vcpu *vcpu,
  536. struct kvm_segment *var, int seg);
  537. int (*get_cpl)(struct kvm_vcpu *vcpu);
  538. void (*set_segment)(struct kvm_vcpu *vcpu,
  539. struct kvm_segment *var, int seg);
  540. void (*get_cs_db_l_bits)(struct kvm_vcpu *vcpu, int *db, int *l);
  541. void (*decache_cr0_guest_bits)(struct kvm_vcpu *vcpu);
  542. void (*decache_cr3)(struct kvm_vcpu *vcpu);
  543. void (*decache_cr4_guest_bits)(struct kvm_vcpu *vcpu);
  544. void (*set_cr0)(struct kvm_vcpu *vcpu, unsigned long cr0);
  545. void (*set_cr3)(struct kvm_vcpu *vcpu, unsigned long cr3);
  546. int (*set_cr4)(struct kvm_vcpu *vcpu, unsigned long cr4);
  547. void (*set_efer)(struct kvm_vcpu *vcpu, u64 efer);
  548. void (*get_idt)(struct kvm_vcpu *vcpu, struct desc_ptr *dt);
  549. void (*set_idt)(struct kvm_vcpu *vcpu, struct desc_ptr *dt);
  550. void (*get_gdt)(struct kvm_vcpu *vcpu, struct desc_ptr *dt);
  551. void (*set_gdt)(struct kvm_vcpu *vcpu, struct desc_ptr *dt);
  552. void (*set_dr7)(struct kvm_vcpu *vcpu, unsigned long value);
  553. void (*cache_reg)(struct kvm_vcpu *vcpu, enum kvm_reg reg);
  554. unsigned long (*get_rflags)(struct kvm_vcpu *vcpu);
  555. void (*set_rflags)(struct kvm_vcpu *vcpu, unsigned long rflags);
  556. void (*fpu_activate)(struct kvm_vcpu *vcpu);
  557. void (*fpu_deactivate)(struct kvm_vcpu *vcpu);
  558. void (*tlb_flush)(struct kvm_vcpu *vcpu);
  559. void (*run)(struct kvm_vcpu *vcpu);
  560. int (*handle_exit)(struct kvm_vcpu *vcpu);
  561. void (*skip_emulated_instruction)(struct kvm_vcpu *vcpu);
  562. void (*set_interrupt_shadow)(struct kvm_vcpu *vcpu, int mask);
  563. u32 (*get_interrupt_shadow)(struct kvm_vcpu *vcpu, int mask);
  564. void (*patch_hypercall)(struct kvm_vcpu *vcpu,
  565. unsigned char *hypercall_addr);
  566. void (*set_irq)(struct kvm_vcpu *vcpu);
  567. void (*set_nmi)(struct kvm_vcpu *vcpu);
  568. void (*queue_exception)(struct kvm_vcpu *vcpu, unsigned nr,
  569. bool has_error_code, u32 error_code,
  570. bool reinject);
  571. void (*cancel_injection)(struct kvm_vcpu *vcpu);
  572. int (*interrupt_allowed)(struct kvm_vcpu *vcpu);
  573. int (*nmi_allowed)(struct kvm_vcpu *vcpu);
  574. bool (*get_nmi_mask)(struct kvm_vcpu *vcpu);
  575. void (*set_nmi_mask)(struct kvm_vcpu *vcpu, bool masked);
  576. void (*enable_nmi_window)(struct kvm_vcpu *vcpu);
  577. void (*enable_irq_window)(struct kvm_vcpu *vcpu);
  578. void (*update_cr8_intercept)(struct kvm_vcpu *vcpu, int tpr, int irr);
  579. int (*set_tss_addr)(struct kvm *kvm, unsigned int addr);
  580. int (*get_tdp_level)(void);
  581. u64 (*get_mt_mask)(struct kvm_vcpu *vcpu, gfn_t gfn, bool is_mmio);
  582. int (*get_lpage_level)(void);
  583. bool (*rdtscp_supported)(void);
  584. bool (*invpcid_supported)(void);
  585. void (*adjust_tsc_offset)(struct kvm_vcpu *vcpu, s64 adjustment, bool host);
  586. void (*set_tdp_cr3)(struct kvm_vcpu *vcpu, unsigned long cr3);
  587. void (*set_supported_cpuid)(u32 func, struct kvm_cpuid_entry2 *entry);
  588. bool (*has_wbinvd_exit)(void);
  589. void (*set_tsc_khz)(struct kvm_vcpu *vcpu, u32 user_tsc_khz, bool scale);
  590. void (*write_tsc_offset)(struct kvm_vcpu *vcpu, u64 offset);
  591. u64 (*compute_tsc_offset)(struct kvm_vcpu *vcpu, u64 target_tsc);
  592. u64 (*read_l1_tsc)(struct kvm_vcpu *vcpu);
  593. void (*get_exit_info)(struct kvm_vcpu *vcpu, u64 *info1, u64 *info2);
  594. int (*check_intercept)(struct kvm_vcpu *vcpu,
  595. struct x86_instruction_info *info,
  596. enum x86_intercept_stage stage);
  597. };
  598. struct kvm_arch_async_pf {
  599. u32 token;
  600. gfn_t gfn;
  601. unsigned long cr3;
  602. bool direct_map;
  603. };
  604. extern struct kvm_x86_ops *kvm_x86_ops;
  605. static inline void adjust_tsc_offset_guest(struct kvm_vcpu *vcpu,
  606. s64 adjustment)
  607. {
  608. kvm_x86_ops->adjust_tsc_offset(vcpu, adjustment, false);
  609. }
  610. static inline void adjust_tsc_offset_host(struct kvm_vcpu *vcpu, s64 adjustment)
  611. {
  612. kvm_x86_ops->adjust_tsc_offset(vcpu, adjustment, true);
  613. }
  614. int kvm_mmu_module_init(void);
  615. void kvm_mmu_module_exit(void);
  616. void kvm_mmu_destroy(struct kvm_vcpu *vcpu);
  617. int kvm_mmu_create(struct kvm_vcpu *vcpu);
  618. int kvm_mmu_setup(struct kvm_vcpu *vcpu);
  619. void kvm_mmu_set_mask_ptes(u64 user_mask, u64 accessed_mask,
  620. u64 dirty_mask, u64 nx_mask, u64 x_mask);
  621. int kvm_mmu_reset_context(struct kvm_vcpu *vcpu);
  622. void kvm_mmu_slot_remove_write_access(struct kvm *kvm, int slot);
  623. void kvm_mmu_write_protect_pt_masked(struct kvm *kvm,
  624. struct kvm_memory_slot *slot,
  625. gfn_t gfn_offset, unsigned long mask);
  626. void kvm_mmu_zap_all(struct kvm *kvm);
  627. unsigned int kvm_mmu_calculate_mmu_pages(struct kvm *kvm);
  628. void kvm_mmu_change_mmu_pages(struct kvm *kvm, unsigned int kvm_nr_mmu_pages);
  629. int load_pdptrs(struct kvm_vcpu *vcpu, struct kvm_mmu *mmu, unsigned long cr3);
  630. int emulator_write_phys(struct kvm_vcpu *vcpu, gpa_t gpa,
  631. const void *val, int bytes);
  632. u8 kvm_get_guest_memory_type(struct kvm_vcpu *vcpu, gfn_t gfn);
  633. extern bool tdp_enabled;
  634. u64 vcpu_tsc_khz(struct kvm_vcpu *vcpu);
  635. /* control of guest tsc rate supported? */
  636. extern bool kvm_has_tsc_control;
  637. /* minimum supported tsc_khz for guests */
  638. extern u32 kvm_min_guest_tsc_khz;
  639. /* maximum supported tsc_khz for guests */
  640. extern u32 kvm_max_guest_tsc_khz;
  641. enum emulation_result {
  642. EMULATE_DONE, /* no further processing */
  643. EMULATE_DO_MMIO, /* kvm_run filled with mmio request */
  644. EMULATE_FAIL, /* can't emulate this instruction */
  645. };
  646. #define EMULTYPE_NO_DECODE (1 << 0)
  647. #define EMULTYPE_TRAP_UD (1 << 1)
  648. #define EMULTYPE_SKIP (1 << 2)
  649. #define EMULTYPE_RETRY (1 << 3)
  650. int x86_emulate_instruction(struct kvm_vcpu *vcpu, unsigned long cr2,
  651. int emulation_type, void *insn, int insn_len);
  652. static inline int emulate_instruction(struct kvm_vcpu *vcpu,
  653. int emulation_type)
  654. {
  655. return x86_emulate_instruction(vcpu, 0, emulation_type, NULL, 0);
  656. }
  657. void kvm_enable_efer_bits(u64);
  658. int kvm_get_msr(struct kvm_vcpu *vcpu, u32 msr_index, u64 *data);
  659. int kvm_set_msr(struct kvm_vcpu *vcpu, u32 msr_index, u64 data);
  660. struct x86_emulate_ctxt;
  661. int kvm_fast_pio_out(struct kvm_vcpu *vcpu, int size, unsigned short port);
  662. void kvm_emulate_cpuid(struct kvm_vcpu *vcpu);
  663. int kvm_emulate_halt(struct kvm_vcpu *vcpu);
  664. int kvm_emulate_wbinvd(struct kvm_vcpu *vcpu);
  665. void kvm_get_segment(struct kvm_vcpu *vcpu, struct kvm_segment *var, int seg);
  666. int kvm_load_segment_descriptor(struct kvm_vcpu *vcpu, u16 selector, int seg);
  667. int kvm_task_switch(struct kvm_vcpu *vcpu, u16 tss_selector, int idt_index,
  668. int reason, bool has_error_code, u32 error_code);
  669. int kvm_set_cr0(struct kvm_vcpu *vcpu, unsigned long cr0);
  670. int kvm_set_cr3(struct kvm_vcpu *vcpu, unsigned long cr3);
  671. int kvm_set_cr4(struct kvm_vcpu *vcpu, unsigned long cr4);
  672. int kvm_set_cr8(struct kvm_vcpu *vcpu, unsigned long cr8);
  673. int kvm_set_dr(struct kvm_vcpu *vcpu, int dr, unsigned long val);
  674. int kvm_get_dr(struct kvm_vcpu *vcpu, int dr, unsigned long *val);
  675. unsigned long kvm_get_cr8(struct kvm_vcpu *vcpu);
  676. void kvm_lmsw(struct kvm_vcpu *vcpu, unsigned long msw);
  677. void kvm_get_cs_db_l_bits(struct kvm_vcpu *vcpu, int *db, int *l);
  678. int kvm_set_xcr(struct kvm_vcpu *vcpu, u32 index, u64 xcr);
  679. int kvm_get_msr_common(struct kvm_vcpu *vcpu, u32 msr, u64 *pdata);
  680. int kvm_set_msr_common(struct kvm_vcpu *vcpu, u32 msr, u64 data);
  681. unsigned long kvm_get_rflags(struct kvm_vcpu *vcpu);
  682. void kvm_set_rflags(struct kvm_vcpu *vcpu, unsigned long rflags);
  683. bool kvm_rdpmc(struct kvm_vcpu *vcpu);
  684. void kvm_queue_exception(struct kvm_vcpu *vcpu, unsigned nr);
  685. void kvm_queue_exception_e(struct kvm_vcpu *vcpu, unsigned nr, u32 error_code);
  686. void kvm_requeue_exception(struct kvm_vcpu *vcpu, unsigned nr);
  687. void kvm_requeue_exception_e(struct kvm_vcpu *vcpu, unsigned nr, u32 error_code);
  688. void kvm_inject_page_fault(struct kvm_vcpu *vcpu, struct x86_exception *fault);
  689. int kvm_read_guest_page_mmu(struct kvm_vcpu *vcpu, struct kvm_mmu *mmu,
  690. gfn_t gfn, void *data, int offset, int len,
  691. u32 access);
  692. void kvm_propagate_fault(struct kvm_vcpu *vcpu, struct x86_exception *fault);
  693. bool kvm_require_cpl(struct kvm_vcpu *vcpu, int required_cpl);
  694. static inline int __kvm_irq_line_state(unsigned long *irq_state,
  695. int irq_source_id, int level)
  696. {
  697. /* Logical OR for level trig interrupt */
  698. if (level)
  699. __set_bit(irq_source_id, irq_state);
  700. else
  701. __clear_bit(irq_source_id, irq_state);
  702. return !!(*irq_state);
  703. }
  704. int kvm_pic_set_irq(struct kvm_pic *pic, int irq, int irq_source_id, int level);
  705. void kvm_pic_clear_all(struct kvm_pic *pic, int irq_source_id);
  706. void kvm_inject_nmi(struct kvm_vcpu *vcpu);
  707. int fx_init(struct kvm_vcpu *vcpu);
  708. void kvm_mmu_flush_tlb(struct kvm_vcpu *vcpu);
  709. void kvm_mmu_pte_write(struct kvm_vcpu *vcpu, gpa_t gpa,
  710. const u8 *new, int bytes);
  711. int kvm_mmu_unprotect_page(struct kvm *kvm, gfn_t gfn);
  712. int kvm_mmu_unprotect_page_virt(struct kvm_vcpu *vcpu, gva_t gva);
  713. void __kvm_mmu_free_some_pages(struct kvm_vcpu *vcpu);
  714. int kvm_mmu_load(struct kvm_vcpu *vcpu);
  715. void kvm_mmu_unload(struct kvm_vcpu *vcpu);
  716. void kvm_mmu_sync_roots(struct kvm_vcpu *vcpu);
  717. gpa_t translate_nested_gpa(struct kvm_vcpu *vcpu, gpa_t gpa, u32 access);
  718. gpa_t kvm_mmu_gva_to_gpa_read(struct kvm_vcpu *vcpu, gva_t gva,
  719. struct x86_exception *exception);
  720. gpa_t kvm_mmu_gva_to_gpa_fetch(struct kvm_vcpu *vcpu, gva_t gva,
  721. struct x86_exception *exception);
  722. gpa_t kvm_mmu_gva_to_gpa_write(struct kvm_vcpu *vcpu, gva_t gva,
  723. struct x86_exception *exception);
  724. gpa_t kvm_mmu_gva_to_gpa_system(struct kvm_vcpu *vcpu, gva_t gva,
  725. struct x86_exception *exception);
  726. int kvm_emulate_hypercall(struct kvm_vcpu *vcpu);
  727. int kvm_mmu_page_fault(struct kvm_vcpu *vcpu, gva_t gva, u32 error_code,
  728. void *insn, int insn_len);
  729. void kvm_mmu_invlpg(struct kvm_vcpu *vcpu, gva_t gva);
  730. void kvm_enable_tdp(void);
  731. void kvm_disable_tdp(void);
  732. int complete_pio(struct kvm_vcpu *vcpu);
  733. bool kvm_check_iopl(struct kvm_vcpu *vcpu);
  734. static inline gpa_t translate_gpa(struct kvm_vcpu *vcpu, gpa_t gpa, u32 access)
  735. {
  736. return gpa;
  737. }
  738. static inline struct kvm_mmu_page *page_header(hpa_t shadow_page)
  739. {
  740. struct page *page = pfn_to_page(shadow_page >> PAGE_SHIFT);
  741. return (struct kvm_mmu_page *)page_private(page);
  742. }
  743. static inline u16 kvm_read_ldt(void)
  744. {
  745. u16 ldt;
  746. asm("sldt %0" : "=g"(ldt));
  747. return ldt;
  748. }
  749. static inline void kvm_load_ldt(u16 sel)
  750. {
  751. asm("lldt %0" : : "rm"(sel));
  752. }
  753. #ifdef CONFIG_X86_64
  754. static inline unsigned long read_msr(unsigned long msr)
  755. {
  756. u64 value;
  757. rdmsrl(msr, value);
  758. return value;
  759. }
  760. #endif
  761. static inline u32 get_rdx_init_val(void)
  762. {
  763. return 0x600; /* P6 family */
  764. }
  765. static inline void kvm_inject_gp(struct kvm_vcpu *vcpu, u32 error_code)
  766. {
  767. kvm_queue_exception_e(vcpu, GP_VECTOR, error_code);
  768. }
  769. #define TSS_IOPB_BASE_OFFSET 0x66
  770. #define TSS_BASE_SIZE 0x68
  771. #define TSS_IOPB_SIZE (65536 / 8)
  772. #define TSS_REDIRECTION_SIZE (256 / 8)
  773. #define RMODE_TSS_SIZE \
  774. (TSS_BASE_SIZE + TSS_REDIRECTION_SIZE + TSS_IOPB_SIZE + 1)
  775. enum {
  776. TASK_SWITCH_CALL = 0,
  777. TASK_SWITCH_IRET = 1,
  778. TASK_SWITCH_JMP = 2,
  779. TASK_SWITCH_GATE = 3,
  780. };
  781. #define HF_GIF_MASK (1 << 0)
  782. #define HF_HIF_MASK (1 << 1)
  783. #define HF_VINTR_MASK (1 << 2)
  784. #define HF_NMI_MASK (1 << 3)
  785. #define HF_IRET_MASK (1 << 4)
  786. #define HF_GUEST_MASK (1 << 5) /* VCPU is in guest-mode */
  787. /*
  788. * Hardware virtualization extension instructions may fault if a
  789. * reboot turns off virtualization while processes are running.
  790. * Trap the fault and ignore the instruction if that happens.
  791. */
  792. asmlinkage void kvm_spurious_fault(void);
  793. extern bool kvm_rebooting;
  794. #define ____kvm_handle_fault_on_reboot(insn, cleanup_insn) \
  795. "666: " insn "\n\t" \
  796. "668: \n\t" \
  797. ".pushsection .fixup, \"ax\" \n" \
  798. "667: \n\t" \
  799. cleanup_insn "\n\t" \
  800. "cmpb $0, kvm_rebooting \n\t" \
  801. "jne 668b \n\t" \
  802. __ASM_SIZE(push) " $666b \n\t" \
  803. "call kvm_spurious_fault \n\t" \
  804. ".popsection \n\t" \
  805. _ASM_EXTABLE(666b, 667b)
  806. #define __kvm_handle_fault_on_reboot(insn) \
  807. ____kvm_handle_fault_on_reboot(insn, "")
  808. #define KVM_ARCH_WANT_MMU_NOTIFIER
  809. int kvm_unmap_hva(struct kvm *kvm, unsigned long hva);
  810. int kvm_unmap_hva_range(struct kvm *kvm, unsigned long start, unsigned long end);
  811. int kvm_age_hva(struct kvm *kvm, unsigned long hva);
  812. int kvm_test_age_hva(struct kvm *kvm, unsigned long hva);
  813. void kvm_set_spte_hva(struct kvm *kvm, unsigned long hva, pte_t pte);
  814. int cpuid_maxphyaddr(struct kvm_vcpu *vcpu);
  815. int kvm_cpu_has_interrupt(struct kvm_vcpu *vcpu);
  816. int kvm_arch_interrupt_allowed(struct kvm_vcpu *vcpu);
  817. int kvm_cpu_get_interrupt(struct kvm_vcpu *v);
  818. void kvm_define_shared_msr(unsigned index, u32 msr);
  819. void kvm_set_shared_msr(unsigned index, u64 val, u64 mask);
  820. bool kvm_is_linear_rip(struct kvm_vcpu *vcpu, unsigned long linear_rip);
  821. void kvm_arch_async_page_not_present(struct kvm_vcpu *vcpu,
  822. struct kvm_async_pf *work);
  823. void kvm_arch_async_page_present(struct kvm_vcpu *vcpu,
  824. struct kvm_async_pf *work);
  825. void kvm_arch_async_page_ready(struct kvm_vcpu *vcpu,
  826. struct kvm_async_pf *work);
  827. bool kvm_arch_can_inject_async_page_present(struct kvm_vcpu *vcpu);
  828. extern bool kvm_find_async_pf_gfn(struct kvm_vcpu *vcpu, gfn_t gfn);
  829. void kvm_complete_insn_gp(struct kvm_vcpu *vcpu, int err);
  830. int kvm_is_in_guest(void);
  831. void kvm_pmu_init(struct kvm_vcpu *vcpu);
  832. void kvm_pmu_destroy(struct kvm_vcpu *vcpu);
  833. void kvm_pmu_reset(struct kvm_vcpu *vcpu);
  834. void kvm_pmu_cpuid_update(struct kvm_vcpu *vcpu);
  835. bool kvm_pmu_msr(struct kvm_vcpu *vcpu, u32 msr);
  836. int kvm_pmu_get_msr(struct kvm_vcpu *vcpu, u32 msr, u64 *data);
  837. int kvm_pmu_set_msr(struct kvm_vcpu *vcpu, u32 msr, u64 data);
  838. int kvm_pmu_read_pmc(struct kvm_vcpu *vcpu, unsigned pmc, u64 *data);
  839. void kvm_handle_pmu_event(struct kvm_vcpu *vcpu);
  840. void kvm_deliver_pmi(struct kvm_vcpu *vcpu);
  841. #endif /* _ASM_X86_KVM_HOST_H */