paravirt.h 25 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033
  1. #ifndef _ASM_X86_PARAVIRT_H
  2. #define _ASM_X86_PARAVIRT_H
  3. /* Various instructions on x86 need to be replaced for
  4. * para-virtualization: those hooks are defined here. */
  5. #ifdef CONFIG_PARAVIRT
  6. #include <asm/pgtable_types.h>
  7. #include <asm/asm.h>
  8. #include <asm/paravirt_types.h>
  9. #ifndef __ASSEMBLY__
  10. #include <linux/types.h>
  11. #include <linux/cpumask.h>
  12. static inline int paravirt_enabled(void)
  13. {
  14. return pv_info.paravirt_enabled;
  15. }
  16. static inline void load_sp0(struct tss_struct *tss,
  17. struct thread_struct *thread)
  18. {
  19. PVOP_VCALL2(pv_cpu_ops.load_sp0, tss, thread);
  20. }
  21. static inline unsigned long get_wallclock(void)
  22. {
  23. return PVOP_CALL0(unsigned long, pv_time_ops.get_wallclock);
  24. }
  25. static inline int set_wallclock(unsigned long nowtime)
  26. {
  27. return PVOP_CALL1(int, pv_time_ops.set_wallclock, nowtime);
  28. }
  29. /* The paravirtualized CPUID instruction. */
  30. static inline void __cpuid(unsigned int *eax, unsigned int *ebx,
  31. unsigned int *ecx, unsigned int *edx)
  32. {
  33. PVOP_VCALL4(pv_cpu_ops.cpuid, eax, ebx, ecx, edx);
  34. }
  35. /*
  36. * These special macros can be used to get or set a debugging register
  37. */
  38. static inline unsigned long paravirt_get_debugreg(int reg)
  39. {
  40. return PVOP_CALL1(unsigned long, pv_cpu_ops.get_debugreg, reg);
  41. }
  42. #define get_debugreg(var, reg) var = paravirt_get_debugreg(reg)
  43. static inline void set_debugreg(unsigned long val, int reg)
  44. {
  45. PVOP_VCALL2(pv_cpu_ops.set_debugreg, reg, val);
  46. }
  47. static inline void clts(void)
  48. {
  49. PVOP_VCALL0(pv_cpu_ops.clts);
  50. }
  51. static inline unsigned long read_cr0(void)
  52. {
  53. return PVOP_CALL0(unsigned long, pv_cpu_ops.read_cr0);
  54. }
  55. static inline void write_cr0(unsigned long x)
  56. {
  57. PVOP_VCALL1(pv_cpu_ops.write_cr0, x);
  58. }
  59. static inline unsigned long read_cr2(void)
  60. {
  61. return PVOP_CALL0(unsigned long, pv_mmu_ops.read_cr2);
  62. }
  63. static inline void write_cr2(unsigned long x)
  64. {
  65. PVOP_VCALL1(pv_mmu_ops.write_cr2, x);
  66. }
  67. static inline unsigned long read_cr3(void)
  68. {
  69. return PVOP_CALL0(unsigned long, pv_mmu_ops.read_cr3);
  70. }
  71. static inline void write_cr3(unsigned long x)
  72. {
  73. PVOP_VCALL1(pv_mmu_ops.write_cr3, x);
  74. }
  75. static inline unsigned long read_cr4(void)
  76. {
  77. return PVOP_CALL0(unsigned long, pv_cpu_ops.read_cr4);
  78. }
  79. static inline unsigned long read_cr4_safe(void)
  80. {
  81. return PVOP_CALL0(unsigned long, pv_cpu_ops.read_cr4_safe);
  82. }
  83. static inline void write_cr4(unsigned long x)
  84. {
  85. PVOP_VCALL1(pv_cpu_ops.write_cr4, x);
  86. }
  87. #ifdef CONFIG_X86_64
  88. static inline unsigned long read_cr8(void)
  89. {
  90. return PVOP_CALL0(unsigned long, pv_cpu_ops.read_cr8);
  91. }
  92. static inline void write_cr8(unsigned long x)
  93. {
  94. PVOP_VCALL1(pv_cpu_ops.write_cr8, x);
  95. }
  96. #endif
  97. static inline void raw_safe_halt(void)
  98. {
  99. PVOP_VCALL0(pv_irq_ops.safe_halt);
  100. }
  101. static inline void halt(void)
  102. {
  103. PVOP_VCALL0(pv_irq_ops.safe_halt);
  104. }
  105. static inline void wbinvd(void)
  106. {
  107. PVOP_VCALL0(pv_cpu_ops.wbinvd);
  108. }
  109. #define get_kernel_rpl() (pv_info.kernel_rpl)
  110. static inline u64 paravirt_read_msr(unsigned msr, int *err)
  111. {
  112. return PVOP_CALL2(u64, pv_cpu_ops.read_msr, msr, err);
  113. }
  114. static inline u64 paravirt_read_msr_amd(unsigned msr, int *err)
  115. {
  116. return PVOP_CALL2(u64, pv_cpu_ops.read_msr_amd, msr, err);
  117. }
  118. static inline int paravirt_write_msr(unsigned msr, unsigned low, unsigned high)
  119. {
  120. return PVOP_CALL3(int, pv_cpu_ops.write_msr, msr, low, high);
  121. }
  122. /* These should all do BUG_ON(_err), but our headers are too tangled. */
  123. #define rdmsr(msr, val1, val2) \
  124. do { \
  125. int _err; \
  126. u64 _l = paravirt_read_msr(msr, &_err); \
  127. val1 = (u32)_l; \
  128. val2 = _l >> 32; \
  129. } while (0)
  130. #define wrmsr(msr, val1, val2) \
  131. do { \
  132. paravirt_write_msr(msr, val1, val2); \
  133. } while (0)
  134. #define rdmsrl(msr, val) \
  135. do { \
  136. int _err; \
  137. val = paravirt_read_msr(msr, &_err); \
  138. } while (0)
  139. #define wrmsrl(msr, val) wrmsr(msr, (u32)((u64)(val)), ((u64)(val))>>32)
  140. #define wrmsr_safe(msr, a, b) paravirt_write_msr(msr, a, b)
  141. /* rdmsr with exception handling */
  142. #define rdmsr_safe(msr, a, b) \
  143. ({ \
  144. int _err; \
  145. u64 _l = paravirt_read_msr(msr, &_err); \
  146. (*a) = (u32)_l; \
  147. (*b) = _l >> 32; \
  148. _err; \
  149. })
  150. static inline int rdmsrl_safe(unsigned msr, unsigned long long *p)
  151. {
  152. int err;
  153. *p = paravirt_read_msr(msr, &err);
  154. return err;
  155. }
  156. static inline int rdmsrl_amd_safe(unsigned msr, unsigned long long *p)
  157. {
  158. int err;
  159. *p = paravirt_read_msr_amd(msr, &err);
  160. return err;
  161. }
  162. static inline u64 paravirt_read_tsc(void)
  163. {
  164. return PVOP_CALL0(u64, pv_cpu_ops.read_tsc);
  165. }
  166. #define rdtscl(low) \
  167. do { \
  168. u64 _l = paravirt_read_tsc(); \
  169. low = (int)_l; \
  170. } while (0)
  171. #define rdtscll(val) (val = paravirt_read_tsc())
  172. static inline unsigned long long paravirt_sched_clock(void)
  173. {
  174. return PVOP_CALL0(unsigned long long, pv_time_ops.sched_clock);
  175. }
  176. #define calibrate_tsc() (pv_time_ops.get_tsc_khz())
  177. static inline unsigned long long paravirt_read_pmc(int counter)
  178. {
  179. return PVOP_CALL1(u64, pv_cpu_ops.read_pmc, counter);
  180. }
  181. #define rdpmc(counter, low, high) \
  182. do { \
  183. u64 _l = paravirt_read_pmc(counter); \
  184. low = (u32)_l; \
  185. high = _l >> 32; \
  186. } while (0)
  187. static inline unsigned long long paravirt_rdtscp(unsigned int *aux)
  188. {
  189. return PVOP_CALL1(u64, pv_cpu_ops.read_tscp, aux);
  190. }
  191. #define rdtscp(low, high, aux) \
  192. do { \
  193. int __aux; \
  194. unsigned long __val = paravirt_rdtscp(&__aux); \
  195. (low) = (u32)__val; \
  196. (high) = (u32)(__val >> 32); \
  197. (aux) = __aux; \
  198. } while (0)
  199. #define rdtscpll(val, aux) \
  200. do { \
  201. unsigned long __aux; \
  202. val = paravirt_rdtscp(&__aux); \
  203. (aux) = __aux; \
  204. } while (0)
  205. static inline void paravirt_alloc_ldt(struct desc_struct *ldt, unsigned entries)
  206. {
  207. PVOP_VCALL2(pv_cpu_ops.alloc_ldt, ldt, entries);
  208. }
  209. static inline void paravirt_free_ldt(struct desc_struct *ldt, unsigned entries)
  210. {
  211. PVOP_VCALL2(pv_cpu_ops.free_ldt, ldt, entries);
  212. }
  213. static inline void load_TR_desc(void)
  214. {
  215. PVOP_VCALL0(pv_cpu_ops.load_tr_desc);
  216. }
  217. static inline void load_gdt(const struct desc_ptr *dtr)
  218. {
  219. PVOP_VCALL1(pv_cpu_ops.load_gdt, dtr);
  220. }
  221. static inline void load_idt(const struct desc_ptr *dtr)
  222. {
  223. PVOP_VCALL1(pv_cpu_ops.load_idt, dtr);
  224. }
  225. static inline void set_ldt(const void *addr, unsigned entries)
  226. {
  227. PVOP_VCALL2(pv_cpu_ops.set_ldt, addr, entries);
  228. }
  229. static inline void store_gdt(struct desc_ptr *dtr)
  230. {
  231. PVOP_VCALL1(pv_cpu_ops.store_gdt, dtr);
  232. }
  233. static inline void store_idt(struct desc_ptr *dtr)
  234. {
  235. PVOP_VCALL1(pv_cpu_ops.store_idt, dtr);
  236. }
  237. static inline unsigned long paravirt_store_tr(void)
  238. {
  239. return PVOP_CALL0(unsigned long, pv_cpu_ops.store_tr);
  240. }
  241. #define store_tr(tr) ((tr) = paravirt_store_tr())
  242. static inline void load_TLS(struct thread_struct *t, unsigned cpu)
  243. {
  244. PVOP_VCALL2(pv_cpu_ops.load_tls, t, cpu);
  245. }
  246. #ifdef CONFIG_X86_64
  247. static inline void load_gs_index(unsigned int gs)
  248. {
  249. PVOP_VCALL1(pv_cpu_ops.load_gs_index, gs);
  250. }
  251. #endif
  252. static inline void write_ldt_entry(struct desc_struct *dt, int entry,
  253. const void *desc)
  254. {
  255. PVOP_VCALL3(pv_cpu_ops.write_ldt_entry, dt, entry, desc);
  256. }
  257. static inline void write_gdt_entry(struct desc_struct *dt, int entry,
  258. void *desc, int type)
  259. {
  260. PVOP_VCALL4(pv_cpu_ops.write_gdt_entry, dt, entry, desc, type);
  261. }
  262. static inline void write_idt_entry(gate_desc *dt, int entry, const gate_desc *g)
  263. {
  264. PVOP_VCALL3(pv_cpu_ops.write_idt_entry, dt, entry, g);
  265. }
  266. static inline void set_iopl_mask(unsigned mask)
  267. {
  268. PVOP_VCALL1(pv_cpu_ops.set_iopl_mask, mask);
  269. }
  270. /* The paravirtualized I/O functions */
  271. static inline void slow_down_io(void)
  272. {
  273. pv_cpu_ops.io_delay();
  274. #ifdef REALLY_SLOW_IO
  275. pv_cpu_ops.io_delay();
  276. pv_cpu_ops.io_delay();
  277. pv_cpu_ops.io_delay();
  278. #endif
  279. }
  280. #ifdef CONFIG_SMP
  281. static inline void startup_ipi_hook(int phys_apicid, unsigned long start_eip,
  282. unsigned long start_esp)
  283. {
  284. PVOP_VCALL3(pv_apic_ops.startup_ipi_hook,
  285. phys_apicid, start_eip, start_esp);
  286. }
  287. #endif
  288. static inline void paravirt_activate_mm(struct mm_struct *prev,
  289. struct mm_struct *next)
  290. {
  291. PVOP_VCALL2(pv_mmu_ops.activate_mm, prev, next);
  292. }
  293. static inline void arch_dup_mmap(struct mm_struct *oldmm,
  294. struct mm_struct *mm)
  295. {
  296. PVOP_VCALL2(pv_mmu_ops.dup_mmap, oldmm, mm);
  297. }
  298. static inline void arch_exit_mmap(struct mm_struct *mm)
  299. {
  300. PVOP_VCALL1(pv_mmu_ops.exit_mmap, mm);
  301. }
  302. static inline void __flush_tlb(void)
  303. {
  304. PVOP_VCALL0(pv_mmu_ops.flush_tlb_user);
  305. }
  306. static inline void __flush_tlb_global(void)
  307. {
  308. PVOP_VCALL0(pv_mmu_ops.flush_tlb_kernel);
  309. }
  310. static inline void __flush_tlb_single(unsigned long addr)
  311. {
  312. PVOP_VCALL1(pv_mmu_ops.flush_tlb_single, addr);
  313. }
  314. static inline void flush_tlb_others(const struct cpumask *cpumask,
  315. struct mm_struct *mm,
  316. unsigned long va)
  317. {
  318. PVOP_VCALL3(pv_mmu_ops.flush_tlb_others, cpumask, mm, va);
  319. }
  320. static inline int paravirt_pgd_alloc(struct mm_struct *mm)
  321. {
  322. return PVOP_CALL1(int, pv_mmu_ops.pgd_alloc, mm);
  323. }
  324. static inline void paravirt_pgd_free(struct mm_struct *mm, pgd_t *pgd)
  325. {
  326. PVOP_VCALL2(pv_mmu_ops.pgd_free, mm, pgd);
  327. }
  328. static inline void paravirt_alloc_pte(struct mm_struct *mm, unsigned long pfn)
  329. {
  330. PVOP_VCALL2(pv_mmu_ops.alloc_pte, mm, pfn);
  331. }
  332. static inline void paravirt_release_pte(unsigned long pfn)
  333. {
  334. PVOP_VCALL1(pv_mmu_ops.release_pte, pfn);
  335. }
  336. static inline void paravirt_alloc_pmd(struct mm_struct *mm, unsigned long pfn)
  337. {
  338. PVOP_VCALL2(pv_mmu_ops.alloc_pmd, mm, pfn);
  339. }
  340. static inline void paravirt_alloc_pmd_clone(unsigned long pfn, unsigned long clonepfn,
  341. unsigned long start, unsigned long count)
  342. {
  343. PVOP_VCALL4(pv_mmu_ops.alloc_pmd_clone, pfn, clonepfn, start, count);
  344. }
  345. static inline void paravirt_release_pmd(unsigned long pfn)
  346. {
  347. PVOP_VCALL1(pv_mmu_ops.release_pmd, pfn);
  348. }
  349. static inline void paravirt_alloc_pud(struct mm_struct *mm, unsigned long pfn)
  350. {
  351. PVOP_VCALL2(pv_mmu_ops.alloc_pud, mm, pfn);
  352. }
  353. static inline void paravirt_release_pud(unsigned long pfn)
  354. {
  355. PVOP_VCALL1(pv_mmu_ops.release_pud, pfn);
  356. }
  357. #ifdef CONFIG_HIGHPTE
  358. static inline void *kmap_atomic_pte(struct page *page, enum km_type type)
  359. {
  360. unsigned long ret;
  361. ret = PVOP_CALL2(unsigned long, pv_mmu_ops.kmap_atomic_pte, page, type);
  362. return (void *)ret;
  363. }
  364. #endif
  365. static inline void pte_update(struct mm_struct *mm, unsigned long addr,
  366. pte_t *ptep)
  367. {
  368. PVOP_VCALL3(pv_mmu_ops.pte_update, mm, addr, ptep);
  369. }
  370. static inline void pte_update_defer(struct mm_struct *mm, unsigned long addr,
  371. pte_t *ptep)
  372. {
  373. PVOP_VCALL3(pv_mmu_ops.pte_update_defer, mm, addr, ptep);
  374. }
  375. static inline pte_t __pte(pteval_t val)
  376. {
  377. pteval_t ret;
  378. if (sizeof(pteval_t) > sizeof(long))
  379. ret = PVOP_CALLEE2(pteval_t,
  380. pv_mmu_ops.make_pte,
  381. val, (u64)val >> 32);
  382. else
  383. ret = PVOP_CALLEE1(pteval_t,
  384. pv_mmu_ops.make_pte,
  385. val);
  386. return (pte_t) { .pte = ret };
  387. }
  388. static inline pteval_t pte_val(pte_t pte)
  389. {
  390. pteval_t ret;
  391. if (sizeof(pteval_t) > sizeof(long))
  392. ret = PVOP_CALLEE2(pteval_t, pv_mmu_ops.pte_val,
  393. pte.pte, (u64)pte.pte >> 32);
  394. else
  395. ret = PVOP_CALLEE1(pteval_t, pv_mmu_ops.pte_val,
  396. pte.pte);
  397. return ret;
  398. }
  399. static inline pgd_t __pgd(pgdval_t val)
  400. {
  401. pgdval_t ret;
  402. if (sizeof(pgdval_t) > sizeof(long))
  403. ret = PVOP_CALLEE2(pgdval_t, pv_mmu_ops.make_pgd,
  404. val, (u64)val >> 32);
  405. else
  406. ret = PVOP_CALLEE1(pgdval_t, pv_mmu_ops.make_pgd,
  407. val);
  408. return (pgd_t) { ret };
  409. }
  410. static inline pgdval_t pgd_val(pgd_t pgd)
  411. {
  412. pgdval_t ret;
  413. if (sizeof(pgdval_t) > sizeof(long))
  414. ret = PVOP_CALLEE2(pgdval_t, pv_mmu_ops.pgd_val,
  415. pgd.pgd, (u64)pgd.pgd >> 32);
  416. else
  417. ret = PVOP_CALLEE1(pgdval_t, pv_mmu_ops.pgd_val,
  418. pgd.pgd);
  419. return ret;
  420. }
  421. #define __HAVE_ARCH_PTEP_MODIFY_PROT_TRANSACTION
  422. static inline pte_t ptep_modify_prot_start(struct mm_struct *mm, unsigned long addr,
  423. pte_t *ptep)
  424. {
  425. pteval_t ret;
  426. ret = PVOP_CALL3(pteval_t, pv_mmu_ops.ptep_modify_prot_start,
  427. mm, addr, ptep);
  428. return (pte_t) { .pte = ret };
  429. }
  430. static inline void ptep_modify_prot_commit(struct mm_struct *mm, unsigned long addr,
  431. pte_t *ptep, pte_t pte)
  432. {
  433. if (sizeof(pteval_t) > sizeof(long))
  434. /* 5 arg words */
  435. pv_mmu_ops.ptep_modify_prot_commit(mm, addr, ptep, pte);
  436. else
  437. PVOP_VCALL4(pv_mmu_ops.ptep_modify_prot_commit,
  438. mm, addr, ptep, pte.pte);
  439. }
  440. static inline void set_pte(pte_t *ptep, pte_t pte)
  441. {
  442. if (sizeof(pteval_t) > sizeof(long))
  443. PVOP_VCALL3(pv_mmu_ops.set_pte, ptep,
  444. pte.pte, (u64)pte.pte >> 32);
  445. else
  446. PVOP_VCALL2(pv_mmu_ops.set_pte, ptep,
  447. pte.pte);
  448. }
  449. static inline void set_pte_at(struct mm_struct *mm, unsigned long addr,
  450. pte_t *ptep, pte_t pte)
  451. {
  452. if (sizeof(pteval_t) > sizeof(long))
  453. /* 5 arg words */
  454. pv_mmu_ops.set_pte_at(mm, addr, ptep, pte);
  455. else
  456. PVOP_VCALL4(pv_mmu_ops.set_pte_at, mm, addr, ptep, pte.pte);
  457. }
  458. static inline void set_pmd(pmd_t *pmdp, pmd_t pmd)
  459. {
  460. pmdval_t val = native_pmd_val(pmd);
  461. if (sizeof(pmdval_t) > sizeof(long))
  462. PVOP_VCALL3(pv_mmu_ops.set_pmd, pmdp, val, (u64)val >> 32);
  463. else
  464. PVOP_VCALL2(pv_mmu_ops.set_pmd, pmdp, val);
  465. }
  466. #if PAGETABLE_LEVELS >= 3
  467. static inline pmd_t __pmd(pmdval_t val)
  468. {
  469. pmdval_t ret;
  470. if (sizeof(pmdval_t) > sizeof(long))
  471. ret = PVOP_CALLEE2(pmdval_t, pv_mmu_ops.make_pmd,
  472. val, (u64)val >> 32);
  473. else
  474. ret = PVOP_CALLEE1(pmdval_t, pv_mmu_ops.make_pmd,
  475. val);
  476. return (pmd_t) { ret };
  477. }
  478. static inline pmdval_t pmd_val(pmd_t pmd)
  479. {
  480. pmdval_t ret;
  481. if (sizeof(pmdval_t) > sizeof(long))
  482. ret = PVOP_CALLEE2(pmdval_t, pv_mmu_ops.pmd_val,
  483. pmd.pmd, (u64)pmd.pmd >> 32);
  484. else
  485. ret = PVOP_CALLEE1(pmdval_t, pv_mmu_ops.pmd_val,
  486. pmd.pmd);
  487. return ret;
  488. }
  489. static inline void set_pud(pud_t *pudp, pud_t pud)
  490. {
  491. pudval_t val = native_pud_val(pud);
  492. if (sizeof(pudval_t) > sizeof(long))
  493. PVOP_VCALL3(pv_mmu_ops.set_pud, pudp,
  494. val, (u64)val >> 32);
  495. else
  496. PVOP_VCALL2(pv_mmu_ops.set_pud, pudp,
  497. val);
  498. }
  499. #if PAGETABLE_LEVELS == 4
  500. static inline pud_t __pud(pudval_t val)
  501. {
  502. pudval_t ret;
  503. if (sizeof(pudval_t) > sizeof(long))
  504. ret = PVOP_CALLEE2(pudval_t, pv_mmu_ops.make_pud,
  505. val, (u64)val >> 32);
  506. else
  507. ret = PVOP_CALLEE1(pudval_t, pv_mmu_ops.make_pud,
  508. val);
  509. return (pud_t) { ret };
  510. }
  511. static inline pudval_t pud_val(pud_t pud)
  512. {
  513. pudval_t ret;
  514. if (sizeof(pudval_t) > sizeof(long))
  515. ret = PVOP_CALLEE2(pudval_t, pv_mmu_ops.pud_val,
  516. pud.pud, (u64)pud.pud >> 32);
  517. else
  518. ret = PVOP_CALLEE1(pudval_t, pv_mmu_ops.pud_val,
  519. pud.pud);
  520. return ret;
  521. }
  522. static inline void set_pgd(pgd_t *pgdp, pgd_t pgd)
  523. {
  524. pgdval_t val = native_pgd_val(pgd);
  525. if (sizeof(pgdval_t) > sizeof(long))
  526. PVOP_VCALL3(pv_mmu_ops.set_pgd, pgdp,
  527. val, (u64)val >> 32);
  528. else
  529. PVOP_VCALL2(pv_mmu_ops.set_pgd, pgdp,
  530. val);
  531. }
  532. static inline void pgd_clear(pgd_t *pgdp)
  533. {
  534. set_pgd(pgdp, __pgd(0));
  535. }
  536. static inline void pud_clear(pud_t *pudp)
  537. {
  538. set_pud(pudp, __pud(0));
  539. }
  540. #endif /* PAGETABLE_LEVELS == 4 */
  541. #endif /* PAGETABLE_LEVELS >= 3 */
  542. #ifdef CONFIG_X86_PAE
  543. /* Special-case pte-setting operations for PAE, which can't update a
  544. 64-bit pte atomically */
  545. static inline void set_pte_atomic(pte_t *ptep, pte_t pte)
  546. {
  547. PVOP_VCALL3(pv_mmu_ops.set_pte_atomic, ptep,
  548. pte.pte, pte.pte >> 32);
  549. }
  550. static inline void pte_clear(struct mm_struct *mm, unsigned long addr,
  551. pte_t *ptep)
  552. {
  553. PVOP_VCALL3(pv_mmu_ops.pte_clear, mm, addr, ptep);
  554. }
  555. static inline void pmd_clear(pmd_t *pmdp)
  556. {
  557. PVOP_VCALL1(pv_mmu_ops.pmd_clear, pmdp);
  558. }
  559. #else /* !CONFIG_X86_PAE */
  560. static inline void set_pte_atomic(pte_t *ptep, pte_t pte)
  561. {
  562. set_pte(ptep, pte);
  563. }
  564. static inline void pte_clear(struct mm_struct *mm, unsigned long addr,
  565. pte_t *ptep)
  566. {
  567. set_pte_at(mm, addr, ptep, __pte(0));
  568. }
  569. static inline void pmd_clear(pmd_t *pmdp)
  570. {
  571. set_pmd(pmdp, __pmd(0));
  572. }
  573. #endif /* CONFIG_X86_PAE */
  574. #define __HAVE_ARCH_START_CONTEXT_SWITCH
  575. static inline void arch_start_context_switch(struct task_struct *prev)
  576. {
  577. PVOP_VCALL1(pv_cpu_ops.start_context_switch, prev);
  578. }
  579. static inline void arch_end_context_switch(struct task_struct *next)
  580. {
  581. PVOP_VCALL1(pv_cpu_ops.end_context_switch, next);
  582. }
  583. #define __HAVE_ARCH_ENTER_LAZY_MMU_MODE
  584. static inline void arch_enter_lazy_mmu_mode(void)
  585. {
  586. PVOP_VCALL0(pv_mmu_ops.lazy_mode.enter);
  587. }
  588. static inline void arch_leave_lazy_mmu_mode(void)
  589. {
  590. PVOP_VCALL0(pv_mmu_ops.lazy_mode.leave);
  591. }
  592. void arch_flush_lazy_mmu_mode(void);
  593. static inline void __set_fixmap(unsigned /* enum fixed_addresses */ idx,
  594. phys_addr_t phys, pgprot_t flags)
  595. {
  596. pv_mmu_ops.set_fixmap(idx, phys, flags);
  597. }
  598. #if defined(CONFIG_SMP) && defined(CONFIG_PARAVIRT_SPINLOCKS)
  599. static inline int __raw_spin_is_locked(struct raw_spinlock *lock)
  600. {
  601. return PVOP_CALL1(int, pv_lock_ops.spin_is_locked, lock);
  602. }
  603. static inline int __raw_spin_is_contended(struct raw_spinlock *lock)
  604. {
  605. return PVOP_CALL1(int, pv_lock_ops.spin_is_contended, lock);
  606. }
  607. #define __raw_spin_is_contended __raw_spin_is_contended
  608. static __always_inline void __raw_spin_lock(struct raw_spinlock *lock)
  609. {
  610. PVOP_VCALL1(pv_lock_ops.spin_lock, lock);
  611. }
  612. static __always_inline void __raw_spin_lock_flags(struct raw_spinlock *lock,
  613. unsigned long flags)
  614. {
  615. PVOP_VCALL2(pv_lock_ops.spin_lock_flags, lock, flags);
  616. }
  617. static __always_inline int __raw_spin_trylock(struct raw_spinlock *lock)
  618. {
  619. return PVOP_CALL1(int, pv_lock_ops.spin_trylock, lock);
  620. }
  621. static __always_inline void __raw_spin_unlock(struct raw_spinlock *lock)
  622. {
  623. PVOP_VCALL1(pv_lock_ops.spin_unlock, lock);
  624. }
  625. #endif
  626. #ifdef CONFIG_X86_32
  627. #define PV_SAVE_REGS "pushl %ecx; pushl %edx;"
  628. #define PV_RESTORE_REGS "popl %edx; popl %ecx;"
  629. /* save and restore all caller-save registers, except return value */
  630. #define PV_SAVE_ALL_CALLER_REGS "pushl %ecx;"
  631. #define PV_RESTORE_ALL_CALLER_REGS "popl %ecx;"
  632. #define PV_FLAGS_ARG "0"
  633. #define PV_EXTRA_CLOBBERS
  634. #define PV_VEXTRA_CLOBBERS
  635. #else
  636. /* save and restore all caller-save registers, except return value */
  637. #define PV_SAVE_ALL_CALLER_REGS \
  638. "push %rcx;" \
  639. "push %rdx;" \
  640. "push %rsi;" \
  641. "push %rdi;" \
  642. "push %r8;" \
  643. "push %r9;" \
  644. "push %r10;" \
  645. "push %r11;"
  646. #define PV_RESTORE_ALL_CALLER_REGS \
  647. "pop %r11;" \
  648. "pop %r10;" \
  649. "pop %r9;" \
  650. "pop %r8;" \
  651. "pop %rdi;" \
  652. "pop %rsi;" \
  653. "pop %rdx;" \
  654. "pop %rcx;"
  655. /* We save some registers, but all of them, that's too much. We clobber all
  656. * caller saved registers but the argument parameter */
  657. #define PV_SAVE_REGS "pushq %%rdi;"
  658. #define PV_RESTORE_REGS "popq %%rdi;"
  659. #define PV_EXTRA_CLOBBERS EXTRA_CLOBBERS, "rcx" , "rdx", "rsi"
  660. #define PV_VEXTRA_CLOBBERS EXTRA_CLOBBERS, "rdi", "rcx" , "rdx", "rsi"
  661. #define PV_FLAGS_ARG "D"
  662. #endif
  663. /*
  664. * Generate a thunk around a function which saves all caller-save
  665. * registers except for the return value. This allows C functions to
  666. * be called from assembler code where fewer than normal registers are
  667. * available. It may also help code generation around calls from C
  668. * code if the common case doesn't use many registers.
  669. *
  670. * When a callee is wrapped in a thunk, the caller can assume that all
  671. * arg regs and all scratch registers are preserved across the
  672. * call. The return value in rax/eax will not be saved, even for void
  673. * functions.
  674. */
  675. #define PV_CALLEE_SAVE_REGS_THUNK(func) \
  676. extern typeof(func) __raw_callee_save_##func; \
  677. static void *__##func##__ __used = func; \
  678. \
  679. asm(".pushsection .text;" \
  680. "__raw_callee_save_" #func ": " \
  681. PV_SAVE_ALL_CALLER_REGS \
  682. "call " #func ";" \
  683. PV_RESTORE_ALL_CALLER_REGS \
  684. "ret;" \
  685. ".popsection")
  686. /* Get a reference to a callee-save function */
  687. #define PV_CALLEE_SAVE(func) \
  688. ((struct paravirt_callee_save) { __raw_callee_save_##func })
  689. /* Promise that "func" already uses the right calling convention */
  690. #define __PV_IS_CALLEE_SAVE(func) \
  691. ((struct paravirt_callee_save) { func })
  692. static inline unsigned long __raw_local_save_flags(void)
  693. {
  694. unsigned long f;
  695. asm volatile(paravirt_alt(PARAVIRT_CALL)
  696. : "=a"(f)
  697. : paravirt_type(pv_irq_ops.save_fl),
  698. paravirt_clobber(CLBR_EAX)
  699. : "memory", "cc");
  700. return f;
  701. }
  702. static inline void raw_local_irq_restore(unsigned long f)
  703. {
  704. asm volatile(paravirt_alt(PARAVIRT_CALL)
  705. : "=a"(f)
  706. : PV_FLAGS_ARG(f),
  707. paravirt_type(pv_irq_ops.restore_fl),
  708. paravirt_clobber(CLBR_EAX)
  709. : "memory", "cc");
  710. }
  711. static inline void raw_local_irq_disable(void)
  712. {
  713. asm volatile(paravirt_alt(PARAVIRT_CALL)
  714. :
  715. : paravirt_type(pv_irq_ops.irq_disable),
  716. paravirt_clobber(CLBR_EAX)
  717. : "memory", "eax", "cc");
  718. }
  719. static inline void raw_local_irq_enable(void)
  720. {
  721. asm volatile(paravirt_alt(PARAVIRT_CALL)
  722. :
  723. : paravirt_type(pv_irq_ops.irq_enable),
  724. paravirt_clobber(CLBR_EAX)
  725. : "memory", "eax", "cc");
  726. }
  727. static inline unsigned long __raw_local_irq_save(void)
  728. {
  729. unsigned long f;
  730. f = __raw_local_save_flags();
  731. raw_local_irq_disable();
  732. return f;
  733. }
  734. /* Make sure as little as possible of this mess escapes. */
  735. #undef PARAVIRT_CALL
  736. #undef __PVOP_CALL
  737. #undef __PVOP_VCALL
  738. #undef PVOP_VCALL0
  739. #undef PVOP_CALL0
  740. #undef PVOP_VCALL1
  741. #undef PVOP_CALL1
  742. #undef PVOP_VCALL2
  743. #undef PVOP_CALL2
  744. #undef PVOP_VCALL3
  745. #undef PVOP_CALL3
  746. #undef PVOP_VCALL4
  747. #undef PVOP_CALL4
  748. extern void default_banner(void);
  749. #else /* __ASSEMBLY__ */
  750. #define _PVSITE(ptype, clobbers, ops, word, algn) \
  751. 771:; \
  752. ops; \
  753. 772:; \
  754. .pushsection .parainstructions,"a"; \
  755. .align algn; \
  756. word 771b; \
  757. .byte ptype; \
  758. .byte 772b-771b; \
  759. .short clobbers; \
  760. .popsection
  761. #define COND_PUSH(set, mask, reg) \
  762. .if ((~(set)) & mask); push %reg; .endif
  763. #define COND_POP(set, mask, reg) \
  764. .if ((~(set)) & mask); pop %reg; .endif
  765. #ifdef CONFIG_X86_64
  766. #define PV_SAVE_REGS(set) \
  767. COND_PUSH(set, CLBR_RAX, rax); \
  768. COND_PUSH(set, CLBR_RCX, rcx); \
  769. COND_PUSH(set, CLBR_RDX, rdx); \
  770. COND_PUSH(set, CLBR_RSI, rsi); \
  771. COND_PUSH(set, CLBR_RDI, rdi); \
  772. COND_PUSH(set, CLBR_R8, r8); \
  773. COND_PUSH(set, CLBR_R9, r9); \
  774. COND_PUSH(set, CLBR_R10, r10); \
  775. COND_PUSH(set, CLBR_R11, r11)
  776. #define PV_RESTORE_REGS(set) \
  777. COND_POP(set, CLBR_R11, r11); \
  778. COND_POP(set, CLBR_R10, r10); \
  779. COND_POP(set, CLBR_R9, r9); \
  780. COND_POP(set, CLBR_R8, r8); \
  781. COND_POP(set, CLBR_RDI, rdi); \
  782. COND_POP(set, CLBR_RSI, rsi); \
  783. COND_POP(set, CLBR_RDX, rdx); \
  784. COND_POP(set, CLBR_RCX, rcx); \
  785. COND_POP(set, CLBR_RAX, rax)
  786. #define PARA_PATCH(struct, off) ((PARAVIRT_PATCH_##struct + (off)) / 8)
  787. #define PARA_SITE(ptype, clobbers, ops) _PVSITE(ptype, clobbers, ops, .quad, 8)
  788. #define PARA_INDIRECT(addr) *addr(%rip)
  789. #else
  790. #define PV_SAVE_REGS(set) \
  791. COND_PUSH(set, CLBR_EAX, eax); \
  792. COND_PUSH(set, CLBR_EDI, edi); \
  793. COND_PUSH(set, CLBR_ECX, ecx); \
  794. COND_PUSH(set, CLBR_EDX, edx)
  795. #define PV_RESTORE_REGS(set) \
  796. COND_POP(set, CLBR_EDX, edx); \
  797. COND_POP(set, CLBR_ECX, ecx); \
  798. COND_POP(set, CLBR_EDI, edi); \
  799. COND_POP(set, CLBR_EAX, eax)
  800. #define PARA_PATCH(struct, off) ((PARAVIRT_PATCH_##struct + (off)) / 4)
  801. #define PARA_SITE(ptype, clobbers, ops) _PVSITE(ptype, clobbers, ops, .long, 4)
  802. #define PARA_INDIRECT(addr) *%cs:addr
  803. #endif
  804. #define INTERRUPT_RETURN \
  805. PARA_SITE(PARA_PATCH(pv_cpu_ops, PV_CPU_iret), CLBR_NONE, \
  806. jmp PARA_INDIRECT(pv_cpu_ops+PV_CPU_iret))
  807. #define DISABLE_INTERRUPTS(clobbers) \
  808. PARA_SITE(PARA_PATCH(pv_irq_ops, PV_IRQ_irq_disable), clobbers, \
  809. PV_SAVE_REGS(clobbers | CLBR_CALLEE_SAVE); \
  810. call PARA_INDIRECT(pv_irq_ops+PV_IRQ_irq_disable); \
  811. PV_RESTORE_REGS(clobbers | CLBR_CALLEE_SAVE);)
  812. #define ENABLE_INTERRUPTS(clobbers) \
  813. PARA_SITE(PARA_PATCH(pv_irq_ops, PV_IRQ_irq_enable), clobbers, \
  814. PV_SAVE_REGS(clobbers | CLBR_CALLEE_SAVE); \
  815. call PARA_INDIRECT(pv_irq_ops+PV_IRQ_irq_enable); \
  816. PV_RESTORE_REGS(clobbers | CLBR_CALLEE_SAVE);)
  817. #define USERGS_SYSRET32 \
  818. PARA_SITE(PARA_PATCH(pv_cpu_ops, PV_CPU_usergs_sysret32), \
  819. CLBR_NONE, \
  820. jmp PARA_INDIRECT(pv_cpu_ops+PV_CPU_usergs_sysret32))
  821. #ifdef CONFIG_X86_32
  822. #define GET_CR0_INTO_EAX \
  823. push %ecx; push %edx; \
  824. call PARA_INDIRECT(pv_cpu_ops+PV_CPU_read_cr0); \
  825. pop %edx; pop %ecx
  826. #define ENABLE_INTERRUPTS_SYSEXIT \
  827. PARA_SITE(PARA_PATCH(pv_cpu_ops, PV_CPU_irq_enable_sysexit), \
  828. CLBR_NONE, \
  829. jmp PARA_INDIRECT(pv_cpu_ops+PV_CPU_irq_enable_sysexit))
  830. #else /* !CONFIG_X86_32 */
  831. /*
  832. * If swapgs is used while the userspace stack is still current,
  833. * there's no way to call a pvop. The PV replacement *must* be
  834. * inlined, or the swapgs instruction must be trapped and emulated.
  835. */
  836. #define SWAPGS_UNSAFE_STACK \
  837. PARA_SITE(PARA_PATCH(pv_cpu_ops, PV_CPU_swapgs), CLBR_NONE, \
  838. swapgs)
  839. /*
  840. * Note: swapgs is very special, and in practise is either going to be
  841. * implemented with a single "swapgs" instruction or something very
  842. * special. Either way, we don't need to save any registers for
  843. * it.
  844. */
  845. #define SWAPGS \
  846. PARA_SITE(PARA_PATCH(pv_cpu_ops, PV_CPU_swapgs), CLBR_NONE, \
  847. call PARA_INDIRECT(pv_cpu_ops+PV_CPU_swapgs) \
  848. )
  849. #define GET_CR2_INTO_RCX \
  850. call PARA_INDIRECT(pv_mmu_ops+PV_MMU_read_cr2); \
  851. movq %rax, %rcx; \
  852. xorq %rax, %rax;
  853. #define PARAVIRT_ADJUST_EXCEPTION_FRAME \
  854. PARA_SITE(PARA_PATCH(pv_irq_ops, PV_IRQ_adjust_exception_frame), \
  855. CLBR_NONE, \
  856. call PARA_INDIRECT(pv_irq_ops+PV_IRQ_adjust_exception_frame))
  857. #define USERGS_SYSRET64 \
  858. PARA_SITE(PARA_PATCH(pv_cpu_ops, PV_CPU_usergs_sysret64), \
  859. CLBR_NONE, \
  860. jmp PARA_INDIRECT(pv_cpu_ops+PV_CPU_usergs_sysret64))
  861. #define ENABLE_INTERRUPTS_SYSEXIT32 \
  862. PARA_SITE(PARA_PATCH(pv_cpu_ops, PV_CPU_irq_enable_sysexit), \
  863. CLBR_NONE, \
  864. jmp PARA_INDIRECT(pv_cpu_ops+PV_CPU_irq_enable_sysexit))
  865. #endif /* CONFIG_X86_32 */
  866. #endif /* __ASSEMBLY__ */
  867. #else /* CONFIG_PARAVIRT */
  868. # define default_banner x86_init_noop
  869. #endif /* !CONFIG_PARAVIRT */
  870. #endif /* _ASM_X86_PARAVIRT_H */