pgtable-3level.h 3.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141
  1. #ifndef _ASM_X86_PGTABLE_3LEVEL_H
  2. #define _ASM_X86_PGTABLE_3LEVEL_H
  3. /*
  4. * Intel Physical Address Extension (PAE) Mode - three-level page
  5. * tables on PPro+ CPUs.
  6. *
  7. * Copyright (C) 1999 Ingo Molnar <mingo@redhat.com>
  8. */
  9. #define pte_ERROR(e) \
  10. printk("%s:%d: bad pte %p(%08lx%08lx).\n", \
  11. __FILE__, __LINE__, &(e), (e).pte_high, (e).pte_low)
  12. #define pmd_ERROR(e) \
  13. printk("%s:%d: bad pmd %p(%016Lx).\n", \
  14. __FILE__, __LINE__, &(e), pmd_val(e))
  15. #define pgd_ERROR(e) \
  16. printk("%s:%d: bad pgd %p(%016Lx).\n", \
  17. __FILE__, __LINE__, &(e), pgd_val(e))
  18. /* Rules for using set_pte: the pte being assigned *must* be
  19. * either not present or in a state where the hardware will
  20. * not attempt to update the pte. In places where this is
  21. * not possible, use pte_get_and_clear to obtain the old pte
  22. * value and then use set_pte to update it. -ben
  23. */
  24. static inline void native_set_pte(pte_t *ptep, pte_t pte)
  25. {
  26. ptep->pte_high = pte.pte_high;
  27. smp_wmb();
  28. ptep->pte_low = pte.pte_low;
  29. }
  30. /*
  31. * Since this is only called on user PTEs, and the page fault handler
  32. * must handle the already racy situation of simultaneous page faults,
  33. * we are justified in merely clearing the PTE present bit, followed
  34. * by a set. The ordering here is important.
  35. */
  36. static inline void native_set_pte_present(struct mm_struct *mm,
  37. unsigned long addr,
  38. pte_t *ptep, pte_t pte)
  39. {
  40. ptep->pte_low = 0;
  41. smp_wmb();
  42. ptep->pte_high = pte.pte_high;
  43. smp_wmb();
  44. ptep->pte_low = pte.pte_low;
  45. }
  46. static inline void native_set_pte_atomic(pte_t *ptep, pte_t pte)
  47. {
  48. set_64bit((unsigned long long *)(ptep), native_pte_val(pte));
  49. }
  50. static inline void native_set_pmd(pmd_t *pmdp, pmd_t pmd)
  51. {
  52. set_64bit((unsigned long long *)(pmdp), native_pmd_val(pmd));
  53. }
  54. static inline void native_set_pud(pud_t *pudp, pud_t pud)
  55. {
  56. set_64bit((unsigned long long *)(pudp), native_pud_val(pud));
  57. }
  58. /*
  59. * For PTEs and PDEs, we must clear the P-bit first when clearing a page table
  60. * entry, so clear the bottom half first and enforce ordering with a compiler
  61. * barrier.
  62. */
  63. static inline void native_pte_clear(struct mm_struct *mm, unsigned long addr,
  64. pte_t *ptep)
  65. {
  66. ptep->pte_low = 0;
  67. smp_wmb();
  68. ptep->pte_high = 0;
  69. }
  70. static inline void native_pmd_clear(pmd_t *pmd)
  71. {
  72. u32 *tmp = (u32 *)pmd;
  73. *tmp = 0;
  74. smp_wmb();
  75. *(tmp + 1) = 0;
  76. }
  77. static inline void pud_clear(pud_t *pudp)
  78. {
  79. unsigned long pgd;
  80. set_pud(pudp, __pud(0));
  81. /*
  82. * According to Intel App note "TLBs, Paging-Structure Caches,
  83. * and Their Invalidation", April 2007, document 317080-001,
  84. * section 8.1: in PAE mode we explicitly have to flush the
  85. * TLB via cr3 if the top-level pgd is changed...
  86. *
  87. * Make sure the pud entry we're updating is within the
  88. * current pgd to avoid unnecessary TLB flushes.
  89. */
  90. pgd = read_cr3();
  91. if (__pa(pudp) >= pgd && __pa(pudp) <
  92. (pgd + sizeof(pgd_t)*PTRS_PER_PGD))
  93. write_cr3(pgd);
  94. }
  95. #ifdef CONFIG_SMP
  96. static inline pte_t native_ptep_get_and_clear(pte_t *ptep)
  97. {
  98. pte_t res;
  99. /* xchg acts as a barrier before the setting of the high bits */
  100. res.pte_low = xchg(&ptep->pte_low, 0);
  101. res.pte_high = ptep->pte_high;
  102. ptep->pte_high = 0;
  103. return res;
  104. }
  105. #else
  106. #define native_ptep_get_and_clear(xp) native_local_ptep_get_and_clear(xp)
  107. #endif
  108. /*
  109. * Bits 0, 6 and 7 are taken in the low part of the pte,
  110. * put the 32 bits of offset into the high part.
  111. */
  112. #define pte_to_pgoff(pte) ((pte).pte_high)
  113. #define pgoff_to_pte(off) \
  114. ((pte_t) { { .pte_low = _PAGE_FILE, .pte_high = (off) } })
  115. #define PTE_FILE_MAX_BITS 32
  116. /* Encode and de-code a swap entry */
  117. #define MAX_SWAPFILES_CHECK() BUILD_BUG_ON(MAX_SWAPFILES_SHIFT > 5)
  118. #define __swp_type(x) (((x).val) & 0x1f)
  119. #define __swp_offset(x) ((x).val >> 5)
  120. #define __swp_entry(type, offset) ((swp_entry_t){(type) | (offset) << 5})
  121. #define __pte_to_swp_entry(pte) ((swp_entry_t){ (pte).pte_high })
  122. #define __swp_entry_to_pte(x) ((pte_t){ { .pte_high = (x).val } })
  123. #endif /* _ASM_X86_PGTABLE_3LEVEL_H */