pgtable_64.h 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432
  1. #ifndef _X86_64_PGTABLE_H
  2. #define _X86_64_PGTABLE_H
  3. #include <linux/const.h>
  4. #ifndef __ASSEMBLY__
  5. /*
  6. * This file contains the functions and defines necessary to modify and use
  7. * the x86-64 page table tree.
  8. */
  9. #include <asm/processor.h>
  10. #include <asm/bitops.h>
  11. #include <linux/threads.h>
  12. #include <asm/pda.h>
  13. extern pud_t level3_kernel_pgt[512];
  14. extern pud_t level3_ident_pgt[512];
  15. extern pmd_t level2_kernel_pgt[512];
  16. extern pgd_t init_level4_pgt[];
  17. extern unsigned long __supported_pte_mask;
  18. #define swapper_pg_dir init_level4_pgt
  19. extern void paging_init(void);
  20. extern void clear_kernel_mapping(unsigned long addr, unsigned long size);
  21. /*
  22. * ZERO_PAGE is a global shared page that is always zero: used
  23. * for zero-mapped memory areas etc..
  24. */
  25. extern unsigned long empty_zero_page[PAGE_SIZE/sizeof(unsigned long)];
  26. #define ZERO_PAGE(vaddr) (virt_to_page(empty_zero_page))
  27. #endif /* !__ASSEMBLY__ */
  28. /*
  29. * PGDIR_SHIFT determines what a top-level page table entry can map
  30. */
  31. #define PGDIR_SHIFT 39
  32. #define PTRS_PER_PGD 512
  33. /*
  34. * 3rd level page
  35. */
  36. #define PUD_SHIFT 30
  37. #define PTRS_PER_PUD 512
  38. /*
  39. * PMD_SHIFT determines the size of the area a middle-level
  40. * page table can map
  41. */
  42. #define PMD_SHIFT 21
  43. #define PTRS_PER_PMD 512
  44. /*
  45. * entries per page directory level
  46. */
  47. #define PTRS_PER_PTE 512
  48. #ifndef __ASSEMBLY__
  49. #define pte_ERROR(e) \
  50. printk("%s:%d: bad pte %p(%016lx).\n", __FILE__, __LINE__, &(e), pte_val(e))
  51. #define pmd_ERROR(e) \
  52. printk("%s:%d: bad pmd %p(%016lx).\n", __FILE__, __LINE__, &(e), pmd_val(e))
  53. #define pud_ERROR(e) \
  54. printk("%s:%d: bad pud %p(%016lx).\n", __FILE__, __LINE__, &(e), pud_val(e))
  55. #define pgd_ERROR(e) \
  56. printk("%s:%d: bad pgd %p(%016lx).\n", __FILE__, __LINE__, &(e), pgd_val(e))
  57. #define pgd_none(x) (!pgd_val(x))
  58. #define pud_none(x) (!pud_val(x))
  59. static inline void set_pte(pte_t *dst, pte_t val)
  60. {
  61. pte_val(*dst) = pte_val(val);
  62. }
  63. #define set_pte_at(mm,addr,ptep,pteval) set_pte(ptep,pteval)
  64. static inline void set_pmd(pmd_t *dst, pmd_t val)
  65. {
  66. pmd_val(*dst) = pmd_val(val);
  67. }
  68. static inline void set_pud(pud_t *dst, pud_t val)
  69. {
  70. pud_val(*dst) = pud_val(val);
  71. }
  72. static inline void pud_clear (pud_t *pud)
  73. {
  74. set_pud(pud, __pud(0));
  75. }
  76. static inline void set_pgd(pgd_t *dst, pgd_t val)
  77. {
  78. pgd_val(*dst) = pgd_val(val);
  79. }
  80. static inline void pgd_clear (pgd_t * pgd)
  81. {
  82. set_pgd(pgd, __pgd(0));
  83. }
  84. #define ptep_get_and_clear(mm,addr,xp) __pte(xchg(&(xp)->pte, 0))
  85. struct mm_struct;
  86. static inline pte_t ptep_get_and_clear_full(struct mm_struct *mm, unsigned long addr, pte_t *ptep, int full)
  87. {
  88. pte_t pte;
  89. if (full) {
  90. pte = *ptep;
  91. *ptep = __pte(0);
  92. } else {
  93. pte = ptep_get_and_clear(mm, addr, ptep);
  94. }
  95. return pte;
  96. }
  97. #define pte_same(a, b) ((a).pte == (b).pte)
  98. #define pte_pgprot(a) (__pgprot((a).pte & ~PHYSICAL_PAGE_MASK))
  99. #endif /* !__ASSEMBLY__ */
  100. #define PMD_SIZE (_AC(1,UL) << PMD_SHIFT)
  101. #define PMD_MASK (~(PMD_SIZE-1))
  102. #define PUD_SIZE (_AC(1,UL) << PUD_SHIFT)
  103. #define PUD_MASK (~(PUD_SIZE-1))
  104. #define PGDIR_SIZE (_AC(1,UL) << PGDIR_SHIFT)
  105. #define PGDIR_MASK (~(PGDIR_SIZE-1))
  106. #define USER_PTRS_PER_PGD ((TASK_SIZE-1)/PGDIR_SIZE+1)
  107. #define FIRST_USER_ADDRESS 0
  108. #define MAXMEM _AC(0x3fffffffffff, UL)
  109. #define VMALLOC_START _AC(0xffffc20000000000, UL)
  110. #define VMALLOC_END _AC(0xffffe1ffffffffff, UL)
  111. #define MODULES_VADDR _AC(0xffffffff88000000, UL)
  112. #define MODULES_END _AC(0xfffffffffff00000, UL)
  113. #define MODULES_LEN (MODULES_END - MODULES_VADDR)
  114. #define _PAGE_BIT_PRESENT 0
  115. #define _PAGE_BIT_RW 1
  116. #define _PAGE_BIT_USER 2
  117. #define _PAGE_BIT_PWT 3
  118. #define _PAGE_BIT_PCD 4
  119. #define _PAGE_BIT_ACCESSED 5
  120. #define _PAGE_BIT_DIRTY 6
  121. #define _PAGE_BIT_PSE 7 /* 4 MB (or 2MB) page */
  122. #define _PAGE_BIT_GLOBAL 8 /* Global TLB entry PPro+ */
  123. #define _PAGE_BIT_NX 63 /* No execute: only valid after cpuid check */
  124. #define _PAGE_PRESENT 0x001
  125. #define _PAGE_RW 0x002
  126. #define _PAGE_USER 0x004
  127. #define _PAGE_PWT 0x008
  128. #define _PAGE_PCD 0x010
  129. #define _PAGE_ACCESSED 0x020
  130. #define _PAGE_DIRTY 0x040
  131. #define _PAGE_PSE 0x080 /* 2MB page */
  132. #define _PAGE_FILE 0x040 /* nonlinear file mapping, saved PTE; unset:swap */
  133. #define _PAGE_GLOBAL 0x100 /* Global TLB entry */
  134. #define _PAGE_PROTNONE 0x080 /* If not present */
  135. #define _PAGE_NX (_AC(1,UL)<<_PAGE_BIT_NX)
  136. #define _PAGE_TABLE (_PAGE_PRESENT | _PAGE_RW | _PAGE_USER | _PAGE_ACCESSED | _PAGE_DIRTY)
  137. #define _KERNPG_TABLE (_PAGE_PRESENT | _PAGE_RW | _PAGE_ACCESSED | _PAGE_DIRTY)
  138. #define _PAGE_CHG_MASK (PTE_MASK | _PAGE_ACCESSED | _PAGE_DIRTY)
  139. #define PAGE_NONE __pgprot(_PAGE_PROTNONE | _PAGE_ACCESSED)
  140. #define PAGE_SHARED __pgprot(_PAGE_PRESENT | _PAGE_RW | _PAGE_USER | _PAGE_ACCESSED | _PAGE_NX)
  141. #define PAGE_SHARED_EXEC __pgprot(_PAGE_PRESENT | _PAGE_RW | _PAGE_USER | _PAGE_ACCESSED)
  142. #define PAGE_COPY_NOEXEC __pgprot(_PAGE_PRESENT | _PAGE_USER | _PAGE_ACCESSED | _PAGE_NX)
  143. #define PAGE_COPY PAGE_COPY_NOEXEC
  144. #define PAGE_COPY_EXEC __pgprot(_PAGE_PRESENT | _PAGE_USER | _PAGE_ACCESSED)
  145. #define PAGE_READONLY __pgprot(_PAGE_PRESENT | _PAGE_USER | _PAGE_ACCESSED | _PAGE_NX)
  146. #define PAGE_READONLY_EXEC __pgprot(_PAGE_PRESENT | _PAGE_USER | _PAGE_ACCESSED)
  147. #define __PAGE_KERNEL \
  148. (_PAGE_PRESENT | _PAGE_RW | _PAGE_DIRTY | _PAGE_ACCESSED | _PAGE_NX)
  149. #define __PAGE_KERNEL_EXEC \
  150. (_PAGE_PRESENT | _PAGE_RW | _PAGE_DIRTY | _PAGE_ACCESSED)
  151. #define __PAGE_KERNEL_NOCACHE \
  152. (_PAGE_PRESENT | _PAGE_RW | _PAGE_DIRTY | _PAGE_PCD | _PAGE_ACCESSED | _PAGE_NX)
  153. #define __PAGE_KERNEL_RO \
  154. (_PAGE_PRESENT | _PAGE_DIRTY | _PAGE_ACCESSED | _PAGE_NX)
  155. #define __PAGE_KERNEL_VSYSCALL \
  156. (_PAGE_PRESENT | _PAGE_USER | _PAGE_ACCESSED)
  157. #define __PAGE_KERNEL_VSYSCALL_NOCACHE \
  158. (_PAGE_PRESENT | _PAGE_USER | _PAGE_ACCESSED | _PAGE_PCD)
  159. #define __PAGE_KERNEL_LARGE \
  160. (__PAGE_KERNEL | _PAGE_PSE)
  161. #define __PAGE_KERNEL_LARGE_EXEC \
  162. (__PAGE_KERNEL_EXEC | _PAGE_PSE)
  163. #define MAKE_GLOBAL(x) __pgprot((x) | _PAGE_GLOBAL)
  164. #define PAGE_KERNEL MAKE_GLOBAL(__PAGE_KERNEL)
  165. #define PAGE_KERNEL_EXEC MAKE_GLOBAL(__PAGE_KERNEL_EXEC)
  166. #define PAGE_KERNEL_RO MAKE_GLOBAL(__PAGE_KERNEL_RO)
  167. #define PAGE_KERNEL_NOCACHE MAKE_GLOBAL(__PAGE_KERNEL_NOCACHE)
  168. #define PAGE_KERNEL_VSYSCALL32 __pgprot(__PAGE_KERNEL_VSYSCALL)
  169. #define PAGE_KERNEL_VSYSCALL MAKE_GLOBAL(__PAGE_KERNEL_VSYSCALL)
  170. #define PAGE_KERNEL_LARGE MAKE_GLOBAL(__PAGE_KERNEL_LARGE)
  171. #define PAGE_KERNEL_VSYSCALL_NOCACHE MAKE_GLOBAL(__PAGE_KERNEL_VSYSCALL_NOCACHE)
  172. /* xwr */
  173. #define __P000 PAGE_NONE
  174. #define __P001 PAGE_READONLY
  175. #define __P010 PAGE_COPY
  176. #define __P011 PAGE_COPY
  177. #define __P100 PAGE_READONLY_EXEC
  178. #define __P101 PAGE_READONLY_EXEC
  179. #define __P110 PAGE_COPY_EXEC
  180. #define __P111 PAGE_COPY_EXEC
  181. #define __S000 PAGE_NONE
  182. #define __S001 PAGE_READONLY
  183. #define __S010 PAGE_SHARED
  184. #define __S011 PAGE_SHARED
  185. #define __S100 PAGE_READONLY_EXEC
  186. #define __S101 PAGE_READONLY_EXEC
  187. #define __S110 PAGE_SHARED_EXEC
  188. #define __S111 PAGE_SHARED_EXEC
  189. #ifndef __ASSEMBLY__
  190. static inline unsigned long pgd_bad(pgd_t pgd)
  191. {
  192. return pgd_val(pgd) & ~(PTE_MASK | _KERNPG_TABLE | _PAGE_USER);
  193. }
  194. static inline unsigned long pud_bad(pud_t pud)
  195. {
  196. return pud_val(pud) & ~(PTE_MASK | _KERNPG_TABLE | _PAGE_USER);
  197. }
  198. static inline unsigned long pmd_bad(pmd_t pmd)
  199. {
  200. return pmd_val(pmd) & ~(PTE_MASK | _KERNPG_TABLE | _PAGE_USER);
  201. }
  202. #define pte_none(x) (!pte_val(x))
  203. #define pte_present(x) (pte_val(x) & (_PAGE_PRESENT | _PAGE_PROTNONE))
  204. #define pte_clear(mm,addr,xp) do { set_pte_at(mm, addr, xp, __pte(0)); } while (0)
  205. #define pages_to_mb(x) ((x) >> (20-PAGE_SHIFT)) /* FIXME: is this
  206. right? */
  207. #define pte_page(x) pfn_to_page(pte_pfn(x))
  208. #define pte_pfn(x) ((pte_val(x) & __PHYSICAL_MASK) >> PAGE_SHIFT)
  209. static inline pte_t pfn_pte(unsigned long page_nr, pgprot_t pgprot)
  210. {
  211. pte_t pte;
  212. pte_val(pte) = (page_nr << PAGE_SHIFT);
  213. pte_val(pte) |= pgprot_val(pgprot);
  214. pte_val(pte) &= __supported_pte_mask;
  215. return pte;
  216. }
  217. /*
  218. * The following only work if pte_present() is true.
  219. * Undefined behaviour if not..
  220. */
  221. #define __LARGE_PTE (_PAGE_PSE|_PAGE_PRESENT)
  222. static inline int pte_dirty(pte_t pte) { return pte_val(pte) & _PAGE_DIRTY; }
  223. static inline int pte_young(pte_t pte) { return pte_val(pte) & _PAGE_ACCESSED; }
  224. static inline int pte_write(pte_t pte) { return pte_val(pte) & _PAGE_RW; }
  225. static inline int pte_file(pte_t pte) { return pte_val(pte) & _PAGE_FILE; }
  226. static inline int pte_huge(pte_t pte) { return pte_val(pte) & _PAGE_PSE; }
  227. static inline pte_t pte_mkclean(pte_t pte) { set_pte(&pte, __pte(pte_val(pte) & ~_PAGE_DIRTY)); return pte; }
  228. static inline pte_t pte_mkold(pte_t pte) { set_pte(&pte, __pte(pte_val(pte) & ~_PAGE_ACCESSED)); return pte; }
  229. static inline pte_t pte_wrprotect(pte_t pte) { set_pte(&pte, __pte(pte_val(pte) & ~_PAGE_RW)); return pte; }
  230. static inline pte_t pte_mkexec(pte_t pte) { set_pte(&pte, __pte(pte_val(pte) & ~_PAGE_NX)); return pte; }
  231. static inline pte_t pte_mkdirty(pte_t pte) { set_pte(&pte, __pte(pte_val(pte) | _PAGE_DIRTY)); return pte; }
  232. static inline pte_t pte_mkyoung(pte_t pte) { set_pte(&pte, __pte(pte_val(pte) | _PAGE_ACCESSED)); return pte; }
  233. static inline pte_t pte_mkwrite(pte_t pte) { set_pte(&pte, __pte(pte_val(pte) | _PAGE_RW)); return pte; }
  234. static inline pte_t pte_mkhuge(pte_t pte) { set_pte(&pte, __pte(pte_val(pte) | _PAGE_PSE)); return pte; }
  235. static inline pte_t pte_clrhuge(pte_t pte) { set_pte(&pte, __pte(pte_val(pte) & ~_PAGE_PSE)); return pte; }
  236. struct vm_area_struct;
  237. static inline int ptep_test_and_clear_young(struct vm_area_struct *vma, unsigned long addr, pte_t *ptep)
  238. {
  239. if (!pte_young(*ptep))
  240. return 0;
  241. return test_and_clear_bit(_PAGE_BIT_ACCESSED, &ptep->pte);
  242. }
  243. static inline void ptep_set_wrprotect(struct mm_struct *mm, unsigned long addr, pte_t *ptep)
  244. {
  245. clear_bit(_PAGE_BIT_RW, &ptep->pte);
  246. }
  247. /*
  248. * Macro to mark a page protection value as "uncacheable".
  249. */
  250. #define pgprot_noncached(prot) (__pgprot(pgprot_val(prot) | _PAGE_PCD | _PAGE_PWT))
  251. static inline int pmd_large(pmd_t pte) {
  252. return (pmd_val(pte) & __LARGE_PTE) == __LARGE_PTE;
  253. }
  254. /*
  255. * Conversion functions: convert a page and protection to a page entry,
  256. * and a page entry and page directory to the page they refer to.
  257. */
  258. /*
  259. * Level 4 access.
  260. */
  261. #define pgd_page_vaddr(pgd) ((unsigned long) __va((unsigned long)pgd_val(pgd) & PTE_MASK))
  262. #define pgd_page(pgd) (pfn_to_page(pgd_val(pgd) >> PAGE_SHIFT))
  263. #define pgd_index(address) (((address) >> PGDIR_SHIFT) & (PTRS_PER_PGD-1))
  264. #define pgd_offset(mm, addr) ((mm)->pgd + pgd_index(addr))
  265. #define pgd_offset_k(address) (init_level4_pgt + pgd_index(address))
  266. #define pgd_present(pgd) (pgd_val(pgd) & _PAGE_PRESENT)
  267. #define mk_kernel_pgd(address) ((pgd_t){ (address) | _KERNPG_TABLE })
  268. /* PUD - Level3 access */
  269. /* to find an entry in a page-table-directory. */
  270. #define pud_page_vaddr(pud) ((unsigned long) __va(pud_val(pud) & PHYSICAL_PAGE_MASK))
  271. #define pud_page(pud) (pfn_to_page(pud_val(pud) >> PAGE_SHIFT))
  272. #define pud_index(address) (((address) >> PUD_SHIFT) & (PTRS_PER_PUD-1))
  273. #define pud_offset(pgd, address) ((pud_t *) pgd_page_vaddr(*(pgd)) + pud_index(address))
  274. #define pud_present(pud) (pud_val(pud) & _PAGE_PRESENT)
  275. /* PMD - Level 2 access */
  276. #define pmd_page_vaddr(pmd) ((unsigned long) __va(pmd_val(pmd) & PTE_MASK))
  277. #define pmd_page(pmd) (pfn_to_page(pmd_val(pmd) >> PAGE_SHIFT))
  278. #define pmd_index(address) (((address) >> PMD_SHIFT) & (PTRS_PER_PMD-1))
  279. #define pmd_offset(dir, address) ((pmd_t *) pud_page_vaddr(*(dir)) + \
  280. pmd_index(address))
  281. #define pmd_none(x) (!pmd_val(x))
  282. #define pmd_present(x) (pmd_val(x) & _PAGE_PRESENT)
  283. #define pmd_clear(xp) do { set_pmd(xp, __pmd(0)); } while (0)
  284. #define pfn_pmd(nr,prot) (__pmd(((nr) << PAGE_SHIFT) | pgprot_val(prot)))
  285. #define pmd_pfn(x) ((pmd_val(x) & __PHYSICAL_MASK) >> PAGE_SHIFT)
  286. #define pte_to_pgoff(pte) ((pte_val(pte) & PHYSICAL_PAGE_MASK) >> PAGE_SHIFT)
  287. #define pgoff_to_pte(off) ((pte_t) { ((off) << PAGE_SHIFT) | _PAGE_FILE })
  288. #define PTE_FILE_MAX_BITS __PHYSICAL_MASK_SHIFT
  289. /* PTE - Level 1 access. */
  290. /* page, protection -> pte */
  291. #define mk_pte(page, pgprot) pfn_pte(page_to_pfn(page), (pgprot))
  292. #define mk_pte_huge(entry) (pte_val(entry) |= _PAGE_PRESENT | _PAGE_PSE)
  293. /* Change flags of a PTE */
  294. static inline pte_t pte_modify(pte_t pte, pgprot_t newprot)
  295. {
  296. pte_val(pte) &= _PAGE_CHG_MASK;
  297. pte_val(pte) |= pgprot_val(newprot);
  298. pte_val(pte) &= __supported_pte_mask;
  299. return pte;
  300. }
  301. #define pte_index(address) \
  302. (((address) >> PAGE_SHIFT) & (PTRS_PER_PTE - 1))
  303. #define pte_offset_kernel(dir, address) ((pte_t *) pmd_page_vaddr(*(dir)) + \
  304. pte_index(address))
  305. /* x86-64 always has all page tables mapped. */
  306. #define pte_offset_map(dir,address) pte_offset_kernel(dir,address)
  307. #define pte_offset_map_nested(dir,address) pte_offset_kernel(dir,address)
  308. #define pte_unmap(pte) /* NOP */
  309. #define pte_unmap_nested(pte) /* NOP */
  310. #define update_mmu_cache(vma,address,pte) do { } while (0)
  311. /* We only update the dirty/accessed state if we set
  312. * the dirty bit by hand in the kernel, since the hardware
  313. * will do the accessed bit for us, and we don't want to
  314. * race with other CPU's that might be updating the dirty
  315. * bit at the same time. */
  316. #define __HAVE_ARCH_PTEP_SET_ACCESS_FLAGS
  317. #define ptep_set_access_flags(__vma, __address, __ptep, __entry, __dirty) \
  318. ({ \
  319. int __changed = !pte_same(*(__ptep), __entry); \
  320. if (__changed && __dirty) { \
  321. set_pte(__ptep, __entry); \
  322. flush_tlb_page(__vma, __address); \
  323. } \
  324. __changed; \
  325. })
  326. /* Encode and de-code a swap entry */
  327. #define __swp_type(x) (((x).val >> 1) & 0x3f)
  328. #define __swp_offset(x) ((x).val >> 8)
  329. #define __swp_entry(type, offset) ((swp_entry_t) { ((type) << 1) | ((offset) << 8) })
  330. #define __pte_to_swp_entry(pte) ((swp_entry_t) { pte_val(pte) })
  331. #define __swp_entry_to_pte(x) ((pte_t) { (x).val })
  332. extern spinlock_t pgd_lock;
  333. extern struct list_head pgd_list;
  334. extern int kern_addr_valid(unsigned long addr);
  335. pte_t *lookup_address(unsigned long addr);
  336. #define io_remap_pfn_range(vma, vaddr, pfn, size, prot) \
  337. remap_pfn_range(vma, vaddr, pfn, size, prot)
  338. #define HAVE_ARCH_UNMAPPED_AREA
  339. #define pgtable_cache_init() do { } while (0)
  340. #define check_pgt_cache() do { } while (0)
  341. #define PAGE_AGP PAGE_KERNEL_NOCACHE
  342. #define HAVE_PAGE_AGP 1
  343. /* fs/proc/kcore.c */
  344. #define kc_vaddr_to_offset(v) ((v) & __VIRTUAL_MASK)
  345. #define kc_offset_to_vaddr(o) \
  346. (((o) & (1UL << (__VIRTUAL_MASK_SHIFT-1))) ? ((o) | (~__VIRTUAL_MASK)) : (o))
  347. #define __HAVE_ARCH_PTEP_TEST_AND_CLEAR_YOUNG
  348. #define __HAVE_ARCH_PTEP_GET_AND_CLEAR
  349. #define __HAVE_ARCH_PTEP_GET_AND_CLEAR_FULL
  350. #define __HAVE_ARCH_PTEP_SET_WRPROTECT
  351. #define __HAVE_ARCH_PTE_SAME
  352. #include <asm-generic/pgtable.h>
  353. #endif /* !__ASSEMBLY__ */
  354. #endif /* _X86_64_PGTABLE_H */