pageattr_32.c 5.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240
  1. /*
  2. * Copyright 2002 Andi Kleen, SuSE Labs.
  3. * Thanks to Ben LaHaise for precious feedback.
  4. */
  5. #include <linux/highmem.h>
  6. #include <linux/module.h>
  7. #include <linux/sched.h>
  8. #include <linux/slab.h>
  9. #include <linux/mm.h>
  10. #include <asm/processor.h>
  11. #include <asm/tlbflush.h>
  12. #include <asm/sections.h>
  13. #include <asm/uaccess.h>
  14. #include <asm/pgalloc.h>
  15. pte_t *lookup_address(unsigned long address, int *level)
  16. {
  17. pgd_t *pgd = pgd_offset_k(address);
  18. pud_t *pud;
  19. pmd_t *pmd;
  20. if (pgd_none(*pgd))
  21. return NULL;
  22. pud = pud_offset(pgd, address);
  23. if (pud_none(*pud))
  24. return NULL;
  25. pmd = pmd_offset(pud, address);
  26. if (pmd_none(*pmd))
  27. return NULL;
  28. *level = 2;
  29. if (pmd_large(*pmd))
  30. return (pte_t *)pmd;
  31. *level = 3;
  32. return pte_offset_kernel(pmd, address);
  33. }
  34. static void set_pmd_pte(pte_t *kpte, unsigned long address, pte_t pte)
  35. {
  36. unsigned long flags;
  37. struct page *page;
  38. /* change init_mm */
  39. set_pte_atomic(kpte, pte);
  40. if (SHARED_KERNEL_PMD)
  41. return;
  42. spin_lock_irqsave(&pgd_lock, flags);
  43. for (page = pgd_list; page; page = (struct page *)page->index) {
  44. pgd_t *pgd;
  45. pud_t *pud;
  46. pmd_t *pmd;
  47. pgd = (pgd_t *)page_address(page) + pgd_index(address);
  48. pud = pud_offset(pgd, address);
  49. pmd = pmd_offset(pud, address);
  50. set_pte_atomic((pte_t *)pmd, pte);
  51. }
  52. spin_unlock_irqrestore(&pgd_lock, flags);
  53. }
  54. static int
  55. split_large_page(pte_t *kpte, unsigned long address, pgprot_t ref_prot)
  56. {
  57. int i, level;
  58. unsigned long addr;
  59. pte_t *pbase, *tmp;
  60. struct page *base;
  61. base = alloc_pages(GFP_KERNEL, 0);
  62. if (!base)
  63. return -ENOMEM;
  64. down_write(&init_mm.mmap_sem);
  65. /*
  66. * Check for races, another CPU might have split this page
  67. * up for us already:
  68. */
  69. tmp = lookup_address(address, &level);
  70. if (tmp != kpte)
  71. goto out_unlock;
  72. address = __pa(address);
  73. addr = address & LARGE_PAGE_MASK;
  74. pbase = (pte_t *)page_address(base);
  75. paravirt_alloc_pt(&init_mm, page_to_pfn(base));
  76. for (i = 0; i < PTRS_PER_PTE; i++, addr += PAGE_SIZE)
  77. set_pte(&pbase[i], pfn_pte(addr >> PAGE_SHIFT, ref_prot));
  78. /*
  79. * Install the new, split up pagetable:
  80. */
  81. set_pmd_pte(kpte, address, mk_pte(base, ref_prot));
  82. base = NULL;
  83. out_unlock:
  84. up_write(&init_mm.mmap_sem);
  85. if (base)
  86. __free_pages(base, 0);
  87. return 0;
  88. }
  89. static int __change_page_attr(struct page *page, pgprot_t prot)
  90. {
  91. pgprot_t ref_prot = PAGE_KERNEL;
  92. struct page *kpte_page;
  93. unsigned long address;
  94. int level, err = 0;
  95. pgprot_t oldprot;
  96. pte_t *kpte;
  97. BUG_ON(PageHighMem(page));
  98. address = (unsigned long)page_address(page);
  99. repeat:
  100. kpte = lookup_address(address, &level);
  101. if (!kpte)
  102. return -EINVAL;
  103. oldprot = pte_pgprot(*kpte);
  104. kpte_page = virt_to_page(kpte);
  105. BUG_ON(PageLRU(kpte_page));
  106. BUG_ON(PageCompound(kpte_page));
  107. /*
  108. * Better fail early if someone sets the kernel text to NX.
  109. * Does not cover __inittext
  110. */
  111. BUG_ON(address >= (unsigned long)&_text &&
  112. address < (unsigned long)&_etext &&
  113. (pgprot_val(prot) & _PAGE_NX));
  114. if ((address & LARGE_PAGE_MASK) < (unsigned long)&_etext)
  115. ref_prot = PAGE_KERNEL_EXEC;
  116. ref_prot = canon_pgprot(ref_prot);
  117. prot = canon_pgprot(prot);
  118. if (level == 3) {
  119. set_pte_atomic(kpte, mk_pte(page, prot));
  120. } else {
  121. err = split_large_page(kpte, address, ref_prot);
  122. if (!err)
  123. goto repeat;
  124. }
  125. return err;
  126. }
  127. /*
  128. * Change the page attributes of an page in the linear mapping.
  129. *
  130. * This should be used when a page is mapped with a different caching policy
  131. * than write-back somewhere - some CPUs do not like it when mappings with
  132. * different caching policies exist. This changes the page attributes of the
  133. * in kernel linear mapping too.
  134. *
  135. * The caller needs to ensure that there are no conflicting mappings elsewhere.
  136. * This function only deals with the kernel linear map.
  137. *
  138. * Caller must call global_flush_tlb() after this.
  139. */
  140. int change_page_attr(struct page *page, int numpages, pgprot_t prot)
  141. {
  142. int err = 0, i;
  143. for (i = 0; i < numpages; i++, page++) {
  144. err = __change_page_attr(page, prot);
  145. if (err)
  146. break;
  147. }
  148. return err;
  149. }
  150. EXPORT_SYMBOL(change_page_attr);
  151. int change_page_attr_addr(unsigned long addr, int numpages, pgprot_t prot)
  152. {
  153. int i;
  154. unsigned long pfn = (addr >> PAGE_SHIFT);
  155. for (i = 0; i < numpages; i++) {
  156. if (!pfn_valid(pfn + i)) {
  157. break;
  158. } else {
  159. int level;
  160. pte_t *pte = lookup_address(addr + i*PAGE_SIZE, &level);
  161. BUG_ON(pte && !pte_none(*pte));
  162. }
  163. }
  164. return change_page_attr(virt_to_page(addr), i, prot);
  165. }
  166. static void flush_kernel_map(void *arg)
  167. {
  168. /*
  169. * Flush all to work around Errata in early athlons regarding
  170. * large page flushing.
  171. */
  172. __flush_tlb_all();
  173. if (boot_cpu_data.x86_model >= 4)
  174. wbinvd();
  175. }
  176. void global_flush_tlb(void)
  177. {
  178. BUG_ON(irqs_disabled());
  179. on_each_cpu(flush_kernel_map, NULL, 1, 1);
  180. }
  181. EXPORT_SYMBOL(global_flush_tlb);
  182. #ifdef CONFIG_DEBUG_PAGEALLOC
  183. void kernel_map_pages(struct page *page, int numpages, int enable)
  184. {
  185. if (PageHighMem(page))
  186. return;
  187. if (!enable) {
  188. debug_check_no_locks_freed(page_address(page),
  189. numpages * PAGE_SIZE);
  190. }
  191. /*
  192. * the return value is ignored - the calls cannot fail,
  193. * large pages are disabled at boot time.
  194. */
  195. change_page_attr(page, numpages, enable ? PAGE_KERNEL : __pgprot(0));
  196. /*
  197. * we should perform an IPI and flush all tlbs,
  198. * but that can deadlock->flush only current cpu.
  199. */
  200. __flush_tlb_all();
  201. }
  202. #endif