hugetlbpage.c 4.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208
  1. /*
  2. * IA-64 Huge TLB Page Support for Kernel.
  3. *
  4. * Copyright (C) 2002-2004 Rohit Seth <rohit.seth@intel.com>
  5. * Copyright (C) 2003-2004 Ken Chen <kenneth.w.chen@intel.com>
  6. *
  7. * Sep, 2003: add numa support
  8. * Feb, 2004: dynamic hugetlb page size via boot parameter
  9. */
  10. #include <linux/init.h>
  11. #include <linux/fs.h>
  12. #include <linux/mm.h>
  13. #include <linux/hugetlb.h>
  14. #include <linux/pagemap.h>
  15. #include <linux/module.h>
  16. #include <linux/slab.h>
  17. #include <linux/sysctl.h>
  18. #include <linux/log2.h>
  19. #include <asm/mman.h>
  20. #include <asm/pgalloc.h>
  21. #include <asm/tlb.h>
  22. #include <asm/tlbflush.h>
  23. unsigned int hpage_shift = HPAGE_SHIFT_DEFAULT;
  24. EXPORT_SYMBOL(hpage_shift);
  25. pte_t *
  26. huge_pte_alloc(struct mm_struct *mm, unsigned long addr, unsigned long sz)
  27. {
  28. unsigned long taddr = htlbpage_to_page(addr);
  29. pgd_t *pgd;
  30. pud_t *pud;
  31. pmd_t *pmd;
  32. pte_t *pte = NULL;
  33. pgd = pgd_offset(mm, taddr);
  34. pud = pud_alloc(mm, pgd, taddr);
  35. if (pud) {
  36. pmd = pmd_alloc(mm, pud, taddr);
  37. if (pmd)
  38. pte = pte_alloc_map(mm, pmd, taddr);
  39. }
  40. return pte;
  41. }
  42. pte_t *
  43. huge_pte_offset (struct mm_struct *mm, unsigned long addr)
  44. {
  45. unsigned long taddr = htlbpage_to_page(addr);
  46. pgd_t *pgd;
  47. pud_t *pud;
  48. pmd_t *pmd;
  49. pte_t *pte = NULL;
  50. pgd = pgd_offset(mm, taddr);
  51. if (pgd_present(*pgd)) {
  52. pud = pud_offset(pgd, taddr);
  53. if (pud_present(*pud)) {
  54. pmd = pmd_offset(pud, taddr);
  55. if (pmd_present(*pmd))
  56. pte = pte_offset_map(pmd, taddr);
  57. }
  58. }
  59. return pte;
  60. }
  61. int huge_pmd_unshare(struct mm_struct *mm, unsigned long *addr, pte_t *ptep)
  62. {
  63. return 0;
  64. }
  65. #define mk_pte_huge(entry) { pte_val(entry) |= _PAGE_P; }
  66. /*
  67. * Don't actually need to do any preparation, but need to make sure
  68. * the address is in the right region.
  69. */
  70. int prepare_hugepage_range(struct file *file,
  71. unsigned long addr, unsigned long len)
  72. {
  73. if (len & ~HPAGE_MASK)
  74. return -EINVAL;
  75. if (addr & ~HPAGE_MASK)
  76. return -EINVAL;
  77. if (REGION_NUMBER(addr) != RGN_HPAGE)
  78. return -EINVAL;
  79. return 0;
  80. }
  81. struct page *follow_huge_addr(struct mm_struct *mm, unsigned long addr, int write)
  82. {
  83. struct page *page;
  84. pte_t *ptep;
  85. if (REGION_NUMBER(addr) != RGN_HPAGE)
  86. return ERR_PTR(-EINVAL);
  87. ptep = huge_pte_offset(mm, addr);
  88. if (!ptep || pte_none(*ptep))
  89. return NULL;
  90. page = pte_page(*ptep);
  91. page += ((addr & ~HPAGE_MASK) >> PAGE_SHIFT);
  92. return page;
  93. }
  94. int pmd_huge(pmd_t pmd)
  95. {
  96. return 0;
  97. }
  98. int pud_huge(pud_t pud)
  99. {
  100. return 0;
  101. }
  102. struct page *
  103. follow_huge_pmd(struct mm_struct *mm, unsigned long address, pmd_t *pmd, int write)
  104. {
  105. return NULL;
  106. }
  107. void hugetlb_free_pgd_range(struct mmu_gather *tlb,
  108. unsigned long addr, unsigned long end,
  109. unsigned long floor, unsigned long ceiling)
  110. {
  111. /*
  112. * This is called to free hugetlb page tables.
  113. *
  114. * The offset of these addresses from the base of the hugetlb
  115. * region must be scaled down by HPAGE_SIZE/PAGE_SIZE so that
  116. * the standard free_pgd_range will free the right page tables.
  117. *
  118. * If floor and ceiling are also in the hugetlb region, they
  119. * must likewise be scaled down; but if outside, left unchanged.
  120. */
  121. addr = htlbpage_to_page(addr);
  122. end = htlbpage_to_page(end);
  123. if (REGION_NUMBER(floor) == RGN_HPAGE)
  124. floor = htlbpage_to_page(floor);
  125. if (REGION_NUMBER(ceiling) == RGN_HPAGE)
  126. ceiling = htlbpage_to_page(ceiling);
  127. free_pgd_range(tlb, addr, end, floor, ceiling);
  128. }
  129. unsigned long hugetlb_get_unmapped_area(struct file *file, unsigned long addr, unsigned long len,
  130. unsigned long pgoff, unsigned long flags)
  131. {
  132. struct vm_area_struct *vmm;
  133. if (len > RGN_MAP_LIMIT)
  134. return -ENOMEM;
  135. if (len & ~HPAGE_MASK)
  136. return -EINVAL;
  137. /* Handle MAP_FIXED */
  138. if (flags & MAP_FIXED) {
  139. if (prepare_hugepage_range(file, addr, len))
  140. return -EINVAL;
  141. return addr;
  142. }
  143. /* This code assumes that RGN_HPAGE != 0. */
  144. if ((REGION_NUMBER(addr) != RGN_HPAGE) || (addr & (HPAGE_SIZE - 1)))
  145. addr = HPAGE_REGION_BASE;
  146. else
  147. addr = ALIGN(addr, HPAGE_SIZE);
  148. for (vmm = find_vma(current->mm, addr); ; vmm = vmm->vm_next) {
  149. /* At this point: (!vmm || addr < vmm->vm_end). */
  150. if (REGION_OFFSET(addr) + len > RGN_MAP_LIMIT)
  151. return -ENOMEM;
  152. if (!vmm || (addr + len) <= vmm->vm_start)
  153. return addr;
  154. addr = ALIGN(vmm->vm_end, HPAGE_SIZE);
  155. }
  156. }
  157. static int __init hugetlb_setup_sz(char *str)
  158. {
  159. u64 tr_pages;
  160. unsigned long long size;
  161. if (ia64_pal_vm_page_size(&tr_pages, NULL) != 0)
  162. /*
  163. * shouldn't happen, but just in case.
  164. */
  165. tr_pages = 0x15557000UL;
  166. size = memparse(str, &str);
  167. if (*str || !is_power_of_2(size) || !(tr_pages & size) ||
  168. size <= PAGE_SIZE ||
  169. size >= (1UL << PAGE_SHIFT << MAX_ORDER)) {
  170. printk(KERN_WARNING "Invalid huge page size specified\n");
  171. return 1;
  172. }
  173. hpage_shift = __ffs(size);
  174. /*
  175. * boot cpu already executed ia64_mmu_init, and has HPAGE_SHIFT_DEFAULT
  176. * override here with new page shift.
  177. */
  178. ia64_set_rr(HPAGE_REGION_BASE, hpage_shift << 2);
  179. return 0;
  180. }
  181. early_param("hugepagesz", hugetlb_setup_sz);