hugetlbpage.c 4.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208
  1. /*
  2. * IA-64 Huge TLB Page Support for Kernel.
  3. *
  4. * Copyright (C) 2002-2004 Rohit Seth <rohit.seth@intel.com>
  5. * Copyright (C) 2003-2004 Ken Chen <kenneth.w.chen@intel.com>
  6. *
  7. * Sep, 2003: add numa support
  8. * Feb, 2004: dynamic hugetlb page size via boot parameter
  9. */
  10. #include <linux/init.h>
  11. #include <linux/fs.h>
  12. #include <linux/mm.h>
  13. #include <linux/hugetlb.h>
  14. #include <linux/pagemap.h>
  15. #include <linux/module.h>
  16. #include <linux/sysctl.h>
  17. #include <linux/log2.h>
  18. #include <asm/mman.h>
  19. #include <asm/pgalloc.h>
  20. #include <asm/tlb.h>
  21. #include <asm/tlbflush.h>
  22. unsigned int hpage_shift = HPAGE_SHIFT_DEFAULT;
  23. EXPORT_SYMBOL(hpage_shift);
  24. pte_t *
  25. huge_pte_alloc(struct mm_struct *mm, unsigned long addr, unsigned long sz)
  26. {
  27. unsigned long taddr = htlbpage_to_page(addr);
  28. pgd_t *pgd;
  29. pud_t *pud;
  30. pmd_t *pmd;
  31. pte_t *pte = NULL;
  32. pgd = pgd_offset(mm, taddr);
  33. pud = pud_alloc(mm, pgd, taddr);
  34. if (pud) {
  35. pmd = pmd_alloc(mm, pud, taddr);
  36. if (pmd)
  37. pte = pte_alloc_map(mm, NULL, pmd, taddr);
  38. }
  39. return pte;
  40. }
  41. pte_t *
  42. huge_pte_offset (struct mm_struct *mm, unsigned long addr)
  43. {
  44. unsigned long taddr = htlbpage_to_page(addr);
  45. pgd_t *pgd;
  46. pud_t *pud;
  47. pmd_t *pmd;
  48. pte_t *pte = NULL;
  49. pgd = pgd_offset(mm, taddr);
  50. if (pgd_present(*pgd)) {
  51. pud = pud_offset(pgd, taddr);
  52. if (pud_present(*pud)) {
  53. pmd = pmd_offset(pud, taddr);
  54. if (pmd_present(*pmd))
  55. pte = pte_offset_map(pmd, taddr);
  56. }
  57. }
  58. return pte;
  59. }
  60. int huge_pmd_unshare(struct mm_struct *mm, unsigned long *addr, pte_t *ptep)
  61. {
  62. return 0;
  63. }
  64. #define mk_pte_huge(entry) { pte_val(entry) |= _PAGE_P; }
  65. /*
  66. * Don't actually need to do any preparation, but need to make sure
  67. * the address is in the right region.
  68. */
  69. int prepare_hugepage_range(struct file *file,
  70. unsigned long addr, unsigned long len)
  71. {
  72. if (len & ~HPAGE_MASK)
  73. return -EINVAL;
  74. if (addr & ~HPAGE_MASK)
  75. return -EINVAL;
  76. if (REGION_NUMBER(addr) != RGN_HPAGE)
  77. return -EINVAL;
  78. return 0;
  79. }
  80. struct page *follow_huge_addr(struct mm_struct *mm, unsigned long addr, int write)
  81. {
  82. struct page *page;
  83. pte_t *ptep;
  84. if (REGION_NUMBER(addr) != RGN_HPAGE)
  85. return ERR_PTR(-EINVAL);
  86. ptep = huge_pte_offset(mm, addr);
  87. if (!ptep || pte_none(*ptep))
  88. return NULL;
  89. page = pte_page(*ptep);
  90. page += ((addr & ~HPAGE_MASK) >> PAGE_SHIFT);
  91. return page;
  92. }
  93. int pmd_huge(pmd_t pmd)
  94. {
  95. return 0;
  96. }
  97. int pud_huge(pud_t pud)
  98. {
  99. return 0;
  100. }
  101. struct page *
  102. follow_huge_pmd(struct mm_struct *mm, unsigned long address, pmd_t *pmd, int write)
  103. {
  104. return NULL;
  105. }
  106. void hugetlb_free_pgd_range(struct mmu_gather *tlb,
  107. unsigned long addr, unsigned long end,
  108. unsigned long floor, unsigned long ceiling)
  109. {
  110. /*
  111. * This is called to free hugetlb page tables.
  112. *
  113. * The offset of these addresses from the base of the hugetlb
  114. * region must be scaled down by HPAGE_SIZE/PAGE_SIZE so that
  115. * the standard free_pgd_range will free the right page tables.
  116. *
  117. * If floor and ceiling are also in the hugetlb region, they
  118. * must likewise be scaled down; but if outside, left unchanged.
  119. */
  120. addr = htlbpage_to_page(addr);
  121. end = htlbpage_to_page(end);
  122. if (REGION_NUMBER(floor) == RGN_HPAGE)
  123. floor = htlbpage_to_page(floor);
  124. if (REGION_NUMBER(ceiling) == RGN_HPAGE)
  125. ceiling = htlbpage_to_page(ceiling);
  126. free_pgd_range(tlb, addr, end, floor, ceiling);
  127. }
  128. unsigned long hugetlb_get_unmapped_area(struct file *file, unsigned long addr, unsigned long len,
  129. unsigned long pgoff, unsigned long flags)
  130. {
  131. struct vm_area_struct *vmm;
  132. if (len > RGN_MAP_LIMIT)
  133. return -ENOMEM;
  134. if (len & ~HPAGE_MASK)
  135. return -EINVAL;
  136. /* Handle MAP_FIXED */
  137. if (flags & MAP_FIXED) {
  138. if (prepare_hugepage_range(file, addr, len))
  139. return -EINVAL;
  140. return addr;
  141. }
  142. /* This code assumes that RGN_HPAGE != 0. */
  143. if ((REGION_NUMBER(addr) != RGN_HPAGE) || (addr & (HPAGE_SIZE - 1)))
  144. addr = HPAGE_REGION_BASE;
  145. else
  146. addr = ALIGN(addr, HPAGE_SIZE);
  147. for (vmm = find_vma(current->mm, addr); ; vmm = vmm->vm_next) {
  148. /* At this point: (!vmm || addr < vmm->vm_end). */
  149. if (REGION_OFFSET(addr) + len > RGN_MAP_LIMIT)
  150. return -ENOMEM;
  151. if (!vmm || (addr + len) <= vmm->vm_start)
  152. return addr;
  153. addr = ALIGN(vmm->vm_end, HPAGE_SIZE);
  154. }
  155. }
  156. static int __init hugetlb_setup_sz(char *str)
  157. {
  158. u64 tr_pages;
  159. unsigned long long size;
  160. if (ia64_pal_vm_page_size(&tr_pages, NULL) != 0)
  161. /*
  162. * shouldn't happen, but just in case.
  163. */
  164. tr_pages = 0x15557000UL;
  165. size = memparse(str, &str);
  166. if (*str || !is_power_of_2(size) || !(tr_pages & size) ||
  167. size <= PAGE_SIZE ||
  168. size >= (1UL << PAGE_SHIFT << MAX_ORDER)) {
  169. printk(KERN_WARNING "Invalid huge page size specified\n");
  170. return 1;
  171. }
  172. hpage_shift = __ffs(size);
  173. /*
  174. * boot cpu already executed ia64_mmu_init, and has HPAGE_SHIFT_DEFAULT
  175. * override here with new page shift.
  176. */
  177. ia64_set_rr(HPAGE_REGION_BASE, hpage_shift << 2);
  178. return 0;
  179. }
  180. early_param("hugepagesz", hugetlb_setup_sz);