contig.c 9.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359
  1. /*
  2. * This file is subject to the terms and conditions of the GNU General Public
  3. * License. See the file "COPYING" in the main directory of this archive
  4. * for more details.
  5. *
  6. * Copyright (C) 1998-2003 Hewlett-Packard Co
  7. * David Mosberger-Tang <davidm@hpl.hp.com>
  8. * Stephane Eranian <eranian@hpl.hp.com>
  9. * Copyright (C) 2000, Rohit Seth <rohit.seth@intel.com>
  10. * Copyright (C) 1999 VA Linux Systems
  11. * Copyright (C) 1999 Walt Drummond <drummond@valinux.com>
  12. * Copyright (C) 2003 Silicon Graphics, Inc. All rights reserved.
  13. *
  14. * Routines used by ia64 machines with contiguous (or virtually contiguous)
  15. * memory.
  16. */
  17. #include <linux/bootmem.h>
  18. #include <linux/efi.h>
  19. #include <linux/memblock.h>
  20. #include <linux/mm.h>
  21. #include <linux/nmi.h>
  22. #include <linux/swap.h>
  23. #include <asm/meminit.h>
  24. #include <asm/pgalloc.h>
  25. #include <asm/pgtable.h>
  26. #include <asm/sections.h>
  27. #include <asm/mca.h>
  28. #ifdef CONFIG_VIRTUAL_MEM_MAP
  29. static unsigned long max_gap;
  30. #endif
  31. /**
  32. * show_mem - give short summary of memory stats
  33. *
  34. * Shows a simple page count of reserved and used pages in the system.
  35. * For discontig machines, it does this on a per-pgdat basis.
  36. */
  37. void show_mem(unsigned int filter)
  38. {
  39. int i, total_reserved = 0;
  40. int total_shared = 0, total_cached = 0;
  41. unsigned long total_present = 0;
  42. pg_data_t *pgdat;
  43. printk(KERN_INFO "Mem-info:\n");
  44. show_free_areas(filter);
  45. printk(KERN_INFO "Node memory in pages:\n");
  46. if (filter & SHOW_MEM_FILTER_PAGE_COUNT)
  47. return;
  48. for_each_online_pgdat(pgdat) {
  49. unsigned long present;
  50. unsigned long flags;
  51. int shared = 0, cached = 0, reserved = 0;
  52. int nid = pgdat->node_id;
  53. if (skip_free_areas_node(filter, nid))
  54. continue;
  55. pgdat_resize_lock(pgdat, &flags);
  56. present = pgdat->node_present_pages;
  57. for(i = 0; i < pgdat->node_spanned_pages; i++) {
  58. struct page *page;
  59. if (unlikely(i % MAX_ORDER_NR_PAGES == 0))
  60. touch_nmi_watchdog();
  61. if (pfn_valid(pgdat->node_start_pfn + i))
  62. page = pfn_to_page(pgdat->node_start_pfn + i);
  63. else {
  64. #ifdef CONFIG_VIRTUAL_MEM_MAP
  65. if (max_gap < LARGE_GAP)
  66. continue;
  67. #endif
  68. i = vmemmap_find_next_valid_pfn(nid, i) - 1;
  69. continue;
  70. }
  71. if (PageReserved(page))
  72. reserved++;
  73. else if (PageSwapCache(page))
  74. cached++;
  75. else if (page_count(page))
  76. shared += page_count(page)-1;
  77. }
  78. pgdat_resize_unlock(pgdat, &flags);
  79. total_present += present;
  80. total_reserved += reserved;
  81. total_cached += cached;
  82. total_shared += shared;
  83. printk(KERN_INFO "Node %4d: RAM: %11ld, rsvd: %8d, "
  84. "shrd: %10d, swpd: %10d\n", nid,
  85. present, reserved, shared, cached);
  86. }
  87. printk(KERN_INFO "%ld pages of RAM\n", total_present);
  88. printk(KERN_INFO "%d reserved pages\n", total_reserved);
  89. printk(KERN_INFO "%d pages shared\n", total_shared);
  90. printk(KERN_INFO "%d pages swap cached\n", total_cached);
  91. printk(KERN_INFO "Total of %ld pages in page table cache\n",
  92. quicklist_total_size());
  93. printk(KERN_INFO "%d free buffer pages\n", nr_free_buffer_pages());
  94. }
  95. /* physical address where the bootmem map is located */
  96. unsigned long bootmap_start;
  97. /**
  98. * find_bootmap_location - callback to find a memory area for the bootmap
  99. * @start: start of region
  100. * @end: end of region
  101. * @arg: unused callback data
  102. *
  103. * Find a place to put the bootmap and return its starting address in
  104. * bootmap_start. This address must be page-aligned.
  105. */
  106. static int __init
  107. find_bootmap_location (u64 start, u64 end, void *arg)
  108. {
  109. u64 needed = *(unsigned long *)arg;
  110. u64 range_start, range_end, free_start;
  111. int i;
  112. #if IGNORE_PFN0
  113. if (start == PAGE_OFFSET) {
  114. start += PAGE_SIZE;
  115. if (start >= end)
  116. return 0;
  117. }
  118. #endif
  119. free_start = PAGE_OFFSET;
  120. for (i = 0; i < num_rsvd_regions; i++) {
  121. range_start = max(start, free_start);
  122. range_end = min(end, rsvd_region[i].start & PAGE_MASK);
  123. free_start = PAGE_ALIGN(rsvd_region[i].end);
  124. if (range_end <= range_start)
  125. continue; /* skip over empty range */
  126. if (range_end - range_start >= needed) {
  127. bootmap_start = __pa(range_start);
  128. return -1; /* done */
  129. }
  130. /* nothing more available in this segment */
  131. if (range_end == end)
  132. return 0;
  133. }
  134. return 0;
  135. }
  136. #ifdef CONFIG_SMP
  137. static void *cpu_data;
  138. /**
  139. * per_cpu_init - setup per-cpu variables
  140. *
  141. * Allocate and setup per-cpu data areas.
  142. */
  143. void * __cpuinit
  144. per_cpu_init (void)
  145. {
  146. static bool first_time = true;
  147. void *cpu0_data = __cpu0_per_cpu;
  148. unsigned int cpu;
  149. if (!first_time)
  150. goto skip;
  151. first_time = false;
  152. /*
  153. * get_free_pages() cannot be used before cpu_init() done.
  154. * BSP allocates PERCPU_PAGE_SIZE bytes for all possible CPUs
  155. * to avoid that AP calls get_zeroed_page().
  156. */
  157. for_each_possible_cpu(cpu) {
  158. void *src = cpu == 0 ? cpu0_data : __phys_per_cpu_start;
  159. memcpy(cpu_data, src, __per_cpu_end - __per_cpu_start);
  160. __per_cpu_offset[cpu] = (char *)cpu_data - __per_cpu_start;
  161. per_cpu(local_per_cpu_offset, cpu) = __per_cpu_offset[cpu];
  162. /*
  163. * percpu area for cpu0 is moved from the __init area
  164. * which is setup by head.S and used till this point.
  165. * Update ar.k3. This move is ensures that percpu
  166. * area for cpu0 is on the correct node and its
  167. * virtual address isn't insanely far from other
  168. * percpu areas which is important for congruent
  169. * percpu allocator.
  170. */
  171. if (cpu == 0)
  172. ia64_set_kr(IA64_KR_PER_CPU_DATA, __pa(cpu_data) -
  173. (unsigned long)__per_cpu_start);
  174. cpu_data += PERCPU_PAGE_SIZE;
  175. }
  176. skip:
  177. return __per_cpu_start + __per_cpu_offset[smp_processor_id()];
  178. }
  179. static inline void
  180. alloc_per_cpu_data(void)
  181. {
  182. cpu_data = __alloc_bootmem(PERCPU_PAGE_SIZE * num_possible_cpus(),
  183. PERCPU_PAGE_SIZE, __pa(MAX_DMA_ADDRESS));
  184. }
  185. /**
  186. * setup_per_cpu_areas - setup percpu areas
  187. *
  188. * Arch code has already allocated and initialized percpu areas. All
  189. * this function has to do is to teach the determined layout to the
  190. * dynamic percpu allocator, which happens to be more complex than
  191. * creating whole new ones using helpers.
  192. */
  193. void __init
  194. setup_per_cpu_areas(void)
  195. {
  196. struct pcpu_alloc_info *ai;
  197. struct pcpu_group_info *gi;
  198. unsigned int cpu;
  199. ssize_t static_size, reserved_size, dyn_size;
  200. int rc;
  201. ai = pcpu_alloc_alloc_info(1, num_possible_cpus());
  202. if (!ai)
  203. panic("failed to allocate pcpu_alloc_info");
  204. gi = &ai->groups[0];
  205. /* units are assigned consecutively to possible cpus */
  206. for_each_possible_cpu(cpu)
  207. gi->cpu_map[gi->nr_units++] = cpu;
  208. /* set parameters */
  209. static_size = __per_cpu_end - __per_cpu_start;
  210. reserved_size = PERCPU_MODULE_RESERVE;
  211. dyn_size = PERCPU_PAGE_SIZE - static_size - reserved_size;
  212. if (dyn_size < 0)
  213. panic("percpu area overflow static=%zd reserved=%zd\n",
  214. static_size, reserved_size);
  215. ai->static_size = static_size;
  216. ai->reserved_size = reserved_size;
  217. ai->dyn_size = dyn_size;
  218. ai->unit_size = PERCPU_PAGE_SIZE;
  219. ai->atom_size = PAGE_SIZE;
  220. ai->alloc_size = PERCPU_PAGE_SIZE;
  221. rc = pcpu_setup_first_chunk(ai, __per_cpu_start + __per_cpu_offset[0]);
  222. if (rc)
  223. panic("failed to setup percpu area (err=%d)", rc);
  224. pcpu_free_alloc_info(ai);
  225. }
  226. #else
  227. #define alloc_per_cpu_data() do { } while (0)
  228. #endif /* CONFIG_SMP */
  229. /**
  230. * find_memory - setup memory map
  231. *
  232. * Walk the EFI memory map and find usable memory for the system, taking
  233. * into account reserved areas.
  234. */
  235. void __init
  236. find_memory (void)
  237. {
  238. unsigned long bootmap_size;
  239. reserve_memory();
  240. /* first find highest page frame number */
  241. min_low_pfn = ~0UL;
  242. max_low_pfn = 0;
  243. efi_memmap_walk(find_max_min_low_pfn, NULL);
  244. max_pfn = max_low_pfn;
  245. /* how many bytes to cover all the pages */
  246. bootmap_size = bootmem_bootmap_pages(max_pfn) << PAGE_SHIFT;
  247. /* look for a location to hold the bootmap */
  248. bootmap_start = ~0UL;
  249. efi_memmap_walk(find_bootmap_location, &bootmap_size);
  250. if (bootmap_start == ~0UL)
  251. panic("Cannot find %ld bytes for bootmap\n", bootmap_size);
  252. bootmap_size = init_bootmem_node(NODE_DATA(0),
  253. (bootmap_start >> PAGE_SHIFT), 0, max_pfn);
  254. /* Free all available memory, then mark bootmem-map as being in use. */
  255. efi_memmap_walk(filter_rsvd_memory, free_bootmem);
  256. reserve_bootmem(bootmap_start, bootmap_size, BOOTMEM_DEFAULT);
  257. find_initrd();
  258. alloc_per_cpu_data();
  259. }
  260. static int count_pages(u64 start, u64 end, void *arg)
  261. {
  262. unsigned long *count = arg;
  263. *count += (end - start) >> PAGE_SHIFT;
  264. return 0;
  265. }
  266. /*
  267. * Set up the page tables.
  268. */
  269. void __init
  270. paging_init (void)
  271. {
  272. unsigned long max_dma;
  273. unsigned long max_zone_pfns[MAX_NR_ZONES];
  274. num_physpages = 0;
  275. efi_memmap_walk(count_pages, &num_physpages);
  276. memset(max_zone_pfns, 0, sizeof(max_zone_pfns));
  277. #ifdef CONFIG_ZONE_DMA
  278. max_dma = virt_to_phys((void *) MAX_DMA_ADDRESS) >> PAGE_SHIFT;
  279. max_zone_pfns[ZONE_DMA] = max_dma;
  280. #endif
  281. max_zone_pfns[ZONE_NORMAL] = max_low_pfn;
  282. #ifdef CONFIG_VIRTUAL_MEM_MAP
  283. efi_memmap_walk(filter_memory, register_active_ranges);
  284. efi_memmap_walk(find_largest_hole, (u64 *)&max_gap);
  285. if (max_gap < LARGE_GAP) {
  286. vmem_map = (struct page *) 0;
  287. free_area_init_nodes(max_zone_pfns);
  288. } else {
  289. unsigned long map_size;
  290. /* allocate virtual_mem_map */
  291. map_size = PAGE_ALIGN(ALIGN(max_low_pfn, MAX_ORDER_NR_PAGES) *
  292. sizeof(struct page));
  293. VMALLOC_END -= map_size;
  294. vmem_map = (struct page *) VMALLOC_END;
  295. efi_memmap_walk(create_mem_map_page_table, NULL);
  296. /*
  297. * alloc_node_mem_map makes an adjustment for mem_map
  298. * which isn't compatible with vmem_map.
  299. */
  300. NODE_DATA(0)->node_mem_map = vmem_map +
  301. find_min_pfn_with_active_regions();
  302. free_area_init_nodes(max_zone_pfns);
  303. printk("Virtual mem_map starts at 0x%p\n", mem_map);
  304. }
  305. #else /* !CONFIG_VIRTUAL_MEM_MAP */
  306. memblock_add_node(0, PFN_PHYS(max_low_pfn), 0);
  307. free_area_init_nodes(max_zone_pfns);
  308. #endif /* !CONFIG_VIRTUAL_MEM_MAP */
  309. zero_page_memmap_ptr = virt_to_page(ia64_imva(empty_zero_page));
  310. }