blob: 351da0a06cd044cefcff49cfaee848ba7b636d5f [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * This file is subject to the terms and conditions of the GNU General Public
3 * License. See the file "COPYING" in the main directory of this archive
4 * for more details.
5 *
6 * Copyright (C) 1998-2003 Hewlett-Packard Co
7 * David Mosberger-Tang <davidm@hpl.hp.com>
8 * Stephane Eranian <eranian@hpl.hp.com>
9 * Copyright (C) 2000, Rohit Seth <rohit.seth@intel.com>
10 * Copyright (C) 1999 VA Linux Systems
11 * Copyright (C) 1999 Walt Drummond <drummond@valinux.com>
12 * Copyright (C) 2003 Silicon Graphics, Inc. All rights reserved.
13 *
14 * Routines used by ia64 machines with contiguous (or virtually contiguous)
15 * memory.
16 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#include <linux/bootmem.h>
18#include <linux/efi.h>
19#include <linux/mm.h>
Prarit Bhargava99a19cf12007-08-22 14:34:38 -040020#include <linux/nmi.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021#include <linux/swap.h>
22
23#include <asm/meminit.h>
24#include <asm/pgalloc.h>
25#include <asm/pgtable.h>
26#include <asm/sections.h>
27#include <asm/mca.h>
28
29#ifdef CONFIG_VIRTUAL_MEM_MAP
Bob Piccoe44e41d2006-06-28 12:55:43 -040030static unsigned long max_gap;
Linus Torvalds1da177e2005-04-16 15:20:36 -070031#endif
32
33/**
George Beshersf1c0afa2007-02-05 16:20:04 -080034 * show_mem - give short summary of memory stats
Linus Torvalds1da177e2005-04-16 15:20:36 -070035 *
George Beshersf1c0afa2007-02-05 16:20:04 -080036 * Shows a simple page count of reserved and used pages in the system.
37 * For discontig machines, it does this on a per-pgdat basis.
Linus Torvalds1da177e2005-04-16 15:20:36 -070038 */
George Beshersf1c0afa2007-02-05 16:20:04 -080039void show_mem(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -070040{
George Beshersf1c0afa2007-02-05 16:20:04 -080041 int i, total_reserved = 0;
42 int total_shared = 0, total_cached = 0;
43 unsigned long total_present = 0;
44 pg_data_t *pgdat;
Linus Torvalds1da177e2005-04-16 15:20:36 -070045
Jes Sorensen709a6c12006-09-13 08:43:42 -040046 printk(KERN_INFO "Mem-info:\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -070047 show_free_areas();
George Beshersf1c0afa2007-02-05 16:20:04 -080048 printk(KERN_INFO "Node memory in pages:\n");
49 for_each_online_pgdat(pgdat) {
50 unsigned long present;
51 unsigned long flags;
52 int shared = 0, cached = 0, reserved = 0;
53
54 pgdat_resize_lock(pgdat, &flags);
55 present = pgdat->node_present_pages;
56 for(i = 0; i < pgdat->node_spanned_pages; i++) {
57 struct page *page;
Prarit Bhargava99a19cf12007-08-22 14:34:38 -040058 if (unlikely(i % MAX_ORDER_NR_PAGES == 0))
59 touch_nmi_watchdog();
George Beshersf1c0afa2007-02-05 16:20:04 -080060 if (pfn_valid(pgdat->node_start_pfn + i))
61 page = pfn_to_page(pgdat->node_start_pfn + i);
62 else {
Bob Piccoe44e41d2006-06-28 12:55:43 -040063#ifdef CONFIG_VIRTUAL_MEM_MAP
George Beshersf1c0afa2007-02-05 16:20:04 -080064 if (max_gap < LARGE_GAP)
65 continue;
Bob Piccoe44e41d2006-06-28 12:55:43 -040066#endif
George Beshersf1c0afa2007-02-05 16:20:04 -080067 i = vmemmap_find_next_valid_pfn(pgdat->node_id,
68 i) - 1;
69 continue;
70 }
71 if (PageReserved(page))
72 reserved++;
73 else if (PageSwapCache(page))
74 cached++;
75 else if (page_count(page))
76 shared += page_count(page)-1;
Bob Piccoe44e41d2006-06-28 12:55:43 -040077 }
George Beshersf1c0afa2007-02-05 16:20:04 -080078 pgdat_resize_unlock(pgdat, &flags);
79 total_present += present;
80 total_reserved += reserved;
81 total_cached += cached;
82 total_shared += shared;
83 printk(KERN_INFO "Node %4d: RAM: %11ld, rsvd: %8d, "
84 "shrd: %10d, swpd: %10d\n", pgdat->node_id,
85 present, reserved, shared, cached);
Linus Torvalds1da177e2005-04-16 15:20:36 -070086 }
George Beshersf1c0afa2007-02-05 16:20:04 -080087 printk(KERN_INFO "%ld pages of RAM\n", total_present);
88 printk(KERN_INFO "%d reserved pages\n", total_reserved);
89 printk(KERN_INFO "%d pages shared\n", total_shared);
90 printk(KERN_INFO "%d pages swap cached\n", total_cached);
91 printk(KERN_INFO "Total of %ld pages in page table cache\n",
Christoph Lameter2bd62a42007-05-10 22:42:53 -070092 quicklist_total_size());
George Beshersf1c0afa2007-02-05 16:20:04 -080093 printk(KERN_INFO "%d free buffer pages\n", nr_free_buffer_pages());
Linus Torvalds1da177e2005-04-16 15:20:36 -070094}
95
George Beshersf1c0afa2007-02-05 16:20:04 -080096
Linus Torvalds1da177e2005-04-16 15:20:36 -070097/* physical address where the bootmem map is located */
98unsigned long bootmap_start;
99
100/**
Linus Torvalds1da177e2005-04-16 15:20:36 -0700101 * find_bootmap_location - callback to find a memory area for the bootmap
102 * @start: start of region
103 * @end: end of region
104 * @arg: unused callback data
105 *
106 * Find a place to put the bootmap and return its starting address in
107 * bootmap_start. This address must be page-aligned.
108 */
Chen, Kenneth Wdae28062006-03-22 16:54:15 -0800109static int __init
Matthew Wilcoxe088a4a2009-05-22 13:49:49 -0700110find_bootmap_location (u64 start, u64 end, void *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700111{
Matthew Wilcoxe088a4a2009-05-22 13:49:49 -0700112 u64 needed = *(unsigned long *)arg;
113 u64 range_start, range_end, free_start;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114 int i;
115
116#if IGNORE_PFN0
117 if (start == PAGE_OFFSET) {
118 start += PAGE_SIZE;
119 if (start >= end)
120 return 0;
121 }
122#endif
123
124 free_start = PAGE_OFFSET;
125
126 for (i = 0; i < num_rsvd_regions; i++) {
127 range_start = max(start, free_start);
128 range_end = min(end, rsvd_region[i].start & PAGE_MASK);
129
130 free_start = PAGE_ALIGN(rsvd_region[i].end);
131
132 if (range_end <= range_start)
133 continue; /* skip over empty range */
134
135 if (range_end - range_start >= needed) {
136 bootmap_start = __pa(range_start);
137 return -1; /* done */
138 }
139
140 /* nothing more available in this segment */
141 if (range_end == end)
142 return 0;
143 }
144 return 0;
145}
146
Tony Luck4b9ddc72007-11-06 15:14:45 -0800147#ifdef CONFIG_SMP
148static void *cpu_data;
149/**
150 * per_cpu_init - setup per-cpu variables
151 *
152 * Allocate and setup per-cpu data areas.
153 */
154void * __cpuinit
155per_cpu_init (void)
156{
Tejun Heo36886472009-10-02 13:28:56 +0900157 static bool first_time = true;
158 void *cpu0_data = __cpu0_per_cpu;
159 unsigned int cpu;
160
161 if (!first_time)
162 goto skip;
163 first_time = false;
Tony Luck4b9ddc72007-11-06 15:14:45 -0800164
165 /*
166 * get_free_pages() cannot be used before cpu_init() done. BSP
167 * allocates "NR_CPUS" pages for all CPUs to avoid that AP calls
168 * get_zeroed_page().
169 */
Tejun Heo36886472009-10-02 13:28:56 +0900170 for (cpu = 0; cpu < NR_CPUS; cpu++) {
171 void *src = cpu == 0 ? cpu0_data : __phys_per_cpu_start;
Tony Luck10617bb2008-08-12 10:34:20 -0700172
Tejun Heo36886472009-10-02 13:28:56 +0900173 memcpy(cpu_data, src, __per_cpu_end - __per_cpu_start);
174 __per_cpu_offset[cpu] = (char *)cpu_data - __per_cpu_start;
175 per_cpu(local_per_cpu_offset, cpu) = __per_cpu_offset[cpu];
Tony Luck10617bb2008-08-12 10:34:20 -0700176
Tejun Heo36886472009-10-02 13:28:56 +0900177 /*
178 * percpu area for cpu0 is moved from the __init area
179 * which is setup by head.S and used till this point.
180 * Update ar.k3. This move is ensures that percpu
181 * area for cpu0 is on the correct node and its
182 * virtual address isn't insanely far from other
183 * percpu areas which is important for congruent
184 * percpu allocator.
185 */
186 if (cpu == 0)
187 ia64_set_kr(IA64_KR_PER_CPU_DATA, __pa(cpu_data) -
188 (unsigned long)__per_cpu_start);
Tony Luck10617bb2008-08-12 10:34:20 -0700189
Tejun Heo36886472009-10-02 13:28:56 +0900190 cpu_data += PERCPU_PAGE_SIZE;
Tony Luck4b9ddc72007-11-06 15:14:45 -0800191 }
Tejun Heo36886472009-10-02 13:28:56 +0900192skip:
Tony Luck4b9ddc72007-11-06 15:14:45 -0800193 return __per_cpu_start + __per_cpu_offset[smp_processor_id()];
194}
195
196static inline void
197alloc_per_cpu_data(void)
198{
Tejun Heo36886472009-10-02 13:28:56 +0900199 cpu_data = __alloc_bootmem(PERCPU_PAGE_SIZE * NR_CPUS,
Tony Luck4b9ddc72007-11-06 15:14:45 -0800200 PERCPU_PAGE_SIZE, __pa(MAX_DMA_ADDRESS));
201}
202#else
203#define alloc_per_cpu_data() do { } while (0)
204#endif /* CONFIG_SMP */
205
Linus Torvalds1da177e2005-04-16 15:20:36 -0700206/**
207 * find_memory - setup memory map
208 *
209 * Walk the EFI memory map and find usable memory for the system, taking
210 * into account reserved areas.
211 */
Chen, Kenneth Wdae28062006-03-22 16:54:15 -0800212void __init
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213find_memory (void)
214{
215 unsigned long bootmap_size;
216
217 reserve_memory();
218
219 /* first find highest page frame number */
Zou Nan haia3f5c332007-03-20 13:41:57 -0700220 min_low_pfn = ~0UL;
221 max_low_pfn = 0;
222 efi_memmap_walk(find_max_min_low_pfn, NULL);
223 max_pfn = max_low_pfn;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700224 /* how many bytes to cover all the pages */
225 bootmap_size = bootmem_bootmap_pages(max_pfn) << PAGE_SHIFT;
226
227 /* look for a location to hold the bootmap */
228 bootmap_start = ~0UL;
229 efi_memmap_walk(find_bootmap_location, &bootmap_size);
230 if (bootmap_start == ~0UL)
231 panic("Cannot find %ld bytes for bootmap\n", bootmap_size);
232
Zou Nan haia3f5c332007-03-20 13:41:57 -0700233 bootmap_size = init_bootmem_node(NODE_DATA(0),
234 (bootmap_start >> PAGE_SHIFT), 0, max_pfn);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700235
236 /* Free all available memory, then mark bootmem-map as being in use. */
237 efi_memmap_walk(filter_rsvd_memory, free_bootmem);
Bernhard Walle72a7fe32008-02-07 00:15:17 -0800238 reserve_bootmem(bootmap_start, bootmap_size, BOOTMEM_DEFAULT);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700239
240 find_initrd();
Horms45a98fc2006-12-12 17:49:03 +0900241
Tony Luck4b9ddc72007-11-06 15:14:45 -0800242 alloc_per_cpu_data();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700243}
244
Matthew Wilcoxe088a4a2009-05-22 13:49:49 -0700245static int count_pages(u64 start, u64 end, void *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246{
247 unsigned long *count = arg;
248
249 *count += (end - start) >> PAGE_SHIFT;
250 return 0;
251}
252
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253/*
254 * Set up the page tables.
255 */
256
Chen, Kenneth Wdae28062006-03-22 16:54:15 -0800257void __init
Linus Torvalds1da177e2005-04-16 15:20:36 -0700258paging_init (void)
259{
260 unsigned long max_dma;
Mel Gorman05e0caa2006-09-27 01:49:54 -0700261 unsigned long max_zone_pfns[MAX_NR_ZONES];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262
263 num_physpages = 0;
264 efi_memmap_walk(count_pages, &num_physpages);
265
Mel Gorman6391af12006-10-11 01:20:39 -0700266 memset(max_zone_pfns, 0, sizeof(max_zone_pfns));
Christoph Lameter09ae1f52007-02-10 01:43:11 -0800267#ifdef CONFIG_ZONE_DMA
268 max_dma = virt_to_phys((void *) MAX_DMA_ADDRESS) >> PAGE_SHIFT;
Mel Gorman05e0caa2006-09-27 01:49:54 -0700269 max_zone_pfns[ZONE_DMA] = max_dma;
Christoph Lameter09ae1f52007-02-10 01:43:11 -0800270#endif
Mel Gorman05e0caa2006-09-27 01:49:54 -0700271 max_zone_pfns[ZONE_NORMAL] = max_low_pfn;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272
273#ifdef CONFIG_VIRTUAL_MEM_MAP
Zoltan Menyhart98075d22008-04-11 15:21:35 -0700274 efi_memmap_walk(filter_memory, register_active_ranges);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275 efi_memmap_walk(find_largest_hole, (u64 *)&max_gap);
276 if (max_gap < LARGE_GAP) {
277 vmem_map = (struct page *) 0;
Mel Gorman05e0caa2006-09-27 01:49:54 -0700278 free_area_init_nodes(max_zone_pfns);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700279 } else {
280 unsigned long map_size;
281
282 /* allocate virtual_mem_map */
283
Bob Picco921eea12006-06-28 12:54:55 -0400284 map_size = PAGE_ALIGN(ALIGN(max_low_pfn, MAX_ORDER_NR_PAGES) *
285 sizeof(struct page));
Tejun Heo126b3fc2009-10-02 13:28:55 +0900286 VMALLOC_END -= map_size;
287 vmem_map = (struct page *) VMALLOC_END;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288 efi_memmap_walk(create_mem_map_page_table, NULL);
289
Mel Gorman05e0caa2006-09-27 01:49:54 -0700290 /*
291 * alloc_node_mem_map makes an adjustment for mem_map
292 * which isn't compatible with vmem_map.
293 */
294 NODE_DATA(0)->node_mem_map = vmem_map +
295 find_min_pfn_with_active_regions();
296 free_area_init_nodes(max_zone_pfns);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297
298 printk("Virtual mem_map starts at 0x%p\n", mem_map);
299 }
300#else /* !CONFIG_VIRTUAL_MEM_MAP */
Mel Gorman05e0caa2006-09-27 01:49:54 -0700301 add_active_range(0, 0, max_low_pfn);
302 free_area_init_nodes(max_zone_pfns);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700303#endif /* !CONFIG_VIRTUAL_MEM_MAP */
304 zero_page_memmap_ptr = virt_to_page(ia64_imva(empty_zero_page));
305}