blob: 142c3b7859443f18a76df4bb4906f78f592e2b41 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * This file is subject to the terms and conditions of the GNU General Public
3 * License. See the file "COPYING" in the main directory of this archive
4 * for more details.
5 *
6 * Copyright (C) 1998-2003 Hewlett-Packard Co
7 * David Mosberger-Tang <davidm@hpl.hp.com>
8 * Stephane Eranian <eranian@hpl.hp.com>
9 * Copyright (C) 2000, Rohit Seth <rohit.seth@intel.com>
10 * Copyright (C) 1999 VA Linux Systems
11 * Copyright (C) 1999 Walt Drummond <drummond@valinux.com>
12 * Copyright (C) 2003 Silicon Graphics, Inc. All rights reserved.
13 *
14 * Routines used by ia64 machines with contiguous (or virtually contiguous)
15 * memory.
16 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#include <linux/bootmem.h>
18#include <linux/efi.h>
Tejun Heo98e4ae82011-12-08 10:22:08 -080019#include <linux/memblock.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <linux/mm.h>
Prarit Bhargava99a19cf12007-08-22 14:34:38 -040021#include <linux/nmi.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070022#include <linux/swap.h>
23
24#include <asm/meminit.h>
25#include <asm/pgalloc.h>
26#include <asm/pgtable.h>
27#include <asm/sections.h>
28#include <asm/mca.h>
29
30#ifdef CONFIG_VIRTUAL_MEM_MAP
Bob Piccoe44e41d2006-06-28 12:55:43 -040031static unsigned long max_gap;
Linus Torvalds1da177e2005-04-16 15:20:36 -070032#endif
33
34/**
George Beshersf1c0afa2007-02-05 16:20:04 -080035 * show_mem - give short summary of memory stats
Linus Torvalds1da177e2005-04-16 15:20:36 -070036 *
George Beshersf1c0afa2007-02-05 16:20:04 -080037 * Shows a simple page count of reserved and used pages in the system.
38 * For discontig machines, it does this on a per-pgdat basis.
Linus Torvalds1da177e2005-04-16 15:20:36 -070039 */
David Rientjesb2b755b2011-03-24 15:18:15 -070040void show_mem(unsigned int filter)
Linus Torvalds1da177e2005-04-16 15:20:36 -070041{
George Beshersf1c0afa2007-02-05 16:20:04 -080042 int i, total_reserved = 0;
43 int total_shared = 0, total_cached = 0;
44 unsigned long total_present = 0;
45 pg_data_t *pgdat;
Linus Torvalds1da177e2005-04-16 15:20:36 -070046
Jes Sorensen709a6c12006-09-13 08:43:42 -040047 printk(KERN_INFO "Mem-info:\n");
David Rientjes7bf02ea2011-05-24 17:11:16 -070048 show_free_areas(filter);
George Beshersf1c0afa2007-02-05 16:20:04 -080049 printk(KERN_INFO "Node memory in pages:\n");
David Rientjes4b59e6c2013-04-29 15:06:11 -070050 if (filter & SHOW_MEM_FILTER_PAGE_COUNT)
51 return;
George Beshersf1c0afa2007-02-05 16:20:04 -080052 for_each_online_pgdat(pgdat) {
53 unsigned long present;
54 unsigned long flags;
55 int shared = 0, cached = 0, reserved = 0;
David Rientjes7bf02ea2011-05-24 17:11:16 -070056 int nid = pgdat->node_id;
George Beshersf1c0afa2007-02-05 16:20:04 -080057
David Rientjes7bf02ea2011-05-24 17:11:16 -070058 if (skip_free_areas_node(filter, nid))
59 continue;
George Beshersf1c0afa2007-02-05 16:20:04 -080060 pgdat_resize_lock(pgdat, &flags);
61 present = pgdat->node_present_pages;
62 for(i = 0; i < pgdat->node_spanned_pages; i++) {
63 struct page *page;
Prarit Bhargava99a19cf12007-08-22 14:34:38 -040064 if (unlikely(i % MAX_ORDER_NR_PAGES == 0))
65 touch_nmi_watchdog();
George Beshersf1c0afa2007-02-05 16:20:04 -080066 if (pfn_valid(pgdat->node_start_pfn + i))
67 page = pfn_to_page(pgdat->node_start_pfn + i);
68 else {
Bob Piccoe44e41d2006-06-28 12:55:43 -040069#ifdef CONFIG_VIRTUAL_MEM_MAP
George Beshersf1c0afa2007-02-05 16:20:04 -080070 if (max_gap < LARGE_GAP)
71 continue;
Bob Piccoe44e41d2006-06-28 12:55:43 -040072#endif
David Rientjes7bf02ea2011-05-24 17:11:16 -070073 i = vmemmap_find_next_valid_pfn(nid, i) - 1;
George Beshersf1c0afa2007-02-05 16:20:04 -080074 continue;
75 }
76 if (PageReserved(page))
77 reserved++;
78 else if (PageSwapCache(page))
79 cached++;
80 else if (page_count(page))
81 shared += page_count(page)-1;
Bob Piccoe44e41d2006-06-28 12:55:43 -040082 }
George Beshersf1c0afa2007-02-05 16:20:04 -080083 pgdat_resize_unlock(pgdat, &flags);
84 total_present += present;
85 total_reserved += reserved;
86 total_cached += cached;
87 total_shared += shared;
88 printk(KERN_INFO "Node %4d: RAM: %11ld, rsvd: %8d, "
David Rientjes7bf02ea2011-05-24 17:11:16 -070089 "shrd: %10d, swpd: %10d\n", nid,
George Beshersf1c0afa2007-02-05 16:20:04 -080090 present, reserved, shared, cached);
Linus Torvalds1da177e2005-04-16 15:20:36 -070091 }
George Beshersf1c0afa2007-02-05 16:20:04 -080092 printk(KERN_INFO "%ld pages of RAM\n", total_present);
93 printk(KERN_INFO "%d reserved pages\n", total_reserved);
94 printk(KERN_INFO "%d pages shared\n", total_shared);
95 printk(KERN_INFO "%d pages swap cached\n", total_cached);
96 printk(KERN_INFO "Total of %ld pages in page table cache\n",
Christoph Lameter2bd62a42007-05-10 22:42:53 -070097 quicklist_total_size());
Zhang Yanfei6434b942013-02-22 16:35:45 -080098 printk(KERN_INFO "%ld free buffer pages\n", nr_free_buffer_pages());
Linus Torvalds1da177e2005-04-16 15:20:36 -070099}
100
George Beshersf1c0afa2007-02-05 16:20:04 -0800101
Linus Torvalds1da177e2005-04-16 15:20:36 -0700102/* physical address where the bootmem map is located */
103unsigned long bootmap_start;
104
105/**
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106 * find_bootmap_location - callback to find a memory area for the bootmap
107 * @start: start of region
108 * @end: end of region
109 * @arg: unused callback data
110 *
111 * Find a place to put the bootmap and return its starting address in
112 * bootmap_start. This address must be page-aligned.
113 */
Chen, Kenneth Wdae28062006-03-22 16:54:15 -0800114static int __init
Matthew Wilcoxe088a4a2009-05-22 13:49:49 -0700115find_bootmap_location (u64 start, u64 end, void *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700116{
Matthew Wilcoxe088a4a2009-05-22 13:49:49 -0700117 u64 needed = *(unsigned long *)arg;
118 u64 range_start, range_end, free_start;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119 int i;
120
121#if IGNORE_PFN0
122 if (start == PAGE_OFFSET) {
123 start += PAGE_SIZE;
124 if (start >= end)
125 return 0;
126 }
127#endif
128
129 free_start = PAGE_OFFSET;
130
131 for (i = 0; i < num_rsvd_regions; i++) {
132 range_start = max(start, free_start);
133 range_end = min(end, rsvd_region[i].start & PAGE_MASK);
134
135 free_start = PAGE_ALIGN(rsvd_region[i].end);
136
137 if (range_end <= range_start)
138 continue; /* skip over empty range */
139
140 if (range_end - range_start >= needed) {
141 bootmap_start = __pa(range_start);
142 return -1; /* done */
143 }
144
145 /* nothing more available in this segment */
146 if (range_end == end)
147 return 0;
148 }
149 return 0;
150}
151
Tony Luck4b9ddc72007-11-06 15:14:45 -0800152#ifdef CONFIG_SMP
153static void *cpu_data;
154/**
155 * per_cpu_init - setup per-cpu variables
156 *
157 * Allocate and setup per-cpu data areas.
158 */
Paul Gortmakerccce9bb2013-06-17 15:51:20 -0400159void *per_cpu_init(void)
Tony Luck4b9ddc72007-11-06 15:14:45 -0800160{
Tejun Heo36886472009-10-02 13:28:56 +0900161 static bool first_time = true;
162 void *cpu0_data = __cpu0_per_cpu;
163 unsigned int cpu;
164
165 if (!first_time)
166 goto skip;
167 first_time = false;
Tony Luck4b9ddc72007-11-06 15:14:45 -0800168
169 /*
Tejun Heo525947622009-10-02 13:28:56 +0900170 * get_free_pages() cannot be used before cpu_init() done.
171 * BSP allocates PERCPU_PAGE_SIZE bytes for all possible CPUs
172 * to avoid that AP calls get_zeroed_page().
Tony Luck4b9ddc72007-11-06 15:14:45 -0800173 */
Tejun Heo525947622009-10-02 13:28:56 +0900174 for_each_possible_cpu(cpu) {
Tejun Heo36886472009-10-02 13:28:56 +0900175 void *src = cpu == 0 ? cpu0_data : __phys_per_cpu_start;
Tony Luck10617bb2008-08-12 10:34:20 -0700176
Tejun Heo36886472009-10-02 13:28:56 +0900177 memcpy(cpu_data, src, __per_cpu_end - __per_cpu_start);
178 __per_cpu_offset[cpu] = (char *)cpu_data - __per_cpu_start;
179 per_cpu(local_per_cpu_offset, cpu) = __per_cpu_offset[cpu];
Tony Luck10617bb2008-08-12 10:34:20 -0700180
Tejun Heo36886472009-10-02 13:28:56 +0900181 /*
182 * percpu area for cpu0 is moved from the __init area
183 * which is setup by head.S and used till this point.
184 * Update ar.k3. This move is ensures that percpu
185 * area for cpu0 is on the correct node and its
186 * virtual address isn't insanely far from other
187 * percpu areas which is important for congruent
188 * percpu allocator.
189 */
190 if (cpu == 0)
191 ia64_set_kr(IA64_KR_PER_CPU_DATA, __pa(cpu_data) -
192 (unsigned long)__per_cpu_start);
Tony Luck10617bb2008-08-12 10:34:20 -0700193
Tejun Heo36886472009-10-02 13:28:56 +0900194 cpu_data += PERCPU_PAGE_SIZE;
Tony Luck4b9ddc72007-11-06 15:14:45 -0800195 }
Tejun Heo36886472009-10-02 13:28:56 +0900196skip:
Tony Luck4b9ddc72007-11-06 15:14:45 -0800197 return __per_cpu_start + __per_cpu_offset[smp_processor_id()];
198}
199
200static inline void
201alloc_per_cpu_data(void)
202{
Tejun Heo525947622009-10-02 13:28:56 +0900203 cpu_data = __alloc_bootmem(PERCPU_PAGE_SIZE * num_possible_cpus(),
Tony Luck4b9ddc72007-11-06 15:14:45 -0800204 PERCPU_PAGE_SIZE, __pa(MAX_DMA_ADDRESS));
205}
Tejun Heo525947622009-10-02 13:28:56 +0900206
207/**
208 * setup_per_cpu_areas - setup percpu areas
209 *
210 * Arch code has already allocated and initialized percpu areas. All
211 * this function has to do is to teach the determined layout to the
212 * dynamic percpu allocator, which happens to be more complex than
213 * creating whole new ones using helpers.
214 */
215void __init
216setup_per_cpu_areas(void)
217{
218 struct pcpu_alloc_info *ai;
219 struct pcpu_group_info *gi;
220 unsigned int cpu;
221 ssize_t static_size, reserved_size, dyn_size;
222 int rc;
223
224 ai = pcpu_alloc_alloc_info(1, num_possible_cpus());
225 if (!ai)
226 panic("failed to allocate pcpu_alloc_info");
227 gi = &ai->groups[0];
228
229 /* units are assigned consecutively to possible cpus */
230 for_each_possible_cpu(cpu)
231 gi->cpu_map[gi->nr_units++] = cpu;
232
233 /* set parameters */
234 static_size = __per_cpu_end - __per_cpu_start;
235 reserved_size = PERCPU_MODULE_RESERVE;
236 dyn_size = PERCPU_PAGE_SIZE - static_size - reserved_size;
237 if (dyn_size < 0)
238 panic("percpu area overflow static=%zd reserved=%zd\n",
239 static_size, reserved_size);
240
241 ai->static_size = static_size;
242 ai->reserved_size = reserved_size;
243 ai->dyn_size = dyn_size;
244 ai->unit_size = PERCPU_PAGE_SIZE;
245 ai->atom_size = PAGE_SIZE;
246 ai->alloc_size = PERCPU_PAGE_SIZE;
247
248 rc = pcpu_setup_first_chunk(ai, __per_cpu_start + __per_cpu_offset[0]);
249 if (rc)
250 panic("failed to setup percpu area (err=%d)", rc);
251
252 pcpu_free_alloc_info(ai);
253}
Tony Luck4b9ddc72007-11-06 15:14:45 -0800254#else
255#define alloc_per_cpu_data() do { } while (0)
256#endif /* CONFIG_SMP */
257
Linus Torvalds1da177e2005-04-16 15:20:36 -0700258/**
259 * find_memory - setup memory map
260 *
261 * Walk the EFI memory map and find usable memory for the system, taking
262 * into account reserved areas.
263 */
Chen, Kenneth Wdae28062006-03-22 16:54:15 -0800264void __init
Linus Torvalds1da177e2005-04-16 15:20:36 -0700265find_memory (void)
266{
267 unsigned long bootmap_size;
268
269 reserve_memory();
270
271 /* first find highest page frame number */
Zou Nan haia3f5c332007-03-20 13:41:57 -0700272 min_low_pfn = ~0UL;
273 max_low_pfn = 0;
274 efi_memmap_walk(find_max_min_low_pfn, NULL);
275 max_pfn = max_low_pfn;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276 /* how many bytes to cover all the pages */
277 bootmap_size = bootmem_bootmap_pages(max_pfn) << PAGE_SHIFT;
278
279 /* look for a location to hold the bootmap */
280 bootmap_start = ~0UL;
281 efi_memmap_walk(find_bootmap_location, &bootmap_size);
282 if (bootmap_start == ~0UL)
283 panic("Cannot find %ld bytes for bootmap\n", bootmap_size);
284
Zou Nan haia3f5c332007-03-20 13:41:57 -0700285 bootmap_size = init_bootmem_node(NODE_DATA(0),
286 (bootmap_start >> PAGE_SHIFT), 0, max_pfn);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700287
288 /* Free all available memory, then mark bootmem-map as being in use. */
289 efi_memmap_walk(filter_rsvd_memory, free_bootmem);
Bernhard Walle72a7fe32008-02-07 00:15:17 -0800290 reserve_bootmem(bootmap_start, bootmap_size, BOOTMEM_DEFAULT);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700291
292 find_initrd();
Horms45a98fc2006-12-12 17:49:03 +0900293
Tony Luck4b9ddc72007-11-06 15:14:45 -0800294 alloc_per_cpu_data();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700295}
296
Matthew Wilcoxe088a4a2009-05-22 13:49:49 -0700297static int count_pages(u64 start, u64 end, void *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700298{
299 unsigned long *count = arg;
300
301 *count += (end - start) >> PAGE_SHIFT;
302 return 0;
303}
304
Linus Torvalds1da177e2005-04-16 15:20:36 -0700305/*
306 * Set up the page tables.
307 */
308
Chen, Kenneth Wdae28062006-03-22 16:54:15 -0800309void __init
Linus Torvalds1da177e2005-04-16 15:20:36 -0700310paging_init (void)
311{
312 unsigned long max_dma;
Mel Gorman05e0caa2006-09-27 01:49:54 -0700313 unsigned long max_zone_pfns[MAX_NR_ZONES];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700314
315 num_physpages = 0;
316 efi_memmap_walk(count_pages, &num_physpages);
317
Mel Gorman6391af12006-10-11 01:20:39 -0700318 memset(max_zone_pfns, 0, sizeof(max_zone_pfns));
Christoph Lameter09ae1f52007-02-10 01:43:11 -0800319#ifdef CONFIG_ZONE_DMA
320 max_dma = virt_to_phys((void *) MAX_DMA_ADDRESS) >> PAGE_SHIFT;
Mel Gorman05e0caa2006-09-27 01:49:54 -0700321 max_zone_pfns[ZONE_DMA] = max_dma;
Christoph Lameter09ae1f52007-02-10 01:43:11 -0800322#endif
Mel Gorman05e0caa2006-09-27 01:49:54 -0700323 max_zone_pfns[ZONE_NORMAL] = max_low_pfn;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700324
325#ifdef CONFIG_VIRTUAL_MEM_MAP
Zoltan Menyhart98075d22008-04-11 15:21:35 -0700326 efi_memmap_walk(filter_memory, register_active_ranges);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700327 efi_memmap_walk(find_largest_hole, (u64 *)&max_gap);
328 if (max_gap < LARGE_GAP) {
329 vmem_map = (struct page *) 0;
Mel Gorman05e0caa2006-09-27 01:49:54 -0700330 free_area_init_nodes(max_zone_pfns);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700331 } else {
332 unsigned long map_size;
333
334 /* allocate virtual_mem_map */
335
Bob Picco921eea12006-06-28 12:54:55 -0400336 map_size = PAGE_ALIGN(ALIGN(max_low_pfn, MAX_ORDER_NR_PAGES) *
337 sizeof(struct page));
Tejun Heo126b3fc2009-10-02 13:28:55 +0900338 VMALLOC_END -= map_size;
339 vmem_map = (struct page *) VMALLOC_END;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340 efi_memmap_walk(create_mem_map_page_table, NULL);
341
Mel Gorman05e0caa2006-09-27 01:49:54 -0700342 /*
343 * alloc_node_mem_map makes an adjustment for mem_map
344 * which isn't compatible with vmem_map.
345 */
346 NODE_DATA(0)->node_mem_map = vmem_map +
347 find_min_pfn_with_active_regions();
348 free_area_init_nodes(max_zone_pfns);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349
350 printk("Virtual mem_map starts at 0x%p\n", mem_map);
351 }
352#else /* !CONFIG_VIRTUAL_MEM_MAP */
Tejun Heo98e4ae82011-12-08 10:22:08 -0800353 memblock_add_node(0, PFN_PHYS(max_low_pfn), 0);
Mel Gorman05e0caa2006-09-27 01:49:54 -0700354 free_area_init_nodes(max_zone_pfns);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700355#endif /* !CONFIG_VIRTUAL_MEM_MAP */
356 zero_page_memmap_ptr = virt_to_page(ia64_imva(empty_zero_page));
357}