blob: bea8ae77d0599831ff17eb22cd35dc4a603b3279 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
Linus Torvalds1da177e2005-04-16 15:20:36 -07002 * Copyright (C) 1995 Linus Torvalds
3 *
4 * Support of BIGMEM added by Gerhard Wichert, Siemens AG, July 1999
5 *
6 * Memory region support
7 * David Parsons <orc@pell.chi.il.us>, July-August 1999
8 *
9 * Added E820 sanitization routine (removes overlapping memory regions);
10 * Brian Moyle <bmoyle@mvista.com>, February 2001
11 *
12 * Moved CPU detection code to cpu/${cpu}.c
13 * Patrick Mochel <mochel@osdl.org>, March 2002
14 *
15 * Provisions for empty E820 memory regions (reported by certain BIOSes).
16 * Alex Achenbach <xela@slit.de>, December 2002.
17 *
18 */
19
20/*
21 * This file handles the architecture-dependent parts of initialization
22 */
23
24#include <linux/sched.h>
25#include <linux/mm.h>
Andy Whitcroft05b79bd2005-06-23 00:07:57 -070026#include <linux/mmzone.h>
Jon Smirl894673e2006-07-10 04:44:13 -070027#include <linux/screen_info.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070028#include <linux/ioport.h>
29#include <linux/acpi.h>
30#include <linux/apm_bios.h>
31#include <linux/initrd.h>
32#include <linux/bootmem.h>
33#include <linux/seq_file.h>
34#include <linux/console.h>
35#include <linux/mca.h>
36#include <linux/root_dev.h>
37#include <linux/highmem.h>
38#include <linux/module.h>
39#include <linux/efi.h>
40#include <linux/init.h>
41#include <linux/edd.h>
Konrad Rzeszutek138fe4e2008-04-09 19:50:41 -070042#include <linux/iscsi_ibft.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070043#include <linux/nodemask.h>
Eric W. Biederman1bc3b912005-06-25 14:58:01 -070044#include <linux/kexec.h>
Andi Kleene9928672006-01-11 22:43:33 +010045#include <linux/dmi.h>
Dave Hansen22a98352006-03-27 01:16:04 -080046#include <linux/pfn.h>
Thomas Gleixner376ff032008-01-30 13:30:16 +010047#include <linux/pci.h>
Yinghai Lu46d671b2008-06-25 17:51:29 -070048#include <asm/pci-direct.h>
Bernhard Kaindlf212ec42008-01-30 13:34:11 +010049#include <linux/init_ohci1394_dma.h>
Glauber de Oliveira Costa790c73f2008-02-15 17:52:48 -020050#include <linux/kvm_para.h>
Eric W. Biederman1bc3b912005-06-25 14:58:01 -070051
Yinghai Lu46d671b2008-06-25 17:51:29 -070052#include <linux/errno.h>
53#include <linux/kernel.h>
54#include <linux/stddef.h>
55#include <linux/unistd.h>
56#include <linux/ptrace.h>
57#include <linux/slab.h>
58#include <linux/user.h>
59#include <linux/delay.h>
60#include <linux/highmem.h>
61
62#include <linux/kallsyms.h>
63#include <linux/edd.h>
64#include <linux/iscsi_ibft.h>
65#include <linux/kexec.h>
66#include <linux/cpufreq.h>
67#include <linux/dma-mapping.h>
68#include <linux/ctype.h>
69#include <linux/uaccess.h>
70
71#include <linux/percpu.h>
72#include <linux/crash_dump.h>
73
Linus Torvalds1da177e2005-04-16 15:20:36 -070074#include <video/edid.h>
Eric W. Biederman1bc3b912005-06-25 14:58:01 -070075
Yinghai Lu093af8d2008-01-30 13:33:32 +010076#include <asm/mtrr.h>
Eric W. Biederman9635b472005-06-25 14:57:41 -070077#include <asm/apic.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070078#include <asm/e820.h>
79#include <asm/mpspec.h>
80#include <asm/setup.h>
81#include <asm/arch_hooks.h>
Yinghai Lu55f26232008-06-25 17:54:23 -070082#include <asm/efi.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070083#include <asm/sections.h>
Yinghai Lu1c6e5502008-06-17 15:41:45 -070084#include <asm/dmi.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070085#include <asm/io_apic.h>
86#include <asm/ist.h>
Zachary Amsden7ce0bcf2007-02-13 13:26:21 +010087#include <asm/vmi.h>
Jeremy Fitzhardingee75eac32006-06-25 05:46:50 -070088#include <setup_arch.h>
Alexey Starikovskiyce3fe6b2008-03-17 22:08:17 +030089#include <asm/bios_ebda.h>
Bernhard Walle00bf4092007-10-21 16:42:01 -070090#include <asm/cacheflush.h>
Alexander van Heukelum2fde61f2008-03-04 19:57:42 +010091#include <asm/processor.h>
Yinghai Lucc9f7a02008-06-16 16:11:08 -070092#include <asm/bugs.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070093
Yinghai Lu46d671b2008-06-25 17:51:29 -070094#include <asm/system.h>
95#include <asm/vsyscall.h>
96#include <asm/smp.h>
97#include <asm/desc.h>
98#include <asm/dma.h>
99#include <asm/gart.h>
100#include <asm/mmu_context.h>
101#include <asm/proto.h>
102
103#include <mach_apic.h>
Yinghai Lu46d671b2008-06-25 17:51:29 -0700104#include <asm/paravirt.h>
Yinghai Lu46d671b2008-06-25 17:51:29 -0700105
106#include <asm/percpu.h>
107#include <asm/sections.h>
108#include <asm/topology.h>
109#include <asm/apicdef.h>
Yinghai Lu55f26232008-06-25 17:54:23 -0700110#ifdef CONFIG_X86_64
111#include <asm/numa_64.h>
112#endif
Yinghai Lu46d671b2008-06-25 17:51:29 -0700113
Yinghai Lu042623b2008-06-25 19:52:15 -0700114#ifndef ARCH_SETUP
115#define ARCH_SETUP
116#endif
117
Yinghai Lu217b8ce2008-06-25 17:55:20 -0700118#ifndef CONFIG_DEBUG_BOOT_PARAMS
119struct boot_params __initdata boot_params;
120#else
121struct boot_params boot_params;
122#endif
123
Linus Torvalds1da177e2005-04-16 15:20:36 -0700124/*
125 * Machine setup..
126 */
Bernhard Wallec9cce832008-01-30 13:30:32 +0100127static struct resource data_resource = {
128 .name = "Kernel data",
129 .start = 0,
130 .end = 0,
131 .flags = IORESOURCE_BUSY | IORESOURCE_MEM
132};
133
134static struct resource code_resource = {
135 .name = "Kernel code",
136 .start = 0,
137 .end = 0,
138 .flags = IORESOURCE_BUSY | IORESOURCE_MEM
139};
140
141static struct resource bss_resource = {
142 .name = "Kernel bss",
143 .start = 0,
144 .end = 0,
145 .flags = IORESOURCE_BUSY | IORESOURCE_MEM
146};
147
Yinghai Lu7dea23e2008-06-25 17:50:06 -0700148
149#ifdef CONFIG_X86_32
Yinghai Lu50923012008-06-25 18:02:06 -0700150/* This value is set up by the early boot code to point to the value
151 immediately after the boot time page tables. It contains a *physical*
152 address, and must not be in the .bss segment! */
153unsigned long init_pg_tables_start __initdata = ~0UL;
154unsigned long init_pg_tables_end __initdata = ~0UL;
155
Bernhard Wallec9cce832008-01-30 13:30:32 +0100156static struct resource video_ram_resource = {
157 .name = "Video RAM area",
158 .start = 0xa0000,
159 .end = 0xbffff,
160 .flags = IORESOURCE_BUSY | IORESOURCE_MEM
161};
162
Linus Torvalds1da177e2005-04-16 15:20:36 -0700163/* cpu data as detected by the assembly code in head.S */
Yinghai Lu7dea23e2008-06-25 17:50:06 -0700164struct cpuinfo_x86 new_cpu_data __cpuinitdata = {0, 0, 0, 0, -1, 1, 0, 0, -1};
Linus Torvalds1da177e2005-04-16 15:20:36 -0700165/* common cpu data for all cpus */
Yinghai Lu7dea23e2008-06-25 17:50:06 -0700166struct cpuinfo_x86 boot_cpu_data __read_mostly = {0, 0, 0, 0, -1, 1, 0, 0, -1};
Alexey Dobriyan129f6942005-06-23 00:08:33 -0700167EXPORT_SYMBOL(boot_cpu_data);
Yinghai Lu7dea23e2008-06-25 17:50:06 -0700168static void set_mca_bus(int x)
169{
170#ifdef CONFIG_MCA
171 MCA_bus = x;
172#endif
173}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700174
Alexey Starikovskiy0c254e32008-03-27 23:55:04 +0300175unsigned int def_to_bigsmp;
176
Linus Torvalds1da177e2005-04-16 15:20:36 -0700177/* for MCA, but anyone else can use it if they want */
178unsigned int machine_id;
179unsigned int machine_submodel_id;
180unsigned int BIOS_revision;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700181
Yinghai Lu7dea23e2008-06-25 17:50:06 -0700182struct apm_info apm_info;
183EXPORT_SYMBOL(apm_info);
184
185#if defined(CONFIG_X86_SPEEDSTEP_SMI) || \
186 defined(CONFIG_X86_SPEEDSTEP_SMI_MODULE)
187struct ist_info ist_info;
188EXPORT_SYMBOL(ist_info);
189#else
190struct ist_info ist_info;
191#endif
192
193#else
194struct cpuinfo_x86 boot_cpu_data __read_mostly;
195EXPORT_SYMBOL(boot_cpu_data);
196#endif
197
198
199#if !defined(CONFIG_X86_PAE) || defined(CONFIG_X86_64)
200unsigned long mmu_cr4_features;
201#else
202unsigned long mmu_cr4_features = X86_CR4_PAE;
203#endif
204
Linus Torvalds1da177e2005-04-16 15:20:36 -0700205/* Boot loader ID as an integer, for the benefit of proc_dointvec */
206int bootloader_type;
207
Linus Torvalds1da177e2005-04-16 15:20:36 -0700208/*
Yinghai Lu1c6e5502008-06-17 15:41:45 -0700209 * Early DMI memory
210 */
211int dmi_alloc_index;
212char dmi_alloc_data[DMI_MAX_DATA];
213
214/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700215 * Setup options
216 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217struct screen_info screen_info;
Alexey Dobriyan129f6942005-06-23 00:08:33 -0700218EXPORT_SYMBOL(screen_info);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700219struct edid_info edid_info;
Antonino A. Daplas5e518d72005-09-09 13:04:34 -0700220EXPORT_SYMBOL_GPL(edid_info);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700221
Linus Torvalds1da177e2005-04-16 15:20:36 -0700222extern int root_mountflags;
223
Pavel Macheke44b7b72008-04-10 23:28:10 +0200224unsigned long saved_video_mode;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700225
H. Peter Anvincf8fa922008-01-30 13:32:51 +0100226#define RAMDISK_IMAGE_START_MASK 0x07FF
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227#define RAMDISK_PROMPT_FLAG 0x8000
H. Peter Anvincf8fa922008-01-30 13:32:51 +0100228#define RAMDISK_LOAD_FLAG 0x4000
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229
Alon Bar-Lev4e498b62007-02-12 00:54:11 -0800230static char __initdata command_line[COMMAND_LINE_SIZE];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700231
Linus Torvalds1da177e2005-04-16 15:20:36 -0700232#if defined(CONFIG_EDD) || defined(CONFIG_EDD_MODULE)
233struct edd edd;
234#ifdef CONFIG_EDD_MODULE
235EXPORT_SYMBOL(edd);
236#endif
237/**
238 * copy_edd() - Copy the BIOS EDD information
239 * from boot_params into a safe place.
240 *
241 */
242static inline void copy_edd(void)
243{
H. Peter Anvin30c82642007-10-15 17:13:22 -0700244 memcpy(edd.mbr_signature, boot_params.edd_mbr_sig_buffer,
245 sizeof(edd.mbr_signature));
246 memcpy(edd.edd_info, boot_params.eddbuf, sizeof(edd.edd_info));
247 edd.mbr_signature_nr = boot_params.edd_mbr_sig_buf_entries;
248 edd.edd_info_nr = boot_params.eddbuf_entries;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700249}
250#else
251static inline void copy_edd(void)
252{
253}
254#endif
255
H. Peter Anvincf8fa922008-01-30 13:32:51 +0100256#ifdef CONFIG_BLK_DEV_INITRD
257
Yinghai Lueb1379c2008-06-25 17:49:26 -0700258#ifdef CONFIG_X86_32
H. Peter Anvincf8fa922008-01-30 13:32:51 +0100259
Yinghai Lueb1379c2008-06-25 17:49:26 -0700260#define MAX_MAP_CHUNK (NR_FIX_BTMAPS << PAGE_SHIFT)
261static void __init relocate_initrd(void)
H. Peter Anvincf8fa922008-01-30 13:32:51 +0100262{
Yinghai Lueb1379c2008-06-25 17:49:26 -0700263
Yinghai Luba5b14cc2008-05-21 18:40:18 -0700264 u64 ramdisk_image = boot_params.hdr.ramdisk_image;
265 u64 ramdisk_size = boot_params.hdr.ramdisk_size;
Yinghai Luba5b14cc2008-05-21 18:40:18 -0700266 u64 end_of_lowmem = max_low_pfn << PAGE_SHIFT;
267 u64 ramdisk_here;
Yinghai Lueb1379c2008-06-25 17:49:26 -0700268 unsigned long slop, clen, mapaddr;
269 char *p, *q;
H. Peter Anvincf8fa922008-01-30 13:32:51 +0100270
271 /* We need to move the initrd down into lowmem */
Yinghai Lu4e296842008-06-24 12:18:14 -0700272 ramdisk_here = find_e820_area(0, end_of_lowmem, ramdisk_size,
273 PAGE_SIZE);
H. Peter Anvincf8fa922008-01-30 13:32:51 +0100274
Yinghai Lu3945e2c2008-05-25 10:00:09 -0700275 if (ramdisk_here == -1ULL)
276 panic("Cannot find place for new RAMDISK of size %lld\n",
277 ramdisk_size);
278
H. Peter Anvincf8fa922008-01-30 13:32:51 +0100279 /* Note: this includes all the lowmem currently occupied by
280 the initrd, we rely on that fact to keep the data intact. */
Yinghai Lu3945e2c2008-05-25 10:00:09 -0700281 reserve_early(ramdisk_here, ramdisk_here + ramdisk_size,
Yinghai Luba5b14cc2008-05-21 18:40:18 -0700282 "NEW RAMDISK");
H. Peter Anvincf8fa922008-01-30 13:32:51 +0100283 initrd_start = ramdisk_here + PAGE_OFFSET;
284 initrd_end = initrd_start + ramdisk_size;
Yinghai Luf0d43102008-05-29 12:56:36 -0700285 printk(KERN_INFO "Allocated new RAMDISK: %08llx - %08llx\n",
286 ramdisk_here, ramdisk_here + ramdisk_size);
H. Peter Anvincf8fa922008-01-30 13:32:51 +0100287
H. Peter Anvincf8fa922008-01-30 13:32:51 +0100288 q = (char *)initrd_start;
289
290 /* Copy any lowmem portion of the initrd */
291 if (ramdisk_image < end_of_lowmem) {
292 clen = end_of_lowmem - ramdisk_image;
293 p = (char *)__va(ramdisk_image);
294 memcpy(q, p, clen);
295 q += clen;
296 ramdisk_image += clen;
297 ramdisk_size -= clen;
298 }
299
300 /* Copy the highmem portion of the initrd */
301 while (ramdisk_size) {
302 slop = ramdisk_image & ~PAGE_MASK;
303 clen = ramdisk_size;
304 if (clen > MAX_MAP_CHUNK-slop)
305 clen = MAX_MAP_CHUNK-slop;
306 mapaddr = ramdisk_image & PAGE_MASK;
Huang, Yingbeacfaa2008-01-30 13:33:44 +0100307 p = early_ioremap(mapaddr, clen+slop);
H. Peter Anvincf8fa922008-01-30 13:32:51 +0100308 memcpy(q, p+slop, clen);
Huang, Yingbeacfaa2008-01-30 13:33:44 +0100309 early_iounmap(p, clen+slop);
H. Peter Anvincf8fa922008-01-30 13:32:51 +0100310 q += clen;
311 ramdisk_image += clen;
312 ramdisk_size -= clen;
313 }
Yinghai Lua4c81cf2008-05-18 01:18:57 -0700314 /* high pages is not converted by early_res_to_bootmem */
Yinghai Luba5b14cc2008-05-21 18:40:18 -0700315 ramdisk_image = boot_params.hdr.ramdisk_image;
316 ramdisk_size = boot_params.hdr.ramdisk_size;
Yinghai Lueb1379c2008-06-25 17:49:26 -0700317 printk(KERN_INFO "Move RAMDISK from %016llx - %016llx to"
318 " %08llx - %08llx\n",
Yinghai Luba5b14cc2008-05-21 18:40:18 -0700319 ramdisk_image, ramdisk_image + ramdisk_size - 1,
320 ramdisk_here, ramdisk_here + ramdisk_size - 1);
Yinghai Lueb1379c2008-06-25 17:49:26 -0700321}
322#endif
Yinghai Lu9a27f5c2008-06-13 20:07:03 -0700323
Yinghai Lueb1379c2008-06-25 17:49:26 -0700324static void __init reserve_initrd(void)
325{
326 u64 ramdisk_image = boot_params.hdr.ramdisk_image;
327 u64 ramdisk_size = boot_params.hdr.ramdisk_size;
328 u64 ramdisk_end = ramdisk_image + ramdisk_size;
329 u64 end_of_lowmem = max_low_pfn << PAGE_SHIFT;
330
331 if (!boot_params.hdr.type_of_loader ||
332 !ramdisk_image || !ramdisk_size)
333 return; /* No initrd provided by bootloader */
334
335 initrd_start = 0;
336
337 if (ramdisk_size >= (end_of_lowmem>>1)) {
338 free_early(ramdisk_image, ramdisk_end);
339 printk(KERN_ERR "initrd too large to handle, "
340 "disabling initrd\n");
341 return;
342 }
343
344 printk(KERN_INFO "RAMDISK: %08llx - %08llx\n", ramdisk_image,
345 ramdisk_end);
346
347
348 if (ramdisk_end <= end_of_lowmem) {
349 /* All in lowmem, easy case */
350 /*
351 * don't need to reserve again, already reserved early
352 * in i386_start_kernel
353 */
354 initrd_start = ramdisk_image + PAGE_OFFSET;
355 initrd_end = initrd_start + ramdisk_size;
356 return;
357 }
358
359#ifdef CONFIG_X86_32
360 relocate_initrd();
361#else
362 printk(KERN_ERR "initrd extends beyond end of memory "
363 "(0x%08llx > 0x%08llx)\ndisabling initrd\n",
364 ramdisk_end, end_of_lowmem);
365 initrd_start = 0;
366#endif
367 free_early(ramdisk_image, ramdisk_end);
H. Peter Anvincf8fa922008-01-30 13:32:51 +0100368}
Yinghai Lu225c37d2008-06-22 02:46:58 -0700369#else
Yinghai Lueb1379c2008-06-25 17:49:26 -0700370static void __init reserve_initrd(void)
Yinghai Lu225c37d2008-06-22 02:46:58 -0700371{
372}
H. Peter Anvincf8fa922008-01-30 13:32:51 +0100373#endif /* CONFIG_BLK_DEV_INITRD */
374
Yinghai Lu29f784e2008-06-25 18:00:22 -0700375static void __init parse_setup_data(void)
Yinghai Lu257b0fd2008-06-25 17:56:22 -0700376{
377 struct setup_data *data;
378 u64 pa_data;
379
380 if (boot_params.hdr.version < 0x0209)
381 return;
382 pa_data = boot_params.hdr.setup_data;
383 while (pa_data) {
384 data = early_ioremap(pa_data, PAGE_SIZE);
385 switch (data->type) {
386 case SETUP_E820_EXT:
387 parse_e820_ext(data, pa_data);
388 break;
389 default:
390 break;
391 }
Yinghai Lu257b0fd2008-06-25 17:56:22 -0700392 pa_data = data->next;
393 early_iounmap(data, PAGE_SIZE);
394 }
395}
396
Yinghai Lua0a0bec2008-07-03 11:37:13 -0700397static void __init e820_reserve_setup_data(void)
Yinghai Lu28bb2232008-06-30 16:20:54 -0700398{
399 struct setup_data *data;
400 u64 pa_data;
Yinghai Lud9a81b42008-07-01 20:04:10 -0700401 int found = 0;
Yinghai Lu28bb2232008-06-30 16:20:54 -0700402
403 if (boot_params.hdr.version < 0x0209)
404 return;
405 pa_data = boot_params.hdr.setup_data;
406 while (pa_data) {
407 data = early_ioremap(pa_data, sizeof(*data));
Yinghai Lu28bb2232008-06-30 16:20:54 -0700408 e820_update_range(pa_data, sizeof(*data)+data->len,
409 E820_RAM, E820_RESERVED_KERN);
Yinghai Lud9a81b42008-07-01 20:04:10 -0700410 found = 1;
Yinghai Lu28bb2232008-06-30 16:20:54 -0700411 pa_data = data->next;
412 early_iounmap(data, sizeof(*data));
413 }
Yinghai Lud9a81b42008-07-01 20:04:10 -0700414 if (!found)
415 return;
416
Yinghai Lu28bb2232008-06-30 16:20:54 -0700417 sanitize_e820_map(e820.map, ARRAY_SIZE(e820.map), &e820.nr_map);
Yinghai Lua0a0bec2008-07-03 11:37:13 -0700418 memcpy(&e820_saved, &e820, sizeof(struct e820map));
Yinghai Lu28bb2232008-06-30 16:20:54 -0700419 printk(KERN_INFO "extended physical RAM map:\n");
420 e820_print_map("reserve setup_data");
421}
422
Yinghai Lua0a0bec2008-07-03 11:37:13 -0700423static void __init reserve_early_setup_data(void)
424{
425 struct setup_data *data;
426 u64 pa_data;
427 char buf[32];
428
429 if (boot_params.hdr.version < 0x0209)
430 return;
431 pa_data = boot_params.hdr.setup_data;
432 while (pa_data) {
433 data = early_ioremap(pa_data, sizeof(*data));
434 sprintf(buf, "setup data %x", data->type);
435 reserve_early(pa_data, pa_data+sizeof(*data)+data->len, buf);
436 pa_data = data->next;
437 early_iounmap(data, sizeof(*data));
438 }
439}
440
Linus Torvalds1da177e2005-04-16 15:20:36 -0700441/*
Yinghai Luccb4def2008-06-25 17:57:13 -0700442 * --------- Crashkernel reservation ------------------------------
443 */
444
445#ifdef CONFIG_KEXEC
Bernhard Walle32105f72008-06-26 21:54:08 +0200446
447/**
448 * Reserve @size bytes of crashkernel memory at any suitable offset.
449 *
450 * @size: Size of the crashkernel memory to reserve.
451 * Returns the base address on success, and -1ULL on failure.
452 */
453unsigned long long find_and_reserve_crashkernel(unsigned long long size)
454{
455 const unsigned long long alignment = 16<<20; /* 16M */
456 unsigned long long start = 0LL;
457
458 while (1) {
459 int ret;
460
461 start = find_e820_area(start, ULONG_MAX, size, alignment);
462 if (start == -1ULL)
463 return start;
464
465 /* try to reserve it */
466 ret = reserve_bootmem_generic(start, size, BOOTMEM_EXCLUSIVE);
467 if (ret >= 0)
468 return start;
469
470 start += alignment;
471 }
472}
473
Yinghai Luccb4def2008-06-25 17:57:13 -0700474static inline unsigned long long get_total_mem(void)
475{
476 unsigned long long total;
477
478 total = max_low_pfn - min_low_pfn;
479#ifdef CONFIG_HIGHMEM
480 total += highend_pfn - highstart_pfn;
481#endif
482
483 return total << PAGE_SHIFT;
484}
485
Yinghai Lu29f784e2008-06-25 18:00:22 -0700486static void __init reserve_crashkernel(void)
Yinghai Luccb4def2008-06-25 17:57:13 -0700487{
488 unsigned long long total_mem;
489 unsigned long long crash_size, crash_base;
490 int ret;
491
492 total_mem = get_total_mem();
493
494 ret = parse_crashkernel(boot_command_line, total_mem,
495 &crash_size, &crash_base);
Bernhard Walle32105f72008-06-26 21:54:08 +0200496 if (ret != 0 || crash_size <= 0)
497 return;
498
499 /* 0 means: find the address automatically */
500 if (crash_base <= 0) {
501 crash_base = find_and_reserve_crashkernel(crash_size);
502 if (crash_base == -1ULL) {
503 pr_info("crashkernel reservation failed. "
504 "No suitable area found.\n");
Yinghai Luccb4def2008-06-25 17:57:13 -0700505 return;
506 }
Bernhard Walle32105f72008-06-26 21:54:08 +0200507 } else {
508 ret = reserve_bootmem_generic(crash_base, crash_size,
509 BOOTMEM_EXCLUSIVE);
510 if (ret < 0) {
511 pr_info("crashkernel reservation failed - "
512 "memory is in use\n");
Yinghai Luccb4def2008-06-25 17:57:13 -0700513 return;
514 }
Yinghai Luccb4def2008-06-25 17:57:13 -0700515 }
Bernhard Walle32105f72008-06-26 21:54:08 +0200516
517 printk(KERN_INFO "Reserving %ldMB of memory at %ldMB "
518 "for crashkernel (System RAM: %ldMB)\n",
519 (unsigned long)(crash_size >> 20),
520 (unsigned long)(crash_base >> 20),
521 (unsigned long)(total_mem >> 20));
522
523 crashk_res.start = crash_base;
524 crashk_res.end = crash_base + crash_size - 1;
525 insert_resource(&iomem_resource, &crashk_res);
Yinghai Luccb4def2008-06-25 17:57:13 -0700526}
527#else
Yinghai Lu29f784e2008-06-25 18:00:22 -0700528static void __init reserve_crashkernel(void)
Yinghai Luccb4def2008-06-25 17:57:13 -0700529{
530}
531#endif
532
Yinghai Lubdba0e72008-06-25 17:58:02 -0700533static struct resource standard_io_resources[] = {
534 { .name = "dma1", .start = 0x00, .end = 0x1f,
535 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
536 { .name = "pic1", .start = 0x20, .end = 0x21,
537 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
538 { .name = "timer0", .start = 0x40, .end = 0x43,
539 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
540 { .name = "timer1", .start = 0x50, .end = 0x53,
541 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
542 { .name = "keyboard", .start = 0x60, .end = 0x60,
543 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
544 { .name = "keyboard", .start = 0x64, .end = 0x64,
545 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
546 { .name = "dma page reg", .start = 0x80, .end = 0x8f,
547 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
548 { .name = "pic2", .start = 0xa0, .end = 0xa1,
549 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
550 { .name = "dma2", .start = 0xc0, .end = 0xdf,
551 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
552 { .name = "fpu", .start = 0xf0, .end = 0xff,
553 .flags = IORESOURCE_BUSY | IORESOURCE_IO }
554};
555
Yinghai Lu29f784e2008-06-25 18:00:22 -0700556static void __init reserve_standard_io_resources(void)
Yinghai Lubdba0e72008-06-25 17:58:02 -0700557{
558 int i;
559
560 /* request I/O space for devices used on all i[345]86 PCs */
561 for (i = 0; i < ARRAY_SIZE(standard_io_resources); i++)
562 request_resource(&ioport_resource, &standard_io_resources[i]);
563
564}
565
Yinghai Lu0196bcb2008-06-25 17:58:55 -0700566#ifdef CONFIG_PROC_VMCORE
567/* elfcorehdr= specifies the location of elf core header
568 * stored by the crashed kernel. This option will be passed
569 * by kexec loader to the capture kernel.
570 */
571static int __init setup_elfcorehdr(char *arg)
572{
573 char *end;
574 if (!arg)
575 return -EINVAL;
576 elfcorehdr_addr = memparse(arg, &end);
577 return end > arg ? 0 : -EINVAL;
578}
579early_param("elfcorehdr", setup_elfcorehdr);
580#endif
581
Yinghai Luccb4def2008-06-25 17:57:13 -0700582/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700583 * Determine if we were loaded by an EFI loader. If so, then we have also been
584 * passed the efi memmap, systab, etc., so we should use these data structures
585 * for initialization. Note, the efi init code path is determined by the
586 * global efi_enabled. This allows the same kernel image to be used on existing
587 * systems (with a traditional BIOS) as well as on EFI systems.
588 */
Yinghai Lu76934ed2008-06-25 17:52:35 -0700589/*
590 * setup_arch - architecture-specific boot-time initializations
591 *
592 * Note: On x86_64, fixmaps are ready for use even before this is called.
593 */
594
Linus Torvalds1da177e2005-04-16 15:20:36 -0700595void __init setup_arch(char **cmdline_p)
596{
Yinghai Lu76934ed2008-06-25 17:52:35 -0700597#ifdef CONFIG_X86_32
Linus Torvalds1da177e2005-04-16 15:20:36 -0700598 memcpy(&boot_cpu_data, &new_cpu_data, sizeof(new_cpu_data));
599 pre_setup_arch_hook();
600 early_cpu_init();
Yinghai Lu76934ed2008-06-25 17:52:35 -0700601#else
602 printk(KERN_INFO "Command line: %s\n", boot_command_line);
603#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700604
Jeremy Fitzhardinge1a98fd12008-06-29 20:02:44 -0700605 early_ioremap_init();
606
H. Peter Anvin30c82642007-10-15 17:13:22 -0700607 ROOT_DEV = old_decode_dev(boot_params.hdr.root_dev);
608 screen_info = boot_params.screen_info;
609 edid_info = boot_params.edid_info;
Yinghai Lu76934ed2008-06-25 17:52:35 -0700610#ifdef CONFIG_X86_32
H. Peter Anvin30c82642007-10-15 17:13:22 -0700611 apm_info.bios = boot_params.apm_bios_info;
612 ist_info = boot_params.ist_info;
Yinghai Lu76934ed2008-06-25 17:52:35 -0700613 if (boot_params.sys_desc_table.length != 0) {
H. Peter Anvin30c82642007-10-15 17:13:22 -0700614 set_mca_bus(boot_params.sys_desc_table.table[3] & 0x2);
615 machine_id = boot_params.sys_desc_table.table[0];
616 machine_submodel_id = boot_params.sys_desc_table.table[1];
617 BIOS_revision = boot_params.sys_desc_table.table[2];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700618 }
Yinghai Lu76934ed2008-06-25 17:52:35 -0700619#endif
620 saved_video_mode = boot_params.hdr.vid_mode;
H. Peter Anvin30c82642007-10-15 17:13:22 -0700621 bootloader_type = boot_params.hdr.type_of_loader;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700622
623#ifdef CONFIG_BLK_DEV_RAM
H. Peter Anvin30c82642007-10-15 17:13:22 -0700624 rd_image_start = boot_params.hdr.ram_size & RAMDISK_IMAGE_START_MASK;
625 rd_prompt = ((boot_params.hdr.ram_size & RAMDISK_PROMPT_FLAG) != 0);
626 rd_doload = ((boot_params.hdr.ram_size & RAMDISK_LOAD_FLAG) != 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700627#endif
Yinghai Lu74652522008-06-23 19:53:33 -0700628#ifdef CONFIG_EFI
629 if (!strncmp((char *)&boot_params.efi_info.efi_loader_signature,
Yinghai Lu76934ed2008-06-25 17:52:35 -0700630#ifdef CONFIG_X86_32
631 "EL32",
632#else
633 "EL64",
634#endif
635 4)) {
Yinghai Lu74652522008-06-23 19:53:33 -0700636 efi_enabled = 1;
637 efi_reserve_early();
638 }
639#endif
640
Linus Torvalds1da177e2005-04-16 15:20:36 -0700641 ARCH_SETUP
Huang, Ying2215e692008-01-30 13:31:19 +0100642
Alexander van Heukelum0dbfafa2008-04-23 15:09:05 +0200643 setup_memory_map();
Yinghai Lu28bb2232008-06-30 16:20:54 -0700644 parse_setup_data();
Yinghai Lua0a0bec2008-07-03 11:37:13 -0700645 /* update the e820_saved too */
646 e820_reserve_setup_data();
Yinghai Lu28bb2232008-06-30 16:20:54 -0700647
Linus Torvalds1da177e2005-04-16 15:20:36 -0700648 copy_edd();
649
H. Peter Anvin30c82642007-10-15 17:13:22 -0700650 if (!boot_params.hdr.root_flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700651 root_mountflags &= ~MS_RDONLY;
652 init_mm.start_code = (unsigned long) _text;
653 init_mm.end_code = (unsigned long) _etext;
654 init_mm.end_data = (unsigned long) _edata;
Yinghai Lu76934ed2008-06-25 17:52:35 -0700655#ifdef CONFIG_X86_32
Linus Torvalds1da177e2005-04-16 15:20:36 -0700656 init_mm.brk = init_pg_tables_end + PAGE_OFFSET;
Yinghai Lu76934ed2008-06-25 17:52:35 -0700657#else
658 init_mm.brk = (unsigned long) &_end;
659#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700660
661 code_resource.start = virt_to_phys(_text);
662 code_resource.end = virt_to_phys(_etext)-1;
663 data_resource.start = virt_to_phys(_etext);
664 data_resource.end = virt_to_phys(_edata)-1;
Bernhard Walle00bf4092007-10-21 16:42:01 -0700665 bss_resource.start = virt_to_phys(&__bss_start);
666 bss_resource.end = virt_to_phys(&__bss_stop)-1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700667
Yinghai Lu76934ed2008-06-25 17:52:35 -0700668#ifdef CONFIG_X86_64
669 early_cpu_init();
670#endif
Yinghai Lu9a2e5932008-06-23 19:54:23 -0700671 strlcpy(command_line, boot_command_line, COMMAND_LINE_SIZE);
672 *cmdline_p = command_line;
673
Rusty Russell1a3f2392006-09-26 10:52:32 +0200674 parse_early_param();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700675
Yinghai Lu28bb2232008-06-30 16:20:54 -0700676 /* after early param, so could get panic from serial */
Yinghai Lua0a0bec2008-07-03 11:37:13 -0700677 reserve_early_setup_data();
Yinghai Lu28bb2232008-06-30 16:20:54 -0700678
Yinghai Lu76934ed2008-06-25 17:52:35 -0700679 if (acpi_mps_check()) {
Ingo Molnar3eb11ed2008-06-23 22:19:22 +0200680#ifdef CONFIG_X86_LOCAL_APIC
Yinghai Lu76934ed2008-06-25 17:52:35 -0700681 disable_apic = 1;
682#endif
Yinghai Lu3c999f12008-06-20 16:11:20 -0700683 clear_cpu_cap(&boot_cpu_data, X86_FEATURE_APIC);
684 }
685
Alexander van Heukelum0dbfafa2008-04-23 15:09:05 +0200686 finish_e820_parsing();
Rusty Russell1a3f2392006-09-26 10:52:32 +0200687
Yinghai Lu76934ed2008-06-25 17:52:35 -0700688#ifdef CONFIG_X86_32
Yinghai Lu41c094f2008-06-16 13:03:31 -0700689 probe_roms();
Yinghai Lu76934ed2008-06-25 17:52:35 -0700690#endif
Yinghai Lu41c094f2008-06-16 13:03:31 -0700691
692 /* after parse_early_param, so could debug it */
693 insert_resource(&iomem_resource, &code_resource);
694 insert_resource(&iomem_resource, &data_resource);
695 insert_resource(&iomem_resource, &bss_resource);
696
Huang, Ying8b2cb7a2008-01-30 13:32:11 +0100697 if (efi_enabled)
698 efi_init();
699
Yinghai Lu76934ed2008-06-25 17:52:35 -0700700#ifdef CONFIG_X86_32
Yinghai Lucc9f7a02008-06-16 16:11:08 -0700701 if (ppro_with_ram_bug()) {
702 e820_update_range(0x70000000ULL, 0x40000ULL, E820_RAM,
703 E820_RESERVED);
704 sanitize_e820_map(e820.map, ARRAY_SIZE(e820.map), &e820.nr_map);
705 printk(KERN_INFO "fixed physical RAM map:\n");
706 e820_print_map("bad_ppro");
707 }
Yinghai Lu76934ed2008-06-25 17:52:35 -0700708#else
709 early_gart_iommu_check();
710#endif
Yinghai Lucc9f7a02008-06-16 16:11:08 -0700711
Yinghai Lu7b2a0a62008-06-03 19:35:04 -0700712 e820_register_active_regions(0, 0, -1UL);
713 /*
714 * partially used pages are not usable - thus
715 * we are rounding upwards:
716 */
717 max_pfn = e820_end_of_ram();
718
Yinghai Lu67807112008-06-08 19:53:26 -0700719 /* preallocate 4k for mptable mpc */
720 early_reserve_e820_mpc_new();
Yinghai Lu093af8d2008-01-30 13:33:32 +0100721 /* update e820 for memory not covered by WB MTRRs */
722 mtrr_bp_init();
Yinghai Lu7b2a0a62008-06-03 19:35:04 -0700723 if (mtrr_trim_uncached_memory(max_pfn)) {
724 remove_all_active_ranges();
725 e820_register_active_regions(0, 0, -1UL);
726 max_pfn = e820_end_of_ram();
727 }
Yinghai Lu76c324182008-03-23 00:16:49 -0700728
Yinghai Lu76934ed2008-06-25 17:52:35 -0700729#ifdef CONFIG_X86_32
Yinghai Lu4e296842008-06-24 12:18:14 -0700730 /* max_low_pfn get updated here */
Yinghai Lu2ec65f82008-06-23 03:05:30 -0700731 find_low_pfn_range();
Yinghai Lu76934ed2008-06-25 17:52:35 -0700732#else
733 num_physpages = max_pfn;
734
735 check_efer();
736
737 /* How many end-of-memory variables you have, grandma! */
738 /* need this before calling reserve_initrd */
739 max_low_pfn = max_pfn;
740 high_memory = (void *)__va(max_pfn * PAGE_SIZE - 1) + 1;
741#endif
Yinghai Lu2ec65f82008-06-23 03:05:30 -0700742
Yinghai Lu4e296842008-06-24 12:18:14 -0700743 /* max_pfn_mapped is updated here */
Yinghai Lub9d19f42008-06-26 00:44:56 -0700744 max_pfn_mapped = init_memory_mapping(0, (max_low_pfn << PAGE_SHIFT));
Yinghai Lu4e296842008-06-24 12:18:14 -0700745
Yinghai Lue7b37892008-06-25 21:51:28 -0700746 /*
747 * NOTE: On x86-32, only from this point on, fixmaps are ready for use.
748 */
749
750#ifdef CONFIG_PROVIDE_OHCI1394_DMA_INIT
751 if (init_ohci1394_dma_early)
752 init_ohci1394_dma_on_all_controllers();
753#endif
754
Yinghai Lu2ec65f82008-06-23 03:05:30 -0700755 reserve_initrd();
756
Yinghai Lu76934ed2008-06-25 17:52:35 -0700757#ifdef CONFIG_X86_64
758 vsmp_init();
759#endif
760
Yinghai Lu1c6e5502008-06-17 15:41:45 -0700761 dmi_scan_machine();
762
763 io_delay_init();
764
Yinghai Lu1c6e5502008-06-17 15:41:45 -0700765 /*
766 * Parse the ACPI tables for possible boot-time SMP configuration.
767 */
768 acpi_boot_table_init();
Yinghai Lu1c6e5502008-06-17 15:41:45 -0700769
Yinghai Lu76934ed2008-06-25 17:52:35 -0700770 /* Remove active ranges so rediscovery with NUMA-awareness happens */
771 remove_all_active_ranges();
Yinghai Lu76934ed2008-06-25 17:52:35 -0700772
Yinghai Lu1c6e5502008-06-17 15:41:45 -0700773#ifdef CONFIG_ACPI_NUMA
Yinghai Luf2f865f2008-06-25 17:53:22 -0700774 /*
775 * Parse SRAT to discover nodes.
776 */
777 acpi_numa_init();
Yinghai Lu1c6e5502008-06-17 15:41:45 -0700778#endif
779
Yinghai Lu2ec65f82008-06-23 03:05:30 -0700780 initmem_init(0, max_pfn);
Yinghai Lu093af8d2008-01-30 13:33:32 +0100781
Yinghai Lu76934ed2008-06-25 17:52:35 -0700782#ifdef CONFIG_X86_64
783 dma32_reserve_bootmem();
784#endif
785
Yinghai Lu593a0cc2008-06-17 10:02:45 -0700786#ifdef CONFIG_ACPI_SLEEP
787 /*
788 * Reserve low memory region for sleep support.
789 */
790 acpi_reserve_bootmem();
791#endif
Yinghai Lud1b20af2008-06-25 17:59:41 -0700792#ifdef CONFIG_X86_FIND_SMP_CONFIG
Yinghai Lu593a0cc2008-06-17 10:02:45 -0700793 /*
794 * Find and reserve possible boot-time SMP configuration:
795 */
796 find_smp_config();
797#endif
798 reserve_crashkernel();
799
800 reserve_ibft_region();
801
Glauber de Oliveira Costa790c73f2008-02-15 17:52:48 -0200802#ifdef CONFIG_KVM_CLOCK
803 kvmclock_init();
804#endif
805
Yinghai Lu76934ed2008-06-25 17:52:35 -0700806#if defined(CONFIG_VMI) && defined(CONFIG_X86_32)
Zachary Amsden7ce0bcf2007-02-13 13:26:21 +0100807 /*
808 * Must be after max_low_pfn is determined, and before kernel
809 * pagetables are setup.
810 */
811 vmi_init();
812#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700813
Linus Torvalds1da177e2005-04-16 15:20:36 -0700814 paging_init();
Bernhard Kaindlf212ec42008-01-30 13:34:11 +0100815
Yinghai Lu76934ed2008-06-25 17:52:35 -0700816#ifdef CONFIG_X86_64
817 map_vsyscall();
818#endif
819
Linus Torvalds1da177e2005-04-16 15:20:36 -0700820#ifdef CONFIG_X86_GENERICARCH
Rusty Russell1a3f2392006-09-26 10:52:32 +0200821 generic_apic_probe();
H. Peter Anvincf8fa922008-01-30 13:32:51 +0100822#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700823
Andi Kleen54ef3402007-10-19 20:35:03 +0200824 early_quirks();
Andy Curridd44647b2006-06-08 00:43:38 -0700825
Yinghai Lu295deae2008-06-23 19:55:05 -0700826 /*
827 * Read APIC and some other early information from ACPI tables.
828 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700829 acpi_boot_init();
Yinghai Lu04606612008-06-21 01:38:41 -0700830
Yinghai Lue0da3362008-06-08 18:29:22 -0700831#if defined(CONFIG_X86_MPPARSE) || defined(CONFIG_X86_VISWS)
Yinghai Lu295deae2008-06-23 19:55:05 -0700832 /*
833 * get boot-time SMP configuration:
834 */
Yinghai Lue0da3362008-06-08 18:29:22 -0700835 if (smp_found_config)
836 get_smp_config();
837#endif
Yinghai Lu76934ed2008-06-25 17:52:35 -0700838
Yinghai Lu329513a2008-07-02 18:54:40 -0700839 prefill_possible_map();
Yinghai Lu5f4765f2008-07-02 18:53:44 -0700840#ifdef CONFIG_X86_64
841 init_cpu_to_node();
842#endif
843
Yinghai Lu76934ed2008-06-25 17:52:35 -0700844 init_apic_mappings();
845 ioapic_init_mappings();
Yinghai Luf3294a32008-06-27 01:41:56 -0700846
847#if defined(CONFIG_SMP) && defined(CONFIG_X86_PC) && defined(CONFIG_X86_32)
Venkatesh Pallipadi911a62d2005-09-03 15:56:31 -0700848 if (def_to_bigsmp)
849 printk(KERN_WARNING "More than 8 CPUs detected and "
850 "CONFIG_X86_PC cannot handle it.\nUse "
851 "CONFIG_X86_GENERICARCH or CONFIG_X86_BIGSMP.\n");
852#endif
Yinghai Lu295deae2008-06-23 19:55:05 -0700853 kvm_guest_init();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700854
Yinghai Lu41c094f2008-06-16 13:03:31 -0700855 e820_reserve_resources();
Yinghai Lubf62f392008-05-20 20:10:58 -0700856 e820_mark_nosave_regions(max_low_pfn);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700857
Yinghai Lu76934ed2008-06-25 17:52:35 -0700858#ifdef CONFIG_X86_32
Yinghai Lu41c094f2008-06-16 13:03:31 -0700859 request_resource(&iomem_resource, &video_ram_resource);
Yinghai Lu76934ed2008-06-25 17:52:35 -0700860#endif
Yinghai Luce97c402008-06-21 20:22:09 -0700861 reserve_standard_io_resources();
Yinghai Lu41c094f2008-06-16 13:03:31 -0700862
863 e820_setup_gap();
864
Linus Torvalds1da177e2005-04-16 15:20:36 -0700865#ifdef CONFIG_VT
866#if defined(CONFIG_VGA_CONSOLE)
867 if (!efi_enabled || (efi_mem_type(0xa0000) != EFI_CONVENTIONAL_MEMORY))
868 conswitchp = &vga_con;
869#elif defined(CONFIG_DUMMY_CONSOLE)
870 conswitchp = &dummy_con;
871#endif
872#endif
873}