x86: remove various unused subarch hooks
[linux-block.git] / arch / x86 / kernel / setup.c
CommitLineData
1da177e4 1/*
1da177e4
LT
2 * Copyright (C) 1995 Linus Torvalds
3 *
4 * Support of BIGMEM added by Gerhard Wichert, Siemens AG, July 1999
5 *
6 * Memory region support
7 * David Parsons <orc@pell.chi.il.us>, July-August 1999
8 *
9 * Added E820 sanitization routine (removes overlapping memory regions);
10 * Brian Moyle <bmoyle@mvista.com>, February 2001
11 *
12 * Moved CPU detection code to cpu/${cpu}.c
13 * Patrick Mochel <mochel@osdl.org>, March 2002
14 *
15 * Provisions for empty E820 memory regions (reported by certain BIOSes).
16 * Alex Achenbach <xela@slit.de>, December 2002.
17 *
18 */
19
20/*
21 * This file handles the architecture-dependent parts of initialization
22 */
23
24#include <linux/sched.h>
25#include <linux/mm.h>
05b79bdc 26#include <linux/mmzone.h>
894673ee 27#include <linux/screen_info.h>
1da177e4
LT
28#include <linux/ioport.h>
29#include <linux/acpi.h>
30#include <linux/apm_bios.h>
31#include <linux/initrd.h>
32#include <linux/bootmem.h>
33#include <linux/seq_file.h>
34#include <linux/console.h>
35#include <linux/mca.h>
36#include <linux/root_dev.h>
37#include <linux/highmem.h>
38#include <linux/module.h>
39#include <linux/efi.h>
40#include <linux/init.h>
41#include <linux/edd.h>
138fe4e0 42#include <linux/iscsi_ibft.h>
1da177e4 43#include <linux/nodemask.h>
1bc3b91a 44#include <linux/kexec.h>
e9928674 45#include <linux/dmi.h>
22a9835c 46#include <linux/pfn.h>
376ff035 47#include <linux/pci.h>
46d671b5 48#include <asm/pci-direct.h>
f212ec4b 49#include <linux/init_ohci1394_dma.h>
790c73f6 50#include <linux/kvm_para.h>
1bc3b91a 51
46d671b5
YL
52#include <linux/errno.h>
53#include <linux/kernel.h>
54#include <linux/stddef.h>
55#include <linux/unistd.h>
56#include <linux/ptrace.h>
57#include <linux/slab.h>
58#include <linux/user.h>
59#include <linux/delay.h>
46d671b5
YL
60
61#include <linux/kallsyms.h>
46d671b5
YL
62#include <linux/cpufreq.h>
63#include <linux/dma-mapping.h>
64#include <linux/ctype.h>
65#include <linux/uaccess.h>
66
67#include <linux/percpu.h>
68#include <linux/crash_dump.h>
69
1da177e4 70#include <video/edid.h>
1bc3b91a 71
093af8d7 72#include <asm/mtrr.h>
9635b47d 73#include <asm/apic.h>
1da177e4
LT
74#include <asm/e820.h>
75#include <asm/mpspec.h>
76#include <asm/setup.h>
77#include <asm/arch_hooks.h>
55f26239 78#include <asm/efi.h>
1da177e4 79#include <asm/sections.h>
1c6e5503 80#include <asm/dmi.h>
1da177e4
LT
81#include <asm/io_apic.h>
82#include <asm/ist.h>
7ce0bcfd 83#include <asm/vmi.h>
1164dd00 84#include <asm/setup_arch.h>
ce3fe6b2 85#include <asm/bios_ebda.h>
00bf4098 86#include <asm/cacheflush.h>
2fde61fd 87#include <asm/processor.h>
cc9f7a0c 88#include <asm/bugs.h>
1da177e4 89
46d671b5
YL
90#include <asm/system.h>
91#include <asm/vsyscall.h>
6e5385d4 92#include <asm/cpu.h>
46d671b5
YL
93#include <asm/desc.h>
94#include <asm/dma.h>
46a7fa27 95#include <asm/iommu.h>
1d9b16d1 96#include <asm/gart.h>
46d671b5
YL
97#include <asm/mmu_context.h>
98#include <asm/proto.h>
99
46d671b5 100#include <asm/paravirt.h>
88b094fb 101#include <asm/hypervisor.h>
46d671b5
YL
102
103#include <asm/percpu.h>
46d671b5
YL
104#include <asm/topology.h>
105#include <asm/apicdef.h>
55f26239
YL
106#ifdef CONFIG_X86_64
107#include <asm/numa_64.h>
108#endif
46d671b5 109
042623bb
YL
110#ifndef ARCH_SETUP
111#define ARCH_SETUP
112#endif
113
c0b5842a
IM
114unsigned int boot_cpu_id __read_mostly;
115
116#ifdef CONFIG_X86_64
117int default_cpu_present_to_apicid(int mps_cpu)
118{
119 return __default_cpu_present_to_apicid(mps_cpu);
120}
121
122int default_check_phys_apicid_present(int boot_cpu_physical_apicid)
123{
124 return __default_check_phys_apicid_present(boot_cpu_physical_apicid);
125}
126#endif
127
217b8ce8
YL
128#ifndef CONFIG_DEBUG_BOOT_PARAMS
129struct boot_params __initdata boot_params;
130#else
131struct boot_params boot_params;
132#endif
133
1da177e4
LT
134/*
135 * Machine setup..
136 */
c9cce83d
BW
137static struct resource data_resource = {
138 .name = "Kernel data",
139 .start = 0,
140 .end = 0,
141 .flags = IORESOURCE_BUSY | IORESOURCE_MEM
142};
143
144static struct resource code_resource = {
145 .name = "Kernel code",
146 .start = 0,
147 .end = 0,
148 .flags = IORESOURCE_BUSY | IORESOURCE_MEM
149};
150
151static struct resource bss_resource = {
152 .name = "Kernel bss",
153 .start = 0,
154 .end = 0,
155 .flags = IORESOURCE_BUSY | IORESOURCE_MEM
156};
157
7dea23ec
YL
158
159#ifdef CONFIG_X86_32
5092301c
YL
160/* This value is set up by the early boot code to point to the value
161 immediately after the boot time page tables. It contains a *physical*
162 address, and must not be in the .bss segment! */
163unsigned long init_pg_tables_start __initdata = ~0UL;
164unsigned long init_pg_tables_end __initdata = ~0UL;
165
c9cce83d
BW
166static struct resource video_ram_resource = {
167 .name = "Video RAM area",
168 .start = 0xa0000,
169 .end = 0xbffff,
170 .flags = IORESOURCE_BUSY | IORESOURCE_MEM
171};
172
1da177e4 173/* cpu data as detected by the assembly code in head.S */
7dea23ec 174struct cpuinfo_x86 new_cpu_data __cpuinitdata = {0, 0, 0, 0, -1, 1, 0, 0, -1};
1da177e4 175/* common cpu data for all cpus */
7dea23ec 176struct cpuinfo_x86 boot_cpu_data __read_mostly = {0, 0, 0, 0, -1, 1, 0, 0, -1};
129f6946 177EXPORT_SYMBOL(boot_cpu_data);
7dea23ec
YL
178static void set_mca_bus(int x)
179{
180#ifdef CONFIG_MCA
181 MCA_bus = x;
182#endif
183}
1da177e4 184
0c254e38
AS
185unsigned int def_to_bigsmp;
186
1da177e4
LT
187/* for MCA, but anyone else can use it if they want */
188unsigned int machine_id;
189unsigned int machine_submodel_id;
190unsigned int BIOS_revision;
1da177e4 191
7dea23ec
YL
192struct apm_info apm_info;
193EXPORT_SYMBOL(apm_info);
194
195#if defined(CONFIG_X86_SPEEDSTEP_SMI) || \
196 defined(CONFIG_X86_SPEEDSTEP_SMI_MODULE)
197struct ist_info ist_info;
198EXPORT_SYMBOL(ist_info);
199#else
200struct ist_info ist_info;
201#endif
202
203#else
204struct cpuinfo_x86 boot_cpu_data __read_mostly;
205EXPORT_SYMBOL(boot_cpu_data);
206#endif
207
208
209#if !defined(CONFIG_X86_PAE) || defined(CONFIG_X86_64)
210unsigned long mmu_cr4_features;
211#else
212unsigned long mmu_cr4_features = X86_CR4_PAE;
213#endif
214
1da177e4
LT
215/* Boot loader ID as an integer, for the benefit of proc_dointvec */
216int bootloader_type;
217
1c6e5503
YL
218/*
219 * Early DMI memory
220 */
221int dmi_alloc_index;
222char dmi_alloc_data[DMI_MAX_DATA];
223
1da177e4
LT
224/*
225 * Setup options
226 */
1da177e4 227struct screen_info screen_info;
129f6946 228EXPORT_SYMBOL(screen_info);
1da177e4 229struct edid_info edid_info;
5e518d76 230EXPORT_SYMBOL_GPL(edid_info);
1da177e4 231
1da177e4
LT
232extern int root_mountflags;
233
e44b7b75 234unsigned long saved_video_mode;
1da177e4 235
cf8fa920 236#define RAMDISK_IMAGE_START_MASK 0x07FF
1da177e4 237#define RAMDISK_PROMPT_FLAG 0x8000
cf8fa920 238#define RAMDISK_LOAD_FLAG 0x4000
1da177e4 239
4e498b66 240static char __initdata command_line[COMMAND_LINE_SIZE];
516cbf37
TB
241#ifdef CONFIG_CMDLINE_BOOL
242static char __initdata builtin_cmdline[COMMAND_LINE_SIZE] = CONFIG_CMDLINE;
243#endif
1da177e4 244
1da177e4
LT
245#if defined(CONFIG_EDD) || defined(CONFIG_EDD_MODULE)
246struct edd edd;
247#ifdef CONFIG_EDD_MODULE
248EXPORT_SYMBOL(edd);
249#endif
250/**
251 * copy_edd() - Copy the BIOS EDD information
252 * from boot_params into a safe place.
253 *
254 */
255static inline void copy_edd(void)
256{
30c82645
PA
257 memcpy(edd.mbr_signature, boot_params.edd_mbr_sig_buffer,
258 sizeof(edd.mbr_signature));
259 memcpy(edd.edd_info, boot_params.eddbuf, sizeof(edd.edd_info));
260 edd.mbr_signature_nr = boot_params.edd_mbr_sig_buf_entries;
261 edd.edd_info_nr = boot_params.eddbuf_entries;
1da177e4
LT
262}
263#else
264static inline void copy_edd(void)
265{
266}
267#endif
268
cf8fa920
PA
269#ifdef CONFIG_BLK_DEV_INITRD
270
eb1379cb 271#ifdef CONFIG_X86_32
cf8fa920 272
eb1379cb
YL
273#define MAX_MAP_CHUNK (NR_FIX_BTMAPS << PAGE_SHIFT)
274static void __init relocate_initrd(void)
cf8fa920 275{
eb1379cb 276
ba5b14cc
YL
277 u64 ramdisk_image = boot_params.hdr.ramdisk_image;
278 u64 ramdisk_size = boot_params.hdr.ramdisk_size;
ba5b14cc
YL
279 u64 end_of_lowmem = max_low_pfn << PAGE_SHIFT;
280 u64 ramdisk_here;
eb1379cb
YL
281 unsigned long slop, clen, mapaddr;
282 char *p, *q;
cf8fa920
PA
283
284 /* We need to move the initrd down into lowmem */
4e29684c
YL
285 ramdisk_here = find_e820_area(0, end_of_lowmem, ramdisk_size,
286 PAGE_SIZE);
cf8fa920 287
3945e2c9
YL
288 if (ramdisk_here == -1ULL)
289 panic("Cannot find place for new RAMDISK of size %lld\n",
290 ramdisk_size);
291
cf8fa920
PA
292 /* Note: this includes all the lowmem currently occupied by
293 the initrd, we rely on that fact to keep the data intact. */
3945e2c9 294 reserve_early(ramdisk_here, ramdisk_here + ramdisk_size,
ba5b14cc 295 "NEW RAMDISK");
cf8fa920
PA
296 initrd_start = ramdisk_here + PAGE_OFFSET;
297 initrd_end = initrd_start + ramdisk_size;
f0d43100
YL
298 printk(KERN_INFO "Allocated new RAMDISK: %08llx - %08llx\n",
299 ramdisk_here, ramdisk_here + ramdisk_size);
cf8fa920 300
cf8fa920
PA
301 q = (char *)initrd_start;
302
303 /* Copy any lowmem portion of the initrd */
304 if (ramdisk_image < end_of_lowmem) {
305 clen = end_of_lowmem - ramdisk_image;
306 p = (char *)__va(ramdisk_image);
307 memcpy(q, p, clen);
308 q += clen;
309 ramdisk_image += clen;
310 ramdisk_size -= clen;
311 }
312
313 /* Copy the highmem portion of the initrd */
314 while (ramdisk_size) {
315 slop = ramdisk_image & ~PAGE_MASK;
316 clen = ramdisk_size;
317 if (clen > MAX_MAP_CHUNK-slop)
318 clen = MAX_MAP_CHUNK-slop;
319 mapaddr = ramdisk_image & PAGE_MASK;
88b4c146 320 p = early_memremap(mapaddr, clen+slop);
cf8fa920 321 memcpy(q, p+slop, clen);
beacfaac 322 early_iounmap(p, clen+slop);
cf8fa920
PA
323 q += clen;
324 ramdisk_image += clen;
325 ramdisk_size -= clen;
326 }
a4c81cf6 327 /* high pages is not converted by early_res_to_bootmem */
ba5b14cc
YL
328 ramdisk_image = boot_params.hdr.ramdisk_image;
329 ramdisk_size = boot_params.hdr.ramdisk_size;
eb1379cb
YL
330 printk(KERN_INFO "Move RAMDISK from %016llx - %016llx to"
331 " %08llx - %08llx\n",
ba5b14cc
YL
332 ramdisk_image, ramdisk_image + ramdisk_size - 1,
333 ramdisk_here, ramdisk_here + ramdisk_size - 1);
eb1379cb
YL
334}
335#endif
9a27f5c5 336
eb1379cb
YL
337static void __init reserve_initrd(void)
338{
339 u64 ramdisk_image = boot_params.hdr.ramdisk_image;
340 u64 ramdisk_size = boot_params.hdr.ramdisk_size;
341 u64 ramdisk_end = ramdisk_image + ramdisk_size;
342 u64 end_of_lowmem = max_low_pfn << PAGE_SHIFT;
343
344 if (!boot_params.hdr.type_of_loader ||
345 !ramdisk_image || !ramdisk_size)
346 return; /* No initrd provided by bootloader */
347
348 initrd_start = 0;
349
350 if (ramdisk_size >= (end_of_lowmem>>1)) {
351 free_early(ramdisk_image, ramdisk_end);
352 printk(KERN_ERR "initrd too large to handle, "
353 "disabling initrd\n");
354 return;
355 }
356
357 printk(KERN_INFO "RAMDISK: %08llx - %08llx\n", ramdisk_image,
358 ramdisk_end);
359
360
361 if (ramdisk_end <= end_of_lowmem) {
362 /* All in lowmem, easy case */
363 /*
364 * don't need to reserve again, already reserved early
365 * in i386_start_kernel
366 */
367 initrd_start = ramdisk_image + PAGE_OFFSET;
368 initrd_end = initrd_start + ramdisk_size;
369 return;
370 }
371
372#ifdef CONFIG_X86_32
373 relocate_initrd();
374#else
375 printk(KERN_ERR "initrd extends beyond end of memory "
376 "(0x%08llx > 0x%08llx)\ndisabling initrd\n",
377 ramdisk_end, end_of_lowmem);
378 initrd_start = 0;
379#endif
380 free_early(ramdisk_image, ramdisk_end);
cf8fa920 381}
225c37d7 382#else
eb1379cb 383static void __init reserve_initrd(void)
225c37d7
YL
384{
385}
cf8fa920
PA
386#endif /* CONFIG_BLK_DEV_INITRD */
387
29f784e3 388static void __init parse_setup_data(void)
257b0fde
YL
389{
390 struct setup_data *data;
391 u64 pa_data;
392
393 if (boot_params.hdr.version < 0x0209)
394 return;
395 pa_data = boot_params.hdr.setup_data;
396 while (pa_data) {
88b4c146 397 data = early_memremap(pa_data, PAGE_SIZE);
257b0fde
YL
398 switch (data->type) {
399 case SETUP_E820_EXT:
400 parse_e820_ext(data, pa_data);
401 break;
402 default:
403 break;
404 }
257b0fde
YL
405 pa_data = data->next;
406 early_iounmap(data, PAGE_SIZE);
407 }
408}
409
a0a0becd 410static void __init e820_reserve_setup_data(void)
28bb2237
YL
411{
412 struct setup_data *data;
413 u64 pa_data;
d9a81b44 414 int found = 0;
28bb2237
YL
415
416 if (boot_params.hdr.version < 0x0209)
417 return;
418 pa_data = boot_params.hdr.setup_data;
419 while (pa_data) {
88b4c146 420 data = early_memremap(pa_data, sizeof(*data));
28bb2237
YL
421 e820_update_range(pa_data, sizeof(*data)+data->len,
422 E820_RAM, E820_RESERVED_KERN);
d9a81b44 423 found = 1;
28bb2237
YL
424 pa_data = data->next;
425 early_iounmap(data, sizeof(*data));
426 }
d9a81b44
YL
427 if (!found)
428 return;
429
28bb2237 430 sanitize_e820_map(e820.map, ARRAY_SIZE(e820.map), &e820.nr_map);
a0a0becd 431 memcpy(&e820_saved, &e820, sizeof(struct e820map));
28bb2237
YL
432 printk(KERN_INFO "extended physical RAM map:\n");
433 e820_print_map("reserve setup_data");
434}
435
a0a0becd
YL
436static void __init reserve_early_setup_data(void)
437{
438 struct setup_data *data;
439 u64 pa_data;
440 char buf[32];
441
442 if (boot_params.hdr.version < 0x0209)
443 return;
444 pa_data = boot_params.hdr.setup_data;
445 while (pa_data) {
88b4c146 446 data = early_memremap(pa_data, sizeof(*data));
a0a0becd
YL
447 sprintf(buf, "setup data %x", data->type);
448 reserve_early(pa_data, pa_data+sizeof(*data)+data->len, buf);
449 pa_data = data->next;
450 early_iounmap(data, sizeof(*data));
451 }
452}
453
ccb4defa
YL
454/*
455 * --------- Crashkernel reservation ------------------------------
456 */
457
458#ifdef CONFIG_KEXEC
32105f7f
BW
459
460/**
461 * Reserve @size bytes of crashkernel memory at any suitable offset.
462 *
463 * @size: Size of the crashkernel memory to reserve.
464 * Returns the base address on success, and -1ULL on failure.
465 */
a9b43c7d 466static
6b356022 467unsigned long long __init find_and_reserve_crashkernel(unsigned long long size)
32105f7f
BW
468{
469 const unsigned long long alignment = 16<<20; /* 16M */
470 unsigned long long start = 0LL;
471
472 while (1) {
473 int ret;
474
475 start = find_e820_area(start, ULONG_MAX, size, alignment);
476 if (start == -1ULL)
477 return start;
478
479 /* try to reserve it */
480 ret = reserve_bootmem_generic(start, size, BOOTMEM_EXCLUSIVE);
481 if (ret >= 0)
482 return start;
483
484 start += alignment;
485 }
486}
487
ccb4defa
YL
488static inline unsigned long long get_total_mem(void)
489{
490 unsigned long long total;
491
492 total = max_low_pfn - min_low_pfn;
493#ifdef CONFIG_HIGHMEM
494 total += highend_pfn - highstart_pfn;
495#endif
496
497 return total << PAGE_SHIFT;
498}
499
29f784e3 500static void __init reserve_crashkernel(void)
ccb4defa
YL
501{
502 unsigned long long total_mem;
503 unsigned long long crash_size, crash_base;
504 int ret;
505
506 total_mem = get_total_mem();
507
508 ret = parse_crashkernel(boot_command_line, total_mem,
509 &crash_size, &crash_base);
32105f7f
BW
510 if (ret != 0 || crash_size <= 0)
511 return;
512
513 /* 0 means: find the address automatically */
514 if (crash_base <= 0) {
515 crash_base = find_and_reserve_crashkernel(crash_size);
516 if (crash_base == -1ULL) {
517 pr_info("crashkernel reservation failed. "
518 "No suitable area found.\n");
ccb4defa
YL
519 return;
520 }
32105f7f
BW
521 } else {
522 ret = reserve_bootmem_generic(crash_base, crash_size,
523 BOOTMEM_EXCLUSIVE);
524 if (ret < 0) {
525 pr_info("crashkernel reservation failed - "
526 "memory is in use\n");
ccb4defa
YL
527 return;
528 }
32105f7f 529 }
ccb4defa 530
32105f7f
BW
531 printk(KERN_INFO "Reserving %ldMB of memory at %ldMB "
532 "for crashkernel (System RAM: %ldMB)\n",
533 (unsigned long)(crash_size >> 20),
534 (unsigned long)(crash_base >> 20),
535 (unsigned long)(total_mem >> 20));
ccb4defa 536
32105f7f
BW
537 crashk_res.start = crash_base;
538 crashk_res.end = crash_base + crash_size - 1;
539 insert_resource(&iomem_resource, &crashk_res);
ccb4defa
YL
540}
541#else
29f784e3 542static void __init reserve_crashkernel(void)
ccb4defa
YL
543{
544}
545#endif
546
bdba0e70
YL
547static struct resource standard_io_resources[] = {
548 { .name = "dma1", .start = 0x00, .end = 0x1f,
549 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
550 { .name = "pic1", .start = 0x20, .end = 0x21,
551 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
552 { .name = "timer0", .start = 0x40, .end = 0x43,
553 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
554 { .name = "timer1", .start = 0x50, .end = 0x53,
555 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
556 { .name = "keyboard", .start = 0x60, .end = 0x60,
557 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
558 { .name = "keyboard", .start = 0x64, .end = 0x64,
559 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
560 { .name = "dma page reg", .start = 0x80, .end = 0x8f,
561 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
562 { .name = "pic2", .start = 0xa0, .end = 0xa1,
563 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
564 { .name = "dma2", .start = 0xc0, .end = 0xdf,
565 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
566 { .name = "fpu", .start = 0xf0, .end = 0xff,
567 .flags = IORESOURCE_BUSY | IORESOURCE_IO }
568};
569
29f784e3 570static void __init reserve_standard_io_resources(void)
bdba0e70
YL
571{
572 int i;
573
574 /* request I/O space for devices used on all i[345]86 PCs */
575 for (i = 0; i < ARRAY_SIZE(standard_io_resources); i++)
576 request_resource(&ioport_resource, &standard_io_resources[i]);
577
578}
579
57cac4d1
VG
580/*
581 * Note: elfcorehdr_addr is not just limited to vmcore. It is also used by
582 * is_kdump_kernel() to determine if we are booting after a panic. Hence
583 * ifdef it under CONFIG_CRASH_DUMP and not CONFIG_PROC_VMCORE.
584 */
585
586#ifdef CONFIG_CRASH_DUMP
0196bcbb
YL
587/* elfcorehdr= specifies the location of elf core header
588 * stored by the crashed kernel. This option will be passed
589 * by kexec loader to the capture kernel.
590 */
591static int __init setup_elfcorehdr(char *arg)
592{
593 char *end;
594 if (!arg)
595 return -EINVAL;
596 elfcorehdr_addr = memparse(arg, &end);
597 return end > arg ? 0 : -EINVAL;
598}
599early_param("elfcorehdr", setup_elfcorehdr);
600#endif
601
be163a15 602static int __init default_update_apic(void)
9f077871 603{
3e5095d1 604#ifdef CONFIG_SMP
328386d7
IM
605 if (!apic->wakeup_cpu)
606 apic->wakeup_cpu = wakeup_secondary_cpu_via_init;
c885df50 607#endif
9f077871 608
54ac14a8 609 return 0;
bb577f98
HD
610}
611
54ac14a8 612static struct x86_quirks default_x86_quirks __initdata = {
be163a15 613 .update_apic = default_update_apic,
54ac14a8 614};
9f077871 615
3c9cb6de 616struct x86_quirks *x86_quirks __initdata = &default_x86_quirks;
5394f80f 617
bb557460 618#ifdef CONFIG_X86_RESERVE_LOW_64K
5649b7c3
IM
619static int __init dmi_low_memory_corruption(const struct dmi_system_id *d)
620{
621 printk(KERN_NOTICE
45608399 622 "%s detected: BIOS may corrupt low RAM, working around it.\n",
5649b7c3
IM
623 d->ident);
624
2216d199
YL
625 e820_update_range(0, 0x10000, E820_RAM, E820_RESERVED);
626 sanitize_e820_map(e820.map, ARRAY_SIZE(e820.map), &e820.nr_map);
5649b7c3
IM
627
628 return 0;
629}
bb557460 630#endif
5649b7c3
IM
631
632/* List of systems that have known low memory corruption BIOS problems */
633static struct dmi_system_id __initdata bad_bios_dmi_table[] = {
fc381519 634#ifdef CONFIG_X86_RESERVE_LOW_64K
5649b7c3
IM
635 {
636 .callback = dmi_low_memory_corruption,
637 .ident = "AMI BIOS",
638 .matches = {
639 DMI_MATCH(DMI_BIOS_VENDOR, "American Megatrends Inc."),
640 },
641 },
1e22436e
IM
642 {
643 .callback = dmi_low_memory_corruption,
644 .ident = "Phoenix BIOS",
645 .matches = {
0af40a4b 646 DMI_MATCH(DMI_BIOS_VENDOR, "Phoenix Technologies"),
1e22436e
IM
647 },
648 },
fc381519 649#endif
a8b71a28 650 {}
5649b7c3
IM
651};
652
1da177e4
LT
653/*
654 * Determine if we were loaded by an EFI loader. If so, then we have also been
655 * passed the efi memmap, systab, etc., so we should use these data structures
656 * for initialization. Note, the efi init code path is determined by the
657 * global efi_enabled. This allows the same kernel image to be used on existing
658 * systems (with a traditional BIOS) as well as on EFI systems.
659 */
76934ed4
YL
660/*
661 * setup_arch - architecture-specific boot-time initializations
662 *
663 * Note: On x86_64, fixmaps are ready for use even before this is called.
664 */
665
1da177e4
LT
666void __init setup_arch(char **cmdline_p)
667{
76934ed4 668#ifdef CONFIG_X86_32
1da177e4 669 memcpy(&boot_cpu_data, &new_cpu_data, sizeof(new_cpu_data));
3b33553b 670 visws_early_detect();
76934ed4
YL
671#else
672 printk(KERN_INFO "Command line: %s\n", boot_command_line);
673#endif
1da177e4 674
ae8d04e2
ZA
675 /* VMI may relocate the fixmap; do this before touching ioremap area */
676 vmi_init();
677
9e882c92 678 early_cpu_init();
1a98fd14
JF
679 early_ioremap_init();
680
30c82645
PA
681 ROOT_DEV = old_decode_dev(boot_params.hdr.root_dev);
682 screen_info = boot_params.screen_info;
683 edid_info = boot_params.edid_info;
76934ed4 684#ifdef CONFIG_X86_32
30c82645
PA
685 apm_info.bios = boot_params.apm_bios_info;
686 ist_info = boot_params.ist_info;
76934ed4 687 if (boot_params.sys_desc_table.length != 0) {
30c82645
PA
688 set_mca_bus(boot_params.sys_desc_table.table[3] & 0x2);
689 machine_id = boot_params.sys_desc_table.table[0];
690 machine_submodel_id = boot_params.sys_desc_table.table[1];
691 BIOS_revision = boot_params.sys_desc_table.table[2];
1da177e4 692 }
76934ed4
YL
693#endif
694 saved_video_mode = boot_params.hdr.vid_mode;
30c82645 695 bootloader_type = boot_params.hdr.type_of_loader;
1da177e4
LT
696
697#ifdef CONFIG_BLK_DEV_RAM
30c82645
PA
698 rd_image_start = boot_params.hdr.ram_size & RAMDISK_IMAGE_START_MASK;
699 rd_prompt = ((boot_params.hdr.ram_size & RAMDISK_PROMPT_FLAG) != 0);
700 rd_doload = ((boot_params.hdr.ram_size & RAMDISK_LOAD_FLAG) != 0);
1da177e4 701#endif
7465252e
YL
702#ifdef CONFIG_EFI
703 if (!strncmp((char *)&boot_params.efi_info.efi_loader_signature,
76934ed4
YL
704#ifdef CONFIG_X86_32
705 "EL32",
706#else
707 "EL64",
708#endif
709 4)) {
7465252e
YL
710 efi_enabled = 1;
711 efi_reserve_early();
712 }
713#endif
714
1da177e4 715 ARCH_SETUP
2215e69d 716
0dbfafa5 717 setup_memory_map();
28bb2237 718 parse_setup_data();
a0a0becd
YL
719 /* update the e820_saved too */
720 e820_reserve_setup_data();
28bb2237 721
1da177e4
LT
722 copy_edd();
723
30c82645 724 if (!boot_params.hdr.root_flags)
1da177e4
LT
725 root_mountflags &= ~MS_RDONLY;
726 init_mm.start_code = (unsigned long) _text;
727 init_mm.end_code = (unsigned long) _etext;
728 init_mm.end_data = (unsigned long) _edata;
76934ed4 729#ifdef CONFIG_X86_32
1da177e4 730 init_mm.brk = init_pg_tables_end + PAGE_OFFSET;
76934ed4
YL
731#else
732 init_mm.brk = (unsigned long) &_end;
733#endif
1da177e4
LT
734
735 code_resource.start = virt_to_phys(_text);
736 code_resource.end = virt_to_phys(_etext)-1;
737 data_resource.start = virt_to_phys(_etext);
738 data_resource.end = virt_to_phys(_edata)-1;
00bf4098
BW
739 bss_resource.start = virt_to_phys(&__bss_start);
740 bss_resource.end = virt_to_phys(&__bss_stop)-1;
1da177e4 741
516cbf37
TB
742#ifdef CONFIG_CMDLINE_BOOL
743#ifdef CONFIG_CMDLINE_OVERRIDE
744 strlcpy(boot_command_line, builtin_cmdline, COMMAND_LINE_SIZE);
745#else
746 if (builtin_cmdline[0]) {
747 /* append boot loader cmdline to builtin */
748 strlcat(builtin_cmdline, " ", COMMAND_LINE_SIZE);
749 strlcat(builtin_cmdline, boot_command_line, COMMAND_LINE_SIZE);
750 strlcpy(boot_command_line, builtin_cmdline, COMMAND_LINE_SIZE);
751 }
752#endif
753#endif
754
9a2e5930
YL
755 strlcpy(command_line, boot_command_line, COMMAND_LINE_SIZE);
756 *cmdline_p = command_line;
757
1a3f239d 758 parse_early_param();
1da177e4 759
0ad5bce7
JF
760#ifdef CONFIG_X86_64
761 check_efer();
762#endif
763
ae8d04e2
ZA
764 /* Must be before kernel pagetables are setup */
765 vmi_activate();
3a6ddd5f 766
28bb2237 767 /* after early param, so could get panic from serial */
a0a0becd 768 reserve_early_setup_data();
28bb2237 769
76934ed4 770 if (acpi_mps_check()) {
3eb11edc 771#ifdef CONFIG_X86_LOCAL_APIC
76934ed4 772 disable_apic = 1;
3eb11edc 773#endif
988781dc 774 setup_clear_cpu_cap(X86_FEATURE_APIC);
3c999f14
YL
775 }
776
dc7c65db
LT
777#ifdef CONFIG_PCI
778 if (pci_early_dump_regs)
779 early_dump_pci_devices();
780#endif
781
0dbfafa5 782 finish_e820_parsing();
1a3f239d 783
2216d199
YL
784 dmi_scan_machine();
785
786 dmi_check_system(bad_bios_dmi_table);
787
88b094fb
AK
788 /*
789 * VMware detection requires dmi to be available, so this
790 * needs to be done after dmi_scan_machine, for the BP.
791 */
792 init_hypervisor(&boot_cpu_data);
793
76934ed4 794#ifdef CONFIG_X86_32
41c094fd 795 probe_roms();
76934ed4 796#endif
41c094fd
YL
797
798 /* after parse_early_param, so could debug it */
799 insert_resource(&iomem_resource, &code_resource);
800 insert_resource(&iomem_resource, &data_resource);
801 insert_resource(&iomem_resource, &bss_resource);
802
8b2cb7a8
HY
803 if (efi_enabled)
804 efi_init();
805
76934ed4 806#ifdef CONFIG_X86_32
cc9f7a0c
YL
807 if (ppro_with_ram_bug()) {
808 e820_update_range(0x70000000ULL, 0x40000ULL, E820_RAM,
809 E820_RESERVED);
810 sanitize_e820_map(e820.map, ARRAY_SIZE(e820.map), &e820.nr_map);
811 printk(KERN_INFO "fixed physical RAM map:\n");
812 e820_print_map("bad_ppro");
813 }
76934ed4
YL
814#else
815 early_gart_iommu_check();
816#endif
cc9f7a0c 817
7b2a0a6c
YL
818 /*
819 * partially used pages are not usable - thus
820 * we are rounding upwards:
821 */
f361a450 822 max_pfn = e820_end_of_ram_pfn();
7b2a0a6c 823
6780711e
YL
824 /* preallocate 4k for mptable mpc */
825 early_reserve_e820_mpc_new();
093af8d7
YL
826 /* update e820 for memory not covered by WB MTRRs */
827 mtrr_bp_init();
2dc807b3 828 if (mtrr_trim_uncached_memory(max_pfn))
f361a450 829 max_pfn = e820_end_of_ram_pfn();
76c32418 830
76934ed4 831#ifdef CONFIG_X86_32
4e29684c 832 /* max_low_pfn get updated here */
2ec65f8b 833 find_low_pfn_range();
76934ed4
YL
834#else
835 num_physpages = max_pfn;
836
06cd9a7d 837 check_x2apic();
76934ed4
YL
838
839 /* How many end-of-memory variables you have, grandma! */
840 /* need this before calling reserve_initrd */
f361a450
YL
841 if (max_pfn > (1UL<<(32 - PAGE_SHIFT)))
842 max_low_pfn = e820_end_of_low_ram_pfn();
843 else
844 max_low_pfn = max_pfn;
845
76934ed4
YL
846 high_memory = (void *)__va(max_pfn * PAGE_SIZE - 1) + 1;
847#endif
2ec65f8b 848
5394f80f
JF
849#ifdef CONFIG_X86_CHECK_BIOS_CORRUPTION
850 setup_bios_corruption_check();
851#endif
852
4e29684c 853 /* max_pfn_mapped is updated here */
f361a450
YL
854 max_low_pfn_mapped = init_memory_mapping(0, max_low_pfn<<PAGE_SHIFT);
855 max_pfn_mapped = max_low_pfn_mapped;
856
857#ifdef CONFIG_X86_64
858 if (max_pfn > max_low_pfn) {
859 max_pfn_mapped = init_memory_mapping(1UL<<32,
860 max_pfn<<PAGE_SHIFT);
861 /* can we preseve max_low_pfn ?*/
862 max_low_pfn = max_pfn;
863 }
864#endif
4e29684c 865
e7b37895
YL
866 /*
867 * NOTE: On x86-32, only from this point on, fixmaps are ready for use.
868 */
869
870#ifdef CONFIG_PROVIDE_OHCI1394_DMA_INIT
871 if (init_ohci1394_dma_early)
872 init_ohci1394_dma_on_all_controllers();
873#endif
874
2ec65f8b
YL
875 reserve_initrd();
876
76934ed4
YL
877#ifdef CONFIG_X86_64
878 vsmp_init();
879#endif
880
1c6e5503
YL
881 io_delay_init();
882
1c6e5503
YL
883 /*
884 * Parse the ACPI tables for possible boot-time SMP configuration.
885 */
886 acpi_boot_table_init();
1c6e5503 887
2e42060c
JS
888 early_acpi_boot_init();
889
1c6e5503 890#ifdef CONFIG_ACPI_NUMA
f2f865fe
YL
891 /*
892 * Parse SRAT to discover nodes.
893 */
894 acpi_numa_init();
1c6e5503
YL
895#endif
896
2ec65f8b 897 initmem_init(0, max_pfn);
093af8d7 898
593a0cc3
YL
899#ifdef CONFIG_ACPI_SLEEP
900 /*
901 * Reserve low memory region for sleep support.
902 */
903 acpi_reserve_bootmem();
904#endif
593a0cc3
YL
905 /*
906 * Find and reserve possible boot-time SMP configuration:
907 */
908 find_smp_config();
550fe4f1 909
593a0cc3
YL
910 reserve_crashkernel();
911
91467bdf
BW
912#ifdef CONFIG_X86_64
913 /*
914 * dma32_reserve_bootmem() allocates bootmem which may conflict
915 * with the crashkernel command line, so do that after
916 * reserve_crashkernel()
917 */
918 dma32_reserve_bootmem();
919#endif
920
593a0cc3
YL
921 reserve_ibft_region();
922
790c73f6
GOC
923#ifdef CONFIG_KVM_CLOCK
924 kvmclock_init();
925#endif
926
a312b37b 927 paravirt_pagetable_setup_start(swapper_pg_dir);
1da177e4 928 paging_init();
a312b37b 929 paravirt_pagetable_setup_done(swapper_pg_dir);
c1f2f09e 930 paravirt_post_allocator_init();
f212ec4b 931
76934ed4
YL
932#ifdef CONFIG_X86_64
933 map_vsyscall();
934#endif
935
1a3f239d 936 generic_apic_probe();
1da177e4 937
54ef3400 938 early_quirks();
d44647b0 939
295deae4
YL
940 /*
941 * Read APIC and some other early information from ACPI tables.
942 */
1da177e4 943 acpi_boot_init();
04606618 944
e0da3364 945#if defined(CONFIG_X86_MPPARSE) || defined(CONFIG_X86_VISWS)
295deae4
YL
946 /*
947 * get boot-time SMP configuration:
948 */
e0da3364
YL
949 if (smp_found_config)
950 get_smp_config();
951#endif
76934ed4 952
329513a3 953 prefill_possible_map();
301e6190 954
5f4765f9
YL
955#ifdef CONFIG_X86_64
956 init_cpu_to_node();
957#endif
958
76934ed4
YL
959 init_apic_mappings();
960 ioapic_init_mappings();
f3294a33 961
9d6a4d08 962 /* need to wait for io_apic is mapped */
be5d5350 963 probe_nr_irqs_gsi();
9d6a4d08 964
295deae4 965 kvm_guest_init();
1da177e4 966
41c094fd 967 e820_reserve_resources();
bf62f398 968 e820_mark_nosave_regions(max_low_pfn);
1da177e4 969
76934ed4 970#ifdef CONFIG_X86_32
41c094fd 971 request_resource(&iomem_resource, &video_ram_resource);
76934ed4 972#endif
ce97c40e 973 reserve_standard_io_resources();
41c094fd
YL
974
975 e820_setup_gap();
976
1da177e4
LT
977#ifdef CONFIG_VT
978#if defined(CONFIG_VGA_CONSOLE)
979 if (!efi_enabled || (efi_mem_type(0xa0000) != EFI_CONVENTIONAL_MEMORY))
980 conswitchp = &vga_con;
981#elif defined(CONFIG_DUMMY_CONSOLE)
982 conswitchp = &dummy_con;
983#endif
984#endif
985}
5649b7c3 986
9be1b56a
IM
987#ifdef CONFIG_X86_32
988
989/**
990 * pre_intr_init_hook - initialisation prior to setting up interrupt vectors
991 *
992 * Description:
993 * Perform any necessary interrupt initialisation prior to setting up
994 * the "ordinary" interrupt call gates. For legacy reasons, the ISA
995 * interrupts should be initialised here if the machine emulates a PC
996 * in any way.
997 **/
998void __init pre_intr_init_hook(void)
999{
1000 if (x86_quirks->arch_pre_intr_init) {
1001 if (x86_quirks->arch_pre_intr_init())
1002 return;
1003 }
1004 init_ISA_irqs();
1005}
1006
1007/**
1008 * intr_init_hook - post gate setup interrupt initialisation
1009 *
1010 * Description:
1011 * Fill in any interrupts that may have been left out by the general
1012 * init_IRQ() routine. interrupts having to do with the machine rather
1013 * than the devices on the I/O bus (like APIC interrupts in intel MP
1014 * systems) are started here.
1015 **/
1016void __init intr_init_hook(void)
1017{
1018 if (x86_quirks->arch_intr_init) {
1019 if (x86_quirks->arch_intr_init())
1020 return;
1021 }
1022}
1023
9be1b56a
IM
1024/**
1025 * trap_init_hook - initialise system specific traps
1026 *
1027 * Description:
1028 * Called as the final act of trap_init(). Used in VISWS to initialise
1029 * the various board specific APIC traps.
1030 **/
1031void __init trap_init_hook(void)
1032{
1033 if (x86_quirks->arch_trap_init) {
1034 if (x86_quirks->arch_trap_init())
1035 return;
1036 }
1037}
1038
1039static struct irqaction irq0 = {
1040 .handler = timer_interrupt,
fc6fc7f1 1041 .flags = IRQF_DISABLED | IRQF_NOBALANCING | IRQF_IRQPOLL | IRQF_TIMER,
9be1b56a
IM
1042 .mask = CPU_MASK_NONE,
1043 .name = "timer"
1044};
1045
1046/**
1047 * pre_time_init_hook - do any specific initialisations before.
1048 *
1049 **/
1050void __init pre_time_init_hook(void)
1051{
1052 if (x86_quirks->arch_pre_time_init)
1053 x86_quirks->arch_pre_time_init();
1054}
1055
1056/**
1057 * time_init_hook - do any specific initialisations for the system timer.
1058 *
1059 * Description:
1060 * Must plug the system timer interrupt source at HZ into the IRQ listed
1061 * in irq_vectors.h:TIMER_IRQ
1062 **/
1063void __init time_init_hook(void)
1064{
1065 if (x86_quirks->arch_time_init) {
1066 /*
1067 * A nonzero return code does not mean failure, it means
1068 * that the architecture quirk does not want any
1069 * generic (timer) setup to be performed after this:
1070 */
1071 if (x86_quirks->arch_time_init())
1072 return;
1073 }
1074
1075 irq0.mask = cpumask_of_cpu(0);
1076 setup_irq(0, &irq0);
1077}
9be1b56a 1078#endif /* CONFIG_X86_32 */