blob: 1cb3e21c571ac46dd629222cd7f94b3dad520903 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/arch/x86-64/kernel/setup.c
3 *
4 * Copyright (C) 1995 Linus Torvalds
5 *
6 * Nov 2001 Dave Jones <davej@suse.de>
7 * Forked from i386 setup code.
8 *
9 * $Id$
10 */
11
12/*
13 * This file handles the architecture-dependent parts of initialization
14 */
15
16#include <linux/errno.h>
17#include <linux/sched.h>
18#include <linux/kernel.h>
19#include <linux/mm.h>
20#include <linux/stddef.h>
21#include <linux/unistd.h>
22#include <linux/ptrace.h>
23#include <linux/slab.h>
24#include <linux/user.h>
25#include <linux/a.out.h>
26#include <linux/tty.h>
27#include <linux/ioport.h>
28#include <linux/delay.h>
29#include <linux/config.h>
30#include <linux/init.h>
31#include <linux/initrd.h>
32#include <linux/highmem.h>
33#include <linux/bootmem.h>
34#include <linux/module.h>
35#include <asm/processor.h>
36#include <linux/console.h>
37#include <linux/seq_file.h>
Vivek Goyalaac04b32006-01-09 20:51:47 -080038#include <linux/crash_dump.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070039#include <linux/root_dev.h>
40#include <linux/pci.h>
41#include <linux/acpi.h>
42#include <linux/kallsyms.h>
43#include <linux/edd.h>
Matt Tolentinobbfceef2005-06-23 00:08:07 -070044#include <linux/mmzone.h>
Eric W. Biederman5f5609d2005-06-25 14:58:04 -070045#include <linux/kexec.h>
Venkatesh Pallipadi95235ca2005-12-02 10:43:20 -080046#include <linux/cpufreq.h>
Andi Kleene9928672006-01-11 22:43:33 +010047#include <linux/dmi.h>
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010048#include <linux/dma-mapping.h>
Andi Kleen681558f2006-03-25 16:29:46 +010049#include <linux/ctype.h>
Matt Tolentinobbfceef2005-06-23 00:08:07 -070050
Linus Torvalds1da177e2005-04-16 15:20:36 -070051#include <asm/mtrr.h>
52#include <asm/uaccess.h>
53#include <asm/system.h>
54#include <asm/io.h>
55#include <asm/smp.h>
56#include <asm/msr.h>
57#include <asm/desc.h>
58#include <video/edid.h>
59#include <asm/e820.h>
60#include <asm/dma.h>
61#include <asm/mpspec.h>
62#include <asm/mmu_context.h>
63#include <asm/bootsetup.h>
64#include <asm/proto.h>
65#include <asm/setup.h>
66#include <asm/mach_apic.h>
67#include <asm/numa.h>
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010068#include <asm/swiotlb.h>
Andi Kleen2bc04142005-11-05 17:25:53 +010069#include <asm/sections.h>
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010070#include <asm/gart-mapping.h>
Andi Kleenf2d3efe2006-03-25 16:30:22 +010071#include <asm/dmi.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070072
73/*
74 * Machine setup..
75 */
76
Ravikiran G Thirumalai6c231b72005-09-06 15:17:45 -070077struct cpuinfo_x86 boot_cpu_data __read_mostly;
Linus Torvalds1da177e2005-04-16 15:20:36 -070078
79unsigned long mmu_cr4_features;
80
81int acpi_disabled;
82EXPORT_SYMBOL(acpi_disabled);
Len Brown888ba6c2005-08-24 12:07:20 -040083#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -070084extern int __initdata acpi_ht;
85extern acpi_interrupt_flags acpi_sci_flags;
86int __initdata acpi_force = 0;
87#endif
88
89int acpi_numa __initdata;
90
Linus Torvalds1da177e2005-04-16 15:20:36 -070091/* Boot loader ID as an integer, for the benefit of proc_dointvec */
92int bootloader_type;
93
94unsigned long saved_video_mode;
95
Andi Kleenf2d3efe2006-03-25 16:30:22 +010096/*
97 * Early DMI memory
98 */
99int dmi_alloc_index;
100char dmi_alloc_data[DMI_MAX_DATA];
101
Linus Torvalds1da177e2005-04-16 15:20:36 -0700102/*
103 * Setup options
104 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105struct screen_info screen_info;
106struct sys_desc_table_struct {
107 unsigned short length;
108 unsigned char table[0];
109};
110
111struct edid_info edid_info;
112struct e820map e820;
113
114extern int root_mountflags;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700115
116char command_line[COMMAND_LINE_SIZE];
117
118struct resource standard_io_resources[] = {
119 { .name = "dma1", .start = 0x00, .end = 0x1f,
120 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
121 { .name = "pic1", .start = 0x20, .end = 0x21,
122 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
123 { .name = "timer0", .start = 0x40, .end = 0x43,
124 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
125 { .name = "timer1", .start = 0x50, .end = 0x53,
126 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
127 { .name = "keyboard", .start = 0x60, .end = 0x6f,
128 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
129 { .name = "dma page reg", .start = 0x80, .end = 0x8f,
130 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
131 { .name = "pic2", .start = 0xa0, .end = 0xa1,
132 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
133 { .name = "dma2", .start = 0xc0, .end = 0xdf,
134 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
135 { .name = "fpu", .start = 0xf0, .end = 0xff,
136 .flags = IORESOURCE_BUSY | IORESOURCE_IO }
137};
138
139#define STANDARD_IO_RESOURCES \
140 (sizeof standard_io_resources / sizeof standard_io_resources[0])
141
142#define IORESOURCE_RAM (IORESOURCE_BUSY | IORESOURCE_MEM)
143
144struct resource data_resource = {
145 .name = "Kernel data",
146 .start = 0,
147 .end = 0,
148 .flags = IORESOURCE_RAM,
149};
150struct resource code_resource = {
151 .name = "Kernel code",
152 .start = 0,
153 .end = 0,
154 .flags = IORESOURCE_RAM,
155};
156
157#define IORESOURCE_ROM (IORESOURCE_BUSY | IORESOURCE_READONLY | IORESOURCE_MEM)
158
159static struct resource system_rom_resource = {
160 .name = "System ROM",
161 .start = 0xf0000,
162 .end = 0xfffff,
163 .flags = IORESOURCE_ROM,
164};
165
166static struct resource extension_rom_resource = {
167 .name = "Extension ROM",
168 .start = 0xe0000,
169 .end = 0xeffff,
170 .flags = IORESOURCE_ROM,
171};
172
173static struct resource adapter_rom_resources[] = {
174 { .name = "Adapter ROM", .start = 0xc8000, .end = 0,
175 .flags = IORESOURCE_ROM },
176 { .name = "Adapter ROM", .start = 0, .end = 0,
177 .flags = IORESOURCE_ROM },
178 { .name = "Adapter ROM", .start = 0, .end = 0,
179 .flags = IORESOURCE_ROM },
180 { .name = "Adapter ROM", .start = 0, .end = 0,
181 .flags = IORESOURCE_ROM },
182 { .name = "Adapter ROM", .start = 0, .end = 0,
183 .flags = IORESOURCE_ROM },
184 { .name = "Adapter ROM", .start = 0, .end = 0,
185 .flags = IORESOURCE_ROM }
186};
187
188#define ADAPTER_ROM_RESOURCES \
189 (sizeof adapter_rom_resources / sizeof adapter_rom_resources[0])
190
191static struct resource video_rom_resource = {
192 .name = "Video ROM",
193 .start = 0xc0000,
194 .end = 0xc7fff,
195 .flags = IORESOURCE_ROM,
196};
197
198static struct resource video_ram_resource = {
199 .name = "Video RAM area",
200 .start = 0xa0000,
201 .end = 0xbffff,
202 .flags = IORESOURCE_RAM,
203};
204
205#define romsignature(x) (*(unsigned short *)(x) == 0xaa55)
206
207static int __init romchecksum(unsigned char *rom, unsigned long length)
208{
209 unsigned char *p, sum = 0;
210
211 for (p = rom; p < rom + length; p++)
212 sum += *p;
213 return sum == 0;
214}
215
216static void __init probe_roms(void)
217{
218 unsigned long start, length, upper;
219 unsigned char *rom;
220 int i;
221
222 /* video rom */
223 upper = adapter_rom_resources[0].start;
224 for (start = video_rom_resource.start; start < upper; start += 2048) {
225 rom = isa_bus_to_virt(start);
226 if (!romsignature(rom))
227 continue;
228
229 video_rom_resource.start = start;
230
231 /* 0 < length <= 0x7f * 512, historically */
232 length = rom[2] * 512;
233
234 /* if checksum okay, trust length byte */
235 if (length && romchecksum(rom, length))
236 video_rom_resource.end = start + length - 1;
237
238 request_resource(&iomem_resource, &video_rom_resource);
239 break;
240 }
241
242 start = (video_rom_resource.end + 1 + 2047) & ~2047UL;
243 if (start < upper)
244 start = upper;
245
246 /* system rom */
247 request_resource(&iomem_resource, &system_rom_resource);
248 upper = system_rom_resource.start;
249
250 /* check for extension rom (ignore length byte!) */
251 rom = isa_bus_to_virt(extension_rom_resource.start);
252 if (romsignature(rom)) {
253 length = extension_rom_resource.end - extension_rom_resource.start + 1;
254 if (romchecksum(rom, length)) {
255 request_resource(&iomem_resource, &extension_rom_resource);
256 upper = extension_rom_resource.start;
257 }
258 }
259
260 /* check for adapter roms on 2k boundaries */
261 for (i = 0; i < ADAPTER_ROM_RESOURCES && start < upper; start += 2048) {
262 rom = isa_bus_to_virt(start);
263 if (!romsignature(rom))
264 continue;
265
266 /* 0 < length <= 0x7f * 512, historically */
267 length = rom[2] * 512;
268
269 /* but accept any length that fits if checksum okay */
270 if (!length || start + length > upper || !romchecksum(rom, length))
271 continue;
272
273 adapter_rom_resources[i].start = start;
274 adapter_rom_resources[i].end = start + length - 1;
275 request_resource(&iomem_resource, &adapter_rom_resources[i]);
276
277 start = adapter_rom_resources[i++].end & ~2047UL;
278 }
279}
280
Andi Kleen681558f2006-03-25 16:29:46 +0100281/* Check for full argument with no trailing characters */
282static int fullarg(char *p, char *arg)
283{
284 int l = strlen(arg);
285 return !memcmp(p, arg, l) && (p[l] == 0 || isspace(p[l]));
286}
287
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288static __init void parse_cmdline_early (char ** cmdline_p)
289{
290 char c = ' ', *to = command_line, *from = COMMAND_LINE;
291 int len = 0;
akpm@osdl.org69cda7b2006-01-09 20:51:46 -0800292 int userdef = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294 for (;;) {
295 if (c != ' ')
296 goto next_char;
297
298#ifdef CONFIG_SMP
299 /*
300 * If the BIOS enumerates physical processors before logical,
301 * maxcpus=N at enumeration-time can be used to disable HT.
302 */
303 else if (!memcmp(from, "maxcpus=", 8)) {
304 extern unsigned int maxcpus;
305
306 maxcpus = simple_strtoul(from + 8, NULL, 0);
307 }
308#endif
Len Brown888ba6c2005-08-24 12:07:20 -0400309#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700310 /* "acpi=off" disables both ACPI table parsing and interpreter init */
Andi Kleen681558f2006-03-25 16:29:46 +0100311 if (fullarg(from,"acpi=off"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312 disable_acpi();
313
Andi Kleen681558f2006-03-25 16:29:46 +0100314 if (fullarg(from, "acpi=force")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315 /* add later when we do DMI horrors: */
316 acpi_force = 1;
317 acpi_disabled = 0;
318 }
319
320 /* acpi=ht just means: do ACPI MADT parsing
321 at bootup, but don't enable the full ACPI interpreter */
Andi Kleen681558f2006-03-25 16:29:46 +0100322 if (fullarg(from, "acpi=ht")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323 if (!acpi_force)
324 disable_acpi();
325 acpi_ht = 1;
326 }
Andi Kleen681558f2006-03-25 16:29:46 +0100327 else if (fullarg(from, "pci=noacpi"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328 acpi_disable_pci();
Andi Kleen681558f2006-03-25 16:29:46 +0100329 else if (fullarg(from, "acpi=noirq"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700330 acpi_noirq_set();
331
Andi Kleen681558f2006-03-25 16:29:46 +0100332 else if (fullarg(from, "acpi_sci=edge"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700333 acpi_sci_flags.trigger = 1;
Andi Kleen681558f2006-03-25 16:29:46 +0100334 else if (fullarg(from, "acpi_sci=level"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700335 acpi_sci_flags.trigger = 3;
Andi Kleen681558f2006-03-25 16:29:46 +0100336 else if (fullarg(from, "acpi_sci=high"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700337 acpi_sci_flags.polarity = 1;
Andi Kleen681558f2006-03-25 16:29:46 +0100338 else if (fullarg(from, "acpi_sci=low"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339 acpi_sci_flags.polarity = 3;
340
341 /* acpi=strict disables out-of-spec workarounds */
Andi Kleen681558f2006-03-25 16:29:46 +0100342 else if (fullarg(from, "acpi=strict")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700343 acpi_strict = 1;
344 }
Andi Kleen22999242005-04-16 15:25:17 -0700345#ifdef CONFIG_X86_IO_APIC
Andi Kleen681558f2006-03-25 16:29:46 +0100346 else if (fullarg(from, "acpi_skip_timer_override"))
Andi Kleen22999242005-04-16 15:25:17 -0700347 acpi_skip_timer_override = 1;
348#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349#endif
350
Andi Kleen681558f2006-03-25 16:29:46 +0100351 if (fullarg(from, "disable_timer_pin_1"))
Chuck Ebbert66759a02005-09-12 18:49:25 +0200352 disable_timer_pin_1 = 1;
Andi Kleen681558f2006-03-25 16:29:46 +0100353 if (fullarg(from, "enable_timer_pin_1"))
Chuck Ebbert66759a02005-09-12 18:49:25 +0200354 disable_timer_pin_1 = -1;
355
Andi Kleend1530d82006-04-07 19:49:42 +0200356 if (fullarg(from, "nolapic") || fullarg(from, "disableapic")) {
357 clear_bit(X86_FEATURE_APIC, boot_cpu_data.x86_capability);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700358 disable_apic = 1;
Andi Kleend1530d82006-04-07 19:49:42 +0200359 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700360
Andi Kleen681558f2006-03-25 16:29:46 +0100361 if (fullarg(from, "noapic"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700362 skip_ioapic_setup = 1;
363
Andi Kleen681558f2006-03-25 16:29:46 +0100364 if (fullarg(from,"apic")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700365 skip_ioapic_setup = 0;
366 ioapic_force = 1;
367 }
368
369 if (!memcmp(from, "mem=", 4))
370 parse_memopt(from+4, &from);
371
akpm@osdl.org69cda7b2006-01-09 20:51:46 -0800372 if (!memcmp(from, "memmap=", 7)) {
373 /* exactmap option is for used defined memory */
374 if (!memcmp(from+7, "exactmap", 8)) {
375#ifdef CONFIG_CRASH_DUMP
376 /* If we are doing a crash dump, we
377 * still need to know the real mem
378 * size before original memory map is
379 * reset.
380 */
381 saved_max_pfn = e820_end_of_ram();
382#endif
383 from += 8+7;
384 end_pfn_map = 0;
385 e820.nr_map = 0;
386 userdef = 1;
387 }
388 else {
389 parse_memmapopt(from+7, &from);
390 userdef = 1;
391 }
392 }
393
Matt Tolentino2b976902005-06-23 00:08:06 -0700394#ifdef CONFIG_NUMA
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395 if (!memcmp(from, "numa=", 5))
396 numa_setup(from+5);
397#endif
398
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399 if (!memcmp(from,"iommu=",6)) {
400 iommu_setup(from+6);
401 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700402
Andi Kleen681558f2006-03-25 16:29:46 +0100403 if (fullarg(from,"oops=panic"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700404 panic_on_oops = 1;
405
406 if (!memcmp(from, "noexec=", 7))
407 nonx_setup(from + 7);
408
Eric W. Biederman5f5609d2005-06-25 14:58:04 -0700409#ifdef CONFIG_KEXEC
410 /* crashkernel=size@addr specifies the location to reserve for
411 * a crash kernel. By reserving this memory we guarantee
412 * that linux never set's it up as a DMA target.
413 * Useful for holding code to do something appropriate
414 * after a kernel panic.
415 */
416 else if (!memcmp(from, "crashkernel=", 12)) {
417 unsigned long size, base;
418 size = memparse(from+12, &from);
419 if (*from == '@') {
420 base = memparse(from+1, &from);
421 /* FIXME: Do I want a sanity check
422 * to validate the memory range?
423 */
424 crashk_res.start = base;
425 crashk_res.end = base + size - 1;
426 }
427 }
428#endif
429
Vivek Goyalaac04b32006-01-09 20:51:47 -0800430#ifdef CONFIG_PROC_VMCORE
431 /* elfcorehdr= specifies the location of elf core header
432 * stored by the crashed kernel. This option will be passed
433 * by kexec loader to the capture kernel.
434 */
435 else if(!memcmp(from, "elfcorehdr=", 11))
436 elfcorehdr_addr = memparse(from+11, &from);
437#endif
Andi Kleene2c03882006-02-26 04:18:46 +0100438
Brian Magnusond5176122006-02-27 04:02:04 +0100439#ifdef CONFIG_HOTPLUG_CPU
Andi Kleene2c03882006-02-26 04:18:46 +0100440 else if (!memcmp(from, "additional_cpus=", 16))
441 setup_additional_cpus(from+16);
442#endif
443
Linus Torvalds1da177e2005-04-16 15:20:36 -0700444 next_char:
445 c = *(from++);
446 if (!c)
447 break;
448 if (COMMAND_LINE_SIZE <= ++len)
449 break;
450 *(to++) = c;
451 }
akpm@osdl.org69cda7b2006-01-09 20:51:46 -0800452 if (userdef) {
453 printk(KERN_INFO "user-defined physical RAM map:\n");
454 e820_print_map("user");
455 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700456 *to = '\0';
457 *cmdline_p = command_line;
458}
459
Matt Tolentino2b976902005-06-23 00:08:06 -0700460#ifndef CONFIG_NUMA
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700461static void __init
462contig_initmem_init(unsigned long start_pfn, unsigned long end_pfn)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700463{
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700464 unsigned long bootmap_size, bootmap;
465
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700466 bootmap_size = bootmem_bootmap_pages(end_pfn)<<PAGE_SHIFT;
467 bootmap = find_e820_area(0, end_pfn<<PAGE_SHIFT, bootmap_size);
468 if (bootmap == -1L)
469 panic("Cannot find bootmem map of size %ld\n",bootmap_size);
470 bootmap_size = init_bootmem(bootmap >> PAGE_SHIFT, end_pfn);
471 e820_bootmem_free(NODE_DATA(0), 0, end_pfn << PAGE_SHIFT);
472 reserve_bootmem(bootmap, bootmap_size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700473}
474#endif
475
476/* Use inline assembly to define this because the nops are defined
477 as inline assembly strings in the include files and we cannot
478 get them easily into strings. */
479asm("\t.data\nk8nops: "
480 K8_NOP1 K8_NOP2 K8_NOP3 K8_NOP4 K8_NOP5 K8_NOP6
481 K8_NOP7 K8_NOP8);
482
483extern unsigned char k8nops[];
484static unsigned char *k8_nops[ASM_NOP_MAX+1] = {
485 NULL,
486 k8nops,
487 k8nops + 1,
488 k8nops + 1 + 2,
489 k8nops + 1 + 2 + 3,
490 k8nops + 1 + 2 + 3 + 4,
491 k8nops + 1 + 2 + 3 + 4 + 5,
492 k8nops + 1 + 2 + 3 + 4 + 5 + 6,
493 k8nops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
494};
495
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100496extern char __vsyscall_0;
497
Linus Torvalds1da177e2005-04-16 15:20:36 -0700498/* Replace instructions with better alternatives for this CPU type.
499
500 This runs before SMP is initialized to avoid SMP problems with
501 self modifying code. This implies that assymetric systems where
502 APs have less capabilities than the boot processor are not handled.
503 In this case boot with "noreplacement". */
504void apply_alternatives(void *start, void *end)
505{
506 struct alt_instr *a;
507 int diff, i, k;
508 for (a = start; (void *)a < end; a++) {
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100509 u8 *instr;
510
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511 if (!boot_cpu_has(a->cpuid))
512 continue;
513
514 BUG_ON(a->replacementlen > a->instrlen);
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100515 instr = a->instr;
516 /* vsyscall code is not mapped yet. resolve it manually. */
517 if (instr >= (u8 *)VSYSCALL_START && instr < (u8*)VSYSCALL_END)
518 instr = __va(instr - (u8*)VSYSCALL_START + (u8*)__pa_symbol(&__vsyscall_0));
519 __inline_memcpy(instr, a->replacement, a->replacementlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700520 diff = a->instrlen - a->replacementlen;
521
522 /* Pad the rest with nops */
523 for (i = a->replacementlen; diff > 0; diff -= k, i += k) {
524 k = diff;
525 if (k > ASM_NOP_MAX)
526 k = ASM_NOP_MAX;
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100527 __inline_memcpy(instr + i, k8_nops[k], k);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700528 }
529 }
530}
531
532static int no_replacement __initdata = 0;
533
534void __init alternative_instructions(void)
535{
536 extern struct alt_instr __alt_instructions[], __alt_instructions_end[];
537 if (no_replacement)
538 return;
539 apply_alternatives(__alt_instructions, __alt_instructions_end);
540}
541
542static int __init noreplacement_setup(char *s)
543{
544 no_replacement = 1;
OGAWA Hirofumi9b410462006-03-31 02:30:33 -0800545 return 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700546}
547
548__setup("noreplacement", noreplacement_setup);
549
550#if defined(CONFIG_EDD) || defined(CONFIG_EDD_MODULE)
551struct edd edd;
552#ifdef CONFIG_EDD_MODULE
553EXPORT_SYMBOL(edd);
554#endif
555/**
556 * copy_edd() - Copy the BIOS EDD information
557 * from boot_params into a safe place.
558 *
559 */
560static inline void copy_edd(void)
561{
562 memcpy(edd.mbr_signature, EDD_MBR_SIGNATURE, sizeof(edd.mbr_signature));
563 memcpy(edd.edd_info, EDD_BUF, sizeof(edd.edd_info));
564 edd.mbr_signature_nr = EDD_MBR_SIG_NR;
565 edd.edd_info_nr = EDD_NR;
566}
567#else
568static inline void copy_edd(void)
569{
570}
571#endif
572
573#define EBDA_ADDR_POINTER 0x40E
Andi Kleenac71d122006-05-08 15:17:28 +0200574
575unsigned __initdata ebda_addr;
576unsigned __initdata ebda_size;
577
578static void discover_ebda(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700579{
Andi Kleenac71d122006-05-08 15:17:28 +0200580 /*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700581 * there is a real-mode segmented pointer pointing to the
582 * 4K EBDA area at 0x40E
583 */
Andi Kleenac71d122006-05-08 15:17:28 +0200584 ebda_addr = *(unsigned short *)EBDA_ADDR_POINTER;
585 ebda_addr <<= 4;
586
587 ebda_size = *(unsigned short *)(unsigned long)ebda_addr;
588
589 /* Round EBDA up to pages */
590 if (ebda_size == 0)
591 ebda_size = 1;
592 ebda_size <<= 10;
593 ebda_size = round_up(ebda_size + (ebda_addr & ~PAGE_MASK), PAGE_SIZE);
594 if (ebda_size > 64*1024)
595 ebda_size = 64*1024;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700596}
597
598void __init setup_arch(char **cmdline_p)
599{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700600 unsigned long kernel_end;
601
602 ROOT_DEV = old_decode_dev(ORIG_ROOT_DEV);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700603 screen_info = SCREEN_INFO;
604 edid_info = EDID_INFO;
605 saved_video_mode = SAVED_VIDEO_MODE;
606 bootloader_type = LOADER_TYPE;
607
608#ifdef CONFIG_BLK_DEV_RAM
609 rd_image_start = RAMDISK_FLAGS & RAMDISK_IMAGE_START_MASK;
610 rd_prompt = ((RAMDISK_FLAGS & RAMDISK_PROMPT_FLAG) != 0);
611 rd_doload = ((RAMDISK_FLAGS & RAMDISK_LOAD_FLAG) != 0);
612#endif
613 setup_memory_region();
614 copy_edd();
615
616 if (!MOUNT_ROOT_RDONLY)
617 root_mountflags &= ~MS_RDONLY;
618 init_mm.start_code = (unsigned long) &_text;
619 init_mm.end_code = (unsigned long) &_etext;
620 init_mm.end_data = (unsigned long) &_edata;
621 init_mm.brk = (unsigned long) &_end;
622
623 code_resource.start = virt_to_phys(&_text);
624 code_resource.end = virt_to_phys(&_etext)-1;
625 data_resource.start = virt_to_phys(&_etext);
626 data_resource.end = virt_to_phys(&_edata)-1;
627
628 parse_cmdline_early(cmdline_p);
629
630 early_identify_cpu(&boot_cpu_data);
631
632 /*
633 * partially used pages are not usable - thus
634 * we are rounding upwards:
635 */
636 end_pfn = e820_end_of_ram();
Andi Kleen1f502492006-03-25 16:29:58 +0100637 num_physpages = end_pfn; /* for pfn_valid */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700638
639 check_efer();
640
Andi Kleenac71d122006-05-08 15:17:28 +0200641 discover_ebda();
642
Linus Torvalds1da177e2005-04-16 15:20:36 -0700643 init_memory_mapping(0, (end_pfn_map << PAGE_SHIFT));
644
Andi Kleenf2d3efe2006-03-25 16:30:22 +0100645 dmi_scan_machine();
646
Siddha, Suresh Bf6c2e332005-11-05 17:25:53 +0100647 zap_low_mappings(0);
648
Len Brown888ba6c2005-08-24 12:07:20 -0400649#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700650 /*
651 * Initialize the ACPI boot-time table parser (gets the RSDP and SDT).
652 * Call this early for SRAT node setup.
653 */
654 acpi_boot_table_init();
655#endif
656
657#ifdef CONFIG_ACPI_NUMA
658 /*
659 * Parse SRAT to discover nodes.
660 */
661 acpi_numa_init();
662#endif
663
Matt Tolentino2b976902005-06-23 00:08:06 -0700664#ifdef CONFIG_NUMA
Linus Torvalds1da177e2005-04-16 15:20:36 -0700665 numa_initmem_init(0, end_pfn);
666#else
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700667 contig_initmem_init(0, end_pfn);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700668#endif
669
670 /* Reserve direct mapping */
671 reserve_bootmem_generic(table_start << PAGE_SHIFT,
672 (table_end - table_start) << PAGE_SHIFT);
673
674 /* reserve kernel */
675 kernel_end = round_up(__pa_symbol(&_end),PAGE_SIZE);
676 reserve_bootmem_generic(HIGH_MEMORY, kernel_end - HIGH_MEMORY);
677
678 /*
679 * reserve physical page 0 - it's a special BIOS page on many boxes,
680 * enabling clean reboots, SMP operation, laptop functions.
681 */
682 reserve_bootmem_generic(0, PAGE_SIZE);
683
684 /* reserve ebda region */
Andi Kleenac71d122006-05-08 15:17:28 +0200685 if (ebda_addr)
686 reserve_bootmem_generic(ebda_addr, ebda_size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700687
688#ifdef CONFIG_SMP
689 /*
690 * But first pinch a few for the stack/trampoline stuff
691 * FIXME: Don't need the extra page at 4K, but need to fix
692 * trampoline before removing it. (see the GDT stuff)
693 */
694 reserve_bootmem_generic(PAGE_SIZE, PAGE_SIZE);
695
696 /* Reserve SMP trampoline */
697 reserve_bootmem_generic(SMP_TRAMPOLINE_BASE, PAGE_SIZE);
698#endif
699
700#ifdef CONFIG_ACPI_SLEEP
701 /*
702 * Reserve low memory region for sleep support.
703 */
704 acpi_reserve_bootmem();
705#endif
706#ifdef CONFIG_X86_LOCAL_APIC
707 /*
708 * Find and reserve possible boot-time SMP configuration:
709 */
710 find_smp_config();
711#endif
712#ifdef CONFIG_BLK_DEV_INITRD
713 if (LOADER_TYPE && INITRD_START) {
714 if (INITRD_START + INITRD_SIZE <= (end_pfn << PAGE_SHIFT)) {
715 reserve_bootmem_generic(INITRD_START, INITRD_SIZE);
716 initrd_start =
717 INITRD_START ? INITRD_START + PAGE_OFFSET : 0;
718 initrd_end = initrd_start+INITRD_SIZE;
719 }
720 else {
721 printk(KERN_ERR "initrd extends beyond end of memory "
722 "(0x%08lx > 0x%08lx)\ndisabling initrd\n",
723 (unsigned long)(INITRD_START + INITRD_SIZE),
724 (unsigned long)(end_pfn << PAGE_SHIFT));
725 initrd_start = 0;
726 }
727 }
728#endif
Eric W. Biederman5f5609d2005-06-25 14:58:04 -0700729#ifdef CONFIG_KEXEC
730 if (crashk_res.start != crashk_res.end) {
Amul Shah00212fe2006-06-25 05:49:31 -0700731 reserve_bootmem_generic(crashk_res.start,
Eric W. Biederman5f5609d2005-06-25 14:58:04 -0700732 crashk_res.end - crashk_res.start + 1);
733 }
734#endif
Eric W. Biederman0d317fb2005-08-06 13:47:36 -0600735
Linus Torvalds1da177e2005-04-16 15:20:36 -0700736 paging_init();
737
738 check_ioapic();
739
Ashok Raj51f62e12006-03-25 16:29:28 +0100740 /*
741 * set this early, so we dont allocate cpu0
742 * if MADT list doesnt list BSP first
743 * mpparse.c/MP_processor_info() allocates logical cpu numbers.
744 */
745 cpu_set(0, cpu_present_map);
Len Brown888ba6c2005-08-24 12:07:20 -0400746#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700747 /*
748 * Read APIC and some other early information from ACPI tables.
749 */
750 acpi_boot_init();
751#endif
752
Ravikiran Thirumalai05b3cbd2006-01-11 22:45:36 +0100753 init_cpu_to_node();
754
Linus Torvalds1da177e2005-04-16 15:20:36 -0700755#ifdef CONFIG_X86_LOCAL_APIC
756 /*
757 * get boot-time SMP configuration:
758 */
759 if (smp_found_config)
760 get_smp_config();
761 init_apic_mappings();
762#endif
763
764 /*
765 * Request address space for all standard RAM and ROM resources
766 * and also for regions reported as reserved by the e820.
767 */
768 probe_roms();
769 e820_reserve_resources();
770
771 request_resource(&iomem_resource, &video_ram_resource);
772
773 {
774 unsigned i;
775 /* request I/O space for devices used on all i[345]86 PCs */
776 for (i = 0; i < STANDARD_IO_RESOURCES; i++)
777 request_resource(&ioport_resource, &standard_io_resources[i]);
778 }
779
Andi Kleena1e97782005-04-16 15:25:12 -0700780 e820_setup_gap();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700781
782#ifdef CONFIG_GART_IOMMU
Jon Mason5b7b6442006-02-03 21:51:59 +0100783 iommu_hole_init();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700784#endif
785
786#ifdef CONFIG_VT
787#if defined(CONFIG_VGA_CONSOLE)
788 conswitchp = &vga_con;
789#elif defined(CONFIG_DUMMY_CONSOLE)
790 conswitchp = &dummy_con;
791#endif
792#endif
793}
794
Ashok Raje6982c62005-06-25 14:54:58 -0700795static int __cpuinit get_model_name(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700796{
797 unsigned int *v;
798
Andi Kleenebfcaa92005-04-16 15:25:18 -0700799 if (c->extended_cpuid_level < 0x80000004)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700800 return 0;
801
802 v = (unsigned int *) c->x86_model_id;
803 cpuid(0x80000002, &v[0], &v[1], &v[2], &v[3]);
804 cpuid(0x80000003, &v[4], &v[5], &v[6], &v[7]);
805 cpuid(0x80000004, &v[8], &v[9], &v[10], &v[11]);
806 c->x86_model_id[48] = 0;
807 return 1;
808}
809
810
Ashok Raje6982c62005-06-25 14:54:58 -0700811static void __cpuinit display_cacheinfo(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700812{
813 unsigned int n, dummy, eax, ebx, ecx, edx;
814
Andi Kleenebfcaa92005-04-16 15:25:18 -0700815 n = c->extended_cpuid_level;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700816
817 if (n >= 0x80000005) {
818 cpuid(0x80000005, &dummy, &ebx, &ecx, &edx);
819 printk(KERN_INFO "CPU: L1 I Cache: %dK (%d bytes/line), D cache %dK (%d bytes/line)\n",
820 edx>>24, edx&0xFF, ecx>>24, ecx&0xFF);
821 c->x86_cache_size=(ecx>>24)+(edx>>24);
822 /* On K8 L1 TLB is inclusive, so don't count it */
823 c->x86_tlbsize = 0;
824 }
825
826 if (n >= 0x80000006) {
827 cpuid(0x80000006, &dummy, &ebx, &ecx, &edx);
828 ecx = cpuid_ecx(0x80000006);
829 c->x86_cache_size = ecx >> 16;
830 c->x86_tlbsize += ((ebx >> 16) & 0xfff) + (ebx & 0xfff);
831
832 printk(KERN_INFO "CPU: L2 Cache: %dK (%d bytes/line)\n",
833 c->x86_cache_size, ecx & 0xFF);
834 }
835
836 if (n >= 0x80000007)
837 cpuid(0x80000007, &dummy, &dummy, &dummy, &c->x86_power);
838 if (n >= 0x80000008) {
839 cpuid(0x80000008, &eax, &dummy, &dummy, &dummy);
840 c->x86_virt_bits = (eax >> 8) & 0xff;
841 c->x86_phys_bits = eax & 0xff;
842 }
843}
844
Andi Kleen3f098c22005-09-12 18:49:24 +0200845#ifdef CONFIG_NUMA
846static int nearby_node(int apicid)
847{
848 int i;
849 for (i = apicid - 1; i >= 0; i--) {
850 int node = apicid_to_node[i];
851 if (node != NUMA_NO_NODE && node_online(node))
852 return node;
853 }
854 for (i = apicid + 1; i < MAX_LOCAL_APIC; i++) {
855 int node = apicid_to_node[i];
856 if (node != NUMA_NO_NODE && node_online(node))
857 return node;
858 }
859 return first_node(node_online_map); /* Shouldn't happen */
860}
861#endif
862
Andi Kleen63518642005-04-16 15:25:16 -0700863/*
864 * On a AMD dual core setup the lower bits of the APIC id distingush the cores.
865 * Assumes number of cores is a power of two.
866 */
867static void __init amd_detect_cmp(struct cpuinfo_x86 *c)
868{
869#ifdef CONFIG_SMP
Andi Kleen29422832005-05-16 21:53:26 -0700870 int cpu = smp_processor_id();
Andi Kleenb41e2932005-05-20 14:27:55 -0700871 unsigned bits;
Andi Kleen3f098c22005-09-12 18:49:24 +0200872#ifdef CONFIG_NUMA
873 int node = 0;
Ravikiran G Thirumalai60c1bc82006-03-25 16:30:04 +0100874 unsigned apicid = hard_smp_processor_id();
Andi Kleen3f098c22005-09-12 18:49:24 +0200875#endif
Andi Kleenfaee9a52006-06-26 13:56:10 +0200876 unsigned ecx = cpuid_ecx(0x80000008);
Andi Kleenb41e2932005-05-20 14:27:55 -0700877
Andi Kleenfaee9a52006-06-26 13:56:10 +0200878 c->x86_max_cores = (ecx & 0xff) + 1;
879
880 /* CPU telling us the core id bits shift? */
881 bits = (ecx >> 12) & 0xF;
882
883 /* Otherwise recompute */
884 if (bits == 0) {
885 while ((1 << bits) < c->x86_max_cores)
886 bits++;
887 }
Andi Kleenb41e2932005-05-20 14:27:55 -0700888
889 /* Low order bits define the core id (index of core in socket) */
890 cpu_core_id[cpu] = phys_proc_id[cpu] & ((1 << bits)-1);
891 /* Convert the APIC ID into the socket ID */
Ravikiran G Thirumalai60c1bc82006-03-25 16:30:04 +0100892 phys_proc_id[cpu] = phys_pkg_id(bits);
Andi Kleen63518642005-04-16 15:25:16 -0700893
894#ifdef CONFIG_NUMA
Andi Kleen3f098c22005-09-12 18:49:24 +0200895 node = phys_proc_id[cpu];
896 if (apicid_to_node[apicid] != NUMA_NO_NODE)
897 node = apicid_to_node[apicid];
898 if (!node_online(node)) {
899 /* Two possibilities here:
900 - The CPU is missing memory and no node was created.
901 In that case try picking one from a nearby CPU
902 - The APIC IDs differ from the HyperTransport node IDs
903 which the K8 northbridge parsing fills in.
904 Assume they are all increased by a constant offset,
905 but in the same order as the HT nodeids.
906 If that doesn't result in a usable node fall back to the
907 path for the previous case. */
908 int ht_nodeid = apicid - (phys_proc_id[0] << bits);
909 if (ht_nodeid >= 0 &&
910 apicid_to_node[ht_nodeid] != NUMA_NO_NODE)
911 node = apicid_to_node[ht_nodeid];
912 /* Pick a nearby node */
913 if (!node_online(node))
914 node = nearby_node(apicid);
915 }
Andi Kleen69d81fc2005-11-05 17:25:53 +0100916 numa_set_node(cpu, node);
Andi Kleena1586082005-05-16 21:53:21 -0700917
Andi Kleen77d910f2006-03-25 16:29:34 +0100918 printk(KERN_INFO "CPU %d/%x(%d) -> Node %d -> Core %d\n",
919 cpu, apicid, c->x86_max_cores, node, cpu_core_id[cpu]);
Andi Kleen3f098c22005-09-12 18:49:24 +0200920#endif
Andi Kleen63518642005-04-16 15:25:16 -0700921#endif
922}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700923
924static int __init init_amd(struct cpuinfo_x86 *c)
925{
926 int r;
Andi Kleen7bcd3f32006-02-03 21:51:02 +0100927 unsigned level;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700928
Linus Torvaldsbc5e8fd2005-09-17 15:41:04 -0700929#ifdef CONFIG_SMP
930 unsigned long value;
931
Andi Kleen7d318d72005-09-29 22:05:55 +0200932 /*
933 * Disable TLB flush filter by setting HWCR.FFDIS on K8
934 * bit 6 of msr C001_0015
935 *
936 * Errata 63 for SH-B3 steppings
937 * Errata 122 for all steppings (F+ have it disabled by default)
938 */
939 if (c->x86 == 15) {
940 rdmsrl(MSR_K8_HWCR, value);
941 value |= 1 << 6;
942 wrmsrl(MSR_K8_HWCR, value);
943 }
Linus Torvaldsbc5e8fd2005-09-17 15:41:04 -0700944#endif
945
Linus Torvalds1da177e2005-04-16 15:20:36 -0700946 /* Bit 31 in normal CPUID used for nonstandard 3DNow ID;
947 3DNow is IDd by bit 31 in extended CPUID (1*32+31) anyway */
948 clear_bit(0*32+31, &c->x86_capability);
949
Andi Kleen7bcd3f32006-02-03 21:51:02 +0100950 /* On C+ stepping K8 rep microcode works well for copy/memset */
951 level = cpuid_eax(1);
952 if (c->x86 == 15 && ((level >= 0x0f48 && level < 0x0f50) || level >= 0x0f58))
953 set_bit(X86_FEATURE_REP_GOOD, &c->x86_capability);
954
Andi Kleen18bd0572006-04-20 02:36:45 +0200955 /* Enable workaround for FXSAVE leak */
956 if (c->x86 >= 6)
957 set_bit(X86_FEATURE_FXSAVE_LEAK, &c->x86_capability);
958
Linus Torvalds1da177e2005-04-16 15:20:36 -0700959 r = get_model_name(c);
960 if (!r) {
961 switch (c->x86) {
962 case 15:
963 /* Should distinguish Models here, but this is only
964 a fallback anyways. */
965 strcpy(c->x86_model_id, "Hammer");
966 break;
967 }
968 }
969 display_cacheinfo(c);
970
Andi Kleen130951c2006-01-11 22:42:02 +0100971 /* c->x86_power is 8000_0007 edx. Bit 8 is constant TSC */
972 if (c->x86_power & (1<<8))
973 set_bit(X86_FEATURE_CONSTANT_TSC, &c->x86_capability);
974
Andi Kleenfaee9a52006-06-26 13:56:10 +0200975 /* Multi core CPU? */
976 if (c->extended_cpuid_level >= 0x80000008)
Andi Kleen63518642005-04-16 15:25:16 -0700977 amd_detect_cmp(c);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700978
979 return r;
980}
981
Ashok Raje6982c62005-06-25 14:54:58 -0700982static void __cpuinit detect_ht(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700983{
984#ifdef CONFIG_SMP
985 u32 eax, ebx, ecx, edx;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100986 int index_msb, core_bits;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700987 int cpu = smp_processor_id();
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100988
989 cpuid(1, &eax, &ebx, &ecx, &edx);
990
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100991
Andi Kleen63518642005-04-16 15:25:16 -0700992 if (!cpu_has(c, X86_FEATURE_HT) || cpu_has(c, X86_FEATURE_CMP_LEGACY))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700993 return;
994
Linus Torvalds1da177e2005-04-16 15:20:36 -0700995 smp_num_siblings = (ebx & 0xff0000) >> 16;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100996
Linus Torvalds1da177e2005-04-16 15:20:36 -0700997 if (smp_num_siblings == 1) {
998 printk(KERN_INFO "CPU: Hyper-Threading is disabled\n");
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100999 } else if (smp_num_siblings > 1 ) {
1000
Linus Torvalds1da177e2005-04-16 15:20:36 -07001001 if (smp_num_siblings > NR_CPUS) {
1002 printk(KERN_WARNING "CPU: Unsupported number of the siblings %d", smp_num_siblings);
1003 smp_num_siblings = 1;
1004 return;
1005 }
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001006
1007 index_msb = get_count_order(smp_num_siblings);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001008 phys_proc_id[cpu] = phys_pkg_id(index_msb);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001009
Linus Torvalds1da177e2005-04-16 15:20:36 -07001010 printk(KERN_INFO "CPU: Physical Processor ID: %d\n",
1011 phys_proc_id[cpu]);
Andi Kleen3dd9d512005-04-16 15:25:15 -07001012
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001013 smp_num_siblings = smp_num_siblings / c->x86_max_cores;
Andi Kleen3dd9d512005-04-16 15:25:15 -07001014
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001015 index_msb = get_count_order(smp_num_siblings) ;
Andi Kleen3dd9d512005-04-16 15:25:15 -07001016
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001017 core_bits = get_count_order(c->x86_max_cores);
Andi Kleen3dd9d512005-04-16 15:25:15 -07001018
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001019 cpu_core_id[cpu] = phys_pkg_id(index_msb) &
1020 ((1 << core_bits) - 1);
1021
1022 if (c->x86_max_cores > 1)
Andi Kleen3dd9d512005-04-16 15:25:15 -07001023 printk(KERN_INFO "CPU: Processor Core ID: %d\n",
1024 cpu_core_id[cpu]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001025 }
1026#endif
1027}
1028
Andi Kleen3dd9d512005-04-16 15:25:15 -07001029/*
1030 * find out the number of processor cores on the die
1031 */
Ashok Raje6982c62005-06-25 14:54:58 -07001032static int __cpuinit intel_num_cpu_cores(struct cpuinfo_x86 *c)
Andi Kleen3dd9d512005-04-16 15:25:15 -07001033{
1034 unsigned int eax;
1035
1036 if (c->cpuid_level < 4)
1037 return 1;
1038
1039 __asm__("cpuid"
1040 : "=a" (eax)
1041 : "0" (4), "c" (0)
1042 : "bx", "dx");
1043
1044 if (eax & 0x1f)
1045 return ((eax >> 26) + 1);
1046 else
1047 return 1;
1048}
1049
Andi Kleendf0cc262005-09-12 18:49:24 +02001050static void srat_detect_node(void)
1051{
1052#ifdef CONFIG_NUMA
Ravikiran G Thirumalaiddea7be2005-10-03 10:36:28 -07001053 unsigned node;
Andi Kleendf0cc262005-09-12 18:49:24 +02001054 int cpu = smp_processor_id();
1055
1056 /* Don't do the funky fallback heuristics the AMD version employs
1057 for now. */
Ravikiran G Thirumalaiddea7be2005-10-03 10:36:28 -07001058 node = apicid_to_node[hard_smp_processor_id()];
Andi Kleendf0cc262005-09-12 18:49:24 +02001059 if (node == NUMA_NO_NODE)
Daniel Yeisley0d015322006-05-30 22:47:57 +02001060 node = first_node(node_online_map);
Andi Kleen69d81fc2005-11-05 17:25:53 +01001061 numa_set_node(cpu, node);
Andi Kleendf0cc262005-09-12 18:49:24 +02001062
1063 if (acpi_numa > 0)
1064 printk(KERN_INFO "CPU %d -> Node %d\n", cpu, node);
1065#endif
1066}
1067
Ashok Raje6982c62005-06-25 14:54:58 -07001068static void __cpuinit init_intel(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001069{
1070 /* Cache sizes */
1071 unsigned n;
1072
1073 init_intel_cacheinfo(c);
Andi Kleenebfcaa92005-04-16 15:25:18 -07001074 n = c->extended_cpuid_level;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001075 if (n >= 0x80000008) {
1076 unsigned eax = cpuid_eax(0x80000008);
1077 c->x86_virt_bits = (eax >> 8) & 0xff;
1078 c->x86_phys_bits = eax & 0xff;
Shaohua Liaf9c1422005-11-05 17:25:54 +01001079 /* CPUID workaround for Intel 0F34 CPU */
1080 if (c->x86_vendor == X86_VENDOR_INTEL &&
1081 c->x86 == 0xF && c->x86_model == 0x3 &&
1082 c->x86_mask == 0x4)
1083 c->x86_phys_bits = 36;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001084 }
1085
1086 if (c->x86 == 15)
1087 c->x86_cache_alignment = c->x86_clflush_size * 2;
Andi Kleen39b3a792006-01-11 22:42:45 +01001088 if ((c->x86 == 0xf && c->x86_model >= 0x03) ||
1089 (c->x86 == 0x6 && c->x86_model >= 0x0e))
Andi Kleenc29601e2005-04-16 15:25:05 -07001090 set_bit(X86_FEATURE_CONSTANT_TSC, &c->x86_capability);
Andi Kleenc818a182006-01-11 22:45:24 +01001091 set_bit(X86_FEATURE_SYNC_RDTSC, &c->x86_capability);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001092 c->x86_max_cores = intel_num_cpu_cores(c);
Andi Kleendf0cc262005-09-12 18:49:24 +02001093
1094 srat_detect_node();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001095}
1096
Adrian Bunk672289e2005-09-10 00:27:21 -07001097static void __cpuinit get_cpu_vendor(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001098{
1099 char *v = c->x86_vendor_id;
1100
1101 if (!strcmp(v, "AuthenticAMD"))
1102 c->x86_vendor = X86_VENDOR_AMD;
1103 else if (!strcmp(v, "GenuineIntel"))
1104 c->x86_vendor = X86_VENDOR_INTEL;
1105 else
1106 c->x86_vendor = X86_VENDOR_UNKNOWN;
1107}
1108
1109struct cpu_model_info {
1110 int vendor;
1111 int family;
1112 char *model_names[16];
1113};
1114
1115/* Do some early cpuid on the boot CPU to get some parameter that are
1116 needed before check_bugs. Everything advanced is in identify_cpu
1117 below. */
Ashok Raje6982c62005-06-25 14:54:58 -07001118void __cpuinit early_identify_cpu(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001119{
1120 u32 tfms;
1121
1122 c->loops_per_jiffy = loops_per_jiffy;
1123 c->x86_cache_size = -1;
1124 c->x86_vendor = X86_VENDOR_UNKNOWN;
1125 c->x86_model = c->x86_mask = 0; /* So far unknown... */
1126 c->x86_vendor_id[0] = '\0'; /* Unset */
1127 c->x86_model_id[0] = '\0'; /* Unset */
1128 c->x86_clflush_size = 64;
1129 c->x86_cache_alignment = c->x86_clflush_size;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001130 c->x86_max_cores = 1;
Andi Kleenebfcaa92005-04-16 15:25:18 -07001131 c->extended_cpuid_level = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001132 memset(&c->x86_capability, 0, sizeof c->x86_capability);
1133
1134 /* Get vendor name */
1135 cpuid(0x00000000, (unsigned int *)&c->cpuid_level,
1136 (unsigned int *)&c->x86_vendor_id[0],
1137 (unsigned int *)&c->x86_vendor_id[8],
1138 (unsigned int *)&c->x86_vendor_id[4]);
1139
1140 get_cpu_vendor(c);
1141
1142 /* Initialize the standard set of capabilities */
1143 /* Note that the vendor-specific code below might override */
1144
1145 /* Intel-defined flags: level 0x00000001 */
1146 if (c->cpuid_level >= 0x00000001) {
1147 __u32 misc;
1148 cpuid(0x00000001, &tfms, &misc, &c->x86_capability[4],
1149 &c->x86_capability[0]);
1150 c->x86 = (tfms >> 8) & 0xf;
1151 c->x86_model = (tfms >> 4) & 0xf;
1152 c->x86_mask = tfms & 0xf;
Suresh Siddhaf5f786d2005-11-05 17:25:53 +01001153 if (c->x86 == 0xf)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001154 c->x86 += (tfms >> 20) & 0xff;
Suresh Siddhaf5f786d2005-11-05 17:25:53 +01001155 if (c->x86 >= 0x6)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001156 c->x86_model += ((tfms >> 16) & 0xF) << 4;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001157 if (c->x86_capability[0] & (1<<19))
1158 c->x86_clflush_size = ((misc >> 8) & 0xff) * 8;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001159 } else {
1160 /* Have CPUID level 0 only - unheard of */
1161 c->x86 = 4;
1162 }
Andi Kleena1586082005-05-16 21:53:21 -07001163
1164#ifdef CONFIG_SMP
Andi Kleenb41e2932005-05-20 14:27:55 -07001165 phys_proc_id[smp_processor_id()] = (cpuid_ebx(1) >> 24) & 0xff;
Andi Kleena1586082005-05-16 21:53:21 -07001166#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001167}
1168
1169/*
1170 * This does the hard work of actually picking apart the CPU stuff...
1171 */
Ashok Raje6982c62005-06-25 14:54:58 -07001172void __cpuinit identify_cpu(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001173{
1174 int i;
1175 u32 xlvl;
1176
1177 early_identify_cpu(c);
1178
1179 /* AMD-defined flags: level 0x80000001 */
1180 xlvl = cpuid_eax(0x80000000);
Andi Kleenebfcaa92005-04-16 15:25:18 -07001181 c->extended_cpuid_level = xlvl;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001182 if ((xlvl & 0xffff0000) == 0x80000000) {
1183 if (xlvl >= 0x80000001) {
1184 c->x86_capability[1] = cpuid_edx(0x80000001);
H. Peter Anvin5b7abc62005-05-01 08:58:49 -07001185 c->x86_capability[6] = cpuid_ecx(0x80000001);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001186 }
1187 if (xlvl >= 0x80000004)
1188 get_model_name(c); /* Default name */
1189 }
1190
1191 /* Transmeta-defined flags: level 0x80860001 */
1192 xlvl = cpuid_eax(0x80860000);
1193 if ((xlvl & 0xffff0000) == 0x80860000) {
1194 /* Don't set x86_cpuid_level here for now to not confuse. */
1195 if (xlvl >= 0x80860001)
1196 c->x86_capability[2] = cpuid_edx(0x80860001);
1197 }
1198
Siddha, Suresh B1e9f28f2006-03-27 01:15:22 -08001199 c->apicid = phys_pkg_id(0);
1200
Linus Torvalds1da177e2005-04-16 15:20:36 -07001201 /*
1202 * Vendor-specific initialization. In this section we
1203 * canonicalize the feature flags, meaning if there are
1204 * features a certain CPU supports which CPUID doesn't
1205 * tell us, CPUID claiming incorrect flags, or other bugs,
1206 * we handle them here.
1207 *
1208 * At the end of this section, c->x86_capability better
1209 * indicate the features this CPU genuinely supports!
1210 */
1211 switch (c->x86_vendor) {
1212 case X86_VENDOR_AMD:
1213 init_amd(c);
1214 break;
1215
1216 case X86_VENDOR_INTEL:
1217 init_intel(c);
1218 break;
1219
1220 case X86_VENDOR_UNKNOWN:
1221 default:
1222 display_cacheinfo(c);
1223 break;
1224 }
1225
1226 select_idle_routine(c);
1227 detect_ht(c);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001228
1229 /*
1230 * On SMP, boot_cpu_data holds the common feature set between
1231 * all CPUs; so make sure that we indicate which features are
1232 * common between the CPUs. The first time this routine gets
1233 * executed, c == &boot_cpu_data.
1234 */
1235 if (c != &boot_cpu_data) {
1236 /* AND the already accumulated flags with these */
1237 for (i = 0 ; i < NCAPINTS ; i++)
1238 boot_cpu_data.x86_capability[i] &= c->x86_capability[i];
1239 }
1240
1241#ifdef CONFIG_X86_MCE
1242 mcheck_init(c);
1243#endif
Shaohua Li3b520b22005-07-07 17:56:38 -07001244 if (c == &boot_cpu_data)
1245 mtrr_bp_init();
1246 else
1247 mtrr_ap_init();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001248#ifdef CONFIG_NUMA
Andi Kleen3019e8e2005-07-28 21:15:28 -07001249 numa_add_cpu(smp_processor_id());
Linus Torvalds1da177e2005-04-16 15:20:36 -07001250#endif
1251}
1252
1253
Ashok Raje6982c62005-06-25 14:54:58 -07001254void __cpuinit print_cpu_info(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001255{
1256 if (c->x86_model_id[0])
1257 printk("%s", c->x86_model_id);
1258
1259 if (c->x86_mask || c->cpuid_level >= 0)
1260 printk(" stepping %02x\n", c->x86_mask);
1261 else
1262 printk("\n");
1263}
1264
1265/*
1266 * Get CPU information for use by the procfs.
1267 */
1268
1269static int show_cpuinfo(struct seq_file *m, void *v)
1270{
1271 struct cpuinfo_x86 *c = v;
1272
1273 /*
1274 * These flag bits must match the definitions in <asm/cpufeature.h>.
1275 * NULL means this bit is undefined or reserved; either way it doesn't
1276 * have meaning as far as Linux is concerned. Note that it's important
1277 * to realize there is a difference between this table and CPUID -- if
1278 * applications want to get the raw CPUID data, they should access
1279 * /dev/cpu/<cpu_nr>/cpuid instead.
1280 */
1281 static char *x86_cap_flags[] = {
1282 /* Intel-defined */
1283 "fpu", "vme", "de", "pse", "tsc", "msr", "pae", "mce",
1284 "cx8", "apic", NULL, "sep", "mtrr", "pge", "mca", "cmov",
1285 "pat", "pse36", "pn", "clflush", NULL, "dts", "acpi", "mmx",
1286 "fxsr", "sse", "sse2", "ss", "ht", "tm", "ia64", NULL,
1287
1288 /* AMD-defined */
Zwane Mwaikambo3c3b73b2005-05-01 08:58:51 -07001289 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001290 NULL, NULL, NULL, "syscall", NULL, NULL, NULL, NULL,
1291 NULL, NULL, NULL, NULL, "nx", NULL, "mmxext", NULL,
Andi Kleen3f98bc42006-01-11 22:42:51 +01001292 NULL, "fxsr_opt", "rdtscp", NULL, NULL, "lm", "3dnowext", "3dnow",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001293
1294 /* Transmeta-defined */
1295 "recovery", "longrun", NULL, "lrti", NULL, NULL, NULL, NULL,
1296 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1297 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1298 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1299
1300 /* Other (Linux-defined) */
Andi Kleen622dcaf2005-05-16 21:53:26 -07001301 "cxmmx", NULL, "cyrix_arr", "centaur_mcr", NULL,
Andi Kleenc29601e2005-04-16 15:25:05 -07001302 "constant_tsc", NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001303 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1304 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1305 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1306
1307 /* Intel-defined (#2) */
Andi Kleen9d95dd82006-03-25 16:31:22 +01001308 "pni", NULL, NULL, "monitor", "ds_cpl", "vmx", "smx", "est",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001309 "tm2", NULL, "cid", NULL, NULL, "cx16", "xtpr", NULL,
1310 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1311 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1312
H. Peter Anvin5b7abc62005-05-01 08:58:49 -07001313 /* VIA/Cyrix/Centaur-defined */
1314 NULL, NULL, "rng", "rng_en", NULL, NULL, "ace", "ace_en",
1315 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1316 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1317 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1318
Linus Torvalds1da177e2005-04-16 15:20:36 -07001319 /* AMD-defined (#2) */
Andi Kleen3f98bc42006-01-11 22:42:51 +01001320 "lahf_lm", "cmp_legacy", "svm", NULL, "cr8_legacy", NULL, NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001321 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1322 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
H. Peter Anvin5b7abc62005-05-01 08:58:49 -07001323 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001324 };
1325 static char *x86_power_flags[] = {
1326 "ts", /* temperature sensor */
1327 "fid", /* frequency id control */
1328 "vid", /* voltage id control */
1329 "ttp", /* thermal trip */
1330 "tm",
Andi Kleen3f98bc42006-01-11 22:42:51 +01001331 "stc",
1332 NULL,
Andi Kleen39b3a792006-01-11 22:42:45 +01001333 /* nothing */ /* constant_tsc - moved to flags */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001334 };
1335
1336
1337#ifdef CONFIG_SMP
1338 if (!cpu_online(c-cpu_data))
1339 return 0;
1340#endif
1341
1342 seq_printf(m,"processor\t: %u\n"
1343 "vendor_id\t: %s\n"
1344 "cpu family\t: %d\n"
1345 "model\t\t: %d\n"
1346 "model name\t: %s\n",
1347 (unsigned)(c-cpu_data),
1348 c->x86_vendor_id[0] ? c->x86_vendor_id : "unknown",
1349 c->x86,
1350 (int)c->x86_model,
1351 c->x86_model_id[0] ? c->x86_model_id : "unknown");
1352
1353 if (c->x86_mask || c->cpuid_level >= 0)
1354 seq_printf(m, "stepping\t: %d\n", c->x86_mask);
1355 else
1356 seq_printf(m, "stepping\t: unknown\n");
1357
1358 if (cpu_has(c,X86_FEATURE_TSC)) {
Venkatesh Pallipadi95235ca2005-12-02 10:43:20 -08001359 unsigned int freq = cpufreq_quick_get((unsigned)(c-cpu_data));
1360 if (!freq)
1361 freq = cpu_khz;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001362 seq_printf(m, "cpu MHz\t\t: %u.%03u\n",
Venkatesh Pallipadi95235ca2005-12-02 10:43:20 -08001363 freq / 1000, (freq % 1000));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001364 }
1365
1366 /* Cache size */
1367 if (c->x86_cache_size >= 0)
1368 seq_printf(m, "cache size\t: %d KB\n", c->x86_cache_size);
1369
1370#ifdef CONFIG_SMP
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001371 if (smp_num_siblings * c->x86_max_cores > 1) {
Andi Kleendb468682005-04-16 15:24:51 -07001372 int cpu = c - cpu_data;
1373 seq_printf(m, "physical id\t: %d\n", phys_proc_id[cpu]);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001374 seq_printf(m, "siblings\t: %d\n", cpus_weight(cpu_core_map[cpu]));
Siddha, Suresh Bd31ddaa2005-04-16 15:25:20 -07001375 seq_printf(m, "core id\t\t: %d\n", cpu_core_id[cpu]);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001376 seq_printf(m, "cpu cores\t: %d\n", c->booted_cores);
Andi Kleendb468682005-04-16 15:24:51 -07001377 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001378#endif
1379
1380 seq_printf(m,
1381 "fpu\t\t: yes\n"
1382 "fpu_exception\t: yes\n"
1383 "cpuid level\t: %d\n"
1384 "wp\t\t: yes\n"
1385 "flags\t\t:",
1386 c->cpuid_level);
1387
1388 {
1389 int i;
1390 for ( i = 0 ; i < 32*NCAPINTS ; i++ )
Akinobu Mita3d1712c2006-03-24 03:15:11 -08001391 if (cpu_has(c, i) && x86_cap_flags[i] != NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001392 seq_printf(m, " %s", x86_cap_flags[i]);
1393 }
1394
1395 seq_printf(m, "\nbogomips\t: %lu.%02lu\n",
1396 c->loops_per_jiffy/(500000/HZ),
1397 (c->loops_per_jiffy/(5000/HZ)) % 100);
1398
1399 if (c->x86_tlbsize > 0)
1400 seq_printf(m, "TLB size\t: %d 4K pages\n", c->x86_tlbsize);
1401 seq_printf(m, "clflush size\t: %d\n", c->x86_clflush_size);
1402 seq_printf(m, "cache_alignment\t: %d\n", c->x86_cache_alignment);
1403
1404 seq_printf(m, "address sizes\t: %u bits physical, %u bits virtual\n",
1405 c->x86_phys_bits, c->x86_virt_bits);
1406
1407 seq_printf(m, "power management:");
1408 {
1409 unsigned i;
1410 for (i = 0; i < 32; i++)
1411 if (c->x86_power & (1 << i)) {
Andi Kleen3f98bc42006-01-11 22:42:51 +01001412 if (i < ARRAY_SIZE(x86_power_flags) &&
1413 x86_power_flags[i])
1414 seq_printf(m, "%s%s",
1415 x86_power_flags[i][0]?" ":"",
1416 x86_power_flags[i]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001417 else
1418 seq_printf(m, " [%d]", i);
1419 }
1420 }
Andi Kleen3dd9d512005-04-16 15:25:15 -07001421
Siddha, Suresh Bd31ddaa2005-04-16 15:25:20 -07001422 seq_printf(m, "\n\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001423
Linus Torvalds1da177e2005-04-16 15:20:36 -07001424 return 0;
1425}
1426
1427static void *c_start(struct seq_file *m, loff_t *pos)
1428{
1429 return *pos < NR_CPUS ? cpu_data + *pos : NULL;
1430}
1431
1432static void *c_next(struct seq_file *m, void *v, loff_t *pos)
1433{
1434 ++*pos;
1435 return c_start(m, pos);
1436}
1437
1438static void c_stop(struct seq_file *m, void *v)
1439{
1440}
1441
1442struct seq_operations cpuinfo_op = {
1443 .start =c_start,
1444 .next = c_next,
1445 .stop = c_stop,
1446 .show = show_cpuinfo,
1447};
Andi Kleene9928672006-01-11 22:43:33 +01001448
Mikael Pettersson160bd182006-05-01 12:16:18 -07001449#ifdef CONFIG_INPUT_PCSPKR
1450#include <linux/platform_device.h>
1451static __init int add_pcspkr(void)
1452{
1453 struct platform_device *pd;
1454 int ret;
1455
1456 pd = platform_device_alloc("pcspkr", -1);
1457 if (!pd)
1458 return -ENOMEM;
1459
1460 ret = platform_device_add(pd);
1461 if (ret)
1462 platform_device_put(pd);
1463
1464 return ret;
1465}
1466device_initcall(add_pcspkr);
1467#endif