blob: 4b7e022169701a712cc69ad29184b3f64ba2d850 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/arch/x86-64/kernel/setup.c
3 *
4 * Copyright (C) 1995 Linus Torvalds
5 *
6 * Nov 2001 Dave Jones <davej@suse.de>
7 * Forked from i386 setup code.
8 *
9 * $Id$
10 */
11
12/*
13 * This file handles the architecture-dependent parts of initialization
14 */
15
16#include <linux/errno.h>
17#include <linux/sched.h>
18#include <linux/kernel.h>
19#include <linux/mm.h>
20#include <linux/stddef.h>
21#include <linux/unistd.h>
22#include <linux/ptrace.h>
23#include <linux/slab.h>
24#include <linux/user.h>
25#include <linux/a.out.h>
26#include <linux/tty.h>
27#include <linux/ioport.h>
28#include <linux/delay.h>
29#include <linux/config.h>
30#include <linux/init.h>
31#include <linux/initrd.h>
32#include <linux/highmem.h>
33#include <linux/bootmem.h>
34#include <linux/module.h>
35#include <asm/processor.h>
36#include <linux/console.h>
37#include <linux/seq_file.h>
Vivek Goyalaac04b32006-01-09 20:51:47 -080038#include <linux/crash_dump.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070039#include <linux/root_dev.h>
40#include <linux/pci.h>
41#include <linux/acpi.h>
42#include <linux/kallsyms.h>
43#include <linux/edd.h>
Matt Tolentinobbfceef2005-06-23 00:08:07 -070044#include <linux/mmzone.h>
Eric W. Biederman5f5609d2005-06-25 14:58:04 -070045#include <linux/kexec.h>
Venkatesh Pallipadi95235ca2005-12-02 10:43:20 -080046#include <linux/cpufreq.h>
Andi Kleene9928672006-01-11 22:43:33 +010047#include <linux/dmi.h>
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010048#include <linux/dma-mapping.h>
Andi Kleen681558f2006-03-25 16:29:46 +010049#include <linux/ctype.h>
Matt Tolentinobbfceef2005-06-23 00:08:07 -070050
Linus Torvalds1da177e2005-04-16 15:20:36 -070051#include <asm/mtrr.h>
52#include <asm/uaccess.h>
53#include <asm/system.h>
54#include <asm/io.h>
55#include <asm/smp.h>
56#include <asm/msr.h>
57#include <asm/desc.h>
58#include <video/edid.h>
59#include <asm/e820.h>
60#include <asm/dma.h>
61#include <asm/mpspec.h>
62#include <asm/mmu_context.h>
63#include <asm/bootsetup.h>
64#include <asm/proto.h>
65#include <asm/setup.h>
66#include <asm/mach_apic.h>
67#include <asm/numa.h>
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010068#include <asm/swiotlb.h>
Andi Kleen2bc04142005-11-05 17:25:53 +010069#include <asm/sections.h>
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010070#include <asm/gart-mapping.h>
Andi Kleenf2d3efe2006-03-25 16:30:22 +010071#include <asm/dmi.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070072
73/*
74 * Machine setup..
75 */
76
Ravikiran G Thirumalai6c231b72005-09-06 15:17:45 -070077struct cpuinfo_x86 boot_cpu_data __read_mostly;
Linus Torvalds1da177e2005-04-16 15:20:36 -070078
79unsigned long mmu_cr4_features;
80
81int acpi_disabled;
82EXPORT_SYMBOL(acpi_disabled);
Len Brown888ba6c2005-08-24 12:07:20 -040083#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -070084extern int __initdata acpi_ht;
85extern acpi_interrupt_flags acpi_sci_flags;
86int __initdata acpi_force = 0;
87#endif
88
89int acpi_numa __initdata;
90
Linus Torvalds1da177e2005-04-16 15:20:36 -070091/* Boot loader ID as an integer, for the benefit of proc_dointvec */
92int bootloader_type;
93
94unsigned long saved_video_mode;
95
Andi Kleenf2d3efe2006-03-25 16:30:22 +010096/*
97 * Early DMI memory
98 */
99int dmi_alloc_index;
100char dmi_alloc_data[DMI_MAX_DATA];
101
Linus Torvalds1da177e2005-04-16 15:20:36 -0700102/*
103 * Setup options
104 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105struct screen_info screen_info;
106struct sys_desc_table_struct {
107 unsigned short length;
108 unsigned char table[0];
109};
110
111struct edid_info edid_info;
112struct e820map e820;
113
114extern int root_mountflags;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700115
116char command_line[COMMAND_LINE_SIZE];
117
118struct resource standard_io_resources[] = {
119 { .name = "dma1", .start = 0x00, .end = 0x1f,
120 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
121 { .name = "pic1", .start = 0x20, .end = 0x21,
122 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
123 { .name = "timer0", .start = 0x40, .end = 0x43,
124 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
125 { .name = "timer1", .start = 0x50, .end = 0x53,
126 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
127 { .name = "keyboard", .start = 0x60, .end = 0x6f,
128 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
129 { .name = "dma page reg", .start = 0x80, .end = 0x8f,
130 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
131 { .name = "pic2", .start = 0xa0, .end = 0xa1,
132 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
133 { .name = "dma2", .start = 0xc0, .end = 0xdf,
134 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
135 { .name = "fpu", .start = 0xf0, .end = 0xff,
136 .flags = IORESOURCE_BUSY | IORESOURCE_IO }
137};
138
139#define STANDARD_IO_RESOURCES \
140 (sizeof standard_io_resources / sizeof standard_io_resources[0])
141
142#define IORESOURCE_RAM (IORESOURCE_BUSY | IORESOURCE_MEM)
143
144struct resource data_resource = {
145 .name = "Kernel data",
146 .start = 0,
147 .end = 0,
148 .flags = IORESOURCE_RAM,
149};
150struct resource code_resource = {
151 .name = "Kernel code",
152 .start = 0,
153 .end = 0,
154 .flags = IORESOURCE_RAM,
155};
156
157#define IORESOURCE_ROM (IORESOURCE_BUSY | IORESOURCE_READONLY | IORESOURCE_MEM)
158
159static struct resource system_rom_resource = {
160 .name = "System ROM",
161 .start = 0xf0000,
162 .end = 0xfffff,
163 .flags = IORESOURCE_ROM,
164};
165
166static struct resource extension_rom_resource = {
167 .name = "Extension ROM",
168 .start = 0xe0000,
169 .end = 0xeffff,
170 .flags = IORESOURCE_ROM,
171};
172
173static struct resource adapter_rom_resources[] = {
174 { .name = "Adapter ROM", .start = 0xc8000, .end = 0,
175 .flags = IORESOURCE_ROM },
176 { .name = "Adapter ROM", .start = 0, .end = 0,
177 .flags = IORESOURCE_ROM },
178 { .name = "Adapter ROM", .start = 0, .end = 0,
179 .flags = IORESOURCE_ROM },
180 { .name = "Adapter ROM", .start = 0, .end = 0,
181 .flags = IORESOURCE_ROM },
182 { .name = "Adapter ROM", .start = 0, .end = 0,
183 .flags = IORESOURCE_ROM },
184 { .name = "Adapter ROM", .start = 0, .end = 0,
185 .flags = IORESOURCE_ROM }
186};
187
188#define ADAPTER_ROM_RESOURCES \
189 (sizeof adapter_rom_resources / sizeof adapter_rom_resources[0])
190
191static struct resource video_rom_resource = {
192 .name = "Video ROM",
193 .start = 0xc0000,
194 .end = 0xc7fff,
195 .flags = IORESOURCE_ROM,
196};
197
198static struct resource video_ram_resource = {
199 .name = "Video RAM area",
200 .start = 0xa0000,
201 .end = 0xbffff,
202 .flags = IORESOURCE_RAM,
203};
204
205#define romsignature(x) (*(unsigned short *)(x) == 0xaa55)
206
207static int __init romchecksum(unsigned char *rom, unsigned long length)
208{
209 unsigned char *p, sum = 0;
210
211 for (p = rom; p < rom + length; p++)
212 sum += *p;
213 return sum == 0;
214}
215
216static void __init probe_roms(void)
217{
218 unsigned long start, length, upper;
219 unsigned char *rom;
220 int i;
221
222 /* video rom */
223 upper = adapter_rom_resources[0].start;
224 for (start = video_rom_resource.start; start < upper; start += 2048) {
225 rom = isa_bus_to_virt(start);
226 if (!romsignature(rom))
227 continue;
228
229 video_rom_resource.start = start;
230
231 /* 0 < length <= 0x7f * 512, historically */
232 length = rom[2] * 512;
233
234 /* if checksum okay, trust length byte */
235 if (length && romchecksum(rom, length))
236 video_rom_resource.end = start + length - 1;
237
238 request_resource(&iomem_resource, &video_rom_resource);
239 break;
240 }
241
242 start = (video_rom_resource.end + 1 + 2047) & ~2047UL;
243 if (start < upper)
244 start = upper;
245
246 /* system rom */
247 request_resource(&iomem_resource, &system_rom_resource);
248 upper = system_rom_resource.start;
249
250 /* check for extension rom (ignore length byte!) */
251 rom = isa_bus_to_virt(extension_rom_resource.start);
252 if (romsignature(rom)) {
253 length = extension_rom_resource.end - extension_rom_resource.start + 1;
254 if (romchecksum(rom, length)) {
255 request_resource(&iomem_resource, &extension_rom_resource);
256 upper = extension_rom_resource.start;
257 }
258 }
259
260 /* check for adapter roms on 2k boundaries */
261 for (i = 0; i < ADAPTER_ROM_RESOURCES && start < upper; start += 2048) {
262 rom = isa_bus_to_virt(start);
263 if (!romsignature(rom))
264 continue;
265
266 /* 0 < length <= 0x7f * 512, historically */
267 length = rom[2] * 512;
268
269 /* but accept any length that fits if checksum okay */
270 if (!length || start + length > upper || !romchecksum(rom, length))
271 continue;
272
273 adapter_rom_resources[i].start = start;
274 adapter_rom_resources[i].end = start + length - 1;
275 request_resource(&iomem_resource, &adapter_rom_resources[i]);
276
277 start = adapter_rom_resources[i++].end & ~2047UL;
278 }
279}
280
Andi Kleen681558f2006-03-25 16:29:46 +0100281/* Check for full argument with no trailing characters */
282static int fullarg(char *p, char *arg)
283{
284 int l = strlen(arg);
285 return !memcmp(p, arg, l) && (p[l] == 0 || isspace(p[l]));
286}
287
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288static __init void parse_cmdline_early (char ** cmdline_p)
289{
290 char c = ' ', *to = command_line, *from = COMMAND_LINE;
291 int len = 0;
akpm@osdl.org69cda7b2006-01-09 20:51:46 -0800292 int userdef = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294 for (;;) {
295 if (c != ' ')
296 goto next_char;
297
298#ifdef CONFIG_SMP
299 /*
300 * If the BIOS enumerates physical processors before logical,
301 * maxcpus=N at enumeration-time can be used to disable HT.
302 */
303 else if (!memcmp(from, "maxcpus=", 8)) {
304 extern unsigned int maxcpus;
305
306 maxcpus = simple_strtoul(from + 8, NULL, 0);
307 }
308#endif
Len Brown888ba6c2005-08-24 12:07:20 -0400309#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700310 /* "acpi=off" disables both ACPI table parsing and interpreter init */
Andi Kleen681558f2006-03-25 16:29:46 +0100311 if (fullarg(from,"acpi=off"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312 disable_acpi();
313
Andi Kleen681558f2006-03-25 16:29:46 +0100314 if (fullarg(from, "acpi=force")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315 /* add later when we do DMI horrors: */
316 acpi_force = 1;
317 acpi_disabled = 0;
318 }
319
320 /* acpi=ht just means: do ACPI MADT parsing
321 at bootup, but don't enable the full ACPI interpreter */
Andi Kleen681558f2006-03-25 16:29:46 +0100322 if (fullarg(from, "acpi=ht")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323 if (!acpi_force)
324 disable_acpi();
325 acpi_ht = 1;
326 }
Andi Kleen681558f2006-03-25 16:29:46 +0100327 else if (fullarg(from, "pci=noacpi"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328 acpi_disable_pci();
Andi Kleen681558f2006-03-25 16:29:46 +0100329 else if (fullarg(from, "acpi=noirq"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700330 acpi_noirq_set();
331
Andi Kleen681558f2006-03-25 16:29:46 +0100332 else if (fullarg(from, "acpi_sci=edge"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700333 acpi_sci_flags.trigger = 1;
Andi Kleen681558f2006-03-25 16:29:46 +0100334 else if (fullarg(from, "acpi_sci=level"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700335 acpi_sci_flags.trigger = 3;
Andi Kleen681558f2006-03-25 16:29:46 +0100336 else if (fullarg(from, "acpi_sci=high"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700337 acpi_sci_flags.polarity = 1;
Andi Kleen681558f2006-03-25 16:29:46 +0100338 else if (fullarg(from, "acpi_sci=low"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339 acpi_sci_flags.polarity = 3;
340
341 /* acpi=strict disables out-of-spec workarounds */
Andi Kleen681558f2006-03-25 16:29:46 +0100342 else if (fullarg(from, "acpi=strict")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700343 acpi_strict = 1;
344 }
Andi Kleen22999242005-04-16 15:25:17 -0700345#ifdef CONFIG_X86_IO_APIC
Andi Kleen681558f2006-03-25 16:29:46 +0100346 else if (fullarg(from, "acpi_skip_timer_override"))
Andi Kleen22999242005-04-16 15:25:17 -0700347 acpi_skip_timer_override = 1;
348#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349#endif
350
Andi Kleen681558f2006-03-25 16:29:46 +0100351 if (fullarg(from, "disable_timer_pin_1"))
Chuck Ebbert66759a02005-09-12 18:49:25 +0200352 disable_timer_pin_1 = 1;
Andi Kleen681558f2006-03-25 16:29:46 +0100353 if (fullarg(from, "enable_timer_pin_1"))
Chuck Ebbert66759a02005-09-12 18:49:25 +0200354 disable_timer_pin_1 = -1;
355
Andi Kleend1530d82006-04-07 19:49:42 +0200356 if (fullarg(from, "nolapic") || fullarg(from, "disableapic")) {
357 clear_bit(X86_FEATURE_APIC, boot_cpu_data.x86_capability);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700358 disable_apic = 1;
Andi Kleend1530d82006-04-07 19:49:42 +0200359 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700360
Andi Kleen681558f2006-03-25 16:29:46 +0100361 if (fullarg(from, "noapic"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700362 skip_ioapic_setup = 1;
363
Andi Kleen681558f2006-03-25 16:29:46 +0100364 if (fullarg(from,"apic")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700365 skip_ioapic_setup = 0;
366 ioapic_force = 1;
367 }
368
369 if (!memcmp(from, "mem=", 4))
370 parse_memopt(from+4, &from);
371
akpm@osdl.org69cda7b2006-01-09 20:51:46 -0800372 if (!memcmp(from, "memmap=", 7)) {
373 /* exactmap option is for used defined memory */
374 if (!memcmp(from+7, "exactmap", 8)) {
375#ifdef CONFIG_CRASH_DUMP
376 /* If we are doing a crash dump, we
377 * still need to know the real mem
378 * size before original memory map is
379 * reset.
380 */
381 saved_max_pfn = e820_end_of_ram();
382#endif
383 from += 8+7;
384 end_pfn_map = 0;
385 e820.nr_map = 0;
386 userdef = 1;
387 }
388 else {
389 parse_memmapopt(from+7, &from);
390 userdef = 1;
391 }
392 }
393
Matt Tolentino2b976902005-06-23 00:08:06 -0700394#ifdef CONFIG_NUMA
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395 if (!memcmp(from, "numa=", 5))
396 numa_setup(from+5);
397#endif
398
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399 if (!memcmp(from,"iommu=",6)) {
400 iommu_setup(from+6);
401 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700402
Andi Kleen681558f2006-03-25 16:29:46 +0100403 if (fullarg(from,"oops=panic"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700404 panic_on_oops = 1;
405
406 if (!memcmp(from, "noexec=", 7))
407 nonx_setup(from + 7);
408
Eric W. Biederman5f5609d2005-06-25 14:58:04 -0700409#ifdef CONFIG_KEXEC
410 /* crashkernel=size@addr specifies the location to reserve for
411 * a crash kernel. By reserving this memory we guarantee
412 * that linux never set's it up as a DMA target.
413 * Useful for holding code to do something appropriate
414 * after a kernel panic.
415 */
416 else if (!memcmp(from, "crashkernel=", 12)) {
417 unsigned long size, base;
418 size = memparse(from+12, &from);
419 if (*from == '@') {
420 base = memparse(from+1, &from);
421 /* FIXME: Do I want a sanity check
422 * to validate the memory range?
423 */
424 crashk_res.start = base;
425 crashk_res.end = base + size - 1;
426 }
427 }
428#endif
429
Vivek Goyalaac04b32006-01-09 20:51:47 -0800430#ifdef CONFIG_PROC_VMCORE
431 /* elfcorehdr= specifies the location of elf core header
432 * stored by the crashed kernel. This option will be passed
433 * by kexec loader to the capture kernel.
434 */
435 else if(!memcmp(from, "elfcorehdr=", 11))
436 elfcorehdr_addr = memparse(from+11, &from);
437#endif
Andi Kleene2c03882006-02-26 04:18:46 +0100438
Brian Magnusond5176122006-02-27 04:02:04 +0100439#ifdef CONFIG_HOTPLUG_CPU
Andi Kleene2c03882006-02-26 04:18:46 +0100440 else if (!memcmp(from, "additional_cpus=", 16))
441 setup_additional_cpus(from+16);
442#endif
443
Linus Torvalds1da177e2005-04-16 15:20:36 -0700444 next_char:
445 c = *(from++);
446 if (!c)
447 break;
448 if (COMMAND_LINE_SIZE <= ++len)
449 break;
450 *(to++) = c;
451 }
akpm@osdl.org69cda7b2006-01-09 20:51:46 -0800452 if (userdef) {
453 printk(KERN_INFO "user-defined physical RAM map:\n");
454 e820_print_map("user");
455 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700456 *to = '\0';
457 *cmdline_p = command_line;
458}
459
Matt Tolentino2b976902005-06-23 00:08:06 -0700460#ifndef CONFIG_NUMA
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700461static void __init
462contig_initmem_init(unsigned long start_pfn, unsigned long end_pfn)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700463{
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700464 unsigned long bootmap_size, bootmap;
465
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700466 bootmap_size = bootmem_bootmap_pages(end_pfn)<<PAGE_SHIFT;
467 bootmap = find_e820_area(0, end_pfn<<PAGE_SHIFT, bootmap_size);
468 if (bootmap == -1L)
469 panic("Cannot find bootmem map of size %ld\n",bootmap_size);
470 bootmap_size = init_bootmem(bootmap >> PAGE_SHIFT, end_pfn);
471 e820_bootmem_free(NODE_DATA(0), 0, end_pfn << PAGE_SHIFT);
472 reserve_bootmem(bootmap, bootmap_size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700473}
474#endif
475
476/* Use inline assembly to define this because the nops are defined
477 as inline assembly strings in the include files and we cannot
478 get them easily into strings. */
479asm("\t.data\nk8nops: "
480 K8_NOP1 K8_NOP2 K8_NOP3 K8_NOP4 K8_NOP5 K8_NOP6
481 K8_NOP7 K8_NOP8);
482
483extern unsigned char k8nops[];
484static unsigned char *k8_nops[ASM_NOP_MAX+1] = {
485 NULL,
486 k8nops,
487 k8nops + 1,
488 k8nops + 1 + 2,
489 k8nops + 1 + 2 + 3,
490 k8nops + 1 + 2 + 3 + 4,
491 k8nops + 1 + 2 + 3 + 4 + 5,
492 k8nops + 1 + 2 + 3 + 4 + 5 + 6,
493 k8nops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
494};
495
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100496extern char __vsyscall_0;
497
Linus Torvalds1da177e2005-04-16 15:20:36 -0700498/* Replace instructions with better alternatives for this CPU type.
499
500 This runs before SMP is initialized to avoid SMP problems with
501 self modifying code. This implies that assymetric systems where
502 APs have less capabilities than the boot processor are not handled.
503 In this case boot with "noreplacement". */
504void apply_alternatives(void *start, void *end)
505{
506 struct alt_instr *a;
507 int diff, i, k;
508 for (a = start; (void *)a < end; a++) {
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100509 u8 *instr;
510
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511 if (!boot_cpu_has(a->cpuid))
512 continue;
513
514 BUG_ON(a->replacementlen > a->instrlen);
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100515 instr = a->instr;
516 /* vsyscall code is not mapped yet. resolve it manually. */
517 if (instr >= (u8 *)VSYSCALL_START && instr < (u8*)VSYSCALL_END)
518 instr = __va(instr - (u8*)VSYSCALL_START + (u8*)__pa_symbol(&__vsyscall_0));
519 __inline_memcpy(instr, a->replacement, a->replacementlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700520 diff = a->instrlen - a->replacementlen;
521
522 /* Pad the rest with nops */
523 for (i = a->replacementlen; diff > 0; diff -= k, i += k) {
524 k = diff;
525 if (k > ASM_NOP_MAX)
526 k = ASM_NOP_MAX;
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100527 __inline_memcpy(instr + i, k8_nops[k], k);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700528 }
529 }
530}
531
532static int no_replacement __initdata = 0;
533
534void __init alternative_instructions(void)
535{
536 extern struct alt_instr __alt_instructions[], __alt_instructions_end[];
537 if (no_replacement)
538 return;
539 apply_alternatives(__alt_instructions, __alt_instructions_end);
540}
541
542static int __init noreplacement_setup(char *s)
543{
544 no_replacement = 1;
OGAWA Hirofumi9b410462006-03-31 02:30:33 -0800545 return 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700546}
547
548__setup("noreplacement", noreplacement_setup);
549
550#if defined(CONFIG_EDD) || defined(CONFIG_EDD_MODULE)
551struct edd edd;
552#ifdef CONFIG_EDD_MODULE
553EXPORT_SYMBOL(edd);
554#endif
555/**
556 * copy_edd() - Copy the BIOS EDD information
557 * from boot_params into a safe place.
558 *
559 */
560static inline void copy_edd(void)
561{
562 memcpy(edd.mbr_signature, EDD_MBR_SIGNATURE, sizeof(edd.mbr_signature));
563 memcpy(edd.edd_info, EDD_BUF, sizeof(edd.edd_info));
564 edd.mbr_signature_nr = EDD_MBR_SIG_NR;
565 edd.edd_info_nr = EDD_NR;
566}
567#else
568static inline void copy_edd(void)
569{
570}
571#endif
572
573#define EBDA_ADDR_POINTER 0x40E
Andi Kleenac71d122006-05-08 15:17:28 +0200574
575unsigned __initdata ebda_addr;
576unsigned __initdata ebda_size;
577
578static void discover_ebda(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700579{
Andi Kleenac71d122006-05-08 15:17:28 +0200580 /*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700581 * there is a real-mode segmented pointer pointing to the
582 * 4K EBDA area at 0x40E
583 */
Andi Kleenac71d122006-05-08 15:17:28 +0200584 ebda_addr = *(unsigned short *)EBDA_ADDR_POINTER;
585 ebda_addr <<= 4;
586
587 ebda_size = *(unsigned short *)(unsigned long)ebda_addr;
588
589 /* Round EBDA up to pages */
590 if (ebda_size == 0)
591 ebda_size = 1;
592 ebda_size <<= 10;
593 ebda_size = round_up(ebda_size + (ebda_addr & ~PAGE_MASK), PAGE_SIZE);
594 if (ebda_size > 64*1024)
595 ebda_size = 64*1024;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700596}
597
598void __init setup_arch(char **cmdline_p)
599{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700600 unsigned long kernel_end;
601
602 ROOT_DEV = old_decode_dev(ORIG_ROOT_DEV);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700603 screen_info = SCREEN_INFO;
604 edid_info = EDID_INFO;
605 saved_video_mode = SAVED_VIDEO_MODE;
606 bootloader_type = LOADER_TYPE;
607
608#ifdef CONFIG_BLK_DEV_RAM
609 rd_image_start = RAMDISK_FLAGS & RAMDISK_IMAGE_START_MASK;
610 rd_prompt = ((RAMDISK_FLAGS & RAMDISK_PROMPT_FLAG) != 0);
611 rd_doload = ((RAMDISK_FLAGS & RAMDISK_LOAD_FLAG) != 0);
612#endif
613 setup_memory_region();
614 copy_edd();
615
616 if (!MOUNT_ROOT_RDONLY)
617 root_mountflags &= ~MS_RDONLY;
618 init_mm.start_code = (unsigned long) &_text;
619 init_mm.end_code = (unsigned long) &_etext;
620 init_mm.end_data = (unsigned long) &_edata;
621 init_mm.brk = (unsigned long) &_end;
622
623 code_resource.start = virt_to_phys(&_text);
624 code_resource.end = virt_to_phys(&_etext)-1;
625 data_resource.start = virt_to_phys(&_etext);
626 data_resource.end = virt_to_phys(&_edata)-1;
627
628 parse_cmdline_early(cmdline_p);
629
630 early_identify_cpu(&boot_cpu_data);
631
632 /*
633 * partially used pages are not usable - thus
634 * we are rounding upwards:
635 */
636 end_pfn = e820_end_of_ram();
Andi Kleen1f502492006-03-25 16:29:58 +0100637 num_physpages = end_pfn; /* for pfn_valid */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700638
639 check_efer();
640
Andi Kleenac71d122006-05-08 15:17:28 +0200641 discover_ebda();
642
Linus Torvalds1da177e2005-04-16 15:20:36 -0700643 init_memory_mapping(0, (end_pfn_map << PAGE_SHIFT));
644
Andi Kleenf2d3efe2006-03-25 16:30:22 +0100645 dmi_scan_machine();
646
Siddha, Suresh Bf6c2e332005-11-05 17:25:53 +0100647 zap_low_mappings(0);
648
Len Brown888ba6c2005-08-24 12:07:20 -0400649#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700650 /*
651 * Initialize the ACPI boot-time table parser (gets the RSDP and SDT).
652 * Call this early for SRAT node setup.
653 */
654 acpi_boot_table_init();
655#endif
656
657#ifdef CONFIG_ACPI_NUMA
658 /*
659 * Parse SRAT to discover nodes.
660 */
661 acpi_numa_init();
662#endif
663
Matt Tolentino2b976902005-06-23 00:08:06 -0700664#ifdef CONFIG_NUMA
Linus Torvalds1da177e2005-04-16 15:20:36 -0700665 numa_initmem_init(0, end_pfn);
666#else
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700667 contig_initmem_init(0, end_pfn);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700668#endif
669
670 /* Reserve direct mapping */
671 reserve_bootmem_generic(table_start << PAGE_SHIFT,
672 (table_end - table_start) << PAGE_SHIFT);
673
674 /* reserve kernel */
675 kernel_end = round_up(__pa_symbol(&_end),PAGE_SIZE);
676 reserve_bootmem_generic(HIGH_MEMORY, kernel_end - HIGH_MEMORY);
677
678 /*
679 * reserve physical page 0 - it's a special BIOS page on many boxes,
680 * enabling clean reboots, SMP operation, laptop functions.
681 */
682 reserve_bootmem_generic(0, PAGE_SIZE);
683
684 /* reserve ebda region */
Andi Kleenac71d122006-05-08 15:17:28 +0200685 if (ebda_addr)
686 reserve_bootmem_generic(ebda_addr, ebda_size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700687
688#ifdef CONFIG_SMP
689 /*
690 * But first pinch a few for the stack/trampoline stuff
691 * FIXME: Don't need the extra page at 4K, but need to fix
692 * trampoline before removing it. (see the GDT stuff)
693 */
694 reserve_bootmem_generic(PAGE_SIZE, PAGE_SIZE);
695
696 /* Reserve SMP trampoline */
697 reserve_bootmem_generic(SMP_TRAMPOLINE_BASE, PAGE_SIZE);
698#endif
699
700#ifdef CONFIG_ACPI_SLEEP
701 /*
702 * Reserve low memory region for sleep support.
703 */
704 acpi_reserve_bootmem();
705#endif
706#ifdef CONFIG_X86_LOCAL_APIC
707 /*
708 * Find and reserve possible boot-time SMP configuration:
709 */
710 find_smp_config();
711#endif
712#ifdef CONFIG_BLK_DEV_INITRD
713 if (LOADER_TYPE && INITRD_START) {
714 if (INITRD_START + INITRD_SIZE <= (end_pfn << PAGE_SHIFT)) {
715 reserve_bootmem_generic(INITRD_START, INITRD_SIZE);
716 initrd_start =
717 INITRD_START ? INITRD_START + PAGE_OFFSET : 0;
718 initrd_end = initrd_start+INITRD_SIZE;
719 }
720 else {
721 printk(KERN_ERR "initrd extends beyond end of memory "
722 "(0x%08lx > 0x%08lx)\ndisabling initrd\n",
723 (unsigned long)(INITRD_START + INITRD_SIZE),
724 (unsigned long)(end_pfn << PAGE_SHIFT));
725 initrd_start = 0;
726 }
727 }
728#endif
Eric W. Biederman5f5609d2005-06-25 14:58:04 -0700729#ifdef CONFIG_KEXEC
730 if (crashk_res.start != crashk_res.end) {
Amul Shah00212fe2006-06-25 05:49:31 -0700731 reserve_bootmem_generic(crashk_res.start,
Eric W. Biederman5f5609d2005-06-25 14:58:04 -0700732 crashk_res.end - crashk_res.start + 1);
733 }
734#endif
Eric W. Biederman0d317fb2005-08-06 13:47:36 -0600735
Linus Torvalds1da177e2005-04-16 15:20:36 -0700736 paging_init();
737
738 check_ioapic();
739
Ashok Raj51f62e12006-03-25 16:29:28 +0100740 /*
741 * set this early, so we dont allocate cpu0
742 * if MADT list doesnt list BSP first
743 * mpparse.c/MP_processor_info() allocates logical cpu numbers.
744 */
745 cpu_set(0, cpu_present_map);
Len Brown888ba6c2005-08-24 12:07:20 -0400746#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700747 /*
748 * Read APIC and some other early information from ACPI tables.
749 */
750 acpi_boot_init();
751#endif
752
Ravikiran Thirumalai05b3cbd2006-01-11 22:45:36 +0100753 init_cpu_to_node();
754
Linus Torvalds1da177e2005-04-16 15:20:36 -0700755#ifdef CONFIG_X86_LOCAL_APIC
756 /*
757 * get boot-time SMP configuration:
758 */
759 if (smp_found_config)
760 get_smp_config();
761 init_apic_mappings();
762#endif
763
764 /*
765 * Request address space for all standard RAM and ROM resources
766 * and also for regions reported as reserved by the e820.
767 */
768 probe_roms();
769 e820_reserve_resources();
770
771 request_resource(&iomem_resource, &video_ram_resource);
772
773 {
774 unsigned i;
775 /* request I/O space for devices used on all i[345]86 PCs */
776 for (i = 0; i < STANDARD_IO_RESOURCES; i++)
777 request_resource(&ioport_resource, &standard_io_resources[i]);
778 }
779
Andi Kleena1e97782005-04-16 15:25:12 -0700780 e820_setup_gap();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700781
782#ifdef CONFIG_GART_IOMMU
Jon Mason5b7b6442006-02-03 21:51:59 +0100783 iommu_hole_init();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700784#endif
785
786#ifdef CONFIG_VT
787#if defined(CONFIG_VGA_CONSOLE)
788 conswitchp = &vga_con;
789#elif defined(CONFIG_DUMMY_CONSOLE)
790 conswitchp = &dummy_con;
791#endif
792#endif
793}
794
Ashok Raje6982c62005-06-25 14:54:58 -0700795static int __cpuinit get_model_name(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700796{
797 unsigned int *v;
798
Andi Kleenebfcaa92005-04-16 15:25:18 -0700799 if (c->extended_cpuid_level < 0x80000004)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700800 return 0;
801
802 v = (unsigned int *) c->x86_model_id;
803 cpuid(0x80000002, &v[0], &v[1], &v[2], &v[3]);
804 cpuid(0x80000003, &v[4], &v[5], &v[6], &v[7]);
805 cpuid(0x80000004, &v[8], &v[9], &v[10], &v[11]);
806 c->x86_model_id[48] = 0;
807 return 1;
808}
809
810
Ashok Raje6982c62005-06-25 14:54:58 -0700811static void __cpuinit display_cacheinfo(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700812{
813 unsigned int n, dummy, eax, ebx, ecx, edx;
814
Andi Kleenebfcaa92005-04-16 15:25:18 -0700815 n = c->extended_cpuid_level;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700816
817 if (n >= 0x80000005) {
818 cpuid(0x80000005, &dummy, &ebx, &ecx, &edx);
819 printk(KERN_INFO "CPU: L1 I Cache: %dK (%d bytes/line), D cache %dK (%d bytes/line)\n",
820 edx>>24, edx&0xFF, ecx>>24, ecx&0xFF);
821 c->x86_cache_size=(ecx>>24)+(edx>>24);
822 /* On K8 L1 TLB is inclusive, so don't count it */
823 c->x86_tlbsize = 0;
824 }
825
826 if (n >= 0x80000006) {
827 cpuid(0x80000006, &dummy, &ebx, &ecx, &edx);
828 ecx = cpuid_ecx(0x80000006);
829 c->x86_cache_size = ecx >> 16;
830 c->x86_tlbsize += ((ebx >> 16) & 0xfff) + (ebx & 0xfff);
831
832 printk(KERN_INFO "CPU: L2 Cache: %dK (%d bytes/line)\n",
833 c->x86_cache_size, ecx & 0xFF);
834 }
835
836 if (n >= 0x80000007)
837 cpuid(0x80000007, &dummy, &dummy, &dummy, &c->x86_power);
838 if (n >= 0x80000008) {
839 cpuid(0x80000008, &eax, &dummy, &dummy, &dummy);
840 c->x86_virt_bits = (eax >> 8) & 0xff;
841 c->x86_phys_bits = eax & 0xff;
842 }
843}
844
Andi Kleen3f098c22005-09-12 18:49:24 +0200845#ifdef CONFIG_NUMA
846static int nearby_node(int apicid)
847{
848 int i;
849 for (i = apicid - 1; i >= 0; i--) {
850 int node = apicid_to_node[i];
851 if (node != NUMA_NO_NODE && node_online(node))
852 return node;
853 }
854 for (i = apicid + 1; i < MAX_LOCAL_APIC; i++) {
855 int node = apicid_to_node[i];
856 if (node != NUMA_NO_NODE && node_online(node))
857 return node;
858 }
859 return first_node(node_online_map); /* Shouldn't happen */
860}
861#endif
862
Andi Kleen63518642005-04-16 15:25:16 -0700863/*
864 * On a AMD dual core setup the lower bits of the APIC id distingush the cores.
865 * Assumes number of cores is a power of two.
866 */
867static void __init amd_detect_cmp(struct cpuinfo_x86 *c)
868{
869#ifdef CONFIG_SMP
Andi Kleen29422832005-05-16 21:53:26 -0700870 int cpu = smp_processor_id();
Andi Kleenb41e2932005-05-20 14:27:55 -0700871 unsigned bits;
Andi Kleen3f098c22005-09-12 18:49:24 +0200872#ifdef CONFIG_NUMA
873 int node = 0;
Ravikiran G Thirumalai60c1bc82006-03-25 16:30:04 +0100874 unsigned apicid = hard_smp_processor_id();
Andi Kleen3f098c22005-09-12 18:49:24 +0200875#endif
Andi Kleenfaee9a52006-06-26 13:56:10 +0200876 unsigned ecx = cpuid_ecx(0x80000008);
Andi Kleenb41e2932005-05-20 14:27:55 -0700877
Andi Kleenfaee9a52006-06-26 13:56:10 +0200878 c->x86_max_cores = (ecx & 0xff) + 1;
879
880 /* CPU telling us the core id bits shift? */
881 bits = (ecx >> 12) & 0xF;
882
883 /* Otherwise recompute */
884 if (bits == 0) {
885 while ((1 << bits) < c->x86_max_cores)
886 bits++;
887 }
Andi Kleenb41e2932005-05-20 14:27:55 -0700888
889 /* Low order bits define the core id (index of core in socket) */
890 cpu_core_id[cpu] = phys_proc_id[cpu] & ((1 << bits)-1);
891 /* Convert the APIC ID into the socket ID */
Ravikiran G Thirumalai60c1bc82006-03-25 16:30:04 +0100892 phys_proc_id[cpu] = phys_pkg_id(bits);
Andi Kleen63518642005-04-16 15:25:16 -0700893
894#ifdef CONFIG_NUMA
Andi Kleen3f098c22005-09-12 18:49:24 +0200895 node = phys_proc_id[cpu];
896 if (apicid_to_node[apicid] != NUMA_NO_NODE)
897 node = apicid_to_node[apicid];
898 if (!node_online(node)) {
899 /* Two possibilities here:
900 - The CPU is missing memory and no node was created.
901 In that case try picking one from a nearby CPU
902 - The APIC IDs differ from the HyperTransport node IDs
903 which the K8 northbridge parsing fills in.
904 Assume they are all increased by a constant offset,
905 but in the same order as the HT nodeids.
906 If that doesn't result in a usable node fall back to the
907 path for the previous case. */
908 int ht_nodeid = apicid - (phys_proc_id[0] << bits);
909 if (ht_nodeid >= 0 &&
910 apicid_to_node[ht_nodeid] != NUMA_NO_NODE)
911 node = apicid_to_node[ht_nodeid];
912 /* Pick a nearby node */
913 if (!node_online(node))
914 node = nearby_node(apicid);
915 }
Andi Kleen69d81fc2005-11-05 17:25:53 +0100916 numa_set_node(cpu, node);
Andi Kleena1586082005-05-16 21:53:21 -0700917
Andi Kleen77d910f2006-03-25 16:29:34 +0100918 printk(KERN_INFO "CPU %d/%x(%d) -> Node %d -> Core %d\n",
919 cpu, apicid, c->x86_max_cores, node, cpu_core_id[cpu]);
Andi Kleen3f098c22005-09-12 18:49:24 +0200920#endif
Andi Kleen63518642005-04-16 15:25:16 -0700921#endif
922}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700923
924static int __init init_amd(struct cpuinfo_x86 *c)
925{
926 int r;
Andi Kleen7bcd3f32006-02-03 21:51:02 +0100927 unsigned level;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700928
Linus Torvaldsbc5e8fd2005-09-17 15:41:04 -0700929#ifdef CONFIG_SMP
930 unsigned long value;
931
Andi Kleen7d318d72005-09-29 22:05:55 +0200932 /*
933 * Disable TLB flush filter by setting HWCR.FFDIS on K8
934 * bit 6 of msr C001_0015
935 *
936 * Errata 63 for SH-B3 steppings
937 * Errata 122 for all steppings (F+ have it disabled by default)
938 */
939 if (c->x86 == 15) {
940 rdmsrl(MSR_K8_HWCR, value);
941 value |= 1 << 6;
942 wrmsrl(MSR_K8_HWCR, value);
943 }
Linus Torvaldsbc5e8fd2005-09-17 15:41:04 -0700944#endif
945
Linus Torvalds1da177e2005-04-16 15:20:36 -0700946 /* Bit 31 in normal CPUID used for nonstandard 3DNow ID;
947 3DNow is IDd by bit 31 in extended CPUID (1*32+31) anyway */
948 clear_bit(0*32+31, &c->x86_capability);
949
Andi Kleen7bcd3f32006-02-03 21:51:02 +0100950 /* On C+ stepping K8 rep microcode works well for copy/memset */
951 level = cpuid_eax(1);
952 if (c->x86 == 15 && ((level >= 0x0f48 && level < 0x0f50) || level >= 0x0f58))
953 set_bit(X86_FEATURE_REP_GOOD, &c->x86_capability);
954
Andi Kleen18bd0572006-04-20 02:36:45 +0200955 /* Enable workaround for FXSAVE leak */
956 if (c->x86 >= 6)
957 set_bit(X86_FEATURE_FXSAVE_LEAK, &c->x86_capability);
958
Linus Torvalds1da177e2005-04-16 15:20:36 -0700959 r = get_model_name(c);
960 if (!r) {
961 switch (c->x86) {
962 case 15:
963 /* Should distinguish Models here, but this is only
964 a fallback anyways. */
965 strcpy(c->x86_model_id, "Hammer");
966 break;
967 }
968 }
969 display_cacheinfo(c);
970
Andi Kleen130951c2006-01-11 22:42:02 +0100971 /* c->x86_power is 8000_0007 edx. Bit 8 is constant TSC */
972 if (c->x86_power & (1<<8))
973 set_bit(X86_FEATURE_CONSTANT_TSC, &c->x86_capability);
974
Andi Kleenfaee9a52006-06-26 13:56:10 +0200975 /* Multi core CPU? */
976 if (c->extended_cpuid_level >= 0x80000008)
Andi Kleen63518642005-04-16 15:25:16 -0700977 amd_detect_cmp(c);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700978
Andi Kleen240cd6a2006-06-26 13:56:13 +0200979 /* Fix cpuid4 emulation for more */
980 num_cache_leaves = 3;
981
Linus Torvalds1da177e2005-04-16 15:20:36 -0700982 return r;
983}
984
Ashok Raje6982c62005-06-25 14:54:58 -0700985static void __cpuinit detect_ht(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700986{
987#ifdef CONFIG_SMP
988 u32 eax, ebx, ecx, edx;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100989 int index_msb, core_bits;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700990 int cpu = smp_processor_id();
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100991
992 cpuid(1, &eax, &ebx, &ecx, &edx);
993
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100994
Andi Kleen63518642005-04-16 15:25:16 -0700995 if (!cpu_has(c, X86_FEATURE_HT) || cpu_has(c, X86_FEATURE_CMP_LEGACY))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700996 return;
997
Linus Torvalds1da177e2005-04-16 15:20:36 -0700998 smp_num_siblings = (ebx & 0xff0000) >> 16;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100999
Linus Torvalds1da177e2005-04-16 15:20:36 -07001000 if (smp_num_siblings == 1) {
1001 printk(KERN_INFO "CPU: Hyper-Threading is disabled\n");
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001002 } else if (smp_num_siblings > 1 ) {
1003
Linus Torvalds1da177e2005-04-16 15:20:36 -07001004 if (smp_num_siblings > NR_CPUS) {
1005 printk(KERN_WARNING "CPU: Unsupported number of the siblings %d", smp_num_siblings);
1006 smp_num_siblings = 1;
1007 return;
1008 }
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001009
1010 index_msb = get_count_order(smp_num_siblings);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001011 phys_proc_id[cpu] = phys_pkg_id(index_msb);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001012
Linus Torvalds1da177e2005-04-16 15:20:36 -07001013 printk(KERN_INFO "CPU: Physical Processor ID: %d\n",
1014 phys_proc_id[cpu]);
Andi Kleen3dd9d512005-04-16 15:25:15 -07001015
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001016 smp_num_siblings = smp_num_siblings / c->x86_max_cores;
Andi Kleen3dd9d512005-04-16 15:25:15 -07001017
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001018 index_msb = get_count_order(smp_num_siblings) ;
Andi Kleen3dd9d512005-04-16 15:25:15 -07001019
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001020 core_bits = get_count_order(c->x86_max_cores);
Andi Kleen3dd9d512005-04-16 15:25:15 -07001021
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001022 cpu_core_id[cpu] = phys_pkg_id(index_msb) &
1023 ((1 << core_bits) - 1);
1024
1025 if (c->x86_max_cores > 1)
Andi Kleen3dd9d512005-04-16 15:25:15 -07001026 printk(KERN_INFO "CPU: Processor Core ID: %d\n",
1027 cpu_core_id[cpu]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001028 }
1029#endif
1030}
1031
Andi Kleen3dd9d512005-04-16 15:25:15 -07001032/*
1033 * find out the number of processor cores on the die
1034 */
Ashok Raje6982c62005-06-25 14:54:58 -07001035static int __cpuinit intel_num_cpu_cores(struct cpuinfo_x86 *c)
Andi Kleen3dd9d512005-04-16 15:25:15 -07001036{
1037 unsigned int eax;
1038
1039 if (c->cpuid_level < 4)
1040 return 1;
1041
1042 __asm__("cpuid"
1043 : "=a" (eax)
1044 : "0" (4), "c" (0)
1045 : "bx", "dx");
1046
1047 if (eax & 0x1f)
1048 return ((eax >> 26) + 1);
1049 else
1050 return 1;
1051}
1052
Andi Kleendf0cc262005-09-12 18:49:24 +02001053static void srat_detect_node(void)
1054{
1055#ifdef CONFIG_NUMA
Ravikiran G Thirumalaiddea7be2005-10-03 10:36:28 -07001056 unsigned node;
Andi Kleendf0cc262005-09-12 18:49:24 +02001057 int cpu = smp_processor_id();
1058
1059 /* Don't do the funky fallback heuristics the AMD version employs
1060 for now. */
Ravikiran G Thirumalaiddea7be2005-10-03 10:36:28 -07001061 node = apicid_to_node[hard_smp_processor_id()];
Andi Kleendf0cc262005-09-12 18:49:24 +02001062 if (node == NUMA_NO_NODE)
Daniel Yeisley0d015322006-05-30 22:47:57 +02001063 node = first_node(node_online_map);
Andi Kleen69d81fc2005-11-05 17:25:53 +01001064 numa_set_node(cpu, node);
Andi Kleendf0cc262005-09-12 18:49:24 +02001065
1066 if (acpi_numa > 0)
1067 printk(KERN_INFO "CPU %d -> Node %d\n", cpu, node);
1068#endif
1069}
1070
Ashok Raje6982c62005-06-25 14:54:58 -07001071static void __cpuinit init_intel(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001072{
1073 /* Cache sizes */
1074 unsigned n;
1075
1076 init_intel_cacheinfo(c);
Andi Kleenebfcaa92005-04-16 15:25:18 -07001077 n = c->extended_cpuid_level;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001078 if (n >= 0x80000008) {
1079 unsigned eax = cpuid_eax(0x80000008);
1080 c->x86_virt_bits = (eax >> 8) & 0xff;
1081 c->x86_phys_bits = eax & 0xff;
Shaohua Liaf9c1422005-11-05 17:25:54 +01001082 /* CPUID workaround for Intel 0F34 CPU */
1083 if (c->x86_vendor == X86_VENDOR_INTEL &&
1084 c->x86 == 0xF && c->x86_model == 0x3 &&
1085 c->x86_mask == 0x4)
1086 c->x86_phys_bits = 36;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001087 }
1088
1089 if (c->x86 == 15)
1090 c->x86_cache_alignment = c->x86_clflush_size * 2;
Andi Kleen39b3a792006-01-11 22:42:45 +01001091 if ((c->x86 == 0xf && c->x86_model >= 0x03) ||
1092 (c->x86 == 0x6 && c->x86_model >= 0x0e))
Andi Kleenc29601e2005-04-16 15:25:05 -07001093 set_bit(X86_FEATURE_CONSTANT_TSC, &c->x86_capability);
Andi Kleenc818a182006-01-11 22:45:24 +01001094 set_bit(X86_FEATURE_SYNC_RDTSC, &c->x86_capability);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001095 c->x86_max_cores = intel_num_cpu_cores(c);
Andi Kleendf0cc262005-09-12 18:49:24 +02001096
1097 srat_detect_node();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001098}
1099
Adrian Bunk672289e2005-09-10 00:27:21 -07001100static void __cpuinit get_cpu_vendor(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001101{
1102 char *v = c->x86_vendor_id;
1103
1104 if (!strcmp(v, "AuthenticAMD"))
1105 c->x86_vendor = X86_VENDOR_AMD;
1106 else if (!strcmp(v, "GenuineIntel"))
1107 c->x86_vendor = X86_VENDOR_INTEL;
1108 else
1109 c->x86_vendor = X86_VENDOR_UNKNOWN;
1110}
1111
1112struct cpu_model_info {
1113 int vendor;
1114 int family;
1115 char *model_names[16];
1116};
1117
1118/* Do some early cpuid on the boot CPU to get some parameter that are
1119 needed before check_bugs. Everything advanced is in identify_cpu
1120 below. */
Ashok Raje6982c62005-06-25 14:54:58 -07001121void __cpuinit early_identify_cpu(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001122{
1123 u32 tfms;
1124
1125 c->loops_per_jiffy = loops_per_jiffy;
1126 c->x86_cache_size = -1;
1127 c->x86_vendor = X86_VENDOR_UNKNOWN;
1128 c->x86_model = c->x86_mask = 0; /* So far unknown... */
1129 c->x86_vendor_id[0] = '\0'; /* Unset */
1130 c->x86_model_id[0] = '\0'; /* Unset */
1131 c->x86_clflush_size = 64;
1132 c->x86_cache_alignment = c->x86_clflush_size;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001133 c->x86_max_cores = 1;
Andi Kleenebfcaa92005-04-16 15:25:18 -07001134 c->extended_cpuid_level = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001135 memset(&c->x86_capability, 0, sizeof c->x86_capability);
1136
1137 /* Get vendor name */
1138 cpuid(0x00000000, (unsigned int *)&c->cpuid_level,
1139 (unsigned int *)&c->x86_vendor_id[0],
1140 (unsigned int *)&c->x86_vendor_id[8],
1141 (unsigned int *)&c->x86_vendor_id[4]);
1142
1143 get_cpu_vendor(c);
1144
1145 /* Initialize the standard set of capabilities */
1146 /* Note that the vendor-specific code below might override */
1147
1148 /* Intel-defined flags: level 0x00000001 */
1149 if (c->cpuid_level >= 0x00000001) {
1150 __u32 misc;
1151 cpuid(0x00000001, &tfms, &misc, &c->x86_capability[4],
1152 &c->x86_capability[0]);
1153 c->x86 = (tfms >> 8) & 0xf;
1154 c->x86_model = (tfms >> 4) & 0xf;
1155 c->x86_mask = tfms & 0xf;
Suresh Siddhaf5f786d2005-11-05 17:25:53 +01001156 if (c->x86 == 0xf)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001157 c->x86 += (tfms >> 20) & 0xff;
Suresh Siddhaf5f786d2005-11-05 17:25:53 +01001158 if (c->x86 >= 0x6)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001159 c->x86_model += ((tfms >> 16) & 0xF) << 4;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001160 if (c->x86_capability[0] & (1<<19))
1161 c->x86_clflush_size = ((misc >> 8) & 0xff) * 8;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001162 } else {
1163 /* Have CPUID level 0 only - unheard of */
1164 c->x86 = 4;
1165 }
Andi Kleena1586082005-05-16 21:53:21 -07001166
1167#ifdef CONFIG_SMP
Andi Kleenb41e2932005-05-20 14:27:55 -07001168 phys_proc_id[smp_processor_id()] = (cpuid_ebx(1) >> 24) & 0xff;
Andi Kleena1586082005-05-16 21:53:21 -07001169#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001170}
1171
1172/*
1173 * This does the hard work of actually picking apart the CPU stuff...
1174 */
Ashok Raje6982c62005-06-25 14:54:58 -07001175void __cpuinit identify_cpu(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001176{
1177 int i;
1178 u32 xlvl;
1179
1180 early_identify_cpu(c);
1181
1182 /* AMD-defined flags: level 0x80000001 */
1183 xlvl = cpuid_eax(0x80000000);
Andi Kleenebfcaa92005-04-16 15:25:18 -07001184 c->extended_cpuid_level = xlvl;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001185 if ((xlvl & 0xffff0000) == 0x80000000) {
1186 if (xlvl >= 0x80000001) {
1187 c->x86_capability[1] = cpuid_edx(0x80000001);
H. Peter Anvin5b7abc62005-05-01 08:58:49 -07001188 c->x86_capability[6] = cpuid_ecx(0x80000001);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001189 }
1190 if (xlvl >= 0x80000004)
1191 get_model_name(c); /* Default name */
1192 }
1193
1194 /* Transmeta-defined flags: level 0x80860001 */
1195 xlvl = cpuid_eax(0x80860000);
1196 if ((xlvl & 0xffff0000) == 0x80860000) {
1197 /* Don't set x86_cpuid_level here for now to not confuse. */
1198 if (xlvl >= 0x80860001)
1199 c->x86_capability[2] = cpuid_edx(0x80860001);
1200 }
1201
Siddha, Suresh B1e9f28f2006-03-27 01:15:22 -08001202 c->apicid = phys_pkg_id(0);
1203
Linus Torvalds1da177e2005-04-16 15:20:36 -07001204 /*
1205 * Vendor-specific initialization. In this section we
1206 * canonicalize the feature flags, meaning if there are
1207 * features a certain CPU supports which CPUID doesn't
1208 * tell us, CPUID claiming incorrect flags, or other bugs,
1209 * we handle them here.
1210 *
1211 * At the end of this section, c->x86_capability better
1212 * indicate the features this CPU genuinely supports!
1213 */
1214 switch (c->x86_vendor) {
1215 case X86_VENDOR_AMD:
1216 init_amd(c);
1217 break;
1218
1219 case X86_VENDOR_INTEL:
1220 init_intel(c);
1221 break;
1222
1223 case X86_VENDOR_UNKNOWN:
1224 default:
1225 display_cacheinfo(c);
1226 break;
1227 }
1228
1229 select_idle_routine(c);
1230 detect_ht(c);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001231
1232 /*
1233 * On SMP, boot_cpu_data holds the common feature set between
1234 * all CPUs; so make sure that we indicate which features are
1235 * common between the CPUs. The first time this routine gets
1236 * executed, c == &boot_cpu_data.
1237 */
1238 if (c != &boot_cpu_data) {
1239 /* AND the already accumulated flags with these */
1240 for (i = 0 ; i < NCAPINTS ; i++)
1241 boot_cpu_data.x86_capability[i] &= c->x86_capability[i];
1242 }
1243
1244#ifdef CONFIG_X86_MCE
1245 mcheck_init(c);
1246#endif
Shaohua Li3b520b22005-07-07 17:56:38 -07001247 if (c == &boot_cpu_data)
1248 mtrr_bp_init();
1249 else
1250 mtrr_ap_init();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001251#ifdef CONFIG_NUMA
Andi Kleen3019e8e2005-07-28 21:15:28 -07001252 numa_add_cpu(smp_processor_id());
Linus Torvalds1da177e2005-04-16 15:20:36 -07001253#endif
1254}
1255
1256
Ashok Raje6982c62005-06-25 14:54:58 -07001257void __cpuinit print_cpu_info(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001258{
1259 if (c->x86_model_id[0])
1260 printk("%s", c->x86_model_id);
1261
1262 if (c->x86_mask || c->cpuid_level >= 0)
1263 printk(" stepping %02x\n", c->x86_mask);
1264 else
1265 printk("\n");
1266}
1267
1268/*
1269 * Get CPU information for use by the procfs.
1270 */
1271
1272static int show_cpuinfo(struct seq_file *m, void *v)
1273{
1274 struct cpuinfo_x86 *c = v;
1275
1276 /*
1277 * These flag bits must match the definitions in <asm/cpufeature.h>.
1278 * NULL means this bit is undefined or reserved; either way it doesn't
1279 * have meaning as far as Linux is concerned. Note that it's important
1280 * to realize there is a difference between this table and CPUID -- if
1281 * applications want to get the raw CPUID data, they should access
1282 * /dev/cpu/<cpu_nr>/cpuid instead.
1283 */
1284 static char *x86_cap_flags[] = {
1285 /* Intel-defined */
1286 "fpu", "vme", "de", "pse", "tsc", "msr", "pae", "mce",
1287 "cx8", "apic", NULL, "sep", "mtrr", "pge", "mca", "cmov",
1288 "pat", "pse36", "pn", "clflush", NULL, "dts", "acpi", "mmx",
1289 "fxsr", "sse", "sse2", "ss", "ht", "tm", "ia64", NULL,
1290
1291 /* AMD-defined */
Zwane Mwaikambo3c3b73b2005-05-01 08:58:51 -07001292 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001293 NULL, NULL, NULL, "syscall", NULL, NULL, NULL, NULL,
1294 NULL, NULL, NULL, NULL, "nx", NULL, "mmxext", NULL,
Andi Kleen3f98bc42006-01-11 22:42:51 +01001295 NULL, "fxsr_opt", "rdtscp", NULL, NULL, "lm", "3dnowext", "3dnow",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001296
1297 /* Transmeta-defined */
1298 "recovery", "longrun", NULL, "lrti", NULL, NULL, NULL, NULL,
1299 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1300 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1301 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1302
1303 /* Other (Linux-defined) */
Andi Kleen622dcaf2005-05-16 21:53:26 -07001304 "cxmmx", NULL, "cyrix_arr", "centaur_mcr", NULL,
Andi Kleenc29601e2005-04-16 15:25:05 -07001305 "constant_tsc", NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001306 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1307 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1308 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1309
1310 /* Intel-defined (#2) */
Andi Kleen9d95dd82006-03-25 16:31:22 +01001311 "pni", NULL, NULL, "monitor", "ds_cpl", "vmx", "smx", "est",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001312 "tm2", NULL, "cid", NULL, NULL, "cx16", "xtpr", NULL,
1313 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1314 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1315
H. Peter Anvin5b7abc62005-05-01 08:58:49 -07001316 /* VIA/Cyrix/Centaur-defined */
1317 NULL, NULL, "rng", "rng_en", NULL, NULL, "ace", "ace_en",
1318 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1319 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1320 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1321
Linus Torvalds1da177e2005-04-16 15:20:36 -07001322 /* AMD-defined (#2) */
Andi Kleen3f98bc42006-01-11 22:42:51 +01001323 "lahf_lm", "cmp_legacy", "svm", NULL, "cr8_legacy", NULL, NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001324 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1325 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
H. Peter Anvin5b7abc62005-05-01 08:58:49 -07001326 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001327 };
1328 static char *x86_power_flags[] = {
1329 "ts", /* temperature sensor */
1330 "fid", /* frequency id control */
1331 "vid", /* voltage id control */
1332 "ttp", /* thermal trip */
1333 "tm",
Andi Kleen3f98bc42006-01-11 22:42:51 +01001334 "stc",
1335 NULL,
Andi Kleen39b3a792006-01-11 22:42:45 +01001336 /* nothing */ /* constant_tsc - moved to flags */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001337 };
1338
1339
1340#ifdef CONFIG_SMP
1341 if (!cpu_online(c-cpu_data))
1342 return 0;
1343#endif
1344
1345 seq_printf(m,"processor\t: %u\n"
1346 "vendor_id\t: %s\n"
1347 "cpu family\t: %d\n"
1348 "model\t\t: %d\n"
1349 "model name\t: %s\n",
1350 (unsigned)(c-cpu_data),
1351 c->x86_vendor_id[0] ? c->x86_vendor_id : "unknown",
1352 c->x86,
1353 (int)c->x86_model,
1354 c->x86_model_id[0] ? c->x86_model_id : "unknown");
1355
1356 if (c->x86_mask || c->cpuid_level >= 0)
1357 seq_printf(m, "stepping\t: %d\n", c->x86_mask);
1358 else
1359 seq_printf(m, "stepping\t: unknown\n");
1360
1361 if (cpu_has(c,X86_FEATURE_TSC)) {
Venkatesh Pallipadi95235ca2005-12-02 10:43:20 -08001362 unsigned int freq = cpufreq_quick_get((unsigned)(c-cpu_data));
1363 if (!freq)
1364 freq = cpu_khz;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001365 seq_printf(m, "cpu MHz\t\t: %u.%03u\n",
Venkatesh Pallipadi95235ca2005-12-02 10:43:20 -08001366 freq / 1000, (freq % 1000));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001367 }
1368
1369 /* Cache size */
1370 if (c->x86_cache_size >= 0)
1371 seq_printf(m, "cache size\t: %d KB\n", c->x86_cache_size);
1372
1373#ifdef CONFIG_SMP
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001374 if (smp_num_siblings * c->x86_max_cores > 1) {
Andi Kleendb468682005-04-16 15:24:51 -07001375 int cpu = c - cpu_data;
1376 seq_printf(m, "physical id\t: %d\n", phys_proc_id[cpu]);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001377 seq_printf(m, "siblings\t: %d\n", cpus_weight(cpu_core_map[cpu]));
Siddha, Suresh Bd31ddaa2005-04-16 15:25:20 -07001378 seq_printf(m, "core id\t\t: %d\n", cpu_core_id[cpu]);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001379 seq_printf(m, "cpu cores\t: %d\n", c->booted_cores);
Andi Kleendb468682005-04-16 15:24:51 -07001380 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001381#endif
1382
1383 seq_printf(m,
1384 "fpu\t\t: yes\n"
1385 "fpu_exception\t: yes\n"
1386 "cpuid level\t: %d\n"
1387 "wp\t\t: yes\n"
1388 "flags\t\t:",
1389 c->cpuid_level);
1390
1391 {
1392 int i;
1393 for ( i = 0 ; i < 32*NCAPINTS ; i++ )
Akinobu Mita3d1712c2006-03-24 03:15:11 -08001394 if (cpu_has(c, i) && x86_cap_flags[i] != NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001395 seq_printf(m, " %s", x86_cap_flags[i]);
1396 }
1397
1398 seq_printf(m, "\nbogomips\t: %lu.%02lu\n",
1399 c->loops_per_jiffy/(500000/HZ),
1400 (c->loops_per_jiffy/(5000/HZ)) % 100);
1401
1402 if (c->x86_tlbsize > 0)
1403 seq_printf(m, "TLB size\t: %d 4K pages\n", c->x86_tlbsize);
1404 seq_printf(m, "clflush size\t: %d\n", c->x86_clflush_size);
1405 seq_printf(m, "cache_alignment\t: %d\n", c->x86_cache_alignment);
1406
1407 seq_printf(m, "address sizes\t: %u bits physical, %u bits virtual\n",
1408 c->x86_phys_bits, c->x86_virt_bits);
1409
1410 seq_printf(m, "power management:");
1411 {
1412 unsigned i;
1413 for (i = 0; i < 32; i++)
1414 if (c->x86_power & (1 << i)) {
Andi Kleen3f98bc42006-01-11 22:42:51 +01001415 if (i < ARRAY_SIZE(x86_power_flags) &&
1416 x86_power_flags[i])
1417 seq_printf(m, "%s%s",
1418 x86_power_flags[i][0]?" ":"",
1419 x86_power_flags[i]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001420 else
1421 seq_printf(m, " [%d]", i);
1422 }
1423 }
Andi Kleen3dd9d512005-04-16 15:25:15 -07001424
Siddha, Suresh Bd31ddaa2005-04-16 15:25:20 -07001425 seq_printf(m, "\n\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001426
Linus Torvalds1da177e2005-04-16 15:20:36 -07001427 return 0;
1428}
1429
1430static void *c_start(struct seq_file *m, loff_t *pos)
1431{
1432 return *pos < NR_CPUS ? cpu_data + *pos : NULL;
1433}
1434
1435static void *c_next(struct seq_file *m, void *v, loff_t *pos)
1436{
1437 ++*pos;
1438 return c_start(m, pos);
1439}
1440
1441static void c_stop(struct seq_file *m, void *v)
1442{
1443}
1444
1445struct seq_operations cpuinfo_op = {
1446 .start =c_start,
1447 .next = c_next,
1448 .stop = c_stop,
1449 .show = show_cpuinfo,
1450};
Andi Kleene9928672006-01-11 22:43:33 +01001451
Mikael Pettersson160bd182006-05-01 12:16:18 -07001452#ifdef CONFIG_INPUT_PCSPKR
1453#include <linux/platform_device.h>
1454static __init int add_pcspkr(void)
1455{
1456 struct platform_device *pd;
1457 int ret;
1458
1459 pd = platform_device_alloc("pcspkr", -1);
1460 if (!pd)
1461 return -ENOMEM;
1462
1463 ret = platform_device_add(pd);
1464 if (ret)
1465 platform_device_put(pd);
1466
1467 return ret;
1468}
1469device_initcall(add_pcspkr);
1470#endif