blob: 759070c827511bb482c3b770ff0f35407746936c [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/arch/x86-64/kernel/setup.c
3 *
4 * Copyright (C) 1995 Linus Torvalds
5 *
6 * Nov 2001 Dave Jones <davej@suse.de>
7 * Forked from i386 setup code.
8 *
9 * $Id$
10 */
11
12/*
13 * This file handles the architecture-dependent parts of initialization
14 */
15
16#include <linux/errno.h>
17#include <linux/sched.h>
18#include <linux/kernel.h>
19#include <linux/mm.h>
20#include <linux/stddef.h>
21#include <linux/unistd.h>
22#include <linux/ptrace.h>
23#include <linux/slab.h>
24#include <linux/user.h>
25#include <linux/a.out.h>
26#include <linux/tty.h>
27#include <linux/ioport.h>
28#include <linux/delay.h>
29#include <linux/config.h>
30#include <linux/init.h>
31#include <linux/initrd.h>
32#include <linux/highmem.h>
33#include <linux/bootmem.h>
34#include <linux/module.h>
35#include <asm/processor.h>
36#include <linux/console.h>
37#include <linux/seq_file.h>
Vivek Goyalaac04b32006-01-09 20:51:47 -080038#include <linux/crash_dump.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070039#include <linux/root_dev.h>
40#include <linux/pci.h>
41#include <linux/acpi.h>
42#include <linux/kallsyms.h>
43#include <linux/edd.h>
Matt Tolentinobbfceef2005-06-23 00:08:07 -070044#include <linux/mmzone.h>
Eric W. Biederman5f5609d2005-06-25 14:58:04 -070045#include <linux/kexec.h>
Venkatesh Pallipadi95235ca2005-12-02 10:43:20 -080046#include <linux/cpufreq.h>
Andi Kleene9928672006-01-11 22:43:33 +010047#include <linux/dmi.h>
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010048#include <linux/dma-mapping.h>
Andi Kleen681558f2006-03-25 16:29:46 +010049#include <linux/ctype.h>
Matt Tolentinobbfceef2005-06-23 00:08:07 -070050
Linus Torvalds1da177e2005-04-16 15:20:36 -070051#include <asm/mtrr.h>
52#include <asm/uaccess.h>
53#include <asm/system.h>
54#include <asm/io.h>
55#include <asm/smp.h>
56#include <asm/msr.h>
57#include <asm/desc.h>
58#include <video/edid.h>
59#include <asm/e820.h>
60#include <asm/dma.h>
61#include <asm/mpspec.h>
62#include <asm/mmu_context.h>
63#include <asm/bootsetup.h>
64#include <asm/proto.h>
65#include <asm/setup.h>
66#include <asm/mach_apic.h>
67#include <asm/numa.h>
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010068#include <asm/swiotlb.h>
Andi Kleen2bc04142005-11-05 17:25:53 +010069#include <asm/sections.h>
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010070#include <asm/gart-mapping.h>
Andi Kleenf2d3efe2006-03-25 16:30:22 +010071#include <asm/dmi.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070072
73/*
74 * Machine setup..
75 */
76
Ravikiran G Thirumalai6c231b72005-09-06 15:17:45 -070077struct cpuinfo_x86 boot_cpu_data __read_mostly;
Linus Torvalds1da177e2005-04-16 15:20:36 -070078
79unsigned long mmu_cr4_features;
80
81int acpi_disabled;
82EXPORT_SYMBOL(acpi_disabled);
Len Brown888ba6c2005-08-24 12:07:20 -040083#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -070084extern int __initdata acpi_ht;
85extern acpi_interrupt_flags acpi_sci_flags;
86int __initdata acpi_force = 0;
87#endif
88
89int acpi_numa __initdata;
90
Linus Torvalds1da177e2005-04-16 15:20:36 -070091/* Boot loader ID as an integer, for the benefit of proc_dointvec */
92int bootloader_type;
93
94unsigned long saved_video_mode;
95
Andi Kleenf2d3efe2006-03-25 16:30:22 +010096/*
97 * Early DMI memory
98 */
99int dmi_alloc_index;
100char dmi_alloc_data[DMI_MAX_DATA];
101
Linus Torvalds1da177e2005-04-16 15:20:36 -0700102/*
103 * Setup options
104 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105struct screen_info screen_info;
106struct sys_desc_table_struct {
107 unsigned short length;
108 unsigned char table[0];
109};
110
111struct edid_info edid_info;
112struct e820map e820;
113
114extern int root_mountflags;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700115
116char command_line[COMMAND_LINE_SIZE];
117
118struct resource standard_io_resources[] = {
119 { .name = "dma1", .start = 0x00, .end = 0x1f,
120 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
121 { .name = "pic1", .start = 0x20, .end = 0x21,
122 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
123 { .name = "timer0", .start = 0x40, .end = 0x43,
124 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
125 { .name = "timer1", .start = 0x50, .end = 0x53,
126 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
127 { .name = "keyboard", .start = 0x60, .end = 0x6f,
128 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
129 { .name = "dma page reg", .start = 0x80, .end = 0x8f,
130 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
131 { .name = "pic2", .start = 0xa0, .end = 0xa1,
132 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
133 { .name = "dma2", .start = 0xc0, .end = 0xdf,
134 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
135 { .name = "fpu", .start = 0xf0, .end = 0xff,
136 .flags = IORESOURCE_BUSY | IORESOURCE_IO }
137};
138
139#define STANDARD_IO_RESOURCES \
140 (sizeof standard_io_resources / sizeof standard_io_resources[0])
141
142#define IORESOURCE_RAM (IORESOURCE_BUSY | IORESOURCE_MEM)
143
144struct resource data_resource = {
145 .name = "Kernel data",
146 .start = 0,
147 .end = 0,
148 .flags = IORESOURCE_RAM,
149};
150struct resource code_resource = {
151 .name = "Kernel code",
152 .start = 0,
153 .end = 0,
154 .flags = IORESOURCE_RAM,
155};
156
157#define IORESOURCE_ROM (IORESOURCE_BUSY | IORESOURCE_READONLY | IORESOURCE_MEM)
158
159static struct resource system_rom_resource = {
160 .name = "System ROM",
161 .start = 0xf0000,
162 .end = 0xfffff,
163 .flags = IORESOURCE_ROM,
164};
165
166static struct resource extension_rom_resource = {
167 .name = "Extension ROM",
168 .start = 0xe0000,
169 .end = 0xeffff,
170 .flags = IORESOURCE_ROM,
171};
172
173static struct resource adapter_rom_resources[] = {
174 { .name = "Adapter ROM", .start = 0xc8000, .end = 0,
175 .flags = IORESOURCE_ROM },
176 { .name = "Adapter ROM", .start = 0, .end = 0,
177 .flags = IORESOURCE_ROM },
178 { .name = "Adapter ROM", .start = 0, .end = 0,
179 .flags = IORESOURCE_ROM },
180 { .name = "Adapter ROM", .start = 0, .end = 0,
181 .flags = IORESOURCE_ROM },
182 { .name = "Adapter ROM", .start = 0, .end = 0,
183 .flags = IORESOURCE_ROM },
184 { .name = "Adapter ROM", .start = 0, .end = 0,
185 .flags = IORESOURCE_ROM }
186};
187
188#define ADAPTER_ROM_RESOURCES \
189 (sizeof adapter_rom_resources / sizeof adapter_rom_resources[0])
190
191static struct resource video_rom_resource = {
192 .name = "Video ROM",
193 .start = 0xc0000,
194 .end = 0xc7fff,
195 .flags = IORESOURCE_ROM,
196};
197
198static struct resource video_ram_resource = {
199 .name = "Video RAM area",
200 .start = 0xa0000,
201 .end = 0xbffff,
202 .flags = IORESOURCE_RAM,
203};
204
205#define romsignature(x) (*(unsigned short *)(x) == 0xaa55)
206
207static int __init romchecksum(unsigned char *rom, unsigned long length)
208{
209 unsigned char *p, sum = 0;
210
211 for (p = rom; p < rom + length; p++)
212 sum += *p;
213 return sum == 0;
214}
215
216static void __init probe_roms(void)
217{
218 unsigned long start, length, upper;
219 unsigned char *rom;
220 int i;
221
222 /* video rom */
223 upper = adapter_rom_resources[0].start;
224 for (start = video_rom_resource.start; start < upper; start += 2048) {
225 rom = isa_bus_to_virt(start);
226 if (!romsignature(rom))
227 continue;
228
229 video_rom_resource.start = start;
230
231 /* 0 < length <= 0x7f * 512, historically */
232 length = rom[2] * 512;
233
234 /* if checksum okay, trust length byte */
235 if (length && romchecksum(rom, length))
236 video_rom_resource.end = start + length - 1;
237
238 request_resource(&iomem_resource, &video_rom_resource);
239 break;
240 }
241
242 start = (video_rom_resource.end + 1 + 2047) & ~2047UL;
243 if (start < upper)
244 start = upper;
245
246 /* system rom */
247 request_resource(&iomem_resource, &system_rom_resource);
248 upper = system_rom_resource.start;
249
250 /* check for extension rom (ignore length byte!) */
251 rom = isa_bus_to_virt(extension_rom_resource.start);
252 if (romsignature(rom)) {
253 length = extension_rom_resource.end - extension_rom_resource.start + 1;
254 if (romchecksum(rom, length)) {
255 request_resource(&iomem_resource, &extension_rom_resource);
256 upper = extension_rom_resource.start;
257 }
258 }
259
260 /* check for adapter roms on 2k boundaries */
261 for (i = 0; i < ADAPTER_ROM_RESOURCES && start < upper; start += 2048) {
262 rom = isa_bus_to_virt(start);
263 if (!romsignature(rom))
264 continue;
265
266 /* 0 < length <= 0x7f * 512, historically */
267 length = rom[2] * 512;
268
269 /* but accept any length that fits if checksum okay */
270 if (!length || start + length > upper || !romchecksum(rom, length))
271 continue;
272
273 adapter_rom_resources[i].start = start;
274 adapter_rom_resources[i].end = start + length - 1;
275 request_resource(&iomem_resource, &adapter_rom_resources[i]);
276
277 start = adapter_rom_resources[i++].end & ~2047UL;
278 }
279}
280
Andi Kleen681558f2006-03-25 16:29:46 +0100281/* Check for full argument with no trailing characters */
282static int fullarg(char *p, char *arg)
283{
284 int l = strlen(arg);
285 return !memcmp(p, arg, l) && (p[l] == 0 || isspace(p[l]));
286}
287
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288static __init void parse_cmdline_early (char ** cmdline_p)
289{
290 char c = ' ', *to = command_line, *from = COMMAND_LINE;
291 int len = 0;
akpm@osdl.org69cda7b2006-01-09 20:51:46 -0800292 int userdef = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294 for (;;) {
295 if (c != ' ')
296 goto next_char;
297
298#ifdef CONFIG_SMP
299 /*
300 * If the BIOS enumerates physical processors before logical,
301 * maxcpus=N at enumeration-time can be used to disable HT.
302 */
303 else if (!memcmp(from, "maxcpus=", 8)) {
304 extern unsigned int maxcpus;
305
306 maxcpus = simple_strtoul(from + 8, NULL, 0);
307 }
308#endif
Len Brown888ba6c2005-08-24 12:07:20 -0400309#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700310 /* "acpi=off" disables both ACPI table parsing and interpreter init */
Andi Kleen681558f2006-03-25 16:29:46 +0100311 if (fullarg(from,"acpi=off"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312 disable_acpi();
313
Andi Kleen681558f2006-03-25 16:29:46 +0100314 if (fullarg(from, "acpi=force")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315 /* add later when we do DMI horrors: */
316 acpi_force = 1;
317 acpi_disabled = 0;
318 }
319
320 /* acpi=ht just means: do ACPI MADT parsing
321 at bootup, but don't enable the full ACPI interpreter */
Andi Kleen681558f2006-03-25 16:29:46 +0100322 if (fullarg(from, "acpi=ht")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323 if (!acpi_force)
324 disable_acpi();
325 acpi_ht = 1;
326 }
Andi Kleen681558f2006-03-25 16:29:46 +0100327 else if (fullarg(from, "pci=noacpi"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328 acpi_disable_pci();
Andi Kleen681558f2006-03-25 16:29:46 +0100329 else if (fullarg(from, "acpi=noirq"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700330 acpi_noirq_set();
331
Andi Kleen681558f2006-03-25 16:29:46 +0100332 else if (fullarg(from, "acpi_sci=edge"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700333 acpi_sci_flags.trigger = 1;
Andi Kleen681558f2006-03-25 16:29:46 +0100334 else if (fullarg(from, "acpi_sci=level"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700335 acpi_sci_flags.trigger = 3;
Andi Kleen681558f2006-03-25 16:29:46 +0100336 else if (fullarg(from, "acpi_sci=high"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700337 acpi_sci_flags.polarity = 1;
Andi Kleen681558f2006-03-25 16:29:46 +0100338 else if (fullarg(from, "acpi_sci=low"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339 acpi_sci_flags.polarity = 3;
340
341 /* acpi=strict disables out-of-spec workarounds */
Andi Kleen681558f2006-03-25 16:29:46 +0100342 else if (fullarg(from, "acpi=strict")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700343 acpi_strict = 1;
344 }
Andi Kleen22999242005-04-16 15:25:17 -0700345#ifdef CONFIG_X86_IO_APIC
Andi Kleen681558f2006-03-25 16:29:46 +0100346 else if (fullarg(from, "acpi_skip_timer_override"))
Andi Kleen22999242005-04-16 15:25:17 -0700347 acpi_skip_timer_override = 1;
348#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349#endif
350
Andi Kleen681558f2006-03-25 16:29:46 +0100351 if (fullarg(from, "disable_timer_pin_1"))
Chuck Ebbert66759a02005-09-12 18:49:25 +0200352 disable_timer_pin_1 = 1;
Andi Kleen681558f2006-03-25 16:29:46 +0100353 if (fullarg(from, "enable_timer_pin_1"))
Chuck Ebbert66759a02005-09-12 18:49:25 +0200354 disable_timer_pin_1 = -1;
355
Andi Kleend1530d82006-04-07 19:49:42 +0200356 if (fullarg(from, "nolapic") || fullarg(from, "disableapic")) {
357 clear_bit(X86_FEATURE_APIC, boot_cpu_data.x86_capability);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700358 disable_apic = 1;
Andi Kleend1530d82006-04-07 19:49:42 +0200359 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700360
Andi Kleen681558f2006-03-25 16:29:46 +0100361 if (fullarg(from, "noapic"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700362 skip_ioapic_setup = 1;
363
Andi Kleen681558f2006-03-25 16:29:46 +0100364 if (fullarg(from,"apic")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700365 skip_ioapic_setup = 0;
366 ioapic_force = 1;
367 }
368
369 if (!memcmp(from, "mem=", 4))
370 parse_memopt(from+4, &from);
371
akpm@osdl.org69cda7b2006-01-09 20:51:46 -0800372 if (!memcmp(from, "memmap=", 7)) {
373 /* exactmap option is for used defined memory */
374 if (!memcmp(from+7, "exactmap", 8)) {
375#ifdef CONFIG_CRASH_DUMP
376 /* If we are doing a crash dump, we
377 * still need to know the real mem
378 * size before original memory map is
379 * reset.
380 */
381 saved_max_pfn = e820_end_of_ram();
382#endif
383 from += 8+7;
384 end_pfn_map = 0;
385 e820.nr_map = 0;
386 userdef = 1;
387 }
388 else {
389 parse_memmapopt(from+7, &from);
390 userdef = 1;
391 }
392 }
393
Matt Tolentino2b976902005-06-23 00:08:06 -0700394#ifdef CONFIG_NUMA
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395 if (!memcmp(from, "numa=", 5))
396 numa_setup(from+5);
397#endif
398
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399 if (!memcmp(from,"iommu=",6)) {
400 iommu_setup(from+6);
401 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700402
Andi Kleen681558f2006-03-25 16:29:46 +0100403 if (fullarg(from,"oops=panic"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700404 panic_on_oops = 1;
405
406 if (!memcmp(from, "noexec=", 7))
407 nonx_setup(from + 7);
408
Eric W. Biederman5f5609d2005-06-25 14:58:04 -0700409#ifdef CONFIG_KEXEC
410 /* crashkernel=size@addr specifies the location to reserve for
411 * a crash kernel. By reserving this memory we guarantee
412 * that linux never set's it up as a DMA target.
413 * Useful for holding code to do something appropriate
414 * after a kernel panic.
415 */
416 else if (!memcmp(from, "crashkernel=", 12)) {
417 unsigned long size, base;
418 size = memparse(from+12, &from);
419 if (*from == '@') {
420 base = memparse(from+1, &from);
421 /* FIXME: Do I want a sanity check
422 * to validate the memory range?
423 */
424 crashk_res.start = base;
425 crashk_res.end = base + size - 1;
426 }
427 }
428#endif
429
Vivek Goyalaac04b32006-01-09 20:51:47 -0800430#ifdef CONFIG_PROC_VMCORE
431 /* elfcorehdr= specifies the location of elf core header
432 * stored by the crashed kernel. This option will be passed
433 * by kexec loader to the capture kernel.
434 */
435 else if(!memcmp(from, "elfcorehdr=", 11))
436 elfcorehdr_addr = memparse(from+11, &from);
437#endif
Andi Kleene2c03882006-02-26 04:18:46 +0100438
Brian Magnusond5176122006-02-27 04:02:04 +0100439#ifdef CONFIG_HOTPLUG_CPU
Andi Kleene2c03882006-02-26 04:18:46 +0100440 else if (!memcmp(from, "additional_cpus=", 16))
441 setup_additional_cpus(from+16);
442#endif
443
Linus Torvalds1da177e2005-04-16 15:20:36 -0700444 next_char:
445 c = *(from++);
446 if (!c)
447 break;
448 if (COMMAND_LINE_SIZE <= ++len)
449 break;
450 *(to++) = c;
451 }
akpm@osdl.org69cda7b2006-01-09 20:51:46 -0800452 if (userdef) {
453 printk(KERN_INFO "user-defined physical RAM map:\n");
454 e820_print_map("user");
455 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700456 *to = '\0';
457 *cmdline_p = command_line;
458}
459
Matt Tolentino2b976902005-06-23 00:08:06 -0700460#ifndef CONFIG_NUMA
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700461static void __init
462contig_initmem_init(unsigned long start_pfn, unsigned long end_pfn)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700463{
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700464 unsigned long bootmap_size, bootmap;
465
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700466 bootmap_size = bootmem_bootmap_pages(end_pfn)<<PAGE_SHIFT;
467 bootmap = find_e820_area(0, end_pfn<<PAGE_SHIFT, bootmap_size);
468 if (bootmap == -1L)
469 panic("Cannot find bootmem map of size %ld\n",bootmap_size);
470 bootmap_size = init_bootmem(bootmap >> PAGE_SHIFT, end_pfn);
471 e820_bootmem_free(NODE_DATA(0), 0, end_pfn << PAGE_SHIFT);
472 reserve_bootmem(bootmap, bootmap_size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700473}
474#endif
475
476/* Use inline assembly to define this because the nops are defined
477 as inline assembly strings in the include files and we cannot
478 get them easily into strings. */
479asm("\t.data\nk8nops: "
480 K8_NOP1 K8_NOP2 K8_NOP3 K8_NOP4 K8_NOP5 K8_NOP6
481 K8_NOP7 K8_NOP8);
482
483extern unsigned char k8nops[];
484static unsigned char *k8_nops[ASM_NOP_MAX+1] = {
485 NULL,
486 k8nops,
487 k8nops + 1,
488 k8nops + 1 + 2,
489 k8nops + 1 + 2 + 3,
490 k8nops + 1 + 2 + 3 + 4,
491 k8nops + 1 + 2 + 3 + 4 + 5,
492 k8nops + 1 + 2 + 3 + 4 + 5 + 6,
493 k8nops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
494};
495
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100496extern char __vsyscall_0;
497
Linus Torvalds1da177e2005-04-16 15:20:36 -0700498/* Replace instructions with better alternatives for this CPU type.
499
500 This runs before SMP is initialized to avoid SMP problems with
501 self modifying code. This implies that assymetric systems where
502 APs have less capabilities than the boot processor are not handled.
503 In this case boot with "noreplacement". */
504void apply_alternatives(void *start, void *end)
505{
506 struct alt_instr *a;
507 int diff, i, k;
508 for (a = start; (void *)a < end; a++) {
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100509 u8 *instr;
510
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511 if (!boot_cpu_has(a->cpuid))
512 continue;
513
514 BUG_ON(a->replacementlen > a->instrlen);
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100515 instr = a->instr;
516 /* vsyscall code is not mapped yet. resolve it manually. */
517 if (instr >= (u8 *)VSYSCALL_START && instr < (u8*)VSYSCALL_END)
518 instr = __va(instr - (u8*)VSYSCALL_START + (u8*)__pa_symbol(&__vsyscall_0));
519 __inline_memcpy(instr, a->replacement, a->replacementlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700520 diff = a->instrlen - a->replacementlen;
521
522 /* Pad the rest with nops */
523 for (i = a->replacementlen; diff > 0; diff -= k, i += k) {
524 k = diff;
525 if (k > ASM_NOP_MAX)
526 k = ASM_NOP_MAX;
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100527 __inline_memcpy(instr + i, k8_nops[k], k);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700528 }
529 }
530}
531
532static int no_replacement __initdata = 0;
533
534void __init alternative_instructions(void)
535{
536 extern struct alt_instr __alt_instructions[], __alt_instructions_end[];
537 if (no_replacement)
538 return;
539 apply_alternatives(__alt_instructions, __alt_instructions_end);
540}
541
542static int __init noreplacement_setup(char *s)
543{
544 no_replacement = 1;
OGAWA Hirofumi9b410462006-03-31 02:30:33 -0800545 return 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700546}
547
548__setup("noreplacement", noreplacement_setup);
549
550#if defined(CONFIG_EDD) || defined(CONFIG_EDD_MODULE)
551struct edd edd;
552#ifdef CONFIG_EDD_MODULE
553EXPORT_SYMBOL(edd);
554#endif
555/**
556 * copy_edd() - Copy the BIOS EDD information
557 * from boot_params into a safe place.
558 *
559 */
560static inline void copy_edd(void)
561{
562 memcpy(edd.mbr_signature, EDD_MBR_SIGNATURE, sizeof(edd.mbr_signature));
563 memcpy(edd.edd_info, EDD_BUF, sizeof(edd.edd_info));
564 edd.mbr_signature_nr = EDD_MBR_SIG_NR;
565 edd.edd_info_nr = EDD_NR;
566}
567#else
568static inline void copy_edd(void)
569{
570}
571#endif
572
573#define EBDA_ADDR_POINTER 0x40E
574static void __init reserve_ebda_region(void)
575{
576 unsigned int addr;
577 /**
578 * there is a real-mode segmented pointer pointing to the
579 * 4K EBDA area at 0x40E
580 */
581 addr = *(unsigned short *)phys_to_virt(EBDA_ADDR_POINTER);
582 addr <<= 4;
583 if (addr)
584 reserve_bootmem_generic(addr, PAGE_SIZE);
585}
586
587void __init setup_arch(char **cmdline_p)
588{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700589 unsigned long kernel_end;
590
591 ROOT_DEV = old_decode_dev(ORIG_ROOT_DEV);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700592 screen_info = SCREEN_INFO;
593 edid_info = EDID_INFO;
594 saved_video_mode = SAVED_VIDEO_MODE;
595 bootloader_type = LOADER_TYPE;
596
597#ifdef CONFIG_BLK_DEV_RAM
598 rd_image_start = RAMDISK_FLAGS & RAMDISK_IMAGE_START_MASK;
599 rd_prompt = ((RAMDISK_FLAGS & RAMDISK_PROMPT_FLAG) != 0);
600 rd_doload = ((RAMDISK_FLAGS & RAMDISK_LOAD_FLAG) != 0);
601#endif
602 setup_memory_region();
603 copy_edd();
604
605 if (!MOUNT_ROOT_RDONLY)
606 root_mountflags &= ~MS_RDONLY;
607 init_mm.start_code = (unsigned long) &_text;
608 init_mm.end_code = (unsigned long) &_etext;
609 init_mm.end_data = (unsigned long) &_edata;
610 init_mm.brk = (unsigned long) &_end;
611
612 code_resource.start = virt_to_phys(&_text);
613 code_resource.end = virt_to_phys(&_etext)-1;
614 data_resource.start = virt_to_phys(&_etext);
615 data_resource.end = virt_to_phys(&_edata)-1;
616
617 parse_cmdline_early(cmdline_p);
618
619 early_identify_cpu(&boot_cpu_data);
620
621 /*
622 * partially used pages are not usable - thus
623 * we are rounding upwards:
624 */
625 end_pfn = e820_end_of_ram();
Andi Kleen1f502492006-03-25 16:29:58 +0100626 num_physpages = end_pfn; /* for pfn_valid */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700627
628 check_efer();
629
630 init_memory_mapping(0, (end_pfn_map << PAGE_SHIFT));
631
Andi Kleenf2d3efe2006-03-25 16:30:22 +0100632 dmi_scan_machine();
633
Siddha, Suresh Bf6c2e332005-11-05 17:25:53 +0100634 zap_low_mappings(0);
635
Len Brown888ba6c2005-08-24 12:07:20 -0400636#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700637 /*
638 * Initialize the ACPI boot-time table parser (gets the RSDP and SDT).
639 * Call this early for SRAT node setup.
640 */
641 acpi_boot_table_init();
642#endif
643
644#ifdef CONFIG_ACPI_NUMA
645 /*
646 * Parse SRAT to discover nodes.
647 */
648 acpi_numa_init();
649#endif
650
Matt Tolentino2b976902005-06-23 00:08:06 -0700651#ifdef CONFIG_NUMA
Linus Torvalds1da177e2005-04-16 15:20:36 -0700652 numa_initmem_init(0, end_pfn);
653#else
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700654 contig_initmem_init(0, end_pfn);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700655#endif
656
657 /* Reserve direct mapping */
658 reserve_bootmem_generic(table_start << PAGE_SHIFT,
659 (table_end - table_start) << PAGE_SHIFT);
660
661 /* reserve kernel */
662 kernel_end = round_up(__pa_symbol(&_end),PAGE_SIZE);
663 reserve_bootmem_generic(HIGH_MEMORY, kernel_end - HIGH_MEMORY);
664
665 /*
666 * reserve physical page 0 - it's a special BIOS page on many boxes,
667 * enabling clean reboots, SMP operation, laptop functions.
668 */
669 reserve_bootmem_generic(0, PAGE_SIZE);
670
671 /* reserve ebda region */
672 reserve_ebda_region();
673
674#ifdef CONFIG_SMP
675 /*
676 * But first pinch a few for the stack/trampoline stuff
677 * FIXME: Don't need the extra page at 4K, but need to fix
678 * trampoline before removing it. (see the GDT stuff)
679 */
680 reserve_bootmem_generic(PAGE_SIZE, PAGE_SIZE);
681
682 /* Reserve SMP trampoline */
683 reserve_bootmem_generic(SMP_TRAMPOLINE_BASE, PAGE_SIZE);
684#endif
685
686#ifdef CONFIG_ACPI_SLEEP
687 /*
688 * Reserve low memory region for sleep support.
689 */
690 acpi_reserve_bootmem();
691#endif
692#ifdef CONFIG_X86_LOCAL_APIC
693 /*
694 * Find and reserve possible boot-time SMP configuration:
695 */
696 find_smp_config();
697#endif
698#ifdef CONFIG_BLK_DEV_INITRD
699 if (LOADER_TYPE && INITRD_START) {
700 if (INITRD_START + INITRD_SIZE <= (end_pfn << PAGE_SHIFT)) {
701 reserve_bootmem_generic(INITRD_START, INITRD_SIZE);
702 initrd_start =
703 INITRD_START ? INITRD_START + PAGE_OFFSET : 0;
704 initrd_end = initrd_start+INITRD_SIZE;
705 }
706 else {
707 printk(KERN_ERR "initrd extends beyond end of memory "
708 "(0x%08lx > 0x%08lx)\ndisabling initrd\n",
709 (unsigned long)(INITRD_START + INITRD_SIZE),
710 (unsigned long)(end_pfn << PAGE_SHIFT));
711 initrd_start = 0;
712 }
713 }
714#endif
Eric W. Biederman5f5609d2005-06-25 14:58:04 -0700715#ifdef CONFIG_KEXEC
716 if (crashk_res.start != crashk_res.end) {
717 reserve_bootmem(crashk_res.start,
718 crashk_res.end - crashk_res.start + 1);
719 }
720#endif
Eric W. Biederman0d317fb2005-08-06 13:47:36 -0600721
Linus Torvalds1da177e2005-04-16 15:20:36 -0700722 paging_init();
723
724 check_ioapic();
725
Ashok Raj51f62e12006-03-25 16:29:28 +0100726 /*
727 * set this early, so we dont allocate cpu0
728 * if MADT list doesnt list BSP first
729 * mpparse.c/MP_processor_info() allocates logical cpu numbers.
730 */
731 cpu_set(0, cpu_present_map);
Len Brown888ba6c2005-08-24 12:07:20 -0400732#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700733 /*
734 * Read APIC and some other early information from ACPI tables.
735 */
736 acpi_boot_init();
737#endif
738
Ravikiran Thirumalai05b3cbd2006-01-11 22:45:36 +0100739 init_cpu_to_node();
740
Linus Torvalds1da177e2005-04-16 15:20:36 -0700741#ifdef CONFIG_X86_LOCAL_APIC
742 /*
743 * get boot-time SMP configuration:
744 */
745 if (smp_found_config)
746 get_smp_config();
747 init_apic_mappings();
748#endif
749
750 /*
751 * Request address space for all standard RAM and ROM resources
752 * and also for regions reported as reserved by the e820.
753 */
754 probe_roms();
755 e820_reserve_resources();
756
757 request_resource(&iomem_resource, &video_ram_resource);
758
759 {
760 unsigned i;
761 /* request I/O space for devices used on all i[345]86 PCs */
762 for (i = 0; i < STANDARD_IO_RESOURCES; i++)
763 request_resource(&ioport_resource, &standard_io_resources[i]);
764 }
765
Andi Kleena1e97782005-04-16 15:25:12 -0700766 e820_setup_gap();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700767
768#ifdef CONFIG_GART_IOMMU
Jon Mason5b7b6442006-02-03 21:51:59 +0100769 iommu_hole_init();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700770#endif
771
772#ifdef CONFIG_VT
773#if defined(CONFIG_VGA_CONSOLE)
774 conswitchp = &vga_con;
775#elif defined(CONFIG_DUMMY_CONSOLE)
776 conswitchp = &dummy_con;
777#endif
778#endif
779}
780
Ashok Raje6982c62005-06-25 14:54:58 -0700781static int __cpuinit get_model_name(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700782{
783 unsigned int *v;
784
Andi Kleenebfcaa92005-04-16 15:25:18 -0700785 if (c->extended_cpuid_level < 0x80000004)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700786 return 0;
787
788 v = (unsigned int *) c->x86_model_id;
789 cpuid(0x80000002, &v[0], &v[1], &v[2], &v[3]);
790 cpuid(0x80000003, &v[4], &v[5], &v[6], &v[7]);
791 cpuid(0x80000004, &v[8], &v[9], &v[10], &v[11]);
792 c->x86_model_id[48] = 0;
793 return 1;
794}
795
796
Ashok Raje6982c62005-06-25 14:54:58 -0700797static void __cpuinit display_cacheinfo(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700798{
799 unsigned int n, dummy, eax, ebx, ecx, edx;
800
Andi Kleenebfcaa92005-04-16 15:25:18 -0700801 n = c->extended_cpuid_level;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700802
803 if (n >= 0x80000005) {
804 cpuid(0x80000005, &dummy, &ebx, &ecx, &edx);
805 printk(KERN_INFO "CPU: L1 I Cache: %dK (%d bytes/line), D cache %dK (%d bytes/line)\n",
806 edx>>24, edx&0xFF, ecx>>24, ecx&0xFF);
807 c->x86_cache_size=(ecx>>24)+(edx>>24);
808 /* On K8 L1 TLB is inclusive, so don't count it */
809 c->x86_tlbsize = 0;
810 }
811
812 if (n >= 0x80000006) {
813 cpuid(0x80000006, &dummy, &ebx, &ecx, &edx);
814 ecx = cpuid_ecx(0x80000006);
815 c->x86_cache_size = ecx >> 16;
816 c->x86_tlbsize += ((ebx >> 16) & 0xfff) + (ebx & 0xfff);
817
818 printk(KERN_INFO "CPU: L2 Cache: %dK (%d bytes/line)\n",
819 c->x86_cache_size, ecx & 0xFF);
820 }
821
822 if (n >= 0x80000007)
823 cpuid(0x80000007, &dummy, &dummy, &dummy, &c->x86_power);
824 if (n >= 0x80000008) {
825 cpuid(0x80000008, &eax, &dummy, &dummy, &dummy);
826 c->x86_virt_bits = (eax >> 8) & 0xff;
827 c->x86_phys_bits = eax & 0xff;
828 }
829}
830
Andi Kleen3f098c22005-09-12 18:49:24 +0200831#ifdef CONFIG_NUMA
832static int nearby_node(int apicid)
833{
834 int i;
835 for (i = apicid - 1; i >= 0; i--) {
836 int node = apicid_to_node[i];
837 if (node != NUMA_NO_NODE && node_online(node))
838 return node;
839 }
840 for (i = apicid + 1; i < MAX_LOCAL_APIC; i++) {
841 int node = apicid_to_node[i];
842 if (node != NUMA_NO_NODE && node_online(node))
843 return node;
844 }
845 return first_node(node_online_map); /* Shouldn't happen */
846}
847#endif
848
Andi Kleen63518642005-04-16 15:25:16 -0700849/*
850 * On a AMD dual core setup the lower bits of the APIC id distingush the cores.
851 * Assumes number of cores is a power of two.
852 */
853static void __init amd_detect_cmp(struct cpuinfo_x86 *c)
854{
855#ifdef CONFIG_SMP
Andi Kleen29422832005-05-16 21:53:26 -0700856 int cpu = smp_processor_id();
Andi Kleenb41e2932005-05-20 14:27:55 -0700857 unsigned bits;
Andi Kleen3f098c22005-09-12 18:49:24 +0200858#ifdef CONFIG_NUMA
859 int node = 0;
Ravikiran G Thirumalai60c1bc82006-03-25 16:30:04 +0100860 unsigned apicid = hard_smp_processor_id();
Andi Kleen3f098c22005-09-12 18:49:24 +0200861#endif
Andi Kleenb41e2932005-05-20 14:27:55 -0700862
863 bits = 0;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100864 while ((1 << bits) < c->x86_max_cores)
Andi Kleenb41e2932005-05-20 14:27:55 -0700865 bits++;
866
867 /* Low order bits define the core id (index of core in socket) */
868 cpu_core_id[cpu] = phys_proc_id[cpu] & ((1 << bits)-1);
869 /* Convert the APIC ID into the socket ID */
Ravikiran G Thirumalai60c1bc82006-03-25 16:30:04 +0100870 phys_proc_id[cpu] = phys_pkg_id(bits);
Andi Kleen63518642005-04-16 15:25:16 -0700871
872#ifdef CONFIG_NUMA
Andi Kleen3f098c22005-09-12 18:49:24 +0200873 node = phys_proc_id[cpu];
874 if (apicid_to_node[apicid] != NUMA_NO_NODE)
875 node = apicid_to_node[apicid];
876 if (!node_online(node)) {
877 /* Two possibilities here:
878 - The CPU is missing memory and no node was created.
879 In that case try picking one from a nearby CPU
880 - The APIC IDs differ from the HyperTransport node IDs
881 which the K8 northbridge parsing fills in.
882 Assume they are all increased by a constant offset,
883 but in the same order as the HT nodeids.
884 If that doesn't result in a usable node fall back to the
885 path for the previous case. */
886 int ht_nodeid = apicid - (phys_proc_id[0] << bits);
887 if (ht_nodeid >= 0 &&
888 apicid_to_node[ht_nodeid] != NUMA_NO_NODE)
889 node = apicid_to_node[ht_nodeid];
890 /* Pick a nearby node */
891 if (!node_online(node))
892 node = nearby_node(apicid);
893 }
Andi Kleen69d81fc2005-11-05 17:25:53 +0100894 numa_set_node(cpu, node);
Andi Kleena1586082005-05-16 21:53:21 -0700895
Andi Kleen77d910f2006-03-25 16:29:34 +0100896 printk(KERN_INFO "CPU %d/%x(%d) -> Node %d -> Core %d\n",
897 cpu, apicid, c->x86_max_cores, node, cpu_core_id[cpu]);
Andi Kleen3f098c22005-09-12 18:49:24 +0200898#endif
Andi Kleen63518642005-04-16 15:25:16 -0700899#endif
900}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700901
902static int __init init_amd(struct cpuinfo_x86 *c)
903{
904 int r;
Andi Kleen7bcd3f32006-02-03 21:51:02 +0100905 unsigned level;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700906
Linus Torvaldsbc5e8fd2005-09-17 15:41:04 -0700907#ifdef CONFIG_SMP
908 unsigned long value;
909
Andi Kleen7d318d72005-09-29 22:05:55 +0200910 /*
911 * Disable TLB flush filter by setting HWCR.FFDIS on K8
912 * bit 6 of msr C001_0015
913 *
914 * Errata 63 for SH-B3 steppings
915 * Errata 122 for all steppings (F+ have it disabled by default)
916 */
917 if (c->x86 == 15) {
918 rdmsrl(MSR_K8_HWCR, value);
919 value |= 1 << 6;
920 wrmsrl(MSR_K8_HWCR, value);
921 }
Linus Torvaldsbc5e8fd2005-09-17 15:41:04 -0700922#endif
923
Linus Torvalds1da177e2005-04-16 15:20:36 -0700924 /* Bit 31 in normal CPUID used for nonstandard 3DNow ID;
925 3DNow is IDd by bit 31 in extended CPUID (1*32+31) anyway */
926 clear_bit(0*32+31, &c->x86_capability);
927
Andi Kleen7bcd3f32006-02-03 21:51:02 +0100928 /* On C+ stepping K8 rep microcode works well for copy/memset */
929 level = cpuid_eax(1);
930 if (c->x86 == 15 && ((level >= 0x0f48 && level < 0x0f50) || level >= 0x0f58))
931 set_bit(X86_FEATURE_REP_GOOD, &c->x86_capability);
932
Andi Kleen18bd0572006-04-20 02:36:45 +0200933 /* Enable workaround for FXSAVE leak */
934 if (c->x86 >= 6)
935 set_bit(X86_FEATURE_FXSAVE_LEAK, &c->x86_capability);
936
Linus Torvalds1da177e2005-04-16 15:20:36 -0700937 r = get_model_name(c);
938 if (!r) {
939 switch (c->x86) {
940 case 15:
941 /* Should distinguish Models here, but this is only
942 a fallback anyways. */
943 strcpy(c->x86_model_id, "Hammer");
944 break;
945 }
946 }
947 display_cacheinfo(c);
948
Andi Kleen130951c2006-01-11 22:42:02 +0100949 /* c->x86_power is 8000_0007 edx. Bit 8 is constant TSC */
950 if (c->x86_power & (1<<8))
951 set_bit(X86_FEATURE_CONSTANT_TSC, &c->x86_capability);
952
Andi Kleenebfcaa92005-04-16 15:25:18 -0700953 if (c->extended_cpuid_level >= 0x80000008) {
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100954 c->x86_max_cores = (cpuid_ecx(0x80000008) & 0xff) + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700955
Andi Kleen63518642005-04-16 15:25:16 -0700956 amd_detect_cmp(c);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700957 }
958
959 return r;
960}
961
Ashok Raje6982c62005-06-25 14:54:58 -0700962static void __cpuinit detect_ht(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700963{
964#ifdef CONFIG_SMP
965 u32 eax, ebx, ecx, edx;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100966 int index_msb, core_bits;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700967 int cpu = smp_processor_id();
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100968
969 cpuid(1, &eax, &ebx, &ecx, &edx);
970
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100971
Andi Kleen63518642005-04-16 15:25:16 -0700972 if (!cpu_has(c, X86_FEATURE_HT) || cpu_has(c, X86_FEATURE_CMP_LEGACY))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700973 return;
974
Linus Torvalds1da177e2005-04-16 15:20:36 -0700975 smp_num_siblings = (ebx & 0xff0000) >> 16;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100976
Linus Torvalds1da177e2005-04-16 15:20:36 -0700977 if (smp_num_siblings == 1) {
978 printk(KERN_INFO "CPU: Hyper-Threading is disabled\n");
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100979 } else if (smp_num_siblings > 1 ) {
980
Linus Torvalds1da177e2005-04-16 15:20:36 -0700981 if (smp_num_siblings > NR_CPUS) {
982 printk(KERN_WARNING "CPU: Unsupported number of the siblings %d", smp_num_siblings);
983 smp_num_siblings = 1;
984 return;
985 }
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100986
987 index_msb = get_count_order(smp_num_siblings);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700988 phys_proc_id[cpu] = phys_pkg_id(index_msb);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100989
Linus Torvalds1da177e2005-04-16 15:20:36 -0700990 printk(KERN_INFO "CPU: Physical Processor ID: %d\n",
991 phys_proc_id[cpu]);
Andi Kleen3dd9d512005-04-16 15:25:15 -0700992
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100993 smp_num_siblings = smp_num_siblings / c->x86_max_cores;
Andi Kleen3dd9d512005-04-16 15:25:15 -0700994
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100995 index_msb = get_count_order(smp_num_siblings) ;
Andi Kleen3dd9d512005-04-16 15:25:15 -0700996
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100997 core_bits = get_count_order(c->x86_max_cores);
Andi Kleen3dd9d512005-04-16 15:25:15 -0700998
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100999 cpu_core_id[cpu] = phys_pkg_id(index_msb) &
1000 ((1 << core_bits) - 1);
1001
1002 if (c->x86_max_cores > 1)
Andi Kleen3dd9d512005-04-16 15:25:15 -07001003 printk(KERN_INFO "CPU: Processor Core ID: %d\n",
1004 cpu_core_id[cpu]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001005 }
1006#endif
1007}
1008
Andi Kleen3dd9d512005-04-16 15:25:15 -07001009/*
1010 * find out the number of processor cores on the die
1011 */
Ashok Raje6982c62005-06-25 14:54:58 -07001012static int __cpuinit intel_num_cpu_cores(struct cpuinfo_x86 *c)
Andi Kleen3dd9d512005-04-16 15:25:15 -07001013{
1014 unsigned int eax;
1015
1016 if (c->cpuid_level < 4)
1017 return 1;
1018
1019 __asm__("cpuid"
1020 : "=a" (eax)
1021 : "0" (4), "c" (0)
1022 : "bx", "dx");
1023
1024 if (eax & 0x1f)
1025 return ((eax >> 26) + 1);
1026 else
1027 return 1;
1028}
1029
Andi Kleendf0cc262005-09-12 18:49:24 +02001030static void srat_detect_node(void)
1031{
1032#ifdef CONFIG_NUMA
Ravikiran G Thirumalaiddea7be2005-10-03 10:36:28 -07001033 unsigned node;
Andi Kleendf0cc262005-09-12 18:49:24 +02001034 int cpu = smp_processor_id();
1035
1036 /* Don't do the funky fallback heuristics the AMD version employs
1037 for now. */
Ravikiran G Thirumalaiddea7be2005-10-03 10:36:28 -07001038 node = apicid_to_node[hard_smp_processor_id()];
Andi Kleendf0cc262005-09-12 18:49:24 +02001039 if (node == NUMA_NO_NODE)
1040 node = 0;
Andi Kleen69d81fc2005-11-05 17:25:53 +01001041 numa_set_node(cpu, node);
Andi Kleendf0cc262005-09-12 18:49:24 +02001042
1043 if (acpi_numa > 0)
1044 printk(KERN_INFO "CPU %d -> Node %d\n", cpu, node);
1045#endif
1046}
1047
Ashok Raje6982c62005-06-25 14:54:58 -07001048static void __cpuinit init_intel(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001049{
1050 /* Cache sizes */
1051 unsigned n;
1052
1053 init_intel_cacheinfo(c);
Andi Kleenebfcaa92005-04-16 15:25:18 -07001054 n = c->extended_cpuid_level;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001055 if (n >= 0x80000008) {
1056 unsigned eax = cpuid_eax(0x80000008);
1057 c->x86_virt_bits = (eax >> 8) & 0xff;
1058 c->x86_phys_bits = eax & 0xff;
Shaohua Liaf9c1422005-11-05 17:25:54 +01001059 /* CPUID workaround for Intel 0F34 CPU */
1060 if (c->x86_vendor == X86_VENDOR_INTEL &&
1061 c->x86 == 0xF && c->x86_model == 0x3 &&
1062 c->x86_mask == 0x4)
1063 c->x86_phys_bits = 36;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001064 }
1065
1066 if (c->x86 == 15)
1067 c->x86_cache_alignment = c->x86_clflush_size * 2;
Andi Kleen39b3a792006-01-11 22:42:45 +01001068 if ((c->x86 == 0xf && c->x86_model >= 0x03) ||
1069 (c->x86 == 0x6 && c->x86_model >= 0x0e))
Andi Kleenc29601e2005-04-16 15:25:05 -07001070 set_bit(X86_FEATURE_CONSTANT_TSC, &c->x86_capability);
Andi Kleenc818a182006-01-11 22:45:24 +01001071 set_bit(X86_FEATURE_SYNC_RDTSC, &c->x86_capability);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001072 c->x86_max_cores = intel_num_cpu_cores(c);
Andi Kleendf0cc262005-09-12 18:49:24 +02001073
1074 srat_detect_node();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001075}
1076
Adrian Bunk672289e2005-09-10 00:27:21 -07001077static void __cpuinit get_cpu_vendor(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001078{
1079 char *v = c->x86_vendor_id;
1080
1081 if (!strcmp(v, "AuthenticAMD"))
1082 c->x86_vendor = X86_VENDOR_AMD;
1083 else if (!strcmp(v, "GenuineIntel"))
1084 c->x86_vendor = X86_VENDOR_INTEL;
1085 else
1086 c->x86_vendor = X86_VENDOR_UNKNOWN;
1087}
1088
1089struct cpu_model_info {
1090 int vendor;
1091 int family;
1092 char *model_names[16];
1093};
1094
1095/* Do some early cpuid on the boot CPU to get some parameter that are
1096 needed before check_bugs. Everything advanced is in identify_cpu
1097 below. */
Ashok Raje6982c62005-06-25 14:54:58 -07001098void __cpuinit early_identify_cpu(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001099{
1100 u32 tfms;
1101
1102 c->loops_per_jiffy = loops_per_jiffy;
1103 c->x86_cache_size = -1;
1104 c->x86_vendor = X86_VENDOR_UNKNOWN;
1105 c->x86_model = c->x86_mask = 0; /* So far unknown... */
1106 c->x86_vendor_id[0] = '\0'; /* Unset */
1107 c->x86_model_id[0] = '\0'; /* Unset */
1108 c->x86_clflush_size = 64;
1109 c->x86_cache_alignment = c->x86_clflush_size;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001110 c->x86_max_cores = 1;
Andi Kleenebfcaa92005-04-16 15:25:18 -07001111 c->extended_cpuid_level = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001112 memset(&c->x86_capability, 0, sizeof c->x86_capability);
1113
1114 /* Get vendor name */
1115 cpuid(0x00000000, (unsigned int *)&c->cpuid_level,
1116 (unsigned int *)&c->x86_vendor_id[0],
1117 (unsigned int *)&c->x86_vendor_id[8],
1118 (unsigned int *)&c->x86_vendor_id[4]);
1119
1120 get_cpu_vendor(c);
1121
1122 /* Initialize the standard set of capabilities */
1123 /* Note that the vendor-specific code below might override */
1124
1125 /* Intel-defined flags: level 0x00000001 */
1126 if (c->cpuid_level >= 0x00000001) {
1127 __u32 misc;
1128 cpuid(0x00000001, &tfms, &misc, &c->x86_capability[4],
1129 &c->x86_capability[0]);
1130 c->x86 = (tfms >> 8) & 0xf;
1131 c->x86_model = (tfms >> 4) & 0xf;
1132 c->x86_mask = tfms & 0xf;
Suresh Siddhaf5f786d2005-11-05 17:25:53 +01001133 if (c->x86 == 0xf)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001134 c->x86 += (tfms >> 20) & 0xff;
Suresh Siddhaf5f786d2005-11-05 17:25:53 +01001135 if (c->x86 >= 0x6)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001136 c->x86_model += ((tfms >> 16) & 0xF) << 4;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001137 if (c->x86_capability[0] & (1<<19))
1138 c->x86_clflush_size = ((misc >> 8) & 0xff) * 8;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001139 } else {
1140 /* Have CPUID level 0 only - unheard of */
1141 c->x86 = 4;
1142 }
Andi Kleena1586082005-05-16 21:53:21 -07001143
1144#ifdef CONFIG_SMP
Andi Kleenb41e2932005-05-20 14:27:55 -07001145 phys_proc_id[smp_processor_id()] = (cpuid_ebx(1) >> 24) & 0xff;
Andi Kleena1586082005-05-16 21:53:21 -07001146#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001147}
1148
1149/*
1150 * This does the hard work of actually picking apart the CPU stuff...
1151 */
Ashok Raje6982c62005-06-25 14:54:58 -07001152void __cpuinit identify_cpu(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001153{
1154 int i;
1155 u32 xlvl;
1156
1157 early_identify_cpu(c);
1158
1159 /* AMD-defined flags: level 0x80000001 */
1160 xlvl = cpuid_eax(0x80000000);
Andi Kleenebfcaa92005-04-16 15:25:18 -07001161 c->extended_cpuid_level = xlvl;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001162 if ((xlvl & 0xffff0000) == 0x80000000) {
1163 if (xlvl >= 0x80000001) {
1164 c->x86_capability[1] = cpuid_edx(0x80000001);
H. Peter Anvin5b7abc62005-05-01 08:58:49 -07001165 c->x86_capability[6] = cpuid_ecx(0x80000001);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001166 }
1167 if (xlvl >= 0x80000004)
1168 get_model_name(c); /* Default name */
1169 }
1170
1171 /* Transmeta-defined flags: level 0x80860001 */
1172 xlvl = cpuid_eax(0x80860000);
1173 if ((xlvl & 0xffff0000) == 0x80860000) {
1174 /* Don't set x86_cpuid_level here for now to not confuse. */
1175 if (xlvl >= 0x80860001)
1176 c->x86_capability[2] = cpuid_edx(0x80860001);
1177 }
1178
Siddha, Suresh B1e9f28f2006-03-27 01:15:22 -08001179 c->apicid = phys_pkg_id(0);
1180
Linus Torvalds1da177e2005-04-16 15:20:36 -07001181 /*
1182 * Vendor-specific initialization. In this section we
1183 * canonicalize the feature flags, meaning if there are
1184 * features a certain CPU supports which CPUID doesn't
1185 * tell us, CPUID claiming incorrect flags, or other bugs,
1186 * we handle them here.
1187 *
1188 * At the end of this section, c->x86_capability better
1189 * indicate the features this CPU genuinely supports!
1190 */
1191 switch (c->x86_vendor) {
1192 case X86_VENDOR_AMD:
1193 init_amd(c);
1194 break;
1195
1196 case X86_VENDOR_INTEL:
1197 init_intel(c);
1198 break;
1199
1200 case X86_VENDOR_UNKNOWN:
1201 default:
1202 display_cacheinfo(c);
1203 break;
1204 }
1205
1206 select_idle_routine(c);
1207 detect_ht(c);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001208
1209 /*
1210 * On SMP, boot_cpu_data holds the common feature set between
1211 * all CPUs; so make sure that we indicate which features are
1212 * common between the CPUs. The first time this routine gets
1213 * executed, c == &boot_cpu_data.
1214 */
1215 if (c != &boot_cpu_data) {
1216 /* AND the already accumulated flags with these */
1217 for (i = 0 ; i < NCAPINTS ; i++)
1218 boot_cpu_data.x86_capability[i] &= c->x86_capability[i];
1219 }
1220
1221#ifdef CONFIG_X86_MCE
1222 mcheck_init(c);
1223#endif
Shaohua Li3b520b22005-07-07 17:56:38 -07001224 if (c == &boot_cpu_data)
1225 mtrr_bp_init();
1226 else
1227 mtrr_ap_init();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001228#ifdef CONFIG_NUMA
Andi Kleen3019e8e2005-07-28 21:15:28 -07001229 numa_add_cpu(smp_processor_id());
Linus Torvalds1da177e2005-04-16 15:20:36 -07001230#endif
1231}
1232
1233
Ashok Raje6982c62005-06-25 14:54:58 -07001234void __cpuinit print_cpu_info(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001235{
1236 if (c->x86_model_id[0])
1237 printk("%s", c->x86_model_id);
1238
1239 if (c->x86_mask || c->cpuid_level >= 0)
1240 printk(" stepping %02x\n", c->x86_mask);
1241 else
1242 printk("\n");
1243}
1244
1245/*
1246 * Get CPU information for use by the procfs.
1247 */
1248
1249static int show_cpuinfo(struct seq_file *m, void *v)
1250{
1251 struct cpuinfo_x86 *c = v;
1252
1253 /*
1254 * These flag bits must match the definitions in <asm/cpufeature.h>.
1255 * NULL means this bit is undefined or reserved; either way it doesn't
1256 * have meaning as far as Linux is concerned. Note that it's important
1257 * to realize there is a difference between this table and CPUID -- if
1258 * applications want to get the raw CPUID data, they should access
1259 * /dev/cpu/<cpu_nr>/cpuid instead.
1260 */
1261 static char *x86_cap_flags[] = {
1262 /* Intel-defined */
1263 "fpu", "vme", "de", "pse", "tsc", "msr", "pae", "mce",
1264 "cx8", "apic", NULL, "sep", "mtrr", "pge", "mca", "cmov",
1265 "pat", "pse36", "pn", "clflush", NULL, "dts", "acpi", "mmx",
1266 "fxsr", "sse", "sse2", "ss", "ht", "tm", "ia64", NULL,
1267
1268 /* AMD-defined */
Zwane Mwaikambo3c3b73b2005-05-01 08:58:51 -07001269 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001270 NULL, NULL, NULL, "syscall", NULL, NULL, NULL, NULL,
1271 NULL, NULL, NULL, NULL, "nx", NULL, "mmxext", NULL,
Andi Kleen3f98bc42006-01-11 22:42:51 +01001272 NULL, "fxsr_opt", "rdtscp", NULL, NULL, "lm", "3dnowext", "3dnow",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001273
1274 /* Transmeta-defined */
1275 "recovery", "longrun", NULL, "lrti", NULL, NULL, NULL, NULL,
1276 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1277 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1278 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1279
1280 /* Other (Linux-defined) */
Andi Kleen622dcaf2005-05-16 21:53:26 -07001281 "cxmmx", NULL, "cyrix_arr", "centaur_mcr", NULL,
Andi Kleenc29601e2005-04-16 15:25:05 -07001282 "constant_tsc", NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001283 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1284 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1285 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1286
1287 /* Intel-defined (#2) */
Andi Kleen9d95dd82006-03-25 16:31:22 +01001288 "pni", NULL, NULL, "monitor", "ds_cpl", "vmx", "smx", "est",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001289 "tm2", NULL, "cid", NULL, NULL, "cx16", "xtpr", NULL,
1290 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1291 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1292
H. Peter Anvin5b7abc62005-05-01 08:58:49 -07001293 /* VIA/Cyrix/Centaur-defined */
1294 NULL, NULL, "rng", "rng_en", NULL, NULL, "ace", "ace_en",
1295 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1296 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1297 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1298
Linus Torvalds1da177e2005-04-16 15:20:36 -07001299 /* AMD-defined (#2) */
Andi Kleen3f98bc42006-01-11 22:42:51 +01001300 "lahf_lm", "cmp_legacy", "svm", NULL, "cr8_legacy", NULL, NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001301 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1302 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
H. Peter Anvin5b7abc62005-05-01 08:58:49 -07001303 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001304 };
1305 static char *x86_power_flags[] = {
1306 "ts", /* temperature sensor */
1307 "fid", /* frequency id control */
1308 "vid", /* voltage id control */
1309 "ttp", /* thermal trip */
1310 "tm",
Andi Kleen3f98bc42006-01-11 22:42:51 +01001311 "stc",
1312 NULL,
Andi Kleen39b3a792006-01-11 22:42:45 +01001313 /* nothing */ /* constant_tsc - moved to flags */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001314 };
1315
1316
1317#ifdef CONFIG_SMP
1318 if (!cpu_online(c-cpu_data))
1319 return 0;
1320#endif
1321
1322 seq_printf(m,"processor\t: %u\n"
1323 "vendor_id\t: %s\n"
1324 "cpu family\t: %d\n"
1325 "model\t\t: %d\n"
1326 "model name\t: %s\n",
1327 (unsigned)(c-cpu_data),
1328 c->x86_vendor_id[0] ? c->x86_vendor_id : "unknown",
1329 c->x86,
1330 (int)c->x86_model,
1331 c->x86_model_id[0] ? c->x86_model_id : "unknown");
1332
1333 if (c->x86_mask || c->cpuid_level >= 0)
1334 seq_printf(m, "stepping\t: %d\n", c->x86_mask);
1335 else
1336 seq_printf(m, "stepping\t: unknown\n");
1337
1338 if (cpu_has(c,X86_FEATURE_TSC)) {
Venkatesh Pallipadi95235ca2005-12-02 10:43:20 -08001339 unsigned int freq = cpufreq_quick_get((unsigned)(c-cpu_data));
1340 if (!freq)
1341 freq = cpu_khz;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001342 seq_printf(m, "cpu MHz\t\t: %u.%03u\n",
Venkatesh Pallipadi95235ca2005-12-02 10:43:20 -08001343 freq / 1000, (freq % 1000));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001344 }
1345
1346 /* Cache size */
1347 if (c->x86_cache_size >= 0)
1348 seq_printf(m, "cache size\t: %d KB\n", c->x86_cache_size);
1349
1350#ifdef CONFIG_SMP
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001351 if (smp_num_siblings * c->x86_max_cores > 1) {
Andi Kleendb468682005-04-16 15:24:51 -07001352 int cpu = c - cpu_data;
1353 seq_printf(m, "physical id\t: %d\n", phys_proc_id[cpu]);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001354 seq_printf(m, "siblings\t: %d\n", cpus_weight(cpu_core_map[cpu]));
Siddha, Suresh Bd31ddaa2005-04-16 15:25:20 -07001355 seq_printf(m, "core id\t\t: %d\n", cpu_core_id[cpu]);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001356 seq_printf(m, "cpu cores\t: %d\n", c->booted_cores);
Andi Kleendb468682005-04-16 15:24:51 -07001357 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001358#endif
1359
1360 seq_printf(m,
1361 "fpu\t\t: yes\n"
1362 "fpu_exception\t: yes\n"
1363 "cpuid level\t: %d\n"
1364 "wp\t\t: yes\n"
1365 "flags\t\t:",
1366 c->cpuid_level);
1367
1368 {
1369 int i;
1370 for ( i = 0 ; i < 32*NCAPINTS ; i++ )
Akinobu Mita3d1712c2006-03-24 03:15:11 -08001371 if (cpu_has(c, i) && x86_cap_flags[i] != NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001372 seq_printf(m, " %s", x86_cap_flags[i]);
1373 }
1374
1375 seq_printf(m, "\nbogomips\t: %lu.%02lu\n",
1376 c->loops_per_jiffy/(500000/HZ),
1377 (c->loops_per_jiffy/(5000/HZ)) % 100);
1378
1379 if (c->x86_tlbsize > 0)
1380 seq_printf(m, "TLB size\t: %d 4K pages\n", c->x86_tlbsize);
1381 seq_printf(m, "clflush size\t: %d\n", c->x86_clflush_size);
1382 seq_printf(m, "cache_alignment\t: %d\n", c->x86_cache_alignment);
1383
1384 seq_printf(m, "address sizes\t: %u bits physical, %u bits virtual\n",
1385 c->x86_phys_bits, c->x86_virt_bits);
1386
1387 seq_printf(m, "power management:");
1388 {
1389 unsigned i;
1390 for (i = 0; i < 32; i++)
1391 if (c->x86_power & (1 << i)) {
Andi Kleen3f98bc42006-01-11 22:42:51 +01001392 if (i < ARRAY_SIZE(x86_power_flags) &&
1393 x86_power_flags[i])
1394 seq_printf(m, "%s%s",
1395 x86_power_flags[i][0]?" ":"",
1396 x86_power_flags[i]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001397 else
1398 seq_printf(m, " [%d]", i);
1399 }
1400 }
Andi Kleen3dd9d512005-04-16 15:25:15 -07001401
Siddha, Suresh Bd31ddaa2005-04-16 15:25:20 -07001402 seq_printf(m, "\n\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001403
Linus Torvalds1da177e2005-04-16 15:20:36 -07001404 return 0;
1405}
1406
1407static void *c_start(struct seq_file *m, loff_t *pos)
1408{
1409 return *pos < NR_CPUS ? cpu_data + *pos : NULL;
1410}
1411
1412static void *c_next(struct seq_file *m, void *v, loff_t *pos)
1413{
1414 ++*pos;
1415 return c_start(m, pos);
1416}
1417
1418static void c_stop(struct seq_file *m, void *v)
1419{
1420}
1421
1422struct seq_operations cpuinfo_op = {
1423 .start =c_start,
1424 .next = c_next,
1425 .stop = c_stop,
1426 .show = show_cpuinfo,
1427};
Andi Kleene9928672006-01-11 22:43:33 +01001428