blob: c50b06765a80ddc16d0d17a59055a8cd42044cea [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/arch/x86-64/kernel/setup.c
3 *
4 * Copyright (C) 1995 Linus Torvalds
5 *
6 * Nov 2001 Dave Jones <davej@suse.de>
7 * Forked from i386 setup code.
8 *
9 * $Id$
10 */
11
12/*
13 * This file handles the architecture-dependent parts of initialization
14 */
15
16#include <linux/errno.h>
17#include <linux/sched.h>
18#include <linux/kernel.h>
19#include <linux/mm.h>
20#include <linux/stddef.h>
21#include <linux/unistd.h>
22#include <linux/ptrace.h>
23#include <linux/slab.h>
24#include <linux/user.h>
25#include <linux/a.out.h>
26#include <linux/tty.h>
27#include <linux/ioport.h>
28#include <linux/delay.h>
29#include <linux/config.h>
30#include <linux/init.h>
31#include <linux/initrd.h>
32#include <linux/highmem.h>
33#include <linux/bootmem.h>
34#include <linux/module.h>
35#include <asm/processor.h>
36#include <linux/console.h>
37#include <linux/seq_file.h>
Vivek Goyalaac04b32006-01-09 20:51:47 -080038#include <linux/crash_dump.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070039#include <linux/root_dev.h>
40#include <linux/pci.h>
41#include <linux/acpi.h>
42#include <linux/kallsyms.h>
43#include <linux/edd.h>
Matt Tolentinobbfceef2005-06-23 00:08:07 -070044#include <linux/mmzone.h>
Eric W. Biederman5f5609d2005-06-25 14:58:04 -070045#include <linux/kexec.h>
Venkatesh Pallipadi95235ca2005-12-02 10:43:20 -080046#include <linux/cpufreq.h>
Andi Kleene9928672006-01-11 22:43:33 +010047#include <linux/dmi.h>
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010048#include <linux/dma-mapping.h>
Andi Kleen681558f2006-03-25 16:29:46 +010049#include <linux/ctype.h>
Matt Tolentinobbfceef2005-06-23 00:08:07 -070050
Linus Torvalds1da177e2005-04-16 15:20:36 -070051#include <asm/mtrr.h>
52#include <asm/uaccess.h>
53#include <asm/system.h>
54#include <asm/io.h>
55#include <asm/smp.h>
56#include <asm/msr.h>
57#include <asm/desc.h>
58#include <video/edid.h>
59#include <asm/e820.h>
60#include <asm/dma.h>
61#include <asm/mpspec.h>
62#include <asm/mmu_context.h>
63#include <asm/bootsetup.h>
64#include <asm/proto.h>
65#include <asm/setup.h>
66#include <asm/mach_apic.h>
67#include <asm/numa.h>
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010068#include <asm/swiotlb.h>
Andi Kleen2bc04142005-11-05 17:25:53 +010069#include <asm/sections.h>
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010070#include <asm/gart-mapping.h>
Andi Kleenf2d3efe2006-03-25 16:30:22 +010071#include <asm/dmi.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070072
73/*
74 * Machine setup..
75 */
76
Ravikiran G Thirumalai6c231b72005-09-06 15:17:45 -070077struct cpuinfo_x86 boot_cpu_data __read_mostly;
Linus Torvalds1da177e2005-04-16 15:20:36 -070078
79unsigned long mmu_cr4_features;
80
81int acpi_disabled;
82EXPORT_SYMBOL(acpi_disabled);
Len Brown888ba6c2005-08-24 12:07:20 -040083#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -070084extern int __initdata acpi_ht;
85extern acpi_interrupt_flags acpi_sci_flags;
86int __initdata acpi_force = 0;
87#endif
88
89int acpi_numa __initdata;
90
Linus Torvalds1da177e2005-04-16 15:20:36 -070091/* Boot loader ID as an integer, for the benefit of proc_dointvec */
92int bootloader_type;
93
94unsigned long saved_video_mode;
95
Andi Kleenf2d3efe2006-03-25 16:30:22 +010096/*
97 * Early DMI memory
98 */
99int dmi_alloc_index;
100char dmi_alloc_data[DMI_MAX_DATA];
101
Linus Torvalds1da177e2005-04-16 15:20:36 -0700102/*
103 * Setup options
104 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105struct screen_info screen_info;
106struct sys_desc_table_struct {
107 unsigned short length;
108 unsigned char table[0];
109};
110
111struct edid_info edid_info;
112struct e820map e820;
113
114extern int root_mountflags;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700115
116char command_line[COMMAND_LINE_SIZE];
117
118struct resource standard_io_resources[] = {
119 { .name = "dma1", .start = 0x00, .end = 0x1f,
120 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
121 { .name = "pic1", .start = 0x20, .end = 0x21,
122 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
123 { .name = "timer0", .start = 0x40, .end = 0x43,
124 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
125 { .name = "timer1", .start = 0x50, .end = 0x53,
126 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
127 { .name = "keyboard", .start = 0x60, .end = 0x6f,
128 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
129 { .name = "dma page reg", .start = 0x80, .end = 0x8f,
130 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
131 { .name = "pic2", .start = 0xa0, .end = 0xa1,
132 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
133 { .name = "dma2", .start = 0xc0, .end = 0xdf,
134 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
135 { .name = "fpu", .start = 0xf0, .end = 0xff,
136 .flags = IORESOURCE_BUSY | IORESOURCE_IO }
137};
138
139#define STANDARD_IO_RESOURCES \
140 (sizeof standard_io_resources / sizeof standard_io_resources[0])
141
142#define IORESOURCE_RAM (IORESOURCE_BUSY | IORESOURCE_MEM)
143
144struct resource data_resource = {
145 .name = "Kernel data",
146 .start = 0,
147 .end = 0,
148 .flags = IORESOURCE_RAM,
149};
150struct resource code_resource = {
151 .name = "Kernel code",
152 .start = 0,
153 .end = 0,
154 .flags = IORESOURCE_RAM,
155};
156
157#define IORESOURCE_ROM (IORESOURCE_BUSY | IORESOURCE_READONLY | IORESOURCE_MEM)
158
159static struct resource system_rom_resource = {
160 .name = "System ROM",
161 .start = 0xf0000,
162 .end = 0xfffff,
163 .flags = IORESOURCE_ROM,
164};
165
166static struct resource extension_rom_resource = {
167 .name = "Extension ROM",
168 .start = 0xe0000,
169 .end = 0xeffff,
170 .flags = IORESOURCE_ROM,
171};
172
173static struct resource adapter_rom_resources[] = {
174 { .name = "Adapter ROM", .start = 0xc8000, .end = 0,
175 .flags = IORESOURCE_ROM },
176 { .name = "Adapter ROM", .start = 0, .end = 0,
177 .flags = IORESOURCE_ROM },
178 { .name = "Adapter ROM", .start = 0, .end = 0,
179 .flags = IORESOURCE_ROM },
180 { .name = "Adapter ROM", .start = 0, .end = 0,
181 .flags = IORESOURCE_ROM },
182 { .name = "Adapter ROM", .start = 0, .end = 0,
183 .flags = IORESOURCE_ROM },
184 { .name = "Adapter ROM", .start = 0, .end = 0,
185 .flags = IORESOURCE_ROM }
186};
187
188#define ADAPTER_ROM_RESOURCES \
189 (sizeof adapter_rom_resources / sizeof adapter_rom_resources[0])
190
191static struct resource video_rom_resource = {
192 .name = "Video ROM",
193 .start = 0xc0000,
194 .end = 0xc7fff,
195 .flags = IORESOURCE_ROM,
196};
197
198static struct resource video_ram_resource = {
199 .name = "Video RAM area",
200 .start = 0xa0000,
201 .end = 0xbffff,
202 .flags = IORESOURCE_RAM,
203};
204
205#define romsignature(x) (*(unsigned short *)(x) == 0xaa55)
206
207static int __init romchecksum(unsigned char *rom, unsigned long length)
208{
209 unsigned char *p, sum = 0;
210
211 for (p = rom; p < rom + length; p++)
212 sum += *p;
213 return sum == 0;
214}
215
216static void __init probe_roms(void)
217{
218 unsigned long start, length, upper;
219 unsigned char *rom;
220 int i;
221
222 /* video rom */
223 upper = adapter_rom_resources[0].start;
224 for (start = video_rom_resource.start; start < upper; start += 2048) {
225 rom = isa_bus_to_virt(start);
226 if (!romsignature(rom))
227 continue;
228
229 video_rom_resource.start = start;
230
231 /* 0 < length <= 0x7f * 512, historically */
232 length = rom[2] * 512;
233
234 /* if checksum okay, trust length byte */
235 if (length && romchecksum(rom, length))
236 video_rom_resource.end = start + length - 1;
237
238 request_resource(&iomem_resource, &video_rom_resource);
239 break;
240 }
241
242 start = (video_rom_resource.end + 1 + 2047) & ~2047UL;
243 if (start < upper)
244 start = upper;
245
246 /* system rom */
247 request_resource(&iomem_resource, &system_rom_resource);
248 upper = system_rom_resource.start;
249
250 /* check for extension rom (ignore length byte!) */
251 rom = isa_bus_to_virt(extension_rom_resource.start);
252 if (romsignature(rom)) {
253 length = extension_rom_resource.end - extension_rom_resource.start + 1;
254 if (romchecksum(rom, length)) {
255 request_resource(&iomem_resource, &extension_rom_resource);
256 upper = extension_rom_resource.start;
257 }
258 }
259
260 /* check for adapter roms on 2k boundaries */
261 for (i = 0; i < ADAPTER_ROM_RESOURCES && start < upper; start += 2048) {
262 rom = isa_bus_to_virt(start);
263 if (!romsignature(rom))
264 continue;
265
266 /* 0 < length <= 0x7f * 512, historically */
267 length = rom[2] * 512;
268
269 /* but accept any length that fits if checksum okay */
270 if (!length || start + length > upper || !romchecksum(rom, length))
271 continue;
272
273 adapter_rom_resources[i].start = start;
274 adapter_rom_resources[i].end = start + length - 1;
275 request_resource(&iomem_resource, &adapter_rom_resources[i]);
276
277 start = adapter_rom_resources[i++].end & ~2047UL;
278 }
279}
280
Andi Kleen681558f2006-03-25 16:29:46 +0100281/* Check for full argument with no trailing characters */
282static int fullarg(char *p, char *arg)
283{
284 int l = strlen(arg);
285 return !memcmp(p, arg, l) && (p[l] == 0 || isspace(p[l]));
286}
287
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288static __init void parse_cmdline_early (char ** cmdline_p)
289{
290 char c = ' ', *to = command_line, *from = COMMAND_LINE;
291 int len = 0;
akpm@osdl.org69cda7b2006-01-09 20:51:46 -0800292 int userdef = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294 for (;;) {
295 if (c != ' ')
296 goto next_char;
297
298#ifdef CONFIG_SMP
299 /*
300 * If the BIOS enumerates physical processors before logical,
301 * maxcpus=N at enumeration-time can be used to disable HT.
302 */
303 else if (!memcmp(from, "maxcpus=", 8)) {
304 extern unsigned int maxcpus;
305
306 maxcpus = simple_strtoul(from + 8, NULL, 0);
307 }
308#endif
Len Brown888ba6c2005-08-24 12:07:20 -0400309#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700310 /* "acpi=off" disables both ACPI table parsing and interpreter init */
Andi Kleen681558f2006-03-25 16:29:46 +0100311 if (fullarg(from,"acpi=off"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312 disable_acpi();
313
Andi Kleen681558f2006-03-25 16:29:46 +0100314 if (fullarg(from, "acpi=force")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315 /* add later when we do DMI horrors: */
316 acpi_force = 1;
317 acpi_disabled = 0;
318 }
319
320 /* acpi=ht just means: do ACPI MADT parsing
321 at bootup, but don't enable the full ACPI interpreter */
Andi Kleen681558f2006-03-25 16:29:46 +0100322 if (fullarg(from, "acpi=ht")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323 if (!acpi_force)
324 disable_acpi();
325 acpi_ht = 1;
326 }
Andi Kleen681558f2006-03-25 16:29:46 +0100327 else if (fullarg(from, "pci=noacpi"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328 acpi_disable_pci();
Andi Kleen681558f2006-03-25 16:29:46 +0100329 else if (fullarg(from, "acpi=noirq"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700330 acpi_noirq_set();
331
Andi Kleen681558f2006-03-25 16:29:46 +0100332 else if (fullarg(from, "acpi_sci=edge"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700333 acpi_sci_flags.trigger = 1;
Andi Kleen681558f2006-03-25 16:29:46 +0100334 else if (fullarg(from, "acpi_sci=level"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700335 acpi_sci_flags.trigger = 3;
Andi Kleen681558f2006-03-25 16:29:46 +0100336 else if (fullarg(from, "acpi_sci=high"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700337 acpi_sci_flags.polarity = 1;
Andi Kleen681558f2006-03-25 16:29:46 +0100338 else if (fullarg(from, "acpi_sci=low"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339 acpi_sci_flags.polarity = 3;
340
341 /* acpi=strict disables out-of-spec workarounds */
Andi Kleen681558f2006-03-25 16:29:46 +0100342 else if (fullarg(from, "acpi=strict")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700343 acpi_strict = 1;
344 }
Andi Kleen22999242005-04-16 15:25:17 -0700345#ifdef CONFIG_X86_IO_APIC
Andi Kleen681558f2006-03-25 16:29:46 +0100346 else if (fullarg(from, "acpi_skip_timer_override"))
Andi Kleen22999242005-04-16 15:25:17 -0700347 acpi_skip_timer_override = 1;
348#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349#endif
350
Andi Kleen681558f2006-03-25 16:29:46 +0100351 if (fullarg(from, "disable_timer_pin_1"))
Chuck Ebbert66759a02005-09-12 18:49:25 +0200352 disable_timer_pin_1 = 1;
Andi Kleen681558f2006-03-25 16:29:46 +0100353 if (fullarg(from, "enable_timer_pin_1"))
Chuck Ebbert66759a02005-09-12 18:49:25 +0200354 disable_timer_pin_1 = -1;
355
Andi Kleend1530d82006-04-07 19:49:42 +0200356 if (fullarg(from, "nolapic") || fullarg(from, "disableapic")) {
357 clear_bit(X86_FEATURE_APIC, boot_cpu_data.x86_capability);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700358 disable_apic = 1;
Andi Kleend1530d82006-04-07 19:49:42 +0200359 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700360
Andi Kleen681558f2006-03-25 16:29:46 +0100361 if (fullarg(from, "noapic"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700362 skip_ioapic_setup = 1;
363
Andi Kleen681558f2006-03-25 16:29:46 +0100364 if (fullarg(from,"apic")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700365 skip_ioapic_setup = 0;
366 ioapic_force = 1;
367 }
368
369 if (!memcmp(from, "mem=", 4))
370 parse_memopt(from+4, &from);
371
akpm@osdl.org69cda7b2006-01-09 20:51:46 -0800372 if (!memcmp(from, "memmap=", 7)) {
373 /* exactmap option is for used defined memory */
374 if (!memcmp(from+7, "exactmap", 8)) {
375#ifdef CONFIG_CRASH_DUMP
376 /* If we are doing a crash dump, we
377 * still need to know the real mem
378 * size before original memory map is
379 * reset.
380 */
381 saved_max_pfn = e820_end_of_ram();
382#endif
383 from += 8+7;
384 end_pfn_map = 0;
385 e820.nr_map = 0;
386 userdef = 1;
387 }
388 else {
389 parse_memmapopt(from+7, &from);
390 userdef = 1;
391 }
392 }
393
Matt Tolentino2b976902005-06-23 00:08:06 -0700394#ifdef CONFIG_NUMA
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395 if (!memcmp(from, "numa=", 5))
396 numa_setup(from+5);
397#endif
398
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399 if (!memcmp(from,"iommu=",6)) {
400 iommu_setup(from+6);
401 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700402
Andi Kleen681558f2006-03-25 16:29:46 +0100403 if (fullarg(from,"oops=panic"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700404 panic_on_oops = 1;
405
406 if (!memcmp(from, "noexec=", 7))
407 nonx_setup(from + 7);
408
Eric W. Biederman5f5609d2005-06-25 14:58:04 -0700409#ifdef CONFIG_KEXEC
410 /* crashkernel=size@addr specifies the location to reserve for
411 * a crash kernel. By reserving this memory we guarantee
412 * that linux never set's it up as a DMA target.
413 * Useful for holding code to do something appropriate
414 * after a kernel panic.
415 */
416 else if (!memcmp(from, "crashkernel=", 12)) {
417 unsigned long size, base;
418 size = memparse(from+12, &from);
419 if (*from == '@') {
420 base = memparse(from+1, &from);
421 /* FIXME: Do I want a sanity check
422 * to validate the memory range?
423 */
424 crashk_res.start = base;
425 crashk_res.end = base + size - 1;
426 }
427 }
428#endif
429
Vivek Goyalaac04b32006-01-09 20:51:47 -0800430#ifdef CONFIG_PROC_VMCORE
431 /* elfcorehdr= specifies the location of elf core header
432 * stored by the crashed kernel. This option will be passed
433 * by kexec loader to the capture kernel.
434 */
435 else if(!memcmp(from, "elfcorehdr=", 11))
436 elfcorehdr_addr = memparse(from+11, &from);
437#endif
Andi Kleene2c03882006-02-26 04:18:46 +0100438
Brian Magnusond5176122006-02-27 04:02:04 +0100439#ifdef CONFIG_HOTPLUG_CPU
Andi Kleene2c03882006-02-26 04:18:46 +0100440 else if (!memcmp(from, "additional_cpus=", 16))
441 setup_additional_cpus(from+16);
442#endif
443
Linus Torvalds1da177e2005-04-16 15:20:36 -0700444 next_char:
445 c = *(from++);
446 if (!c)
447 break;
448 if (COMMAND_LINE_SIZE <= ++len)
449 break;
450 *(to++) = c;
451 }
akpm@osdl.org69cda7b2006-01-09 20:51:46 -0800452 if (userdef) {
453 printk(KERN_INFO "user-defined physical RAM map:\n");
454 e820_print_map("user");
455 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700456 *to = '\0';
457 *cmdline_p = command_line;
458}
459
Matt Tolentino2b976902005-06-23 00:08:06 -0700460#ifndef CONFIG_NUMA
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700461static void __init
462contig_initmem_init(unsigned long start_pfn, unsigned long end_pfn)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700463{
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700464 unsigned long bootmap_size, bootmap;
465
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700466 bootmap_size = bootmem_bootmap_pages(end_pfn)<<PAGE_SHIFT;
467 bootmap = find_e820_area(0, end_pfn<<PAGE_SHIFT, bootmap_size);
468 if (bootmap == -1L)
469 panic("Cannot find bootmem map of size %ld\n",bootmap_size);
470 bootmap_size = init_bootmem(bootmap >> PAGE_SHIFT, end_pfn);
471 e820_bootmem_free(NODE_DATA(0), 0, end_pfn << PAGE_SHIFT);
472 reserve_bootmem(bootmap, bootmap_size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700473}
474#endif
475
476/* Use inline assembly to define this because the nops are defined
477 as inline assembly strings in the include files and we cannot
478 get them easily into strings. */
479asm("\t.data\nk8nops: "
480 K8_NOP1 K8_NOP2 K8_NOP3 K8_NOP4 K8_NOP5 K8_NOP6
481 K8_NOP7 K8_NOP8);
482
483extern unsigned char k8nops[];
484static unsigned char *k8_nops[ASM_NOP_MAX+1] = {
485 NULL,
486 k8nops,
487 k8nops + 1,
488 k8nops + 1 + 2,
489 k8nops + 1 + 2 + 3,
490 k8nops + 1 + 2 + 3 + 4,
491 k8nops + 1 + 2 + 3 + 4 + 5,
492 k8nops + 1 + 2 + 3 + 4 + 5 + 6,
493 k8nops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
494};
495
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100496extern char __vsyscall_0;
497
Linus Torvalds1da177e2005-04-16 15:20:36 -0700498/* Replace instructions with better alternatives for this CPU type.
499
500 This runs before SMP is initialized to avoid SMP problems with
501 self modifying code. This implies that assymetric systems where
502 APs have less capabilities than the boot processor are not handled.
503 In this case boot with "noreplacement". */
504void apply_alternatives(void *start, void *end)
505{
506 struct alt_instr *a;
507 int diff, i, k;
508 for (a = start; (void *)a < end; a++) {
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100509 u8 *instr;
510
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511 if (!boot_cpu_has(a->cpuid))
512 continue;
513
514 BUG_ON(a->replacementlen > a->instrlen);
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100515 instr = a->instr;
516 /* vsyscall code is not mapped yet. resolve it manually. */
517 if (instr >= (u8 *)VSYSCALL_START && instr < (u8*)VSYSCALL_END)
518 instr = __va(instr - (u8*)VSYSCALL_START + (u8*)__pa_symbol(&__vsyscall_0));
519 __inline_memcpy(instr, a->replacement, a->replacementlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700520 diff = a->instrlen - a->replacementlen;
521
522 /* Pad the rest with nops */
523 for (i = a->replacementlen; diff > 0; diff -= k, i += k) {
524 k = diff;
525 if (k > ASM_NOP_MAX)
526 k = ASM_NOP_MAX;
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100527 __inline_memcpy(instr + i, k8_nops[k], k);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700528 }
529 }
530}
531
532static int no_replacement __initdata = 0;
533
534void __init alternative_instructions(void)
535{
536 extern struct alt_instr __alt_instructions[], __alt_instructions_end[];
537 if (no_replacement)
538 return;
539 apply_alternatives(__alt_instructions, __alt_instructions_end);
540}
541
542static int __init noreplacement_setup(char *s)
543{
544 no_replacement = 1;
OGAWA Hirofumi9b410462006-03-31 02:30:33 -0800545 return 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700546}
547
548__setup("noreplacement", noreplacement_setup);
549
550#if defined(CONFIG_EDD) || defined(CONFIG_EDD_MODULE)
551struct edd edd;
552#ifdef CONFIG_EDD_MODULE
553EXPORT_SYMBOL(edd);
554#endif
555/**
556 * copy_edd() - Copy the BIOS EDD information
557 * from boot_params into a safe place.
558 *
559 */
560static inline void copy_edd(void)
561{
562 memcpy(edd.mbr_signature, EDD_MBR_SIGNATURE, sizeof(edd.mbr_signature));
563 memcpy(edd.edd_info, EDD_BUF, sizeof(edd.edd_info));
564 edd.mbr_signature_nr = EDD_MBR_SIG_NR;
565 edd.edd_info_nr = EDD_NR;
566}
567#else
568static inline void copy_edd(void)
569{
570}
571#endif
572
573#define EBDA_ADDR_POINTER 0x40E
574static void __init reserve_ebda_region(void)
575{
576 unsigned int addr;
577 /**
578 * there is a real-mode segmented pointer pointing to the
579 * 4K EBDA area at 0x40E
580 */
581 addr = *(unsigned short *)phys_to_virt(EBDA_ADDR_POINTER);
582 addr <<= 4;
583 if (addr)
584 reserve_bootmem_generic(addr, PAGE_SIZE);
585}
586
587void __init setup_arch(char **cmdline_p)
588{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700589 unsigned long kernel_end;
590
591 ROOT_DEV = old_decode_dev(ORIG_ROOT_DEV);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700592 screen_info = SCREEN_INFO;
593 edid_info = EDID_INFO;
594 saved_video_mode = SAVED_VIDEO_MODE;
595 bootloader_type = LOADER_TYPE;
596
597#ifdef CONFIG_BLK_DEV_RAM
598 rd_image_start = RAMDISK_FLAGS & RAMDISK_IMAGE_START_MASK;
599 rd_prompt = ((RAMDISK_FLAGS & RAMDISK_PROMPT_FLAG) != 0);
600 rd_doload = ((RAMDISK_FLAGS & RAMDISK_LOAD_FLAG) != 0);
601#endif
602 setup_memory_region();
603 copy_edd();
604
605 if (!MOUNT_ROOT_RDONLY)
606 root_mountflags &= ~MS_RDONLY;
607 init_mm.start_code = (unsigned long) &_text;
608 init_mm.end_code = (unsigned long) &_etext;
609 init_mm.end_data = (unsigned long) &_edata;
610 init_mm.brk = (unsigned long) &_end;
611
612 code_resource.start = virt_to_phys(&_text);
613 code_resource.end = virt_to_phys(&_etext)-1;
614 data_resource.start = virt_to_phys(&_etext);
615 data_resource.end = virt_to_phys(&_edata)-1;
616
617 parse_cmdline_early(cmdline_p);
618
619 early_identify_cpu(&boot_cpu_data);
620
621 /*
622 * partially used pages are not usable - thus
623 * we are rounding upwards:
624 */
625 end_pfn = e820_end_of_ram();
Andi Kleen1f502492006-03-25 16:29:58 +0100626 num_physpages = end_pfn; /* for pfn_valid */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700627
628 check_efer();
629
630 init_memory_mapping(0, (end_pfn_map << PAGE_SHIFT));
631
Andi Kleenf2d3efe2006-03-25 16:30:22 +0100632 dmi_scan_machine();
633
Siddha, Suresh Bf6c2e332005-11-05 17:25:53 +0100634 zap_low_mappings(0);
635
Len Brown888ba6c2005-08-24 12:07:20 -0400636#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700637 /*
638 * Initialize the ACPI boot-time table parser (gets the RSDP and SDT).
639 * Call this early for SRAT node setup.
640 */
641 acpi_boot_table_init();
642#endif
643
644#ifdef CONFIG_ACPI_NUMA
645 /*
646 * Parse SRAT to discover nodes.
647 */
648 acpi_numa_init();
649#endif
650
Matt Tolentino2b976902005-06-23 00:08:06 -0700651#ifdef CONFIG_NUMA
Linus Torvalds1da177e2005-04-16 15:20:36 -0700652 numa_initmem_init(0, end_pfn);
653#else
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700654 contig_initmem_init(0, end_pfn);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700655#endif
656
657 /* Reserve direct mapping */
658 reserve_bootmem_generic(table_start << PAGE_SHIFT,
659 (table_end - table_start) << PAGE_SHIFT);
660
661 /* reserve kernel */
662 kernel_end = round_up(__pa_symbol(&_end),PAGE_SIZE);
663 reserve_bootmem_generic(HIGH_MEMORY, kernel_end - HIGH_MEMORY);
664
665 /*
666 * reserve physical page 0 - it's a special BIOS page on many boxes,
667 * enabling clean reboots, SMP operation, laptop functions.
668 */
669 reserve_bootmem_generic(0, PAGE_SIZE);
670
671 /* reserve ebda region */
672 reserve_ebda_region();
673
674#ifdef CONFIG_SMP
675 /*
676 * But first pinch a few for the stack/trampoline stuff
677 * FIXME: Don't need the extra page at 4K, but need to fix
678 * trampoline before removing it. (see the GDT stuff)
679 */
680 reserve_bootmem_generic(PAGE_SIZE, PAGE_SIZE);
681
682 /* Reserve SMP trampoline */
683 reserve_bootmem_generic(SMP_TRAMPOLINE_BASE, PAGE_SIZE);
684#endif
685
686#ifdef CONFIG_ACPI_SLEEP
687 /*
688 * Reserve low memory region for sleep support.
689 */
690 acpi_reserve_bootmem();
691#endif
692#ifdef CONFIG_X86_LOCAL_APIC
693 /*
694 * Find and reserve possible boot-time SMP configuration:
695 */
696 find_smp_config();
697#endif
698#ifdef CONFIG_BLK_DEV_INITRD
699 if (LOADER_TYPE && INITRD_START) {
700 if (INITRD_START + INITRD_SIZE <= (end_pfn << PAGE_SHIFT)) {
701 reserve_bootmem_generic(INITRD_START, INITRD_SIZE);
702 initrd_start =
703 INITRD_START ? INITRD_START + PAGE_OFFSET : 0;
704 initrd_end = initrd_start+INITRD_SIZE;
705 }
706 else {
707 printk(KERN_ERR "initrd extends beyond end of memory "
708 "(0x%08lx > 0x%08lx)\ndisabling initrd\n",
709 (unsigned long)(INITRD_START + INITRD_SIZE),
710 (unsigned long)(end_pfn << PAGE_SHIFT));
711 initrd_start = 0;
712 }
713 }
714#endif
Eric W. Biederman5f5609d2005-06-25 14:58:04 -0700715#ifdef CONFIG_KEXEC
716 if (crashk_res.start != crashk_res.end) {
717 reserve_bootmem(crashk_res.start,
718 crashk_res.end - crashk_res.start + 1);
719 }
720#endif
Eric W. Biederman0d317fb2005-08-06 13:47:36 -0600721
Linus Torvalds1da177e2005-04-16 15:20:36 -0700722 paging_init();
723
724 check_ioapic();
725
Ashok Raj51f62e12006-03-25 16:29:28 +0100726 /*
727 * set this early, so we dont allocate cpu0
728 * if MADT list doesnt list BSP first
729 * mpparse.c/MP_processor_info() allocates logical cpu numbers.
730 */
731 cpu_set(0, cpu_present_map);
Len Brown888ba6c2005-08-24 12:07:20 -0400732#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700733 /*
734 * Read APIC and some other early information from ACPI tables.
735 */
736 acpi_boot_init();
737#endif
738
Ravikiran Thirumalai05b3cbd2006-01-11 22:45:36 +0100739 init_cpu_to_node();
740
Linus Torvalds1da177e2005-04-16 15:20:36 -0700741#ifdef CONFIG_X86_LOCAL_APIC
742 /*
743 * get boot-time SMP configuration:
744 */
745 if (smp_found_config)
746 get_smp_config();
747 init_apic_mappings();
748#endif
749
750 /*
751 * Request address space for all standard RAM and ROM resources
752 * and also for regions reported as reserved by the e820.
753 */
754 probe_roms();
755 e820_reserve_resources();
756
757 request_resource(&iomem_resource, &video_ram_resource);
758
759 {
760 unsigned i;
761 /* request I/O space for devices used on all i[345]86 PCs */
762 for (i = 0; i < STANDARD_IO_RESOURCES; i++)
763 request_resource(&ioport_resource, &standard_io_resources[i]);
764 }
765
Andi Kleena1e97782005-04-16 15:25:12 -0700766 e820_setup_gap();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700767
768#ifdef CONFIG_GART_IOMMU
Jon Mason5b7b6442006-02-03 21:51:59 +0100769 iommu_hole_init();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700770#endif
771
772#ifdef CONFIG_VT
773#if defined(CONFIG_VGA_CONSOLE)
774 conswitchp = &vga_con;
775#elif defined(CONFIG_DUMMY_CONSOLE)
776 conswitchp = &dummy_con;
777#endif
778#endif
779}
780
Ashok Raje6982c62005-06-25 14:54:58 -0700781static int __cpuinit get_model_name(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700782{
783 unsigned int *v;
784
Andi Kleenebfcaa92005-04-16 15:25:18 -0700785 if (c->extended_cpuid_level < 0x80000004)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700786 return 0;
787
788 v = (unsigned int *) c->x86_model_id;
789 cpuid(0x80000002, &v[0], &v[1], &v[2], &v[3]);
790 cpuid(0x80000003, &v[4], &v[5], &v[6], &v[7]);
791 cpuid(0x80000004, &v[8], &v[9], &v[10], &v[11]);
792 c->x86_model_id[48] = 0;
793 return 1;
794}
795
796
Ashok Raje6982c62005-06-25 14:54:58 -0700797static void __cpuinit display_cacheinfo(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700798{
799 unsigned int n, dummy, eax, ebx, ecx, edx;
800
Andi Kleenebfcaa92005-04-16 15:25:18 -0700801 n = c->extended_cpuid_level;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700802
803 if (n >= 0x80000005) {
804 cpuid(0x80000005, &dummy, &ebx, &ecx, &edx);
805 printk(KERN_INFO "CPU: L1 I Cache: %dK (%d bytes/line), D cache %dK (%d bytes/line)\n",
806 edx>>24, edx&0xFF, ecx>>24, ecx&0xFF);
807 c->x86_cache_size=(ecx>>24)+(edx>>24);
808 /* On K8 L1 TLB is inclusive, so don't count it */
809 c->x86_tlbsize = 0;
810 }
811
812 if (n >= 0x80000006) {
813 cpuid(0x80000006, &dummy, &ebx, &ecx, &edx);
814 ecx = cpuid_ecx(0x80000006);
815 c->x86_cache_size = ecx >> 16;
816 c->x86_tlbsize += ((ebx >> 16) & 0xfff) + (ebx & 0xfff);
817
818 printk(KERN_INFO "CPU: L2 Cache: %dK (%d bytes/line)\n",
819 c->x86_cache_size, ecx & 0xFF);
820 }
821
822 if (n >= 0x80000007)
823 cpuid(0x80000007, &dummy, &dummy, &dummy, &c->x86_power);
824 if (n >= 0x80000008) {
825 cpuid(0x80000008, &eax, &dummy, &dummy, &dummy);
826 c->x86_virt_bits = (eax >> 8) & 0xff;
827 c->x86_phys_bits = eax & 0xff;
828 }
829}
830
Andi Kleen3f098c22005-09-12 18:49:24 +0200831#ifdef CONFIG_NUMA
832static int nearby_node(int apicid)
833{
834 int i;
835 for (i = apicid - 1; i >= 0; i--) {
836 int node = apicid_to_node[i];
837 if (node != NUMA_NO_NODE && node_online(node))
838 return node;
839 }
840 for (i = apicid + 1; i < MAX_LOCAL_APIC; i++) {
841 int node = apicid_to_node[i];
842 if (node != NUMA_NO_NODE && node_online(node))
843 return node;
844 }
845 return first_node(node_online_map); /* Shouldn't happen */
846}
847#endif
848
Andi Kleen63518642005-04-16 15:25:16 -0700849/*
850 * On a AMD dual core setup the lower bits of the APIC id distingush the cores.
851 * Assumes number of cores is a power of two.
852 */
853static void __init amd_detect_cmp(struct cpuinfo_x86 *c)
854{
855#ifdef CONFIG_SMP
Andi Kleen29422832005-05-16 21:53:26 -0700856 int cpu = smp_processor_id();
Andi Kleenb41e2932005-05-20 14:27:55 -0700857 unsigned bits;
Andi Kleen3f098c22005-09-12 18:49:24 +0200858#ifdef CONFIG_NUMA
859 int node = 0;
Ravikiran G Thirumalai60c1bc82006-03-25 16:30:04 +0100860 unsigned apicid = hard_smp_processor_id();
Andi Kleen3f098c22005-09-12 18:49:24 +0200861#endif
Andi Kleenb41e2932005-05-20 14:27:55 -0700862
863 bits = 0;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100864 while ((1 << bits) < c->x86_max_cores)
Andi Kleenb41e2932005-05-20 14:27:55 -0700865 bits++;
866
867 /* Low order bits define the core id (index of core in socket) */
868 cpu_core_id[cpu] = phys_proc_id[cpu] & ((1 << bits)-1);
869 /* Convert the APIC ID into the socket ID */
Ravikiran G Thirumalai60c1bc82006-03-25 16:30:04 +0100870 phys_proc_id[cpu] = phys_pkg_id(bits);
Andi Kleen63518642005-04-16 15:25:16 -0700871
872#ifdef CONFIG_NUMA
Andi Kleen3f098c22005-09-12 18:49:24 +0200873 node = phys_proc_id[cpu];
874 if (apicid_to_node[apicid] != NUMA_NO_NODE)
875 node = apicid_to_node[apicid];
876 if (!node_online(node)) {
877 /* Two possibilities here:
878 - The CPU is missing memory and no node was created.
879 In that case try picking one from a nearby CPU
880 - The APIC IDs differ from the HyperTransport node IDs
881 which the K8 northbridge parsing fills in.
882 Assume they are all increased by a constant offset,
883 but in the same order as the HT nodeids.
884 If that doesn't result in a usable node fall back to the
885 path for the previous case. */
886 int ht_nodeid = apicid - (phys_proc_id[0] << bits);
887 if (ht_nodeid >= 0 &&
888 apicid_to_node[ht_nodeid] != NUMA_NO_NODE)
889 node = apicid_to_node[ht_nodeid];
890 /* Pick a nearby node */
891 if (!node_online(node))
892 node = nearby_node(apicid);
893 }
Andi Kleen69d81fc2005-11-05 17:25:53 +0100894 numa_set_node(cpu, node);
Andi Kleena1586082005-05-16 21:53:21 -0700895
Andi Kleen77d910f2006-03-25 16:29:34 +0100896 printk(KERN_INFO "CPU %d/%x(%d) -> Node %d -> Core %d\n",
897 cpu, apicid, c->x86_max_cores, node, cpu_core_id[cpu]);
Andi Kleen3f098c22005-09-12 18:49:24 +0200898#endif
Andi Kleen63518642005-04-16 15:25:16 -0700899#endif
900}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700901
902static int __init init_amd(struct cpuinfo_x86 *c)
903{
904 int r;
Andi Kleen7bcd3f32006-02-03 21:51:02 +0100905 unsigned level;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700906
Linus Torvaldsbc5e8fd2005-09-17 15:41:04 -0700907#ifdef CONFIG_SMP
908 unsigned long value;
909
Andi Kleen7d318d72005-09-29 22:05:55 +0200910 /*
911 * Disable TLB flush filter by setting HWCR.FFDIS on K8
912 * bit 6 of msr C001_0015
913 *
914 * Errata 63 for SH-B3 steppings
915 * Errata 122 for all steppings (F+ have it disabled by default)
916 */
917 if (c->x86 == 15) {
918 rdmsrl(MSR_K8_HWCR, value);
919 value |= 1 << 6;
920 wrmsrl(MSR_K8_HWCR, value);
921 }
Linus Torvaldsbc5e8fd2005-09-17 15:41:04 -0700922#endif
923
Linus Torvalds1da177e2005-04-16 15:20:36 -0700924 /* Bit 31 in normal CPUID used for nonstandard 3DNow ID;
925 3DNow is IDd by bit 31 in extended CPUID (1*32+31) anyway */
926 clear_bit(0*32+31, &c->x86_capability);
927
Andi Kleen7bcd3f32006-02-03 21:51:02 +0100928 /* On C+ stepping K8 rep microcode works well for copy/memset */
929 level = cpuid_eax(1);
930 if (c->x86 == 15 && ((level >= 0x0f48 && level < 0x0f50) || level >= 0x0f58))
931 set_bit(X86_FEATURE_REP_GOOD, &c->x86_capability);
932
Linus Torvalds1da177e2005-04-16 15:20:36 -0700933 r = get_model_name(c);
934 if (!r) {
935 switch (c->x86) {
936 case 15:
937 /* Should distinguish Models here, but this is only
938 a fallback anyways. */
939 strcpy(c->x86_model_id, "Hammer");
940 break;
941 }
942 }
943 display_cacheinfo(c);
944
Andi Kleen130951c2006-01-11 22:42:02 +0100945 /* c->x86_power is 8000_0007 edx. Bit 8 is constant TSC */
946 if (c->x86_power & (1<<8))
947 set_bit(X86_FEATURE_CONSTANT_TSC, &c->x86_capability);
948
Andi Kleenebfcaa92005-04-16 15:25:18 -0700949 if (c->extended_cpuid_level >= 0x80000008) {
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100950 c->x86_max_cores = (cpuid_ecx(0x80000008) & 0xff) + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700951
Andi Kleen63518642005-04-16 15:25:16 -0700952 amd_detect_cmp(c);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700953 }
954
955 return r;
956}
957
Ashok Raje6982c62005-06-25 14:54:58 -0700958static void __cpuinit detect_ht(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700959{
960#ifdef CONFIG_SMP
961 u32 eax, ebx, ecx, edx;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100962 int index_msb, core_bits;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700963 int cpu = smp_processor_id();
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100964
965 cpuid(1, &eax, &ebx, &ecx, &edx);
966
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100967
Andi Kleen63518642005-04-16 15:25:16 -0700968 if (!cpu_has(c, X86_FEATURE_HT) || cpu_has(c, X86_FEATURE_CMP_LEGACY))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700969 return;
970
Linus Torvalds1da177e2005-04-16 15:20:36 -0700971 smp_num_siblings = (ebx & 0xff0000) >> 16;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100972
Linus Torvalds1da177e2005-04-16 15:20:36 -0700973 if (smp_num_siblings == 1) {
974 printk(KERN_INFO "CPU: Hyper-Threading is disabled\n");
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100975 } else if (smp_num_siblings > 1 ) {
976
Linus Torvalds1da177e2005-04-16 15:20:36 -0700977 if (smp_num_siblings > NR_CPUS) {
978 printk(KERN_WARNING "CPU: Unsupported number of the siblings %d", smp_num_siblings);
979 smp_num_siblings = 1;
980 return;
981 }
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100982
983 index_msb = get_count_order(smp_num_siblings);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700984 phys_proc_id[cpu] = phys_pkg_id(index_msb);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100985
Linus Torvalds1da177e2005-04-16 15:20:36 -0700986 printk(KERN_INFO "CPU: Physical Processor ID: %d\n",
987 phys_proc_id[cpu]);
Andi Kleen3dd9d512005-04-16 15:25:15 -0700988
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100989 smp_num_siblings = smp_num_siblings / c->x86_max_cores;
Andi Kleen3dd9d512005-04-16 15:25:15 -0700990
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100991 index_msb = get_count_order(smp_num_siblings) ;
Andi Kleen3dd9d512005-04-16 15:25:15 -0700992
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100993 core_bits = get_count_order(c->x86_max_cores);
Andi Kleen3dd9d512005-04-16 15:25:15 -0700994
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100995 cpu_core_id[cpu] = phys_pkg_id(index_msb) &
996 ((1 << core_bits) - 1);
997
998 if (c->x86_max_cores > 1)
Andi Kleen3dd9d512005-04-16 15:25:15 -0700999 printk(KERN_INFO "CPU: Processor Core ID: %d\n",
1000 cpu_core_id[cpu]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001001 }
1002#endif
1003}
1004
Andi Kleen3dd9d512005-04-16 15:25:15 -07001005/*
1006 * find out the number of processor cores on the die
1007 */
Ashok Raje6982c62005-06-25 14:54:58 -07001008static int __cpuinit intel_num_cpu_cores(struct cpuinfo_x86 *c)
Andi Kleen3dd9d512005-04-16 15:25:15 -07001009{
1010 unsigned int eax;
1011
1012 if (c->cpuid_level < 4)
1013 return 1;
1014
1015 __asm__("cpuid"
1016 : "=a" (eax)
1017 : "0" (4), "c" (0)
1018 : "bx", "dx");
1019
1020 if (eax & 0x1f)
1021 return ((eax >> 26) + 1);
1022 else
1023 return 1;
1024}
1025
Andi Kleendf0cc262005-09-12 18:49:24 +02001026static void srat_detect_node(void)
1027{
1028#ifdef CONFIG_NUMA
Ravikiran G Thirumalaiddea7be2005-10-03 10:36:28 -07001029 unsigned node;
Andi Kleendf0cc262005-09-12 18:49:24 +02001030 int cpu = smp_processor_id();
1031
1032 /* Don't do the funky fallback heuristics the AMD version employs
1033 for now. */
Ravikiran G Thirumalaiddea7be2005-10-03 10:36:28 -07001034 node = apicid_to_node[hard_smp_processor_id()];
Andi Kleendf0cc262005-09-12 18:49:24 +02001035 if (node == NUMA_NO_NODE)
1036 node = 0;
Andi Kleen69d81fc2005-11-05 17:25:53 +01001037 numa_set_node(cpu, node);
Andi Kleendf0cc262005-09-12 18:49:24 +02001038
1039 if (acpi_numa > 0)
1040 printk(KERN_INFO "CPU %d -> Node %d\n", cpu, node);
1041#endif
1042}
1043
Ashok Raje6982c62005-06-25 14:54:58 -07001044static void __cpuinit init_intel(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001045{
1046 /* Cache sizes */
1047 unsigned n;
1048
1049 init_intel_cacheinfo(c);
Andi Kleenebfcaa92005-04-16 15:25:18 -07001050 n = c->extended_cpuid_level;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001051 if (n >= 0x80000008) {
1052 unsigned eax = cpuid_eax(0x80000008);
1053 c->x86_virt_bits = (eax >> 8) & 0xff;
1054 c->x86_phys_bits = eax & 0xff;
Shaohua Liaf9c1422005-11-05 17:25:54 +01001055 /* CPUID workaround for Intel 0F34 CPU */
1056 if (c->x86_vendor == X86_VENDOR_INTEL &&
1057 c->x86 == 0xF && c->x86_model == 0x3 &&
1058 c->x86_mask == 0x4)
1059 c->x86_phys_bits = 36;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001060 }
1061
1062 if (c->x86 == 15)
1063 c->x86_cache_alignment = c->x86_clflush_size * 2;
Andi Kleen39b3a792006-01-11 22:42:45 +01001064 if ((c->x86 == 0xf && c->x86_model >= 0x03) ||
1065 (c->x86 == 0x6 && c->x86_model >= 0x0e))
Andi Kleenc29601e2005-04-16 15:25:05 -07001066 set_bit(X86_FEATURE_CONSTANT_TSC, &c->x86_capability);
Andi Kleenc818a182006-01-11 22:45:24 +01001067 set_bit(X86_FEATURE_SYNC_RDTSC, &c->x86_capability);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001068 c->x86_max_cores = intel_num_cpu_cores(c);
Andi Kleendf0cc262005-09-12 18:49:24 +02001069
1070 srat_detect_node();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001071}
1072
Adrian Bunk672289e2005-09-10 00:27:21 -07001073static void __cpuinit get_cpu_vendor(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001074{
1075 char *v = c->x86_vendor_id;
1076
1077 if (!strcmp(v, "AuthenticAMD"))
1078 c->x86_vendor = X86_VENDOR_AMD;
1079 else if (!strcmp(v, "GenuineIntel"))
1080 c->x86_vendor = X86_VENDOR_INTEL;
1081 else
1082 c->x86_vendor = X86_VENDOR_UNKNOWN;
1083}
1084
1085struct cpu_model_info {
1086 int vendor;
1087 int family;
1088 char *model_names[16];
1089};
1090
1091/* Do some early cpuid on the boot CPU to get some parameter that are
1092 needed before check_bugs. Everything advanced is in identify_cpu
1093 below. */
Ashok Raje6982c62005-06-25 14:54:58 -07001094void __cpuinit early_identify_cpu(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001095{
1096 u32 tfms;
1097
1098 c->loops_per_jiffy = loops_per_jiffy;
1099 c->x86_cache_size = -1;
1100 c->x86_vendor = X86_VENDOR_UNKNOWN;
1101 c->x86_model = c->x86_mask = 0; /* So far unknown... */
1102 c->x86_vendor_id[0] = '\0'; /* Unset */
1103 c->x86_model_id[0] = '\0'; /* Unset */
1104 c->x86_clflush_size = 64;
1105 c->x86_cache_alignment = c->x86_clflush_size;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001106 c->x86_max_cores = 1;
Andi Kleenebfcaa92005-04-16 15:25:18 -07001107 c->extended_cpuid_level = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001108 memset(&c->x86_capability, 0, sizeof c->x86_capability);
1109
1110 /* Get vendor name */
1111 cpuid(0x00000000, (unsigned int *)&c->cpuid_level,
1112 (unsigned int *)&c->x86_vendor_id[0],
1113 (unsigned int *)&c->x86_vendor_id[8],
1114 (unsigned int *)&c->x86_vendor_id[4]);
1115
1116 get_cpu_vendor(c);
1117
1118 /* Initialize the standard set of capabilities */
1119 /* Note that the vendor-specific code below might override */
1120
1121 /* Intel-defined flags: level 0x00000001 */
1122 if (c->cpuid_level >= 0x00000001) {
1123 __u32 misc;
1124 cpuid(0x00000001, &tfms, &misc, &c->x86_capability[4],
1125 &c->x86_capability[0]);
1126 c->x86 = (tfms >> 8) & 0xf;
1127 c->x86_model = (tfms >> 4) & 0xf;
1128 c->x86_mask = tfms & 0xf;
Suresh Siddhaf5f786d2005-11-05 17:25:53 +01001129 if (c->x86 == 0xf)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001130 c->x86 += (tfms >> 20) & 0xff;
Suresh Siddhaf5f786d2005-11-05 17:25:53 +01001131 if (c->x86 >= 0x6)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001132 c->x86_model += ((tfms >> 16) & 0xF) << 4;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001133 if (c->x86_capability[0] & (1<<19))
1134 c->x86_clflush_size = ((misc >> 8) & 0xff) * 8;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001135 } else {
1136 /* Have CPUID level 0 only - unheard of */
1137 c->x86 = 4;
1138 }
Andi Kleena1586082005-05-16 21:53:21 -07001139
1140#ifdef CONFIG_SMP
Andi Kleenb41e2932005-05-20 14:27:55 -07001141 phys_proc_id[smp_processor_id()] = (cpuid_ebx(1) >> 24) & 0xff;
Andi Kleena1586082005-05-16 21:53:21 -07001142#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001143}
1144
1145/*
1146 * This does the hard work of actually picking apart the CPU stuff...
1147 */
Ashok Raje6982c62005-06-25 14:54:58 -07001148void __cpuinit identify_cpu(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001149{
1150 int i;
1151 u32 xlvl;
1152
1153 early_identify_cpu(c);
1154
1155 /* AMD-defined flags: level 0x80000001 */
1156 xlvl = cpuid_eax(0x80000000);
Andi Kleenebfcaa92005-04-16 15:25:18 -07001157 c->extended_cpuid_level = xlvl;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001158 if ((xlvl & 0xffff0000) == 0x80000000) {
1159 if (xlvl >= 0x80000001) {
1160 c->x86_capability[1] = cpuid_edx(0x80000001);
H. Peter Anvin5b7abc62005-05-01 08:58:49 -07001161 c->x86_capability[6] = cpuid_ecx(0x80000001);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001162 }
1163 if (xlvl >= 0x80000004)
1164 get_model_name(c); /* Default name */
1165 }
1166
1167 /* Transmeta-defined flags: level 0x80860001 */
1168 xlvl = cpuid_eax(0x80860000);
1169 if ((xlvl & 0xffff0000) == 0x80860000) {
1170 /* Don't set x86_cpuid_level here for now to not confuse. */
1171 if (xlvl >= 0x80860001)
1172 c->x86_capability[2] = cpuid_edx(0x80860001);
1173 }
1174
Siddha, Suresh B1e9f28f2006-03-27 01:15:22 -08001175 c->apicid = phys_pkg_id(0);
1176
Linus Torvalds1da177e2005-04-16 15:20:36 -07001177 /*
1178 * Vendor-specific initialization. In this section we
1179 * canonicalize the feature flags, meaning if there are
1180 * features a certain CPU supports which CPUID doesn't
1181 * tell us, CPUID claiming incorrect flags, or other bugs,
1182 * we handle them here.
1183 *
1184 * At the end of this section, c->x86_capability better
1185 * indicate the features this CPU genuinely supports!
1186 */
1187 switch (c->x86_vendor) {
1188 case X86_VENDOR_AMD:
1189 init_amd(c);
1190 break;
1191
1192 case X86_VENDOR_INTEL:
1193 init_intel(c);
1194 break;
1195
1196 case X86_VENDOR_UNKNOWN:
1197 default:
1198 display_cacheinfo(c);
1199 break;
1200 }
1201
1202 select_idle_routine(c);
1203 detect_ht(c);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001204
1205 /*
1206 * On SMP, boot_cpu_data holds the common feature set between
1207 * all CPUs; so make sure that we indicate which features are
1208 * common between the CPUs. The first time this routine gets
1209 * executed, c == &boot_cpu_data.
1210 */
1211 if (c != &boot_cpu_data) {
1212 /* AND the already accumulated flags with these */
1213 for (i = 0 ; i < NCAPINTS ; i++)
1214 boot_cpu_data.x86_capability[i] &= c->x86_capability[i];
1215 }
1216
1217#ifdef CONFIG_X86_MCE
1218 mcheck_init(c);
1219#endif
Shaohua Li3b520b22005-07-07 17:56:38 -07001220 if (c == &boot_cpu_data)
1221 mtrr_bp_init();
1222 else
1223 mtrr_ap_init();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001224#ifdef CONFIG_NUMA
Andi Kleen3019e8e2005-07-28 21:15:28 -07001225 numa_add_cpu(smp_processor_id());
Linus Torvalds1da177e2005-04-16 15:20:36 -07001226#endif
1227}
1228
1229
Ashok Raje6982c62005-06-25 14:54:58 -07001230void __cpuinit print_cpu_info(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001231{
1232 if (c->x86_model_id[0])
1233 printk("%s", c->x86_model_id);
1234
1235 if (c->x86_mask || c->cpuid_level >= 0)
1236 printk(" stepping %02x\n", c->x86_mask);
1237 else
1238 printk("\n");
1239}
1240
1241/*
1242 * Get CPU information for use by the procfs.
1243 */
1244
1245static int show_cpuinfo(struct seq_file *m, void *v)
1246{
1247 struct cpuinfo_x86 *c = v;
1248
1249 /*
1250 * These flag bits must match the definitions in <asm/cpufeature.h>.
1251 * NULL means this bit is undefined or reserved; either way it doesn't
1252 * have meaning as far as Linux is concerned. Note that it's important
1253 * to realize there is a difference between this table and CPUID -- if
1254 * applications want to get the raw CPUID data, they should access
1255 * /dev/cpu/<cpu_nr>/cpuid instead.
1256 */
1257 static char *x86_cap_flags[] = {
1258 /* Intel-defined */
1259 "fpu", "vme", "de", "pse", "tsc", "msr", "pae", "mce",
1260 "cx8", "apic", NULL, "sep", "mtrr", "pge", "mca", "cmov",
1261 "pat", "pse36", "pn", "clflush", NULL, "dts", "acpi", "mmx",
1262 "fxsr", "sse", "sse2", "ss", "ht", "tm", "ia64", NULL,
1263
1264 /* AMD-defined */
Zwane Mwaikambo3c3b73b2005-05-01 08:58:51 -07001265 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001266 NULL, NULL, NULL, "syscall", NULL, NULL, NULL, NULL,
1267 NULL, NULL, NULL, NULL, "nx", NULL, "mmxext", NULL,
Andi Kleen3f98bc42006-01-11 22:42:51 +01001268 NULL, "fxsr_opt", "rdtscp", NULL, NULL, "lm", "3dnowext", "3dnow",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001269
1270 /* Transmeta-defined */
1271 "recovery", "longrun", NULL, "lrti", NULL, NULL, NULL, NULL,
1272 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1273 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1274 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1275
1276 /* Other (Linux-defined) */
Andi Kleen622dcaf2005-05-16 21:53:26 -07001277 "cxmmx", NULL, "cyrix_arr", "centaur_mcr", NULL,
Andi Kleenc29601e2005-04-16 15:25:05 -07001278 "constant_tsc", NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001279 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1280 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1281 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1282
1283 /* Intel-defined (#2) */
Andi Kleen9d95dd82006-03-25 16:31:22 +01001284 "pni", NULL, NULL, "monitor", "ds_cpl", "vmx", "smx", "est",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001285 "tm2", NULL, "cid", NULL, NULL, "cx16", "xtpr", NULL,
1286 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1287 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1288
H. Peter Anvin5b7abc62005-05-01 08:58:49 -07001289 /* VIA/Cyrix/Centaur-defined */
1290 NULL, NULL, "rng", "rng_en", NULL, NULL, "ace", "ace_en",
1291 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1292 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1293 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1294
Linus Torvalds1da177e2005-04-16 15:20:36 -07001295 /* AMD-defined (#2) */
Andi Kleen3f98bc42006-01-11 22:42:51 +01001296 "lahf_lm", "cmp_legacy", "svm", NULL, "cr8_legacy", NULL, NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001297 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1298 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
H. Peter Anvin5b7abc62005-05-01 08:58:49 -07001299 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001300 };
1301 static char *x86_power_flags[] = {
1302 "ts", /* temperature sensor */
1303 "fid", /* frequency id control */
1304 "vid", /* voltage id control */
1305 "ttp", /* thermal trip */
1306 "tm",
Andi Kleen3f98bc42006-01-11 22:42:51 +01001307 "stc",
1308 NULL,
Andi Kleen39b3a792006-01-11 22:42:45 +01001309 /* nothing */ /* constant_tsc - moved to flags */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001310 };
1311
1312
1313#ifdef CONFIG_SMP
1314 if (!cpu_online(c-cpu_data))
1315 return 0;
1316#endif
1317
1318 seq_printf(m,"processor\t: %u\n"
1319 "vendor_id\t: %s\n"
1320 "cpu family\t: %d\n"
1321 "model\t\t: %d\n"
1322 "model name\t: %s\n",
1323 (unsigned)(c-cpu_data),
1324 c->x86_vendor_id[0] ? c->x86_vendor_id : "unknown",
1325 c->x86,
1326 (int)c->x86_model,
1327 c->x86_model_id[0] ? c->x86_model_id : "unknown");
1328
1329 if (c->x86_mask || c->cpuid_level >= 0)
1330 seq_printf(m, "stepping\t: %d\n", c->x86_mask);
1331 else
1332 seq_printf(m, "stepping\t: unknown\n");
1333
1334 if (cpu_has(c,X86_FEATURE_TSC)) {
Venkatesh Pallipadi95235ca2005-12-02 10:43:20 -08001335 unsigned int freq = cpufreq_quick_get((unsigned)(c-cpu_data));
1336 if (!freq)
1337 freq = cpu_khz;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001338 seq_printf(m, "cpu MHz\t\t: %u.%03u\n",
Venkatesh Pallipadi95235ca2005-12-02 10:43:20 -08001339 freq / 1000, (freq % 1000));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001340 }
1341
1342 /* Cache size */
1343 if (c->x86_cache_size >= 0)
1344 seq_printf(m, "cache size\t: %d KB\n", c->x86_cache_size);
1345
1346#ifdef CONFIG_SMP
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001347 if (smp_num_siblings * c->x86_max_cores > 1) {
Andi Kleendb468682005-04-16 15:24:51 -07001348 int cpu = c - cpu_data;
1349 seq_printf(m, "physical id\t: %d\n", phys_proc_id[cpu]);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001350 seq_printf(m, "siblings\t: %d\n", cpus_weight(cpu_core_map[cpu]));
Siddha, Suresh Bd31ddaa2005-04-16 15:25:20 -07001351 seq_printf(m, "core id\t\t: %d\n", cpu_core_id[cpu]);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001352 seq_printf(m, "cpu cores\t: %d\n", c->booted_cores);
Andi Kleendb468682005-04-16 15:24:51 -07001353 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001354#endif
1355
1356 seq_printf(m,
1357 "fpu\t\t: yes\n"
1358 "fpu_exception\t: yes\n"
1359 "cpuid level\t: %d\n"
1360 "wp\t\t: yes\n"
1361 "flags\t\t:",
1362 c->cpuid_level);
1363
1364 {
1365 int i;
1366 for ( i = 0 ; i < 32*NCAPINTS ; i++ )
Akinobu Mita3d1712c2006-03-24 03:15:11 -08001367 if (cpu_has(c, i) && x86_cap_flags[i] != NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001368 seq_printf(m, " %s", x86_cap_flags[i]);
1369 }
1370
1371 seq_printf(m, "\nbogomips\t: %lu.%02lu\n",
1372 c->loops_per_jiffy/(500000/HZ),
1373 (c->loops_per_jiffy/(5000/HZ)) % 100);
1374
1375 if (c->x86_tlbsize > 0)
1376 seq_printf(m, "TLB size\t: %d 4K pages\n", c->x86_tlbsize);
1377 seq_printf(m, "clflush size\t: %d\n", c->x86_clflush_size);
1378 seq_printf(m, "cache_alignment\t: %d\n", c->x86_cache_alignment);
1379
1380 seq_printf(m, "address sizes\t: %u bits physical, %u bits virtual\n",
1381 c->x86_phys_bits, c->x86_virt_bits);
1382
1383 seq_printf(m, "power management:");
1384 {
1385 unsigned i;
1386 for (i = 0; i < 32; i++)
1387 if (c->x86_power & (1 << i)) {
Andi Kleen3f98bc42006-01-11 22:42:51 +01001388 if (i < ARRAY_SIZE(x86_power_flags) &&
1389 x86_power_flags[i])
1390 seq_printf(m, "%s%s",
1391 x86_power_flags[i][0]?" ":"",
1392 x86_power_flags[i]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001393 else
1394 seq_printf(m, " [%d]", i);
1395 }
1396 }
Andi Kleen3dd9d512005-04-16 15:25:15 -07001397
Siddha, Suresh Bd31ddaa2005-04-16 15:25:20 -07001398 seq_printf(m, "\n\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001399
Linus Torvalds1da177e2005-04-16 15:20:36 -07001400 return 0;
1401}
1402
1403static void *c_start(struct seq_file *m, loff_t *pos)
1404{
1405 return *pos < NR_CPUS ? cpu_data + *pos : NULL;
1406}
1407
1408static void *c_next(struct seq_file *m, void *v, loff_t *pos)
1409{
1410 ++*pos;
1411 return c_start(m, pos);
1412}
1413
1414static void c_stop(struct seq_file *m, void *v)
1415{
1416}
1417
1418struct seq_operations cpuinfo_op = {
1419 .start =c_start,
1420 .next = c_next,
1421 .stop = c_stop,
1422 .show = show_cpuinfo,
1423};
Andi Kleene9928672006-01-11 22:43:33 +01001424