blob: e3a8bb91e168b67c879e176e7e7f4e87c1bf2945 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
Linus Torvalds1da177e2005-04-16 15:20:36 -07002 *
3 * Copyright (C) 1991, 1992 Linus Torvalds
4 *
5 * Enhanced CPU detection and feature setting code by Mike Jagdis
6 * and Martin Mares, November 1997.
7 */
8
9.text
Linus Torvalds1da177e2005-04-16 15:20:36 -070010#include <linux/threads.h>
Sam Ravnborg8b2f7ff2008-01-30 13:33:28 +010011#include <linux/init.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#include <linux/linkage.h>
13#include <asm/segment.h>
Jeremy Fitzhardinge0341c142009-02-13 11:14:01 -080014#include <asm/page_types.h>
15#include <asm/pgtable_types.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <asm/cache.h>
17#include <asm/thread_info.h>
Sam Ravnborg86feeaa2005-09-09 19:28:28 +020018#include <asm/asm-offsets.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070019#include <asm/setup.h>
Ian Campbell551889a2008-02-09 23:24:09 +010020#include <asm/processor-flags.h>
H. Peter Anvin8a50e512009-11-13 15:28:13 -080021#include <asm/msr-index.h>
22#include <asm/cpufeature.h>
Tejun Heo60a53172009-02-09 22:17:40 +090023#include <asm/percpu.h>
Ian Campbell551889a2008-02-09 23:24:09 +010024
25/* Physical address */
26#define pa(X) ((X) - __PAGE_OFFSET)
Linus Torvalds1da177e2005-04-16 15:20:36 -070027
28/*
29 * References to members of the new_cpu_data structure.
30 */
31
32#define X86 new_cpu_data+CPUINFO_x86
33#define X86_VENDOR new_cpu_data+CPUINFO_x86_vendor
34#define X86_MODEL new_cpu_data+CPUINFO_x86_model
35#define X86_MASK new_cpu_data+CPUINFO_x86_mask
36#define X86_HARD_MATH new_cpu_data+CPUINFO_hard_math
37#define X86_CPUID new_cpu_data+CPUINFO_cpuid_level
38#define X86_CAPABILITY new_cpu_data+CPUINFO_x86_capability
39#define X86_VENDOR_ID new_cpu_data+CPUINFO_x86_vendor_id
40
41/*
Jeremy Fitzhardingec090f532009-03-16 12:07:54 -070042 * This is how much memory in addition to the memory covered up to
43 * and including _end we need mapped initially.
Jeremy Fitzhardinge9ce8c2e2007-05-02 19:27:16 +020044 * We need:
Yinghai Lu2bd27532009-03-09 01:15:57 -070045 * (KERNEL_IMAGE_SIZE/4096) / 1024 pages (worst case, non PAE)
46 * (KERNEL_IMAGE_SIZE/4096) / 512 + 4 pages (worst case for PAE)
Linus Torvalds1da177e2005-04-16 15:20:36 -070047 *
48 * Modulo rounding, each megabyte assigned here requires a kilobyte of
49 * memory, which is currently unreclaimed.
50 *
51 * This should be a multiple of a page.
Yinghai Lu2bd27532009-03-09 01:15:57 -070052 *
53 * KERNEL_IMAGE_SIZE should be greater than pa(_end)
54 * and small than max_low_pfn, otherwise will waste some page table entries
Linus Torvalds1da177e2005-04-16 15:20:36 -070055 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070056
Jeremy Fitzhardinge9ce8c2e2007-05-02 19:27:16 +020057#if PTRS_PER_PMD > 1
Jeremy Fitzhardingec090f532009-03-16 12:07:54 -070058#define PAGE_TABLE_SIZE(pages) (((pages) / PTRS_PER_PMD) + PTRS_PER_PGD)
Jeremy Fitzhardinge9ce8c2e2007-05-02 19:27:16 +020059#else
Jeremy Fitzhardingec090f532009-03-16 12:07:54 -070060#define PAGE_TABLE_SIZE(pages) ((pages) / PTRS_PER_PGD)
Jeremy Fitzhardinge9ce8c2e2007-05-02 19:27:16 +020061#endif
Jeremy Fitzhardinge9ce8c2e2007-05-02 19:27:16 +020062
H. Peter Anvin147dd562010-12-16 19:11:09 -080063/* Number of possible pages in the lowmem region */
64LOWMEM_PAGES = (((1<<32) - __PAGE_OFFSET) >> PAGE_SHIFT)
65
Jeremy Fitzhardingec090f532009-03-16 12:07:54 -070066/* Enough space to fit pagetables for the low memory linear map */
H. Peter Anvin147dd562010-12-16 19:11:09 -080067MAPPING_BEYOND_END = PAGE_TABLE_SIZE(LOWMEM_PAGES) << PAGE_SHIFT
Jeremy Fitzhardingec090f532009-03-16 12:07:54 -070068
69/*
70 * Worst-case size of the kernel mapping we need to make:
H. Peter Anvin147dd562010-12-16 19:11:09 -080071 * a relocatable kernel can live anywhere in lowmem, so we need to be able
72 * to map all of lowmem.
Jeremy Fitzhardingec090f532009-03-16 12:07:54 -070073 */
H. Peter Anvin147dd562010-12-16 19:11:09 -080074KERNEL_PAGES = LOWMEM_PAGES
Jeremy Fitzhardingec090f532009-03-16 12:07:54 -070075
Jeremy Fitzhardingeb8a22a62009-03-16 12:10:07 -070076INIT_MAP_SIZE = PAGE_TABLE_SIZE(KERNEL_PAGES) * PAGE_SIZE_asm
Yinghai Lu2bd27532009-03-09 01:15:57 -070077RESERVE_BRK(pagetables, INIT_MAP_SIZE)
Jeremy Fitzhardinge796216a2009-03-12 16:09:49 -070078
Linus Torvalds1da177e2005-04-16 15:20:36 -070079/*
80 * 32-bit kernel entrypoint; only used by the boot CPU. On entry,
81 * %esi points to the real-mode code as a 32-bit pointer.
82 * CS and DS must be 4 GB flat segments, but we don't depend on
83 * any particular GDT layout, because we load our own as soon as we
84 * can.
85 */
Tim Abbott4ae59b92009-09-16 16:44:28 -040086__HEAD
Linus Torvalds1da177e2005-04-16 15:20:36 -070087ENTRY(startup_32)
Rusty Russella24e7852007-10-21 16:41:35 -070088 /* test KEEP_SEGMENTS flag to see if the bootloader is asking
89 us to not reload segments */
90 testb $(1<<6), BP_loadflags(%esi)
91 jnz 2f
Linus Torvalds1da177e2005-04-16 15:20:36 -070092
93/*
94 * Set segments to known values.
95 */
Ian Campbell551889a2008-02-09 23:24:09 +010096 lgdt pa(boot_gdt_descr)
Linus Torvalds1da177e2005-04-16 15:20:36 -070097 movl $(__BOOT_DS),%eax
98 movl %eax,%ds
99 movl %eax,%es
100 movl %eax,%fs
101 movl %eax,%gs
Rusty Russella24e7852007-10-21 16:41:35 -07001022:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700103
104/*
105 * Clear BSS first so that there are no surprises...
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106 */
Rusty Russella24e7852007-10-21 16:41:35 -0700107 cld
Linus Torvalds1da177e2005-04-16 15:20:36 -0700108 xorl %eax,%eax
Ian Campbell551889a2008-02-09 23:24:09 +0100109 movl $pa(__bss_start),%edi
110 movl $pa(__bss_stop),%ecx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700111 subl %edi,%ecx
112 shrl $2,%ecx
113 rep ; stosl
Vivek Goyal484b90c2005-09-03 15:56:31 -0700114/*
115 * Copy bootup parameters out of the way.
116 * Note: %esi still has the pointer to the real-mode data.
117 * With the kexec as boot loader, parameter segment might be loaded beyond
118 * kernel image and might not even be addressable by early boot page tables.
119 * (kexec on panic case). Hence copy out the parameters before initializing
120 * page tables.
121 */
Ian Campbell551889a2008-02-09 23:24:09 +0100122 movl $pa(boot_params),%edi
Vivek Goyal484b90c2005-09-03 15:56:31 -0700123 movl $(PARAM_SIZE/4),%ecx
124 cld
125 rep
126 movsl
Ian Campbell551889a2008-02-09 23:24:09 +0100127 movl pa(boot_params) + NEW_CL_POINTER,%esi
Vivek Goyal484b90c2005-09-03 15:56:31 -0700128 andl %esi,%esi
H. Peter Anvinfa76dab2007-10-23 22:37:25 +0200129 jz 1f # No comand line
Ian Campbell551889a2008-02-09 23:24:09 +0100130 movl $pa(boot_command_line),%edi
Vivek Goyal484b90c2005-09-03 15:56:31 -0700131 movl $(COMMAND_LINE_SIZE/4),%ecx
132 rep
133 movsl
1341:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700135
Andres Salomonfd699c72010-06-18 17:46:53 -0400136#ifdef CONFIG_OLPC_OPENFIRMWARE
137 /* save OFW's pgdir table for later use when calling into OFW */
138 movl %cr3, %eax
139 movl %eax, pa(olpc_ofw_pgd)
140#endif
141
Linus Torvalds1da177e2005-04-16 15:20:36 -0700142/*
143 * Initialize page tables. This creates a PDE and a set of page
Yinghai Lu2bd27532009-03-09 01:15:57 -0700144 * tables, which are located immediately beyond __brk_base. The variable
Jeremy Fitzhardingeccf3fe02009-02-27 13:27:38 -0800145 * _brk_end is set up to point to the first "safe" location.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700146 * Mappings are created both at virtual address 0 (identity mapping)
Yinghai Lu2bd27532009-03-09 01:15:57 -0700147 * and PAGE_OFFSET for up to _end.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148 *
Ian Campbell551889a2008-02-09 23:24:09 +0100149 * Note that the stack is not yet set up!
Linus Torvalds1da177e2005-04-16 15:20:36 -0700150 */
Ian Campbell551889a2008-02-09 23:24:09 +0100151#ifdef CONFIG_X86_PAE
152
153 /*
Borislav Petkovb40827fa2010-08-28 15:58:33 +0200154 * In PAE mode initial_page_table is statically defined to contain
155 * enough entries to cover the VMSPLIT option (that is the top 1, 2 or 3
156 * entries). The identity mapping is handled by pointing two PGD entries
157 * to the first kernel PMD.
Ian Campbell551889a2008-02-09 23:24:09 +0100158 *
Borislav Petkovb40827fa2010-08-28 15:58:33 +0200159 * Note the upper half of each PMD or PTE are always zero at this stage.
Ian Campbell551889a2008-02-09 23:24:09 +0100160 */
161
Joe Korty86b2b702008-06-02 17:21:06 -0400162#define KPMDS (((-__PAGE_OFFSET) >> 30) & 3) /* Number of kernel PMDs */
Ian Campbell551889a2008-02-09 23:24:09 +0100163
164 xorl %ebx,%ebx /* %ebx is kept at zero */
165
Jeremy Fitzhardingeccf3fe02009-02-27 13:27:38 -0800166 movl $pa(__brk_base), %edi
Borislav Petkovb40827fa2010-08-28 15:58:33 +0200167 movl $pa(initial_pg_pmd), %edx
Suresh Siddhab2bc2732008-09-23 14:00:36 -0700168 movl $PTE_IDENT_ATTR, %eax
Linus Torvalds1da177e2005-04-16 15:20:36 -070016910:
Suresh Siddhab2bc2732008-09-23 14:00:36 -0700170 leal PDE_IDENT_ATTR(%edi),%ecx /* Create PMD entry */
Ian Campbell551889a2008-02-09 23:24:09 +0100171 movl %ecx,(%edx) /* Store PMD entry */
172 /* Upper half already zero */
173 addl $8,%edx
174 movl $512,%ecx
17511:
176 stosl
177 xchgl %eax,%ebx
178 stosl
179 xchgl %eax,%ebx
180 addl $0x1000,%eax
181 loop 11b
182
183 /*
Jeremy Fitzhardingec090f532009-03-16 12:07:54 -0700184 * End condition: we must map up to the end + MAPPING_BEYOND_END.
Ian Campbell551889a2008-02-09 23:24:09 +0100185 */
Jeremy Fitzhardingec090f532009-03-16 12:07:54 -0700186 movl $pa(_end) + MAPPING_BEYOND_END + PTE_IDENT_ATTR, %ebp
Ian Campbell551889a2008-02-09 23:24:09 +0100187 cmpl %ebp,%eax
188 jb 10b
1891:
Jeremy Fitzhardingeccf3fe02009-02-27 13:27:38 -0800190 addl $__PAGE_OFFSET, %edi
191 movl %edi, pa(_brk_end)
Yinghai Lu6af61a72008-06-01 23:53:50 -0700192 shrl $12, %eax
193 movl %eax, pa(max_pfn_mapped)
Ian Campbell551889a2008-02-09 23:24:09 +0100194
195 /* Do early initialization of the fixmap area */
Borislav Petkovb40827fa2010-08-28 15:58:33 +0200196 movl $pa(initial_pg_fixmap)+PDE_IDENT_ATTR,%eax
197 movl %eax,pa(initial_pg_pmd+0x1000*KPMDS-8)
Ian Campbell551889a2008-02-09 23:24:09 +0100198#else /* Not PAE */
199
200page_pde_offset = (__PAGE_OFFSET >> 20);
201
Jeremy Fitzhardingeccf3fe02009-02-27 13:27:38 -0800202 movl $pa(__brk_base), %edi
Borislav Petkovb40827fa2010-08-28 15:58:33 +0200203 movl $pa(initial_page_table), %edx
Suresh Siddhab2bc2732008-09-23 14:00:36 -0700204 movl $PTE_IDENT_ATTR, %eax
Ian Campbell551889a2008-02-09 23:24:09 +010020510:
Suresh Siddhab2bc2732008-09-23 14:00:36 -0700206 leal PDE_IDENT_ATTR(%edi),%ecx /* Create PDE entry */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700207 movl %ecx,(%edx) /* Store identity PDE entry */
208 movl %ecx,page_pde_offset(%edx) /* Store kernel PDE entry */
209 addl $4,%edx
210 movl $1024, %ecx
21111:
212 stosl
213 addl $0x1000,%eax
214 loop 11b
Ian Campbell551889a2008-02-09 23:24:09 +0100215 /*
Jeremy Fitzhardingec090f532009-03-16 12:07:54 -0700216 * End condition: we must map up to the end + MAPPING_BEYOND_END.
Ian Campbell551889a2008-02-09 23:24:09 +0100217 */
Jeremy Fitzhardingec090f532009-03-16 12:07:54 -0700218 movl $pa(_end) + MAPPING_BEYOND_END + PTE_IDENT_ATTR, %ebp
Linus Torvalds1da177e2005-04-16 15:20:36 -0700219 cmpl %ebp,%eax
220 jb 10b
Jeremy Fitzhardingeccf3fe02009-02-27 13:27:38 -0800221 addl $__PAGE_OFFSET, %edi
222 movl %edi, pa(_brk_end)
Yinghai Lu6af61a72008-06-01 23:53:50 -0700223 shrl $12, %eax
224 movl %eax, pa(max_pfn_mapped)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700225
Ian Campbell551889a2008-02-09 23:24:09 +0100226 /* Do early initialization of the fixmap area */
Borislav Petkovb40827fa2010-08-28 15:58:33 +0200227 movl $pa(initial_pg_fixmap)+PDE_IDENT_ATTR,%eax
228 movl %eax,pa(initial_page_table+0xffc)
Ian Campbell551889a2008-02-09 23:24:09 +0100229#endif
Rusty Russelld50d8fe2011-01-04 17:20:54 +1030230
231#ifdef CONFIG_PARAVIRT
232 /* This is can only trip for a broken bootloader... */
233 cmpw $0x207, pa(boot_params + BP_version)
234 jb default_entry
235
236 /* Paravirt-compatible boot parameters. Look to see what architecture
237 we're booting under. */
238 movl pa(boot_params + BP_hardware_subarch), %eax
239 cmpl $num_subarch_entries, %eax
240 jae bad_subarch
241
242 movl pa(subarch_entries)(,%eax,4), %eax
243 subl $__PAGE_OFFSET, %eax
244 jmp *%eax
245
246bad_subarch:
247WEAK(lguest_entry)
248WEAK(xen_entry)
249 /* Unknown implementation; there's really
250 nothing we can do at this point. */
251 ud2a
252
253 __INITDATA
254
255subarch_entries:
256 .long default_entry /* normal x86/PC */
257 .long lguest_entry /* lguest hypervisor */
258 .long xen_entry /* Xen hypervisor */
259 .long default_entry /* Moorestown MID */
260num_subarch_entries = (. - subarch_entries) / 4
261.previous
262#else
263 jmp default_entry
264#endif /* CONFIG_PARAVIRT */
265
Linus Torvalds1da177e2005-04-16 15:20:36 -0700266/*
267 * Non-boot CPU entry point; entered from trampoline.S
268 * We can't lgdt here, because lgdt itself uses a data segment, but
Sebastien Dugue52de74d2007-05-02 19:27:10 +0200269 * we know the trampoline has already loaded the boot_gdt for us.
Vivek Goyalf8657e12007-02-13 13:26:22 +0100270 *
271 * If cpu hotplug is not supported then this code can go in init section
272 * which will be freed later
Linus Torvalds1da177e2005-04-16 15:20:36 -0700273 */
Vivek Goyalf8657e12007-02-13 13:26:22 +0100274
Jan Beulich78b89ec2009-08-18 16:41:33 +0100275__CPUINIT
Vivek Goyalf8657e12007-02-13 13:26:22 +0100276
277#ifdef CONFIG_SMP
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278ENTRY(startup_32_smp)
279 cld
280 movl $(__BOOT_DS),%eax
281 movl %eax,%ds
282 movl %eax,%es
283 movl %eax,%fs
284 movl %eax,%gs
Ian Campbell5756dd52008-01-30 13:33:27 +0100285#endif /* CONFIG_SMP */
Rusty Russelld50d8fe2011-01-04 17:20:54 +1030286default_entry:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700287
288/*
289 * New page tables may be in 4Mbyte page mode and may
290 * be using the global pages.
291 *
292 * NOTE! If we are on a 486 we may have no cr4 at all!
293 * So we do not try to touch it unless we really have
294 * some bits in it to set. This won't work if the BSP
295 * implements cr4 but this AP does not -- very unlikely
296 * but be warned! The same applies to the pse feature
297 * if not equally supported. --macro
298 *
299 * NOTE! We have to correct for the fact that we're
300 * not yet offset PAGE_OFFSET..
301 */
Ian Campbell551889a2008-02-09 23:24:09 +0100302#define cr4_bits pa(mmu_cr4_features)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700303 movl cr4_bits,%edx
304 andl %edx,%edx
305 jz 6f
306 movl %cr4,%eax # Turn on paging options (PSE,PAE,..)
307 orl %edx,%eax
308 movl %eax,%cr4
309
H. Peter Anvin8a50e512009-11-13 15:28:13 -0800310 testb $X86_CR4_PAE, %al # check if PAE is enabled
311 jz 6f
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312
313 /* Check if extended functions are implemented */
314 movl $0x80000000, %eax
315 cpuid
H. Peter Anvin8a50e512009-11-13 15:28:13 -0800316 /* Value must be in the range 0x80000001 to 0x8000ffff */
317 subl $0x80000001, %eax
318 cmpl $(0x8000ffff-0x80000001), %eax
319 ja 6f
Linus Torvalds1da177e2005-04-16 15:20:36 -0700320 mov $0x80000001, %eax
321 cpuid
322 /* Execute Disable bit supported? */
H. Peter Anvin8a50e512009-11-13 15:28:13 -0800323 btl $(X86_FEATURE_NX & 31), %edx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700324 jnc 6f
325
326 /* Setup EFER (Extended Feature Enable Register) */
H. Peter Anvin8a50e512009-11-13 15:28:13 -0800327 movl $MSR_EFER, %ecx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328 rdmsr
329
H. Peter Anvin8a50e512009-11-13 15:28:13 -0800330 btsl $_EFER_NX, %eax
Linus Torvalds1da177e2005-04-16 15:20:36 -0700331 /* Make changes effective */
332 wrmsr
333
3346:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700335
336/*
337 * Enable paging
338 */
Borislav Petkovb40827fa2010-08-28 15:58:33 +0200339 movl $pa(initial_page_table), %eax
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340 movl %eax,%cr3 /* set the page table pointer.. */
341 movl %cr0,%eax
Ian Campbell551889a2008-02-09 23:24:09 +0100342 orl $X86_CR0_PG,%eax
Linus Torvalds1da177e2005-04-16 15:20:36 -0700343 movl %eax,%cr0 /* ..and set paging (PG) bit */
344 ljmp $__BOOT_CS,$1f /* Clear prefetch and normalize %eip */
3451:
346 /* Set up the stack pointer */
347 lss stack_start,%esp
348
349/*
350 * Initialize eflags. Some BIOS's leave bits like NT set. This would
351 * confuse the debugger if this code is traced.
352 * XXX - best to initialize before switching to protected mode.
353 */
354 pushl $0
355 popfl
356
357#ifdef CONFIG_SMP
Ian Campbell50359502008-01-30 13:33:27 +0100358 cmpb $0, ready
Linus Torvalds1da177e2005-04-16 15:20:36 -0700359 jz 1f /* Initial CPU cleans BSS */
360 jmp checkCPUtype
3611:
362#endif /* CONFIG_SMP */
363
364/*
365 * start system 32-bit setup. We need to re-do some of the things done
366 * in 16-bit mode for the "real" operations.
367 */
368 call setup_idt
369
Linus Torvalds1da177e2005-04-16 15:20:36 -0700370checkCPUtype:
371
372 movl $-1,X86_CPUID # -1 for no CPUID initially
373
374/* check if it is 486 or 386. */
375/*
376 * XXX - this does a lot of unnecessary setup. Alignment checks don't
377 * apply at our cpl of 0 and the stack ought to be aligned already, and
378 * we don't need to preserve eflags.
379 */
380
381 movb $3,X86 # at least 386
382 pushfl # push EFLAGS
383 popl %eax # get EFLAGS
384 movl %eax,%ecx # save original EFLAGS
385 xorl $0x240000,%eax # flip AC and ID bits in EFLAGS
386 pushl %eax # copy to EFLAGS
387 popfl # set EFLAGS
388 pushfl # get new EFLAGS
389 popl %eax # put it in eax
390 xorl %ecx,%eax # change in flags
391 pushl %ecx # restore original EFLAGS
392 popfl
393 testl $0x40000,%eax # check if AC bit changed
394 je is386
395
396 movb $4,X86 # at least 486
397 testl $0x200000,%eax # check if ID bit changed
398 je is486
399
400 /* get vendor info */
401 xorl %eax,%eax # call CPUID with 0 -> return vendor ID
402 cpuid
403 movl %eax,X86_CPUID # save CPUID level
404 movl %ebx,X86_VENDOR_ID # lo 4 chars
405 movl %edx,X86_VENDOR_ID+4 # next 4 chars
406 movl %ecx,X86_VENDOR_ID+8 # last 4 chars
407
408 orl %eax,%eax # do we have processor info as well?
409 je is486
410
411 movl $1,%eax # Use the CPUID instruction to get CPU type
412 cpuid
413 movb %al,%cl # save reg for future use
414 andb $0x0f,%ah # mask processor family
415 movb %ah,X86
416 andb $0xf0,%al # mask model
417 shrb $4,%al
418 movb %al,X86_MODEL
419 andb $0x0f,%cl # mask mask revision
420 movb %cl,X86_MASK
421 movl %edx,X86_CAPABILITY
422
423is486: movl $0x50022,%ecx # set AM, WP, NE and MP
424 jmp 2f
425
426is386: movl $2,%ecx # set MP
4272: movl %cr0,%eax
428 andl $0x80000011,%eax # Save PG,PE,ET
429 orl %ecx,%eax
430 movl %eax,%cr0
431
432 call check_x87
Rusty Russell2a57ff12007-02-13 13:26:26 +0100433 lgdt early_gdt_descr
Linus Torvalds1da177e2005-04-16 15:20:36 -0700434 lidt idt_descr
435 ljmp $(__KERNEL_CS),$1f
4361: movl $(__KERNEL_DS),%eax # reload all the segment registers
437 movl %eax,%ss # after changing gdt.
438
439 movl $(__USER_DS),%eax # DS/ES contains default USER segment
440 movl %eax,%ds
441 movl %eax,%es
442
Brian Gerst0dd76d72009-01-21 17:26:05 +0900443 movl $(__KERNEL_PERCPU), %eax
444 movl %eax,%fs # set this cpu's percpu
445
Tejun Heo60a53172009-02-09 22:17:40 +0900446#ifdef CONFIG_CC_STACKPROTECTOR
447 /*
448 * The linker can't handle this by relocation. Manually set
449 * base address in stack canary segment descriptor.
450 */
451 cmpb $0,ready
452 jne 1f
Rusty Russelldd17c8f2009-10-29 22:34:15 +0900453 movl $gdt_page,%eax
454 movl $stack_canary,%ecx
Tejun Heo60a53172009-02-09 22:17:40 +0900455 movw %cx, 8 * GDT_ENTRY_STACK_CANARY + 2(%eax)
456 shrl $16, %ecx
457 movb %cl, 8 * GDT_ENTRY_STACK_CANARY + 4(%eax)
458 movb %ch, 8 * GDT_ENTRY_STACK_CANARY + 7(%eax)
4591:
460#endif
461 movl $(__KERNEL_STACK_CANARY),%eax
Jeremy Fitzhardinge464d1a72007-02-13 13:26:20 +0100462 movl %eax,%gs
Tejun Heo60a53172009-02-09 22:17:40 +0900463
464 xorl %eax,%eax # Clear LDT
Linus Torvalds1da177e2005-04-16 15:20:36 -0700465 lldt %ax
Jeremy Fitzhardingef95d47c2006-12-07 02:14:02 +0100466
Linus Torvalds1da177e2005-04-16 15:20:36 -0700467 cld # gcc2 wants the direction flag cleared at all times
Jeremy Fitzhardinge26fd5e02006-10-21 18:37:02 +0200468 pushl $0 # fake return address for unwinder
Linus Torvalds1da177e2005-04-16 15:20:36 -0700469#ifdef CONFIG_SMP
Shaohua Lid92de652005-06-25 14:54:49 -0700470 movb ready, %cl
471 movb $1, ready
Andi Kleen29fe5f32006-08-30 19:37:09 +0200472 cmpb $0,%cl # the first CPU calls start_kernel
Jeremy Fitzhardinge7c3576d2007-05-02 19:27:16 +0200473 je 1f
Glauber Costa3e970472008-05-28 13:01:54 -0300474 movl (stack_start), %esp
Jeremy Fitzhardinge7c3576d2007-05-02 19:27:16 +02004751:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700476#endif /* CONFIG_SMP */
Glauber Costae3f77ed2008-05-28 12:57:02 -0300477 jmp *(initial_code)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700478
479/*
480 * We depend on ET to be correct. This checks for 287/387.
481 */
482check_x87:
483 movb $0,X86_HARD_MATH
484 clts
485 fninit
486 fstsw %ax
487 cmpb $0,%al
488 je 1f
489 movl %cr0,%eax /* no coprocessor: have to set bits */
490 xorl $4,%eax /* set EM */
491 movl %eax,%cr0
492 ret
493 ALIGN
4941: movb $1,X86_HARD_MATH
495 .byte 0xDB,0xE4 /* fsetpm for 287, ignored by 387 */
496 ret
497
498/*
499 * setup_idt
500 *
501 * sets up a idt with 256 entries pointing to
502 * ignore_int, interrupt gates. It doesn't actually load
503 * idt - that can be done only after paging has been enabled
504 * and the kernel moved to PAGE_OFFSET. Interrupts
505 * are enabled elsewhere, when we can be relatively
506 * sure everything is ok.
507 *
508 * Warning: %esi is live across this function.
509 */
510setup_idt:
511 lea ignore_int,%edx
512 movl $(__KERNEL_CS << 16),%eax
513 movw %dx,%ax /* selector = 0x0010 = cs */
514 movw $0x8E00,%dx /* interrupt gate - dpl=0, present */
515
516 lea idt_table,%edi
517 mov $256,%ecx
518rp_sidt:
519 movl %eax,(%edi)
520 movl %edx,4(%edi)
521 addl $8,%edi
522 dec %ecx
523 jne rp_sidt
Chuck Ebbertec5c0922006-09-26 10:52:39 +0200524
525.macro set_early_handler handler,trapno
526 lea \handler,%edx
527 movl $(__KERNEL_CS << 16),%eax
528 movw %dx,%ax
529 movw $0x8E00,%dx /* interrupt gate - dpl=0, present */
530 lea idt_table,%edi
531 movl %eax,8*\trapno(%edi)
532 movl %edx,8*\trapno+4(%edi)
533.endm
534
535 set_early_handler handler=early_divide_err,trapno=0
536 set_early_handler handler=early_illegal_opcode,trapno=6
537 set_early_handler handler=early_protection_fault,trapno=13
538 set_early_handler handler=early_page_fault,trapno=14
539
Linus Torvalds1da177e2005-04-16 15:20:36 -0700540 ret
541
Chuck Ebbertec5c0922006-09-26 10:52:39 +0200542early_divide_err:
543 xor %edx,%edx
544 pushl $0 /* fake errcode */
545 jmp early_fault
546
547early_illegal_opcode:
548 movl $6,%edx
549 pushl $0 /* fake errcode */
550 jmp early_fault
551
552early_protection_fault:
553 movl $13,%edx
554 jmp early_fault
555
556early_page_fault:
557 movl $14,%edx
558 jmp early_fault
559
560early_fault:
561 cld
562#ifdef CONFIG_PRINTK
Ingo Molnar382f64a2007-10-17 18:04:41 +0200563 pusha
Chuck Ebbertec5c0922006-09-26 10:52:39 +0200564 movl $(__KERNEL_DS),%eax
565 movl %eax,%ds
566 movl %eax,%es
567 cmpl $2,early_recursion_flag
568 je hlt_loop
569 incl early_recursion_flag
570 movl %cr2,%eax
571 pushl %eax
572 pushl %edx /* trapno */
573 pushl $fault_msg
Chuck Ebbertec5c0922006-09-26 10:52:39 +0200574 call printk
575#endif
Ingo Molnar94878ef2008-01-30 13:33:09 +0100576 call dump_stack
Chuck Ebbertec5c0922006-09-26 10:52:39 +0200577hlt_loop:
578 hlt
579 jmp hlt_loop
580
Linus Torvalds1da177e2005-04-16 15:20:36 -0700581/* This is the default interrupt "handler" :-) */
582 ALIGN
583ignore_int:
584 cld
Matt Mackalld59745c2005-05-01 08:59:02 -0700585#ifdef CONFIG_PRINTK
Linus Torvalds1da177e2005-04-16 15:20:36 -0700586 pushl %eax
587 pushl %ecx
588 pushl %edx
589 pushl %es
590 pushl %ds
591 movl $(__KERNEL_DS),%eax
592 movl %eax,%ds
593 movl %eax,%es
Chuck Ebbertec5c0922006-09-26 10:52:39 +0200594 cmpl $2,early_recursion_flag
595 je hlt_loop
596 incl early_recursion_flag
Linus Torvalds1da177e2005-04-16 15:20:36 -0700597 pushl 16(%esp)
598 pushl 24(%esp)
599 pushl 32(%esp)
600 pushl 40(%esp)
601 pushl $int_msg
602 call printk
Ingo Molnard5e397c2009-01-26 06:09:00 +0100603
604 call dump_stack
605
Linus Torvalds1da177e2005-04-16 15:20:36 -0700606 addl $(5*4),%esp
607 popl %ds
608 popl %es
609 popl %edx
610 popl %ecx
611 popl %eax
Matt Mackalld59745c2005-05-01 08:59:02 -0700612#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700613 iret
614
Robert Richter0e838152009-07-27 19:43:52 +0200615 __REFDATA
Thomas Gleixner583323b2008-07-27 21:43:11 +0200616.align 4
617ENTRY(initial_code)
618 .long i386_start_kernel
619
Linus Torvalds1da177e2005-04-16 15:20:36 -0700620/*
621 * BSS section
622 */
Tim Abbott02b7da32009-09-20 18:14:14 -0400623__PAGE_ALIGNED_BSS
Jeremy Fitzhardinge5ead97c2007-07-17 18:37:04 -0700624 .align PAGE_SIZE_asm
Ian Campbell551889a2008-02-09 23:24:09 +0100625#ifdef CONFIG_X86_PAE
Rusty Russelld50d8fe2011-01-04 17:20:54 +1030626initial_pg_pmd:
Ian Campbell551889a2008-02-09 23:24:09 +0100627 .fill 1024*KPMDS,4,0
628#else
Borislav Petkovb40827fa2010-08-28 15:58:33 +0200629ENTRY(initial_page_table)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700630 .fill 1024,4,0
Ian Campbell551889a2008-02-09 23:24:09 +0100631#endif
Rusty Russelld50d8fe2011-01-04 17:20:54 +1030632initial_pg_fixmap:
Eric W. Bidermanb1c931e2007-07-15 23:37:28 -0700633 .fill 1024,4,0
Linus Torvalds1da177e2005-04-16 15:20:36 -0700634ENTRY(empty_zero_page)
635 .fill 4096,1,0
Borislav Petkovb40827fa2010-08-28 15:58:33 +0200636ENTRY(swapper_pg_dir)
637 .fill 1024,4,0
Yinghai Lu2bd27532009-03-09 01:15:57 -0700638
Linus Torvalds1da177e2005-04-16 15:20:36 -0700639/*
640 * This starts the data section.
641 */
Ian Campbell551889a2008-02-09 23:24:09 +0100642#ifdef CONFIG_X86_PAE
Tim Abbottabe1ee32009-09-20 18:14:15 -0400643__PAGE_ALIGNED_DATA
Ian Campbell551889a2008-02-09 23:24:09 +0100644 /* Page-aligned for the benefit of paravirt? */
645 .align PAGE_SIZE_asm
Borislav Petkovb40827fa2010-08-28 15:58:33 +0200646ENTRY(initial_page_table)
647 .long pa(initial_pg_pmd+PGD_IDENT_ATTR),0 /* low identity map */
Ian Campbell551889a2008-02-09 23:24:09 +0100648# if KPMDS == 3
Borislav Petkovb40827fa2010-08-28 15:58:33 +0200649 .long pa(initial_pg_pmd+PGD_IDENT_ATTR),0
650 .long pa(initial_pg_pmd+PGD_IDENT_ATTR+0x1000),0
651 .long pa(initial_pg_pmd+PGD_IDENT_ATTR+0x2000),0
Ian Campbell551889a2008-02-09 23:24:09 +0100652# elif KPMDS == 2
653 .long 0,0
Borislav Petkovb40827fa2010-08-28 15:58:33 +0200654 .long pa(initial_pg_pmd+PGD_IDENT_ATTR),0
655 .long pa(initial_pg_pmd+PGD_IDENT_ATTR+0x1000),0
Ian Campbell551889a2008-02-09 23:24:09 +0100656# elif KPMDS == 1
657 .long 0,0
658 .long 0,0
Borislav Petkovb40827fa2010-08-28 15:58:33 +0200659 .long pa(initial_pg_pmd+PGD_IDENT_ATTR),0
Ian Campbell551889a2008-02-09 23:24:09 +0100660# else
661# error "Kernel PMDs should be 1, 2 or 3"
662# endif
663 .align PAGE_SIZE_asm /* needs to be page-sized too */
664#endif
665
Linus Torvalds1da177e2005-04-16 15:20:36 -0700666.data
Linus Torvalds1da177e2005-04-16 15:20:36 -0700667ENTRY(stack_start)
668 .long init_thread_union+THREAD_SIZE
669 .long __BOOT_DS
670
671ready: .byte 0
672
Chuck Ebbertec5c0922006-09-26 10:52:39 +0200673early_recursion_flag:
674 .long 0
675
Linus Torvalds1da177e2005-04-16 15:20:36 -0700676int_msg:
Ingo Molnard5e397c2009-01-26 06:09:00 +0100677 .asciz "Unknown interrupt or fault at: %p %p %p\n"
Linus Torvalds1da177e2005-04-16 15:20:36 -0700678
Chuck Ebbertec5c0922006-09-26 10:52:39 +0200679fault_msg:
Vegard Nossum575ca732008-04-25 21:02:34 +0200680/* fault info: */
681 .ascii "BUG: Int %d: CR2 %p\n"
682/* pusha regs: */
683 .ascii " EDI %p ESI %p EBP %p ESP %p\n"
684 .ascii " EBX %p EDX %p ECX %p EAX %p\n"
685/* fault frame: */
686 .ascii " err %p EIP %p CS %p flg %p\n"
687 .ascii "Stack: %p %p %p %p %p %p %p %p\n"
688 .ascii " %p %p %p %p %p %p %p %p\n"
689 .asciz " %p %p %p %p %p %p %p %p\n"
Chuck Ebbertec5c0922006-09-26 10:52:39 +0200690
Thomas Gleixner97027852007-10-11 11:16:51 +0200691#include "../../x86/xen/xen-head.S"
Jeremy Fitzhardinge5ead97c2007-07-17 18:37:04 -0700692
Linus Torvalds1da177e2005-04-16 15:20:36 -0700693/*
694 * The IDT and GDT 'descriptors' are a strange 48-bit object
695 * only used by the lidt and lgdt instructions. They are not
696 * like usual segment descriptors - they consist of a 16-bit
697 * segment size, and 32-bit linear address value:
698 */
699
700.globl boot_gdt_descr
701.globl idt_descr
Linus Torvalds1da177e2005-04-16 15:20:36 -0700702
703 ALIGN
704# early boot GDT descriptor (must use 1:1 address mapping)
705 .word 0 # 32 bit align gdt_desc.address
706boot_gdt_descr:
707 .word __BOOT_DS+7
Sebastien Dugue52de74d2007-05-02 19:27:10 +0200708 .long boot_gdt - __PAGE_OFFSET
Linus Torvalds1da177e2005-04-16 15:20:36 -0700709
710 .word 0 # 32-bit align idt_desc.address
711idt_descr:
712 .word IDT_ENTRIES*8-1 # idt contains 256 entries
713 .long idt_table
714
715# boot GDT descriptor (later on used by CPU#0):
716 .word 0 # 32 bit align gdt_desc.address
Rusty Russell2a57ff12007-02-13 13:26:26 +0100717ENTRY(early_gdt_descr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700718 .word GDT_ENTRIES*8-1
Rusty Russelldd17c8f2009-10-29 22:34:15 +0900719 .long gdt_page /* Overwritten for secondary CPUs */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700720
Linus Torvalds1da177e2005-04-16 15:20:36 -0700721/*
Sebastien Dugue52de74d2007-05-02 19:27:10 +0200722 * The boot_gdt must mirror the equivalent in setup.S and is
Linus Torvalds1da177e2005-04-16 15:20:36 -0700723 * used only for booting.
724 */
725 .align L1_CACHE_BYTES
Sebastien Dugue52de74d2007-05-02 19:27:10 +0200726ENTRY(boot_gdt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700727 .fill GDT_ENTRY_BOOT_CS,8,0
728 .quad 0x00cf9a000000ffff /* kernel 4GB code at 0x00000000 */
729 .quad 0x00cf92000000ffff /* kernel 4GB data at 0x00000000 */