Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | /* |
Dave Jones | 835c34a | 2007-10-12 21:10:53 -0400 | [diff] [blame] | 2 | * prepare to run common code |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 3 | * |
| 4 | * Copyright (C) 2000 Andrea Arcangeli <andrea@suse.de> SuSE |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 5 | */ |
| 6 | |
| 7 | #include <linux/init.h> |
| 8 | #include <linux/linkage.h> |
| 9 | #include <linux/types.h> |
| 10 | #include <linux/kernel.h> |
| 11 | #include <linux/string.h> |
| 12 | #include <linux/percpu.h> |
Thomas Gleixner | eaf76e8 | 2008-01-30 13:30:19 +0100 | [diff] [blame] | 13 | #include <linux/start_kernel.h> |
Huang, Ying | 8b664aa | 2008-03-28 10:49:44 +0800 | [diff] [blame] | 14 | #include <linux/io.h> |
Yinghai Lu | 72d7c3b | 2010-08-25 13:39:17 -0700 | [diff] [blame] | 15 | #include <linux/memblock.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 16 | |
| 17 | #include <asm/processor.h> |
| 18 | #include <asm/proto.h> |
| 19 | #include <asm/smp.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 20 | #include <asm/setup.h> |
| 21 | #include <asm/desc.h> |
Siddha, Suresh B | f6c2e33 | 2005-11-05 17:25:53 +0100 | [diff] [blame] | 22 | #include <asm/pgtable.h> |
Vivek Goyal | cfd243d | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 23 | #include <asm/tlbflush.h> |
Andi Kleen | 2bc0414 | 2005-11-05 17:25:53 +0100 | [diff] [blame] | 24 | #include <asm/sections.h> |
Thomas Gleixner | 718fc13 | 2008-01-30 13:30:17 +0100 | [diff] [blame] | 25 | #include <asm/kdebug.h> |
Andi Kleen | 7517527 | 2008-01-30 13:33:17 +0100 | [diff] [blame] | 26 | #include <asm/e820.h> |
Thomas Gleixner | 47a3d5d | 2009-08-29 15:03:59 +0200 | [diff] [blame] | 27 | #include <asm/bios_ebda.h> |
H. Peter Anvin | 5dcd14e | 2013-01-29 01:05:24 -0800 | [diff] [blame] | 28 | #include <asm/bootparam_utils.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 29 | |
H. Peter Anvin | 8170e6b | 2013-01-24 12:19:52 -0800 | [diff] [blame] | 30 | /* |
| 31 | * Manage page tables very early on. |
| 32 | */ |
| 33 | extern pgd_t early_level4_pgt[PTRS_PER_PGD]; |
| 34 | extern pmd_t early_dynamic_pgts[EARLY_DYNAMIC_PAGE_TABLES][PTRS_PER_PMD]; |
| 35 | static unsigned int __initdata next_early_pgt = 2; |
| 36 | |
| 37 | /* Wipe all early page tables except for the kernel symbol map */ |
| 38 | static void __init reset_early_page_tables(void) |
Vivek Goyal | cfd243d | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 39 | { |
H. Peter Anvin | 8170e6b | 2013-01-24 12:19:52 -0800 | [diff] [blame] | 40 | unsigned long i; |
| 41 | |
| 42 | for (i = 0; i < PTRS_PER_PGD-1; i++) |
| 43 | early_level4_pgt[i].pgd = 0; |
| 44 | |
| 45 | next_early_pgt = 0; |
| 46 | |
| 47 | write_cr3(__pa(early_level4_pgt)); |
| 48 | } |
| 49 | |
| 50 | /* Create a new PMD entry */ |
| 51 | int __init early_make_pgtable(unsigned long address) |
| 52 | { |
| 53 | unsigned long physaddr = address - __PAGE_OFFSET; |
| 54 | unsigned long i; |
| 55 | pgdval_t pgd, *pgd_p; |
Yinghai Lu | 6b9c75a | 2013-01-24 12:19:53 -0800 | [diff] [blame] | 56 | pudval_t pud, *pud_p; |
H. Peter Anvin | 8170e6b | 2013-01-24 12:19:52 -0800 | [diff] [blame] | 57 | pmdval_t pmd, *pmd_p; |
| 58 | |
| 59 | /* Invalid address or early pgt is done ? */ |
| 60 | if (physaddr >= MAXMEM || read_cr3() != __pa(early_level4_pgt)) |
| 61 | return -1; |
| 62 | |
Yinghai Lu | 6b9c75a | 2013-01-24 12:19:53 -0800 | [diff] [blame] | 63 | again: |
| 64 | pgd_p = &early_level4_pgt[pgd_index(address)].pgd; |
H. Peter Anvin | 8170e6b | 2013-01-24 12:19:52 -0800 | [diff] [blame] | 65 | pgd = *pgd_p; |
| 66 | |
| 67 | /* |
| 68 | * The use of __START_KERNEL_map rather than __PAGE_OFFSET here is |
| 69 | * critical -- __PAGE_OFFSET would point us back into the dynamic |
| 70 | * range and we might end up looping forever... |
| 71 | */ |
Yinghai Lu | 6b9c75a | 2013-01-24 12:19:53 -0800 | [diff] [blame] | 72 | if (pgd) |
H. Peter Anvin | 8170e6b | 2013-01-24 12:19:52 -0800 | [diff] [blame] | 73 | pud_p = (pudval_t *)((pgd & PTE_PFN_MASK) + __START_KERNEL_map - phys_base); |
Yinghai Lu | 6b9c75a | 2013-01-24 12:19:53 -0800 | [diff] [blame] | 74 | else { |
| 75 | if (next_early_pgt >= EARLY_DYNAMIC_PAGE_TABLES) { |
H. Peter Anvin | 8170e6b | 2013-01-24 12:19:52 -0800 | [diff] [blame] | 76 | reset_early_page_tables(); |
Yinghai Lu | 6b9c75a | 2013-01-24 12:19:53 -0800 | [diff] [blame] | 77 | goto again; |
| 78 | } |
H. Peter Anvin | 8170e6b | 2013-01-24 12:19:52 -0800 | [diff] [blame] | 79 | |
| 80 | pud_p = (pudval_t *)early_dynamic_pgts[next_early_pgt++]; |
| 81 | for (i = 0; i < PTRS_PER_PUD; i++) |
| 82 | pud_p[i] = 0; |
H. Peter Anvin | 8170e6b | 2013-01-24 12:19:52 -0800 | [diff] [blame] | 83 | *pgd_p = (pgdval_t)pud_p - __START_KERNEL_map + phys_base + _KERNPG_TABLE; |
| 84 | } |
Yinghai Lu | 6b9c75a | 2013-01-24 12:19:53 -0800 | [diff] [blame] | 85 | pud_p += pud_index(address); |
| 86 | pud = *pud_p; |
H. Peter Anvin | 8170e6b | 2013-01-24 12:19:52 -0800 | [diff] [blame] | 87 | |
Yinghai Lu | 6b9c75a | 2013-01-24 12:19:53 -0800 | [diff] [blame] | 88 | if (pud) |
| 89 | pmd_p = (pmdval_t *)((pud & PTE_PFN_MASK) + __START_KERNEL_map - phys_base); |
| 90 | else { |
| 91 | if (next_early_pgt >= EARLY_DYNAMIC_PAGE_TABLES) { |
| 92 | reset_early_page_tables(); |
| 93 | goto again; |
| 94 | } |
| 95 | |
| 96 | pmd_p = (pmdval_t *)early_dynamic_pgts[next_early_pgt++]; |
| 97 | for (i = 0; i < PTRS_PER_PMD; i++) |
| 98 | pmd_p[i] = 0; |
| 99 | *pud_p = (pudval_t)pmd_p - __START_KERNEL_map + phys_base + _KERNPG_TABLE; |
H. Peter Anvin | 8170e6b | 2013-01-24 12:19:52 -0800 | [diff] [blame] | 100 | } |
Yinghai Lu | 6b9c75a | 2013-01-24 12:19:53 -0800 | [diff] [blame] | 101 | pmd = (physaddr & PMD_MASK) + (__PAGE_KERNEL_LARGE & ~_PAGE_GLOBAL); |
| 102 | pmd_p[pmd_index(address)] = pmd; |
H. Peter Anvin | 8170e6b | 2013-01-24 12:19:52 -0800 | [diff] [blame] | 103 | |
| 104 | return 0; |
Vivek Goyal | cfd243d | 2007-05-02 19:27:07 +0200 | [diff] [blame] | 105 | } |
| 106 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 107 | /* Don't add a printk in there. printk relies on the PDA which is not initialized |
| 108 | yet. */ |
| 109 | static void __init clear_bss(void) |
| 110 | { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 111 | memset(__bss_start, 0, |
Andi Kleen | 2bc0414 | 2005-11-05 17:25:53 +0100 | [diff] [blame] | 112 | (unsigned long) __bss_stop - (unsigned long) __bss_start); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 113 | } |
| 114 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 115 | static void __init copy_bootdata(char *real_mode_data) |
| 116 | { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 117 | char * command_line; |
| 118 | |
H. Peter Anvin | 30c8264 | 2007-10-15 17:13:22 -0700 | [diff] [blame] | 119 | memcpy(&boot_params, real_mode_data, sizeof boot_params); |
H. Peter Anvin | 5dcd14e | 2013-01-29 01:05:24 -0800 | [diff] [blame] | 120 | sanitize_boot_params(&boot_params); |
H. Peter Anvin | 30c8264 | 2007-10-15 17:13:22 -0700 | [diff] [blame] | 121 | if (boot_params.hdr.cmd_line_ptr) { |
| 122 | command_line = __va(boot_params.hdr.cmd_line_ptr); |
| 123 | memcpy(boot_command_line, command_line, COMMAND_LINE_SIZE); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 124 | } |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 125 | } |
| 126 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 127 | void __init x86_64_start_kernel(char * real_mode_data) |
| 128 | { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 129 | int i; |
| 130 | |
Ingo Molnar | b4e0409 | 2008-02-21 13:45:16 +0100 | [diff] [blame] | 131 | /* |
| 132 | * Build-time sanity checks on the kernel image and module |
| 133 | * area mappings. (these are purely build-time and produce no code) |
| 134 | */ |
| 135 | BUILD_BUG_ON(MODULES_VADDR < KERNEL_IMAGE_START); |
| 136 | BUILD_BUG_ON(MODULES_VADDR-KERNEL_IMAGE_START < KERNEL_IMAGE_SIZE); |
| 137 | BUILD_BUG_ON(MODULES_LEN + KERNEL_IMAGE_SIZE > 2*PUD_SIZE); |
| 138 | BUILD_BUG_ON((KERNEL_IMAGE_START & ~PMD_MASK) != 0); |
| 139 | BUILD_BUG_ON((MODULES_VADDR & ~PMD_MASK) != 0); |
| 140 | BUILD_BUG_ON(!(MODULES_VADDR > __START_KERNEL)); |
| 141 | BUILD_BUG_ON(!(((MODULES_END - 1) & PGDIR_MASK) == |
| 142 | (__START_KERNEL & PGDIR_MASK))); |
Jan Beulich | 66d4bdf | 2008-07-31 16:48:31 +0100 | [diff] [blame] | 143 | BUILD_BUG_ON(__fix_to_virt(__end_of_fixed_addresses) <= MODULES_END); |
Ingo Molnar | b4e0409 | 2008-02-21 13:45:16 +0100 | [diff] [blame] | 144 | |
H. Peter Anvin | 8170e6b | 2013-01-24 12:19:52 -0800 | [diff] [blame] | 145 | /* Kill off the identity-map trampoline */ |
| 146 | reset_early_page_tables(); |
| 147 | |
Yinghai Lu | 3df0af0 | 2006-12-07 02:14:12 +0100 | [diff] [blame] | 148 | /* clear bss before set_intr_gate with early_idt_handler */ |
| 149 | clear_bss(); |
| 150 | |
Andi Kleen | 5524ea3 | 2008-03-11 02:23:20 +0100 | [diff] [blame] | 151 | for (i = 0; i < NUM_EXCEPTION_VECTORS; i++) { |
Ingo Molnar | 076f977 | 2008-01-30 13:33:06 +0100 | [diff] [blame] | 152 | #ifdef CONFIG_EARLY_PRINTK |
Roland McGrath | 8866cd9 | 2008-01-30 13:33:06 +0100 | [diff] [blame] | 153 | set_intr_gate(i, &early_idt_handlers[i]); |
Ingo Molnar | 076f977 | 2008-01-30 13:33:06 +0100 | [diff] [blame] | 154 | #else |
| 155 | set_intr_gate(i, early_idt_handler); |
| 156 | #endif |
| 157 | } |
Glauber de Oliveira Costa | 9d1c6e7 | 2007-10-19 20:35:03 +0200 | [diff] [blame] | 158 | load_idt((const struct desc_ptr *)&idt_descr); |
Siddha, Suresh B | f6c2e33 | 2005-11-05 17:25:53 +0100 | [diff] [blame] | 159 | |
Yinghai Lu | fa2bbce | 2013-01-24 12:19:49 -0800 | [diff] [blame] | 160 | copy_bootdata(__va(real_mode_data)); |
| 161 | |
dcg | 1254469 | 2008-09-28 18:49:46 +0200 | [diff] [blame] | 162 | if (console_loglevel == 10) |
| 163 | early_printk("Kernel alive\n"); |
Ingo Molnar | 2148270 | 2006-07-03 00:24:57 -0700 | [diff] [blame] | 164 | |
H. Peter Anvin | 8170e6b | 2013-01-24 12:19:52 -0800 | [diff] [blame] | 165 | clear_page(init_level4_pgt); |
| 166 | /* set init_level4_pgt kernel high mapping*/ |
| 167 | init_level4_pgt[511] = early_level4_pgt[511]; |
| 168 | |
Jeremy Fitzhardinge | f97013f | 2008-06-25 00:19:18 -0400 | [diff] [blame] | 169 | x86_64_start_reservations(real_mode_data); |
| 170 | } |
| 171 | |
| 172 | void __init x86_64_start_reservations(char *real_mode_data) |
| 173 | { |
Yinghai Lu | fa2bbce | 2013-01-24 12:19:49 -0800 | [diff] [blame] | 174 | /* version is always not zero if it is copied */ |
| 175 | if (!boot_params.hdr.version) |
| 176 | copy_bootdata(__va(real_mode_data)); |
Yinghai Lu | 9de819f | 2008-01-30 13:30:46 +0100 | [diff] [blame] | 177 | |
Tejun Heo | 24aa078 | 2011-07-12 11:16:06 +0200 | [diff] [blame] | 178 | memblock_reserve(__pa_symbol(&_text), |
| 179 | __pa_symbol(&__bss_stop) - __pa_symbol(&_text)); |
Andi Kleen | 7517527 | 2008-01-30 13:33:17 +0100 | [diff] [blame] | 180 | |
Thomas Gleixner | 47a3d5d | 2009-08-29 15:03:59 +0200 | [diff] [blame] | 181 | reserve_ebda_region(); |
Andi Kleen | 7517527 | 2008-01-30 13:33:17 +0100 | [diff] [blame] | 182 | |
| 183 | /* |
| 184 | * At this point everything still needed from the boot loader |
| 185 | * or BIOS or kernel text should be early reserved or marked not |
| 186 | * RAM in e820. All other memory is free game. |
| 187 | */ |
| 188 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 189 | start_kernel(); |
| 190 | } |