Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | #include <linux/module.h> |
Adrian Bunk | cd6ed52 | 2006-12-06 20:40:06 -0800 | [diff] [blame] | 2 | #include <linux/reboot.h> |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 3 | #include <linux/init.h> |
| 4 | #include <linux/pm.h> |
| 5 | #include <linux/efi.h> |
| 6 | #include <acpi/reboot.h> |
| 7 | #include <asm/io.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 8 | #include <asm/apic.h> |
Zachary Amsden | 4d37e7e | 2005-09-03 15:56:38 -0700 | [diff] [blame] | 9 | #include <asm/desc.h> |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 10 | #include <asm/hpet.h> |
Jeremy Fitzhardinge | 68db065 | 2008-03-17 16:37:13 -0700 | [diff] [blame] | 11 | #include <asm/pgtable.h> |
Dmitri Vorobiev | 4412620 | 2008-04-28 03:15:59 +0400 | [diff] [blame] | 12 | #include <asm/proto.h> |
Jeremy Fitzhardinge | 973efae | 2007-05-02 19:27:06 +0200 | [diff] [blame] | 13 | #include <asm/reboot_fixups.h> |
Jeremy Fitzhardinge | 07f3331 | 2007-05-02 19:27:11 +0200 | [diff] [blame] | 14 | #include <asm/reboot.h> |
Jaswinder Singh Rajput | 8248771 | 2008-12-27 18:32:28 +0530 | [diff] [blame] | 15 | #include <asm/pci_x86.h> |
Eduardo Habkost | d176720 | 2008-11-17 19:03:24 -0200 | [diff] [blame] | 16 | #include <asm/virtext.h> |
Jaswinder Singh Rajput | 96b89dc | 2009-01-07 21:35:48 +0530 | [diff] [blame] | 17 | #include <asm/cpu.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 18 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 19 | #ifdef CONFIG_X86_32 |
| 20 | # include <linux/dmi.h> |
| 21 | # include <linux/ctype.h> |
| 22 | # include <linux/mc146818rtc.h> |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 23 | #else |
| 24 | # include <asm/iommu.h> |
| 25 | #endif |
| 26 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 27 | /* |
| 28 | * Power off function, if any |
| 29 | */ |
| 30 | void (*pm_power_off)(void); |
Alexey Dobriyan | 129f694 | 2005-06-23 00:08:33 -0700 | [diff] [blame] | 31 | EXPORT_SYMBOL(pm_power_off); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 32 | |
Jan Beulich | ebdd561 | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 33 | static const struct desc_ptr no_idt = {}; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 34 | static int reboot_mode; |
Eduardo Habkost | 8d00450 | 2008-11-04 12:52:44 -0200 | [diff] [blame] | 35 | enum reboot_type reboot_type = BOOT_KBD; |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 36 | int reboot_force; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 37 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 38 | #if defined(CONFIG_X86_32) && defined(CONFIG_SMP) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 39 | static int reboot_cpu = -1; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 40 | #endif |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 41 | |
Eduardo Habkost | d176720 | 2008-11-17 19:03:24 -0200 | [diff] [blame] | 42 | /* This is set if we need to go through the 'emergency' path. |
| 43 | * When machine_emergency_restart() is called, we may be on |
| 44 | * an inconsistent state and won't be able to do a clean cleanup |
| 45 | */ |
| 46 | static int reboot_emergency; |
| 47 | |
H. Peter Anvin | 14d7ca5 | 2008-11-11 16:19:48 -0800 | [diff] [blame] | 48 | /* This is set by the PCI code if either type 1 or type 2 PCI is detected */ |
| 49 | bool port_cf9_safe = false; |
| 50 | |
| 51 | /* reboot=b[ios] | s[mp] | t[riple] | k[bd] | e[fi] [, [w]arm | [c]old] | p[ci] |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 52 | warm Don't set the cold reboot flag |
| 53 | cold Set the cold reboot flag |
| 54 | bios Reboot by jumping through the BIOS (only for X86_32) |
| 55 | smp Reboot by executing reset on BSP or other CPU (only for X86_32) |
| 56 | triple Force a triple fault (init) |
| 57 | kbd Use the keyboard controller. cold reset (default) |
| 58 | acpi Use the RESET_REG in the FADT |
| 59 | efi Use efi reset_system runtime service |
H. Peter Anvin | 14d7ca5 | 2008-11-11 16:19:48 -0800 | [diff] [blame] | 60 | pci Use the so-called "PCI reset register", CF9 |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 61 | force Avoid anything that could hang. |
| 62 | */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 63 | static int __init reboot_setup(char *str) |
| 64 | { |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 65 | for (;;) { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 66 | switch (*str) { |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 67 | case 'w': |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 68 | reboot_mode = 0x1234; |
| 69 | break; |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 70 | |
| 71 | case 'c': |
| 72 | reboot_mode = 0; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 73 | break; |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 74 | |
| 75 | #ifdef CONFIG_X86_32 |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 76 | #ifdef CONFIG_SMP |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 77 | case 's': |
Tobias Klauser | 6f673d8 | 2005-09-13 01:25:48 -0700 | [diff] [blame] | 78 | if (isdigit(*(str+1))) { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 79 | reboot_cpu = (int) (*(str+1) - '0'); |
Tobias Klauser | 6f673d8 | 2005-09-13 01:25:48 -0700 | [diff] [blame] | 80 | if (isdigit(*(str+2))) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 81 | reboot_cpu = reboot_cpu*10 + (int)(*(str+2) - '0'); |
| 82 | } |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 83 | /* we will leave sorting out the final value |
| 84 | when we are ready to reboot, since we might not |
| 85 | have set up boot_cpu_id or smp_num_cpu */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 86 | break; |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 87 | #endif /* CONFIG_SMP */ |
| 88 | |
| 89 | case 'b': |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 90 | #endif |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 91 | case 'a': |
| 92 | case 'k': |
| 93 | case 't': |
| 94 | case 'e': |
H. Peter Anvin | 14d7ca5 | 2008-11-11 16:19:48 -0800 | [diff] [blame] | 95 | case 'p': |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 96 | reboot_type = *str; |
| 97 | break; |
| 98 | |
| 99 | case 'f': |
| 100 | reboot_force = 1; |
| 101 | break; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 102 | } |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 103 | |
| 104 | str = strchr(str, ','); |
| 105 | if (str) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 106 | str++; |
| 107 | else |
| 108 | break; |
| 109 | } |
| 110 | return 1; |
| 111 | } |
| 112 | |
| 113 | __setup("reboot=", reboot_setup); |
| 114 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 115 | |
| 116 | #ifdef CONFIG_X86_32 |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 117 | /* |
| 118 | * Reboot options and system auto-detection code provided by |
| 119 | * Dell Inc. so their systems "just work". :-) |
| 120 | */ |
| 121 | |
| 122 | /* |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 123 | * Some machines require the "reboot=b" commandline option, |
| 124 | * this quirk makes that automatic. |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 125 | */ |
Jeff Garzik | 1855256 | 2007-10-03 15:15:40 -0400 | [diff] [blame] | 126 | static int __init set_bios_reboot(const struct dmi_system_id *d) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 127 | { |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 128 | if (reboot_type != BOOT_BIOS) { |
| 129 | reboot_type = BOOT_BIOS; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 130 | printk(KERN_INFO "%s series board detected. Selecting BIOS-method for reboots.\n", d->ident); |
| 131 | } |
| 132 | return 0; |
| 133 | } |
| 134 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 135 | static struct dmi_system_id __initdata reboot_dmi_table[] = { |
Tim Gardner | b9e82af | 2007-06-01 00:46:40 -0700 | [diff] [blame] | 136 | { /* Handle problems with rebooting on Dell E520's */ |
| 137 | .callback = set_bios_reboot, |
| 138 | .ident = "Dell E520", |
| 139 | .matches = { |
| 140 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."), |
| 141 | DMI_MATCH(DMI_PRODUCT_NAME, "Dell DM061"), |
| 142 | }, |
| 143 | }, |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 144 | { /* Handle problems with rebooting on Dell 1300's */ |
Eric W. Biederman | dd2a130 | 2005-06-25 14:57:55 -0700 | [diff] [blame] | 145 | .callback = set_bios_reboot, |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 146 | .ident = "Dell PowerEdge 1300", |
| 147 | .matches = { |
| 148 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Computer Corporation"), |
| 149 | DMI_MATCH(DMI_PRODUCT_NAME, "PowerEdge 1300/"), |
| 150 | }, |
| 151 | }, |
| 152 | { /* Handle problems with rebooting on Dell 300's */ |
| 153 | .callback = set_bios_reboot, |
| 154 | .ident = "Dell PowerEdge 300", |
| 155 | .matches = { |
| 156 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Computer Corporation"), |
| 157 | DMI_MATCH(DMI_PRODUCT_NAME, "PowerEdge 300/"), |
| 158 | }, |
| 159 | }, |
James Jarvis | df2edcf | 2007-07-21 17:11:11 +0200 | [diff] [blame] | 160 | { /* Handle problems with rebooting on Dell Optiplex 745's SFF*/ |
| 161 | .callback = set_bios_reboot, |
| 162 | .ident = "Dell OptiPlex 745", |
| 163 | .matches = { |
| 164 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."), |
| 165 | DMI_MATCH(DMI_PRODUCT_NAME, "OptiPlex 745"), |
James Jarvis | df2edcf | 2007-07-21 17:11:11 +0200 | [diff] [blame] | 166 | }, |
| 167 | }, |
Coleman Kane | fc115bf | 2008-03-04 15:05:41 -0800 | [diff] [blame] | 168 | { /* Handle problems with rebooting on Dell Optiplex 745's DFF*/ |
| 169 | .callback = set_bios_reboot, |
| 170 | .ident = "Dell OptiPlex 745", |
| 171 | .matches = { |
| 172 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."), |
| 173 | DMI_MATCH(DMI_PRODUCT_NAME, "OptiPlex 745"), |
| 174 | DMI_MATCH(DMI_BOARD_NAME, "0MM599"), |
| 175 | }, |
| 176 | }, |
Heinz-Ado Arnolds | fc1c892 | 2008-03-12 16:27:56 +0100 | [diff] [blame] | 177 | { /* Handle problems with rebooting on Dell Optiplex 745 with 0KW626 */ |
| 178 | .callback = set_bios_reboot, |
| 179 | .ident = "Dell OptiPlex 745", |
| 180 | .matches = { |
| 181 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."), |
| 182 | DMI_MATCH(DMI_PRODUCT_NAME, "OptiPlex 745"), |
| 183 | DMI_MATCH(DMI_BOARD_NAME, "0KW626"), |
| 184 | }, |
| 185 | }, |
Steve Conklin | 093bac1 | 2008-11-14 00:55:51 -0600 | [diff] [blame] | 186 | { /* Handle problems with rebooting on Dell Optiplex 330 with 0KP561 */ |
| 187 | .callback = set_bios_reboot, |
| 188 | .ident = "Dell OptiPlex 330", |
| 189 | .matches = { |
| 190 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."), |
| 191 | DMI_MATCH(DMI_PRODUCT_NAME, "OptiPlex 330"), |
| 192 | DMI_MATCH(DMI_BOARD_NAME, "0KP561"), |
| 193 | }, |
| 194 | }, |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 195 | { /* Handle problems with rebooting on Dell 2400's */ |
| 196 | .callback = set_bios_reboot, |
| 197 | .ident = "Dell PowerEdge 2400", |
| 198 | .matches = { |
| 199 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Computer Corporation"), |
| 200 | DMI_MATCH(DMI_PRODUCT_NAME, "PowerEdge 2400"), |
| 201 | }, |
| 202 | }, |
Ingo Molnar | fab3b58 | 2008-07-17 13:50:15 +0200 | [diff] [blame] | 203 | { /* Handle problems with rebooting on Dell T5400's */ |
| 204 | .callback = set_bios_reboot, |
| 205 | .ident = "Dell Precision T5400", |
| 206 | .matches = { |
| 207 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."), |
| 208 | DMI_MATCH(DMI_PRODUCT_NAME, "Precision WorkStation T5400"), |
| 209 | }, |
| 210 | }, |
Ben Collins | 766c3f9 | 2006-01-06 00:12:20 -0800 | [diff] [blame] | 211 | { /* Handle problems with rebooting on HP laptops */ |
Thierry Vignaud | d91b14c | 2005-11-29 19:34:35 -0800 | [diff] [blame] | 212 | .callback = set_bios_reboot, |
Ben Collins | 766c3f9 | 2006-01-06 00:12:20 -0800 | [diff] [blame] | 213 | .ident = "HP Compaq Laptop", |
Thierry Vignaud | d91b14c | 2005-11-29 19:34:35 -0800 | [diff] [blame] | 214 | .matches = { |
| 215 | DMI_MATCH(DMI_SYS_VENDOR, "Hewlett-Packard"), |
Ben Collins | 766c3f9 | 2006-01-06 00:12:20 -0800 | [diff] [blame] | 216 | DMI_MATCH(DMI_PRODUCT_NAME, "HP Compaq"), |
Thierry Vignaud | d91b14c | 2005-11-29 19:34:35 -0800 | [diff] [blame] | 217 | }, |
| 218 | }, |
Leann Ogasawara | dd4124a | 2009-03-04 11:53:00 -0800 | [diff] [blame] | 219 | { /* Handle problems with rebooting on Dell XPS710 */ |
| 220 | .callback = set_bios_reboot, |
| 221 | .ident = "Dell XPS710", |
| 222 | .matches = { |
| 223 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."), |
| 224 | DMI_MATCH(DMI_PRODUCT_NAME, "Dell XPS710"), |
| 225 | }, |
| 226 | }, |
Alan Cox | c5da9a2 | 2009-03-26 20:45:28 +0000 | [diff] [blame] | 227 | { /* Handle problems with rebooting on Dell DXP061 */ |
| 228 | .callback = set_bios_reboot, |
| 229 | .ident = "Dell DXP061", |
| 230 | .matches = { |
| 231 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."), |
| 232 | DMI_MATCH(DMI_PRODUCT_NAME, "Dell DXP061"), |
| 233 | }, |
| 234 | }, |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 235 | { } |
| 236 | }; |
| 237 | |
| 238 | static int __init reboot_init(void) |
| 239 | { |
| 240 | dmi_check_system(reboot_dmi_table); |
| 241 | return 0; |
| 242 | } |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 243 | core_initcall(reboot_init); |
| 244 | |
| 245 | /* The following code and data reboots the machine by switching to real |
| 246 | mode and jumping to the BIOS reset entry point, as if the CPU has |
| 247 | really been reset. The previous version asked the keyboard |
| 248 | controller to pulse the CPU reset line, which is more thorough, but |
| 249 | doesn't work with at least one type of 486 motherboard. It is easy |
| 250 | to stop this code working; hence the copious comments. */ |
Jan Beulich | ebdd561 | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 251 | static const unsigned long long |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 252 | real_mode_gdt_entries [3] = |
| 253 | { |
| 254 | 0x0000000000000000ULL, /* Null descriptor */ |
Jan Beulich | ebdd561 | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 255 | 0x00009b000000ffffULL, /* 16-bit real-mode 64k code at 0x00000000 */ |
| 256 | 0x000093000100ffffULL /* 16-bit real-mode 64k data at 0x00000100 */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 257 | }; |
| 258 | |
Jan Beulich | ebdd561 | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 259 | static const struct desc_ptr |
Rusty Russell | 05f4a3e | 2006-09-25 23:32:22 -0700 | [diff] [blame] | 260 | real_mode_gdt = { sizeof (real_mode_gdt_entries) - 1, (long)real_mode_gdt_entries }, |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 261 | real_mode_idt = { 0x3ff, 0 }; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 262 | |
| 263 | /* This is 16-bit protected mode code to disable paging and the cache, |
| 264 | switch to real mode and jump to the BIOS reset code. |
| 265 | |
| 266 | The instruction that switches to real mode by writing to CR0 must be |
| 267 | followed immediately by a far jump instruction, which set CS to a |
| 268 | valid value for real mode, and flushes the prefetch queue to avoid |
| 269 | running instructions that have already been decoded in protected |
| 270 | mode. |
| 271 | |
| 272 | Clears all the flags except ET, especially PG (paging), PE |
| 273 | (protected-mode enable) and TS (task switch for coprocessor state |
| 274 | save). Flushes the TLB after paging has been disabled. Sets CD and |
| 275 | NW, to disable the cache on a 486, and invalidates the cache. This |
| 276 | is more like the state of a 486 after reset. I don't know if |
| 277 | something else should be done for other chips. |
| 278 | |
| 279 | More could be done here to set up the registers as if a CPU reset had |
| 280 | occurred; hopefully real BIOSs don't assume much. */ |
Jan Beulich | ebdd561 | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 281 | static const unsigned char real_mode_switch [] = |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 282 | { |
| 283 | 0x66, 0x0f, 0x20, 0xc0, /* movl %cr0,%eax */ |
| 284 | 0x66, 0x83, 0xe0, 0x11, /* andl $0x00000011,%eax */ |
| 285 | 0x66, 0x0d, 0x00, 0x00, 0x00, 0x60, /* orl $0x60000000,%eax */ |
| 286 | 0x66, 0x0f, 0x22, 0xc0, /* movl %eax,%cr0 */ |
| 287 | 0x66, 0x0f, 0x22, 0xd8, /* movl %eax,%cr3 */ |
| 288 | 0x66, 0x0f, 0x20, 0xc3, /* movl %cr0,%ebx */ |
| 289 | 0x66, 0x81, 0xe3, 0x00, 0x00, 0x00, 0x60, /* andl $0x60000000,%ebx */ |
| 290 | 0x74, 0x02, /* jz f */ |
| 291 | 0x0f, 0x09, /* wbinvd */ |
| 292 | 0x24, 0x10, /* f: andb $0x10,al */ |
| 293 | 0x66, 0x0f, 0x22, 0xc0 /* movl %eax,%cr0 */ |
| 294 | }; |
Jan Beulich | ebdd561 | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 295 | static const unsigned char jump_to_bios [] = |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 296 | { |
| 297 | 0xea, 0x00, 0x00, 0xff, 0xff /* ljmp $0xffff,$0x0000 */ |
| 298 | }; |
| 299 | |
| 300 | /* |
| 301 | * Switch to real mode and then execute the code |
| 302 | * specified by the code and length parameters. |
| 303 | * We assume that length will aways be less that 100! |
| 304 | */ |
Jan Beulich | ebdd561 | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 305 | void machine_real_restart(const unsigned char *code, int length) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 306 | { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 307 | local_irq_disable(); |
| 308 | |
| 309 | /* Write zero to CMOS register number 0x0f, which the BIOS POST |
| 310 | routine will recognize as telling it to do a proper reboot. (Well |
| 311 | that's what this book in front of me says -- it may only apply to |
| 312 | the Phoenix BIOS though, it's not clear). At the same time, |
| 313 | disable NMIs by setting the top bit in the CMOS address register, |
| 314 | as we're about to do peculiar things to the CPU. I'm not sure if |
| 315 | `outb_p' is needed instead of just `outb'. Use it to be on the |
| 316 | safe side. (Yes, CMOS_WRITE does outb_p's. - Paul G.) |
| 317 | */ |
Hisashi Hifumi | 62dbc21 | 2007-05-02 19:27:18 +0200 | [diff] [blame] | 318 | spin_lock(&rtc_lock); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 319 | CMOS_WRITE(0x00, 0x8f); |
Hisashi Hifumi | 62dbc21 | 2007-05-02 19:27:18 +0200 | [diff] [blame] | 320 | spin_unlock(&rtc_lock); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 321 | |
| 322 | /* Remap the kernel at virtual address zero, as well as offset zero |
| 323 | from the kernel segment. This assumes the kernel segment starts at |
| 324 | virtual address PAGE_OFFSET. */ |
Jeremy Fitzhardinge | 68db065 | 2008-03-17 16:37:13 -0700 | [diff] [blame] | 325 | memcpy(swapper_pg_dir, swapper_pg_dir + KERNEL_PGD_BOUNDARY, |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 326 | sizeof(swapper_pg_dir [0]) * KERNEL_PGD_PTRS); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 327 | |
| 328 | /* |
| 329 | * Use `swapper_pg_dir' as our page directory. |
| 330 | */ |
| 331 | load_cr3(swapper_pg_dir); |
| 332 | |
| 333 | /* Write 0x1234 to absolute memory location 0x472. The BIOS reads |
| 334 | this on booting to tell it to "Bypass memory test (also warm |
| 335 | boot)". This seems like a fairly standard thing that gets set by |
| 336 | REBOOT.COM programs, and the previous reset routine did this |
| 337 | too. */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 338 | *((unsigned short *)0x472) = reboot_mode; |
| 339 | |
| 340 | /* For the switch to real mode, copy some code to low memory. It has |
| 341 | to be in the first 64k because it is running in 16-bit mode, and it |
| 342 | has to have the same physical and virtual address, because it turns |
| 343 | off paging. Copy it near the end of the first page, out of the way |
| 344 | of BIOS variables. */ |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 345 | memcpy((void *)(0x1000 - sizeof(real_mode_switch) - 100), |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 346 | real_mode_switch, sizeof (real_mode_switch)); |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 347 | memcpy((void *)(0x1000 - 100), code, length); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 348 | |
| 349 | /* Set up the IDT for real mode. */ |
Zachary Amsden | 4d37e7e | 2005-09-03 15:56:38 -0700 | [diff] [blame] | 350 | load_idt(&real_mode_idt); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 351 | |
| 352 | /* Set up a GDT from which we can load segment descriptors for real |
| 353 | mode. The GDT is not used in real mode; it is just needed here to |
| 354 | prepare the descriptors. */ |
Zachary Amsden | 4d37e7e | 2005-09-03 15:56:38 -0700 | [diff] [blame] | 355 | load_gdt(&real_mode_gdt); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 356 | |
| 357 | /* Load the data segment registers, and thus the descriptors ready for |
| 358 | real mode. The base address of each segment is 0x100, 16 times the |
| 359 | selector value being loaded here. This is so that the segment |
| 360 | registers don't have to be reloaded after switching to real mode: |
| 361 | the values are consistent for real mode operation already. */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 362 | __asm__ __volatile__ ("movl $0x0010,%%eax\n" |
| 363 | "\tmovl %%eax,%%ds\n" |
| 364 | "\tmovl %%eax,%%es\n" |
| 365 | "\tmovl %%eax,%%fs\n" |
| 366 | "\tmovl %%eax,%%gs\n" |
| 367 | "\tmovl %%eax,%%ss" : : : "eax"); |
| 368 | |
| 369 | /* Jump to the 16-bit code that we copied earlier. It disables paging |
| 370 | and the cache, switches to real mode, and jumps to the BIOS reset |
| 371 | entry point. */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 372 | __asm__ __volatile__ ("ljmp $0x0008,%0" |
| 373 | : |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 374 | : "i" ((void *)(0x1000 - sizeof (real_mode_switch) - 100))); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 375 | } |
Alexey Dobriyan | 129f694 | 2005-06-23 00:08:33 -0700 | [diff] [blame] | 376 | #ifdef CONFIG_APM_MODULE |
| 377 | EXPORT_SYMBOL(machine_real_restart); |
| 378 | #endif |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 379 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 380 | #endif /* CONFIG_X86_32 */ |
| 381 | |
| 382 | static inline void kb_wait(void) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 383 | { |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 384 | int i; |
| 385 | |
Alan Cox | c84d6af8 | 2008-01-30 13:33:25 +0100 | [diff] [blame] | 386 | for (i = 0; i < 0x10000; i++) { |
| 387 | if ((inb(0x64) & 0x02) == 0) |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 388 | break; |
Alan Cox | c84d6af8 | 2008-01-30 13:33:25 +0100 | [diff] [blame] | 389 | udelay(2); |
| 390 | } |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 391 | } |
| 392 | |
Eduardo Habkost | d176720 | 2008-11-17 19:03:24 -0200 | [diff] [blame] | 393 | static void vmxoff_nmi(int cpu, struct die_args *args) |
| 394 | { |
| 395 | cpu_emergency_vmxoff(); |
| 396 | } |
| 397 | |
| 398 | /* Use NMIs as IPIs to tell all CPUs to disable virtualization |
| 399 | */ |
| 400 | static void emergency_vmx_disable_all(void) |
| 401 | { |
| 402 | /* Just make sure we won't change CPUs while doing this */ |
| 403 | local_irq_disable(); |
| 404 | |
| 405 | /* We need to disable VMX on all CPUs before rebooting, otherwise |
| 406 | * we risk hanging up the machine, because the CPU ignore INIT |
| 407 | * signals when VMX is enabled. |
| 408 | * |
| 409 | * We can't take any locks and we may be on an inconsistent |
| 410 | * state, so we use NMIs as IPIs to tell the other CPUs to disable |
| 411 | * VMX and halt. |
| 412 | * |
| 413 | * For safety, we will avoid running the nmi_shootdown_cpus() |
| 414 | * stuff unnecessarily, but we don't have a way to check |
| 415 | * if other CPUs have VMX enabled. So we will call it only if the |
| 416 | * CPU we are running on has VMX enabled. |
| 417 | * |
| 418 | * We will miss cases where VMX is not enabled on all CPUs. This |
| 419 | * shouldn't do much harm because KVM always enable VMX on all |
| 420 | * CPUs anyway. But we can miss it on the small window where KVM |
| 421 | * is still enabling VMX. |
| 422 | */ |
| 423 | if (cpu_has_vmx() && cpu_vmx_enabled()) { |
| 424 | /* Disable VMX on this CPU. |
| 425 | */ |
| 426 | cpu_vmxoff(); |
| 427 | |
| 428 | /* Halt and disable VMX on the other CPUs */ |
| 429 | nmi_shootdown_cpus(vmxoff_nmi); |
| 430 | |
| 431 | } |
| 432 | } |
| 433 | |
| 434 | |
Ingo Molnar | 7432d14 | 2008-03-06 18:29:43 +0100 | [diff] [blame] | 435 | void __attribute__((weak)) mach_reboot_fixups(void) |
| 436 | { |
| 437 | } |
| 438 | |
Jody Belka | 416e2d6 | 2008-02-12 23:37:48 +0000 | [diff] [blame] | 439 | static void native_machine_emergency_restart(void) |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 440 | { |
| 441 | int i; |
| 442 | |
Eduardo Habkost | d176720 | 2008-11-17 19:03:24 -0200 | [diff] [blame] | 443 | if (reboot_emergency) |
| 444 | emergency_vmx_disable_all(); |
| 445 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 446 | /* Tell the BIOS if we want cold or warm reboot */ |
| 447 | *((unsigned short *)__va(0x472)) = reboot_mode; |
| 448 | |
| 449 | for (;;) { |
| 450 | /* Could also try the reset bit in the Hammer NB */ |
| 451 | switch (reboot_type) { |
| 452 | case BOOT_KBD: |
Ingo Molnar | 7432d14 | 2008-03-06 18:29:43 +0100 | [diff] [blame] | 453 | mach_reboot_fixups(); /* for board specific fixups */ |
| 454 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 455 | for (i = 0; i < 10; i++) { |
| 456 | kb_wait(); |
| 457 | udelay(50); |
| 458 | outb(0xfe, 0x64); /* pulse reset low */ |
| 459 | udelay(50); |
| 460 | } |
| 461 | |
| 462 | case BOOT_TRIPLE: |
Jan Beulich | ebdd561 | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 463 | load_idt(&no_idt); |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 464 | __asm__ __volatile__("int3"); |
| 465 | |
| 466 | reboot_type = BOOT_KBD; |
| 467 | break; |
| 468 | |
| 469 | #ifdef CONFIG_X86_32 |
| 470 | case BOOT_BIOS: |
| 471 | machine_real_restart(jump_to_bios, sizeof(jump_to_bios)); |
| 472 | |
| 473 | reboot_type = BOOT_KBD; |
| 474 | break; |
| 475 | #endif |
| 476 | |
| 477 | case BOOT_ACPI: |
| 478 | acpi_reboot(); |
| 479 | reboot_type = BOOT_KBD; |
| 480 | break; |
| 481 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 482 | case BOOT_EFI: |
| 483 | if (efi_enabled) |
H. Peter Anvin | 14d7ca5 | 2008-11-11 16:19:48 -0800 | [diff] [blame] | 484 | efi.reset_system(reboot_mode ? |
| 485 | EFI_RESET_WARM : |
| 486 | EFI_RESET_COLD, |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 487 | EFI_SUCCESS, 0, NULL); |
H. Peter Anvin | b47b928 | 2008-11-24 00:50:09 -0800 | [diff] [blame] | 488 | reboot_type = BOOT_KBD; |
H. Peter Anvin | 14d7ca5 | 2008-11-11 16:19:48 -0800 | [diff] [blame] | 489 | break; |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 490 | |
H. Peter Anvin | 14d7ca5 | 2008-11-11 16:19:48 -0800 | [diff] [blame] | 491 | case BOOT_CF9: |
| 492 | port_cf9_safe = true; |
| 493 | /* fall through */ |
| 494 | |
| 495 | case BOOT_CF9_COND: |
| 496 | if (port_cf9_safe) { |
| 497 | u8 cf9 = inb(0xcf9) & ~6; |
| 498 | outb(cf9|2, 0xcf9); /* Request hard reset */ |
| 499 | udelay(50); |
| 500 | outb(cf9|6, 0xcf9); /* Actually do the reset */ |
| 501 | udelay(50); |
| 502 | } |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 503 | reboot_type = BOOT_KBD; |
| 504 | break; |
| 505 | } |
| 506 | } |
| 507 | } |
| 508 | |
Glauber Costa | 3c62c62 | 2008-03-17 16:08:39 -0300 | [diff] [blame] | 509 | void native_machine_shutdown(void) |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 510 | { |
| 511 | /* Stop the cpus and apics */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 512 | #ifdef CONFIG_SMP |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 513 | |
Eric W. Biederman | dd2a130 | 2005-06-25 14:57:55 -0700 | [diff] [blame] | 514 | /* The boot cpu is always logical cpu 0 */ |
Mike Travis | 65c0118 | 2008-07-15 14:14:30 -0700 | [diff] [blame] | 515 | int reboot_cpu_id = 0; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 516 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 517 | #ifdef CONFIG_X86_32 |
Eric W. Biederman | dd2a130 | 2005-06-25 14:57:55 -0700 | [diff] [blame] | 518 | /* See if there has been given a command line override */ |
Mike Travis | 9628937 | 2008-12-31 18:08:46 -0800 | [diff] [blame] | 519 | if ((reboot_cpu != -1) && (reboot_cpu < nr_cpu_ids) && |
Mike Travis | 0bc3cc0 | 2008-07-24 18:21:31 -0700 | [diff] [blame] | 520 | cpu_online(reboot_cpu)) |
Eric W. Biederman | dd2a130 | 2005-06-25 14:57:55 -0700 | [diff] [blame] | 521 | reboot_cpu_id = reboot_cpu; |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 522 | #endif |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 523 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 524 | /* Make certain the cpu I'm about to reboot on is online */ |
Mike Travis | 0bc3cc0 | 2008-07-24 18:21:31 -0700 | [diff] [blame] | 525 | if (!cpu_online(reboot_cpu_id)) |
Eric W. Biederman | dd2a130 | 2005-06-25 14:57:55 -0700 | [diff] [blame] | 526 | reboot_cpu_id = smp_processor_id(); |
Eric W. Biederman | dd2a130 | 2005-06-25 14:57:55 -0700 | [diff] [blame] | 527 | |
| 528 | /* Make certain I only run on the appropriate processor */ |
Mike Travis | 9628937 | 2008-12-31 18:08:46 -0800 | [diff] [blame] | 529 | set_cpus_allowed_ptr(current, cpumask_of(reboot_cpu_id)); |
Eric W. Biederman | dd2a130 | 2005-06-25 14:57:55 -0700 | [diff] [blame] | 530 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 531 | /* O.K Now that I'm on the appropriate processor, |
| 532 | * stop all of the others. |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 533 | */ |
| 534 | smp_send_stop(); |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 535 | #endif |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 536 | |
| 537 | lapic_shutdown(); |
| 538 | |
| 539 | #ifdef CONFIG_X86_IO_APIC |
| 540 | disable_IO_APIC(); |
| 541 | #endif |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 542 | |
OGAWA Hirofumi | c86c7fb | 2007-12-03 17:17:10 +0100 | [diff] [blame] | 543 | #ifdef CONFIG_HPET_TIMER |
| 544 | hpet_disable(); |
| 545 | #endif |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 546 | |
| 547 | #ifdef CONFIG_X86_64 |
| 548 | pci_iommu_shutdown(); |
| 549 | #endif |
Eric W. Biederman | dd2a130 | 2005-06-25 14:57:55 -0700 | [diff] [blame] | 550 | } |
| 551 | |
Eduardo Habkost | d176720 | 2008-11-17 19:03:24 -0200 | [diff] [blame] | 552 | static void __machine_emergency_restart(int emergency) |
| 553 | { |
| 554 | reboot_emergency = emergency; |
| 555 | machine_ops.emergency_restart(); |
| 556 | } |
| 557 | |
Jody Belka | 416e2d6 | 2008-02-12 23:37:48 +0000 | [diff] [blame] | 558 | static void native_machine_restart(char *__unused) |
Jeremy Fitzhardinge | 973efae | 2007-05-02 19:27:06 +0200 | [diff] [blame] | 559 | { |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 560 | printk("machine restart\n"); |
Jeremy Fitzhardinge | 973efae | 2007-05-02 19:27:06 +0200 | [diff] [blame] | 561 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 562 | if (!reboot_force) |
Eric W. Biederman | 6e3fbee | 2006-01-11 22:43:12 +0100 | [diff] [blame] | 563 | machine_shutdown(); |
Eduardo Habkost | d176720 | 2008-11-17 19:03:24 -0200 | [diff] [blame] | 564 | __machine_emergency_restart(0); |
Jeremy Fitzhardinge | 07f3331 | 2007-05-02 19:27:11 +0200 | [diff] [blame] | 565 | } |
| 566 | |
Jody Belka | 416e2d6 | 2008-02-12 23:37:48 +0000 | [diff] [blame] | 567 | static void native_machine_halt(void) |
Jeremy Fitzhardinge | 07f3331 | 2007-05-02 19:27:11 +0200 | [diff] [blame] | 568 | { |
Ivan Vecera | d3ec5ca | 2008-11-11 14:33:44 +0100 | [diff] [blame] | 569 | /* stop other cpus and apics */ |
| 570 | machine_shutdown(); |
| 571 | |
| 572 | /* stop this cpu */ |
| 573 | stop_this_cpu(NULL); |
Jeremy Fitzhardinge | 07f3331 | 2007-05-02 19:27:11 +0200 | [diff] [blame] | 574 | } |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 575 | |
Jody Belka | 416e2d6 | 2008-02-12 23:37:48 +0000 | [diff] [blame] | 576 | static void native_machine_power_off(void) |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 577 | { |
| 578 | if (pm_power_off) { |
| 579 | if (!reboot_force) |
| 580 | machine_shutdown(); |
| 581 | pm_power_off(); |
| 582 | } |
| 583 | } |
| 584 | |
| 585 | struct machine_ops machine_ops = { |
Jody Belka | 416e2d6 | 2008-02-12 23:37:48 +0000 | [diff] [blame] | 586 | .power_off = native_machine_power_off, |
| 587 | .shutdown = native_machine_shutdown, |
| 588 | .emergency_restart = native_machine_emergency_restart, |
| 589 | .restart = native_machine_restart, |
Glauber Costa | ed23dc6 | 2008-03-17 16:08:38 -0300 | [diff] [blame] | 590 | .halt = native_machine_halt, |
| 591 | #ifdef CONFIG_KEXEC |
| 592 | .crash_shutdown = native_machine_crash_shutdown, |
| 593 | #endif |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 594 | }; |
Jody Belka | 416e2d6 | 2008-02-12 23:37:48 +0000 | [diff] [blame] | 595 | |
| 596 | void machine_power_off(void) |
| 597 | { |
| 598 | machine_ops.power_off(); |
| 599 | } |
| 600 | |
| 601 | void machine_shutdown(void) |
| 602 | { |
| 603 | machine_ops.shutdown(); |
| 604 | } |
| 605 | |
| 606 | void machine_emergency_restart(void) |
| 607 | { |
Eduardo Habkost | d176720 | 2008-11-17 19:03:24 -0200 | [diff] [blame] | 608 | __machine_emergency_restart(1); |
Jody Belka | 416e2d6 | 2008-02-12 23:37:48 +0000 | [diff] [blame] | 609 | } |
| 610 | |
| 611 | void machine_restart(char *cmd) |
| 612 | { |
| 613 | machine_ops.restart(cmd); |
| 614 | } |
| 615 | |
| 616 | void machine_halt(void) |
| 617 | { |
| 618 | machine_ops.halt(); |
| 619 | } |
| 620 | |
Glauber Costa | ed23dc6 | 2008-03-17 16:08:38 -0300 | [diff] [blame] | 621 | #ifdef CONFIG_KEXEC |
| 622 | void machine_crash_shutdown(struct pt_regs *regs) |
| 623 | { |
| 624 | machine_ops.crash_shutdown(regs); |
| 625 | } |
| 626 | #endif |
Eduardo Habkost | 2ddded2 | 2008-11-12 11:34:42 -0200 | [diff] [blame] | 627 | |
| 628 | |
Eduardo Habkost | bb8dd27 | 2008-11-12 11:34:43 -0200 | [diff] [blame] | 629 | #if defined(CONFIG_SMP) |
Eduardo Habkost | 2ddded2 | 2008-11-12 11:34:42 -0200 | [diff] [blame] | 630 | |
| 631 | /* This keeps a track of which one is crashing cpu. */ |
| 632 | static int crashing_cpu; |
| 633 | static nmi_shootdown_cb shootdown_callback; |
| 634 | |
| 635 | static atomic_t waiting_for_crash_ipi; |
| 636 | |
| 637 | static int crash_nmi_callback(struct notifier_block *self, |
| 638 | unsigned long val, void *data) |
| 639 | { |
| 640 | int cpu; |
| 641 | |
| 642 | if (val != DIE_NMI_IPI) |
| 643 | return NOTIFY_OK; |
| 644 | |
| 645 | cpu = raw_smp_processor_id(); |
| 646 | |
| 647 | /* Don't do anything if this handler is invoked on crashing cpu. |
| 648 | * Otherwise, system will completely hang. Crashing cpu can get |
| 649 | * an NMI if system was initially booted with nmi_watchdog parameter. |
| 650 | */ |
| 651 | if (cpu == crashing_cpu) |
| 652 | return NOTIFY_STOP; |
| 653 | local_irq_disable(); |
| 654 | |
| 655 | shootdown_callback(cpu, (struct die_args *)data); |
| 656 | |
| 657 | atomic_dec(&waiting_for_crash_ipi); |
| 658 | /* Assume hlt works */ |
| 659 | halt(); |
| 660 | for (;;) |
| 661 | cpu_relax(); |
| 662 | |
| 663 | return 1; |
| 664 | } |
| 665 | |
| 666 | static void smp_send_nmi_allbutself(void) |
| 667 | { |
Ingo Molnar | dac5f41 | 2009-01-28 15:42:24 +0100 | [diff] [blame] | 668 | apic->send_IPI_allbutself(NMI_VECTOR); |
Eduardo Habkost | 2ddded2 | 2008-11-12 11:34:42 -0200 | [diff] [blame] | 669 | } |
| 670 | |
| 671 | static struct notifier_block crash_nmi_nb = { |
| 672 | .notifier_call = crash_nmi_callback, |
| 673 | }; |
| 674 | |
Eduardo Habkost | bb8dd27 | 2008-11-12 11:34:43 -0200 | [diff] [blame] | 675 | /* Halt all other CPUs, calling the specified function on each of them |
| 676 | * |
| 677 | * This function can be used to halt all other CPUs on crash |
| 678 | * or emergency reboot time. The function passed as parameter |
| 679 | * will be called inside a NMI handler on all CPUs. |
| 680 | */ |
Eduardo Habkost | 2ddded2 | 2008-11-12 11:34:42 -0200 | [diff] [blame] | 681 | void nmi_shootdown_cpus(nmi_shootdown_cb callback) |
| 682 | { |
| 683 | unsigned long msecs; |
Eduardo Habkost | c415b3d | 2008-11-12 11:34:44 -0200 | [diff] [blame] | 684 | local_irq_disable(); |
Eduardo Habkost | 2ddded2 | 2008-11-12 11:34:42 -0200 | [diff] [blame] | 685 | |
| 686 | /* Make a note of crashing cpu. Will be used in NMI callback.*/ |
| 687 | crashing_cpu = safe_smp_processor_id(); |
| 688 | |
| 689 | shootdown_callback = callback; |
| 690 | |
| 691 | atomic_set(&waiting_for_crash_ipi, num_online_cpus() - 1); |
| 692 | /* Would it be better to replace the trap vector here? */ |
| 693 | if (register_die_notifier(&crash_nmi_nb)) |
| 694 | return; /* return what? */ |
| 695 | /* Ensure the new callback function is set before sending |
| 696 | * out the NMI |
| 697 | */ |
| 698 | wmb(); |
| 699 | |
| 700 | smp_send_nmi_allbutself(); |
| 701 | |
| 702 | msecs = 1000; /* Wait at most a second for the other cpus to stop */ |
| 703 | while ((atomic_read(&waiting_for_crash_ipi) > 0) && msecs) { |
| 704 | mdelay(1); |
| 705 | msecs--; |
| 706 | } |
| 707 | |
| 708 | /* Leave the nmi callback set */ |
| 709 | } |
Eduardo Habkost | bb8dd27 | 2008-11-12 11:34:43 -0200 | [diff] [blame] | 710 | #else /* !CONFIG_SMP */ |
| 711 | void nmi_shootdown_cpus(nmi_shootdown_cb callback) |
| 712 | { |
| 713 | /* No other CPUs to shoot down */ |
| 714 | } |
Eduardo Habkost | 2ddded2 | 2008-11-12 11:34:42 -0200 | [diff] [blame] | 715 | #endif |