Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | #include <linux/module.h> |
Adrian Bunk | cd6ed52 | 2006-12-06 20:40:06 -0800 | [diff] [blame] | 2 | #include <linux/reboot.h> |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 3 | #include <linux/init.h> |
| 4 | #include <linux/pm.h> |
| 5 | #include <linux/efi.h> |
| 6 | #include <acpi/reboot.h> |
| 7 | #include <asm/io.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 8 | #include <asm/apic.h> |
Zachary Amsden | 4d37e7e | 2005-09-03 15:56:38 -0700 | [diff] [blame] | 9 | #include <asm/desc.h> |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 10 | #include <asm/hpet.h> |
Jeremy Fitzhardinge | 68db065 | 2008-03-17 16:37:13 -0700 | [diff] [blame] | 11 | #include <asm/pgtable.h> |
Dmitri Vorobiev | 4412620 | 2008-04-28 03:15:59 +0400 | [diff] [blame] | 12 | #include <asm/proto.h> |
Jeremy Fitzhardinge | 973efae | 2007-05-02 19:27:06 +0200 | [diff] [blame] | 13 | #include <asm/reboot_fixups.h> |
Jeremy Fitzhardinge | 07f3331 | 2007-05-02 19:27:11 +0200 | [diff] [blame] | 14 | #include <asm/reboot.h> |
Eduardo Habkost | d176720 | 2008-11-17 19:03:24 -0200 | [diff] [blame] | 15 | #include <asm/virtext.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 16 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 17 | #ifdef CONFIG_X86_32 |
| 18 | # include <linux/dmi.h> |
| 19 | # include <linux/ctype.h> |
| 20 | # include <linux/mc146818rtc.h> |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 21 | #else |
| 22 | # include <asm/iommu.h> |
| 23 | #endif |
| 24 | |
Eduardo Habkost | 2ddded2 | 2008-11-12 11:34:42 -0200 | [diff] [blame] | 25 | #include <mach_ipi.h> |
| 26 | |
| 27 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 28 | /* |
| 29 | * Power off function, if any |
| 30 | */ |
| 31 | void (*pm_power_off)(void); |
Alexey Dobriyan | 129f694 | 2005-06-23 00:08:33 -0700 | [diff] [blame] | 32 | EXPORT_SYMBOL(pm_power_off); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 33 | |
Jan Beulich | ebdd561 | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 34 | static const struct desc_ptr no_idt = {}; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 35 | static int reboot_mode; |
Eduardo Habkost | 8d00450 | 2008-11-04 12:52:44 -0200 | [diff] [blame] | 36 | enum reboot_type reboot_type = BOOT_KBD; |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 37 | int reboot_force; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 38 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 39 | #if defined(CONFIG_X86_32) && defined(CONFIG_SMP) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 40 | static int reboot_cpu = -1; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 41 | #endif |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 42 | |
Eduardo Habkost | d176720 | 2008-11-17 19:03:24 -0200 | [diff] [blame] | 43 | /* This is set if we need to go through the 'emergency' path. |
| 44 | * When machine_emergency_restart() is called, we may be on |
| 45 | * an inconsistent state and won't be able to do a clean cleanup |
| 46 | */ |
| 47 | static int reboot_emergency; |
| 48 | |
H. Peter Anvin | 14d7ca5 | 2008-11-11 16:19:48 -0800 | [diff] [blame] | 49 | /* This is set by the PCI code if either type 1 or type 2 PCI is detected */ |
| 50 | bool port_cf9_safe = false; |
| 51 | |
| 52 | /* reboot=b[ios] | s[mp] | t[riple] | k[bd] | e[fi] [, [w]arm | [c]old] | p[ci] |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 53 | warm Don't set the cold reboot flag |
| 54 | cold Set the cold reboot flag |
| 55 | bios Reboot by jumping through the BIOS (only for X86_32) |
| 56 | smp Reboot by executing reset on BSP or other CPU (only for X86_32) |
| 57 | triple Force a triple fault (init) |
| 58 | kbd Use the keyboard controller. cold reset (default) |
| 59 | acpi Use the RESET_REG in the FADT |
| 60 | efi Use efi reset_system runtime service |
H. Peter Anvin | 14d7ca5 | 2008-11-11 16:19:48 -0800 | [diff] [blame] | 61 | pci Use the so-called "PCI reset register", CF9 |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 62 | force Avoid anything that could hang. |
| 63 | */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 64 | static int __init reboot_setup(char *str) |
| 65 | { |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 66 | for (;;) { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 67 | switch (*str) { |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 68 | case 'w': |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 69 | reboot_mode = 0x1234; |
| 70 | break; |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 71 | |
| 72 | case 'c': |
| 73 | reboot_mode = 0; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 74 | break; |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 75 | |
| 76 | #ifdef CONFIG_X86_32 |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 77 | #ifdef CONFIG_SMP |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 78 | case 's': |
Tobias Klauser | 6f673d8 | 2005-09-13 01:25:48 -0700 | [diff] [blame] | 79 | if (isdigit(*(str+1))) { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 80 | reboot_cpu = (int) (*(str+1) - '0'); |
Tobias Klauser | 6f673d8 | 2005-09-13 01:25:48 -0700 | [diff] [blame] | 81 | if (isdigit(*(str+2))) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 82 | reboot_cpu = reboot_cpu*10 + (int)(*(str+2) - '0'); |
| 83 | } |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 84 | /* we will leave sorting out the final value |
| 85 | when we are ready to reboot, since we might not |
| 86 | have set up boot_cpu_id or smp_num_cpu */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 87 | break; |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 88 | #endif /* CONFIG_SMP */ |
| 89 | |
| 90 | case 'b': |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 91 | #endif |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 92 | case 'a': |
| 93 | case 'k': |
| 94 | case 't': |
| 95 | case 'e': |
H. Peter Anvin | 14d7ca5 | 2008-11-11 16:19:48 -0800 | [diff] [blame] | 96 | case 'p': |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 97 | reboot_type = *str; |
| 98 | break; |
| 99 | |
| 100 | case 'f': |
| 101 | reboot_force = 1; |
| 102 | break; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 103 | } |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 104 | |
| 105 | str = strchr(str, ','); |
| 106 | if (str) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 107 | str++; |
| 108 | else |
| 109 | break; |
| 110 | } |
| 111 | return 1; |
| 112 | } |
| 113 | |
| 114 | __setup("reboot=", reboot_setup); |
| 115 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 116 | |
| 117 | #ifdef CONFIG_X86_32 |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 118 | /* |
| 119 | * Reboot options and system auto-detection code provided by |
| 120 | * Dell Inc. so their systems "just work". :-) |
| 121 | */ |
| 122 | |
| 123 | /* |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 124 | * Some machines require the "reboot=b" commandline option, |
| 125 | * this quirk makes that automatic. |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 126 | */ |
Jeff Garzik | 1855256 | 2007-10-03 15:15:40 -0400 | [diff] [blame] | 127 | static int __init set_bios_reboot(const struct dmi_system_id *d) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 128 | { |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 129 | if (reboot_type != BOOT_BIOS) { |
| 130 | reboot_type = BOOT_BIOS; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 131 | printk(KERN_INFO "%s series board detected. Selecting BIOS-method for reboots.\n", d->ident); |
| 132 | } |
| 133 | return 0; |
| 134 | } |
| 135 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 136 | static struct dmi_system_id __initdata reboot_dmi_table[] = { |
Tim Gardner | b9e82af | 2007-06-01 00:46:40 -0700 | [diff] [blame] | 137 | { /* Handle problems with rebooting on Dell E520's */ |
| 138 | .callback = set_bios_reboot, |
| 139 | .ident = "Dell E520", |
| 140 | .matches = { |
| 141 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."), |
| 142 | DMI_MATCH(DMI_PRODUCT_NAME, "Dell DM061"), |
| 143 | }, |
| 144 | }, |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 145 | { /* Handle problems with rebooting on Dell 1300's */ |
Eric W. Biederman | dd2a130 | 2005-06-25 14:57:55 -0700 | [diff] [blame] | 146 | .callback = set_bios_reboot, |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 147 | .ident = "Dell PowerEdge 1300", |
| 148 | .matches = { |
| 149 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Computer Corporation"), |
| 150 | DMI_MATCH(DMI_PRODUCT_NAME, "PowerEdge 1300/"), |
| 151 | }, |
| 152 | }, |
| 153 | { /* Handle problems with rebooting on Dell 300's */ |
| 154 | .callback = set_bios_reboot, |
| 155 | .ident = "Dell PowerEdge 300", |
| 156 | .matches = { |
| 157 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Computer Corporation"), |
| 158 | DMI_MATCH(DMI_PRODUCT_NAME, "PowerEdge 300/"), |
| 159 | }, |
| 160 | }, |
James Jarvis | df2edcf | 2007-07-21 17:11:11 +0200 | [diff] [blame] | 161 | { /* Handle problems with rebooting on Dell Optiplex 745's SFF*/ |
| 162 | .callback = set_bios_reboot, |
| 163 | .ident = "Dell OptiPlex 745", |
| 164 | .matches = { |
| 165 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."), |
| 166 | DMI_MATCH(DMI_PRODUCT_NAME, "OptiPlex 745"), |
James Jarvis | df2edcf | 2007-07-21 17:11:11 +0200 | [diff] [blame] | 167 | }, |
| 168 | }, |
Coleman Kane | fc115bf | 2008-03-04 15:05:41 -0800 | [diff] [blame] | 169 | { /* Handle problems with rebooting on Dell Optiplex 745's DFF*/ |
| 170 | .callback = set_bios_reboot, |
| 171 | .ident = "Dell OptiPlex 745", |
| 172 | .matches = { |
| 173 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."), |
| 174 | DMI_MATCH(DMI_PRODUCT_NAME, "OptiPlex 745"), |
| 175 | DMI_MATCH(DMI_BOARD_NAME, "0MM599"), |
| 176 | }, |
| 177 | }, |
Heinz-Ado Arnolds | fc1c892 | 2008-03-12 16:27:56 +0100 | [diff] [blame] | 178 | { /* Handle problems with rebooting on Dell Optiplex 745 with 0KW626 */ |
| 179 | .callback = set_bios_reboot, |
| 180 | .ident = "Dell OptiPlex 745", |
| 181 | .matches = { |
| 182 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."), |
| 183 | DMI_MATCH(DMI_PRODUCT_NAME, "OptiPlex 745"), |
| 184 | DMI_MATCH(DMI_BOARD_NAME, "0KW626"), |
| 185 | }, |
| 186 | }, |
Steve Conklin | 093bac1 | 2008-11-14 00:55:51 -0600 | [diff] [blame] | 187 | { /* Handle problems with rebooting on Dell Optiplex 330 with 0KP561 */ |
| 188 | .callback = set_bios_reboot, |
| 189 | .ident = "Dell OptiPlex 330", |
| 190 | .matches = { |
| 191 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."), |
| 192 | DMI_MATCH(DMI_PRODUCT_NAME, "OptiPlex 330"), |
| 193 | DMI_MATCH(DMI_BOARD_NAME, "0KP561"), |
| 194 | }, |
| 195 | }, |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 196 | { /* Handle problems with rebooting on Dell 2400's */ |
| 197 | .callback = set_bios_reboot, |
| 198 | .ident = "Dell PowerEdge 2400", |
| 199 | .matches = { |
| 200 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Computer Corporation"), |
| 201 | DMI_MATCH(DMI_PRODUCT_NAME, "PowerEdge 2400"), |
| 202 | }, |
| 203 | }, |
Ingo Molnar | fab3b58 | 2008-07-17 13:50:15 +0200 | [diff] [blame] | 204 | { /* Handle problems with rebooting on Dell T5400's */ |
| 205 | .callback = set_bios_reboot, |
| 206 | .ident = "Dell Precision T5400", |
| 207 | .matches = { |
| 208 | DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."), |
| 209 | DMI_MATCH(DMI_PRODUCT_NAME, "Precision WorkStation T5400"), |
| 210 | }, |
| 211 | }, |
Ben Collins | 766c3f9 | 2006-01-06 00:12:20 -0800 | [diff] [blame] | 212 | { /* Handle problems with rebooting on HP laptops */ |
Thierry Vignaud | d91b14c | 2005-11-29 19:34:35 -0800 | [diff] [blame] | 213 | .callback = set_bios_reboot, |
Ben Collins | 766c3f9 | 2006-01-06 00:12:20 -0800 | [diff] [blame] | 214 | .ident = "HP Compaq Laptop", |
Thierry Vignaud | d91b14c | 2005-11-29 19:34:35 -0800 | [diff] [blame] | 215 | .matches = { |
| 216 | DMI_MATCH(DMI_SYS_VENDOR, "Hewlett-Packard"), |
Ben Collins | 766c3f9 | 2006-01-06 00:12:20 -0800 | [diff] [blame] | 217 | DMI_MATCH(DMI_PRODUCT_NAME, "HP Compaq"), |
Thierry Vignaud | d91b14c | 2005-11-29 19:34:35 -0800 | [diff] [blame] | 218 | }, |
| 219 | }, |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 220 | { } |
| 221 | }; |
| 222 | |
| 223 | static int __init reboot_init(void) |
| 224 | { |
| 225 | dmi_check_system(reboot_dmi_table); |
| 226 | return 0; |
| 227 | } |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 228 | core_initcall(reboot_init); |
| 229 | |
| 230 | /* The following code and data reboots the machine by switching to real |
| 231 | mode and jumping to the BIOS reset entry point, as if the CPU has |
| 232 | really been reset. The previous version asked the keyboard |
| 233 | controller to pulse the CPU reset line, which is more thorough, but |
| 234 | doesn't work with at least one type of 486 motherboard. It is easy |
| 235 | to stop this code working; hence the copious comments. */ |
Jan Beulich | ebdd561 | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 236 | static const unsigned long long |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 237 | real_mode_gdt_entries [3] = |
| 238 | { |
| 239 | 0x0000000000000000ULL, /* Null descriptor */ |
Jan Beulich | ebdd561 | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 240 | 0x00009b000000ffffULL, /* 16-bit real-mode 64k code at 0x00000000 */ |
| 241 | 0x000093000100ffffULL /* 16-bit real-mode 64k data at 0x00000100 */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 242 | }; |
| 243 | |
Jan Beulich | ebdd561 | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 244 | static const struct desc_ptr |
Rusty Russell | 05f4a3e | 2006-09-25 23:32:22 -0700 | [diff] [blame] | 245 | real_mode_gdt = { sizeof (real_mode_gdt_entries) - 1, (long)real_mode_gdt_entries }, |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 246 | real_mode_idt = { 0x3ff, 0 }; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 247 | |
| 248 | /* This is 16-bit protected mode code to disable paging and the cache, |
| 249 | switch to real mode and jump to the BIOS reset code. |
| 250 | |
| 251 | The instruction that switches to real mode by writing to CR0 must be |
| 252 | followed immediately by a far jump instruction, which set CS to a |
| 253 | valid value for real mode, and flushes the prefetch queue to avoid |
| 254 | running instructions that have already been decoded in protected |
| 255 | mode. |
| 256 | |
| 257 | Clears all the flags except ET, especially PG (paging), PE |
| 258 | (protected-mode enable) and TS (task switch for coprocessor state |
| 259 | save). Flushes the TLB after paging has been disabled. Sets CD and |
| 260 | NW, to disable the cache on a 486, and invalidates the cache. This |
| 261 | is more like the state of a 486 after reset. I don't know if |
| 262 | something else should be done for other chips. |
| 263 | |
| 264 | More could be done here to set up the registers as if a CPU reset had |
| 265 | occurred; hopefully real BIOSs don't assume much. */ |
Jan Beulich | ebdd561 | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 266 | static const unsigned char real_mode_switch [] = |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 267 | { |
| 268 | 0x66, 0x0f, 0x20, 0xc0, /* movl %cr0,%eax */ |
| 269 | 0x66, 0x83, 0xe0, 0x11, /* andl $0x00000011,%eax */ |
| 270 | 0x66, 0x0d, 0x00, 0x00, 0x00, 0x60, /* orl $0x60000000,%eax */ |
| 271 | 0x66, 0x0f, 0x22, 0xc0, /* movl %eax,%cr0 */ |
| 272 | 0x66, 0x0f, 0x22, 0xd8, /* movl %eax,%cr3 */ |
| 273 | 0x66, 0x0f, 0x20, 0xc3, /* movl %cr0,%ebx */ |
| 274 | 0x66, 0x81, 0xe3, 0x00, 0x00, 0x00, 0x60, /* andl $0x60000000,%ebx */ |
| 275 | 0x74, 0x02, /* jz f */ |
| 276 | 0x0f, 0x09, /* wbinvd */ |
| 277 | 0x24, 0x10, /* f: andb $0x10,al */ |
| 278 | 0x66, 0x0f, 0x22, 0xc0 /* movl %eax,%cr0 */ |
| 279 | }; |
Jan Beulich | ebdd561 | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 280 | static const unsigned char jump_to_bios [] = |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 281 | { |
| 282 | 0xea, 0x00, 0x00, 0xff, 0xff /* ljmp $0xffff,$0x0000 */ |
| 283 | }; |
| 284 | |
| 285 | /* |
| 286 | * Switch to real mode and then execute the code |
| 287 | * specified by the code and length parameters. |
| 288 | * We assume that length will aways be less that 100! |
| 289 | */ |
Jan Beulich | ebdd561 | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 290 | void machine_real_restart(const unsigned char *code, int length) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 291 | { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 292 | local_irq_disable(); |
| 293 | |
| 294 | /* Write zero to CMOS register number 0x0f, which the BIOS POST |
| 295 | routine will recognize as telling it to do a proper reboot. (Well |
| 296 | that's what this book in front of me says -- it may only apply to |
| 297 | the Phoenix BIOS though, it's not clear). At the same time, |
| 298 | disable NMIs by setting the top bit in the CMOS address register, |
| 299 | as we're about to do peculiar things to the CPU. I'm not sure if |
| 300 | `outb_p' is needed instead of just `outb'. Use it to be on the |
| 301 | safe side. (Yes, CMOS_WRITE does outb_p's. - Paul G.) |
| 302 | */ |
Hisashi Hifumi | 62dbc21 | 2007-05-02 19:27:18 +0200 | [diff] [blame] | 303 | spin_lock(&rtc_lock); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 304 | CMOS_WRITE(0x00, 0x8f); |
Hisashi Hifumi | 62dbc21 | 2007-05-02 19:27:18 +0200 | [diff] [blame] | 305 | spin_unlock(&rtc_lock); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 306 | |
| 307 | /* Remap the kernel at virtual address zero, as well as offset zero |
| 308 | from the kernel segment. This assumes the kernel segment starts at |
| 309 | virtual address PAGE_OFFSET. */ |
Jeremy Fitzhardinge | 68db065 | 2008-03-17 16:37:13 -0700 | [diff] [blame] | 310 | memcpy(swapper_pg_dir, swapper_pg_dir + KERNEL_PGD_BOUNDARY, |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 311 | sizeof(swapper_pg_dir [0]) * KERNEL_PGD_PTRS); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 312 | |
| 313 | /* |
| 314 | * Use `swapper_pg_dir' as our page directory. |
| 315 | */ |
| 316 | load_cr3(swapper_pg_dir); |
| 317 | |
| 318 | /* Write 0x1234 to absolute memory location 0x472. The BIOS reads |
| 319 | this on booting to tell it to "Bypass memory test (also warm |
| 320 | boot)". This seems like a fairly standard thing that gets set by |
| 321 | REBOOT.COM programs, and the previous reset routine did this |
| 322 | too. */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 323 | *((unsigned short *)0x472) = reboot_mode; |
| 324 | |
| 325 | /* For the switch to real mode, copy some code to low memory. It has |
| 326 | to be in the first 64k because it is running in 16-bit mode, and it |
| 327 | has to have the same physical and virtual address, because it turns |
| 328 | off paging. Copy it near the end of the first page, out of the way |
| 329 | of BIOS variables. */ |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 330 | memcpy((void *)(0x1000 - sizeof(real_mode_switch) - 100), |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 331 | real_mode_switch, sizeof (real_mode_switch)); |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 332 | memcpy((void *)(0x1000 - 100), code, length); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 333 | |
| 334 | /* Set up the IDT for real mode. */ |
Zachary Amsden | 4d37e7e | 2005-09-03 15:56:38 -0700 | [diff] [blame] | 335 | load_idt(&real_mode_idt); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 336 | |
| 337 | /* Set up a GDT from which we can load segment descriptors for real |
| 338 | mode. The GDT is not used in real mode; it is just needed here to |
| 339 | prepare the descriptors. */ |
Zachary Amsden | 4d37e7e | 2005-09-03 15:56:38 -0700 | [diff] [blame] | 340 | load_gdt(&real_mode_gdt); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 341 | |
| 342 | /* Load the data segment registers, and thus the descriptors ready for |
| 343 | real mode. The base address of each segment is 0x100, 16 times the |
| 344 | selector value being loaded here. This is so that the segment |
| 345 | registers don't have to be reloaded after switching to real mode: |
| 346 | the values are consistent for real mode operation already. */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 347 | __asm__ __volatile__ ("movl $0x0010,%%eax\n" |
| 348 | "\tmovl %%eax,%%ds\n" |
| 349 | "\tmovl %%eax,%%es\n" |
| 350 | "\tmovl %%eax,%%fs\n" |
| 351 | "\tmovl %%eax,%%gs\n" |
| 352 | "\tmovl %%eax,%%ss" : : : "eax"); |
| 353 | |
| 354 | /* Jump to the 16-bit code that we copied earlier. It disables paging |
| 355 | and the cache, switches to real mode, and jumps to the BIOS reset |
| 356 | entry point. */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 357 | __asm__ __volatile__ ("ljmp $0x0008,%0" |
| 358 | : |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 359 | : "i" ((void *)(0x1000 - sizeof (real_mode_switch) - 100))); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 360 | } |
Alexey Dobriyan | 129f694 | 2005-06-23 00:08:33 -0700 | [diff] [blame] | 361 | #ifdef CONFIG_APM_MODULE |
| 362 | EXPORT_SYMBOL(machine_real_restart); |
| 363 | #endif |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 364 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 365 | #endif /* CONFIG_X86_32 */ |
| 366 | |
| 367 | static inline void kb_wait(void) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 368 | { |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 369 | int i; |
| 370 | |
Alan Cox | c84d6af8 | 2008-01-30 13:33:25 +0100 | [diff] [blame] | 371 | for (i = 0; i < 0x10000; i++) { |
| 372 | if ((inb(0x64) & 0x02) == 0) |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 373 | break; |
Alan Cox | c84d6af8 | 2008-01-30 13:33:25 +0100 | [diff] [blame] | 374 | udelay(2); |
| 375 | } |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 376 | } |
| 377 | |
Eduardo Habkost | d176720 | 2008-11-17 19:03:24 -0200 | [diff] [blame] | 378 | static void vmxoff_nmi(int cpu, struct die_args *args) |
| 379 | { |
| 380 | cpu_emergency_vmxoff(); |
| 381 | } |
| 382 | |
| 383 | /* Use NMIs as IPIs to tell all CPUs to disable virtualization |
| 384 | */ |
| 385 | static void emergency_vmx_disable_all(void) |
| 386 | { |
| 387 | /* Just make sure we won't change CPUs while doing this */ |
| 388 | local_irq_disable(); |
| 389 | |
| 390 | /* We need to disable VMX on all CPUs before rebooting, otherwise |
| 391 | * we risk hanging up the machine, because the CPU ignore INIT |
| 392 | * signals when VMX is enabled. |
| 393 | * |
| 394 | * We can't take any locks and we may be on an inconsistent |
| 395 | * state, so we use NMIs as IPIs to tell the other CPUs to disable |
| 396 | * VMX and halt. |
| 397 | * |
| 398 | * For safety, we will avoid running the nmi_shootdown_cpus() |
| 399 | * stuff unnecessarily, but we don't have a way to check |
| 400 | * if other CPUs have VMX enabled. So we will call it only if the |
| 401 | * CPU we are running on has VMX enabled. |
| 402 | * |
| 403 | * We will miss cases where VMX is not enabled on all CPUs. This |
| 404 | * shouldn't do much harm because KVM always enable VMX on all |
| 405 | * CPUs anyway. But we can miss it on the small window where KVM |
| 406 | * is still enabling VMX. |
| 407 | */ |
| 408 | if (cpu_has_vmx() && cpu_vmx_enabled()) { |
| 409 | /* Disable VMX on this CPU. |
| 410 | */ |
| 411 | cpu_vmxoff(); |
| 412 | |
| 413 | /* Halt and disable VMX on the other CPUs */ |
| 414 | nmi_shootdown_cpus(vmxoff_nmi); |
| 415 | |
| 416 | } |
| 417 | } |
| 418 | |
| 419 | |
Ingo Molnar | 7432d14 | 2008-03-06 18:29:43 +0100 | [diff] [blame] | 420 | void __attribute__((weak)) mach_reboot_fixups(void) |
| 421 | { |
| 422 | } |
| 423 | |
Jody Belka | 416e2d6 | 2008-02-12 23:37:48 +0000 | [diff] [blame] | 424 | static void native_machine_emergency_restart(void) |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 425 | { |
| 426 | int i; |
| 427 | |
Eduardo Habkost | d176720 | 2008-11-17 19:03:24 -0200 | [diff] [blame] | 428 | if (reboot_emergency) |
| 429 | emergency_vmx_disable_all(); |
| 430 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 431 | /* Tell the BIOS if we want cold or warm reboot */ |
| 432 | *((unsigned short *)__va(0x472)) = reboot_mode; |
| 433 | |
| 434 | for (;;) { |
| 435 | /* Could also try the reset bit in the Hammer NB */ |
| 436 | switch (reboot_type) { |
| 437 | case BOOT_KBD: |
Ingo Molnar | 7432d14 | 2008-03-06 18:29:43 +0100 | [diff] [blame] | 438 | mach_reboot_fixups(); /* for board specific fixups */ |
| 439 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 440 | for (i = 0; i < 10; i++) { |
| 441 | kb_wait(); |
| 442 | udelay(50); |
| 443 | outb(0xfe, 0x64); /* pulse reset low */ |
| 444 | udelay(50); |
| 445 | } |
| 446 | |
| 447 | case BOOT_TRIPLE: |
Jan Beulich | ebdd561 | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 448 | load_idt(&no_idt); |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 449 | __asm__ __volatile__("int3"); |
| 450 | |
| 451 | reboot_type = BOOT_KBD; |
| 452 | break; |
| 453 | |
| 454 | #ifdef CONFIG_X86_32 |
| 455 | case BOOT_BIOS: |
| 456 | machine_real_restart(jump_to_bios, sizeof(jump_to_bios)); |
| 457 | |
| 458 | reboot_type = BOOT_KBD; |
| 459 | break; |
| 460 | #endif |
| 461 | |
| 462 | case BOOT_ACPI: |
| 463 | acpi_reboot(); |
| 464 | reboot_type = BOOT_KBD; |
| 465 | break; |
| 466 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 467 | case BOOT_EFI: |
| 468 | if (efi_enabled) |
H. Peter Anvin | 14d7ca5 | 2008-11-11 16:19:48 -0800 | [diff] [blame] | 469 | efi.reset_system(reboot_mode ? |
| 470 | EFI_RESET_WARM : |
| 471 | EFI_RESET_COLD, |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 472 | EFI_SUCCESS, 0, NULL); |
H. Peter Anvin | b47b928 | 2008-11-24 00:50:09 -0800 | [diff] [blame] | 473 | reboot_type = BOOT_KBD; |
H. Peter Anvin | 14d7ca5 | 2008-11-11 16:19:48 -0800 | [diff] [blame] | 474 | break; |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 475 | |
H. Peter Anvin | 14d7ca5 | 2008-11-11 16:19:48 -0800 | [diff] [blame] | 476 | case BOOT_CF9: |
| 477 | port_cf9_safe = true; |
| 478 | /* fall through */ |
| 479 | |
| 480 | case BOOT_CF9_COND: |
| 481 | if (port_cf9_safe) { |
| 482 | u8 cf9 = inb(0xcf9) & ~6; |
| 483 | outb(cf9|2, 0xcf9); /* Request hard reset */ |
| 484 | udelay(50); |
| 485 | outb(cf9|6, 0xcf9); /* Actually do the reset */ |
| 486 | udelay(50); |
| 487 | } |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 488 | reboot_type = BOOT_KBD; |
| 489 | break; |
| 490 | } |
| 491 | } |
| 492 | } |
| 493 | |
Glauber Costa | 3c62c62 | 2008-03-17 16:08:39 -0300 | [diff] [blame] | 494 | void native_machine_shutdown(void) |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 495 | { |
| 496 | /* Stop the cpus and apics */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 497 | #ifdef CONFIG_SMP |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 498 | |
Eric W. Biederman | dd2a130 | 2005-06-25 14:57:55 -0700 | [diff] [blame] | 499 | /* The boot cpu is always logical cpu 0 */ |
Mike Travis | 65c0118 | 2008-07-15 14:14:30 -0700 | [diff] [blame] | 500 | int reboot_cpu_id = 0; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 501 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 502 | #ifdef CONFIG_X86_32 |
Eric W. Biederman | dd2a130 | 2005-06-25 14:57:55 -0700 | [diff] [blame] | 503 | /* See if there has been given a command line override */ |
Eric W. Biederman | d8e392e | 2005-07-26 12:07:01 -0600 | [diff] [blame] | 504 | if ((reboot_cpu != -1) && (reboot_cpu < NR_CPUS) && |
Mike Travis | 0bc3cc0 | 2008-07-24 18:21:31 -0700 | [diff] [blame] | 505 | cpu_online(reboot_cpu)) |
Eric W. Biederman | dd2a130 | 2005-06-25 14:57:55 -0700 | [diff] [blame] | 506 | reboot_cpu_id = reboot_cpu; |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 507 | #endif |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 508 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 509 | /* Make certain the cpu I'm about to reboot on is online */ |
Mike Travis | 0bc3cc0 | 2008-07-24 18:21:31 -0700 | [diff] [blame] | 510 | if (!cpu_online(reboot_cpu_id)) |
Eric W. Biederman | dd2a130 | 2005-06-25 14:57:55 -0700 | [diff] [blame] | 511 | reboot_cpu_id = smp_processor_id(); |
Eric W. Biederman | dd2a130 | 2005-06-25 14:57:55 -0700 | [diff] [blame] | 512 | |
| 513 | /* Make certain I only run on the appropriate processor */ |
Mike Travis | 0bc3cc0 | 2008-07-24 18:21:31 -0700 | [diff] [blame] | 514 | set_cpus_allowed_ptr(current, &cpumask_of_cpu(reboot_cpu_id)); |
Eric W. Biederman | dd2a130 | 2005-06-25 14:57:55 -0700 | [diff] [blame] | 515 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 516 | /* O.K Now that I'm on the appropriate processor, |
| 517 | * stop all of the others. |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 518 | */ |
| 519 | smp_send_stop(); |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 520 | #endif |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 521 | |
| 522 | lapic_shutdown(); |
| 523 | |
| 524 | #ifdef CONFIG_X86_IO_APIC |
| 525 | disable_IO_APIC(); |
| 526 | #endif |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 527 | |
OGAWA Hirofumi | c86c7fb | 2007-12-03 17:17:10 +0100 | [diff] [blame] | 528 | #ifdef CONFIG_HPET_TIMER |
| 529 | hpet_disable(); |
| 530 | #endif |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 531 | |
| 532 | #ifdef CONFIG_X86_64 |
| 533 | pci_iommu_shutdown(); |
| 534 | #endif |
Eric W. Biederman | dd2a130 | 2005-06-25 14:57:55 -0700 | [diff] [blame] | 535 | } |
| 536 | |
Eduardo Habkost | d176720 | 2008-11-17 19:03:24 -0200 | [diff] [blame] | 537 | static void __machine_emergency_restart(int emergency) |
| 538 | { |
| 539 | reboot_emergency = emergency; |
| 540 | machine_ops.emergency_restart(); |
| 541 | } |
| 542 | |
Jody Belka | 416e2d6 | 2008-02-12 23:37:48 +0000 | [diff] [blame] | 543 | static void native_machine_restart(char *__unused) |
Jeremy Fitzhardinge | 973efae | 2007-05-02 19:27:06 +0200 | [diff] [blame] | 544 | { |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 545 | printk("machine restart\n"); |
Jeremy Fitzhardinge | 973efae | 2007-05-02 19:27:06 +0200 | [diff] [blame] | 546 | |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 547 | if (!reboot_force) |
Eric W. Biederman | 6e3fbee | 2006-01-11 22:43:12 +0100 | [diff] [blame] | 548 | machine_shutdown(); |
Eduardo Habkost | d176720 | 2008-11-17 19:03:24 -0200 | [diff] [blame] | 549 | __machine_emergency_restart(0); |
Jeremy Fitzhardinge | 07f3331 | 2007-05-02 19:27:11 +0200 | [diff] [blame] | 550 | } |
| 551 | |
Jody Belka | 416e2d6 | 2008-02-12 23:37:48 +0000 | [diff] [blame] | 552 | static void native_machine_halt(void) |
Jeremy Fitzhardinge | 07f3331 | 2007-05-02 19:27:11 +0200 | [diff] [blame] | 553 | { |
Ivan Vecera | d3ec5ca | 2008-11-11 14:33:44 +0100 | [diff] [blame] | 554 | /* stop other cpus and apics */ |
| 555 | machine_shutdown(); |
| 556 | |
| 557 | /* stop this cpu */ |
| 558 | stop_this_cpu(NULL); |
Jeremy Fitzhardinge | 07f3331 | 2007-05-02 19:27:11 +0200 | [diff] [blame] | 559 | } |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 560 | |
Jody Belka | 416e2d6 | 2008-02-12 23:37:48 +0000 | [diff] [blame] | 561 | static void native_machine_power_off(void) |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 562 | { |
| 563 | if (pm_power_off) { |
| 564 | if (!reboot_force) |
| 565 | machine_shutdown(); |
| 566 | pm_power_off(); |
| 567 | } |
| 568 | } |
| 569 | |
| 570 | struct machine_ops machine_ops = { |
Jody Belka | 416e2d6 | 2008-02-12 23:37:48 +0000 | [diff] [blame] | 571 | .power_off = native_machine_power_off, |
| 572 | .shutdown = native_machine_shutdown, |
| 573 | .emergency_restart = native_machine_emergency_restart, |
| 574 | .restart = native_machine_restart, |
Glauber Costa | ed23dc6 | 2008-03-17 16:08:38 -0300 | [diff] [blame] | 575 | .halt = native_machine_halt, |
| 576 | #ifdef CONFIG_KEXEC |
| 577 | .crash_shutdown = native_machine_crash_shutdown, |
| 578 | #endif |
Miguel Boton | 4d022e3 | 2008-01-30 13:32:51 +0100 | [diff] [blame] | 579 | }; |
Jody Belka | 416e2d6 | 2008-02-12 23:37:48 +0000 | [diff] [blame] | 580 | |
| 581 | void machine_power_off(void) |
| 582 | { |
| 583 | machine_ops.power_off(); |
| 584 | } |
| 585 | |
| 586 | void machine_shutdown(void) |
| 587 | { |
| 588 | machine_ops.shutdown(); |
| 589 | } |
| 590 | |
| 591 | void machine_emergency_restart(void) |
| 592 | { |
Eduardo Habkost | d176720 | 2008-11-17 19:03:24 -0200 | [diff] [blame] | 593 | __machine_emergency_restart(1); |
Jody Belka | 416e2d6 | 2008-02-12 23:37:48 +0000 | [diff] [blame] | 594 | } |
| 595 | |
| 596 | void machine_restart(char *cmd) |
| 597 | { |
| 598 | machine_ops.restart(cmd); |
| 599 | } |
| 600 | |
| 601 | void machine_halt(void) |
| 602 | { |
| 603 | machine_ops.halt(); |
| 604 | } |
| 605 | |
Glauber Costa | ed23dc6 | 2008-03-17 16:08:38 -0300 | [diff] [blame] | 606 | #ifdef CONFIG_KEXEC |
| 607 | void machine_crash_shutdown(struct pt_regs *regs) |
| 608 | { |
| 609 | machine_ops.crash_shutdown(regs); |
| 610 | } |
| 611 | #endif |
Eduardo Habkost | 2ddded2 | 2008-11-12 11:34:42 -0200 | [diff] [blame] | 612 | |
| 613 | |
Eduardo Habkost | bb8dd27 | 2008-11-12 11:34:43 -0200 | [diff] [blame] | 614 | #if defined(CONFIG_SMP) |
Eduardo Habkost | 2ddded2 | 2008-11-12 11:34:42 -0200 | [diff] [blame] | 615 | |
| 616 | /* This keeps a track of which one is crashing cpu. */ |
| 617 | static int crashing_cpu; |
| 618 | static nmi_shootdown_cb shootdown_callback; |
| 619 | |
| 620 | static atomic_t waiting_for_crash_ipi; |
| 621 | |
| 622 | static int crash_nmi_callback(struct notifier_block *self, |
| 623 | unsigned long val, void *data) |
| 624 | { |
| 625 | int cpu; |
| 626 | |
| 627 | if (val != DIE_NMI_IPI) |
| 628 | return NOTIFY_OK; |
| 629 | |
| 630 | cpu = raw_smp_processor_id(); |
| 631 | |
| 632 | /* Don't do anything if this handler is invoked on crashing cpu. |
| 633 | * Otherwise, system will completely hang. Crashing cpu can get |
| 634 | * an NMI if system was initially booted with nmi_watchdog parameter. |
| 635 | */ |
| 636 | if (cpu == crashing_cpu) |
| 637 | return NOTIFY_STOP; |
| 638 | local_irq_disable(); |
| 639 | |
| 640 | shootdown_callback(cpu, (struct die_args *)data); |
| 641 | |
| 642 | atomic_dec(&waiting_for_crash_ipi); |
| 643 | /* Assume hlt works */ |
| 644 | halt(); |
| 645 | for (;;) |
| 646 | cpu_relax(); |
| 647 | |
| 648 | return 1; |
| 649 | } |
| 650 | |
| 651 | static void smp_send_nmi_allbutself(void) |
| 652 | { |
Ingo Molnar | 855caa3 | 2008-12-17 13:24:52 +0100 | [diff] [blame] | 653 | send_IPI_allbutself(NMI_VECTOR); |
Eduardo Habkost | 2ddded2 | 2008-11-12 11:34:42 -0200 | [diff] [blame] | 654 | } |
| 655 | |
| 656 | static struct notifier_block crash_nmi_nb = { |
| 657 | .notifier_call = crash_nmi_callback, |
| 658 | }; |
| 659 | |
Eduardo Habkost | bb8dd27 | 2008-11-12 11:34:43 -0200 | [diff] [blame] | 660 | /* Halt all other CPUs, calling the specified function on each of them |
| 661 | * |
| 662 | * This function can be used to halt all other CPUs on crash |
| 663 | * or emergency reboot time. The function passed as parameter |
| 664 | * will be called inside a NMI handler on all CPUs. |
| 665 | */ |
Eduardo Habkost | 2ddded2 | 2008-11-12 11:34:42 -0200 | [diff] [blame] | 666 | void nmi_shootdown_cpus(nmi_shootdown_cb callback) |
| 667 | { |
| 668 | unsigned long msecs; |
Eduardo Habkost | c415b3d | 2008-11-12 11:34:44 -0200 | [diff] [blame] | 669 | local_irq_disable(); |
Eduardo Habkost | 2ddded2 | 2008-11-12 11:34:42 -0200 | [diff] [blame] | 670 | |
| 671 | /* Make a note of crashing cpu. Will be used in NMI callback.*/ |
| 672 | crashing_cpu = safe_smp_processor_id(); |
| 673 | |
| 674 | shootdown_callback = callback; |
| 675 | |
| 676 | atomic_set(&waiting_for_crash_ipi, num_online_cpus() - 1); |
| 677 | /* Would it be better to replace the trap vector here? */ |
| 678 | if (register_die_notifier(&crash_nmi_nb)) |
| 679 | return; /* return what? */ |
| 680 | /* Ensure the new callback function is set before sending |
| 681 | * out the NMI |
| 682 | */ |
| 683 | wmb(); |
| 684 | |
| 685 | smp_send_nmi_allbutself(); |
| 686 | |
| 687 | msecs = 1000; /* Wait at most a second for the other cpus to stop */ |
| 688 | while ((atomic_read(&waiting_for_crash_ipi) > 0) && msecs) { |
| 689 | mdelay(1); |
| 690 | msecs--; |
| 691 | } |
| 692 | |
| 693 | /* Leave the nmi callback set */ |
| 694 | } |
Eduardo Habkost | bb8dd27 | 2008-11-12 11:34:43 -0200 | [diff] [blame] | 695 | #else /* !CONFIG_SMP */ |
| 696 | void nmi_shootdown_cpus(nmi_shootdown_cb callback) |
| 697 | { |
| 698 | /* No other CPUs to shoot down */ |
| 699 | } |
Eduardo Habkost | 2ddded2 | 2008-11-12 11:34:42 -0200 | [diff] [blame] | 700 | #endif |