blob: 4526b3a75ed2aef73579212c7fde9ca6ed15e946 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001#include <linux/module.h>
Adrian Bunkcd6ed522006-12-06 20:40:06 -08002#include <linux/reboot.h>
Miguel Boton4d022e32008-01-30 13:32:51 +01003#include <linux/init.h>
4#include <linux/pm.h>
5#include <linux/efi.h>
6#include <acpi/reboot.h>
7#include <asm/io.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -07008#include <asm/apic.h>
Zachary Amsden4d37e7e2005-09-03 15:56:38 -07009#include <asm/desc.h>
Miguel Boton4d022e32008-01-30 13:32:51 +010010#include <asm/hpet.h>
Jeremy Fitzhardinge68db0652008-03-17 16:37:13 -070011#include <asm/pgtable.h>
Dmitri Vorobiev44126202008-04-28 03:15:59 +040012#include <asm/proto.h>
Jeremy Fitzhardinge973efae2007-05-02 19:27:06 +020013#include <asm/reboot_fixups.h>
Jeremy Fitzhardinge07f33312007-05-02 19:27:11 +020014#include <asm/reboot.h>
Jaswinder Singh Rajput82487712008-12-27 18:32:28 +053015#include <asm/pci_x86.h>
Eduardo Habkostd1767202008-11-17 19:03:24 -020016#include <asm/virtext.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070017
Miguel Boton4d022e32008-01-30 13:32:51 +010018#ifdef CONFIG_X86_32
19# include <linux/dmi.h>
20# include <linux/ctype.h>
21# include <linux/mc146818rtc.h>
Miguel Boton4d022e32008-01-30 13:32:51 +010022#else
23# include <asm/iommu.h>
24#endif
25
Eduardo Habkost2ddded22008-11-12 11:34:42 -020026#include <mach_ipi.h>
Eduardo Habkost2ddded22008-11-12 11:34:42 -020027
Linus Torvalds1da177e2005-04-16 15:20:36 -070028/*
29 * Power off function, if any
30 */
31void (*pm_power_off)(void);
Alexey Dobriyan129f6942005-06-23 00:08:33 -070032EXPORT_SYMBOL(pm_power_off);
Linus Torvalds1da177e2005-04-16 15:20:36 -070033
Jan Beulichebdd5612008-05-12 15:43:38 +020034static const struct desc_ptr no_idt = {};
Linus Torvalds1da177e2005-04-16 15:20:36 -070035static int reboot_mode;
Eduardo Habkost8d004502008-11-04 12:52:44 -020036enum reboot_type reboot_type = BOOT_KBD;
Miguel Boton4d022e32008-01-30 13:32:51 +010037int reboot_force;
Linus Torvalds1da177e2005-04-16 15:20:36 -070038
Miguel Boton4d022e32008-01-30 13:32:51 +010039#if defined(CONFIG_X86_32) && defined(CONFIG_SMP)
Linus Torvalds1da177e2005-04-16 15:20:36 -070040static int reboot_cpu = -1;
Linus Torvalds1da177e2005-04-16 15:20:36 -070041#endif
Miguel Boton4d022e32008-01-30 13:32:51 +010042
Eduardo Habkostd1767202008-11-17 19:03:24 -020043/* This is set if we need to go through the 'emergency' path.
44 * When machine_emergency_restart() is called, we may be on
45 * an inconsistent state and won't be able to do a clean cleanup
46 */
47static int reboot_emergency;
48
H. Peter Anvin14d7ca52008-11-11 16:19:48 -080049/* This is set by the PCI code if either type 1 or type 2 PCI is detected */
50bool port_cf9_safe = false;
51
52/* reboot=b[ios] | s[mp] | t[riple] | k[bd] | e[fi] [, [w]arm | [c]old] | p[ci]
Miguel Boton4d022e32008-01-30 13:32:51 +010053 warm Don't set the cold reboot flag
54 cold Set the cold reboot flag
55 bios Reboot by jumping through the BIOS (only for X86_32)
56 smp Reboot by executing reset on BSP or other CPU (only for X86_32)
57 triple Force a triple fault (init)
58 kbd Use the keyboard controller. cold reset (default)
59 acpi Use the RESET_REG in the FADT
60 efi Use efi reset_system runtime service
H. Peter Anvin14d7ca52008-11-11 16:19:48 -080061 pci Use the so-called "PCI reset register", CF9
Miguel Boton4d022e32008-01-30 13:32:51 +010062 force Avoid anything that could hang.
63 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070064static int __init reboot_setup(char *str)
65{
Miguel Boton4d022e32008-01-30 13:32:51 +010066 for (;;) {
Linus Torvalds1da177e2005-04-16 15:20:36 -070067 switch (*str) {
Miguel Boton4d022e32008-01-30 13:32:51 +010068 case 'w':
Linus Torvalds1da177e2005-04-16 15:20:36 -070069 reboot_mode = 0x1234;
70 break;
Miguel Boton4d022e32008-01-30 13:32:51 +010071
72 case 'c':
73 reboot_mode = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -070074 break;
Miguel Boton4d022e32008-01-30 13:32:51 +010075
76#ifdef CONFIG_X86_32
Linus Torvalds1da177e2005-04-16 15:20:36 -070077#ifdef CONFIG_SMP
Miguel Boton4d022e32008-01-30 13:32:51 +010078 case 's':
Tobias Klauser6f673d82005-09-13 01:25:48 -070079 if (isdigit(*(str+1))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -070080 reboot_cpu = (int) (*(str+1) - '0');
Tobias Klauser6f673d82005-09-13 01:25:48 -070081 if (isdigit(*(str+2)))
Linus Torvalds1da177e2005-04-16 15:20:36 -070082 reboot_cpu = reboot_cpu*10 + (int)(*(str+2) - '0');
83 }
Miguel Boton4d022e32008-01-30 13:32:51 +010084 /* we will leave sorting out the final value
85 when we are ready to reboot, since we might not
86 have set up boot_cpu_id or smp_num_cpu */
Linus Torvalds1da177e2005-04-16 15:20:36 -070087 break;
Miguel Boton4d022e32008-01-30 13:32:51 +010088#endif /* CONFIG_SMP */
89
90 case 'b':
Linus Torvalds1da177e2005-04-16 15:20:36 -070091#endif
Miguel Boton4d022e32008-01-30 13:32:51 +010092 case 'a':
93 case 'k':
94 case 't':
95 case 'e':
H. Peter Anvin14d7ca52008-11-11 16:19:48 -080096 case 'p':
Miguel Boton4d022e32008-01-30 13:32:51 +010097 reboot_type = *str;
98 break;
99
100 case 'f':
101 reboot_force = 1;
102 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700103 }
Miguel Boton4d022e32008-01-30 13:32:51 +0100104
105 str = strchr(str, ',');
106 if (str)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700107 str++;
108 else
109 break;
110 }
111 return 1;
112}
113
114__setup("reboot=", reboot_setup);
115
Miguel Boton4d022e32008-01-30 13:32:51 +0100116
117#ifdef CONFIG_X86_32
Linus Torvalds1da177e2005-04-16 15:20:36 -0700118/*
119 * Reboot options and system auto-detection code provided by
120 * Dell Inc. so their systems "just work". :-)
121 */
122
123/*
Miguel Boton4d022e32008-01-30 13:32:51 +0100124 * Some machines require the "reboot=b" commandline option,
125 * this quirk makes that automatic.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700126 */
Jeff Garzik18552562007-10-03 15:15:40 -0400127static int __init set_bios_reboot(const struct dmi_system_id *d)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700128{
Miguel Boton4d022e32008-01-30 13:32:51 +0100129 if (reboot_type != BOOT_BIOS) {
130 reboot_type = BOOT_BIOS;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131 printk(KERN_INFO "%s series board detected. Selecting BIOS-method for reboots.\n", d->ident);
132 }
133 return 0;
134}
135
Linus Torvalds1da177e2005-04-16 15:20:36 -0700136static struct dmi_system_id __initdata reboot_dmi_table[] = {
Tim Gardnerb9e82af2007-06-01 00:46:40 -0700137 { /* Handle problems with rebooting on Dell E520's */
138 .callback = set_bios_reboot,
139 .ident = "Dell E520",
140 .matches = {
141 DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."),
142 DMI_MATCH(DMI_PRODUCT_NAME, "Dell DM061"),
143 },
144 },
Linus Torvalds1da177e2005-04-16 15:20:36 -0700145 { /* Handle problems with rebooting on Dell 1300's */
Eric W. Biedermandd2a1302005-06-25 14:57:55 -0700146 .callback = set_bios_reboot,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700147 .ident = "Dell PowerEdge 1300",
148 .matches = {
149 DMI_MATCH(DMI_SYS_VENDOR, "Dell Computer Corporation"),
150 DMI_MATCH(DMI_PRODUCT_NAME, "PowerEdge 1300/"),
151 },
152 },
153 { /* Handle problems with rebooting on Dell 300's */
154 .callback = set_bios_reboot,
155 .ident = "Dell PowerEdge 300",
156 .matches = {
157 DMI_MATCH(DMI_SYS_VENDOR, "Dell Computer Corporation"),
158 DMI_MATCH(DMI_PRODUCT_NAME, "PowerEdge 300/"),
159 },
160 },
James Jarvisdf2edcf2007-07-21 17:11:11 +0200161 { /* Handle problems with rebooting on Dell Optiplex 745's SFF*/
162 .callback = set_bios_reboot,
163 .ident = "Dell OptiPlex 745",
164 .matches = {
165 DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."),
166 DMI_MATCH(DMI_PRODUCT_NAME, "OptiPlex 745"),
James Jarvisdf2edcf2007-07-21 17:11:11 +0200167 },
168 },
Coleman Kanefc115bf2008-03-04 15:05:41 -0800169 { /* Handle problems with rebooting on Dell Optiplex 745's DFF*/
170 .callback = set_bios_reboot,
171 .ident = "Dell OptiPlex 745",
172 .matches = {
173 DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."),
174 DMI_MATCH(DMI_PRODUCT_NAME, "OptiPlex 745"),
175 DMI_MATCH(DMI_BOARD_NAME, "0MM599"),
176 },
177 },
Heinz-Ado Arnoldsfc1c89252008-03-12 16:27:56 +0100178 { /* Handle problems with rebooting on Dell Optiplex 745 with 0KW626 */
179 .callback = set_bios_reboot,
180 .ident = "Dell OptiPlex 745",
181 .matches = {
182 DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."),
183 DMI_MATCH(DMI_PRODUCT_NAME, "OptiPlex 745"),
184 DMI_MATCH(DMI_BOARD_NAME, "0KW626"),
185 },
186 },
Steve Conklin093bac12008-11-14 00:55:51 -0600187 { /* Handle problems with rebooting on Dell Optiplex 330 with 0KP561 */
188 .callback = set_bios_reboot,
189 .ident = "Dell OptiPlex 330",
190 .matches = {
191 DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."),
192 DMI_MATCH(DMI_PRODUCT_NAME, "OptiPlex 330"),
193 DMI_MATCH(DMI_BOARD_NAME, "0KP561"),
194 },
195 },
Linus Torvalds1da177e2005-04-16 15:20:36 -0700196 { /* Handle problems with rebooting on Dell 2400's */
197 .callback = set_bios_reboot,
198 .ident = "Dell PowerEdge 2400",
199 .matches = {
200 DMI_MATCH(DMI_SYS_VENDOR, "Dell Computer Corporation"),
201 DMI_MATCH(DMI_PRODUCT_NAME, "PowerEdge 2400"),
202 },
203 },
Ingo Molnarfab3b582008-07-17 13:50:15 +0200204 { /* Handle problems with rebooting on Dell T5400's */
205 .callback = set_bios_reboot,
206 .ident = "Dell Precision T5400",
207 .matches = {
208 DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."),
209 DMI_MATCH(DMI_PRODUCT_NAME, "Precision WorkStation T5400"),
210 },
211 },
Ben Collins766c3f92006-01-06 00:12:20 -0800212 { /* Handle problems with rebooting on HP laptops */
Thierry Vignaudd91b14c2005-11-29 19:34:35 -0800213 .callback = set_bios_reboot,
Ben Collins766c3f92006-01-06 00:12:20 -0800214 .ident = "HP Compaq Laptop",
Thierry Vignaudd91b14c2005-11-29 19:34:35 -0800215 .matches = {
216 DMI_MATCH(DMI_SYS_VENDOR, "Hewlett-Packard"),
Ben Collins766c3f92006-01-06 00:12:20 -0800217 DMI_MATCH(DMI_PRODUCT_NAME, "HP Compaq"),
Thierry Vignaudd91b14c2005-11-29 19:34:35 -0800218 },
219 },
Leann Ogasawaradd4124a2009-03-04 11:53:00 -0800220 { /* Handle problems with rebooting on Dell XPS710 */
221 .callback = set_bios_reboot,
222 .ident = "Dell XPS710",
223 .matches = {
224 DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."),
225 DMI_MATCH(DMI_PRODUCT_NAME, "Dell XPS710"),
226 },
227 },
Linus Torvalds1da177e2005-04-16 15:20:36 -0700228 { }
229};
230
231static int __init reboot_init(void)
232{
233 dmi_check_system(reboot_dmi_table);
234 return 0;
235}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700236core_initcall(reboot_init);
237
238/* The following code and data reboots the machine by switching to real
239 mode and jumping to the BIOS reset entry point, as if the CPU has
240 really been reset. The previous version asked the keyboard
241 controller to pulse the CPU reset line, which is more thorough, but
242 doesn't work with at least one type of 486 motherboard. It is easy
243 to stop this code working; hence the copious comments. */
Jan Beulichebdd5612008-05-12 15:43:38 +0200244static const unsigned long long
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245real_mode_gdt_entries [3] =
246{
247 0x0000000000000000ULL, /* Null descriptor */
Jan Beulichebdd5612008-05-12 15:43:38 +0200248 0x00009b000000ffffULL, /* 16-bit real-mode 64k code at 0x00000000 */
249 0x000093000100ffffULL /* 16-bit real-mode 64k data at 0x00000100 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700250};
251
Jan Beulichebdd5612008-05-12 15:43:38 +0200252static const struct desc_ptr
Rusty Russell05f4a3e2006-09-25 23:32:22 -0700253real_mode_gdt = { sizeof (real_mode_gdt_entries) - 1, (long)real_mode_gdt_entries },
Miguel Boton4d022e32008-01-30 13:32:51 +0100254real_mode_idt = { 0x3ff, 0 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255
256/* This is 16-bit protected mode code to disable paging and the cache,
257 switch to real mode and jump to the BIOS reset code.
258
259 The instruction that switches to real mode by writing to CR0 must be
260 followed immediately by a far jump instruction, which set CS to a
261 valid value for real mode, and flushes the prefetch queue to avoid
262 running instructions that have already been decoded in protected
263 mode.
264
265 Clears all the flags except ET, especially PG (paging), PE
266 (protected-mode enable) and TS (task switch for coprocessor state
267 save). Flushes the TLB after paging has been disabled. Sets CD and
268 NW, to disable the cache on a 486, and invalidates the cache. This
269 is more like the state of a 486 after reset. I don't know if
270 something else should be done for other chips.
271
272 More could be done here to set up the registers as if a CPU reset had
273 occurred; hopefully real BIOSs don't assume much. */
Jan Beulichebdd5612008-05-12 15:43:38 +0200274static const unsigned char real_mode_switch [] =
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275{
276 0x66, 0x0f, 0x20, 0xc0, /* movl %cr0,%eax */
277 0x66, 0x83, 0xe0, 0x11, /* andl $0x00000011,%eax */
278 0x66, 0x0d, 0x00, 0x00, 0x00, 0x60, /* orl $0x60000000,%eax */
279 0x66, 0x0f, 0x22, 0xc0, /* movl %eax,%cr0 */
280 0x66, 0x0f, 0x22, 0xd8, /* movl %eax,%cr3 */
281 0x66, 0x0f, 0x20, 0xc3, /* movl %cr0,%ebx */
282 0x66, 0x81, 0xe3, 0x00, 0x00, 0x00, 0x60, /* andl $0x60000000,%ebx */
283 0x74, 0x02, /* jz f */
284 0x0f, 0x09, /* wbinvd */
285 0x24, 0x10, /* f: andb $0x10,al */
286 0x66, 0x0f, 0x22, 0xc0 /* movl %eax,%cr0 */
287};
Jan Beulichebdd5612008-05-12 15:43:38 +0200288static const unsigned char jump_to_bios [] =
Linus Torvalds1da177e2005-04-16 15:20:36 -0700289{
290 0xea, 0x00, 0x00, 0xff, 0xff /* ljmp $0xffff,$0x0000 */
291};
292
293/*
294 * Switch to real mode and then execute the code
295 * specified by the code and length parameters.
296 * We assume that length will aways be less that 100!
297 */
Jan Beulichebdd5612008-05-12 15:43:38 +0200298void machine_real_restart(const unsigned char *code, int length)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700299{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700300 local_irq_disable();
301
302 /* Write zero to CMOS register number 0x0f, which the BIOS POST
303 routine will recognize as telling it to do a proper reboot. (Well
304 that's what this book in front of me says -- it may only apply to
305 the Phoenix BIOS though, it's not clear). At the same time,
306 disable NMIs by setting the top bit in the CMOS address register,
307 as we're about to do peculiar things to the CPU. I'm not sure if
308 `outb_p' is needed instead of just `outb'. Use it to be on the
309 safe side. (Yes, CMOS_WRITE does outb_p's. - Paul G.)
310 */
Hisashi Hifumi62dbc212007-05-02 19:27:18 +0200311 spin_lock(&rtc_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312 CMOS_WRITE(0x00, 0x8f);
Hisashi Hifumi62dbc212007-05-02 19:27:18 +0200313 spin_unlock(&rtc_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700314
315 /* Remap the kernel at virtual address zero, as well as offset zero
316 from the kernel segment. This assumes the kernel segment starts at
317 virtual address PAGE_OFFSET. */
Jeremy Fitzhardinge68db0652008-03-17 16:37:13 -0700318 memcpy(swapper_pg_dir, swapper_pg_dir + KERNEL_PGD_BOUNDARY,
Miguel Boton4d022e32008-01-30 13:32:51 +0100319 sizeof(swapper_pg_dir [0]) * KERNEL_PGD_PTRS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700320
321 /*
322 * Use `swapper_pg_dir' as our page directory.
323 */
324 load_cr3(swapper_pg_dir);
325
326 /* Write 0x1234 to absolute memory location 0x472. The BIOS reads
327 this on booting to tell it to "Bypass memory test (also warm
328 boot)". This seems like a fairly standard thing that gets set by
329 REBOOT.COM programs, and the previous reset routine did this
330 too. */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700331 *((unsigned short *)0x472) = reboot_mode;
332
333 /* For the switch to real mode, copy some code to low memory. It has
334 to be in the first 64k because it is running in 16-bit mode, and it
335 has to have the same physical and virtual address, because it turns
336 off paging. Copy it near the end of the first page, out of the way
337 of BIOS variables. */
Miguel Boton4d022e32008-01-30 13:32:51 +0100338 memcpy((void *)(0x1000 - sizeof(real_mode_switch) - 100),
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339 real_mode_switch, sizeof (real_mode_switch));
Miguel Boton4d022e32008-01-30 13:32:51 +0100340 memcpy((void *)(0x1000 - 100), code, length);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700341
342 /* Set up the IDT for real mode. */
Zachary Amsden4d37e7e2005-09-03 15:56:38 -0700343 load_idt(&real_mode_idt);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344
345 /* Set up a GDT from which we can load segment descriptors for real
346 mode. The GDT is not used in real mode; it is just needed here to
347 prepare the descriptors. */
Zachary Amsden4d37e7e2005-09-03 15:56:38 -0700348 load_gdt(&real_mode_gdt);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349
350 /* Load the data segment registers, and thus the descriptors ready for
351 real mode. The base address of each segment is 0x100, 16 times the
352 selector value being loaded here. This is so that the segment
353 registers don't have to be reloaded after switching to real mode:
354 the values are consistent for real mode operation already. */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700355 __asm__ __volatile__ ("movl $0x0010,%%eax\n"
356 "\tmovl %%eax,%%ds\n"
357 "\tmovl %%eax,%%es\n"
358 "\tmovl %%eax,%%fs\n"
359 "\tmovl %%eax,%%gs\n"
360 "\tmovl %%eax,%%ss" : : : "eax");
361
362 /* Jump to the 16-bit code that we copied earlier. It disables paging
363 and the cache, switches to real mode, and jumps to the BIOS reset
364 entry point. */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700365 __asm__ __volatile__ ("ljmp $0x0008,%0"
366 :
Miguel Boton4d022e32008-01-30 13:32:51 +0100367 : "i" ((void *)(0x1000 - sizeof (real_mode_switch) - 100)));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700368}
Alexey Dobriyan129f6942005-06-23 00:08:33 -0700369#ifdef CONFIG_APM_MODULE
370EXPORT_SYMBOL(machine_real_restart);
371#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700372
Miguel Boton4d022e32008-01-30 13:32:51 +0100373#endif /* CONFIG_X86_32 */
374
375static inline void kb_wait(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376{
Miguel Boton4d022e32008-01-30 13:32:51 +0100377 int i;
378
Alan Coxc84d6af82008-01-30 13:33:25 +0100379 for (i = 0; i < 0x10000; i++) {
380 if ((inb(0x64) & 0x02) == 0)
Miguel Boton4d022e32008-01-30 13:32:51 +0100381 break;
Alan Coxc84d6af82008-01-30 13:33:25 +0100382 udelay(2);
383 }
Miguel Boton4d022e32008-01-30 13:32:51 +0100384}
385
Eduardo Habkostd1767202008-11-17 19:03:24 -0200386static void vmxoff_nmi(int cpu, struct die_args *args)
387{
388 cpu_emergency_vmxoff();
389}
390
391/* Use NMIs as IPIs to tell all CPUs to disable virtualization
392 */
393static void emergency_vmx_disable_all(void)
394{
395 /* Just make sure we won't change CPUs while doing this */
396 local_irq_disable();
397
398 /* We need to disable VMX on all CPUs before rebooting, otherwise
399 * we risk hanging up the machine, because the CPU ignore INIT
400 * signals when VMX is enabled.
401 *
402 * We can't take any locks and we may be on an inconsistent
403 * state, so we use NMIs as IPIs to tell the other CPUs to disable
404 * VMX and halt.
405 *
406 * For safety, we will avoid running the nmi_shootdown_cpus()
407 * stuff unnecessarily, but we don't have a way to check
408 * if other CPUs have VMX enabled. So we will call it only if the
409 * CPU we are running on has VMX enabled.
410 *
411 * We will miss cases where VMX is not enabled on all CPUs. This
412 * shouldn't do much harm because KVM always enable VMX on all
413 * CPUs anyway. But we can miss it on the small window where KVM
414 * is still enabling VMX.
415 */
416 if (cpu_has_vmx() && cpu_vmx_enabled()) {
417 /* Disable VMX on this CPU.
418 */
419 cpu_vmxoff();
420
421 /* Halt and disable VMX on the other CPUs */
422 nmi_shootdown_cpus(vmxoff_nmi);
423
424 }
425}
426
427
Ingo Molnar7432d142008-03-06 18:29:43 +0100428void __attribute__((weak)) mach_reboot_fixups(void)
429{
430}
431
Jody Belka416e2d62008-02-12 23:37:48 +0000432static void native_machine_emergency_restart(void)
Miguel Boton4d022e32008-01-30 13:32:51 +0100433{
434 int i;
435
Eduardo Habkostd1767202008-11-17 19:03:24 -0200436 if (reboot_emergency)
437 emergency_vmx_disable_all();
438
Miguel Boton4d022e32008-01-30 13:32:51 +0100439 /* Tell the BIOS if we want cold or warm reboot */
440 *((unsigned short *)__va(0x472)) = reboot_mode;
441
442 for (;;) {
443 /* Could also try the reset bit in the Hammer NB */
444 switch (reboot_type) {
445 case BOOT_KBD:
Ingo Molnar7432d142008-03-06 18:29:43 +0100446 mach_reboot_fixups(); /* for board specific fixups */
447
Miguel Boton4d022e32008-01-30 13:32:51 +0100448 for (i = 0; i < 10; i++) {
449 kb_wait();
450 udelay(50);
451 outb(0xfe, 0x64); /* pulse reset low */
452 udelay(50);
453 }
454
455 case BOOT_TRIPLE:
Jan Beulichebdd5612008-05-12 15:43:38 +0200456 load_idt(&no_idt);
Miguel Boton4d022e32008-01-30 13:32:51 +0100457 __asm__ __volatile__("int3");
458
459 reboot_type = BOOT_KBD;
460 break;
461
462#ifdef CONFIG_X86_32
463 case BOOT_BIOS:
464 machine_real_restart(jump_to_bios, sizeof(jump_to_bios));
465
466 reboot_type = BOOT_KBD;
467 break;
468#endif
469
470 case BOOT_ACPI:
471 acpi_reboot();
472 reboot_type = BOOT_KBD;
473 break;
474
Miguel Boton4d022e32008-01-30 13:32:51 +0100475 case BOOT_EFI:
476 if (efi_enabled)
H. Peter Anvin14d7ca52008-11-11 16:19:48 -0800477 efi.reset_system(reboot_mode ?
478 EFI_RESET_WARM :
479 EFI_RESET_COLD,
Miguel Boton4d022e32008-01-30 13:32:51 +0100480 EFI_SUCCESS, 0, NULL);
H. Peter Anvinb47b9282008-11-24 00:50:09 -0800481 reboot_type = BOOT_KBD;
H. Peter Anvin14d7ca52008-11-11 16:19:48 -0800482 break;
Miguel Boton4d022e32008-01-30 13:32:51 +0100483
H. Peter Anvin14d7ca52008-11-11 16:19:48 -0800484 case BOOT_CF9:
485 port_cf9_safe = true;
486 /* fall through */
487
488 case BOOT_CF9_COND:
489 if (port_cf9_safe) {
490 u8 cf9 = inb(0xcf9) & ~6;
491 outb(cf9|2, 0xcf9); /* Request hard reset */
492 udelay(50);
493 outb(cf9|6, 0xcf9); /* Actually do the reset */
494 udelay(50);
495 }
Miguel Boton4d022e32008-01-30 13:32:51 +0100496 reboot_type = BOOT_KBD;
497 break;
498 }
499 }
500}
501
Glauber Costa3c62c622008-03-17 16:08:39 -0300502void native_machine_shutdown(void)
Miguel Boton4d022e32008-01-30 13:32:51 +0100503{
504 /* Stop the cpus and apics */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700505#ifdef CONFIG_SMP
Linus Torvalds1da177e2005-04-16 15:20:36 -0700506
Eric W. Biedermandd2a1302005-06-25 14:57:55 -0700507 /* The boot cpu is always logical cpu 0 */
Mike Travis65c01182008-07-15 14:14:30 -0700508 int reboot_cpu_id = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700509
Miguel Boton4d022e32008-01-30 13:32:51 +0100510#ifdef CONFIG_X86_32
Eric W. Biedermandd2a1302005-06-25 14:57:55 -0700511 /* See if there has been given a command line override */
Mike Travis96289372008-12-31 18:08:46 -0800512 if ((reboot_cpu != -1) && (reboot_cpu < nr_cpu_ids) &&
Mike Travis0bc3cc02008-07-24 18:21:31 -0700513 cpu_online(reboot_cpu))
Eric W. Biedermandd2a1302005-06-25 14:57:55 -0700514 reboot_cpu_id = reboot_cpu;
Miguel Boton4d022e32008-01-30 13:32:51 +0100515#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700516
Miguel Boton4d022e32008-01-30 13:32:51 +0100517 /* Make certain the cpu I'm about to reboot on is online */
Mike Travis0bc3cc02008-07-24 18:21:31 -0700518 if (!cpu_online(reboot_cpu_id))
Eric W. Biedermandd2a1302005-06-25 14:57:55 -0700519 reboot_cpu_id = smp_processor_id();
Eric W. Biedermandd2a1302005-06-25 14:57:55 -0700520
521 /* Make certain I only run on the appropriate processor */
Mike Travis96289372008-12-31 18:08:46 -0800522 set_cpus_allowed_ptr(current, cpumask_of(reboot_cpu_id));
Eric W. Biedermandd2a1302005-06-25 14:57:55 -0700523
Miguel Boton4d022e32008-01-30 13:32:51 +0100524 /* O.K Now that I'm on the appropriate processor,
525 * stop all of the others.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700526 */
527 smp_send_stop();
Miguel Boton4d022e32008-01-30 13:32:51 +0100528#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700529
530 lapic_shutdown();
531
532#ifdef CONFIG_X86_IO_APIC
533 disable_IO_APIC();
534#endif
Miguel Boton4d022e32008-01-30 13:32:51 +0100535
OGAWA Hirofumic86c7fb2007-12-03 17:17:10 +0100536#ifdef CONFIG_HPET_TIMER
537 hpet_disable();
538#endif
Miguel Boton4d022e32008-01-30 13:32:51 +0100539
540#ifdef CONFIG_X86_64
541 pci_iommu_shutdown();
542#endif
Eric W. Biedermandd2a1302005-06-25 14:57:55 -0700543}
544
Eduardo Habkostd1767202008-11-17 19:03:24 -0200545static void __machine_emergency_restart(int emergency)
546{
547 reboot_emergency = emergency;
548 machine_ops.emergency_restart();
549}
550
Jody Belka416e2d62008-02-12 23:37:48 +0000551static void native_machine_restart(char *__unused)
Jeremy Fitzhardinge973efae2007-05-02 19:27:06 +0200552{
Miguel Boton4d022e32008-01-30 13:32:51 +0100553 printk("machine restart\n");
Jeremy Fitzhardinge973efae2007-05-02 19:27:06 +0200554
Miguel Boton4d022e32008-01-30 13:32:51 +0100555 if (!reboot_force)
Eric W. Biederman6e3fbee2006-01-11 22:43:12 +0100556 machine_shutdown();
Eduardo Habkostd1767202008-11-17 19:03:24 -0200557 __machine_emergency_restart(0);
Jeremy Fitzhardinge07f33312007-05-02 19:27:11 +0200558}
559
Jody Belka416e2d62008-02-12 23:37:48 +0000560static void native_machine_halt(void)
Jeremy Fitzhardinge07f33312007-05-02 19:27:11 +0200561{
Ivan Vecerad3ec5ca2008-11-11 14:33:44 +0100562 /* stop other cpus and apics */
563 machine_shutdown();
564
565 /* stop this cpu */
566 stop_this_cpu(NULL);
Jeremy Fitzhardinge07f33312007-05-02 19:27:11 +0200567}
Miguel Boton4d022e32008-01-30 13:32:51 +0100568
Jody Belka416e2d62008-02-12 23:37:48 +0000569static void native_machine_power_off(void)
Miguel Boton4d022e32008-01-30 13:32:51 +0100570{
571 if (pm_power_off) {
572 if (!reboot_force)
573 machine_shutdown();
574 pm_power_off();
575 }
576}
577
578struct machine_ops machine_ops = {
Jody Belka416e2d62008-02-12 23:37:48 +0000579 .power_off = native_machine_power_off,
580 .shutdown = native_machine_shutdown,
581 .emergency_restart = native_machine_emergency_restart,
582 .restart = native_machine_restart,
Glauber Costaed23dc62008-03-17 16:08:38 -0300583 .halt = native_machine_halt,
584#ifdef CONFIG_KEXEC
585 .crash_shutdown = native_machine_crash_shutdown,
586#endif
Miguel Boton4d022e32008-01-30 13:32:51 +0100587};
Jody Belka416e2d62008-02-12 23:37:48 +0000588
589void machine_power_off(void)
590{
591 machine_ops.power_off();
592}
593
594void machine_shutdown(void)
595{
596 machine_ops.shutdown();
597}
598
599void machine_emergency_restart(void)
600{
Eduardo Habkostd1767202008-11-17 19:03:24 -0200601 __machine_emergency_restart(1);
Jody Belka416e2d62008-02-12 23:37:48 +0000602}
603
604void machine_restart(char *cmd)
605{
606 machine_ops.restart(cmd);
607}
608
609void machine_halt(void)
610{
611 machine_ops.halt();
612}
613
Glauber Costaed23dc62008-03-17 16:08:38 -0300614#ifdef CONFIG_KEXEC
615void machine_crash_shutdown(struct pt_regs *regs)
616{
617 machine_ops.crash_shutdown(regs);
618}
619#endif
Eduardo Habkost2ddded22008-11-12 11:34:42 -0200620
621
Eduardo Habkostbb8dd272008-11-12 11:34:43 -0200622#if defined(CONFIG_SMP)
Eduardo Habkost2ddded22008-11-12 11:34:42 -0200623
624/* This keeps a track of which one is crashing cpu. */
625static int crashing_cpu;
626static nmi_shootdown_cb shootdown_callback;
627
628static atomic_t waiting_for_crash_ipi;
629
630static int crash_nmi_callback(struct notifier_block *self,
631 unsigned long val, void *data)
632{
633 int cpu;
634
635 if (val != DIE_NMI_IPI)
636 return NOTIFY_OK;
637
638 cpu = raw_smp_processor_id();
639
640 /* Don't do anything if this handler is invoked on crashing cpu.
641 * Otherwise, system will completely hang. Crashing cpu can get
642 * an NMI if system was initially booted with nmi_watchdog parameter.
643 */
644 if (cpu == crashing_cpu)
645 return NOTIFY_STOP;
646 local_irq_disable();
647
648 shootdown_callback(cpu, (struct die_args *)data);
649
650 atomic_dec(&waiting_for_crash_ipi);
651 /* Assume hlt works */
652 halt();
653 for (;;)
654 cpu_relax();
655
656 return 1;
657}
658
659static void smp_send_nmi_allbutself(void)
660{
Ingo Molnar855caa32008-12-17 13:24:52 +0100661 send_IPI_allbutself(NMI_VECTOR);
Eduardo Habkost2ddded22008-11-12 11:34:42 -0200662}
663
664static struct notifier_block crash_nmi_nb = {
665 .notifier_call = crash_nmi_callback,
666};
667
Eduardo Habkostbb8dd272008-11-12 11:34:43 -0200668/* Halt all other CPUs, calling the specified function on each of them
669 *
670 * This function can be used to halt all other CPUs on crash
671 * or emergency reboot time. The function passed as parameter
672 * will be called inside a NMI handler on all CPUs.
673 */
Eduardo Habkost2ddded22008-11-12 11:34:42 -0200674void nmi_shootdown_cpus(nmi_shootdown_cb callback)
675{
676 unsigned long msecs;
Eduardo Habkostc415b3d2008-11-12 11:34:44 -0200677 local_irq_disable();
Eduardo Habkost2ddded22008-11-12 11:34:42 -0200678
679 /* Make a note of crashing cpu. Will be used in NMI callback.*/
680 crashing_cpu = safe_smp_processor_id();
681
682 shootdown_callback = callback;
683
684 atomic_set(&waiting_for_crash_ipi, num_online_cpus() - 1);
685 /* Would it be better to replace the trap vector here? */
686 if (register_die_notifier(&crash_nmi_nb))
687 return; /* return what? */
688 /* Ensure the new callback function is set before sending
689 * out the NMI
690 */
691 wmb();
692
693 smp_send_nmi_allbutself();
694
695 msecs = 1000; /* Wait at most a second for the other cpus to stop */
696 while ((atomic_read(&waiting_for_crash_ipi) > 0) && msecs) {
697 mdelay(1);
698 msecs--;
699 }
700
701 /* Leave the nmi callback set */
702}
Eduardo Habkostbb8dd272008-11-12 11:34:43 -0200703#else /* !CONFIG_SMP */
704void nmi_shootdown_cpus(nmi_shootdown_cb callback)
705{
706 /* No other CPUs to shoot down */
707}
Eduardo Habkost2ddded22008-11-12 11:34:42 -0200708#endif