blob: 1cc18d439bbbd377bd6941eece6fa2397508d359 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001#include <linux/module.h>
Adrian Bunkcd6ed522006-12-06 20:40:06 -08002#include <linux/reboot.h>
Miguel Boton4d022e32008-01-30 13:32:51 +01003#include <linux/init.h>
4#include <linux/pm.h>
5#include <linux/efi.h>
6#include <acpi/reboot.h>
7#include <asm/io.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -07008#include <asm/apic.h>
Zachary Amsden4d37e7e2005-09-03 15:56:38 -07009#include <asm/desc.h>
Miguel Boton4d022e32008-01-30 13:32:51 +010010#include <asm/hpet.h>
Jeremy Fitzhardinge68db0652008-03-17 16:37:13 -070011#include <asm/pgtable.h>
Dmitri Vorobiev44126202008-04-28 03:15:59 +040012#include <asm/proto.h>
Jeremy Fitzhardinge973efae2007-05-02 19:27:06 +020013#include <asm/reboot_fixups.h>
Jeremy Fitzhardinge07f33312007-05-02 19:27:11 +020014#include <asm/reboot.h>
Jaswinder Singh Rajput82487712008-12-27 18:32:28 +053015#include <asm/pci_x86.h>
Eduardo Habkostd1767202008-11-17 19:03:24 -020016#include <asm/virtext.h>
Jaswinder Singh Rajput96b89dc2009-01-07 21:35:48 +053017#include <asm/cpu.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018
Miguel Boton4d022e32008-01-30 13:32:51 +010019#ifdef CONFIG_X86_32
20# include <linux/dmi.h>
21# include <linux/ctype.h>
22# include <linux/mc146818rtc.h>
Miguel Boton4d022e32008-01-30 13:32:51 +010023#else
24# include <asm/iommu.h>
25#endif
26
Linus Torvalds1da177e2005-04-16 15:20:36 -070027/*
28 * Power off function, if any
29 */
30void (*pm_power_off)(void);
Alexey Dobriyan129f6942005-06-23 00:08:33 -070031EXPORT_SYMBOL(pm_power_off);
Linus Torvalds1da177e2005-04-16 15:20:36 -070032
Jan Beulichebdd5612008-05-12 15:43:38 +020033static const struct desc_ptr no_idt = {};
Linus Torvalds1da177e2005-04-16 15:20:36 -070034static int reboot_mode;
Eduardo Habkost8d004502008-11-04 12:52:44 -020035enum reboot_type reboot_type = BOOT_KBD;
Miguel Boton4d022e32008-01-30 13:32:51 +010036int reboot_force;
Linus Torvalds1da177e2005-04-16 15:20:36 -070037
Miguel Boton4d022e32008-01-30 13:32:51 +010038#if defined(CONFIG_X86_32) && defined(CONFIG_SMP)
Linus Torvalds1da177e2005-04-16 15:20:36 -070039static int reboot_cpu = -1;
Linus Torvalds1da177e2005-04-16 15:20:36 -070040#endif
Miguel Boton4d022e32008-01-30 13:32:51 +010041
Eduardo Habkostd1767202008-11-17 19:03:24 -020042/* This is set if we need to go through the 'emergency' path.
43 * When machine_emergency_restart() is called, we may be on
44 * an inconsistent state and won't be able to do a clean cleanup
45 */
46static int reboot_emergency;
47
H. Peter Anvin14d7ca52008-11-11 16:19:48 -080048/* This is set by the PCI code if either type 1 or type 2 PCI is detected */
49bool port_cf9_safe = false;
50
51/* reboot=b[ios] | s[mp] | t[riple] | k[bd] | e[fi] [, [w]arm | [c]old] | p[ci]
Miguel Boton4d022e32008-01-30 13:32:51 +010052 warm Don't set the cold reboot flag
53 cold Set the cold reboot flag
54 bios Reboot by jumping through the BIOS (only for X86_32)
55 smp Reboot by executing reset on BSP or other CPU (only for X86_32)
56 triple Force a triple fault (init)
57 kbd Use the keyboard controller. cold reset (default)
58 acpi Use the RESET_REG in the FADT
59 efi Use efi reset_system runtime service
H. Peter Anvin14d7ca52008-11-11 16:19:48 -080060 pci Use the so-called "PCI reset register", CF9
Miguel Boton4d022e32008-01-30 13:32:51 +010061 force Avoid anything that could hang.
62 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070063static int __init reboot_setup(char *str)
64{
Miguel Boton4d022e32008-01-30 13:32:51 +010065 for (;;) {
Linus Torvalds1da177e2005-04-16 15:20:36 -070066 switch (*str) {
Miguel Boton4d022e32008-01-30 13:32:51 +010067 case 'w':
Linus Torvalds1da177e2005-04-16 15:20:36 -070068 reboot_mode = 0x1234;
69 break;
Miguel Boton4d022e32008-01-30 13:32:51 +010070
71 case 'c':
72 reboot_mode = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -070073 break;
Miguel Boton4d022e32008-01-30 13:32:51 +010074
75#ifdef CONFIG_X86_32
Linus Torvalds1da177e2005-04-16 15:20:36 -070076#ifdef CONFIG_SMP
Miguel Boton4d022e32008-01-30 13:32:51 +010077 case 's':
Tobias Klauser6f673d82005-09-13 01:25:48 -070078 if (isdigit(*(str+1))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -070079 reboot_cpu = (int) (*(str+1) - '0');
Tobias Klauser6f673d82005-09-13 01:25:48 -070080 if (isdigit(*(str+2)))
Linus Torvalds1da177e2005-04-16 15:20:36 -070081 reboot_cpu = reboot_cpu*10 + (int)(*(str+2) - '0');
82 }
Miguel Boton4d022e32008-01-30 13:32:51 +010083 /* we will leave sorting out the final value
84 when we are ready to reboot, since we might not
85 have set up boot_cpu_id or smp_num_cpu */
Linus Torvalds1da177e2005-04-16 15:20:36 -070086 break;
Miguel Boton4d022e32008-01-30 13:32:51 +010087#endif /* CONFIG_SMP */
88
89 case 'b':
Linus Torvalds1da177e2005-04-16 15:20:36 -070090#endif
Miguel Boton4d022e32008-01-30 13:32:51 +010091 case 'a':
92 case 'k':
93 case 't':
94 case 'e':
H. Peter Anvin14d7ca52008-11-11 16:19:48 -080095 case 'p':
Miguel Boton4d022e32008-01-30 13:32:51 +010096 reboot_type = *str;
97 break;
98
99 case 'f':
100 reboot_force = 1;
101 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700102 }
Miguel Boton4d022e32008-01-30 13:32:51 +0100103
104 str = strchr(str, ',');
105 if (str)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700106 str++;
107 else
108 break;
109 }
110 return 1;
111}
112
113__setup("reboot=", reboot_setup);
114
Miguel Boton4d022e32008-01-30 13:32:51 +0100115
116#ifdef CONFIG_X86_32
Linus Torvalds1da177e2005-04-16 15:20:36 -0700117/*
118 * Reboot options and system auto-detection code provided by
119 * Dell Inc. so their systems "just work". :-)
120 */
121
122/*
Miguel Boton4d022e32008-01-30 13:32:51 +0100123 * Some machines require the "reboot=b" commandline option,
124 * this quirk makes that automatic.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700125 */
Jeff Garzik18552562007-10-03 15:15:40 -0400126static int __init set_bios_reboot(const struct dmi_system_id *d)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700127{
Miguel Boton4d022e32008-01-30 13:32:51 +0100128 if (reboot_type != BOOT_BIOS) {
129 reboot_type = BOOT_BIOS;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700130 printk(KERN_INFO "%s series board detected. Selecting BIOS-method for reboots.\n", d->ident);
131 }
132 return 0;
133}
134
Linus Torvalds1da177e2005-04-16 15:20:36 -0700135static struct dmi_system_id __initdata reboot_dmi_table[] = {
Tim Gardnerb9e82af2007-06-01 00:46:40 -0700136 { /* Handle problems with rebooting on Dell E520's */
137 .callback = set_bios_reboot,
138 .ident = "Dell E520",
139 .matches = {
140 DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."),
141 DMI_MATCH(DMI_PRODUCT_NAME, "Dell DM061"),
142 },
143 },
Linus Torvalds1da177e2005-04-16 15:20:36 -0700144 { /* Handle problems with rebooting on Dell 1300's */
Eric W. Biedermandd2a1302005-06-25 14:57:55 -0700145 .callback = set_bios_reboot,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700146 .ident = "Dell PowerEdge 1300",
147 .matches = {
148 DMI_MATCH(DMI_SYS_VENDOR, "Dell Computer Corporation"),
149 DMI_MATCH(DMI_PRODUCT_NAME, "PowerEdge 1300/"),
150 },
151 },
152 { /* Handle problems with rebooting on Dell 300's */
153 .callback = set_bios_reboot,
154 .ident = "Dell PowerEdge 300",
155 .matches = {
156 DMI_MATCH(DMI_SYS_VENDOR, "Dell Computer Corporation"),
157 DMI_MATCH(DMI_PRODUCT_NAME, "PowerEdge 300/"),
158 },
159 },
James Jarvisdf2edcf2007-07-21 17:11:11 +0200160 { /* Handle problems with rebooting on Dell Optiplex 745's SFF*/
161 .callback = set_bios_reboot,
162 .ident = "Dell OptiPlex 745",
163 .matches = {
164 DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."),
165 DMI_MATCH(DMI_PRODUCT_NAME, "OptiPlex 745"),
James Jarvisdf2edcf2007-07-21 17:11:11 +0200166 },
167 },
Coleman Kanefc115bf2008-03-04 15:05:41 -0800168 { /* Handle problems with rebooting on Dell Optiplex 745's DFF*/
169 .callback = set_bios_reboot,
170 .ident = "Dell OptiPlex 745",
171 .matches = {
172 DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."),
173 DMI_MATCH(DMI_PRODUCT_NAME, "OptiPlex 745"),
174 DMI_MATCH(DMI_BOARD_NAME, "0MM599"),
175 },
176 },
Heinz-Ado Arnoldsfc1c89252008-03-12 16:27:56 +0100177 { /* Handle problems with rebooting on Dell Optiplex 745 with 0KW626 */
178 .callback = set_bios_reboot,
179 .ident = "Dell OptiPlex 745",
180 .matches = {
181 DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."),
182 DMI_MATCH(DMI_PRODUCT_NAME, "OptiPlex 745"),
183 DMI_MATCH(DMI_BOARD_NAME, "0KW626"),
184 },
185 },
Steve Conklin093bac12008-11-14 00:55:51 -0600186 { /* Handle problems with rebooting on Dell Optiplex 330 with 0KP561 */
187 .callback = set_bios_reboot,
188 .ident = "Dell OptiPlex 330",
189 .matches = {
190 DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."),
191 DMI_MATCH(DMI_PRODUCT_NAME, "OptiPlex 330"),
192 DMI_MATCH(DMI_BOARD_NAME, "0KP561"),
193 },
194 },
Linus Torvalds1da177e2005-04-16 15:20:36 -0700195 { /* Handle problems with rebooting on Dell 2400's */
196 .callback = set_bios_reboot,
197 .ident = "Dell PowerEdge 2400",
198 .matches = {
199 DMI_MATCH(DMI_SYS_VENDOR, "Dell Computer Corporation"),
200 DMI_MATCH(DMI_PRODUCT_NAME, "PowerEdge 2400"),
201 },
202 },
Ingo Molnarfab3b582008-07-17 13:50:15 +0200203 { /* Handle problems with rebooting on Dell T5400's */
204 .callback = set_bios_reboot,
205 .ident = "Dell Precision T5400",
206 .matches = {
207 DMI_MATCH(DMI_SYS_VENDOR, "Dell Inc."),
208 DMI_MATCH(DMI_PRODUCT_NAME, "Precision WorkStation T5400"),
209 },
210 },
Ben Collins766c3f92006-01-06 00:12:20 -0800211 { /* Handle problems with rebooting on HP laptops */
Thierry Vignaudd91b14c2005-11-29 19:34:35 -0800212 .callback = set_bios_reboot,
Ben Collins766c3f92006-01-06 00:12:20 -0800213 .ident = "HP Compaq Laptop",
Thierry Vignaudd91b14c2005-11-29 19:34:35 -0800214 .matches = {
215 DMI_MATCH(DMI_SYS_VENDOR, "Hewlett-Packard"),
Ben Collins766c3f92006-01-06 00:12:20 -0800216 DMI_MATCH(DMI_PRODUCT_NAME, "HP Compaq"),
Thierry Vignaudd91b14c2005-11-29 19:34:35 -0800217 },
218 },
Linus Torvalds1da177e2005-04-16 15:20:36 -0700219 { }
220};
221
222static int __init reboot_init(void)
223{
224 dmi_check_system(reboot_dmi_table);
225 return 0;
226}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227core_initcall(reboot_init);
228
229/* The following code and data reboots the machine by switching to real
230 mode and jumping to the BIOS reset entry point, as if the CPU has
231 really been reset. The previous version asked the keyboard
232 controller to pulse the CPU reset line, which is more thorough, but
233 doesn't work with at least one type of 486 motherboard. It is easy
234 to stop this code working; hence the copious comments. */
Jan Beulichebdd5612008-05-12 15:43:38 +0200235static const unsigned long long
Linus Torvalds1da177e2005-04-16 15:20:36 -0700236real_mode_gdt_entries [3] =
237{
238 0x0000000000000000ULL, /* Null descriptor */
Jan Beulichebdd5612008-05-12 15:43:38 +0200239 0x00009b000000ffffULL, /* 16-bit real-mode 64k code at 0x00000000 */
240 0x000093000100ffffULL /* 16-bit real-mode 64k data at 0x00000100 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241};
242
Jan Beulichebdd5612008-05-12 15:43:38 +0200243static const struct desc_ptr
Rusty Russell05f4a3e2006-09-25 23:32:22 -0700244real_mode_gdt = { sizeof (real_mode_gdt_entries) - 1, (long)real_mode_gdt_entries },
Miguel Boton4d022e32008-01-30 13:32:51 +0100245real_mode_idt = { 0x3ff, 0 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246
247/* This is 16-bit protected mode code to disable paging and the cache,
248 switch to real mode and jump to the BIOS reset code.
249
250 The instruction that switches to real mode by writing to CR0 must be
251 followed immediately by a far jump instruction, which set CS to a
252 valid value for real mode, and flushes the prefetch queue to avoid
253 running instructions that have already been decoded in protected
254 mode.
255
256 Clears all the flags except ET, especially PG (paging), PE
257 (protected-mode enable) and TS (task switch for coprocessor state
258 save). Flushes the TLB after paging has been disabled. Sets CD and
259 NW, to disable the cache on a 486, and invalidates the cache. This
260 is more like the state of a 486 after reset. I don't know if
261 something else should be done for other chips.
262
263 More could be done here to set up the registers as if a CPU reset had
264 occurred; hopefully real BIOSs don't assume much. */
Jan Beulichebdd5612008-05-12 15:43:38 +0200265static const unsigned char real_mode_switch [] =
Linus Torvalds1da177e2005-04-16 15:20:36 -0700266{
267 0x66, 0x0f, 0x20, 0xc0, /* movl %cr0,%eax */
268 0x66, 0x83, 0xe0, 0x11, /* andl $0x00000011,%eax */
269 0x66, 0x0d, 0x00, 0x00, 0x00, 0x60, /* orl $0x60000000,%eax */
270 0x66, 0x0f, 0x22, 0xc0, /* movl %eax,%cr0 */
271 0x66, 0x0f, 0x22, 0xd8, /* movl %eax,%cr3 */
272 0x66, 0x0f, 0x20, 0xc3, /* movl %cr0,%ebx */
273 0x66, 0x81, 0xe3, 0x00, 0x00, 0x00, 0x60, /* andl $0x60000000,%ebx */
274 0x74, 0x02, /* jz f */
275 0x0f, 0x09, /* wbinvd */
276 0x24, 0x10, /* f: andb $0x10,al */
277 0x66, 0x0f, 0x22, 0xc0 /* movl %eax,%cr0 */
278};
Jan Beulichebdd5612008-05-12 15:43:38 +0200279static const unsigned char jump_to_bios [] =
Linus Torvalds1da177e2005-04-16 15:20:36 -0700280{
281 0xea, 0x00, 0x00, 0xff, 0xff /* ljmp $0xffff,$0x0000 */
282};
283
284/*
285 * Switch to real mode and then execute the code
286 * specified by the code and length parameters.
287 * We assume that length will aways be less that 100!
288 */
Jan Beulichebdd5612008-05-12 15:43:38 +0200289void machine_real_restart(const unsigned char *code, int length)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700290{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700291 local_irq_disable();
292
293 /* Write zero to CMOS register number 0x0f, which the BIOS POST
294 routine will recognize as telling it to do a proper reboot. (Well
295 that's what this book in front of me says -- it may only apply to
296 the Phoenix BIOS though, it's not clear). At the same time,
297 disable NMIs by setting the top bit in the CMOS address register,
298 as we're about to do peculiar things to the CPU. I'm not sure if
299 `outb_p' is needed instead of just `outb'. Use it to be on the
300 safe side. (Yes, CMOS_WRITE does outb_p's. - Paul G.)
301 */
Hisashi Hifumi62dbc212007-05-02 19:27:18 +0200302 spin_lock(&rtc_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700303 CMOS_WRITE(0x00, 0x8f);
Hisashi Hifumi62dbc212007-05-02 19:27:18 +0200304 spin_unlock(&rtc_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700305
306 /* Remap the kernel at virtual address zero, as well as offset zero
307 from the kernel segment. This assumes the kernel segment starts at
308 virtual address PAGE_OFFSET. */
Jeremy Fitzhardinge68db0652008-03-17 16:37:13 -0700309 memcpy(swapper_pg_dir, swapper_pg_dir + KERNEL_PGD_BOUNDARY,
Miguel Boton4d022e32008-01-30 13:32:51 +0100310 sizeof(swapper_pg_dir [0]) * KERNEL_PGD_PTRS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700311
312 /*
313 * Use `swapper_pg_dir' as our page directory.
314 */
315 load_cr3(swapper_pg_dir);
316
317 /* Write 0x1234 to absolute memory location 0x472. The BIOS reads
318 this on booting to tell it to "Bypass memory test (also warm
319 boot)". This seems like a fairly standard thing that gets set by
320 REBOOT.COM programs, and the previous reset routine did this
321 too. */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700322 *((unsigned short *)0x472) = reboot_mode;
323
324 /* For the switch to real mode, copy some code to low memory. It has
325 to be in the first 64k because it is running in 16-bit mode, and it
326 has to have the same physical and virtual address, because it turns
327 off paging. Copy it near the end of the first page, out of the way
328 of BIOS variables. */
Miguel Boton4d022e32008-01-30 13:32:51 +0100329 memcpy((void *)(0x1000 - sizeof(real_mode_switch) - 100),
Linus Torvalds1da177e2005-04-16 15:20:36 -0700330 real_mode_switch, sizeof (real_mode_switch));
Miguel Boton4d022e32008-01-30 13:32:51 +0100331 memcpy((void *)(0x1000 - 100), code, length);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700332
333 /* Set up the IDT for real mode. */
Zachary Amsden4d37e7e2005-09-03 15:56:38 -0700334 load_idt(&real_mode_idt);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700335
336 /* Set up a GDT from which we can load segment descriptors for real
337 mode. The GDT is not used in real mode; it is just needed here to
338 prepare the descriptors. */
Zachary Amsden4d37e7e2005-09-03 15:56:38 -0700339 load_gdt(&real_mode_gdt);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340
341 /* Load the data segment registers, and thus the descriptors ready for
342 real mode. The base address of each segment is 0x100, 16 times the
343 selector value being loaded here. This is so that the segment
344 registers don't have to be reloaded after switching to real mode:
345 the values are consistent for real mode operation already. */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700346 __asm__ __volatile__ ("movl $0x0010,%%eax\n"
347 "\tmovl %%eax,%%ds\n"
348 "\tmovl %%eax,%%es\n"
349 "\tmovl %%eax,%%fs\n"
350 "\tmovl %%eax,%%gs\n"
351 "\tmovl %%eax,%%ss" : : : "eax");
352
353 /* Jump to the 16-bit code that we copied earlier. It disables paging
354 and the cache, switches to real mode, and jumps to the BIOS reset
355 entry point. */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700356 __asm__ __volatile__ ("ljmp $0x0008,%0"
357 :
Miguel Boton4d022e32008-01-30 13:32:51 +0100358 : "i" ((void *)(0x1000 - sizeof (real_mode_switch) - 100)));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700359}
Alexey Dobriyan129f6942005-06-23 00:08:33 -0700360#ifdef CONFIG_APM_MODULE
361EXPORT_SYMBOL(machine_real_restart);
362#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363
Miguel Boton4d022e32008-01-30 13:32:51 +0100364#endif /* CONFIG_X86_32 */
365
366static inline void kb_wait(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700367{
Miguel Boton4d022e32008-01-30 13:32:51 +0100368 int i;
369
Alan Coxc84d6af82008-01-30 13:33:25 +0100370 for (i = 0; i < 0x10000; i++) {
371 if ((inb(0x64) & 0x02) == 0)
Miguel Boton4d022e32008-01-30 13:32:51 +0100372 break;
Alan Coxc84d6af82008-01-30 13:33:25 +0100373 udelay(2);
374 }
Miguel Boton4d022e32008-01-30 13:32:51 +0100375}
376
Eduardo Habkostd1767202008-11-17 19:03:24 -0200377static void vmxoff_nmi(int cpu, struct die_args *args)
378{
379 cpu_emergency_vmxoff();
380}
381
382/* Use NMIs as IPIs to tell all CPUs to disable virtualization
383 */
384static void emergency_vmx_disable_all(void)
385{
386 /* Just make sure we won't change CPUs while doing this */
387 local_irq_disable();
388
389 /* We need to disable VMX on all CPUs before rebooting, otherwise
390 * we risk hanging up the machine, because the CPU ignore INIT
391 * signals when VMX is enabled.
392 *
393 * We can't take any locks and we may be on an inconsistent
394 * state, so we use NMIs as IPIs to tell the other CPUs to disable
395 * VMX and halt.
396 *
397 * For safety, we will avoid running the nmi_shootdown_cpus()
398 * stuff unnecessarily, but we don't have a way to check
399 * if other CPUs have VMX enabled. So we will call it only if the
400 * CPU we are running on has VMX enabled.
401 *
402 * We will miss cases where VMX is not enabled on all CPUs. This
403 * shouldn't do much harm because KVM always enable VMX on all
404 * CPUs anyway. But we can miss it on the small window where KVM
405 * is still enabling VMX.
406 */
407 if (cpu_has_vmx() && cpu_vmx_enabled()) {
408 /* Disable VMX on this CPU.
409 */
410 cpu_vmxoff();
411
412 /* Halt and disable VMX on the other CPUs */
413 nmi_shootdown_cpus(vmxoff_nmi);
414
415 }
416}
417
418
Ingo Molnar7432d142008-03-06 18:29:43 +0100419void __attribute__((weak)) mach_reboot_fixups(void)
420{
421}
422
Jody Belka416e2d62008-02-12 23:37:48 +0000423static void native_machine_emergency_restart(void)
Miguel Boton4d022e32008-01-30 13:32:51 +0100424{
425 int i;
426
Eduardo Habkostd1767202008-11-17 19:03:24 -0200427 if (reboot_emergency)
428 emergency_vmx_disable_all();
429
Miguel Boton4d022e32008-01-30 13:32:51 +0100430 /* Tell the BIOS if we want cold or warm reboot */
431 *((unsigned short *)__va(0x472)) = reboot_mode;
432
433 for (;;) {
434 /* Could also try the reset bit in the Hammer NB */
435 switch (reboot_type) {
436 case BOOT_KBD:
Ingo Molnar7432d142008-03-06 18:29:43 +0100437 mach_reboot_fixups(); /* for board specific fixups */
438
Miguel Boton4d022e32008-01-30 13:32:51 +0100439 for (i = 0; i < 10; i++) {
440 kb_wait();
441 udelay(50);
442 outb(0xfe, 0x64); /* pulse reset low */
443 udelay(50);
444 }
445
446 case BOOT_TRIPLE:
Jan Beulichebdd5612008-05-12 15:43:38 +0200447 load_idt(&no_idt);
Miguel Boton4d022e32008-01-30 13:32:51 +0100448 __asm__ __volatile__("int3");
449
450 reboot_type = BOOT_KBD;
451 break;
452
453#ifdef CONFIG_X86_32
454 case BOOT_BIOS:
455 machine_real_restart(jump_to_bios, sizeof(jump_to_bios));
456
457 reboot_type = BOOT_KBD;
458 break;
459#endif
460
461 case BOOT_ACPI:
462 acpi_reboot();
463 reboot_type = BOOT_KBD;
464 break;
465
Miguel Boton4d022e32008-01-30 13:32:51 +0100466 case BOOT_EFI:
467 if (efi_enabled)
H. Peter Anvin14d7ca52008-11-11 16:19:48 -0800468 efi.reset_system(reboot_mode ?
469 EFI_RESET_WARM :
470 EFI_RESET_COLD,
Miguel Boton4d022e32008-01-30 13:32:51 +0100471 EFI_SUCCESS, 0, NULL);
H. Peter Anvinb47b9282008-11-24 00:50:09 -0800472 reboot_type = BOOT_KBD;
H. Peter Anvin14d7ca52008-11-11 16:19:48 -0800473 break;
Miguel Boton4d022e32008-01-30 13:32:51 +0100474
H. Peter Anvin14d7ca52008-11-11 16:19:48 -0800475 case BOOT_CF9:
476 port_cf9_safe = true;
477 /* fall through */
478
479 case BOOT_CF9_COND:
480 if (port_cf9_safe) {
481 u8 cf9 = inb(0xcf9) & ~6;
482 outb(cf9|2, 0xcf9); /* Request hard reset */
483 udelay(50);
484 outb(cf9|6, 0xcf9); /* Actually do the reset */
485 udelay(50);
486 }
Miguel Boton4d022e32008-01-30 13:32:51 +0100487 reboot_type = BOOT_KBD;
488 break;
489 }
490 }
491}
492
Glauber Costa3c62c622008-03-17 16:08:39 -0300493void native_machine_shutdown(void)
Miguel Boton4d022e32008-01-30 13:32:51 +0100494{
495 /* Stop the cpus and apics */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700496#ifdef CONFIG_SMP
Linus Torvalds1da177e2005-04-16 15:20:36 -0700497
Eric W. Biedermandd2a1302005-06-25 14:57:55 -0700498 /* The boot cpu is always logical cpu 0 */
Mike Travis65c01182008-07-15 14:14:30 -0700499 int reboot_cpu_id = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700500
Miguel Boton4d022e32008-01-30 13:32:51 +0100501#ifdef CONFIG_X86_32
Eric W. Biedermandd2a1302005-06-25 14:57:55 -0700502 /* See if there has been given a command line override */
Mike Travis96289372008-12-31 18:08:46 -0800503 if ((reboot_cpu != -1) && (reboot_cpu < nr_cpu_ids) &&
Mike Travis0bc3cc02008-07-24 18:21:31 -0700504 cpu_online(reboot_cpu))
Eric W. Biedermandd2a1302005-06-25 14:57:55 -0700505 reboot_cpu_id = reboot_cpu;
Miguel Boton4d022e32008-01-30 13:32:51 +0100506#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700507
Miguel Boton4d022e32008-01-30 13:32:51 +0100508 /* Make certain the cpu I'm about to reboot on is online */
Mike Travis0bc3cc02008-07-24 18:21:31 -0700509 if (!cpu_online(reboot_cpu_id))
Eric W. Biedermandd2a1302005-06-25 14:57:55 -0700510 reboot_cpu_id = smp_processor_id();
Eric W. Biedermandd2a1302005-06-25 14:57:55 -0700511
512 /* Make certain I only run on the appropriate processor */
Mike Travis96289372008-12-31 18:08:46 -0800513 set_cpus_allowed_ptr(current, cpumask_of(reboot_cpu_id));
Eric W. Biedermandd2a1302005-06-25 14:57:55 -0700514
Miguel Boton4d022e32008-01-30 13:32:51 +0100515 /* O.K Now that I'm on the appropriate processor,
516 * stop all of the others.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700517 */
518 smp_send_stop();
Miguel Boton4d022e32008-01-30 13:32:51 +0100519#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700520
521 lapic_shutdown();
522
523#ifdef CONFIG_X86_IO_APIC
524 disable_IO_APIC();
525#endif
Miguel Boton4d022e32008-01-30 13:32:51 +0100526
OGAWA Hirofumic86c7fb2007-12-03 17:17:10 +0100527#ifdef CONFIG_HPET_TIMER
528 hpet_disable();
529#endif
Miguel Boton4d022e32008-01-30 13:32:51 +0100530
531#ifdef CONFIG_X86_64
532 pci_iommu_shutdown();
533#endif
Eric W. Biedermandd2a1302005-06-25 14:57:55 -0700534}
535
Eduardo Habkostd1767202008-11-17 19:03:24 -0200536static void __machine_emergency_restart(int emergency)
537{
538 reboot_emergency = emergency;
539 machine_ops.emergency_restart();
540}
541
Jody Belka416e2d62008-02-12 23:37:48 +0000542static void native_machine_restart(char *__unused)
Jeremy Fitzhardinge973efae2007-05-02 19:27:06 +0200543{
Miguel Boton4d022e32008-01-30 13:32:51 +0100544 printk("machine restart\n");
Jeremy Fitzhardinge973efae2007-05-02 19:27:06 +0200545
Miguel Boton4d022e32008-01-30 13:32:51 +0100546 if (!reboot_force)
Eric W. Biederman6e3fbee2006-01-11 22:43:12 +0100547 machine_shutdown();
Eduardo Habkostd1767202008-11-17 19:03:24 -0200548 __machine_emergency_restart(0);
Jeremy Fitzhardinge07f33312007-05-02 19:27:11 +0200549}
550
Jody Belka416e2d62008-02-12 23:37:48 +0000551static void native_machine_halt(void)
Jeremy Fitzhardinge07f33312007-05-02 19:27:11 +0200552{
Ivan Vecerad3ec5ca2008-11-11 14:33:44 +0100553 /* stop other cpus and apics */
554 machine_shutdown();
555
556 /* stop this cpu */
557 stop_this_cpu(NULL);
Jeremy Fitzhardinge07f33312007-05-02 19:27:11 +0200558}
Miguel Boton4d022e32008-01-30 13:32:51 +0100559
Jody Belka416e2d62008-02-12 23:37:48 +0000560static void native_machine_power_off(void)
Miguel Boton4d022e32008-01-30 13:32:51 +0100561{
562 if (pm_power_off) {
563 if (!reboot_force)
564 machine_shutdown();
565 pm_power_off();
566 }
567}
568
569struct machine_ops machine_ops = {
Jody Belka416e2d62008-02-12 23:37:48 +0000570 .power_off = native_machine_power_off,
571 .shutdown = native_machine_shutdown,
572 .emergency_restart = native_machine_emergency_restart,
573 .restart = native_machine_restart,
Glauber Costaed23dc62008-03-17 16:08:38 -0300574 .halt = native_machine_halt,
575#ifdef CONFIG_KEXEC
576 .crash_shutdown = native_machine_crash_shutdown,
577#endif
Miguel Boton4d022e32008-01-30 13:32:51 +0100578};
Jody Belka416e2d62008-02-12 23:37:48 +0000579
580void machine_power_off(void)
581{
582 machine_ops.power_off();
583}
584
585void machine_shutdown(void)
586{
587 machine_ops.shutdown();
588}
589
590void machine_emergency_restart(void)
591{
Eduardo Habkostd1767202008-11-17 19:03:24 -0200592 __machine_emergency_restart(1);
Jody Belka416e2d62008-02-12 23:37:48 +0000593}
594
595void machine_restart(char *cmd)
596{
597 machine_ops.restart(cmd);
598}
599
600void machine_halt(void)
601{
602 machine_ops.halt();
603}
604
Glauber Costaed23dc62008-03-17 16:08:38 -0300605#ifdef CONFIG_KEXEC
606void machine_crash_shutdown(struct pt_regs *regs)
607{
608 machine_ops.crash_shutdown(regs);
609}
610#endif
Eduardo Habkost2ddded22008-11-12 11:34:42 -0200611
612
Eduardo Habkostbb8dd272008-11-12 11:34:43 -0200613#if defined(CONFIG_SMP)
Eduardo Habkost2ddded22008-11-12 11:34:42 -0200614
615/* This keeps a track of which one is crashing cpu. */
616static int crashing_cpu;
617static nmi_shootdown_cb shootdown_callback;
618
619static atomic_t waiting_for_crash_ipi;
620
621static int crash_nmi_callback(struct notifier_block *self,
622 unsigned long val, void *data)
623{
624 int cpu;
625
626 if (val != DIE_NMI_IPI)
627 return NOTIFY_OK;
628
629 cpu = raw_smp_processor_id();
630
631 /* Don't do anything if this handler is invoked on crashing cpu.
632 * Otherwise, system will completely hang. Crashing cpu can get
633 * an NMI if system was initially booted with nmi_watchdog parameter.
634 */
635 if (cpu == crashing_cpu)
636 return NOTIFY_STOP;
637 local_irq_disable();
638
639 shootdown_callback(cpu, (struct die_args *)data);
640
641 atomic_dec(&waiting_for_crash_ipi);
642 /* Assume hlt works */
643 halt();
644 for (;;)
645 cpu_relax();
646
647 return 1;
648}
649
650static void smp_send_nmi_allbutself(void)
651{
Ingo Molnardac5f412009-01-28 15:42:24 +0100652 apic->send_IPI_allbutself(NMI_VECTOR);
Eduardo Habkost2ddded22008-11-12 11:34:42 -0200653}
654
655static struct notifier_block crash_nmi_nb = {
656 .notifier_call = crash_nmi_callback,
657};
658
Eduardo Habkostbb8dd272008-11-12 11:34:43 -0200659/* Halt all other CPUs, calling the specified function on each of them
660 *
661 * This function can be used to halt all other CPUs on crash
662 * or emergency reboot time. The function passed as parameter
663 * will be called inside a NMI handler on all CPUs.
664 */
Eduardo Habkost2ddded22008-11-12 11:34:42 -0200665void nmi_shootdown_cpus(nmi_shootdown_cb callback)
666{
667 unsigned long msecs;
Eduardo Habkostc415b3d2008-11-12 11:34:44 -0200668 local_irq_disable();
Eduardo Habkost2ddded22008-11-12 11:34:42 -0200669
670 /* Make a note of crashing cpu. Will be used in NMI callback.*/
671 crashing_cpu = safe_smp_processor_id();
672
673 shootdown_callback = callback;
674
675 atomic_set(&waiting_for_crash_ipi, num_online_cpus() - 1);
676 /* Would it be better to replace the trap vector here? */
677 if (register_die_notifier(&crash_nmi_nb))
678 return; /* return what? */
679 /* Ensure the new callback function is set before sending
680 * out the NMI
681 */
682 wmb();
683
684 smp_send_nmi_allbutself();
685
686 msecs = 1000; /* Wait at most a second for the other cpus to stop */
687 while ((atomic_read(&waiting_for_crash_ipi) > 0) && msecs) {
688 mdelay(1);
689 msecs--;
690 }
691
692 /* Leave the nmi callback set */
693}
Eduardo Habkostbb8dd272008-11-12 11:34:43 -0200694#else /* !CONFIG_SMP */
695void nmi_shootdown_cpus(nmi_shootdown_cb callback)
696{
697 /* No other CPUs to shoot down */
698}
Eduardo Habkost2ddded22008-11-12 11:34:42 -0200699#endif