1 #include <linux/module.h>
2 #include <linux/reboot.h>
3 #include <linux/init.h>
6 #include <acpi/reboot.h>
11 #include <asm/pgtable.h>
12 #include <asm/proto.h>
13 #include <asm/reboot_fixups.h>
14 #include <asm/reboot.h>
15 #include <asm/pci_x86.h>
16 #include <asm/virtext.h>
20 # include <linux/dmi.h>
21 # include <linux/ctype.h>
22 # include <linux/mc146818rtc.h>
24 # include <asm/iommu.h>
28 * Power off function, if any
30 void (*pm_power_off
)(void);
31 EXPORT_SYMBOL(pm_power_off
);
33 static const struct desc_ptr no_idt
= {};
34 static int reboot_mode
;
35 enum reboot_type reboot_type
= BOOT_KBD
;
38 #if defined(CONFIG_X86_32) && defined(CONFIG_SMP)
39 static int reboot_cpu
= -1;
42 /* This is set if we need to go through the 'emergency' path.
43 * When machine_emergency_restart() is called, we may be on
44 * an inconsistent state and won't be able to do a clean cleanup
46 static int reboot_emergency
;
48 /* This is set by the PCI code if either type 1 or type 2 PCI is detected */
49 bool port_cf9_safe
= false;
51 /* reboot=b[ios] | s[mp] | t[riple] | k[bd] | e[fi] [, [w]arm | [c]old] | p[ci]
52 warm Don't set the cold reboot flag
53 cold Set the cold reboot flag
54 bios Reboot by jumping through the BIOS (only for X86_32)
55 smp Reboot by executing reset on BSP or other CPU (only for X86_32)
56 triple Force a triple fault (init)
57 kbd Use the keyboard controller. cold reset (default)
58 acpi Use the RESET_REG in the FADT
59 efi Use efi reset_system runtime service
60 pci Use the so-called "PCI reset register", CF9
61 force Avoid anything that could hang.
63 static int __init
reboot_setup(char *str
)
78 if (isdigit(*(str
+1))) {
79 reboot_cpu
= (int) (*(str
+1) - '0');
80 if (isdigit(*(str
+2)))
81 reboot_cpu
= reboot_cpu
*10 + (int)(*(str
+2) - '0');
83 /* we will leave sorting out the final value
84 when we are ready to reboot, since we might not
85 have set up boot_cpu_id or smp_num_cpu */
87 #endif /* CONFIG_SMP */
104 str
= strchr(str
, ',');
113 __setup("reboot=", reboot_setup
);
118 * Reboot options and system auto-detection code provided by
119 * Dell Inc. so their systems "just work". :-)
123 * Some machines require the "reboot=b" commandline option,
124 * this quirk makes that automatic.
126 static int __init
set_bios_reboot(const struct dmi_system_id
*d
)
128 if (reboot_type
!= BOOT_BIOS
) {
129 reboot_type
= BOOT_BIOS
;
130 printk(KERN_INFO
"%s series board detected. Selecting BIOS-method for reboots.\n", d
->ident
);
135 static struct dmi_system_id __initdata reboot_dmi_table
[] = {
136 { /* Handle problems with rebooting on Dell E520's */
137 .callback
= set_bios_reboot
,
138 .ident
= "Dell E520",
140 DMI_MATCH(DMI_SYS_VENDOR
, "Dell Inc."),
141 DMI_MATCH(DMI_PRODUCT_NAME
, "Dell DM061"),
144 { /* Handle problems with rebooting on Dell 1300's */
145 .callback
= set_bios_reboot
,
146 .ident
= "Dell PowerEdge 1300",
148 DMI_MATCH(DMI_SYS_VENDOR
, "Dell Computer Corporation"),
149 DMI_MATCH(DMI_PRODUCT_NAME
, "PowerEdge 1300/"),
152 { /* Handle problems with rebooting on Dell 300's */
153 .callback
= set_bios_reboot
,
154 .ident
= "Dell PowerEdge 300",
156 DMI_MATCH(DMI_SYS_VENDOR
, "Dell Computer Corporation"),
157 DMI_MATCH(DMI_PRODUCT_NAME
, "PowerEdge 300/"),
160 { /* Handle problems with rebooting on Dell Optiplex 745's SFF*/
161 .callback
= set_bios_reboot
,
162 .ident
= "Dell OptiPlex 745",
164 DMI_MATCH(DMI_SYS_VENDOR
, "Dell Inc."),
165 DMI_MATCH(DMI_PRODUCT_NAME
, "OptiPlex 745"),
168 { /* Handle problems with rebooting on Dell Optiplex 745's DFF*/
169 .callback
= set_bios_reboot
,
170 .ident
= "Dell OptiPlex 745",
172 DMI_MATCH(DMI_SYS_VENDOR
, "Dell Inc."),
173 DMI_MATCH(DMI_PRODUCT_NAME
, "OptiPlex 745"),
174 DMI_MATCH(DMI_BOARD_NAME
, "0MM599"),
177 { /* Handle problems with rebooting on Dell Optiplex 745 with 0KW626 */
178 .callback
= set_bios_reboot
,
179 .ident
= "Dell OptiPlex 745",
181 DMI_MATCH(DMI_SYS_VENDOR
, "Dell Inc."),
182 DMI_MATCH(DMI_PRODUCT_NAME
, "OptiPlex 745"),
183 DMI_MATCH(DMI_BOARD_NAME
, "0KW626"),
186 { /* Handle problems with rebooting on Dell Optiplex 330 with 0KP561 */
187 .callback
= set_bios_reboot
,
188 .ident
= "Dell OptiPlex 330",
190 DMI_MATCH(DMI_SYS_VENDOR
, "Dell Inc."),
191 DMI_MATCH(DMI_PRODUCT_NAME
, "OptiPlex 330"),
192 DMI_MATCH(DMI_BOARD_NAME
, "0KP561"),
195 { /* Handle problems with rebooting on Dell Optiplex 360 with 0T656F */
196 .callback
= set_bios_reboot
,
197 .ident
= "Dell OptiPlex 360",
199 DMI_MATCH(DMI_SYS_VENDOR
, "Dell Inc."),
200 DMI_MATCH(DMI_PRODUCT_NAME
, "OptiPlex 360"),
201 DMI_MATCH(DMI_BOARD_NAME
, "0T656F"),
204 { /* Handle problems with rebooting on Dell 2400's */
205 .callback
= set_bios_reboot
,
206 .ident
= "Dell PowerEdge 2400",
208 DMI_MATCH(DMI_SYS_VENDOR
, "Dell Computer Corporation"),
209 DMI_MATCH(DMI_PRODUCT_NAME
, "PowerEdge 2400"),
212 { /* Handle problems with rebooting on Dell T5400's */
213 .callback
= set_bios_reboot
,
214 .ident
= "Dell Precision T5400",
216 DMI_MATCH(DMI_SYS_VENDOR
, "Dell Inc."),
217 DMI_MATCH(DMI_PRODUCT_NAME
, "Precision WorkStation T5400"),
220 { /* Handle problems with rebooting on HP laptops */
221 .callback
= set_bios_reboot
,
222 .ident
= "HP Compaq Laptop",
224 DMI_MATCH(DMI_SYS_VENDOR
, "Hewlett-Packard"),
225 DMI_MATCH(DMI_PRODUCT_NAME
, "HP Compaq"),
228 { /* Handle problems with rebooting on Dell XPS710 */
229 .callback
= set_bios_reboot
,
230 .ident
= "Dell XPS710",
232 DMI_MATCH(DMI_SYS_VENDOR
, "Dell Inc."),
233 DMI_MATCH(DMI_PRODUCT_NAME
, "Dell XPS710"),
239 static int __init
reboot_init(void)
241 dmi_check_system(reboot_dmi_table
);
244 core_initcall(reboot_init
);
246 /* The following code and data reboots the machine by switching to real
247 mode and jumping to the BIOS reset entry point, as if the CPU has
248 really been reset. The previous version asked the keyboard
249 controller to pulse the CPU reset line, which is more thorough, but
250 doesn't work with at least one type of 486 motherboard. It is easy
251 to stop this code working; hence the copious comments. */
252 static const unsigned long long
253 real_mode_gdt_entries
[3] =
255 0x0000000000000000ULL
, /* Null descriptor */
256 0x00009b000000ffffULL
, /* 16-bit real-mode 64k code at 0x00000000 */
257 0x000093000100ffffULL
/* 16-bit real-mode 64k data at 0x00000100 */
260 static const struct desc_ptr
261 real_mode_gdt
= { sizeof (real_mode_gdt_entries
) - 1, (long)real_mode_gdt_entries
},
262 real_mode_idt
= { 0x3ff, 0 };
264 /* This is 16-bit protected mode code to disable paging and the cache,
265 switch to real mode and jump to the BIOS reset code.
267 The instruction that switches to real mode by writing to CR0 must be
268 followed immediately by a far jump instruction, which set CS to a
269 valid value for real mode, and flushes the prefetch queue to avoid
270 running instructions that have already been decoded in protected
273 Clears all the flags except ET, especially PG (paging), PE
274 (protected-mode enable) and TS (task switch for coprocessor state
275 save). Flushes the TLB after paging has been disabled. Sets CD and
276 NW, to disable the cache on a 486, and invalidates the cache. This
277 is more like the state of a 486 after reset. I don't know if
278 something else should be done for other chips.
280 More could be done here to set up the registers as if a CPU reset had
281 occurred; hopefully real BIOSs don't assume much. */
282 static const unsigned char real_mode_switch
[] =
284 0x66, 0x0f, 0x20, 0xc0, /* movl %cr0,%eax */
285 0x66, 0x83, 0xe0, 0x11, /* andl $0x00000011,%eax */
286 0x66, 0x0d, 0x00, 0x00, 0x00, 0x60, /* orl $0x60000000,%eax */
287 0x66, 0x0f, 0x22, 0xc0, /* movl %eax,%cr0 */
288 0x66, 0x0f, 0x22, 0xd8, /* movl %eax,%cr3 */
289 0x66, 0x0f, 0x20, 0xc3, /* movl %cr0,%ebx */
290 0x66, 0x81, 0xe3, 0x00, 0x00, 0x00, 0x60, /* andl $0x60000000,%ebx */
291 0x74, 0x02, /* jz f */
292 0x0f, 0x09, /* wbinvd */
293 0x24, 0x10, /* f: andb $0x10,al */
294 0x66, 0x0f, 0x22, 0xc0 /* movl %eax,%cr0 */
296 static const unsigned char jump_to_bios
[] =
298 0xea, 0x00, 0x00, 0xff, 0xff /* ljmp $0xffff,$0x0000 */
302 * Switch to real mode and then execute the code
303 * specified by the code and length parameters.
304 * We assume that length will aways be less that 100!
306 void machine_real_restart(const unsigned char *code
, int length
)
310 /* Write zero to CMOS register number 0x0f, which the BIOS POST
311 routine will recognize as telling it to do a proper reboot. (Well
312 that's what this book in front of me says -- it may only apply to
313 the Phoenix BIOS though, it's not clear). At the same time,
314 disable NMIs by setting the top bit in the CMOS address register,
315 as we're about to do peculiar things to the CPU. I'm not sure if
316 `outb_p' is needed instead of just `outb'. Use it to be on the
317 safe side. (Yes, CMOS_WRITE does outb_p's. - Paul G.)
319 spin_lock(&rtc_lock
);
320 CMOS_WRITE(0x00, 0x8f);
321 spin_unlock(&rtc_lock
);
323 /* Remap the kernel at virtual address zero, as well as offset zero
324 from the kernel segment. This assumes the kernel segment starts at
325 virtual address PAGE_OFFSET. */
326 memcpy(swapper_pg_dir
, swapper_pg_dir
+ KERNEL_PGD_BOUNDARY
,
327 sizeof(swapper_pg_dir
[0]) * KERNEL_PGD_PTRS
);
330 * Use `swapper_pg_dir' as our page directory.
332 load_cr3(swapper_pg_dir
);
334 /* Write 0x1234 to absolute memory location 0x472. The BIOS reads
335 this on booting to tell it to "Bypass memory test (also warm
336 boot)". This seems like a fairly standard thing that gets set by
337 REBOOT.COM programs, and the previous reset routine did this
339 *((unsigned short *)0x472) = reboot_mode
;
341 /* For the switch to real mode, copy some code to low memory. It has
342 to be in the first 64k because it is running in 16-bit mode, and it
343 has to have the same physical and virtual address, because it turns
344 off paging. Copy it near the end of the first page, out of the way
345 of BIOS variables. */
346 memcpy((void *)(0x1000 - sizeof(real_mode_switch
) - 100),
347 real_mode_switch
, sizeof (real_mode_switch
));
348 memcpy((void *)(0x1000 - 100), code
, length
);
350 /* Set up the IDT for real mode. */
351 load_idt(&real_mode_idt
);
353 /* Set up a GDT from which we can load segment descriptors for real
354 mode. The GDT is not used in real mode; it is just needed here to
355 prepare the descriptors. */
356 load_gdt(&real_mode_gdt
);
358 /* Load the data segment registers, and thus the descriptors ready for
359 real mode. The base address of each segment is 0x100, 16 times the
360 selector value being loaded here. This is so that the segment
361 registers don't have to be reloaded after switching to real mode:
362 the values are consistent for real mode operation already. */
363 __asm__
__volatile__ ("movl $0x0010,%%eax\n"
364 "\tmovl %%eax,%%ds\n"
365 "\tmovl %%eax,%%es\n"
366 "\tmovl %%eax,%%fs\n"
367 "\tmovl %%eax,%%gs\n"
368 "\tmovl %%eax,%%ss" : : : "eax");
370 /* Jump to the 16-bit code that we copied earlier. It disables paging
371 and the cache, switches to real mode, and jumps to the BIOS reset
373 __asm__
__volatile__ ("ljmp $0x0008,%0"
375 : "i" ((void *)(0x1000 - sizeof (real_mode_switch
) - 100)));
377 #ifdef CONFIG_APM_MODULE
378 EXPORT_SYMBOL(machine_real_restart
);
381 #endif /* CONFIG_X86_32 */
383 static inline void kb_wait(void)
387 for (i
= 0; i
< 0x10000; i
++) {
388 if ((inb(0x64) & 0x02) == 0)
394 static void vmxoff_nmi(int cpu
, struct die_args
*args
)
396 cpu_emergency_vmxoff();
399 /* Use NMIs as IPIs to tell all CPUs to disable virtualization
401 static void emergency_vmx_disable_all(void)
403 /* Just make sure we won't change CPUs while doing this */
406 /* We need to disable VMX on all CPUs before rebooting, otherwise
407 * we risk hanging up the machine, because the CPU ignore INIT
408 * signals when VMX is enabled.
410 * We can't take any locks and we may be on an inconsistent
411 * state, so we use NMIs as IPIs to tell the other CPUs to disable
414 * For safety, we will avoid running the nmi_shootdown_cpus()
415 * stuff unnecessarily, but we don't have a way to check
416 * if other CPUs have VMX enabled. So we will call it only if the
417 * CPU we are running on has VMX enabled.
419 * We will miss cases where VMX is not enabled on all CPUs. This
420 * shouldn't do much harm because KVM always enable VMX on all
421 * CPUs anyway. But we can miss it on the small window where KVM
422 * is still enabling VMX.
424 if (cpu_has_vmx() && cpu_vmx_enabled()) {
425 /* Disable VMX on this CPU.
429 /* Halt and disable VMX on the other CPUs */
430 nmi_shootdown_cpus(vmxoff_nmi
);
436 void __attribute__((weak
)) mach_reboot_fixups(void)
440 static void native_machine_emergency_restart(void)
444 if (reboot_emergency
)
445 emergency_vmx_disable_all();
447 /* Tell the BIOS if we want cold or warm reboot */
448 *((unsigned short *)__va(0x472)) = reboot_mode
;
451 /* Could also try the reset bit in the Hammer NB */
452 switch (reboot_type
) {
454 mach_reboot_fixups(); /* for board specific fixups */
456 for (i
= 0; i
< 10; i
++) {
459 outb(0xfe, 0x64); /* pulse reset low */
465 __asm__
__volatile__("int3");
467 reboot_type
= BOOT_KBD
;
472 machine_real_restart(jump_to_bios
, sizeof(jump_to_bios
));
474 reboot_type
= BOOT_KBD
;
480 reboot_type
= BOOT_KBD
;
485 efi
.reset_system(reboot_mode
?
488 EFI_SUCCESS
, 0, NULL
);
489 reboot_type
= BOOT_KBD
;
493 port_cf9_safe
= true;
498 u8 cf9
= inb(0xcf9) & ~6;
499 outb(cf9
|2, 0xcf9); /* Request hard reset */
501 outb(cf9
|6, 0xcf9); /* Actually do the reset */
504 reboot_type
= BOOT_KBD
;
510 void native_machine_shutdown(void)
512 /* Stop the cpus and apics */
515 /* The boot cpu is always logical cpu 0 */
516 int reboot_cpu_id
= 0;
519 /* See if there has been given a command line override */
520 if ((reboot_cpu
!= -1) && (reboot_cpu
< nr_cpu_ids
) &&
521 cpu_online(reboot_cpu
))
522 reboot_cpu_id
= reboot_cpu
;
525 /* Make certain the cpu I'm about to reboot on is online */
526 if (!cpu_online(reboot_cpu_id
))
527 reboot_cpu_id
= smp_processor_id();
529 /* Make certain I only run on the appropriate processor */
530 set_cpus_allowed_ptr(current
, cpumask_of(reboot_cpu_id
));
532 /* O.K Now that I'm on the appropriate processor,
533 * stop all of the others.
540 #ifdef CONFIG_X86_IO_APIC
544 #ifdef CONFIG_HPET_TIMER
549 pci_iommu_shutdown();
553 static void __machine_emergency_restart(int emergency
)
555 reboot_emergency
= emergency
;
556 machine_ops
.emergency_restart();
559 static void native_machine_restart(char *__unused
)
561 printk("machine restart\n");
565 __machine_emergency_restart(0);
568 static void native_machine_halt(void)
570 /* stop other cpus and apics */
577 static void native_machine_power_off(void)
586 struct machine_ops machine_ops
= {
587 .power_off
= native_machine_power_off
,
588 .shutdown
= native_machine_shutdown
,
589 .emergency_restart
= native_machine_emergency_restart
,
590 .restart
= native_machine_restart
,
591 .halt
= native_machine_halt
,
593 .crash_shutdown
= native_machine_crash_shutdown
,
597 void machine_power_off(void)
599 machine_ops
.power_off();
602 void machine_shutdown(void)
604 machine_ops
.shutdown();
607 void machine_emergency_restart(void)
609 __machine_emergency_restart(1);
612 void machine_restart(char *cmd
)
614 machine_ops
.restart(cmd
);
617 void machine_halt(void)
623 void machine_crash_shutdown(struct pt_regs
*regs
)
625 machine_ops
.crash_shutdown(regs
);
630 #if defined(CONFIG_SMP)
632 /* This keeps a track of which one is crashing cpu. */
633 static int crashing_cpu
;
634 static nmi_shootdown_cb shootdown_callback
;
636 static atomic_t waiting_for_crash_ipi
;
638 static int crash_nmi_callback(struct notifier_block
*self
,
639 unsigned long val
, void *data
)
643 if (val
!= DIE_NMI_IPI
)
646 cpu
= raw_smp_processor_id();
648 /* Don't do anything if this handler is invoked on crashing cpu.
649 * Otherwise, system will completely hang. Crashing cpu can get
650 * an NMI if system was initially booted with nmi_watchdog parameter.
652 if (cpu
== crashing_cpu
)
656 shootdown_callback(cpu
, (struct die_args
*)data
);
658 atomic_dec(&waiting_for_crash_ipi
);
659 /* Assume hlt works */
667 static void smp_send_nmi_allbutself(void)
669 apic
->send_IPI_allbutself(NMI_VECTOR
);
672 static struct notifier_block crash_nmi_nb
= {
673 .notifier_call
= crash_nmi_callback
,
676 /* Halt all other CPUs, calling the specified function on each of them
678 * This function can be used to halt all other CPUs on crash
679 * or emergency reboot time. The function passed as parameter
680 * will be called inside a NMI handler on all CPUs.
682 void nmi_shootdown_cpus(nmi_shootdown_cb callback
)
687 /* Make a note of crashing cpu. Will be used in NMI callback.*/
688 crashing_cpu
= safe_smp_processor_id();
690 shootdown_callback
= callback
;
692 atomic_set(&waiting_for_crash_ipi
, num_online_cpus() - 1);
693 /* Would it be better to replace the trap vector here? */
694 if (register_die_notifier(&crash_nmi_nb
))
695 return; /* return what? */
696 /* Ensure the new callback function is set before sending
701 smp_send_nmi_allbutself();
703 msecs
= 1000; /* Wait at most a second for the other cpus to stop */
704 while ((atomic_read(&waiting_for_crash_ipi
) > 0) && msecs
) {
709 /* Leave the nmi callback set */
711 #else /* !CONFIG_SMP */
712 void nmi_shootdown_cpus(nmi_shootdown_cb callback
)
714 /* No other CPUs to shoot down */