blob: 25d5c30735820873acddb33216105563ad19dc3b [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
Linus Torvalds1da177e2005-04-16 15:20:36 -07002 * Copyright (C) 1991, 1992 Linus Torvalds
Alexander van Heukeluma8c1be92008-07-02 01:29:44 +02003 * Copyright (C) 2000, 2001, 2002 Andi Kleen, SuSE Labs
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 *
5 * Pentium III FXSR, SSE support
6 * Gareth Hughes <gareth@valinux.com>, May 2000
7 */
8
9/*
Alexander van Heukelumc1d518c2008-10-03 23:17:11 +020010 * Handle hardware traps and faults.
Linus Torvalds1da177e2005-04-16 15:20:36 -070011 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#include <linux/interrupt.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070013#include <linux/kallsyms.h>
Ingo Molnarb5964402008-02-26 11:15:50 +010014#include <linux/spinlock.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070015#include <linux/kprobes.h>
Andrew Morton1e2af922006-09-27 01:51:15 -070016#include <linux/uaccess.h>
Ingo Molnarb5964402008-02-26 11:15:50 +010017#include <linux/utsname.h>
18#include <linux/kdebug.h>
19#include <linux/kernel.h>
20#include <linux/module.h>
21#include <linux/ptrace.h>
22#include <linux/string.h>
23#include <linux/unwind.h>
24#include <linux/delay.h>
25#include <linux/errno.h>
26#include <linux/kexec.h>
27#include <linux/sched.h>
28#include <linux/timer.h>
29#include <linux/init.h>
Jeremy Fitzhardinge91768d62006-12-08 02:36:21 -080030#include <linux/bug.h>
Ingo Molnarb5964402008-02-26 11:15:50 +010031#include <linux/nmi.h>
32#include <linux/mm.h>
Alexander van Heukelumc1d518c2008-10-03 23:17:11 +020033#include <linux/smp.h>
34#include <linux/io.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035
36#ifdef CONFIG_EISA
37#include <linux/ioport.h>
38#include <linux/eisa.h>
39#endif
40
41#ifdef CONFIG_MCA
42#include <linux/mca.h>
43#endif
44
Dave Jiangc0d12172007-07-19 01:49:46 -070045#if defined(CONFIG_EDAC)
46#include <linux/edac.h>
47#endif
48
Ingo Molnarb5964402008-02-26 11:15:50 +010049#include <asm/stacktrace.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070050#include <asm/processor.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070051#include <asm/debugreg.h>
Ingo Molnarb5964402008-02-26 11:15:50 +010052#include <asm/atomic.h>
53#include <asm/system.h>
54#include <asm/unwind.h>
Alexander van Heukelumc1d518c2008-10-03 23:17:11 +020055#include <asm/traps.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070056#include <asm/desc.h>
57#include <asm/i387.h>
Alexander van Heukelumc1d518c2008-10-03 23:17:11 +020058
59#include <mach_traps.h>
60
Alexander van Heukelum081f75b2008-10-03 22:00:39 +020061#ifdef CONFIG_X86_64
62#include <asm/pgalloc.h>
63#include <asm/proto.h>
64#include <asm/pda.h>
65#else
Alexander van Heukelumc1d518c2008-10-03 23:17:11 +020066#include <asm/processor-flags.h>
67#include <asm/arch_hooks.h>
Jaswinder Singh6ac8d512008-07-15 21:09:13 +053068#include <asm/traps.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070069
Alexander van Heukelumeb642f62008-09-09 21:56:11 +020070#include "cpu/mcheck/mce.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -070071
72asmlinkage int system_call(void);
73
Linus Torvalds1da177e2005-04-16 15:20:36 -070074/* Do we ignore FPU interrupts ? */
Ingo Molnarb5964402008-02-26 11:15:50 +010075char ignore_fpu_irq;
Linus Torvalds1da177e2005-04-16 15:20:36 -070076
77/*
78 * The IDT has to be page-aligned to simplify the Pentium
79 * F0 0F bug workaround.. We have a special link segment
80 * for this.
81 */
Glauber de Oliveira Costa010d4f82008-01-30 13:31:12 +010082gate_desc idt_table[256]
Glauber de Oliveira Costa6842ef02008-01-30 13:31:11 +010083 __attribute__((__section__(".data.idt"))) = { { { { 0, 0 } } }, };
Alexander van Heukelum081f75b2008-10-03 22:00:39 +020084#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070085
Yinghai Lub77b8812008-12-19 15:23:44 -080086DECLARE_BITMAP(used_vectors, NR_VECTORS);
87EXPORT_SYMBOL_GPL(used_vectors);
88
Alexander van Heukelumbadc7652008-07-02 01:30:30 +020089static int ignore_nmis;
Alan Sterne041c682006-03-27 01:16:30 -080090
Alexander van Heukelum762db432008-09-09 21:55:55 +020091static inline void conditional_sti(struct pt_regs *regs)
92{
93 if (regs->flags & X86_EFLAGS_IF)
94 local_irq_enable();
95}
96
Alexander van Heukelum3d2a71a2008-09-30 18:41:37 +020097static inline void preempt_conditional_sti(struct pt_regs *regs)
98{
99 inc_preempt_count();
100 if (regs->flags & X86_EFLAGS_IF)
101 local_irq_enable();
102}
103
104static inline void preempt_conditional_cli(struct pt_regs *regs)
105{
106 if (regs->flags & X86_EFLAGS_IF)
107 local_irq_disable();
108 dec_preempt_count();
109}
110
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200111#ifdef CONFIG_X86_32
Ingo Molnarb5964402008-02-26 11:15:50 +0100112static inline void
113die_if_kernel(const char *str, struct pt_regs *regs, long err)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114{
Vincent Hanquez717b5942005-06-23 00:08:45 -0700115 if (!user_mode_vm(regs))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700116 die(str, regs, err);
117}
118
Alexander van Heukelumae821572008-09-30 18:41:35 +0200119/*
120 * Perform the lazy TSS's I/O bitmap copy. If the TSS has an
121 * invalid offset set (the LAZY one) and the faulting thread has
122 * a valid I/O bitmap pointer, we copy the I/O bitmap in the TSS,
123 * we set the offset field correctly and return 1.
124 */
125static int lazy_iobitmap_copy(void)
126{
127 struct thread_struct *thread;
128 struct tss_struct *tss;
129 int cpu;
130
131 cpu = get_cpu();
132 tss = &per_cpu(init_tss, cpu);
133 thread = &current->thread;
134
135 if (tss->x86_tss.io_bitmap_base == INVALID_IO_BITMAP_OFFSET_LAZY &&
136 thread->io_bitmap_ptr) {
137 memcpy(tss->io_bitmap, thread->io_bitmap_ptr,
138 thread->io_bitmap_max);
139 /*
140 * If the previously set map was extending to higher ports
141 * than the current one, pad extra space with 0xff (no access).
142 */
143 if (thread->io_bitmap_max < tss->io_bitmap_max) {
144 memset((char *) tss->io_bitmap +
145 thread->io_bitmap_max, 0xff,
146 tss->io_bitmap_max - thread->io_bitmap_max);
147 }
148 tss->io_bitmap_max = thread->io_bitmap_max;
149 tss->x86_tss.io_bitmap_base = IO_BITMAP_OFFSET;
150 tss->io_bitmap_owner = thread;
151 put_cpu();
152
153 return 1;
154 }
155 put_cpu();
156
157 return 0;
158}
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200159#endif
Alexander van Heukelumae821572008-09-30 18:41:35 +0200160
Ingo Molnarb5964402008-02-26 11:15:50 +0100161static void __kprobes
Alexander van Heukelum3c1326f2008-09-26 14:03:08 +0200162do_trap(int trapnr, int signr, char *str, struct pt_regs *regs,
Ingo Molnarb5964402008-02-26 11:15:50 +0100163 long error_code, siginfo_t *info)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164{
Alexander Nyberg4f339ec2005-06-25 14:58:27 -0700165 struct task_struct *tsk = current;
Alexander Nyberg4f339ec2005-06-25 14:58:27 -0700166
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200167#ifdef CONFIG_X86_32
gorcunov@gmail.com6b6891f2008-03-28 17:56:57 +0300168 if (regs->flags & X86_VM_MASK) {
Alexander van Heukelum3c1326f2008-09-26 14:03:08 +0200169 /*
170 * traps 0, 1, 3, 4, and 5 should be forwarded to vm86.
171 * On nmi (interrupt 2), do_trap should not be called.
172 */
173 if (trapnr < 6)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700174 goto vm86_trap;
175 goto trap_signal;
176 }
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200177#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700178
Vincent Hanquez717b5942005-06-23 00:08:45 -0700179 if (!user_mode(regs))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180 goto kernel_trap;
181
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200182#ifdef CONFIG_X86_32
Ingo Molnarb5964402008-02-26 11:15:50 +0100183trap_signal:
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200184#endif
Ingo Molnarb5964402008-02-26 11:15:50 +0100185 /*
186 * We want error_code and trap_no set for userspace faults and
187 * kernelspace faults which result in die(), but not
188 * kernelspace faults which are fixed up. die() gives the
189 * process no chance to handle the signal and notice the
190 * kernel fault information, so that won't result in polluting
191 * the information about previously queued, but not yet
192 * delivered, faults. See also do_general_protection below.
193 */
194 tsk->thread.error_code = error_code;
195 tsk->thread.trap_no = trapnr;
196
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200197#ifdef CONFIG_X86_64
198 if (show_unhandled_signals && unhandled_signal(tsk, signr) &&
199 printk_ratelimit()) {
200 printk(KERN_INFO
201 "%s[%d] trap %s ip:%lx sp:%lx error:%lx",
202 tsk->comm, tsk->pid, str,
203 regs->ip, regs->sp, error_code);
204 print_vma_addr(" in ", regs->ip);
205 printk("\n");
206 }
207#endif
208
Ingo Molnarb5964402008-02-26 11:15:50 +0100209 if (info)
210 force_sig_info(signr, info, tsk);
211 else
212 force_sig(signr, tsk);
213 return;
214
215kernel_trap:
216 if (!fixup_exception(regs)) {
Andi Kleend1895182007-05-02 19:27:05 +0200217 tsk->thread.error_code = error_code;
218 tsk->thread.trap_no = trapnr;
Ingo Molnarb5964402008-02-26 11:15:50 +0100219 die(str, regs, error_code);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700220 }
Ingo Molnarb5964402008-02-26 11:15:50 +0100221 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700222
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200223#ifdef CONFIG_X86_32
Ingo Molnarb5964402008-02-26 11:15:50 +0100224vm86_trap:
225 if (handle_vm86_trap((struct kernel_vm86_regs *) regs,
226 error_code, trapnr))
227 goto trap_signal;
228 return;
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200229#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700230}
231
Ingo Molnarb5964402008-02-26 11:15:50 +0100232#define DO_ERROR(trapnr, signr, str, name) \
Alexander van Heukelume407d6202008-09-30 18:41:36 +0200233dotraplinkage void do_##name(struct pt_regs *regs, long error_code) \
Ingo Molnarb5964402008-02-26 11:15:50 +0100234{ \
235 if (notify_die(DIE_TRAP, str, regs, error_code, trapnr, signr) \
Alexander van Heukeluma8c1be92008-07-02 01:29:44 +0200236 == NOTIFY_STOP) \
Ingo Molnarb5964402008-02-26 11:15:50 +0100237 return; \
Alexander van Heukelum61aef7d2008-09-09 21:55:56 +0200238 conditional_sti(regs); \
Alexander van Heukelum3c1326f2008-09-26 14:03:08 +0200239 do_trap(trapnr, signr, str, regs, error_code, NULL); \
Linus Torvalds1da177e2005-04-16 15:20:36 -0700240}
241
Alexander van Heukelum3c1326f2008-09-26 14:03:08 +0200242#define DO_ERROR_INFO(trapnr, signr, str, name, sicode, siaddr) \
Alexander van Heukelume407d6202008-09-30 18:41:36 +0200243dotraplinkage void do_##name(struct pt_regs *regs, long error_code) \
Ingo Molnarb5964402008-02-26 11:15:50 +0100244{ \
245 siginfo_t info; \
246 info.si_signo = signr; \
247 info.si_errno = 0; \
248 info.si_code = sicode; \
249 info.si_addr = (void __user *)siaddr; \
Ingo Molnarb5964402008-02-26 11:15:50 +0100250 if (notify_die(DIE_TRAP, str, regs, error_code, trapnr, signr) \
Alexander van Heukeluma8c1be92008-07-02 01:29:44 +0200251 == NOTIFY_STOP) \
Ingo Molnarb5964402008-02-26 11:15:50 +0100252 return; \
Alexander van Heukelum61aef7d2008-09-09 21:55:56 +0200253 conditional_sti(regs); \
Alexander van Heukelum3c1326f2008-09-26 14:03:08 +0200254 do_trap(trapnr, signr, str, regs, error_code, &info); \
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255}
256
Alexander van Heukelum3c1326f2008-09-26 14:03:08 +0200257DO_ERROR_INFO(0, SIGFPE, "divide error", divide_error, FPE_INTDIV, regs->ip)
258DO_ERROR(4, SIGSEGV, "overflow", overflow)
259DO_ERROR(5, SIGSEGV, "bounds", bounds)
260DO_ERROR_INFO(6, SIGILL, "invalid opcode", invalid_op, ILL_ILLOPN, regs->ip)
Alexander van Heukelum51bc1ed2008-09-09 21:56:03 +0200261DO_ERROR(9, SIGFPE, "coprocessor segment overrun", coprocessor_segment_overrun)
Alexander van Heukelum6bf77bf2008-09-09 21:56:04 +0200262DO_ERROR(10, SIGSEGV, "invalid TSS", invalid_TSS)
Alexander van Heukelum36d936c2008-09-09 21:56:05 +0200263DO_ERROR(11, SIGBUS, "segment not present", segment_not_present)
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200264#ifdef CONFIG_X86_32
Alexander van Heukelumf5ca8182008-09-09 21:56:06 +0200265DO_ERROR(12, SIGBUS, "stack segment", stack_segment)
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200266#endif
Alexander van Heukelum3c1326f2008-09-26 14:03:08 +0200267DO_ERROR_INFO(17, SIGBUS, "alignment check", alignment_check, BUS_ADRALN, 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200269#ifdef CONFIG_X86_64
270/* Runs on IST stack */
271dotraplinkage void do_stack_segment(struct pt_regs *regs, long error_code)
272{
273 if (notify_die(DIE_TRAP, "stack segment", regs, error_code,
274 12, SIGBUS) == NOTIFY_STOP)
275 return;
276 preempt_conditional_sti(regs);
277 do_trap(12, SIGBUS, "stack segment", regs, error_code, NULL);
278 preempt_conditional_cli(regs);
279}
280
281dotraplinkage void do_double_fault(struct pt_regs *regs, long error_code)
282{
283 static const char str[] = "double fault";
284 struct task_struct *tsk = current;
285
286 /* Return not checked because double check cannot be ignored */
287 notify_die(DIE_TRAP, str, regs, error_code, 8, SIGSEGV);
288
289 tsk->thread.error_code = error_code;
290 tsk->thread.trap_no = 8;
291
Ingo Molnarbd8b96d2008-12-26 09:20:22 +0100292 /*
293 * This is always a kernel trap and never fixable (and thus must
294 * never return).
295 */
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200296 for (;;)
297 die(str, regs, error_code);
298}
299#endif
300
Alexander van Heukelume407d6202008-09-30 18:41:36 +0200301dotraplinkage void __kprobes
Alexander van Heukelum13485ab2008-07-02 01:32:04 +0200302do_general_protection(struct pt_regs *regs, long error_code)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700303{
Alexander van Heukelum13485ab2008-07-02 01:32:04 +0200304 struct task_struct *tsk;
Ingo Molnarb5964402008-02-26 11:15:50 +0100305
Alexander van Heukelumc6df0d72008-09-09 21:56:07 +0200306 conditional_sti(regs);
307
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200308#ifdef CONFIG_X86_32
Alexander van Heukelumae821572008-09-30 18:41:35 +0200309 if (lazy_iobitmap_copy()) {
310 /* restart the faulting instruction */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700311 return;
312 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700313
gorcunov@gmail.com6b6891f2008-03-28 17:56:57 +0300314 if (regs->flags & X86_VM_MASK)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315 goto gp_in_vm86;
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200316#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700317
Alexander van Heukelum13485ab2008-07-02 01:32:04 +0200318 tsk = current;
Vincent Hanquez717b5942005-06-23 00:08:45 -0700319 if (!user_mode(regs))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700320 goto gp_in_kernel;
321
Alexander van Heukelum13485ab2008-07-02 01:32:04 +0200322 tsk->thread.error_code = error_code;
323 tsk->thread.trap_no = 13;
Ingo Molnarb5964402008-02-26 11:15:50 +0100324
Alexander van Heukelum13485ab2008-07-02 01:32:04 +0200325 if (show_unhandled_signals && unhandled_signal(tsk, SIGSEGV) &&
326 printk_ratelimit()) {
Masoud Asgharifard Sharbianiabd4f752007-07-22 11:12:28 +0200327 printk(KERN_INFO
Alexander van Heukelum13485ab2008-07-02 01:32:04 +0200328 "%s[%d] general protection ip:%lx sp:%lx error:%lx",
329 tsk->comm, task_pid_nr(tsk),
330 regs->ip, regs->sp, error_code);
Andi Kleen03252912008-01-30 13:33:18 +0100331 print_vma_addr(" in ", regs->ip);
332 printk("\n");
333 }
Masoud Asgharifard Sharbianiabd4f752007-07-22 11:12:28 +0200334
Alexander van Heukelum13485ab2008-07-02 01:32:04 +0200335 force_sig(SIGSEGV, tsk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700336 return;
337
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200338#ifdef CONFIG_X86_32
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339gp_in_vm86:
340 local_irq_enable();
341 handle_vm86_fault((struct kernel_vm86_regs *) regs, error_code);
342 return;
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200343#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344
345gp_in_kernel:
Alexander van Heukelum13485ab2008-07-02 01:32:04 +0200346 if (fixup_exception(regs))
347 return;
348
349 tsk->thread.error_code = error_code;
350 tsk->thread.trap_no = 13;
351 if (notify_die(DIE_GPF, "general protection fault", regs,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700352 error_code, 13, SIGSEGV) == NOTIFY_STOP)
Alexander van Heukelum13485ab2008-07-02 01:32:04 +0200353 return;
354 die("general protection fault", regs, error_code);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700355}
356
Steven Rostedt5deb45e2008-04-19 19:19:55 +0200357static notrace __kprobes void
Ingo Molnarb5964402008-02-26 11:15:50 +0100358mem_parity_error(unsigned char reason, struct pt_regs *regs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700359{
Ingo Molnarb5964402008-02-26 11:15:50 +0100360 printk(KERN_EMERG
361 "Uhhuh. NMI received for unknown reason %02x on CPU %d.\n",
362 reason, smp_processor_id());
363
364 printk(KERN_EMERG
365 "You have some hardware problem, likely on the PCI bus.\n");
Dave Jiangc0d12172007-07-19 01:49:46 -0700366
367#if defined(CONFIG_EDAC)
Ingo Molnarb5964402008-02-26 11:15:50 +0100368 if (edac_handler_set()) {
Dave Jiangc0d12172007-07-19 01:49:46 -0700369 edac_atomic_assert_error();
370 return;
371 }
372#endif
373
Don Zickus8da5add2006-09-26 10:52:27 +0200374 if (panic_on_unrecovered_nmi)
Ingo Molnarb5964402008-02-26 11:15:50 +0100375 panic("NMI: Not continuing");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376
Don Zickusc41c5cd2006-09-26 10:52:27 +0200377 printk(KERN_EMERG "Dazed and confused, but trying to continue\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700378
379 /* Clear and disable the memory parity error line. */
Alexander van Heukelum79704792008-10-03 22:00:36 +0200380 reason = (reason & 0xf) | 4;
381 outb(reason, 0x61);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700382}
383
Steven Rostedt5deb45e2008-04-19 19:19:55 +0200384static notrace __kprobes void
Ingo Molnarb5964402008-02-26 11:15:50 +0100385io_check_error(unsigned char reason, struct pt_regs *regs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700386{
387 unsigned long i;
388
Dave Jones9c107802006-01-09 20:51:32 -0800389 printk(KERN_EMERG "NMI: IOCK error (debug interrupt?)\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700390 show_registers(regs);
391
392 /* Re-enable the IOCK line, wait for a few seconds */
393 reason = (reason & 0xf) | 8;
394 outb(reason, 0x61);
Ingo Molnarb5964402008-02-26 11:15:50 +0100395
Linus Torvalds1da177e2005-04-16 15:20:36 -0700396 i = 2000;
Ingo Molnarb5964402008-02-26 11:15:50 +0100397 while (--i)
398 udelay(1000);
399
Linus Torvalds1da177e2005-04-16 15:20:36 -0700400 reason &= ~8;
401 outb(reason, 0x61);
402}
403
Steven Rostedt5deb45e2008-04-19 19:19:55 +0200404static notrace __kprobes void
Ingo Molnarb5964402008-02-26 11:15:50 +0100405unknown_nmi_error(unsigned char reason, struct pt_regs *regs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700406{
Alexander van Heukelumc1d518c2008-10-03 23:17:11 +0200407 if (notify_die(DIE_NMIUNKNOWN, "nmi", regs, reason, 2, SIGINT) ==
408 NOTIFY_STOP)
Jason Wesseld3597522008-02-15 14:55:53 -0600409 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700410#ifdef CONFIG_MCA
Ingo Molnarb5964402008-02-26 11:15:50 +0100411 /*
412 * Might actually be able to figure out what the guilty party
413 * is:
414 */
415 if (MCA_bus) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700416 mca_handle_nmi();
417 return;
418 }
419#endif
Ingo Molnarb5964402008-02-26 11:15:50 +0100420 printk(KERN_EMERG
421 "Uhhuh. NMI received for unknown reason %02x on CPU %d.\n",
422 reason, smp_processor_id());
423
Don Zickusc41c5cd2006-09-26 10:52:27 +0200424 printk(KERN_EMERG "Do you have a strange power saving mode enabled?\n");
Don Zickus8da5add2006-09-26 10:52:27 +0200425 if (panic_on_unrecovered_nmi)
Ingo Molnarb5964402008-02-26 11:15:50 +0100426 panic("NMI: Not continuing");
Don Zickus8da5add2006-09-26 10:52:27 +0200427
Don Zickusc41c5cd2006-09-26 10:52:27 +0200428 printk(KERN_EMERG "Dazed and confused, but trying to continue\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700429}
430
Steven Rostedt5deb45e2008-04-19 19:19:55 +0200431static notrace __kprobes void default_do_nmi(struct pt_regs *regs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700432{
433 unsigned char reason = 0;
Alexander van Heukelumabd34802008-07-02 18:39:01 +0200434 int cpu;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700435
Alexander van Heukelumabd34802008-07-02 18:39:01 +0200436 cpu = smp_processor_id();
437
438 /* Only the BSP gets external NMIs from the system. */
439 if (!cpu)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700440 reason = get_nmi_reason();
Ingo Molnarb5964402008-02-26 11:15:50 +0100441
Linus Torvalds1da177e2005-04-16 15:20:36 -0700442 if (!(reason & 0xc0)) {
Jan Beulich20c0d2d2006-03-26 01:37:01 -0800443 if (notify_die(DIE_NMI_IPI, "nmi_ipi", regs, reason, 2, SIGINT)
Alexander van Heukeluma8c1be92008-07-02 01:29:44 +0200444 == NOTIFY_STOP)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700445 return;
446#ifdef CONFIG_X86_LOCAL_APIC
447 /*
448 * Ok, so this is none of the documented NMI sources,
449 * so it must be the NMI watchdog.
450 */
Don Zickus3adbbcce2006-09-26 10:52:26 +0200451 if (nmi_watchdog_tick(regs, reason))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700452 return;
Alexander van Heukelumabd34802008-07-02 18:39:01 +0200453 if (!do_nmi_callback(regs, cpu))
Don Zickus3adbbcce2006-09-26 10:52:26 +0200454 unknown_nmi_error(reason, regs);
Ingo Molnarb5964402008-02-26 11:15:50 +0100455#else
456 unknown_nmi_error(reason, regs);
457#endif
Don Zickus2fbe7b22006-09-26 10:52:27 +0200458
Linus Torvalds1da177e2005-04-16 15:20:36 -0700459 return;
460 }
Jan Beulich20c0d2d2006-03-26 01:37:01 -0800461 if (notify_die(DIE_NMI, "nmi", regs, reason, 2, SIGINT) == NOTIFY_STOP)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700462 return;
Alexander van Heukeluma8c1be92008-07-02 01:29:44 +0200463
464 /* AK: following checks seem to be broken on modern chipsets. FIXME */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700465 if (reason & 0x80)
466 mem_parity_error(reason, regs);
467 if (reason & 0x40)
468 io_check_error(reason, regs);
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200469#ifdef CONFIG_X86_32
Linus Torvalds1da177e2005-04-16 15:20:36 -0700470 /*
471 * Reassert NMI in case it became active meanwhile
Ingo Molnarb5964402008-02-26 11:15:50 +0100472 * as it's edge-triggered:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700473 */
474 reassert_nmi();
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200475#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700476}
477
Alexander van Heukelume407d6202008-09-30 18:41:36 +0200478dotraplinkage notrace __kprobes void
479do_nmi(struct pt_regs *regs, long error_code)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700480{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700481 nmi_enter();
482
Hiroshi Shimamoto915b0d02008-12-08 19:19:26 -0800483 inc_irq_stat(__nmi_count);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700484
Andi Kleen8f4e9562007-07-22 11:12:32 +0200485 if (!ignore_nmis)
486 default_do_nmi(regs);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700487
488 nmi_exit();
489}
490
Andi Kleen8f4e9562007-07-22 11:12:32 +0200491void stop_nmi(void)
492{
493 acpi_nmi_disable();
494 ignore_nmis++;
495}
496
497void restart_nmi(void)
498{
499 ignore_nmis--;
500 acpi_nmi_enable();
501}
502
Alexander van Heukelumc1d518c2008-10-03 23:17:11 +0200503/* May run on IST stack. */
Alexander van Heukelume407d6202008-09-30 18:41:36 +0200504dotraplinkage void __kprobes do_int3(struct pt_regs *regs, long error_code)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700505{
Alexander van Heukelumb94da1e2008-09-09 21:55:58 +0200506#ifdef CONFIG_KPROBES
Linus Torvalds1da177e2005-04-16 15:20:36 -0700507 if (notify_die(DIE_INT3, "int3", regs, error_code, 3, SIGTRAP)
508 == NOTIFY_STOP)
Stas Sergeev48c88212005-05-01 08:58:49 -0700509 return;
Alexander van Heukelumb94da1e2008-09-09 21:55:58 +0200510#else
511 if (notify_die(DIE_TRAP, "int3", regs, error_code, 3, SIGTRAP)
512 == NOTIFY_STOP)
513 return;
514#endif
Ingo Molnarb5964402008-02-26 11:15:50 +0100515
Alexander van Heukelum4915a352008-10-03 22:00:34 +0200516 preempt_conditional_sti(regs);
Alexander van Heukelum3c1326f2008-09-26 14:03:08 +0200517 do_trap(3, SIGTRAP, "int3", regs, error_code, NULL);
Alexander van Heukelum4915a352008-10-03 22:00:34 +0200518 preempt_conditional_cli(regs);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700519}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700520
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200521#ifdef CONFIG_X86_64
Ingo Molnarbd8b96d2008-12-26 09:20:22 +0100522/*
523 * Help handler running on IST stack to switch back to user stack
524 * for scheduling or signal handling. The actual stack switch is done in
525 * entry.S
526 */
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200527asmlinkage __kprobes struct pt_regs *sync_regs(struct pt_regs *eregs)
528{
529 struct pt_regs *regs = eregs;
530 /* Did already sync */
531 if (eregs == (struct pt_regs *)eregs->sp)
532 ;
533 /* Exception from user space */
534 else if (user_mode(eregs))
535 regs = task_pt_regs(current);
Ingo Molnarbd8b96d2008-12-26 09:20:22 +0100536 /*
537 * Exception from kernel and interrupts are enabled. Move to
538 * kernel process stack.
539 */
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200540 else if (eregs->flags & X86_EFLAGS_IF)
541 regs = (struct pt_regs *)(eregs->sp -= sizeof(struct pt_regs));
542 if (eregs != regs)
543 *regs = *eregs;
544 return regs;
545}
546#endif
547
Linus Torvalds1da177e2005-04-16 15:20:36 -0700548/*
549 * Our handling of the processor debug registers is non-trivial.
550 * We do not clear them on entry and exit from the kernel. Therefore
551 * it is possible to get a watchpoint trap here from inside the kernel.
552 * However, the code in ./ptrace.c has ensured that the user can
553 * only set watchpoints on userspace addresses. Therefore the in-kernel
554 * watchpoint trap can only occur in code which is reading/writing
555 * from user space. Such code must not hold kernel locks (since it
556 * can equally take a page fault), therefore it is safe to call
557 * force_sig_info even though that claims and releases locks.
Ingo Molnarb5964402008-02-26 11:15:50 +0100558 *
Linus Torvalds1da177e2005-04-16 15:20:36 -0700559 * Code in ./signal.c ensures that the debug control register
560 * is restored before we deliver any signal, and therefore that
561 * user code runs with the correct debug control register even though
562 * we clear it here.
563 *
564 * Being careful here means that we don't have to be as careful in a
565 * lot of more complicated places (task switching can be a bit lazy
566 * about restoring all the debug state, and ptrace doesn't have to
567 * find every occurrence of the TF bit that could be saved away even
568 * by user code)
Alexander van Heukelumc1d518c2008-10-03 23:17:11 +0200569 *
570 * May run on IST stack.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700571 */
Alexander van Heukelume407d6202008-09-30 18:41:36 +0200572dotraplinkage void __kprobes do_debug(struct pt_regs *regs, long error_code)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700573{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700574 struct task_struct *tsk = current;
Alexander van Heukelum3d2a71a2008-09-30 18:41:37 +0200575 unsigned long condition;
Srinivasa Dsda654b72008-09-23 15:23:52 +0530576 int si_code;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700577
Vincent Hanquez1cc6f122005-06-23 00:08:43 -0700578 get_debugreg(condition, 6);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700579
Roland McGrath10faa812008-01-30 13:30:54 +0100580 /*
581 * The processor cleared BTF, so don't mark that we need it set.
582 */
583 clear_tsk_thread_flag(tsk, TIF_DEBUGCTLMSR);
584 tsk->thread.debugctlmsr = 0;
585
Linus Torvalds1da177e2005-04-16 15:20:36 -0700586 if (notify_die(DIE_DEBUG, "debug", regs, condition, error_code,
Alexander van Heukeluma8c1be92008-07-02 01:29:44 +0200587 SIGTRAP) == NOTIFY_STOP)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700588 return;
Alexander van Heukelum3d2a71a2008-09-30 18:41:37 +0200589
Linus Torvalds1da177e2005-04-16 15:20:36 -0700590 /* It's safe to allow irq's after DR6 has been saved */
Alexander van Heukelum3d2a71a2008-09-30 18:41:37 +0200591 preempt_conditional_sti(regs);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700592
593 /* Mask out spurious debug traps due to lazy DR7 setting */
594 if (condition & (DR_TRAP0|DR_TRAP1|DR_TRAP2|DR_TRAP3)) {
Roland McGrath0f534092008-01-30 13:30:59 +0100595 if (!tsk->thread.debugreg7)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700596 goto clear_dr7;
597 }
598
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200599#ifdef CONFIG_X86_32
gorcunov@gmail.com6b6891f2008-03-28 17:56:57 +0300600 if (regs->flags & X86_VM_MASK)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700601 goto debug_vm86;
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200602#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700603
604 /* Save debug status register where ptrace can see it */
Roland McGrath0f534092008-01-30 13:30:59 +0100605 tsk->thread.debugreg6 = condition;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700606
607 /*
608 * Single-stepping through TF: make sure we ignore any events in
609 * kernel space (but re-enable TF when returning to user mode).
610 */
611 if (condition & DR_STEP) {
Vincent Hanquez717b5942005-06-23 00:08:45 -0700612 if (!user_mode(regs))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700613 goto clear_TF_reenable;
614 }
615
Alexander van Heukelum3d2a71a2008-09-30 18:41:37 +0200616 si_code = get_si_code(condition);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700617 /* Ok, finally something we can handle */
Srinivasa Dsda654b72008-09-23 15:23:52 +0530618 send_sigtrap(tsk, regs, error_code, si_code);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700619
Ingo Molnarb5964402008-02-26 11:15:50 +0100620 /*
621 * Disable additional traps. They'll be re-enabled when
Linus Torvalds1da177e2005-04-16 15:20:36 -0700622 * the signal is delivered.
623 */
624clear_dr7:
Vincent Hanquez1cc6f122005-06-23 00:08:43 -0700625 set_debugreg(0, 7);
Alexander van Heukelum3d2a71a2008-09-30 18:41:37 +0200626 preempt_conditional_cli(regs);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700627 return;
628
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200629#ifdef CONFIG_X86_32
Linus Torvalds1da177e2005-04-16 15:20:36 -0700630debug_vm86:
631 handle_vm86_trap((struct kernel_vm86_regs *) regs, error_code, 1);
Alexander van Heukelum3d2a71a2008-09-30 18:41:37 +0200632 preempt_conditional_cli(regs);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700633 return;
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200634#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700635
636clear_TF_reenable:
637 set_tsk_thread_flag(tsk, TIF_SINGLESTEP);
Ingo Molnar60930152008-03-30 11:45:23 +0200638 regs->flags &= ~X86_EFLAGS_TF;
Alexander van Heukelum3d2a71a2008-09-30 18:41:37 +0200639 preempt_conditional_cli(regs);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700640 return;
641}
642
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200643#ifdef CONFIG_X86_64
644static int kernel_math_error(struct pt_regs *regs, const char *str, int trapnr)
645{
646 if (fixup_exception(regs))
647 return 1;
648
649 notify_die(DIE_GPF, str, regs, 0, trapnr, SIGFPE);
650 /* Illegal floating point operation in the kernel */
651 current->thread.trap_no = trapnr;
652 die(str, regs, 0);
653 return 0;
654}
655#endif
656
Linus Torvalds1da177e2005-04-16 15:20:36 -0700657/*
658 * Note that we play around with the 'TS' bit in an attempt to get
659 * the correct behaviour even in the presence of the asynchronous
660 * IRQ13 behaviour
661 */
H. Peter Anvin65ea5b02008-01-30 13:30:56 +0100662void math_error(void __user *ip)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700663{
Ingo Molnarb5964402008-02-26 11:15:50 +0100664 struct task_struct *task;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700665 siginfo_t info;
H. Peter Anvinadf77ba2008-12-22 17:56:05 -0800666 unsigned short cwd, swd, err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700667
668 /*
669 * Save the info for the exception handler and clear the error.
670 */
671 task = current;
672 save_init_fpu(task);
673 task->thread.trap_no = 16;
674 task->thread.error_code = 0;
675 info.si_signo = SIGFPE;
676 info.si_errno = 0;
H. Peter Anvin65ea5b02008-01-30 13:30:56 +0100677 info.si_addr = ip;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700678 /*
679 * (~cwd & swd) will mask out exceptions that are not set to unmasked
680 * status. 0x3f is the exception bits in these regs, 0x200 is the
681 * C1 reg you need in case of a stack fault, 0x040 is the stack
682 * fault bit. We should only be taking one exception at a time,
683 * so if this combination doesn't produce any single exception,
Alexander van Heukeluma8c1be92008-07-02 01:29:44 +0200684 * then we have a bad program that isn't synchronizing its FPU usage
Linus Torvalds1da177e2005-04-16 15:20:36 -0700685 * and it will suffer the consequences since we won't be able to
686 * fully reproduce the context of the exception
687 */
688 cwd = get_fpu_cwd(task);
689 swd = get_fpu_swd(task);
H. Peter Anvinadf77ba2008-12-22 17:56:05 -0800690
H. Peter Anvina73ad332008-12-25 10:39:01 -0800691 err = swd & ~cwd;
H. Peter Anvinadf77ba2008-12-22 17:56:05 -0800692
693 if (err & 0x001) { /* Invalid op */
Ingo Molnarb5964402008-02-26 11:15:50 +0100694 /*
695 * swd & 0x240 == 0x040: Stack Underflow
696 * swd & 0x240 == 0x240: Stack Overflow
697 * User must clear the SF bit (0x40) if set
698 */
699 info.si_code = FPE_FLTINV;
H. Peter Anvinadf77ba2008-12-22 17:56:05 -0800700 } else if (err & 0x004) { /* Divide by Zero */
Ingo Molnarb5964402008-02-26 11:15:50 +0100701 info.si_code = FPE_FLTDIV;
H. Peter Anvinadf77ba2008-12-22 17:56:05 -0800702 } else if (err & 0x008) { /* Overflow */
Ingo Molnarb5964402008-02-26 11:15:50 +0100703 info.si_code = FPE_FLTOVF;
H. Peter Anvinadf77ba2008-12-22 17:56:05 -0800704 } else if (err & 0x012) { /* Denormal, Underflow */
705 info.si_code = FPE_FLTUND;
706 } else if (err & 0x020) { /* Precision */
Ingo Molnarb5964402008-02-26 11:15:50 +0100707 info.si_code = FPE_FLTRES;
H. Peter Anvinadf77ba2008-12-22 17:56:05 -0800708 } else {
Ingo Molnarbd8b96d2008-12-26 09:20:22 +0100709 /*
710 * If we're using IRQ 13, or supposedly even some trap 16
711 * implementations, it's possible we get a spurious trap...
712 */
H. Peter Anvina73ad332008-12-25 10:39:01 -0800713 return; /* Spurious trap, no error */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700714 }
715 force_sig_info(SIGFPE, &info, task);
716}
717
Alexander van Heukelume407d6202008-09-30 18:41:36 +0200718dotraplinkage void do_coprocessor_error(struct pt_regs *regs, long error_code)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700719{
Alexander van Heukelum252d28f2008-09-09 21:56:09 +0200720 conditional_sti(regs);
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200721
722#ifdef CONFIG_X86_32
Linus Torvalds1da177e2005-04-16 15:20:36 -0700723 ignore_fpu_irq = 1;
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200724#else
725 if (!user_mode(regs) &&
726 kernel_math_error(regs, "kernel x87 math error", 16))
727 return;
728#endif
729
H. Peter Anvin65ea5b02008-01-30 13:30:56 +0100730 math_error((void __user *)regs->ip);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700731}
732
H. Peter Anvin65ea5b02008-01-30 13:30:56 +0100733static void simd_math_error(void __user *ip)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700734{
Ingo Molnarb5964402008-02-26 11:15:50 +0100735 struct task_struct *task;
Ingo Molnarb5964402008-02-26 11:15:50 +0100736 siginfo_t info;
Alexander van Heukelum7b4fd4b2008-07-02 01:33:14 +0200737 unsigned short mxcsr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700738
739 /*
740 * Save the info for the exception handler and clear the error.
741 */
742 task = current;
743 save_init_fpu(task);
744 task->thread.trap_no = 19;
745 task->thread.error_code = 0;
746 info.si_signo = SIGFPE;
747 info.si_errno = 0;
748 info.si_code = __SI_FAULT;
H. Peter Anvin65ea5b02008-01-30 13:30:56 +0100749 info.si_addr = ip;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700750 /*
751 * The SIMD FPU exceptions are handled a little differently, as there
752 * is only a single status/control register. Thus, to determine which
753 * unmasked exception was caught we must mask the exception mask bits
754 * at 0x1f80, and then use these to mask the exception bits at 0x3f.
755 */
756 mxcsr = get_fpu_mxcsr(task);
757 switch (~((mxcsr & 0x1f80) >> 7) & (mxcsr & 0x3f)) {
Ingo Molnarb5964402008-02-26 11:15:50 +0100758 case 0x000:
759 default:
760 break;
761 case 0x001: /* Invalid Op */
762 info.si_code = FPE_FLTINV;
763 break;
764 case 0x002: /* Denormalize */
765 case 0x010: /* Underflow */
766 info.si_code = FPE_FLTUND;
767 break;
768 case 0x004: /* Zero Divide */
769 info.si_code = FPE_FLTDIV;
770 break;
771 case 0x008: /* Overflow */
772 info.si_code = FPE_FLTOVF;
773 break;
774 case 0x020: /* Precision */
775 info.si_code = FPE_FLTRES;
776 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700777 }
778 force_sig_info(SIGFPE, &info, task);
779}
780
Alexander van Heukelume407d6202008-09-30 18:41:36 +0200781dotraplinkage void
782do_simd_coprocessor_error(struct pt_regs *regs, long error_code)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700783{
Alexander van Heukelumb939bde2008-09-09 21:56:12 +0200784 conditional_sti(regs);
785
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200786#ifdef CONFIG_X86_32
Linus Torvalds1da177e2005-04-16 15:20:36 -0700787 if (cpu_has_xmm) {
788 /* Handle SIMD FPU exceptions on PIII+ processors. */
789 ignore_fpu_irq = 1;
H. Peter Anvin65ea5b02008-01-30 13:30:56 +0100790 simd_math_error((void __user *)regs->ip);
Ingo Molnarb5964402008-02-26 11:15:50 +0100791 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700792 }
Ingo Molnarb5964402008-02-26 11:15:50 +0100793 /*
794 * Handle strange cache flush from user space exception
795 * in all other cases. This is undocumented behaviour.
796 */
gorcunov@gmail.com6b6891f2008-03-28 17:56:57 +0300797 if (regs->flags & X86_VM_MASK) {
Ingo Molnarb5964402008-02-26 11:15:50 +0100798 handle_vm86_fault((struct kernel_vm86_regs *)regs, error_code);
799 return;
800 }
801 current->thread.trap_no = 19;
802 current->thread.error_code = error_code;
803 die_if_kernel("cache flush denied", regs, error_code);
804 force_sig(SIGSEGV, current);
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200805#else
806 if (!user_mode(regs) &&
807 kernel_math_error(regs, "kernel simd math error", 19))
808 return;
809 simd_math_error((void __user *)regs->ip);
810#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700811}
812
Alexander van Heukelume407d6202008-09-30 18:41:36 +0200813dotraplinkage void
814do_spurious_interrupt_bug(struct pt_regs *regs, long error_code)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700815{
Alexander van Heukelumcf819782008-09-09 21:56:08 +0200816 conditional_sti(regs);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700817#if 0
818 /* No need to warn about this any longer. */
Ingo Molnarb5964402008-02-26 11:15:50 +0100819 printk(KERN_INFO "Ignoring P6 Local APIC Spurious Interrupt Bug...\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700820#endif
821}
822
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200823#ifdef CONFIG_X86_32
Ingo Molnarb5964402008-02-26 11:15:50 +0100824unsigned long patch_espfix_desc(unsigned long uesp, unsigned long kesp)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700825{
Glauber Costa736f12b2008-05-27 20:14:51 -0700826 struct desc_struct *gdt = get_cpu_gdt_table(smp_processor_id());
Stas Sergeevbe44d2a2006-12-07 02:14:01 +0100827 unsigned long base = (kesp - uesp) & -THREAD_SIZE;
828 unsigned long new_kesp = kesp - base;
829 unsigned long lim_pages = (new_kesp | (THREAD_SIZE - 1)) >> PAGE_SHIFT;
830 __u64 desc = *(__u64 *)&gdt[GDT_ENTRY_ESPFIX_SS];
Ingo Molnarb5964402008-02-26 11:15:50 +0100831
Stas Sergeevbe44d2a2006-12-07 02:14:01 +0100832 /* Set up base for espfix segment */
Ingo Molnarb5964402008-02-26 11:15:50 +0100833 desc &= 0x00f0ff0000000000ULL;
834 desc |= ((((__u64)base) << 16) & 0x000000ffffff0000ULL) |
Stas Sergeevbe44d2a2006-12-07 02:14:01 +0100835 ((((__u64)base) << 32) & 0xff00000000000000ULL) |
836 ((((__u64)lim_pages) << 32) & 0x000f000000000000ULL) |
837 (lim_pages & 0xffff);
838 *(__u64 *)&gdt[GDT_ENTRY_ESPFIX_SS] = desc;
Ingo Molnarb5964402008-02-26 11:15:50 +0100839
Stas Sergeevbe44d2a2006-12-07 02:14:01 +0100840 return new_kesp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700841}
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200842#else
843asmlinkage void __attribute__((weak)) smp_thermal_interrupt(void)
844{
845}
846
847asmlinkage void __attribute__((weak)) mce_threshold_interrupt(void)
848{
849}
850#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700851
852/*
Ingo Molnarb5964402008-02-26 11:15:50 +0100853 * 'math_state_restore()' saves the current math information in the
Linus Torvalds1da177e2005-04-16 15:20:36 -0700854 * old math state array, and gets the new ones from the current task
855 *
856 * Careful.. There are problems with IBM-designed IRQ13 behaviour.
857 * Don't touch unless you *really* know how it works.
858 *
859 * Must be called with kernel preemption disabled (in this case,
860 * local interrupts are disabled at the call-site in entry.S).
861 */
Chuck Ebbertacc20762006-12-07 02:14:01 +0100862asmlinkage void math_state_restore(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700863{
864 struct thread_info *thread = current_thread_info();
865 struct task_struct *tsk = thread->task;
866
Suresh Siddhaaa283f42008-03-10 15:28:05 -0700867 if (!tsk_used_math(tsk)) {
868 local_irq_enable();
869 /*
870 * does a slab alloc which can sleep
871 */
872 if (init_fpu(tsk)) {
873 /*
874 * ran out of memory!
875 */
876 do_group_exit(SIGKILL);
877 return;
878 }
879 local_irq_disable();
880 }
881
Ingo Molnarb5964402008-02-26 11:15:50 +0100882 clts(); /* Allow maths ops (or we recurse) */
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200883#ifdef CONFIG_X86_32
Linus Torvalds1da177e2005-04-16 15:20:36 -0700884 restore_fpu(tsk);
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200885#else
886 /*
887 * Paranoid restore. send a SIGSEGV if we fail to restore the state.
888 */
889 if (unlikely(restore_fpu_checking(tsk))) {
890 stts();
891 force_sig(SIGSEGV, tsk);
892 return;
893 }
894#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700895 thread->status |= TS_USEDFPU; /* So we fnsave on switch_to() */
Chuck Ebbertacc20762006-12-07 02:14:01 +0100896 tsk->fpu_counter++;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700897}
Rusty Russell5992b6d2007-07-19 01:49:21 -0700898EXPORT_SYMBOL_GPL(math_state_restore);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700899
900#ifndef CONFIG_MATH_EMULATION
Linus Torvalds1da177e2005-04-16 15:20:36 -0700901asmlinkage void math_emulate(long arg)
902{
Ingo Molnarb5964402008-02-26 11:15:50 +0100903 printk(KERN_EMERG
904 "math-emulation not enabled and no coprocessor found.\n");
905 printk(KERN_EMERG "killing %s.\n", current->comm);
906 force_sig(SIGFPE, current);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700907 schedule();
908}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700909#endif /* CONFIG_MATH_EMULATION */
910
Alexander van Heukelume407d6202008-09-30 18:41:36 +0200911dotraplinkage void __kprobes
912do_device_not_available(struct pt_regs *regs, long error)
Alexander van Heukelum7643e9b2008-09-09 21:56:02 +0200913{
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200914#ifdef CONFIG_X86_32
Alexander van Heukelum7643e9b2008-09-09 21:56:02 +0200915 if (read_cr0() & X86_CR0_EM) {
916 conditional_sti(regs);
917 math_emulate(0);
918 } else {
919 math_state_restore(); /* interrupts still off */
920 conditional_sti(regs);
921 }
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200922#else
923 math_state_restore();
924#endif
Alexander van Heukelum7643e9b2008-09-09 21:56:02 +0200925}
926
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200927#ifdef CONFIG_X86_32
Alexander van Heukelume407d6202008-09-30 18:41:36 +0200928dotraplinkage void do_iret_error(struct pt_regs *regs, long error_code)
Alexander van Heukelumf8e08702008-09-09 21:56:13 +0200929{
930 siginfo_t info;
931 local_irq_enable();
932
933 info.si_signo = SIGILL;
934 info.si_errno = 0;
935 info.si_code = ILL_BADSTK;
936 info.si_addr = 0;
937 if (notify_die(DIE_TRAP, "iret exception",
938 regs, error_code, 32, SIGILL) == NOTIFY_STOP)
939 return;
Alexander van Heukelum3c1326f2008-09-26 14:03:08 +0200940 do_trap(32, SIGILL, "iret exception", regs, error_code, &info);
Alexander van Heukelumf8e08702008-09-09 21:56:13 +0200941}
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200942#endif
Alexander van Heukelumf8e08702008-09-09 21:56:13 +0200943
Linus Torvalds1da177e2005-04-16 15:20:36 -0700944void __init trap_init(void)
945{
Rusty Russelldbeb2be2007-10-19 20:35:03 +0200946 int i;
947
Linus Torvalds1da177e2005-04-16 15:20:36 -0700948#ifdef CONFIG_EISA
Ingo Molnar927222b2008-01-30 13:33:49 +0100949 void __iomem *p = early_ioremap(0x0FFFD9, 4);
Ingo Molnarb5964402008-02-26 11:15:50 +0100950
951 if (readl(p) == 'E' + ('I'<<8) + ('S'<<16) + ('A'<<24))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700952 EISA_bus = 1;
Ingo Molnar927222b2008-01-30 13:33:49 +0100953 early_iounmap(p, 4);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700954#endif
955
Alexander van Heukelum976382d2008-09-09 21:55:57 +0200956 set_intr_gate(0, &divide_error);
Alexander van Heukelum699d2932008-10-03 22:00:32 +0200957 set_intr_gate_ist(1, &debug, DEBUG_STACK);
958 set_intr_gate_ist(2, &nmi, NMI_STACK);
959 /* int3 can be called from all */
960 set_system_intr_gate_ist(3, &int3, DEBUG_STACK);
961 /* int4 can be called from all */
962 set_system_intr_gate(4, &overflow);
Alexander van Heukelum64f644c2008-09-09 21:56:00 +0200963 set_intr_gate(5, &bounds);
Alexander van Heukelum12394cf2008-09-09 21:56:01 +0200964 set_intr_gate(6, &invalid_op);
Alexander van Heukelum7643e9b2008-09-09 21:56:02 +0200965 set_intr_gate(7, &device_not_available);
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200966#ifdef CONFIG_X86_32
Alexander van Heukeluma8c1be92008-07-02 01:29:44 +0200967 set_task_gate(8, GDT_ENTRY_DOUBLEFAULT_TSS);
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200968#else
969 set_intr_gate_ist(8, &double_fault, DOUBLEFAULT_STACK);
970#endif
Alexander van Heukelum51bc1ed2008-09-09 21:56:03 +0200971 set_intr_gate(9, &coprocessor_segment_overrun);
Alexander van Heukelum6bf77bf2008-09-09 21:56:04 +0200972 set_intr_gate(10, &invalid_TSS);
Alexander van Heukelum36d936c2008-09-09 21:56:05 +0200973 set_intr_gate(11, &segment_not_present);
Alexander van Heukelum699d2932008-10-03 22:00:32 +0200974 set_intr_gate_ist(12, &stack_segment, STACKFAULT_STACK);
Alexander van Heukelumc6df0d72008-09-09 21:56:07 +0200975 set_intr_gate(13, &general_protection);
Ingo Molnarb5964402008-02-26 11:15:50 +0100976 set_intr_gate(14, &page_fault);
Alexander van Heukelumcf819782008-09-09 21:56:08 +0200977 set_intr_gate(15, &spurious_interrupt_bug);
Alexander van Heukelum252d28f2008-09-09 21:56:09 +0200978 set_intr_gate(16, &coprocessor_error);
Alexander van Heukelum5feedfd2008-09-09 21:56:10 +0200979 set_intr_gate(17, &alignment_check);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700980#ifdef CONFIG_X86_MCE
Alexander van Heukelum699d2932008-10-03 22:00:32 +0200981 set_intr_gate_ist(18, &machine_check, MCE_STACK);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700982#endif
Alexander van Heukelumb939bde2008-09-09 21:56:12 +0200983 set_intr_gate(19, &simd_coprocessor_error);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700984
Alexander van Heukelum081f75b2008-10-03 22:00:39 +0200985#ifdef CONFIG_IA32_EMULATION
986 set_system_intr_gate(IA32_SYSCALL_VECTOR, ia32_syscall);
987#endif
988
989#ifdef CONFIG_X86_32
Jan Beulichd43c6e82006-01-06 00:11:49 -0800990 if (cpu_has_fxsr) {
Jan Beulichd43c6e82006-01-06 00:11:49 -0800991 printk(KERN_INFO "Enabling fast FPU save and restore... ");
992 set_in_cr4(X86_CR4_OSFXSR);
993 printk("done.\n");
994 }
995 if (cpu_has_xmm) {
Ingo Molnarb5964402008-02-26 11:15:50 +0100996 printk(KERN_INFO
997 "Enabling unmasked SIMD FPU exception support... ");
Jan Beulichd43c6e82006-01-06 00:11:49 -0800998 set_in_cr4(X86_CR4_OSXMMEXCPT);
999 printk("done.\n");
1000 }
1001
Alexander van Heukelum699d2932008-10-03 22:00:32 +02001002 set_system_trap_gate(SYSCALL_VECTOR, &system_call);
Yinghai Lub77b8812008-12-19 15:23:44 -08001003#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001004
Ingo Molnarb5964402008-02-26 11:15:50 +01001005 /* Reserve all the builtin and the syscall vector: */
Rusty Russelldbeb2be2007-10-19 20:35:03 +02001006 for (i = 0; i < FIRST_EXTERNAL_VECTOR; i++)
1007 set_bit(i, used_vectors);
Ingo Molnarb5964402008-02-26 11:15:50 +01001008
Yinghai Lub77b8812008-12-19 15:23:44 -08001009#ifdef CONFIG_X86_64
1010 set_bit(IA32_SYSCALL_VECTOR, used_vectors);
1011#else
Rusty Russelldbeb2be2007-10-19 20:35:03 +02001012 set_bit(SYSCALL_VECTOR, used_vectors);
Alexander van Heukelum081f75b2008-10-03 22:00:39 +02001013#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001014 /*
Ingo Molnarb5964402008-02-26 11:15:50 +01001015 * Should be a barrier for any external CPU state:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001016 */
1017 cpu_init();
1018
Alexander van Heukelum081f75b2008-10-03 22:00:39 +02001019#ifdef CONFIG_X86_32
Linus Torvalds1da177e2005-04-16 15:20:36 -07001020 trap_init_hook();
Alexander van Heukelum081f75b2008-10-03 22:00:39 +02001021#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001022}