blob: 4a836384dd0ffe95d9aad429292217ad14678b2e [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/arch/x86-64/traps.c
3 *
4 * Copyright (C) 1991, 1992 Linus Torvalds
5 * Copyright (C) 2000, 2001, 2002 Andi Kleen, SuSE Labs
6 *
7 * Pentium III FXSR, SSE support
8 * Gareth Hughes <gareth@valinux.com>, May 2000
9 *
10 * $Id: traps.c,v 1.36 2002/03/24 11:09:10 ak Exp $
11 */
12
13/*
14 * 'Traps.c' handles hardware traps and faults after we have saved some
15 * state in 'entry.S'.
16 */
17#include <linux/config.h>
18#include <linux/sched.h>
19#include <linux/kernel.h>
20#include <linux/string.h>
21#include <linux/errno.h>
22#include <linux/ptrace.h>
23#include <linux/timer.h>
24#include <linux/mm.h>
25#include <linux/init.h>
26#include <linux/delay.h>
27#include <linux/spinlock.h>
28#include <linux/interrupt.h>
29#include <linux/module.h>
30#include <linux/moduleparam.h>
akpm@osdl.org35faa712005-04-16 15:24:54 -070031#include <linux/nmi.h>
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -070032#include <linux/kprobes.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070033
34#include <asm/system.h>
35#include <asm/uaccess.h>
36#include <asm/io.h>
37#include <asm/atomic.h>
38#include <asm/debugreg.h>
39#include <asm/desc.h>
40#include <asm/i387.h>
41#include <asm/kdebug.h>
42#include <asm/processor.h>
43
44#include <asm/smp.h>
45#include <asm/pgalloc.h>
46#include <asm/pda.h>
47#include <asm/proto.h>
48#include <asm/nmi.h>
49
Linus Torvalds1da177e2005-04-16 15:20:36 -070050extern struct gate_struct idt_table[256];
51
52asmlinkage void divide_error(void);
53asmlinkage void debug(void);
54asmlinkage void nmi(void);
55asmlinkage void int3(void);
56asmlinkage void overflow(void);
57asmlinkage void bounds(void);
58asmlinkage void invalid_op(void);
59asmlinkage void device_not_available(void);
60asmlinkage void double_fault(void);
61asmlinkage void coprocessor_segment_overrun(void);
62asmlinkage void invalid_TSS(void);
63asmlinkage void segment_not_present(void);
64asmlinkage void stack_segment(void);
65asmlinkage void general_protection(void);
66asmlinkage void page_fault(void);
67asmlinkage void coprocessor_error(void);
68asmlinkage void simd_coprocessor_error(void);
69asmlinkage void reserved(void);
70asmlinkage void alignment_check(void);
71asmlinkage void machine_check(void);
72asmlinkage void spurious_interrupt_bug(void);
73asmlinkage void call_debug(void);
74
75struct notifier_block *die_chain;
76static DEFINE_SPINLOCK(die_notifier_lock);
77
78int register_die_notifier(struct notifier_block *nb)
79{
80 int err = 0;
81 unsigned long flags;
82 spin_lock_irqsave(&die_notifier_lock, flags);
83 err = notifier_chain_register(&die_chain, nb);
84 spin_unlock_irqrestore(&die_notifier_lock, flags);
85 return err;
86}
87
88static inline void conditional_sti(struct pt_regs *regs)
89{
90 if (regs->eflags & X86_EFLAGS_IF)
91 local_irq_enable();
92}
93
94static int kstack_depth_to_print = 10;
95
96#ifdef CONFIG_KALLSYMS
97#include <linux/kallsyms.h>
98int printk_address(unsigned long address)
99{
100 unsigned long offset = 0, symsize;
101 const char *symname;
102 char *modname;
103 char *delim = ":";
104 char namebuf[128];
105
106 symname = kallsyms_lookup(address, &symsize, &offset, &modname, namebuf);
107 if (!symname)
108 return printk("[<%016lx>]", address);
109 if (!modname)
110 modname = delim = "";
111 return printk("<%016lx>{%s%s%s%s%+ld}",
112 address,delim,modname,delim,symname,offset);
113}
114#else
115int printk_address(unsigned long address)
116{
117 return printk("[<%016lx>]", address);
118}
119#endif
120
Andi Kleen0a658002005-04-16 15:25:17 -0700121static unsigned long *in_exception_stack(unsigned cpu, unsigned long stack,
122 unsigned *usedp, const char **idp)
123{
124 static const char ids[N_EXCEPTION_STACKS][8] = {
125 [DEBUG_STACK - 1] = "#DB",
126 [NMI_STACK - 1] = "NMI",
127 [DOUBLEFAULT_STACK - 1] = "#DF",
128 [STACKFAULT_STACK - 1] = "#SS",
129 [MCE_STACK - 1] = "#MC",
130 };
131 unsigned k;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700132
Andi Kleen0a658002005-04-16 15:25:17 -0700133 for (k = 0; k < N_EXCEPTION_STACKS; k++) {
134 unsigned long end;
135
136 end = per_cpu(init_tss, cpu).ist[k];
137 if (stack >= end)
138 continue;
139 if (stack >= end - EXCEPTION_STKSZ) {
140 if (*usedp & (1U << k))
141 break;
142 *usedp |= 1U << k;
143 *idp = ids[k];
144 return (unsigned long *)end;
145 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700146 }
147 return NULL;
Andi Kleen0a658002005-04-16 15:25:17 -0700148}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700149
150/*
151 * x86-64 can have upto three kernel stacks:
152 * process stack
153 * interrupt stack
Andi Kleen0a658002005-04-16 15:25:17 -0700154 * severe exception (double fault, nmi, stack fault, debug, mce) hardware stack
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155 */
156
157void show_trace(unsigned long *stack)
158{
159 unsigned long addr;
Andi Kleen0a658002005-04-16 15:25:17 -0700160 const unsigned cpu = safe_smp_processor_id();
161 unsigned long *irqstack_end = (unsigned long *)cpu_pda[cpu].irqstackptr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700162 int i;
Andi Kleen0a658002005-04-16 15:25:17 -0700163 unsigned used = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164
165 printk("\nCall Trace:");
Andi Kleen0a658002005-04-16 15:25:17 -0700166
167#define HANDLE_STACK(cond) \
168 do while (cond) { \
169 addr = *stack++; \
170 if (kernel_text_address(addr)) { \
171 /* \
172 * If the address is either in the text segment of the \
173 * kernel, or in the region which contains vmalloc'ed \
174 * memory, it *may* be the address of a calling \
175 * routine; if so, print it so that someone tracing \
176 * down the cause of the crash will be able to figure \
177 * out the call path that was taken. \
178 */ \
179 i += printk_address(addr); \
180 if (i > 50) { \
181 printk("\n "); \
182 i = 0; \
183 } \
184 else \
185 i += printk(" "); \
186 } \
187 } while (0)
188
189 for(i = 0; ; ) {
190 const char *id;
191 unsigned long *estack_end;
192 estack_end = in_exception_stack(cpu, (unsigned long)stack,
193 &used, &id);
194
195 if (estack_end) {
196 i += printk(" <%s> ", id);
197 HANDLE_STACK (stack < estack_end);
198 i += printk(" <EOE> ");
199 stack = (unsigned long *) estack_end[-2];
200 continue;
201 }
202 if (irqstack_end) {
203 unsigned long *irqstack;
204 irqstack = irqstack_end -
205 (IRQSTACKSIZE - 64) / sizeof(*irqstack);
206
207 if (stack >= irqstack && stack < irqstack_end) {
208 i += printk(" <IRQ> ");
209 HANDLE_STACK (stack < irqstack_end);
210 stack = (unsigned long *) (irqstack_end[-1]);
211 irqstack_end = NULL;
212 i += printk(" <EOI> ");
213 continue;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700214 }
215 }
Andi Kleen0a658002005-04-16 15:25:17 -0700216 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217 }
Andi Kleen0a658002005-04-16 15:25:17 -0700218
219 HANDLE_STACK (((long) stack & (THREAD_SIZE-1)) != 0);
220#undef HANDLE_STACK
Linus Torvalds1da177e2005-04-16 15:20:36 -0700221 printk("\n");
222}
223
224void show_stack(struct task_struct *tsk, unsigned long * rsp)
225{
226 unsigned long *stack;
227 int i;
228 const int cpu = safe_smp_processor_id();
229 unsigned long *irqstack_end = (unsigned long *) (cpu_pda[cpu].irqstackptr);
230 unsigned long *irqstack = (unsigned long *) (cpu_pda[cpu].irqstackptr - IRQSTACKSIZE);
231
232 // debugging aid: "show_stack(NULL, NULL);" prints the
233 // back trace for this cpu.
234
235 if (rsp == NULL) {
236 if (tsk)
237 rsp = (unsigned long *)tsk->thread.rsp;
238 else
239 rsp = (unsigned long *)&rsp;
240 }
241
242 stack = rsp;
243 for(i=0; i < kstack_depth_to_print; i++) {
244 if (stack >= irqstack && stack <= irqstack_end) {
245 if (stack == irqstack_end) {
246 stack = (unsigned long *) (irqstack_end[-1]);
247 printk(" <EOI> ");
248 }
249 } else {
250 if (((long) stack & (THREAD_SIZE-1)) == 0)
251 break;
252 }
253 if (i && ((i % 4) == 0))
254 printk("\n ");
255 printk("%016lx ", *stack++);
akpm@osdl.org35faa712005-04-16 15:24:54 -0700256 touch_nmi_watchdog();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700257 }
258 show_trace((unsigned long *)rsp);
259}
260
261/*
262 * The architecture-independent dump_stack generator
263 */
264void dump_stack(void)
265{
266 unsigned long dummy;
267 show_trace(&dummy);
268}
269
270EXPORT_SYMBOL(dump_stack);
271
272void show_registers(struct pt_regs *regs)
273{
274 int i;
Vincent Hanquez76381fe2005-06-23 00:08:46 -0700275 int in_kernel = !user_mode(regs);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276 unsigned long rsp;
277 const int cpu = safe_smp_processor_id();
278 struct task_struct *cur = cpu_pda[cpu].pcurrent;
279
280 rsp = regs->rsp;
281
282 printk("CPU %d ", cpu);
283 __show_regs(regs);
284 printk("Process %s (pid: %d, threadinfo %p, task %p)\n",
285 cur->comm, cur->pid, cur->thread_info, cur);
286
287 /*
288 * When in-kernel, we also print out the stack and code at the
289 * time of the fault..
290 */
291 if (in_kernel) {
292
293 printk("Stack: ");
294 show_stack(NULL, (unsigned long*)rsp);
295
296 printk("\nCode: ");
297 if(regs->rip < PAGE_OFFSET)
298 goto bad;
299
300 for(i=0;i<20;i++)
301 {
302 unsigned char c;
303 if(__get_user(c, &((unsigned char*)regs->rip)[i])) {
304bad:
305 printk(" Bad RIP value.");
306 break;
307 }
308 printk("%02x ", c);
309 }
310 }
311 printk("\n");
312}
313
314void handle_BUG(struct pt_regs *regs)
315{
316 struct bug_frame f;
317 char tmp;
318
Vincent Hanquez76381fe2005-06-23 00:08:46 -0700319 if (user_mode(regs))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700320 return;
321 if (__copy_from_user(&f, (struct bug_frame *) regs->rip,
322 sizeof(struct bug_frame)))
323 return;
Jan Beulich049cdef2005-09-12 18:49:25 +0200324 if (f.filename >= 0 ||
Linus Torvalds1da177e2005-04-16 15:20:36 -0700325 f.ud2[0] != 0x0f || f.ud2[1] != 0x0b)
326 return;
Jan Beulich049cdef2005-09-12 18:49:25 +0200327 if (__get_user(tmp, (char *)(long)f.filename))
328 f.filename = (int)(long)"unmapped filename";
Linus Torvalds1da177e2005-04-16 15:20:36 -0700329 printk("----------- [cut here ] --------- [please bite here ] ---------\n");
Jan Beulich049cdef2005-09-12 18:49:25 +0200330 printk(KERN_ALERT "Kernel BUG at %.50s:%d\n", (char *)(long)f.filename, f.line);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700331}
332
Alexander Nyberg4f60fdf2005-05-25 12:31:28 -0700333#ifdef CONFIG_BUG
Linus Torvalds1da177e2005-04-16 15:20:36 -0700334void out_of_line_bug(void)
335{
336 BUG();
337}
Alexander Nyberg4f60fdf2005-05-25 12:31:28 -0700338#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339
340static DEFINE_SPINLOCK(die_lock);
341static int die_owner = -1;
342
Jan Beulich12091402005-09-12 18:49:24 +0200343unsigned long oops_begin(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344{
Jan Beulich12091402005-09-12 18:49:24 +0200345 int cpu = safe_smp_processor_id();
346 unsigned long flags;
347
348 /* racy, but better than risking deadlock. */
349 local_irq_save(flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700350 if (!spin_trylock(&die_lock)) {
351 if (cpu == die_owner)
352 /* nested oops. should stop eventually */;
353 else
Jan Beulich12091402005-09-12 18:49:24 +0200354 spin_lock(&die_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700355 }
Jan Beulich12091402005-09-12 18:49:24 +0200356 die_owner = cpu;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700357 console_verbose();
Jan Beulich12091402005-09-12 18:49:24 +0200358 bust_spinlocks(1);
359 return flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700360}
361
Jan Beulich12091402005-09-12 18:49:24 +0200362void oops_end(unsigned long flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363{
364 die_owner = -1;
Jan Beulich12091402005-09-12 18:49:24 +0200365 bust_spinlocks(0);
366 spin_unlock_irqrestore(&die_lock, flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700367 if (panic_on_oops)
Jan Beulich12091402005-09-12 18:49:24 +0200368 panic("Oops");
369}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700370
371void __die(const char * str, struct pt_regs * regs, long err)
372{
373 static int die_counter;
374 printk(KERN_EMERG "%s: %04lx [%u] ", str, err & 0xffff,++die_counter);
375#ifdef CONFIG_PREEMPT
376 printk("PREEMPT ");
377#endif
378#ifdef CONFIG_SMP
379 printk("SMP ");
380#endif
381#ifdef CONFIG_DEBUG_PAGEALLOC
382 printk("DEBUG_PAGEALLOC");
383#endif
384 printk("\n");
385 notify_die(DIE_OOPS, (char *)str, regs, err, 255, SIGSEGV);
386 show_registers(regs);
387 /* Executive summary in case the oops scrolled away */
388 printk(KERN_ALERT "RIP ");
389 printk_address(regs->rip);
390 printk(" RSP <%016lx>\n", regs->rsp);
391}
392
393void die(const char * str, struct pt_regs * regs, long err)
394{
Jan Beulich12091402005-09-12 18:49:24 +0200395 unsigned long flags = oops_begin();
396
Linus Torvalds1da177e2005-04-16 15:20:36 -0700397 handle_BUG(regs);
398 __die(str, regs, err);
Jan Beulich12091402005-09-12 18:49:24 +0200399 oops_end(flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700400 do_exit(SIGSEGV);
401}
402static inline void die_if_kernel(const char * str, struct pt_regs * regs, long err)
403{
404 if (!(regs->eflags & VM_MASK) && (regs->cs == __KERNEL_CS))
405 die(str, regs, err);
406}
407
408void die_nmi(char *str, struct pt_regs *regs)
409{
Jan Beulich12091402005-09-12 18:49:24 +0200410 unsigned long flags = oops_begin();
411
Linus Torvalds1da177e2005-04-16 15:20:36 -0700412 /*
413 * We are in trouble anyway, lets at least try
414 * to get a message out.
415 */
416 printk(str, safe_smp_processor_id());
417 show_registers(regs);
418 if (panic_on_timeout || panic_on_oops)
419 panic("nmi watchdog");
420 printk("console shuts up ...\n");
Jan Beulich12091402005-09-12 18:49:24 +0200421 oops_end(flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700422 do_exit(SIGSEGV);
423}
424
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -0700425static void __kprobes do_trap(int trapnr, int signr, char *str,
426 struct pt_regs * regs, long error_code,
427 siginfo_t *info)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700428{
429 conditional_sti(regs);
430
431#ifdef CONFIG_CHECKING
432 {
433 unsigned long gs;
434 struct x8664_pda *pda = cpu_pda + safe_smp_processor_id();
435 rdmsrl(MSR_GS_BASE, gs);
436 if (gs != (unsigned long)pda) {
437 wrmsrl(MSR_GS_BASE, pda);
438 printk("%s: wrong gs %lx expected %p rip %lx\n", str, gs, pda,
439 regs->rip);
440 }
441 }
442#endif
443
Vincent Hanquez76381fe2005-06-23 00:08:46 -0700444 if (user_mode(regs)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700445 struct task_struct *tsk = current;
446
447 if (exception_trace && unhandled_signal(tsk, signr))
448 printk(KERN_INFO
449 "%s[%d] trap %s rip:%lx rsp:%lx error:%lx\n",
450 tsk->comm, tsk->pid, str,
451 regs->rip,regs->rsp,error_code);
452
453 tsk->thread.error_code = error_code;
454 tsk->thread.trap_no = trapnr;
455 if (info)
456 force_sig_info(signr, info, tsk);
457 else
458 force_sig(signr, tsk);
459 return;
460 }
461
462
463 /* kernel trap */
464 {
465 const struct exception_table_entry *fixup;
466 fixup = search_exception_tables(regs->rip);
467 if (fixup) {
468 regs->rip = fixup->fixup;
469 } else
470 die(str, regs, error_code);
471 return;
472 }
473}
474
475#define DO_ERROR(trapnr, signr, str, name) \
476asmlinkage void do_##name(struct pt_regs * regs, long error_code) \
477{ \
478 if (notify_die(DIE_TRAP, str, regs, error_code, trapnr, signr) \
479 == NOTIFY_STOP) \
480 return; \
481 do_trap(trapnr, signr, str, regs, error_code, NULL); \
482}
483
484#define DO_ERROR_INFO(trapnr, signr, str, name, sicode, siaddr) \
485asmlinkage void do_##name(struct pt_regs * regs, long error_code) \
486{ \
487 siginfo_t info; \
488 info.si_signo = signr; \
489 info.si_errno = 0; \
490 info.si_code = sicode; \
491 info.si_addr = (void __user *)siaddr; \
492 if (notify_die(DIE_TRAP, str, regs, error_code, trapnr, signr) \
493 == NOTIFY_STOP) \
494 return; \
495 do_trap(trapnr, signr, str, regs, error_code, &info); \
496}
497
498DO_ERROR_INFO( 0, SIGFPE, "divide error", divide_error, FPE_INTDIV, regs->rip)
499DO_ERROR( 4, SIGSEGV, "overflow", overflow)
500DO_ERROR( 5, SIGSEGV, "bounds", bounds)
501DO_ERROR_INFO( 6, SIGILL, "invalid operand", invalid_op, ILL_ILLOPN, regs->rip)
502DO_ERROR( 7, SIGSEGV, "device not available", device_not_available)
503DO_ERROR( 9, SIGFPE, "coprocessor segment overrun", coprocessor_segment_overrun)
504DO_ERROR(10, SIGSEGV, "invalid TSS", invalid_TSS)
505DO_ERROR(11, SIGBUS, "segment not present", segment_not_present)
506DO_ERROR_INFO(17, SIGBUS, "alignment check", alignment_check, BUS_ADRALN, 0)
507DO_ERROR(18, SIGSEGV, "reserved", reserved)
Andi Kleen6fefb0d2005-04-16 15:25:03 -0700508DO_ERROR(12, SIGBUS, "stack segment", stack_segment)
509DO_ERROR( 8, SIGSEGV, "double fault", double_fault)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700510
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -0700511asmlinkage void __kprobes do_general_protection(struct pt_regs * regs,
512 long error_code)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700513{
514 conditional_sti(regs);
515
516#ifdef CONFIG_CHECKING
517 {
518 unsigned long gs;
519 struct x8664_pda *pda = cpu_pda + safe_smp_processor_id();
520 rdmsrl(MSR_GS_BASE, gs);
521 if (gs != (unsigned long)pda) {
522 wrmsrl(MSR_GS_BASE, pda);
523 oops_in_progress++;
524 printk("general protection handler: wrong gs %lx expected %p\n", gs, pda);
525 oops_in_progress--;
526 }
527 }
528#endif
529
Vincent Hanquez76381fe2005-06-23 00:08:46 -0700530 if (user_mode(regs)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700531 struct task_struct *tsk = current;
532
533 if (exception_trace && unhandled_signal(tsk, SIGSEGV))
534 printk(KERN_INFO
535 "%s[%d] general protection rip:%lx rsp:%lx error:%lx\n",
536 tsk->comm, tsk->pid,
537 regs->rip,regs->rsp,error_code);
538
539 tsk->thread.error_code = error_code;
540 tsk->thread.trap_no = 13;
541 force_sig(SIGSEGV, tsk);
542 return;
543 }
544
545 /* kernel gp */
546 {
547 const struct exception_table_entry *fixup;
548 fixup = search_exception_tables(regs->rip);
549 if (fixup) {
550 regs->rip = fixup->fixup;
551 return;
552 }
553 if (notify_die(DIE_GPF, "general protection fault", regs,
554 error_code, 13, SIGSEGV) == NOTIFY_STOP)
555 return;
556 die("general protection fault", regs, error_code);
557 }
558}
559
560static void mem_parity_error(unsigned char reason, struct pt_regs * regs)
561{
562 printk("Uhhuh. NMI received. Dazed and confused, but trying to continue\n");
563 printk("You probably have a hardware problem with your RAM chips\n");
564
565 /* Clear and disable the memory parity error line. */
566 reason = (reason & 0xf) | 4;
567 outb(reason, 0x61);
568}
569
570static void io_check_error(unsigned char reason, struct pt_regs * regs)
571{
572 printk("NMI: IOCK error (debug interrupt?)\n");
573 show_registers(regs);
574
575 /* Re-enable the IOCK line, wait for a few seconds */
576 reason = (reason & 0xf) | 8;
577 outb(reason, 0x61);
578 mdelay(2000);
579 reason &= ~8;
580 outb(reason, 0x61);
581}
582
583static void unknown_nmi_error(unsigned char reason, struct pt_regs * regs)
584{ printk("Uhhuh. NMI received for unknown reason %02x.\n", reason);
585 printk("Dazed and confused, but trying to continue\n");
586 printk("Do you have a strange power saving mode enabled?\n");
587}
588
Andi Kleen6fefb0d2005-04-16 15:25:03 -0700589/* Runs on IST stack. This code must keep interrupts off all the time.
590 Nested NMIs are prevented by the CPU. */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700591asmlinkage void default_do_nmi(struct pt_regs *regs)
592{
593 unsigned char reason = 0;
Ashok Raj76e4f662005-06-25 14:55:00 -0700594 int cpu;
595
596 cpu = smp_processor_id();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700597
598 /* Only the BSP gets external NMIs from the system. */
Ashok Raj76e4f662005-06-25 14:55:00 -0700599 if (!cpu)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700600 reason = get_nmi_reason();
601
602 if (!(reason & 0xc0)) {
603 if (notify_die(DIE_NMI_IPI, "nmi_ipi", regs, reason, 0, SIGINT)
604 == NOTIFY_STOP)
605 return;
606#ifdef CONFIG_X86_LOCAL_APIC
607 /*
608 * Ok, so this is none of the documented NMI sources,
609 * so it must be the NMI watchdog.
610 */
611 if (nmi_watchdog > 0) {
612 nmi_watchdog_tick(regs,reason);
613 return;
614 }
615#endif
616 unknown_nmi_error(reason, regs);
617 return;
618 }
619 if (notify_die(DIE_NMI, "nmi", regs, reason, 0, SIGINT) == NOTIFY_STOP)
620 return;
621
622 /* AK: following checks seem to be broken on modern chipsets. FIXME */
623
624 if (reason & 0x80)
625 mem_parity_error(reason, regs);
626 if (reason & 0x40)
627 io_check_error(reason, regs);
628}
629
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -0700630asmlinkage void __kprobes do_int3(struct pt_regs * regs, long error_code)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700631{
632 if (notify_die(DIE_INT3, "int3", regs, error_code, 3, SIGTRAP) == NOTIFY_STOP) {
633 return;
634 }
635 do_trap(3, SIGTRAP, "int3", regs, error_code, NULL);
636 return;
637}
638
Andi Kleen6fefb0d2005-04-16 15:25:03 -0700639/* Help handler running on IST stack to switch back to user stack
640 for scheduling or signal handling. The actual stack switch is done in
641 entry.S */
642asmlinkage struct pt_regs *sync_regs(struct pt_regs *eregs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700643{
Andi Kleen6fefb0d2005-04-16 15:25:03 -0700644 struct pt_regs *regs = eregs;
645 /* Did already sync */
646 if (eregs == (struct pt_regs *)eregs->rsp)
647 ;
648 /* Exception from user space */
Vincent Hanquez76381fe2005-06-23 00:08:46 -0700649 else if (user_mode(eregs))
Andi Kleen6fefb0d2005-04-16 15:25:03 -0700650 regs = ((struct pt_regs *)current->thread.rsp0) - 1;
651 /* Exception from kernel and interrupts are enabled. Move to
652 kernel process stack. */
653 else if (eregs->eflags & X86_EFLAGS_IF)
654 regs = (struct pt_regs *)(eregs->rsp -= sizeof(struct pt_regs));
655 if (eregs != regs)
656 *regs = *eregs;
657 return regs;
658}
659
660/* runs on IST stack. */
Prasanna S Panchamukhi0f2fbdc2005-09-06 15:19:28 -0700661asmlinkage void __kprobes do_debug(struct pt_regs * regs,
662 unsigned long error_code)
Andi Kleen6fefb0d2005-04-16 15:25:03 -0700663{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700664 unsigned long condition;
665 struct task_struct *tsk = current;
666 siginfo_t info;
667
Linus Torvalds1da177e2005-04-16 15:20:36 -0700668#ifdef CONFIG_CHECKING
669 {
670 /* RED-PEN interaction with debugger - could destroy gs */
671 unsigned long gs;
672 struct x8664_pda *pda = cpu_pda + safe_smp_processor_id();
673 rdmsrl(MSR_GS_BASE, gs);
674 if (gs != (unsigned long)pda) {
675 wrmsrl(MSR_GS_BASE, pda);
676 printk("debug handler: wrong gs %lx expected %p\n", gs, pda);
677 }
678 }
679#endif
680
Vincent Hanqueze9129e52005-06-23 00:08:46 -0700681 get_debugreg(condition, 6);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700682
683 if (notify_die(DIE_DEBUG, "debug", regs, condition, error_code,
Andi Kleendaeeafe2005-04-16 15:25:13 -0700684 SIGTRAP) == NOTIFY_STOP)
Andi Kleen6fefb0d2005-04-16 15:25:03 -0700685 return;
Andi Kleendaeeafe2005-04-16 15:25:13 -0700686
Linus Torvalds1da177e2005-04-16 15:20:36 -0700687 conditional_sti(regs);
688
689 /* Mask out spurious debug traps due to lazy DR7 setting */
690 if (condition & (DR_TRAP0|DR_TRAP1|DR_TRAP2|DR_TRAP3)) {
691 if (!tsk->thread.debugreg7) {
692 goto clear_dr7;
693 }
694 }
695
696 tsk->thread.debugreg6 = condition;
697
698 /* Mask out spurious TF errors due to lazy TF clearing */
Andi Kleendaeeafe2005-04-16 15:25:13 -0700699 if (condition & DR_STEP) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700700 /*
701 * The TF error should be masked out only if the current
702 * process is not traced and if the TRAP flag has been set
703 * previously by a tracing process (condition detected by
704 * the PT_DTRACE flag); remember that the i386 TRAP flag
705 * can be modified by the process itself in user mode,
706 * allowing programs to debug themselves without the ptrace()
707 * interface.
708 */
Vincent Hanquez76381fe2005-06-23 00:08:46 -0700709 if (!user_mode(regs))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700710 goto clear_TF_reenable;
Andi Kleenbe61bff2005-04-16 15:24:57 -0700711 /*
712 * Was the TF flag set by a debugger? If so, clear it now,
713 * so that register information is correct.
714 */
715 if (tsk->ptrace & PT_DTRACE) {
716 regs->eflags &= ~TF_MASK;
717 tsk->ptrace &= ~PT_DTRACE;
718 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700719 }
720
721 /* Ok, finally something we can handle */
722 tsk->thread.trap_no = 1;
723 tsk->thread.error_code = error_code;
724 info.si_signo = SIGTRAP;
725 info.si_errno = 0;
726 info.si_code = TRAP_BRKPT;
Vincent Hanquez76381fe2005-06-23 00:08:46 -0700727 if (!user_mode(regs))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700728 goto clear_dr7;
729
730 info.si_addr = (void __user *)regs->rip;
731 force_sig_info(SIGTRAP, &info, tsk);
732clear_dr7:
Vincent Hanqueze9129e52005-06-23 00:08:46 -0700733 set_debugreg(0UL, 7);
Andi Kleen6fefb0d2005-04-16 15:25:03 -0700734 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700735
736clear_TF_reenable:
737 set_tsk_thread_flag(tsk, TIF_SINGLESTEP);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700738 regs->eflags &= ~TF_MASK;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700739}
740
741static int kernel_math_error(struct pt_regs *regs, char *str)
742{
743 const struct exception_table_entry *fixup;
744 fixup = search_exception_tables(regs->rip);
745 if (fixup) {
746 regs->rip = fixup->fixup;
747 return 1;
748 }
749 notify_die(DIE_GPF, str, regs, 0, 16, SIGFPE);
Andi Kleen3a848f62005-04-16 15:25:06 -0700750 /* Illegal floating point operation in the kernel */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700751 die(str, regs, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700752 return 0;
753}
754
755/*
756 * Note that we play around with the 'TS' bit in an attempt to get
757 * the correct behaviour even in the presence of the asynchronous
758 * IRQ13 behaviour
759 */
760asmlinkage void do_coprocessor_error(struct pt_regs *regs)
761{
762 void __user *rip = (void __user *)(regs->rip);
763 struct task_struct * task;
764 siginfo_t info;
765 unsigned short cwd, swd;
766
767 conditional_sti(regs);
Vincent Hanquez76381fe2005-06-23 00:08:46 -0700768 if (!user_mode(regs) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700769 kernel_math_error(regs, "kernel x87 math error"))
770 return;
771
772 /*
773 * Save the info for the exception handler and clear the error.
774 */
775 task = current;
776 save_init_fpu(task);
777 task->thread.trap_no = 16;
778 task->thread.error_code = 0;
779 info.si_signo = SIGFPE;
780 info.si_errno = 0;
781 info.si_code = __SI_FAULT;
782 info.si_addr = rip;
783 /*
784 * (~cwd & swd) will mask out exceptions that are not set to unmasked
785 * status. 0x3f is the exception bits in these regs, 0x200 is the
786 * C1 reg you need in case of a stack fault, 0x040 is the stack
787 * fault bit. We should only be taking one exception at a time,
788 * so if this combination doesn't produce any single exception,
789 * then we have a bad program that isn't synchronizing its FPU usage
790 * and it will suffer the consequences since we won't be able to
791 * fully reproduce the context of the exception
792 */
793 cwd = get_fpu_cwd(task);
794 swd = get_fpu_swd(task);
Chuck Ebbertff347b22005-09-12 18:49:25 +0200795 switch (swd & ~cwd & 0x3f) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700796 case 0x000:
797 default:
798 break;
799 case 0x001: /* Invalid Op */
Chuck Ebbertff347b22005-09-12 18:49:25 +0200800 /*
801 * swd & 0x240 == 0x040: Stack Underflow
802 * swd & 0x240 == 0x240: Stack Overflow
803 * User must clear the SF bit (0x40) if set
804 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700805 info.si_code = FPE_FLTINV;
806 break;
807 case 0x002: /* Denormalize */
808 case 0x010: /* Underflow */
809 info.si_code = FPE_FLTUND;
810 break;
811 case 0x004: /* Zero Divide */
812 info.si_code = FPE_FLTDIV;
813 break;
814 case 0x008: /* Overflow */
815 info.si_code = FPE_FLTOVF;
816 break;
817 case 0x020: /* Precision */
818 info.si_code = FPE_FLTRES;
819 break;
820 }
821 force_sig_info(SIGFPE, &info, task);
822}
823
824asmlinkage void bad_intr(void)
825{
826 printk("bad interrupt");
827}
828
829asmlinkage void do_simd_coprocessor_error(struct pt_regs *regs)
830{
831 void __user *rip = (void __user *)(regs->rip);
832 struct task_struct * task;
833 siginfo_t info;
834 unsigned short mxcsr;
835
836 conditional_sti(regs);
Vincent Hanquez76381fe2005-06-23 00:08:46 -0700837 if (!user_mode(regs) &&
Andi Kleen3a848f62005-04-16 15:25:06 -0700838 kernel_math_error(regs, "kernel simd math error"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700839 return;
840
841 /*
842 * Save the info for the exception handler and clear the error.
843 */
844 task = current;
845 save_init_fpu(task);
846 task->thread.trap_no = 19;
847 task->thread.error_code = 0;
848 info.si_signo = SIGFPE;
849 info.si_errno = 0;
850 info.si_code = __SI_FAULT;
851 info.si_addr = rip;
852 /*
853 * The SIMD FPU exceptions are handled a little differently, as there
854 * is only a single status/control register. Thus, to determine which
855 * unmasked exception was caught we must mask the exception mask bits
856 * at 0x1f80, and then use these to mask the exception bits at 0x3f.
857 */
858 mxcsr = get_fpu_mxcsr(task);
859 switch (~((mxcsr & 0x1f80) >> 7) & (mxcsr & 0x3f)) {
860 case 0x000:
861 default:
862 break;
863 case 0x001: /* Invalid Op */
864 info.si_code = FPE_FLTINV;
865 break;
866 case 0x002: /* Denormalize */
867 case 0x010: /* Underflow */
868 info.si_code = FPE_FLTUND;
869 break;
870 case 0x004: /* Zero Divide */
871 info.si_code = FPE_FLTDIV;
872 break;
873 case 0x008: /* Overflow */
874 info.si_code = FPE_FLTOVF;
875 break;
876 case 0x020: /* Precision */
877 info.si_code = FPE_FLTRES;
878 break;
879 }
880 force_sig_info(SIGFPE, &info, task);
881}
882
883asmlinkage void do_spurious_interrupt_bug(struct pt_regs * regs)
884{
885}
886
887asmlinkage void __attribute__((weak)) smp_thermal_interrupt(void)
888{
889}
890
Jacob Shin89b831e2005-11-05 17:25:53 +0100891asmlinkage void __attribute__((weak)) mce_threshold_interrupt(void)
892{
893}
894
Linus Torvalds1da177e2005-04-16 15:20:36 -0700895/*
896 * 'math_state_restore()' saves the current math information in the
897 * old math state array, and gets the new ones from the current task
898 *
899 * Careful.. There are problems with IBM-designed IRQ13 behaviour.
900 * Don't touch unless you *really* know how it works.
901 */
902asmlinkage void math_state_restore(void)
903{
904 struct task_struct *me = current;
905 clts(); /* Allow maths ops (or we recurse) */
906
907 if (!used_math())
908 init_fpu(me);
909 restore_fpu_checking(&me->thread.i387.fxsave);
910 me->thread_info->status |= TS_USEDFPU;
911}
912
913void do_call_debug(struct pt_regs *regs)
914{
915 notify_die(DIE_CALL, "debug call", regs, 0, 255, SIGINT);
916}
917
918void __init trap_init(void)
919{
920 set_intr_gate(0,&divide_error);
921 set_intr_gate_ist(1,&debug,DEBUG_STACK);
922 set_intr_gate_ist(2,&nmi,NMI_STACK);
923 set_system_gate(3,&int3);
924 set_system_gate(4,&overflow); /* int4-5 can be called from all */
925 set_system_gate(5,&bounds);
926 set_intr_gate(6,&invalid_op);
927 set_intr_gate(7,&device_not_available);
928 set_intr_gate_ist(8,&double_fault, DOUBLEFAULT_STACK);
929 set_intr_gate(9,&coprocessor_segment_overrun);
930 set_intr_gate(10,&invalid_TSS);
931 set_intr_gate(11,&segment_not_present);
932 set_intr_gate_ist(12,&stack_segment,STACKFAULT_STACK);
933 set_intr_gate(13,&general_protection);
934 set_intr_gate(14,&page_fault);
935 set_intr_gate(15,&spurious_interrupt_bug);
936 set_intr_gate(16,&coprocessor_error);
937 set_intr_gate(17,&alignment_check);
938#ifdef CONFIG_X86_MCE
939 set_intr_gate_ist(18,&machine_check, MCE_STACK);
940#endif
941 set_intr_gate(19,&simd_coprocessor_error);
942
943#ifdef CONFIG_IA32_EMULATION
944 set_system_gate(IA32_SYSCALL_VECTOR, ia32_syscall);
945#endif
946
947 set_intr_gate(KDB_VECTOR, call_debug);
948
949 /*
950 * Should be a barrier for any external CPU state.
951 */
952 cpu_init();
953}
954
955
956/* Actual parsing is done early in setup.c. */
957static int __init oops_dummy(char *s)
958{
959 panic_on_oops = 1;
960 return -1;
961}
962__setup("oops=", oops_dummy);
963
964static int __init kstack_setup(char *s)
965{
966 kstack_depth_to_print = simple_strtoul(s,NULL,0);
967 return 0;
968}
969__setup("kstack=", kstack_setup);
970