| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 1 | /* | 
|  | 2 | * arch/ia64/kernel/crash.c | 
|  | 3 | * | 
|  | 4 | * Architecture specific (ia64) functions for kexec based crash dumps. | 
|  | 5 | * | 
|  | 6 | * Created by: Khalid Aziz <khalid.aziz@hp.com> | 
|  | 7 | * Copyright (C) 2005 Hewlett-Packard Development Company, L.P. | 
|  | 8 | * Copyright (C) 2005 Intel Corp	Zou Nan hai <nanhai.zou@intel.com> | 
|  | 9 | * | 
|  | 10 | */ | 
|  | 11 | #include <linux/smp.h> | 
|  | 12 | #include <linux/delay.h> | 
|  | 13 | #include <linux/crash_dump.h> | 
|  | 14 | #include <linux/bootmem.h> | 
|  | 15 | #include <linux/kexec.h> | 
|  | 16 | #include <linux/elfcore.h> | 
|  | 17 | #include <linux/sysctl.h> | 
|  | 18 | #include <linux/init.h> | 
| Christoph Hellwig | 1eeb66a | 2007-05-08 00:27:03 -0700 | [diff] [blame] | 19 | #include <linux/kdebug.h> | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 20 |  | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 21 | #include <asm/mca.h> | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 22 |  | 
|  | 23 | int kdump_status[NR_CPUS]; | 
| Simon Horman | 0ac1fac | 2007-02-14 16:15:02 +0900 | [diff] [blame] | 24 | static atomic_t kdump_cpu_frozen; | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 25 | atomic_t kdump_in_progress; | 
| Hidetoshi Seto | 1726b08 | 2009-08-06 14:51:57 -0700 | [diff] [blame] | 26 | static int kdump_freeze_monarch; | 
| Simon Horman | 0ac1fac | 2007-02-14 16:15:02 +0900 | [diff] [blame] | 27 | static int kdump_on_init = 1; | 
| Hidetoshi Seto | b0247a5 | 2008-04-08 13:31:47 +0900 | [diff] [blame] | 28 | static int kdump_on_fatal_mca = 1; | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 29 |  | 
|  | 30 | static inline Elf64_Word | 
|  | 31 | *append_elf_note(Elf64_Word *buf, char *name, unsigned type, void *data, | 
|  | 32 | size_t data_len) | 
|  | 33 | { | 
|  | 34 | struct elf_note *note = (struct elf_note *)buf; | 
|  | 35 | note->n_namesz = strlen(name) + 1; | 
|  | 36 | note->n_descsz = data_len; | 
|  | 37 | note->n_type   = type; | 
|  | 38 | buf += (sizeof(*note) + 3)/4; | 
|  | 39 | memcpy(buf, name, note->n_namesz); | 
|  | 40 | buf += (note->n_namesz + 3)/4; | 
|  | 41 | memcpy(buf, data, data_len); | 
|  | 42 | buf += (data_len + 3)/4; | 
|  | 43 | return buf; | 
|  | 44 | } | 
|  | 45 |  | 
|  | 46 | static void | 
|  | 47 | final_note(void *buf) | 
|  | 48 | { | 
|  | 49 | memset(buf, 0, sizeof(struct elf_note)); | 
|  | 50 | } | 
|  | 51 |  | 
|  | 52 | extern void ia64_dump_cpu_regs(void *); | 
|  | 53 |  | 
|  | 54 | static DEFINE_PER_CPU(struct elf_prstatus, elf_prstatus); | 
|  | 55 |  | 
|  | 56 | void | 
| Al Viro | ccbebda | 2007-02-09 16:38:10 +0000 | [diff] [blame] | 57 | crash_save_this_cpu(void) | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 58 | { | 
|  | 59 | void *buf; | 
|  | 60 | unsigned long cfm, sof, sol; | 
|  | 61 |  | 
|  | 62 | int cpu = smp_processor_id(); | 
|  | 63 | struct elf_prstatus *prstatus = &per_cpu(elf_prstatus, cpu); | 
|  | 64 |  | 
|  | 65 | elf_greg_t *dst = (elf_greg_t *)&(prstatus->pr_reg); | 
|  | 66 | memset(prstatus, 0, sizeof(*prstatus)); | 
|  | 67 | prstatus->pr_pid = current->pid; | 
|  | 68 |  | 
|  | 69 | ia64_dump_cpu_regs(dst); | 
|  | 70 | cfm = dst[43]; | 
|  | 71 | sol = (cfm >> 7) & 0x7f; | 
|  | 72 | sof = cfm & 0x7f; | 
|  | 73 | dst[46] = (unsigned long)ia64_rse_skip_regs((unsigned long *)dst[46], | 
|  | 74 | sof - sol); | 
|  | 75 |  | 
|  | 76 | buf = (u64 *) per_cpu_ptr(crash_notes, cpu); | 
|  | 77 | if (!buf) | 
|  | 78 | return; | 
| Simon Horman | 6672f76 | 2007-05-08 00:28:22 -0700 | [diff] [blame] | 79 | buf = append_elf_note(buf, KEXEC_CORE_NOTE_NAME, NT_PRSTATUS, prstatus, | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 80 | sizeof(*prstatus)); | 
|  | 81 | final_note(buf); | 
|  | 82 | } | 
|  | 83 |  | 
| Magnus Damm | bcb9b99 | 2007-02-05 15:43:42 +0900 | [diff] [blame] | 84 | #ifdef CONFIG_SMP | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 85 | static int | 
|  | 86 | kdump_wait_cpu_freeze(void) | 
|  | 87 | { | 
|  | 88 | int cpu_num = num_online_cpus() - 1; | 
|  | 89 | int timeout = 1000; | 
|  | 90 | while(timeout-- > 0) { | 
| Simon Horman | 0ac1fac | 2007-02-14 16:15:02 +0900 | [diff] [blame] | 91 | if (atomic_read(&kdump_cpu_frozen) == cpu_num) | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 92 | return 0; | 
|  | 93 | udelay(1000); | 
|  | 94 | } | 
|  | 95 | return 1; | 
|  | 96 | } | 
| Magnus Damm | bcb9b99 | 2007-02-05 15:43:42 +0900 | [diff] [blame] | 97 | #endif | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 98 |  | 
|  | 99 | void | 
|  | 100 | machine_crash_shutdown(struct pt_regs *pt) | 
|  | 101 | { | 
|  | 102 | /* This function is only called after the system | 
|  | 103 | * has paniced or is otherwise in a critical state. | 
|  | 104 | * The minimum amount of code to allow a kexec'd kernel | 
|  | 105 | * to run successfully needs to happen here. | 
|  | 106 | * | 
|  | 107 | * In practice this means shooting down the other cpus in | 
|  | 108 | * an SMP system. | 
|  | 109 | */ | 
|  | 110 | kexec_disable_iosapic(); | 
|  | 111 | #ifdef CONFIG_SMP | 
| Hidetoshi Seto | 1726b08 | 2009-08-06 14:51:57 -0700 | [diff] [blame] | 112 | /* | 
|  | 113 | * If kdump_on_init is set and an INIT is asserted here, kdump will | 
|  | 114 | * be started again via INIT monarch. | 
|  | 115 | */ | 
|  | 116 | local_irq_disable(); | 
|  | 117 | ia64_set_psr_mc();	/* mask MCA/INIT */ | 
|  | 118 | if (atomic_inc_return(&kdump_in_progress) != 1) | 
|  | 119 | unw_init_running(kdump_cpu_freeze, NULL); | 
|  | 120 |  | 
|  | 121 | /* | 
|  | 122 | * Now this cpu is ready for kdump. | 
|  | 123 | * Stop all others by IPI or INIT.  They could receive INIT from | 
|  | 124 | * outside and might be INIT monarch, but only thing they have to | 
|  | 125 | * do is falling into kdump_cpu_freeze(). | 
|  | 126 | * | 
|  | 127 | * If an INIT is asserted here: | 
|  | 128 | * - All receivers might be slaves, since some of cpus could already | 
|  | 129 | *   be frozen and INIT might be masked on monarch.  In this case, | 
| Hidetoshi Seto | 0cced40 | 2009-08-06 14:51:58 -0700 | [diff] [blame] | 130 | *   all slaves will be frozen soon since kdump_in_progress will let | 
|  | 131 | *   them into DIE_INIT_SLAVE_LEAVE. | 
| Hidetoshi Seto | 1726b08 | 2009-08-06 14:51:57 -0700 | [diff] [blame] | 132 | * - One might be a monarch, but INIT rendezvous will fail since | 
|  | 133 | *   at least this cpu already have INIT masked so it never join | 
|  | 134 | *   to the rendezvous.  In this case, all slaves and monarch will | 
| Hidetoshi Seto | 0cced40 | 2009-08-06 14:51:58 -0700 | [diff] [blame] | 135 | *   be frozen soon with no wait since the INIT rendezvous is skipped | 
|  | 136 | *   by kdump_in_progress. | 
| Hidetoshi Seto | 1726b08 | 2009-08-06 14:51:57 -0700 | [diff] [blame] | 137 | */ | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 138 | kdump_smp_send_stop(); | 
| Simon Horman | 0ac1fac | 2007-02-14 16:15:02 +0900 | [diff] [blame] | 139 | /* not all cpu response to IPI, send INIT to freeze them */ | 
| Hidetoshi Seto | 5959906 | 2009-08-06 14:51:57 -0700 | [diff] [blame] | 140 | if (kdump_wait_cpu_freeze()) { | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 141 | kdump_smp_send_init(); | 
| Hidetoshi Seto | 5959906 | 2009-08-06 14:51:57 -0700 | [diff] [blame] | 142 | /* wait again, don't go ahead if possible */ | 
|  | 143 | kdump_wait_cpu_freeze(); | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 144 | } | 
|  | 145 | #endif | 
|  | 146 | } | 
|  | 147 |  | 
|  | 148 | static void | 
|  | 149 | machine_kdump_on_init(void) | 
|  | 150 | { | 
| Takao Indoh | 072f042 | 2008-04-15 05:59:54 -0400 | [diff] [blame] | 151 | crash_save_vmcoreinfo(); | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 152 | local_irq_disable(); | 
|  | 153 | kexec_disable_iosapic(); | 
|  | 154 | machine_kexec(ia64_kimage); | 
|  | 155 | } | 
|  | 156 |  | 
|  | 157 | void | 
|  | 158 | kdump_cpu_freeze(struct unw_frame_info *info, void *arg) | 
|  | 159 | { | 
|  | 160 | int cpuid; | 
| Hidetoshi Seto | 4295ab3 | 2009-08-06 14:51:56 -0700 | [diff] [blame] | 161 |  | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 162 | local_irq_disable(); | 
|  | 163 | cpuid = smp_processor_id(); | 
|  | 164 | crash_save_this_cpu(); | 
|  | 165 | current->thread.ksp = (__u64)info->sw - 16; | 
| Hidetoshi Seto | 4295ab3 | 2009-08-06 14:51:56 -0700 | [diff] [blame] | 166 |  | 
|  | 167 | ia64_set_psr_mc();	/* mask MCA/INIT and stop reentrance */ | 
|  | 168 |  | 
| Simon Horman | 0ac1fac | 2007-02-14 16:15:02 +0900 | [diff] [blame] | 169 | atomic_inc(&kdump_cpu_frozen); | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 170 | kdump_status[cpuid] = 1; | 
|  | 171 | mb(); | 
| Magnus Damm | bcb9b99 | 2007-02-05 15:43:42 +0900 | [diff] [blame] | 172 | for (;;) | 
|  | 173 | cpu_relax(); | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 174 | } | 
|  | 175 |  | 
|  | 176 | static int | 
|  | 177 | kdump_init_notifier(struct notifier_block *self, unsigned long val, void *data) | 
|  | 178 | { | 
|  | 179 | struct ia64_mca_notify_die *nd; | 
|  | 180 | struct die_args *args = data; | 
|  | 181 |  | 
| Hidetoshi Seto | 5959906 | 2009-08-06 14:51:57 -0700 | [diff] [blame] | 182 | if (atomic_read(&kdump_in_progress)) { | 
|  | 183 | switch (val) { | 
|  | 184 | case DIE_INIT_MONARCH_LEAVE: | 
|  | 185 | if (!kdump_freeze_monarch) | 
|  | 186 | break; | 
|  | 187 | /* fall through */ | 
|  | 188 | case DIE_INIT_SLAVE_LEAVE: | 
| Hidetoshi Seto | 0cced40 | 2009-08-06 14:51:58 -0700 | [diff] [blame] | 189 | case DIE_INIT_MONARCH_ENTER: | 
| Hidetoshi Seto | 5959906 | 2009-08-06 14:51:57 -0700 | [diff] [blame] | 190 | case DIE_MCA_RENDZVOUS_LEAVE: | 
|  | 191 | unw_init_running(kdump_cpu_freeze, NULL); | 
|  | 192 | break; | 
|  | 193 | } | 
|  | 194 | } | 
|  | 195 |  | 
| Hidetoshi Seto | b0247a5 | 2008-04-08 13:31:47 +0900 | [diff] [blame] | 196 | if (!kdump_on_init && !kdump_on_fatal_mca) | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 197 | return NOTIFY_DONE; | 
|  | 198 |  | 
| Kenji Kaneshige | 2010d7f | 2007-09-01 16:37:48 +0900 | [diff] [blame] | 199 | if (!ia64_kimage) { | 
|  | 200 | if (val == DIE_INIT_MONARCH_LEAVE) | 
|  | 201 | ia64_mca_printk(KERN_NOTICE | 
|  | 202 | "%s: kdump not configured\n", | 
| Harvey Harrison | d4ed808 | 2008-03-04 15:15:00 -0800 | [diff] [blame] | 203 | __func__); | 
| Kenji Kaneshige | 2010d7f | 2007-09-01 16:37:48 +0900 | [diff] [blame] | 204 | return NOTIFY_DONE; | 
|  | 205 | } | 
|  | 206 |  | 
| Jay Lan | 311f594 | 2007-04-03 17:53:42 -0700 | [diff] [blame] | 207 | if (val != DIE_INIT_MONARCH_LEAVE && | 
| Jay Lan | 311f594 | 2007-04-03 17:53:42 -0700 | [diff] [blame] | 208 | val != DIE_INIT_MONARCH_PROCESS && | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 209 | val != DIE_MCA_MONARCH_LEAVE) | 
|  | 210 | return NOTIFY_DONE; | 
|  | 211 |  | 
|  | 212 | nd = (struct ia64_mca_notify_die *)args->err; | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 213 |  | 
|  | 214 | switch (val) { | 
| Hidetoshi Seto | 3975aff | 2008-04-08 13:33:08 +0900 | [diff] [blame] | 215 | case DIE_INIT_MONARCH_PROCESS: | 
| Hidetoshi Seto | 5959906 | 2009-08-06 14:51:57 -0700 | [diff] [blame] | 216 | /* Reason code 1 means machine check rendezvous*/ | 
|  | 217 | if (kdump_on_init && (nd->sos->rv_rc != 1)) { | 
| Hidetoshi Seto | 1726b08 | 2009-08-06 14:51:57 -0700 | [diff] [blame] | 218 | if (atomic_inc_return(&kdump_in_progress) != 1) | 
|  | 219 | kdump_freeze_monarch = 1; | 
| Hidetoshi Seto | 3975aff | 2008-04-08 13:33:08 +0900 | [diff] [blame] | 220 | } | 
|  | 221 | break; | 
|  | 222 | case DIE_INIT_MONARCH_LEAVE: | 
| Hidetoshi Seto | 5959906 | 2009-08-06 14:51:57 -0700 | [diff] [blame] | 223 | /* Reason code 1 means machine check rendezvous*/ | 
|  | 224 | if (kdump_on_init && (nd->sos->rv_rc != 1)) | 
|  | 225 | machine_kdump_on_init(); | 
| Hidetoshi Seto | 3975aff | 2008-04-08 13:33:08 +0900 | [diff] [blame] | 226 | break; | 
|  | 227 | case DIE_MCA_MONARCH_LEAVE: | 
| Hidetoshi Seto | 4fa2f0e | 2008-04-17 17:00:37 +0900 | [diff] [blame] | 228 | /* *(nd->data) indicate if MCA is recoverable */ | 
|  | 229 | if (kdump_on_fatal_mca && !(*(nd->data))) { | 
| Hidetoshi Seto | 0cced40 | 2009-08-06 14:51:58 -0700 | [diff] [blame] | 230 | if (atomic_inc_return(&kdump_in_progress) == 1) | 
| Hidetoshi Seto | 1726b08 | 2009-08-06 14:51:57 -0700 | [diff] [blame] | 231 | machine_kdump_on_init(); | 
| Hidetoshi Seto | 1726b08 | 2009-08-06 14:51:57 -0700 | [diff] [blame] | 232 | /* We got fatal MCA while kdump!? No way!! */ | 
| Hidetoshi Seto | 3975aff | 2008-04-08 13:33:08 +0900 | [diff] [blame] | 233 | } | 
|  | 234 | break; | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 235 | } | 
|  | 236 | return NOTIFY_DONE; | 
|  | 237 | } | 
|  | 238 |  | 
|  | 239 | #ifdef CONFIG_SYSCTL | 
| Hidetoshi Seto | b0247a5 | 2008-04-08 13:31:47 +0900 | [diff] [blame] | 240 | static ctl_table kdump_ctl_table[] = { | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 241 | { | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 242 | .procname = "kdump_on_init", | 
|  | 243 | .data = &kdump_on_init, | 
|  | 244 | .maxlen = sizeof(int), | 
|  | 245 | .mode = 0644, | 
| Eric W. Biederman | 6d45611 | 2009-11-16 03:11:48 -0800 | [diff] [blame] | 246 | .proc_handler = proc_dointvec, | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 247 | }, | 
| Hidetoshi Seto | b0247a5 | 2008-04-08 13:31:47 +0900 | [diff] [blame] | 248 | { | 
| Hidetoshi Seto | b0247a5 | 2008-04-08 13:31:47 +0900 | [diff] [blame] | 249 | .procname = "kdump_on_fatal_mca", | 
|  | 250 | .data = &kdump_on_fatal_mca, | 
|  | 251 | .maxlen = sizeof(int), | 
|  | 252 | .mode = 0644, | 
| Eric W. Biederman | 6d45611 | 2009-11-16 03:11:48 -0800 | [diff] [blame] | 253 | .proc_handler = proc_dointvec, | 
| Hidetoshi Seto | b0247a5 | 2008-04-08 13:31:47 +0900 | [diff] [blame] | 254 | }, | 
| Eric W. Biederman | d00faf8 | 2009-04-03 05:15:37 -0700 | [diff] [blame] | 255 | { } | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 256 | }; | 
|  | 257 |  | 
|  | 258 | static ctl_table sys_table[] = { | 
|  | 259 | { | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 260 | .procname = "kernel", | 
|  | 261 | .mode = 0555, | 
| Hidetoshi Seto | b0247a5 | 2008-04-08 13:31:47 +0900 | [diff] [blame] | 262 | .child = kdump_ctl_table, | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 263 | }, | 
| Eric W. Biederman | d00faf8 | 2009-04-03 05:15:37 -0700 | [diff] [blame] | 264 | { } | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 265 | }; | 
|  | 266 | #endif | 
|  | 267 |  | 
|  | 268 | static int | 
|  | 269 | machine_crash_setup(void) | 
|  | 270 | { | 
| Jay Lan | 311f594 | 2007-04-03 17:53:42 -0700 | [diff] [blame] | 271 | /* be notified before default_monarch_init_process */ | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 272 | static struct notifier_block kdump_init_notifier_nb = { | 
|  | 273 | .notifier_call = kdump_init_notifier, | 
| Jay Lan | 311f594 | 2007-04-03 17:53:42 -0700 | [diff] [blame] | 274 | .priority = 1, | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 275 | }; | 
|  | 276 | int ret; | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 277 | if((ret = register_die_notifier(&kdump_init_notifier_nb)) != 0) | 
|  | 278 | return ret; | 
|  | 279 | #ifdef CONFIG_SYSCTL | 
| Eric W. Biederman | 0b4d414 | 2007-02-14 00:34:09 -0800 | [diff] [blame] | 280 | register_sysctl_table(sys_table); | 
| Zou Nan hai | a7956113 | 2006-12-07 09:51:35 -0800 | [diff] [blame] | 281 | #endif | 
|  | 282 | return 0; | 
|  | 283 | } | 
|  | 284 |  | 
|  | 285 | __initcall(machine_crash_setup); | 
|  | 286 |  |