| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 1 | /* | 
|  | 2 | *  libata-eh.c - libata error handling | 
|  | 3 | * | 
|  | 4 | *  Maintained by:  Jeff Garzik <jgarzik@pobox.com> | 
|  | 5 | *    		    Please ALWAYS copy linux-ide@vger.kernel.org | 
|  | 6 | *		    on emails. | 
|  | 7 | * | 
|  | 8 | *  Copyright 2006 Tejun Heo <htejun@gmail.com> | 
|  | 9 | * | 
|  | 10 | * | 
|  | 11 | *  This program is free software; you can redistribute it and/or | 
|  | 12 | *  modify it under the terms of the GNU General Public License as | 
|  | 13 | *  published by the Free Software Foundation; either version 2, or | 
|  | 14 | *  (at your option) any later version. | 
|  | 15 | * | 
|  | 16 | *  This program is distributed in the hope that it will be useful, | 
|  | 17 | *  but WITHOUT ANY WARRANTY; without even the implied warranty of | 
|  | 18 | *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU | 
|  | 19 | *  General Public License for more details. | 
|  | 20 | * | 
|  | 21 | *  You should have received a copy of the GNU General Public License | 
|  | 22 | *  along with this program; see the file COPYING.  If not, write to | 
|  | 23 | *  the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, | 
|  | 24 | *  USA. | 
|  | 25 | * | 
|  | 26 | * | 
|  | 27 | *  libata documentation is available via 'make {ps|pdf}docs', | 
|  | 28 | *  as Documentation/DocBook/libata.* | 
|  | 29 | * | 
|  | 30 | *  Hardware documentation available from http://www.t13.org/ and | 
|  | 31 | *  http://www.sata-io.org/ | 
|  | 32 | * | 
|  | 33 | */ | 
|  | 34 |  | 
|  | 35 | #include <linux/config.h> | 
|  | 36 | #include <linux/kernel.h> | 
|  | 37 | #include <scsi/scsi.h> | 
|  | 38 | #include <scsi/scsi_host.h> | 
|  | 39 | #include <scsi/scsi_eh.h> | 
|  | 40 | #include <scsi/scsi_device.h> | 
|  | 41 | #include <scsi/scsi_cmnd.h> | 
| Tejun Heo | f8bbfc2 | 2006-05-19 21:07:05 +0900 | [diff] [blame] | 42 | #include "scsi_transport_api.h" | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 43 |  | 
|  | 44 | #include <linux/libata.h> | 
|  | 45 |  | 
|  | 46 | #include "libata.h" | 
|  | 47 |  | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 48 | static void __ata_port_freeze(struct ata_port *ap); | 
| Tejun Heo | 720ba12 | 2006-05-31 18:28:13 +0900 | [diff] [blame] | 49 | static void ata_eh_finish(struct ata_port *ap); | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 50 |  | 
| Tejun Heo | 0c247c5 | 2006-05-15 20:58:19 +0900 | [diff] [blame] | 51 | static void ata_ering_record(struct ata_ering *ering, int is_io, | 
|  | 52 | unsigned int err_mask) | 
|  | 53 | { | 
|  | 54 | struct ata_ering_entry *ent; | 
|  | 55 |  | 
|  | 56 | WARN_ON(!err_mask); | 
|  | 57 |  | 
|  | 58 | ering->cursor++; | 
|  | 59 | ering->cursor %= ATA_ERING_SIZE; | 
|  | 60 |  | 
|  | 61 | ent = &ering->ring[ering->cursor]; | 
|  | 62 | ent->is_io = is_io; | 
|  | 63 | ent->err_mask = err_mask; | 
|  | 64 | ent->timestamp = get_jiffies_64(); | 
|  | 65 | } | 
|  | 66 |  | 
|  | 67 | static struct ata_ering_entry * ata_ering_top(struct ata_ering *ering) | 
|  | 68 | { | 
|  | 69 | struct ata_ering_entry *ent = &ering->ring[ering->cursor]; | 
|  | 70 | if (!ent->err_mask) | 
|  | 71 | return NULL; | 
|  | 72 | return ent; | 
|  | 73 | } | 
|  | 74 |  | 
|  | 75 | static int ata_ering_map(struct ata_ering *ering, | 
|  | 76 | int (*map_fn)(struct ata_ering_entry *, void *), | 
|  | 77 | void *arg) | 
|  | 78 | { | 
|  | 79 | int idx, rc = 0; | 
|  | 80 | struct ata_ering_entry *ent; | 
|  | 81 |  | 
|  | 82 | idx = ering->cursor; | 
|  | 83 | do { | 
|  | 84 | ent = &ering->ring[idx]; | 
|  | 85 | if (!ent->err_mask) | 
|  | 86 | break; | 
|  | 87 | rc = map_fn(ent, arg); | 
|  | 88 | if (rc) | 
|  | 89 | break; | 
|  | 90 | idx = (idx - 1 + ATA_ERING_SIZE) % ATA_ERING_SIZE; | 
|  | 91 | } while (idx != ering->cursor); | 
|  | 92 |  | 
|  | 93 | return rc; | 
|  | 94 | } | 
|  | 95 |  | 
| Tejun Heo | 64f65ca | 2006-06-24 20:30:18 +0900 | [diff] [blame] | 96 | static unsigned int ata_eh_dev_action(struct ata_device *dev) | 
|  | 97 | { | 
|  | 98 | struct ata_eh_context *ehc = &dev->ap->eh_context; | 
|  | 99 |  | 
|  | 100 | return ehc->i.action | ehc->i.dev_action[dev->devno]; | 
|  | 101 | } | 
|  | 102 |  | 
| Tejun Heo | af181c2 | 2006-06-24 20:30:18 +0900 | [diff] [blame] | 103 | static void ata_eh_clear_action(struct ata_device *dev, | 
|  | 104 | struct ata_eh_info *ehi, unsigned int action) | 
|  | 105 | { | 
|  | 106 | int i; | 
|  | 107 |  | 
|  | 108 | if (!dev) { | 
|  | 109 | ehi->action &= ~action; | 
|  | 110 | for (i = 0; i < ATA_MAX_DEVICES; i++) | 
|  | 111 | ehi->dev_action[i] &= ~action; | 
|  | 112 | } else { | 
|  | 113 | /* doesn't make sense for port-wide EH actions */ | 
|  | 114 | WARN_ON(!(action & ATA_EH_PERDEV_MASK)); | 
|  | 115 |  | 
|  | 116 | /* break ehi->action into ehi->dev_action */ | 
|  | 117 | if (ehi->action & action) { | 
|  | 118 | for (i = 0; i < ATA_MAX_DEVICES; i++) | 
|  | 119 | ehi->dev_action[i] |= ehi->action & action; | 
|  | 120 | ehi->action &= ~action; | 
|  | 121 | } | 
|  | 122 |  | 
|  | 123 | /* turn off the specified per-dev action */ | 
|  | 124 | ehi->dev_action[dev->devno] &= ~action; | 
|  | 125 | } | 
|  | 126 | } | 
|  | 127 |  | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 128 | /** | 
|  | 129 | *	ata_scsi_timed_out - SCSI layer time out callback | 
|  | 130 | *	@cmd: timed out SCSI command | 
|  | 131 | * | 
|  | 132 | *	Handles SCSI layer timeout.  We race with normal completion of | 
|  | 133 | *	the qc for @cmd.  If the qc is already gone, we lose and let | 
|  | 134 | *	the scsi command finish (EH_HANDLED).  Otherwise, the qc has | 
|  | 135 | *	timed out and EH should be invoked.  Prevent ata_qc_complete() | 
|  | 136 | *	from finishing it by setting EH_SCHEDULED and return | 
|  | 137 | *	EH_NOT_HANDLED. | 
|  | 138 | * | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 139 | *	TODO: kill this function once old EH is gone. | 
|  | 140 | * | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 141 | *	LOCKING: | 
|  | 142 | *	Called from timer context | 
|  | 143 | * | 
|  | 144 | *	RETURNS: | 
|  | 145 | *	EH_HANDLED or EH_NOT_HANDLED | 
|  | 146 | */ | 
|  | 147 | enum scsi_eh_timer_return ata_scsi_timed_out(struct scsi_cmnd *cmd) | 
|  | 148 | { | 
|  | 149 | struct Scsi_Host *host = cmd->device->host; | 
| Jeff Garzik | 35bb94b | 2006-04-11 13:12:34 -0400 | [diff] [blame] | 150 | struct ata_port *ap = ata_shost_to_port(host); | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 151 | unsigned long flags; | 
|  | 152 | struct ata_queued_cmd *qc; | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 153 | enum scsi_eh_timer_return ret; | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 154 |  | 
|  | 155 | DPRINTK("ENTER\n"); | 
|  | 156 |  | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 157 | if (ap->ops->error_handler) { | 
|  | 158 | ret = EH_NOT_HANDLED; | 
|  | 159 | goto out; | 
|  | 160 | } | 
|  | 161 |  | 
|  | 162 | ret = EH_HANDLED; | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 163 | spin_lock_irqsave(ap->lock, flags); | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 164 | qc = ata_qc_from_tag(ap, ap->active_tag); | 
|  | 165 | if (qc) { | 
|  | 166 | WARN_ON(qc->scsicmd != cmd); | 
|  | 167 | qc->flags |= ATA_QCFLAG_EH_SCHEDULED; | 
|  | 168 | qc->err_mask |= AC_ERR_TIMEOUT; | 
|  | 169 | ret = EH_NOT_HANDLED; | 
|  | 170 | } | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 171 | spin_unlock_irqrestore(ap->lock, flags); | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 172 |  | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 173 | out: | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 174 | DPRINTK("EXIT, ret=%d\n", ret); | 
|  | 175 | return ret; | 
|  | 176 | } | 
|  | 177 |  | 
|  | 178 | /** | 
|  | 179 | *	ata_scsi_error - SCSI layer error handler callback | 
|  | 180 | *	@host: SCSI host on which error occurred | 
|  | 181 | * | 
|  | 182 | *	Handles SCSI-layer-thrown error events. | 
|  | 183 | * | 
|  | 184 | *	LOCKING: | 
|  | 185 | *	Inherited from SCSI layer (none, can sleep) | 
|  | 186 | * | 
|  | 187 | *	RETURNS: | 
|  | 188 | *	Zero. | 
|  | 189 | */ | 
| Jeff Garzik | 381544b | 2006-04-11 13:04:39 -0400 | [diff] [blame] | 190 | void ata_scsi_error(struct Scsi_Host *host) | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 191 | { | 
| Jeff Garzik | 35bb94b | 2006-04-11 13:12:34 -0400 | [diff] [blame] | 192 | struct ata_port *ap = ata_shost_to_port(host); | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 193 | spinlock_t *ap_lock = ap->lock; | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 194 | int i, repeat_cnt = ATA_EH_MAX_REPEAT; | 
|  | 195 | unsigned long flags; | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 196 |  | 
|  | 197 | DPRINTK("ENTER\n"); | 
|  | 198 |  | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 199 | /* synchronize with port task */ | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 200 | ata_port_flush_task(ap); | 
|  | 201 |  | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 202 | /* synchronize with host_set lock and sort out timeouts */ | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 203 |  | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 204 | /* For new EH, all qcs are finished in one of three ways - | 
|  | 205 | * normal completion, error completion, and SCSI timeout. | 
|  | 206 | * Both cmpletions can race against SCSI timeout.  When normal | 
|  | 207 | * completion wins, the qc never reaches EH.  When error | 
|  | 208 | * completion wins, the qc has ATA_QCFLAG_FAILED set. | 
|  | 209 | * | 
|  | 210 | * When SCSI timeout wins, things are a bit more complex. | 
|  | 211 | * Normal or error completion can occur after the timeout but | 
|  | 212 | * before this point.  In such cases, both types of | 
|  | 213 | * completions are honored.  A scmd is determined to have | 
|  | 214 | * timed out iff its associated qc is active and not failed. | 
|  | 215 | */ | 
|  | 216 | if (ap->ops->error_handler) { | 
|  | 217 | struct scsi_cmnd *scmd, *tmp; | 
|  | 218 | int nr_timedout = 0; | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 219 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 220 | spin_lock_irqsave(ap_lock, flags); | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 221 |  | 
|  | 222 | list_for_each_entry_safe(scmd, tmp, &host->eh_cmd_q, eh_entry) { | 
|  | 223 | struct ata_queued_cmd *qc; | 
|  | 224 |  | 
|  | 225 | for (i = 0; i < ATA_MAX_QUEUE; i++) { | 
|  | 226 | qc = __ata_qc_from_tag(ap, i); | 
|  | 227 | if (qc->flags & ATA_QCFLAG_ACTIVE && | 
|  | 228 | qc->scsicmd == scmd) | 
|  | 229 | break; | 
|  | 230 | } | 
|  | 231 |  | 
|  | 232 | if (i < ATA_MAX_QUEUE) { | 
|  | 233 | /* the scmd has an associated qc */ | 
|  | 234 | if (!(qc->flags & ATA_QCFLAG_FAILED)) { | 
|  | 235 | /* which hasn't failed yet, timeout */ | 
|  | 236 | qc->err_mask |= AC_ERR_TIMEOUT; | 
|  | 237 | qc->flags |= ATA_QCFLAG_FAILED; | 
|  | 238 | nr_timedout++; | 
|  | 239 | } | 
|  | 240 | } else { | 
|  | 241 | /* Normal completion occurred after | 
|  | 242 | * SCSI timeout but before this point. | 
|  | 243 | * Successfully complete it. | 
|  | 244 | */ | 
|  | 245 | scmd->retries = scmd->allowed; | 
|  | 246 | scsi_eh_finish_cmd(scmd, &ap->eh_done_q); | 
|  | 247 | } | 
|  | 248 | } | 
|  | 249 |  | 
|  | 250 | /* If we have timed out qcs.  They belong to EH from | 
|  | 251 | * this point but the state of the controller is | 
|  | 252 | * unknown.  Freeze the port to make sure the IRQ | 
|  | 253 | * handler doesn't diddle with those qcs.  This must | 
|  | 254 | * be done atomically w.r.t. setting QCFLAG_FAILED. | 
|  | 255 | */ | 
|  | 256 | if (nr_timedout) | 
|  | 257 | __ata_port_freeze(ap); | 
|  | 258 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 259 | spin_unlock_irqrestore(ap_lock, flags); | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 260 | } else | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 261 | spin_unlock_wait(ap_lock); | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 262 |  | 
|  | 263 | repeat: | 
|  | 264 | /* invoke error handler */ | 
|  | 265 | if (ap->ops->error_handler) { | 
| Tejun Heo | f3e81b1 | 2006-05-15 20:58:21 +0900 | [diff] [blame] | 266 | /* fetch & clear EH info */ | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 267 | spin_lock_irqsave(ap_lock, flags); | 
| Tejun Heo | f3e81b1 | 2006-05-15 20:58:21 +0900 | [diff] [blame] | 268 |  | 
|  | 269 | memset(&ap->eh_context, 0, sizeof(ap->eh_context)); | 
|  | 270 | ap->eh_context.i = ap->eh_info; | 
|  | 271 | memset(&ap->eh_info, 0, sizeof(ap->eh_info)); | 
|  | 272 |  | 
| Tejun Heo | c6cf9e9 | 2006-05-31 18:27:27 +0900 | [diff] [blame] | 273 | ap->flags |= ATA_FLAG_EH_IN_PROGRESS; | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 274 | ap->flags &= ~ATA_FLAG_EH_PENDING; | 
| Tejun Heo | f3e81b1 | 2006-05-15 20:58:21 +0900 | [diff] [blame] | 275 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 276 | spin_unlock_irqrestore(ap_lock, flags); | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 277 |  | 
| Tejun Heo | 720ba12 | 2006-05-31 18:28:13 +0900 | [diff] [blame] | 278 | /* invoke EH.  if unloading, just finish failed qcs */ | 
|  | 279 | if (!(ap->flags & ATA_FLAG_UNLOADING)) | 
|  | 280 | ap->ops->error_handler(ap); | 
|  | 281 | else | 
|  | 282 | ata_eh_finish(ap); | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 283 |  | 
|  | 284 | /* Exception might have happend after ->error_handler | 
|  | 285 | * recovered the port but before this point.  Repeat | 
|  | 286 | * EH in such case. | 
|  | 287 | */ | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 288 | spin_lock_irqsave(ap_lock, flags); | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 289 |  | 
|  | 290 | if (ap->flags & ATA_FLAG_EH_PENDING) { | 
|  | 291 | if (--repeat_cnt) { | 
|  | 292 | ata_port_printk(ap, KERN_INFO, | 
|  | 293 | "EH pending after completion, " | 
|  | 294 | "repeating EH (cnt=%d)\n", repeat_cnt); | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 295 | spin_unlock_irqrestore(ap_lock, flags); | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 296 | goto repeat; | 
|  | 297 | } | 
|  | 298 | ata_port_printk(ap, KERN_ERR, "EH pending after %d " | 
|  | 299 | "tries, giving up\n", ATA_EH_MAX_REPEAT); | 
|  | 300 | } | 
|  | 301 |  | 
| Tejun Heo | f3e81b1 | 2006-05-15 20:58:21 +0900 | [diff] [blame] | 302 | /* this run is complete, make sure EH info is clear */ | 
|  | 303 | memset(&ap->eh_info, 0, sizeof(ap->eh_info)); | 
|  | 304 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 305 | /* Clear host_eh_scheduled while holding ap_lock such | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 306 | * that if exception occurs after this point but | 
|  | 307 | * before EH completion, SCSI midlayer will | 
|  | 308 | * re-initiate EH. | 
|  | 309 | */ | 
|  | 310 | host->host_eh_scheduled = 0; | 
|  | 311 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 312 | spin_unlock_irqrestore(ap_lock, flags); | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 313 | } else { | 
|  | 314 | WARN_ON(ata_qc_from_tag(ap, ap->active_tag) == NULL); | 
|  | 315 | ap->ops->eng_timeout(ap); | 
|  | 316 | } | 
|  | 317 |  | 
|  | 318 | /* finish or retry handled scmd's and clean up */ | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 319 | WARN_ON(host->host_failed || !list_empty(&host->eh_cmd_q)); | 
|  | 320 |  | 
|  | 321 | scsi_eh_flush_done_q(&ap->eh_done_q); | 
|  | 322 |  | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 323 | /* clean up */ | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 324 | spin_lock_irqsave(ap_lock, flags); | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 325 |  | 
| Tejun Heo | 3e70639 | 2006-05-31 18:28:11 +0900 | [diff] [blame] | 326 | if (ap->flags & ATA_FLAG_LOADING) { | 
|  | 327 | ap->flags &= ~ATA_FLAG_LOADING; | 
|  | 328 | } else { | 
|  | 329 | if (ap->flags & ATA_FLAG_SCSI_HOTPLUG) | 
|  | 330 | queue_work(ata_aux_wq, &ap->hotplug_task); | 
|  | 331 | if (ap->flags & ATA_FLAG_RECOVERED) | 
|  | 332 | ata_port_printk(ap, KERN_INFO, "EH complete\n"); | 
|  | 333 | } | 
| Tejun Heo | 580b210 | 2006-05-31 18:28:05 +0900 | [diff] [blame] | 334 |  | 
|  | 335 | ap->flags &= ~(ATA_FLAG_SCSI_HOTPLUG | ATA_FLAG_RECOVERED); | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 336 |  | 
| Tejun Heo | c6cf9e9 | 2006-05-31 18:27:27 +0900 | [diff] [blame] | 337 | /* tell wait_eh that we're done */ | 
|  | 338 | ap->flags &= ~ATA_FLAG_EH_IN_PROGRESS; | 
|  | 339 | wake_up_all(&ap->eh_wait_q); | 
|  | 340 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 341 | spin_unlock_irqrestore(ap_lock, flags); | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 342 |  | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 343 | DPRINTK("EXIT\n"); | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 344 | } | 
|  | 345 |  | 
|  | 346 | /** | 
| Tejun Heo | c6cf9e9 | 2006-05-31 18:27:27 +0900 | [diff] [blame] | 347 | *	ata_port_wait_eh - Wait for the currently pending EH to complete | 
|  | 348 | *	@ap: Port to wait EH for | 
|  | 349 | * | 
|  | 350 | *	Wait until the currently pending EH is complete. | 
|  | 351 | * | 
|  | 352 | *	LOCKING: | 
|  | 353 | *	Kernel thread context (may sleep). | 
|  | 354 | */ | 
|  | 355 | void ata_port_wait_eh(struct ata_port *ap) | 
|  | 356 | { | 
|  | 357 | unsigned long flags; | 
|  | 358 | DEFINE_WAIT(wait); | 
|  | 359 |  | 
|  | 360 | retry: | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 361 | spin_lock_irqsave(ap->lock, flags); | 
| Tejun Heo | c6cf9e9 | 2006-05-31 18:27:27 +0900 | [diff] [blame] | 362 |  | 
|  | 363 | while (ap->flags & (ATA_FLAG_EH_PENDING | ATA_FLAG_EH_IN_PROGRESS)) { | 
|  | 364 | prepare_to_wait(&ap->eh_wait_q, &wait, TASK_UNINTERRUPTIBLE); | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 365 | spin_unlock_irqrestore(ap->lock, flags); | 
| Tejun Heo | c6cf9e9 | 2006-05-31 18:27:27 +0900 | [diff] [blame] | 366 | schedule(); | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 367 | spin_lock_irqsave(ap->lock, flags); | 
| Tejun Heo | c6cf9e9 | 2006-05-31 18:27:27 +0900 | [diff] [blame] | 368 | } | 
| Tejun Heo | 0a1b622 | 2006-06-11 11:01:38 +0900 | [diff] [blame] | 369 | finish_wait(&ap->eh_wait_q, &wait); | 
| Tejun Heo | c6cf9e9 | 2006-05-31 18:27:27 +0900 | [diff] [blame] | 370 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 371 | spin_unlock_irqrestore(ap->lock, flags); | 
| Tejun Heo | c6cf9e9 | 2006-05-31 18:27:27 +0900 | [diff] [blame] | 372 |  | 
|  | 373 | /* make sure SCSI EH is complete */ | 
|  | 374 | if (scsi_host_in_recovery(ap->host)) { | 
|  | 375 | msleep(10); | 
|  | 376 | goto retry; | 
|  | 377 | } | 
|  | 378 | } | 
|  | 379 |  | 
|  | 380 | /** | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 381 | *	ata_qc_timeout - Handle timeout of queued command | 
|  | 382 | *	@qc: Command that timed out | 
|  | 383 | * | 
|  | 384 | *	Some part of the kernel (currently, only the SCSI layer) | 
|  | 385 | *	has noticed that the active command on port @ap has not | 
|  | 386 | *	completed after a specified length of time.  Handle this | 
|  | 387 | *	condition by disabling DMA (if necessary) and completing | 
|  | 388 | *	transactions, with error if necessary. | 
|  | 389 | * | 
|  | 390 | *	This also handles the case of the "lost interrupt", where | 
|  | 391 | *	for some reason (possibly hardware bug, possibly driver bug) | 
|  | 392 | *	an interrupt was not delivered to the driver, even though the | 
|  | 393 | *	transaction completed successfully. | 
|  | 394 | * | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 395 | *	TODO: kill this function once old EH is gone. | 
|  | 396 | * | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 397 | *	LOCKING: | 
|  | 398 | *	Inherited from SCSI layer (none, can sleep) | 
|  | 399 | */ | 
|  | 400 | static void ata_qc_timeout(struct ata_queued_cmd *qc) | 
|  | 401 | { | 
|  | 402 | struct ata_port *ap = qc->ap; | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 403 | u8 host_stat = 0, drv_stat; | 
|  | 404 | unsigned long flags; | 
|  | 405 |  | 
|  | 406 | DPRINTK("ENTER\n"); | 
|  | 407 |  | 
|  | 408 | ap->hsm_task_state = HSM_ST_IDLE; | 
|  | 409 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 410 | spin_lock_irqsave(ap->lock, flags); | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 411 |  | 
|  | 412 | switch (qc->tf.protocol) { | 
|  | 413 |  | 
|  | 414 | case ATA_PROT_DMA: | 
|  | 415 | case ATA_PROT_ATAPI_DMA: | 
|  | 416 | host_stat = ap->ops->bmdma_status(ap); | 
|  | 417 |  | 
|  | 418 | /* before we do anything else, clear DMA-Start bit */ | 
|  | 419 | ap->ops->bmdma_stop(qc); | 
|  | 420 |  | 
|  | 421 | /* fall through */ | 
|  | 422 |  | 
|  | 423 | default: | 
|  | 424 | ata_altstatus(ap); | 
|  | 425 | drv_stat = ata_chk_status(ap); | 
|  | 426 |  | 
|  | 427 | /* ack bmdma irq events */ | 
|  | 428 | ap->ops->irq_clear(ap); | 
|  | 429 |  | 
| Tejun Heo | f15a1da | 2006-05-15 20:57:56 +0900 | [diff] [blame] | 430 | ata_dev_printk(qc->dev, KERN_ERR, "command 0x%x timeout, " | 
|  | 431 | "stat 0x%x host_stat 0x%x\n", | 
|  | 432 | qc->tf.command, drv_stat, host_stat); | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 433 |  | 
|  | 434 | /* complete taskfile transaction */ | 
| Jeff Garzik | c13b56a | 2006-04-02 10:34:24 -0400 | [diff] [blame] | 435 | qc->err_mask |= AC_ERR_TIMEOUT; | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 436 | break; | 
|  | 437 | } | 
|  | 438 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 439 | spin_unlock_irqrestore(ap->lock, flags); | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 440 |  | 
|  | 441 | ata_eh_qc_complete(qc); | 
|  | 442 |  | 
|  | 443 | DPRINTK("EXIT\n"); | 
|  | 444 | } | 
|  | 445 |  | 
|  | 446 | /** | 
|  | 447 | *	ata_eng_timeout - Handle timeout of queued command | 
|  | 448 | *	@ap: Port on which timed-out command is active | 
|  | 449 | * | 
|  | 450 | *	Some part of the kernel (currently, only the SCSI layer) | 
|  | 451 | *	has noticed that the active command on port @ap has not | 
|  | 452 | *	completed after a specified length of time.  Handle this | 
|  | 453 | *	condition by disabling DMA (if necessary) and completing | 
|  | 454 | *	transactions, with error if necessary. | 
|  | 455 | * | 
|  | 456 | *	This also handles the case of the "lost interrupt", where | 
|  | 457 | *	for some reason (possibly hardware bug, possibly driver bug) | 
|  | 458 | *	an interrupt was not delivered to the driver, even though the | 
|  | 459 | *	transaction completed successfully. | 
|  | 460 | * | 
| Tejun Heo | ad9e276 | 2006-05-15 20:58:12 +0900 | [diff] [blame] | 461 | *	TODO: kill this function once old EH is gone. | 
|  | 462 | * | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 463 | *	LOCKING: | 
|  | 464 | *	Inherited from SCSI layer (none, can sleep) | 
|  | 465 | */ | 
|  | 466 | void ata_eng_timeout(struct ata_port *ap) | 
|  | 467 | { | 
|  | 468 | DPRINTK("ENTER\n"); | 
|  | 469 |  | 
|  | 470 | ata_qc_timeout(ata_qc_from_tag(ap, ap->active_tag)); | 
|  | 471 |  | 
|  | 472 | DPRINTK("EXIT\n"); | 
|  | 473 | } | 
|  | 474 |  | 
| Tejun Heo | f686bcb | 2006-05-15 20:58:05 +0900 | [diff] [blame] | 475 | /** | 
|  | 476 | *	ata_qc_schedule_eh - schedule qc for error handling | 
|  | 477 | *	@qc: command to schedule error handling for | 
|  | 478 | * | 
|  | 479 | *	Schedule error handling for @qc.  EH will kick in as soon as | 
|  | 480 | *	other commands are drained. | 
|  | 481 | * | 
|  | 482 | *	LOCKING: | 
|  | 483 | *	spin_lock_irqsave(host_set lock) | 
|  | 484 | */ | 
|  | 485 | void ata_qc_schedule_eh(struct ata_queued_cmd *qc) | 
|  | 486 | { | 
|  | 487 | struct ata_port *ap = qc->ap; | 
|  | 488 |  | 
|  | 489 | WARN_ON(!ap->ops->error_handler); | 
|  | 490 |  | 
|  | 491 | qc->flags |= ATA_QCFLAG_FAILED; | 
|  | 492 | qc->ap->flags |= ATA_FLAG_EH_PENDING; | 
|  | 493 |  | 
|  | 494 | /* The following will fail if timeout has already expired. | 
|  | 495 | * ata_scsi_error() takes care of such scmds on EH entry. | 
|  | 496 | * Note that ATA_QCFLAG_FAILED is unconditionally set after | 
|  | 497 | * this function completes. | 
|  | 498 | */ | 
|  | 499 | scsi_req_abort_cmd(qc->scsicmd); | 
|  | 500 | } | 
|  | 501 |  | 
| Tejun Heo | 7b70fc0 | 2006-05-15 20:58:07 +0900 | [diff] [blame] | 502 | /** | 
|  | 503 | *	ata_port_schedule_eh - schedule error handling without a qc | 
|  | 504 | *	@ap: ATA port to schedule EH for | 
|  | 505 | * | 
|  | 506 | *	Schedule error handling for @ap.  EH will kick in as soon as | 
|  | 507 | *	all commands are drained. | 
|  | 508 | * | 
|  | 509 | *	LOCKING: | 
|  | 510 | *	spin_lock_irqsave(host_set lock) | 
|  | 511 | */ | 
|  | 512 | void ata_port_schedule_eh(struct ata_port *ap) | 
|  | 513 | { | 
|  | 514 | WARN_ON(!ap->ops->error_handler); | 
|  | 515 |  | 
|  | 516 | ap->flags |= ATA_FLAG_EH_PENDING; | 
| Tejun Heo | f8bbfc2 | 2006-05-19 21:07:05 +0900 | [diff] [blame] | 517 | scsi_schedule_eh(ap->host); | 
| Tejun Heo | 7b70fc0 | 2006-05-15 20:58:07 +0900 | [diff] [blame] | 518 |  | 
|  | 519 | DPRINTK("port EH scheduled\n"); | 
|  | 520 | } | 
|  | 521 |  | 
|  | 522 | /** | 
|  | 523 | *	ata_port_abort - abort all qc's on the port | 
|  | 524 | *	@ap: ATA port to abort qc's for | 
|  | 525 | * | 
|  | 526 | *	Abort all active qc's of @ap and schedule EH. | 
|  | 527 | * | 
|  | 528 | *	LOCKING: | 
|  | 529 | *	spin_lock_irqsave(host_set lock) | 
|  | 530 | * | 
|  | 531 | *	RETURNS: | 
|  | 532 | *	Number of aborted qc's. | 
|  | 533 | */ | 
|  | 534 | int ata_port_abort(struct ata_port *ap) | 
|  | 535 | { | 
|  | 536 | int tag, nr_aborted = 0; | 
|  | 537 |  | 
|  | 538 | WARN_ON(!ap->ops->error_handler); | 
|  | 539 |  | 
|  | 540 | for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { | 
|  | 541 | struct ata_queued_cmd *qc = ata_qc_from_tag(ap, tag); | 
|  | 542 |  | 
|  | 543 | if (qc) { | 
|  | 544 | qc->flags |= ATA_QCFLAG_FAILED; | 
|  | 545 | ata_qc_complete(qc); | 
|  | 546 | nr_aborted++; | 
|  | 547 | } | 
|  | 548 | } | 
|  | 549 |  | 
|  | 550 | if (!nr_aborted) | 
|  | 551 | ata_port_schedule_eh(ap); | 
|  | 552 |  | 
|  | 553 | return nr_aborted; | 
|  | 554 | } | 
|  | 555 |  | 
| Tejun Heo | e318049 | 2006-05-15 20:58:09 +0900 | [diff] [blame] | 556 | /** | 
|  | 557 | *	__ata_port_freeze - freeze port | 
|  | 558 | *	@ap: ATA port to freeze | 
|  | 559 | * | 
|  | 560 | *	This function is called when HSM violation or some other | 
|  | 561 | *	condition disrupts normal operation of the port.  Frozen port | 
|  | 562 | *	is not allowed to perform any operation until the port is | 
|  | 563 | *	thawed, which usually follows a successful reset. | 
|  | 564 | * | 
|  | 565 | *	ap->ops->freeze() callback can be used for freezing the port | 
|  | 566 | *	hardware-wise (e.g. mask interrupt and stop DMA engine).  If a | 
|  | 567 | *	port cannot be frozen hardware-wise, the interrupt handler | 
|  | 568 | *	must ack and clear interrupts unconditionally while the port | 
|  | 569 | *	is frozen. | 
|  | 570 | * | 
|  | 571 | *	LOCKING: | 
|  | 572 | *	spin_lock_irqsave(host_set lock) | 
|  | 573 | */ | 
|  | 574 | static void __ata_port_freeze(struct ata_port *ap) | 
|  | 575 | { | 
|  | 576 | WARN_ON(!ap->ops->error_handler); | 
|  | 577 |  | 
|  | 578 | if (ap->ops->freeze) | 
|  | 579 | ap->ops->freeze(ap); | 
|  | 580 |  | 
|  | 581 | ap->flags |= ATA_FLAG_FROZEN; | 
|  | 582 |  | 
|  | 583 | DPRINTK("ata%u port frozen\n", ap->id); | 
|  | 584 | } | 
|  | 585 |  | 
|  | 586 | /** | 
|  | 587 | *	ata_port_freeze - abort & freeze port | 
|  | 588 | *	@ap: ATA port to freeze | 
|  | 589 | * | 
|  | 590 | *	Abort and freeze @ap. | 
|  | 591 | * | 
|  | 592 | *	LOCKING: | 
|  | 593 | *	spin_lock_irqsave(host_set lock) | 
|  | 594 | * | 
|  | 595 | *	RETURNS: | 
|  | 596 | *	Number of aborted commands. | 
|  | 597 | */ | 
|  | 598 | int ata_port_freeze(struct ata_port *ap) | 
|  | 599 | { | 
|  | 600 | int nr_aborted; | 
|  | 601 |  | 
|  | 602 | WARN_ON(!ap->ops->error_handler); | 
|  | 603 |  | 
|  | 604 | nr_aborted = ata_port_abort(ap); | 
|  | 605 | __ata_port_freeze(ap); | 
|  | 606 |  | 
|  | 607 | return nr_aborted; | 
|  | 608 | } | 
|  | 609 |  | 
|  | 610 | /** | 
|  | 611 | *	ata_eh_freeze_port - EH helper to freeze port | 
|  | 612 | *	@ap: ATA port to freeze | 
|  | 613 | * | 
|  | 614 | *	Freeze @ap. | 
|  | 615 | * | 
|  | 616 | *	LOCKING: | 
|  | 617 | *	None. | 
|  | 618 | */ | 
|  | 619 | void ata_eh_freeze_port(struct ata_port *ap) | 
|  | 620 | { | 
|  | 621 | unsigned long flags; | 
|  | 622 |  | 
|  | 623 | if (!ap->ops->error_handler) | 
|  | 624 | return; | 
|  | 625 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 626 | spin_lock_irqsave(ap->lock, flags); | 
| Tejun Heo | e318049 | 2006-05-15 20:58:09 +0900 | [diff] [blame] | 627 | __ata_port_freeze(ap); | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 628 | spin_unlock_irqrestore(ap->lock, flags); | 
| Tejun Heo | e318049 | 2006-05-15 20:58:09 +0900 | [diff] [blame] | 629 | } | 
|  | 630 |  | 
|  | 631 | /** | 
|  | 632 | *	ata_port_thaw_port - EH helper to thaw port | 
|  | 633 | *	@ap: ATA port to thaw | 
|  | 634 | * | 
|  | 635 | *	Thaw frozen port @ap. | 
|  | 636 | * | 
|  | 637 | *	LOCKING: | 
|  | 638 | *	None. | 
|  | 639 | */ | 
|  | 640 | void ata_eh_thaw_port(struct ata_port *ap) | 
|  | 641 | { | 
|  | 642 | unsigned long flags; | 
|  | 643 |  | 
|  | 644 | if (!ap->ops->error_handler) | 
|  | 645 | return; | 
|  | 646 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 647 | spin_lock_irqsave(ap->lock, flags); | 
| Tejun Heo | e318049 | 2006-05-15 20:58:09 +0900 | [diff] [blame] | 648 |  | 
|  | 649 | ap->flags &= ~ATA_FLAG_FROZEN; | 
|  | 650 |  | 
|  | 651 | if (ap->ops->thaw) | 
|  | 652 | ap->ops->thaw(ap); | 
|  | 653 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 654 | spin_unlock_irqrestore(ap->lock, flags); | 
| Tejun Heo | e318049 | 2006-05-15 20:58:09 +0900 | [diff] [blame] | 655 |  | 
|  | 656 | DPRINTK("ata%u port thawed\n", ap->id); | 
|  | 657 | } | 
|  | 658 |  | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 659 | static void ata_eh_scsidone(struct scsi_cmnd *scmd) | 
|  | 660 | { | 
|  | 661 | /* nada */ | 
|  | 662 | } | 
|  | 663 |  | 
|  | 664 | static void __ata_eh_qc_complete(struct ata_queued_cmd *qc) | 
|  | 665 | { | 
|  | 666 | struct ata_port *ap = qc->ap; | 
|  | 667 | struct scsi_cmnd *scmd = qc->scsicmd; | 
|  | 668 | unsigned long flags; | 
|  | 669 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 670 | spin_lock_irqsave(ap->lock, flags); | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 671 | qc->scsidone = ata_eh_scsidone; | 
|  | 672 | __ata_qc_complete(qc); | 
|  | 673 | WARN_ON(ata_tag_valid(qc->tag)); | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 674 | spin_unlock_irqrestore(ap->lock, flags); | 
| Tejun Heo | ece1d63 | 2006-04-02 18:51:53 +0900 | [diff] [blame] | 675 |  | 
|  | 676 | scsi_eh_finish_cmd(scmd, &ap->eh_done_q); | 
|  | 677 | } | 
|  | 678 |  | 
|  | 679 | /** | 
|  | 680 | *	ata_eh_qc_complete - Complete an active ATA command from EH | 
|  | 681 | *	@qc: Command to complete | 
|  | 682 | * | 
|  | 683 | *	Indicate to the mid and upper layers that an ATA command has | 
|  | 684 | *	completed.  To be used from EH. | 
|  | 685 | */ | 
|  | 686 | void ata_eh_qc_complete(struct ata_queued_cmd *qc) | 
|  | 687 | { | 
|  | 688 | struct scsi_cmnd *scmd = qc->scsicmd; | 
|  | 689 | scmd->retries = scmd->allowed; | 
|  | 690 | __ata_eh_qc_complete(qc); | 
|  | 691 | } | 
|  | 692 |  | 
|  | 693 | /** | 
|  | 694 | *	ata_eh_qc_retry - Tell midlayer to retry an ATA command after EH | 
|  | 695 | *	@qc: Command to retry | 
|  | 696 | * | 
|  | 697 | *	Indicate to the mid and upper layers that an ATA command | 
|  | 698 | *	should be retried.  To be used from EH. | 
|  | 699 | * | 
|  | 700 | *	SCSI midlayer limits the number of retries to scmd->allowed. | 
|  | 701 | *	scmd->retries is decremented for commands which get retried | 
|  | 702 | *	due to unrelated failures (qc->err_mask is zero). | 
|  | 703 | */ | 
|  | 704 | void ata_eh_qc_retry(struct ata_queued_cmd *qc) | 
|  | 705 | { | 
|  | 706 | struct scsi_cmnd *scmd = qc->scsicmd; | 
|  | 707 | if (!qc->err_mask && scmd->retries) | 
|  | 708 | scmd->retries--; | 
|  | 709 | __ata_eh_qc_complete(qc); | 
|  | 710 | } | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 711 |  | 
|  | 712 | /** | 
| Tejun Heo | 0ea035a | 2006-05-31 18:28:01 +0900 | [diff] [blame] | 713 | *	ata_eh_detach_dev - detach ATA device | 
|  | 714 | *	@dev: ATA device to detach | 
|  | 715 | * | 
|  | 716 | *	Detach @dev. | 
|  | 717 | * | 
|  | 718 | *	LOCKING: | 
|  | 719 | *	None. | 
|  | 720 | */ | 
|  | 721 | static void ata_eh_detach_dev(struct ata_device *dev) | 
|  | 722 | { | 
|  | 723 | struct ata_port *ap = dev->ap; | 
|  | 724 | unsigned long flags; | 
|  | 725 |  | 
|  | 726 | ata_dev_disable(dev); | 
|  | 727 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 728 | spin_lock_irqsave(ap->lock, flags); | 
| Tejun Heo | 0ea035a | 2006-05-31 18:28:01 +0900 | [diff] [blame] | 729 |  | 
|  | 730 | dev->flags &= ~ATA_DFLAG_DETACH; | 
|  | 731 |  | 
|  | 732 | if (ata_scsi_offline_dev(dev)) { | 
|  | 733 | dev->flags |= ATA_DFLAG_DETACHED; | 
|  | 734 | ap->flags |= ATA_FLAG_SCSI_HOTPLUG; | 
|  | 735 | } | 
|  | 736 |  | 
| Tejun Heo | beb07c1 | 2006-06-24 20:30:19 +0900 | [diff] [blame] | 737 | /* clear per-dev EH actions */ | 
|  | 738 | ata_eh_clear_action(dev, &ap->eh_info, ATA_EH_PERDEV_MASK); | 
|  | 739 | ata_eh_clear_action(dev, &ap->eh_context.i, ATA_EH_PERDEV_MASK); | 
|  | 740 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 741 | spin_unlock_irqrestore(ap->lock, flags); | 
| Tejun Heo | 0ea035a | 2006-05-31 18:28:01 +0900 | [diff] [blame] | 742 | } | 
|  | 743 |  | 
|  | 744 | /** | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 745 | *	ata_eh_about_to_do - about to perform eh_action | 
|  | 746 | *	@ap: target ATA port | 
| Tejun Heo | 47005f2 | 2006-06-19 18:27:23 +0900 | [diff] [blame] | 747 | *	@dev: target ATA dev for per-dev action (can be NULL) | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 748 | *	@action: action about to be performed | 
|  | 749 | * | 
|  | 750 | *	Called just before performing EH actions to clear related bits | 
|  | 751 | *	in @ap->eh_info such that eh actions are not unnecessarily | 
|  | 752 | *	repeated. | 
|  | 753 | * | 
|  | 754 | *	LOCKING: | 
|  | 755 | *	None. | 
|  | 756 | */ | 
| Tejun Heo | 47005f2 | 2006-06-19 18:27:23 +0900 | [diff] [blame] | 757 | static void ata_eh_about_to_do(struct ata_port *ap, struct ata_device *dev, | 
|  | 758 | unsigned int action) | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 759 | { | 
|  | 760 | unsigned long flags; | 
|  | 761 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 762 | spin_lock_irqsave(ap->lock, flags); | 
| Tejun Heo | 47005f2 | 2006-06-19 18:27:23 +0900 | [diff] [blame] | 763 | ata_eh_clear_action(dev, &ap->eh_info, action); | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 764 | ap->flags |= ATA_FLAG_RECOVERED; | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 765 | spin_unlock_irqrestore(ap->lock, flags); | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 766 | } | 
|  | 767 |  | 
|  | 768 | /** | 
| Tejun Heo | 47005f2 | 2006-06-19 18:27:23 +0900 | [diff] [blame] | 769 | *	ata_eh_done - EH action complete | 
|  | 770 | *	@ap: target ATA port | 
|  | 771 | *	@dev: target ATA dev for per-dev action (can be NULL) | 
|  | 772 | *	@action: action just completed | 
|  | 773 | * | 
|  | 774 | *	Called right after performing EH actions to clear related bits | 
|  | 775 | *	in @ap->eh_context. | 
|  | 776 | * | 
|  | 777 | *	LOCKING: | 
|  | 778 | *	None. | 
|  | 779 | */ | 
|  | 780 | static void ata_eh_done(struct ata_port *ap, struct ata_device *dev, | 
|  | 781 | unsigned int action) | 
|  | 782 | { | 
|  | 783 | ata_eh_clear_action(dev, &ap->eh_context.i, action); | 
|  | 784 | } | 
|  | 785 |  | 
|  | 786 | /** | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 787 | *	ata_err_string - convert err_mask to descriptive string | 
|  | 788 | *	@err_mask: error mask to convert to string | 
|  | 789 | * | 
|  | 790 | *	Convert @err_mask to descriptive string.  Errors are | 
|  | 791 | *	prioritized according to severity and only the most severe | 
|  | 792 | *	error is reported. | 
|  | 793 | * | 
|  | 794 | *	LOCKING: | 
|  | 795 | *	None. | 
|  | 796 | * | 
|  | 797 | *	RETURNS: | 
|  | 798 | *	Descriptive string for @err_mask | 
|  | 799 | */ | 
|  | 800 | static const char * ata_err_string(unsigned int err_mask) | 
|  | 801 | { | 
|  | 802 | if (err_mask & AC_ERR_HOST_BUS) | 
|  | 803 | return "host bus error"; | 
|  | 804 | if (err_mask & AC_ERR_ATA_BUS) | 
|  | 805 | return "ATA bus error"; | 
|  | 806 | if (err_mask & AC_ERR_TIMEOUT) | 
|  | 807 | return "timeout"; | 
|  | 808 | if (err_mask & AC_ERR_HSM) | 
|  | 809 | return "HSM violation"; | 
|  | 810 | if (err_mask & AC_ERR_SYSTEM) | 
|  | 811 | return "internal error"; | 
|  | 812 | if (err_mask & AC_ERR_MEDIA) | 
|  | 813 | return "media error"; | 
|  | 814 | if (err_mask & AC_ERR_INVALID) | 
|  | 815 | return "invalid argument"; | 
|  | 816 | if (err_mask & AC_ERR_DEV) | 
|  | 817 | return "device error"; | 
|  | 818 | return "unknown error"; | 
|  | 819 | } | 
|  | 820 |  | 
|  | 821 | /** | 
| Tejun Heo | e8ee845 | 2006-05-15 21:03:46 +0900 | [diff] [blame] | 822 | *	ata_read_log_page - read a specific log page | 
|  | 823 | *	@dev: target device | 
|  | 824 | *	@page: page to read | 
|  | 825 | *	@buf: buffer to store read page | 
|  | 826 | *	@sectors: number of sectors to read | 
|  | 827 | * | 
|  | 828 | *	Read log page using READ_LOG_EXT command. | 
|  | 829 | * | 
|  | 830 | *	LOCKING: | 
|  | 831 | *	Kernel thread context (may sleep). | 
|  | 832 | * | 
|  | 833 | *	RETURNS: | 
|  | 834 | *	0 on success, AC_ERR_* mask otherwise. | 
|  | 835 | */ | 
|  | 836 | static unsigned int ata_read_log_page(struct ata_device *dev, | 
|  | 837 | u8 page, void *buf, unsigned int sectors) | 
|  | 838 | { | 
|  | 839 | struct ata_taskfile tf; | 
|  | 840 | unsigned int err_mask; | 
|  | 841 |  | 
|  | 842 | DPRINTK("read log page - page %d\n", page); | 
|  | 843 |  | 
|  | 844 | ata_tf_init(dev, &tf); | 
|  | 845 | tf.command = ATA_CMD_READ_LOG_EXT; | 
|  | 846 | tf.lbal = page; | 
|  | 847 | tf.nsect = sectors; | 
|  | 848 | tf.hob_nsect = sectors >> 8; | 
|  | 849 | tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_LBA48 | ATA_TFLAG_DEVICE; | 
|  | 850 | tf.protocol = ATA_PROT_PIO; | 
|  | 851 |  | 
|  | 852 | err_mask = ata_exec_internal(dev, &tf, NULL, DMA_FROM_DEVICE, | 
|  | 853 | buf, sectors * ATA_SECT_SIZE); | 
|  | 854 |  | 
|  | 855 | DPRINTK("EXIT, err_mask=%x\n", err_mask); | 
|  | 856 | return err_mask; | 
|  | 857 | } | 
|  | 858 |  | 
|  | 859 | /** | 
|  | 860 | *	ata_eh_read_log_10h - Read log page 10h for NCQ error details | 
|  | 861 | *	@dev: Device to read log page 10h from | 
|  | 862 | *	@tag: Resulting tag of the failed command | 
|  | 863 | *	@tf: Resulting taskfile registers of the failed command | 
|  | 864 | * | 
|  | 865 | *	Read log page 10h to obtain NCQ error details and clear error | 
|  | 866 | *	condition. | 
|  | 867 | * | 
|  | 868 | *	LOCKING: | 
|  | 869 | *	Kernel thread context (may sleep). | 
|  | 870 | * | 
|  | 871 | *	RETURNS: | 
|  | 872 | *	0 on success, -errno otherwise. | 
|  | 873 | */ | 
|  | 874 | static int ata_eh_read_log_10h(struct ata_device *dev, | 
|  | 875 | int *tag, struct ata_taskfile *tf) | 
|  | 876 | { | 
|  | 877 | u8 *buf = dev->ap->sector_buf; | 
|  | 878 | unsigned int err_mask; | 
|  | 879 | u8 csum; | 
|  | 880 | int i; | 
|  | 881 |  | 
|  | 882 | err_mask = ata_read_log_page(dev, ATA_LOG_SATA_NCQ, buf, 1); | 
|  | 883 | if (err_mask) | 
|  | 884 | return -EIO; | 
|  | 885 |  | 
|  | 886 | csum = 0; | 
|  | 887 | for (i = 0; i < ATA_SECT_SIZE; i++) | 
|  | 888 | csum += buf[i]; | 
|  | 889 | if (csum) | 
|  | 890 | ata_dev_printk(dev, KERN_WARNING, | 
|  | 891 | "invalid checksum 0x%x on log page 10h\n", csum); | 
|  | 892 |  | 
|  | 893 | if (buf[0] & 0x80) | 
|  | 894 | return -ENOENT; | 
|  | 895 |  | 
|  | 896 | *tag = buf[0] & 0x1f; | 
|  | 897 |  | 
|  | 898 | tf->command = buf[2]; | 
|  | 899 | tf->feature = buf[3]; | 
|  | 900 | tf->lbal = buf[4]; | 
|  | 901 | tf->lbam = buf[5]; | 
|  | 902 | tf->lbah = buf[6]; | 
|  | 903 | tf->device = buf[7]; | 
|  | 904 | tf->hob_lbal = buf[8]; | 
|  | 905 | tf->hob_lbam = buf[9]; | 
|  | 906 | tf->hob_lbah = buf[10]; | 
|  | 907 | tf->nsect = buf[12]; | 
|  | 908 | tf->hob_nsect = buf[13]; | 
|  | 909 |  | 
|  | 910 | return 0; | 
|  | 911 | } | 
|  | 912 |  | 
|  | 913 | /** | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 914 | *	atapi_eh_request_sense - perform ATAPI REQUEST_SENSE | 
|  | 915 | *	@dev: device to perform REQUEST_SENSE to | 
|  | 916 | *	@sense_buf: result sense data buffer (SCSI_SENSE_BUFFERSIZE bytes long) | 
|  | 917 | * | 
|  | 918 | *	Perform ATAPI REQUEST_SENSE after the device reported CHECK | 
|  | 919 | *	SENSE.  This function is EH helper. | 
|  | 920 | * | 
|  | 921 | *	LOCKING: | 
|  | 922 | *	Kernel thread context (may sleep). | 
|  | 923 | * | 
|  | 924 | *	RETURNS: | 
|  | 925 | *	0 on success, AC_ERR_* mask on failure | 
|  | 926 | */ | 
|  | 927 | static unsigned int atapi_eh_request_sense(struct ata_device *dev, | 
|  | 928 | unsigned char *sense_buf) | 
|  | 929 | { | 
|  | 930 | struct ata_port *ap = dev->ap; | 
|  | 931 | struct ata_taskfile tf; | 
|  | 932 | u8 cdb[ATAPI_CDB_LEN]; | 
|  | 933 |  | 
|  | 934 | DPRINTK("ATAPI request sense\n"); | 
|  | 935 |  | 
|  | 936 | ata_tf_init(dev, &tf); | 
|  | 937 |  | 
|  | 938 | /* FIXME: is this needed? */ | 
|  | 939 | memset(sense_buf, 0, SCSI_SENSE_BUFFERSIZE); | 
|  | 940 |  | 
|  | 941 | /* XXX: why tf_read here? */ | 
|  | 942 | ap->ops->tf_read(ap, &tf); | 
|  | 943 |  | 
|  | 944 | /* fill these in, for the case where they are -not- overwritten */ | 
|  | 945 | sense_buf[0] = 0x70; | 
|  | 946 | sense_buf[2] = tf.feature >> 4; | 
|  | 947 |  | 
|  | 948 | memset(cdb, 0, ATAPI_CDB_LEN); | 
|  | 949 | cdb[0] = REQUEST_SENSE; | 
|  | 950 | cdb[4] = SCSI_SENSE_BUFFERSIZE; | 
|  | 951 |  | 
|  | 952 | tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_DEVICE; | 
|  | 953 | tf.command = ATA_CMD_PACKET; | 
|  | 954 |  | 
|  | 955 | /* is it pointless to prefer PIO for "safety reasons"? */ | 
|  | 956 | if (ap->flags & ATA_FLAG_PIO_DMA) { | 
|  | 957 | tf.protocol = ATA_PROT_ATAPI_DMA; | 
|  | 958 | tf.feature |= ATAPI_PKT_DMA; | 
|  | 959 | } else { | 
|  | 960 | tf.protocol = ATA_PROT_ATAPI; | 
|  | 961 | tf.lbam = (8 * 1024) & 0xff; | 
|  | 962 | tf.lbah = (8 * 1024) >> 8; | 
|  | 963 | } | 
|  | 964 |  | 
|  | 965 | return ata_exec_internal(dev, &tf, cdb, DMA_FROM_DEVICE, | 
|  | 966 | sense_buf, SCSI_SENSE_BUFFERSIZE); | 
|  | 967 | } | 
|  | 968 |  | 
|  | 969 | /** | 
|  | 970 | *	ata_eh_analyze_serror - analyze SError for a failed port | 
|  | 971 | *	@ap: ATA port to analyze SError for | 
|  | 972 | * | 
|  | 973 | *	Analyze SError if available and further determine cause of | 
|  | 974 | *	failure. | 
|  | 975 | * | 
|  | 976 | *	LOCKING: | 
|  | 977 | *	None. | 
|  | 978 | */ | 
|  | 979 | static void ata_eh_analyze_serror(struct ata_port *ap) | 
|  | 980 | { | 
|  | 981 | struct ata_eh_context *ehc = &ap->eh_context; | 
|  | 982 | u32 serror = ehc->i.serror; | 
|  | 983 | unsigned int err_mask = 0, action = 0; | 
|  | 984 |  | 
|  | 985 | if (serror & SERR_PERSISTENT) { | 
|  | 986 | err_mask |= AC_ERR_ATA_BUS; | 
|  | 987 | action |= ATA_EH_HARDRESET; | 
|  | 988 | } | 
|  | 989 | if (serror & | 
|  | 990 | (SERR_DATA_RECOVERED | SERR_COMM_RECOVERED | SERR_DATA)) { | 
|  | 991 | err_mask |= AC_ERR_ATA_BUS; | 
|  | 992 | action |= ATA_EH_SOFTRESET; | 
|  | 993 | } | 
|  | 994 | if (serror & SERR_PROTOCOL) { | 
|  | 995 | err_mask |= AC_ERR_HSM; | 
|  | 996 | action |= ATA_EH_SOFTRESET; | 
|  | 997 | } | 
|  | 998 | if (serror & SERR_INTERNAL) { | 
|  | 999 | err_mask |= AC_ERR_SYSTEM; | 
|  | 1000 | action |= ATA_EH_SOFTRESET; | 
|  | 1001 | } | 
| Tejun Heo | 084fe63 | 2006-05-31 18:28:03 +0900 | [diff] [blame] | 1002 | if (serror & (SERR_PHYRDY_CHG | SERR_DEV_XCHG)) | 
|  | 1003 | ata_ehi_hotplugged(&ehc->i); | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1004 |  | 
|  | 1005 | ehc->i.err_mask |= err_mask; | 
|  | 1006 | ehc->i.action |= action; | 
|  | 1007 | } | 
|  | 1008 |  | 
|  | 1009 | /** | 
| Tejun Heo | e8ee845 | 2006-05-15 21:03:46 +0900 | [diff] [blame] | 1010 | *	ata_eh_analyze_ncq_error - analyze NCQ error | 
|  | 1011 | *	@ap: ATA port to analyze NCQ error for | 
|  | 1012 | * | 
|  | 1013 | *	Read log page 10h, determine the offending qc and acquire | 
|  | 1014 | *	error status TF.  For NCQ device errors, all LLDDs have to do | 
|  | 1015 | *	is setting AC_ERR_DEV in ehi->err_mask.  This function takes | 
|  | 1016 | *	care of the rest. | 
|  | 1017 | * | 
|  | 1018 | *	LOCKING: | 
|  | 1019 | *	Kernel thread context (may sleep). | 
|  | 1020 | */ | 
|  | 1021 | static void ata_eh_analyze_ncq_error(struct ata_port *ap) | 
|  | 1022 | { | 
|  | 1023 | struct ata_eh_context *ehc = &ap->eh_context; | 
|  | 1024 | struct ata_device *dev = ap->device; | 
|  | 1025 | struct ata_queued_cmd *qc; | 
|  | 1026 | struct ata_taskfile tf; | 
|  | 1027 | int tag, rc; | 
|  | 1028 |  | 
|  | 1029 | /* if frozen, we can't do much */ | 
|  | 1030 | if (ap->flags & ATA_FLAG_FROZEN) | 
|  | 1031 | return; | 
|  | 1032 |  | 
|  | 1033 | /* is it NCQ device error? */ | 
|  | 1034 | if (!ap->sactive || !(ehc->i.err_mask & AC_ERR_DEV)) | 
|  | 1035 | return; | 
|  | 1036 |  | 
|  | 1037 | /* has LLDD analyzed already? */ | 
|  | 1038 | for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { | 
|  | 1039 | qc = __ata_qc_from_tag(ap, tag); | 
|  | 1040 |  | 
|  | 1041 | if (!(qc->flags & ATA_QCFLAG_FAILED)) | 
|  | 1042 | continue; | 
|  | 1043 |  | 
|  | 1044 | if (qc->err_mask) | 
|  | 1045 | return; | 
|  | 1046 | } | 
|  | 1047 |  | 
|  | 1048 | /* okay, this error is ours */ | 
|  | 1049 | rc = ata_eh_read_log_10h(dev, &tag, &tf); | 
|  | 1050 | if (rc) { | 
|  | 1051 | ata_port_printk(ap, KERN_ERR, "failed to read log page 10h " | 
|  | 1052 | "(errno=%d)\n", rc); | 
|  | 1053 | return; | 
|  | 1054 | } | 
|  | 1055 |  | 
|  | 1056 | if (!(ap->sactive & (1 << tag))) { | 
|  | 1057 | ata_port_printk(ap, KERN_ERR, "log page 10h reported " | 
|  | 1058 | "inactive tag %d\n", tag); | 
|  | 1059 | return; | 
|  | 1060 | } | 
|  | 1061 |  | 
|  | 1062 | /* we've got the perpetrator, condemn it */ | 
|  | 1063 | qc = __ata_qc_from_tag(ap, tag); | 
|  | 1064 | memcpy(&qc->result_tf, &tf, sizeof(tf)); | 
|  | 1065 | qc->err_mask |= AC_ERR_DEV; | 
|  | 1066 | ehc->i.err_mask &= ~AC_ERR_DEV; | 
|  | 1067 | } | 
|  | 1068 |  | 
|  | 1069 | /** | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1070 | *	ata_eh_analyze_tf - analyze taskfile of a failed qc | 
|  | 1071 | *	@qc: qc to analyze | 
|  | 1072 | *	@tf: Taskfile registers to analyze | 
|  | 1073 | * | 
|  | 1074 | *	Analyze taskfile of @qc and further determine cause of | 
|  | 1075 | *	failure.  This function also requests ATAPI sense data if | 
|  | 1076 | *	avaliable. | 
|  | 1077 | * | 
|  | 1078 | *	LOCKING: | 
|  | 1079 | *	Kernel thread context (may sleep). | 
|  | 1080 | * | 
|  | 1081 | *	RETURNS: | 
|  | 1082 | *	Determined recovery action | 
|  | 1083 | */ | 
|  | 1084 | static unsigned int ata_eh_analyze_tf(struct ata_queued_cmd *qc, | 
|  | 1085 | const struct ata_taskfile *tf) | 
|  | 1086 | { | 
|  | 1087 | unsigned int tmp, action = 0; | 
|  | 1088 | u8 stat = tf->command, err = tf->feature; | 
|  | 1089 |  | 
|  | 1090 | if ((stat & (ATA_BUSY | ATA_DRQ | ATA_DRDY)) != ATA_DRDY) { | 
|  | 1091 | qc->err_mask |= AC_ERR_HSM; | 
|  | 1092 | return ATA_EH_SOFTRESET; | 
|  | 1093 | } | 
|  | 1094 |  | 
|  | 1095 | if (!(qc->err_mask & AC_ERR_DEV)) | 
|  | 1096 | return 0; | 
|  | 1097 |  | 
|  | 1098 | switch (qc->dev->class) { | 
|  | 1099 | case ATA_DEV_ATA: | 
|  | 1100 | if (err & ATA_ICRC) | 
|  | 1101 | qc->err_mask |= AC_ERR_ATA_BUS; | 
|  | 1102 | if (err & ATA_UNC) | 
|  | 1103 | qc->err_mask |= AC_ERR_MEDIA; | 
|  | 1104 | if (err & ATA_IDNF) | 
|  | 1105 | qc->err_mask |= AC_ERR_INVALID; | 
|  | 1106 | break; | 
|  | 1107 |  | 
|  | 1108 | case ATA_DEV_ATAPI: | 
|  | 1109 | tmp = atapi_eh_request_sense(qc->dev, | 
|  | 1110 | qc->scsicmd->sense_buffer); | 
|  | 1111 | if (!tmp) { | 
|  | 1112 | /* ATA_QCFLAG_SENSE_VALID is used to tell | 
|  | 1113 | * atapi_qc_complete() that sense data is | 
|  | 1114 | * already valid. | 
|  | 1115 | * | 
|  | 1116 | * TODO: interpret sense data and set | 
|  | 1117 | * appropriate err_mask. | 
|  | 1118 | */ | 
|  | 1119 | qc->flags |= ATA_QCFLAG_SENSE_VALID; | 
|  | 1120 | } else | 
|  | 1121 | qc->err_mask |= tmp; | 
|  | 1122 | } | 
|  | 1123 |  | 
|  | 1124 | if (qc->err_mask & (AC_ERR_HSM | AC_ERR_TIMEOUT | AC_ERR_ATA_BUS)) | 
|  | 1125 | action |= ATA_EH_SOFTRESET; | 
|  | 1126 |  | 
|  | 1127 | return action; | 
|  | 1128 | } | 
|  | 1129 |  | 
|  | 1130 | static int ata_eh_categorize_ering_entry(struct ata_ering_entry *ent) | 
|  | 1131 | { | 
|  | 1132 | if (ent->err_mask & (AC_ERR_ATA_BUS | AC_ERR_TIMEOUT)) | 
|  | 1133 | return 1; | 
|  | 1134 |  | 
|  | 1135 | if (ent->is_io) { | 
|  | 1136 | if (ent->err_mask & AC_ERR_HSM) | 
|  | 1137 | return 1; | 
|  | 1138 | if ((ent->err_mask & | 
|  | 1139 | (AC_ERR_DEV|AC_ERR_MEDIA|AC_ERR_INVALID)) == AC_ERR_DEV) | 
|  | 1140 | return 2; | 
|  | 1141 | } | 
|  | 1142 |  | 
|  | 1143 | return 0; | 
|  | 1144 | } | 
|  | 1145 |  | 
|  | 1146 | struct speed_down_needed_arg { | 
|  | 1147 | u64 since; | 
|  | 1148 | int nr_errors[3]; | 
|  | 1149 | }; | 
|  | 1150 |  | 
|  | 1151 | static int speed_down_needed_cb(struct ata_ering_entry *ent, void *void_arg) | 
|  | 1152 | { | 
|  | 1153 | struct speed_down_needed_arg *arg = void_arg; | 
|  | 1154 |  | 
|  | 1155 | if (ent->timestamp < arg->since) | 
|  | 1156 | return -1; | 
|  | 1157 |  | 
|  | 1158 | arg->nr_errors[ata_eh_categorize_ering_entry(ent)]++; | 
|  | 1159 | return 0; | 
|  | 1160 | } | 
|  | 1161 |  | 
|  | 1162 | /** | 
|  | 1163 | *	ata_eh_speed_down_needed - Determine wheter speed down is necessary | 
|  | 1164 | *	@dev: Device of interest | 
|  | 1165 | * | 
|  | 1166 | *	This function examines error ring of @dev and determines | 
|  | 1167 | *	whether speed down is necessary.  Speed down is necessary if | 
|  | 1168 | *	there have been more than 3 of Cat-1 errors or 10 of Cat-2 | 
|  | 1169 | *	errors during last 15 minutes. | 
|  | 1170 | * | 
|  | 1171 | *	Cat-1 errors are ATA_BUS, TIMEOUT for any command and HSM | 
|  | 1172 | *	violation for known supported commands. | 
|  | 1173 | * | 
|  | 1174 | *	Cat-2 errors are unclassified DEV error for known supported | 
|  | 1175 | *	command. | 
|  | 1176 | * | 
|  | 1177 | *	LOCKING: | 
|  | 1178 | *	Inherited from caller. | 
|  | 1179 | * | 
|  | 1180 | *	RETURNS: | 
|  | 1181 | *	1 if speed down is necessary, 0 otherwise | 
|  | 1182 | */ | 
|  | 1183 | static int ata_eh_speed_down_needed(struct ata_device *dev) | 
|  | 1184 | { | 
|  | 1185 | const u64 interval = 15LLU * 60 * HZ; | 
|  | 1186 | static const int err_limits[3] = { -1, 3, 10 }; | 
|  | 1187 | struct speed_down_needed_arg arg; | 
|  | 1188 | struct ata_ering_entry *ent; | 
|  | 1189 | int err_cat; | 
|  | 1190 | u64 j64; | 
|  | 1191 |  | 
|  | 1192 | ent = ata_ering_top(&dev->ering); | 
|  | 1193 | if (!ent) | 
|  | 1194 | return 0; | 
|  | 1195 |  | 
|  | 1196 | err_cat = ata_eh_categorize_ering_entry(ent); | 
|  | 1197 | if (err_cat == 0) | 
|  | 1198 | return 0; | 
|  | 1199 |  | 
|  | 1200 | memset(&arg, 0, sizeof(arg)); | 
|  | 1201 |  | 
|  | 1202 | j64 = get_jiffies_64(); | 
|  | 1203 | if (j64 >= interval) | 
|  | 1204 | arg.since = j64 - interval; | 
|  | 1205 | else | 
|  | 1206 | arg.since = 0; | 
|  | 1207 |  | 
|  | 1208 | ata_ering_map(&dev->ering, speed_down_needed_cb, &arg); | 
|  | 1209 |  | 
|  | 1210 | return arg.nr_errors[err_cat] > err_limits[err_cat]; | 
|  | 1211 | } | 
|  | 1212 |  | 
|  | 1213 | /** | 
|  | 1214 | *	ata_eh_speed_down - record error and speed down if necessary | 
|  | 1215 | *	@dev: Failed device | 
|  | 1216 | *	@is_io: Did the device fail during normal IO? | 
|  | 1217 | *	@err_mask: err_mask of the error | 
|  | 1218 | * | 
|  | 1219 | *	Record error and examine error history to determine whether | 
|  | 1220 | *	adjusting transmission speed is necessary.  It also sets | 
|  | 1221 | *	transmission limits appropriately if such adjustment is | 
|  | 1222 | *	necessary. | 
|  | 1223 | * | 
|  | 1224 | *	LOCKING: | 
|  | 1225 | *	Kernel thread context (may sleep). | 
|  | 1226 | * | 
|  | 1227 | *	RETURNS: | 
|  | 1228 | *	0 on success, -errno otherwise | 
|  | 1229 | */ | 
|  | 1230 | static int ata_eh_speed_down(struct ata_device *dev, int is_io, | 
|  | 1231 | unsigned int err_mask) | 
|  | 1232 | { | 
|  | 1233 | if (!err_mask) | 
|  | 1234 | return 0; | 
|  | 1235 |  | 
|  | 1236 | /* record error and determine whether speed down is necessary */ | 
|  | 1237 | ata_ering_record(&dev->ering, is_io, err_mask); | 
|  | 1238 |  | 
|  | 1239 | if (!ata_eh_speed_down_needed(dev)) | 
|  | 1240 | return 0; | 
|  | 1241 |  | 
|  | 1242 | /* speed down SATA link speed if possible */ | 
|  | 1243 | if (sata_down_spd_limit(dev->ap) == 0) | 
|  | 1244 | return ATA_EH_HARDRESET; | 
|  | 1245 |  | 
|  | 1246 | /* lower transfer mode */ | 
|  | 1247 | if (ata_down_xfermask_limit(dev, 0) == 0) | 
|  | 1248 | return ATA_EH_SOFTRESET; | 
|  | 1249 |  | 
|  | 1250 | ata_dev_printk(dev, KERN_ERR, | 
|  | 1251 | "speed down requested but no transfer mode left\n"); | 
|  | 1252 | return 0; | 
|  | 1253 | } | 
|  | 1254 |  | 
|  | 1255 | /** | 
|  | 1256 | *	ata_eh_autopsy - analyze error and determine recovery action | 
|  | 1257 | *	@ap: ATA port to perform autopsy on | 
|  | 1258 | * | 
|  | 1259 | *	Analyze why @ap failed and determine which recovery action is | 
|  | 1260 | *	needed.  This function also sets more detailed AC_ERR_* values | 
|  | 1261 | *	and fills sense data for ATAPI CHECK SENSE. | 
|  | 1262 | * | 
|  | 1263 | *	LOCKING: | 
|  | 1264 | *	Kernel thread context (may sleep). | 
|  | 1265 | */ | 
|  | 1266 | static void ata_eh_autopsy(struct ata_port *ap) | 
|  | 1267 | { | 
|  | 1268 | struct ata_eh_context *ehc = &ap->eh_context; | 
|  | 1269 | unsigned int action = ehc->i.action; | 
|  | 1270 | struct ata_device *failed_dev = NULL; | 
|  | 1271 | unsigned int all_err_mask = 0; | 
|  | 1272 | int tag, is_io = 0; | 
|  | 1273 | u32 serror; | 
|  | 1274 | int rc; | 
|  | 1275 |  | 
|  | 1276 | DPRINTK("ENTER\n"); | 
|  | 1277 |  | 
|  | 1278 | /* obtain and analyze SError */ | 
|  | 1279 | rc = sata_scr_read(ap, SCR_ERROR, &serror); | 
|  | 1280 | if (rc == 0) { | 
|  | 1281 | ehc->i.serror |= serror; | 
|  | 1282 | ata_eh_analyze_serror(ap); | 
|  | 1283 | } else if (rc != -EOPNOTSUPP) | 
|  | 1284 | action |= ATA_EH_HARDRESET; | 
|  | 1285 |  | 
| Tejun Heo | e8ee845 | 2006-05-15 21:03:46 +0900 | [diff] [blame] | 1286 | /* analyze NCQ failure */ | 
|  | 1287 | ata_eh_analyze_ncq_error(ap); | 
|  | 1288 |  | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1289 | /* any real error trumps AC_ERR_OTHER */ | 
|  | 1290 | if (ehc->i.err_mask & ~AC_ERR_OTHER) | 
|  | 1291 | ehc->i.err_mask &= ~AC_ERR_OTHER; | 
|  | 1292 |  | 
|  | 1293 | all_err_mask |= ehc->i.err_mask; | 
|  | 1294 |  | 
|  | 1295 | for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { | 
|  | 1296 | struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); | 
|  | 1297 |  | 
|  | 1298 | if (!(qc->flags & ATA_QCFLAG_FAILED)) | 
|  | 1299 | continue; | 
|  | 1300 |  | 
|  | 1301 | /* inherit upper level err_mask */ | 
|  | 1302 | qc->err_mask |= ehc->i.err_mask; | 
|  | 1303 |  | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1304 | /* analyze TF */ | 
|  | 1305 | action |= ata_eh_analyze_tf(qc, &qc->result_tf); | 
|  | 1306 |  | 
|  | 1307 | /* DEV errors are probably spurious in case of ATA_BUS error */ | 
|  | 1308 | if (qc->err_mask & AC_ERR_ATA_BUS) | 
|  | 1309 | qc->err_mask &= ~(AC_ERR_DEV | AC_ERR_MEDIA | | 
|  | 1310 | AC_ERR_INVALID); | 
|  | 1311 |  | 
|  | 1312 | /* any real error trumps unknown error */ | 
|  | 1313 | if (qc->err_mask & ~AC_ERR_OTHER) | 
|  | 1314 | qc->err_mask &= ~AC_ERR_OTHER; | 
|  | 1315 |  | 
|  | 1316 | /* SENSE_VALID trumps dev/unknown error and revalidation */ | 
|  | 1317 | if (qc->flags & ATA_QCFLAG_SENSE_VALID) { | 
|  | 1318 | qc->err_mask &= ~(AC_ERR_DEV | AC_ERR_OTHER); | 
|  | 1319 | action &= ~ATA_EH_REVALIDATE; | 
|  | 1320 | } | 
|  | 1321 |  | 
|  | 1322 | /* accumulate error info */ | 
|  | 1323 | failed_dev = qc->dev; | 
|  | 1324 | all_err_mask |= qc->err_mask; | 
|  | 1325 | if (qc->flags & ATA_QCFLAG_IO) | 
|  | 1326 | is_io = 1; | 
|  | 1327 | } | 
|  | 1328 |  | 
| Tejun Heo | a20f33f | 2006-05-16 12:58:24 +0900 | [diff] [blame] | 1329 | /* enforce default EH actions */ | 
|  | 1330 | if (ap->flags & ATA_FLAG_FROZEN || | 
|  | 1331 | all_err_mask & (AC_ERR_HSM | AC_ERR_TIMEOUT)) | 
|  | 1332 | action |= ATA_EH_SOFTRESET; | 
|  | 1333 | else if (all_err_mask) | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1334 | action |= ATA_EH_REVALIDATE; | 
|  | 1335 |  | 
| Tejun Heo | 47005f2 | 2006-06-19 18:27:23 +0900 | [diff] [blame] | 1336 | /* if we have offending qcs and the associated failed device */ | 
|  | 1337 | if (failed_dev) { | 
|  | 1338 | /* speed down */ | 
|  | 1339 | action |= ata_eh_speed_down(failed_dev, is_io, all_err_mask); | 
|  | 1340 |  | 
|  | 1341 | /* perform per-dev EH action only on the offending device */ | 
|  | 1342 | ehc->i.dev_action[failed_dev->devno] |= | 
|  | 1343 | action & ATA_EH_PERDEV_MASK; | 
|  | 1344 | action &= ~ATA_EH_PERDEV_MASK; | 
|  | 1345 | } | 
|  | 1346 |  | 
| Tejun Heo | a20f33f | 2006-05-16 12:58:24 +0900 | [diff] [blame] | 1347 | /* record autopsy result */ | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1348 | ehc->i.dev = failed_dev; | 
|  | 1349 | ehc->i.action = action; | 
|  | 1350 |  | 
|  | 1351 | DPRINTK("EXIT\n"); | 
|  | 1352 | } | 
|  | 1353 |  | 
|  | 1354 | /** | 
|  | 1355 | *	ata_eh_report - report error handling to user | 
|  | 1356 | *	@ap: ATA port EH is going on | 
|  | 1357 | * | 
|  | 1358 | *	Report EH to user. | 
|  | 1359 | * | 
|  | 1360 | *	LOCKING: | 
|  | 1361 | *	None. | 
|  | 1362 | */ | 
|  | 1363 | static void ata_eh_report(struct ata_port *ap) | 
|  | 1364 | { | 
|  | 1365 | struct ata_eh_context *ehc = &ap->eh_context; | 
|  | 1366 | const char *frozen, *desc; | 
|  | 1367 | int tag, nr_failed = 0; | 
|  | 1368 |  | 
|  | 1369 | desc = NULL; | 
|  | 1370 | if (ehc->i.desc[0] != '\0') | 
|  | 1371 | desc = ehc->i.desc; | 
|  | 1372 |  | 
|  | 1373 | for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { | 
|  | 1374 | struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); | 
|  | 1375 |  | 
|  | 1376 | if (!(qc->flags & ATA_QCFLAG_FAILED)) | 
|  | 1377 | continue; | 
|  | 1378 | if (qc->flags & ATA_QCFLAG_SENSE_VALID && !qc->err_mask) | 
|  | 1379 | continue; | 
|  | 1380 |  | 
|  | 1381 | nr_failed++; | 
|  | 1382 | } | 
|  | 1383 |  | 
|  | 1384 | if (!nr_failed && !ehc->i.err_mask) | 
|  | 1385 | return; | 
|  | 1386 |  | 
|  | 1387 | frozen = ""; | 
|  | 1388 | if (ap->flags & ATA_FLAG_FROZEN) | 
|  | 1389 | frozen = " frozen"; | 
|  | 1390 |  | 
|  | 1391 | if (ehc->i.dev) { | 
| Tejun Heo | e8ee845 | 2006-05-15 21:03:46 +0900 | [diff] [blame] | 1392 | ata_dev_printk(ehc->i.dev, KERN_ERR, "exception Emask 0x%x " | 
|  | 1393 | "SAct 0x%x SErr 0x%x action 0x%x%s\n", | 
|  | 1394 | ehc->i.err_mask, ap->sactive, ehc->i.serror, | 
|  | 1395 | ehc->i.action, frozen); | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1396 | if (desc) | 
|  | 1397 | ata_dev_printk(ehc->i.dev, KERN_ERR, "(%s)\n", desc); | 
|  | 1398 | } else { | 
| Tejun Heo | e8ee845 | 2006-05-15 21:03:46 +0900 | [diff] [blame] | 1399 | ata_port_printk(ap, KERN_ERR, "exception Emask 0x%x " | 
|  | 1400 | "SAct 0x%x SErr 0x%x action 0x%x%s\n", | 
|  | 1401 | ehc->i.err_mask, ap->sactive, ehc->i.serror, | 
|  | 1402 | ehc->i.action, frozen); | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1403 | if (desc) | 
|  | 1404 | ata_port_printk(ap, KERN_ERR, "(%s)\n", desc); | 
|  | 1405 | } | 
|  | 1406 |  | 
|  | 1407 | for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { | 
|  | 1408 | struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); | 
|  | 1409 |  | 
|  | 1410 | if (!(qc->flags & ATA_QCFLAG_FAILED) || !qc->err_mask) | 
|  | 1411 | continue; | 
|  | 1412 |  | 
|  | 1413 | ata_dev_printk(qc->dev, KERN_ERR, "tag %d cmd 0x%x " | 
|  | 1414 | "Emask 0x%x stat 0x%x err 0x%x (%s)\n", | 
|  | 1415 | qc->tag, qc->tf.command, qc->err_mask, | 
|  | 1416 | qc->result_tf.command, qc->result_tf.feature, | 
|  | 1417 | ata_err_string(qc->err_mask)); | 
|  | 1418 | } | 
|  | 1419 | } | 
|  | 1420 |  | 
| Tejun Heo | d87fa38 | 2006-05-31 18:28:24 +0900 | [diff] [blame] | 1421 | static int ata_do_reset(struct ata_port *ap, ata_reset_fn_t reset, | 
|  | 1422 | unsigned int *classes) | 
|  | 1423 | { | 
|  | 1424 | int i, rc; | 
|  | 1425 |  | 
|  | 1426 | for (i = 0; i < ATA_MAX_DEVICES; i++) | 
|  | 1427 | classes[i] = ATA_DEV_UNKNOWN; | 
|  | 1428 |  | 
|  | 1429 | rc = reset(ap, classes); | 
|  | 1430 | if (rc) | 
|  | 1431 | return rc; | 
|  | 1432 |  | 
|  | 1433 | /* If any class isn't ATA_DEV_UNKNOWN, consider classification | 
|  | 1434 | * is complete and convert all ATA_DEV_UNKNOWN to | 
|  | 1435 | * ATA_DEV_NONE. | 
|  | 1436 | */ | 
|  | 1437 | for (i = 0; i < ATA_MAX_DEVICES; i++) | 
|  | 1438 | if (classes[i] != ATA_DEV_UNKNOWN) | 
|  | 1439 | break; | 
|  | 1440 |  | 
|  | 1441 | if (i < ATA_MAX_DEVICES) | 
|  | 1442 | for (i = 0; i < ATA_MAX_DEVICES; i++) | 
|  | 1443 | if (classes[i] == ATA_DEV_UNKNOWN) | 
|  | 1444 | classes[i] = ATA_DEV_NONE; | 
|  | 1445 |  | 
|  | 1446 | return 0; | 
|  | 1447 | } | 
|  | 1448 |  | 
| Tejun Heo | 664faf0 | 2006-05-31 18:27:50 +0900 | [diff] [blame] | 1449 | static int ata_eh_followup_srst_needed(int rc, int classify, | 
|  | 1450 | const unsigned int *classes) | 
|  | 1451 | { | 
|  | 1452 | if (rc == -EAGAIN) | 
|  | 1453 | return 1; | 
|  | 1454 | if (rc != 0) | 
|  | 1455 | return 0; | 
|  | 1456 | if (classify && classes[0] == ATA_DEV_UNKNOWN) | 
|  | 1457 | return 1; | 
|  | 1458 | return 0; | 
|  | 1459 | } | 
|  | 1460 |  | 
|  | 1461 | static int ata_eh_reset(struct ata_port *ap, int classify, | 
| Tejun Heo | f5914a4 | 2006-05-31 18:27:48 +0900 | [diff] [blame] | 1462 | ata_prereset_fn_t prereset, ata_reset_fn_t softreset, | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1463 | ata_reset_fn_t hardreset, ata_postreset_fn_t postreset) | 
|  | 1464 | { | 
|  | 1465 | struct ata_eh_context *ehc = &ap->eh_context; | 
| Tejun Heo | 664faf0 | 2006-05-31 18:27:50 +0900 | [diff] [blame] | 1466 | unsigned int *classes = ehc->classes; | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1467 | int tries = ATA_EH_RESET_TRIES; | 
| Tejun Heo | 3e70639 | 2006-05-31 18:28:11 +0900 | [diff] [blame] | 1468 | int verbose = !(ap->flags & ATA_FLAG_LOADING); | 
| Tejun Heo | f5914a4 | 2006-05-31 18:27:48 +0900 | [diff] [blame] | 1469 | unsigned int action; | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1470 | ata_reset_fn_t reset; | 
| Tejun Heo | 664faf0 | 2006-05-31 18:27:50 +0900 | [diff] [blame] | 1471 | int i, did_followup_srst, rc; | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1472 |  | 
| Tejun Heo | f5914a4 | 2006-05-31 18:27:48 +0900 | [diff] [blame] | 1473 | /* Determine which reset to use and record in ehc->i.action. | 
|  | 1474 | * prereset() may examine and modify it. | 
|  | 1475 | */ | 
|  | 1476 | action = ehc->i.action; | 
|  | 1477 | ehc->i.action &= ~ATA_EH_RESET_MASK; | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1478 | if (softreset && (!hardreset || (!sata_set_spd_needed(ap) && | 
| Tejun Heo | f5914a4 | 2006-05-31 18:27:48 +0900 | [diff] [blame] | 1479 | !(action & ATA_EH_HARDRESET)))) | 
|  | 1480 | ehc->i.action |= ATA_EH_SOFTRESET; | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1481 | else | 
| Tejun Heo | f5914a4 | 2006-05-31 18:27:48 +0900 | [diff] [blame] | 1482 | ehc->i.action |= ATA_EH_HARDRESET; | 
|  | 1483 |  | 
|  | 1484 | if (prereset) { | 
|  | 1485 | rc = prereset(ap); | 
|  | 1486 | if (rc) { | 
|  | 1487 | ata_port_printk(ap, KERN_ERR, | 
|  | 1488 | "prereset failed (errno=%d)\n", rc); | 
|  | 1489 | return rc; | 
|  | 1490 | } | 
|  | 1491 | } | 
|  | 1492 |  | 
|  | 1493 | /* prereset() might have modified ehc->i.action */ | 
|  | 1494 | if (ehc->i.action & ATA_EH_HARDRESET) | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1495 | reset = hardreset; | 
| Tejun Heo | f5914a4 | 2006-05-31 18:27:48 +0900 | [diff] [blame] | 1496 | else if (ehc->i.action & ATA_EH_SOFTRESET) | 
|  | 1497 | reset = softreset; | 
|  | 1498 | else { | 
|  | 1499 | /* prereset told us not to reset, bang classes and return */ | 
|  | 1500 | for (i = 0; i < ATA_MAX_DEVICES; i++) | 
|  | 1501 | classes[i] = ATA_DEV_NONE; | 
|  | 1502 | return 0; | 
|  | 1503 | } | 
|  | 1504 |  | 
|  | 1505 | /* did prereset() screw up?  if so, fix up to avoid oopsing */ | 
|  | 1506 | if (!reset) { | 
|  | 1507 | ata_port_printk(ap, KERN_ERR, "BUG: prereset() requested " | 
|  | 1508 | "invalid reset type\n"); | 
|  | 1509 | if (softreset) | 
|  | 1510 | reset = softreset; | 
|  | 1511 | else | 
|  | 1512 | reset = hardreset; | 
|  | 1513 | } | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1514 |  | 
|  | 1515 | retry: | 
| Tejun Heo | 3e70639 | 2006-05-31 18:28:11 +0900 | [diff] [blame] | 1516 | /* shut up during boot probing */ | 
|  | 1517 | if (verbose) | 
|  | 1518 | ata_port_printk(ap, KERN_INFO, "%s resetting port\n", | 
|  | 1519 | reset == softreset ? "soft" : "hard"); | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1520 |  | 
|  | 1521 | /* reset */ | 
| Tejun Heo | 47005f2 | 2006-06-19 18:27:23 +0900 | [diff] [blame] | 1522 | ata_eh_about_to_do(ap, NULL, ATA_EH_RESET_MASK); | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1523 | ehc->i.flags |= ATA_EHI_DID_RESET; | 
|  | 1524 |  | 
|  | 1525 | rc = ata_do_reset(ap, reset, classes); | 
|  | 1526 |  | 
| Tejun Heo | 664faf0 | 2006-05-31 18:27:50 +0900 | [diff] [blame] | 1527 | did_followup_srst = 0; | 
|  | 1528 | if (reset == hardreset && | 
|  | 1529 | ata_eh_followup_srst_needed(rc, classify, classes)) { | 
|  | 1530 | /* okay, let's do follow-up softreset */ | 
|  | 1531 | did_followup_srst = 1; | 
|  | 1532 | reset = softreset; | 
|  | 1533 |  | 
|  | 1534 | if (!reset) { | 
|  | 1535 | ata_port_printk(ap, KERN_ERR, | 
|  | 1536 | "follow-up softreset required " | 
|  | 1537 | "but no softreset avaliable\n"); | 
|  | 1538 | return -EINVAL; | 
|  | 1539 | } | 
|  | 1540 |  | 
| Tejun Heo | 47005f2 | 2006-06-19 18:27:23 +0900 | [diff] [blame] | 1541 | ata_eh_about_to_do(ap, NULL, ATA_EH_RESET_MASK); | 
| Tejun Heo | 664faf0 | 2006-05-31 18:27:50 +0900 | [diff] [blame] | 1542 | rc = ata_do_reset(ap, reset, classes); | 
|  | 1543 |  | 
|  | 1544 | if (rc == 0 && classify && | 
|  | 1545 | classes[0] == ATA_DEV_UNKNOWN) { | 
|  | 1546 | ata_port_printk(ap, KERN_ERR, | 
|  | 1547 | "classification failed\n"); | 
|  | 1548 | return -EINVAL; | 
|  | 1549 | } | 
|  | 1550 | } | 
|  | 1551 |  | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1552 | if (rc && --tries) { | 
| Tejun Heo | 664faf0 | 2006-05-31 18:27:50 +0900 | [diff] [blame] | 1553 | const char *type; | 
|  | 1554 |  | 
|  | 1555 | if (reset == softreset) { | 
|  | 1556 | if (did_followup_srst) | 
|  | 1557 | type = "follow-up soft"; | 
|  | 1558 | else | 
|  | 1559 | type = "soft"; | 
|  | 1560 | } else | 
|  | 1561 | type = "hard"; | 
|  | 1562 |  | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1563 | ata_port_printk(ap, KERN_WARNING, | 
| Tejun Heo | 664faf0 | 2006-05-31 18:27:50 +0900 | [diff] [blame] | 1564 | "%sreset failed, retrying in 5 secs\n", type); | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1565 | ssleep(5); | 
|  | 1566 |  | 
|  | 1567 | if (reset == hardreset) | 
|  | 1568 | sata_down_spd_limit(ap); | 
|  | 1569 | if (hardreset) | 
|  | 1570 | reset = hardreset; | 
|  | 1571 | goto retry; | 
|  | 1572 | } | 
|  | 1573 |  | 
|  | 1574 | if (rc == 0) { | 
| Tejun Heo | 20952b6 | 2006-05-31 18:27:23 +0900 | [diff] [blame] | 1575 | /* After the reset, the device state is PIO 0 and the | 
|  | 1576 | * controller state is undefined.  Record the mode. | 
|  | 1577 | */ | 
|  | 1578 | for (i = 0; i < ATA_MAX_DEVICES; i++) | 
|  | 1579 | ap->device[i].pio_mode = XFER_PIO_0; | 
|  | 1580 |  | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1581 | if (postreset) | 
|  | 1582 | postreset(ap, classes); | 
|  | 1583 |  | 
|  | 1584 | /* reset successful, schedule revalidation */ | 
| Tejun Heo | 47005f2 | 2006-06-19 18:27:23 +0900 | [diff] [blame] | 1585 | ata_eh_done(ap, NULL, ATA_EH_RESET_MASK); | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1586 | ehc->i.action |= ATA_EH_REVALIDATE; | 
|  | 1587 | } | 
|  | 1588 |  | 
|  | 1589 | return rc; | 
|  | 1590 | } | 
|  | 1591 |  | 
| Tejun Heo | 084fe63 | 2006-05-31 18:28:03 +0900 | [diff] [blame] | 1592 | static int ata_eh_revalidate_and_attach(struct ata_port *ap, | 
|  | 1593 | struct ata_device **r_failed_dev) | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1594 | { | 
|  | 1595 | struct ata_eh_context *ehc = &ap->eh_context; | 
|  | 1596 | struct ata_device *dev; | 
| Tejun Heo | 084fe63 | 2006-05-31 18:28:03 +0900 | [diff] [blame] | 1597 | unsigned long flags; | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1598 | int i, rc = 0; | 
|  | 1599 |  | 
|  | 1600 | DPRINTK("ENTER\n"); | 
|  | 1601 |  | 
|  | 1602 | for (i = 0; i < ATA_MAX_DEVICES; i++) { | 
| Tejun Heo | 47005f2 | 2006-06-19 18:27:23 +0900 | [diff] [blame] | 1603 | unsigned int action; | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1604 |  | 
| Tejun Heo | 47005f2 | 2006-06-19 18:27:23 +0900 | [diff] [blame] | 1605 | dev = &ap->device[i]; | 
| Tejun Heo | 64f65ca | 2006-06-24 20:30:18 +0900 | [diff] [blame] | 1606 | action = ata_eh_dev_action(dev); | 
| Tejun Heo | 47005f2 | 2006-06-19 18:27:23 +0900 | [diff] [blame] | 1607 |  | 
|  | 1608 | if (action & ATA_EH_REVALIDATE && ata_dev_enabled(dev)) { | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1609 | if (ata_port_offline(ap)) { | 
|  | 1610 | rc = -EIO; | 
|  | 1611 | break; | 
|  | 1612 | } | 
|  | 1613 |  | 
| Tejun Heo | 47005f2 | 2006-06-19 18:27:23 +0900 | [diff] [blame] | 1614 | ata_eh_about_to_do(ap, dev, ATA_EH_REVALIDATE); | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1615 | rc = ata_dev_revalidate(dev, | 
|  | 1616 | ehc->i.flags & ATA_EHI_DID_RESET); | 
|  | 1617 | if (rc) | 
|  | 1618 | break; | 
|  | 1619 |  | 
| Tejun Heo | 47005f2 | 2006-06-19 18:27:23 +0900 | [diff] [blame] | 1620 | ata_eh_done(ap, dev, ATA_EH_REVALIDATE); | 
|  | 1621 |  | 
| zhao, forrest | 3057ac3 | 2006-06-12 12:01:34 +0800 | [diff] [blame] | 1622 | /* schedule the scsi_rescan_device() here */ | 
|  | 1623 | queue_work(ata_aux_wq, &(ap->scsi_rescan_task)); | 
| Tejun Heo | 084fe63 | 2006-05-31 18:28:03 +0900 | [diff] [blame] | 1624 | } else if (dev->class == ATA_DEV_UNKNOWN && | 
|  | 1625 | ehc->tries[dev->devno] && | 
|  | 1626 | ata_class_enabled(ehc->classes[dev->devno])) { | 
|  | 1627 | dev->class = ehc->classes[dev->devno]; | 
|  | 1628 |  | 
|  | 1629 | rc = ata_dev_read_id(dev, &dev->class, 1, dev->id); | 
|  | 1630 | if (rc == 0) | 
|  | 1631 | rc = ata_dev_configure(dev, 1); | 
|  | 1632 |  | 
|  | 1633 | if (rc) { | 
|  | 1634 | dev->class = ATA_DEV_UNKNOWN; | 
|  | 1635 | break; | 
|  | 1636 | } | 
|  | 1637 |  | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 1638 | spin_lock_irqsave(ap->lock, flags); | 
| Tejun Heo | 084fe63 | 2006-05-31 18:28:03 +0900 | [diff] [blame] | 1639 | ap->flags |= ATA_FLAG_SCSI_HOTPLUG; | 
| Jeff Garzik | ba6a130 | 2006-06-22 23:46:10 -0400 | [diff] [blame] | 1640 | spin_unlock_irqrestore(ap->lock, flags); | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1641 | } | 
|  | 1642 | } | 
|  | 1643 |  | 
| Tejun Heo | 47005f2 | 2006-06-19 18:27:23 +0900 | [diff] [blame] | 1644 | if (rc) | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1645 | *r_failed_dev = dev; | 
|  | 1646 |  | 
|  | 1647 | DPRINTK("EXIT\n"); | 
|  | 1648 | return rc; | 
|  | 1649 | } | 
|  | 1650 |  | 
|  | 1651 | static int ata_port_nr_enabled(struct ata_port *ap) | 
|  | 1652 | { | 
|  | 1653 | int i, cnt = 0; | 
|  | 1654 |  | 
|  | 1655 | for (i = 0; i < ATA_MAX_DEVICES; i++) | 
|  | 1656 | if (ata_dev_enabled(&ap->device[i])) | 
|  | 1657 | cnt++; | 
|  | 1658 | return cnt; | 
|  | 1659 | } | 
|  | 1660 |  | 
| Tejun Heo | 084fe63 | 2006-05-31 18:28:03 +0900 | [diff] [blame] | 1661 | static int ata_port_nr_vacant(struct ata_port *ap) | 
|  | 1662 | { | 
|  | 1663 | int i, cnt = 0; | 
|  | 1664 |  | 
|  | 1665 | for (i = 0; i < ATA_MAX_DEVICES; i++) | 
|  | 1666 | if (ap->device[i].class == ATA_DEV_UNKNOWN) | 
|  | 1667 | cnt++; | 
|  | 1668 | return cnt; | 
|  | 1669 | } | 
|  | 1670 |  | 
|  | 1671 | static int ata_eh_skip_recovery(struct ata_port *ap) | 
|  | 1672 | { | 
|  | 1673 | struct ata_eh_context *ehc = &ap->eh_context; | 
|  | 1674 | int i; | 
|  | 1675 |  | 
|  | 1676 | if (ap->flags & ATA_FLAG_FROZEN || ata_port_nr_enabled(ap)) | 
|  | 1677 | return 0; | 
|  | 1678 |  | 
|  | 1679 | /* skip if class codes for all vacant slots are ATA_DEV_NONE */ | 
|  | 1680 | for (i = 0; i < ATA_MAX_DEVICES; i++) { | 
|  | 1681 | struct ata_device *dev = &ap->device[i]; | 
|  | 1682 |  | 
|  | 1683 | if (dev->class == ATA_DEV_UNKNOWN && | 
|  | 1684 | ehc->classes[dev->devno] != ATA_DEV_NONE) | 
|  | 1685 | return 0; | 
|  | 1686 | } | 
|  | 1687 |  | 
|  | 1688 | return 1; | 
|  | 1689 | } | 
|  | 1690 |  | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1691 | /** | 
|  | 1692 | *	ata_eh_recover - recover host port after error | 
|  | 1693 | *	@ap: host port to recover | 
| Tejun Heo | f5914a4 | 2006-05-31 18:27:48 +0900 | [diff] [blame] | 1694 | *	@prereset: prereset method (can be NULL) | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1695 | *	@softreset: softreset method (can be NULL) | 
|  | 1696 | *	@hardreset: hardreset method (can be NULL) | 
|  | 1697 | *	@postreset: postreset method (can be NULL) | 
|  | 1698 | * | 
|  | 1699 | *	This is the alpha and omega, eum and yang, heart and soul of | 
|  | 1700 | *	libata exception handling.  On entry, actions required to | 
| Tejun Heo | 084fe63 | 2006-05-31 18:28:03 +0900 | [diff] [blame] | 1701 | *	recover the port and hotplug requests are recorded in | 
|  | 1702 | *	eh_context.  This function executes all the operations with | 
|  | 1703 | *	appropriate retrials and fallbacks to resurrect failed | 
|  | 1704 | *	devices, detach goners and greet newcomers. | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1705 | * | 
|  | 1706 | *	LOCKING: | 
|  | 1707 | *	Kernel thread context (may sleep). | 
|  | 1708 | * | 
|  | 1709 | *	RETURNS: | 
|  | 1710 | *	0 on success, -errno on failure. | 
|  | 1711 | */ | 
| Tejun Heo | f5914a4 | 2006-05-31 18:27:48 +0900 | [diff] [blame] | 1712 | static int ata_eh_recover(struct ata_port *ap, ata_prereset_fn_t prereset, | 
|  | 1713 | ata_reset_fn_t softreset, ata_reset_fn_t hardreset, | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1714 | ata_postreset_fn_t postreset) | 
|  | 1715 | { | 
|  | 1716 | struct ata_eh_context *ehc = &ap->eh_context; | 
|  | 1717 | struct ata_device *dev; | 
|  | 1718 | int down_xfermask, i, rc; | 
|  | 1719 |  | 
|  | 1720 | DPRINTK("ENTER\n"); | 
|  | 1721 |  | 
|  | 1722 | /* prep for recovery */ | 
|  | 1723 | for (i = 0; i < ATA_MAX_DEVICES; i++) { | 
|  | 1724 | dev = &ap->device[i]; | 
|  | 1725 |  | 
|  | 1726 | ehc->tries[dev->devno] = ATA_EH_DEV_TRIES; | 
| Tejun Heo | 084fe63 | 2006-05-31 18:28:03 +0900 | [diff] [blame] | 1727 |  | 
|  | 1728 | /* process hotplug request */ | 
|  | 1729 | if (dev->flags & ATA_DFLAG_DETACH) | 
|  | 1730 | ata_eh_detach_dev(dev); | 
|  | 1731 |  | 
|  | 1732 | if (!ata_dev_enabled(dev) && | 
|  | 1733 | ((ehc->i.probe_mask & (1 << dev->devno)) && | 
|  | 1734 | !(ehc->did_probe_mask & (1 << dev->devno)))) { | 
|  | 1735 | ata_eh_detach_dev(dev); | 
|  | 1736 | ata_dev_init(dev); | 
|  | 1737 | ehc->did_probe_mask |= (1 << dev->devno); | 
|  | 1738 | ehc->i.action |= ATA_EH_SOFTRESET; | 
|  | 1739 | } | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1740 | } | 
|  | 1741 |  | 
|  | 1742 | retry: | 
|  | 1743 | down_xfermask = 0; | 
|  | 1744 | rc = 0; | 
|  | 1745 |  | 
| Tejun Heo | aeb2ecd | 2006-06-12 14:11:43 +0900 | [diff] [blame] | 1746 | /* if UNLOADING, finish immediately */ | 
|  | 1747 | if (ap->flags & ATA_FLAG_UNLOADING) | 
|  | 1748 | goto out; | 
|  | 1749 |  | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1750 | /* skip EH if possible. */ | 
| Tejun Heo | 084fe63 | 2006-05-31 18:28:03 +0900 | [diff] [blame] | 1751 | if (ata_eh_skip_recovery(ap)) | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1752 | ehc->i.action = 0; | 
|  | 1753 |  | 
| Tejun Heo | 084fe63 | 2006-05-31 18:28:03 +0900 | [diff] [blame] | 1754 | for (i = 0; i < ATA_MAX_DEVICES; i++) | 
|  | 1755 | ehc->classes[i] = ATA_DEV_UNKNOWN; | 
|  | 1756 |  | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1757 | /* reset */ | 
|  | 1758 | if (ehc->i.action & ATA_EH_RESET_MASK) { | 
|  | 1759 | ata_eh_freeze_port(ap); | 
|  | 1760 |  | 
| Tejun Heo | 084fe63 | 2006-05-31 18:28:03 +0900 | [diff] [blame] | 1761 | rc = ata_eh_reset(ap, ata_port_nr_vacant(ap), prereset, | 
|  | 1762 | softreset, hardreset, postreset); | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1763 | if (rc) { | 
|  | 1764 | ata_port_printk(ap, KERN_ERR, | 
|  | 1765 | "reset failed, giving up\n"); | 
|  | 1766 | goto out; | 
|  | 1767 | } | 
|  | 1768 |  | 
|  | 1769 | ata_eh_thaw_port(ap); | 
|  | 1770 | } | 
|  | 1771 |  | 
| Tejun Heo | 084fe63 | 2006-05-31 18:28:03 +0900 | [diff] [blame] | 1772 | /* revalidate existing devices and attach new ones */ | 
|  | 1773 | rc = ata_eh_revalidate_and_attach(ap, &dev); | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1774 | if (rc) | 
|  | 1775 | goto dev_fail; | 
|  | 1776 |  | 
|  | 1777 | /* configure transfer mode if the port has been reset */ | 
|  | 1778 | if (ehc->i.flags & ATA_EHI_DID_RESET) { | 
|  | 1779 | rc = ata_set_mode(ap, &dev); | 
|  | 1780 | if (rc) { | 
|  | 1781 | down_xfermask = 1; | 
|  | 1782 | goto dev_fail; | 
|  | 1783 | } | 
|  | 1784 | } | 
|  | 1785 |  | 
|  | 1786 | goto out; | 
|  | 1787 |  | 
|  | 1788 | dev_fail: | 
|  | 1789 | switch (rc) { | 
|  | 1790 | case -ENODEV: | 
| Tejun Heo | 084fe63 | 2006-05-31 18:28:03 +0900 | [diff] [blame] | 1791 | /* device missing, schedule probing */ | 
|  | 1792 | ehc->i.probe_mask |= (1 << dev->devno); | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1793 | case -EINVAL: | 
|  | 1794 | ehc->tries[dev->devno] = 0; | 
|  | 1795 | break; | 
|  | 1796 | case -EIO: | 
|  | 1797 | sata_down_spd_limit(ap); | 
|  | 1798 | default: | 
|  | 1799 | ehc->tries[dev->devno]--; | 
|  | 1800 | if (down_xfermask && | 
|  | 1801 | ata_down_xfermask_limit(dev, ehc->tries[dev->devno] == 1)) | 
|  | 1802 | ehc->tries[dev->devno] = 0; | 
|  | 1803 | } | 
|  | 1804 |  | 
| Tejun Heo | 084fe63 | 2006-05-31 18:28:03 +0900 | [diff] [blame] | 1805 | if (ata_dev_enabled(dev) && !ehc->tries[dev->devno]) { | 
|  | 1806 | /* disable device if it has used up all its chances */ | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1807 | ata_dev_disable(dev); | 
|  | 1808 |  | 
| Tejun Heo | 084fe63 | 2006-05-31 18:28:03 +0900 | [diff] [blame] | 1809 | /* detach if offline */ | 
|  | 1810 | if (ata_port_offline(ap)) | 
|  | 1811 | ata_eh_detach_dev(dev); | 
|  | 1812 |  | 
|  | 1813 | /* probe if requested */ | 
|  | 1814 | if ((ehc->i.probe_mask & (1 << dev->devno)) && | 
|  | 1815 | !(ehc->did_probe_mask & (1 << dev->devno))) { | 
|  | 1816 | ata_eh_detach_dev(dev); | 
|  | 1817 | ata_dev_init(dev); | 
|  | 1818 |  | 
|  | 1819 | ehc->tries[dev->devno] = ATA_EH_DEV_TRIES; | 
|  | 1820 | ehc->did_probe_mask |= (1 << dev->devno); | 
|  | 1821 | ehc->i.action |= ATA_EH_SOFTRESET; | 
|  | 1822 | } | 
|  | 1823 | } else { | 
|  | 1824 | /* soft didn't work?  be haaaaard */ | 
|  | 1825 | if (ehc->i.flags & ATA_EHI_DID_RESET) | 
|  | 1826 | ehc->i.action |= ATA_EH_HARDRESET; | 
|  | 1827 | else | 
|  | 1828 | ehc->i.action |= ATA_EH_SOFTRESET; | 
|  | 1829 | } | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1830 |  | 
|  | 1831 | if (ata_port_nr_enabled(ap)) { | 
|  | 1832 | ata_port_printk(ap, KERN_WARNING, "failed to recover some " | 
|  | 1833 | "devices, retrying in 5 secs\n"); | 
|  | 1834 | ssleep(5); | 
|  | 1835 | } else { | 
|  | 1836 | /* no device left, repeat fast */ | 
|  | 1837 | msleep(500); | 
|  | 1838 | } | 
|  | 1839 |  | 
|  | 1840 | goto retry; | 
|  | 1841 |  | 
|  | 1842 | out: | 
|  | 1843 | if (rc) { | 
|  | 1844 | for (i = 0; i < ATA_MAX_DEVICES; i++) | 
|  | 1845 | ata_dev_disable(&ap->device[i]); | 
|  | 1846 | } | 
|  | 1847 |  | 
|  | 1848 | DPRINTK("EXIT, rc=%d\n", rc); | 
|  | 1849 | return rc; | 
|  | 1850 | } | 
|  | 1851 |  | 
|  | 1852 | /** | 
|  | 1853 | *	ata_eh_finish - finish up EH | 
|  | 1854 | *	@ap: host port to finish EH for | 
|  | 1855 | * | 
|  | 1856 | *	Recovery is complete.  Clean up EH states and retry or finish | 
|  | 1857 | *	failed qcs. | 
|  | 1858 | * | 
|  | 1859 | *	LOCKING: | 
|  | 1860 | *	None. | 
|  | 1861 | */ | 
|  | 1862 | static void ata_eh_finish(struct ata_port *ap) | 
|  | 1863 | { | 
|  | 1864 | int tag; | 
|  | 1865 |  | 
|  | 1866 | /* retry or finish qcs */ | 
|  | 1867 | for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { | 
|  | 1868 | struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); | 
|  | 1869 |  | 
|  | 1870 | if (!(qc->flags & ATA_QCFLAG_FAILED)) | 
|  | 1871 | continue; | 
|  | 1872 |  | 
|  | 1873 | if (qc->err_mask) { | 
|  | 1874 | /* FIXME: Once EH migration is complete, | 
|  | 1875 | * generate sense data in this function, | 
|  | 1876 | * considering both err_mask and tf. | 
|  | 1877 | */ | 
|  | 1878 | if (qc->err_mask & AC_ERR_INVALID) | 
|  | 1879 | ata_eh_qc_complete(qc); | 
|  | 1880 | else | 
|  | 1881 | ata_eh_qc_retry(qc); | 
|  | 1882 | } else { | 
|  | 1883 | if (qc->flags & ATA_QCFLAG_SENSE_VALID) { | 
|  | 1884 | ata_eh_qc_complete(qc); | 
|  | 1885 | } else { | 
|  | 1886 | /* feed zero TF to sense generation */ | 
|  | 1887 | memset(&qc->result_tf, 0, sizeof(qc->result_tf)); | 
|  | 1888 | ata_eh_qc_retry(qc); | 
|  | 1889 | } | 
|  | 1890 | } | 
|  | 1891 | } | 
|  | 1892 | } | 
|  | 1893 |  | 
|  | 1894 | /** | 
|  | 1895 | *	ata_do_eh - do standard error handling | 
|  | 1896 | *	@ap: host port to handle error for | 
| Tejun Heo | f5914a4 | 2006-05-31 18:27:48 +0900 | [diff] [blame] | 1897 | *	@prereset: prereset method (can be NULL) | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1898 | *	@softreset: softreset method (can be NULL) | 
|  | 1899 | *	@hardreset: hardreset method (can be NULL) | 
|  | 1900 | *	@postreset: postreset method (can be NULL) | 
|  | 1901 | * | 
|  | 1902 | *	Perform standard error handling sequence. | 
|  | 1903 | * | 
|  | 1904 | *	LOCKING: | 
|  | 1905 | *	Kernel thread context (may sleep). | 
|  | 1906 | */ | 
| Tejun Heo | f5914a4 | 2006-05-31 18:27:48 +0900 | [diff] [blame] | 1907 | void ata_do_eh(struct ata_port *ap, ata_prereset_fn_t prereset, | 
|  | 1908 | ata_reset_fn_t softreset, ata_reset_fn_t hardreset, | 
|  | 1909 | ata_postreset_fn_t postreset) | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1910 | { | 
| Tejun Heo | 3e70639 | 2006-05-31 18:28:11 +0900 | [diff] [blame] | 1911 | if (!(ap->flags & ATA_FLAG_LOADING)) { | 
|  | 1912 | ata_eh_autopsy(ap); | 
|  | 1913 | ata_eh_report(ap); | 
|  | 1914 | } | 
|  | 1915 |  | 
| Tejun Heo | f5914a4 | 2006-05-31 18:27:48 +0900 | [diff] [blame] | 1916 | ata_eh_recover(ap, prereset, softreset, hardreset, postreset); | 
| Tejun Heo | 022bdb0 | 2006-05-15 20:58:22 +0900 | [diff] [blame] | 1917 | ata_eh_finish(ap); | 
|  | 1918 | } |