1c6fd2807SJeff Garzik /* 2c6fd2807SJeff Garzik * libata-eh.c - libata error handling 3c6fd2807SJeff Garzik * 4c6fd2807SJeff Garzik * Maintained by: Jeff Garzik <jgarzik@pobox.com> 5c6fd2807SJeff Garzik * Please ALWAYS copy linux-ide@vger.kernel.org 6c6fd2807SJeff Garzik * on emails. 7c6fd2807SJeff Garzik * 8c6fd2807SJeff Garzik * Copyright 2006 Tejun Heo <htejun@gmail.com> 9c6fd2807SJeff Garzik * 10c6fd2807SJeff Garzik * 11c6fd2807SJeff Garzik * This program is free software; you can redistribute it and/or 12c6fd2807SJeff Garzik * modify it under the terms of the GNU General Public License as 13c6fd2807SJeff Garzik * published by the Free Software Foundation; either version 2, or 14c6fd2807SJeff Garzik * (at your option) any later version. 15c6fd2807SJeff Garzik * 16c6fd2807SJeff Garzik * This program is distributed in the hope that it will be useful, 17c6fd2807SJeff Garzik * but WITHOUT ANY WARRANTY; without even the implied warranty of 18c6fd2807SJeff Garzik * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 19c6fd2807SJeff Garzik * General Public License for more details. 20c6fd2807SJeff Garzik * 21c6fd2807SJeff Garzik * You should have received a copy of the GNU General Public License 22c6fd2807SJeff Garzik * along with this program; see the file COPYING. If not, write to 23c6fd2807SJeff Garzik * the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, 24c6fd2807SJeff Garzik * USA. 25c6fd2807SJeff Garzik * 26c6fd2807SJeff Garzik * 27c6fd2807SJeff Garzik * libata documentation is available via 'make {ps|pdf}docs', 28c6fd2807SJeff Garzik * as Documentation/DocBook/libata.* 29c6fd2807SJeff Garzik * 30c6fd2807SJeff Garzik * Hardware documentation available from http://www.t13.org/ and 31c6fd2807SJeff Garzik * http://www.sata-io.org/ 32c6fd2807SJeff Garzik * 33c6fd2807SJeff Garzik */ 34c6fd2807SJeff Garzik 35c6fd2807SJeff Garzik #include <linux/kernel.h> 36c6fd2807SJeff Garzik #include <scsi/scsi.h> 37c6fd2807SJeff Garzik #include <scsi/scsi_host.h> 38c6fd2807SJeff Garzik #include <scsi/scsi_eh.h> 39c6fd2807SJeff Garzik #include <scsi/scsi_device.h> 40c6fd2807SJeff Garzik #include <scsi/scsi_cmnd.h> 41c6fd2807SJeff Garzik #include "../scsi/scsi_transport_api.h" 42c6fd2807SJeff Garzik 43c6fd2807SJeff Garzik #include <linux/libata.h> 44c6fd2807SJeff Garzik 45c6fd2807SJeff Garzik #include "libata.h" 46c6fd2807SJeff Garzik 477d47e8d4STejun Heo enum { 487d47e8d4STejun Heo ATA_EH_SPDN_NCQ_OFF = (1 << 0), 497d47e8d4STejun Heo ATA_EH_SPDN_SPEED_DOWN = (1 << 1), 507d47e8d4STejun Heo ATA_EH_SPDN_FALLBACK_TO_PIO = (1 << 2), 517d47e8d4STejun Heo }; 527d47e8d4STejun Heo 5331daabdaSTejun Heo /* Waiting in ->prereset can never be reliable. It's sometimes nice 5431daabdaSTejun Heo * to wait there but it can't be depended upon; otherwise, we wouldn't 5531daabdaSTejun Heo * be resetting. Just give it enough time for most drives to spin up. 5631daabdaSTejun Heo */ 5731daabdaSTejun Heo enum { 5831daabdaSTejun Heo ATA_EH_PRERESET_TIMEOUT = 10 * HZ, 59*5ddf24c5STejun Heo ATA_EH_FASTDRAIN_INTERVAL = 3 * HZ, 6031daabdaSTejun Heo }; 6131daabdaSTejun Heo 6231daabdaSTejun Heo /* The following table determines how we sequence resets. Each entry 6331daabdaSTejun Heo * represents timeout for that try. The first try can be soft or 6431daabdaSTejun Heo * hardreset. All others are hardreset if available. In most cases 6531daabdaSTejun Heo * the first reset w/ 10sec timeout should succeed. Following entries 6631daabdaSTejun Heo * are mostly for error handling, hotplug and retarded devices. 6731daabdaSTejun Heo */ 6831daabdaSTejun Heo static const unsigned long ata_eh_reset_timeouts[] = { 6931daabdaSTejun Heo 10 * HZ, /* most drives spin up by 10sec */ 7031daabdaSTejun Heo 10 * HZ, /* > 99% working drives spin up before 20sec */ 7131daabdaSTejun Heo 35 * HZ, /* give > 30 secs of idleness for retarded devices */ 7231daabdaSTejun Heo 5 * HZ, /* and sweet one last chance */ 7331daabdaSTejun Heo /* > 1 min has elapsed, give up */ 7431daabdaSTejun Heo }; 7531daabdaSTejun Heo 76c6fd2807SJeff Garzik static void __ata_port_freeze(struct ata_port *ap); 77c6fd2807SJeff Garzik static void ata_eh_finish(struct ata_port *ap); 786ffa01d8STejun Heo #ifdef CONFIG_PM 79c6fd2807SJeff Garzik static void ata_eh_handle_port_suspend(struct ata_port *ap); 80c6fd2807SJeff Garzik static void ata_eh_handle_port_resume(struct ata_port *ap); 816ffa01d8STejun Heo #else /* CONFIG_PM */ 826ffa01d8STejun Heo static void ata_eh_handle_port_suspend(struct ata_port *ap) 836ffa01d8STejun Heo { } 846ffa01d8STejun Heo 856ffa01d8STejun Heo static void ata_eh_handle_port_resume(struct ata_port *ap) 866ffa01d8STejun Heo { } 876ffa01d8STejun Heo #endif /* CONFIG_PM */ 88c6fd2807SJeff Garzik 89b64bbc39STejun Heo static void __ata_ehi_pushv_desc(struct ata_eh_info *ehi, const char *fmt, 90b64bbc39STejun Heo va_list args) 91b64bbc39STejun Heo { 92b64bbc39STejun Heo ehi->desc_len += vscnprintf(ehi->desc + ehi->desc_len, 93b64bbc39STejun Heo ATA_EH_DESC_LEN - ehi->desc_len, 94b64bbc39STejun Heo fmt, args); 95b64bbc39STejun Heo } 96b64bbc39STejun Heo 97b64bbc39STejun Heo /** 98b64bbc39STejun Heo * __ata_ehi_push_desc - push error description without adding separator 99b64bbc39STejun Heo * @ehi: target EHI 100b64bbc39STejun Heo * @fmt: printf format string 101b64bbc39STejun Heo * 102b64bbc39STejun Heo * Format string according to @fmt and append it to @ehi->desc. 103b64bbc39STejun Heo * 104b64bbc39STejun Heo * LOCKING: 105b64bbc39STejun Heo * spin_lock_irqsave(host lock) 106b64bbc39STejun Heo */ 107b64bbc39STejun Heo void __ata_ehi_push_desc(struct ata_eh_info *ehi, const char *fmt, ...) 108b64bbc39STejun Heo { 109b64bbc39STejun Heo va_list args; 110b64bbc39STejun Heo 111b64bbc39STejun Heo va_start(args, fmt); 112b64bbc39STejun Heo __ata_ehi_pushv_desc(ehi, fmt, args); 113b64bbc39STejun Heo va_end(args); 114b64bbc39STejun Heo } 115b64bbc39STejun Heo 116b64bbc39STejun Heo /** 117b64bbc39STejun Heo * ata_ehi_push_desc - push error description with separator 118b64bbc39STejun Heo * @ehi: target EHI 119b64bbc39STejun Heo * @fmt: printf format string 120b64bbc39STejun Heo * 121b64bbc39STejun Heo * Format string according to @fmt and append it to @ehi->desc. 122b64bbc39STejun Heo * If @ehi->desc is not empty, ", " is added in-between. 123b64bbc39STejun Heo * 124b64bbc39STejun Heo * LOCKING: 125b64bbc39STejun Heo * spin_lock_irqsave(host lock) 126b64bbc39STejun Heo */ 127b64bbc39STejun Heo void ata_ehi_push_desc(struct ata_eh_info *ehi, const char *fmt, ...) 128b64bbc39STejun Heo { 129b64bbc39STejun Heo va_list args; 130b64bbc39STejun Heo 131b64bbc39STejun Heo if (ehi->desc_len) 132b64bbc39STejun Heo __ata_ehi_push_desc(ehi, ", "); 133b64bbc39STejun Heo 134b64bbc39STejun Heo va_start(args, fmt); 135b64bbc39STejun Heo __ata_ehi_pushv_desc(ehi, fmt, args); 136b64bbc39STejun Heo va_end(args); 137b64bbc39STejun Heo } 138b64bbc39STejun Heo 139b64bbc39STejun Heo /** 140b64bbc39STejun Heo * ata_ehi_clear_desc - clean error description 141b64bbc39STejun Heo * @ehi: target EHI 142b64bbc39STejun Heo * 143b64bbc39STejun Heo * Clear @ehi->desc. 144b64bbc39STejun Heo * 145b64bbc39STejun Heo * LOCKING: 146b64bbc39STejun Heo * spin_lock_irqsave(host lock) 147b64bbc39STejun Heo */ 148b64bbc39STejun Heo void ata_ehi_clear_desc(struct ata_eh_info *ehi) 149b64bbc39STejun Heo { 150b64bbc39STejun Heo ehi->desc[0] = '\0'; 151b64bbc39STejun Heo ehi->desc_len = 0; 152b64bbc39STejun Heo } 153b64bbc39STejun Heo 154c6fd2807SJeff Garzik static void ata_ering_record(struct ata_ering *ering, int is_io, 155c6fd2807SJeff Garzik unsigned int err_mask) 156c6fd2807SJeff Garzik { 157c6fd2807SJeff Garzik struct ata_ering_entry *ent; 158c6fd2807SJeff Garzik 159c6fd2807SJeff Garzik WARN_ON(!err_mask); 160c6fd2807SJeff Garzik 161c6fd2807SJeff Garzik ering->cursor++; 162c6fd2807SJeff Garzik ering->cursor %= ATA_ERING_SIZE; 163c6fd2807SJeff Garzik 164c6fd2807SJeff Garzik ent = &ering->ring[ering->cursor]; 165c6fd2807SJeff Garzik ent->is_io = is_io; 166c6fd2807SJeff Garzik ent->err_mask = err_mask; 167c6fd2807SJeff Garzik ent->timestamp = get_jiffies_64(); 168c6fd2807SJeff Garzik } 169c6fd2807SJeff Garzik 1707d47e8d4STejun Heo static void ata_ering_clear(struct ata_ering *ering) 171c6fd2807SJeff Garzik { 1727d47e8d4STejun Heo memset(ering, 0, sizeof(*ering)); 173c6fd2807SJeff Garzik } 174c6fd2807SJeff Garzik 175c6fd2807SJeff Garzik static int ata_ering_map(struct ata_ering *ering, 176c6fd2807SJeff Garzik int (*map_fn)(struct ata_ering_entry *, void *), 177c6fd2807SJeff Garzik void *arg) 178c6fd2807SJeff Garzik { 179c6fd2807SJeff Garzik int idx, rc = 0; 180c6fd2807SJeff Garzik struct ata_ering_entry *ent; 181c6fd2807SJeff Garzik 182c6fd2807SJeff Garzik idx = ering->cursor; 183c6fd2807SJeff Garzik do { 184c6fd2807SJeff Garzik ent = &ering->ring[idx]; 185c6fd2807SJeff Garzik if (!ent->err_mask) 186c6fd2807SJeff Garzik break; 187c6fd2807SJeff Garzik rc = map_fn(ent, arg); 188c6fd2807SJeff Garzik if (rc) 189c6fd2807SJeff Garzik break; 190c6fd2807SJeff Garzik idx = (idx - 1 + ATA_ERING_SIZE) % ATA_ERING_SIZE; 191c6fd2807SJeff Garzik } while (idx != ering->cursor); 192c6fd2807SJeff Garzik 193c6fd2807SJeff Garzik return rc; 194c6fd2807SJeff Garzik } 195c6fd2807SJeff Garzik 196c6fd2807SJeff Garzik static unsigned int ata_eh_dev_action(struct ata_device *dev) 197c6fd2807SJeff Garzik { 198c6fd2807SJeff Garzik struct ata_eh_context *ehc = &dev->ap->eh_context; 199c6fd2807SJeff Garzik 200c6fd2807SJeff Garzik return ehc->i.action | ehc->i.dev_action[dev->devno]; 201c6fd2807SJeff Garzik } 202c6fd2807SJeff Garzik 203c6fd2807SJeff Garzik static void ata_eh_clear_action(struct ata_device *dev, 204c6fd2807SJeff Garzik struct ata_eh_info *ehi, unsigned int action) 205c6fd2807SJeff Garzik { 206c6fd2807SJeff Garzik int i; 207c6fd2807SJeff Garzik 208c6fd2807SJeff Garzik if (!dev) { 209c6fd2807SJeff Garzik ehi->action &= ~action; 210c6fd2807SJeff Garzik for (i = 0; i < ATA_MAX_DEVICES; i++) 211c6fd2807SJeff Garzik ehi->dev_action[i] &= ~action; 212c6fd2807SJeff Garzik } else { 213c6fd2807SJeff Garzik /* doesn't make sense for port-wide EH actions */ 214c6fd2807SJeff Garzik WARN_ON(!(action & ATA_EH_PERDEV_MASK)); 215c6fd2807SJeff Garzik 216c6fd2807SJeff Garzik /* break ehi->action into ehi->dev_action */ 217c6fd2807SJeff Garzik if (ehi->action & action) { 218c6fd2807SJeff Garzik for (i = 0; i < ATA_MAX_DEVICES; i++) 219c6fd2807SJeff Garzik ehi->dev_action[i] |= ehi->action & action; 220c6fd2807SJeff Garzik ehi->action &= ~action; 221c6fd2807SJeff Garzik } 222c6fd2807SJeff Garzik 223c6fd2807SJeff Garzik /* turn off the specified per-dev action */ 224c6fd2807SJeff Garzik ehi->dev_action[dev->devno] &= ~action; 225c6fd2807SJeff Garzik } 226c6fd2807SJeff Garzik } 227c6fd2807SJeff Garzik 228c6fd2807SJeff Garzik /** 229c6fd2807SJeff Garzik * ata_scsi_timed_out - SCSI layer time out callback 230c6fd2807SJeff Garzik * @cmd: timed out SCSI command 231c6fd2807SJeff Garzik * 232c6fd2807SJeff Garzik * Handles SCSI layer timeout. We race with normal completion of 233c6fd2807SJeff Garzik * the qc for @cmd. If the qc is already gone, we lose and let 234c6fd2807SJeff Garzik * the scsi command finish (EH_HANDLED). Otherwise, the qc has 235c6fd2807SJeff Garzik * timed out and EH should be invoked. Prevent ata_qc_complete() 236c6fd2807SJeff Garzik * from finishing it by setting EH_SCHEDULED and return 237c6fd2807SJeff Garzik * EH_NOT_HANDLED. 238c6fd2807SJeff Garzik * 239c6fd2807SJeff Garzik * TODO: kill this function once old EH is gone. 240c6fd2807SJeff Garzik * 241c6fd2807SJeff Garzik * LOCKING: 242c6fd2807SJeff Garzik * Called from timer context 243c6fd2807SJeff Garzik * 244c6fd2807SJeff Garzik * RETURNS: 245c6fd2807SJeff Garzik * EH_HANDLED or EH_NOT_HANDLED 246c6fd2807SJeff Garzik */ 247c6fd2807SJeff Garzik enum scsi_eh_timer_return ata_scsi_timed_out(struct scsi_cmnd *cmd) 248c6fd2807SJeff Garzik { 249c6fd2807SJeff Garzik struct Scsi_Host *host = cmd->device->host; 250c6fd2807SJeff Garzik struct ata_port *ap = ata_shost_to_port(host); 251c6fd2807SJeff Garzik unsigned long flags; 252c6fd2807SJeff Garzik struct ata_queued_cmd *qc; 253c6fd2807SJeff Garzik enum scsi_eh_timer_return ret; 254c6fd2807SJeff Garzik 255c6fd2807SJeff Garzik DPRINTK("ENTER\n"); 256c6fd2807SJeff Garzik 257c6fd2807SJeff Garzik if (ap->ops->error_handler) { 258c6fd2807SJeff Garzik ret = EH_NOT_HANDLED; 259c6fd2807SJeff Garzik goto out; 260c6fd2807SJeff Garzik } 261c6fd2807SJeff Garzik 262c6fd2807SJeff Garzik ret = EH_HANDLED; 263c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 264c6fd2807SJeff Garzik qc = ata_qc_from_tag(ap, ap->active_tag); 265c6fd2807SJeff Garzik if (qc) { 266c6fd2807SJeff Garzik WARN_ON(qc->scsicmd != cmd); 267c6fd2807SJeff Garzik qc->flags |= ATA_QCFLAG_EH_SCHEDULED; 268c6fd2807SJeff Garzik qc->err_mask |= AC_ERR_TIMEOUT; 269c6fd2807SJeff Garzik ret = EH_NOT_HANDLED; 270c6fd2807SJeff Garzik } 271c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 272c6fd2807SJeff Garzik 273c6fd2807SJeff Garzik out: 274c6fd2807SJeff Garzik DPRINTK("EXIT, ret=%d\n", ret); 275c6fd2807SJeff Garzik return ret; 276c6fd2807SJeff Garzik } 277c6fd2807SJeff Garzik 278c6fd2807SJeff Garzik /** 279c6fd2807SJeff Garzik * ata_scsi_error - SCSI layer error handler callback 280c6fd2807SJeff Garzik * @host: SCSI host on which error occurred 281c6fd2807SJeff Garzik * 282c6fd2807SJeff Garzik * Handles SCSI-layer-thrown error events. 283c6fd2807SJeff Garzik * 284c6fd2807SJeff Garzik * LOCKING: 285c6fd2807SJeff Garzik * Inherited from SCSI layer (none, can sleep) 286c6fd2807SJeff Garzik * 287c6fd2807SJeff Garzik * RETURNS: 288c6fd2807SJeff Garzik * Zero. 289c6fd2807SJeff Garzik */ 290c6fd2807SJeff Garzik void ata_scsi_error(struct Scsi_Host *host) 291c6fd2807SJeff Garzik { 292c6fd2807SJeff Garzik struct ata_port *ap = ata_shost_to_port(host); 293c6fd2807SJeff Garzik int i, repeat_cnt = ATA_EH_MAX_REPEAT; 294c6fd2807SJeff Garzik unsigned long flags; 295c6fd2807SJeff Garzik 296c6fd2807SJeff Garzik DPRINTK("ENTER\n"); 297c6fd2807SJeff Garzik 298c6fd2807SJeff Garzik /* synchronize with port task */ 299c6fd2807SJeff Garzik ata_port_flush_task(ap); 300c6fd2807SJeff Garzik 301cca3974eSJeff Garzik /* synchronize with host lock and sort out timeouts */ 302c6fd2807SJeff Garzik 303c6fd2807SJeff Garzik /* For new EH, all qcs are finished in one of three ways - 304c6fd2807SJeff Garzik * normal completion, error completion, and SCSI timeout. 305c6fd2807SJeff Garzik * Both cmpletions can race against SCSI timeout. When normal 306c6fd2807SJeff Garzik * completion wins, the qc never reaches EH. When error 307c6fd2807SJeff Garzik * completion wins, the qc has ATA_QCFLAG_FAILED set. 308c6fd2807SJeff Garzik * 309c6fd2807SJeff Garzik * When SCSI timeout wins, things are a bit more complex. 310c6fd2807SJeff Garzik * Normal or error completion can occur after the timeout but 311c6fd2807SJeff Garzik * before this point. In such cases, both types of 312c6fd2807SJeff Garzik * completions are honored. A scmd is determined to have 313c6fd2807SJeff Garzik * timed out iff its associated qc is active and not failed. 314c6fd2807SJeff Garzik */ 315c6fd2807SJeff Garzik if (ap->ops->error_handler) { 316c6fd2807SJeff Garzik struct scsi_cmnd *scmd, *tmp; 317c6fd2807SJeff Garzik int nr_timedout = 0; 318c6fd2807SJeff Garzik 319c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 320c6fd2807SJeff Garzik 321c6fd2807SJeff Garzik list_for_each_entry_safe(scmd, tmp, &host->eh_cmd_q, eh_entry) { 322c6fd2807SJeff Garzik struct ata_queued_cmd *qc; 323c6fd2807SJeff Garzik 324c6fd2807SJeff Garzik for (i = 0; i < ATA_MAX_QUEUE; i++) { 325c6fd2807SJeff Garzik qc = __ata_qc_from_tag(ap, i); 326c6fd2807SJeff Garzik if (qc->flags & ATA_QCFLAG_ACTIVE && 327c6fd2807SJeff Garzik qc->scsicmd == scmd) 328c6fd2807SJeff Garzik break; 329c6fd2807SJeff Garzik } 330c6fd2807SJeff Garzik 331c6fd2807SJeff Garzik if (i < ATA_MAX_QUEUE) { 332c6fd2807SJeff Garzik /* the scmd has an associated qc */ 333c6fd2807SJeff Garzik if (!(qc->flags & ATA_QCFLAG_FAILED)) { 334c6fd2807SJeff Garzik /* which hasn't failed yet, timeout */ 335c6fd2807SJeff Garzik qc->err_mask |= AC_ERR_TIMEOUT; 336c6fd2807SJeff Garzik qc->flags |= ATA_QCFLAG_FAILED; 337c6fd2807SJeff Garzik nr_timedout++; 338c6fd2807SJeff Garzik } 339c6fd2807SJeff Garzik } else { 340c6fd2807SJeff Garzik /* Normal completion occurred after 341c6fd2807SJeff Garzik * SCSI timeout but before this point. 342c6fd2807SJeff Garzik * Successfully complete it. 343c6fd2807SJeff Garzik */ 344c6fd2807SJeff Garzik scmd->retries = scmd->allowed; 345c6fd2807SJeff Garzik scsi_eh_finish_cmd(scmd, &ap->eh_done_q); 346c6fd2807SJeff Garzik } 347c6fd2807SJeff Garzik } 348c6fd2807SJeff Garzik 349c6fd2807SJeff Garzik /* If we have timed out qcs. They belong to EH from 350c6fd2807SJeff Garzik * this point but the state of the controller is 351c6fd2807SJeff Garzik * unknown. Freeze the port to make sure the IRQ 352c6fd2807SJeff Garzik * handler doesn't diddle with those qcs. This must 353c6fd2807SJeff Garzik * be done atomically w.r.t. setting QCFLAG_FAILED. 354c6fd2807SJeff Garzik */ 355c6fd2807SJeff Garzik if (nr_timedout) 356c6fd2807SJeff Garzik __ata_port_freeze(ap); 357c6fd2807SJeff Garzik 358c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 359c6fd2807SJeff Garzik } else 360c6fd2807SJeff Garzik spin_unlock_wait(ap->lock); 361c6fd2807SJeff Garzik 362c6fd2807SJeff Garzik repeat: 363c6fd2807SJeff Garzik /* invoke error handler */ 364c6fd2807SJeff Garzik if (ap->ops->error_handler) { 365*5ddf24c5STejun Heo /* kill fast drain timer */ 366*5ddf24c5STejun Heo del_timer_sync(&ap->fastdrain_timer); 367*5ddf24c5STejun Heo 368c6fd2807SJeff Garzik /* process port resume request */ 369c6fd2807SJeff Garzik ata_eh_handle_port_resume(ap); 370c6fd2807SJeff Garzik 371c6fd2807SJeff Garzik /* fetch & clear EH info */ 372c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 373c6fd2807SJeff Garzik 374c6fd2807SJeff Garzik memset(&ap->eh_context, 0, sizeof(ap->eh_context)); 375c6fd2807SJeff Garzik ap->eh_context.i = ap->eh_info; 376c6fd2807SJeff Garzik memset(&ap->eh_info, 0, sizeof(ap->eh_info)); 377c6fd2807SJeff Garzik 378c6fd2807SJeff Garzik ap->pflags |= ATA_PFLAG_EH_IN_PROGRESS; 379c6fd2807SJeff Garzik ap->pflags &= ~ATA_PFLAG_EH_PENDING; 380c6fd2807SJeff Garzik 381c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 382c6fd2807SJeff Garzik 383c6fd2807SJeff Garzik /* invoke EH, skip if unloading or suspended */ 384c6fd2807SJeff Garzik if (!(ap->pflags & (ATA_PFLAG_UNLOADING | ATA_PFLAG_SUSPENDED))) 385c6fd2807SJeff Garzik ap->ops->error_handler(ap); 386c6fd2807SJeff Garzik else 387c6fd2807SJeff Garzik ata_eh_finish(ap); 388c6fd2807SJeff Garzik 389c6fd2807SJeff Garzik /* process port suspend request */ 390c6fd2807SJeff Garzik ata_eh_handle_port_suspend(ap); 391c6fd2807SJeff Garzik 392c6fd2807SJeff Garzik /* Exception might have happend after ->error_handler 393c6fd2807SJeff Garzik * recovered the port but before this point. Repeat 394c6fd2807SJeff Garzik * EH in such case. 395c6fd2807SJeff Garzik */ 396c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 397c6fd2807SJeff Garzik 398c6fd2807SJeff Garzik if (ap->pflags & ATA_PFLAG_EH_PENDING) { 399c6fd2807SJeff Garzik if (--repeat_cnt) { 400c6fd2807SJeff Garzik ata_port_printk(ap, KERN_INFO, 401c6fd2807SJeff Garzik "EH pending after completion, " 402c6fd2807SJeff Garzik "repeating EH (cnt=%d)\n", repeat_cnt); 403c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 404c6fd2807SJeff Garzik goto repeat; 405c6fd2807SJeff Garzik } 406c6fd2807SJeff Garzik ata_port_printk(ap, KERN_ERR, "EH pending after %d " 407c6fd2807SJeff Garzik "tries, giving up\n", ATA_EH_MAX_REPEAT); 408914616a3STejun Heo ap->pflags &= ~ATA_PFLAG_EH_PENDING; 409c6fd2807SJeff Garzik } 410c6fd2807SJeff Garzik 411c6fd2807SJeff Garzik /* this run is complete, make sure EH info is clear */ 412c6fd2807SJeff Garzik memset(&ap->eh_info, 0, sizeof(ap->eh_info)); 413c6fd2807SJeff Garzik 414c6fd2807SJeff Garzik /* Clear host_eh_scheduled while holding ap->lock such 415c6fd2807SJeff Garzik * that if exception occurs after this point but 416c6fd2807SJeff Garzik * before EH completion, SCSI midlayer will 417c6fd2807SJeff Garzik * re-initiate EH. 418c6fd2807SJeff Garzik */ 419c6fd2807SJeff Garzik host->host_eh_scheduled = 0; 420c6fd2807SJeff Garzik 421c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 422c6fd2807SJeff Garzik } else { 423c6fd2807SJeff Garzik WARN_ON(ata_qc_from_tag(ap, ap->active_tag) == NULL); 424c6fd2807SJeff Garzik ap->ops->eng_timeout(ap); 425c6fd2807SJeff Garzik } 426c6fd2807SJeff Garzik 427c6fd2807SJeff Garzik /* finish or retry handled scmd's and clean up */ 428c6fd2807SJeff Garzik WARN_ON(host->host_failed || !list_empty(&host->eh_cmd_q)); 429c6fd2807SJeff Garzik 430c6fd2807SJeff Garzik scsi_eh_flush_done_q(&ap->eh_done_q); 431c6fd2807SJeff Garzik 432c6fd2807SJeff Garzik /* clean up */ 433c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 434c6fd2807SJeff Garzik 435c6fd2807SJeff Garzik if (ap->pflags & ATA_PFLAG_LOADING) 436c6fd2807SJeff Garzik ap->pflags &= ~ATA_PFLAG_LOADING; 437c6fd2807SJeff Garzik else if (ap->pflags & ATA_PFLAG_SCSI_HOTPLUG) 43852bad64dSDavid Howells queue_delayed_work(ata_aux_wq, &ap->hotplug_task, 0); 439c6fd2807SJeff Garzik 440c6fd2807SJeff Garzik if (ap->pflags & ATA_PFLAG_RECOVERED) 441c6fd2807SJeff Garzik ata_port_printk(ap, KERN_INFO, "EH complete\n"); 442c6fd2807SJeff Garzik 443c6fd2807SJeff Garzik ap->pflags &= ~(ATA_PFLAG_SCSI_HOTPLUG | ATA_PFLAG_RECOVERED); 444c6fd2807SJeff Garzik 445c6fd2807SJeff Garzik /* tell wait_eh that we're done */ 446c6fd2807SJeff Garzik ap->pflags &= ~ATA_PFLAG_EH_IN_PROGRESS; 447c6fd2807SJeff Garzik wake_up_all(&ap->eh_wait_q); 448c6fd2807SJeff Garzik 449c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 450c6fd2807SJeff Garzik 451c6fd2807SJeff Garzik DPRINTK("EXIT\n"); 452c6fd2807SJeff Garzik } 453c6fd2807SJeff Garzik 454c6fd2807SJeff Garzik /** 455c6fd2807SJeff Garzik * ata_port_wait_eh - Wait for the currently pending EH to complete 456c6fd2807SJeff Garzik * @ap: Port to wait EH for 457c6fd2807SJeff Garzik * 458c6fd2807SJeff Garzik * Wait until the currently pending EH is complete. 459c6fd2807SJeff Garzik * 460c6fd2807SJeff Garzik * LOCKING: 461c6fd2807SJeff Garzik * Kernel thread context (may sleep). 462c6fd2807SJeff Garzik */ 463c6fd2807SJeff Garzik void ata_port_wait_eh(struct ata_port *ap) 464c6fd2807SJeff Garzik { 465c6fd2807SJeff Garzik unsigned long flags; 466c6fd2807SJeff Garzik DEFINE_WAIT(wait); 467c6fd2807SJeff Garzik 468c6fd2807SJeff Garzik retry: 469c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 470c6fd2807SJeff Garzik 471c6fd2807SJeff Garzik while (ap->pflags & (ATA_PFLAG_EH_PENDING | ATA_PFLAG_EH_IN_PROGRESS)) { 472c6fd2807SJeff Garzik prepare_to_wait(&ap->eh_wait_q, &wait, TASK_UNINTERRUPTIBLE); 473c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 474c6fd2807SJeff Garzik schedule(); 475c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 476c6fd2807SJeff Garzik } 477c6fd2807SJeff Garzik finish_wait(&ap->eh_wait_q, &wait); 478c6fd2807SJeff Garzik 479c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 480c6fd2807SJeff Garzik 481c6fd2807SJeff Garzik /* make sure SCSI EH is complete */ 482cca3974eSJeff Garzik if (scsi_host_in_recovery(ap->scsi_host)) { 483c6fd2807SJeff Garzik msleep(10); 484c6fd2807SJeff Garzik goto retry; 485c6fd2807SJeff Garzik } 486c6fd2807SJeff Garzik } 487c6fd2807SJeff Garzik 488c6fd2807SJeff Garzik /** 489c6fd2807SJeff Garzik * ata_qc_timeout - Handle timeout of queued command 490c6fd2807SJeff Garzik * @qc: Command that timed out 491c6fd2807SJeff Garzik * 492c6fd2807SJeff Garzik * Some part of the kernel (currently, only the SCSI layer) 493c6fd2807SJeff Garzik * has noticed that the active command on port @ap has not 494c6fd2807SJeff Garzik * completed after a specified length of time. Handle this 495c6fd2807SJeff Garzik * condition by disabling DMA (if necessary) and completing 496c6fd2807SJeff Garzik * transactions, with error if necessary. 497c6fd2807SJeff Garzik * 498c6fd2807SJeff Garzik * This also handles the case of the "lost interrupt", where 499c6fd2807SJeff Garzik * for some reason (possibly hardware bug, possibly driver bug) 500c6fd2807SJeff Garzik * an interrupt was not delivered to the driver, even though the 501c6fd2807SJeff Garzik * transaction completed successfully. 502c6fd2807SJeff Garzik * 503c6fd2807SJeff Garzik * TODO: kill this function once old EH is gone. 504c6fd2807SJeff Garzik * 505c6fd2807SJeff Garzik * LOCKING: 506c6fd2807SJeff Garzik * Inherited from SCSI layer (none, can sleep) 507c6fd2807SJeff Garzik */ 508c6fd2807SJeff Garzik static void ata_qc_timeout(struct ata_queued_cmd *qc) 509c6fd2807SJeff Garzik { 510c6fd2807SJeff Garzik struct ata_port *ap = qc->ap; 511c6fd2807SJeff Garzik u8 host_stat = 0, drv_stat; 512c6fd2807SJeff Garzik unsigned long flags; 513c6fd2807SJeff Garzik 514c6fd2807SJeff Garzik DPRINTK("ENTER\n"); 515c6fd2807SJeff Garzik 516c6fd2807SJeff Garzik ap->hsm_task_state = HSM_ST_IDLE; 517c6fd2807SJeff Garzik 518c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 519c6fd2807SJeff Garzik 520c6fd2807SJeff Garzik switch (qc->tf.protocol) { 521c6fd2807SJeff Garzik 522c6fd2807SJeff Garzik case ATA_PROT_DMA: 523c6fd2807SJeff Garzik case ATA_PROT_ATAPI_DMA: 524c6fd2807SJeff Garzik host_stat = ap->ops->bmdma_status(ap); 525c6fd2807SJeff Garzik 526c6fd2807SJeff Garzik /* before we do anything else, clear DMA-Start bit */ 527c6fd2807SJeff Garzik ap->ops->bmdma_stop(qc); 528c6fd2807SJeff Garzik 529c6fd2807SJeff Garzik /* fall through */ 530c6fd2807SJeff Garzik 531c6fd2807SJeff Garzik default: 532c6fd2807SJeff Garzik ata_altstatus(ap); 533c6fd2807SJeff Garzik drv_stat = ata_chk_status(ap); 534c6fd2807SJeff Garzik 535c6fd2807SJeff Garzik /* ack bmdma irq events */ 536c6fd2807SJeff Garzik ap->ops->irq_clear(ap); 537c6fd2807SJeff Garzik 538c6fd2807SJeff Garzik ata_dev_printk(qc->dev, KERN_ERR, "command 0x%x timeout, " 539c6fd2807SJeff Garzik "stat 0x%x host_stat 0x%x\n", 540c6fd2807SJeff Garzik qc->tf.command, drv_stat, host_stat); 541c6fd2807SJeff Garzik 542c6fd2807SJeff Garzik /* complete taskfile transaction */ 543c6fd2807SJeff Garzik qc->err_mask |= AC_ERR_TIMEOUT; 544c6fd2807SJeff Garzik break; 545c6fd2807SJeff Garzik } 546c6fd2807SJeff Garzik 547c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 548c6fd2807SJeff Garzik 549c6fd2807SJeff Garzik ata_eh_qc_complete(qc); 550c6fd2807SJeff Garzik 551c6fd2807SJeff Garzik DPRINTK("EXIT\n"); 552c6fd2807SJeff Garzik } 553c6fd2807SJeff Garzik 554c6fd2807SJeff Garzik /** 555c6fd2807SJeff Garzik * ata_eng_timeout - Handle timeout of queued command 556c6fd2807SJeff Garzik * @ap: Port on which timed-out command is active 557c6fd2807SJeff Garzik * 558c6fd2807SJeff Garzik * Some part of the kernel (currently, only the SCSI layer) 559c6fd2807SJeff Garzik * has noticed that the active command on port @ap has not 560c6fd2807SJeff Garzik * completed after a specified length of time. Handle this 561c6fd2807SJeff Garzik * condition by disabling DMA (if necessary) and completing 562c6fd2807SJeff Garzik * transactions, with error if necessary. 563c6fd2807SJeff Garzik * 564c6fd2807SJeff Garzik * This also handles the case of the "lost interrupt", where 565c6fd2807SJeff Garzik * for some reason (possibly hardware bug, possibly driver bug) 566c6fd2807SJeff Garzik * an interrupt was not delivered to the driver, even though the 567c6fd2807SJeff Garzik * transaction completed successfully. 568c6fd2807SJeff Garzik * 569c6fd2807SJeff Garzik * TODO: kill this function once old EH is gone. 570c6fd2807SJeff Garzik * 571c6fd2807SJeff Garzik * LOCKING: 572c6fd2807SJeff Garzik * Inherited from SCSI layer (none, can sleep) 573c6fd2807SJeff Garzik */ 574c6fd2807SJeff Garzik void ata_eng_timeout(struct ata_port *ap) 575c6fd2807SJeff Garzik { 576c6fd2807SJeff Garzik DPRINTK("ENTER\n"); 577c6fd2807SJeff Garzik 578c6fd2807SJeff Garzik ata_qc_timeout(ata_qc_from_tag(ap, ap->active_tag)); 579c6fd2807SJeff Garzik 580c6fd2807SJeff Garzik DPRINTK("EXIT\n"); 581c6fd2807SJeff Garzik } 582c6fd2807SJeff Garzik 583*5ddf24c5STejun Heo static int ata_eh_nr_in_flight(struct ata_port *ap) 584*5ddf24c5STejun Heo { 585*5ddf24c5STejun Heo unsigned int tag; 586*5ddf24c5STejun Heo int nr = 0; 587*5ddf24c5STejun Heo 588*5ddf24c5STejun Heo /* count only non-internal commands */ 589*5ddf24c5STejun Heo for (tag = 0; tag < ATA_MAX_QUEUE - 1; tag++) 590*5ddf24c5STejun Heo if (ata_qc_from_tag(ap, tag)) 591*5ddf24c5STejun Heo nr++; 592*5ddf24c5STejun Heo 593*5ddf24c5STejun Heo return nr; 594*5ddf24c5STejun Heo } 595*5ddf24c5STejun Heo 596*5ddf24c5STejun Heo void ata_eh_fastdrain_timerfn(unsigned long arg) 597*5ddf24c5STejun Heo { 598*5ddf24c5STejun Heo struct ata_port *ap = (void *)arg; 599*5ddf24c5STejun Heo unsigned long flags; 600*5ddf24c5STejun Heo int cnt; 601*5ddf24c5STejun Heo 602*5ddf24c5STejun Heo spin_lock_irqsave(ap->lock, flags); 603*5ddf24c5STejun Heo 604*5ddf24c5STejun Heo cnt = ata_eh_nr_in_flight(ap); 605*5ddf24c5STejun Heo 606*5ddf24c5STejun Heo /* are we done? */ 607*5ddf24c5STejun Heo if (!cnt) 608*5ddf24c5STejun Heo goto out_unlock; 609*5ddf24c5STejun Heo 610*5ddf24c5STejun Heo if (cnt == ap->fastdrain_cnt) { 611*5ddf24c5STejun Heo unsigned int tag; 612*5ddf24c5STejun Heo 613*5ddf24c5STejun Heo /* No progress during the last interval, tag all 614*5ddf24c5STejun Heo * in-flight qcs as timed out and freeze the port. 615*5ddf24c5STejun Heo */ 616*5ddf24c5STejun Heo for (tag = 0; tag < ATA_MAX_QUEUE - 1; tag++) { 617*5ddf24c5STejun Heo struct ata_queued_cmd *qc = ata_qc_from_tag(ap, tag); 618*5ddf24c5STejun Heo if (qc) 619*5ddf24c5STejun Heo qc->err_mask |= AC_ERR_TIMEOUT; 620*5ddf24c5STejun Heo } 621*5ddf24c5STejun Heo 622*5ddf24c5STejun Heo ata_port_freeze(ap); 623*5ddf24c5STejun Heo } else { 624*5ddf24c5STejun Heo /* some qcs have finished, give it another chance */ 625*5ddf24c5STejun Heo ap->fastdrain_cnt = cnt; 626*5ddf24c5STejun Heo ap->fastdrain_timer.expires = 627*5ddf24c5STejun Heo jiffies + ATA_EH_FASTDRAIN_INTERVAL; 628*5ddf24c5STejun Heo add_timer(&ap->fastdrain_timer); 629*5ddf24c5STejun Heo } 630*5ddf24c5STejun Heo 631*5ddf24c5STejun Heo out_unlock: 632*5ddf24c5STejun Heo spin_unlock_irqrestore(ap->lock, flags); 633*5ddf24c5STejun Heo } 634*5ddf24c5STejun Heo 635*5ddf24c5STejun Heo /** 636*5ddf24c5STejun Heo * ata_eh_set_pending - set ATA_PFLAG_EH_PENDING and activate fast drain 637*5ddf24c5STejun Heo * @ap: target ATA port 638*5ddf24c5STejun Heo * @fastdrain: activate fast drain 639*5ddf24c5STejun Heo * 640*5ddf24c5STejun Heo * Set ATA_PFLAG_EH_PENDING and activate fast drain if @fastdrain 641*5ddf24c5STejun Heo * is non-zero and EH wasn't pending before. Fast drain ensures 642*5ddf24c5STejun Heo * that EH kicks in in timely manner. 643*5ddf24c5STejun Heo * 644*5ddf24c5STejun Heo * LOCKING: 645*5ddf24c5STejun Heo * spin_lock_irqsave(host lock) 646*5ddf24c5STejun Heo */ 647*5ddf24c5STejun Heo static void ata_eh_set_pending(struct ata_port *ap, int fastdrain) 648*5ddf24c5STejun Heo { 649*5ddf24c5STejun Heo int cnt; 650*5ddf24c5STejun Heo 651*5ddf24c5STejun Heo /* already scheduled? */ 652*5ddf24c5STejun Heo if (ap->pflags & ATA_PFLAG_EH_PENDING) 653*5ddf24c5STejun Heo return; 654*5ddf24c5STejun Heo 655*5ddf24c5STejun Heo ap->pflags |= ATA_PFLAG_EH_PENDING; 656*5ddf24c5STejun Heo 657*5ddf24c5STejun Heo if (!fastdrain) 658*5ddf24c5STejun Heo return; 659*5ddf24c5STejun Heo 660*5ddf24c5STejun Heo /* do we have in-flight qcs? */ 661*5ddf24c5STejun Heo cnt = ata_eh_nr_in_flight(ap); 662*5ddf24c5STejun Heo if (!cnt) 663*5ddf24c5STejun Heo return; 664*5ddf24c5STejun Heo 665*5ddf24c5STejun Heo /* activate fast drain */ 666*5ddf24c5STejun Heo ap->fastdrain_cnt = cnt; 667*5ddf24c5STejun Heo ap->fastdrain_timer.expires = jiffies + ATA_EH_FASTDRAIN_INTERVAL; 668*5ddf24c5STejun Heo add_timer(&ap->fastdrain_timer); 669*5ddf24c5STejun Heo } 670*5ddf24c5STejun Heo 671c6fd2807SJeff Garzik /** 672c6fd2807SJeff Garzik * ata_qc_schedule_eh - schedule qc for error handling 673c6fd2807SJeff Garzik * @qc: command to schedule error handling for 674c6fd2807SJeff Garzik * 675c6fd2807SJeff Garzik * Schedule error handling for @qc. EH will kick in as soon as 676c6fd2807SJeff Garzik * other commands are drained. 677c6fd2807SJeff Garzik * 678c6fd2807SJeff Garzik * LOCKING: 679cca3974eSJeff Garzik * spin_lock_irqsave(host lock) 680c6fd2807SJeff Garzik */ 681c6fd2807SJeff Garzik void ata_qc_schedule_eh(struct ata_queued_cmd *qc) 682c6fd2807SJeff Garzik { 683c6fd2807SJeff Garzik struct ata_port *ap = qc->ap; 684c6fd2807SJeff Garzik 685c6fd2807SJeff Garzik WARN_ON(!ap->ops->error_handler); 686c6fd2807SJeff Garzik 687c6fd2807SJeff Garzik qc->flags |= ATA_QCFLAG_FAILED; 688*5ddf24c5STejun Heo ata_eh_set_pending(ap, 1); 689c6fd2807SJeff Garzik 690c6fd2807SJeff Garzik /* The following will fail if timeout has already expired. 691c6fd2807SJeff Garzik * ata_scsi_error() takes care of such scmds on EH entry. 692c6fd2807SJeff Garzik * Note that ATA_QCFLAG_FAILED is unconditionally set after 693c6fd2807SJeff Garzik * this function completes. 694c6fd2807SJeff Garzik */ 695c6fd2807SJeff Garzik scsi_req_abort_cmd(qc->scsicmd); 696c6fd2807SJeff Garzik } 697c6fd2807SJeff Garzik 698c6fd2807SJeff Garzik /** 699c6fd2807SJeff Garzik * ata_port_schedule_eh - schedule error handling without a qc 700c6fd2807SJeff Garzik * @ap: ATA port to schedule EH for 701c6fd2807SJeff Garzik * 702c6fd2807SJeff Garzik * Schedule error handling for @ap. EH will kick in as soon as 703c6fd2807SJeff Garzik * all commands are drained. 704c6fd2807SJeff Garzik * 705c6fd2807SJeff Garzik * LOCKING: 706cca3974eSJeff Garzik * spin_lock_irqsave(host lock) 707c6fd2807SJeff Garzik */ 708c6fd2807SJeff Garzik void ata_port_schedule_eh(struct ata_port *ap) 709c6fd2807SJeff Garzik { 710c6fd2807SJeff Garzik WARN_ON(!ap->ops->error_handler); 711c6fd2807SJeff Garzik 712f4d6d004STejun Heo if (ap->pflags & ATA_PFLAG_INITIALIZING) 713f4d6d004STejun Heo return; 714f4d6d004STejun Heo 715*5ddf24c5STejun Heo ata_eh_set_pending(ap, 1); 716cca3974eSJeff Garzik scsi_schedule_eh(ap->scsi_host); 717c6fd2807SJeff Garzik 718c6fd2807SJeff Garzik DPRINTK("port EH scheduled\n"); 719c6fd2807SJeff Garzik } 720c6fd2807SJeff Garzik 721c6fd2807SJeff Garzik /** 722c6fd2807SJeff Garzik * ata_port_abort - abort all qc's on the port 723c6fd2807SJeff Garzik * @ap: ATA port to abort qc's for 724c6fd2807SJeff Garzik * 725c6fd2807SJeff Garzik * Abort all active qc's of @ap and schedule EH. 726c6fd2807SJeff Garzik * 727c6fd2807SJeff Garzik * LOCKING: 728cca3974eSJeff Garzik * spin_lock_irqsave(host lock) 729c6fd2807SJeff Garzik * 730c6fd2807SJeff Garzik * RETURNS: 731c6fd2807SJeff Garzik * Number of aborted qc's. 732c6fd2807SJeff Garzik */ 733c6fd2807SJeff Garzik int ata_port_abort(struct ata_port *ap) 734c6fd2807SJeff Garzik { 735c6fd2807SJeff Garzik int tag, nr_aborted = 0; 736c6fd2807SJeff Garzik 737c6fd2807SJeff Garzik WARN_ON(!ap->ops->error_handler); 738c6fd2807SJeff Garzik 739*5ddf24c5STejun Heo /* we're gonna abort all commands, no need for fast drain */ 740*5ddf24c5STejun Heo ata_eh_set_pending(ap, 0); 741*5ddf24c5STejun Heo 742c6fd2807SJeff Garzik for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 743c6fd2807SJeff Garzik struct ata_queued_cmd *qc = ata_qc_from_tag(ap, tag); 744c6fd2807SJeff Garzik 745c6fd2807SJeff Garzik if (qc) { 746c6fd2807SJeff Garzik qc->flags |= ATA_QCFLAG_FAILED; 747c6fd2807SJeff Garzik ata_qc_complete(qc); 748c6fd2807SJeff Garzik nr_aborted++; 749c6fd2807SJeff Garzik } 750c6fd2807SJeff Garzik } 751c6fd2807SJeff Garzik 752c6fd2807SJeff Garzik if (!nr_aborted) 753c6fd2807SJeff Garzik ata_port_schedule_eh(ap); 754c6fd2807SJeff Garzik 755c6fd2807SJeff Garzik return nr_aborted; 756c6fd2807SJeff Garzik } 757c6fd2807SJeff Garzik 758c6fd2807SJeff Garzik /** 759c6fd2807SJeff Garzik * __ata_port_freeze - freeze port 760c6fd2807SJeff Garzik * @ap: ATA port to freeze 761c6fd2807SJeff Garzik * 762c6fd2807SJeff Garzik * This function is called when HSM violation or some other 763c6fd2807SJeff Garzik * condition disrupts normal operation of the port. Frozen port 764c6fd2807SJeff Garzik * is not allowed to perform any operation until the port is 765c6fd2807SJeff Garzik * thawed, which usually follows a successful reset. 766c6fd2807SJeff Garzik * 767c6fd2807SJeff Garzik * ap->ops->freeze() callback can be used for freezing the port 768c6fd2807SJeff Garzik * hardware-wise (e.g. mask interrupt and stop DMA engine). If a 769c6fd2807SJeff Garzik * port cannot be frozen hardware-wise, the interrupt handler 770c6fd2807SJeff Garzik * must ack and clear interrupts unconditionally while the port 771c6fd2807SJeff Garzik * is frozen. 772c6fd2807SJeff Garzik * 773c6fd2807SJeff Garzik * LOCKING: 774cca3974eSJeff Garzik * spin_lock_irqsave(host lock) 775c6fd2807SJeff Garzik */ 776c6fd2807SJeff Garzik static void __ata_port_freeze(struct ata_port *ap) 777c6fd2807SJeff Garzik { 778c6fd2807SJeff Garzik WARN_ON(!ap->ops->error_handler); 779c6fd2807SJeff Garzik 780c6fd2807SJeff Garzik if (ap->ops->freeze) 781c6fd2807SJeff Garzik ap->ops->freeze(ap); 782c6fd2807SJeff Garzik 783c6fd2807SJeff Garzik ap->pflags |= ATA_PFLAG_FROZEN; 784c6fd2807SJeff Garzik 78544877b4eSTejun Heo DPRINTK("ata%u port frozen\n", ap->print_id); 786c6fd2807SJeff Garzik } 787c6fd2807SJeff Garzik 788c6fd2807SJeff Garzik /** 789c6fd2807SJeff Garzik * ata_port_freeze - abort & freeze port 790c6fd2807SJeff Garzik * @ap: ATA port to freeze 791c6fd2807SJeff Garzik * 792c6fd2807SJeff Garzik * Abort and freeze @ap. 793c6fd2807SJeff Garzik * 794c6fd2807SJeff Garzik * LOCKING: 795cca3974eSJeff Garzik * spin_lock_irqsave(host lock) 796c6fd2807SJeff Garzik * 797c6fd2807SJeff Garzik * RETURNS: 798c6fd2807SJeff Garzik * Number of aborted commands. 799c6fd2807SJeff Garzik */ 800c6fd2807SJeff Garzik int ata_port_freeze(struct ata_port *ap) 801c6fd2807SJeff Garzik { 802c6fd2807SJeff Garzik int nr_aborted; 803c6fd2807SJeff Garzik 804c6fd2807SJeff Garzik WARN_ON(!ap->ops->error_handler); 805c6fd2807SJeff Garzik 806c6fd2807SJeff Garzik nr_aborted = ata_port_abort(ap); 807c6fd2807SJeff Garzik __ata_port_freeze(ap); 808c6fd2807SJeff Garzik 809c6fd2807SJeff Garzik return nr_aborted; 810c6fd2807SJeff Garzik } 811c6fd2807SJeff Garzik 812c6fd2807SJeff Garzik /** 813c6fd2807SJeff Garzik * ata_eh_freeze_port - EH helper to freeze port 814c6fd2807SJeff Garzik * @ap: ATA port to freeze 815c6fd2807SJeff Garzik * 816c6fd2807SJeff Garzik * Freeze @ap. 817c6fd2807SJeff Garzik * 818c6fd2807SJeff Garzik * LOCKING: 819c6fd2807SJeff Garzik * None. 820c6fd2807SJeff Garzik */ 821c6fd2807SJeff Garzik void ata_eh_freeze_port(struct ata_port *ap) 822c6fd2807SJeff Garzik { 823c6fd2807SJeff Garzik unsigned long flags; 824c6fd2807SJeff Garzik 825c6fd2807SJeff Garzik if (!ap->ops->error_handler) 826c6fd2807SJeff Garzik return; 827c6fd2807SJeff Garzik 828c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 829c6fd2807SJeff Garzik __ata_port_freeze(ap); 830c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 831c6fd2807SJeff Garzik } 832c6fd2807SJeff Garzik 833c6fd2807SJeff Garzik /** 834c6fd2807SJeff Garzik * ata_port_thaw_port - EH helper to thaw port 835c6fd2807SJeff Garzik * @ap: ATA port to thaw 836c6fd2807SJeff Garzik * 837c6fd2807SJeff Garzik * Thaw frozen port @ap. 838c6fd2807SJeff Garzik * 839c6fd2807SJeff Garzik * LOCKING: 840c6fd2807SJeff Garzik * None. 841c6fd2807SJeff Garzik */ 842c6fd2807SJeff Garzik void ata_eh_thaw_port(struct ata_port *ap) 843c6fd2807SJeff Garzik { 844c6fd2807SJeff Garzik unsigned long flags; 845c6fd2807SJeff Garzik 846c6fd2807SJeff Garzik if (!ap->ops->error_handler) 847c6fd2807SJeff Garzik return; 848c6fd2807SJeff Garzik 849c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 850c6fd2807SJeff Garzik 851c6fd2807SJeff Garzik ap->pflags &= ~ATA_PFLAG_FROZEN; 852c6fd2807SJeff Garzik 853c6fd2807SJeff Garzik if (ap->ops->thaw) 854c6fd2807SJeff Garzik ap->ops->thaw(ap); 855c6fd2807SJeff Garzik 856c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 857c6fd2807SJeff Garzik 85844877b4eSTejun Heo DPRINTK("ata%u port thawed\n", ap->print_id); 859c6fd2807SJeff Garzik } 860c6fd2807SJeff Garzik 861c6fd2807SJeff Garzik static void ata_eh_scsidone(struct scsi_cmnd *scmd) 862c6fd2807SJeff Garzik { 863c6fd2807SJeff Garzik /* nada */ 864c6fd2807SJeff Garzik } 865c6fd2807SJeff Garzik 866c6fd2807SJeff Garzik static void __ata_eh_qc_complete(struct ata_queued_cmd *qc) 867c6fd2807SJeff Garzik { 868c6fd2807SJeff Garzik struct ata_port *ap = qc->ap; 869c6fd2807SJeff Garzik struct scsi_cmnd *scmd = qc->scsicmd; 870c6fd2807SJeff Garzik unsigned long flags; 871c6fd2807SJeff Garzik 872c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 873c6fd2807SJeff Garzik qc->scsidone = ata_eh_scsidone; 874c6fd2807SJeff Garzik __ata_qc_complete(qc); 875c6fd2807SJeff Garzik WARN_ON(ata_tag_valid(qc->tag)); 876c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 877c6fd2807SJeff Garzik 878c6fd2807SJeff Garzik scsi_eh_finish_cmd(scmd, &ap->eh_done_q); 879c6fd2807SJeff Garzik } 880c6fd2807SJeff Garzik 881c6fd2807SJeff Garzik /** 882c6fd2807SJeff Garzik * ata_eh_qc_complete - Complete an active ATA command from EH 883c6fd2807SJeff Garzik * @qc: Command to complete 884c6fd2807SJeff Garzik * 885c6fd2807SJeff Garzik * Indicate to the mid and upper layers that an ATA command has 886c6fd2807SJeff Garzik * completed. To be used from EH. 887c6fd2807SJeff Garzik */ 888c6fd2807SJeff Garzik void ata_eh_qc_complete(struct ata_queued_cmd *qc) 889c6fd2807SJeff Garzik { 890c6fd2807SJeff Garzik struct scsi_cmnd *scmd = qc->scsicmd; 891c6fd2807SJeff Garzik scmd->retries = scmd->allowed; 892c6fd2807SJeff Garzik __ata_eh_qc_complete(qc); 893c6fd2807SJeff Garzik } 894c6fd2807SJeff Garzik 895c6fd2807SJeff Garzik /** 896c6fd2807SJeff Garzik * ata_eh_qc_retry - Tell midlayer to retry an ATA command after EH 897c6fd2807SJeff Garzik * @qc: Command to retry 898c6fd2807SJeff Garzik * 899c6fd2807SJeff Garzik * Indicate to the mid and upper layers that an ATA command 900c6fd2807SJeff Garzik * should be retried. To be used from EH. 901c6fd2807SJeff Garzik * 902c6fd2807SJeff Garzik * SCSI midlayer limits the number of retries to scmd->allowed. 903c6fd2807SJeff Garzik * scmd->retries is decremented for commands which get retried 904c6fd2807SJeff Garzik * due to unrelated failures (qc->err_mask is zero). 905c6fd2807SJeff Garzik */ 906c6fd2807SJeff Garzik void ata_eh_qc_retry(struct ata_queued_cmd *qc) 907c6fd2807SJeff Garzik { 908c6fd2807SJeff Garzik struct scsi_cmnd *scmd = qc->scsicmd; 909c6fd2807SJeff Garzik if (!qc->err_mask && scmd->retries) 910c6fd2807SJeff Garzik scmd->retries--; 911c6fd2807SJeff Garzik __ata_eh_qc_complete(qc); 912c6fd2807SJeff Garzik } 913c6fd2807SJeff Garzik 914c6fd2807SJeff Garzik /** 915c6fd2807SJeff Garzik * ata_eh_detach_dev - detach ATA device 916c6fd2807SJeff Garzik * @dev: ATA device to detach 917c6fd2807SJeff Garzik * 918c6fd2807SJeff Garzik * Detach @dev. 919c6fd2807SJeff Garzik * 920c6fd2807SJeff Garzik * LOCKING: 921c6fd2807SJeff Garzik * None. 922c6fd2807SJeff Garzik */ 923c6fd2807SJeff Garzik static void ata_eh_detach_dev(struct ata_device *dev) 924c6fd2807SJeff Garzik { 925c6fd2807SJeff Garzik struct ata_port *ap = dev->ap; 926c6fd2807SJeff Garzik unsigned long flags; 927c6fd2807SJeff Garzik 928c6fd2807SJeff Garzik ata_dev_disable(dev); 929c6fd2807SJeff Garzik 930c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 931c6fd2807SJeff Garzik 932c6fd2807SJeff Garzik dev->flags &= ~ATA_DFLAG_DETACH; 933c6fd2807SJeff Garzik 934c6fd2807SJeff Garzik if (ata_scsi_offline_dev(dev)) { 935c6fd2807SJeff Garzik dev->flags |= ATA_DFLAG_DETACHED; 936c6fd2807SJeff Garzik ap->pflags |= ATA_PFLAG_SCSI_HOTPLUG; 937c6fd2807SJeff Garzik } 938c6fd2807SJeff Garzik 939c6fd2807SJeff Garzik /* clear per-dev EH actions */ 940c6fd2807SJeff Garzik ata_eh_clear_action(dev, &ap->eh_info, ATA_EH_PERDEV_MASK); 941c6fd2807SJeff Garzik ata_eh_clear_action(dev, &ap->eh_context.i, ATA_EH_PERDEV_MASK); 942c6fd2807SJeff Garzik 943c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 944c6fd2807SJeff Garzik } 945c6fd2807SJeff Garzik 946c6fd2807SJeff Garzik /** 947c6fd2807SJeff Garzik * ata_eh_about_to_do - about to perform eh_action 948c6fd2807SJeff Garzik * @ap: target ATA port 949c6fd2807SJeff Garzik * @dev: target ATA dev for per-dev action (can be NULL) 950c6fd2807SJeff Garzik * @action: action about to be performed 951c6fd2807SJeff Garzik * 952c6fd2807SJeff Garzik * Called just before performing EH actions to clear related bits 953c6fd2807SJeff Garzik * in @ap->eh_info such that eh actions are not unnecessarily 954c6fd2807SJeff Garzik * repeated. 955c6fd2807SJeff Garzik * 956c6fd2807SJeff Garzik * LOCKING: 957c6fd2807SJeff Garzik * None. 958c6fd2807SJeff Garzik */ 959c6fd2807SJeff Garzik static void ata_eh_about_to_do(struct ata_port *ap, struct ata_device *dev, 960c6fd2807SJeff Garzik unsigned int action) 961c6fd2807SJeff Garzik { 962c6fd2807SJeff Garzik unsigned long flags; 963c6fd2807SJeff Garzik struct ata_eh_info *ehi = &ap->eh_info; 964c6fd2807SJeff Garzik struct ata_eh_context *ehc = &ap->eh_context; 965c6fd2807SJeff Garzik 966c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 967c6fd2807SJeff Garzik 968c6fd2807SJeff Garzik /* Reset is represented by combination of actions and EHI 969c6fd2807SJeff Garzik * flags. Suck in all related bits before clearing eh_info to 970c6fd2807SJeff Garzik * avoid losing requested action. 971c6fd2807SJeff Garzik */ 972c6fd2807SJeff Garzik if (action & ATA_EH_RESET_MASK) { 973c6fd2807SJeff Garzik ehc->i.action |= ehi->action & ATA_EH_RESET_MASK; 974c6fd2807SJeff Garzik ehc->i.flags |= ehi->flags & ATA_EHI_RESET_MODIFIER_MASK; 975c6fd2807SJeff Garzik 976c6fd2807SJeff Garzik /* make sure all reset actions are cleared & clear EHI flags */ 977c6fd2807SJeff Garzik action |= ATA_EH_RESET_MASK; 978c6fd2807SJeff Garzik ehi->flags &= ~ATA_EHI_RESET_MODIFIER_MASK; 979c6fd2807SJeff Garzik } 980c6fd2807SJeff Garzik 981c6fd2807SJeff Garzik ata_eh_clear_action(dev, ehi, action); 982c6fd2807SJeff Garzik 983c6fd2807SJeff Garzik if (!(ehc->i.flags & ATA_EHI_QUIET)) 984c6fd2807SJeff Garzik ap->pflags |= ATA_PFLAG_RECOVERED; 985c6fd2807SJeff Garzik 986c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 987c6fd2807SJeff Garzik } 988c6fd2807SJeff Garzik 989c6fd2807SJeff Garzik /** 990c6fd2807SJeff Garzik * ata_eh_done - EH action complete 991c6fd2807SJeff Garzik * @ap: target ATA port 992c6fd2807SJeff Garzik * @dev: target ATA dev for per-dev action (can be NULL) 993c6fd2807SJeff Garzik * @action: action just completed 994c6fd2807SJeff Garzik * 995c6fd2807SJeff Garzik * Called right after performing EH actions to clear related bits 996c6fd2807SJeff Garzik * in @ap->eh_context. 997c6fd2807SJeff Garzik * 998c6fd2807SJeff Garzik * LOCKING: 999c6fd2807SJeff Garzik * None. 1000c6fd2807SJeff Garzik */ 1001c6fd2807SJeff Garzik static void ata_eh_done(struct ata_port *ap, struct ata_device *dev, 1002c6fd2807SJeff Garzik unsigned int action) 1003c6fd2807SJeff Garzik { 1004c6fd2807SJeff Garzik /* if reset is complete, clear all reset actions & reset modifier */ 1005c6fd2807SJeff Garzik if (action & ATA_EH_RESET_MASK) { 1006c6fd2807SJeff Garzik action |= ATA_EH_RESET_MASK; 1007c6fd2807SJeff Garzik ap->eh_context.i.flags &= ~ATA_EHI_RESET_MODIFIER_MASK; 1008c6fd2807SJeff Garzik } 1009c6fd2807SJeff Garzik 1010c6fd2807SJeff Garzik ata_eh_clear_action(dev, &ap->eh_context.i, action); 1011c6fd2807SJeff Garzik } 1012c6fd2807SJeff Garzik 1013c6fd2807SJeff Garzik /** 1014c6fd2807SJeff Garzik * ata_err_string - convert err_mask to descriptive string 1015c6fd2807SJeff Garzik * @err_mask: error mask to convert to string 1016c6fd2807SJeff Garzik * 1017c6fd2807SJeff Garzik * Convert @err_mask to descriptive string. Errors are 1018c6fd2807SJeff Garzik * prioritized according to severity and only the most severe 1019c6fd2807SJeff Garzik * error is reported. 1020c6fd2807SJeff Garzik * 1021c6fd2807SJeff Garzik * LOCKING: 1022c6fd2807SJeff Garzik * None. 1023c6fd2807SJeff Garzik * 1024c6fd2807SJeff Garzik * RETURNS: 1025c6fd2807SJeff Garzik * Descriptive string for @err_mask 1026c6fd2807SJeff Garzik */ 1027c6fd2807SJeff Garzik static const char * ata_err_string(unsigned int err_mask) 1028c6fd2807SJeff Garzik { 1029c6fd2807SJeff Garzik if (err_mask & AC_ERR_HOST_BUS) 1030c6fd2807SJeff Garzik return "host bus error"; 1031c6fd2807SJeff Garzik if (err_mask & AC_ERR_ATA_BUS) 1032c6fd2807SJeff Garzik return "ATA bus error"; 1033c6fd2807SJeff Garzik if (err_mask & AC_ERR_TIMEOUT) 1034c6fd2807SJeff Garzik return "timeout"; 1035c6fd2807SJeff Garzik if (err_mask & AC_ERR_HSM) 1036c6fd2807SJeff Garzik return "HSM violation"; 1037c6fd2807SJeff Garzik if (err_mask & AC_ERR_SYSTEM) 1038c6fd2807SJeff Garzik return "internal error"; 1039c6fd2807SJeff Garzik if (err_mask & AC_ERR_MEDIA) 1040c6fd2807SJeff Garzik return "media error"; 1041c6fd2807SJeff Garzik if (err_mask & AC_ERR_INVALID) 1042c6fd2807SJeff Garzik return "invalid argument"; 1043c6fd2807SJeff Garzik if (err_mask & AC_ERR_DEV) 1044c6fd2807SJeff Garzik return "device error"; 1045c6fd2807SJeff Garzik return "unknown error"; 1046c6fd2807SJeff Garzik } 1047c6fd2807SJeff Garzik 1048c6fd2807SJeff Garzik /** 1049c6fd2807SJeff Garzik * ata_read_log_page - read a specific log page 1050c6fd2807SJeff Garzik * @dev: target device 1051c6fd2807SJeff Garzik * @page: page to read 1052c6fd2807SJeff Garzik * @buf: buffer to store read page 1053c6fd2807SJeff Garzik * @sectors: number of sectors to read 1054c6fd2807SJeff Garzik * 1055c6fd2807SJeff Garzik * Read log page using READ_LOG_EXT command. 1056c6fd2807SJeff Garzik * 1057c6fd2807SJeff Garzik * LOCKING: 1058c6fd2807SJeff Garzik * Kernel thread context (may sleep). 1059c6fd2807SJeff Garzik * 1060c6fd2807SJeff Garzik * RETURNS: 1061c6fd2807SJeff Garzik * 0 on success, AC_ERR_* mask otherwise. 1062c6fd2807SJeff Garzik */ 1063c6fd2807SJeff Garzik static unsigned int ata_read_log_page(struct ata_device *dev, 1064c6fd2807SJeff Garzik u8 page, void *buf, unsigned int sectors) 1065c6fd2807SJeff Garzik { 1066c6fd2807SJeff Garzik struct ata_taskfile tf; 1067c6fd2807SJeff Garzik unsigned int err_mask; 1068c6fd2807SJeff Garzik 1069c6fd2807SJeff Garzik DPRINTK("read log page - page %d\n", page); 1070c6fd2807SJeff Garzik 1071c6fd2807SJeff Garzik ata_tf_init(dev, &tf); 1072c6fd2807SJeff Garzik tf.command = ATA_CMD_READ_LOG_EXT; 1073c6fd2807SJeff Garzik tf.lbal = page; 1074c6fd2807SJeff Garzik tf.nsect = sectors; 1075c6fd2807SJeff Garzik tf.hob_nsect = sectors >> 8; 1076c6fd2807SJeff Garzik tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_LBA48 | ATA_TFLAG_DEVICE; 1077c6fd2807SJeff Garzik tf.protocol = ATA_PROT_PIO; 1078c6fd2807SJeff Garzik 1079c6fd2807SJeff Garzik err_mask = ata_exec_internal(dev, &tf, NULL, DMA_FROM_DEVICE, 1080c6fd2807SJeff Garzik buf, sectors * ATA_SECT_SIZE); 1081c6fd2807SJeff Garzik 1082c6fd2807SJeff Garzik DPRINTK("EXIT, err_mask=%x\n", err_mask); 1083c6fd2807SJeff Garzik return err_mask; 1084c6fd2807SJeff Garzik } 1085c6fd2807SJeff Garzik 1086c6fd2807SJeff Garzik /** 1087c6fd2807SJeff Garzik * ata_eh_read_log_10h - Read log page 10h for NCQ error details 1088c6fd2807SJeff Garzik * @dev: Device to read log page 10h from 1089c6fd2807SJeff Garzik * @tag: Resulting tag of the failed command 1090c6fd2807SJeff Garzik * @tf: Resulting taskfile registers of the failed command 1091c6fd2807SJeff Garzik * 1092c6fd2807SJeff Garzik * Read log page 10h to obtain NCQ error details and clear error 1093c6fd2807SJeff Garzik * condition. 1094c6fd2807SJeff Garzik * 1095c6fd2807SJeff Garzik * LOCKING: 1096c6fd2807SJeff Garzik * Kernel thread context (may sleep). 1097c6fd2807SJeff Garzik * 1098c6fd2807SJeff Garzik * RETURNS: 1099c6fd2807SJeff Garzik * 0 on success, -errno otherwise. 1100c6fd2807SJeff Garzik */ 1101c6fd2807SJeff Garzik static int ata_eh_read_log_10h(struct ata_device *dev, 1102c6fd2807SJeff Garzik int *tag, struct ata_taskfile *tf) 1103c6fd2807SJeff Garzik { 1104c6fd2807SJeff Garzik u8 *buf = dev->ap->sector_buf; 1105c6fd2807SJeff Garzik unsigned int err_mask; 1106c6fd2807SJeff Garzik u8 csum; 1107c6fd2807SJeff Garzik int i; 1108c6fd2807SJeff Garzik 1109c6fd2807SJeff Garzik err_mask = ata_read_log_page(dev, ATA_LOG_SATA_NCQ, buf, 1); 1110c6fd2807SJeff Garzik if (err_mask) 1111c6fd2807SJeff Garzik return -EIO; 1112c6fd2807SJeff Garzik 1113c6fd2807SJeff Garzik csum = 0; 1114c6fd2807SJeff Garzik for (i = 0; i < ATA_SECT_SIZE; i++) 1115c6fd2807SJeff Garzik csum += buf[i]; 1116c6fd2807SJeff Garzik if (csum) 1117c6fd2807SJeff Garzik ata_dev_printk(dev, KERN_WARNING, 1118c6fd2807SJeff Garzik "invalid checksum 0x%x on log page 10h\n", csum); 1119c6fd2807SJeff Garzik 1120c6fd2807SJeff Garzik if (buf[0] & 0x80) 1121c6fd2807SJeff Garzik return -ENOENT; 1122c6fd2807SJeff Garzik 1123c6fd2807SJeff Garzik *tag = buf[0] & 0x1f; 1124c6fd2807SJeff Garzik 1125c6fd2807SJeff Garzik tf->command = buf[2]; 1126c6fd2807SJeff Garzik tf->feature = buf[3]; 1127c6fd2807SJeff Garzik tf->lbal = buf[4]; 1128c6fd2807SJeff Garzik tf->lbam = buf[5]; 1129c6fd2807SJeff Garzik tf->lbah = buf[6]; 1130c6fd2807SJeff Garzik tf->device = buf[7]; 1131c6fd2807SJeff Garzik tf->hob_lbal = buf[8]; 1132c6fd2807SJeff Garzik tf->hob_lbam = buf[9]; 1133c6fd2807SJeff Garzik tf->hob_lbah = buf[10]; 1134c6fd2807SJeff Garzik tf->nsect = buf[12]; 1135c6fd2807SJeff Garzik tf->hob_nsect = buf[13]; 1136c6fd2807SJeff Garzik 1137c6fd2807SJeff Garzik return 0; 1138c6fd2807SJeff Garzik } 1139c6fd2807SJeff Garzik 1140c6fd2807SJeff Garzik /** 1141c6fd2807SJeff Garzik * atapi_eh_request_sense - perform ATAPI REQUEST_SENSE 1142c6fd2807SJeff Garzik * @dev: device to perform REQUEST_SENSE to 1143c6fd2807SJeff Garzik * @sense_buf: result sense data buffer (SCSI_SENSE_BUFFERSIZE bytes long) 1144c6fd2807SJeff Garzik * 1145c6fd2807SJeff Garzik * Perform ATAPI REQUEST_SENSE after the device reported CHECK 1146c6fd2807SJeff Garzik * SENSE. This function is EH helper. 1147c6fd2807SJeff Garzik * 1148c6fd2807SJeff Garzik * LOCKING: 1149c6fd2807SJeff Garzik * Kernel thread context (may sleep). 1150c6fd2807SJeff Garzik * 1151c6fd2807SJeff Garzik * RETURNS: 1152c6fd2807SJeff Garzik * 0 on success, AC_ERR_* mask on failure 1153c6fd2807SJeff Garzik */ 115456287768SAlbert Lee static unsigned int atapi_eh_request_sense(struct ata_queued_cmd *qc) 1155c6fd2807SJeff Garzik { 115656287768SAlbert Lee struct ata_device *dev = qc->dev; 115756287768SAlbert Lee unsigned char *sense_buf = qc->scsicmd->sense_buffer; 1158c6fd2807SJeff Garzik struct ata_port *ap = dev->ap; 1159c6fd2807SJeff Garzik struct ata_taskfile tf; 1160c6fd2807SJeff Garzik u8 cdb[ATAPI_CDB_LEN]; 1161c6fd2807SJeff Garzik 1162c6fd2807SJeff Garzik DPRINTK("ATAPI request sense\n"); 1163c6fd2807SJeff Garzik 1164c6fd2807SJeff Garzik /* FIXME: is this needed? */ 1165c6fd2807SJeff Garzik memset(sense_buf, 0, SCSI_SENSE_BUFFERSIZE); 1166c6fd2807SJeff Garzik 116756287768SAlbert Lee /* initialize sense_buf with the error register, 116856287768SAlbert Lee * for the case where they are -not- overwritten 116956287768SAlbert Lee */ 1170c6fd2807SJeff Garzik sense_buf[0] = 0x70; 117156287768SAlbert Lee sense_buf[2] = qc->result_tf.feature >> 4; 117256287768SAlbert Lee 117356287768SAlbert Lee /* some devices time out if garbage left in tf */ 117456287768SAlbert Lee ata_tf_init(dev, &tf); 1175c6fd2807SJeff Garzik 1176c6fd2807SJeff Garzik memset(cdb, 0, ATAPI_CDB_LEN); 1177c6fd2807SJeff Garzik cdb[0] = REQUEST_SENSE; 1178c6fd2807SJeff Garzik cdb[4] = SCSI_SENSE_BUFFERSIZE; 1179c6fd2807SJeff Garzik 1180c6fd2807SJeff Garzik tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_DEVICE; 1181c6fd2807SJeff Garzik tf.command = ATA_CMD_PACKET; 1182c6fd2807SJeff Garzik 1183c6fd2807SJeff Garzik /* is it pointless to prefer PIO for "safety reasons"? */ 1184c6fd2807SJeff Garzik if (ap->flags & ATA_FLAG_PIO_DMA) { 1185c6fd2807SJeff Garzik tf.protocol = ATA_PROT_ATAPI_DMA; 1186c6fd2807SJeff Garzik tf.feature |= ATAPI_PKT_DMA; 1187c6fd2807SJeff Garzik } else { 1188c6fd2807SJeff Garzik tf.protocol = ATA_PROT_ATAPI; 1189c6fd2807SJeff Garzik tf.lbam = (8 * 1024) & 0xff; 1190c6fd2807SJeff Garzik tf.lbah = (8 * 1024) >> 8; 1191c6fd2807SJeff Garzik } 1192c6fd2807SJeff Garzik 1193c6fd2807SJeff Garzik return ata_exec_internal(dev, &tf, cdb, DMA_FROM_DEVICE, 1194c6fd2807SJeff Garzik sense_buf, SCSI_SENSE_BUFFERSIZE); 1195c6fd2807SJeff Garzik } 1196c6fd2807SJeff Garzik 1197c6fd2807SJeff Garzik /** 1198c6fd2807SJeff Garzik * ata_eh_analyze_serror - analyze SError for a failed port 1199c6fd2807SJeff Garzik * @ap: ATA port to analyze SError for 1200c6fd2807SJeff Garzik * 1201c6fd2807SJeff Garzik * Analyze SError if available and further determine cause of 1202c6fd2807SJeff Garzik * failure. 1203c6fd2807SJeff Garzik * 1204c6fd2807SJeff Garzik * LOCKING: 1205c6fd2807SJeff Garzik * None. 1206c6fd2807SJeff Garzik */ 1207c6fd2807SJeff Garzik static void ata_eh_analyze_serror(struct ata_port *ap) 1208c6fd2807SJeff Garzik { 1209c6fd2807SJeff Garzik struct ata_eh_context *ehc = &ap->eh_context; 1210c6fd2807SJeff Garzik u32 serror = ehc->i.serror; 1211c6fd2807SJeff Garzik unsigned int err_mask = 0, action = 0; 1212c6fd2807SJeff Garzik 1213c6fd2807SJeff Garzik if (serror & SERR_PERSISTENT) { 1214c6fd2807SJeff Garzik err_mask |= AC_ERR_ATA_BUS; 1215c6fd2807SJeff Garzik action |= ATA_EH_HARDRESET; 1216c6fd2807SJeff Garzik } 1217c6fd2807SJeff Garzik if (serror & 1218c6fd2807SJeff Garzik (SERR_DATA_RECOVERED | SERR_COMM_RECOVERED | SERR_DATA)) { 1219c6fd2807SJeff Garzik err_mask |= AC_ERR_ATA_BUS; 1220c6fd2807SJeff Garzik action |= ATA_EH_SOFTRESET; 1221c6fd2807SJeff Garzik } 1222c6fd2807SJeff Garzik if (serror & SERR_PROTOCOL) { 1223c6fd2807SJeff Garzik err_mask |= AC_ERR_HSM; 1224c6fd2807SJeff Garzik action |= ATA_EH_SOFTRESET; 1225c6fd2807SJeff Garzik } 1226c6fd2807SJeff Garzik if (serror & SERR_INTERNAL) { 1227c6fd2807SJeff Garzik err_mask |= AC_ERR_SYSTEM; 1228771b8dadSTejun Heo action |= ATA_EH_HARDRESET; 1229c6fd2807SJeff Garzik } 1230c6fd2807SJeff Garzik if (serror & (SERR_PHYRDY_CHG | SERR_DEV_XCHG)) 1231c6fd2807SJeff Garzik ata_ehi_hotplugged(&ehc->i); 1232c6fd2807SJeff Garzik 1233c6fd2807SJeff Garzik ehc->i.err_mask |= err_mask; 1234c6fd2807SJeff Garzik ehc->i.action |= action; 1235c6fd2807SJeff Garzik } 1236c6fd2807SJeff Garzik 1237c6fd2807SJeff Garzik /** 1238c6fd2807SJeff Garzik * ata_eh_analyze_ncq_error - analyze NCQ error 1239c6fd2807SJeff Garzik * @ap: ATA port to analyze NCQ error for 1240c6fd2807SJeff Garzik * 1241c6fd2807SJeff Garzik * Read log page 10h, determine the offending qc and acquire 1242c6fd2807SJeff Garzik * error status TF. For NCQ device errors, all LLDDs have to do 1243c6fd2807SJeff Garzik * is setting AC_ERR_DEV in ehi->err_mask. This function takes 1244c6fd2807SJeff Garzik * care of the rest. 1245c6fd2807SJeff Garzik * 1246c6fd2807SJeff Garzik * LOCKING: 1247c6fd2807SJeff Garzik * Kernel thread context (may sleep). 1248c6fd2807SJeff Garzik */ 1249c6fd2807SJeff Garzik static void ata_eh_analyze_ncq_error(struct ata_port *ap) 1250c6fd2807SJeff Garzik { 1251c6fd2807SJeff Garzik struct ata_eh_context *ehc = &ap->eh_context; 1252c6fd2807SJeff Garzik struct ata_device *dev = ap->device; 1253c6fd2807SJeff Garzik struct ata_queued_cmd *qc; 1254c6fd2807SJeff Garzik struct ata_taskfile tf; 1255c6fd2807SJeff Garzik int tag, rc; 1256c6fd2807SJeff Garzik 1257c6fd2807SJeff Garzik /* if frozen, we can't do much */ 1258c6fd2807SJeff Garzik if (ap->pflags & ATA_PFLAG_FROZEN) 1259c6fd2807SJeff Garzik return; 1260c6fd2807SJeff Garzik 1261c6fd2807SJeff Garzik /* is it NCQ device error? */ 1262c6fd2807SJeff Garzik if (!ap->sactive || !(ehc->i.err_mask & AC_ERR_DEV)) 1263c6fd2807SJeff Garzik return; 1264c6fd2807SJeff Garzik 1265c6fd2807SJeff Garzik /* has LLDD analyzed already? */ 1266c6fd2807SJeff Garzik for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 1267c6fd2807SJeff Garzik qc = __ata_qc_from_tag(ap, tag); 1268c6fd2807SJeff Garzik 1269c6fd2807SJeff Garzik if (!(qc->flags & ATA_QCFLAG_FAILED)) 1270c6fd2807SJeff Garzik continue; 1271c6fd2807SJeff Garzik 1272c6fd2807SJeff Garzik if (qc->err_mask) 1273c6fd2807SJeff Garzik return; 1274c6fd2807SJeff Garzik } 1275c6fd2807SJeff Garzik 1276c6fd2807SJeff Garzik /* okay, this error is ours */ 1277c6fd2807SJeff Garzik rc = ata_eh_read_log_10h(dev, &tag, &tf); 1278c6fd2807SJeff Garzik if (rc) { 1279c6fd2807SJeff Garzik ata_port_printk(ap, KERN_ERR, "failed to read log page 10h " 1280c6fd2807SJeff Garzik "(errno=%d)\n", rc); 1281c6fd2807SJeff Garzik return; 1282c6fd2807SJeff Garzik } 1283c6fd2807SJeff Garzik 1284c6fd2807SJeff Garzik if (!(ap->sactive & (1 << tag))) { 1285c6fd2807SJeff Garzik ata_port_printk(ap, KERN_ERR, "log page 10h reported " 1286c6fd2807SJeff Garzik "inactive tag %d\n", tag); 1287c6fd2807SJeff Garzik return; 1288c6fd2807SJeff Garzik } 1289c6fd2807SJeff Garzik 1290c6fd2807SJeff Garzik /* we've got the perpetrator, condemn it */ 1291c6fd2807SJeff Garzik qc = __ata_qc_from_tag(ap, tag); 1292c6fd2807SJeff Garzik memcpy(&qc->result_tf, &tf, sizeof(tf)); 12935335b729STejun Heo qc->err_mask |= AC_ERR_DEV | AC_ERR_NCQ; 1294c6fd2807SJeff Garzik ehc->i.err_mask &= ~AC_ERR_DEV; 1295c6fd2807SJeff Garzik } 1296c6fd2807SJeff Garzik 1297c6fd2807SJeff Garzik /** 1298c6fd2807SJeff Garzik * ata_eh_analyze_tf - analyze taskfile of a failed qc 1299c6fd2807SJeff Garzik * @qc: qc to analyze 1300c6fd2807SJeff Garzik * @tf: Taskfile registers to analyze 1301c6fd2807SJeff Garzik * 1302c6fd2807SJeff Garzik * Analyze taskfile of @qc and further determine cause of 1303c6fd2807SJeff Garzik * failure. This function also requests ATAPI sense data if 1304c6fd2807SJeff Garzik * avaliable. 1305c6fd2807SJeff Garzik * 1306c6fd2807SJeff Garzik * LOCKING: 1307c6fd2807SJeff Garzik * Kernel thread context (may sleep). 1308c6fd2807SJeff Garzik * 1309c6fd2807SJeff Garzik * RETURNS: 1310c6fd2807SJeff Garzik * Determined recovery action 1311c6fd2807SJeff Garzik */ 1312c6fd2807SJeff Garzik static unsigned int ata_eh_analyze_tf(struct ata_queued_cmd *qc, 1313c6fd2807SJeff Garzik const struct ata_taskfile *tf) 1314c6fd2807SJeff Garzik { 1315c6fd2807SJeff Garzik unsigned int tmp, action = 0; 1316c6fd2807SJeff Garzik u8 stat = tf->command, err = tf->feature; 1317c6fd2807SJeff Garzik 1318c6fd2807SJeff Garzik if ((stat & (ATA_BUSY | ATA_DRQ | ATA_DRDY)) != ATA_DRDY) { 1319c6fd2807SJeff Garzik qc->err_mask |= AC_ERR_HSM; 1320c6fd2807SJeff Garzik return ATA_EH_SOFTRESET; 1321c6fd2807SJeff Garzik } 1322c6fd2807SJeff Garzik 1323a51d644aSTejun Heo if (stat & (ATA_ERR | ATA_DF)) 1324a51d644aSTejun Heo qc->err_mask |= AC_ERR_DEV; 1325a51d644aSTejun Heo else 1326c6fd2807SJeff Garzik return 0; 1327c6fd2807SJeff Garzik 1328c6fd2807SJeff Garzik switch (qc->dev->class) { 1329c6fd2807SJeff Garzik case ATA_DEV_ATA: 1330c6fd2807SJeff Garzik if (err & ATA_ICRC) 1331c6fd2807SJeff Garzik qc->err_mask |= AC_ERR_ATA_BUS; 1332c6fd2807SJeff Garzik if (err & ATA_UNC) 1333c6fd2807SJeff Garzik qc->err_mask |= AC_ERR_MEDIA; 1334c6fd2807SJeff Garzik if (err & ATA_IDNF) 1335c6fd2807SJeff Garzik qc->err_mask |= AC_ERR_INVALID; 1336c6fd2807SJeff Garzik break; 1337c6fd2807SJeff Garzik 1338c6fd2807SJeff Garzik case ATA_DEV_ATAPI: 1339a569a30dSTejun Heo if (!(qc->ap->pflags & ATA_PFLAG_FROZEN)) { 134056287768SAlbert Lee tmp = atapi_eh_request_sense(qc); 1341c6fd2807SJeff Garzik if (!tmp) { 1342a569a30dSTejun Heo /* ATA_QCFLAG_SENSE_VALID is used to 1343a569a30dSTejun Heo * tell atapi_qc_complete() that sense 1344a569a30dSTejun Heo * data is already valid. 1345c6fd2807SJeff Garzik * 1346c6fd2807SJeff Garzik * TODO: interpret sense data and set 1347c6fd2807SJeff Garzik * appropriate err_mask. 1348c6fd2807SJeff Garzik */ 1349c6fd2807SJeff Garzik qc->flags |= ATA_QCFLAG_SENSE_VALID; 1350c6fd2807SJeff Garzik } else 1351c6fd2807SJeff Garzik qc->err_mask |= tmp; 1352c6fd2807SJeff Garzik } 1353a569a30dSTejun Heo } 1354c6fd2807SJeff Garzik 1355c6fd2807SJeff Garzik if (qc->err_mask & (AC_ERR_HSM | AC_ERR_TIMEOUT | AC_ERR_ATA_BUS)) 1356c6fd2807SJeff Garzik action |= ATA_EH_SOFTRESET; 1357c6fd2807SJeff Garzik 1358c6fd2807SJeff Garzik return action; 1359c6fd2807SJeff Garzik } 1360c6fd2807SJeff Garzik 13617d47e8d4STejun Heo static int ata_eh_categorize_error(int is_io, unsigned int err_mask) 1362c6fd2807SJeff Garzik { 13637d47e8d4STejun Heo if (err_mask & AC_ERR_ATA_BUS) 1364c6fd2807SJeff Garzik return 1; 1365c6fd2807SJeff Garzik 13667d47e8d4STejun Heo if (err_mask & AC_ERR_TIMEOUT) 1367c6fd2807SJeff Garzik return 2; 13687d47e8d4STejun Heo 13697d47e8d4STejun Heo if (is_io) { 13707d47e8d4STejun Heo if (err_mask & AC_ERR_HSM) 13717d47e8d4STejun Heo return 2; 13727d47e8d4STejun Heo if ((err_mask & 13737d47e8d4STejun Heo (AC_ERR_DEV|AC_ERR_MEDIA|AC_ERR_INVALID)) == AC_ERR_DEV) 13747d47e8d4STejun Heo return 3; 1375c6fd2807SJeff Garzik } 1376c6fd2807SJeff Garzik 1377c6fd2807SJeff Garzik return 0; 1378c6fd2807SJeff Garzik } 1379c6fd2807SJeff Garzik 13807d47e8d4STejun Heo struct speed_down_verdict_arg { 1381c6fd2807SJeff Garzik u64 since; 13827d47e8d4STejun Heo int nr_errors[4]; 1383c6fd2807SJeff Garzik }; 1384c6fd2807SJeff Garzik 13857d47e8d4STejun Heo static int speed_down_verdict_cb(struct ata_ering_entry *ent, void *void_arg) 1386c6fd2807SJeff Garzik { 13877d47e8d4STejun Heo struct speed_down_verdict_arg *arg = void_arg; 13887d47e8d4STejun Heo int cat = ata_eh_categorize_error(ent->is_io, ent->err_mask); 1389c6fd2807SJeff Garzik 1390c6fd2807SJeff Garzik if (ent->timestamp < arg->since) 1391c6fd2807SJeff Garzik return -1; 1392c6fd2807SJeff Garzik 13937d47e8d4STejun Heo arg->nr_errors[cat]++; 1394c6fd2807SJeff Garzik return 0; 1395c6fd2807SJeff Garzik } 1396c6fd2807SJeff Garzik 1397c6fd2807SJeff Garzik /** 13987d47e8d4STejun Heo * ata_eh_speed_down_verdict - Determine speed down verdict 1399c6fd2807SJeff Garzik * @dev: Device of interest 1400c6fd2807SJeff Garzik * 1401c6fd2807SJeff Garzik * This function examines error ring of @dev and determines 14027d47e8d4STejun Heo * whether NCQ needs to be turned off, transfer speed should be 14037d47e8d4STejun Heo * stepped down, or falling back to PIO is necessary. 1404c6fd2807SJeff Garzik * 14057d47e8d4STejun Heo * Cat-1 is ATA_BUS error for any command. 1406c6fd2807SJeff Garzik * 14077d47e8d4STejun Heo * Cat-2 is TIMEOUT for any command or HSM violation for known 14087d47e8d4STejun Heo * supported commands. 14097d47e8d4STejun Heo * 14107d47e8d4STejun Heo * Cat-3 is is unclassified DEV error for known supported 1411c6fd2807SJeff Garzik * command. 1412c6fd2807SJeff Garzik * 14137d47e8d4STejun Heo * NCQ needs to be turned off if there have been more than 3 14147d47e8d4STejun Heo * Cat-2 + Cat-3 errors during last 10 minutes. 14157d47e8d4STejun Heo * 14167d47e8d4STejun Heo * Speed down is necessary if there have been more than 3 Cat-1 + 14177d47e8d4STejun Heo * Cat-2 errors or 10 Cat-3 errors during last 10 minutes. 14187d47e8d4STejun Heo * 14197d47e8d4STejun Heo * Falling back to PIO mode is necessary if there have been more 14207d47e8d4STejun Heo * than 10 Cat-1 + Cat-2 + Cat-3 errors during last 5 minutes. 14217d47e8d4STejun Heo * 1422c6fd2807SJeff Garzik * LOCKING: 1423c6fd2807SJeff Garzik * Inherited from caller. 1424c6fd2807SJeff Garzik * 1425c6fd2807SJeff Garzik * RETURNS: 14267d47e8d4STejun Heo * OR of ATA_EH_SPDN_* flags. 1427c6fd2807SJeff Garzik */ 14287d47e8d4STejun Heo static unsigned int ata_eh_speed_down_verdict(struct ata_device *dev) 1429c6fd2807SJeff Garzik { 14307d47e8d4STejun Heo const u64 j5mins = 5LLU * 60 * HZ, j10mins = 10LLU * 60 * HZ; 14317d47e8d4STejun Heo u64 j64 = get_jiffies_64(); 14327d47e8d4STejun Heo struct speed_down_verdict_arg arg; 14337d47e8d4STejun Heo unsigned int verdict = 0; 1434c6fd2807SJeff Garzik 14357d47e8d4STejun Heo /* scan past 10 mins of error history */ 1436c6fd2807SJeff Garzik memset(&arg, 0, sizeof(arg)); 14377d47e8d4STejun Heo arg.since = j64 - min(j64, j10mins); 14387d47e8d4STejun Heo ata_ering_map(&dev->ering, speed_down_verdict_cb, &arg); 1439c6fd2807SJeff Garzik 14407d47e8d4STejun Heo if (arg.nr_errors[2] + arg.nr_errors[3] > 3) 14417d47e8d4STejun Heo verdict |= ATA_EH_SPDN_NCQ_OFF; 14427d47e8d4STejun Heo if (arg.nr_errors[1] + arg.nr_errors[2] > 3 || arg.nr_errors[3] > 10) 14437d47e8d4STejun Heo verdict |= ATA_EH_SPDN_SPEED_DOWN; 1444c6fd2807SJeff Garzik 14457d47e8d4STejun Heo /* scan past 3 mins of error history */ 14467d47e8d4STejun Heo memset(&arg, 0, sizeof(arg)); 14477d47e8d4STejun Heo arg.since = j64 - min(j64, j5mins); 14487d47e8d4STejun Heo ata_ering_map(&dev->ering, speed_down_verdict_cb, &arg); 1449c6fd2807SJeff Garzik 14507d47e8d4STejun Heo if (arg.nr_errors[1] + arg.nr_errors[2] + arg.nr_errors[3] > 10) 14517d47e8d4STejun Heo verdict |= ATA_EH_SPDN_FALLBACK_TO_PIO; 14527d47e8d4STejun Heo 14537d47e8d4STejun Heo return verdict; 1454c6fd2807SJeff Garzik } 1455c6fd2807SJeff Garzik 1456c6fd2807SJeff Garzik /** 1457c6fd2807SJeff Garzik * ata_eh_speed_down - record error and speed down if necessary 1458c6fd2807SJeff Garzik * @dev: Failed device 1459c6fd2807SJeff Garzik * @is_io: Did the device fail during normal IO? 1460c6fd2807SJeff Garzik * @err_mask: err_mask of the error 1461c6fd2807SJeff Garzik * 1462c6fd2807SJeff Garzik * Record error and examine error history to determine whether 1463c6fd2807SJeff Garzik * adjusting transmission speed is necessary. It also sets 1464c6fd2807SJeff Garzik * transmission limits appropriately if such adjustment is 1465c6fd2807SJeff Garzik * necessary. 1466c6fd2807SJeff Garzik * 1467c6fd2807SJeff Garzik * LOCKING: 1468c6fd2807SJeff Garzik * Kernel thread context (may sleep). 1469c6fd2807SJeff Garzik * 1470c6fd2807SJeff Garzik * RETURNS: 14717d47e8d4STejun Heo * Determined recovery action. 1472c6fd2807SJeff Garzik */ 14737d47e8d4STejun Heo static unsigned int ata_eh_speed_down(struct ata_device *dev, int is_io, 1474c6fd2807SJeff Garzik unsigned int err_mask) 1475c6fd2807SJeff Garzik { 14767d47e8d4STejun Heo unsigned int verdict; 14777d47e8d4STejun Heo unsigned int action = 0; 14787d47e8d4STejun Heo 14797d47e8d4STejun Heo /* don't bother if Cat-0 error */ 14807d47e8d4STejun Heo if (ata_eh_categorize_error(is_io, err_mask) == 0) 1481c6fd2807SJeff Garzik return 0; 1482c6fd2807SJeff Garzik 1483c6fd2807SJeff Garzik /* record error and determine whether speed down is necessary */ 1484c6fd2807SJeff Garzik ata_ering_record(&dev->ering, is_io, err_mask); 14857d47e8d4STejun Heo verdict = ata_eh_speed_down_verdict(dev); 1486c6fd2807SJeff Garzik 14877d47e8d4STejun Heo /* turn off NCQ? */ 14887d47e8d4STejun Heo if ((verdict & ATA_EH_SPDN_NCQ_OFF) && 14897d47e8d4STejun Heo (dev->flags & (ATA_DFLAG_PIO | ATA_DFLAG_NCQ | 14907d47e8d4STejun Heo ATA_DFLAG_NCQ_OFF)) == ATA_DFLAG_NCQ) { 14917d47e8d4STejun Heo dev->flags |= ATA_DFLAG_NCQ_OFF; 14927d47e8d4STejun Heo ata_dev_printk(dev, KERN_WARNING, 14937d47e8d4STejun Heo "NCQ disabled due to excessive errors\n"); 14947d47e8d4STejun Heo goto done; 14957d47e8d4STejun Heo } 1496c6fd2807SJeff Garzik 14977d47e8d4STejun Heo /* speed down? */ 14987d47e8d4STejun Heo if (verdict & ATA_EH_SPDN_SPEED_DOWN) { 1499c6fd2807SJeff Garzik /* speed down SATA link speed if possible */ 15007d47e8d4STejun Heo if (sata_down_spd_limit(dev->ap) == 0) { 15017d47e8d4STejun Heo action |= ATA_EH_HARDRESET; 15027d47e8d4STejun Heo goto done; 15037d47e8d4STejun Heo } 1504c6fd2807SJeff Garzik 1505c6fd2807SJeff Garzik /* lower transfer mode */ 15067d47e8d4STejun Heo if (dev->spdn_cnt < 2) { 15077d47e8d4STejun Heo static const int dma_dnxfer_sel[] = 15087d47e8d4STejun Heo { ATA_DNXFER_DMA, ATA_DNXFER_40C }; 15097d47e8d4STejun Heo static const int pio_dnxfer_sel[] = 15107d47e8d4STejun Heo { ATA_DNXFER_PIO, ATA_DNXFER_FORCE_PIO0 }; 15117d47e8d4STejun Heo int sel; 1512c6fd2807SJeff Garzik 15137d47e8d4STejun Heo if (dev->xfer_shift != ATA_SHIFT_PIO) 15147d47e8d4STejun Heo sel = dma_dnxfer_sel[dev->spdn_cnt]; 15157d47e8d4STejun Heo else 15167d47e8d4STejun Heo sel = pio_dnxfer_sel[dev->spdn_cnt]; 15177d47e8d4STejun Heo 15187d47e8d4STejun Heo dev->spdn_cnt++; 15197d47e8d4STejun Heo 15207d47e8d4STejun Heo if (ata_down_xfermask_limit(dev, sel) == 0) { 15217d47e8d4STejun Heo action |= ATA_EH_SOFTRESET; 15227d47e8d4STejun Heo goto done; 15237d47e8d4STejun Heo } 15247d47e8d4STejun Heo } 15257d47e8d4STejun Heo } 15267d47e8d4STejun Heo 15277d47e8d4STejun Heo /* Fall back to PIO? Slowing down to PIO is meaningless for 15287d47e8d4STejun Heo * SATA. Consider it only for PATA. 15297d47e8d4STejun Heo */ 15307d47e8d4STejun Heo if ((verdict & ATA_EH_SPDN_FALLBACK_TO_PIO) && (dev->spdn_cnt >= 2) && 15317d47e8d4STejun Heo (dev->ap->cbl != ATA_CBL_SATA) && 15327d47e8d4STejun Heo (dev->xfer_shift != ATA_SHIFT_PIO)) { 15337d47e8d4STejun Heo if (ata_down_xfermask_limit(dev, ATA_DNXFER_FORCE_PIO) == 0) { 15347d47e8d4STejun Heo dev->spdn_cnt = 0; 15357d47e8d4STejun Heo action |= ATA_EH_SOFTRESET; 15367d47e8d4STejun Heo goto done; 15377d47e8d4STejun Heo } 15387d47e8d4STejun Heo } 15397d47e8d4STejun Heo 1540c6fd2807SJeff Garzik return 0; 15417d47e8d4STejun Heo done: 15427d47e8d4STejun Heo /* device has been slowed down, blow error history */ 15437d47e8d4STejun Heo ata_ering_clear(&dev->ering); 15447d47e8d4STejun Heo return action; 1545c6fd2807SJeff Garzik } 1546c6fd2807SJeff Garzik 1547c6fd2807SJeff Garzik /** 1548c6fd2807SJeff Garzik * ata_eh_autopsy - analyze error and determine recovery action 1549c6fd2807SJeff Garzik * @ap: ATA port to perform autopsy on 1550c6fd2807SJeff Garzik * 1551c6fd2807SJeff Garzik * Analyze why @ap failed and determine which recovery action is 1552c6fd2807SJeff Garzik * needed. This function also sets more detailed AC_ERR_* values 1553c6fd2807SJeff Garzik * and fills sense data for ATAPI CHECK SENSE. 1554c6fd2807SJeff Garzik * 1555c6fd2807SJeff Garzik * LOCKING: 1556c6fd2807SJeff Garzik * Kernel thread context (may sleep). 1557c6fd2807SJeff Garzik */ 1558c6fd2807SJeff Garzik static void ata_eh_autopsy(struct ata_port *ap) 1559c6fd2807SJeff Garzik { 1560c6fd2807SJeff Garzik struct ata_eh_context *ehc = &ap->eh_context; 1561c6fd2807SJeff Garzik unsigned int all_err_mask = 0; 1562c6fd2807SJeff Garzik int tag, is_io = 0; 1563c6fd2807SJeff Garzik u32 serror; 1564c6fd2807SJeff Garzik int rc; 1565c6fd2807SJeff Garzik 1566c6fd2807SJeff Garzik DPRINTK("ENTER\n"); 1567c6fd2807SJeff Garzik 1568c6fd2807SJeff Garzik if (ehc->i.flags & ATA_EHI_NO_AUTOPSY) 1569c6fd2807SJeff Garzik return; 1570c6fd2807SJeff Garzik 1571c6fd2807SJeff Garzik /* obtain and analyze SError */ 1572c6fd2807SJeff Garzik rc = sata_scr_read(ap, SCR_ERROR, &serror); 1573c6fd2807SJeff Garzik if (rc == 0) { 1574c6fd2807SJeff Garzik ehc->i.serror |= serror; 1575c6fd2807SJeff Garzik ata_eh_analyze_serror(ap); 15764e57c517STejun Heo } else if (rc != -EOPNOTSUPP) { 15774e57c517STejun Heo /* SError read failed, force hardreset and probing */ 15784e57c517STejun Heo ata_ehi_schedule_probe(&ehc->i); 1579c6fd2807SJeff Garzik ehc->i.action |= ATA_EH_HARDRESET; 15804e57c517STejun Heo ehc->i.err_mask |= AC_ERR_OTHER; 15814e57c517STejun Heo } 1582c6fd2807SJeff Garzik 1583c6fd2807SJeff Garzik /* analyze NCQ failure */ 1584c6fd2807SJeff Garzik ata_eh_analyze_ncq_error(ap); 1585c6fd2807SJeff Garzik 1586c6fd2807SJeff Garzik /* any real error trumps AC_ERR_OTHER */ 1587c6fd2807SJeff Garzik if (ehc->i.err_mask & ~AC_ERR_OTHER) 1588c6fd2807SJeff Garzik ehc->i.err_mask &= ~AC_ERR_OTHER; 1589c6fd2807SJeff Garzik 1590c6fd2807SJeff Garzik all_err_mask |= ehc->i.err_mask; 1591c6fd2807SJeff Garzik 1592c6fd2807SJeff Garzik for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 1593c6fd2807SJeff Garzik struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 1594c6fd2807SJeff Garzik 1595c6fd2807SJeff Garzik if (!(qc->flags & ATA_QCFLAG_FAILED)) 1596c6fd2807SJeff Garzik continue; 1597c6fd2807SJeff Garzik 1598c6fd2807SJeff Garzik /* inherit upper level err_mask */ 1599c6fd2807SJeff Garzik qc->err_mask |= ehc->i.err_mask; 1600c6fd2807SJeff Garzik 1601c6fd2807SJeff Garzik /* analyze TF */ 1602c6fd2807SJeff Garzik ehc->i.action |= ata_eh_analyze_tf(qc, &qc->result_tf); 1603c6fd2807SJeff Garzik 1604c6fd2807SJeff Garzik /* DEV errors are probably spurious in case of ATA_BUS error */ 1605c6fd2807SJeff Garzik if (qc->err_mask & AC_ERR_ATA_BUS) 1606c6fd2807SJeff Garzik qc->err_mask &= ~(AC_ERR_DEV | AC_ERR_MEDIA | 1607c6fd2807SJeff Garzik AC_ERR_INVALID); 1608c6fd2807SJeff Garzik 1609c6fd2807SJeff Garzik /* any real error trumps unknown error */ 1610c6fd2807SJeff Garzik if (qc->err_mask & ~AC_ERR_OTHER) 1611c6fd2807SJeff Garzik qc->err_mask &= ~AC_ERR_OTHER; 1612c6fd2807SJeff Garzik 1613c6fd2807SJeff Garzik /* SENSE_VALID trumps dev/unknown error and revalidation */ 1614c6fd2807SJeff Garzik if (qc->flags & ATA_QCFLAG_SENSE_VALID) { 1615c6fd2807SJeff Garzik qc->err_mask &= ~(AC_ERR_DEV | AC_ERR_OTHER); 1616c6fd2807SJeff Garzik ehc->i.action &= ~ATA_EH_REVALIDATE; 1617c6fd2807SJeff Garzik } 1618c6fd2807SJeff Garzik 1619c6fd2807SJeff Garzik /* accumulate error info */ 1620c6fd2807SJeff Garzik ehc->i.dev = qc->dev; 1621c6fd2807SJeff Garzik all_err_mask |= qc->err_mask; 1622c6fd2807SJeff Garzik if (qc->flags & ATA_QCFLAG_IO) 1623c6fd2807SJeff Garzik is_io = 1; 1624c6fd2807SJeff Garzik } 1625c6fd2807SJeff Garzik 1626c6fd2807SJeff Garzik /* enforce default EH actions */ 1627c6fd2807SJeff Garzik if (ap->pflags & ATA_PFLAG_FROZEN || 1628c6fd2807SJeff Garzik all_err_mask & (AC_ERR_HSM | AC_ERR_TIMEOUT)) 1629c6fd2807SJeff Garzik ehc->i.action |= ATA_EH_SOFTRESET; 1630c6fd2807SJeff Garzik else if (all_err_mask) 1631c6fd2807SJeff Garzik ehc->i.action |= ATA_EH_REVALIDATE; 1632c6fd2807SJeff Garzik 1633c6fd2807SJeff Garzik /* if we have offending qcs and the associated failed device */ 1634c6fd2807SJeff Garzik if (ehc->i.dev) { 1635c6fd2807SJeff Garzik /* speed down */ 1636c6fd2807SJeff Garzik ehc->i.action |= ata_eh_speed_down(ehc->i.dev, is_io, 1637c6fd2807SJeff Garzik all_err_mask); 1638c6fd2807SJeff Garzik 1639c6fd2807SJeff Garzik /* perform per-dev EH action only on the offending device */ 1640c6fd2807SJeff Garzik ehc->i.dev_action[ehc->i.dev->devno] |= 1641c6fd2807SJeff Garzik ehc->i.action & ATA_EH_PERDEV_MASK; 1642c6fd2807SJeff Garzik ehc->i.action &= ~ATA_EH_PERDEV_MASK; 1643c6fd2807SJeff Garzik } 1644c6fd2807SJeff Garzik 1645c6fd2807SJeff Garzik DPRINTK("EXIT\n"); 1646c6fd2807SJeff Garzik } 1647c6fd2807SJeff Garzik 1648c6fd2807SJeff Garzik /** 1649c6fd2807SJeff Garzik * ata_eh_report - report error handling to user 1650c6fd2807SJeff Garzik * @ap: ATA port EH is going on 1651c6fd2807SJeff Garzik * 1652c6fd2807SJeff Garzik * Report EH to user. 1653c6fd2807SJeff Garzik * 1654c6fd2807SJeff Garzik * LOCKING: 1655c6fd2807SJeff Garzik * None. 1656c6fd2807SJeff Garzik */ 1657c6fd2807SJeff Garzik static void ata_eh_report(struct ata_port *ap) 1658c6fd2807SJeff Garzik { 1659c6fd2807SJeff Garzik struct ata_eh_context *ehc = &ap->eh_context; 1660c6fd2807SJeff Garzik const char *frozen, *desc; 1661c6fd2807SJeff Garzik int tag, nr_failed = 0; 1662c6fd2807SJeff Garzik 1663c6fd2807SJeff Garzik desc = NULL; 1664c6fd2807SJeff Garzik if (ehc->i.desc[0] != '\0') 1665c6fd2807SJeff Garzik desc = ehc->i.desc; 1666c6fd2807SJeff Garzik 1667c6fd2807SJeff Garzik for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 1668c6fd2807SJeff Garzik struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 1669c6fd2807SJeff Garzik 1670c6fd2807SJeff Garzik if (!(qc->flags & ATA_QCFLAG_FAILED)) 1671c6fd2807SJeff Garzik continue; 1672c6fd2807SJeff Garzik if (qc->flags & ATA_QCFLAG_SENSE_VALID && !qc->err_mask) 1673c6fd2807SJeff Garzik continue; 1674c6fd2807SJeff Garzik 1675c6fd2807SJeff Garzik nr_failed++; 1676c6fd2807SJeff Garzik } 1677c6fd2807SJeff Garzik 1678c6fd2807SJeff Garzik if (!nr_failed && !ehc->i.err_mask) 1679c6fd2807SJeff Garzik return; 1680c6fd2807SJeff Garzik 1681c6fd2807SJeff Garzik frozen = ""; 1682c6fd2807SJeff Garzik if (ap->pflags & ATA_PFLAG_FROZEN) 1683c6fd2807SJeff Garzik frozen = " frozen"; 1684c6fd2807SJeff Garzik 1685c6fd2807SJeff Garzik if (ehc->i.dev) { 1686c6fd2807SJeff Garzik ata_dev_printk(ehc->i.dev, KERN_ERR, "exception Emask 0x%x " 1687c6fd2807SJeff Garzik "SAct 0x%x SErr 0x%x action 0x%x%s\n", 1688c6fd2807SJeff Garzik ehc->i.err_mask, ap->sactive, ehc->i.serror, 1689c6fd2807SJeff Garzik ehc->i.action, frozen); 1690c6fd2807SJeff Garzik if (desc) 1691b64bbc39STejun Heo ata_dev_printk(ehc->i.dev, KERN_ERR, "%s\n", desc); 1692c6fd2807SJeff Garzik } else { 1693c6fd2807SJeff Garzik ata_port_printk(ap, KERN_ERR, "exception Emask 0x%x " 1694c6fd2807SJeff Garzik "SAct 0x%x SErr 0x%x action 0x%x%s\n", 1695c6fd2807SJeff Garzik ehc->i.err_mask, ap->sactive, ehc->i.serror, 1696c6fd2807SJeff Garzik ehc->i.action, frozen); 1697c6fd2807SJeff Garzik if (desc) 1698b64bbc39STejun Heo ata_port_printk(ap, KERN_ERR, "%s\n", desc); 1699c6fd2807SJeff Garzik } 1700c6fd2807SJeff Garzik 1701c6fd2807SJeff Garzik for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 17028a937581STejun Heo static const char *dma_str[] = { 17038a937581STejun Heo [DMA_BIDIRECTIONAL] = "bidi", 17048a937581STejun Heo [DMA_TO_DEVICE] = "out", 17058a937581STejun Heo [DMA_FROM_DEVICE] = "in", 17068a937581STejun Heo [DMA_NONE] = "", 17078a937581STejun Heo }; 1708c6fd2807SJeff Garzik struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 17098a937581STejun Heo struct ata_taskfile *cmd = &qc->tf, *res = &qc->result_tf; 1710c6fd2807SJeff Garzik 1711c6fd2807SJeff Garzik if (!(qc->flags & ATA_QCFLAG_FAILED) || !qc->err_mask) 1712c6fd2807SJeff Garzik continue; 1713c6fd2807SJeff Garzik 17148a937581STejun Heo ata_dev_printk(qc->dev, KERN_ERR, 17158a937581STejun Heo "cmd %02x/%02x:%02x:%02x:%02x:%02x/%02x:%02x:%02x:%02x:%02x/%02x " 1716664e8503STejun Heo "tag %d cdb 0x%x data %u %s\n " 17178a937581STejun Heo "res %02x/%02x:%02x:%02x:%02x:%02x/%02x:%02x:%02x:%02x:%02x/%02x " 17185335b729STejun Heo "Emask 0x%x (%s)%s\n", 17198a937581STejun Heo cmd->command, cmd->feature, cmd->nsect, 17208a937581STejun Heo cmd->lbal, cmd->lbam, cmd->lbah, 17218a937581STejun Heo cmd->hob_feature, cmd->hob_nsect, 17228a937581STejun Heo cmd->hob_lbal, cmd->hob_lbam, cmd->hob_lbah, 1723726f0785STejun Heo cmd->device, qc->tag, qc->cdb[0], qc->nbytes, 1724664e8503STejun Heo dma_str[qc->dma_dir], 17258a937581STejun Heo res->command, res->feature, res->nsect, 17268a937581STejun Heo res->lbal, res->lbam, res->lbah, 17278a937581STejun Heo res->hob_feature, res->hob_nsect, 17288a937581STejun Heo res->hob_lbal, res->hob_lbam, res->hob_lbah, 17295335b729STejun Heo res->device, qc->err_mask, ata_err_string(qc->err_mask), 17305335b729STejun Heo qc->err_mask & AC_ERR_NCQ ? " <F>" : ""); 1731c6fd2807SJeff Garzik } 1732c6fd2807SJeff Garzik } 1733c6fd2807SJeff Garzik 1734c6fd2807SJeff Garzik static int ata_do_reset(struct ata_port *ap, ata_reset_fn_t reset, 1735d4b2bab4STejun Heo unsigned int *classes, unsigned long deadline) 1736c6fd2807SJeff Garzik { 1737c6fd2807SJeff Garzik int i, rc; 1738c6fd2807SJeff Garzik 1739c6fd2807SJeff Garzik for (i = 0; i < ATA_MAX_DEVICES; i++) 1740c6fd2807SJeff Garzik classes[i] = ATA_DEV_UNKNOWN; 1741c6fd2807SJeff Garzik 1742d4b2bab4STejun Heo rc = reset(ap, classes, deadline); 1743c6fd2807SJeff Garzik if (rc) 1744c6fd2807SJeff Garzik return rc; 1745c6fd2807SJeff Garzik 1746c6fd2807SJeff Garzik /* If any class isn't ATA_DEV_UNKNOWN, consider classification 1747c6fd2807SJeff Garzik * is complete and convert all ATA_DEV_UNKNOWN to 1748c6fd2807SJeff Garzik * ATA_DEV_NONE. 1749c6fd2807SJeff Garzik */ 1750c6fd2807SJeff Garzik for (i = 0; i < ATA_MAX_DEVICES; i++) 1751c6fd2807SJeff Garzik if (classes[i] != ATA_DEV_UNKNOWN) 1752c6fd2807SJeff Garzik break; 1753c6fd2807SJeff Garzik 1754c6fd2807SJeff Garzik if (i < ATA_MAX_DEVICES) 1755c6fd2807SJeff Garzik for (i = 0; i < ATA_MAX_DEVICES; i++) 1756c6fd2807SJeff Garzik if (classes[i] == ATA_DEV_UNKNOWN) 1757c6fd2807SJeff Garzik classes[i] = ATA_DEV_NONE; 1758c6fd2807SJeff Garzik 1759c6fd2807SJeff Garzik return 0; 1760c6fd2807SJeff Garzik } 1761c6fd2807SJeff Garzik 1762c6fd2807SJeff Garzik static int ata_eh_followup_srst_needed(int rc, int classify, 1763c6fd2807SJeff Garzik const unsigned int *classes) 1764c6fd2807SJeff Garzik { 1765c6fd2807SJeff Garzik if (rc == -EAGAIN) 1766c6fd2807SJeff Garzik return 1; 1767c6fd2807SJeff Garzik if (rc != 0) 1768c6fd2807SJeff Garzik return 0; 1769c6fd2807SJeff Garzik if (classify && classes[0] == ATA_DEV_UNKNOWN) 1770c6fd2807SJeff Garzik return 1; 1771c6fd2807SJeff Garzik return 0; 1772c6fd2807SJeff Garzik } 1773c6fd2807SJeff Garzik 1774c6fd2807SJeff Garzik static int ata_eh_reset(struct ata_port *ap, int classify, 1775c6fd2807SJeff Garzik ata_prereset_fn_t prereset, ata_reset_fn_t softreset, 1776c6fd2807SJeff Garzik ata_reset_fn_t hardreset, ata_postreset_fn_t postreset) 1777c6fd2807SJeff Garzik { 1778c6fd2807SJeff Garzik struct ata_eh_context *ehc = &ap->eh_context; 1779c6fd2807SJeff Garzik unsigned int *classes = ehc->classes; 1780c6fd2807SJeff Garzik int verbose = !(ehc->i.flags & ATA_EHI_QUIET); 178131daabdaSTejun Heo int try = 0; 178231daabdaSTejun Heo unsigned long deadline; 1783c6fd2807SJeff Garzik unsigned int action; 1784c6fd2807SJeff Garzik ata_reset_fn_t reset; 17858b5bb2faSTejun Heo int i, rc; 1786c6fd2807SJeff Garzik 1787c6fd2807SJeff Garzik /* about to reset */ 1788c6fd2807SJeff Garzik ata_eh_about_to_do(ap, NULL, ehc->i.action & ATA_EH_RESET_MASK); 1789c6fd2807SJeff Garzik 1790c6fd2807SJeff Garzik /* Determine which reset to use and record in ehc->i.action. 1791c6fd2807SJeff Garzik * prereset() may examine and modify it. 1792c6fd2807SJeff Garzik */ 1793c6fd2807SJeff Garzik action = ehc->i.action; 1794c6fd2807SJeff Garzik ehc->i.action &= ~ATA_EH_RESET_MASK; 1795c6fd2807SJeff Garzik if (softreset && (!hardreset || (!sata_set_spd_needed(ap) && 1796c6fd2807SJeff Garzik !(action & ATA_EH_HARDRESET)))) 1797c6fd2807SJeff Garzik ehc->i.action |= ATA_EH_SOFTRESET; 1798c6fd2807SJeff Garzik else 1799c6fd2807SJeff Garzik ehc->i.action |= ATA_EH_HARDRESET; 1800c6fd2807SJeff Garzik 1801c6fd2807SJeff Garzik if (prereset) { 180231daabdaSTejun Heo rc = prereset(ap, jiffies + ATA_EH_PRERESET_TIMEOUT); 1803c6fd2807SJeff Garzik if (rc) { 1804c961922bSAlan Cox if (rc == -ENOENT) { 18054aa9ab67STejun Heo ata_port_printk(ap, KERN_DEBUG, 18064aa9ab67STejun Heo "port disabled. ignoring.\n"); 1807c961922bSAlan Cox ap->eh_context.i.action &= ~ATA_EH_RESET_MASK; 18084aa9ab67STejun Heo 18094aa9ab67STejun Heo for (i = 0; i < ATA_MAX_DEVICES; i++) 18104aa9ab67STejun Heo classes[i] = ATA_DEV_NONE; 18114aa9ab67STejun Heo 18124aa9ab67STejun Heo rc = 0; 1813c961922bSAlan Cox } else 1814c6fd2807SJeff Garzik ata_port_printk(ap, KERN_ERR, 1815c6fd2807SJeff Garzik "prereset failed (errno=%d)\n", rc); 1816fccb6ea5STejun Heo goto out; 1817c6fd2807SJeff Garzik } 1818c6fd2807SJeff Garzik } 1819c6fd2807SJeff Garzik 1820c6fd2807SJeff Garzik /* prereset() might have modified ehc->i.action */ 1821c6fd2807SJeff Garzik if (ehc->i.action & ATA_EH_HARDRESET) 1822c6fd2807SJeff Garzik reset = hardreset; 1823c6fd2807SJeff Garzik else if (ehc->i.action & ATA_EH_SOFTRESET) 1824c6fd2807SJeff Garzik reset = softreset; 1825c6fd2807SJeff Garzik else { 1826c6fd2807SJeff Garzik /* prereset told us not to reset, bang classes and return */ 1827c6fd2807SJeff Garzik for (i = 0; i < ATA_MAX_DEVICES; i++) 1828c6fd2807SJeff Garzik classes[i] = ATA_DEV_NONE; 1829fccb6ea5STejun Heo rc = 0; 1830fccb6ea5STejun Heo goto out; 1831c6fd2807SJeff Garzik } 1832c6fd2807SJeff Garzik 1833c6fd2807SJeff Garzik /* did prereset() screw up? if so, fix up to avoid oopsing */ 1834c6fd2807SJeff Garzik if (!reset) { 1835c6fd2807SJeff Garzik if (softreset) 1836c6fd2807SJeff Garzik reset = softreset; 1837c6fd2807SJeff Garzik else 1838c6fd2807SJeff Garzik reset = hardreset; 1839c6fd2807SJeff Garzik } 1840c6fd2807SJeff Garzik 1841c6fd2807SJeff Garzik retry: 184231daabdaSTejun Heo deadline = jiffies + ata_eh_reset_timeouts[try++]; 184331daabdaSTejun Heo 1844c6fd2807SJeff Garzik /* shut up during boot probing */ 1845c6fd2807SJeff Garzik if (verbose) 1846c6fd2807SJeff Garzik ata_port_printk(ap, KERN_INFO, "%s resetting port\n", 1847c6fd2807SJeff Garzik reset == softreset ? "soft" : "hard"); 1848c6fd2807SJeff Garzik 1849c6fd2807SJeff Garzik /* mark that this EH session started with reset */ 18500d64a233STejun Heo if (reset == hardreset) 18510d64a233STejun Heo ehc->i.flags |= ATA_EHI_DID_HARDRESET; 18520d64a233STejun Heo else 18530d64a233STejun Heo ehc->i.flags |= ATA_EHI_DID_SOFTRESET; 1854c6fd2807SJeff Garzik 185531daabdaSTejun Heo rc = ata_do_reset(ap, reset, classes, deadline); 1856c6fd2807SJeff Garzik 1857c6fd2807SJeff Garzik if (reset == hardreset && 1858c6fd2807SJeff Garzik ata_eh_followup_srst_needed(rc, classify, classes)) { 1859c6fd2807SJeff Garzik /* okay, let's do follow-up softreset */ 1860c6fd2807SJeff Garzik reset = softreset; 1861c6fd2807SJeff Garzik 1862c6fd2807SJeff Garzik if (!reset) { 1863c6fd2807SJeff Garzik ata_port_printk(ap, KERN_ERR, 1864c6fd2807SJeff Garzik "follow-up softreset required " 1865c6fd2807SJeff Garzik "but no softreset avaliable\n"); 1866fccb6ea5STejun Heo rc = -EINVAL; 1867fccb6ea5STejun Heo goto out; 1868c6fd2807SJeff Garzik } 1869c6fd2807SJeff Garzik 1870c6fd2807SJeff Garzik ata_eh_about_to_do(ap, NULL, ATA_EH_RESET_MASK); 187131daabdaSTejun Heo rc = ata_do_reset(ap, reset, classes, deadline); 1872c6fd2807SJeff Garzik 1873c6fd2807SJeff Garzik if (rc == 0 && classify && 1874c6fd2807SJeff Garzik classes[0] == ATA_DEV_UNKNOWN) { 1875c6fd2807SJeff Garzik ata_port_printk(ap, KERN_ERR, 1876c6fd2807SJeff Garzik "classification failed\n"); 1877fccb6ea5STejun Heo rc = -EINVAL; 1878fccb6ea5STejun Heo goto out; 1879c6fd2807SJeff Garzik } 1880c6fd2807SJeff Garzik } 1881c6fd2807SJeff Garzik 188231daabdaSTejun Heo if (rc && try < ARRAY_SIZE(ata_eh_reset_timeouts)) { 188331daabdaSTejun Heo unsigned long now = jiffies; 1884c6fd2807SJeff Garzik 188531daabdaSTejun Heo if (time_before(now, deadline)) { 188631daabdaSTejun Heo unsigned long delta = deadline - jiffies; 1887c6fd2807SJeff Garzik 188831daabdaSTejun Heo ata_port_printk(ap, KERN_WARNING, "reset failed " 188931daabdaSTejun Heo "(errno=%d), retrying in %u secs\n", 189031daabdaSTejun Heo rc, (jiffies_to_msecs(delta) + 999) / 1000); 1891c6fd2807SJeff Garzik 189231daabdaSTejun Heo schedule_timeout_uninterruptible(delta); 189331daabdaSTejun Heo } 189431daabdaSTejun Heo 1895f1545154STejun Heo if (rc == -EPIPE || 189631daabdaSTejun Heo try == ARRAY_SIZE(ata_eh_reset_timeouts) - 1) 1897c6fd2807SJeff Garzik sata_down_spd_limit(ap); 1898c6fd2807SJeff Garzik if (hardreset) 1899c6fd2807SJeff Garzik reset = hardreset; 1900c6fd2807SJeff Garzik goto retry; 1901c6fd2807SJeff Garzik } 1902c6fd2807SJeff Garzik 1903c6fd2807SJeff Garzik if (rc == 0) { 1904008a7896STejun Heo u32 sstatus; 1905008a7896STejun Heo 1906c6fd2807SJeff Garzik /* After the reset, the device state is PIO 0 and the 1907c6fd2807SJeff Garzik * controller state is undefined. Record the mode. 1908c6fd2807SJeff Garzik */ 1909c6fd2807SJeff Garzik for (i = 0; i < ATA_MAX_DEVICES; i++) 1910c6fd2807SJeff Garzik ap->device[i].pio_mode = XFER_PIO_0; 1911c6fd2807SJeff Garzik 1912008a7896STejun Heo /* record current link speed */ 1913008a7896STejun Heo if (sata_scr_read(ap, SCR_STATUS, &sstatus) == 0) 1914008a7896STejun Heo ap->sata_spd = (sstatus >> 4) & 0xf; 1915008a7896STejun Heo 1916c6fd2807SJeff Garzik if (postreset) 1917c6fd2807SJeff Garzik postreset(ap, classes); 1918c6fd2807SJeff Garzik 1919c6fd2807SJeff Garzik /* reset successful, schedule revalidation */ 1920c6fd2807SJeff Garzik ata_eh_done(ap, NULL, ehc->i.action & ATA_EH_RESET_MASK); 1921c6fd2807SJeff Garzik ehc->i.action |= ATA_EH_REVALIDATE; 1922c6fd2807SJeff Garzik } 1923fccb6ea5STejun Heo out: 1924fccb6ea5STejun Heo /* clear hotplug flag */ 1925fccb6ea5STejun Heo ehc->i.flags &= ~ATA_EHI_HOTPLUGGED; 1926c6fd2807SJeff Garzik return rc; 1927c6fd2807SJeff Garzik } 1928c6fd2807SJeff Garzik 1929c6fd2807SJeff Garzik static int ata_eh_revalidate_and_attach(struct ata_port *ap, 1930c6fd2807SJeff Garzik struct ata_device **r_failed_dev) 1931c6fd2807SJeff Garzik { 1932c6fd2807SJeff Garzik struct ata_eh_context *ehc = &ap->eh_context; 1933c6fd2807SJeff Garzik struct ata_device *dev; 19348c3c52a8STejun Heo unsigned int new_mask = 0; 1935c6fd2807SJeff Garzik unsigned long flags; 1936c6fd2807SJeff Garzik int i, rc = 0; 1937c6fd2807SJeff Garzik 1938c6fd2807SJeff Garzik DPRINTK("ENTER\n"); 1939c6fd2807SJeff Garzik 19408c3c52a8STejun Heo /* For PATA drive side cable detection to work, IDENTIFY must 19418c3c52a8STejun Heo * be done backwards such that PDIAG- is released by the slave 19428c3c52a8STejun Heo * device before the master device is identified. 19438c3c52a8STejun Heo */ 19448c3c52a8STejun Heo for (i = ATA_MAX_DEVICES - 1; i >= 0; i--) { 1945bff04647STejun Heo unsigned int action, readid_flags = 0; 1946c6fd2807SJeff Garzik 1947c6fd2807SJeff Garzik dev = &ap->device[i]; 1948c6fd2807SJeff Garzik action = ata_eh_dev_action(dev); 1949c6fd2807SJeff Garzik 1950bff04647STejun Heo if (ehc->i.flags & ATA_EHI_DID_RESET) 1951bff04647STejun Heo readid_flags |= ATA_READID_POSTRESET; 1952bff04647STejun Heo 19539666f400STejun Heo if ((action & ATA_EH_REVALIDATE) && ata_dev_enabled(dev)) { 1954c6fd2807SJeff Garzik if (ata_port_offline(ap)) { 1955c6fd2807SJeff Garzik rc = -EIO; 19568c3c52a8STejun Heo goto err; 1957c6fd2807SJeff Garzik } 1958c6fd2807SJeff Garzik 1959c6fd2807SJeff Garzik ata_eh_about_to_do(ap, dev, ATA_EH_REVALIDATE); 1960bff04647STejun Heo rc = ata_dev_revalidate(dev, readid_flags); 1961c6fd2807SJeff Garzik if (rc) 19628c3c52a8STejun Heo goto err; 1963c6fd2807SJeff Garzik 1964c6fd2807SJeff Garzik ata_eh_done(ap, dev, ATA_EH_REVALIDATE); 1965c6fd2807SJeff Garzik 1966baa1e78aSTejun Heo /* Configuration may have changed, reconfigure 1967baa1e78aSTejun Heo * transfer mode. 1968baa1e78aSTejun Heo */ 1969baa1e78aSTejun Heo ehc->i.flags |= ATA_EHI_SETMODE; 1970baa1e78aSTejun Heo 1971c6fd2807SJeff Garzik /* schedule the scsi_rescan_device() here */ 1972c6fd2807SJeff Garzik queue_work(ata_aux_wq, &(ap->scsi_rescan_task)); 1973c6fd2807SJeff Garzik } else if (dev->class == ATA_DEV_UNKNOWN && 1974c6fd2807SJeff Garzik ehc->tries[dev->devno] && 1975c6fd2807SJeff Garzik ata_class_enabled(ehc->classes[dev->devno])) { 1976c6fd2807SJeff Garzik dev->class = ehc->classes[dev->devno]; 1977c6fd2807SJeff Garzik 1978bff04647STejun Heo rc = ata_dev_read_id(dev, &dev->class, readid_flags, 1979bff04647STejun Heo dev->id); 19808c3c52a8STejun Heo switch (rc) { 19818c3c52a8STejun Heo case 0: 19828c3c52a8STejun Heo new_mask |= 1 << i; 19838c3c52a8STejun Heo break; 19848c3c52a8STejun Heo case -ENOENT: 198555a8e2c8STejun Heo /* IDENTIFY was issued to non-existent 198655a8e2c8STejun Heo * device. No need to reset. Just 198755a8e2c8STejun Heo * thaw and kill the device. 198855a8e2c8STejun Heo */ 198955a8e2c8STejun Heo ata_eh_thaw_port(ap); 199055a8e2c8STejun Heo dev->class = ATA_DEV_UNKNOWN; 1991c6fd2807SJeff Garzik break; 19928c3c52a8STejun Heo default: 19938c3c52a8STejun Heo dev->class = ATA_DEV_UNKNOWN; 19948c3c52a8STejun Heo goto err; 19958c3c52a8STejun Heo } 19968c3c52a8STejun Heo } 1997c6fd2807SJeff Garzik } 1998c6fd2807SJeff Garzik 1999c1c4e8d5STejun Heo /* PDIAG- should have been released, ask cable type if post-reset */ 2000c1c4e8d5STejun Heo if ((ehc->i.flags & ATA_EHI_DID_RESET) && ap->ops->cable_detect) 2001c1c4e8d5STejun Heo ap->cbl = ap->ops->cable_detect(ap); 2002c1c4e8d5STejun Heo 20038c3c52a8STejun Heo /* Configure new devices forward such that user doesn't see 20048c3c52a8STejun Heo * device detection messages backwards. 20058c3c52a8STejun Heo */ 20068c3c52a8STejun Heo for (i = 0; i < ATA_MAX_DEVICES; i++) { 20078c3c52a8STejun Heo dev = &ap->device[i]; 20088c3c52a8STejun Heo 20098c3c52a8STejun Heo if (!(new_mask & (1 << i))) 20108c3c52a8STejun Heo continue; 20118c3c52a8STejun Heo 20128c3c52a8STejun Heo ehc->i.flags |= ATA_EHI_PRINTINFO; 20138c3c52a8STejun Heo rc = ata_dev_configure(dev); 20148c3c52a8STejun Heo ehc->i.flags &= ~ATA_EHI_PRINTINFO; 20158c3c52a8STejun Heo if (rc) 20168c3c52a8STejun Heo goto err; 20178c3c52a8STejun Heo 2018c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 2019c6fd2807SJeff Garzik ap->pflags |= ATA_PFLAG_SCSI_HOTPLUG; 2020c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 2021baa1e78aSTejun Heo 202255a8e2c8STejun Heo /* new device discovered, configure xfermode */ 2023baa1e78aSTejun Heo ehc->i.flags |= ATA_EHI_SETMODE; 2024c6fd2807SJeff Garzik } 2025c6fd2807SJeff Garzik 20268c3c52a8STejun Heo return 0; 20278c3c52a8STejun Heo 20288c3c52a8STejun Heo err: 2029c6fd2807SJeff Garzik *r_failed_dev = dev; 20308c3c52a8STejun Heo DPRINTK("EXIT rc=%d\n", rc); 2031c6fd2807SJeff Garzik return rc; 2032c6fd2807SJeff Garzik } 2033c6fd2807SJeff Garzik 2034c6fd2807SJeff Garzik static int ata_port_nr_enabled(struct ata_port *ap) 2035c6fd2807SJeff Garzik { 2036c6fd2807SJeff Garzik int i, cnt = 0; 2037c6fd2807SJeff Garzik 2038c6fd2807SJeff Garzik for (i = 0; i < ATA_MAX_DEVICES; i++) 2039c6fd2807SJeff Garzik if (ata_dev_enabled(&ap->device[i])) 2040c6fd2807SJeff Garzik cnt++; 2041c6fd2807SJeff Garzik return cnt; 2042c6fd2807SJeff Garzik } 2043c6fd2807SJeff Garzik 2044c6fd2807SJeff Garzik static int ata_port_nr_vacant(struct ata_port *ap) 2045c6fd2807SJeff Garzik { 2046c6fd2807SJeff Garzik int i, cnt = 0; 2047c6fd2807SJeff Garzik 2048c6fd2807SJeff Garzik for (i = 0; i < ATA_MAX_DEVICES; i++) 2049c6fd2807SJeff Garzik if (ap->device[i].class == ATA_DEV_UNKNOWN) 2050c6fd2807SJeff Garzik cnt++; 2051c6fd2807SJeff Garzik return cnt; 2052c6fd2807SJeff Garzik } 2053c6fd2807SJeff Garzik 2054c6fd2807SJeff Garzik static int ata_eh_skip_recovery(struct ata_port *ap) 2055c6fd2807SJeff Garzik { 2056c6fd2807SJeff Garzik struct ata_eh_context *ehc = &ap->eh_context; 2057c6fd2807SJeff Garzik int i; 2058c6fd2807SJeff Garzik 2059c6fd2807SJeff Garzik /* thaw frozen port, resume link and recover failed devices */ 2060c6fd2807SJeff Garzik if ((ap->pflags & ATA_PFLAG_FROZEN) || 2061c6fd2807SJeff Garzik (ehc->i.flags & ATA_EHI_RESUME_LINK) || ata_port_nr_enabled(ap)) 2062c6fd2807SJeff Garzik return 0; 2063c6fd2807SJeff Garzik 2064c6fd2807SJeff Garzik /* skip if class codes for all vacant slots are ATA_DEV_NONE */ 2065c6fd2807SJeff Garzik for (i = 0; i < ATA_MAX_DEVICES; i++) { 2066c6fd2807SJeff Garzik struct ata_device *dev = &ap->device[i]; 2067c6fd2807SJeff Garzik 2068c6fd2807SJeff Garzik if (dev->class == ATA_DEV_UNKNOWN && 2069c6fd2807SJeff Garzik ehc->classes[dev->devno] != ATA_DEV_NONE) 2070c6fd2807SJeff Garzik return 0; 2071c6fd2807SJeff Garzik } 2072c6fd2807SJeff Garzik 2073c6fd2807SJeff Garzik return 1; 2074c6fd2807SJeff Garzik } 2075c6fd2807SJeff Garzik 2076fee7ca72STejun Heo static void ata_eh_handle_dev_fail(struct ata_device *dev, int err) 2077fee7ca72STejun Heo { 2078fee7ca72STejun Heo struct ata_port *ap = dev->ap; 2079fee7ca72STejun Heo struct ata_eh_context *ehc = &ap->eh_context; 2080fee7ca72STejun Heo 2081fee7ca72STejun Heo ehc->tries[dev->devno]--; 2082fee7ca72STejun Heo 2083fee7ca72STejun Heo switch (err) { 2084fee7ca72STejun Heo case -ENODEV: 2085fee7ca72STejun Heo /* device missing or wrong IDENTIFY data, schedule probing */ 2086fee7ca72STejun Heo ehc->i.probe_mask |= (1 << dev->devno); 2087fee7ca72STejun Heo case -EINVAL: 2088fee7ca72STejun Heo /* give it just one more chance */ 2089fee7ca72STejun Heo ehc->tries[dev->devno] = min(ehc->tries[dev->devno], 1); 2090fee7ca72STejun Heo case -EIO: 2091fee7ca72STejun Heo if (ehc->tries[dev->devno] == 1) { 2092fee7ca72STejun Heo /* This is the last chance, better to slow 2093fee7ca72STejun Heo * down than lose it. 2094fee7ca72STejun Heo */ 2095fee7ca72STejun Heo sata_down_spd_limit(ap); 2096fee7ca72STejun Heo ata_down_xfermask_limit(dev, ATA_DNXFER_PIO); 2097fee7ca72STejun Heo } 2098fee7ca72STejun Heo } 2099fee7ca72STejun Heo 2100fee7ca72STejun Heo if (ata_dev_enabled(dev) && !ehc->tries[dev->devno]) { 2101fee7ca72STejun Heo /* disable device if it has used up all its chances */ 2102fee7ca72STejun Heo ata_dev_disable(dev); 2103fee7ca72STejun Heo 2104fee7ca72STejun Heo /* detach if offline */ 2105fee7ca72STejun Heo if (ata_port_offline(ap)) 2106fee7ca72STejun Heo ata_eh_detach_dev(dev); 2107fee7ca72STejun Heo 2108fee7ca72STejun Heo /* probe if requested */ 2109fee7ca72STejun Heo if ((ehc->i.probe_mask & (1 << dev->devno)) && 2110fee7ca72STejun Heo !(ehc->did_probe_mask & (1 << dev->devno))) { 2111fee7ca72STejun Heo ata_eh_detach_dev(dev); 2112fee7ca72STejun Heo ata_dev_init(dev); 2113fee7ca72STejun Heo 2114fee7ca72STejun Heo ehc->tries[dev->devno] = ATA_EH_DEV_TRIES; 2115fee7ca72STejun Heo ehc->did_probe_mask |= (1 << dev->devno); 2116fee7ca72STejun Heo ehc->i.action |= ATA_EH_SOFTRESET; 2117fee7ca72STejun Heo } 2118fee7ca72STejun Heo } else { 2119fee7ca72STejun Heo /* soft didn't work? be haaaaard */ 2120fee7ca72STejun Heo if (ehc->i.flags & ATA_EHI_DID_RESET) 2121fee7ca72STejun Heo ehc->i.action |= ATA_EH_HARDRESET; 2122fee7ca72STejun Heo else 2123fee7ca72STejun Heo ehc->i.action |= ATA_EH_SOFTRESET; 2124fee7ca72STejun Heo } 2125fee7ca72STejun Heo } 2126fee7ca72STejun Heo 2127c6fd2807SJeff Garzik /** 2128c6fd2807SJeff Garzik * ata_eh_recover - recover host port after error 2129c6fd2807SJeff Garzik * @ap: host port to recover 2130c6fd2807SJeff Garzik * @prereset: prereset method (can be NULL) 2131c6fd2807SJeff Garzik * @softreset: softreset method (can be NULL) 2132c6fd2807SJeff Garzik * @hardreset: hardreset method (can be NULL) 2133c6fd2807SJeff Garzik * @postreset: postreset method (can be NULL) 2134c6fd2807SJeff Garzik * 2135c6fd2807SJeff Garzik * This is the alpha and omega, eum and yang, heart and soul of 2136c6fd2807SJeff Garzik * libata exception handling. On entry, actions required to 2137c6fd2807SJeff Garzik * recover the port and hotplug requests are recorded in 2138c6fd2807SJeff Garzik * eh_context. This function executes all the operations with 2139c6fd2807SJeff Garzik * appropriate retrials and fallbacks to resurrect failed 2140c6fd2807SJeff Garzik * devices, detach goners and greet newcomers. 2141c6fd2807SJeff Garzik * 2142c6fd2807SJeff Garzik * LOCKING: 2143c6fd2807SJeff Garzik * Kernel thread context (may sleep). 2144c6fd2807SJeff Garzik * 2145c6fd2807SJeff Garzik * RETURNS: 2146c6fd2807SJeff Garzik * 0 on success, -errno on failure. 2147c6fd2807SJeff Garzik */ 2148c6fd2807SJeff Garzik static int ata_eh_recover(struct ata_port *ap, ata_prereset_fn_t prereset, 2149c6fd2807SJeff Garzik ata_reset_fn_t softreset, ata_reset_fn_t hardreset, 2150c6fd2807SJeff Garzik ata_postreset_fn_t postreset) 2151c6fd2807SJeff Garzik { 2152c6fd2807SJeff Garzik struct ata_eh_context *ehc = &ap->eh_context; 2153c6fd2807SJeff Garzik struct ata_device *dev; 21544ae72a1eSTejun Heo int i, rc; 2155c6fd2807SJeff Garzik 2156c6fd2807SJeff Garzik DPRINTK("ENTER\n"); 2157c6fd2807SJeff Garzik 2158c6fd2807SJeff Garzik /* prep for recovery */ 2159c6fd2807SJeff Garzik for (i = 0; i < ATA_MAX_DEVICES; i++) { 2160c6fd2807SJeff Garzik dev = &ap->device[i]; 2161c6fd2807SJeff Garzik 2162c6fd2807SJeff Garzik ehc->tries[dev->devno] = ATA_EH_DEV_TRIES; 2163c6fd2807SJeff Garzik 216479a55b72STejun Heo /* collect port action mask recorded in dev actions */ 216579a55b72STejun Heo ehc->i.action |= ehc->i.dev_action[i] & ~ATA_EH_PERDEV_MASK; 216679a55b72STejun Heo ehc->i.dev_action[i] &= ATA_EH_PERDEV_MASK; 216779a55b72STejun Heo 2168c6fd2807SJeff Garzik /* process hotplug request */ 2169c6fd2807SJeff Garzik if (dev->flags & ATA_DFLAG_DETACH) 2170c6fd2807SJeff Garzik ata_eh_detach_dev(dev); 2171c6fd2807SJeff Garzik 2172c6fd2807SJeff Garzik if (!ata_dev_enabled(dev) && 2173c6fd2807SJeff Garzik ((ehc->i.probe_mask & (1 << dev->devno)) && 2174c6fd2807SJeff Garzik !(ehc->did_probe_mask & (1 << dev->devno)))) { 2175c6fd2807SJeff Garzik ata_eh_detach_dev(dev); 2176c6fd2807SJeff Garzik ata_dev_init(dev); 2177c6fd2807SJeff Garzik ehc->did_probe_mask |= (1 << dev->devno); 2178c6fd2807SJeff Garzik ehc->i.action |= ATA_EH_SOFTRESET; 2179c6fd2807SJeff Garzik } 2180c6fd2807SJeff Garzik } 2181c6fd2807SJeff Garzik 2182c6fd2807SJeff Garzik retry: 2183c6fd2807SJeff Garzik rc = 0; 2184c6fd2807SJeff Garzik 2185c6fd2807SJeff Garzik /* if UNLOADING, finish immediately */ 2186c6fd2807SJeff Garzik if (ap->pflags & ATA_PFLAG_UNLOADING) 2187c6fd2807SJeff Garzik goto out; 2188c6fd2807SJeff Garzik 2189c6fd2807SJeff Garzik /* skip EH if possible. */ 2190c6fd2807SJeff Garzik if (ata_eh_skip_recovery(ap)) 2191c6fd2807SJeff Garzik ehc->i.action = 0; 2192c6fd2807SJeff Garzik 2193c6fd2807SJeff Garzik for (i = 0; i < ATA_MAX_DEVICES; i++) 2194c6fd2807SJeff Garzik ehc->classes[i] = ATA_DEV_UNKNOWN; 2195c6fd2807SJeff Garzik 2196c6fd2807SJeff Garzik /* reset */ 2197c6fd2807SJeff Garzik if (ehc->i.action & ATA_EH_RESET_MASK) { 2198c6fd2807SJeff Garzik ata_eh_freeze_port(ap); 2199c6fd2807SJeff Garzik 2200c6fd2807SJeff Garzik rc = ata_eh_reset(ap, ata_port_nr_vacant(ap), prereset, 2201c6fd2807SJeff Garzik softreset, hardreset, postreset); 2202c6fd2807SJeff Garzik if (rc) { 2203c6fd2807SJeff Garzik ata_port_printk(ap, KERN_ERR, 2204c6fd2807SJeff Garzik "reset failed, giving up\n"); 2205c6fd2807SJeff Garzik goto out; 2206c6fd2807SJeff Garzik } 2207c6fd2807SJeff Garzik 2208c6fd2807SJeff Garzik ata_eh_thaw_port(ap); 2209c6fd2807SJeff Garzik } 2210c6fd2807SJeff Garzik 2211c6fd2807SJeff Garzik /* revalidate existing devices and attach new ones */ 2212c6fd2807SJeff Garzik rc = ata_eh_revalidate_and_attach(ap, &dev); 2213c6fd2807SJeff Garzik if (rc) 2214c6fd2807SJeff Garzik goto dev_fail; 2215c6fd2807SJeff Garzik 2216baa1e78aSTejun Heo /* configure transfer mode if necessary */ 2217baa1e78aSTejun Heo if (ehc->i.flags & ATA_EHI_SETMODE) { 2218c6fd2807SJeff Garzik rc = ata_set_mode(ap, &dev); 22194ae72a1eSTejun Heo if (rc) 2220c6fd2807SJeff Garzik goto dev_fail; 2221baa1e78aSTejun Heo ehc->i.flags &= ~ATA_EHI_SETMODE; 2222c6fd2807SJeff Garzik } 2223c6fd2807SJeff Garzik 2224c6fd2807SJeff Garzik goto out; 2225c6fd2807SJeff Garzik 2226c6fd2807SJeff Garzik dev_fail: 2227fee7ca72STejun Heo ata_eh_handle_dev_fail(dev, rc); 2228c6fd2807SJeff Garzik 2229c6fd2807SJeff Garzik if (ata_port_nr_enabled(ap)) { 2230c6fd2807SJeff Garzik ata_port_printk(ap, KERN_WARNING, "failed to recover some " 2231c6fd2807SJeff Garzik "devices, retrying in 5 secs\n"); 2232c6fd2807SJeff Garzik ssleep(5); 2233c6fd2807SJeff Garzik } else { 2234c6fd2807SJeff Garzik /* no device left, repeat fast */ 2235c6fd2807SJeff Garzik msleep(500); 2236c6fd2807SJeff Garzik } 2237c6fd2807SJeff Garzik 2238c6fd2807SJeff Garzik goto retry; 2239c6fd2807SJeff Garzik 2240c6fd2807SJeff Garzik out: 2241c6fd2807SJeff Garzik if (rc) { 2242c6fd2807SJeff Garzik for (i = 0; i < ATA_MAX_DEVICES; i++) 2243c6fd2807SJeff Garzik ata_dev_disable(&ap->device[i]); 2244c6fd2807SJeff Garzik } 2245c6fd2807SJeff Garzik 2246c6fd2807SJeff Garzik DPRINTK("EXIT, rc=%d\n", rc); 2247c6fd2807SJeff Garzik return rc; 2248c6fd2807SJeff Garzik } 2249c6fd2807SJeff Garzik 2250c6fd2807SJeff Garzik /** 2251c6fd2807SJeff Garzik * ata_eh_finish - finish up EH 2252c6fd2807SJeff Garzik * @ap: host port to finish EH for 2253c6fd2807SJeff Garzik * 2254c6fd2807SJeff Garzik * Recovery is complete. Clean up EH states and retry or finish 2255c6fd2807SJeff Garzik * failed qcs. 2256c6fd2807SJeff Garzik * 2257c6fd2807SJeff Garzik * LOCKING: 2258c6fd2807SJeff Garzik * None. 2259c6fd2807SJeff Garzik */ 2260c6fd2807SJeff Garzik static void ata_eh_finish(struct ata_port *ap) 2261c6fd2807SJeff Garzik { 2262c6fd2807SJeff Garzik int tag; 2263c6fd2807SJeff Garzik 2264c6fd2807SJeff Garzik /* retry or finish qcs */ 2265c6fd2807SJeff Garzik for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 2266c6fd2807SJeff Garzik struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 2267c6fd2807SJeff Garzik 2268c6fd2807SJeff Garzik if (!(qc->flags & ATA_QCFLAG_FAILED)) 2269c6fd2807SJeff Garzik continue; 2270c6fd2807SJeff Garzik 2271c6fd2807SJeff Garzik if (qc->err_mask) { 2272c6fd2807SJeff Garzik /* FIXME: Once EH migration is complete, 2273c6fd2807SJeff Garzik * generate sense data in this function, 2274c6fd2807SJeff Garzik * considering both err_mask and tf. 2275c6fd2807SJeff Garzik */ 2276c6fd2807SJeff Garzik if (qc->err_mask & AC_ERR_INVALID) 2277c6fd2807SJeff Garzik ata_eh_qc_complete(qc); 2278c6fd2807SJeff Garzik else 2279c6fd2807SJeff Garzik ata_eh_qc_retry(qc); 2280c6fd2807SJeff Garzik } else { 2281c6fd2807SJeff Garzik if (qc->flags & ATA_QCFLAG_SENSE_VALID) { 2282c6fd2807SJeff Garzik ata_eh_qc_complete(qc); 2283c6fd2807SJeff Garzik } else { 2284c6fd2807SJeff Garzik /* feed zero TF to sense generation */ 2285c6fd2807SJeff Garzik memset(&qc->result_tf, 0, sizeof(qc->result_tf)); 2286c6fd2807SJeff Garzik ata_eh_qc_retry(qc); 2287c6fd2807SJeff Garzik } 2288c6fd2807SJeff Garzik } 2289c6fd2807SJeff Garzik } 2290c6fd2807SJeff Garzik } 2291c6fd2807SJeff Garzik 2292c6fd2807SJeff Garzik /** 2293c6fd2807SJeff Garzik * ata_do_eh - do standard error handling 2294c6fd2807SJeff Garzik * @ap: host port to handle error for 2295c6fd2807SJeff Garzik * @prereset: prereset method (can be NULL) 2296c6fd2807SJeff Garzik * @softreset: softreset method (can be NULL) 2297c6fd2807SJeff Garzik * @hardreset: hardreset method (can be NULL) 2298c6fd2807SJeff Garzik * @postreset: postreset method (can be NULL) 2299c6fd2807SJeff Garzik * 2300c6fd2807SJeff Garzik * Perform standard error handling sequence. 2301c6fd2807SJeff Garzik * 2302c6fd2807SJeff Garzik * LOCKING: 2303c6fd2807SJeff Garzik * Kernel thread context (may sleep). 2304c6fd2807SJeff Garzik */ 2305c6fd2807SJeff Garzik void ata_do_eh(struct ata_port *ap, ata_prereset_fn_t prereset, 2306c6fd2807SJeff Garzik ata_reset_fn_t softreset, ata_reset_fn_t hardreset, 2307c6fd2807SJeff Garzik ata_postreset_fn_t postreset) 2308c6fd2807SJeff Garzik { 2309c6fd2807SJeff Garzik ata_eh_autopsy(ap); 2310c6fd2807SJeff Garzik ata_eh_report(ap); 2311c6fd2807SJeff Garzik ata_eh_recover(ap, prereset, softreset, hardreset, postreset); 2312c6fd2807SJeff Garzik ata_eh_finish(ap); 2313c6fd2807SJeff Garzik } 2314c6fd2807SJeff Garzik 23156ffa01d8STejun Heo #ifdef CONFIG_PM 2316c6fd2807SJeff Garzik /** 2317c6fd2807SJeff Garzik * ata_eh_handle_port_suspend - perform port suspend operation 2318c6fd2807SJeff Garzik * @ap: port to suspend 2319c6fd2807SJeff Garzik * 2320c6fd2807SJeff Garzik * Suspend @ap. 2321c6fd2807SJeff Garzik * 2322c6fd2807SJeff Garzik * LOCKING: 2323c6fd2807SJeff Garzik * Kernel thread context (may sleep). 2324c6fd2807SJeff Garzik */ 2325c6fd2807SJeff Garzik static void ata_eh_handle_port_suspend(struct ata_port *ap) 2326c6fd2807SJeff Garzik { 2327c6fd2807SJeff Garzik unsigned long flags; 2328c6fd2807SJeff Garzik int rc = 0; 2329c6fd2807SJeff Garzik 2330c6fd2807SJeff Garzik /* are we suspending? */ 2331c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 2332c6fd2807SJeff Garzik if (!(ap->pflags & ATA_PFLAG_PM_PENDING) || 2333c6fd2807SJeff Garzik ap->pm_mesg.event == PM_EVENT_ON) { 2334c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 2335c6fd2807SJeff Garzik return; 2336c6fd2807SJeff Garzik } 2337c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 2338c6fd2807SJeff Garzik 2339c6fd2807SJeff Garzik WARN_ON(ap->pflags & ATA_PFLAG_SUSPENDED); 2340c6fd2807SJeff Garzik 234164578a3dSTejun Heo /* tell ACPI we're suspending */ 234264578a3dSTejun Heo rc = ata_acpi_on_suspend(ap); 234364578a3dSTejun Heo if (rc) 234464578a3dSTejun Heo goto out; 234564578a3dSTejun Heo 2346c6fd2807SJeff Garzik /* suspend */ 2347c6fd2807SJeff Garzik ata_eh_freeze_port(ap); 2348c6fd2807SJeff Garzik 2349c6fd2807SJeff Garzik if (ap->ops->port_suspend) 2350c6fd2807SJeff Garzik rc = ap->ops->port_suspend(ap, ap->pm_mesg); 2351c6fd2807SJeff Garzik 235264578a3dSTejun Heo out: 2353c6fd2807SJeff Garzik /* report result */ 2354c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 2355c6fd2807SJeff Garzik 2356c6fd2807SJeff Garzik ap->pflags &= ~ATA_PFLAG_PM_PENDING; 2357c6fd2807SJeff Garzik if (rc == 0) 2358c6fd2807SJeff Garzik ap->pflags |= ATA_PFLAG_SUSPENDED; 235964578a3dSTejun Heo else if (ap->pflags & ATA_PFLAG_FROZEN) 2360c6fd2807SJeff Garzik ata_port_schedule_eh(ap); 2361c6fd2807SJeff Garzik 2362c6fd2807SJeff Garzik if (ap->pm_result) { 2363c6fd2807SJeff Garzik *ap->pm_result = rc; 2364c6fd2807SJeff Garzik ap->pm_result = NULL; 2365c6fd2807SJeff Garzik } 2366c6fd2807SJeff Garzik 2367c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 2368c6fd2807SJeff Garzik 2369c6fd2807SJeff Garzik return; 2370c6fd2807SJeff Garzik } 2371c6fd2807SJeff Garzik 2372c6fd2807SJeff Garzik /** 2373c6fd2807SJeff Garzik * ata_eh_handle_port_resume - perform port resume operation 2374c6fd2807SJeff Garzik * @ap: port to resume 2375c6fd2807SJeff Garzik * 2376c6fd2807SJeff Garzik * Resume @ap. 2377c6fd2807SJeff Garzik * 2378c6fd2807SJeff Garzik * LOCKING: 2379c6fd2807SJeff Garzik * Kernel thread context (may sleep). 2380c6fd2807SJeff Garzik */ 2381c6fd2807SJeff Garzik static void ata_eh_handle_port_resume(struct ata_port *ap) 2382c6fd2807SJeff Garzik { 2383c6fd2807SJeff Garzik unsigned long flags; 23849666f400STejun Heo int rc = 0; 2385c6fd2807SJeff Garzik 2386c6fd2807SJeff Garzik /* are we resuming? */ 2387c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 2388c6fd2807SJeff Garzik if (!(ap->pflags & ATA_PFLAG_PM_PENDING) || 2389c6fd2807SJeff Garzik ap->pm_mesg.event != PM_EVENT_ON) { 2390c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 2391c6fd2807SJeff Garzik return; 2392c6fd2807SJeff Garzik } 2393c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 2394c6fd2807SJeff Garzik 23959666f400STejun Heo WARN_ON(!(ap->pflags & ATA_PFLAG_SUSPENDED)); 2396c6fd2807SJeff Garzik 2397c6fd2807SJeff Garzik if (ap->ops->port_resume) 2398c6fd2807SJeff Garzik rc = ap->ops->port_resume(ap); 2399c6fd2807SJeff Garzik 24006746544cSTejun Heo /* tell ACPI that we're resuming */ 24016746544cSTejun Heo ata_acpi_on_resume(ap); 24026746544cSTejun Heo 24039666f400STejun Heo /* report result */ 2404c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 2405c6fd2807SJeff Garzik ap->pflags &= ~(ATA_PFLAG_PM_PENDING | ATA_PFLAG_SUSPENDED); 2406c6fd2807SJeff Garzik if (ap->pm_result) { 2407c6fd2807SJeff Garzik *ap->pm_result = rc; 2408c6fd2807SJeff Garzik ap->pm_result = NULL; 2409c6fd2807SJeff Garzik } 2410c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 2411c6fd2807SJeff Garzik } 24126ffa01d8STejun Heo #endif /* CONFIG_PM */ 2413