1c6fd2807SJeff Garzik /* 2c6fd2807SJeff Garzik * libata-eh.c - libata error handling 3c6fd2807SJeff Garzik * 4c6fd2807SJeff Garzik * Maintained by: Jeff Garzik <jgarzik@pobox.com> 5c6fd2807SJeff Garzik * Please ALWAYS copy linux-ide@vger.kernel.org 6c6fd2807SJeff Garzik * on emails. 7c6fd2807SJeff Garzik * 8c6fd2807SJeff Garzik * Copyright 2006 Tejun Heo <htejun@gmail.com> 9c6fd2807SJeff Garzik * 10c6fd2807SJeff Garzik * 11c6fd2807SJeff Garzik * This program is free software; you can redistribute it and/or 12c6fd2807SJeff Garzik * modify it under the terms of the GNU General Public License as 13c6fd2807SJeff Garzik * published by the Free Software Foundation; either version 2, or 14c6fd2807SJeff Garzik * (at your option) any later version. 15c6fd2807SJeff Garzik * 16c6fd2807SJeff Garzik * This program is distributed in the hope that it will be useful, 17c6fd2807SJeff Garzik * but WITHOUT ANY WARRANTY; without even the implied warranty of 18c6fd2807SJeff Garzik * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 19c6fd2807SJeff Garzik * General Public License for more details. 20c6fd2807SJeff Garzik * 21c6fd2807SJeff Garzik * You should have received a copy of the GNU General Public License 22c6fd2807SJeff Garzik * along with this program; see the file COPYING. If not, write to 23c6fd2807SJeff Garzik * the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, 24c6fd2807SJeff Garzik * USA. 25c6fd2807SJeff Garzik * 26c6fd2807SJeff Garzik * 27c6fd2807SJeff Garzik * libata documentation is available via 'make {ps|pdf}docs', 28c6fd2807SJeff Garzik * as Documentation/DocBook/libata.* 29c6fd2807SJeff Garzik * 30c6fd2807SJeff Garzik * Hardware documentation available from http://www.t13.org/ and 31c6fd2807SJeff Garzik * http://www.sata-io.org/ 32c6fd2807SJeff Garzik * 33c6fd2807SJeff Garzik */ 34c6fd2807SJeff Garzik 35c6fd2807SJeff Garzik #include <linux/kernel.h> 36c6fd2807SJeff Garzik #include <scsi/scsi.h> 37c6fd2807SJeff Garzik #include <scsi/scsi_host.h> 38c6fd2807SJeff Garzik #include <scsi/scsi_eh.h> 39c6fd2807SJeff Garzik #include <scsi/scsi_device.h> 40c6fd2807SJeff Garzik #include <scsi/scsi_cmnd.h> 41c6fd2807SJeff Garzik #include "../scsi/scsi_transport_api.h" 42c6fd2807SJeff Garzik 43c6fd2807SJeff Garzik #include <linux/libata.h> 44c6fd2807SJeff Garzik 45c6fd2807SJeff Garzik #include "libata.h" 46c6fd2807SJeff Garzik 477d47e8d4STejun Heo enum { 487d47e8d4STejun Heo ATA_EH_SPDN_NCQ_OFF = (1 << 0), 497d47e8d4STejun Heo ATA_EH_SPDN_SPEED_DOWN = (1 << 1), 507d47e8d4STejun Heo ATA_EH_SPDN_FALLBACK_TO_PIO = (1 << 2), 517d47e8d4STejun Heo }; 527d47e8d4STejun Heo 5331daabdaSTejun Heo /* Waiting in ->prereset can never be reliable. It's sometimes nice 5431daabdaSTejun Heo * to wait there but it can't be depended upon; otherwise, we wouldn't 5531daabdaSTejun Heo * be resetting. Just give it enough time for most drives to spin up. 5631daabdaSTejun Heo */ 5731daabdaSTejun Heo enum { 5831daabdaSTejun Heo ATA_EH_PRERESET_TIMEOUT = 10 * HZ, 595ddf24c5STejun Heo ATA_EH_FASTDRAIN_INTERVAL = 3 * HZ, 6031daabdaSTejun Heo }; 6131daabdaSTejun Heo 6231daabdaSTejun Heo /* The following table determines how we sequence resets. Each entry 6331daabdaSTejun Heo * represents timeout for that try. The first try can be soft or 6431daabdaSTejun Heo * hardreset. All others are hardreset if available. In most cases 6531daabdaSTejun Heo * the first reset w/ 10sec timeout should succeed. Following entries 6631daabdaSTejun Heo * are mostly for error handling, hotplug and retarded devices. 6731daabdaSTejun Heo */ 6831daabdaSTejun Heo static const unsigned long ata_eh_reset_timeouts[] = { 6931daabdaSTejun Heo 10 * HZ, /* most drives spin up by 10sec */ 7031daabdaSTejun Heo 10 * HZ, /* > 99% working drives spin up before 20sec */ 7131daabdaSTejun Heo 35 * HZ, /* give > 30 secs of idleness for retarded devices */ 7231daabdaSTejun Heo 5 * HZ, /* and sweet one last chance */ 7331daabdaSTejun Heo /* > 1 min has elapsed, give up */ 7431daabdaSTejun Heo }; 7531daabdaSTejun Heo 76c6fd2807SJeff Garzik static void __ata_port_freeze(struct ata_port *ap); 77c6fd2807SJeff Garzik static void ata_eh_finish(struct ata_port *ap); 786ffa01d8STejun Heo #ifdef CONFIG_PM 79c6fd2807SJeff Garzik static void ata_eh_handle_port_suspend(struct ata_port *ap); 80c6fd2807SJeff Garzik static void ata_eh_handle_port_resume(struct ata_port *ap); 816ffa01d8STejun Heo #else /* CONFIG_PM */ 826ffa01d8STejun Heo static void ata_eh_handle_port_suspend(struct ata_port *ap) 836ffa01d8STejun Heo { } 846ffa01d8STejun Heo 856ffa01d8STejun Heo static void ata_eh_handle_port_resume(struct ata_port *ap) 866ffa01d8STejun Heo { } 876ffa01d8STejun Heo #endif /* CONFIG_PM */ 88c6fd2807SJeff Garzik 89b64bbc39STejun Heo static void __ata_ehi_pushv_desc(struct ata_eh_info *ehi, const char *fmt, 90b64bbc39STejun Heo va_list args) 91b64bbc39STejun Heo { 92b64bbc39STejun Heo ehi->desc_len += vscnprintf(ehi->desc + ehi->desc_len, 93b64bbc39STejun Heo ATA_EH_DESC_LEN - ehi->desc_len, 94b64bbc39STejun Heo fmt, args); 95b64bbc39STejun Heo } 96b64bbc39STejun Heo 97b64bbc39STejun Heo /** 98b64bbc39STejun Heo * __ata_ehi_push_desc - push error description without adding separator 99b64bbc39STejun Heo * @ehi: target EHI 100b64bbc39STejun Heo * @fmt: printf format string 101b64bbc39STejun Heo * 102b64bbc39STejun Heo * Format string according to @fmt and append it to @ehi->desc. 103b64bbc39STejun Heo * 104b64bbc39STejun Heo * LOCKING: 105b64bbc39STejun Heo * spin_lock_irqsave(host lock) 106b64bbc39STejun Heo */ 107b64bbc39STejun Heo void __ata_ehi_push_desc(struct ata_eh_info *ehi, const char *fmt, ...) 108b64bbc39STejun Heo { 109b64bbc39STejun Heo va_list args; 110b64bbc39STejun Heo 111b64bbc39STejun Heo va_start(args, fmt); 112b64bbc39STejun Heo __ata_ehi_pushv_desc(ehi, fmt, args); 113b64bbc39STejun Heo va_end(args); 114b64bbc39STejun Heo } 115b64bbc39STejun Heo 116b64bbc39STejun Heo /** 117b64bbc39STejun Heo * ata_ehi_push_desc - push error description with separator 118b64bbc39STejun Heo * @ehi: target EHI 119b64bbc39STejun Heo * @fmt: printf format string 120b64bbc39STejun Heo * 121b64bbc39STejun Heo * Format string according to @fmt and append it to @ehi->desc. 122b64bbc39STejun Heo * If @ehi->desc is not empty, ", " is added in-between. 123b64bbc39STejun Heo * 124b64bbc39STejun Heo * LOCKING: 125b64bbc39STejun Heo * spin_lock_irqsave(host lock) 126b64bbc39STejun Heo */ 127b64bbc39STejun Heo void ata_ehi_push_desc(struct ata_eh_info *ehi, const char *fmt, ...) 128b64bbc39STejun Heo { 129b64bbc39STejun Heo va_list args; 130b64bbc39STejun Heo 131b64bbc39STejun Heo if (ehi->desc_len) 132b64bbc39STejun Heo __ata_ehi_push_desc(ehi, ", "); 133b64bbc39STejun Heo 134b64bbc39STejun Heo va_start(args, fmt); 135b64bbc39STejun Heo __ata_ehi_pushv_desc(ehi, fmt, args); 136b64bbc39STejun Heo va_end(args); 137b64bbc39STejun Heo } 138b64bbc39STejun Heo 139b64bbc39STejun Heo /** 140b64bbc39STejun Heo * ata_ehi_clear_desc - clean error description 141b64bbc39STejun Heo * @ehi: target EHI 142b64bbc39STejun Heo * 143b64bbc39STejun Heo * Clear @ehi->desc. 144b64bbc39STejun Heo * 145b64bbc39STejun Heo * LOCKING: 146b64bbc39STejun Heo * spin_lock_irqsave(host lock) 147b64bbc39STejun Heo */ 148b64bbc39STejun Heo void ata_ehi_clear_desc(struct ata_eh_info *ehi) 149b64bbc39STejun Heo { 150b64bbc39STejun Heo ehi->desc[0] = '\0'; 151b64bbc39STejun Heo ehi->desc_len = 0; 152b64bbc39STejun Heo } 153b64bbc39STejun Heo 154cbcdd875STejun Heo /** 155cbcdd875STejun Heo * ata_port_desc - append port description 156cbcdd875STejun Heo * @ap: target ATA port 157cbcdd875STejun Heo * @fmt: printf format string 158cbcdd875STejun Heo * 159cbcdd875STejun Heo * Format string according to @fmt and append it to port 160cbcdd875STejun Heo * description. If port description is not empty, " " is added 161cbcdd875STejun Heo * in-between. This function is to be used while initializing 162cbcdd875STejun Heo * ata_host. The description is printed on host registration. 163cbcdd875STejun Heo * 164cbcdd875STejun Heo * LOCKING: 165cbcdd875STejun Heo * None. 166cbcdd875STejun Heo */ 167cbcdd875STejun Heo void ata_port_desc(struct ata_port *ap, const char *fmt, ...) 168cbcdd875STejun Heo { 169cbcdd875STejun Heo va_list args; 170cbcdd875STejun Heo 171cbcdd875STejun Heo WARN_ON(!(ap->pflags & ATA_PFLAG_INITIALIZING)); 172cbcdd875STejun Heo 173cbcdd875STejun Heo if (ap->link.eh_info.desc_len) 174cbcdd875STejun Heo __ata_ehi_push_desc(&ap->link.eh_info, " "); 175cbcdd875STejun Heo 176cbcdd875STejun Heo va_start(args, fmt); 177cbcdd875STejun Heo __ata_ehi_pushv_desc(&ap->link.eh_info, fmt, args); 178cbcdd875STejun Heo va_end(args); 179cbcdd875STejun Heo } 180cbcdd875STejun Heo 181cbcdd875STejun Heo #ifdef CONFIG_PCI 182cbcdd875STejun Heo 183cbcdd875STejun Heo /** 184cbcdd875STejun Heo * ata_port_pbar_desc - append PCI BAR description 185cbcdd875STejun Heo * @ap: target ATA port 186cbcdd875STejun Heo * @bar: target PCI BAR 187cbcdd875STejun Heo * @offset: offset into PCI BAR 188cbcdd875STejun Heo * @name: name of the area 189cbcdd875STejun Heo * 190cbcdd875STejun Heo * If @offset is negative, this function formats a string which 191cbcdd875STejun Heo * contains the name, address, size and type of the BAR and 192cbcdd875STejun Heo * appends it to the port description. If @offset is zero or 193cbcdd875STejun Heo * positive, only name and offsetted address is appended. 194cbcdd875STejun Heo * 195cbcdd875STejun Heo * LOCKING: 196cbcdd875STejun Heo * None. 197cbcdd875STejun Heo */ 198cbcdd875STejun Heo void ata_port_pbar_desc(struct ata_port *ap, int bar, ssize_t offset, 199cbcdd875STejun Heo const char *name) 200cbcdd875STejun Heo { 201cbcdd875STejun Heo struct pci_dev *pdev = to_pci_dev(ap->host->dev); 202cbcdd875STejun Heo char *type = ""; 203cbcdd875STejun Heo unsigned long long start, len; 204cbcdd875STejun Heo 205cbcdd875STejun Heo if (pci_resource_flags(pdev, bar) & IORESOURCE_MEM) 206cbcdd875STejun Heo type = "m"; 207cbcdd875STejun Heo else if (pci_resource_flags(pdev, bar) & IORESOURCE_IO) 208cbcdd875STejun Heo type = "i"; 209cbcdd875STejun Heo 210cbcdd875STejun Heo start = (unsigned long long)pci_resource_start(pdev, bar); 211cbcdd875STejun Heo len = (unsigned long long)pci_resource_len(pdev, bar); 212cbcdd875STejun Heo 213cbcdd875STejun Heo if (offset < 0) 214cbcdd875STejun Heo ata_port_desc(ap, "%s %s%llu@0x%llx", name, type, len, start); 215cbcdd875STejun Heo else 216cbcdd875STejun Heo ata_port_desc(ap, "%s 0x%llx", name, start + offset); 217cbcdd875STejun Heo } 218cbcdd875STejun Heo 219cbcdd875STejun Heo #endif /* CONFIG_PCI */ 220cbcdd875STejun Heo 221c6fd2807SJeff Garzik static void ata_ering_record(struct ata_ering *ering, int is_io, 222c6fd2807SJeff Garzik unsigned int err_mask) 223c6fd2807SJeff Garzik { 224c6fd2807SJeff Garzik struct ata_ering_entry *ent; 225c6fd2807SJeff Garzik 226c6fd2807SJeff Garzik WARN_ON(!err_mask); 227c6fd2807SJeff Garzik 228c6fd2807SJeff Garzik ering->cursor++; 229c6fd2807SJeff Garzik ering->cursor %= ATA_ERING_SIZE; 230c6fd2807SJeff Garzik 231c6fd2807SJeff Garzik ent = &ering->ring[ering->cursor]; 232c6fd2807SJeff Garzik ent->is_io = is_io; 233c6fd2807SJeff Garzik ent->err_mask = err_mask; 234c6fd2807SJeff Garzik ent->timestamp = get_jiffies_64(); 235c6fd2807SJeff Garzik } 236c6fd2807SJeff Garzik 2377d47e8d4STejun Heo static void ata_ering_clear(struct ata_ering *ering) 238c6fd2807SJeff Garzik { 2397d47e8d4STejun Heo memset(ering, 0, sizeof(*ering)); 240c6fd2807SJeff Garzik } 241c6fd2807SJeff Garzik 242c6fd2807SJeff Garzik static int ata_ering_map(struct ata_ering *ering, 243c6fd2807SJeff Garzik int (*map_fn)(struct ata_ering_entry *, void *), 244c6fd2807SJeff Garzik void *arg) 245c6fd2807SJeff Garzik { 246c6fd2807SJeff Garzik int idx, rc = 0; 247c6fd2807SJeff Garzik struct ata_ering_entry *ent; 248c6fd2807SJeff Garzik 249c6fd2807SJeff Garzik idx = ering->cursor; 250c6fd2807SJeff Garzik do { 251c6fd2807SJeff Garzik ent = &ering->ring[idx]; 252c6fd2807SJeff Garzik if (!ent->err_mask) 253c6fd2807SJeff Garzik break; 254c6fd2807SJeff Garzik rc = map_fn(ent, arg); 255c6fd2807SJeff Garzik if (rc) 256c6fd2807SJeff Garzik break; 257c6fd2807SJeff Garzik idx = (idx - 1 + ATA_ERING_SIZE) % ATA_ERING_SIZE; 258c6fd2807SJeff Garzik } while (idx != ering->cursor); 259c6fd2807SJeff Garzik 260c6fd2807SJeff Garzik return rc; 261c6fd2807SJeff Garzik } 262c6fd2807SJeff Garzik 263c6fd2807SJeff Garzik static unsigned int ata_eh_dev_action(struct ata_device *dev) 264c6fd2807SJeff Garzik { 2659af5c9c9STejun Heo struct ata_eh_context *ehc = &dev->link->eh_context; 266c6fd2807SJeff Garzik 267c6fd2807SJeff Garzik return ehc->i.action | ehc->i.dev_action[dev->devno]; 268c6fd2807SJeff Garzik } 269c6fd2807SJeff Garzik 270f58229f8STejun Heo static void ata_eh_clear_action(struct ata_link *link, struct ata_device *dev, 271c6fd2807SJeff Garzik struct ata_eh_info *ehi, unsigned int action) 272c6fd2807SJeff Garzik { 273f58229f8STejun Heo struct ata_device *tdev; 274c6fd2807SJeff Garzik 275c6fd2807SJeff Garzik if (!dev) { 276c6fd2807SJeff Garzik ehi->action &= ~action; 277f58229f8STejun Heo ata_link_for_each_dev(tdev, link) 278f58229f8STejun Heo ehi->dev_action[tdev->devno] &= ~action; 279c6fd2807SJeff Garzik } else { 280c6fd2807SJeff Garzik /* doesn't make sense for port-wide EH actions */ 281c6fd2807SJeff Garzik WARN_ON(!(action & ATA_EH_PERDEV_MASK)); 282c6fd2807SJeff Garzik 283c6fd2807SJeff Garzik /* break ehi->action into ehi->dev_action */ 284c6fd2807SJeff Garzik if (ehi->action & action) { 285f58229f8STejun Heo ata_link_for_each_dev(tdev, link) 286f58229f8STejun Heo ehi->dev_action[tdev->devno] |= 287f58229f8STejun Heo ehi->action & action; 288c6fd2807SJeff Garzik ehi->action &= ~action; 289c6fd2807SJeff Garzik } 290c6fd2807SJeff Garzik 291c6fd2807SJeff Garzik /* turn off the specified per-dev action */ 292c6fd2807SJeff Garzik ehi->dev_action[dev->devno] &= ~action; 293c6fd2807SJeff Garzik } 294c6fd2807SJeff Garzik } 295c6fd2807SJeff Garzik 296c6fd2807SJeff Garzik /** 297c6fd2807SJeff Garzik * ata_scsi_timed_out - SCSI layer time out callback 298c6fd2807SJeff Garzik * @cmd: timed out SCSI command 299c6fd2807SJeff Garzik * 300c6fd2807SJeff Garzik * Handles SCSI layer timeout. We race with normal completion of 301c6fd2807SJeff Garzik * the qc for @cmd. If the qc is already gone, we lose and let 302c6fd2807SJeff Garzik * the scsi command finish (EH_HANDLED). Otherwise, the qc has 303c6fd2807SJeff Garzik * timed out and EH should be invoked. Prevent ata_qc_complete() 304c6fd2807SJeff Garzik * from finishing it by setting EH_SCHEDULED and return 305c6fd2807SJeff Garzik * EH_NOT_HANDLED. 306c6fd2807SJeff Garzik * 307c6fd2807SJeff Garzik * TODO: kill this function once old EH is gone. 308c6fd2807SJeff Garzik * 309c6fd2807SJeff Garzik * LOCKING: 310c6fd2807SJeff Garzik * Called from timer context 311c6fd2807SJeff Garzik * 312c6fd2807SJeff Garzik * RETURNS: 313c6fd2807SJeff Garzik * EH_HANDLED or EH_NOT_HANDLED 314c6fd2807SJeff Garzik */ 315c6fd2807SJeff Garzik enum scsi_eh_timer_return ata_scsi_timed_out(struct scsi_cmnd *cmd) 316c6fd2807SJeff Garzik { 317c6fd2807SJeff Garzik struct Scsi_Host *host = cmd->device->host; 318c6fd2807SJeff Garzik struct ata_port *ap = ata_shost_to_port(host); 319c6fd2807SJeff Garzik unsigned long flags; 320c6fd2807SJeff Garzik struct ata_queued_cmd *qc; 321c6fd2807SJeff Garzik enum scsi_eh_timer_return ret; 322c6fd2807SJeff Garzik 323c6fd2807SJeff Garzik DPRINTK("ENTER\n"); 324c6fd2807SJeff Garzik 325c6fd2807SJeff Garzik if (ap->ops->error_handler) { 326c6fd2807SJeff Garzik ret = EH_NOT_HANDLED; 327c6fd2807SJeff Garzik goto out; 328c6fd2807SJeff Garzik } 329c6fd2807SJeff Garzik 330c6fd2807SJeff Garzik ret = EH_HANDLED; 331c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 3329af5c9c9STejun Heo qc = ata_qc_from_tag(ap, ap->link.active_tag); 333c6fd2807SJeff Garzik if (qc) { 334c6fd2807SJeff Garzik WARN_ON(qc->scsicmd != cmd); 335c6fd2807SJeff Garzik qc->flags |= ATA_QCFLAG_EH_SCHEDULED; 336c6fd2807SJeff Garzik qc->err_mask |= AC_ERR_TIMEOUT; 337c6fd2807SJeff Garzik ret = EH_NOT_HANDLED; 338c6fd2807SJeff Garzik } 339c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 340c6fd2807SJeff Garzik 341c6fd2807SJeff Garzik out: 342c6fd2807SJeff Garzik DPRINTK("EXIT, ret=%d\n", ret); 343c6fd2807SJeff Garzik return ret; 344c6fd2807SJeff Garzik } 345c6fd2807SJeff Garzik 346c6fd2807SJeff Garzik /** 347c6fd2807SJeff Garzik * ata_scsi_error - SCSI layer error handler callback 348c6fd2807SJeff Garzik * @host: SCSI host on which error occurred 349c6fd2807SJeff Garzik * 350c6fd2807SJeff Garzik * Handles SCSI-layer-thrown error events. 351c6fd2807SJeff Garzik * 352c6fd2807SJeff Garzik * LOCKING: 353c6fd2807SJeff Garzik * Inherited from SCSI layer (none, can sleep) 354c6fd2807SJeff Garzik * 355c6fd2807SJeff Garzik * RETURNS: 356c6fd2807SJeff Garzik * Zero. 357c6fd2807SJeff Garzik */ 358c6fd2807SJeff Garzik void ata_scsi_error(struct Scsi_Host *host) 359c6fd2807SJeff Garzik { 360c6fd2807SJeff Garzik struct ata_port *ap = ata_shost_to_port(host); 361*a1e10f7eSTejun Heo int i; 362c6fd2807SJeff Garzik unsigned long flags; 363c6fd2807SJeff Garzik 364c6fd2807SJeff Garzik DPRINTK("ENTER\n"); 365c6fd2807SJeff Garzik 366c6fd2807SJeff Garzik /* synchronize with port task */ 367c6fd2807SJeff Garzik ata_port_flush_task(ap); 368c6fd2807SJeff Garzik 369cca3974eSJeff Garzik /* synchronize with host lock and sort out timeouts */ 370c6fd2807SJeff Garzik 371c6fd2807SJeff Garzik /* For new EH, all qcs are finished in one of three ways - 372c6fd2807SJeff Garzik * normal completion, error completion, and SCSI timeout. 373c6fd2807SJeff Garzik * Both cmpletions can race against SCSI timeout. When normal 374c6fd2807SJeff Garzik * completion wins, the qc never reaches EH. When error 375c6fd2807SJeff Garzik * completion wins, the qc has ATA_QCFLAG_FAILED set. 376c6fd2807SJeff Garzik * 377c6fd2807SJeff Garzik * When SCSI timeout wins, things are a bit more complex. 378c6fd2807SJeff Garzik * Normal or error completion can occur after the timeout but 379c6fd2807SJeff Garzik * before this point. In such cases, both types of 380c6fd2807SJeff Garzik * completions are honored. A scmd is determined to have 381c6fd2807SJeff Garzik * timed out iff its associated qc is active and not failed. 382c6fd2807SJeff Garzik */ 383c6fd2807SJeff Garzik if (ap->ops->error_handler) { 384c6fd2807SJeff Garzik struct scsi_cmnd *scmd, *tmp; 385c6fd2807SJeff Garzik int nr_timedout = 0; 386c6fd2807SJeff Garzik 387c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 388c6fd2807SJeff Garzik 389c6fd2807SJeff Garzik list_for_each_entry_safe(scmd, tmp, &host->eh_cmd_q, eh_entry) { 390c6fd2807SJeff Garzik struct ata_queued_cmd *qc; 391c6fd2807SJeff Garzik 392c6fd2807SJeff Garzik for (i = 0; i < ATA_MAX_QUEUE; i++) { 393c6fd2807SJeff Garzik qc = __ata_qc_from_tag(ap, i); 394c6fd2807SJeff Garzik if (qc->flags & ATA_QCFLAG_ACTIVE && 395c6fd2807SJeff Garzik qc->scsicmd == scmd) 396c6fd2807SJeff Garzik break; 397c6fd2807SJeff Garzik } 398c6fd2807SJeff Garzik 399c6fd2807SJeff Garzik if (i < ATA_MAX_QUEUE) { 400c6fd2807SJeff Garzik /* the scmd has an associated qc */ 401c6fd2807SJeff Garzik if (!(qc->flags & ATA_QCFLAG_FAILED)) { 402c6fd2807SJeff Garzik /* which hasn't failed yet, timeout */ 403c6fd2807SJeff Garzik qc->err_mask |= AC_ERR_TIMEOUT; 404c6fd2807SJeff Garzik qc->flags |= ATA_QCFLAG_FAILED; 405c6fd2807SJeff Garzik nr_timedout++; 406c6fd2807SJeff Garzik } 407c6fd2807SJeff Garzik } else { 408c6fd2807SJeff Garzik /* Normal completion occurred after 409c6fd2807SJeff Garzik * SCSI timeout but before this point. 410c6fd2807SJeff Garzik * Successfully complete it. 411c6fd2807SJeff Garzik */ 412c6fd2807SJeff Garzik scmd->retries = scmd->allowed; 413c6fd2807SJeff Garzik scsi_eh_finish_cmd(scmd, &ap->eh_done_q); 414c6fd2807SJeff Garzik } 415c6fd2807SJeff Garzik } 416c6fd2807SJeff Garzik 417c6fd2807SJeff Garzik /* If we have timed out qcs. They belong to EH from 418c6fd2807SJeff Garzik * this point but the state of the controller is 419c6fd2807SJeff Garzik * unknown. Freeze the port to make sure the IRQ 420c6fd2807SJeff Garzik * handler doesn't diddle with those qcs. This must 421c6fd2807SJeff Garzik * be done atomically w.r.t. setting QCFLAG_FAILED. 422c6fd2807SJeff Garzik */ 423c6fd2807SJeff Garzik if (nr_timedout) 424c6fd2807SJeff Garzik __ata_port_freeze(ap); 425c6fd2807SJeff Garzik 426c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 427*a1e10f7eSTejun Heo 428*a1e10f7eSTejun Heo /* initialize eh_tries */ 429*a1e10f7eSTejun Heo ap->eh_tries = ATA_EH_MAX_TRIES; 430c6fd2807SJeff Garzik } else 431c6fd2807SJeff Garzik spin_unlock_wait(ap->lock); 432c6fd2807SJeff Garzik 433c6fd2807SJeff Garzik repeat: 434c6fd2807SJeff Garzik /* invoke error handler */ 435c6fd2807SJeff Garzik if (ap->ops->error_handler) { 436cf1b86c8STejun Heo struct ata_link *link; 437cf1b86c8STejun Heo 4385ddf24c5STejun Heo /* kill fast drain timer */ 4395ddf24c5STejun Heo del_timer_sync(&ap->fastdrain_timer); 4405ddf24c5STejun Heo 441c6fd2807SJeff Garzik /* process port resume request */ 442c6fd2807SJeff Garzik ata_eh_handle_port_resume(ap); 443c6fd2807SJeff Garzik 444c6fd2807SJeff Garzik /* fetch & clear EH info */ 445c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 446c6fd2807SJeff Garzik 447cf1b86c8STejun Heo __ata_port_for_each_link(link, ap) { 448cf1b86c8STejun Heo memset(&link->eh_context, 0, sizeof(link->eh_context)); 449cf1b86c8STejun Heo link->eh_context.i = link->eh_info; 450cf1b86c8STejun Heo memset(&link->eh_info, 0, sizeof(link->eh_info)); 451cf1b86c8STejun Heo } 452c6fd2807SJeff Garzik 453c6fd2807SJeff Garzik ap->pflags |= ATA_PFLAG_EH_IN_PROGRESS; 454c6fd2807SJeff Garzik ap->pflags &= ~ATA_PFLAG_EH_PENDING; 455c6fd2807SJeff Garzik 456c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 457c6fd2807SJeff Garzik 458c6fd2807SJeff Garzik /* invoke EH, skip if unloading or suspended */ 459c6fd2807SJeff Garzik if (!(ap->pflags & (ATA_PFLAG_UNLOADING | ATA_PFLAG_SUSPENDED))) 460c6fd2807SJeff Garzik ap->ops->error_handler(ap); 461c6fd2807SJeff Garzik else 462c6fd2807SJeff Garzik ata_eh_finish(ap); 463c6fd2807SJeff Garzik 464c6fd2807SJeff Garzik /* process port suspend request */ 465c6fd2807SJeff Garzik ata_eh_handle_port_suspend(ap); 466c6fd2807SJeff Garzik 467c6fd2807SJeff Garzik /* Exception might have happend after ->error_handler 468c6fd2807SJeff Garzik * recovered the port but before this point. Repeat 469c6fd2807SJeff Garzik * EH in such case. 470c6fd2807SJeff Garzik */ 471c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 472c6fd2807SJeff Garzik 473c6fd2807SJeff Garzik if (ap->pflags & ATA_PFLAG_EH_PENDING) { 474*a1e10f7eSTejun Heo if (--ap->eh_tries) { 475c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 476c6fd2807SJeff Garzik goto repeat; 477c6fd2807SJeff Garzik } 478c6fd2807SJeff Garzik ata_port_printk(ap, KERN_ERR, "EH pending after %d " 479*a1e10f7eSTejun Heo "tries, giving up\n", ATA_EH_MAX_TRIES); 480914616a3STejun Heo ap->pflags &= ~ATA_PFLAG_EH_PENDING; 481c6fd2807SJeff Garzik } 482c6fd2807SJeff Garzik 483c6fd2807SJeff Garzik /* this run is complete, make sure EH info is clear */ 484cf1b86c8STejun Heo __ata_port_for_each_link(link, ap) 485cf1b86c8STejun Heo memset(&link->eh_info, 0, sizeof(link->eh_info)); 486c6fd2807SJeff Garzik 487c6fd2807SJeff Garzik /* Clear host_eh_scheduled while holding ap->lock such 488c6fd2807SJeff Garzik * that if exception occurs after this point but 489c6fd2807SJeff Garzik * before EH completion, SCSI midlayer will 490c6fd2807SJeff Garzik * re-initiate EH. 491c6fd2807SJeff Garzik */ 492c6fd2807SJeff Garzik host->host_eh_scheduled = 0; 493c6fd2807SJeff Garzik 494c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 495c6fd2807SJeff Garzik } else { 4969af5c9c9STejun Heo WARN_ON(ata_qc_from_tag(ap, ap->link.active_tag) == NULL); 497c6fd2807SJeff Garzik ap->ops->eng_timeout(ap); 498c6fd2807SJeff Garzik } 499c6fd2807SJeff Garzik 500c6fd2807SJeff Garzik /* finish or retry handled scmd's and clean up */ 501c6fd2807SJeff Garzik WARN_ON(host->host_failed || !list_empty(&host->eh_cmd_q)); 502c6fd2807SJeff Garzik 503c6fd2807SJeff Garzik scsi_eh_flush_done_q(&ap->eh_done_q); 504c6fd2807SJeff Garzik 505c6fd2807SJeff Garzik /* clean up */ 506c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 507c6fd2807SJeff Garzik 508c6fd2807SJeff Garzik if (ap->pflags & ATA_PFLAG_LOADING) 509c6fd2807SJeff Garzik ap->pflags &= ~ATA_PFLAG_LOADING; 510c6fd2807SJeff Garzik else if (ap->pflags & ATA_PFLAG_SCSI_HOTPLUG) 51152bad64dSDavid Howells queue_delayed_work(ata_aux_wq, &ap->hotplug_task, 0); 512c6fd2807SJeff Garzik 513c6fd2807SJeff Garzik if (ap->pflags & ATA_PFLAG_RECOVERED) 514c6fd2807SJeff Garzik ata_port_printk(ap, KERN_INFO, "EH complete\n"); 515c6fd2807SJeff Garzik 516c6fd2807SJeff Garzik ap->pflags &= ~(ATA_PFLAG_SCSI_HOTPLUG | ATA_PFLAG_RECOVERED); 517c6fd2807SJeff Garzik 518c6fd2807SJeff Garzik /* tell wait_eh that we're done */ 519c6fd2807SJeff Garzik ap->pflags &= ~ATA_PFLAG_EH_IN_PROGRESS; 520c6fd2807SJeff Garzik wake_up_all(&ap->eh_wait_q); 521c6fd2807SJeff Garzik 522c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 523c6fd2807SJeff Garzik 524c6fd2807SJeff Garzik DPRINTK("EXIT\n"); 525c6fd2807SJeff Garzik } 526c6fd2807SJeff Garzik 527c6fd2807SJeff Garzik /** 528c6fd2807SJeff Garzik * ata_port_wait_eh - Wait for the currently pending EH to complete 529c6fd2807SJeff Garzik * @ap: Port to wait EH for 530c6fd2807SJeff Garzik * 531c6fd2807SJeff Garzik * Wait until the currently pending EH is complete. 532c6fd2807SJeff Garzik * 533c6fd2807SJeff Garzik * LOCKING: 534c6fd2807SJeff Garzik * Kernel thread context (may sleep). 535c6fd2807SJeff Garzik */ 536c6fd2807SJeff Garzik void ata_port_wait_eh(struct ata_port *ap) 537c6fd2807SJeff Garzik { 538c6fd2807SJeff Garzik unsigned long flags; 539c6fd2807SJeff Garzik DEFINE_WAIT(wait); 540c6fd2807SJeff Garzik 541c6fd2807SJeff Garzik retry: 542c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 543c6fd2807SJeff Garzik 544c6fd2807SJeff Garzik while (ap->pflags & (ATA_PFLAG_EH_PENDING | ATA_PFLAG_EH_IN_PROGRESS)) { 545c6fd2807SJeff Garzik prepare_to_wait(&ap->eh_wait_q, &wait, TASK_UNINTERRUPTIBLE); 546c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 547c6fd2807SJeff Garzik schedule(); 548c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 549c6fd2807SJeff Garzik } 550c6fd2807SJeff Garzik finish_wait(&ap->eh_wait_q, &wait); 551c6fd2807SJeff Garzik 552c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 553c6fd2807SJeff Garzik 554c6fd2807SJeff Garzik /* make sure SCSI EH is complete */ 555cca3974eSJeff Garzik if (scsi_host_in_recovery(ap->scsi_host)) { 556c6fd2807SJeff Garzik msleep(10); 557c6fd2807SJeff Garzik goto retry; 558c6fd2807SJeff Garzik } 559c6fd2807SJeff Garzik } 560c6fd2807SJeff Garzik 561c6fd2807SJeff Garzik /** 562c6fd2807SJeff Garzik * ata_qc_timeout - Handle timeout of queued command 563c6fd2807SJeff Garzik * @qc: Command that timed out 564c6fd2807SJeff Garzik * 565c6fd2807SJeff Garzik * Some part of the kernel (currently, only the SCSI layer) 566c6fd2807SJeff Garzik * has noticed that the active command on port @ap has not 567c6fd2807SJeff Garzik * completed after a specified length of time. Handle this 568c6fd2807SJeff Garzik * condition by disabling DMA (if necessary) and completing 569c6fd2807SJeff Garzik * transactions, with error if necessary. 570c6fd2807SJeff Garzik * 571c6fd2807SJeff Garzik * This also handles the case of the "lost interrupt", where 572c6fd2807SJeff Garzik * for some reason (possibly hardware bug, possibly driver bug) 573c6fd2807SJeff Garzik * an interrupt was not delivered to the driver, even though the 574c6fd2807SJeff Garzik * transaction completed successfully. 575c6fd2807SJeff Garzik * 576c6fd2807SJeff Garzik * TODO: kill this function once old EH is gone. 577c6fd2807SJeff Garzik * 578c6fd2807SJeff Garzik * LOCKING: 579c6fd2807SJeff Garzik * Inherited from SCSI layer (none, can sleep) 580c6fd2807SJeff Garzik */ 581c6fd2807SJeff Garzik static void ata_qc_timeout(struct ata_queued_cmd *qc) 582c6fd2807SJeff Garzik { 583c6fd2807SJeff Garzik struct ata_port *ap = qc->ap; 584c6fd2807SJeff Garzik u8 host_stat = 0, drv_stat; 585c6fd2807SJeff Garzik unsigned long flags; 586c6fd2807SJeff Garzik 587c6fd2807SJeff Garzik DPRINTK("ENTER\n"); 588c6fd2807SJeff Garzik 589c6fd2807SJeff Garzik ap->hsm_task_state = HSM_ST_IDLE; 590c6fd2807SJeff Garzik 591c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 592c6fd2807SJeff Garzik 593c6fd2807SJeff Garzik switch (qc->tf.protocol) { 594c6fd2807SJeff Garzik 595c6fd2807SJeff Garzik case ATA_PROT_DMA: 596c6fd2807SJeff Garzik case ATA_PROT_ATAPI_DMA: 597c6fd2807SJeff Garzik host_stat = ap->ops->bmdma_status(ap); 598c6fd2807SJeff Garzik 599c6fd2807SJeff Garzik /* before we do anything else, clear DMA-Start bit */ 600c6fd2807SJeff Garzik ap->ops->bmdma_stop(qc); 601c6fd2807SJeff Garzik 602c6fd2807SJeff Garzik /* fall through */ 603c6fd2807SJeff Garzik 604c6fd2807SJeff Garzik default: 605c6fd2807SJeff Garzik ata_altstatus(ap); 606c6fd2807SJeff Garzik drv_stat = ata_chk_status(ap); 607c6fd2807SJeff Garzik 608c6fd2807SJeff Garzik /* ack bmdma irq events */ 609c6fd2807SJeff Garzik ap->ops->irq_clear(ap); 610c6fd2807SJeff Garzik 611c6fd2807SJeff Garzik ata_dev_printk(qc->dev, KERN_ERR, "command 0x%x timeout, " 612c6fd2807SJeff Garzik "stat 0x%x host_stat 0x%x\n", 613c6fd2807SJeff Garzik qc->tf.command, drv_stat, host_stat); 614c6fd2807SJeff Garzik 615c6fd2807SJeff Garzik /* complete taskfile transaction */ 616c6fd2807SJeff Garzik qc->err_mask |= AC_ERR_TIMEOUT; 617c6fd2807SJeff Garzik break; 618c6fd2807SJeff Garzik } 619c6fd2807SJeff Garzik 620c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 621c6fd2807SJeff Garzik 622c6fd2807SJeff Garzik ata_eh_qc_complete(qc); 623c6fd2807SJeff Garzik 624c6fd2807SJeff Garzik DPRINTK("EXIT\n"); 625c6fd2807SJeff Garzik } 626c6fd2807SJeff Garzik 627c6fd2807SJeff Garzik /** 628c6fd2807SJeff Garzik * ata_eng_timeout - Handle timeout of queued command 629c6fd2807SJeff Garzik * @ap: Port on which timed-out command is active 630c6fd2807SJeff Garzik * 631c6fd2807SJeff Garzik * Some part of the kernel (currently, only the SCSI layer) 632c6fd2807SJeff Garzik * has noticed that the active command on port @ap has not 633c6fd2807SJeff Garzik * completed after a specified length of time. Handle this 634c6fd2807SJeff Garzik * condition by disabling DMA (if necessary) and completing 635c6fd2807SJeff Garzik * transactions, with error if necessary. 636c6fd2807SJeff Garzik * 637c6fd2807SJeff Garzik * This also handles the case of the "lost interrupt", where 638c6fd2807SJeff Garzik * for some reason (possibly hardware bug, possibly driver bug) 639c6fd2807SJeff Garzik * an interrupt was not delivered to the driver, even though the 640c6fd2807SJeff Garzik * transaction completed successfully. 641c6fd2807SJeff Garzik * 642c6fd2807SJeff Garzik * TODO: kill this function once old EH is gone. 643c6fd2807SJeff Garzik * 644c6fd2807SJeff Garzik * LOCKING: 645c6fd2807SJeff Garzik * Inherited from SCSI layer (none, can sleep) 646c6fd2807SJeff Garzik */ 647c6fd2807SJeff Garzik void ata_eng_timeout(struct ata_port *ap) 648c6fd2807SJeff Garzik { 649c6fd2807SJeff Garzik DPRINTK("ENTER\n"); 650c6fd2807SJeff Garzik 6519af5c9c9STejun Heo ata_qc_timeout(ata_qc_from_tag(ap, ap->link.active_tag)); 652c6fd2807SJeff Garzik 653c6fd2807SJeff Garzik DPRINTK("EXIT\n"); 654c6fd2807SJeff Garzik } 655c6fd2807SJeff Garzik 6565ddf24c5STejun Heo static int ata_eh_nr_in_flight(struct ata_port *ap) 6575ddf24c5STejun Heo { 6585ddf24c5STejun Heo unsigned int tag; 6595ddf24c5STejun Heo int nr = 0; 6605ddf24c5STejun Heo 6615ddf24c5STejun Heo /* count only non-internal commands */ 6625ddf24c5STejun Heo for (tag = 0; tag < ATA_MAX_QUEUE - 1; tag++) 6635ddf24c5STejun Heo if (ata_qc_from_tag(ap, tag)) 6645ddf24c5STejun Heo nr++; 6655ddf24c5STejun Heo 6665ddf24c5STejun Heo return nr; 6675ddf24c5STejun Heo } 6685ddf24c5STejun Heo 6695ddf24c5STejun Heo void ata_eh_fastdrain_timerfn(unsigned long arg) 6705ddf24c5STejun Heo { 6715ddf24c5STejun Heo struct ata_port *ap = (void *)arg; 6725ddf24c5STejun Heo unsigned long flags; 6735ddf24c5STejun Heo int cnt; 6745ddf24c5STejun Heo 6755ddf24c5STejun Heo spin_lock_irqsave(ap->lock, flags); 6765ddf24c5STejun Heo 6775ddf24c5STejun Heo cnt = ata_eh_nr_in_flight(ap); 6785ddf24c5STejun Heo 6795ddf24c5STejun Heo /* are we done? */ 6805ddf24c5STejun Heo if (!cnt) 6815ddf24c5STejun Heo goto out_unlock; 6825ddf24c5STejun Heo 6835ddf24c5STejun Heo if (cnt == ap->fastdrain_cnt) { 6845ddf24c5STejun Heo unsigned int tag; 6855ddf24c5STejun Heo 6865ddf24c5STejun Heo /* No progress during the last interval, tag all 6875ddf24c5STejun Heo * in-flight qcs as timed out and freeze the port. 6885ddf24c5STejun Heo */ 6895ddf24c5STejun Heo for (tag = 0; tag < ATA_MAX_QUEUE - 1; tag++) { 6905ddf24c5STejun Heo struct ata_queued_cmd *qc = ata_qc_from_tag(ap, tag); 6915ddf24c5STejun Heo if (qc) 6925ddf24c5STejun Heo qc->err_mask |= AC_ERR_TIMEOUT; 6935ddf24c5STejun Heo } 6945ddf24c5STejun Heo 6955ddf24c5STejun Heo ata_port_freeze(ap); 6965ddf24c5STejun Heo } else { 6975ddf24c5STejun Heo /* some qcs have finished, give it another chance */ 6985ddf24c5STejun Heo ap->fastdrain_cnt = cnt; 6995ddf24c5STejun Heo ap->fastdrain_timer.expires = 7005ddf24c5STejun Heo jiffies + ATA_EH_FASTDRAIN_INTERVAL; 7015ddf24c5STejun Heo add_timer(&ap->fastdrain_timer); 7025ddf24c5STejun Heo } 7035ddf24c5STejun Heo 7045ddf24c5STejun Heo out_unlock: 7055ddf24c5STejun Heo spin_unlock_irqrestore(ap->lock, flags); 7065ddf24c5STejun Heo } 7075ddf24c5STejun Heo 7085ddf24c5STejun Heo /** 7095ddf24c5STejun Heo * ata_eh_set_pending - set ATA_PFLAG_EH_PENDING and activate fast drain 7105ddf24c5STejun Heo * @ap: target ATA port 7115ddf24c5STejun Heo * @fastdrain: activate fast drain 7125ddf24c5STejun Heo * 7135ddf24c5STejun Heo * Set ATA_PFLAG_EH_PENDING and activate fast drain if @fastdrain 7145ddf24c5STejun Heo * is non-zero and EH wasn't pending before. Fast drain ensures 7155ddf24c5STejun Heo * that EH kicks in in timely manner. 7165ddf24c5STejun Heo * 7175ddf24c5STejun Heo * LOCKING: 7185ddf24c5STejun Heo * spin_lock_irqsave(host lock) 7195ddf24c5STejun Heo */ 7205ddf24c5STejun Heo static void ata_eh_set_pending(struct ata_port *ap, int fastdrain) 7215ddf24c5STejun Heo { 7225ddf24c5STejun Heo int cnt; 7235ddf24c5STejun Heo 7245ddf24c5STejun Heo /* already scheduled? */ 7255ddf24c5STejun Heo if (ap->pflags & ATA_PFLAG_EH_PENDING) 7265ddf24c5STejun Heo return; 7275ddf24c5STejun Heo 7285ddf24c5STejun Heo ap->pflags |= ATA_PFLAG_EH_PENDING; 7295ddf24c5STejun Heo 7305ddf24c5STejun Heo if (!fastdrain) 7315ddf24c5STejun Heo return; 7325ddf24c5STejun Heo 7335ddf24c5STejun Heo /* do we have in-flight qcs? */ 7345ddf24c5STejun Heo cnt = ata_eh_nr_in_flight(ap); 7355ddf24c5STejun Heo if (!cnt) 7365ddf24c5STejun Heo return; 7375ddf24c5STejun Heo 7385ddf24c5STejun Heo /* activate fast drain */ 7395ddf24c5STejun Heo ap->fastdrain_cnt = cnt; 7405ddf24c5STejun Heo ap->fastdrain_timer.expires = jiffies + ATA_EH_FASTDRAIN_INTERVAL; 7415ddf24c5STejun Heo add_timer(&ap->fastdrain_timer); 7425ddf24c5STejun Heo } 7435ddf24c5STejun Heo 744c6fd2807SJeff Garzik /** 745c6fd2807SJeff Garzik * ata_qc_schedule_eh - schedule qc for error handling 746c6fd2807SJeff Garzik * @qc: command to schedule error handling for 747c6fd2807SJeff Garzik * 748c6fd2807SJeff Garzik * Schedule error handling for @qc. EH will kick in as soon as 749c6fd2807SJeff Garzik * other commands are drained. 750c6fd2807SJeff Garzik * 751c6fd2807SJeff Garzik * LOCKING: 752cca3974eSJeff Garzik * spin_lock_irqsave(host lock) 753c6fd2807SJeff Garzik */ 754c6fd2807SJeff Garzik void ata_qc_schedule_eh(struct ata_queued_cmd *qc) 755c6fd2807SJeff Garzik { 756c6fd2807SJeff Garzik struct ata_port *ap = qc->ap; 757c6fd2807SJeff Garzik 758c6fd2807SJeff Garzik WARN_ON(!ap->ops->error_handler); 759c6fd2807SJeff Garzik 760c6fd2807SJeff Garzik qc->flags |= ATA_QCFLAG_FAILED; 7615ddf24c5STejun Heo ata_eh_set_pending(ap, 1); 762c6fd2807SJeff Garzik 763c6fd2807SJeff Garzik /* The following will fail if timeout has already expired. 764c6fd2807SJeff Garzik * ata_scsi_error() takes care of such scmds on EH entry. 765c6fd2807SJeff Garzik * Note that ATA_QCFLAG_FAILED is unconditionally set after 766c6fd2807SJeff Garzik * this function completes. 767c6fd2807SJeff Garzik */ 768c6fd2807SJeff Garzik scsi_req_abort_cmd(qc->scsicmd); 769c6fd2807SJeff Garzik } 770c6fd2807SJeff Garzik 771c6fd2807SJeff Garzik /** 772c6fd2807SJeff Garzik * ata_port_schedule_eh - schedule error handling without a qc 773c6fd2807SJeff Garzik * @ap: ATA port to schedule EH for 774c6fd2807SJeff Garzik * 775c6fd2807SJeff Garzik * Schedule error handling for @ap. EH will kick in as soon as 776c6fd2807SJeff Garzik * all commands are drained. 777c6fd2807SJeff Garzik * 778c6fd2807SJeff Garzik * LOCKING: 779cca3974eSJeff Garzik * spin_lock_irqsave(host lock) 780c6fd2807SJeff Garzik */ 781c6fd2807SJeff Garzik void ata_port_schedule_eh(struct ata_port *ap) 782c6fd2807SJeff Garzik { 783c6fd2807SJeff Garzik WARN_ON(!ap->ops->error_handler); 784c6fd2807SJeff Garzik 785f4d6d004STejun Heo if (ap->pflags & ATA_PFLAG_INITIALIZING) 786f4d6d004STejun Heo return; 787f4d6d004STejun Heo 7885ddf24c5STejun Heo ata_eh_set_pending(ap, 1); 789cca3974eSJeff Garzik scsi_schedule_eh(ap->scsi_host); 790c6fd2807SJeff Garzik 791c6fd2807SJeff Garzik DPRINTK("port EH scheduled\n"); 792c6fd2807SJeff Garzik } 793c6fd2807SJeff Garzik 794dbd82616STejun Heo static int ata_do_link_abort(struct ata_port *ap, struct ata_link *link) 795c6fd2807SJeff Garzik { 796c6fd2807SJeff Garzik int tag, nr_aborted = 0; 797c6fd2807SJeff Garzik 798c6fd2807SJeff Garzik WARN_ON(!ap->ops->error_handler); 799c6fd2807SJeff Garzik 8005ddf24c5STejun Heo /* we're gonna abort all commands, no need for fast drain */ 8015ddf24c5STejun Heo ata_eh_set_pending(ap, 0); 8025ddf24c5STejun Heo 803c6fd2807SJeff Garzik for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 804c6fd2807SJeff Garzik struct ata_queued_cmd *qc = ata_qc_from_tag(ap, tag); 805c6fd2807SJeff Garzik 806dbd82616STejun Heo if (qc && (!link || qc->dev->link == link)) { 807c6fd2807SJeff Garzik qc->flags |= ATA_QCFLAG_FAILED; 808c6fd2807SJeff Garzik ata_qc_complete(qc); 809c6fd2807SJeff Garzik nr_aborted++; 810c6fd2807SJeff Garzik } 811c6fd2807SJeff Garzik } 812c6fd2807SJeff Garzik 813c6fd2807SJeff Garzik if (!nr_aborted) 814c6fd2807SJeff Garzik ata_port_schedule_eh(ap); 815c6fd2807SJeff Garzik 816c6fd2807SJeff Garzik return nr_aborted; 817c6fd2807SJeff Garzik } 818c6fd2807SJeff Garzik 819c6fd2807SJeff Garzik /** 820dbd82616STejun Heo * ata_link_abort - abort all qc's on the link 821dbd82616STejun Heo * @link: ATA link to abort qc's for 822dbd82616STejun Heo * 823dbd82616STejun Heo * Abort all active qc's active on @link and schedule EH. 824dbd82616STejun Heo * 825dbd82616STejun Heo * LOCKING: 826dbd82616STejun Heo * spin_lock_irqsave(host lock) 827dbd82616STejun Heo * 828dbd82616STejun Heo * RETURNS: 829dbd82616STejun Heo * Number of aborted qc's. 830dbd82616STejun Heo */ 831dbd82616STejun Heo int ata_link_abort(struct ata_link *link) 832dbd82616STejun Heo { 833dbd82616STejun Heo return ata_do_link_abort(link->ap, link); 834dbd82616STejun Heo } 835dbd82616STejun Heo 836dbd82616STejun Heo /** 837dbd82616STejun Heo * ata_port_abort - abort all qc's on the port 838dbd82616STejun Heo * @ap: ATA port to abort qc's for 839dbd82616STejun Heo * 840dbd82616STejun Heo * Abort all active qc's of @ap and schedule EH. 841dbd82616STejun Heo * 842dbd82616STejun Heo * LOCKING: 843dbd82616STejun Heo * spin_lock_irqsave(host_set lock) 844dbd82616STejun Heo * 845dbd82616STejun Heo * RETURNS: 846dbd82616STejun Heo * Number of aborted qc's. 847dbd82616STejun Heo */ 848dbd82616STejun Heo int ata_port_abort(struct ata_port *ap) 849dbd82616STejun Heo { 850dbd82616STejun Heo return ata_do_link_abort(ap, NULL); 851dbd82616STejun Heo } 852dbd82616STejun Heo 853dbd82616STejun Heo /** 854c6fd2807SJeff Garzik * __ata_port_freeze - freeze port 855c6fd2807SJeff Garzik * @ap: ATA port to freeze 856c6fd2807SJeff Garzik * 857c6fd2807SJeff Garzik * This function is called when HSM violation or some other 858c6fd2807SJeff Garzik * condition disrupts normal operation of the port. Frozen port 859c6fd2807SJeff Garzik * is not allowed to perform any operation until the port is 860c6fd2807SJeff Garzik * thawed, which usually follows a successful reset. 861c6fd2807SJeff Garzik * 862c6fd2807SJeff Garzik * ap->ops->freeze() callback can be used for freezing the port 863c6fd2807SJeff Garzik * hardware-wise (e.g. mask interrupt and stop DMA engine). If a 864c6fd2807SJeff Garzik * port cannot be frozen hardware-wise, the interrupt handler 865c6fd2807SJeff Garzik * must ack and clear interrupts unconditionally while the port 866c6fd2807SJeff Garzik * is frozen. 867c6fd2807SJeff Garzik * 868c6fd2807SJeff Garzik * LOCKING: 869cca3974eSJeff Garzik * spin_lock_irqsave(host lock) 870c6fd2807SJeff Garzik */ 871c6fd2807SJeff Garzik static void __ata_port_freeze(struct ata_port *ap) 872c6fd2807SJeff Garzik { 873c6fd2807SJeff Garzik WARN_ON(!ap->ops->error_handler); 874c6fd2807SJeff Garzik 875c6fd2807SJeff Garzik if (ap->ops->freeze) 876c6fd2807SJeff Garzik ap->ops->freeze(ap); 877c6fd2807SJeff Garzik 878c6fd2807SJeff Garzik ap->pflags |= ATA_PFLAG_FROZEN; 879c6fd2807SJeff Garzik 88044877b4eSTejun Heo DPRINTK("ata%u port frozen\n", ap->print_id); 881c6fd2807SJeff Garzik } 882c6fd2807SJeff Garzik 883c6fd2807SJeff Garzik /** 884c6fd2807SJeff Garzik * ata_port_freeze - abort & freeze port 885c6fd2807SJeff Garzik * @ap: ATA port to freeze 886c6fd2807SJeff Garzik * 887c6fd2807SJeff Garzik * Abort and freeze @ap. 888c6fd2807SJeff Garzik * 889c6fd2807SJeff Garzik * LOCKING: 890cca3974eSJeff Garzik * spin_lock_irqsave(host lock) 891c6fd2807SJeff Garzik * 892c6fd2807SJeff Garzik * RETURNS: 893c6fd2807SJeff Garzik * Number of aborted commands. 894c6fd2807SJeff Garzik */ 895c6fd2807SJeff Garzik int ata_port_freeze(struct ata_port *ap) 896c6fd2807SJeff Garzik { 897c6fd2807SJeff Garzik int nr_aborted; 898c6fd2807SJeff Garzik 899c6fd2807SJeff Garzik WARN_ON(!ap->ops->error_handler); 900c6fd2807SJeff Garzik 901c6fd2807SJeff Garzik nr_aborted = ata_port_abort(ap); 902c6fd2807SJeff Garzik __ata_port_freeze(ap); 903c6fd2807SJeff Garzik 904c6fd2807SJeff Garzik return nr_aborted; 905c6fd2807SJeff Garzik } 906c6fd2807SJeff Garzik 907c6fd2807SJeff Garzik /** 908c6fd2807SJeff Garzik * ata_eh_freeze_port - EH helper to freeze port 909c6fd2807SJeff Garzik * @ap: ATA port to freeze 910c6fd2807SJeff Garzik * 911c6fd2807SJeff Garzik * Freeze @ap. 912c6fd2807SJeff Garzik * 913c6fd2807SJeff Garzik * LOCKING: 914c6fd2807SJeff Garzik * None. 915c6fd2807SJeff Garzik */ 916c6fd2807SJeff Garzik void ata_eh_freeze_port(struct ata_port *ap) 917c6fd2807SJeff Garzik { 918c6fd2807SJeff Garzik unsigned long flags; 919c6fd2807SJeff Garzik 920c6fd2807SJeff Garzik if (!ap->ops->error_handler) 921c6fd2807SJeff Garzik return; 922c6fd2807SJeff Garzik 923c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 924c6fd2807SJeff Garzik __ata_port_freeze(ap); 925c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 926c6fd2807SJeff Garzik } 927c6fd2807SJeff Garzik 928c6fd2807SJeff Garzik /** 929c6fd2807SJeff Garzik * ata_port_thaw_port - EH helper to thaw port 930c6fd2807SJeff Garzik * @ap: ATA port to thaw 931c6fd2807SJeff Garzik * 932c6fd2807SJeff Garzik * Thaw frozen port @ap. 933c6fd2807SJeff Garzik * 934c6fd2807SJeff Garzik * LOCKING: 935c6fd2807SJeff Garzik * None. 936c6fd2807SJeff Garzik */ 937c6fd2807SJeff Garzik void ata_eh_thaw_port(struct ata_port *ap) 938c6fd2807SJeff Garzik { 939c6fd2807SJeff Garzik unsigned long flags; 940c6fd2807SJeff Garzik 941c6fd2807SJeff Garzik if (!ap->ops->error_handler) 942c6fd2807SJeff Garzik return; 943c6fd2807SJeff Garzik 944c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 945c6fd2807SJeff Garzik 946c6fd2807SJeff Garzik ap->pflags &= ~ATA_PFLAG_FROZEN; 947c6fd2807SJeff Garzik 948c6fd2807SJeff Garzik if (ap->ops->thaw) 949c6fd2807SJeff Garzik ap->ops->thaw(ap); 950c6fd2807SJeff Garzik 951c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 952c6fd2807SJeff Garzik 95344877b4eSTejun Heo DPRINTK("ata%u port thawed\n", ap->print_id); 954c6fd2807SJeff Garzik } 955c6fd2807SJeff Garzik 956c6fd2807SJeff Garzik static void ata_eh_scsidone(struct scsi_cmnd *scmd) 957c6fd2807SJeff Garzik { 958c6fd2807SJeff Garzik /* nada */ 959c6fd2807SJeff Garzik } 960c6fd2807SJeff Garzik 961c6fd2807SJeff Garzik static void __ata_eh_qc_complete(struct ata_queued_cmd *qc) 962c6fd2807SJeff Garzik { 963c6fd2807SJeff Garzik struct ata_port *ap = qc->ap; 964c6fd2807SJeff Garzik struct scsi_cmnd *scmd = qc->scsicmd; 965c6fd2807SJeff Garzik unsigned long flags; 966c6fd2807SJeff Garzik 967c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 968c6fd2807SJeff Garzik qc->scsidone = ata_eh_scsidone; 969c6fd2807SJeff Garzik __ata_qc_complete(qc); 970c6fd2807SJeff Garzik WARN_ON(ata_tag_valid(qc->tag)); 971c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 972c6fd2807SJeff Garzik 973c6fd2807SJeff Garzik scsi_eh_finish_cmd(scmd, &ap->eh_done_q); 974c6fd2807SJeff Garzik } 975c6fd2807SJeff Garzik 976c6fd2807SJeff Garzik /** 977c6fd2807SJeff Garzik * ata_eh_qc_complete - Complete an active ATA command from EH 978c6fd2807SJeff Garzik * @qc: Command to complete 979c6fd2807SJeff Garzik * 980c6fd2807SJeff Garzik * Indicate to the mid and upper layers that an ATA command has 981c6fd2807SJeff Garzik * completed. To be used from EH. 982c6fd2807SJeff Garzik */ 983c6fd2807SJeff Garzik void ata_eh_qc_complete(struct ata_queued_cmd *qc) 984c6fd2807SJeff Garzik { 985c6fd2807SJeff Garzik struct scsi_cmnd *scmd = qc->scsicmd; 986c6fd2807SJeff Garzik scmd->retries = scmd->allowed; 987c6fd2807SJeff Garzik __ata_eh_qc_complete(qc); 988c6fd2807SJeff Garzik } 989c6fd2807SJeff Garzik 990c6fd2807SJeff Garzik /** 991c6fd2807SJeff Garzik * ata_eh_qc_retry - Tell midlayer to retry an ATA command after EH 992c6fd2807SJeff Garzik * @qc: Command to retry 993c6fd2807SJeff Garzik * 994c6fd2807SJeff Garzik * Indicate to the mid and upper layers that an ATA command 995c6fd2807SJeff Garzik * should be retried. To be used from EH. 996c6fd2807SJeff Garzik * 997c6fd2807SJeff Garzik * SCSI midlayer limits the number of retries to scmd->allowed. 998c6fd2807SJeff Garzik * scmd->retries is decremented for commands which get retried 999c6fd2807SJeff Garzik * due to unrelated failures (qc->err_mask is zero). 1000c6fd2807SJeff Garzik */ 1001c6fd2807SJeff Garzik void ata_eh_qc_retry(struct ata_queued_cmd *qc) 1002c6fd2807SJeff Garzik { 1003c6fd2807SJeff Garzik struct scsi_cmnd *scmd = qc->scsicmd; 1004c6fd2807SJeff Garzik if (!qc->err_mask && scmd->retries) 1005c6fd2807SJeff Garzik scmd->retries--; 1006c6fd2807SJeff Garzik __ata_eh_qc_complete(qc); 1007c6fd2807SJeff Garzik } 1008c6fd2807SJeff Garzik 1009c6fd2807SJeff Garzik /** 1010c6fd2807SJeff Garzik * ata_eh_detach_dev - detach ATA device 1011c6fd2807SJeff Garzik * @dev: ATA device to detach 1012c6fd2807SJeff Garzik * 1013c6fd2807SJeff Garzik * Detach @dev. 1014c6fd2807SJeff Garzik * 1015c6fd2807SJeff Garzik * LOCKING: 1016c6fd2807SJeff Garzik * None. 1017c6fd2807SJeff Garzik */ 1018c6fd2807SJeff Garzik static void ata_eh_detach_dev(struct ata_device *dev) 1019c6fd2807SJeff Garzik { 1020f58229f8STejun Heo struct ata_link *link = dev->link; 1021f58229f8STejun Heo struct ata_port *ap = link->ap; 1022c6fd2807SJeff Garzik unsigned long flags; 1023c6fd2807SJeff Garzik 1024c6fd2807SJeff Garzik ata_dev_disable(dev); 1025c6fd2807SJeff Garzik 1026c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 1027c6fd2807SJeff Garzik 1028c6fd2807SJeff Garzik dev->flags &= ~ATA_DFLAG_DETACH; 1029c6fd2807SJeff Garzik 1030c6fd2807SJeff Garzik if (ata_scsi_offline_dev(dev)) { 1031c6fd2807SJeff Garzik dev->flags |= ATA_DFLAG_DETACHED; 1032c6fd2807SJeff Garzik ap->pflags |= ATA_PFLAG_SCSI_HOTPLUG; 1033c6fd2807SJeff Garzik } 1034c6fd2807SJeff Garzik 1035c6fd2807SJeff Garzik /* clear per-dev EH actions */ 1036f58229f8STejun Heo ata_eh_clear_action(link, dev, &link->eh_info, ATA_EH_PERDEV_MASK); 1037f58229f8STejun Heo ata_eh_clear_action(link, dev, &link->eh_context.i, ATA_EH_PERDEV_MASK); 1038c6fd2807SJeff Garzik 1039c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 1040c6fd2807SJeff Garzik } 1041c6fd2807SJeff Garzik 1042c6fd2807SJeff Garzik /** 1043c6fd2807SJeff Garzik * ata_eh_about_to_do - about to perform eh_action 1044955e57dfSTejun Heo * @link: target ATA link 1045c6fd2807SJeff Garzik * @dev: target ATA dev for per-dev action (can be NULL) 1046c6fd2807SJeff Garzik * @action: action about to be performed 1047c6fd2807SJeff Garzik * 1048c6fd2807SJeff Garzik * Called just before performing EH actions to clear related bits 1049955e57dfSTejun Heo * in @link->eh_info such that eh actions are not unnecessarily 1050955e57dfSTejun Heo * repeated. 1051c6fd2807SJeff Garzik * 1052c6fd2807SJeff Garzik * LOCKING: 1053c6fd2807SJeff Garzik * None. 1054c6fd2807SJeff Garzik */ 1055955e57dfSTejun Heo static void ata_eh_about_to_do(struct ata_link *link, struct ata_device *dev, 1056c6fd2807SJeff Garzik unsigned int action) 1057c6fd2807SJeff Garzik { 1058955e57dfSTejun Heo struct ata_port *ap = link->ap; 1059955e57dfSTejun Heo struct ata_eh_info *ehi = &link->eh_info; 1060955e57dfSTejun Heo struct ata_eh_context *ehc = &link->eh_context; 1061c6fd2807SJeff Garzik unsigned long flags; 1062c6fd2807SJeff Garzik 1063c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 1064c6fd2807SJeff Garzik 1065c6fd2807SJeff Garzik /* Reset is represented by combination of actions and EHI 1066c6fd2807SJeff Garzik * flags. Suck in all related bits before clearing eh_info to 1067c6fd2807SJeff Garzik * avoid losing requested action. 1068c6fd2807SJeff Garzik */ 1069c6fd2807SJeff Garzik if (action & ATA_EH_RESET_MASK) { 1070c6fd2807SJeff Garzik ehc->i.action |= ehi->action & ATA_EH_RESET_MASK; 1071c6fd2807SJeff Garzik ehc->i.flags |= ehi->flags & ATA_EHI_RESET_MODIFIER_MASK; 1072c6fd2807SJeff Garzik 1073c6fd2807SJeff Garzik /* make sure all reset actions are cleared & clear EHI flags */ 1074c6fd2807SJeff Garzik action |= ATA_EH_RESET_MASK; 1075c6fd2807SJeff Garzik ehi->flags &= ~ATA_EHI_RESET_MODIFIER_MASK; 1076c6fd2807SJeff Garzik } 1077c6fd2807SJeff Garzik 1078955e57dfSTejun Heo ata_eh_clear_action(link, dev, ehi, action); 1079c6fd2807SJeff Garzik 1080c6fd2807SJeff Garzik if (!(ehc->i.flags & ATA_EHI_QUIET)) 1081c6fd2807SJeff Garzik ap->pflags |= ATA_PFLAG_RECOVERED; 1082c6fd2807SJeff Garzik 1083c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 1084c6fd2807SJeff Garzik } 1085c6fd2807SJeff Garzik 1086c6fd2807SJeff Garzik /** 1087c6fd2807SJeff Garzik * ata_eh_done - EH action complete 1088c6fd2807SJeff Garzik * @ap: target ATA port 1089c6fd2807SJeff Garzik * @dev: target ATA dev for per-dev action (can be NULL) 1090c6fd2807SJeff Garzik * @action: action just completed 1091c6fd2807SJeff Garzik * 1092c6fd2807SJeff Garzik * Called right after performing EH actions to clear related bits 1093955e57dfSTejun Heo * in @link->eh_context. 1094c6fd2807SJeff Garzik * 1095c6fd2807SJeff Garzik * LOCKING: 1096c6fd2807SJeff Garzik * None. 1097c6fd2807SJeff Garzik */ 1098955e57dfSTejun Heo static void ata_eh_done(struct ata_link *link, struct ata_device *dev, 1099c6fd2807SJeff Garzik unsigned int action) 1100c6fd2807SJeff Garzik { 1101955e57dfSTejun Heo struct ata_eh_context *ehc = &link->eh_context; 11029af5c9c9STejun Heo 1103c6fd2807SJeff Garzik /* if reset is complete, clear all reset actions & reset modifier */ 1104c6fd2807SJeff Garzik if (action & ATA_EH_RESET_MASK) { 1105c6fd2807SJeff Garzik action |= ATA_EH_RESET_MASK; 11069af5c9c9STejun Heo ehc->i.flags &= ~ATA_EHI_RESET_MODIFIER_MASK; 1107c6fd2807SJeff Garzik } 1108c6fd2807SJeff Garzik 1109955e57dfSTejun Heo ata_eh_clear_action(link, dev, &ehc->i, action); 1110c6fd2807SJeff Garzik } 1111c6fd2807SJeff Garzik 1112c6fd2807SJeff Garzik /** 1113c6fd2807SJeff Garzik * ata_err_string - convert err_mask to descriptive string 1114c6fd2807SJeff Garzik * @err_mask: error mask to convert to string 1115c6fd2807SJeff Garzik * 1116c6fd2807SJeff Garzik * Convert @err_mask to descriptive string. Errors are 1117c6fd2807SJeff Garzik * prioritized according to severity and only the most severe 1118c6fd2807SJeff Garzik * error is reported. 1119c6fd2807SJeff Garzik * 1120c6fd2807SJeff Garzik * LOCKING: 1121c6fd2807SJeff Garzik * None. 1122c6fd2807SJeff Garzik * 1123c6fd2807SJeff Garzik * RETURNS: 1124c6fd2807SJeff Garzik * Descriptive string for @err_mask 1125c6fd2807SJeff Garzik */ 1126c6fd2807SJeff Garzik static const char * ata_err_string(unsigned int err_mask) 1127c6fd2807SJeff Garzik { 1128c6fd2807SJeff Garzik if (err_mask & AC_ERR_HOST_BUS) 1129c6fd2807SJeff Garzik return "host bus error"; 1130c6fd2807SJeff Garzik if (err_mask & AC_ERR_ATA_BUS) 1131c6fd2807SJeff Garzik return "ATA bus error"; 1132c6fd2807SJeff Garzik if (err_mask & AC_ERR_TIMEOUT) 1133c6fd2807SJeff Garzik return "timeout"; 1134c6fd2807SJeff Garzik if (err_mask & AC_ERR_HSM) 1135c6fd2807SJeff Garzik return "HSM violation"; 1136c6fd2807SJeff Garzik if (err_mask & AC_ERR_SYSTEM) 1137c6fd2807SJeff Garzik return "internal error"; 1138c6fd2807SJeff Garzik if (err_mask & AC_ERR_MEDIA) 1139c6fd2807SJeff Garzik return "media error"; 1140c6fd2807SJeff Garzik if (err_mask & AC_ERR_INVALID) 1141c6fd2807SJeff Garzik return "invalid argument"; 1142c6fd2807SJeff Garzik if (err_mask & AC_ERR_DEV) 1143c6fd2807SJeff Garzik return "device error"; 1144c6fd2807SJeff Garzik return "unknown error"; 1145c6fd2807SJeff Garzik } 1146c6fd2807SJeff Garzik 1147c6fd2807SJeff Garzik /** 1148c6fd2807SJeff Garzik * ata_read_log_page - read a specific log page 1149c6fd2807SJeff Garzik * @dev: target device 1150c6fd2807SJeff Garzik * @page: page to read 1151c6fd2807SJeff Garzik * @buf: buffer to store read page 1152c6fd2807SJeff Garzik * @sectors: number of sectors to read 1153c6fd2807SJeff Garzik * 1154c6fd2807SJeff Garzik * Read log page using READ_LOG_EXT command. 1155c6fd2807SJeff Garzik * 1156c6fd2807SJeff Garzik * LOCKING: 1157c6fd2807SJeff Garzik * Kernel thread context (may sleep). 1158c6fd2807SJeff Garzik * 1159c6fd2807SJeff Garzik * RETURNS: 1160c6fd2807SJeff Garzik * 0 on success, AC_ERR_* mask otherwise. 1161c6fd2807SJeff Garzik */ 1162c6fd2807SJeff Garzik static unsigned int ata_read_log_page(struct ata_device *dev, 1163c6fd2807SJeff Garzik u8 page, void *buf, unsigned int sectors) 1164c6fd2807SJeff Garzik { 1165c6fd2807SJeff Garzik struct ata_taskfile tf; 1166c6fd2807SJeff Garzik unsigned int err_mask; 1167c6fd2807SJeff Garzik 1168c6fd2807SJeff Garzik DPRINTK("read log page - page %d\n", page); 1169c6fd2807SJeff Garzik 1170c6fd2807SJeff Garzik ata_tf_init(dev, &tf); 1171c6fd2807SJeff Garzik tf.command = ATA_CMD_READ_LOG_EXT; 1172c6fd2807SJeff Garzik tf.lbal = page; 1173c6fd2807SJeff Garzik tf.nsect = sectors; 1174c6fd2807SJeff Garzik tf.hob_nsect = sectors >> 8; 1175c6fd2807SJeff Garzik tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_LBA48 | ATA_TFLAG_DEVICE; 1176c6fd2807SJeff Garzik tf.protocol = ATA_PROT_PIO; 1177c6fd2807SJeff Garzik 1178c6fd2807SJeff Garzik err_mask = ata_exec_internal(dev, &tf, NULL, DMA_FROM_DEVICE, 1179c6fd2807SJeff Garzik buf, sectors * ATA_SECT_SIZE); 1180c6fd2807SJeff Garzik 1181c6fd2807SJeff Garzik DPRINTK("EXIT, err_mask=%x\n", err_mask); 1182c6fd2807SJeff Garzik return err_mask; 1183c6fd2807SJeff Garzik } 1184c6fd2807SJeff Garzik 1185c6fd2807SJeff Garzik /** 1186c6fd2807SJeff Garzik * ata_eh_read_log_10h - Read log page 10h for NCQ error details 1187c6fd2807SJeff Garzik * @dev: Device to read log page 10h from 1188c6fd2807SJeff Garzik * @tag: Resulting tag of the failed command 1189c6fd2807SJeff Garzik * @tf: Resulting taskfile registers of the failed command 1190c6fd2807SJeff Garzik * 1191c6fd2807SJeff Garzik * Read log page 10h to obtain NCQ error details and clear error 1192c6fd2807SJeff Garzik * condition. 1193c6fd2807SJeff Garzik * 1194c6fd2807SJeff Garzik * LOCKING: 1195c6fd2807SJeff Garzik * Kernel thread context (may sleep). 1196c6fd2807SJeff Garzik * 1197c6fd2807SJeff Garzik * RETURNS: 1198c6fd2807SJeff Garzik * 0 on success, -errno otherwise. 1199c6fd2807SJeff Garzik */ 1200c6fd2807SJeff Garzik static int ata_eh_read_log_10h(struct ata_device *dev, 1201c6fd2807SJeff Garzik int *tag, struct ata_taskfile *tf) 1202c6fd2807SJeff Garzik { 12039af5c9c9STejun Heo u8 *buf = dev->link->ap->sector_buf; 1204c6fd2807SJeff Garzik unsigned int err_mask; 1205c6fd2807SJeff Garzik u8 csum; 1206c6fd2807SJeff Garzik int i; 1207c6fd2807SJeff Garzik 1208c6fd2807SJeff Garzik err_mask = ata_read_log_page(dev, ATA_LOG_SATA_NCQ, buf, 1); 1209c6fd2807SJeff Garzik if (err_mask) 1210c6fd2807SJeff Garzik return -EIO; 1211c6fd2807SJeff Garzik 1212c6fd2807SJeff Garzik csum = 0; 1213c6fd2807SJeff Garzik for (i = 0; i < ATA_SECT_SIZE; i++) 1214c6fd2807SJeff Garzik csum += buf[i]; 1215c6fd2807SJeff Garzik if (csum) 1216c6fd2807SJeff Garzik ata_dev_printk(dev, KERN_WARNING, 1217c6fd2807SJeff Garzik "invalid checksum 0x%x on log page 10h\n", csum); 1218c6fd2807SJeff Garzik 1219c6fd2807SJeff Garzik if (buf[0] & 0x80) 1220c6fd2807SJeff Garzik return -ENOENT; 1221c6fd2807SJeff Garzik 1222c6fd2807SJeff Garzik *tag = buf[0] & 0x1f; 1223c6fd2807SJeff Garzik 1224c6fd2807SJeff Garzik tf->command = buf[2]; 1225c6fd2807SJeff Garzik tf->feature = buf[3]; 1226c6fd2807SJeff Garzik tf->lbal = buf[4]; 1227c6fd2807SJeff Garzik tf->lbam = buf[5]; 1228c6fd2807SJeff Garzik tf->lbah = buf[6]; 1229c6fd2807SJeff Garzik tf->device = buf[7]; 1230c6fd2807SJeff Garzik tf->hob_lbal = buf[8]; 1231c6fd2807SJeff Garzik tf->hob_lbam = buf[9]; 1232c6fd2807SJeff Garzik tf->hob_lbah = buf[10]; 1233c6fd2807SJeff Garzik tf->nsect = buf[12]; 1234c6fd2807SJeff Garzik tf->hob_nsect = buf[13]; 1235c6fd2807SJeff Garzik 1236c6fd2807SJeff Garzik return 0; 1237c6fd2807SJeff Garzik } 1238c6fd2807SJeff Garzik 1239c6fd2807SJeff Garzik /** 1240c6fd2807SJeff Garzik * atapi_eh_request_sense - perform ATAPI REQUEST_SENSE 1241c6fd2807SJeff Garzik * @dev: device to perform REQUEST_SENSE to 1242c6fd2807SJeff Garzik * @sense_buf: result sense data buffer (SCSI_SENSE_BUFFERSIZE bytes long) 1243c6fd2807SJeff Garzik * 1244c6fd2807SJeff Garzik * Perform ATAPI REQUEST_SENSE after the device reported CHECK 1245c6fd2807SJeff Garzik * SENSE. This function is EH helper. 1246c6fd2807SJeff Garzik * 1247c6fd2807SJeff Garzik * LOCKING: 1248c6fd2807SJeff Garzik * Kernel thread context (may sleep). 1249c6fd2807SJeff Garzik * 1250c6fd2807SJeff Garzik * RETURNS: 1251c6fd2807SJeff Garzik * 0 on success, AC_ERR_* mask on failure 1252c6fd2807SJeff Garzik */ 125356287768SAlbert Lee static unsigned int atapi_eh_request_sense(struct ata_queued_cmd *qc) 1254c6fd2807SJeff Garzik { 125556287768SAlbert Lee struct ata_device *dev = qc->dev; 125656287768SAlbert Lee unsigned char *sense_buf = qc->scsicmd->sense_buffer; 12579af5c9c9STejun Heo struct ata_port *ap = dev->link->ap; 1258c6fd2807SJeff Garzik struct ata_taskfile tf; 1259c6fd2807SJeff Garzik u8 cdb[ATAPI_CDB_LEN]; 1260c6fd2807SJeff Garzik 1261c6fd2807SJeff Garzik DPRINTK("ATAPI request sense\n"); 1262c6fd2807SJeff Garzik 1263c6fd2807SJeff Garzik /* FIXME: is this needed? */ 1264c6fd2807SJeff Garzik memset(sense_buf, 0, SCSI_SENSE_BUFFERSIZE); 1265c6fd2807SJeff Garzik 126656287768SAlbert Lee /* initialize sense_buf with the error register, 126756287768SAlbert Lee * for the case where they are -not- overwritten 126856287768SAlbert Lee */ 1269c6fd2807SJeff Garzik sense_buf[0] = 0x70; 127056287768SAlbert Lee sense_buf[2] = qc->result_tf.feature >> 4; 127156287768SAlbert Lee 127256287768SAlbert Lee /* some devices time out if garbage left in tf */ 127356287768SAlbert Lee ata_tf_init(dev, &tf); 1274c6fd2807SJeff Garzik 1275c6fd2807SJeff Garzik memset(cdb, 0, ATAPI_CDB_LEN); 1276c6fd2807SJeff Garzik cdb[0] = REQUEST_SENSE; 1277c6fd2807SJeff Garzik cdb[4] = SCSI_SENSE_BUFFERSIZE; 1278c6fd2807SJeff Garzik 1279c6fd2807SJeff Garzik tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_DEVICE; 1280c6fd2807SJeff Garzik tf.command = ATA_CMD_PACKET; 1281c6fd2807SJeff Garzik 1282c6fd2807SJeff Garzik /* is it pointless to prefer PIO for "safety reasons"? */ 1283c6fd2807SJeff Garzik if (ap->flags & ATA_FLAG_PIO_DMA) { 1284c6fd2807SJeff Garzik tf.protocol = ATA_PROT_ATAPI_DMA; 1285c6fd2807SJeff Garzik tf.feature |= ATAPI_PKT_DMA; 1286c6fd2807SJeff Garzik } else { 1287c6fd2807SJeff Garzik tf.protocol = ATA_PROT_ATAPI; 1288c6fd2807SJeff Garzik tf.lbam = (8 * 1024) & 0xff; 1289c6fd2807SJeff Garzik tf.lbah = (8 * 1024) >> 8; 1290c6fd2807SJeff Garzik } 1291c6fd2807SJeff Garzik 1292c6fd2807SJeff Garzik return ata_exec_internal(dev, &tf, cdb, DMA_FROM_DEVICE, 1293c6fd2807SJeff Garzik sense_buf, SCSI_SENSE_BUFFERSIZE); 1294c6fd2807SJeff Garzik } 1295c6fd2807SJeff Garzik 1296c6fd2807SJeff Garzik /** 1297c6fd2807SJeff Garzik * ata_eh_analyze_serror - analyze SError for a failed port 12980260731fSTejun Heo * @link: ATA link to analyze SError for 1299c6fd2807SJeff Garzik * 1300c6fd2807SJeff Garzik * Analyze SError if available and further determine cause of 1301c6fd2807SJeff Garzik * failure. 1302c6fd2807SJeff Garzik * 1303c6fd2807SJeff Garzik * LOCKING: 1304c6fd2807SJeff Garzik * None. 1305c6fd2807SJeff Garzik */ 13060260731fSTejun Heo static void ata_eh_analyze_serror(struct ata_link *link) 1307c6fd2807SJeff Garzik { 13080260731fSTejun Heo struct ata_eh_context *ehc = &link->eh_context; 1309c6fd2807SJeff Garzik u32 serror = ehc->i.serror; 1310c6fd2807SJeff Garzik unsigned int err_mask = 0, action = 0; 1311c6fd2807SJeff Garzik 1312c6fd2807SJeff Garzik if (serror & SERR_PERSISTENT) { 1313c6fd2807SJeff Garzik err_mask |= AC_ERR_ATA_BUS; 1314c6fd2807SJeff Garzik action |= ATA_EH_HARDRESET; 1315c6fd2807SJeff Garzik } 1316c6fd2807SJeff Garzik if (serror & 1317c6fd2807SJeff Garzik (SERR_DATA_RECOVERED | SERR_COMM_RECOVERED | SERR_DATA)) { 1318c6fd2807SJeff Garzik err_mask |= AC_ERR_ATA_BUS; 1319c6fd2807SJeff Garzik action |= ATA_EH_SOFTRESET; 1320c6fd2807SJeff Garzik } 1321c6fd2807SJeff Garzik if (serror & SERR_PROTOCOL) { 1322c6fd2807SJeff Garzik err_mask |= AC_ERR_HSM; 1323c6fd2807SJeff Garzik action |= ATA_EH_SOFTRESET; 1324c6fd2807SJeff Garzik } 1325c6fd2807SJeff Garzik if (serror & SERR_INTERNAL) { 1326c6fd2807SJeff Garzik err_mask |= AC_ERR_SYSTEM; 1327771b8dadSTejun Heo action |= ATA_EH_HARDRESET; 1328c6fd2807SJeff Garzik } 1329c6fd2807SJeff Garzik if (serror & (SERR_PHYRDY_CHG | SERR_DEV_XCHG)) 1330c6fd2807SJeff Garzik ata_ehi_hotplugged(&ehc->i); 1331c6fd2807SJeff Garzik 1332c6fd2807SJeff Garzik ehc->i.err_mask |= err_mask; 1333c6fd2807SJeff Garzik ehc->i.action |= action; 1334c6fd2807SJeff Garzik } 1335c6fd2807SJeff Garzik 1336c6fd2807SJeff Garzik /** 1337c6fd2807SJeff Garzik * ata_eh_analyze_ncq_error - analyze NCQ error 13380260731fSTejun Heo * @link: ATA link to analyze NCQ error for 1339c6fd2807SJeff Garzik * 1340c6fd2807SJeff Garzik * Read log page 10h, determine the offending qc and acquire 1341c6fd2807SJeff Garzik * error status TF. For NCQ device errors, all LLDDs have to do 1342c6fd2807SJeff Garzik * is setting AC_ERR_DEV in ehi->err_mask. This function takes 1343c6fd2807SJeff Garzik * care of the rest. 1344c6fd2807SJeff Garzik * 1345c6fd2807SJeff Garzik * LOCKING: 1346c6fd2807SJeff Garzik * Kernel thread context (may sleep). 1347c6fd2807SJeff Garzik */ 13480260731fSTejun Heo static void ata_eh_analyze_ncq_error(struct ata_link *link) 1349c6fd2807SJeff Garzik { 13500260731fSTejun Heo struct ata_port *ap = link->ap; 13510260731fSTejun Heo struct ata_eh_context *ehc = &link->eh_context; 13520260731fSTejun Heo struct ata_device *dev = link->device; 1353c6fd2807SJeff Garzik struct ata_queued_cmd *qc; 1354c6fd2807SJeff Garzik struct ata_taskfile tf; 1355c6fd2807SJeff Garzik int tag, rc; 1356c6fd2807SJeff Garzik 1357c6fd2807SJeff Garzik /* if frozen, we can't do much */ 1358c6fd2807SJeff Garzik if (ap->pflags & ATA_PFLAG_FROZEN) 1359c6fd2807SJeff Garzik return; 1360c6fd2807SJeff Garzik 1361c6fd2807SJeff Garzik /* is it NCQ device error? */ 13620260731fSTejun Heo if (!link->sactive || !(ehc->i.err_mask & AC_ERR_DEV)) 1363c6fd2807SJeff Garzik return; 1364c6fd2807SJeff Garzik 1365c6fd2807SJeff Garzik /* has LLDD analyzed already? */ 1366c6fd2807SJeff Garzik for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 1367c6fd2807SJeff Garzik qc = __ata_qc_from_tag(ap, tag); 1368c6fd2807SJeff Garzik 1369c6fd2807SJeff Garzik if (!(qc->flags & ATA_QCFLAG_FAILED)) 1370c6fd2807SJeff Garzik continue; 1371c6fd2807SJeff Garzik 1372c6fd2807SJeff Garzik if (qc->err_mask) 1373c6fd2807SJeff Garzik return; 1374c6fd2807SJeff Garzik } 1375c6fd2807SJeff Garzik 1376c6fd2807SJeff Garzik /* okay, this error is ours */ 1377c6fd2807SJeff Garzik rc = ata_eh_read_log_10h(dev, &tag, &tf); 1378c6fd2807SJeff Garzik if (rc) { 13790260731fSTejun Heo ata_link_printk(link, KERN_ERR, "failed to read log page 10h " 1380c6fd2807SJeff Garzik "(errno=%d)\n", rc); 1381c6fd2807SJeff Garzik return; 1382c6fd2807SJeff Garzik } 1383c6fd2807SJeff Garzik 13840260731fSTejun Heo if (!(link->sactive & (1 << tag))) { 13850260731fSTejun Heo ata_link_printk(link, KERN_ERR, "log page 10h reported " 1386c6fd2807SJeff Garzik "inactive tag %d\n", tag); 1387c6fd2807SJeff Garzik return; 1388c6fd2807SJeff Garzik } 1389c6fd2807SJeff Garzik 1390c6fd2807SJeff Garzik /* we've got the perpetrator, condemn it */ 1391c6fd2807SJeff Garzik qc = __ata_qc_from_tag(ap, tag); 1392c6fd2807SJeff Garzik memcpy(&qc->result_tf, &tf, sizeof(tf)); 13935335b729STejun Heo qc->err_mask |= AC_ERR_DEV | AC_ERR_NCQ; 1394c6fd2807SJeff Garzik ehc->i.err_mask &= ~AC_ERR_DEV; 1395c6fd2807SJeff Garzik } 1396c6fd2807SJeff Garzik 1397c6fd2807SJeff Garzik /** 1398c6fd2807SJeff Garzik * ata_eh_analyze_tf - analyze taskfile of a failed qc 1399c6fd2807SJeff Garzik * @qc: qc to analyze 1400c6fd2807SJeff Garzik * @tf: Taskfile registers to analyze 1401c6fd2807SJeff Garzik * 1402c6fd2807SJeff Garzik * Analyze taskfile of @qc and further determine cause of 1403c6fd2807SJeff Garzik * failure. This function also requests ATAPI sense data if 1404c6fd2807SJeff Garzik * avaliable. 1405c6fd2807SJeff Garzik * 1406c6fd2807SJeff Garzik * LOCKING: 1407c6fd2807SJeff Garzik * Kernel thread context (may sleep). 1408c6fd2807SJeff Garzik * 1409c6fd2807SJeff Garzik * RETURNS: 1410c6fd2807SJeff Garzik * Determined recovery action 1411c6fd2807SJeff Garzik */ 1412c6fd2807SJeff Garzik static unsigned int ata_eh_analyze_tf(struct ata_queued_cmd *qc, 1413c6fd2807SJeff Garzik const struct ata_taskfile *tf) 1414c6fd2807SJeff Garzik { 1415c6fd2807SJeff Garzik unsigned int tmp, action = 0; 1416c6fd2807SJeff Garzik u8 stat = tf->command, err = tf->feature; 1417c6fd2807SJeff Garzik 1418c6fd2807SJeff Garzik if ((stat & (ATA_BUSY | ATA_DRQ | ATA_DRDY)) != ATA_DRDY) { 1419c6fd2807SJeff Garzik qc->err_mask |= AC_ERR_HSM; 1420c6fd2807SJeff Garzik return ATA_EH_SOFTRESET; 1421c6fd2807SJeff Garzik } 1422c6fd2807SJeff Garzik 1423a51d644aSTejun Heo if (stat & (ATA_ERR | ATA_DF)) 1424a51d644aSTejun Heo qc->err_mask |= AC_ERR_DEV; 1425a51d644aSTejun Heo else 1426c6fd2807SJeff Garzik return 0; 1427c6fd2807SJeff Garzik 1428c6fd2807SJeff Garzik switch (qc->dev->class) { 1429c6fd2807SJeff Garzik case ATA_DEV_ATA: 1430c6fd2807SJeff Garzik if (err & ATA_ICRC) 1431c6fd2807SJeff Garzik qc->err_mask |= AC_ERR_ATA_BUS; 1432c6fd2807SJeff Garzik if (err & ATA_UNC) 1433c6fd2807SJeff Garzik qc->err_mask |= AC_ERR_MEDIA; 1434c6fd2807SJeff Garzik if (err & ATA_IDNF) 1435c6fd2807SJeff Garzik qc->err_mask |= AC_ERR_INVALID; 1436c6fd2807SJeff Garzik break; 1437c6fd2807SJeff Garzik 1438c6fd2807SJeff Garzik case ATA_DEV_ATAPI: 1439a569a30dSTejun Heo if (!(qc->ap->pflags & ATA_PFLAG_FROZEN)) { 144056287768SAlbert Lee tmp = atapi_eh_request_sense(qc); 1441c6fd2807SJeff Garzik if (!tmp) { 1442a569a30dSTejun Heo /* ATA_QCFLAG_SENSE_VALID is used to 1443a569a30dSTejun Heo * tell atapi_qc_complete() that sense 1444a569a30dSTejun Heo * data is already valid. 1445c6fd2807SJeff Garzik * 1446c6fd2807SJeff Garzik * TODO: interpret sense data and set 1447c6fd2807SJeff Garzik * appropriate err_mask. 1448c6fd2807SJeff Garzik */ 1449c6fd2807SJeff Garzik qc->flags |= ATA_QCFLAG_SENSE_VALID; 1450c6fd2807SJeff Garzik } else 1451c6fd2807SJeff Garzik qc->err_mask |= tmp; 1452c6fd2807SJeff Garzik } 1453a569a30dSTejun Heo } 1454c6fd2807SJeff Garzik 1455c6fd2807SJeff Garzik if (qc->err_mask & (AC_ERR_HSM | AC_ERR_TIMEOUT | AC_ERR_ATA_BUS)) 1456c6fd2807SJeff Garzik action |= ATA_EH_SOFTRESET; 1457c6fd2807SJeff Garzik 1458c6fd2807SJeff Garzik return action; 1459c6fd2807SJeff Garzik } 1460c6fd2807SJeff Garzik 14617d47e8d4STejun Heo static int ata_eh_categorize_error(int is_io, unsigned int err_mask) 1462c6fd2807SJeff Garzik { 14637d47e8d4STejun Heo if (err_mask & AC_ERR_ATA_BUS) 1464c6fd2807SJeff Garzik return 1; 1465c6fd2807SJeff Garzik 14667d47e8d4STejun Heo if (err_mask & AC_ERR_TIMEOUT) 1467c6fd2807SJeff Garzik return 2; 14687d47e8d4STejun Heo 14697d47e8d4STejun Heo if (is_io) { 14707d47e8d4STejun Heo if (err_mask & AC_ERR_HSM) 14717d47e8d4STejun Heo return 2; 14727d47e8d4STejun Heo if ((err_mask & 14737d47e8d4STejun Heo (AC_ERR_DEV|AC_ERR_MEDIA|AC_ERR_INVALID)) == AC_ERR_DEV) 14747d47e8d4STejun Heo return 3; 1475c6fd2807SJeff Garzik } 1476c6fd2807SJeff Garzik 1477c6fd2807SJeff Garzik return 0; 1478c6fd2807SJeff Garzik } 1479c6fd2807SJeff Garzik 14807d47e8d4STejun Heo struct speed_down_verdict_arg { 1481c6fd2807SJeff Garzik u64 since; 14827d47e8d4STejun Heo int nr_errors[4]; 1483c6fd2807SJeff Garzik }; 1484c6fd2807SJeff Garzik 14857d47e8d4STejun Heo static int speed_down_verdict_cb(struct ata_ering_entry *ent, void *void_arg) 1486c6fd2807SJeff Garzik { 14877d47e8d4STejun Heo struct speed_down_verdict_arg *arg = void_arg; 14887d47e8d4STejun Heo int cat = ata_eh_categorize_error(ent->is_io, ent->err_mask); 1489c6fd2807SJeff Garzik 1490c6fd2807SJeff Garzik if (ent->timestamp < arg->since) 1491c6fd2807SJeff Garzik return -1; 1492c6fd2807SJeff Garzik 14937d47e8d4STejun Heo arg->nr_errors[cat]++; 1494c6fd2807SJeff Garzik return 0; 1495c6fd2807SJeff Garzik } 1496c6fd2807SJeff Garzik 1497c6fd2807SJeff Garzik /** 14987d47e8d4STejun Heo * ata_eh_speed_down_verdict - Determine speed down verdict 1499c6fd2807SJeff Garzik * @dev: Device of interest 1500c6fd2807SJeff Garzik * 1501c6fd2807SJeff Garzik * This function examines error ring of @dev and determines 15027d47e8d4STejun Heo * whether NCQ needs to be turned off, transfer speed should be 15037d47e8d4STejun Heo * stepped down, or falling back to PIO is necessary. 1504c6fd2807SJeff Garzik * 15057d47e8d4STejun Heo * Cat-1 is ATA_BUS error for any command. 1506c6fd2807SJeff Garzik * 15077d47e8d4STejun Heo * Cat-2 is TIMEOUT for any command or HSM violation for known 15087d47e8d4STejun Heo * supported commands. 15097d47e8d4STejun Heo * 15107d47e8d4STejun Heo * Cat-3 is is unclassified DEV error for known supported 1511c6fd2807SJeff Garzik * command. 1512c6fd2807SJeff Garzik * 15137d47e8d4STejun Heo * NCQ needs to be turned off if there have been more than 3 15147d47e8d4STejun Heo * Cat-2 + Cat-3 errors during last 10 minutes. 15157d47e8d4STejun Heo * 15167d47e8d4STejun Heo * Speed down is necessary if there have been more than 3 Cat-1 + 15177d47e8d4STejun Heo * Cat-2 errors or 10 Cat-3 errors during last 10 minutes. 15187d47e8d4STejun Heo * 15197d47e8d4STejun Heo * Falling back to PIO mode is necessary if there have been more 15207d47e8d4STejun Heo * than 10 Cat-1 + Cat-2 + Cat-3 errors during last 5 minutes. 15217d47e8d4STejun Heo * 1522c6fd2807SJeff Garzik * LOCKING: 1523c6fd2807SJeff Garzik * Inherited from caller. 1524c6fd2807SJeff Garzik * 1525c6fd2807SJeff Garzik * RETURNS: 15267d47e8d4STejun Heo * OR of ATA_EH_SPDN_* flags. 1527c6fd2807SJeff Garzik */ 15287d47e8d4STejun Heo static unsigned int ata_eh_speed_down_verdict(struct ata_device *dev) 1529c6fd2807SJeff Garzik { 15307d47e8d4STejun Heo const u64 j5mins = 5LLU * 60 * HZ, j10mins = 10LLU * 60 * HZ; 15317d47e8d4STejun Heo u64 j64 = get_jiffies_64(); 15327d47e8d4STejun Heo struct speed_down_verdict_arg arg; 15337d47e8d4STejun Heo unsigned int verdict = 0; 1534c6fd2807SJeff Garzik 15357d47e8d4STejun Heo /* scan past 10 mins of error history */ 1536c6fd2807SJeff Garzik memset(&arg, 0, sizeof(arg)); 15377d47e8d4STejun Heo arg.since = j64 - min(j64, j10mins); 15387d47e8d4STejun Heo ata_ering_map(&dev->ering, speed_down_verdict_cb, &arg); 1539c6fd2807SJeff Garzik 15407d47e8d4STejun Heo if (arg.nr_errors[2] + arg.nr_errors[3] > 3) 15417d47e8d4STejun Heo verdict |= ATA_EH_SPDN_NCQ_OFF; 15427d47e8d4STejun Heo if (arg.nr_errors[1] + arg.nr_errors[2] > 3 || arg.nr_errors[3] > 10) 15437d47e8d4STejun Heo verdict |= ATA_EH_SPDN_SPEED_DOWN; 1544c6fd2807SJeff Garzik 15457d47e8d4STejun Heo /* scan past 3 mins of error history */ 15467d47e8d4STejun Heo memset(&arg, 0, sizeof(arg)); 15477d47e8d4STejun Heo arg.since = j64 - min(j64, j5mins); 15487d47e8d4STejun Heo ata_ering_map(&dev->ering, speed_down_verdict_cb, &arg); 1549c6fd2807SJeff Garzik 15507d47e8d4STejun Heo if (arg.nr_errors[1] + arg.nr_errors[2] + arg.nr_errors[3] > 10) 15517d47e8d4STejun Heo verdict |= ATA_EH_SPDN_FALLBACK_TO_PIO; 15527d47e8d4STejun Heo 15537d47e8d4STejun Heo return verdict; 1554c6fd2807SJeff Garzik } 1555c6fd2807SJeff Garzik 1556c6fd2807SJeff Garzik /** 1557c6fd2807SJeff Garzik * ata_eh_speed_down - record error and speed down if necessary 1558c6fd2807SJeff Garzik * @dev: Failed device 1559c6fd2807SJeff Garzik * @is_io: Did the device fail during normal IO? 1560c6fd2807SJeff Garzik * @err_mask: err_mask of the error 1561c6fd2807SJeff Garzik * 1562c6fd2807SJeff Garzik * Record error and examine error history to determine whether 1563c6fd2807SJeff Garzik * adjusting transmission speed is necessary. It also sets 1564c6fd2807SJeff Garzik * transmission limits appropriately if such adjustment is 1565c6fd2807SJeff Garzik * necessary. 1566c6fd2807SJeff Garzik * 1567c6fd2807SJeff Garzik * LOCKING: 1568c6fd2807SJeff Garzik * Kernel thread context (may sleep). 1569c6fd2807SJeff Garzik * 1570c6fd2807SJeff Garzik * RETURNS: 15717d47e8d4STejun Heo * Determined recovery action. 1572c6fd2807SJeff Garzik */ 15737d47e8d4STejun Heo static unsigned int ata_eh_speed_down(struct ata_device *dev, int is_io, 1574c6fd2807SJeff Garzik unsigned int err_mask) 1575c6fd2807SJeff Garzik { 15767d47e8d4STejun Heo unsigned int verdict; 15777d47e8d4STejun Heo unsigned int action = 0; 15787d47e8d4STejun Heo 15797d47e8d4STejun Heo /* don't bother if Cat-0 error */ 15807d47e8d4STejun Heo if (ata_eh_categorize_error(is_io, err_mask) == 0) 1581c6fd2807SJeff Garzik return 0; 1582c6fd2807SJeff Garzik 1583c6fd2807SJeff Garzik /* record error and determine whether speed down is necessary */ 1584c6fd2807SJeff Garzik ata_ering_record(&dev->ering, is_io, err_mask); 15857d47e8d4STejun Heo verdict = ata_eh_speed_down_verdict(dev); 1586c6fd2807SJeff Garzik 15877d47e8d4STejun Heo /* turn off NCQ? */ 15887d47e8d4STejun Heo if ((verdict & ATA_EH_SPDN_NCQ_OFF) && 15897d47e8d4STejun Heo (dev->flags & (ATA_DFLAG_PIO | ATA_DFLAG_NCQ | 15907d47e8d4STejun Heo ATA_DFLAG_NCQ_OFF)) == ATA_DFLAG_NCQ) { 15917d47e8d4STejun Heo dev->flags |= ATA_DFLAG_NCQ_OFF; 15927d47e8d4STejun Heo ata_dev_printk(dev, KERN_WARNING, 15937d47e8d4STejun Heo "NCQ disabled due to excessive errors\n"); 15947d47e8d4STejun Heo goto done; 15957d47e8d4STejun Heo } 1596c6fd2807SJeff Garzik 15977d47e8d4STejun Heo /* speed down? */ 15987d47e8d4STejun Heo if (verdict & ATA_EH_SPDN_SPEED_DOWN) { 1599c6fd2807SJeff Garzik /* speed down SATA link speed if possible */ 1600936fd732STejun Heo if (sata_down_spd_limit(dev->link) == 0) { 16017d47e8d4STejun Heo action |= ATA_EH_HARDRESET; 16027d47e8d4STejun Heo goto done; 16037d47e8d4STejun Heo } 1604c6fd2807SJeff Garzik 1605c6fd2807SJeff Garzik /* lower transfer mode */ 16067d47e8d4STejun Heo if (dev->spdn_cnt < 2) { 16077d47e8d4STejun Heo static const int dma_dnxfer_sel[] = 16087d47e8d4STejun Heo { ATA_DNXFER_DMA, ATA_DNXFER_40C }; 16097d47e8d4STejun Heo static const int pio_dnxfer_sel[] = 16107d47e8d4STejun Heo { ATA_DNXFER_PIO, ATA_DNXFER_FORCE_PIO0 }; 16117d47e8d4STejun Heo int sel; 1612c6fd2807SJeff Garzik 16137d47e8d4STejun Heo if (dev->xfer_shift != ATA_SHIFT_PIO) 16147d47e8d4STejun Heo sel = dma_dnxfer_sel[dev->spdn_cnt]; 16157d47e8d4STejun Heo else 16167d47e8d4STejun Heo sel = pio_dnxfer_sel[dev->spdn_cnt]; 16177d47e8d4STejun Heo 16187d47e8d4STejun Heo dev->spdn_cnt++; 16197d47e8d4STejun Heo 16207d47e8d4STejun Heo if (ata_down_xfermask_limit(dev, sel) == 0) { 16217d47e8d4STejun Heo action |= ATA_EH_SOFTRESET; 16227d47e8d4STejun Heo goto done; 16237d47e8d4STejun Heo } 16247d47e8d4STejun Heo } 16257d47e8d4STejun Heo } 16267d47e8d4STejun Heo 16277d47e8d4STejun Heo /* Fall back to PIO? Slowing down to PIO is meaningless for 16287d47e8d4STejun Heo * SATA. Consider it only for PATA. 16297d47e8d4STejun Heo */ 16307d47e8d4STejun Heo if ((verdict & ATA_EH_SPDN_FALLBACK_TO_PIO) && (dev->spdn_cnt >= 2) && 16319af5c9c9STejun Heo (dev->link->ap->cbl != ATA_CBL_SATA) && 16327d47e8d4STejun Heo (dev->xfer_shift != ATA_SHIFT_PIO)) { 16337d47e8d4STejun Heo if (ata_down_xfermask_limit(dev, ATA_DNXFER_FORCE_PIO) == 0) { 16347d47e8d4STejun Heo dev->spdn_cnt = 0; 16357d47e8d4STejun Heo action |= ATA_EH_SOFTRESET; 16367d47e8d4STejun Heo goto done; 16377d47e8d4STejun Heo } 16387d47e8d4STejun Heo } 16397d47e8d4STejun Heo 1640c6fd2807SJeff Garzik return 0; 16417d47e8d4STejun Heo done: 16427d47e8d4STejun Heo /* device has been slowed down, blow error history */ 16437d47e8d4STejun Heo ata_ering_clear(&dev->ering); 16447d47e8d4STejun Heo return action; 1645c6fd2807SJeff Garzik } 1646c6fd2807SJeff Garzik 1647c6fd2807SJeff Garzik /** 16489b1e2658STejun Heo * ata_eh_link_autopsy - analyze error and determine recovery action 16499b1e2658STejun Heo * @link: host link to perform autopsy on 1650c6fd2807SJeff Garzik * 16510260731fSTejun Heo * Analyze why @link failed and determine which recovery actions 16520260731fSTejun Heo * are needed. This function also sets more detailed AC_ERR_* 16530260731fSTejun Heo * values and fills sense data for ATAPI CHECK SENSE. 1654c6fd2807SJeff Garzik * 1655c6fd2807SJeff Garzik * LOCKING: 1656c6fd2807SJeff Garzik * Kernel thread context (may sleep). 1657c6fd2807SJeff Garzik */ 16589b1e2658STejun Heo static void ata_eh_link_autopsy(struct ata_link *link) 1659c6fd2807SJeff Garzik { 16600260731fSTejun Heo struct ata_port *ap = link->ap; 1661936fd732STejun Heo struct ata_eh_context *ehc = &link->eh_context; 1662c6fd2807SJeff Garzik unsigned int all_err_mask = 0; 1663c6fd2807SJeff Garzik int tag, is_io = 0; 1664c6fd2807SJeff Garzik u32 serror; 1665c6fd2807SJeff Garzik int rc; 1666c6fd2807SJeff Garzik 1667c6fd2807SJeff Garzik DPRINTK("ENTER\n"); 1668c6fd2807SJeff Garzik 1669c6fd2807SJeff Garzik if (ehc->i.flags & ATA_EHI_NO_AUTOPSY) 1670c6fd2807SJeff Garzik return; 1671c6fd2807SJeff Garzik 1672c6fd2807SJeff Garzik /* obtain and analyze SError */ 1673936fd732STejun Heo rc = sata_scr_read(link, SCR_ERROR, &serror); 1674c6fd2807SJeff Garzik if (rc == 0) { 1675c6fd2807SJeff Garzik ehc->i.serror |= serror; 16760260731fSTejun Heo ata_eh_analyze_serror(link); 16774e57c517STejun Heo } else if (rc != -EOPNOTSUPP) { 16784e57c517STejun Heo /* SError read failed, force hardreset and probing */ 16794e57c517STejun Heo ata_ehi_schedule_probe(&ehc->i); 1680c6fd2807SJeff Garzik ehc->i.action |= ATA_EH_HARDRESET; 16814e57c517STejun Heo ehc->i.err_mask |= AC_ERR_OTHER; 16824e57c517STejun Heo } 1683c6fd2807SJeff Garzik 1684c6fd2807SJeff Garzik /* analyze NCQ failure */ 16850260731fSTejun Heo ata_eh_analyze_ncq_error(link); 1686c6fd2807SJeff Garzik 1687c6fd2807SJeff Garzik /* any real error trumps AC_ERR_OTHER */ 1688c6fd2807SJeff Garzik if (ehc->i.err_mask & ~AC_ERR_OTHER) 1689c6fd2807SJeff Garzik ehc->i.err_mask &= ~AC_ERR_OTHER; 1690c6fd2807SJeff Garzik 1691c6fd2807SJeff Garzik all_err_mask |= ehc->i.err_mask; 1692c6fd2807SJeff Garzik 1693c6fd2807SJeff Garzik for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 1694c6fd2807SJeff Garzik struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 1695c6fd2807SJeff Garzik 16960260731fSTejun Heo if (!(qc->flags & ATA_QCFLAG_FAILED) || qc->dev->link != link) 1697c6fd2807SJeff Garzik continue; 1698c6fd2807SJeff Garzik 1699c6fd2807SJeff Garzik /* inherit upper level err_mask */ 1700c6fd2807SJeff Garzik qc->err_mask |= ehc->i.err_mask; 1701c6fd2807SJeff Garzik 1702c6fd2807SJeff Garzik /* analyze TF */ 1703c6fd2807SJeff Garzik ehc->i.action |= ata_eh_analyze_tf(qc, &qc->result_tf); 1704c6fd2807SJeff Garzik 1705c6fd2807SJeff Garzik /* DEV errors are probably spurious in case of ATA_BUS error */ 1706c6fd2807SJeff Garzik if (qc->err_mask & AC_ERR_ATA_BUS) 1707c6fd2807SJeff Garzik qc->err_mask &= ~(AC_ERR_DEV | AC_ERR_MEDIA | 1708c6fd2807SJeff Garzik AC_ERR_INVALID); 1709c6fd2807SJeff Garzik 1710c6fd2807SJeff Garzik /* any real error trumps unknown error */ 1711c6fd2807SJeff Garzik if (qc->err_mask & ~AC_ERR_OTHER) 1712c6fd2807SJeff Garzik qc->err_mask &= ~AC_ERR_OTHER; 1713c6fd2807SJeff Garzik 1714c6fd2807SJeff Garzik /* SENSE_VALID trumps dev/unknown error and revalidation */ 1715c6fd2807SJeff Garzik if (qc->flags & ATA_QCFLAG_SENSE_VALID) { 1716c6fd2807SJeff Garzik qc->err_mask &= ~(AC_ERR_DEV | AC_ERR_OTHER); 1717c6fd2807SJeff Garzik ehc->i.action &= ~ATA_EH_REVALIDATE; 1718c6fd2807SJeff Garzik } 1719c6fd2807SJeff Garzik 1720c6fd2807SJeff Garzik /* accumulate error info */ 1721c6fd2807SJeff Garzik ehc->i.dev = qc->dev; 1722c6fd2807SJeff Garzik all_err_mask |= qc->err_mask; 1723c6fd2807SJeff Garzik if (qc->flags & ATA_QCFLAG_IO) 1724c6fd2807SJeff Garzik is_io = 1; 1725c6fd2807SJeff Garzik } 1726c6fd2807SJeff Garzik 1727c6fd2807SJeff Garzik /* enforce default EH actions */ 1728c6fd2807SJeff Garzik if (ap->pflags & ATA_PFLAG_FROZEN || 1729c6fd2807SJeff Garzik all_err_mask & (AC_ERR_HSM | AC_ERR_TIMEOUT)) 1730c6fd2807SJeff Garzik ehc->i.action |= ATA_EH_SOFTRESET; 1731c6fd2807SJeff Garzik else if (all_err_mask) 1732c6fd2807SJeff Garzik ehc->i.action |= ATA_EH_REVALIDATE; 1733c6fd2807SJeff Garzik 1734c6fd2807SJeff Garzik /* if we have offending qcs and the associated failed device */ 1735c6fd2807SJeff Garzik if (ehc->i.dev) { 1736c6fd2807SJeff Garzik /* speed down */ 1737c6fd2807SJeff Garzik ehc->i.action |= ata_eh_speed_down(ehc->i.dev, is_io, 1738c6fd2807SJeff Garzik all_err_mask); 1739c6fd2807SJeff Garzik 1740c6fd2807SJeff Garzik /* perform per-dev EH action only on the offending device */ 1741c6fd2807SJeff Garzik ehc->i.dev_action[ehc->i.dev->devno] |= 1742c6fd2807SJeff Garzik ehc->i.action & ATA_EH_PERDEV_MASK; 1743c6fd2807SJeff Garzik ehc->i.action &= ~ATA_EH_PERDEV_MASK; 1744c6fd2807SJeff Garzik } 1745c6fd2807SJeff Garzik 1746c6fd2807SJeff Garzik DPRINTK("EXIT\n"); 1747c6fd2807SJeff Garzik } 1748c6fd2807SJeff Garzik 1749c6fd2807SJeff Garzik /** 17509b1e2658STejun Heo * ata_eh_autopsy - analyze error and determine recovery action 17519b1e2658STejun Heo * @ap: host port to perform autopsy on 17529b1e2658STejun Heo * 17539b1e2658STejun Heo * Analyze all links of @ap and determine why they failed and 17549b1e2658STejun Heo * which recovery actions are needed. 17559b1e2658STejun Heo * 17569b1e2658STejun Heo * LOCKING: 17579b1e2658STejun Heo * Kernel thread context (may sleep). 17589b1e2658STejun Heo */ 17599b1e2658STejun Heo static void ata_eh_autopsy(struct ata_port *ap) 17609b1e2658STejun Heo { 17619b1e2658STejun Heo struct ata_link *link; 17629b1e2658STejun Heo 17639b1e2658STejun Heo __ata_port_for_each_link(link, ap) 17649b1e2658STejun Heo ata_eh_link_autopsy(link); 17659b1e2658STejun Heo } 17669b1e2658STejun Heo 17679b1e2658STejun Heo /** 17689b1e2658STejun Heo * ata_eh_link_report - report error handling to user 17690260731fSTejun Heo * @link: ATA link EH is going on 1770c6fd2807SJeff Garzik * 1771c6fd2807SJeff Garzik * Report EH to user. 1772c6fd2807SJeff Garzik * 1773c6fd2807SJeff Garzik * LOCKING: 1774c6fd2807SJeff Garzik * None. 1775c6fd2807SJeff Garzik */ 17769b1e2658STejun Heo static void ata_eh_link_report(struct ata_link *link) 1777c6fd2807SJeff Garzik { 17780260731fSTejun Heo struct ata_port *ap = link->ap; 17790260731fSTejun Heo struct ata_eh_context *ehc = &link->eh_context; 1780c6fd2807SJeff Garzik const char *frozen, *desc; 1781*a1e10f7eSTejun Heo char tries_buf[6]; 1782c6fd2807SJeff Garzik int tag, nr_failed = 0; 1783c6fd2807SJeff Garzik 1784c6fd2807SJeff Garzik desc = NULL; 1785c6fd2807SJeff Garzik if (ehc->i.desc[0] != '\0') 1786c6fd2807SJeff Garzik desc = ehc->i.desc; 1787c6fd2807SJeff Garzik 1788c6fd2807SJeff Garzik for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 1789c6fd2807SJeff Garzik struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 1790c6fd2807SJeff Garzik 17910260731fSTejun Heo if (!(qc->flags & ATA_QCFLAG_FAILED) || qc->dev->link != link) 1792c6fd2807SJeff Garzik continue; 1793c6fd2807SJeff Garzik if (qc->flags & ATA_QCFLAG_SENSE_VALID && !qc->err_mask) 1794c6fd2807SJeff Garzik continue; 1795c6fd2807SJeff Garzik 1796c6fd2807SJeff Garzik nr_failed++; 1797c6fd2807SJeff Garzik } 1798c6fd2807SJeff Garzik 1799c6fd2807SJeff Garzik if (!nr_failed && !ehc->i.err_mask) 1800c6fd2807SJeff Garzik return; 1801c6fd2807SJeff Garzik 1802c6fd2807SJeff Garzik frozen = ""; 1803c6fd2807SJeff Garzik if (ap->pflags & ATA_PFLAG_FROZEN) 1804c6fd2807SJeff Garzik frozen = " frozen"; 1805c6fd2807SJeff Garzik 1806*a1e10f7eSTejun Heo memset(tries_buf, 0, sizeof(tries_buf)); 1807*a1e10f7eSTejun Heo if (ap->eh_tries < ATA_EH_MAX_TRIES) 1808*a1e10f7eSTejun Heo snprintf(tries_buf, sizeof(tries_buf) - 1, " t%d", 1809*a1e10f7eSTejun Heo ap->eh_tries); 1810*a1e10f7eSTejun Heo 1811c6fd2807SJeff Garzik if (ehc->i.dev) { 1812c6fd2807SJeff Garzik ata_dev_printk(ehc->i.dev, KERN_ERR, "exception Emask 0x%x " 1813*a1e10f7eSTejun Heo "SAct 0x%x SErr 0x%x action 0x%x%s%s\n", 1814*a1e10f7eSTejun Heo ehc->i.err_mask, link->sactive, ehc->i.serror, 1815*a1e10f7eSTejun Heo ehc->i.action, frozen, tries_buf); 1816c6fd2807SJeff Garzik if (desc) 1817b64bbc39STejun Heo ata_dev_printk(ehc->i.dev, KERN_ERR, "%s\n", desc); 1818c6fd2807SJeff Garzik } else { 18190260731fSTejun Heo ata_link_printk(link, KERN_ERR, "exception Emask 0x%x " 1820*a1e10f7eSTejun Heo "SAct 0x%x SErr 0x%x action 0x%x%s%s\n", 1821*a1e10f7eSTejun Heo ehc->i.err_mask, link->sactive, ehc->i.serror, 1822*a1e10f7eSTejun Heo ehc->i.action, frozen, tries_buf); 1823c6fd2807SJeff Garzik if (desc) 18240260731fSTejun Heo ata_link_printk(link, KERN_ERR, "%s\n", desc); 1825c6fd2807SJeff Garzik } 1826c6fd2807SJeff Garzik 1827c6fd2807SJeff Garzik for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 18288a937581STejun Heo static const char *dma_str[] = { 18298a937581STejun Heo [DMA_BIDIRECTIONAL] = "bidi", 18308a937581STejun Heo [DMA_TO_DEVICE] = "out", 18318a937581STejun Heo [DMA_FROM_DEVICE] = "in", 18328a937581STejun Heo [DMA_NONE] = "", 18338a937581STejun Heo }; 1834c6fd2807SJeff Garzik struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 18358a937581STejun Heo struct ata_taskfile *cmd = &qc->tf, *res = &qc->result_tf; 1836c6fd2807SJeff Garzik 18370260731fSTejun Heo if (!(qc->flags & ATA_QCFLAG_FAILED) || 18380260731fSTejun Heo qc->dev->link != link || !qc->err_mask) 1839c6fd2807SJeff Garzik continue; 1840c6fd2807SJeff Garzik 18418a937581STejun Heo ata_dev_printk(qc->dev, KERN_ERR, 18428a937581STejun Heo "cmd %02x/%02x:%02x:%02x:%02x:%02x/%02x:%02x:%02x:%02x:%02x/%02x " 1843664e8503STejun Heo "tag %d cdb 0x%x data %u %s\n " 18448a937581STejun Heo "res %02x/%02x:%02x:%02x:%02x:%02x/%02x:%02x:%02x:%02x:%02x/%02x " 18455335b729STejun Heo "Emask 0x%x (%s)%s\n", 18468a937581STejun Heo cmd->command, cmd->feature, cmd->nsect, 18478a937581STejun Heo cmd->lbal, cmd->lbam, cmd->lbah, 18488a937581STejun Heo cmd->hob_feature, cmd->hob_nsect, 18498a937581STejun Heo cmd->hob_lbal, cmd->hob_lbam, cmd->hob_lbah, 1850726f0785STejun Heo cmd->device, qc->tag, qc->cdb[0], qc->nbytes, 1851664e8503STejun Heo dma_str[qc->dma_dir], 18528a937581STejun Heo res->command, res->feature, res->nsect, 18538a937581STejun Heo res->lbal, res->lbam, res->lbah, 18548a937581STejun Heo res->hob_feature, res->hob_nsect, 18558a937581STejun Heo res->hob_lbal, res->hob_lbam, res->hob_lbah, 18565335b729STejun Heo res->device, qc->err_mask, ata_err_string(qc->err_mask), 18575335b729STejun Heo qc->err_mask & AC_ERR_NCQ ? " <F>" : ""); 1858c6fd2807SJeff Garzik } 1859c6fd2807SJeff Garzik } 1860c6fd2807SJeff Garzik 18619b1e2658STejun Heo /** 18629b1e2658STejun Heo * ata_eh_report - report error handling to user 18639b1e2658STejun Heo * @ap: ATA port to report EH about 18649b1e2658STejun Heo * 18659b1e2658STejun Heo * Report EH to user. 18669b1e2658STejun Heo * 18679b1e2658STejun Heo * LOCKING: 18689b1e2658STejun Heo * None. 18699b1e2658STejun Heo */ 18709b1e2658STejun Heo static void ata_eh_report(struct ata_port *ap) 18719b1e2658STejun Heo { 18729b1e2658STejun Heo struct ata_link *link; 18739b1e2658STejun Heo 18749b1e2658STejun Heo __ata_port_for_each_link(link, ap) 18759b1e2658STejun Heo ata_eh_link_report(link); 18769b1e2658STejun Heo } 18779b1e2658STejun Heo 1878cc0680a5STejun Heo static int ata_do_reset(struct ata_link *link, ata_reset_fn_t reset, 1879d4b2bab4STejun Heo unsigned int *classes, unsigned long deadline) 1880c6fd2807SJeff Garzik { 1881f58229f8STejun Heo struct ata_device *dev; 1882f58229f8STejun Heo int rc; 1883c6fd2807SJeff Garzik 1884cc0680a5STejun Heo ata_link_for_each_dev(dev, link) 1885f58229f8STejun Heo classes[dev->devno] = ATA_DEV_UNKNOWN; 1886c6fd2807SJeff Garzik 1887cc0680a5STejun Heo rc = reset(link, classes, deadline); 1888c6fd2807SJeff Garzik if (rc) 1889c6fd2807SJeff Garzik return rc; 1890c6fd2807SJeff Garzik 1891c6fd2807SJeff Garzik /* If any class isn't ATA_DEV_UNKNOWN, consider classification 1892c6fd2807SJeff Garzik * is complete and convert all ATA_DEV_UNKNOWN to 1893c6fd2807SJeff Garzik * ATA_DEV_NONE. 1894c6fd2807SJeff Garzik */ 1895cc0680a5STejun Heo ata_link_for_each_dev(dev, link) 1896f58229f8STejun Heo if (classes[dev->devno] != ATA_DEV_UNKNOWN) 1897c6fd2807SJeff Garzik break; 1898c6fd2807SJeff Garzik 1899f58229f8STejun Heo if (dev) { 1900cc0680a5STejun Heo ata_link_for_each_dev(dev, link) { 1901f58229f8STejun Heo if (classes[dev->devno] == ATA_DEV_UNKNOWN) 1902f58229f8STejun Heo classes[dev->devno] = ATA_DEV_NONE; 1903f58229f8STejun Heo } 1904f58229f8STejun Heo } 1905c6fd2807SJeff Garzik 1906c6fd2807SJeff Garzik return 0; 1907c6fd2807SJeff Garzik } 1908c6fd2807SJeff Garzik 1909c6fd2807SJeff Garzik static int ata_eh_followup_srst_needed(int rc, int classify, 1910c6fd2807SJeff Garzik const unsigned int *classes) 1911c6fd2807SJeff Garzik { 1912c6fd2807SJeff Garzik if (rc == -EAGAIN) 1913c6fd2807SJeff Garzik return 1; 1914c6fd2807SJeff Garzik if (rc != 0) 1915c6fd2807SJeff Garzik return 0; 1916c6fd2807SJeff Garzik if (classify && classes[0] == ATA_DEV_UNKNOWN) 1917c6fd2807SJeff Garzik return 1; 1918c6fd2807SJeff Garzik return 0; 1919c6fd2807SJeff Garzik } 1920c6fd2807SJeff Garzik 1921cc0680a5STejun Heo static int ata_eh_reset(struct ata_link *link, int classify, 1922c6fd2807SJeff Garzik ata_prereset_fn_t prereset, ata_reset_fn_t softreset, 1923c6fd2807SJeff Garzik ata_reset_fn_t hardreset, ata_postreset_fn_t postreset) 1924c6fd2807SJeff Garzik { 1925936fd732STejun Heo struct ata_eh_context *ehc = &link->eh_context; 1926c6fd2807SJeff Garzik unsigned int *classes = ehc->classes; 1927c6fd2807SJeff Garzik int verbose = !(ehc->i.flags & ATA_EHI_QUIET); 192831daabdaSTejun Heo int try = 0; 1929f58229f8STejun Heo struct ata_device *dev; 193031daabdaSTejun Heo unsigned long deadline; 1931c6fd2807SJeff Garzik unsigned int action; 1932c6fd2807SJeff Garzik ata_reset_fn_t reset; 1933f58229f8STejun Heo int rc; 1934c6fd2807SJeff Garzik 1935c6fd2807SJeff Garzik /* about to reset */ 1936955e57dfSTejun Heo ata_eh_about_to_do(link, NULL, ehc->i.action & ATA_EH_RESET_MASK); 1937c6fd2807SJeff Garzik 1938c6fd2807SJeff Garzik /* Determine which reset to use and record in ehc->i.action. 1939c6fd2807SJeff Garzik * prereset() may examine and modify it. 1940c6fd2807SJeff Garzik */ 1941c6fd2807SJeff Garzik action = ehc->i.action; 1942c6fd2807SJeff Garzik ehc->i.action &= ~ATA_EH_RESET_MASK; 1943936fd732STejun Heo if (softreset && (!hardreset || (!sata_set_spd_needed(link) && 1944c6fd2807SJeff Garzik !(action & ATA_EH_HARDRESET)))) 1945c6fd2807SJeff Garzik ehc->i.action |= ATA_EH_SOFTRESET; 1946c6fd2807SJeff Garzik else 1947c6fd2807SJeff Garzik ehc->i.action |= ATA_EH_HARDRESET; 1948c6fd2807SJeff Garzik 1949c6fd2807SJeff Garzik if (prereset) { 1950cc0680a5STejun Heo rc = prereset(link, jiffies + ATA_EH_PRERESET_TIMEOUT); 1951c6fd2807SJeff Garzik if (rc) { 1952c961922bSAlan Cox if (rc == -ENOENT) { 1953cc0680a5STejun Heo ata_link_printk(link, KERN_DEBUG, 19544aa9ab67STejun Heo "port disabled. ignoring.\n"); 19559af5c9c9STejun Heo ehc->i.action &= ~ATA_EH_RESET_MASK; 19564aa9ab67STejun Heo 1957936fd732STejun Heo ata_link_for_each_dev(dev, link) 1958f58229f8STejun Heo classes[dev->devno] = ATA_DEV_NONE; 19594aa9ab67STejun Heo 19604aa9ab67STejun Heo rc = 0; 1961c961922bSAlan Cox } else 1962cc0680a5STejun Heo ata_link_printk(link, KERN_ERR, 1963c6fd2807SJeff Garzik "prereset failed (errno=%d)\n", rc); 1964fccb6ea5STejun Heo goto out; 1965c6fd2807SJeff Garzik } 1966c6fd2807SJeff Garzik } 1967c6fd2807SJeff Garzik 1968c6fd2807SJeff Garzik /* prereset() might have modified ehc->i.action */ 1969c6fd2807SJeff Garzik if (ehc->i.action & ATA_EH_HARDRESET) 1970c6fd2807SJeff Garzik reset = hardreset; 1971c6fd2807SJeff Garzik else if (ehc->i.action & ATA_EH_SOFTRESET) 1972c6fd2807SJeff Garzik reset = softreset; 1973c6fd2807SJeff Garzik else { 1974c6fd2807SJeff Garzik /* prereset told us not to reset, bang classes and return */ 1975936fd732STejun Heo ata_link_for_each_dev(dev, link) 1976f58229f8STejun Heo classes[dev->devno] = ATA_DEV_NONE; 1977fccb6ea5STejun Heo rc = 0; 1978fccb6ea5STejun Heo goto out; 1979c6fd2807SJeff Garzik } 1980c6fd2807SJeff Garzik 1981c6fd2807SJeff Garzik /* did prereset() screw up? if so, fix up to avoid oopsing */ 1982c6fd2807SJeff Garzik if (!reset) { 1983c6fd2807SJeff Garzik if (softreset) 1984c6fd2807SJeff Garzik reset = softreset; 1985c6fd2807SJeff Garzik else 1986c6fd2807SJeff Garzik reset = hardreset; 1987c6fd2807SJeff Garzik } 1988c6fd2807SJeff Garzik 1989c6fd2807SJeff Garzik retry: 199031daabdaSTejun Heo deadline = jiffies + ata_eh_reset_timeouts[try++]; 199131daabdaSTejun Heo 1992c6fd2807SJeff Garzik /* shut up during boot probing */ 1993c6fd2807SJeff Garzik if (verbose) 1994cc0680a5STejun Heo ata_link_printk(link, KERN_INFO, "%s resetting link\n", 1995c6fd2807SJeff Garzik reset == softreset ? "soft" : "hard"); 1996c6fd2807SJeff Garzik 1997c6fd2807SJeff Garzik /* mark that this EH session started with reset */ 19980d64a233STejun Heo if (reset == hardreset) 19990d64a233STejun Heo ehc->i.flags |= ATA_EHI_DID_HARDRESET; 20000d64a233STejun Heo else 20010d64a233STejun Heo ehc->i.flags |= ATA_EHI_DID_SOFTRESET; 2002c6fd2807SJeff Garzik 2003cc0680a5STejun Heo rc = ata_do_reset(link, reset, classes, deadline); 2004c6fd2807SJeff Garzik 2005c6fd2807SJeff Garzik if (reset == hardreset && 2006c6fd2807SJeff Garzik ata_eh_followup_srst_needed(rc, classify, classes)) { 2007c6fd2807SJeff Garzik /* okay, let's do follow-up softreset */ 2008c6fd2807SJeff Garzik reset = softreset; 2009c6fd2807SJeff Garzik 2010c6fd2807SJeff Garzik if (!reset) { 2011cc0680a5STejun Heo ata_link_printk(link, KERN_ERR, 2012c6fd2807SJeff Garzik "follow-up softreset required " 2013c6fd2807SJeff Garzik "but no softreset avaliable\n"); 2014fccb6ea5STejun Heo rc = -EINVAL; 2015fccb6ea5STejun Heo goto out; 2016c6fd2807SJeff Garzik } 2017c6fd2807SJeff Garzik 2018955e57dfSTejun Heo ata_eh_about_to_do(link, NULL, ATA_EH_RESET_MASK); 2019cc0680a5STejun Heo rc = ata_do_reset(link, reset, classes, deadline); 2020c6fd2807SJeff Garzik 2021c6fd2807SJeff Garzik if (rc == 0 && classify && 2022c6fd2807SJeff Garzik classes[0] == ATA_DEV_UNKNOWN) { 2023cc0680a5STejun Heo ata_link_printk(link, KERN_ERR, 2024c6fd2807SJeff Garzik "classification failed\n"); 2025fccb6ea5STejun Heo rc = -EINVAL; 2026fccb6ea5STejun Heo goto out; 2027c6fd2807SJeff Garzik } 2028c6fd2807SJeff Garzik } 2029c6fd2807SJeff Garzik 203031daabdaSTejun Heo if (rc && try < ARRAY_SIZE(ata_eh_reset_timeouts)) { 203131daabdaSTejun Heo unsigned long now = jiffies; 2032c6fd2807SJeff Garzik 203331daabdaSTejun Heo if (time_before(now, deadline)) { 203431daabdaSTejun Heo unsigned long delta = deadline - jiffies; 2035c6fd2807SJeff Garzik 2036cc0680a5STejun Heo ata_link_printk(link, KERN_WARNING, "reset failed " 203731daabdaSTejun Heo "(errno=%d), retrying in %u secs\n", 203831daabdaSTejun Heo rc, (jiffies_to_msecs(delta) + 999) / 1000); 2039c6fd2807SJeff Garzik 204031daabdaSTejun Heo schedule_timeout_uninterruptible(delta); 204131daabdaSTejun Heo } 204231daabdaSTejun Heo 2043f1545154STejun Heo if (rc == -EPIPE || 204431daabdaSTejun Heo try == ARRAY_SIZE(ata_eh_reset_timeouts) - 1) 2045936fd732STejun Heo sata_down_spd_limit(link); 2046c6fd2807SJeff Garzik if (hardreset) 2047c6fd2807SJeff Garzik reset = hardreset; 2048c6fd2807SJeff Garzik goto retry; 2049c6fd2807SJeff Garzik } 2050c6fd2807SJeff Garzik 2051c6fd2807SJeff Garzik if (rc == 0) { 2052008a7896STejun Heo u32 sstatus; 2053008a7896STejun Heo 2054c6fd2807SJeff Garzik /* After the reset, the device state is PIO 0 and the 2055c6fd2807SJeff Garzik * controller state is undefined. Record the mode. 2056c6fd2807SJeff Garzik */ 2057936fd732STejun Heo ata_link_for_each_dev(dev, link) 2058f58229f8STejun Heo dev->pio_mode = XFER_PIO_0; 2059c6fd2807SJeff Garzik 2060008a7896STejun Heo /* record current link speed */ 2061936fd732STejun Heo if (sata_scr_read(link, SCR_STATUS, &sstatus) == 0) 2062936fd732STejun Heo link->sata_spd = (sstatus >> 4) & 0xf; 2063008a7896STejun Heo 2064c6fd2807SJeff Garzik if (postreset) 2065cc0680a5STejun Heo postreset(link, classes); 2066c6fd2807SJeff Garzik 2067c6fd2807SJeff Garzik /* reset successful, schedule revalidation */ 2068955e57dfSTejun Heo ata_eh_done(link, NULL, ehc->i.action & ATA_EH_RESET_MASK); 2069c6fd2807SJeff Garzik ehc->i.action |= ATA_EH_REVALIDATE; 2070c6fd2807SJeff Garzik } 2071fccb6ea5STejun Heo out: 2072fccb6ea5STejun Heo /* clear hotplug flag */ 2073fccb6ea5STejun Heo ehc->i.flags &= ~ATA_EHI_HOTPLUGGED; 2074c6fd2807SJeff Garzik return rc; 2075c6fd2807SJeff Garzik } 2076c6fd2807SJeff Garzik 20770260731fSTejun Heo static int ata_eh_revalidate_and_attach(struct ata_link *link, 2078c6fd2807SJeff Garzik struct ata_device **r_failed_dev) 2079c6fd2807SJeff Garzik { 20800260731fSTejun Heo struct ata_port *ap = link->ap; 20810260731fSTejun Heo struct ata_eh_context *ehc = &link->eh_context; 2082c6fd2807SJeff Garzik struct ata_device *dev; 20838c3c52a8STejun Heo unsigned int new_mask = 0; 2084c6fd2807SJeff Garzik unsigned long flags; 2085f58229f8STejun Heo int rc = 0; 2086c6fd2807SJeff Garzik 2087c6fd2807SJeff Garzik DPRINTK("ENTER\n"); 2088c6fd2807SJeff Garzik 20898c3c52a8STejun Heo /* For PATA drive side cable detection to work, IDENTIFY must 20908c3c52a8STejun Heo * be done backwards such that PDIAG- is released by the slave 20918c3c52a8STejun Heo * device before the master device is identified. 20928c3c52a8STejun Heo */ 20930260731fSTejun Heo ata_link_for_each_dev_reverse(dev, link) { 2094f58229f8STejun Heo unsigned int action = ata_eh_dev_action(dev); 2095f58229f8STejun Heo unsigned int readid_flags = 0; 2096c6fd2807SJeff Garzik 2097bff04647STejun Heo if (ehc->i.flags & ATA_EHI_DID_RESET) 2098bff04647STejun Heo readid_flags |= ATA_READID_POSTRESET; 2099bff04647STejun Heo 21009666f400STejun Heo if ((action & ATA_EH_REVALIDATE) && ata_dev_enabled(dev)) { 21010260731fSTejun Heo if (ata_link_offline(link)) { 2102c6fd2807SJeff Garzik rc = -EIO; 21038c3c52a8STejun Heo goto err; 2104c6fd2807SJeff Garzik } 2105c6fd2807SJeff Garzik 21060260731fSTejun Heo ata_eh_about_to_do(link, dev, ATA_EH_REVALIDATE); 2107bff04647STejun Heo rc = ata_dev_revalidate(dev, readid_flags); 2108c6fd2807SJeff Garzik if (rc) 21098c3c52a8STejun Heo goto err; 2110c6fd2807SJeff Garzik 21110260731fSTejun Heo ata_eh_done(link, dev, ATA_EH_REVALIDATE); 2112c6fd2807SJeff Garzik 2113baa1e78aSTejun Heo /* Configuration may have changed, reconfigure 2114baa1e78aSTejun Heo * transfer mode. 2115baa1e78aSTejun Heo */ 2116baa1e78aSTejun Heo ehc->i.flags |= ATA_EHI_SETMODE; 2117baa1e78aSTejun Heo 2118c6fd2807SJeff Garzik /* schedule the scsi_rescan_device() here */ 2119c6fd2807SJeff Garzik queue_work(ata_aux_wq, &(ap->scsi_rescan_task)); 2120c6fd2807SJeff Garzik } else if (dev->class == ATA_DEV_UNKNOWN && 2121c6fd2807SJeff Garzik ehc->tries[dev->devno] && 2122c6fd2807SJeff Garzik ata_class_enabled(ehc->classes[dev->devno])) { 2123c6fd2807SJeff Garzik dev->class = ehc->classes[dev->devno]; 2124c6fd2807SJeff Garzik 2125bff04647STejun Heo rc = ata_dev_read_id(dev, &dev->class, readid_flags, 2126bff04647STejun Heo dev->id); 21278c3c52a8STejun Heo switch (rc) { 21288c3c52a8STejun Heo case 0: 2129f58229f8STejun Heo new_mask |= 1 << dev->devno; 21308c3c52a8STejun Heo break; 21318c3c52a8STejun Heo case -ENOENT: 213255a8e2c8STejun Heo /* IDENTIFY was issued to non-existent 213355a8e2c8STejun Heo * device. No need to reset. Just 213455a8e2c8STejun Heo * thaw and kill the device. 213555a8e2c8STejun Heo */ 213655a8e2c8STejun Heo ata_eh_thaw_port(ap); 213755a8e2c8STejun Heo dev->class = ATA_DEV_UNKNOWN; 2138c6fd2807SJeff Garzik break; 21398c3c52a8STejun Heo default: 21408c3c52a8STejun Heo dev->class = ATA_DEV_UNKNOWN; 21418c3c52a8STejun Heo goto err; 21428c3c52a8STejun Heo } 21438c3c52a8STejun Heo } 2144c6fd2807SJeff Garzik } 2145c6fd2807SJeff Garzik 2146c1c4e8d5STejun Heo /* PDIAG- should have been released, ask cable type if post-reset */ 21479b1e2658STejun Heo if (ata_is_host_link(link) && ap->ops->cable_detect && 21489b1e2658STejun Heo (ehc->i.flags & ATA_EHI_DID_RESET)) 2149c1c4e8d5STejun Heo ap->cbl = ap->ops->cable_detect(ap); 2150c1c4e8d5STejun Heo 21518c3c52a8STejun Heo /* Configure new devices forward such that user doesn't see 21528c3c52a8STejun Heo * device detection messages backwards. 21538c3c52a8STejun Heo */ 21540260731fSTejun Heo ata_link_for_each_dev(dev, link) { 2155f58229f8STejun Heo if (!(new_mask & (1 << dev->devno))) 21568c3c52a8STejun Heo continue; 21578c3c52a8STejun Heo 21588c3c52a8STejun Heo ehc->i.flags |= ATA_EHI_PRINTINFO; 21598c3c52a8STejun Heo rc = ata_dev_configure(dev); 21608c3c52a8STejun Heo ehc->i.flags &= ~ATA_EHI_PRINTINFO; 21618c3c52a8STejun Heo if (rc) 21628c3c52a8STejun Heo goto err; 21638c3c52a8STejun Heo 2164c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 2165c6fd2807SJeff Garzik ap->pflags |= ATA_PFLAG_SCSI_HOTPLUG; 2166c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 2167baa1e78aSTejun Heo 216855a8e2c8STejun Heo /* new device discovered, configure xfermode */ 2169baa1e78aSTejun Heo ehc->i.flags |= ATA_EHI_SETMODE; 2170c6fd2807SJeff Garzik } 2171c6fd2807SJeff Garzik 21728c3c52a8STejun Heo return 0; 21738c3c52a8STejun Heo 21748c3c52a8STejun Heo err: 2175c6fd2807SJeff Garzik *r_failed_dev = dev; 21768c3c52a8STejun Heo DPRINTK("EXIT rc=%d\n", rc); 2177c6fd2807SJeff Garzik return rc; 2178c6fd2807SJeff Garzik } 2179c6fd2807SJeff Garzik 21800260731fSTejun Heo static int ata_link_nr_enabled(struct ata_link *link) 2181c6fd2807SJeff Garzik { 2182f58229f8STejun Heo struct ata_device *dev; 2183f58229f8STejun Heo int cnt = 0; 2184c6fd2807SJeff Garzik 21850260731fSTejun Heo ata_link_for_each_dev(dev, link) 2186f58229f8STejun Heo if (ata_dev_enabled(dev)) 2187c6fd2807SJeff Garzik cnt++; 2188c6fd2807SJeff Garzik return cnt; 2189c6fd2807SJeff Garzik } 2190c6fd2807SJeff Garzik 21910260731fSTejun Heo static int ata_link_nr_vacant(struct ata_link *link) 2192c6fd2807SJeff Garzik { 2193f58229f8STejun Heo struct ata_device *dev; 2194f58229f8STejun Heo int cnt = 0; 2195c6fd2807SJeff Garzik 21960260731fSTejun Heo ata_link_for_each_dev(dev, link) 2197f58229f8STejun Heo if (dev->class == ATA_DEV_UNKNOWN) 2198c6fd2807SJeff Garzik cnt++; 2199c6fd2807SJeff Garzik return cnt; 2200c6fd2807SJeff Garzik } 2201c6fd2807SJeff Garzik 22020260731fSTejun Heo static int ata_eh_skip_recovery(struct ata_link *link) 2203c6fd2807SJeff Garzik { 22040260731fSTejun Heo struct ata_eh_context *ehc = &link->eh_context; 2205f58229f8STejun Heo struct ata_device *dev; 2206c6fd2807SJeff Garzik 2207c6fd2807SJeff Garzik /* thaw frozen port, resume link and recover failed devices */ 22080260731fSTejun Heo if ((link->ap->pflags & ATA_PFLAG_FROZEN) || 22090260731fSTejun Heo (ehc->i.flags & ATA_EHI_RESUME_LINK) || ata_link_nr_enabled(link)) 2210c6fd2807SJeff Garzik return 0; 2211c6fd2807SJeff Garzik 2212c6fd2807SJeff Garzik /* skip if class codes for all vacant slots are ATA_DEV_NONE */ 22130260731fSTejun Heo ata_link_for_each_dev(dev, link) { 2214c6fd2807SJeff Garzik if (dev->class == ATA_DEV_UNKNOWN && 2215c6fd2807SJeff Garzik ehc->classes[dev->devno] != ATA_DEV_NONE) 2216c6fd2807SJeff Garzik return 0; 2217c6fd2807SJeff Garzik } 2218c6fd2807SJeff Garzik 2219c6fd2807SJeff Garzik return 1; 2220c6fd2807SJeff Garzik } 2221c6fd2807SJeff Garzik 22229b1e2658STejun Heo static int ata_eh_handle_dev_fail(struct ata_device *dev, int err) 2223fee7ca72STejun Heo { 22249af5c9c9STejun Heo struct ata_eh_context *ehc = &dev->link->eh_context; 2225fee7ca72STejun Heo 2226fee7ca72STejun Heo ehc->tries[dev->devno]--; 2227fee7ca72STejun Heo 2228fee7ca72STejun Heo switch (err) { 2229fee7ca72STejun Heo case -ENODEV: 2230fee7ca72STejun Heo /* device missing or wrong IDENTIFY data, schedule probing */ 2231fee7ca72STejun Heo ehc->i.probe_mask |= (1 << dev->devno); 2232fee7ca72STejun Heo case -EINVAL: 2233fee7ca72STejun Heo /* give it just one more chance */ 2234fee7ca72STejun Heo ehc->tries[dev->devno] = min(ehc->tries[dev->devno], 1); 2235fee7ca72STejun Heo case -EIO: 2236fee7ca72STejun Heo if (ehc->tries[dev->devno] == 1) { 2237fee7ca72STejun Heo /* This is the last chance, better to slow 2238fee7ca72STejun Heo * down than lose it. 2239fee7ca72STejun Heo */ 2240936fd732STejun Heo sata_down_spd_limit(dev->link); 2241fee7ca72STejun Heo ata_down_xfermask_limit(dev, ATA_DNXFER_PIO); 2242fee7ca72STejun Heo } 2243fee7ca72STejun Heo } 2244fee7ca72STejun Heo 2245fee7ca72STejun Heo if (ata_dev_enabled(dev) && !ehc->tries[dev->devno]) { 2246fee7ca72STejun Heo /* disable device if it has used up all its chances */ 2247fee7ca72STejun Heo ata_dev_disable(dev); 2248fee7ca72STejun Heo 2249fee7ca72STejun Heo /* detach if offline */ 2250936fd732STejun Heo if (ata_link_offline(dev->link)) 2251fee7ca72STejun Heo ata_eh_detach_dev(dev); 2252fee7ca72STejun Heo 2253fee7ca72STejun Heo /* probe if requested */ 2254fee7ca72STejun Heo if ((ehc->i.probe_mask & (1 << dev->devno)) && 2255fee7ca72STejun Heo !(ehc->did_probe_mask & (1 << dev->devno))) { 2256fee7ca72STejun Heo ata_eh_detach_dev(dev); 2257fee7ca72STejun Heo ata_dev_init(dev); 2258fee7ca72STejun Heo 2259fee7ca72STejun Heo ehc->tries[dev->devno] = ATA_EH_DEV_TRIES; 2260fee7ca72STejun Heo ehc->did_probe_mask |= (1 << dev->devno); 2261fee7ca72STejun Heo ehc->i.action |= ATA_EH_SOFTRESET; 2262fee7ca72STejun Heo } 22639b1e2658STejun Heo 22649b1e2658STejun Heo return 1; 2265fee7ca72STejun Heo } else { 2266fee7ca72STejun Heo /* soft didn't work? be haaaaard */ 2267fee7ca72STejun Heo if (ehc->i.flags & ATA_EHI_DID_RESET) 2268fee7ca72STejun Heo ehc->i.action |= ATA_EH_HARDRESET; 2269fee7ca72STejun Heo else 2270fee7ca72STejun Heo ehc->i.action |= ATA_EH_SOFTRESET; 22719b1e2658STejun Heo 22729b1e2658STejun Heo return 0; 2273fee7ca72STejun Heo } 2274fee7ca72STejun Heo } 2275fee7ca72STejun Heo 2276c6fd2807SJeff Garzik /** 2277c6fd2807SJeff Garzik * ata_eh_recover - recover host port after error 2278c6fd2807SJeff Garzik * @ap: host port to recover 2279c6fd2807SJeff Garzik * @prereset: prereset method (can be NULL) 2280c6fd2807SJeff Garzik * @softreset: softreset method (can be NULL) 2281c6fd2807SJeff Garzik * @hardreset: hardreset method (can be NULL) 2282c6fd2807SJeff Garzik * @postreset: postreset method (can be NULL) 22839b1e2658STejun Heo * @r_failed_link: out parameter for failed link 2284c6fd2807SJeff Garzik * 2285c6fd2807SJeff Garzik * This is the alpha and omega, eum and yang, heart and soul of 2286c6fd2807SJeff Garzik * libata exception handling. On entry, actions required to 22879b1e2658STejun Heo * recover each link and hotplug requests are recorded in the 22889b1e2658STejun Heo * link's eh_context. This function executes all the operations 22899b1e2658STejun Heo * with appropriate retrials and fallbacks to resurrect failed 2290c6fd2807SJeff Garzik * devices, detach goners and greet newcomers. 2291c6fd2807SJeff Garzik * 2292c6fd2807SJeff Garzik * LOCKING: 2293c6fd2807SJeff Garzik * Kernel thread context (may sleep). 2294c6fd2807SJeff Garzik * 2295c6fd2807SJeff Garzik * RETURNS: 2296c6fd2807SJeff Garzik * 0 on success, -errno on failure. 2297c6fd2807SJeff Garzik */ 2298c6fd2807SJeff Garzik static int ata_eh_recover(struct ata_port *ap, ata_prereset_fn_t prereset, 2299c6fd2807SJeff Garzik ata_reset_fn_t softreset, ata_reset_fn_t hardreset, 23009b1e2658STejun Heo ata_postreset_fn_t postreset, 23019b1e2658STejun Heo struct ata_link **r_failed_link) 2302c6fd2807SJeff Garzik { 23039b1e2658STejun Heo struct ata_link *link; 2304c6fd2807SJeff Garzik struct ata_device *dev; 23059b1e2658STejun Heo int nr_failed_devs, nr_disabled_devs; 23069b1e2658STejun Heo int reset, rc; 2307c6fd2807SJeff Garzik 2308c6fd2807SJeff Garzik DPRINTK("ENTER\n"); 2309c6fd2807SJeff Garzik 2310c6fd2807SJeff Garzik /* prep for recovery */ 23119b1e2658STejun Heo ata_port_for_each_link(link, ap) { 23129b1e2658STejun Heo struct ata_eh_context *ehc = &link->eh_context; 23139b1e2658STejun Heo 23140260731fSTejun Heo ata_link_for_each_dev(dev, link) { 2315c6fd2807SJeff Garzik ehc->tries[dev->devno] = ATA_EH_DEV_TRIES; 2316c6fd2807SJeff Garzik 231779a55b72STejun Heo /* collect port action mask recorded in dev actions */ 23189b1e2658STejun Heo ehc->i.action |= ehc->i.dev_action[dev->devno] & 23199b1e2658STejun Heo ~ATA_EH_PERDEV_MASK; 2320f58229f8STejun Heo ehc->i.dev_action[dev->devno] &= ATA_EH_PERDEV_MASK; 232179a55b72STejun Heo 2322c6fd2807SJeff Garzik /* process hotplug request */ 2323c6fd2807SJeff Garzik if (dev->flags & ATA_DFLAG_DETACH) 2324c6fd2807SJeff Garzik ata_eh_detach_dev(dev); 2325c6fd2807SJeff Garzik 2326c6fd2807SJeff Garzik if (!ata_dev_enabled(dev) && 2327c6fd2807SJeff Garzik ((ehc->i.probe_mask & (1 << dev->devno)) && 2328c6fd2807SJeff Garzik !(ehc->did_probe_mask & (1 << dev->devno)))) { 2329c6fd2807SJeff Garzik ata_eh_detach_dev(dev); 2330c6fd2807SJeff Garzik ata_dev_init(dev); 2331c6fd2807SJeff Garzik ehc->did_probe_mask |= (1 << dev->devno); 2332c6fd2807SJeff Garzik ehc->i.action |= ATA_EH_SOFTRESET; 2333c6fd2807SJeff Garzik } 2334c6fd2807SJeff Garzik } 23359b1e2658STejun Heo } 2336c6fd2807SJeff Garzik 2337c6fd2807SJeff Garzik retry: 2338c6fd2807SJeff Garzik rc = 0; 23399b1e2658STejun Heo nr_failed_devs = 0; 23409b1e2658STejun Heo nr_disabled_devs = 0; 23419b1e2658STejun Heo reset = 0; 2342c6fd2807SJeff Garzik 2343c6fd2807SJeff Garzik /* if UNLOADING, finish immediately */ 2344c6fd2807SJeff Garzik if (ap->pflags & ATA_PFLAG_UNLOADING) 2345c6fd2807SJeff Garzik goto out; 2346c6fd2807SJeff Garzik 23479b1e2658STejun Heo /* prep for EH */ 23489b1e2658STejun Heo ata_port_for_each_link(link, ap) { 23499b1e2658STejun Heo struct ata_eh_context *ehc = &link->eh_context; 23509b1e2658STejun Heo 2351c6fd2807SJeff Garzik /* skip EH if possible. */ 23520260731fSTejun Heo if (ata_eh_skip_recovery(link)) 2353c6fd2807SJeff Garzik ehc->i.action = 0; 2354c6fd2807SJeff Garzik 23559b1e2658STejun Heo /* do we need to reset? */ 23569b1e2658STejun Heo if (ehc->i.action & ATA_EH_RESET_MASK) 23579b1e2658STejun Heo reset = 1; 23589b1e2658STejun Heo 23590260731fSTejun Heo ata_link_for_each_dev(dev, link) 2360f58229f8STejun Heo ehc->classes[dev->devno] = ATA_DEV_UNKNOWN; 23619b1e2658STejun Heo } 2362c6fd2807SJeff Garzik 2363c6fd2807SJeff Garzik /* reset */ 23649b1e2658STejun Heo if (reset) { 2365c6fd2807SJeff Garzik ata_eh_freeze_port(ap); 2366c6fd2807SJeff Garzik 23679b1e2658STejun Heo ata_port_for_each_link(link, ap) { 23689b1e2658STejun Heo struct ata_eh_context *ehc = &link->eh_context; 23699b1e2658STejun Heo 23709b1e2658STejun Heo if (!(ehc->i.action & ATA_EH_RESET_MASK)) 23719b1e2658STejun Heo continue; 23729b1e2658STejun Heo 23739b1e2658STejun Heo rc = ata_eh_reset(link, ata_link_nr_vacant(link), 23749b1e2658STejun Heo prereset, softreset, hardreset, 23759b1e2658STejun Heo postreset); 2376c6fd2807SJeff Garzik if (rc) { 23770260731fSTejun Heo ata_link_printk(link, KERN_ERR, 2378c6fd2807SJeff Garzik "reset failed, giving up\n"); 2379c6fd2807SJeff Garzik goto out; 2380c6fd2807SJeff Garzik } 23819b1e2658STejun Heo } 2382c6fd2807SJeff Garzik 2383c6fd2807SJeff Garzik ata_eh_thaw_port(ap); 2384c6fd2807SJeff Garzik } 2385c6fd2807SJeff Garzik 23869b1e2658STejun Heo /* the rest */ 23879b1e2658STejun Heo ata_port_for_each_link(link, ap) { 23889b1e2658STejun Heo struct ata_eh_context *ehc = &link->eh_context; 23899b1e2658STejun Heo 2390c6fd2807SJeff Garzik /* revalidate existing devices and attach new ones */ 23910260731fSTejun Heo rc = ata_eh_revalidate_and_attach(link, &dev); 2392c6fd2807SJeff Garzik if (rc) 2393c6fd2807SJeff Garzik goto dev_fail; 2394c6fd2807SJeff Garzik 2395baa1e78aSTejun Heo /* configure transfer mode if necessary */ 2396baa1e78aSTejun Heo if (ehc->i.flags & ATA_EHI_SETMODE) { 23970260731fSTejun Heo rc = ata_set_mode(link, &dev); 23984ae72a1eSTejun Heo if (rc) 2399c6fd2807SJeff Garzik goto dev_fail; 2400baa1e78aSTejun Heo ehc->i.flags &= ~ATA_EHI_SETMODE; 2401c6fd2807SJeff Garzik } 2402c6fd2807SJeff Garzik 24039b1e2658STejun Heo /* this link is okay now */ 24049b1e2658STejun Heo ehc->i.flags = 0; 24059b1e2658STejun Heo continue; 2406c6fd2807SJeff Garzik 2407c6fd2807SJeff Garzik dev_fail: 24089b1e2658STejun Heo nr_failed_devs++; 24099b1e2658STejun Heo if (ata_eh_handle_dev_fail(dev, rc)) 24109b1e2658STejun Heo nr_disabled_devs++; 2411c6fd2807SJeff Garzik 24129b1e2658STejun Heo if (ap->pflags & ATA_PFLAG_FROZEN) 24139b1e2658STejun Heo break; 24149b1e2658STejun Heo } 24159b1e2658STejun Heo 24169b1e2658STejun Heo if (nr_failed_devs) { 24179b1e2658STejun Heo if (nr_failed_devs != nr_disabled_devs) { 24189b1e2658STejun Heo ata_port_printk(ap, KERN_WARNING, "failed to recover " 24199b1e2658STejun Heo "some devices, retrying in 5 secs\n"); 2420c6fd2807SJeff Garzik ssleep(5); 2421c6fd2807SJeff Garzik } else { 24229b1e2658STejun Heo /* no device left to recover, repeat fast */ 2423c6fd2807SJeff Garzik msleep(500); 2424c6fd2807SJeff Garzik } 2425c6fd2807SJeff Garzik 2426c6fd2807SJeff Garzik goto retry; 24279b1e2658STejun Heo } 2428c6fd2807SJeff Garzik 2429c6fd2807SJeff Garzik out: 24309b1e2658STejun Heo if (rc && r_failed_link) 24319b1e2658STejun Heo *r_failed_link = link; 2432c6fd2807SJeff Garzik 2433c6fd2807SJeff Garzik DPRINTK("EXIT, rc=%d\n", rc); 2434c6fd2807SJeff Garzik return rc; 2435c6fd2807SJeff Garzik } 2436c6fd2807SJeff Garzik 2437c6fd2807SJeff Garzik /** 2438c6fd2807SJeff Garzik * ata_eh_finish - finish up EH 2439c6fd2807SJeff Garzik * @ap: host port to finish EH for 2440c6fd2807SJeff Garzik * 2441c6fd2807SJeff Garzik * Recovery is complete. Clean up EH states and retry or finish 2442c6fd2807SJeff Garzik * failed qcs. 2443c6fd2807SJeff Garzik * 2444c6fd2807SJeff Garzik * LOCKING: 2445c6fd2807SJeff Garzik * None. 2446c6fd2807SJeff Garzik */ 2447c6fd2807SJeff Garzik static void ata_eh_finish(struct ata_port *ap) 2448c6fd2807SJeff Garzik { 2449c6fd2807SJeff Garzik int tag; 2450c6fd2807SJeff Garzik 2451c6fd2807SJeff Garzik /* retry or finish qcs */ 2452c6fd2807SJeff Garzik for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 2453c6fd2807SJeff Garzik struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 2454c6fd2807SJeff Garzik 2455c6fd2807SJeff Garzik if (!(qc->flags & ATA_QCFLAG_FAILED)) 2456c6fd2807SJeff Garzik continue; 2457c6fd2807SJeff Garzik 2458c6fd2807SJeff Garzik if (qc->err_mask) { 2459c6fd2807SJeff Garzik /* FIXME: Once EH migration is complete, 2460c6fd2807SJeff Garzik * generate sense data in this function, 2461c6fd2807SJeff Garzik * considering both err_mask and tf. 2462c6fd2807SJeff Garzik */ 2463c6fd2807SJeff Garzik if (qc->err_mask & AC_ERR_INVALID) 2464c6fd2807SJeff Garzik ata_eh_qc_complete(qc); 2465c6fd2807SJeff Garzik else 2466c6fd2807SJeff Garzik ata_eh_qc_retry(qc); 2467c6fd2807SJeff Garzik } else { 2468c6fd2807SJeff Garzik if (qc->flags & ATA_QCFLAG_SENSE_VALID) { 2469c6fd2807SJeff Garzik ata_eh_qc_complete(qc); 2470c6fd2807SJeff Garzik } else { 2471c6fd2807SJeff Garzik /* feed zero TF to sense generation */ 2472c6fd2807SJeff Garzik memset(&qc->result_tf, 0, sizeof(qc->result_tf)); 2473c6fd2807SJeff Garzik ata_eh_qc_retry(qc); 2474c6fd2807SJeff Garzik } 2475c6fd2807SJeff Garzik } 2476c6fd2807SJeff Garzik } 2477c6fd2807SJeff Garzik } 2478c6fd2807SJeff Garzik 2479c6fd2807SJeff Garzik /** 2480c6fd2807SJeff Garzik * ata_do_eh - do standard error handling 2481c6fd2807SJeff Garzik * @ap: host port to handle error for 2482c6fd2807SJeff Garzik * @prereset: prereset method (can be NULL) 2483c6fd2807SJeff Garzik * @softreset: softreset method (can be NULL) 2484c6fd2807SJeff Garzik * @hardreset: hardreset method (can be NULL) 2485c6fd2807SJeff Garzik * @postreset: postreset method (can be NULL) 2486c6fd2807SJeff Garzik * 2487c6fd2807SJeff Garzik * Perform standard error handling sequence. 2488c6fd2807SJeff Garzik * 2489c6fd2807SJeff Garzik * LOCKING: 2490c6fd2807SJeff Garzik * Kernel thread context (may sleep). 2491c6fd2807SJeff Garzik */ 2492c6fd2807SJeff Garzik void ata_do_eh(struct ata_port *ap, ata_prereset_fn_t prereset, 2493c6fd2807SJeff Garzik ata_reset_fn_t softreset, ata_reset_fn_t hardreset, 2494c6fd2807SJeff Garzik ata_postreset_fn_t postreset) 2495c6fd2807SJeff Garzik { 24969b1e2658STejun Heo struct ata_device *dev; 24979b1e2658STejun Heo int rc; 24989b1e2658STejun Heo 24999b1e2658STejun Heo ata_eh_autopsy(ap); 25009b1e2658STejun Heo ata_eh_report(ap); 25019b1e2658STejun Heo 25029b1e2658STejun Heo rc = ata_eh_recover(ap, prereset, softreset, hardreset, postreset, 25039b1e2658STejun Heo NULL); 25049b1e2658STejun Heo if (rc) { 25059b1e2658STejun Heo ata_link_for_each_dev(dev, &ap->link) 25069b1e2658STejun Heo ata_dev_disable(dev); 25079b1e2658STejun Heo } 25089b1e2658STejun Heo 2509c6fd2807SJeff Garzik ata_eh_finish(ap); 2510c6fd2807SJeff Garzik } 2511c6fd2807SJeff Garzik 25126ffa01d8STejun Heo #ifdef CONFIG_PM 2513c6fd2807SJeff Garzik /** 2514c6fd2807SJeff Garzik * ata_eh_handle_port_suspend - perform port suspend operation 2515c6fd2807SJeff Garzik * @ap: port to suspend 2516c6fd2807SJeff Garzik * 2517c6fd2807SJeff Garzik * Suspend @ap. 2518c6fd2807SJeff Garzik * 2519c6fd2807SJeff Garzik * LOCKING: 2520c6fd2807SJeff Garzik * Kernel thread context (may sleep). 2521c6fd2807SJeff Garzik */ 2522c6fd2807SJeff Garzik static void ata_eh_handle_port_suspend(struct ata_port *ap) 2523c6fd2807SJeff Garzik { 2524c6fd2807SJeff Garzik unsigned long flags; 2525c6fd2807SJeff Garzik int rc = 0; 2526c6fd2807SJeff Garzik 2527c6fd2807SJeff Garzik /* are we suspending? */ 2528c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 2529c6fd2807SJeff Garzik if (!(ap->pflags & ATA_PFLAG_PM_PENDING) || 2530c6fd2807SJeff Garzik ap->pm_mesg.event == PM_EVENT_ON) { 2531c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 2532c6fd2807SJeff Garzik return; 2533c6fd2807SJeff Garzik } 2534c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 2535c6fd2807SJeff Garzik 2536c6fd2807SJeff Garzik WARN_ON(ap->pflags & ATA_PFLAG_SUSPENDED); 2537c6fd2807SJeff Garzik 253864578a3dSTejun Heo /* tell ACPI we're suspending */ 253964578a3dSTejun Heo rc = ata_acpi_on_suspend(ap); 254064578a3dSTejun Heo if (rc) 254164578a3dSTejun Heo goto out; 254264578a3dSTejun Heo 2543c6fd2807SJeff Garzik /* suspend */ 2544c6fd2807SJeff Garzik ata_eh_freeze_port(ap); 2545c6fd2807SJeff Garzik 2546c6fd2807SJeff Garzik if (ap->ops->port_suspend) 2547c6fd2807SJeff Garzik rc = ap->ops->port_suspend(ap, ap->pm_mesg); 2548c6fd2807SJeff Garzik 254964578a3dSTejun Heo out: 2550c6fd2807SJeff Garzik /* report result */ 2551c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 2552c6fd2807SJeff Garzik 2553c6fd2807SJeff Garzik ap->pflags &= ~ATA_PFLAG_PM_PENDING; 2554c6fd2807SJeff Garzik if (rc == 0) 2555c6fd2807SJeff Garzik ap->pflags |= ATA_PFLAG_SUSPENDED; 255664578a3dSTejun Heo else if (ap->pflags & ATA_PFLAG_FROZEN) 2557c6fd2807SJeff Garzik ata_port_schedule_eh(ap); 2558c6fd2807SJeff Garzik 2559c6fd2807SJeff Garzik if (ap->pm_result) { 2560c6fd2807SJeff Garzik *ap->pm_result = rc; 2561c6fd2807SJeff Garzik ap->pm_result = NULL; 2562c6fd2807SJeff Garzik } 2563c6fd2807SJeff Garzik 2564c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 2565c6fd2807SJeff Garzik 2566c6fd2807SJeff Garzik return; 2567c6fd2807SJeff Garzik } 2568c6fd2807SJeff Garzik 2569c6fd2807SJeff Garzik /** 2570c6fd2807SJeff Garzik * ata_eh_handle_port_resume - perform port resume operation 2571c6fd2807SJeff Garzik * @ap: port to resume 2572c6fd2807SJeff Garzik * 2573c6fd2807SJeff Garzik * Resume @ap. 2574c6fd2807SJeff Garzik * 2575c6fd2807SJeff Garzik * LOCKING: 2576c6fd2807SJeff Garzik * Kernel thread context (may sleep). 2577c6fd2807SJeff Garzik */ 2578c6fd2807SJeff Garzik static void ata_eh_handle_port_resume(struct ata_port *ap) 2579c6fd2807SJeff Garzik { 2580c6fd2807SJeff Garzik unsigned long flags; 25819666f400STejun Heo int rc = 0; 2582c6fd2807SJeff Garzik 2583c6fd2807SJeff Garzik /* are we resuming? */ 2584c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 2585c6fd2807SJeff Garzik if (!(ap->pflags & ATA_PFLAG_PM_PENDING) || 2586c6fd2807SJeff Garzik ap->pm_mesg.event != PM_EVENT_ON) { 2587c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 2588c6fd2807SJeff Garzik return; 2589c6fd2807SJeff Garzik } 2590c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 2591c6fd2807SJeff Garzik 25929666f400STejun Heo WARN_ON(!(ap->pflags & ATA_PFLAG_SUSPENDED)); 2593c6fd2807SJeff Garzik 2594c6fd2807SJeff Garzik if (ap->ops->port_resume) 2595c6fd2807SJeff Garzik rc = ap->ops->port_resume(ap); 2596c6fd2807SJeff Garzik 25976746544cSTejun Heo /* tell ACPI that we're resuming */ 25986746544cSTejun Heo ata_acpi_on_resume(ap); 25996746544cSTejun Heo 26009666f400STejun Heo /* report result */ 2601c6fd2807SJeff Garzik spin_lock_irqsave(ap->lock, flags); 2602c6fd2807SJeff Garzik ap->pflags &= ~(ATA_PFLAG_PM_PENDING | ATA_PFLAG_SUSPENDED); 2603c6fd2807SJeff Garzik if (ap->pm_result) { 2604c6fd2807SJeff Garzik *ap->pm_result = rc; 2605c6fd2807SJeff Garzik ap->pm_result = NULL; 2606c6fd2807SJeff Garzik } 2607c6fd2807SJeff Garzik spin_unlock_irqrestore(ap->lock, flags); 2608c6fd2807SJeff Garzik } 26096ffa01d8STejun Heo #endif /* CONFIG_PM */ 2610