1 /* 2 * libata-eh.c - libata error handling 3 * 4 * Maintained by: Jeff Garzik <jgarzik@pobox.com> 5 * Please ALWAYS copy linux-ide@vger.kernel.org 6 * on emails. 7 * 8 * Copyright 2006 Tejun Heo <htejun@gmail.com> 9 * 10 * 11 * This program is free software; you can redistribute it and/or 12 * modify it under the terms of the GNU General Public License as 13 * published by the Free Software Foundation; either version 2, or 14 * (at your option) any later version. 15 * 16 * This program is distributed in the hope that it will be useful, 17 * but WITHOUT ANY WARRANTY; without even the implied warranty of 18 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 19 * General Public License for more details. 20 * 21 * You should have received a copy of the GNU General Public License 22 * along with this program; see the file COPYING. If not, write to 23 * the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, 24 * USA. 25 * 26 * 27 * libata documentation is available via 'make {ps|pdf}docs', 28 * as Documentation/DocBook/libata.* 29 * 30 * Hardware documentation available from http://www.t13.org/ and 31 * http://www.sata-io.org/ 32 * 33 */ 34 35 #include <linux/kernel.h> 36 #include <linux/blkdev.h> 37 #include <linux/pci.h> 38 #include <scsi/scsi.h> 39 #include <scsi/scsi_host.h> 40 #include <scsi/scsi_eh.h> 41 #include <scsi/scsi_device.h> 42 #include <scsi/scsi_cmnd.h> 43 #include "../scsi/scsi_transport_api.h" 44 45 #include <linux/libata.h> 46 47 #include "libata.h" 48 49 enum { 50 /* speed down verdicts */ 51 ATA_EH_SPDN_NCQ_OFF = (1 << 0), 52 ATA_EH_SPDN_SPEED_DOWN = (1 << 1), 53 ATA_EH_SPDN_FALLBACK_TO_PIO = (1 << 2), 54 ATA_EH_SPDN_KEEP_ERRORS = (1 << 3), 55 56 /* error flags */ 57 ATA_EFLAG_IS_IO = (1 << 0), 58 ATA_EFLAG_DUBIOUS_XFER = (1 << 1), 59 60 /* error categories */ 61 ATA_ECAT_NONE = 0, 62 ATA_ECAT_ATA_BUS = 1, 63 ATA_ECAT_TOUT_HSM = 2, 64 ATA_ECAT_UNK_DEV = 3, 65 ATA_ECAT_DUBIOUS_NONE = 4, 66 ATA_ECAT_DUBIOUS_ATA_BUS = 5, 67 ATA_ECAT_DUBIOUS_TOUT_HSM = 6, 68 ATA_ECAT_DUBIOUS_UNK_DEV = 7, 69 ATA_ECAT_NR = 8, 70 71 ATA_EH_CMD_DFL_TIMEOUT = 5000, 72 73 /* always put at least this amount of time between resets */ 74 ATA_EH_RESET_COOL_DOWN = 5000, 75 76 /* Waiting in ->prereset can never be reliable. It's 77 * sometimes nice to wait there but it can't be depended upon; 78 * otherwise, we wouldn't be resetting. Just give it enough 79 * time for most drives to spin up. 80 */ 81 ATA_EH_PRERESET_TIMEOUT = 10000, 82 ATA_EH_FASTDRAIN_INTERVAL = 3000, 83 84 ATA_EH_UA_TRIES = 5, 85 }; 86 87 /* The following table determines how we sequence resets. Each entry 88 * represents timeout for that try. The first try can be soft or 89 * hardreset. All others are hardreset if available. In most cases 90 * the first reset w/ 10sec timeout should succeed. Following entries 91 * are mostly for error handling, hotplug and retarded devices. 92 */ 93 static const unsigned long ata_eh_reset_timeouts[] = { 94 10000, /* most drives spin up by 10sec */ 95 10000, /* > 99% working drives spin up before 20sec */ 96 35000, /* give > 30 secs of idleness for retarded devices */ 97 5000, /* and sweet one last chance */ 98 ULONG_MAX, /* > 1 min has elapsed, give up */ 99 }; 100 101 static const unsigned long ata_eh_identify_timeouts[] = { 102 5000, /* covers > 99% of successes and not too boring on failures */ 103 10000, /* combined time till here is enough even for media access */ 104 30000, /* for true idiots */ 105 ULONG_MAX, 106 }; 107 108 static const unsigned long ata_eh_other_timeouts[] = { 109 5000, /* same rationale as identify timeout */ 110 10000, /* ditto */ 111 /* but no merciful 30sec for other commands, it just isn't worth it */ 112 ULONG_MAX, 113 }; 114 115 struct ata_eh_cmd_timeout_ent { 116 const u8 *commands; 117 const unsigned long *timeouts; 118 }; 119 120 /* The following table determines timeouts to use for EH internal 121 * commands. Each table entry is a command class and matches the 122 * commands the entry applies to and the timeout table to use. 123 * 124 * On the retry after a command timed out, the next timeout value from 125 * the table is used. If the table doesn't contain further entries, 126 * the last value is used. 127 * 128 * ehc->cmd_timeout_idx keeps track of which timeout to use per 129 * command class, so if SET_FEATURES times out on the first try, the 130 * next try will use the second timeout value only for that class. 131 */ 132 #define CMDS(cmds...) (const u8 []){ cmds, 0 } 133 static const struct ata_eh_cmd_timeout_ent 134 ata_eh_cmd_timeout_table[ATA_EH_CMD_TIMEOUT_TABLE_SIZE] = { 135 { .commands = CMDS(ATA_CMD_ID_ATA, ATA_CMD_ID_ATAPI), 136 .timeouts = ata_eh_identify_timeouts, }, 137 { .commands = CMDS(ATA_CMD_READ_NATIVE_MAX, ATA_CMD_READ_NATIVE_MAX_EXT), 138 .timeouts = ata_eh_other_timeouts, }, 139 { .commands = CMDS(ATA_CMD_SET_MAX, ATA_CMD_SET_MAX_EXT), 140 .timeouts = ata_eh_other_timeouts, }, 141 { .commands = CMDS(ATA_CMD_SET_FEATURES), 142 .timeouts = ata_eh_other_timeouts, }, 143 { .commands = CMDS(ATA_CMD_INIT_DEV_PARAMS), 144 .timeouts = ata_eh_other_timeouts, }, 145 }; 146 #undef CMDS 147 148 static void __ata_port_freeze(struct ata_port *ap); 149 #ifdef CONFIG_PM 150 static void ata_eh_handle_port_suspend(struct ata_port *ap); 151 static void ata_eh_handle_port_resume(struct ata_port *ap); 152 #else /* CONFIG_PM */ 153 static void ata_eh_handle_port_suspend(struct ata_port *ap) 154 { } 155 156 static void ata_eh_handle_port_resume(struct ata_port *ap) 157 { } 158 #endif /* CONFIG_PM */ 159 160 static void __ata_ehi_pushv_desc(struct ata_eh_info *ehi, const char *fmt, 161 va_list args) 162 { 163 ehi->desc_len += vscnprintf(ehi->desc + ehi->desc_len, 164 ATA_EH_DESC_LEN - ehi->desc_len, 165 fmt, args); 166 } 167 168 /** 169 * __ata_ehi_push_desc - push error description without adding separator 170 * @ehi: target EHI 171 * @fmt: printf format string 172 * 173 * Format string according to @fmt and append it to @ehi->desc. 174 * 175 * LOCKING: 176 * spin_lock_irqsave(host lock) 177 */ 178 void __ata_ehi_push_desc(struct ata_eh_info *ehi, const char *fmt, ...) 179 { 180 va_list args; 181 182 va_start(args, fmt); 183 __ata_ehi_pushv_desc(ehi, fmt, args); 184 va_end(args); 185 } 186 187 /** 188 * ata_ehi_push_desc - push error description with separator 189 * @ehi: target EHI 190 * @fmt: printf format string 191 * 192 * Format string according to @fmt and append it to @ehi->desc. 193 * If @ehi->desc is not empty, ", " is added in-between. 194 * 195 * LOCKING: 196 * spin_lock_irqsave(host lock) 197 */ 198 void ata_ehi_push_desc(struct ata_eh_info *ehi, const char *fmt, ...) 199 { 200 va_list args; 201 202 if (ehi->desc_len) 203 __ata_ehi_push_desc(ehi, ", "); 204 205 va_start(args, fmt); 206 __ata_ehi_pushv_desc(ehi, fmt, args); 207 va_end(args); 208 } 209 210 /** 211 * ata_ehi_clear_desc - clean error description 212 * @ehi: target EHI 213 * 214 * Clear @ehi->desc. 215 * 216 * LOCKING: 217 * spin_lock_irqsave(host lock) 218 */ 219 void ata_ehi_clear_desc(struct ata_eh_info *ehi) 220 { 221 ehi->desc[0] = '\0'; 222 ehi->desc_len = 0; 223 } 224 225 /** 226 * ata_port_desc - append port description 227 * @ap: target ATA port 228 * @fmt: printf format string 229 * 230 * Format string according to @fmt and append it to port 231 * description. If port description is not empty, " " is added 232 * in-between. This function is to be used while initializing 233 * ata_host. The description is printed on host registration. 234 * 235 * LOCKING: 236 * None. 237 */ 238 void ata_port_desc(struct ata_port *ap, const char *fmt, ...) 239 { 240 va_list args; 241 242 WARN_ON(!(ap->pflags & ATA_PFLAG_INITIALIZING)); 243 244 if (ap->link.eh_info.desc_len) 245 __ata_ehi_push_desc(&ap->link.eh_info, " "); 246 247 va_start(args, fmt); 248 __ata_ehi_pushv_desc(&ap->link.eh_info, fmt, args); 249 va_end(args); 250 } 251 252 #ifdef CONFIG_PCI 253 254 /** 255 * ata_port_pbar_desc - append PCI BAR description 256 * @ap: target ATA port 257 * @bar: target PCI BAR 258 * @offset: offset into PCI BAR 259 * @name: name of the area 260 * 261 * If @offset is negative, this function formats a string which 262 * contains the name, address, size and type of the BAR and 263 * appends it to the port description. If @offset is zero or 264 * positive, only name and offsetted address is appended. 265 * 266 * LOCKING: 267 * None. 268 */ 269 void ata_port_pbar_desc(struct ata_port *ap, int bar, ssize_t offset, 270 const char *name) 271 { 272 struct pci_dev *pdev = to_pci_dev(ap->host->dev); 273 char *type = ""; 274 unsigned long long start, len; 275 276 if (pci_resource_flags(pdev, bar) & IORESOURCE_MEM) 277 type = "m"; 278 else if (pci_resource_flags(pdev, bar) & IORESOURCE_IO) 279 type = "i"; 280 281 start = (unsigned long long)pci_resource_start(pdev, bar); 282 len = (unsigned long long)pci_resource_len(pdev, bar); 283 284 if (offset < 0) 285 ata_port_desc(ap, "%s %s%llu@0x%llx", name, type, len, start); 286 else 287 ata_port_desc(ap, "%s 0x%llx", name, 288 start + (unsigned long long)offset); 289 } 290 291 #endif /* CONFIG_PCI */ 292 293 static int ata_lookup_timeout_table(u8 cmd) 294 { 295 int i; 296 297 for (i = 0; i < ATA_EH_CMD_TIMEOUT_TABLE_SIZE; i++) { 298 const u8 *cur; 299 300 for (cur = ata_eh_cmd_timeout_table[i].commands; *cur; cur++) 301 if (*cur == cmd) 302 return i; 303 } 304 305 return -1; 306 } 307 308 /** 309 * ata_internal_cmd_timeout - determine timeout for an internal command 310 * @dev: target device 311 * @cmd: internal command to be issued 312 * 313 * Determine timeout for internal command @cmd for @dev. 314 * 315 * LOCKING: 316 * EH context. 317 * 318 * RETURNS: 319 * Determined timeout. 320 */ 321 unsigned long ata_internal_cmd_timeout(struct ata_device *dev, u8 cmd) 322 { 323 struct ata_eh_context *ehc = &dev->link->eh_context; 324 int ent = ata_lookup_timeout_table(cmd); 325 int idx; 326 327 if (ent < 0) 328 return ATA_EH_CMD_DFL_TIMEOUT; 329 330 idx = ehc->cmd_timeout_idx[dev->devno][ent]; 331 return ata_eh_cmd_timeout_table[ent].timeouts[idx]; 332 } 333 334 /** 335 * ata_internal_cmd_timed_out - notification for internal command timeout 336 * @dev: target device 337 * @cmd: internal command which timed out 338 * 339 * Notify EH that internal command @cmd for @dev timed out. This 340 * function should be called only for commands whose timeouts are 341 * determined using ata_internal_cmd_timeout(). 342 * 343 * LOCKING: 344 * EH context. 345 */ 346 void ata_internal_cmd_timed_out(struct ata_device *dev, u8 cmd) 347 { 348 struct ata_eh_context *ehc = &dev->link->eh_context; 349 int ent = ata_lookup_timeout_table(cmd); 350 int idx; 351 352 if (ent < 0) 353 return; 354 355 idx = ehc->cmd_timeout_idx[dev->devno][ent]; 356 if (ata_eh_cmd_timeout_table[ent].timeouts[idx + 1] != ULONG_MAX) 357 ehc->cmd_timeout_idx[dev->devno][ent]++; 358 } 359 360 static void ata_ering_record(struct ata_ering *ering, unsigned int eflags, 361 unsigned int err_mask) 362 { 363 struct ata_ering_entry *ent; 364 365 WARN_ON(!err_mask); 366 367 ering->cursor++; 368 ering->cursor %= ATA_ERING_SIZE; 369 370 ent = &ering->ring[ering->cursor]; 371 ent->eflags = eflags; 372 ent->err_mask = err_mask; 373 ent->timestamp = get_jiffies_64(); 374 } 375 376 static struct ata_ering_entry *ata_ering_top(struct ata_ering *ering) 377 { 378 struct ata_ering_entry *ent = &ering->ring[ering->cursor]; 379 380 if (ent->err_mask) 381 return ent; 382 return NULL; 383 } 384 385 static void ata_ering_clear(struct ata_ering *ering) 386 { 387 memset(ering, 0, sizeof(*ering)); 388 } 389 390 static int ata_ering_map(struct ata_ering *ering, 391 int (*map_fn)(struct ata_ering_entry *, void *), 392 void *arg) 393 { 394 int idx, rc = 0; 395 struct ata_ering_entry *ent; 396 397 idx = ering->cursor; 398 do { 399 ent = &ering->ring[idx]; 400 if (!ent->err_mask) 401 break; 402 rc = map_fn(ent, arg); 403 if (rc) 404 break; 405 idx = (idx - 1 + ATA_ERING_SIZE) % ATA_ERING_SIZE; 406 } while (idx != ering->cursor); 407 408 return rc; 409 } 410 411 static unsigned int ata_eh_dev_action(struct ata_device *dev) 412 { 413 struct ata_eh_context *ehc = &dev->link->eh_context; 414 415 return ehc->i.action | ehc->i.dev_action[dev->devno]; 416 } 417 418 static void ata_eh_clear_action(struct ata_link *link, struct ata_device *dev, 419 struct ata_eh_info *ehi, unsigned int action) 420 { 421 struct ata_device *tdev; 422 423 if (!dev) { 424 ehi->action &= ~action; 425 ata_link_for_each_dev(tdev, link) 426 ehi->dev_action[tdev->devno] &= ~action; 427 } else { 428 /* doesn't make sense for port-wide EH actions */ 429 WARN_ON(!(action & ATA_EH_PERDEV_MASK)); 430 431 /* break ehi->action into ehi->dev_action */ 432 if (ehi->action & action) { 433 ata_link_for_each_dev(tdev, link) 434 ehi->dev_action[tdev->devno] |= 435 ehi->action & action; 436 ehi->action &= ~action; 437 } 438 439 /* turn off the specified per-dev action */ 440 ehi->dev_action[dev->devno] &= ~action; 441 } 442 } 443 444 /** 445 * ata_scsi_timed_out - SCSI layer time out callback 446 * @cmd: timed out SCSI command 447 * 448 * Handles SCSI layer timeout. We race with normal completion of 449 * the qc for @cmd. If the qc is already gone, we lose and let 450 * the scsi command finish (EH_HANDLED). Otherwise, the qc has 451 * timed out and EH should be invoked. Prevent ata_qc_complete() 452 * from finishing it by setting EH_SCHEDULED and return 453 * EH_NOT_HANDLED. 454 * 455 * TODO: kill this function once old EH is gone. 456 * 457 * LOCKING: 458 * Called from timer context 459 * 460 * RETURNS: 461 * EH_HANDLED or EH_NOT_HANDLED 462 */ 463 enum blk_eh_timer_return ata_scsi_timed_out(struct scsi_cmnd *cmd) 464 { 465 struct Scsi_Host *host = cmd->device->host; 466 struct ata_port *ap = ata_shost_to_port(host); 467 unsigned long flags; 468 struct ata_queued_cmd *qc; 469 enum blk_eh_timer_return ret; 470 471 DPRINTK("ENTER\n"); 472 473 if (ap->ops->error_handler) { 474 ret = BLK_EH_NOT_HANDLED; 475 goto out; 476 } 477 478 ret = BLK_EH_HANDLED; 479 spin_lock_irqsave(ap->lock, flags); 480 qc = ata_qc_from_tag(ap, ap->link.active_tag); 481 if (qc) { 482 WARN_ON(qc->scsicmd != cmd); 483 qc->flags |= ATA_QCFLAG_EH_SCHEDULED; 484 qc->err_mask |= AC_ERR_TIMEOUT; 485 ret = BLK_EH_NOT_HANDLED; 486 } 487 spin_unlock_irqrestore(ap->lock, flags); 488 489 out: 490 DPRINTK("EXIT, ret=%d\n", ret); 491 return ret; 492 } 493 494 /** 495 * ata_scsi_error - SCSI layer error handler callback 496 * @host: SCSI host on which error occurred 497 * 498 * Handles SCSI-layer-thrown error events. 499 * 500 * LOCKING: 501 * Inherited from SCSI layer (none, can sleep) 502 * 503 * RETURNS: 504 * Zero. 505 */ 506 void ata_scsi_error(struct Scsi_Host *host) 507 { 508 struct ata_port *ap = ata_shost_to_port(host); 509 int i; 510 unsigned long flags; 511 512 DPRINTK("ENTER\n"); 513 514 /* synchronize with port task */ 515 ata_port_flush_task(ap); 516 517 /* synchronize with host lock and sort out timeouts */ 518 519 /* For new EH, all qcs are finished in one of three ways - 520 * normal completion, error completion, and SCSI timeout. 521 * Both cmpletions can race against SCSI timeout. When normal 522 * completion wins, the qc never reaches EH. When error 523 * completion wins, the qc has ATA_QCFLAG_FAILED set. 524 * 525 * When SCSI timeout wins, things are a bit more complex. 526 * Normal or error completion can occur after the timeout but 527 * before this point. In such cases, both types of 528 * completions are honored. A scmd is determined to have 529 * timed out iff its associated qc is active and not failed. 530 */ 531 if (ap->ops->error_handler) { 532 struct scsi_cmnd *scmd, *tmp; 533 int nr_timedout = 0; 534 535 spin_lock_irqsave(ap->lock, flags); 536 537 list_for_each_entry_safe(scmd, tmp, &host->eh_cmd_q, eh_entry) { 538 struct ata_queued_cmd *qc; 539 540 for (i = 0; i < ATA_MAX_QUEUE; i++) { 541 qc = __ata_qc_from_tag(ap, i); 542 if (qc->flags & ATA_QCFLAG_ACTIVE && 543 qc->scsicmd == scmd) 544 break; 545 } 546 547 if (i < ATA_MAX_QUEUE) { 548 /* the scmd has an associated qc */ 549 if (!(qc->flags & ATA_QCFLAG_FAILED)) { 550 /* which hasn't failed yet, timeout */ 551 qc->err_mask |= AC_ERR_TIMEOUT; 552 qc->flags |= ATA_QCFLAG_FAILED; 553 nr_timedout++; 554 } 555 } else { 556 /* Normal completion occurred after 557 * SCSI timeout but before this point. 558 * Successfully complete it. 559 */ 560 scmd->retries = scmd->allowed; 561 scsi_eh_finish_cmd(scmd, &ap->eh_done_q); 562 } 563 } 564 565 /* If we have timed out qcs. They belong to EH from 566 * this point but the state of the controller is 567 * unknown. Freeze the port to make sure the IRQ 568 * handler doesn't diddle with those qcs. This must 569 * be done atomically w.r.t. setting QCFLAG_FAILED. 570 */ 571 if (nr_timedout) 572 __ata_port_freeze(ap); 573 574 spin_unlock_irqrestore(ap->lock, flags); 575 576 /* initialize eh_tries */ 577 ap->eh_tries = ATA_EH_MAX_TRIES; 578 } else 579 spin_unlock_wait(ap->lock); 580 581 repeat: 582 /* invoke error handler */ 583 if (ap->ops->error_handler) { 584 struct ata_link *link; 585 586 /* kill fast drain timer */ 587 del_timer_sync(&ap->fastdrain_timer); 588 589 /* process port resume request */ 590 ata_eh_handle_port_resume(ap); 591 592 /* fetch & clear EH info */ 593 spin_lock_irqsave(ap->lock, flags); 594 595 __ata_port_for_each_link(link, ap) { 596 struct ata_eh_context *ehc = &link->eh_context; 597 struct ata_device *dev; 598 599 memset(&link->eh_context, 0, sizeof(link->eh_context)); 600 link->eh_context.i = link->eh_info; 601 memset(&link->eh_info, 0, sizeof(link->eh_info)); 602 603 ata_link_for_each_dev(dev, link) { 604 int devno = dev->devno; 605 606 ehc->saved_xfer_mode[devno] = dev->xfer_mode; 607 if (ata_ncq_enabled(dev)) 608 ehc->saved_ncq_enabled |= 1 << devno; 609 } 610 611 /* set last reset timestamp to some time in the past */ 612 ehc->last_reset = jiffies - 60 * HZ; 613 } 614 615 ap->pflags |= ATA_PFLAG_EH_IN_PROGRESS; 616 ap->pflags &= ~ATA_PFLAG_EH_PENDING; 617 ap->excl_link = NULL; /* don't maintain exclusion over EH */ 618 619 spin_unlock_irqrestore(ap->lock, flags); 620 621 /* invoke EH, skip if unloading or suspended */ 622 if (!(ap->pflags & (ATA_PFLAG_UNLOADING | ATA_PFLAG_SUSPENDED))) 623 ap->ops->error_handler(ap); 624 else 625 ata_eh_finish(ap); 626 627 /* process port suspend request */ 628 ata_eh_handle_port_suspend(ap); 629 630 /* Exception might have happend after ->error_handler 631 * recovered the port but before this point. Repeat 632 * EH in such case. 633 */ 634 spin_lock_irqsave(ap->lock, flags); 635 636 if (ap->pflags & ATA_PFLAG_EH_PENDING) { 637 if (--ap->eh_tries) { 638 spin_unlock_irqrestore(ap->lock, flags); 639 goto repeat; 640 } 641 ata_port_printk(ap, KERN_ERR, "EH pending after %d " 642 "tries, giving up\n", ATA_EH_MAX_TRIES); 643 ap->pflags &= ~ATA_PFLAG_EH_PENDING; 644 } 645 646 /* this run is complete, make sure EH info is clear */ 647 __ata_port_for_each_link(link, ap) 648 memset(&link->eh_info, 0, sizeof(link->eh_info)); 649 650 /* Clear host_eh_scheduled while holding ap->lock such 651 * that if exception occurs after this point but 652 * before EH completion, SCSI midlayer will 653 * re-initiate EH. 654 */ 655 host->host_eh_scheduled = 0; 656 657 spin_unlock_irqrestore(ap->lock, flags); 658 } else { 659 WARN_ON(ata_qc_from_tag(ap, ap->link.active_tag) == NULL); 660 ap->ops->eng_timeout(ap); 661 } 662 663 /* finish or retry handled scmd's and clean up */ 664 WARN_ON(host->host_failed || !list_empty(&host->eh_cmd_q)); 665 666 scsi_eh_flush_done_q(&ap->eh_done_q); 667 668 /* clean up */ 669 spin_lock_irqsave(ap->lock, flags); 670 671 if (ap->pflags & ATA_PFLAG_LOADING) 672 ap->pflags &= ~ATA_PFLAG_LOADING; 673 else if (ap->pflags & ATA_PFLAG_SCSI_HOTPLUG) 674 queue_delayed_work(ata_aux_wq, &ap->hotplug_task, 0); 675 676 if (ap->pflags & ATA_PFLAG_RECOVERED) 677 ata_port_printk(ap, KERN_INFO, "EH complete\n"); 678 679 ap->pflags &= ~(ATA_PFLAG_SCSI_HOTPLUG | ATA_PFLAG_RECOVERED); 680 681 /* tell wait_eh that we're done */ 682 ap->pflags &= ~ATA_PFLAG_EH_IN_PROGRESS; 683 wake_up_all(&ap->eh_wait_q); 684 685 spin_unlock_irqrestore(ap->lock, flags); 686 687 DPRINTK("EXIT\n"); 688 } 689 690 /** 691 * ata_port_wait_eh - Wait for the currently pending EH to complete 692 * @ap: Port to wait EH for 693 * 694 * Wait until the currently pending EH is complete. 695 * 696 * LOCKING: 697 * Kernel thread context (may sleep). 698 */ 699 void ata_port_wait_eh(struct ata_port *ap) 700 { 701 unsigned long flags; 702 DEFINE_WAIT(wait); 703 704 retry: 705 spin_lock_irqsave(ap->lock, flags); 706 707 while (ap->pflags & (ATA_PFLAG_EH_PENDING | ATA_PFLAG_EH_IN_PROGRESS)) { 708 prepare_to_wait(&ap->eh_wait_q, &wait, TASK_UNINTERRUPTIBLE); 709 spin_unlock_irqrestore(ap->lock, flags); 710 schedule(); 711 spin_lock_irqsave(ap->lock, flags); 712 } 713 finish_wait(&ap->eh_wait_q, &wait); 714 715 spin_unlock_irqrestore(ap->lock, flags); 716 717 /* make sure SCSI EH is complete */ 718 if (scsi_host_in_recovery(ap->scsi_host)) { 719 msleep(10); 720 goto retry; 721 } 722 } 723 724 static int ata_eh_nr_in_flight(struct ata_port *ap) 725 { 726 unsigned int tag; 727 int nr = 0; 728 729 /* count only non-internal commands */ 730 for (tag = 0; tag < ATA_MAX_QUEUE - 1; tag++) 731 if (ata_qc_from_tag(ap, tag)) 732 nr++; 733 734 return nr; 735 } 736 737 void ata_eh_fastdrain_timerfn(unsigned long arg) 738 { 739 struct ata_port *ap = (void *)arg; 740 unsigned long flags; 741 int cnt; 742 743 spin_lock_irqsave(ap->lock, flags); 744 745 cnt = ata_eh_nr_in_flight(ap); 746 747 /* are we done? */ 748 if (!cnt) 749 goto out_unlock; 750 751 if (cnt == ap->fastdrain_cnt) { 752 unsigned int tag; 753 754 /* No progress during the last interval, tag all 755 * in-flight qcs as timed out and freeze the port. 756 */ 757 for (tag = 0; tag < ATA_MAX_QUEUE - 1; tag++) { 758 struct ata_queued_cmd *qc = ata_qc_from_tag(ap, tag); 759 if (qc) 760 qc->err_mask |= AC_ERR_TIMEOUT; 761 } 762 763 ata_port_freeze(ap); 764 } else { 765 /* some qcs have finished, give it another chance */ 766 ap->fastdrain_cnt = cnt; 767 ap->fastdrain_timer.expires = 768 ata_deadline(jiffies, ATA_EH_FASTDRAIN_INTERVAL); 769 add_timer(&ap->fastdrain_timer); 770 } 771 772 out_unlock: 773 spin_unlock_irqrestore(ap->lock, flags); 774 } 775 776 /** 777 * ata_eh_set_pending - set ATA_PFLAG_EH_PENDING and activate fast drain 778 * @ap: target ATA port 779 * @fastdrain: activate fast drain 780 * 781 * Set ATA_PFLAG_EH_PENDING and activate fast drain if @fastdrain 782 * is non-zero and EH wasn't pending before. Fast drain ensures 783 * that EH kicks in in timely manner. 784 * 785 * LOCKING: 786 * spin_lock_irqsave(host lock) 787 */ 788 static void ata_eh_set_pending(struct ata_port *ap, int fastdrain) 789 { 790 int cnt; 791 792 /* already scheduled? */ 793 if (ap->pflags & ATA_PFLAG_EH_PENDING) 794 return; 795 796 ap->pflags |= ATA_PFLAG_EH_PENDING; 797 798 if (!fastdrain) 799 return; 800 801 /* do we have in-flight qcs? */ 802 cnt = ata_eh_nr_in_flight(ap); 803 if (!cnt) 804 return; 805 806 /* activate fast drain */ 807 ap->fastdrain_cnt = cnt; 808 ap->fastdrain_timer.expires = 809 ata_deadline(jiffies, ATA_EH_FASTDRAIN_INTERVAL); 810 add_timer(&ap->fastdrain_timer); 811 } 812 813 /** 814 * ata_qc_schedule_eh - schedule qc for error handling 815 * @qc: command to schedule error handling for 816 * 817 * Schedule error handling for @qc. EH will kick in as soon as 818 * other commands are drained. 819 * 820 * LOCKING: 821 * spin_lock_irqsave(host lock) 822 */ 823 void ata_qc_schedule_eh(struct ata_queued_cmd *qc) 824 { 825 struct ata_port *ap = qc->ap; 826 827 WARN_ON(!ap->ops->error_handler); 828 829 qc->flags |= ATA_QCFLAG_FAILED; 830 ata_eh_set_pending(ap, 1); 831 832 /* The following will fail if timeout has already expired. 833 * ata_scsi_error() takes care of such scmds on EH entry. 834 * Note that ATA_QCFLAG_FAILED is unconditionally set after 835 * this function completes. 836 */ 837 blk_abort_request(qc->scsicmd->request); 838 } 839 840 /** 841 * ata_port_schedule_eh - schedule error handling without a qc 842 * @ap: ATA port to schedule EH for 843 * 844 * Schedule error handling for @ap. EH will kick in as soon as 845 * all commands are drained. 846 * 847 * LOCKING: 848 * spin_lock_irqsave(host lock) 849 */ 850 void ata_port_schedule_eh(struct ata_port *ap) 851 { 852 WARN_ON(!ap->ops->error_handler); 853 854 if (ap->pflags & ATA_PFLAG_INITIALIZING) 855 return; 856 857 ata_eh_set_pending(ap, 1); 858 scsi_schedule_eh(ap->scsi_host); 859 860 DPRINTK("port EH scheduled\n"); 861 } 862 863 static int ata_do_link_abort(struct ata_port *ap, struct ata_link *link) 864 { 865 int tag, nr_aborted = 0; 866 867 WARN_ON(!ap->ops->error_handler); 868 869 /* we're gonna abort all commands, no need for fast drain */ 870 ata_eh_set_pending(ap, 0); 871 872 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 873 struct ata_queued_cmd *qc = ata_qc_from_tag(ap, tag); 874 875 if (qc && (!link || qc->dev->link == link)) { 876 qc->flags |= ATA_QCFLAG_FAILED; 877 ata_qc_complete(qc); 878 nr_aborted++; 879 } 880 } 881 882 if (!nr_aborted) 883 ata_port_schedule_eh(ap); 884 885 return nr_aborted; 886 } 887 888 /** 889 * ata_link_abort - abort all qc's on the link 890 * @link: ATA link to abort qc's for 891 * 892 * Abort all active qc's active on @link and schedule EH. 893 * 894 * LOCKING: 895 * spin_lock_irqsave(host lock) 896 * 897 * RETURNS: 898 * Number of aborted qc's. 899 */ 900 int ata_link_abort(struct ata_link *link) 901 { 902 return ata_do_link_abort(link->ap, link); 903 } 904 905 /** 906 * ata_port_abort - abort all qc's on the port 907 * @ap: ATA port to abort qc's for 908 * 909 * Abort all active qc's of @ap and schedule EH. 910 * 911 * LOCKING: 912 * spin_lock_irqsave(host_set lock) 913 * 914 * RETURNS: 915 * Number of aborted qc's. 916 */ 917 int ata_port_abort(struct ata_port *ap) 918 { 919 return ata_do_link_abort(ap, NULL); 920 } 921 922 /** 923 * __ata_port_freeze - freeze port 924 * @ap: ATA port to freeze 925 * 926 * This function is called when HSM violation or some other 927 * condition disrupts normal operation of the port. Frozen port 928 * is not allowed to perform any operation until the port is 929 * thawed, which usually follows a successful reset. 930 * 931 * ap->ops->freeze() callback can be used for freezing the port 932 * hardware-wise (e.g. mask interrupt and stop DMA engine). If a 933 * port cannot be frozen hardware-wise, the interrupt handler 934 * must ack and clear interrupts unconditionally while the port 935 * is frozen. 936 * 937 * LOCKING: 938 * spin_lock_irqsave(host lock) 939 */ 940 static void __ata_port_freeze(struct ata_port *ap) 941 { 942 WARN_ON(!ap->ops->error_handler); 943 944 if (ap->ops->freeze) 945 ap->ops->freeze(ap); 946 947 ap->pflags |= ATA_PFLAG_FROZEN; 948 949 DPRINTK("ata%u port frozen\n", ap->print_id); 950 } 951 952 /** 953 * ata_port_freeze - abort & freeze port 954 * @ap: ATA port to freeze 955 * 956 * Abort and freeze @ap. 957 * 958 * LOCKING: 959 * spin_lock_irqsave(host lock) 960 * 961 * RETURNS: 962 * Number of aborted commands. 963 */ 964 int ata_port_freeze(struct ata_port *ap) 965 { 966 int nr_aborted; 967 968 WARN_ON(!ap->ops->error_handler); 969 970 nr_aborted = ata_port_abort(ap); 971 __ata_port_freeze(ap); 972 973 return nr_aborted; 974 } 975 976 /** 977 * sata_async_notification - SATA async notification handler 978 * @ap: ATA port where async notification is received 979 * 980 * Handler to be called when async notification via SDB FIS is 981 * received. This function schedules EH if necessary. 982 * 983 * LOCKING: 984 * spin_lock_irqsave(host lock) 985 * 986 * RETURNS: 987 * 1 if EH is scheduled, 0 otherwise. 988 */ 989 int sata_async_notification(struct ata_port *ap) 990 { 991 u32 sntf; 992 int rc; 993 994 if (!(ap->flags & ATA_FLAG_AN)) 995 return 0; 996 997 rc = sata_scr_read(&ap->link, SCR_NOTIFICATION, &sntf); 998 if (rc == 0) 999 sata_scr_write(&ap->link, SCR_NOTIFICATION, sntf); 1000 1001 if (!sata_pmp_attached(ap) || rc) { 1002 /* PMP is not attached or SNTF is not available */ 1003 if (!sata_pmp_attached(ap)) { 1004 /* PMP is not attached. Check whether ATAPI 1005 * AN is configured. If so, notify media 1006 * change. 1007 */ 1008 struct ata_device *dev = ap->link.device; 1009 1010 if ((dev->class == ATA_DEV_ATAPI) && 1011 (dev->flags & ATA_DFLAG_AN)) 1012 ata_scsi_media_change_notify(dev); 1013 return 0; 1014 } else { 1015 /* PMP is attached but SNTF is not available. 1016 * ATAPI async media change notification is 1017 * not used. The PMP must be reporting PHY 1018 * status change, schedule EH. 1019 */ 1020 ata_port_schedule_eh(ap); 1021 return 1; 1022 } 1023 } else { 1024 /* PMP is attached and SNTF is available */ 1025 struct ata_link *link; 1026 1027 /* check and notify ATAPI AN */ 1028 ata_port_for_each_link(link, ap) { 1029 if (!(sntf & (1 << link->pmp))) 1030 continue; 1031 1032 if ((link->device->class == ATA_DEV_ATAPI) && 1033 (link->device->flags & ATA_DFLAG_AN)) 1034 ata_scsi_media_change_notify(link->device); 1035 } 1036 1037 /* If PMP is reporting that PHY status of some 1038 * downstream ports has changed, schedule EH. 1039 */ 1040 if (sntf & (1 << SATA_PMP_CTRL_PORT)) { 1041 ata_port_schedule_eh(ap); 1042 return 1; 1043 } 1044 1045 return 0; 1046 } 1047 } 1048 1049 /** 1050 * ata_eh_freeze_port - EH helper to freeze port 1051 * @ap: ATA port to freeze 1052 * 1053 * Freeze @ap. 1054 * 1055 * LOCKING: 1056 * None. 1057 */ 1058 void ata_eh_freeze_port(struct ata_port *ap) 1059 { 1060 unsigned long flags; 1061 1062 if (!ap->ops->error_handler) 1063 return; 1064 1065 spin_lock_irqsave(ap->lock, flags); 1066 __ata_port_freeze(ap); 1067 spin_unlock_irqrestore(ap->lock, flags); 1068 } 1069 1070 /** 1071 * ata_port_thaw_port - EH helper to thaw port 1072 * @ap: ATA port to thaw 1073 * 1074 * Thaw frozen port @ap. 1075 * 1076 * LOCKING: 1077 * None. 1078 */ 1079 void ata_eh_thaw_port(struct ata_port *ap) 1080 { 1081 unsigned long flags; 1082 1083 if (!ap->ops->error_handler) 1084 return; 1085 1086 spin_lock_irqsave(ap->lock, flags); 1087 1088 ap->pflags &= ~ATA_PFLAG_FROZEN; 1089 1090 if (ap->ops->thaw) 1091 ap->ops->thaw(ap); 1092 1093 spin_unlock_irqrestore(ap->lock, flags); 1094 1095 DPRINTK("ata%u port thawed\n", ap->print_id); 1096 } 1097 1098 static void ata_eh_scsidone(struct scsi_cmnd *scmd) 1099 { 1100 /* nada */ 1101 } 1102 1103 static void __ata_eh_qc_complete(struct ata_queued_cmd *qc) 1104 { 1105 struct ata_port *ap = qc->ap; 1106 struct scsi_cmnd *scmd = qc->scsicmd; 1107 unsigned long flags; 1108 1109 spin_lock_irqsave(ap->lock, flags); 1110 qc->scsidone = ata_eh_scsidone; 1111 __ata_qc_complete(qc); 1112 WARN_ON(ata_tag_valid(qc->tag)); 1113 spin_unlock_irqrestore(ap->lock, flags); 1114 1115 scsi_eh_finish_cmd(scmd, &ap->eh_done_q); 1116 } 1117 1118 /** 1119 * ata_eh_qc_complete - Complete an active ATA command from EH 1120 * @qc: Command to complete 1121 * 1122 * Indicate to the mid and upper layers that an ATA command has 1123 * completed. To be used from EH. 1124 */ 1125 void ata_eh_qc_complete(struct ata_queued_cmd *qc) 1126 { 1127 struct scsi_cmnd *scmd = qc->scsicmd; 1128 scmd->retries = scmd->allowed; 1129 __ata_eh_qc_complete(qc); 1130 } 1131 1132 /** 1133 * ata_eh_qc_retry - Tell midlayer to retry an ATA command after EH 1134 * @qc: Command to retry 1135 * 1136 * Indicate to the mid and upper layers that an ATA command 1137 * should be retried. To be used from EH. 1138 * 1139 * SCSI midlayer limits the number of retries to scmd->allowed. 1140 * scmd->retries is decremented for commands which get retried 1141 * due to unrelated failures (qc->err_mask is zero). 1142 */ 1143 void ata_eh_qc_retry(struct ata_queued_cmd *qc) 1144 { 1145 struct scsi_cmnd *scmd = qc->scsicmd; 1146 if (!qc->err_mask && scmd->retries) 1147 scmd->retries--; 1148 __ata_eh_qc_complete(qc); 1149 } 1150 1151 /** 1152 * ata_eh_detach_dev - detach ATA device 1153 * @dev: ATA device to detach 1154 * 1155 * Detach @dev. 1156 * 1157 * LOCKING: 1158 * None. 1159 */ 1160 void ata_eh_detach_dev(struct ata_device *dev) 1161 { 1162 struct ata_link *link = dev->link; 1163 struct ata_port *ap = link->ap; 1164 unsigned long flags; 1165 1166 ata_dev_disable(dev); 1167 1168 spin_lock_irqsave(ap->lock, flags); 1169 1170 dev->flags &= ~ATA_DFLAG_DETACH; 1171 1172 if (ata_scsi_offline_dev(dev)) { 1173 dev->flags |= ATA_DFLAG_DETACHED; 1174 ap->pflags |= ATA_PFLAG_SCSI_HOTPLUG; 1175 } 1176 1177 /* clear per-dev EH actions */ 1178 ata_eh_clear_action(link, dev, &link->eh_info, ATA_EH_PERDEV_MASK); 1179 ata_eh_clear_action(link, dev, &link->eh_context.i, ATA_EH_PERDEV_MASK); 1180 1181 spin_unlock_irqrestore(ap->lock, flags); 1182 } 1183 1184 /** 1185 * ata_eh_about_to_do - about to perform eh_action 1186 * @link: target ATA link 1187 * @dev: target ATA dev for per-dev action (can be NULL) 1188 * @action: action about to be performed 1189 * 1190 * Called just before performing EH actions to clear related bits 1191 * in @link->eh_info such that eh actions are not unnecessarily 1192 * repeated. 1193 * 1194 * LOCKING: 1195 * None. 1196 */ 1197 void ata_eh_about_to_do(struct ata_link *link, struct ata_device *dev, 1198 unsigned int action) 1199 { 1200 struct ata_port *ap = link->ap; 1201 struct ata_eh_info *ehi = &link->eh_info; 1202 struct ata_eh_context *ehc = &link->eh_context; 1203 unsigned long flags; 1204 1205 spin_lock_irqsave(ap->lock, flags); 1206 1207 ata_eh_clear_action(link, dev, ehi, action); 1208 1209 if (!(ehc->i.flags & ATA_EHI_QUIET)) 1210 ap->pflags |= ATA_PFLAG_RECOVERED; 1211 1212 spin_unlock_irqrestore(ap->lock, flags); 1213 } 1214 1215 /** 1216 * ata_eh_done - EH action complete 1217 * @ap: target ATA port 1218 * @dev: target ATA dev for per-dev action (can be NULL) 1219 * @action: action just completed 1220 * 1221 * Called right after performing EH actions to clear related bits 1222 * in @link->eh_context. 1223 * 1224 * LOCKING: 1225 * None. 1226 */ 1227 void ata_eh_done(struct ata_link *link, struct ata_device *dev, 1228 unsigned int action) 1229 { 1230 struct ata_eh_context *ehc = &link->eh_context; 1231 1232 ata_eh_clear_action(link, dev, &ehc->i, action); 1233 } 1234 1235 /** 1236 * ata_err_string - convert err_mask to descriptive string 1237 * @err_mask: error mask to convert to string 1238 * 1239 * Convert @err_mask to descriptive string. Errors are 1240 * prioritized according to severity and only the most severe 1241 * error is reported. 1242 * 1243 * LOCKING: 1244 * None. 1245 * 1246 * RETURNS: 1247 * Descriptive string for @err_mask 1248 */ 1249 static const char *ata_err_string(unsigned int err_mask) 1250 { 1251 if (err_mask & AC_ERR_HOST_BUS) 1252 return "host bus error"; 1253 if (err_mask & AC_ERR_ATA_BUS) 1254 return "ATA bus error"; 1255 if (err_mask & AC_ERR_TIMEOUT) 1256 return "timeout"; 1257 if (err_mask & AC_ERR_HSM) 1258 return "HSM violation"; 1259 if (err_mask & AC_ERR_SYSTEM) 1260 return "internal error"; 1261 if (err_mask & AC_ERR_MEDIA) 1262 return "media error"; 1263 if (err_mask & AC_ERR_INVALID) 1264 return "invalid argument"; 1265 if (err_mask & AC_ERR_DEV) 1266 return "device error"; 1267 return "unknown error"; 1268 } 1269 1270 /** 1271 * ata_read_log_page - read a specific log page 1272 * @dev: target device 1273 * @page: page to read 1274 * @buf: buffer to store read page 1275 * @sectors: number of sectors to read 1276 * 1277 * Read log page using READ_LOG_EXT command. 1278 * 1279 * LOCKING: 1280 * Kernel thread context (may sleep). 1281 * 1282 * RETURNS: 1283 * 0 on success, AC_ERR_* mask otherwise. 1284 */ 1285 static unsigned int ata_read_log_page(struct ata_device *dev, 1286 u8 page, void *buf, unsigned int sectors) 1287 { 1288 struct ata_taskfile tf; 1289 unsigned int err_mask; 1290 1291 DPRINTK("read log page - page %d\n", page); 1292 1293 ata_tf_init(dev, &tf); 1294 tf.command = ATA_CMD_READ_LOG_EXT; 1295 tf.lbal = page; 1296 tf.nsect = sectors; 1297 tf.hob_nsect = sectors >> 8; 1298 tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_LBA48 | ATA_TFLAG_DEVICE; 1299 tf.protocol = ATA_PROT_PIO; 1300 1301 err_mask = ata_exec_internal(dev, &tf, NULL, DMA_FROM_DEVICE, 1302 buf, sectors * ATA_SECT_SIZE, 0); 1303 1304 DPRINTK("EXIT, err_mask=%x\n", err_mask); 1305 return err_mask; 1306 } 1307 1308 /** 1309 * ata_eh_read_log_10h - Read log page 10h for NCQ error details 1310 * @dev: Device to read log page 10h from 1311 * @tag: Resulting tag of the failed command 1312 * @tf: Resulting taskfile registers of the failed command 1313 * 1314 * Read log page 10h to obtain NCQ error details and clear error 1315 * condition. 1316 * 1317 * LOCKING: 1318 * Kernel thread context (may sleep). 1319 * 1320 * RETURNS: 1321 * 0 on success, -errno otherwise. 1322 */ 1323 static int ata_eh_read_log_10h(struct ata_device *dev, 1324 int *tag, struct ata_taskfile *tf) 1325 { 1326 u8 *buf = dev->link->ap->sector_buf; 1327 unsigned int err_mask; 1328 u8 csum; 1329 int i; 1330 1331 err_mask = ata_read_log_page(dev, ATA_LOG_SATA_NCQ, buf, 1); 1332 if (err_mask) 1333 return -EIO; 1334 1335 csum = 0; 1336 for (i = 0; i < ATA_SECT_SIZE; i++) 1337 csum += buf[i]; 1338 if (csum) 1339 ata_dev_printk(dev, KERN_WARNING, 1340 "invalid checksum 0x%x on log page 10h\n", csum); 1341 1342 if (buf[0] & 0x80) 1343 return -ENOENT; 1344 1345 *tag = buf[0] & 0x1f; 1346 1347 tf->command = buf[2]; 1348 tf->feature = buf[3]; 1349 tf->lbal = buf[4]; 1350 tf->lbam = buf[5]; 1351 tf->lbah = buf[6]; 1352 tf->device = buf[7]; 1353 tf->hob_lbal = buf[8]; 1354 tf->hob_lbam = buf[9]; 1355 tf->hob_lbah = buf[10]; 1356 tf->nsect = buf[12]; 1357 tf->hob_nsect = buf[13]; 1358 1359 return 0; 1360 } 1361 1362 /** 1363 * atapi_eh_tur - perform ATAPI TEST_UNIT_READY 1364 * @dev: target ATAPI device 1365 * @r_sense_key: out parameter for sense_key 1366 * 1367 * Perform ATAPI TEST_UNIT_READY. 1368 * 1369 * LOCKING: 1370 * EH context (may sleep). 1371 * 1372 * RETURNS: 1373 * 0 on success, AC_ERR_* mask on failure. 1374 */ 1375 static unsigned int atapi_eh_tur(struct ata_device *dev, u8 *r_sense_key) 1376 { 1377 u8 cdb[ATAPI_CDB_LEN] = { TEST_UNIT_READY, 0, 0, 0, 0, 0 }; 1378 struct ata_taskfile tf; 1379 unsigned int err_mask; 1380 1381 ata_tf_init(dev, &tf); 1382 1383 tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_DEVICE; 1384 tf.command = ATA_CMD_PACKET; 1385 tf.protocol = ATAPI_PROT_NODATA; 1386 1387 err_mask = ata_exec_internal(dev, &tf, cdb, DMA_NONE, NULL, 0, 0); 1388 if (err_mask == AC_ERR_DEV) 1389 *r_sense_key = tf.feature >> 4; 1390 return err_mask; 1391 } 1392 1393 /** 1394 * atapi_eh_request_sense - perform ATAPI REQUEST_SENSE 1395 * @dev: device to perform REQUEST_SENSE to 1396 * @sense_buf: result sense data buffer (SCSI_SENSE_BUFFERSIZE bytes long) 1397 * @dfl_sense_key: default sense key to use 1398 * 1399 * Perform ATAPI REQUEST_SENSE after the device reported CHECK 1400 * SENSE. This function is EH helper. 1401 * 1402 * LOCKING: 1403 * Kernel thread context (may sleep). 1404 * 1405 * RETURNS: 1406 * 0 on success, AC_ERR_* mask on failure 1407 */ 1408 static unsigned int atapi_eh_request_sense(struct ata_device *dev, 1409 u8 *sense_buf, u8 dfl_sense_key) 1410 { 1411 u8 cdb[ATAPI_CDB_LEN] = 1412 { REQUEST_SENSE, 0, 0, 0, SCSI_SENSE_BUFFERSIZE, 0 }; 1413 struct ata_port *ap = dev->link->ap; 1414 struct ata_taskfile tf; 1415 1416 DPRINTK("ATAPI request sense\n"); 1417 1418 /* FIXME: is this needed? */ 1419 memset(sense_buf, 0, SCSI_SENSE_BUFFERSIZE); 1420 1421 /* initialize sense_buf with the error register, 1422 * for the case where they are -not- overwritten 1423 */ 1424 sense_buf[0] = 0x70; 1425 sense_buf[2] = dfl_sense_key; 1426 1427 /* some devices time out if garbage left in tf */ 1428 ata_tf_init(dev, &tf); 1429 1430 tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_DEVICE; 1431 tf.command = ATA_CMD_PACKET; 1432 1433 /* is it pointless to prefer PIO for "safety reasons"? */ 1434 if (ap->flags & ATA_FLAG_PIO_DMA) { 1435 tf.protocol = ATAPI_PROT_DMA; 1436 tf.feature |= ATAPI_PKT_DMA; 1437 } else { 1438 tf.protocol = ATAPI_PROT_PIO; 1439 tf.lbam = SCSI_SENSE_BUFFERSIZE; 1440 tf.lbah = 0; 1441 } 1442 1443 return ata_exec_internal(dev, &tf, cdb, DMA_FROM_DEVICE, 1444 sense_buf, SCSI_SENSE_BUFFERSIZE, 0); 1445 } 1446 1447 /** 1448 * ata_eh_analyze_serror - analyze SError for a failed port 1449 * @link: ATA link to analyze SError for 1450 * 1451 * Analyze SError if available and further determine cause of 1452 * failure. 1453 * 1454 * LOCKING: 1455 * None. 1456 */ 1457 static void ata_eh_analyze_serror(struct ata_link *link) 1458 { 1459 struct ata_eh_context *ehc = &link->eh_context; 1460 u32 serror = ehc->i.serror; 1461 unsigned int err_mask = 0, action = 0; 1462 u32 hotplug_mask; 1463 1464 if (serror & (SERR_PERSISTENT | SERR_DATA)) { 1465 err_mask |= AC_ERR_ATA_BUS; 1466 action |= ATA_EH_RESET; 1467 } 1468 if (serror & SERR_PROTOCOL) { 1469 err_mask |= AC_ERR_HSM; 1470 action |= ATA_EH_RESET; 1471 } 1472 if (serror & SERR_INTERNAL) { 1473 err_mask |= AC_ERR_SYSTEM; 1474 action |= ATA_EH_RESET; 1475 } 1476 1477 /* Determine whether a hotplug event has occurred. Both 1478 * SError.N/X are considered hotplug events for enabled or 1479 * host links. For disabled PMP links, only N bit is 1480 * considered as X bit is left at 1 for link plugging. 1481 */ 1482 hotplug_mask = 0; 1483 1484 if (!(link->flags & ATA_LFLAG_DISABLED) || ata_is_host_link(link)) 1485 hotplug_mask = SERR_PHYRDY_CHG | SERR_DEV_XCHG; 1486 else 1487 hotplug_mask = SERR_PHYRDY_CHG; 1488 1489 if (serror & hotplug_mask) 1490 ata_ehi_hotplugged(&ehc->i); 1491 1492 ehc->i.err_mask |= err_mask; 1493 ehc->i.action |= action; 1494 } 1495 1496 /** 1497 * ata_eh_analyze_ncq_error - analyze NCQ error 1498 * @link: ATA link to analyze NCQ error for 1499 * 1500 * Read log page 10h, determine the offending qc and acquire 1501 * error status TF. For NCQ device errors, all LLDDs have to do 1502 * is setting AC_ERR_DEV in ehi->err_mask. This function takes 1503 * care of the rest. 1504 * 1505 * LOCKING: 1506 * Kernel thread context (may sleep). 1507 */ 1508 void ata_eh_analyze_ncq_error(struct ata_link *link) 1509 { 1510 struct ata_port *ap = link->ap; 1511 struct ata_eh_context *ehc = &link->eh_context; 1512 struct ata_device *dev = link->device; 1513 struct ata_queued_cmd *qc; 1514 struct ata_taskfile tf; 1515 int tag, rc; 1516 1517 /* if frozen, we can't do much */ 1518 if (ap->pflags & ATA_PFLAG_FROZEN) 1519 return; 1520 1521 /* is it NCQ device error? */ 1522 if (!link->sactive || !(ehc->i.err_mask & AC_ERR_DEV)) 1523 return; 1524 1525 /* has LLDD analyzed already? */ 1526 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 1527 qc = __ata_qc_from_tag(ap, tag); 1528 1529 if (!(qc->flags & ATA_QCFLAG_FAILED)) 1530 continue; 1531 1532 if (qc->err_mask) 1533 return; 1534 } 1535 1536 /* okay, this error is ours */ 1537 rc = ata_eh_read_log_10h(dev, &tag, &tf); 1538 if (rc) { 1539 ata_link_printk(link, KERN_ERR, "failed to read log page 10h " 1540 "(errno=%d)\n", rc); 1541 return; 1542 } 1543 1544 if (!(link->sactive & (1 << tag))) { 1545 ata_link_printk(link, KERN_ERR, "log page 10h reported " 1546 "inactive tag %d\n", tag); 1547 return; 1548 } 1549 1550 /* we've got the perpetrator, condemn it */ 1551 qc = __ata_qc_from_tag(ap, tag); 1552 memcpy(&qc->result_tf, &tf, sizeof(tf)); 1553 qc->result_tf.flags = ATA_TFLAG_ISADDR | ATA_TFLAG_LBA | ATA_TFLAG_LBA48; 1554 qc->err_mask |= AC_ERR_DEV | AC_ERR_NCQ; 1555 ehc->i.err_mask &= ~AC_ERR_DEV; 1556 } 1557 1558 /** 1559 * ata_eh_analyze_tf - analyze taskfile of a failed qc 1560 * @qc: qc to analyze 1561 * @tf: Taskfile registers to analyze 1562 * 1563 * Analyze taskfile of @qc and further determine cause of 1564 * failure. This function also requests ATAPI sense data if 1565 * avaliable. 1566 * 1567 * LOCKING: 1568 * Kernel thread context (may sleep). 1569 * 1570 * RETURNS: 1571 * Determined recovery action 1572 */ 1573 static unsigned int ata_eh_analyze_tf(struct ata_queued_cmd *qc, 1574 const struct ata_taskfile *tf) 1575 { 1576 unsigned int tmp, action = 0; 1577 u8 stat = tf->command, err = tf->feature; 1578 1579 if ((stat & (ATA_BUSY | ATA_DRQ | ATA_DRDY)) != ATA_DRDY) { 1580 qc->err_mask |= AC_ERR_HSM; 1581 return ATA_EH_RESET; 1582 } 1583 1584 if (stat & (ATA_ERR | ATA_DF)) 1585 qc->err_mask |= AC_ERR_DEV; 1586 else 1587 return 0; 1588 1589 switch (qc->dev->class) { 1590 case ATA_DEV_ATA: 1591 if (err & ATA_ICRC) 1592 qc->err_mask |= AC_ERR_ATA_BUS; 1593 if (err & ATA_UNC) 1594 qc->err_mask |= AC_ERR_MEDIA; 1595 if (err & ATA_IDNF) 1596 qc->err_mask |= AC_ERR_INVALID; 1597 break; 1598 1599 case ATA_DEV_ATAPI: 1600 if (!(qc->ap->pflags & ATA_PFLAG_FROZEN)) { 1601 tmp = atapi_eh_request_sense(qc->dev, 1602 qc->scsicmd->sense_buffer, 1603 qc->result_tf.feature >> 4); 1604 if (!tmp) { 1605 /* ATA_QCFLAG_SENSE_VALID is used to 1606 * tell atapi_qc_complete() that sense 1607 * data is already valid. 1608 * 1609 * TODO: interpret sense data and set 1610 * appropriate err_mask. 1611 */ 1612 qc->flags |= ATA_QCFLAG_SENSE_VALID; 1613 } else 1614 qc->err_mask |= tmp; 1615 } 1616 } 1617 1618 if (qc->err_mask & (AC_ERR_HSM | AC_ERR_TIMEOUT | AC_ERR_ATA_BUS)) 1619 action |= ATA_EH_RESET; 1620 1621 return action; 1622 } 1623 1624 static int ata_eh_categorize_error(unsigned int eflags, unsigned int err_mask, 1625 int *xfer_ok) 1626 { 1627 int base = 0; 1628 1629 if (!(eflags & ATA_EFLAG_DUBIOUS_XFER)) 1630 *xfer_ok = 1; 1631 1632 if (!*xfer_ok) 1633 base = ATA_ECAT_DUBIOUS_NONE; 1634 1635 if (err_mask & AC_ERR_ATA_BUS) 1636 return base + ATA_ECAT_ATA_BUS; 1637 1638 if (err_mask & AC_ERR_TIMEOUT) 1639 return base + ATA_ECAT_TOUT_HSM; 1640 1641 if (eflags & ATA_EFLAG_IS_IO) { 1642 if (err_mask & AC_ERR_HSM) 1643 return base + ATA_ECAT_TOUT_HSM; 1644 if ((err_mask & 1645 (AC_ERR_DEV|AC_ERR_MEDIA|AC_ERR_INVALID)) == AC_ERR_DEV) 1646 return base + ATA_ECAT_UNK_DEV; 1647 } 1648 1649 return 0; 1650 } 1651 1652 struct speed_down_verdict_arg { 1653 u64 since; 1654 int xfer_ok; 1655 int nr_errors[ATA_ECAT_NR]; 1656 }; 1657 1658 static int speed_down_verdict_cb(struct ata_ering_entry *ent, void *void_arg) 1659 { 1660 struct speed_down_verdict_arg *arg = void_arg; 1661 int cat; 1662 1663 if (ent->timestamp < arg->since) 1664 return -1; 1665 1666 cat = ata_eh_categorize_error(ent->eflags, ent->err_mask, 1667 &arg->xfer_ok); 1668 arg->nr_errors[cat]++; 1669 1670 return 0; 1671 } 1672 1673 /** 1674 * ata_eh_speed_down_verdict - Determine speed down verdict 1675 * @dev: Device of interest 1676 * 1677 * This function examines error ring of @dev and determines 1678 * whether NCQ needs to be turned off, transfer speed should be 1679 * stepped down, or falling back to PIO is necessary. 1680 * 1681 * ECAT_ATA_BUS : ATA_BUS error for any command 1682 * 1683 * ECAT_TOUT_HSM : TIMEOUT for any command or HSM violation for 1684 * IO commands 1685 * 1686 * ECAT_UNK_DEV : Unknown DEV error for IO commands 1687 * 1688 * ECAT_DUBIOUS_* : Identical to above three but occurred while 1689 * data transfer hasn't been verified. 1690 * 1691 * Verdicts are 1692 * 1693 * NCQ_OFF : Turn off NCQ. 1694 * 1695 * SPEED_DOWN : Speed down transfer speed but don't fall back 1696 * to PIO. 1697 * 1698 * FALLBACK_TO_PIO : Fall back to PIO. 1699 * 1700 * Even if multiple verdicts are returned, only one action is 1701 * taken per error. An action triggered by non-DUBIOUS errors 1702 * clears ering, while one triggered by DUBIOUS_* errors doesn't. 1703 * This is to expedite speed down decisions right after device is 1704 * initially configured. 1705 * 1706 * The followings are speed down rules. #1 and #2 deal with 1707 * DUBIOUS errors. 1708 * 1709 * 1. If more than one DUBIOUS_ATA_BUS or DUBIOUS_TOUT_HSM errors 1710 * occurred during last 5 mins, SPEED_DOWN and FALLBACK_TO_PIO. 1711 * 1712 * 2. If more than one DUBIOUS_TOUT_HSM or DUBIOUS_UNK_DEV errors 1713 * occurred during last 5 mins, NCQ_OFF. 1714 * 1715 * 3. If more than 8 ATA_BUS, TOUT_HSM or UNK_DEV errors 1716 * ocurred during last 5 mins, FALLBACK_TO_PIO 1717 * 1718 * 4. If more than 3 TOUT_HSM or UNK_DEV errors occurred 1719 * during last 10 mins, NCQ_OFF. 1720 * 1721 * 5. If more than 3 ATA_BUS or TOUT_HSM errors, or more than 6 1722 * UNK_DEV errors occurred during last 10 mins, SPEED_DOWN. 1723 * 1724 * LOCKING: 1725 * Inherited from caller. 1726 * 1727 * RETURNS: 1728 * OR of ATA_EH_SPDN_* flags. 1729 */ 1730 static unsigned int ata_eh_speed_down_verdict(struct ata_device *dev) 1731 { 1732 const u64 j5mins = 5LLU * 60 * HZ, j10mins = 10LLU * 60 * HZ; 1733 u64 j64 = get_jiffies_64(); 1734 struct speed_down_verdict_arg arg; 1735 unsigned int verdict = 0; 1736 1737 /* scan past 5 mins of error history */ 1738 memset(&arg, 0, sizeof(arg)); 1739 arg.since = j64 - min(j64, j5mins); 1740 ata_ering_map(&dev->ering, speed_down_verdict_cb, &arg); 1741 1742 if (arg.nr_errors[ATA_ECAT_DUBIOUS_ATA_BUS] + 1743 arg.nr_errors[ATA_ECAT_DUBIOUS_TOUT_HSM] > 1) 1744 verdict |= ATA_EH_SPDN_SPEED_DOWN | 1745 ATA_EH_SPDN_FALLBACK_TO_PIO | ATA_EH_SPDN_KEEP_ERRORS; 1746 1747 if (arg.nr_errors[ATA_ECAT_DUBIOUS_TOUT_HSM] + 1748 arg.nr_errors[ATA_ECAT_DUBIOUS_UNK_DEV] > 1) 1749 verdict |= ATA_EH_SPDN_NCQ_OFF | ATA_EH_SPDN_KEEP_ERRORS; 1750 1751 if (arg.nr_errors[ATA_ECAT_ATA_BUS] + 1752 arg.nr_errors[ATA_ECAT_TOUT_HSM] + 1753 arg.nr_errors[ATA_ECAT_UNK_DEV] > 6) 1754 verdict |= ATA_EH_SPDN_FALLBACK_TO_PIO; 1755 1756 /* scan past 10 mins of error history */ 1757 memset(&arg, 0, sizeof(arg)); 1758 arg.since = j64 - min(j64, j10mins); 1759 ata_ering_map(&dev->ering, speed_down_verdict_cb, &arg); 1760 1761 if (arg.nr_errors[ATA_ECAT_TOUT_HSM] + 1762 arg.nr_errors[ATA_ECAT_UNK_DEV] > 3) 1763 verdict |= ATA_EH_SPDN_NCQ_OFF; 1764 1765 if (arg.nr_errors[ATA_ECAT_ATA_BUS] + 1766 arg.nr_errors[ATA_ECAT_TOUT_HSM] > 3 || 1767 arg.nr_errors[ATA_ECAT_UNK_DEV] > 6) 1768 verdict |= ATA_EH_SPDN_SPEED_DOWN; 1769 1770 return verdict; 1771 } 1772 1773 /** 1774 * ata_eh_speed_down - record error and speed down if necessary 1775 * @dev: Failed device 1776 * @eflags: mask of ATA_EFLAG_* flags 1777 * @err_mask: err_mask of the error 1778 * 1779 * Record error and examine error history to determine whether 1780 * adjusting transmission speed is necessary. It also sets 1781 * transmission limits appropriately if such adjustment is 1782 * necessary. 1783 * 1784 * LOCKING: 1785 * Kernel thread context (may sleep). 1786 * 1787 * RETURNS: 1788 * Determined recovery action. 1789 */ 1790 static unsigned int ata_eh_speed_down(struct ata_device *dev, 1791 unsigned int eflags, unsigned int err_mask) 1792 { 1793 struct ata_link *link = ata_dev_phys_link(dev); 1794 int xfer_ok = 0; 1795 unsigned int verdict; 1796 unsigned int action = 0; 1797 1798 /* don't bother if Cat-0 error */ 1799 if (ata_eh_categorize_error(eflags, err_mask, &xfer_ok) == 0) 1800 return 0; 1801 1802 /* record error and determine whether speed down is necessary */ 1803 ata_ering_record(&dev->ering, eflags, err_mask); 1804 verdict = ata_eh_speed_down_verdict(dev); 1805 1806 /* turn off NCQ? */ 1807 if ((verdict & ATA_EH_SPDN_NCQ_OFF) && 1808 (dev->flags & (ATA_DFLAG_PIO | ATA_DFLAG_NCQ | 1809 ATA_DFLAG_NCQ_OFF)) == ATA_DFLAG_NCQ) { 1810 dev->flags |= ATA_DFLAG_NCQ_OFF; 1811 ata_dev_printk(dev, KERN_WARNING, 1812 "NCQ disabled due to excessive errors\n"); 1813 goto done; 1814 } 1815 1816 /* speed down? */ 1817 if (verdict & ATA_EH_SPDN_SPEED_DOWN) { 1818 /* speed down SATA link speed if possible */ 1819 if (sata_down_spd_limit(link) == 0) { 1820 action |= ATA_EH_RESET; 1821 goto done; 1822 } 1823 1824 /* lower transfer mode */ 1825 if (dev->spdn_cnt < 2) { 1826 static const int dma_dnxfer_sel[] = 1827 { ATA_DNXFER_DMA, ATA_DNXFER_40C }; 1828 static const int pio_dnxfer_sel[] = 1829 { ATA_DNXFER_PIO, ATA_DNXFER_FORCE_PIO0 }; 1830 int sel; 1831 1832 if (dev->xfer_shift != ATA_SHIFT_PIO) 1833 sel = dma_dnxfer_sel[dev->spdn_cnt]; 1834 else 1835 sel = pio_dnxfer_sel[dev->spdn_cnt]; 1836 1837 dev->spdn_cnt++; 1838 1839 if (ata_down_xfermask_limit(dev, sel) == 0) { 1840 action |= ATA_EH_RESET; 1841 goto done; 1842 } 1843 } 1844 } 1845 1846 /* Fall back to PIO? Slowing down to PIO is meaningless for 1847 * SATA ATA devices. Consider it only for PATA and SATAPI. 1848 */ 1849 if ((verdict & ATA_EH_SPDN_FALLBACK_TO_PIO) && (dev->spdn_cnt >= 2) && 1850 (link->ap->cbl != ATA_CBL_SATA || dev->class == ATA_DEV_ATAPI) && 1851 (dev->xfer_shift != ATA_SHIFT_PIO)) { 1852 if (ata_down_xfermask_limit(dev, ATA_DNXFER_FORCE_PIO) == 0) { 1853 dev->spdn_cnt = 0; 1854 action |= ATA_EH_RESET; 1855 goto done; 1856 } 1857 } 1858 1859 return 0; 1860 done: 1861 /* device has been slowed down, blow error history */ 1862 if (!(verdict & ATA_EH_SPDN_KEEP_ERRORS)) 1863 ata_ering_clear(&dev->ering); 1864 return action; 1865 } 1866 1867 /** 1868 * ata_eh_link_autopsy - analyze error and determine recovery action 1869 * @link: host link to perform autopsy on 1870 * 1871 * Analyze why @link failed and determine which recovery actions 1872 * are needed. This function also sets more detailed AC_ERR_* 1873 * values and fills sense data for ATAPI CHECK SENSE. 1874 * 1875 * LOCKING: 1876 * Kernel thread context (may sleep). 1877 */ 1878 static void ata_eh_link_autopsy(struct ata_link *link) 1879 { 1880 struct ata_port *ap = link->ap; 1881 struct ata_eh_context *ehc = &link->eh_context; 1882 struct ata_device *dev; 1883 unsigned int all_err_mask = 0, eflags = 0; 1884 int tag; 1885 u32 serror; 1886 int rc; 1887 1888 DPRINTK("ENTER\n"); 1889 1890 if (ehc->i.flags & ATA_EHI_NO_AUTOPSY) 1891 return; 1892 1893 /* obtain and analyze SError */ 1894 rc = sata_scr_read(link, SCR_ERROR, &serror); 1895 if (rc == 0) { 1896 ehc->i.serror |= serror; 1897 ata_eh_analyze_serror(link); 1898 } else if (rc != -EOPNOTSUPP) { 1899 /* SError read failed, force reset and probing */ 1900 ehc->i.probe_mask |= ATA_ALL_DEVICES; 1901 ehc->i.action |= ATA_EH_RESET; 1902 ehc->i.err_mask |= AC_ERR_OTHER; 1903 } 1904 1905 /* analyze NCQ failure */ 1906 ata_eh_analyze_ncq_error(link); 1907 1908 /* any real error trumps AC_ERR_OTHER */ 1909 if (ehc->i.err_mask & ~AC_ERR_OTHER) 1910 ehc->i.err_mask &= ~AC_ERR_OTHER; 1911 1912 all_err_mask |= ehc->i.err_mask; 1913 1914 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 1915 struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 1916 1917 if (!(qc->flags & ATA_QCFLAG_FAILED) || 1918 ata_dev_phys_link(qc->dev) != link) 1919 continue; 1920 1921 /* inherit upper level err_mask */ 1922 qc->err_mask |= ehc->i.err_mask; 1923 1924 /* analyze TF */ 1925 ehc->i.action |= ata_eh_analyze_tf(qc, &qc->result_tf); 1926 1927 /* DEV errors are probably spurious in case of ATA_BUS error */ 1928 if (qc->err_mask & AC_ERR_ATA_BUS) 1929 qc->err_mask &= ~(AC_ERR_DEV | AC_ERR_MEDIA | 1930 AC_ERR_INVALID); 1931 1932 /* any real error trumps unknown error */ 1933 if (qc->err_mask & ~AC_ERR_OTHER) 1934 qc->err_mask &= ~AC_ERR_OTHER; 1935 1936 /* SENSE_VALID trumps dev/unknown error and revalidation */ 1937 if (qc->flags & ATA_QCFLAG_SENSE_VALID) 1938 qc->err_mask &= ~(AC_ERR_DEV | AC_ERR_OTHER); 1939 1940 /* determine whether the command is worth retrying */ 1941 if (!(qc->err_mask & AC_ERR_INVALID) && 1942 ((qc->flags & ATA_QCFLAG_IO) || qc->err_mask != AC_ERR_DEV)) 1943 qc->flags |= ATA_QCFLAG_RETRY; 1944 1945 /* accumulate error info */ 1946 ehc->i.dev = qc->dev; 1947 all_err_mask |= qc->err_mask; 1948 if (qc->flags & ATA_QCFLAG_IO) 1949 eflags |= ATA_EFLAG_IS_IO; 1950 } 1951 1952 /* enforce default EH actions */ 1953 if (ap->pflags & ATA_PFLAG_FROZEN || 1954 all_err_mask & (AC_ERR_HSM | AC_ERR_TIMEOUT)) 1955 ehc->i.action |= ATA_EH_RESET; 1956 else if (((eflags & ATA_EFLAG_IS_IO) && all_err_mask) || 1957 (!(eflags & ATA_EFLAG_IS_IO) && (all_err_mask & ~AC_ERR_DEV))) 1958 ehc->i.action |= ATA_EH_REVALIDATE; 1959 1960 /* If we have offending qcs and the associated failed device, 1961 * perform per-dev EH action only on the offending device. 1962 */ 1963 if (ehc->i.dev) { 1964 ehc->i.dev_action[ehc->i.dev->devno] |= 1965 ehc->i.action & ATA_EH_PERDEV_MASK; 1966 ehc->i.action &= ~ATA_EH_PERDEV_MASK; 1967 } 1968 1969 /* propagate timeout to host link */ 1970 if ((all_err_mask & AC_ERR_TIMEOUT) && !ata_is_host_link(link)) 1971 ap->link.eh_context.i.err_mask |= AC_ERR_TIMEOUT; 1972 1973 /* record error and consider speeding down */ 1974 dev = ehc->i.dev; 1975 if (!dev && ((ata_link_max_devices(link) == 1 && 1976 ata_dev_enabled(link->device)))) 1977 dev = link->device; 1978 1979 if (dev) { 1980 if (dev->flags & ATA_DFLAG_DUBIOUS_XFER) 1981 eflags |= ATA_EFLAG_DUBIOUS_XFER; 1982 ehc->i.action |= ata_eh_speed_down(dev, eflags, all_err_mask); 1983 } 1984 1985 DPRINTK("EXIT\n"); 1986 } 1987 1988 /** 1989 * ata_eh_autopsy - analyze error and determine recovery action 1990 * @ap: host port to perform autopsy on 1991 * 1992 * Analyze all links of @ap and determine why they failed and 1993 * which recovery actions are needed. 1994 * 1995 * LOCKING: 1996 * Kernel thread context (may sleep). 1997 */ 1998 void ata_eh_autopsy(struct ata_port *ap) 1999 { 2000 struct ata_link *link; 2001 2002 ata_port_for_each_link(link, ap) 2003 ata_eh_link_autopsy(link); 2004 2005 /* Handle the frigging slave link. Autopsy is done similarly 2006 * but actions and flags are transferred over to the master 2007 * link and handled from there. 2008 */ 2009 if (ap->slave_link) { 2010 struct ata_eh_context *mehc = &ap->link.eh_context; 2011 struct ata_eh_context *sehc = &ap->slave_link->eh_context; 2012 2013 ata_eh_link_autopsy(ap->slave_link); 2014 2015 ata_eh_about_to_do(ap->slave_link, NULL, ATA_EH_ALL_ACTIONS); 2016 mehc->i.action |= sehc->i.action; 2017 mehc->i.dev_action[1] |= sehc->i.dev_action[1]; 2018 mehc->i.flags |= sehc->i.flags; 2019 ata_eh_done(ap->slave_link, NULL, ATA_EH_ALL_ACTIONS); 2020 } 2021 2022 /* Autopsy of fanout ports can affect host link autopsy. 2023 * Perform host link autopsy last. 2024 */ 2025 if (sata_pmp_attached(ap)) 2026 ata_eh_link_autopsy(&ap->link); 2027 } 2028 2029 /** 2030 * ata_eh_link_report - report error handling to user 2031 * @link: ATA link EH is going on 2032 * 2033 * Report EH to user. 2034 * 2035 * LOCKING: 2036 * None. 2037 */ 2038 static void ata_eh_link_report(struct ata_link *link) 2039 { 2040 struct ata_port *ap = link->ap; 2041 struct ata_eh_context *ehc = &link->eh_context; 2042 const char *frozen, *desc; 2043 char tries_buf[6]; 2044 int tag, nr_failed = 0; 2045 2046 if (ehc->i.flags & ATA_EHI_QUIET) 2047 return; 2048 2049 desc = NULL; 2050 if (ehc->i.desc[0] != '\0') 2051 desc = ehc->i.desc; 2052 2053 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 2054 struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 2055 2056 if (!(qc->flags & ATA_QCFLAG_FAILED) || 2057 ata_dev_phys_link(qc->dev) != link || 2058 ((qc->flags & ATA_QCFLAG_QUIET) && 2059 qc->err_mask == AC_ERR_DEV)) 2060 continue; 2061 if (qc->flags & ATA_QCFLAG_SENSE_VALID && !qc->err_mask) 2062 continue; 2063 2064 nr_failed++; 2065 } 2066 2067 if (!nr_failed && !ehc->i.err_mask) 2068 return; 2069 2070 frozen = ""; 2071 if (ap->pflags & ATA_PFLAG_FROZEN) 2072 frozen = " frozen"; 2073 2074 memset(tries_buf, 0, sizeof(tries_buf)); 2075 if (ap->eh_tries < ATA_EH_MAX_TRIES) 2076 snprintf(tries_buf, sizeof(tries_buf) - 1, " t%d", 2077 ap->eh_tries); 2078 2079 if (ehc->i.dev) { 2080 ata_dev_printk(ehc->i.dev, KERN_ERR, "exception Emask 0x%x " 2081 "SAct 0x%x SErr 0x%x action 0x%x%s%s\n", 2082 ehc->i.err_mask, link->sactive, ehc->i.serror, 2083 ehc->i.action, frozen, tries_buf); 2084 if (desc) 2085 ata_dev_printk(ehc->i.dev, KERN_ERR, "%s\n", desc); 2086 } else { 2087 ata_link_printk(link, KERN_ERR, "exception Emask 0x%x " 2088 "SAct 0x%x SErr 0x%x action 0x%x%s%s\n", 2089 ehc->i.err_mask, link->sactive, ehc->i.serror, 2090 ehc->i.action, frozen, tries_buf); 2091 if (desc) 2092 ata_link_printk(link, KERN_ERR, "%s\n", desc); 2093 } 2094 2095 if (ehc->i.serror) 2096 ata_link_printk(link, KERN_ERR, 2097 "SError: { %s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s}\n", 2098 ehc->i.serror & SERR_DATA_RECOVERED ? "RecovData " : "", 2099 ehc->i.serror & SERR_COMM_RECOVERED ? "RecovComm " : "", 2100 ehc->i.serror & SERR_DATA ? "UnrecovData " : "", 2101 ehc->i.serror & SERR_PERSISTENT ? "Persist " : "", 2102 ehc->i.serror & SERR_PROTOCOL ? "Proto " : "", 2103 ehc->i.serror & SERR_INTERNAL ? "HostInt " : "", 2104 ehc->i.serror & SERR_PHYRDY_CHG ? "PHYRdyChg " : "", 2105 ehc->i.serror & SERR_PHY_INT_ERR ? "PHYInt " : "", 2106 ehc->i.serror & SERR_COMM_WAKE ? "CommWake " : "", 2107 ehc->i.serror & SERR_10B_8B_ERR ? "10B8B " : "", 2108 ehc->i.serror & SERR_DISPARITY ? "Dispar " : "", 2109 ehc->i.serror & SERR_CRC ? "BadCRC " : "", 2110 ehc->i.serror & SERR_HANDSHAKE ? "Handshk " : "", 2111 ehc->i.serror & SERR_LINK_SEQ_ERR ? "LinkSeq " : "", 2112 ehc->i.serror & SERR_TRANS_ST_ERROR ? "TrStaTrns " : "", 2113 ehc->i.serror & SERR_UNRECOG_FIS ? "UnrecFIS " : "", 2114 ehc->i.serror & SERR_DEV_XCHG ? "DevExch " : ""); 2115 2116 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 2117 struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 2118 struct ata_taskfile *cmd = &qc->tf, *res = &qc->result_tf; 2119 const u8 *cdb = qc->cdb; 2120 char data_buf[20] = ""; 2121 char cdb_buf[70] = ""; 2122 2123 if (!(qc->flags & ATA_QCFLAG_FAILED) || 2124 ata_dev_phys_link(qc->dev) != link || !qc->err_mask) 2125 continue; 2126 2127 if (qc->dma_dir != DMA_NONE) { 2128 static const char *dma_str[] = { 2129 [DMA_BIDIRECTIONAL] = "bidi", 2130 [DMA_TO_DEVICE] = "out", 2131 [DMA_FROM_DEVICE] = "in", 2132 }; 2133 static const char *prot_str[] = { 2134 [ATA_PROT_PIO] = "pio", 2135 [ATA_PROT_DMA] = "dma", 2136 [ATA_PROT_NCQ] = "ncq", 2137 [ATAPI_PROT_PIO] = "pio", 2138 [ATAPI_PROT_DMA] = "dma", 2139 }; 2140 2141 snprintf(data_buf, sizeof(data_buf), " %s %u %s", 2142 prot_str[qc->tf.protocol], qc->nbytes, 2143 dma_str[qc->dma_dir]); 2144 } 2145 2146 if (ata_is_atapi(qc->tf.protocol)) 2147 snprintf(cdb_buf, sizeof(cdb_buf), 2148 "cdb %02x %02x %02x %02x %02x %02x %02x %02x " 2149 "%02x %02x %02x %02x %02x %02x %02x %02x\n ", 2150 cdb[0], cdb[1], cdb[2], cdb[3], 2151 cdb[4], cdb[5], cdb[6], cdb[7], 2152 cdb[8], cdb[9], cdb[10], cdb[11], 2153 cdb[12], cdb[13], cdb[14], cdb[15]); 2154 2155 ata_dev_printk(qc->dev, KERN_ERR, 2156 "cmd %02x/%02x:%02x:%02x:%02x:%02x/%02x:%02x:%02x:%02x:%02x/%02x " 2157 "tag %d%s\n %s" 2158 "res %02x/%02x:%02x:%02x:%02x:%02x/%02x:%02x:%02x:%02x:%02x/%02x " 2159 "Emask 0x%x (%s)%s\n", 2160 cmd->command, cmd->feature, cmd->nsect, 2161 cmd->lbal, cmd->lbam, cmd->lbah, 2162 cmd->hob_feature, cmd->hob_nsect, 2163 cmd->hob_lbal, cmd->hob_lbam, cmd->hob_lbah, 2164 cmd->device, qc->tag, data_buf, cdb_buf, 2165 res->command, res->feature, res->nsect, 2166 res->lbal, res->lbam, res->lbah, 2167 res->hob_feature, res->hob_nsect, 2168 res->hob_lbal, res->hob_lbam, res->hob_lbah, 2169 res->device, qc->err_mask, ata_err_string(qc->err_mask), 2170 qc->err_mask & AC_ERR_NCQ ? " <F>" : ""); 2171 2172 if (res->command & (ATA_BUSY | ATA_DRDY | ATA_DF | ATA_DRQ | 2173 ATA_ERR)) { 2174 if (res->command & ATA_BUSY) 2175 ata_dev_printk(qc->dev, KERN_ERR, 2176 "status: { Busy }\n"); 2177 else 2178 ata_dev_printk(qc->dev, KERN_ERR, 2179 "status: { %s%s%s%s}\n", 2180 res->command & ATA_DRDY ? "DRDY " : "", 2181 res->command & ATA_DF ? "DF " : "", 2182 res->command & ATA_DRQ ? "DRQ " : "", 2183 res->command & ATA_ERR ? "ERR " : ""); 2184 } 2185 2186 if (cmd->command != ATA_CMD_PACKET && 2187 (res->feature & (ATA_ICRC | ATA_UNC | ATA_IDNF | 2188 ATA_ABORTED))) 2189 ata_dev_printk(qc->dev, KERN_ERR, 2190 "error: { %s%s%s%s}\n", 2191 res->feature & ATA_ICRC ? "ICRC " : "", 2192 res->feature & ATA_UNC ? "UNC " : "", 2193 res->feature & ATA_IDNF ? "IDNF " : "", 2194 res->feature & ATA_ABORTED ? "ABRT " : ""); 2195 } 2196 } 2197 2198 /** 2199 * ata_eh_report - report error handling to user 2200 * @ap: ATA port to report EH about 2201 * 2202 * Report EH to user. 2203 * 2204 * LOCKING: 2205 * None. 2206 */ 2207 void ata_eh_report(struct ata_port *ap) 2208 { 2209 struct ata_link *link; 2210 2211 __ata_port_for_each_link(link, ap) 2212 ata_eh_link_report(link); 2213 } 2214 2215 static int ata_do_reset(struct ata_link *link, ata_reset_fn_t reset, 2216 unsigned int *classes, unsigned long deadline, 2217 bool clear_classes) 2218 { 2219 struct ata_device *dev; 2220 2221 if (clear_classes) 2222 ata_link_for_each_dev(dev, link) 2223 classes[dev->devno] = ATA_DEV_UNKNOWN; 2224 2225 return reset(link, classes, deadline); 2226 } 2227 2228 static int ata_eh_followup_srst_needed(struct ata_link *link, 2229 int rc, const unsigned int *classes) 2230 { 2231 if ((link->flags & ATA_LFLAG_NO_SRST) || ata_link_offline(link)) 2232 return 0; 2233 if (rc == -EAGAIN) 2234 return 1; 2235 if (sata_pmp_supported(link->ap) && ata_is_host_link(link)) 2236 return 1; 2237 return 0; 2238 } 2239 2240 int ata_eh_reset(struct ata_link *link, int classify, 2241 ata_prereset_fn_t prereset, ata_reset_fn_t softreset, 2242 ata_reset_fn_t hardreset, ata_postreset_fn_t postreset) 2243 { 2244 struct ata_port *ap = link->ap; 2245 struct ata_link *slave = ap->slave_link; 2246 struct ata_eh_context *ehc = &link->eh_context; 2247 struct ata_eh_context *sehc = &slave->eh_context; 2248 unsigned int *classes = ehc->classes; 2249 unsigned int lflags = link->flags; 2250 int verbose = !(ehc->i.flags & ATA_EHI_QUIET); 2251 int max_tries = 0, try = 0; 2252 struct ata_link *failed_link; 2253 struct ata_device *dev; 2254 unsigned long deadline, now; 2255 ata_reset_fn_t reset; 2256 unsigned long flags; 2257 u32 sstatus; 2258 int nr_unknown, rc; 2259 2260 /* 2261 * Prepare to reset 2262 */ 2263 while (ata_eh_reset_timeouts[max_tries] != ULONG_MAX) 2264 max_tries++; 2265 if (link->flags & ATA_LFLAG_NO_HRST) 2266 hardreset = NULL; 2267 if (link->flags & ATA_LFLAG_NO_SRST) 2268 softreset = NULL; 2269 2270 now = jiffies; 2271 deadline = ata_deadline(ehc->last_reset, ATA_EH_RESET_COOL_DOWN); 2272 if (time_before(now, deadline)) 2273 schedule_timeout_uninterruptible(deadline - now); 2274 2275 spin_lock_irqsave(ap->lock, flags); 2276 ap->pflags |= ATA_PFLAG_RESETTING; 2277 spin_unlock_irqrestore(ap->lock, flags); 2278 2279 ata_eh_about_to_do(link, NULL, ATA_EH_RESET); 2280 ehc->last_reset = jiffies; 2281 2282 ata_link_for_each_dev(dev, link) { 2283 /* If we issue an SRST then an ATA drive (not ATAPI) 2284 * may change configuration and be in PIO0 timing. If 2285 * we do a hard reset (or are coming from power on) 2286 * this is true for ATA or ATAPI. Until we've set a 2287 * suitable controller mode we should not touch the 2288 * bus as we may be talking too fast. 2289 */ 2290 dev->pio_mode = XFER_PIO_0; 2291 2292 /* If the controller has a pio mode setup function 2293 * then use it to set the chipset to rights. Don't 2294 * touch the DMA setup as that will be dealt with when 2295 * configuring devices. 2296 */ 2297 if (ap->ops->set_piomode) 2298 ap->ops->set_piomode(ap, dev); 2299 } 2300 2301 /* prefer hardreset */ 2302 reset = NULL; 2303 ehc->i.action &= ~ATA_EH_RESET; 2304 if (hardreset) { 2305 reset = hardreset; 2306 ehc->i.action |= ATA_EH_HARDRESET; 2307 } else if (softreset) { 2308 reset = softreset; 2309 ehc->i.action |= ATA_EH_SOFTRESET; 2310 } 2311 2312 if (prereset) { 2313 unsigned long deadline = ata_deadline(jiffies, 2314 ATA_EH_PRERESET_TIMEOUT); 2315 2316 if (slave) { 2317 sehc->i.action &= ~ATA_EH_RESET; 2318 sehc->i.action |= ehc->i.action; 2319 } 2320 2321 rc = prereset(link, deadline); 2322 2323 /* If present, do prereset on slave link too. Reset 2324 * is skipped iff both master and slave links report 2325 * -ENOENT or clear ATA_EH_RESET. 2326 */ 2327 if (slave && (rc == 0 || rc == -ENOENT)) { 2328 int tmp; 2329 2330 tmp = prereset(slave, deadline); 2331 if (tmp != -ENOENT) 2332 rc = tmp; 2333 2334 ehc->i.action |= sehc->i.action; 2335 } 2336 2337 if (rc) { 2338 if (rc == -ENOENT) { 2339 ata_link_printk(link, KERN_DEBUG, 2340 "port disabled. ignoring.\n"); 2341 ehc->i.action &= ~ATA_EH_RESET; 2342 2343 ata_link_for_each_dev(dev, link) 2344 classes[dev->devno] = ATA_DEV_NONE; 2345 2346 rc = 0; 2347 } else 2348 ata_link_printk(link, KERN_ERR, 2349 "prereset failed (errno=%d)\n", rc); 2350 goto out; 2351 } 2352 2353 /* prereset() might have cleared ATA_EH_RESET. If so, 2354 * bang classes and return. 2355 */ 2356 if (reset && !(ehc->i.action & ATA_EH_RESET)) { 2357 ata_link_for_each_dev(dev, link) 2358 classes[dev->devno] = ATA_DEV_NONE; 2359 rc = 0; 2360 goto out; 2361 } 2362 } 2363 2364 retry: 2365 /* 2366 * Perform reset 2367 */ 2368 ehc->last_reset = jiffies; 2369 if (ata_is_host_link(link)) 2370 ata_eh_freeze_port(ap); 2371 2372 deadline = ata_deadline(jiffies, ata_eh_reset_timeouts[try++]); 2373 2374 if (reset) { 2375 if (verbose) 2376 ata_link_printk(link, KERN_INFO, "%s resetting link\n", 2377 reset == softreset ? "soft" : "hard"); 2378 2379 /* mark that this EH session started with reset */ 2380 if (reset == hardreset) 2381 ehc->i.flags |= ATA_EHI_DID_HARDRESET; 2382 else 2383 ehc->i.flags |= ATA_EHI_DID_SOFTRESET; 2384 2385 rc = ata_do_reset(link, reset, classes, deadline, true); 2386 if (rc && rc != -EAGAIN) { 2387 failed_link = link; 2388 goto fail; 2389 } 2390 2391 /* hardreset slave link if existent */ 2392 if (slave && reset == hardreset) { 2393 int tmp; 2394 2395 if (verbose) 2396 ata_link_printk(slave, KERN_INFO, 2397 "hard resetting link\n"); 2398 2399 ata_eh_about_to_do(slave, NULL, ATA_EH_RESET); 2400 tmp = ata_do_reset(slave, reset, classes, deadline, 2401 false); 2402 switch (tmp) { 2403 case -EAGAIN: 2404 rc = -EAGAIN; 2405 case 0: 2406 break; 2407 default: 2408 failed_link = slave; 2409 rc = tmp; 2410 goto fail; 2411 } 2412 } 2413 2414 /* perform follow-up SRST if necessary */ 2415 if (reset == hardreset && 2416 ata_eh_followup_srst_needed(link, rc, classes)) { 2417 reset = softreset; 2418 2419 if (!reset) { 2420 ata_link_printk(link, KERN_ERR, 2421 "follow-up softreset required " 2422 "but no softreset avaliable\n"); 2423 failed_link = link; 2424 rc = -EINVAL; 2425 goto fail; 2426 } 2427 2428 ata_eh_about_to_do(link, NULL, ATA_EH_RESET); 2429 rc = ata_do_reset(link, reset, classes, deadline, true); 2430 } 2431 } else { 2432 if (verbose) 2433 ata_link_printk(link, KERN_INFO, "no reset method " 2434 "available, skipping reset\n"); 2435 if (!(lflags & ATA_LFLAG_ASSUME_CLASS)) 2436 lflags |= ATA_LFLAG_ASSUME_ATA; 2437 } 2438 2439 /* 2440 * Post-reset processing 2441 */ 2442 ata_link_for_each_dev(dev, link) { 2443 /* After the reset, the device state is PIO 0 and the 2444 * controller state is undefined. Reset also wakes up 2445 * drives from sleeping mode. 2446 */ 2447 dev->pio_mode = XFER_PIO_0; 2448 dev->flags &= ~ATA_DFLAG_SLEEPING; 2449 2450 if (ata_phys_link_offline(ata_dev_phys_link(dev))) 2451 continue; 2452 2453 /* apply class override */ 2454 if (lflags & ATA_LFLAG_ASSUME_ATA) 2455 classes[dev->devno] = ATA_DEV_ATA; 2456 else if (lflags & ATA_LFLAG_ASSUME_SEMB) 2457 classes[dev->devno] = ATA_DEV_SEMB_UNSUP; /* not yet */ 2458 } 2459 2460 /* record current link speed */ 2461 if (sata_scr_read(link, SCR_STATUS, &sstatus) == 0) 2462 link->sata_spd = (sstatus >> 4) & 0xf; 2463 if (slave && sata_scr_read(slave, SCR_STATUS, &sstatus) == 0) 2464 slave->sata_spd = (sstatus >> 4) & 0xf; 2465 2466 /* thaw the port */ 2467 if (ata_is_host_link(link)) 2468 ata_eh_thaw_port(ap); 2469 2470 /* postreset() should clear hardware SError. Although SError 2471 * is cleared during link resume, clearing SError here is 2472 * necessary as some PHYs raise hotplug events after SRST. 2473 * This introduces race condition where hotplug occurs between 2474 * reset and here. This race is mediated by cross checking 2475 * link onlineness and classification result later. 2476 */ 2477 if (postreset) { 2478 postreset(link, classes); 2479 if (slave) 2480 postreset(slave, classes); 2481 } 2482 2483 /* clear cached SError */ 2484 spin_lock_irqsave(link->ap->lock, flags); 2485 link->eh_info.serror = 0; 2486 if (slave) 2487 slave->eh_info.serror = 0; 2488 spin_unlock_irqrestore(link->ap->lock, flags); 2489 2490 /* Make sure onlineness and classification result correspond. 2491 * Hotplug could have happened during reset and some 2492 * controllers fail to wait while a drive is spinning up after 2493 * being hotplugged causing misdetection. By cross checking 2494 * link onlineness and classification result, those conditions 2495 * can be reliably detected and retried. 2496 */ 2497 nr_unknown = 0; 2498 ata_link_for_each_dev(dev, link) { 2499 /* convert all ATA_DEV_UNKNOWN to ATA_DEV_NONE */ 2500 if (classes[dev->devno] == ATA_DEV_UNKNOWN) { 2501 classes[dev->devno] = ATA_DEV_NONE; 2502 if (ata_phys_link_online(ata_dev_phys_link(dev))) 2503 nr_unknown++; 2504 } 2505 } 2506 2507 if (classify && nr_unknown) { 2508 if (try < max_tries) { 2509 ata_link_printk(link, KERN_WARNING, "link online but " 2510 "device misclassified, retrying\n"); 2511 failed_link = link; 2512 rc = -EAGAIN; 2513 goto fail; 2514 } 2515 ata_link_printk(link, KERN_WARNING, 2516 "link online but device misclassified, " 2517 "device detection might fail\n"); 2518 } 2519 2520 /* reset successful, schedule revalidation */ 2521 ata_eh_done(link, NULL, ATA_EH_RESET); 2522 if (slave) 2523 ata_eh_done(slave, NULL, ATA_EH_RESET); 2524 ehc->last_reset = jiffies; 2525 ehc->i.action |= ATA_EH_REVALIDATE; 2526 2527 rc = 0; 2528 out: 2529 /* clear hotplug flag */ 2530 ehc->i.flags &= ~ATA_EHI_HOTPLUGGED; 2531 if (slave) 2532 sehc->i.flags &= ~ATA_EHI_HOTPLUGGED; 2533 2534 spin_lock_irqsave(ap->lock, flags); 2535 ap->pflags &= ~ATA_PFLAG_RESETTING; 2536 spin_unlock_irqrestore(ap->lock, flags); 2537 2538 return rc; 2539 2540 fail: 2541 /* if SCR isn't accessible on a fan-out port, PMP needs to be reset */ 2542 if (!ata_is_host_link(link) && 2543 sata_scr_read(link, SCR_STATUS, &sstatus)) 2544 rc = -ERESTART; 2545 2546 if (rc == -ERESTART || try >= max_tries) 2547 goto out; 2548 2549 now = jiffies; 2550 if (time_before(now, deadline)) { 2551 unsigned long delta = deadline - now; 2552 2553 ata_link_printk(failed_link, KERN_WARNING, 2554 "reset failed (errno=%d), retrying in %u secs\n", 2555 rc, DIV_ROUND_UP(jiffies_to_msecs(delta), 1000)); 2556 2557 while (delta) 2558 delta = schedule_timeout_uninterruptible(delta); 2559 } 2560 2561 if (try == max_tries - 1) { 2562 sata_down_spd_limit(link); 2563 if (slave) 2564 sata_down_spd_limit(slave); 2565 } else if (rc == -EPIPE) 2566 sata_down_spd_limit(failed_link); 2567 2568 if (hardreset) 2569 reset = hardreset; 2570 goto retry; 2571 } 2572 2573 static inline void ata_eh_pull_park_action(struct ata_port *ap) 2574 { 2575 struct ata_link *link; 2576 struct ata_device *dev; 2577 unsigned long flags; 2578 2579 /* 2580 * This function can be thought of as an extended version of 2581 * ata_eh_about_to_do() specially crafted to accommodate the 2582 * requirements of ATA_EH_PARK handling. Since the EH thread 2583 * does not leave the do {} while () loop in ata_eh_recover as 2584 * long as the timeout for a park request to *one* device on 2585 * the port has not expired, and since we still want to pick 2586 * up park requests to other devices on the same port or 2587 * timeout updates for the same device, we have to pull 2588 * ATA_EH_PARK actions from eh_info into eh_context.i 2589 * ourselves at the beginning of each pass over the loop. 2590 * 2591 * Additionally, all write accesses to &ap->park_req_pending 2592 * through INIT_COMPLETION() (see below) or complete_all() 2593 * (see ata_scsi_park_store()) are protected by the host lock. 2594 * As a result we have that park_req_pending.done is zero on 2595 * exit from this function, i.e. when ATA_EH_PARK actions for 2596 * *all* devices on port ap have been pulled into the 2597 * respective eh_context structs. If, and only if, 2598 * park_req_pending.done is non-zero by the time we reach 2599 * wait_for_completion_timeout(), another ATA_EH_PARK action 2600 * has been scheduled for at least one of the devices on port 2601 * ap and we have to cycle over the do {} while () loop in 2602 * ata_eh_recover() again. 2603 */ 2604 2605 spin_lock_irqsave(ap->lock, flags); 2606 INIT_COMPLETION(ap->park_req_pending); 2607 ata_port_for_each_link(link, ap) { 2608 ata_link_for_each_dev(dev, link) { 2609 struct ata_eh_info *ehi = &link->eh_info; 2610 2611 link->eh_context.i.dev_action[dev->devno] |= 2612 ehi->dev_action[dev->devno] & ATA_EH_PARK; 2613 ata_eh_clear_action(link, dev, ehi, ATA_EH_PARK); 2614 } 2615 } 2616 spin_unlock_irqrestore(ap->lock, flags); 2617 } 2618 2619 static void ata_eh_park_issue_cmd(struct ata_device *dev, int park) 2620 { 2621 struct ata_eh_context *ehc = &dev->link->eh_context; 2622 struct ata_taskfile tf; 2623 unsigned int err_mask; 2624 2625 ata_tf_init(dev, &tf); 2626 if (park) { 2627 ehc->unloaded_mask |= 1 << dev->devno; 2628 tf.command = ATA_CMD_IDLEIMMEDIATE; 2629 tf.feature = 0x44; 2630 tf.lbal = 0x4c; 2631 tf.lbam = 0x4e; 2632 tf.lbah = 0x55; 2633 } else { 2634 ehc->unloaded_mask &= ~(1 << dev->devno); 2635 tf.command = ATA_CMD_CHK_POWER; 2636 } 2637 2638 tf.flags |= ATA_TFLAG_DEVICE | ATA_TFLAG_ISADDR; 2639 tf.protocol |= ATA_PROT_NODATA; 2640 err_mask = ata_exec_internal(dev, &tf, NULL, DMA_NONE, NULL, 0, 0); 2641 if (park && (err_mask || tf.lbal != 0xc4)) { 2642 ata_dev_printk(dev, KERN_ERR, "head unload failed!\n"); 2643 ehc->unloaded_mask &= ~(1 << dev->devno); 2644 } 2645 } 2646 2647 static int ata_eh_revalidate_and_attach(struct ata_link *link, 2648 struct ata_device **r_failed_dev) 2649 { 2650 struct ata_port *ap = link->ap; 2651 struct ata_eh_context *ehc = &link->eh_context; 2652 struct ata_device *dev; 2653 unsigned int new_mask = 0; 2654 unsigned long flags; 2655 int rc = 0; 2656 2657 DPRINTK("ENTER\n"); 2658 2659 /* For PATA drive side cable detection to work, IDENTIFY must 2660 * be done backwards such that PDIAG- is released by the slave 2661 * device before the master device is identified. 2662 */ 2663 ata_link_for_each_dev_reverse(dev, link) { 2664 unsigned int action = ata_eh_dev_action(dev); 2665 unsigned int readid_flags = 0; 2666 2667 if (ehc->i.flags & ATA_EHI_DID_RESET) 2668 readid_flags |= ATA_READID_POSTRESET; 2669 2670 if ((action & ATA_EH_REVALIDATE) && ata_dev_enabled(dev)) { 2671 WARN_ON(dev->class == ATA_DEV_PMP); 2672 2673 if (ata_phys_link_offline(ata_dev_phys_link(dev))) { 2674 rc = -EIO; 2675 goto err; 2676 } 2677 2678 ata_eh_about_to_do(link, dev, ATA_EH_REVALIDATE); 2679 rc = ata_dev_revalidate(dev, ehc->classes[dev->devno], 2680 readid_flags); 2681 if (rc) 2682 goto err; 2683 2684 ata_eh_done(link, dev, ATA_EH_REVALIDATE); 2685 2686 /* Configuration may have changed, reconfigure 2687 * transfer mode. 2688 */ 2689 ehc->i.flags |= ATA_EHI_SETMODE; 2690 2691 /* schedule the scsi_rescan_device() here */ 2692 queue_work(ata_aux_wq, &(ap->scsi_rescan_task)); 2693 } else if (dev->class == ATA_DEV_UNKNOWN && 2694 ehc->tries[dev->devno] && 2695 ata_class_enabled(ehc->classes[dev->devno])) { 2696 dev->class = ehc->classes[dev->devno]; 2697 2698 if (dev->class == ATA_DEV_PMP) 2699 rc = sata_pmp_attach(dev); 2700 else 2701 rc = ata_dev_read_id(dev, &dev->class, 2702 readid_flags, dev->id); 2703 switch (rc) { 2704 case 0: 2705 new_mask |= 1 << dev->devno; 2706 break; 2707 case -ENOENT: 2708 /* IDENTIFY was issued to non-existent 2709 * device. No need to reset. Just 2710 * thaw and kill the device. 2711 */ 2712 ata_eh_thaw_port(ap); 2713 dev->class = ATA_DEV_UNKNOWN; 2714 break; 2715 default: 2716 dev->class = ATA_DEV_UNKNOWN; 2717 goto err; 2718 } 2719 } 2720 } 2721 2722 /* PDIAG- should have been released, ask cable type if post-reset */ 2723 if ((ehc->i.flags & ATA_EHI_DID_RESET) && ata_is_host_link(link)) { 2724 if (ap->ops->cable_detect) 2725 ap->cbl = ap->ops->cable_detect(ap); 2726 ata_force_cbl(ap); 2727 } 2728 2729 /* Configure new devices forward such that user doesn't see 2730 * device detection messages backwards. 2731 */ 2732 ata_link_for_each_dev(dev, link) { 2733 if (!(new_mask & (1 << dev->devno)) || 2734 dev->class == ATA_DEV_PMP) 2735 continue; 2736 2737 ehc->i.flags |= ATA_EHI_PRINTINFO; 2738 rc = ata_dev_configure(dev); 2739 ehc->i.flags &= ~ATA_EHI_PRINTINFO; 2740 if (rc) 2741 goto err; 2742 2743 spin_lock_irqsave(ap->lock, flags); 2744 ap->pflags |= ATA_PFLAG_SCSI_HOTPLUG; 2745 spin_unlock_irqrestore(ap->lock, flags); 2746 2747 /* new device discovered, configure xfermode */ 2748 ehc->i.flags |= ATA_EHI_SETMODE; 2749 } 2750 2751 return 0; 2752 2753 err: 2754 *r_failed_dev = dev; 2755 DPRINTK("EXIT rc=%d\n", rc); 2756 return rc; 2757 } 2758 2759 /** 2760 * ata_set_mode - Program timings and issue SET FEATURES - XFER 2761 * @link: link on which timings will be programmed 2762 * @r_failed_dev: out paramter for failed device 2763 * 2764 * Set ATA device disk transfer mode (PIO3, UDMA6, etc.). If 2765 * ata_set_mode() fails, pointer to the failing device is 2766 * returned in @r_failed_dev. 2767 * 2768 * LOCKING: 2769 * PCI/etc. bus probe sem. 2770 * 2771 * RETURNS: 2772 * 0 on success, negative errno otherwise 2773 */ 2774 int ata_set_mode(struct ata_link *link, struct ata_device **r_failed_dev) 2775 { 2776 struct ata_port *ap = link->ap; 2777 struct ata_device *dev; 2778 int rc; 2779 2780 /* if data transfer is verified, clear DUBIOUS_XFER on ering top */ 2781 ata_link_for_each_dev(dev, link) { 2782 if (!(dev->flags & ATA_DFLAG_DUBIOUS_XFER)) { 2783 struct ata_ering_entry *ent; 2784 2785 ent = ata_ering_top(&dev->ering); 2786 if (ent) 2787 ent->eflags &= ~ATA_EFLAG_DUBIOUS_XFER; 2788 } 2789 } 2790 2791 /* has private set_mode? */ 2792 if (ap->ops->set_mode) 2793 rc = ap->ops->set_mode(link, r_failed_dev); 2794 else 2795 rc = ata_do_set_mode(link, r_failed_dev); 2796 2797 /* if transfer mode has changed, set DUBIOUS_XFER on device */ 2798 ata_link_for_each_dev(dev, link) { 2799 struct ata_eh_context *ehc = &link->eh_context; 2800 u8 saved_xfer_mode = ehc->saved_xfer_mode[dev->devno]; 2801 u8 saved_ncq = !!(ehc->saved_ncq_enabled & (1 << dev->devno)); 2802 2803 if (dev->xfer_mode != saved_xfer_mode || 2804 ata_ncq_enabled(dev) != saved_ncq) 2805 dev->flags |= ATA_DFLAG_DUBIOUS_XFER; 2806 } 2807 2808 return rc; 2809 } 2810 2811 /** 2812 * atapi_eh_clear_ua - Clear ATAPI UNIT ATTENTION after reset 2813 * @dev: ATAPI device to clear UA for 2814 * 2815 * Resets and other operations can make an ATAPI device raise 2816 * UNIT ATTENTION which causes the next operation to fail. This 2817 * function clears UA. 2818 * 2819 * LOCKING: 2820 * EH context (may sleep). 2821 * 2822 * RETURNS: 2823 * 0 on success, -errno on failure. 2824 */ 2825 static int atapi_eh_clear_ua(struct ata_device *dev) 2826 { 2827 int i; 2828 2829 for (i = 0; i < ATA_EH_UA_TRIES; i++) { 2830 u8 sense_buffer[SCSI_SENSE_BUFFERSIZE]; 2831 u8 sense_key = 0; 2832 unsigned int err_mask; 2833 2834 err_mask = atapi_eh_tur(dev, &sense_key); 2835 if (err_mask != 0 && err_mask != AC_ERR_DEV) { 2836 ata_dev_printk(dev, KERN_WARNING, "TEST_UNIT_READY " 2837 "failed (err_mask=0x%x)\n", err_mask); 2838 return -EIO; 2839 } 2840 2841 if (!err_mask || sense_key != UNIT_ATTENTION) 2842 return 0; 2843 2844 err_mask = atapi_eh_request_sense(dev, sense_buffer, sense_key); 2845 if (err_mask) { 2846 ata_dev_printk(dev, KERN_WARNING, "failed to clear " 2847 "UNIT ATTENTION (err_mask=0x%x)\n", err_mask); 2848 return -EIO; 2849 } 2850 } 2851 2852 ata_dev_printk(dev, KERN_WARNING, 2853 "UNIT ATTENTION persists after %d tries\n", ATA_EH_UA_TRIES); 2854 2855 return 0; 2856 } 2857 2858 static int ata_link_nr_enabled(struct ata_link *link) 2859 { 2860 struct ata_device *dev; 2861 int cnt = 0; 2862 2863 ata_link_for_each_dev(dev, link) 2864 if (ata_dev_enabled(dev)) 2865 cnt++; 2866 return cnt; 2867 } 2868 2869 static int ata_link_nr_vacant(struct ata_link *link) 2870 { 2871 struct ata_device *dev; 2872 int cnt = 0; 2873 2874 ata_link_for_each_dev(dev, link) 2875 if (dev->class == ATA_DEV_UNKNOWN) 2876 cnt++; 2877 return cnt; 2878 } 2879 2880 static int ata_eh_skip_recovery(struct ata_link *link) 2881 { 2882 struct ata_port *ap = link->ap; 2883 struct ata_eh_context *ehc = &link->eh_context; 2884 struct ata_device *dev; 2885 2886 /* skip disabled links */ 2887 if (link->flags & ATA_LFLAG_DISABLED) 2888 return 1; 2889 2890 /* thaw frozen port and recover failed devices */ 2891 if ((ap->pflags & ATA_PFLAG_FROZEN) || ata_link_nr_enabled(link)) 2892 return 0; 2893 2894 /* reset at least once if reset is requested */ 2895 if ((ehc->i.action & ATA_EH_RESET) && 2896 !(ehc->i.flags & ATA_EHI_DID_RESET)) 2897 return 0; 2898 2899 /* skip if class codes for all vacant slots are ATA_DEV_NONE */ 2900 ata_link_for_each_dev(dev, link) { 2901 if (dev->class == ATA_DEV_UNKNOWN && 2902 ehc->classes[dev->devno] != ATA_DEV_NONE) 2903 return 0; 2904 } 2905 2906 return 1; 2907 } 2908 2909 static int ata_eh_schedule_probe(struct ata_device *dev) 2910 { 2911 struct ata_eh_context *ehc = &dev->link->eh_context; 2912 2913 if (!(ehc->i.probe_mask & (1 << dev->devno)) || 2914 (ehc->did_probe_mask & (1 << dev->devno))) 2915 return 0; 2916 2917 ata_eh_detach_dev(dev); 2918 ata_dev_init(dev); 2919 ehc->did_probe_mask |= (1 << dev->devno); 2920 ehc->i.action |= ATA_EH_RESET; 2921 ehc->saved_xfer_mode[dev->devno] = 0; 2922 ehc->saved_ncq_enabled &= ~(1 << dev->devno); 2923 2924 return 1; 2925 } 2926 2927 static int ata_eh_handle_dev_fail(struct ata_device *dev, int err) 2928 { 2929 struct ata_eh_context *ehc = &dev->link->eh_context; 2930 2931 ehc->tries[dev->devno]--; 2932 2933 switch (err) { 2934 case -ENODEV: 2935 /* device missing or wrong IDENTIFY data, schedule probing */ 2936 ehc->i.probe_mask |= (1 << dev->devno); 2937 case -EINVAL: 2938 /* give it just one more chance */ 2939 ehc->tries[dev->devno] = min(ehc->tries[dev->devno], 1); 2940 case -EIO: 2941 if (ehc->tries[dev->devno] == 1 && dev->pio_mode > XFER_PIO_0) { 2942 /* This is the last chance, better to slow 2943 * down than lose it. 2944 */ 2945 sata_down_spd_limit(ata_dev_phys_link(dev)); 2946 ata_down_xfermask_limit(dev, ATA_DNXFER_PIO); 2947 } 2948 } 2949 2950 if (ata_dev_enabled(dev) && !ehc->tries[dev->devno]) { 2951 /* disable device if it has used up all its chances */ 2952 ata_dev_disable(dev); 2953 2954 /* detach if offline */ 2955 if (ata_phys_link_offline(ata_dev_phys_link(dev))) 2956 ata_eh_detach_dev(dev); 2957 2958 /* schedule probe if necessary */ 2959 if (ata_eh_schedule_probe(dev)) { 2960 ehc->tries[dev->devno] = ATA_EH_DEV_TRIES; 2961 memset(ehc->cmd_timeout_idx[dev->devno], 0, 2962 sizeof(ehc->cmd_timeout_idx[dev->devno])); 2963 } 2964 2965 return 1; 2966 } else { 2967 ehc->i.action |= ATA_EH_RESET; 2968 return 0; 2969 } 2970 } 2971 2972 /** 2973 * ata_eh_recover - recover host port after error 2974 * @ap: host port to recover 2975 * @prereset: prereset method (can be NULL) 2976 * @softreset: softreset method (can be NULL) 2977 * @hardreset: hardreset method (can be NULL) 2978 * @postreset: postreset method (can be NULL) 2979 * @r_failed_link: out parameter for failed link 2980 * 2981 * This is the alpha and omega, eum and yang, heart and soul of 2982 * libata exception handling. On entry, actions required to 2983 * recover each link and hotplug requests are recorded in the 2984 * link's eh_context. This function executes all the operations 2985 * with appropriate retrials and fallbacks to resurrect failed 2986 * devices, detach goners and greet newcomers. 2987 * 2988 * LOCKING: 2989 * Kernel thread context (may sleep). 2990 * 2991 * RETURNS: 2992 * 0 on success, -errno on failure. 2993 */ 2994 int ata_eh_recover(struct ata_port *ap, ata_prereset_fn_t prereset, 2995 ata_reset_fn_t softreset, ata_reset_fn_t hardreset, 2996 ata_postreset_fn_t postreset, 2997 struct ata_link **r_failed_link) 2998 { 2999 struct ata_link *link; 3000 struct ata_device *dev; 3001 int nr_failed_devs; 3002 int rc; 3003 unsigned long flags, deadline; 3004 3005 DPRINTK("ENTER\n"); 3006 3007 /* prep for recovery */ 3008 ata_port_for_each_link(link, ap) { 3009 struct ata_eh_context *ehc = &link->eh_context; 3010 3011 /* re-enable link? */ 3012 if (ehc->i.action & ATA_EH_ENABLE_LINK) { 3013 ata_eh_about_to_do(link, NULL, ATA_EH_ENABLE_LINK); 3014 spin_lock_irqsave(ap->lock, flags); 3015 link->flags &= ~ATA_LFLAG_DISABLED; 3016 spin_unlock_irqrestore(ap->lock, flags); 3017 ata_eh_done(link, NULL, ATA_EH_ENABLE_LINK); 3018 } 3019 3020 ata_link_for_each_dev(dev, link) { 3021 if (link->flags & ATA_LFLAG_NO_RETRY) 3022 ehc->tries[dev->devno] = 1; 3023 else 3024 ehc->tries[dev->devno] = ATA_EH_DEV_TRIES; 3025 3026 /* collect port action mask recorded in dev actions */ 3027 ehc->i.action |= ehc->i.dev_action[dev->devno] & 3028 ~ATA_EH_PERDEV_MASK; 3029 ehc->i.dev_action[dev->devno] &= ATA_EH_PERDEV_MASK; 3030 3031 /* process hotplug request */ 3032 if (dev->flags & ATA_DFLAG_DETACH) 3033 ata_eh_detach_dev(dev); 3034 3035 /* schedule probe if necessary */ 3036 if (!ata_dev_enabled(dev)) 3037 ata_eh_schedule_probe(dev); 3038 } 3039 } 3040 3041 retry: 3042 rc = 0; 3043 nr_failed_devs = 0; 3044 3045 /* if UNLOADING, finish immediately */ 3046 if (ap->pflags & ATA_PFLAG_UNLOADING) 3047 goto out; 3048 3049 /* prep for EH */ 3050 ata_port_for_each_link(link, ap) { 3051 struct ata_eh_context *ehc = &link->eh_context; 3052 3053 /* skip EH if possible. */ 3054 if (ata_eh_skip_recovery(link)) 3055 ehc->i.action = 0; 3056 3057 ata_link_for_each_dev(dev, link) 3058 ehc->classes[dev->devno] = ATA_DEV_UNKNOWN; 3059 } 3060 3061 /* reset */ 3062 ata_port_for_each_link(link, ap) { 3063 struct ata_eh_context *ehc = &link->eh_context; 3064 3065 if (!(ehc->i.action & ATA_EH_RESET)) 3066 continue; 3067 3068 rc = ata_eh_reset(link, ata_link_nr_vacant(link), 3069 prereset, softreset, hardreset, postreset); 3070 if (rc) { 3071 ata_link_printk(link, KERN_ERR, 3072 "reset failed, giving up\n"); 3073 goto out; 3074 } 3075 } 3076 3077 do { 3078 unsigned long now; 3079 3080 /* 3081 * clears ATA_EH_PARK in eh_info and resets 3082 * ap->park_req_pending 3083 */ 3084 ata_eh_pull_park_action(ap); 3085 3086 deadline = jiffies; 3087 ata_port_for_each_link(link, ap) { 3088 ata_link_for_each_dev(dev, link) { 3089 struct ata_eh_context *ehc = &link->eh_context; 3090 unsigned long tmp; 3091 3092 if (dev->class != ATA_DEV_ATA) 3093 continue; 3094 if (!(ehc->i.dev_action[dev->devno] & 3095 ATA_EH_PARK)) 3096 continue; 3097 tmp = dev->unpark_deadline; 3098 if (time_before(deadline, tmp)) 3099 deadline = tmp; 3100 else if (time_before_eq(tmp, jiffies)) 3101 continue; 3102 if (ehc->unloaded_mask & (1 << dev->devno)) 3103 continue; 3104 3105 ata_eh_park_issue_cmd(dev, 1); 3106 } 3107 } 3108 3109 now = jiffies; 3110 if (time_before_eq(deadline, now)) 3111 break; 3112 3113 deadline = wait_for_completion_timeout(&ap->park_req_pending, 3114 deadline - now); 3115 } while (deadline); 3116 ata_port_for_each_link(link, ap) { 3117 ata_link_for_each_dev(dev, link) { 3118 if (!(link->eh_context.unloaded_mask & 3119 (1 << dev->devno))) 3120 continue; 3121 3122 ata_eh_park_issue_cmd(dev, 0); 3123 ata_eh_done(link, dev, ATA_EH_PARK); 3124 } 3125 } 3126 3127 /* the rest */ 3128 ata_port_for_each_link(link, ap) { 3129 struct ata_eh_context *ehc = &link->eh_context; 3130 3131 /* revalidate existing devices and attach new ones */ 3132 rc = ata_eh_revalidate_and_attach(link, &dev); 3133 if (rc) 3134 goto dev_fail; 3135 3136 /* if PMP got attached, return, pmp EH will take care of it */ 3137 if (link->device->class == ATA_DEV_PMP) { 3138 ehc->i.action = 0; 3139 return 0; 3140 } 3141 3142 /* configure transfer mode if necessary */ 3143 if (ehc->i.flags & ATA_EHI_SETMODE) { 3144 rc = ata_set_mode(link, &dev); 3145 if (rc) 3146 goto dev_fail; 3147 ehc->i.flags &= ~ATA_EHI_SETMODE; 3148 } 3149 3150 /* If reset has been issued, clear UA to avoid 3151 * disrupting the current users of the device. 3152 */ 3153 if (ehc->i.flags & ATA_EHI_DID_RESET) { 3154 ata_link_for_each_dev(dev, link) { 3155 if (dev->class != ATA_DEV_ATAPI) 3156 continue; 3157 rc = atapi_eh_clear_ua(dev); 3158 if (rc) 3159 goto dev_fail; 3160 } 3161 } 3162 3163 /* configure link power saving */ 3164 if (ehc->i.action & ATA_EH_LPM) 3165 ata_link_for_each_dev(dev, link) 3166 ata_dev_enable_pm(dev, ap->pm_policy); 3167 3168 /* this link is okay now */ 3169 ehc->i.flags = 0; 3170 continue; 3171 3172 dev_fail: 3173 nr_failed_devs++; 3174 ata_eh_handle_dev_fail(dev, rc); 3175 3176 if (ap->pflags & ATA_PFLAG_FROZEN) { 3177 /* PMP reset requires working host port. 3178 * Can't retry if it's frozen. 3179 */ 3180 if (sata_pmp_attached(ap)) 3181 goto out; 3182 break; 3183 } 3184 } 3185 3186 if (nr_failed_devs) 3187 goto retry; 3188 3189 out: 3190 if (rc && r_failed_link) 3191 *r_failed_link = link; 3192 3193 DPRINTK("EXIT, rc=%d\n", rc); 3194 return rc; 3195 } 3196 3197 /** 3198 * ata_eh_finish - finish up EH 3199 * @ap: host port to finish EH for 3200 * 3201 * Recovery is complete. Clean up EH states and retry or finish 3202 * failed qcs. 3203 * 3204 * LOCKING: 3205 * None. 3206 */ 3207 void ata_eh_finish(struct ata_port *ap) 3208 { 3209 int tag; 3210 3211 /* retry or finish qcs */ 3212 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 3213 struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 3214 3215 if (!(qc->flags & ATA_QCFLAG_FAILED)) 3216 continue; 3217 3218 if (qc->err_mask) { 3219 /* FIXME: Once EH migration is complete, 3220 * generate sense data in this function, 3221 * considering both err_mask and tf. 3222 */ 3223 if (qc->flags & ATA_QCFLAG_RETRY) 3224 ata_eh_qc_retry(qc); 3225 else 3226 ata_eh_qc_complete(qc); 3227 } else { 3228 if (qc->flags & ATA_QCFLAG_SENSE_VALID) { 3229 ata_eh_qc_complete(qc); 3230 } else { 3231 /* feed zero TF to sense generation */ 3232 memset(&qc->result_tf, 0, sizeof(qc->result_tf)); 3233 ata_eh_qc_retry(qc); 3234 } 3235 } 3236 } 3237 3238 /* make sure nr_active_links is zero after EH */ 3239 WARN_ON(ap->nr_active_links); 3240 ap->nr_active_links = 0; 3241 } 3242 3243 /** 3244 * ata_do_eh - do standard error handling 3245 * @ap: host port to handle error for 3246 * 3247 * @prereset: prereset method (can be NULL) 3248 * @softreset: softreset method (can be NULL) 3249 * @hardreset: hardreset method (can be NULL) 3250 * @postreset: postreset method (can be NULL) 3251 * 3252 * Perform standard error handling sequence. 3253 * 3254 * LOCKING: 3255 * Kernel thread context (may sleep). 3256 */ 3257 void ata_do_eh(struct ata_port *ap, ata_prereset_fn_t prereset, 3258 ata_reset_fn_t softreset, ata_reset_fn_t hardreset, 3259 ata_postreset_fn_t postreset) 3260 { 3261 struct ata_device *dev; 3262 int rc; 3263 3264 ata_eh_autopsy(ap); 3265 ata_eh_report(ap); 3266 3267 rc = ata_eh_recover(ap, prereset, softreset, hardreset, postreset, 3268 NULL); 3269 if (rc) { 3270 ata_link_for_each_dev(dev, &ap->link) 3271 ata_dev_disable(dev); 3272 } 3273 3274 ata_eh_finish(ap); 3275 } 3276 3277 /** 3278 * ata_std_error_handler - standard error handler 3279 * @ap: host port to handle error for 3280 * 3281 * Standard error handler 3282 * 3283 * LOCKING: 3284 * Kernel thread context (may sleep). 3285 */ 3286 void ata_std_error_handler(struct ata_port *ap) 3287 { 3288 struct ata_port_operations *ops = ap->ops; 3289 ata_reset_fn_t hardreset = ops->hardreset; 3290 3291 /* ignore built-in hardreset if SCR access is not available */ 3292 if (ata_is_builtin_hardreset(hardreset) && !sata_scr_valid(&ap->link)) 3293 hardreset = NULL; 3294 3295 ata_do_eh(ap, ops->prereset, ops->softreset, hardreset, ops->postreset); 3296 } 3297 3298 #ifdef CONFIG_PM 3299 /** 3300 * ata_eh_handle_port_suspend - perform port suspend operation 3301 * @ap: port to suspend 3302 * 3303 * Suspend @ap. 3304 * 3305 * LOCKING: 3306 * Kernel thread context (may sleep). 3307 */ 3308 static void ata_eh_handle_port_suspend(struct ata_port *ap) 3309 { 3310 unsigned long flags; 3311 int rc = 0; 3312 3313 /* are we suspending? */ 3314 spin_lock_irqsave(ap->lock, flags); 3315 if (!(ap->pflags & ATA_PFLAG_PM_PENDING) || 3316 ap->pm_mesg.event == PM_EVENT_ON) { 3317 spin_unlock_irqrestore(ap->lock, flags); 3318 return; 3319 } 3320 spin_unlock_irqrestore(ap->lock, flags); 3321 3322 WARN_ON(ap->pflags & ATA_PFLAG_SUSPENDED); 3323 3324 /* tell ACPI we're suspending */ 3325 rc = ata_acpi_on_suspend(ap); 3326 if (rc) 3327 goto out; 3328 3329 /* suspend */ 3330 ata_eh_freeze_port(ap); 3331 3332 if (ap->ops->port_suspend) 3333 rc = ap->ops->port_suspend(ap, ap->pm_mesg); 3334 3335 ata_acpi_set_state(ap, PMSG_SUSPEND); 3336 out: 3337 /* report result */ 3338 spin_lock_irqsave(ap->lock, flags); 3339 3340 ap->pflags &= ~ATA_PFLAG_PM_PENDING; 3341 if (rc == 0) 3342 ap->pflags |= ATA_PFLAG_SUSPENDED; 3343 else if (ap->pflags & ATA_PFLAG_FROZEN) 3344 ata_port_schedule_eh(ap); 3345 3346 if (ap->pm_result) { 3347 *ap->pm_result = rc; 3348 ap->pm_result = NULL; 3349 } 3350 3351 spin_unlock_irqrestore(ap->lock, flags); 3352 3353 return; 3354 } 3355 3356 /** 3357 * ata_eh_handle_port_resume - perform port resume operation 3358 * @ap: port to resume 3359 * 3360 * Resume @ap. 3361 * 3362 * LOCKING: 3363 * Kernel thread context (may sleep). 3364 */ 3365 static void ata_eh_handle_port_resume(struct ata_port *ap) 3366 { 3367 unsigned long flags; 3368 int rc = 0; 3369 3370 /* are we resuming? */ 3371 spin_lock_irqsave(ap->lock, flags); 3372 if (!(ap->pflags & ATA_PFLAG_PM_PENDING) || 3373 ap->pm_mesg.event != PM_EVENT_ON) { 3374 spin_unlock_irqrestore(ap->lock, flags); 3375 return; 3376 } 3377 spin_unlock_irqrestore(ap->lock, flags); 3378 3379 WARN_ON(!(ap->pflags & ATA_PFLAG_SUSPENDED)); 3380 3381 ata_acpi_set_state(ap, PMSG_ON); 3382 3383 if (ap->ops->port_resume) 3384 rc = ap->ops->port_resume(ap); 3385 3386 /* tell ACPI that we're resuming */ 3387 ata_acpi_on_resume(ap); 3388 3389 /* report result */ 3390 spin_lock_irqsave(ap->lock, flags); 3391 ap->pflags &= ~(ATA_PFLAG_PM_PENDING | ATA_PFLAG_SUSPENDED); 3392 if (ap->pm_result) { 3393 *ap->pm_result = rc; 3394 ap->pm_result = NULL; 3395 } 3396 spin_unlock_irqrestore(ap->lock, flags); 3397 } 3398 #endif /* CONFIG_PM */ 3399