1 /* 2 * libata-eh.c - libata error handling 3 * 4 * Maintained by: Jeff Garzik <jgarzik@pobox.com> 5 * Please ALWAYS copy linux-ide@vger.kernel.org 6 * on emails. 7 * 8 * Copyright 2006 Tejun Heo <htejun@gmail.com> 9 * 10 * 11 * This program is free software; you can redistribute it and/or 12 * modify it under the terms of the GNU General Public License as 13 * published by the Free Software Foundation; either version 2, or 14 * (at your option) any later version. 15 * 16 * This program is distributed in the hope that it will be useful, 17 * but WITHOUT ANY WARRANTY; without even the implied warranty of 18 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 19 * General Public License for more details. 20 * 21 * You should have received a copy of the GNU General Public License 22 * along with this program; see the file COPYING. If not, write to 23 * the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, 24 * USA. 25 * 26 * 27 * libata documentation is available via 'make {ps|pdf}docs', 28 * as Documentation/DocBook/libata.* 29 * 30 * Hardware documentation available from http://www.t13.org/ and 31 * http://www.sata-io.org/ 32 * 33 */ 34 35 #include <linux/kernel.h> 36 #include <linux/blkdev.h> 37 #include <linux/pci.h> 38 #include <scsi/scsi.h> 39 #include <scsi/scsi_host.h> 40 #include <scsi/scsi_eh.h> 41 #include <scsi/scsi_device.h> 42 #include <scsi/scsi_cmnd.h> 43 #include <scsi/scsi_dbg.h> 44 #include "../scsi/scsi_transport_api.h" 45 46 #include <linux/libata.h> 47 48 #include "libata.h" 49 50 enum { 51 /* speed down verdicts */ 52 ATA_EH_SPDN_NCQ_OFF = (1 << 0), 53 ATA_EH_SPDN_SPEED_DOWN = (1 << 1), 54 ATA_EH_SPDN_FALLBACK_TO_PIO = (1 << 2), 55 ATA_EH_SPDN_KEEP_ERRORS = (1 << 3), 56 57 /* error flags */ 58 ATA_EFLAG_IS_IO = (1 << 0), 59 ATA_EFLAG_DUBIOUS_XFER = (1 << 1), 60 ATA_EFLAG_OLD_ER = (1 << 31), 61 62 /* error categories */ 63 ATA_ECAT_NONE = 0, 64 ATA_ECAT_ATA_BUS = 1, 65 ATA_ECAT_TOUT_HSM = 2, 66 ATA_ECAT_UNK_DEV = 3, 67 ATA_ECAT_DUBIOUS_NONE = 4, 68 ATA_ECAT_DUBIOUS_ATA_BUS = 5, 69 ATA_ECAT_DUBIOUS_TOUT_HSM = 6, 70 ATA_ECAT_DUBIOUS_UNK_DEV = 7, 71 ATA_ECAT_NR = 8, 72 73 ATA_EH_CMD_DFL_TIMEOUT = 5000, 74 75 /* always put at least this amount of time between resets */ 76 ATA_EH_RESET_COOL_DOWN = 5000, 77 78 /* Waiting in ->prereset can never be reliable. It's 79 * sometimes nice to wait there but it can't be depended upon; 80 * otherwise, we wouldn't be resetting. Just give it enough 81 * time for most drives to spin up. 82 */ 83 ATA_EH_PRERESET_TIMEOUT = 10000, 84 ATA_EH_FASTDRAIN_INTERVAL = 3000, 85 86 ATA_EH_UA_TRIES = 5, 87 88 /* probe speed down parameters, see ata_eh_schedule_probe() */ 89 ATA_EH_PROBE_TRIAL_INTERVAL = 60000, /* 1 min */ 90 ATA_EH_PROBE_TRIALS = 2, 91 }; 92 93 /* The following table determines how we sequence resets. Each entry 94 * represents timeout for that try. The first try can be soft or 95 * hardreset. All others are hardreset if available. In most cases 96 * the first reset w/ 10sec timeout should succeed. Following entries 97 * are mostly for error handling, hotplug and retarded devices. 98 */ 99 static const unsigned long ata_eh_reset_timeouts[] = { 100 10000, /* most drives spin up by 10sec */ 101 10000, /* > 99% working drives spin up before 20sec */ 102 35000, /* give > 30 secs of idleness for retarded devices */ 103 5000, /* and sweet one last chance */ 104 ULONG_MAX, /* > 1 min has elapsed, give up */ 105 }; 106 107 static const unsigned long ata_eh_identify_timeouts[] = { 108 5000, /* covers > 99% of successes and not too boring on failures */ 109 10000, /* combined time till here is enough even for media access */ 110 30000, /* for true idiots */ 111 ULONG_MAX, 112 }; 113 114 static const unsigned long ata_eh_flush_timeouts[] = { 115 15000, /* be generous with flush */ 116 15000, /* ditto */ 117 30000, /* and even more generous */ 118 ULONG_MAX, 119 }; 120 121 static const unsigned long ata_eh_other_timeouts[] = { 122 5000, /* same rationale as identify timeout */ 123 10000, /* ditto */ 124 /* but no merciful 30sec for other commands, it just isn't worth it */ 125 ULONG_MAX, 126 }; 127 128 struct ata_eh_cmd_timeout_ent { 129 const u8 *commands; 130 const unsigned long *timeouts; 131 }; 132 133 /* The following table determines timeouts to use for EH internal 134 * commands. Each table entry is a command class and matches the 135 * commands the entry applies to and the timeout table to use. 136 * 137 * On the retry after a command timed out, the next timeout value from 138 * the table is used. If the table doesn't contain further entries, 139 * the last value is used. 140 * 141 * ehc->cmd_timeout_idx keeps track of which timeout to use per 142 * command class, so if SET_FEATURES times out on the first try, the 143 * next try will use the second timeout value only for that class. 144 */ 145 #define CMDS(cmds...) (const u8 []){ cmds, 0 } 146 static const struct ata_eh_cmd_timeout_ent 147 ata_eh_cmd_timeout_table[ATA_EH_CMD_TIMEOUT_TABLE_SIZE] = { 148 { .commands = CMDS(ATA_CMD_ID_ATA, ATA_CMD_ID_ATAPI), 149 .timeouts = ata_eh_identify_timeouts, }, 150 { .commands = CMDS(ATA_CMD_READ_NATIVE_MAX, ATA_CMD_READ_NATIVE_MAX_EXT), 151 .timeouts = ata_eh_other_timeouts, }, 152 { .commands = CMDS(ATA_CMD_SET_MAX, ATA_CMD_SET_MAX_EXT), 153 .timeouts = ata_eh_other_timeouts, }, 154 { .commands = CMDS(ATA_CMD_SET_FEATURES), 155 .timeouts = ata_eh_other_timeouts, }, 156 { .commands = CMDS(ATA_CMD_INIT_DEV_PARAMS), 157 .timeouts = ata_eh_other_timeouts, }, 158 { .commands = CMDS(ATA_CMD_FLUSH, ATA_CMD_FLUSH_EXT), 159 .timeouts = ata_eh_flush_timeouts }, 160 }; 161 #undef CMDS 162 163 static void __ata_port_freeze(struct ata_port *ap); 164 #ifdef CONFIG_PM 165 static void ata_eh_handle_port_suspend(struct ata_port *ap); 166 static void ata_eh_handle_port_resume(struct ata_port *ap); 167 #else /* CONFIG_PM */ 168 static void ata_eh_handle_port_suspend(struct ata_port *ap) 169 { } 170 171 static void ata_eh_handle_port_resume(struct ata_port *ap) 172 { } 173 #endif /* CONFIG_PM */ 174 175 static void __ata_ehi_pushv_desc(struct ata_eh_info *ehi, const char *fmt, 176 va_list args) 177 { 178 ehi->desc_len += vscnprintf(ehi->desc + ehi->desc_len, 179 ATA_EH_DESC_LEN - ehi->desc_len, 180 fmt, args); 181 } 182 183 /** 184 * __ata_ehi_push_desc - push error description without adding separator 185 * @ehi: target EHI 186 * @fmt: printf format string 187 * 188 * Format string according to @fmt and append it to @ehi->desc. 189 * 190 * LOCKING: 191 * spin_lock_irqsave(host lock) 192 */ 193 void __ata_ehi_push_desc(struct ata_eh_info *ehi, const char *fmt, ...) 194 { 195 va_list args; 196 197 va_start(args, fmt); 198 __ata_ehi_pushv_desc(ehi, fmt, args); 199 va_end(args); 200 } 201 202 /** 203 * ata_ehi_push_desc - push error description with separator 204 * @ehi: target EHI 205 * @fmt: printf format string 206 * 207 * Format string according to @fmt and append it to @ehi->desc. 208 * If @ehi->desc is not empty, ", " is added in-between. 209 * 210 * LOCKING: 211 * spin_lock_irqsave(host lock) 212 */ 213 void ata_ehi_push_desc(struct ata_eh_info *ehi, const char *fmt, ...) 214 { 215 va_list args; 216 217 if (ehi->desc_len) 218 __ata_ehi_push_desc(ehi, ", "); 219 220 va_start(args, fmt); 221 __ata_ehi_pushv_desc(ehi, fmt, args); 222 va_end(args); 223 } 224 225 /** 226 * ata_ehi_clear_desc - clean error description 227 * @ehi: target EHI 228 * 229 * Clear @ehi->desc. 230 * 231 * LOCKING: 232 * spin_lock_irqsave(host lock) 233 */ 234 void ata_ehi_clear_desc(struct ata_eh_info *ehi) 235 { 236 ehi->desc[0] = '\0'; 237 ehi->desc_len = 0; 238 } 239 240 /** 241 * ata_port_desc - append port description 242 * @ap: target ATA port 243 * @fmt: printf format string 244 * 245 * Format string according to @fmt and append it to port 246 * description. If port description is not empty, " " is added 247 * in-between. This function is to be used while initializing 248 * ata_host. The description is printed on host registration. 249 * 250 * LOCKING: 251 * None. 252 */ 253 void ata_port_desc(struct ata_port *ap, const char *fmt, ...) 254 { 255 va_list args; 256 257 WARN_ON(!(ap->pflags & ATA_PFLAG_INITIALIZING)); 258 259 if (ap->link.eh_info.desc_len) 260 __ata_ehi_push_desc(&ap->link.eh_info, " "); 261 262 va_start(args, fmt); 263 __ata_ehi_pushv_desc(&ap->link.eh_info, fmt, args); 264 va_end(args); 265 } 266 267 #ifdef CONFIG_PCI 268 269 /** 270 * ata_port_pbar_desc - append PCI BAR description 271 * @ap: target ATA port 272 * @bar: target PCI BAR 273 * @offset: offset into PCI BAR 274 * @name: name of the area 275 * 276 * If @offset is negative, this function formats a string which 277 * contains the name, address, size and type of the BAR and 278 * appends it to the port description. If @offset is zero or 279 * positive, only name and offsetted address is appended. 280 * 281 * LOCKING: 282 * None. 283 */ 284 void ata_port_pbar_desc(struct ata_port *ap, int bar, ssize_t offset, 285 const char *name) 286 { 287 struct pci_dev *pdev = to_pci_dev(ap->host->dev); 288 char *type = ""; 289 unsigned long long start, len; 290 291 if (pci_resource_flags(pdev, bar) & IORESOURCE_MEM) 292 type = "m"; 293 else if (pci_resource_flags(pdev, bar) & IORESOURCE_IO) 294 type = "i"; 295 296 start = (unsigned long long)pci_resource_start(pdev, bar); 297 len = (unsigned long long)pci_resource_len(pdev, bar); 298 299 if (offset < 0) 300 ata_port_desc(ap, "%s %s%llu@0x%llx", name, type, len, start); 301 else 302 ata_port_desc(ap, "%s 0x%llx", name, 303 start + (unsigned long long)offset); 304 } 305 306 #endif /* CONFIG_PCI */ 307 308 static int ata_lookup_timeout_table(u8 cmd) 309 { 310 int i; 311 312 for (i = 0; i < ATA_EH_CMD_TIMEOUT_TABLE_SIZE; i++) { 313 const u8 *cur; 314 315 for (cur = ata_eh_cmd_timeout_table[i].commands; *cur; cur++) 316 if (*cur == cmd) 317 return i; 318 } 319 320 return -1; 321 } 322 323 /** 324 * ata_internal_cmd_timeout - determine timeout for an internal command 325 * @dev: target device 326 * @cmd: internal command to be issued 327 * 328 * Determine timeout for internal command @cmd for @dev. 329 * 330 * LOCKING: 331 * EH context. 332 * 333 * RETURNS: 334 * Determined timeout. 335 */ 336 unsigned long ata_internal_cmd_timeout(struct ata_device *dev, u8 cmd) 337 { 338 struct ata_eh_context *ehc = &dev->link->eh_context; 339 int ent = ata_lookup_timeout_table(cmd); 340 int idx; 341 342 if (ent < 0) 343 return ATA_EH_CMD_DFL_TIMEOUT; 344 345 idx = ehc->cmd_timeout_idx[dev->devno][ent]; 346 return ata_eh_cmd_timeout_table[ent].timeouts[idx]; 347 } 348 349 /** 350 * ata_internal_cmd_timed_out - notification for internal command timeout 351 * @dev: target device 352 * @cmd: internal command which timed out 353 * 354 * Notify EH that internal command @cmd for @dev timed out. This 355 * function should be called only for commands whose timeouts are 356 * determined using ata_internal_cmd_timeout(). 357 * 358 * LOCKING: 359 * EH context. 360 */ 361 void ata_internal_cmd_timed_out(struct ata_device *dev, u8 cmd) 362 { 363 struct ata_eh_context *ehc = &dev->link->eh_context; 364 int ent = ata_lookup_timeout_table(cmd); 365 int idx; 366 367 if (ent < 0) 368 return; 369 370 idx = ehc->cmd_timeout_idx[dev->devno][ent]; 371 if (ata_eh_cmd_timeout_table[ent].timeouts[idx + 1] != ULONG_MAX) 372 ehc->cmd_timeout_idx[dev->devno][ent]++; 373 } 374 375 static void ata_ering_record(struct ata_ering *ering, unsigned int eflags, 376 unsigned int err_mask) 377 { 378 struct ata_ering_entry *ent; 379 380 WARN_ON(!err_mask); 381 382 ering->cursor++; 383 ering->cursor %= ATA_ERING_SIZE; 384 385 ent = &ering->ring[ering->cursor]; 386 ent->eflags = eflags; 387 ent->err_mask = err_mask; 388 ent->timestamp = get_jiffies_64(); 389 } 390 391 static struct ata_ering_entry *ata_ering_top(struct ata_ering *ering) 392 { 393 struct ata_ering_entry *ent = &ering->ring[ering->cursor]; 394 395 if (ent->err_mask) 396 return ent; 397 return NULL; 398 } 399 400 int ata_ering_map(struct ata_ering *ering, 401 int (*map_fn)(struct ata_ering_entry *, void *), 402 void *arg) 403 { 404 int idx, rc = 0; 405 struct ata_ering_entry *ent; 406 407 idx = ering->cursor; 408 do { 409 ent = &ering->ring[idx]; 410 if (!ent->err_mask) 411 break; 412 rc = map_fn(ent, arg); 413 if (rc) 414 break; 415 idx = (idx - 1 + ATA_ERING_SIZE) % ATA_ERING_SIZE; 416 } while (idx != ering->cursor); 417 418 return rc; 419 } 420 421 int ata_ering_clear_cb(struct ata_ering_entry *ent, void *void_arg) 422 { 423 ent->eflags |= ATA_EFLAG_OLD_ER; 424 return 0; 425 } 426 427 static void ata_ering_clear(struct ata_ering *ering) 428 { 429 ata_ering_map(ering, ata_ering_clear_cb, NULL); 430 } 431 432 static unsigned int ata_eh_dev_action(struct ata_device *dev) 433 { 434 struct ata_eh_context *ehc = &dev->link->eh_context; 435 436 return ehc->i.action | ehc->i.dev_action[dev->devno]; 437 } 438 439 static void ata_eh_clear_action(struct ata_link *link, struct ata_device *dev, 440 struct ata_eh_info *ehi, unsigned int action) 441 { 442 struct ata_device *tdev; 443 444 if (!dev) { 445 ehi->action &= ~action; 446 ata_for_each_dev(tdev, link, ALL) 447 ehi->dev_action[tdev->devno] &= ~action; 448 } else { 449 /* doesn't make sense for port-wide EH actions */ 450 WARN_ON(!(action & ATA_EH_PERDEV_MASK)); 451 452 /* break ehi->action into ehi->dev_action */ 453 if (ehi->action & action) { 454 ata_for_each_dev(tdev, link, ALL) 455 ehi->dev_action[tdev->devno] |= 456 ehi->action & action; 457 ehi->action &= ~action; 458 } 459 460 /* turn off the specified per-dev action */ 461 ehi->dev_action[dev->devno] &= ~action; 462 } 463 } 464 465 /** 466 * ata_eh_acquire - acquire EH ownership 467 * @ap: ATA port to acquire EH ownership for 468 * 469 * Acquire EH ownership for @ap. This is the basic exclusion 470 * mechanism for ports sharing a host. Only one port hanging off 471 * the same host can claim the ownership of EH. 472 * 473 * LOCKING: 474 * EH context. 475 */ 476 void ata_eh_acquire(struct ata_port *ap) 477 { 478 mutex_lock(&ap->host->eh_mutex); 479 WARN_ON_ONCE(ap->host->eh_owner); 480 ap->host->eh_owner = current; 481 } 482 483 /** 484 * ata_eh_release - release EH ownership 485 * @ap: ATA port to release EH ownership for 486 * 487 * Release EH ownership for @ap if the caller. The caller must 488 * have acquired EH ownership using ata_eh_acquire() previously. 489 * 490 * LOCKING: 491 * EH context. 492 */ 493 void ata_eh_release(struct ata_port *ap) 494 { 495 WARN_ON_ONCE(ap->host->eh_owner != current); 496 ap->host->eh_owner = NULL; 497 mutex_unlock(&ap->host->eh_mutex); 498 } 499 500 /** 501 * ata_scsi_timed_out - SCSI layer time out callback 502 * @cmd: timed out SCSI command 503 * 504 * Handles SCSI layer timeout. We race with normal completion of 505 * the qc for @cmd. If the qc is already gone, we lose and let 506 * the scsi command finish (EH_HANDLED). Otherwise, the qc has 507 * timed out and EH should be invoked. Prevent ata_qc_complete() 508 * from finishing it by setting EH_SCHEDULED and return 509 * EH_NOT_HANDLED. 510 * 511 * TODO: kill this function once old EH is gone. 512 * 513 * LOCKING: 514 * Called from timer context 515 * 516 * RETURNS: 517 * EH_HANDLED or EH_NOT_HANDLED 518 */ 519 enum blk_eh_timer_return ata_scsi_timed_out(struct scsi_cmnd *cmd) 520 { 521 struct Scsi_Host *host = cmd->device->host; 522 struct ata_port *ap = ata_shost_to_port(host); 523 unsigned long flags; 524 struct ata_queued_cmd *qc; 525 enum blk_eh_timer_return ret; 526 527 DPRINTK("ENTER\n"); 528 529 if (ap->ops->error_handler) { 530 ret = BLK_EH_NOT_HANDLED; 531 goto out; 532 } 533 534 ret = BLK_EH_HANDLED; 535 spin_lock_irqsave(ap->lock, flags); 536 qc = ata_qc_from_tag(ap, ap->link.active_tag); 537 if (qc) { 538 WARN_ON(qc->scsicmd != cmd); 539 qc->flags |= ATA_QCFLAG_EH_SCHEDULED; 540 qc->err_mask |= AC_ERR_TIMEOUT; 541 ret = BLK_EH_NOT_HANDLED; 542 } 543 spin_unlock_irqrestore(ap->lock, flags); 544 545 out: 546 DPRINTK("EXIT, ret=%d\n", ret); 547 return ret; 548 } 549 550 static void ata_eh_unload(struct ata_port *ap) 551 { 552 struct ata_link *link; 553 struct ata_device *dev; 554 unsigned long flags; 555 556 /* Restore SControl IPM and SPD for the next driver and 557 * disable attached devices. 558 */ 559 ata_for_each_link(link, ap, PMP_FIRST) { 560 sata_scr_write(link, SCR_CONTROL, link->saved_scontrol & 0xff0); 561 ata_for_each_dev(dev, link, ALL) 562 ata_dev_disable(dev); 563 } 564 565 /* freeze and set UNLOADED */ 566 spin_lock_irqsave(ap->lock, flags); 567 568 ata_port_freeze(ap); /* won't be thawed */ 569 ap->pflags &= ~ATA_PFLAG_EH_PENDING; /* clear pending from freeze */ 570 ap->pflags |= ATA_PFLAG_UNLOADED; 571 572 spin_unlock_irqrestore(ap->lock, flags); 573 } 574 575 /** 576 * ata_scsi_error - SCSI layer error handler callback 577 * @host: SCSI host on which error occurred 578 * 579 * Handles SCSI-layer-thrown error events. 580 * 581 * LOCKING: 582 * Inherited from SCSI layer (none, can sleep) 583 * 584 * RETURNS: 585 * Zero. 586 */ 587 void ata_scsi_error(struct Scsi_Host *host) 588 { 589 struct ata_port *ap = ata_shost_to_port(host); 590 int i; 591 unsigned long flags; 592 593 DPRINTK("ENTER\n"); 594 595 /* make sure sff pio task is not running */ 596 ata_sff_flush_pio_task(ap); 597 598 /* synchronize with host lock and sort out timeouts */ 599 600 /* For new EH, all qcs are finished in one of three ways - 601 * normal completion, error completion, and SCSI timeout. 602 * Both completions can race against SCSI timeout. When normal 603 * completion wins, the qc never reaches EH. When error 604 * completion wins, the qc has ATA_QCFLAG_FAILED set. 605 * 606 * When SCSI timeout wins, things are a bit more complex. 607 * Normal or error completion can occur after the timeout but 608 * before this point. In such cases, both types of 609 * completions are honored. A scmd is determined to have 610 * timed out iff its associated qc is active and not failed. 611 */ 612 if (ap->ops->error_handler) { 613 struct scsi_cmnd *scmd, *tmp; 614 int nr_timedout = 0; 615 616 spin_lock_irqsave(ap->lock, flags); 617 618 /* This must occur under the ap->lock as we don't want 619 a polled recovery to race the real interrupt handler 620 621 The lost_interrupt handler checks for any completed but 622 non-notified command and completes much like an IRQ handler. 623 624 We then fall into the error recovery code which will treat 625 this as if normal completion won the race */ 626 627 if (ap->ops->lost_interrupt) 628 ap->ops->lost_interrupt(ap); 629 630 list_for_each_entry_safe(scmd, tmp, &host->eh_cmd_q, eh_entry) { 631 struct ata_queued_cmd *qc; 632 633 for (i = 0; i < ATA_MAX_QUEUE; i++) { 634 qc = __ata_qc_from_tag(ap, i); 635 if (qc->flags & ATA_QCFLAG_ACTIVE && 636 qc->scsicmd == scmd) 637 break; 638 } 639 640 if (i < ATA_MAX_QUEUE) { 641 /* the scmd has an associated qc */ 642 if (!(qc->flags & ATA_QCFLAG_FAILED)) { 643 /* which hasn't failed yet, timeout */ 644 qc->err_mask |= AC_ERR_TIMEOUT; 645 qc->flags |= ATA_QCFLAG_FAILED; 646 nr_timedout++; 647 } 648 } else { 649 /* Normal completion occurred after 650 * SCSI timeout but before this point. 651 * Successfully complete it. 652 */ 653 scmd->retries = scmd->allowed; 654 scsi_eh_finish_cmd(scmd, &ap->eh_done_q); 655 } 656 } 657 658 /* If we have timed out qcs. They belong to EH from 659 * this point but the state of the controller is 660 * unknown. Freeze the port to make sure the IRQ 661 * handler doesn't diddle with those qcs. This must 662 * be done atomically w.r.t. setting QCFLAG_FAILED. 663 */ 664 if (nr_timedout) 665 __ata_port_freeze(ap); 666 667 spin_unlock_irqrestore(ap->lock, flags); 668 669 /* initialize eh_tries */ 670 ap->eh_tries = ATA_EH_MAX_TRIES; 671 } else 672 spin_unlock_wait(ap->lock); 673 674 /* If we timed raced normal completion and there is nothing to 675 recover nr_timedout == 0 why exactly are we doing error recovery ? */ 676 677 /* invoke error handler */ 678 if (ap->ops->error_handler) { 679 struct ata_link *link; 680 681 /* acquire EH ownership */ 682 ata_eh_acquire(ap); 683 repeat: 684 /* kill fast drain timer */ 685 del_timer_sync(&ap->fastdrain_timer); 686 687 /* process port resume request */ 688 ata_eh_handle_port_resume(ap); 689 690 /* fetch & clear EH info */ 691 spin_lock_irqsave(ap->lock, flags); 692 693 ata_for_each_link(link, ap, HOST_FIRST) { 694 struct ata_eh_context *ehc = &link->eh_context; 695 struct ata_device *dev; 696 697 memset(&link->eh_context, 0, sizeof(link->eh_context)); 698 link->eh_context.i = link->eh_info; 699 memset(&link->eh_info, 0, sizeof(link->eh_info)); 700 701 ata_for_each_dev(dev, link, ENABLED) { 702 int devno = dev->devno; 703 704 ehc->saved_xfer_mode[devno] = dev->xfer_mode; 705 if (ata_ncq_enabled(dev)) 706 ehc->saved_ncq_enabled |= 1 << devno; 707 } 708 } 709 710 ap->pflags |= ATA_PFLAG_EH_IN_PROGRESS; 711 ap->pflags &= ~ATA_PFLAG_EH_PENDING; 712 ap->excl_link = NULL; /* don't maintain exclusion over EH */ 713 714 spin_unlock_irqrestore(ap->lock, flags); 715 716 /* invoke EH, skip if unloading or suspended */ 717 if (!(ap->pflags & (ATA_PFLAG_UNLOADING | ATA_PFLAG_SUSPENDED))) 718 ap->ops->error_handler(ap); 719 else { 720 /* if unloading, commence suicide */ 721 if ((ap->pflags & ATA_PFLAG_UNLOADING) && 722 !(ap->pflags & ATA_PFLAG_UNLOADED)) 723 ata_eh_unload(ap); 724 ata_eh_finish(ap); 725 } 726 727 /* process port suspend request */ 728 ata_eh_handle_port_suspend(ap); 729 730 /* Exception might have happend after ->error_handler 731 * recovered the port but before this point. Repeat 732 * EH in such case. 733 */ 734 spin_lock_irqsave(ap->lock, flags); 735 736 if (ap->pflags & ATA_PFLAG_EH_PENDING) { 737 if (--ap->eh_tries) { 738 spin_unlock_irqrestore(ap->lock, flags); 739 goto repeat; 740 } 741 ata_port_printk(ap, KERN_ERR, "EH pending after %d " 742 "tries, giving up\n", ATA_EH_MAX_TRIES); 743 ap->pflags &= ~ATA_PFLAG_EH_PENDING; 744 } 745 746 /* this run is complete, make sure EH info is clear */ 747 ata_for_each_link(link, ap, HOST_FIRST) 748 memset(&link->eh_info, 0, sizeof(link->eh_info)); 749 750 /* Clear host_eh_scheduled while holding ap->lock such 751 * that if exception occurs after this point but 752 * before EH completion, SCSI midlayer will 753 * re-initiate EH. 754 */ 755 host->host_eh_scheduled = 0; 756 757 spin_unlock_irqrestore(ap->lock, flags); 758 ata_eh_release(ap); 759 } else { 760 WARN_ON(ata_qc_from_tag(ap, ap->link.active_tag) == NULL); 761 ap->ops->eng_timeout(ap); 762 } 763 764 /* finish or retry handled scmd's and clean up */ 765 WARN_ON(host->host_failed || !list_empty(&host->eh_cmd_q)); 766 767 scsi_eh_flush_done_q(&ap->eh_done_q); 768 769 /* clean up */ 770 spin_lock_irqsave(ap->lock, flags); 771 772 if (ap->pflags & ATA_PFLAG_LOADING) 773 ap->pflags &= ~ATA_PFLAG_LOADING; 774 else if (ap->pflags & ATA_PFLAG_SCSI_HOTPLUG) 775 schedule_delayed_work(&ap->hotplug_task, 0); 776 777 if (ap->pflags & ATA_PFLAG_RECOVERED) 778 ata_port_printk(ap, KERN_INFO, "EH complete\n"); 779 780 ap->pflags &= ~(ATA_PFLAG_SCSI_HOTPLUG | ATA_PFLAG_RECOVERED); 781 782 /* tell wait_eh that we're done */ 783 ap->pflags &= ~ATA_PFLAG_EH_IN_PROGRESS; 784 wake_up_all(&ap->eh_wait_q); 785 786 spin_unlock_irqrestore(ap->lock, flags); 787 788 DPRINTK("EXIT\n"); 789 } 790 791 /** 792 * ata_port_wait_eh - Wait for the currently pending EH to complete 793 * @ap: Port to wait EH for 794 * 795 * Wait until the currently pending EH is complete. 796 * 797 * LOCKING: 798 * Kernel thread context (may sleep). 799 */ 800 void ata_port_wait_eh(struct ata_port *ap) 801 { 802 unsigned long flags; 803 DEFINE_WAIT(wait); 804 805 retry: 806 spin_lock_irqsave(ap->lock, flags); 807 808 while (ap->pflags & (ATA_PFLAG_EH_PENDING | ATA_PFLAG_EH_IN_PROGRESS)) { 809 prepare_to_wait(&ap->eh_wait_q, &wait, TASK_UNINTERRUPTIBLE); 810 spin_unlock_irqrestore(ap->lock, flags); 811 schedule(); 812 spin_lock_irqsave(ap->lock, flags); 813 } 814 finish_wait(&ap->eh_wait_q, &wait); 815 816 spin_unlock_irqrestore(ap->lock, flags); 817 818 /* make sure SCSI EH is complete */ 819 if (scsi_host_in_recovery(ap->scsi_host)) { 820 ata_msleep(ap, 10); 821 goto retry; 822 } 823 } 824 825 static int ata_eh_nr_in_flight(struct ata_port *ap) 826 { 827 unsigned int tag; 828 int nr = 0; 829 830 /* count only non-internal commands */ 831 for (tag = 0; tag < ATA_MAX_QUEUE - 1; tag++) 832 if (ata_qc_from_tag(ap, tag)) 833 nr++; 834 835 return nr; 836 } 837 838 void ata_eh_fastdrain_timerfn(unsigned long arg) 839 { 840 struct ata_port *ap = (void *)arg; 841 unsigned long flags; 842 int cnt; 843 844 spin_lock_irqsave(ap->lock, flags); 845 846 cnt = ata_eh_nr_in_flight(ap); 847 848 /* are we done? */ 849 if (!cnt) 850 goto out_unlock; 851 852 if (cnt == ap->fastdrain_cnt) { 853 unsigned int tag; 854 855 /* No progress during the last interval, tag all 856 * in-flight qcs as timed out and freeze the port. 857 */ 858 for (tag = 0; tag < ATA_MAX_QUEUE - 1; tag++) { 859 struct ata_queued_cmd *qc = ata_qc_from_tag(ap, tag); 860 if (qc) 861 qc->err_mask |= AC_ERR_TIMEOUT; 862 } 863 864 ata_port_freeze(ap); 865 } else { 866 /* some qcs have finished, give it another chance */ 867 ap->fastdrain_cnt = cnt; 868 ap->fastdrain_timer.expires = 869 ata_deadline(jiffies, ATA_EH_FASTDRAIN_INTERVAL); 870 add_timer(&ap->fastdrain_timer); 871 } 872 873 out_unlock: 874 spin_unlock_irqrestore(ap->lock, flags); 875 } 876 877 /** 878 * ata_eh_set_pending - set ATA_PFLAG_EH_PENDING and activate fast drain 879 * @ap: target ATA port 880 * @fastdrain: activate fast drain 881 * 882 * Set ATA_PFLAG_EH_PENDING and activate fast drain if @fastdrain 883 * is non-zero and EH wasn't pending before. Fast drain ensures 884 * that EH kicks in in timely manner. 885 * 886 * LOCKING: 887 * spin_lock_irqsave(host lock) 888 */ 889 static void ata_eh_set_pending(struct ata_port *ap, int fastdrain) 890 { 891 int cnt; 892 893 /* already scheduled? */ 894 if (ap->pflags & ATA_PFLAG_EH_PENDING) 895 return; 896 897 ap->pflags |= ATA_PFLAG_EH_PENDING; 898 899 if (!fastdrain) 900 return; 901 902 /* do we have in-flight qcs? */ 903 cnt = ata_eh_nr_in_flight(ap); 904 if (!cnt) 905 return; 906 907 /* activate fast drain */ 908 ap->fastdrain_cnt = cnt; 909 ap->fastdrain_timer.expires = 910 ata_deadline(jiffies, ATA_EH_FASTDRAIN_INTERVAL); 911 add_timer(&ap->fastdrain_timer); 912 } 913 914 /** 915 * ata_qc_schedule_eh - schedule qc for error handling 916 * @qc: command to schedule error handling for 917 * 918 * Schedule error handling for @qc. EH will kick in as soon as 919 * other commands are drained. 920 * 921 * LOCKING: 922 * spin_lock_irqsave(host lock) 923 */ 924 void ata_qc_schedule_eh(struct ata_queued_cmd *qc) 925 { 926 struct ata_port *ap = qc->ap; 927 struct request_queue *q = qc->scsicmd->device->request_queue; 928 unsigned long flags; 929 930 WARN_ON(!ap->ops->error_handler); 931 932 qc->flags |= ATA_QCFLAG_FAILED; 933 ata_eh_set_pending(ap, 1); 934 935 /* The following will fail if timeout has already expired. 936 * ata_scsi_error() takes care of such scmds on EH entry. 937 * Note that ATA_QCFLAG_FAILED is unconditionally set after 938 * this function completes. 939 */ 940 spin_lock_irqsave(q->queue_lock, flags); 941 blk_abort_request(qc->scsicmd->request); 942 spin_unlock_irqrestore(q->queue_lock, flags); 943 } 944 945 /** 946 * ata_port_schedule_eh - schedule error handling without a qc 947 * @ap: ATA port to schedule EH for 948 * 949 * Schedule error handling for @ap. EH will kick in as soon as 950 * all commands are drained. 951 * 952 * LOCKING: 953 * spin_lock_irqsave(host lock) 954 */ 955 void ata_port_schedule_eh(struct ata_port *ap) 956 { 957 WARN_ON(!ap->ops->error_handler); 958 959 if (ap->pflags & ATA_PFLAG_INITIALIZING) 960 return; 961 962 ata_eh_set_pending(ap, 1); 963 scsi_schedule_eh(ap->scsi_host); 964 965 DPRINTK("port EH scheduled\n"); 966 } 967 968 static int ata_do_link_abort(struct ata_port *ap, struct ata_link *link) 969 { 970 int tag, nr_aborted = 0; 971 972 WARN_ON(!ap->ops->error_handler); 973 974 /* we're gonna abort all commands, no need for fast drain */ 975 ata_eh_set_pending(ap, 0); 976 977 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 978 struct ata_queued_cmd *qc = ata_qc_from_tag(ap, tag); 979 980 if (qc && (!link || qc->dev->link == link)) { 981 qc->flags |= ATA_QCFLAG_FAILED; 982 ata_qc_complete(qc); 983 nr_aborted++; 984 } 985 } 986 987 if (!nr_aborted) 988 ata_port_schedule_eh(ap); 989 990 return nr_aborted; 991 } 992 993 /** 994 * ata_link_abort - abort all qc's on the link 995 * @link: ATA link to abort qc's for 996 * 997 * Abort all active qc's active on @link and schedule EH. 998 * 999 * LOCKING: 1000 * spin_lock_irqsave(host lock) 1001 * 1002 * RETURNS: 1003 * Number of aborted qc's. 1004 */ 1005 int ata_link_abort(struct ata_link *link) 1006 { 1007 return ata_do_link_abort(link->ap, link); 1008 } 1009 1010 /** 1011 * ata_port_abort - abort all qc's on the port 1012 * @ap: ATA port to abort qc's for 1013 * 1014 * Abort all active qc's of @ap and schedule EH. 1015 * 1016 * LOCKING: 1017 * spin_lock_irqsave(host_set lock) 1018 * 1019 * RETURNS: 1020 * Number of aborted qc's. 1021 */ 1022 int ata_port_abort(struct ata_port *ap) 1023 { 1024 return ata_do_link_abort(ap, NULL); 1025 } 1026 1027 /** 1028 * __ata_port_freeze - freeze port 1029 * @ap: ATA port to freeze 1030 * 1031 * This function is called when HSM violation or some other 1032 * condition disrupts normal operation of the port. Frozen port 1033 * is not allowed to perform any operation until the port is 1034 * thawed, which usually follows a successful reset. 1035 * 1036 * ap->ops->freeze() callback can be used for freezing the port 1037 * hardware-wise (e.g. mask interrupt and stop DMA engine). If a 1038 * port cannot be frozen hardware-wise, the interrupt handler 1039 * must ack and clear interrupts unconditionally while the port 1040 * is frozen. 1041 * 1042 * LOCKING: 1043 * spin_lock_irqsave(host lock) 1044 */ 1045 static void __ata_port_freeze(struct ata_port *ap) 1046 { 1047 WARN_ON(!ap->ops->error_handler); 1048 1049 if (ap->ops->freeze) 1050 ap->ops->freeze(ap); 1051 1052 ap->pflags |= ATA_PFLAG_FROZEN; 1053 1054 DPRINTK("ata%u port frozen\n", ap->print_id); 1055 } 1056 1057 /** 1058 * ata_port_freeze - abort & freeze port 1059 * @ap: ATA port to freeze 1060 * 1061 * Abort and freeze @ap. The freeze operation must be called 1062 * first, because some hardware requires special operations 1063 * before the taskfile registers are accessible. 1064 * 1065 * LOCKING: 1066 * spin_lock_irqsave(host lock) 1067 * 1068 * RETURNS: 1069 * Number of aborted commands. 1070 */ 1071 int ata_port_freeze(struct ata_port *ap) 1072 { 1073 int nr_aborted; 1074 1075 WARN_ON(!ap->ops->error_handler); 1076 1077 __ata_port_freeze(ap); 1078 nr_aborted = ata_port_abort(ap); 1079 1080 return nr_aborted; 1081 } 1082 1083 /** 1084 * sata_async_notification - SATA async notification handler 1085 * @ap: ATA port where async notification is received 1086 * 1087 * Handler to be called when async notification via SDB FIS is 1088 * received. This function schedules EH if necessary. 1089 * 1090 * LOCKING: 1091 * spin_lock_irqsave(host lock) 1092 * 1093 * RETURNS: 1094 * 1 if EH is scheduled, 0 otherwise. 1095 */ 1096 int sata_async_notification(struct ata_port *ap) 1097 { 1098 u32 sntf; 1099 int rc; 1100 1101 if (!(ap->flags & ATA_FLAG_AN)) 1102 return 0; 1103 1104 rc = sata_scr_read(&ap->link, SCR_NOTIFICATION, &sntf); 1105 if (rc == 0) 1106 sata_scr_write(&ap->link, SCR_NOTIFICATION, sntf); 1107 1108 if (!sata_pmp_attached(ap) || rc) { 1109 /* PMP is not attached or SNTF is not available */ 1110 if (!sata_pmp_attached(ap)) { 1111 /* PMP is not attached. Check whether ATAPI 1112 * AN is configured. If so, notify media 1113 * change. 1114 */ 1115 struct ata_device *dev = ap->link.device; 1116 1117 if ((dev->class == ATA_DEV_ATAPI) && 1118 (dev->flags & ATA_DFLAG_AN)) 1119 ata_scsi_media_change_notify(dev); 1120 return 0; 1121 } else { 1122 /* PMP is attached but SNTF is not available. 1123 * ATAPI async media change notification is 1124 * not used. The PMP must be reporting PHY 1125 * status change, schedule EH. 1126 */ 1127 ata_port_schedule_eh(ap); 1128 return 1; 1129 } 1130 } else { 1131 /* PMP is attached and SNTF is available */ 1132 struct ata_link *link; 1133 1134 /* check and notify ATAPI AN */ 1135 ata_for_each_link(link, ap, EDGE) { 1136 if (!(sntf & (1 << link->pmp))) 1137 continue; 1138 1139 if ((link->device->class == ATA_DEV_ATAPI) && 1140 (link->device->flags & ATA_DFLAG_AN)) 1141 ata_scsi_media_change_notify(link->device); 1142 } 1143 1144 /* If PMP is reporting that PHY status of some 1145 * downstream ports has changed, schedule EH. 1146 */ 1147 if (sntf & (1 << SATA_PMP_CTRL_PORT)) { 1148 ata_port_schedule_eh(ap); 1149 return 1; 1150 } 1151 1152 return 0; 1153 } 1154 } 1155 1156 /** 1157 * ata_eh_freeze_port - EH helper to freeze port 1158 * @ap: ATA port to freeze 1159 * 1160 * Freeze @ap. 1161 * 1162 * LOCKING: 1163 * None. 1164 */ 1165 void ata_eh_freeze_port(struct ata_port *ap) 1166 { 1167 unsigned long flags; 1168 1169 if (!ap->ops->error_handler) 1170 return; 1171 1172 spin_lock_irqsave(ap->lock, flags); 1173 __ata_port_freeze(ap); 1174 spin_unlock_irqrestore(ap->lock, flags); 1175 } 1176 1177 /** 1178 * ata_port_thaw_port - EH helper to thaw port 1179 * @ap: ATA port to thaw 1180 * 1181 * Thaw frozen port @ap. 1182 * 1183 * LOCKING: 1184 * None. 1185 */ 1186 void ata_eh_thaw_port(struct ata_port *ap) 1187 { 1188 unsigned long flags; 1189 1190 if (!ap->ops->error_handler) 1191 return; 1192 1193 spin_lock_irqsave(ap->lock, flags); 1194 1195 ap->pflags &= ~ATA_PFLAG_FROZEN; 1196 1197 if (ap->ops->thaw) 1198 ap->ops->thaw(ap); 1199 1200 spin_unlock_irqrestore(ap->lock, flags); 1201 1202 DPRINTK("ata%u port thawed\n", ap->print_id); 1203 } 1204 1205 static void ata_eh_scsidone(struct scsi_cmnd *scmd) 1206 { 1207 /* nada */ 1208 } 1209 1210 static void __ata_eh_qc_complete(struct ata_queued_cmd *qc) 1211 { 1212 struct ata_port *ap = qc->ap; 1213 struct scsi_cmnd *scmd = qc->scsicmd; 1214 unsigned long flags; 1215 1216 spin_lock_irqsave(ap->lock, flags); 1217 qc->scsidone = ata_eh_scsidone; 1218 __ata_qc_complete(qc); 1219 WARN_ON(ata_tag_valid(qc->tag)); 1220 spin_unlock_irqrestore(ap->lock, flags); 1221 1222 scsi_eh_finish_cmd(scmd, &ap->eh_done_q); 1223 } 1224 1225 /** 1226 * ata_eh_qc_complete - Complete an active ATA command from EH 1227 * @qc: Command to complete 1228 * 1229 * Indicate to the mid and upper layers that an ATA command has 1230 * completed. To be used from EH. 1231 */ 1232 void ata_eh_qc_complete(struct ata_queued_cmd *qc) 1233 { 1234 struct scsi_cmnd *scmd = qc->scsicmd; 1235 scmd->retries = scmd->allowed; 1236 __ata_eh_qc_complete(qc); 1237 } 1238 1239 /** 1240 * ata_eh_qc_retry - Tell midlayer to retry an ATA command after EH 1241 * @qc: Command to retry 1242 * 1243 * Indicate to the mid and upper layers that an ATA command 1244 * should be retried. To be used from EH. 1245 * 1246 * SCSI midlayer limits the number of retries to scmd->allowed. 1247 * scmd->retries is decremented for commands which get retried 1248 * due to unrelated failures (qc->err_mask is zero). 1249 */ 1250 void ata_eh_qc_retry(struct ata_queued_cmd *qc) 1251 { 1252 struct scsi_cmnd *scmd = qc->scsicmd; 1253 if (!qc->err_mask && scmd->retries) 1254 scmd->retries--; 1255 __ata_eh_qc_complete(qc); 1256 } 1257 1258 /** 1259 * ata_dev_disable - disable ATA device 1260 * @dev: ATA device to disable 1261 * 1262 * Disable @dev. 1263 * 1264 * Locking: 1265 * EH context. 1266 */ 1267 void ata_dev_disable(struct ata_device *dev) 1268 { 1269 if (!ata_dev_enabled(dev)) 1270 return; 1271 1272 if (ata_msg_drv(dev->link->ap)) 1273 ata_dev_printk(dev, KERN_WARNING, "disabled\n"); 1274 ata_acpi_on_disable(dev); 1275 ata_down_xfermask_limit(dev, ATA_DNXFER_FORCE_PIO0 | ATA_DNXFER_QUIET); 1276 dev->class++; 1277 1278 /* From now till the next successful probe, ering is used to 1279 * track probe failures. Clear accumulated device error info. 1280 */ 1281 ata_ering_clear(&dev->ering); 1282 } 1283 1284 /** 1285 * ata_eh_detach_dev - detach ATA device 1286 * @dev: ATA device to detach 1287 * 1288 * Detach @dev. 1289 * 1290 * LOCKING: 1291 * None. 1292 */ 1293 void ata_eh_detach_dev(struct ata_device *dev) 1294 { 1295 struct ata_link *link = dev->link; 1296 struct ata_port *ap = link->ap; 1297 struct ata_eh_context *ehc = &link->eh_context; 1298 unsigned long flags; 1299 1300 ata_dev_disable(dev); 1301 1302 spin_lock_irqsave(ap->lock, flags); 1303 1304 dev->flags &= ~ATA_DFLAG_DETACH; 1305 1306 if (ata_scsi_offline_dev(dev)) { 1307 dev->flags |= ATA_DFLAG_DETACHED; 1308 ap->pflags |= ATA_PFLAG_SCSI_HOTPLUG; 1309 } 1310 1311 /* clear per-dev EH info */ 1312 ata_eh_clear_action(link, dev, &link->eh_info, ATA_EH_PERDEV_MASK); 1313 ata_eh_clear_action(link, dev, &link->eh_context.i, ATA_EH_PERDEV_MASK); 1314 ehc->saved_xfer_mode[dev->devno] = 0; 1315 ehc->saved_ncq_enabled &= ~(1 << dev->devno); 1316 1317 spin_unlock_irqrestore(ap->lock, flags); 1318 } 1319 1320 /** 1321 * ata_eh_about_to_do - about to perform eh_action 1322 * @link: target ATA link 1323 * @dev: target ATA dev for per-dev action (can be NULL) 1324 * @action: action about to be performed 1325 * 1326 * Called just before performing EH actions to clear related bits 1327 * in @link->eh_info such that eh actions are not unnecessarily 1328 * repeated. 1329 * 1330 * LOCKING: 1331 * None. 1332 */ 1333 void ata_eh_about_to_do(struct ata_link *link, struct ata_device *dev, 1334 unsigned int action) 1335 { 1336 struct ata_port *ap = link->ap; 1337 struct ata_eh_info *ehi = &link->eh_info; 1338 struct ata_eh_context *ehc = &link->eh_context; 1339 unsigned long flags; 1340 1341 spin_lock_irqsave(ap->lock, flags); 1342 1343 ata_eh_clear_action(link, dev, ehi, action); 1344 1345 /* About to take EH action, set RECOVERED. Ignore actions on 1346 * slave links as master will do them again. 1347 */ 1348 if (!(ehc->i.flags & ATA_EHI_QUIET) && link != ap->slave_link) 1349 ap->pflags |= ATA_PFLAG_RECOVERED; 1350 1351 spin_unlock_irqrestore(ap->lock, flags); 1352 } 1353 1354 /** 1355 * ata_eh_done - EH action complete 1356 * @ap: target ATA port 1357 * @dev: target ATA dev for per-dev action (can be NULL) 1358 * @action: action just completed 1359 * 1360 * Called right after performing EH actions to clear related bits 1361 * in @link->eh_context. 1362 * 1363 * LOCKING: 1364 * None. 1365 */ 1366 void ata_eh_done(struct ata_link *link, struct ata_device *dev, 1367 unsigned int action) 1368 { 1369 struct ata_eh_context *ehc = &link->eh_context; 1370 1371 ata_eh_clear_action(link, dev, &ehc->i, action); 1372 } 1373 1374 /** 1375 * ata_err_string - convert err_mask to descriptive string 1376 * @err_mask: error mask to convert to string 1377 * 1378 * Convert @err_mask to descriptive string. Errors are 1379 * prioritized according to severity and only the most severe 1380 * error is reported. 1381 * 1382 * LOCKING: 1383 * None. 1384 * 1385 * RETURNS: 1386 * Descriptive string for @err_mask 1387 */ 1388 static const char *ata_err_string(unsigned int err_mask) 1389 { 1390 if (err_mask & AC_ERR_HOST_BUS) 1391 return "host bus error"; 1392 if (err_mask & AC_ERR_ATA_BUS) 1393 return "ATA bus error"; 1394 if (err_mask & AC_ERR_TIMEOUT) 1395 return "timeout"; 1396 if (err_mask & AC_ERR_HSM) 1397 return "HSM violation"; 1398 if (err_mask & AC_ERR_SYSTEM) 1399 return "internal error"; 1400 if (err_mask & AC_ERR_MEDIA) 1401 return "media error"; 1402 if (err_mask & AC_ERR_INVALID) 1403 return "invalid argument"; 1404 if (err_mask & AC_ERR_DEV) 1405 return "device error"; 1406 return "unknown error"; 1407 } 1408 1409 /** 1410 * ata_read_log_page - read a specific log page 1411 * @dev: target device 1412 * @page: page to read 1413 * @buf: buffer to store read page 1414 * @sectors: number of sectors to read 1415 * 1416 * Read log page using READ_LOG_EXT command. 1417 * 1418 * LOCKING: 1419 * Kernel thread context (may sleep). 1420 * 1421 * RETURNS: 1422 * 0 on success, AC_ERR_* mask otherwise. 1423 */ 1424 static unsigned int ata_read_log_page(struct ata_device *dev, 1425 u8 page, void *buf, unsigned int sectors) 1426 { 1427 struct ata_taskfile tf; 1428 unsigned int err_mask; 1429 1430 DPRINTK("read log page - page %d\n", page); 1431 1432 ata_tf_init(dev, &tf); 1433 tf.command = ATA_CMD_READ_LOG_EXT; 1434 tf.lbal = page; 1435 tf.nsect = sectors; 1436 tf.hob_nsect = sectors >> 8; 1437 tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_LBA48 | ATA_TFLAG_DEVICE; 1438 tf.protocol = ATA_PROT_PIO; 1439 1440 err_mask = ata_exec_internal(dev, &tf, NULL, DMA_FROM_DEVICE, 1441 buf, sectors * ATA_SECT_SIZE, 0); 1442 1443 DPRINTK("EXIT, err_mask=%x\n", err_mask); 1444 return err_mask; 1445 } 1446 1447 /** 1448 * ata_eh_read_log_10h - Read log page 10h for NCQ error details 1449 * @dev: Device to read log page 10h from 1450 * @tag: Resulting tag of the failed command 1451 * @tf: Resulting taskfile registers of the failed command 1452 * 1453 * Read log page 10h to obtain NCQ error details and clear error 1454 * condition. 1455 * 1456 * LOCKING: 1457 * Kernel thread context (may sleep). 1458 * 1459 * RETURNS: 1460 * 0 on success, -errno otherwise. 1461 */ 1462 static int ata_eh_read_log_10h(struct ata_device *dev, 1463 int *tag, struct ata_taskfile *tf) 1464 { 1465 u8 *buf = dev->link->ap->sector_buf; 1466 unsigned int err_mask; 1467 u8 csum; 1468 int i; 1469 1470 err_mask = ata_read_log_page(dev, ATA_LOG_SATA_NCQ, buf, 1); 1471 if (err_mask) 1472 return -EIO; 1473 1474 csum = 0; 1475 for (i = 0; i < ATA_SECT_SIZE; i++) 1476 csum += buf[i]; 1477 if (csum) 1478 ata_dev_printk(dev, KERN_WARNING, 1479 "invalid checksum 0x%x on log page 10h\n", csum); 1480 1481 if (buf[0] & 0x80) 1482 return -ENOENT; 1483 1484 *tag = buf[0] & 0x1f; 1485 1486 tf->command = buf[2]; 1487 tf->feature = buf[3]; 1488 tf->lbal = buf[4]; 1489 tf->lbam = buf[5]; 1490 tf->lbah = buf[6]; 1491 tf->device = buf[7]; 1492 tf->hob_lbal = buf[8]; 1493 tf->hob_lbam = buf[9]; 1494 tf->hob_lbah = buf[10]; 1495 tf->nsect = buf[12]; 1496 tf->hob_nsect = buf[13]; 1497 1498 return 0; 1499 } 1500 1501 /** 1502 * atapi_eh_tur - perform ATAPI TEST_UNIT_READY 1503 * @dev: target ATAPI device 1504 * @r_sense_key: out parameter for sense_key 1505 * 1506 * Perform ATAPI TEST_UNIT_READY. 1507 * 1508 * LOCKING: 1509 * EH context (may sleep). 1510 * 1511 * RETURNS: 1512 * 0 on success, AC_ERR_* mask on failure. 1513 */ 1514 static unsigned int atapi_eh_tur(struct ata_device *dev, u8 *r_sense_key) 1515 { 1516 u8 cdb[ATAPI_CDB_LEN] = { TEST_UNIT_READY, 0, 0, 0, 0, 0 }; 1517 struct ata_taskfile tf; 1518 unsigned int err_mask; 1519 1520 ata_tf_init(dev, &tf); 1521 1522 tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_DEVICE; 1523 tf.command = ATA_CMD_PACKET; 1524 tf.protocol = ATAPI_PROT_NODATA; 1525 1526 err_mask = ata_exec_internal(dev, &tf, cdb, DMA_NONE, NULL, 0, 0); 1527 if (err_mask == AC_ERR_DEV) 1528 *r_sense_key = tf.feature >> 4; 1529 return err_mask; 1530 } 1531 1532 /** 1533 * atapi_eh_request_sense - perform ATAPI REQUEST_SENSE 1534 * @dev: device to perform REQUEST_SENSE to 1535 * @sense_buf: result sense data buffer (SCSI_SENSE_BUFFERSIZE bytes long) 1536 * @dfl_sense_key: default sense key to use 1537 * 1538 * Perform ATAPI REQUEST_SENSE after the device reported CHECK 1539 * SENSE. This function is EH helper. 1540 * 1541 * LOCKING: 1542 * Kernel thread context (may sleep). 1543 * 1544 * RETURNS: 1545 * 0 on success, AC_ERR_* mask on failure 1546 */ 1547 static unsigned int atapi_eh_request_sense(struct ata_device *dev, 1548 u8 *sense_buf, u8 dfl_sense_key) 1549 { 1550 u8 cdb[ATAPI_CDB_LEN] = 1551 { REQUEST_SENSE, 0, 0, 0, SCSI_SENSE_BUFFERSIZE, 0 }; 1552 struct ata_port *ap = dev->link->ap; 1553 struct ata_taskfile tf; 1554 1555 DPRINTK("ATAPI request sense\n"); 1556 1557 /* FIXME: is this needed? */ 1558 memset(sense_buf, 0, SCSI_SENSE_BUFFERSIZE); 1559 1560 /* initialize sense_buf with the error register, 1561 * for the case where they are -not- overwritten 1562 */ 1563 sense_buf[0] = 0x70; 1564 sense_buf[2] = dfl_sense_key; 1565 1566 /* some devices time out if garbage left in tf */ 1567 ata_tf_init(dev, &tf); 1568 1569 tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_DEVICE; 1570 tf.command = ATA_CMD_PACKET; 1571 1572 /* is it pointless to prefer PIO for "safety reasons"? */ 1573 if (ap->flags & ATA_FLAG_PIO_DMA) { 1574 tf.protocol = ATAPI_PROT_DMA; 1575 tf.feature |= ATAPI_PKT_DMA; 1576 } else { 1577 tf.protocol = ATAPI_PROT_PIO; 1578 tf.lbam = SCSI_SENSE_BUFFERSIZE; 1579 tf.lbah = 0; 1580 } 1581 1582 return ata_exec_internal(dev, &tf, cdb, DMA_FROM_DEVICE, 1583 sense_buf, SCSI_SENSE_BUFFERSIZE, 0); 1584 } 1585 1586 /** 1587 * ata_eh_analyze_serror - analyze SError for a failed port 1588 * @link: ATA link to analyze SError for 1589 * 1590 * Analyze SError if available and further determine cause of 1591 * failure. 1592 * 1593 * LOCKING: 1594 * None. 1595 */ 1596 static void ata_eh_analyze_serror(struct ata_link *link) 1597 { 1598 struct ata_eh_context *ehc = &link->eh_context; 1599 u32 serror = ehc->i.serror; 1600 unsigned int err_mask = 0, action = 0; 1601 u32 hotplug_mask; 1602 1603 if (serror & (SERR_PERSISTENT | SERR_DATA)) { 1604 err_mask |= AC_ERR_ATA_BUS; 1605 action |= ATA_EH_RESET; 1606 } 1607 if (serror & SERR_PROTOCOL) { 1608 err_mask |= AC_ERR_HSM; 1609 action |= ATA_EH_RESET; 1610 } 1611 if (serror & SERR_INTERNAL) { 1612 err_mask |= AC_ERR_SYSTEM; 1613 action |= ATA_EH_RESET; 1614 } 1615 1616 /* Determine whether a hotplug event has occurred. Both 1617 * SError.N/X are considered hotplug events for enabled or 1618 * host links. For disabled PMP links, only N bit is 1619 * considered as X bit is left at 1 for link plugging. 1620 */ 1621 if (link->lpm_policy != ATA_LPM_MAX_POWER) 1622 hotplug_mask = 0; /* hotplug doesn't work w/ LPM */ 1623 else if (!(link->flags & ATA_LFLAG_DISABLED) || ata_is_host_link(link)) 1624 hotplug_mask = SERR_PHYRDY_CHG | SERR_DEV_XCHG; 1625 else 1626 hotplug_mask = SERR_PHYRDY_CHG; 1627 1628 if (serror & hotplug_mask) 1629 ata_ehi_hotplugged(&ehc->i); 1630 1631 ehc->i.err_mask |= err_mask; 1632 ehc->i.action |= action; 1633 } 1634 1635 /** 1636 * ata_eh_analyze_ncq_error - analyze NCQ error 1637 * @link: ATA link to analyze NCQ error for 1638 * 1639 * Read log page 10h, determine the offending qc and acquire 1640 * error status TF. For NCQ device errors, all LLDDs have to do 1641 * is setting AC_ERR_DEV in ehi->err_mask. This function takes 1642 * care of the rest. 1643 * 1644 * LOCKING: 1645 * Kernel thread context (may sleep). 1646 */ 1647 void ata_eh_analyze_ncq_error(struct ata_link *link) 1648 { 1649 struct ata_port *ap = link->ap; 1650 struct ata_eh_context *ehc = &link->eh_context; 1651 struct ata_device *dev = link->device; 1652 struct ata_queued_cmd *qc; 1653 struct ata_taskfile tf; 1654 int tag, rc; 1655 1656 /* if frozen, we can't do much */ 1657 if (ap->pflags & ATA_PFLAG_FROZEN) 1658 return; 1659 1660 /* is it NCQ device error? */ 1661 if (!link->sactive || !(ehc->i.err_mask & AC_ERR_DEV)) 1662 return; 1663 1664 /* has LLDD analyzed already? */ 1665 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 1666 qc = __ata_qc_from_tag(ap, tag); 1667 1668 if (!(qc->flags & ATA_QCFLAG_FAILED)) 1669 continue; 1670 1671 if (qc->err_mask) 1672 return; 1673 } 1674 1675 /* okay, this error is ours */ 1676 memset(&tf, 0, sizeof(tf)); 1677 rc = ata_eh_read_log_10h(dev, &tag, &tf); 1678 if (rc) { 1679 ata_link_printk(link, KERN_ERR, "failed to read log page 10h " 1680 "(errno=%d)\n", rc); 1681 return; 1682 } 1683 1684 if (!(link->sactive & (1 << tag))) { 1685 ata_link_printk(link, KERN_ERR, "log page 10h reported " 1686 "inactive tag %d\n", tag); 1687 return; 1688 } 1689 1690 /* we've got the perpetrator, condemn it */ 1691 qc = __ata_qc_from_tag(ap, tag); 1692 memcpy(&qc->result_tf, &tf, sizeof(tf)); 1693 qc->result_tf.flags = ATA_TFLAG_ISADDR | ATA_TFLAG_LBA | ATA_TFLAG_LBA48; 1694 qc->err_mask |= AC_ERR_DEV | AC_ERR_NCQ; 1695 ehc->i.err_mask &= ~AC_ERR_DEV; 1696 } 1697 1698 /** 1699 * ata_eh_analyze_tf - analyze taskfile of a failed qc 1700 * @qc: qc to analyze 1701 * @tf: Taskfile registers to analyze 1702 * 1703 * Analyze taskfile of @qc and further determine cause of 1704 * failure. This function also requests ATAPI sense data if 1705 * avaliable. 1706 * 1707 * LOCKING: 1708 * Kernel thread context (may sleep). 1709 * 1710 * RETURNS: 1711 * Determined recovery action 1712 */ 1713 static unsigned int ata_eh_analyze_tf(struct ata_queued_cmd *qc, 1714 const struct ata_taskfile *tf) 1715 { 1716 unsigned int tmp, action = 0; 1717 u8 stat = tf->command, err = tf->feature; 1718 1719 if ((stat & (ATA_BUSY | ATA_DRQ | ATA_DRDY)) != ATA_DRDY) { 1720 qc->err_mask |= AC_ERR_HSM; 1721 return ATA_EH_RESET; 1722 } 1723 1724 if (stat & (ATA_ERR | ATA_DF)) 1725 qc->err_mask |= AC_ERR_DEV; 1726 else 1727 return 0; 1728 1729 switch (qc->dev->class) { 1730 case ATA_DEV_ATA: 1731 if (err & ATA_ICRC) 1732 qc->err_mask |= AC_ERR_ATA_BUS; 1733 if (err & ATA_UNC) 1734 qc->err_mask |= AC_ERR_MEDIA; 1735 if (err & ATA_IDNF) 1736 qc->err_mask |= AC_ERR_INVALID; 1737 break; 1738 1739 case ATA_DEV_ATAPI: 1740 if (!(qc->ap->pflags & ATA_PFLAG_FROZEN)) { 1741 tmp = atapi_eh_request_sense(qc->dev, 1742 qc->scsicmd->sense_buffer, 1743 qc->result_tf.feature >> 4); 1744 if (!tmp) { 1745 /* ATA_QCFLAG_SENSE_VALID is used to 1746 * tell atapi_qc_complete() that sense 1747 * data is already valid. 1748 * 1749 * TODO: interpret sense data and set 1750 * appropriate err_mask. 1751 */ 1752 qc->flags |= ATA_QCFLAG_SENSE_VALID; 1753 } else 1754 qc->err_mask |= tmp; 1755 } 1756 } 1757 1758 if (qc->err_mask & (AC_ERR_HSM | AC_ERR_TIMEOUT | AC_ERR_ATA_BUS)) 1759 action |= ATA_EH_RESET; 1760 1761 return action; 1762 } 1763 1764 static int ata_eh_categorize_error(unsigned int eflags, unsigned int err_mask, 1765 int *xfer_ok) 1766 { 1767 int base = 0; 1768 1769 if (!(eflags & ATA_EFLAG_DUBIOUS_XFER)) 1770 *xfer_ok = 1; 1771 1772 if (!*xfer_ok) 1773 base = ATA_ECAT_DUBIOUS_NONE; 1774 1775 if (err_mask & AC_ERR_ATA_BUS) 1776 return base + ATA_ECAT_ATA_BUS; 1777 1778 if (err_mask & AC_ERR_TIMEOUT) 1779 return base + ATA_ECAT_TOUT_HSM; 1780 1781 if (eflags & ATA_EFLAG_IS_IO) { 1782 if (err_mask & AC_ERR_HSM) 1783 return base + ATA_ECAT_TOUT_HSM; 1784 if ((err_mask & 1785 (AC_ERR_DEV|AC_ERR_MEDIA|AC_ERR_INVALID)) == AC_ERR_DEV) 1786 return base + ATA_ECAT_UNK_DEV; 1787 } 1788 1789 return 0; 1790 } 1791 1792 struct speed_down_verdict_arg { 1793 u64 since; 1794 int xfer_ok; 1795 int nr_errors[ATA_ECAT_NR]; 1796 }; 1797 1798 static int speed_down_verdict_cb(struct ata_ering_entry *ent, void *void_arg) 1799 { 1800 struct speed_down_verdict_arg *arg = void_arg; 1801 int cat; 1802 1803 if ((ent->eflags & ATA_EFLAG_OLD_ER) || (ent->timestamp < arg->since)) 1804 return -1; 1805 1806 cat = ata_eh_categorize_error(ent->eflags, ent->err_mask, 1807 &arg->xfer_ok); 1808 arg->nr_errors[cat]++; 1809 1810 return 0; 1811 } 1812 1813 /** 1814 * ata_eh_speed_down_verdict - Determine speed down verdict 1815 * @dev: Device of interest 1816 * 1817 * This function examines error ring of @dev and determines 1818 * whether NCQ needs to be turned off, transfer speed should be 1819 * stepped down, or falling back to PIO is necessary. 1820 * 1821 * ECAT_ATA_BUS : ATA_BUS error for any command 1822 * 1823 * ECAT_TOUT_HSM : TIMEOUT for any command or HSM violation for 1824 * IO commands 1825 * 1826 * ECAT_UNK_DEV : Unknown DEV error for IO commands 1827 * 1828 * ECAT_DUBIOUS_* : Identical to above three but occurred while 1829 * data transfer hasn't been verified. 1830 * 1831 * Verdicts are 1832 * 1833 * NCQ_OFF : Turn off NCQ. 1834 * 1835 * SPEED_DOWN : Speed down transfer speed but don't fall back 1836 * to PIO. 1837 * 1838 * FALLBACK_TO_PIO : Fall back to PIO. 1839 * 1840 * Even if multiple verdicts are returned, only one action is 1841 * taken per error. An action triggered by non-DUBIOUS errors 1842 * clears ering, while one triggered by DUBIOUS_* errors doesn't. 1843 * This is to expedite speed down decisions right after device is 1844 * initially configured. 1845 * 1846 * The followings are speed down rules. #1 and #2 deal with 1847 * DUBIOUS errors. 1848 * 1849 * 1. If more than one DUBIOUS_ATA_BUS or DUBIOUS_TOUT_HSM errors 1850 * occurred during last 5 mins, SPEED_DOWN and FALLBACK_TO_PIO. 1851 * 1852 * 2. If more than one DUBIOUS_TOUT_HSM or DUBIOUS_UNK_DEV errors 1853 * occurred during last 5 mins, NCQ_OFF. 1854 * 1855 * 3. If more than 8 ATA_BUS, TOUT_HSM or UNK_DEV errors 1856 * ocurred during last 5 mins, FALLBACK_TO_PIO 1857 * 1858 * 4. If more than 3 TOUT_HSM or UNK_DEV errors occurred 1859 * during last 10 mins, NCQ_OFF. 1860 * 1861 * 5. If more than 3 ATA_BUS or TOUT_HSM errors, or more than 6 1862 * UNK_DEV errors occurred during last 10 mins, SPEED_DOWN. 1863 * 1864 * LOCKING: 1865 * Inherited from caller. 1866 * 1867 * RETURNS: 1868 * OR of ATA_EH_SPDN_* flags. 1869 */ 1870 static unsigned int ata_eh_speed_down_verdict(struct ata_device *dev) 1871 { 1872 const u64 j5mins = 5LLU * 60 * HZ, j10mins = 10LLU * 60 * HZ; 1873 u64 j64 = get_jiffies_64(); 1874 struct speed_down_verdict_arg arg; 1875 unsigned int verdict = 0; 1876 1877 /* scan past 5 mins of error history */ 1878 memset(&arg, 0, sizeof(arg)); 1879 arg.since = j64 - min(j64, j5mins); 1880 ata_ering_map(&dev->ering, speed_down_verdict_cb, &arg); 1881 1882 if (arg.nr_errors[ATA_ECAT_DUBIOUS_ATA_BUS] + 1883 arg.nr_errors[ATA_ECAT_DUBIOUS_TOUT_HSM] > 1) 1884 verdict |= ATA_EH_SPDN_SPEED_DOWN | 1885 ATA_EH_SPDN_FALLBACK_TO_PIO | ATA_EH_SPDN_KEEP_ERRORS; 1886 1887 if (arg.nr_errors[ATA_ECAT_DUBIOUS_TOUT_HSM] + 1888 arg.nr_errors[ATA_ECAT_DUBIOUS_UNK_DEV] > 1) 1889 verdict |= ATA_EH_SPDN_NCQ_OFF | ATA_EH_SPDN_KEEP_ERRORS; 1890 1891 if (arg.nr_errors[ATA_ECAT_ATA_BUS] + 1892 arg.nr_errors[ATA_ECAT_TOUT_HSM] + 1893 arg.nr_errors[ATA_ECAT_UNK_DEV] > 6) 1894 verdict |= ATA_EH_SPDN_FALLBACK_TO_PIO; 1895 1896 /* scan past 10 mins of error history */ 1897 memset(&arg, 0, sizeof(arg)); 1898 arg.since = j64 - min(j64, j10mins); 1899 ata_ering_map(&dev->ering, speed_down_verdict_cb, &arg); 1900 1901 if (arg.nr_errors[ATA_ECAT_TOUT_HSM] + 1902 arg.nr_errors[ATA_ECAT_UNK_DEV] > 3) 1903 verdict |= ATA_EH_SPDN_NCQ_OFF; 1904 1905 if (arg.nr_errors[ATA_ECAT_ATA_BUS] + 1906 arg.nr_errors[ATA_ECAT_TOUT_HSM] > 3 || 1907 arg.nr_errors[ATA_ECAT_UNK_DEV] > 6) 1908 verdict |= ATA_EH_SPDN_SPEED_DOWN; 1909 1910 return verdict; 1911 } 1912 1913 /** 1914 * ata_eh_speed_down - record error and speed down if necessary 1915 * @dev: Failed device 1916 * @eflags: mask of ATA_EFLAG_* flags 1917 * @err_mask: err_mask of the error 1918 * 1919 * Record error and examine error history to determine whether 1920 * adjusting transmission speed is necessary. It also sets 1921 * transmission limits appropriately if such adjustment is 1922 * necessary. 1923 * 1924 * LOCKING: 1925 * Kernel thread context (may sleep). 1926 * 1927 * RETURNS: 1928 * Determined recovery action. 1929 */ 1930 static unsigned int ata_eh_speed_down(struct ata_device *dev, 1931 unsigned int eflags, unsigned int err_mask) 1932 { 1933 struct ata_link *link = ata_dev_phys_link(dev); 1934 int xfer_ok = 0; 1935 unsigned int verdict; 1936 unsigned int action = 0; 1937 1938 /* don't bother if Cat-0 error */ 1939 if (ata_eh_categorize_error(eflags, err_mask, &xfer_ok) == 0) 1940 return 0; 1941 1942 /* record error and determine whether speed down is necessary */ 1943 ata_ering_record(&dev->ering, eflags, err_mask); 1944 verdict = ata_eh_speed_down_verdict(dev); 1945 1946 /* turn off NCQ? */ 1947 if ((verdict & ATA_EH_SPDN_NCQ_OFF) && 1948 (dev->flags & (ATA_DFLAG_PIO | ATA_DFLAG_NCQ | 1949 ATA_DFLAG_NCQ_OFF)) == ATA_DFLAG_NCQ) { 1950 dev->flags |= ATA_DFLAG_NCQ_OFF; 1951 ata_dev_printk(dev, KERN_WARNING, 1952 "NCQ disabled due to excessive errors\n"); 1953 goto done; 1954 } 1955 1956 /* speed down? */ 1957 if (verdict & ATA_EH_SPDN_SPEED_DOWN) { 1958 /* speed down SATA link speed if possible */ 1959 if (sata_down_spd_limit(link, 0) == 0) { 1960 action |= ATA_EH_RESET; 1961 goto done; 1962 } 1963 1964 /* lower transfer mode */ 1965 if (dev->spdn_cnt < 2) { 1966 static const int dma_dnxfer_sel[] = 1967 { ATA_DNXFER_DMA, ATA_DNXFER_40C }; 1968 static const int pio_dnxfer_sel[] = 1969 { ATA_DNXFER_PIO, ATA_DNXFER_FORCE_PIO0 }; 1970 int sel; 1971 1972 if (dev->xfer_shift != ATA_SHIFT_PIO) 1973 sel = dma_dnxfer_sel[dev->spdn_cnt]; 1974 else 1975 sel = pio_dnxfer_sel[dev->spdn_cnt]; 1976 1977 dev->spdn_cnt++; 1978 1979 if (ata_down_xfermask_limit(dev, sel) == 0) { 1980 action |= ATA_EH_RESET; 1981 goto done; 1982 } 1983 } 1984 } 1985 1986 /* Fall back to PIO? Slowing down to PIO is meaningless for 1987 * SATA ATA devices. Consider it only for PATA and SATAPI. 1988 */ 1989 if ((verdict & ATA_EH_SPDN_FALLBACK_TO_PIO) && (dev->spdn_cnt >= 2) && 1990 (link->ap->cbl != ATA_CBL_SATA || dev->class == ATA_DEV_ATAPI) && 1991 (dev->xfer_shift != ATA_SHIFT_PIO)) { 1992 if (ata_down_xfermask_limit(dev, ATA_DNXFER_FORCE_PIO) == 0) { 1993 dev->spdn_cnt = 0; 1994 action |= ATA_EH_RESET; 1995 goto done; 1996 } 1997 } 1998 1999 return 0; 2000 done: 2001 /* device has been slowed down, blow error history */ 2002 if (!(verdict & ATA_EH_SPDN_KEEP_ERRORS)) 2003 ata_ering_clear(&dev->ering); 2004 return action; 2005 } 2006 2007 /** 2008 * ata_eh_link_autopsy - analyze error and determine recovery action 2009 * @link: host link to perform autopsy on 2010 * 2011 * Analyze why @link failed and determine which recovery actions 2012 * are needed. This function also sets more detailed AC_ERR_* 2013 * values and fills sense data for ATAPI CHECK SENSE. 2014 * 2015 * LOCKING: 2016 * Kernel thread context (may sleep). 2017 */ 2018 static void ata_eh_link_autopsy(struct ata_link *link) 2019 { 2020 struct ata_port *ap = link->ap; 2021 struct ata_eh_context *ehc = &link->eh_context; 2022 struct ata_device *dev; 2023 unsigned int all_err_mask = 0, eflags = 0; 2024 int tag; 2025 u32 serror; 2026 int rc; 2027 2028 DPRINTK("ENTER\n"); 2029 2030 if (ehc->i.flags & ATA_EHI_NO_AUTOPSY) 2031 return; 2032 2033 /* obtain and analyze SError */ 2034 rc = sata_scr_read(link, SCR_ERROR, &serror); 2035 if (rc == 0) { 2036 ehc->i.serror |= serror; 2037 ata_eh_analyze_serror(link); 2038 } else if (rc != -EOPNOTSUPP) { 2039 /* SError read failed, force reset and probing */ 2040 ehc->i.probe_mask |= ATA_ALL_DEVICES; 2041 ehc->i.action |= ATA_EH_RESET; 2042 ehc->i.err_mask |= AC_ERR_OTHER; 2043 } 2044 2045 /* analyze NCQ failure */ 2046 ata_eh_analyze_ncq_error(link); 2047 2048 /* any real error trumps AC_ERR_OTHER */ 2049 if (ehc->i.err_mask & ~AC_ERR_OTHER) 2050 ehc->i.err_mask &= ~AC_ERR_OTHER; 2051 2052 all_err_mask |= ehc->i.err_mask; 2053 2054 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 2055 struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 2056 2057 if (!(qc->flags & ATA_QCFLAG_FAILED) || 2058 ata_dev_phys_link(qc->dev) != link) 2059 continue; 2060 2061 /* inherit upper level err_mask */ 2062 qc->err_mask |= ehc->i.err_mask; 2063 2064 /* analyze TF */ 2065 ehc->i.action |= ata_eh_analyze_tf(qc, &qc->result_tf); 2066 2067 /* DEV errors are probably spurious in case of ATA_BUS error */ 2068 if (qc->err_mask & AC_ERR_ATA_BUS) 2069 qc->err_mask &= ~(AC_ERR_DEV | AC_ERR_MEDIA | 2070 AC_ERR_INVALID); 2071 2072 /* any real error trumps unknown error */ 2073 if (qc->err_mask & ~AC_ERR_OTHER) 2074 qc->err_mask &= ~AC_ERR_OTHER; 2075 2076 /* SENSE_VALID trumps dev/unknown error and revalidation */ 2077 if (qc->flags & ATA_QCFLAG_SENSE_VALID) 2078 qc->err_mask &= ~(AC_ERR_DEV | AC_ERR_OTHER); 2079 2080 /* determine whether the command is worth retrying */ 2081 if (qc->flags & ATA_QCFLAG_IO || 2082 (!(qc->err_mask & AC_ERR_INVALID) && 2083 qc->err_mask != AC_ERR_DEV)) 2084 qc->flags |= ATA_QCFLAG_RETRY; 2085 2086 /* accumulate error info */ 2087 ehc->i.dev = qc->dev; 2088 all_err_mask |= qc->err_mask; 2089 if (qc->flags & ATA_QCFLAG_IO) 2090 eflags |= ATA_EFLAG_IS_IO; 2091 } 2092 2093 /* enforce default EH actions */ 2094 if (ap->pflags & ATA_PFLAG_FROZEN || 2095 all_err_mask & (AC_ERR_HSM | AC_ERR_TIMEOUT)) 2096 ehc->i.action |= ATA_EH_RESET; 2097 else if (((eflags & ATA_EFLAG_IS_IO) && all_err_mask) || 2098 (!(eflags & ATA_EFLAG_IS_IO) && (all_err_mask & ~AC_ERR_DEV))) 2099 ehc->i.action |= ATA_EH_REVALIDATE; 2100 2101 /* If we have offending qcs and the associated failed device, 2102 * perform per-dev EH action only on the offending device. 2103 */ 2104 if (ehc->i.dev) { 2105 ehc->i.dev_action[ehc->i.dev->devno] |= 2106 ehc->i.action & ATA_EH_PERDEV_MASK; 2107 ehc->i.action &= ~ATA_EH_PERDEV_MASK; 2108 } 2109 2110 /* propagate timeout to host link */ 2111 if ((all_err_mask & AC_ERR_TIMEOUT) && !ata_is_host_link(link)) 2112 ap->link.eh_context.i.err_mask |= AC_ERR_TIMEOUT; 2113 2114 /* record error and consider speeding down */ 2115 dev = ehc->i.dev; 2116 if (!dev && ((ata_link_max_devices(link) == 1 && 2117 ata_dev_enabled(link->device)))) 2118 dev = link->device; 2119 2120 if (dev) { 2121 if (dev->flags & ATA_DFLAG_DUBIOUS_XFER) 2122 eflags |= ATA_EFLAG_DUBIOUS_XFER; 2123 ehc->i.action |= ata_eh_speed_down(dev, eflags, all_err_mask); 2124 } 2125 2126 DPRINTK("EXIT\n"); 2127 } 2128 2129 /** 2130 * ata_eh_autopsy - analyze error and determine recovery action 2131 * @ap: host port to perform autopsy on 2132 * 2133 * Analyze all links of @ap and determine why they failed and 2134 * which recovery actions are needed. 2135 * 2136 * LOCKING: 2137 * Kernel thread context (may sleep). 2138 */ 2139 void ata_eh_autopsy(struct ata_port *ap) 2140 { 2141 struct ata_link *link; 2142 2143 ata_for_each_link(link, ap, EDGE) 2144 ata_eh_link_autopsy(link); 2145 2146 /* Handle the frigging slave link. Autopsy is done similarly 2147 * but actions and flags are transferred over to the master 2148 * link and handled from there. 2149 */ 2150 if (ap->slave_link) { 2151 struct ata_eh_context *mehc = &ap->link.eh_context; 2152 struct ata_eh_context *sehc = &ap->slave_link->eh_context; 2153 2154 /* transfer control flags from master to slave */ 2155 sehc->i.flags |= mehc->i.flags & ATA_EHI_TO_SLAVE_MASK; 2156 2157 /* perform autopsy on the slave link */ 2158 ata_eh_link_autopsy(ap->slave_link); 2159 2160 /* transfer actions from slave to master and clear slave */ 2161 ata_eh_about_to_do(ap->slave_link, NULL, ATA_EH_ALL_ACTIONS); 2162 mehc->i.action |= sehc->i.action; 2163 mehc->i.dev_action[1] |= sehc->i.dev_action[1]; 2164 mehc->i.flags |= sehc->i.flags; 2165 ata_eh_done(ap->slave_link, NULL, ATA_EH_ALL_ACTIONS); 2166 } 2167 2168 /* Autopsy of fanout ports can affect host link autopsy. 2169 * Perform host link autopsy last. 2170 */ 2171 if (sata_pmp_attached(ap)) 2172 ata_eh_link_autopsy(&ap->link); 2173 } 2174 2175 /** 2176 * ata_get_cmd_descript - get description for ATA command 2177 * @command: ATA command code to get description for 2178 * 2179 * Return a textual description of the given command, or NULL if the 2180 * command is not known. 2181 * 2182 * LOCKING: 2183 * None 2184 */ 2185 const char *ata_get_cmd_descript(u8 command) 2186 { 2187 #ifdef CONFIG_ATA_VERBOSE_ERROR 2188 static const struct 2189 { 2190 u8 command; 2191 const char *text; 2192 } cmd_descr[] = { 2193 { ATA_CMD_DEV_RESET, "DEVICE RESET" }, 2194 { ATA_CMD_CHK_POWER, "CHECK POWER MODE" }, 2195 { ATA_CMD_STANDBY, "STANDBY" }, 2196 { ATA_CMD_IDLE, "IDLE" }, 2197 { ATA_CMD_EDD, "EXECUTE DEVICE DIAGNOSTIC" }, 2198 { ATA_CMD_DOWNLOAD_MICRO, "DOWNLOAD MICROCODE" }, 2199 { ATA_CMD_NOP, "NOP" }, 2200 { ATA_CMD_FLUSH, "FLUSH CACHE" }, 2201 { ATA_CMD_FLUSH_EXT, "FLUSH CACHE EXT" }, 2202 { ATA_CMD_ID_ATA, "IDENTIFY DEVICE" }, 2203 { ATA_CMD_ID_ATAPI, "IDENTIFY PACKET DEVICE" }, 2204 { ATA_CMD_SERVICE, "SERVICE" }, 2205 { ATA_CMD_READ, "READ DMA" }, 2206 { ATA_CMD_READ_EXT, "READ DMA EXT" }, 2207 { ATA_CMD_READ_QUEUED, "READ DMA QUEUED" }, 2208 { ATA_CMD_READ_STREAM_EXT, "READ STREAM EXT" }, 2209 { ATA_CMD_READ_STREAM_DMA_EXT, "READ STREAM DMA EXT" }, 2210 { ATA_CMD_WRITE, "WRITE DMA" }, 2211 { ATA_CMD_WRITE_EXT, "WRITE DMA EXT" }, 2212 { ATA_CMD_WRITE_QUEUED, "WRITE DMA QUEUED EXT" }, 2213 { ATA_CMD_WRITE_STREAM_EXT, "WRITE STREAM EXT" }, 2214 { ATA_CMD_WRITE_STREAM_DMA_EXT, "WRITE STREAM DMA EXT" }, 2215 { ATA_CMD_WRITE_FUA_EXT, "WRITE DMA FUA EXT" }, 2216 { ATA_CMD_WRITE_QUEUED_FUA_EXT, "WRITE DMA QUEUED FUA EXT" }, 2217 { ATA_CMD_FPDMA_READ, "READ FPDMA QUEUED" }, 2218 { ATA_CMD_FPDMA_WRITE, "WRITE FPDMA QUEUED" }, 2219 { ATA_CMD_PIO_READ, "READ SECTOR(S)" }, 2220 { ATA_CMD_PIO_READ_EXT, "READ SECTOR(S) EXT" }, 2221 { ATA_CMD_PIO_WRITE, "WRITE SECTOR(S)" }, 2222 { ATA_CMD_PIO_WRITE_EXT, "WRITE SECTOR(S) EXT" }, 2223 { ATA_CMD_READ_MULTI, "READ MULTIPLE" }, 2224 { ATA_CMD_READ_MULTI_EXT, "READ MULTIPLE EXT" }, 2225 { ATA_CMD_WRITE_MULTI, "WRITE MULTIPLE" }, 2226 { ATA_CMD_WRITE_MULTI_EXT, "WRITE MULTIPLE EXT" }, 2227 { ATA_CMD_WRITE_MULTI_FUA_EXT, "WRITE MULTIPLE FUA EXT" }, 2228 { ATA_CMD_SET_FEATURES, "SET FEATURES" }, 2229 { ATA_CMD_SET_MULTI, "SET MULTIPLE MODE" }, 2230 { ATA_CMD_VERIFY, "READ VERIFY SECTOR(S)" }, 2231 { ATA_CMD_VERIFY_EXT, "READ VERIFY SECTOR(S) EXT" }, 2232 { ATA_CMD_WRITE_UNCORR_EXT, "WRITE UNCORRECTABLE EXT" }, 2233 { ATA_CMD_STANDBYNOW1, "STANDBY IMMEDIATE" }, 2234 { ATA_CMD_IDLEIMMEDIATE, "IDLE IMMEDIATE" }, 2235 { ATA_CMD_SLEEP, "SLEEP" }, 2236 { ATA_CMD_INIT_DEV_PARAMS, "INITIALIZE DEVICE PARAMETERS" }, 2237 { ATA_CMD_READ_NATIVE_MAX, "READ NATIVE MAX ADDRESS" }, 2238 { ATA_CMD_READ_NATIVE_MAX_EXT, "READ NATIVE MAX ADDRESS EXT" }, 2239 { ATA_CMD_SET_MAX, "SET MAX ADDRESS" }, 2240 { ATA_CMD_SET_MAX_EXT, "SET MAX ADDRESS EXT" }, 2241 { ATA_CMD_READ_LOG_EXT, "READ LOG EXT" }, 2242 { ATA_CMD_WRITE_LOG_EXT, "WRITE LOG EXT" }, 2243 { ATA_CMD_READ_LOG_DMA_EXT, "READ LOG DMA EXT" }, 2244 { ATA_CMD_WRITE_LOG_DMA_EXT, "WRITE LOG DMA EXT" }, 2245 { ATA_CMD_TRUSTED_RCV, "TRUSTED RECEIVE" }, 2246 { ATA_CMD_TRUSTED_RCV_DMA, "TRUSTED RECEIVE DMA" }, 2247 { ATA_CMD_TRUSTED_SND, "TRUSTED SEND" }, 2248 { ATA_CMD_TRUSTED_SND_DMA, "TRUSTED SEND DMA" }, 2249 { ATA_CMD_PMP_READ, "READ BUFFER" }, 2250 { ATA_CMD_PMP_WRITE, "WRITE BUFFER" }, 2251 { ATA_CMD_CONF_OVERLAY, "DEVICE CONFIGURATION OVERLAY" }, 2252 { ATA_CMD_SEC_SET_PASS, "SECURITY SET PASSWORD" }, 2253 { ATA_CMD_SEC_UNLOCK, "SECURITY UNLOCK" }, 2254 { ATA_CMD_SEC_ERASE_PREP, "SECURITY ERASE PREPARE" }, 2255 { ATA_CMD_SEC_ERASE_UNIT, "SECURITY ERASE UNIT" }, 2256 { ATA_CMD_SEC_FREEZE_LOCK, "SECURITY FREEZE LOCK" }, 2257 { ATA_CMD_SEC_DISABLE_PASS, "SECURITY DISABLE PASSWORD" }, 2258 { ATA_CMD_CONFIG_STREAM, "CONFIGURE STREAM" }, 2259 { ATA_CMD_SMART, "SMART" }, 2260 { ATA_CMD_MEDIA_LOCK, "DOOR LOCK" }, 2261 { ATA_CMD_MEDIA_UNLOCK, "DOOR UNLOCK" }, 2262 { ATA_CMD_DSM, "DATA SET MANAGEMENT" }, 2263 { ATA_CMD_CHK_MED_CRD_TYP, "CHECK MEDIA CARD TYPE" }, 2264 { ATA_CMD_CFA_REQ_EXT_ERR, "CFA REQUEST EXTENDED ERROR" }, 2265 { ATA_CMD_CFA_WRITE_NE, "CFA WRITE SECTORS WITHOUT ERASE" }, 2266 { ATA_CMD_CFA_TRANS_SECT, "CFA TRANSLATE SECTOR" }, 2267 { ATA_CMD_CFA_ERASE, "CFA ERASE SECTORS" }, 2268 { ATA_CMD_CFA_WRITE_MULT_NE, "CFA WRITE MULTIPLE WITHOUT ERASE" }, 2269 { ATA_CMD_READ_LONG, "READ LONG (with retries)" }, 2270 { ATA_CMD_READ_LONG_ONCE, "READ LONG (without retries)" }, 2271 { ATA_CMD_WRITE_LONG, "WRITE LONG (with retries)" }, 2272 { ATA_CMD_WRITE_LONG_ONCE, "WRITE LONG (without retries)" }, 2273 { ATA_CMD_RESTORE, "RECALIBRATE" }, 2274 { 0, NULL } /* terminate list */ 2275 }; 2276 2277 unsigned int i; 2278 for (i = 0; cmd_descr[i].text; i++) 2279 if (cmd_descr[i].command == command) 2280 return cmd_descr[i].text; 2281 #endif 2282 2283 return NULL; 2284 } 2285 2286 /** 2287 * ata_eh_link_report - report error handling to user 2288 * @link: ATA link EH is going on 2289 * 2290 * Report EH to user. 2291 * 2292 * LOCKING: 2293 * None. 2294 */ 2295 static void ata_eh_link_report(struct ata_link *link) 2296 { 2297 struct ata_port *ap = link->ap; 2298 struct ata_eh_context *ehc = &link->eh_context; 2299 const char *frozen, *desc; 2300 char tries_buf[6]; 2301 int tag, nr_failed = 0; 2302 2303 if (ehc->i.flags & ATA_EHI_QUIET) 2304 return; 2305 2306 desc = NULL; 2307 if (ehc->i.desc[0] != '\0') 2308 desc = ehc->i.desc; 2309 2310 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 2311 struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 2312 2313 if (!(qc->flags & ATA_QCFLAG_FAILED) || 2314 ata_dev_phys_link(qc->dev) != link || 2315 ((qc->flags & ATA_QCFLAG_QUIET) && 2316 qc->err_mask == AC_ERR_DEV)) 2317 continue; 2318 if (qc->flags & ATA_QCFLAG_SENSE_VALID && !qc->err_mask) 2319 continue; 2320 2321 nr_failed++; 2322 } 2323 2324 if (!nr_failed && !ehc->i.err_mask) 2325 return; 2326 2327 frozen = ""; 2328 if (ap->pflags & ATA_PFLAG_FROZEN) 2329 frozen = " frozen"; 2330 2331 memset(tries_buf, 0, sizeof(tries_buf)); 2332 if (ap->eh_tries < ATA_EH_MAX_TRIES) 2333 snprintf(tries_buf, sizeof(tries_buf) - 1, " t%d", 2334 ap->eh_tries); 2335 2336 if (ehc->i.dev) { 2337 ata_dev_printk(ehc->i.dev, KERN_ERR, "exception Emask 0x%x " 2338 "SAct 0x%x SErr 0x%x action 0x%x%s%s\n", 2339 ehc->i.err_mask, link->sactive, ehc->i.serror, 2340 ehc->i.action, frozen, tries_buf); 2341 if (desc) 2342 ata_dev_printk(ehc->i.dev, KERN_ERR, "%s\n", desc); 2343 } else { 2344 ata_link_printk(link, KERN_ERR, "exception Emask 0x%x " 2345 "SAct 0x%x SErr 0x%x action 0x%x%s%s\n", 2346 ehc->i.err_mask, link->sactive, ehc->i.serror, 2347 ehc->i.action, frozen, tries_buf); 2348 if (desc) 2349 ata_link_printk(link, KERN_ERR, "%s\n", desc); 2350 } 2351 2352 #ifdef CONFIG_ATA_VERBOSE_ERROR 2353 if (ehc->i.serror) 2354 ata_link_printk(link, KERN_ERR, 2355 "SError: { %s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s}\n", 2356 ehc->i.serror & SERR_DATA_RECOVERED ? "RecovData " : "", 2357 ehc->i.serror & SERR_COMM_RECOVERED ? "RecovComm " : "", 2358 ehc->i.serror & SERR_DATA ? "UnrecovData " : "", 2359 ehc->i.serror & SERR_PERSISTENT ? "Persist " : "", 2360 ehc->i.serror & SERR_PROTOCOL ? "Proto " : "", 2361 ehc->i.serror & SERR_INTERNAL ? "HostInt " : "", 2362 ehc->i.serror & SERR_PHYRDY_CHG ? "PHYRdyChg " : "", 2363 ehc->i.serror & SERR_PHY_INT_ERR ? "PHYInt " : "", 2364 ehc->i.serror & SERR_COMM_WAKE ? "CommWake " : "", 2365 ehc->i.serror & SERR_10B_8B_ERR ? "10B8B " : "", 2366 ehc->i.serror & SERR_DISPARITY ? "Dispar " : "", 2367 ehc->i.serror & SERR_CRC ? "BadCRC " : "", 2368 ehc->i.serror & SERR_HANDSHAKE ? "Handshk " : "", 2369 ehc->i.serror & SERR_LINK_SEQ_ERR ? "LinkSeq " : "", 2370 ehc->i.serror & SERR_TRANS_ST_ERROR ? "TrStaTrns " : "", 2371 ehc->i.serror & SERR_UNRECOG_FIS ? "UnrecFIS " : "", 2372 ehc->i.serror & SERR_DEV_XCHG ? "DevExch " : ""); 2373 #endif 2374 2375 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 2376 struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 2377 struct ata_taskfile *cmd = &qc->tf, *res = &qc->result_tf; 2378 const u8 *cdb = qc->cdb; 2379 char data_buf[20] = ""; 2380 char cdb_buf[70] = ""; 2381 2382 if (!(qc->flags & ATA_QCFLAG_FAILED) || 2383 ata_dev_phys_link(qc->dev) != link || !qc->err_mask) 2384 continue; 2385 2386 if (qc->dma_dir != DMA_NONE) { 2387 static const char *dma_str[] = { 2388 [DMA_BIDIRECTIONAL] = "bidi", 2389 [DMA_TO_DEVICE] = "out", 2390 [DMA_FROM_DEVICE] = "in", 2391 }; 2392 static const char *prot_str[] = { 2393 [ATA_PROT_PIO] = "pio", 2394 [ATA_PROT_DMA] = "dma", 2395 [ATA_PROT_NCQ] = "ncq", 2396 [ATAPI_PROT_PIO] = "pio", 2397 [ATAPI_PROT_DMA] = "dma", 2398 }; 2399 2400 snprintf(data_buf, sizeof(data_buf), " %s %u %s", 2401 prot_str[qc->tf.protocol], qc->nbytes, 2402 dma_str[qc->dma_dir]); 2403 } 2404 2405 if (ata_is_atapi(qc->tf.protocol)) { 2406 if (qc->scsicmd) 2407 scsi_print_command(qc->scsicmd); 2408 else 2409 snprintf(cdb_buf, sizeof(cdb_buf), 2410 "cdb %02x %02x %02x %02x %02x %02x %02x %02x " 2411 "%02x %02x %02x %02x %02x %02x %02x %02x\n ", 2412 cdb[0], cdb[1], cdb[2], cdb[3], 2413 cdb[4], cdb[5], cdb[6], cdb[7], 2414 cdb[8], cdb[9], cdb[10], cdb[11], 2415 cdb[12], cdb[13], cdb[14], cdb[15]); 2416 } else { 2417 const char *descr = ata_get_cmd_descript(cmd->command); 2418 if (descr) 2419 ata_dev_printk(qc->dev, KERN_ERR, 2420 "failed command: %s\n", descr); 2421 } 2422 2423 ata_dev_printk(qc->dev, KERN_ERR, 2424 "cmd %02x/%02x:%02x:%02x:%02x:%02x/%02x:%02x:%02x:%02x:%02x/%02x " 2425 "tag %d%s\n %s" 2426 "res %02x/%02x:%02x:%02x:%02x:%02x/%02x:%02x:%02x:%02x:%02x/%02x " 2427 "Emask 0x%x (%s)%s\n", 2428 cmd->command, cmd->feature, cmd->nsect, 2429 cmd->lbal, cmd->lbam, cmd->lbah, 2430 cmd->hob_feature, cmd->hob_nsect, 2431 cmd->hob_lbal, cmd->hob_lbam, cmd->hob_lbah, 2432 cmd->device, qc->tag, data_buf, cdb_buf, 2433 res->command, res->feature, res->nsect, 2434 res->lbal, res->lbam, res->lbah, 2435 res->hob_feature, res->hob_nsect, 2436 res->hob_lbal, res->hob_lbam, res->hob_lbah, 2437 res->device, qc->err_mask, ata_err_string(qc->err_mask), 2438 qc->err_mask & AC_ERR_NCQ ? " <F>" : ""); 2439 2440 #ifdef CONFIG_ATA_VERBOSE_ERROR 2441 if (res->command & (ATA_BUSY | ATA_DRDY | ATA_DF | ATA_DRQ | 2442 ATA_ERR)) { 2443 if (res->command & ATA_BUSY) 2444 ata_dev_printk(qc->dev, KERN_ERR, 2445 "status: { Busy }\n"); 2446 else 2447 ata_dev_printk(qc->dev, KERN_ERR, 2448 "status: { %s%s%s%s}\n", 2449 res->command & ATA_DRDY ? "DRDY " : "", 2450 res->command & ATA_DF ? "DF " : "", 2451 res->command & ATA_DRQ ? "DRQ " : "", 2452 res->command & ATA_ERR ? "ERR " : ""); 2453 } 2454 2455 if (cmd->command != ATA_CMD_PACKET && 2456 (res->feature & (ATA_ICRC | ATA_UNC | ATA_IDNF | 2457 ATA_ABORTED))) 2458 ata_dev_printk(qc->dev, KERN_ERR, 2459 "error: { %s%s%s%s}\n", 2460 res->feature & ATA_ICRC ? "ICRC " : "", 2461 res->feature & ATA_UNC ? "UNC " : "", 2462 res->feature & ATA_IDNF ? "IDNF " : "", 2463 res->feature & ATA_ABORTED ? "ABRT " : ""); 2464 #endif 2465 } 2466 } 2467 2468 /** 2469 * ata_eh_report - report error handling to user 2470 * @ap: ATA port to report EH about 2471 * 2472 * Report EH to user. 2473 * 2474 * LOCKING: 2475 * None. 2476 */ 2477 void ata_eh_report(struct ata_port *ap) 2478 { 2479 struct ata_link *link; 2480 2481 ata_for_each_link(link, ap, HOST_FIRST) 2482 ata_eh_link_report(link); 2483 } 2484 2485 static int ata_do_reset(struct ata_link *link, ata_reset_fn_t reset, 2486 unsigned int *classes, unsigned long deadline, 2487 bool clear_classes) 2488 { 2489 struct ata_device *dev; 2490 2491 if (clear_classes) 2492 ata_for_each_dev(dev, link, ALL) 2493 classes[dev->devno] = ATA_DEV_UNKNOWN; 2494 2495 return reset(link, classes, deadline); 2496 } 2497 2498 static int ata_eh_followup_srst_needed(struct ata_link *link, 2499 int rc, const unsigned int *classes) 2500 { 2501 if ((link->flags & ATA_LFLAG_NO_SRST) || ata_link_offline(link)) 2502 return 0; 2503 if (rc == -EAGAIN) 2504 return 1; 2505 if (sata_pmp_supported(link->ap) && ata_is_host_link(link)) 2506 return 1; 2507 return 0; 2508 } 2509 2510 int ata_eh_reset(struct ata_link *link, int classify, 2511 ata_prereset_fn_t prereset, ata_reset_fn_t softreset, 2512 ata_reset_fn_t hardreset, ata_postreset_fn_t postreset) 2513 { 2514 struct ata_port *ap = link->ap; 2515 struct ata_link *slave = ap->slave_link; 2516 struct ata_eh_context *ehc = &link->eh_context; 2517 struct ata_eh_context *sehc = slave ? &slave->eh_context : NULL; 2518 unsigned int *classes = ehc->classes; 2519 unsigned int lflags = link->flags; 2520 int verbose = !(ehc->i.flags & ATA_EHI_QUIET); 2521 int max_tries = 0, try = 0; 2522 struct ata_link *failed_link; 2523 struct ata_device *dev; 2524 unsigned long deadline, now; 2525 ata_reset_fn_t reset; 2526 unsigned long flags; 2527 u32 sstatus; 2528 int nr_unknown, rc; 2529 2530 /* 2531 * Prepare to reset 2532 */ 2533 while (ata_eh_reset_timeouts[max_tries] != ULONG_MAX) 2534 max_tries++; 2535 if (link->flags & ATA_LFLAG_NO_HRST) 2536 hardreset = NULL; 2537 if (link->flags & ATA_LFLAG_NO_SRST) 2538 softreset = NULL; 2539 2540 /* make sure each reset attemp is at least COOL_DOWN apart */ 2541 if (ehc->i.flags & ATA_EHI_DID_RESET) { 2542 now = jiffies; 2543 WARN_ON(time_after(ehc->last_reset, now)); 2544 deadline = ata_deadline(ehc->last_reset, 2545 ATA_EH_RESET_COOL_DOWN); 2546 if (time_before(now, deadline)) 2547 schedule_timeout_uninterruptible(deadline - now); 2548 } 2549 2550 spin_lock_irqsave(ap->lock, flags); 2551 ap->pflags |= ATA_PFLAG_RESETTING; 2552 spin_unlock_irqrestore(ap->lock, flags); 2553 2554 ata_eh_about_to_do(link, NULL, ATA_EH_RESET); 2555 2556 ata_for_each_dev(dev, link, ALL) { 2557 /* If we issue an SRST then an ATA drive (not ATAPI) 2558 * may change configuration and be in PIO0 timing. If 2559 * we do a hard reset (or are coming from power on) 2560 * this is true for ATA or ATAPI. Until we've set a 2561 * suitable controller mode we should not touch the 2562 * bus as we may be talking too fast. 2563 */ 2564 dev->pio_mode = XFER_PIO_0; 2565 2566 /* If the controller has a pio mode setup function 2567 * then use it to set the chipset to rights. Don't 2568 * touch the DMA setup as that will be dealt with when 2569 * configuring devices. 2570 */ 2571 if (ap->ops->set_piomode) 2572 ap->ops->set_piomode(ap, dev); 2573 } 2574 2575 /* prefer hardreset */ 2576 reset = NULL; 2577 ehc->i.action &= ~ATA_EH_RESET; 2578 if (hardreset) { 2579 reset = hardreset; 2580 ehc->i.action |= ATA_EH_HARDRESET; 2581 } else if (softreset) { 2582 reset = softreset; 2583 ehc->i.action |= ATA_EH_SOFTRESET; 2584 } 2585 2586 if (prereset) { 2587 unsigned long deadline = ata_deadline(jiffies, 2588 ATA_EH_PRERESET_TIMEOUT); 2589 2590 if (slave) { 2591 sehc->i.action &= ~ATA_EH_RESET; 2592 sehc->i.action |= ehc->i.action; 2593 } 2594 2595 rc = prereset(link, deadline); 2596 2597 /* If present, do prereset on slave link too. Reset 2598 * is skipped iff both master and slave links report 2599 * -ENOENT or clear ATA_EH_RESET. 2600 */ 2601 if (slave && (rc == 0 || rc == -ENOENT)) { 2602 int tmp; 2603 2604 tmp = prereset(slave, deadline); 2605 if (tmp != -ENOENT) 2606 rc = tmp; 2607 2608 ehc->i.action |= sehc->i.action; 2609 } 2610 2611 if (rc) { 2612 if (rc == -ENOENT) { 2613 ata_link_printk(link, KERN_DEBUG, 2614 "port disabled. ignoring.\n"); 2615 ehc->i.action &= ~ATA_EH_RESET; 2616 2617 ata_for_each_dev(dev, link, ALL) 2618 classes[dev->devno] = ATA_DEV_NONE; 2619 2620 rc = 0; 2621 } else 2622 ata_link_printk(link, KERN_ERR, 2623 "prereset failed (errno=%d)\n", rc); 2624 goto out; 2625 } 2626 2627 /* prereset() might have cleared ATA_EH_RESET. If so, 2628 * bang classes, thaw and return. 2629 */ 2630 if (reset && !(ehc->i.action & ATA_EH_RESET)) { 2631 ata_for_each_dev(dev, link, ALL) 2632 classes[dev->devno] = ATA_DEV_NONE; 2633 if ((ap->pflags & ATA_PFLAG_FROZEN) && 2634 ata_is_host_link(link)) 2635 ata_eh_thaw_port(ap); 2636 rc = 0; 2637 goto out; 2638 } 2639 } 2640 2641 retry: 2642 /* 2643 * Perform reset 2644 */ 2645 if (ata_is_host_link(link)) 2646 ata_eh_freeze_port(ap); 2647 2648 deadline = ata_deadline(jiffies, ata_eh_reset_timeouts[try++]); 2649 2650 if (reset) { 2651 if (verbose) 2652 ata_link_printk(link, KERN_INFO, "%s resetting link\n", 2653 reset == softreset ? "soft" : "hard"); 2654 2655 /* mark that this EH session started with reset */ 2656 ehc->last_reset = jiffies; 2657 if (reset == hardreset) 2658 ehc->i.flags |= ATA_EHI_DID_HARDRESET; 2659 else 2660 ehc->i.flags |= ATA_EHI_DID_SOFTRESET; 2661 2662 rc = ata_do_reset(link, reset, classes, deadline, true); 2663 if (rc && rc != -EAGAIN) { 2664 failed_link = link; 2665 goto fail; 2666 } 2667 2668 /* hardreset slave link if existent */ 2669 if (slave && reset == hardreset) { 2670 int tmp; 2671 2672 if (verbose) 2673 ata_link_printk(slave, KERN_INFO, 2674 "hard resetting link\n"); 2675 2676 ata_eh_about_to_do(slave, NULL, ATA_EH_RESET); 2677 tmp = ata_do_reset(slave, reset, classes, deadline, 2678 false); 2679 switch (tmp) { 2680 case -EAGAIN: 2681 rc = -EAGAIN; 2682 case 0: 2683 break; 2684 default: 2685 failed_link = slave; 2686 rc = tmp; 2687 goto fail; 2688 } 2689 } 2690 2691 /* perform follow-up SRST if necessary */ 2692 if (reset == hardreset && 2693 ata_eh_followup_srst_needed(link, rc, classes)) { 2694 reset = softreset; 2695 2696 if (!reset) { 2697 ata_link_printk(link, KERN_ERR, 2698 "follow-up softreset required " 2699 "but no softreset avaliable\n"); 2700 failed_link = link; 2701 rc = -EINVAL; 2702 goto fail; 2703 } 2704 2705 ata_eh_about_to_do(link, NULL, ATA_EH_RESET); 2706 rc = ata_do_reset(link, reset, classes, deadline, true); 2707 if (rc) { 2708 failed_link = link; 2709 goto fail; 2710 } 2711 } 2712 } else { 2713 if (verbose) 2714 ata_link_printk(link, KERN_INFO, "no reset method " 2715 "available, skipping reset\n"); 2716 if (!(lflags & ATA_LFLAG_ASSUME_CLASS)) 2717 lflags |= ATA_LFLAG_ASSUME_ATA; 2718 } 2719 2720 /* 2721 * Post-reset processing 2722 */ 2723 ata_for_each_dev(dev, link, ALL) { 2724 /* After the reset, the device state is PIO 0 and the 2725 * controller state is undefined. Reset also wakes up 2726 * drives from sleeping mode. 2727 */ 2728 dev->pio_mode = XFER_PIO_0; 2729 dev->flags &= ~ATA_DFLAG_SLEEPING; 2730 2731 if (ata_phys_link_offline(ata_dev_phys_link(dev))) 2732 continue; 2733 2734 /* apply class override */ 2735 if (lflags & ATA_LFLAG_ASSUME_ATA) 2736 classes[dev->devno] = ATA_DEV_ATA; 2737 else if (lflags & ATA_LFLAG_ASSUME_SEMB) 2738 classes[dev->devno] = ATA_DEV_SEMB_UNSUP; 2739 } 2740 2741 /* record current link speed */ 2742 if (sata_scr_read(link, SCR_STATUS, &sstatus) == 0) 2743 link->sata_spd = (sstatus >> 4) & 0xf; 2744 if (slave && sata_scr_read(slave, SCR_STATUS, &sstatus) == 0) 2745 slave->sata_spd = (sstatus >> 4) & 0xf; 2746 2747 /* thaw the port */ 2748 if (ata_is_host_link(link)) 2749 ata_eh_thaw_port(ap); 2750 2751 /* postreset() should clear hardware SError. Although SError 2752 * is cleared during link resume, clearing SError here is 2753 * necessary as some PHYs raise hotplug events after SRST. 2754 * This introduces race condition where hotplug occurs between 2755 * reset and here. This race is mediated by cross checking 2756 * link onlineness and classification result later. 2757 */ 2758 if (postreset) { 2759 postreset(link, classes); 2760 if (slave) 2761 postreset(slave, classes); 2762 } 2763 2764 /* 2765 * Some controllers can't be frozen very well and may set 2766 * spuruious error conditions during reset. Clear accumulated 2767 * error information. As reset is the final recovery action, 2768 * nothing is lost by doing this. 2769 */ 2770 spin_lock_irqsave(link->ap->lock, flags); 2771 memset(&link->eh_info, 0, sizeof(link->eh_info)); 2772 if (slave) 2773 memset(&slave->eh_info, 0, sizeof(link->eh_info)); 2774 ap->pflags &= ~ATA_PFLAG_EH_PENDING; 2775 spin_unlock_irqrestore(link->ap->lock, flags); 2776 2777 /* 2778 * Make sure onlineness and classification result correspond. 2779 * Hotplug could have happened during reset and some 2780 * controllers fail to wait while a drive is spinning up after 2781 * being hotplugged causing misdetection. By cross checking 2782 * link on/offlineness and classification result, those 2783 * conditions can be reliably detected and retried. 2784 */ 2785 nr_unknown = 0; 2786 ata_for_each_dev(dev, link, ALL) { 2787 if (ata_phys_link_online(ata_dev_phys_link(dev))) { 2788 if (classes[dev->devno] == ATA_DEV_UNKNOWN) { 2789 ata_dev_printk(dev, KERN_DEBUG, "link online " 2790 "but device misclassifed\n"); 2791 classes[dev->devno] = ATA_DEV_NONE; 2792 nr_unknown++; 2793 } 2794 } else if (ata_phys_link_offline(ata_dev_phys_link(dev))) { 2795 if (ata_class_enabled(classes[dev->devno])) 2796 ata_dev_printk(dev, KERN_DEBUG, "link offline, " 2797 "clearing class %d to NONE\n", 2798 classes[dev->devno]); 2799 classes[dev->devno] = ATA_DEV_NONE; 2800 } else if (classes[dev->devno] == ATA_DEV_UNKNOWN) { 2801 ata_dev_printk(dev, KERN_DEBUG, "link status unknown, " 2802 "clearing UNKNOWN to NONE\n"); 2803 classes[dev->devno] = ATA_DEV_NONE; 2804 } 2805 } 2806 2807 if (classify && nr_unknown) { 2808 if (try < max_tries) { 2809 ata_link_printk(link, KERN_WARNING, "link online but " 2810 "%d devices misclassified, retrying\n", 2811 nr_unknown); 2812 failed_link = link; 2813 rc = -EAGAIN; 2814 goto fail; 2815 } 2816 ata_link_printk(link, KERN_WARNING, 2817 "link online but %d devices misclassified, " 2818 "device detection might fail\n", nr_unknown); 2819 } 2820 2821 /* reset successful, schedule revalidation */ 2822 ata_eh_done(link, NULL, ATA_EH_RESET); 2823 if (slave) 2824 ata_eh_done(slave, NULL, ATA_EH_RESET); 2825 ehc->last_reset = jiffies; /* update to completion time */ 2826 ehc->i.action |= ATA_EH_REVALIDATE; 2827 link->lpm_policy = ATA_LPM_UNKNOWN; /* reset LPM state */ 2828 2829 rc = 0; 2830 out: 2831 /* clear hotplug flag */ 2832 ehc->i.flags &= ~ATA_EHI_HOTPLUGGED; 2833 if (slave) 2834 sehc->i.flags &= ~ATA_EHI_HOTPLUGGED; 2835 2836 spin_lock_irqsave(ap->lock, flags); 2837 ap->pflags &= ~ATA_PFLAG_RESETTING; 2838 spin_unlock_irqrestore(ap->lock, flags); 2839 2840 return rc; 2841 2842 fail: 2843 /* if SCR isn't accessible on a fan-out port, PMP needs to be reset */ 2844 if (!ata_is_host_link(link) && 2845 sata_scr_read(link, SCR_STATUS, &sstatus)) 2846 rc = -ERESTART; 2847 2848 if (rc == -ERESTART || try >= max_tries) 2849 goto out; 2850 2851 now = jiffies; 2852 if (time_before(now, deadline)) { 2853 unsigned long delta = deadline - now; 2854 2855 ata_link_printk(failed_link, KERN_WARNING, 2856 "reset failed (errno=%d), retrying in %u secs\n", 2857 rc, DIV_ROUND_UP(jiffies_to_msecs(delta), 1000)); 2858 2859 ata_eh_release(ap); 2860 while (delta) 2861 delta = schedule_timeout_uninterruptible(delta); 2862 ata_eh_acquire(ap); 2863 } 2864 2865 if (try == max_tries - 1) { 2866 sata_down_spd_limit(link, 0); 2867 if (slave) 2868 sata_down_spd_limit(slave, 0); 2869 } else if (rc == -EPIPE) 2870 sata_down_spd_limit(failed_link, 0); 2871 2872 if (hardreset) 2873 reset = hardreset; 2874 goto retry; 2875 } 2876 2877 static inline void ata_eh_pull_park_action(struct ata_port *ap) 2878 { 2879 struct ata_link *link; 2880 struct ata_device *dev; 2881 unsigned long flags; 2882 2883 /* 2884 * This function can be thought of as an extended version of 2885 * ata_eh_about_to_do() specially crafted to accommodate the 2886 * requirements of ATA_EH_PARK handling. Since the EH thread 2887 * does not leave the do {} while () loop in ata_eh_recover as 2888 * long as the timeout for a park request to *one* device on 2889 * the port has not expired, and since we still want to pick 2890 * up park requests to other devices on the same port or 2891 * timeout updates for the same device, we have to pull 2892 * ATA_EH_PARK actions from eh_info into eh_context.i 2893 * ourselves at the beginning of each pass over the loop. 2894 * 2895 * Additionally, all write accesses to &ap->park_req_pending 2896 * through INIT_COMPLETION() (see below) or complete_all() 2897 * (see ata_scsi_park_store()) are protected by the host lock. 2898 * As a result we have that park_req_pending.done is zero on 2899 * exit from this function, i.e. when ATA_EH_PARK actions for 2900 * *all* devices on port ap have been pulled into the 2901 * respective eh_context structs. If, and only if, 2902 * park_req_pending.done is non-zero by the time we reach 2903 * wait_for_completion_timeout(), another ATA_EH_PARK action 2904 * has been scheduled for at least one of the devices on port 2905 * ap and we have to cycle over the do {} while () loop in 2906 * ata_eh_recover() again. 2907 */ 2908 2909 spin_lock_irqsave(ap->lock, flags); 2910 INIT_COMPLETION(ap->park_req_pending); 2911 ata_for_each_link(link, ap, EDGE) { 2912 ata_for_each_dev(dev, link, ALL) { 2913 struct ata_eh_info *ehi = &link->eh_info; 2914 2915 link->eh_context.i.dev_action[dev->devno] |= 2916 ehi->dev_action[dev->devno] & ATA_EH_PARK; 2917 ata_eh_clear_action(link, dev, ehi, ATA_EH_PARK); 2918 } 2919 } 2920 spin_unlock_irqrestore(ap->lock, flags); 2921 } 2922 2923 static void ata_eh_park_issue_cmd(struct ata_device *dev, int park) 2924 { 2925 struct ata_eh_context *ehc = &dev->link->eh_context; 2926 struct ata_taskfile tf; 2927 unsigned int err_mask; 2928 2929 ata_tf_init(dev, &tf); 2930 if (park) { 2931 ehc->unloaded_mask |= 1 << dev->devno; 2932 tf.command = ATA_CMD_IDLEIMMEDIATE; 2933 tf.feature = 0x44; 2934 tf.lbal = 0x4c; 2935 tf.lbam = 0x4e; 2936 tf.lbah = 0x55; 2937 } else { 2938 ehc->unloaded_mask &= ~(1 << dev->devno); 2939 tf.command = ATA_CMD_CHK_POWER; 2940 } 2941 2942 tf.flags |= ATA_TFLAG_DEVICE | ATA_TFLAG_ISADDR; 2943 tf.protocol |= ATA_PROT_NODATA; 2944 err_mask = ata_exec_internal(dev, &tf, NULL, DMA_NONE, NULL, 0, 0); 2945 if (park && (err_mask || tf.lbal != 0xc4)) { 2946 ata_dev_printk(dev, KERN_ERR, "head unload failed!\n"); 2947 ehc->unloaded_mask &= ~(1 << dev->devno); 2948 } 2949 } 2950 2951 static int ata_eh_revalidate_and_attach(struct ata_link *link, 2952 struct ata_device **r_failed_dev) 2953 { 2954 struct ata_port *ap = link->ap; 2955 struct ata_eh_context *ehc = &link->eh_context; 2956 struct ata_device *dev; 2957 unsigned int new_mask = 0; 2958 unsigned long flags; 2959 int rc = 0; 2960 2961 DPRINTK("ENTER\n"); 2962 2963 /* For PATA drive side cable detection to work, IDENTIFY must 2964 * be done backwards such that PDIAG- is released by the slave 2965 * device before the master device is identified. 2966 */ 2967 ata_for_each_dev(dev, link, ALL_REVERSE) { 2968 unsigned int action = ata_eh_dev_action(dev); 2969 unsigned int readid_flags = 0; 2970 2971 if (ehc->i.flags & ATA_EHI_DID_RESET) 2972 readid_flags |= ATA_READID_POSTRESET; 2973 2974 if ((action & ATA_EH_REVALIDATE) && ata_dev_enabled(dev)) { 2975 WARN_ON(dev->class == ATA_DEV_PMP); 2976 2977 if (ata_phys_link_offline(ata_dev_phys_link(dev))) { 2978 rc = -EIO; 2979 goto err; 2980 } 2981 2982 ata_eh_about_to_do(link, dev, ATA_EH_REVALIDATE); 2983 rc = ata_dev_revalidate(dev, ehc->classes[dev->devno], 2984 readid_flags); 2985 if (rc) 2986 goto err; 2987 2988 ata_eh_done(link, dev, ATA_EH_REVALIDATE); 2989 2990 /* Configuration may have changed, reconfigure 2991 * transfer mode. 2992 */ 2993 ehc->i.flags |= ATA_EHI_SETMODE; 2994 2995 /* schedule the scsi_rescan_device() here */ 2996 schedule_work(&(ap->scsi_rescan_task)); 2997 } else if (dev->class == ATA_DEV_UNKNOWN && 2998 ehc->tries[dev->devno] && 2999 ata_class_enabled(ehc->classes[dev->devno])) { 3000 /* Temporarily set dev->class, it will be 3001 * permanently set once all configurations are 3002 * complete. This is necessary because new 3003 * device configuration is done in two 3004 * separate loops. 3005 */ 3006 dev->class = ehc->classes[dev->devno]; 3007 3008 if (dev->class == ATA_DEV_PMP) 3009 rc = sata_pmp_attach(dev); 3010 else 3011 rc = ata_dev_read_id(dev, &dev->class, 3012 readid_flags, dev->id); 3013 3014 /* read_id might have changed class, store and reset */ 3015 ehc->classes[dev->devno] = dev->class; 3016 dev->class = ATA_DEV_UNKNOWN; 3017 3018 switch (rc) { 3019 case 0: 3020 /* clear error info accumulated during probe */ 3021 ata_ering_clear(&dev->ering); 3022 new_mask |= 1 << dev->devno; 3023 break; 3024 case -ENOENT: 3025 /* IDENTIFY was issued to non-existent 3026 * device. No need to reset. Just 3027 * thaw and ignore the device. 3028 */ 3029 ata_eh_thaw_port(ap); 3030 break; 3031 default: 3032 goto err; 3033 } 3034 } 3035 } 3036 3037 /* PDIAG- should have been released, ask cable type if post-reset */ 3038 if ((ehc->i.flags & ATA_EHI_DID_RESET) && ata_is_host_link(link)) { 3039 if (ap->ops->cable_detect) 3040 ap->cbl = ap->ops->cable_detect(ap); 3041 ata_force_cbl(ap); 3042 } 3043 3044 /* Configure new devices forward such that user doesn't see 3045 * device detection messages backwards. 3046 */ 3047 ata_for_each_dev(dev, link, ALL) { 3048 if (!(new_mask & (1 << dev->devno))) 3049 continue; 3050 3051 dev->class = ehc->classes[dev->devno]; 3052 3053 if (dev->class == ATA_DEV_PMP) 3054 continue; 3055 3056 ehc->i.flags |= ATA_EHI_PRINTINFO; 3057 rc = ata_dev_configure(dev); 3058 ehc->i.flags &= ~ATA_EHI_PRINTINFO; 3059 if (rc) { 3060 dev->class = ATA_DEV_UNKNOWN; 3061 goto err; 3062 } 3063 3064 spin_lock_irqsave(ap->lock, flags); 3065 ap->pflags |= ATA_PFLAG_SCSI_HOTPLUG; 3066 spin_unlock_irqrestore(ap->lock, flags); 3067 3068 /* new device discovered, configure xfermode */ 3069 ehc->i.flags |= ATA_EHI_SETMODE; 3070 } 3071 3072 return 0; 3073 3074 err: 3075 *r_failed_dev = dev; 3076 DPRINTK("EXIT rc=%d\n", rc); 3077 return rc; 3078 } 3079 3080 /** 3081 * ata_set_mode - Program timings and issue SET FEATURES - XFER 3082 * @link: link on which timings will be programmed 3083 * @r_failed_dev: out parameter for failed device 3084 * 3085 * Set ATA device disk transfer mode (PIO3, UDMA6, etc.). If 3086 * ata_set_mode() fails, pointer to the failing device is 3087 * returned in @r_failed_dev. 3088 * 3089 * LOCKING: 3090 * PCI/etc. bus probe sem. 3091 * 3092 * RETURNS: 3093 * 0 on success, negative errno otherwise 3094 */ 3095 int ata_set_mode(struct ata_link *link, struct ata_device **r_failed_dev) 3096 { 3097 struct ata_port *ap = link->ap; 3098 struct ata_device *dev; 3099 int rc; 3100 3101 /* if data transfer is verified, clear DUBIOUS_XFER on ering top */ 3102 ata_for_each_dev(dev, link, ENABLED) { 3103 if (!(dev->flags & ATA_DFLAG_DUBIOUS_XFER)) { 3104 struct ata_ering_entry *ent; 3105 3106 ent = ata_ering_top(&dev->ering); 3107 if (ent) 3108 ent->eflags &= ~ATA_EFLAG_DUBIOUS_XFER; 3109 } 3110 } 3111 3112 /* has private set_mode? */ 3113 if (ap->ops->set_mode) 3114 rc = ap->ops->set_mode(link, r_failed_dev); 3115 else 3116 rc = ata_do_set_mode(link, r_failed_dev); 3117 3118 /* if transfer mode has changed, set DUBIOUS_XFER on device */ 3119 ata_for_each_dev(dev, link, ENABLED) { 3120 struct ata_eh_context *ehc = &link->eh_context; 3121 u8 saved_xfer_mode = ehc->saved_xfer_mode[dev->devno]; 3122 u8 saved_ncq = !!(ehc->saved_ncq_enabled & (1 << dev->devno)); 3123 3124 if (dev->xfer_mode != saved_xfer_mode || 3125 ata_ncq_enabled(dev) != saved_ncq) 3126 dev->flags |= ATA_DFLAG_DUBIOUS_XFER; 3127 } 3128 3129 return rc; 3130 } 3131 3132 /** 3133 * atapi_eh_clear_ua - Clear ATAPI UNIT ATTENTION after reset 3134 * @dev: ATAPI device to clear UA for 3135 * 3136 * Resets and other operations can make an ATAPI device raise 3137 * UNIT ATTENTION which causes the next operation to fail. This 3138 * function clears UA. 3139 * 3140 * LOCKING: 3141 * EH context (may sleep). 3142 * 3143 * RETURNS: 3144 * 0 on success, -errno on failure. 3145 */ 3146 static int atapi_eh_clear_ua(struct ata_device *dev) 3147 { 3148 int i; 3149 3150 for (i = 0; i < ATA_EH_UA_TRIES; i++) { 3151 u8 *sense_buffer = dev->link->ap->sector_buf; 3152 u8 sense_key = 0; 3153 unsigned int err_mask; 3154 3155 err_mask = atapi_eh_tur(dev, &sense_key); 3156 if (err_mask != 0 && err_mask != AC_ERR_DEV) { 3157 ata_dev_printk(dev, KERN_WARNING, "TEST_UNIT_READY " 3158 "failed (err_mask=0x%x)\n", err_mask); 3159 return -EIO; 3160 } 3161 3162 if (!err_mask || sense_key != UNIT_ATTENTION) 3163 return 0; 3164 3165 err_mask = atapi_eh_request_sense(dev, sense_buffer, sense_key); 3166 if (err_mask) { 3167 ata_dev_printk(dev, KERN_WARNING, "failed to clear " 3168 "UNIT ATTENTION (err_mask=0x%x)\n", err_mask); 3169 return -EIO; 3170 } 3171 } 3172 3173 ata_dev_printk(dev, KERN_WARNING, 3174 "UNIT ATTENTION persists after %d tries\n", ATA_EH_UA_TRIES); 3175 3176 return 0; 3177 } 3178 3179 /** 3180 * ata_eh_maybe_retry_flush - Retry FLUSH if necessary 3181 * @dev: ATA device which may need FLUSH retry 3182 * 3183 * If @dev failed FLUSH, it needs to be reported upper layer 3184 * immediately as it means that @dev failed to remap and already 3185 * lost at least a sector and further FLUSH retrials won't make 3186 * any difference to the lost sector. However, if FLUSH failed 3187 * for other reasons, for example transmission error, FLUSH needs 3188 * to be retried. 3189 * 3190 * This function determines whether FLUSH failure retry is 3191 * necessary and performs it if so. 3192 * 3193 * RETURNS: 3194 * 0 if EH can continue, -errno if EH needs to be repeated. 3195 */ 3196 static int ata_eh_maybe_retry_flush(struct ata_device *dev) 3197 { 3198 struct ata_link *link = dev->link; 3199 struct ata_port *ap = link->ap; 3200 struct ata_queued_cmd *qc; 3201 struct ata_taskfile tf; 3202 unsigned int err_mask; 3203 int rc = 0; 3204 3205 /* did flush fail for this device? */ 3206 if (!ata_tag_valid(link->active_tag)) 3207 return 0; 3208 3209 qc = __ata_qc_from_tag(ap, link->active_tag); 3210 if (qc->dev != dev || (qc->tf.command != ATA_CMD_FLUSH_EXT && 3211 qc->tf.command != ATA_CMD_FLUSH)) 3212 return 0; 3213 3214 /* if the device failed it, it should be reported to upper layers */ 3215 if (qc->err_mask & AC_ERR_DEV) 3216 return 0; 3217 3218 /* flush failed for some other reason, give it another shot */ 3219 ata_tf_init(dev, &tf); 3220 3221 tf.command = qc->tf.command; 3222 tf.flags |= ATA_TFLAG_DEVICE; 3223 tf.protocol = ATA_PROT_NODATA; 3224 3225 ata_dev_printk(dev, KERN_WARNING, "retrying FLUSH 0x%x Emask 0x%x\n", 3226 tf.command, qc->err_mask); 3227 3228 err_mask = ata_exec_internal(dev, &tf, NULL, DMA_NONE, NULL, 0, 0); 3229 if (!err_mask) { 3230 /* 3231 * FLUSH is complete but there's no way to 3232 * successfully complete a failed command from EH. 3233 * Making sure retry is allowed at least once and 3234 * retrying it should do the trick - whatever was in 3235 * the cache is already on the platter and this won't 3236 * cause infinite loop. 3237 */ 3238 qc->scsicmd->allowed = max(qc->scsicmd->allowed, 1); 3239 } else { 3240 ata_dev_printk(dev, KERN_WARNING, "FLUSH failed Emask 0x%x\n", 3241 err_mask); 3242 rc = -EIO; 3243 3244 /* if device failed it, report it to upper layers */ 3245 if (err_mask & AC_ERR_DEV) { 3246 qc->err_mask |= AC_ERR_DEV; 3247 qc->result_tf = tf; 3248 if (!(ap->pflags & ATA_PFLAG_FROZEN)) 3249 rc = 0; 3250 } 3251 } 3252 return rc; 3253 } 3254 3255 /** 3256 * ata_eh_set_lpm - configure SATA interface power management 3257 * @link: link to configure power management 3258 * @policy: the link power management policy 3259 * @r_failed_dev: out parameter for failed device 3260 * 3261 * Enable SATA Interface power management. This will enable 3262 * Device Interface Power Management (DIPM) for min_power 3263 * policy, and then call driver specific callbacks for 3264 * enabling Host Initiated Power management. 3265 * 3266 * LOCKING: 3267 * EH context. 3268 * 3269 * RETURNS: 3270 * 0 on success, -errno on failure. 3271 */ 3272 static int ata_eh_set_lpm(struct ata_link *link, enum ata_lpm_policy policy, 3273 struct ata_device **r_failed_dev) 3274 { 3275 struct ata_port *ap = ata_is_host_link(link) ? link->ap : NULL; 3276 struct ata_eh_context *ehc = &link->eh_context; 3277 struct ata_device *dev, *link_dev = NULL, *lpm_dev = NULL; 3278 enum ata_lpm_policy old_policy = link->lpm_policy; 3279 unsigned int hints = ATA_LPM_EMPTY | ATA_LPM_HIPM; 3280 unsigned int err_mask; 3281 int rc; 3282 3283 /* if the link or host doesn't do LPM, noop */ 3284 if ((link->flags & ATA_LFLAG_NO_LPM) || (ap && !ap->ops->set_lpm)) 3285 return 0; 3286 3287 /* 3288 * DIPM is enabled only for MIN_POWER as some devices 3289 * misbehave when the host NACKs transition to SLUMBER. Order 3290 * device and link configurations such that the host always 3291 * allows DIPM requests. 3292 */ 3293 ata_for_each_dev(dev, link, ENABLED) { 3294 bool hipm = ata_id_has_hipm(dev->id); 3295 bool dipm = ata_id_has_dipm(dev->id); 3296 3297 /* find the first enabled and LPM enabled devices */ 3298 if (!link_dev) 3299 link_dev = dev; 3300 3301 if (!lpm_dev && (hipm || dipm)) 3302 lpm_dev = dev; 3303 3304 hints &= ~ATA_LPM_EMPTY; 3305 if (!hipm) 3306 hints &= ~ATA_LPM_HIPM; 3307 3308 /* disable DIPM before changing link config */ 3309 if (policy != ATA_LPM_MIN_POWER && dipm) { 3310 err_mask = ata_dev_set_feature(dev, 3311 SETFEATURES_SATA_DISABLE, SATA_DIPM); 3312 if (err_mask && err_mask != AC_ERR_DEV) { 3313 ata_dev_printk(dev, KERN_WARNING, 3314 "failed to disable DIPM, Emask 0x%x\n", 3315 err_mask); 3316 rc = -EIO; 3317 goto fail; 3318 } 3319 } 3320 } 3321 3322 if (ap) { 3323 rc = ap->ops->set_lpm(link, policy, hints); 3324 if (!rc && ap->slave_link) 3325 rc = ap->ops->set_lpm(ap->slave_link, policy, hints); 3326 } else 3327 rc = sata_pmp_set_lpm(link, policy, hints); 3328 3329 /* 3330 * Attribute link config failure to the first (LPM) enabled 3331 * device on the link. 3332 */ 3333 if (rc) { 3334 if (rc == -EOPNOTSUPP) { 3335 link->flags |= ATA_LFLAG_NO_LPM; 3336 return 0; 3337 } 3338 dev = lpm_dev ? lpm_dev : link_dev; 3339 goto fail; 3340 } 3341 3342 /* 3343 * Low level driver acked the transition. Issue DIPM command 3344 * with the new policy set. 3345 */ 3346 link->lpm_policy = policy; 3347 if (ap && ap->slave_link) 3348 ap->slave_link->lpm_policy = policy; 3349 3350 /* host config updated, enable DIPM if transitioning to MIN_POWER */ 3351 ata_for_each_dev(dev, link, ENABLED) { 3352 if (policy == ATA_LPM_MIN_POWER && ata_id_has_dipm(dev->id)) { 3353 err_mask = ata_dev_set_feature(dev, 3354 SETFEATURES_SATA_ENABLE, SATA_DIPM); 3355 if (err_mask && err_mask != AC_ERR_DEV) { 3356 ata_dev_printk(dev, KERN_WARNING, 3357 "failed to enable DIPM, Emask 0x%x\n", 3358 err_mask); 3359 rc = -EIO; 3360 goto fail; 3361 } 3362 } 3363 } 3364 3365 return 0; 3366 3367 fail: 3368 /* restore the old policy */ 3369 link->lpm_policy = old_policy; 3370 if (ap && ap->slave_link) 3371 ap->slave_link->lpm_policy = old_policy; 3372 3373 /* if no device or only one more chance is left, disable LPM */ 3374 if (!dev || ehc->tries[dev->devno] <= 2) { 3375 ata_link_printk(link, KERN_WARNING, 3376 "disabling LPM on the link\n"); 3377 link->flags |= ATA_LFLAG_NO_LPM; 3378 } 3379 if (r_failed_dev) 3380 *r_failed_dev = dev; 3381 return rc; 3382 } 3383 3384 static int ata_link_nr_enabled(struct ata_link *link) 3385 { 3386 struct ata_device *dev; 3387 int cnt = 0; 3388 3389 ata_for_each_dev(dev, link, ENABLED) 3390 cnt++; 3391 return cnt; 3392 } 3393 3394 static int ata_link_nr_vacant(struct ata_link *link) 3395 { 3396 struct ata_device *dev; 3397 int cnt = 0; 3398 3399 ata_for_each_dev(dev, link, ALL) 3400 if (dev->class == ATA_DEV_UNKNOWN) 3401 cnt++; 3402 return cnt; 3403 } 3404 3405 static int ata_eh_skip_recovery(struct ata_link *link) 3406 { 3407 struct ata_port *ap = link->ap; 3408 struct ata_eh_context *ehc = &link->eh_context; 3409 struct ata_device *dev; 3410 3411 /* skip disabled links */ 3412 if (link->flags & ATA_LFLAG_DISABLED) 3413 return 1; 3414 3415 /* skip if explicitly requested */ 3416 if (ehc->i.flags & ATA_EHI_NO_RECOVERY) 3417 return 1; 3418 3419 /* thaw frozen port and recover failed devices */ 3420 if ((ap->pflags & ATA_PFLAG_FROZEN) || ata_link_nr_enabled(link)) 3421 return 0; 3422 3423 /* reset at least once if reset is requested */ 3424 if ((ehc->i.action & ATA_EH_RESET) && 3425 !(ehc->i.flags & ATA_EHI_DID_RESET)) 3426 return 0; 3427 3428 /* skip if class codes for all vacant slots are ATA_DEV_NONE */ 3429 ata_for_each_dev(dev, link, ALL) { 3430 if (dev->class == ATA_DEV_UNKNOWN && 3431 ehc->classes[dev->devno] != ATA_DEV_NONE) 3432 return 0; 3433 } 3434 3435 return 1; 3436 } 3437 3438 static int ata_count_probe_trials_cb(struct ata_ering_entry *ent, void *void_arg) 3439 { 3440 u64 interval = msecs_to_jiffies(ATA_EH_PROBE_TRIAL_INTERVAL); 3441 u64 now = get_jiffies_64(); 3442 int *trials = void_arg; 3443 3444 if (ent->timestamp < now - min(now, interval)) 3445 return -1; 3446 3447 (*trials)++; 3448 return 0; 3449 } 3450 3451 static int ata_eh_schedule_probe(struct ata_device *dev) 3452 { 3453 struct ata_eh_context *ehc = &dev->link->eh_context; 3454 struct ata_link *link = ata_dev_phys_link(dev); 3455 int trials = 0; 3456 3457 if (!(ehc->i.probe_mask & (1 << dev->devno)) || 3458 (ehc->did_probe_mask & (1 << dev->devno))) 3459 return 0; 3460 3461 ata_eh_detach_dev(dev); 3462 ata_dev_init(dev); 3463 ehc->did_probe_mask |= (1 << dev->devno); 3464 ehc->i.action |= ATA_EH_RESET; 3465 ehc->saved_xfer_mode[dev->devno] = 0; 3466 ehc->saved_ncq_enabled &= ~(1 << dev->devno); 3467 3468 /* the link maybe in a deep sleep, wake it up */ 3469 if (link->lpm_policy > ATA_LPM_MAX_POWER) { 3470 if (ata_is_host_link(link)) 3471 link->ap->ops->set_lpm(link, ATA_LPM_MAX_POWER, 3472 ATA_LPM_EMPTY); 3473 else 3474 sata_pmp_set_lpm(link, ATA_LPM_MAX_POWER, 3475 ATA_LPM_EMPTY); 3476 } 3477 3478 /* Record and count probe trials on the ering. The specific 3479 * error mask used is irrelevant. Because a successful device 3480 * detection clears the ering, this count accumulates only if 3481 * there are consecutive failed probes. 3482 * 3483 * If the count is equal to or higher than ATA_EH_PROBE_TRIALS 3484 * in the last ATA_EH_PROBE_TRIAL_INTERVAL, link speed is 3485 * forced to 1.5Gbps. 3486 * 3487 * This is to work around cases where failed link speed 3488 * negotiation results in device misdetection leading to 3489 * infinite DEVXCHG or PHRDY CHG events. 3490 */ 3491 ata_ering_record(&dev->ering, 0, AC_ERR_OTHER); 3492 ata_ering_map(&dev->ering, ata_count_probe_trials_cb, &trials); 3493 3494 if (trials > ATA_EH_PROBE_TRIALS) 3495 sata_down_spd_limit(link, 1); 3496 3497 return 1; 3498 } 3499 3500 static int ata_eh_handle_dev_fail(struct ata_device *dev, int err) 3501 { 3502 struct ata_eh_context *ehc = &dev->link->eh_context; 3503 3504 /* -EAGAIN from EH routine indicates retry without prejudice. 3505 * The requester is responsible for ensuring forward progress. 3506 */ 3507 if (err != -EAGAIN) 3508 ehc->tries[dev->devno]--; 3509 3510 switch (err) { 3511 case -ENODEV: 3512 /* device missing or wrong IDENTIFY data, schedule probing */ 3513 ehc->i.probe_mask |= (1 << dev->devno); 3514 case -EINVAL: 3515 /* give it just one more chance */ 3516 ehc->tries[dev->devno] = min(ehc->tries[dev->devno], 1); 3517 case -EIO: 3518 if (ehc->tries[dev->devno] == 1) { 3519 /* This is the last chance, better to slow 3520 * down than lose it. 3521 */ 3522 sata_down_spd_limit(ata_dev_phys_link(dev), 0); 3523 if (dev->pio_mode > XFER_PIO_0) 3524 ata_down_xfermask_limit(dev, ATA_DNXFER_PIO); 3525 } 3526 } 3527 3528 if (ata_dev_enabled(dev) && !ehc->tries[dev->devno]) { 3529 /* disable device if it has used up all its chances */ 3530 ata_dev_disable(dev); 3531 3532 /* detach if offline */ 3533 if (ata_phys_link_offline(ata_dev_phys_link(dev))) 3534 ata_eh_detach_dev(dev); 3535 3536 /* schedule probe if necessary */ 3537 if (ata_eh_schedule_probe(dev)) { 3538 ehc->tries[dev->devno] = ATA_EH_DEV_TRIES; 3539 memset(ehc->cmd_timeout_idx[dev->devno], 0, 3540 sizeof(ehc->cmd_timeout_idx[dev->devno])); 3541 } 3542 3543 return 1; 3544 } else { 3545 ehc->i.action |= ATA_EH_RESET; 3546 return 0; 3547 } 3548 } 3549 3550 /** 3551 * ata_eh_recover - recover host port after error 3552 * @ap: host port to recover 3553 * @prereset: prereset method (can be NULL) 3554 * @softreset: softreset method (can be NULL) 3555 * @hardreset: hardreset method (can be NULL) 3556 * @postreset: postreset method (can be NULL) 3557 * @r_failed_link: out parameter for failed link 3558 * 3559 * This is the alpha and omega, eum and yang, heart and soul of 3560 * libata exception handling. On entry, actions required to 3561 * recover each link and hotplug requests are recorded in the 3562 * link's eh_context. This function executes all the operations 3563 * with appropriate retrials and fallbacks to resurrect failed 3564 * devices, detach goners and greet newcomers. 3565 * 3566 * LOCKING: 3567 * Kernel thread context (may sleep). 3568 * 3569 * RETURNS: 3570 * 0 on success, -errno on failure. 3571 */ 3572 int ata_eh_recover(struct ata_port *ap, ata_prereset_fn_t prereset, 3573 ata_reset_fn_t softreset, ata_reset_fn_t hardreset, 3574 ata_postreset_fn_t postreset, 3575 struct ata_link **r_failed_link) 3576 { 3577 struct ata_link *link; 3578 struct ata_device *dev; 3579 int rc, nr_fails; 3580 unsigned long flags, deadline; 3581 3582 DPRINTK("ENTER\n"); 3583 3584 /* prep for recovery */ 3585 ata_for_each_link(link, ap, EDGE) { 3586 struct ata_eh_context *ehc = &link->eh_context; 3587 3588 /* re-enable link? */ 3589 if (ehc->i.action & ATA_EH_ENABLE_LINK) { 3590 ata_eh_about_to_do(link, NULL, ATA_EH_ENABLE_LINK); 3591 spin_lock_irqsave(ap->lock, flags); 3592 link->flags &= ~ATA_LFLAG_DISABLED; 3593 spin_unlock_irqrestore(ap->lock, flags); 3594 ata_eh_done(link, NULL, ATA_EH_ENABLE_LINK); 3595 } 3596 3597 ata_for_each_dev(dev, link, ALL) { 3598 if (link->flags & ATA_LFLAG_NO_RETRY) 3599 ehc->tries[dev->devno] = 1; 3600 else 3601 ehc->tries[dev->devno] = ATA_EH_DEV_TRIES; 3602 3603 /* collect port action mask recorded in dev actions */ 3604 ehc->i.action |= ehc->i.dev_action[dev->devno] & 3605 ~ATA_EH_PERDEV_MASK; 3606 ehc->i.dev_action[dev->devno] &= ATA_EH_PERDEV_MASK; 3607 3608 /* process hotplug request */ 3609 if (dev->flags & ATA_DFLAG_DETACH) 3610 ata_eh_detach_dev(dev); 3611 3612 /* schedule probe if necessary */ 3613 if (!ata_dev_enabled(dev)) 3614 ata_eh_schedule_probe(dev); 3615 } 3616 } 3617 3618 retry: 3619 rc = 0; 3620 3621 /* if UNLOADING, finish immediately */ 3622 if (ap->pflags & ATA_PFLAG_UNLOADING) 3623 goto out; 3624 3625 /* prep for EH */ 3626 ata_for_each_link(link, ap, EDGE) { 3627 struct ata_eh_context *ehc = &link->eh_context; 3628 3629 /* skip EH if possible. */ 3630 if (ata_eh_skip_recovery(link)) 3631 ehc->i.action = 0; 3632 3633 ata_for_each_dev(dev, link, ALL) 3634 ehc->classes[dev->devno] = ATA_DEV_UNKNOWN; 3635 } 3636 3637 /* reset */ 3638 ata_for_each_link(link, ap, EDGE) { 3639 struct ata_eh_context *ehc = &link->eh_context; 3640 3641 if (!(ehc->i.action & ATA_EH_RESET)) 3642 continue; 3643 3644 rc = ata_eh_reset(link, ata_link_nr_vacant(link), 3645 prereset, softreset, hardreset, postreset); 3646 if (rc) { 3647 ata_link_printk(link, KERN_ERR, 3648 "reset failed, giving up\n"); 3649 goto out; 3650 } 3651 } 3652 3653 do { 3654 unsigned long now; 3655 3656 /* 3657 * clears ATA_EH_PARK in eh_info and resets 3658 * ap->park_req_pending 3659 */ 3660 ata_eh_pull_park_action(ap); 3661 3662 deadline = jiffies; 3663 ata_for_each_link(link, ap, EDGE) { 3664 ata_for_each_dev(dev, link, ALL) { 3665 struct ata_eh_context *ehc = &link->eh_context; 3666 unsigned long tmp; 3667 3668 if (dev->class != ATA_DEV_ATA) 3669 continue; 3670 if (!(ehc->i.dev_action[dev->devno] & 3671 ATA_EH_PARK)) 3672 continue; 3673 tmp = dev->unpark_deadline; 3674 if (time_before(deadline, tmp)) 3675 deadline = tmp; 3676 else if (time_before_eq(tmp, jiffies)) 3677 continue; 3678 if (ehc->unloaded_mask & (1 << dev->devno)) 3679 continue; 3680 3681 ata_eh_park_issue_cmd(dev, 1); 3682 } 3683 } 3684 3685 now = jiffies; 3686 if (time_before_eq(deadline, now)) 3687 break; 3688 3689 ata_eh_release(ap); 3690 deadline = wait_for_completion_timeout(&ap->park_req_pending, 3691 deadline - now); 3692 ata_eh_acquire(ap); 3693 } while (deadline); 3694 ata_for_each_link(link, ap, EDGE) { 3695 ata_for_each_dev(dev, link, ALL) { 3696 if (!(link->eh_context.unloaded_mask & 3697 (1 << dev->devno))) 3698 continue; 3699 3700 ata_eh_park_issue_cmd(dev, 0); 3701 ata_eh_done(link, dev, ATA_EH_PARK); 3702 } 3703 } 3704 3705 /* the rest */ 3706 nr_fails = 0; 3707 ata_for_each_link(link, ap, PMP_FIRST) { 3708 struct ata_eh_context *ehc = &link->eh_context; 3709 3710 if (sata_pmp_attached(ap) && ata_is_host_link(link)) 3711 goto config_lpm; 3712 3713 /* revalidate existing devices and attach new ones */ 3714 rc = ata_eh_revalidate_and_attach(link, &dev); 3715 if (rc) 3716 goto rest_fail; 3717 3718 /* if PMP got attached, return, pmp EH will take care of it */ 3719 if (link->device->class == ATA_DEV_PMP) { 3720 ehc->i.action = 0; 3721 return 0; 3722 } 3723 3724 /* configure transfer mode if necessary */ 3725 if (ehc->i.flags & ATA_EHI_SETMODE) { 3726 rc = ata_set_mode(link, &dev); 3727 if (rc) 3728 goto rest_fail; 3729 ehc->i.flags &= ~ATA_EHI_SETMODE; 3730 } 3731 3732 /* If reset has been issued, clear UA to avoid 3733 * disrupting the current users of the device. 3734 */ 3735 if (ehc->i.flags & ATA_EHI_DID_RESET) { 3736 ata_for_each_dev(dev, link, ALL) { 3737 if (dev->class != ATA_DEV_ATAPI) 3738 continue; 3739 rc = atapi_eh_clear_ua(dev); 3740 if (rc) 3741 goto rest_fail; 3742 } 3743 } 3744 3745 /* retry flush if necessary */ 3746 ata_for_each_dev(dev, link, ALL) { 3747 if (dev->class != ATA_DEV_ATA) 3748 continue; 3749 rc = ata_eh_maybe_retry_flush(dev); 3750 if (rc) 3751 goto rest_fail; 3752 } 3753 3754 config_lpm: 3755 /* configure link power saving */ 3756 if (link->lpm_policy != ap->target_lpm_policy) { 3757 rc = ata_eh_set_lpm(link, ap->target_lpm_policy, &dev); 3758 if (rc) 3759 goto rest_fail; 3760 } 3761 3762 /* this link is okay now */ 3763 ehc->i.flags = 0; 3764 continue; 3765 3766 rest_fail: 3767 nr_fails++; 3768 if (dev) 3769 ata_eh_handle_dev_fail(dev, rc); 3770 3771 if (ap->pflags & ATA_PFLAG_FROZEN) { 3772 /* PMP reset requires working host port. 3773 * Can't retry if it's frozen. 3774 */ 3775 if (sata_pmp_attached(ap)) 3776 goto out; 3777 break; 3778 } 3779 } 3780 3781 if (nr_fails) 3782 goto retry; 3783 3784 out: 3785 if (rc && r_failed_link) 3786 *r_failed_link = link; 3787 3788 DPRINTK("EXIT, rc=%d\n", rc); 3789 return rc; 3790 } 3791 3792 /** 3793 * ata_eh_finish - finish up EH 3794 * @ap: host port to finish EH for 3795 * 3796 * Recovery is complete. Clean up EH states and retry or finish 3797 * failed qcs. 3798 * 3799 * LOCKING: 3800 * None. 3801 */ 3802 void ata_eh_finish(struct ata_port *ap) 3803 { 3804 int tag; 3805 3806 /* retry or finish qcs */ 3807 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 3808 struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 3809 3810 if (!(qc->flags & ATA_QCFLAG_FAILED)) 3811 continue; 3812 3813 if (qc->err_mask) { 3814 /* FIXME: Once EH migration is complete, 3815 * generate sense data in this function, 3816 * considering both err_mask and tf. 3817 */ 3818 if (qc->flags & ATA_QCFLAG_RETRY) 3819 ata_eh_qc_retry(qc); 3820 else 3821 ata_eh_qc_complete(qc); 3822 } else { 3823 if (qc->flags & ATA_QCFLAG_SENSE_VALID) { 3824 ata_eh_qc_complete(qc); 3825 } else { 3826 /* feed zero TF to sense generation */ 3827 memset(&qc->result_tf, 0, sizeof(qc->result_tf)); 3828 ata_eh_qc_retry(qc); 3829 } 3830 } 3831 } 3832 3833 /* make sure nr_active_links is zero after EH */ 3834 WARN_ON(ap->nr_active_links); 3835 ap->nr_active_links = 0; 3836 } 3837 3838 /** 3839 * ata_do_eh - do standard error handling 3840 * @ap: host port to handle error for 3841 * 3842 * @prereset: prereset method (can be NULL) 3843 * @softreset: softreset method (can be NULL) 3844 * @hardreset: hardreset method (can be NULL) 3845 * @postreset: postreset method (can be NULL) 3846 * 3847 * Perform standard error handling sequence. 3848 * 3849 * LOCKING: 3850 * Kernel thread context (may sleep). 3851 */ 3852 void ata_do_eh(struct ata_port *ap, ata_prereset_fn_t prereset, 3853 ata_reset_fn_t softreset, ata_reset_fn_t hardreset, 3854 ata_postreset_fn_t postreset) 3855 { 3856 struct ata_device *dev; 3857 int rc; 3858 3859 ata_eh_autopsy(ap); 3860 ata_eh_report(ap); 3861 3862 rc = ata_eh_recover(ap, prereset, softreset, hardreset, postreset, 3863 NULL); 3864 if (rc) { 3865 ata_for_each_dev(dev, &ap->link, ALL) 3866 ata_dev_disable(dev); 3867 } 3868 3869 ata_eh_finish(ap); 3870 } 3871 3872 /** 3873 * ata_std_error_handler - standard error handler 3874 * @ap: host port to handle error for 3875 * 3876 * Standard error handler 3877 * 3878 * LOCKING: 3879 * Kernel thread context (may sleep). 3880 */ 3881 void ata_std_error_handler(struct ata_port *ap) 3882 { 3883 struct ata_port_operations *ops = ap->ops; 3884 ata_reset_fn_t hardreset = ops->hardreset; 3885 3886 /* ignore built-in hardreset if SCR access is not available */ 3887 if (hardreset == sata_std_hardreset && !sata_scr_valid(&ap->link)) 3888 hardreset = NULL; 3889 3890 ata_do_eh(ap, ops->prereset, ops->softreset, hardreset, ops->postreset); 3891 } 3892 3893 #ifdef CONFIG_PM 3894 /** 3895 * ata_eh_handle_port_suspend - perform port suspend operation 3896 * @ap: port to suspend 3897 * 3898 * Suspend @ap. 3899 * 3900 * LOCKING: 3901 * Kernel thread context (may sleep). 3902 */ 3903 static void ata_eh_handle_port_suspend(struct ata_port *ap) 3904 { 3905 unsigned long flags; 3906 int rc = 0; 3907 3908 /* are we suspending? */ 3909 spin_lock_irqsave(ap->lock, flags); 3910 if (!(ap->pflags & ATA_PFLAG_PM_PENDING) || 3911 ap->pm_mesg.event == PM_EVENT_ON) { 3912 spin_unlock_irqrestore(ap->lock, flags); 3913 return; 3914 } 3915 spin_unlock_irqrestore(ap->lock, flags); 3916 3917 WARN_ON(ap->pflags & ATA_PFLAG_SUSPENDED); 3918 3919 /* tell ACPI we're suspending */ 3920 rc = ata_acpi_on_suspend(ap); 3921 if (rc) 3922 goto out; 3923 3924 /* suspend */ 3925 ata_eh_freeze_port(ap); 3926 3927 if (ap->ops->port_suspend) 3928 rc = ap->ops->port_suspend(ap, ap->pm_mesg); 3929 3930 ata_acpi_set_state(ap, PMSG_SUSPEND); 3931 out: 3932 /* report result */ 3933 spin_lock_irqsave(ap->lock, flags); 3934 3935 ap->pflags &= ~ATA_PFLAG_PM_PENDING; 3936 if (rc == 0) 3937 ap->pflags |= ATA_PFLAG_SUSPENDED; 3938 else if (ap->pflags & ATA_PFLAG_FROZEN) 3939 ata_port_schedule_eh(ap); 3940 3941 if (ap->pm_result) { 3942 *ap->pm_result = rc; 3943 ap->pm_result = NULL; 3944 } 3945 3946 spin_unlock_irqrestore(ap->lock, flags); 3947 3948 return; 3949 } 3950 3951 /** 3952 * ata_eh_handle_port_resume - perform port resume operation 3953 * @ap: port to resume 3954 * 3955 * Resume @ap. 3956 * 3957 * LOCKING: 3958 * Kernel thread context (may sleep). 3959 */ 3960 static void ata_eh_handle_port_resume(struct ata_port *ap) 3961 { 3962 struct ata_link *link; 3963 struct ata_device *dev; 3964 unsigned long flags; 3965 int rc = 0; 3966 3967 /* are we resuming? */ 3968 spin_lock_irqsave(ap->lock, flags); 3969 if (!(ap->pflags & ATA_PFLAG_PM_PENDING) || 3970 ap->pm_mesg.event != PM_EVENT_ON) { 3971 spin_unlock_irqrestore(ap->lock, flags); 3972 return; 3973 } 3974 spin_unlock_irqrestore(ap->lock, flags); 3975 3976 WARN_ON(!(ap->pflags & ATA_PFLAG_SUSPENDED)); 3977 3978 /* 3979 * Error timestamps are in jiffies which doesn't run while 3980 * suspended and PHY events during resume isn't too uncommon. 3981 * When the two are combined, it can lead to unnecessary speed 3982 * downs if the machine is suspended and resumed repeatedly. 3983 * Clear error history. 3984 */ 3985 ata_for_each_link(link, ap, HOST_FIRST) 3986 ata_for_each_dev(dev, link, ALL) 3987 ata_ering_clear(&dev->ering); 3988 3989 ata_acpi_set_state(ap, PMSG_ON); 3990 3991 if (ap->ops->port_resume) 3992 rc = ap->ops->port_resume(ap); 3993 3994 /* tell ACPI that we're resuming */ 3995 ata_acpi_on_resume(ap); 3996 3997 /* report result */ 3998 spin_lock_irqsave(ap->lock, flags); 3999 ap->pflags &= ~(ATA_PFLAG_PM_PENDING | ATA_PFLAG_SUSPENDED); 4000 if (ap->pm_result) { 4001 *ap->pm_result = rc; 4002 ap->pm_result = NULL; 4003 } 4004 spin_unlock_irqrestore(ap->lock, flags); 4005 } 4006 #endif /* CONFIG_PM */ 4007