1 /* 2 * libata-eh.c - libata error handling 3 * 4 * Maintained by: Jeff Garzik <jgarzik@pobox.com> 5 * Please ALWAYS copy linux-ide@vger.kernel.org 6 * on emails. 7 * 8 * Copyright 2006 Tejun Heo <htejun@gmail.com> 9 * 10 * 11 * This program is free software; you can redistribute it and/or 12 * modify it under the terms of the GNU General Public License as 13 * published by the Free Software Foundation; either version 2, or 14 * (at your option) any later version. 15 * 16 * This program is distributed in the hope that it will be useful, 17 * but WITHOUT ANY WARRANTY; without even the implied warranty of 18 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 19 * General Public License for more details. 20 * 21 * You should have received a copy of the GNU General Public License 22 * along with this program; see the file COPYING. If not, write to 23 * the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, 24 * USA. 25 * 26 * 27 * libata documentation is available via 'make {ps|pdf}docs', 28 * as Documentation/DocBook/libata.* 29 * 30 * Hardware documentation available from http://www.t13.org/ and 31 * http://www.sata-io.org/ 32 * 33 */ 34 35 #include <linux/kernel.h> 36 #include <linux/blkdev.h> 37 #include <linux/pci.h> 38 #include <scsi/scsi.h> 39 #include <scsi/scsi_host.h> 40 #include <scsi/scsi_eh.h> 41 #include <scsi/scsi_device.h> 42 #include <scsi/scsi_cmnd.h> 43 #include <scsi/scsi_dbg.h> 44 #include "../scsi/scsi_transport_api.h" 45 46 #include <linux/libata.h> 47 48 #include "libata.h" 49 50 enum { 51 /* speed down verdicts */ 52 ATA_EH_SPDN_NCQ_OFF = (1 << 0), 53 ATA_EH_SPDN_SPEED_DOWN = (1 << 1), 54 ATA_EH_SPDN_FALLBACK_TO_PIO = (1 << 2), 55 ATA_EH_SPDN_KEEP_ERRORS = (1 << 3), 56 57 /* error flags */ 58 ATA_EFLAG_IS_IO = (1 << 0), 59 ATA_EFLAG_DUBIOUS_XFER = (1 << 1), 60 61 /* error categories */ 62 ATA_ECAT_NONE = 0, 63 ATA_ECAT_ATA_BUS = 1, 64 ATA_ECAT_TOUT_HSM = 2, 65 ATA_ECAT_UNK_DEV = 3, 66 ATA_ECAT_DUBIOUS_NONE = 4, 67 ATA_ECAT_DUBIOUS_ATA_BUS = 5, 68 ATA_ECAT_DUBIOUS_TOUT_HSM = 6, 69 ATA_ECAT_DUBIOUS_UNK_DEV = 7, 70 ATA_ECAT_NR = 8, 71 72 ATA_EH_CMD_DFL_TIMEOUT = 5000, 73 74 /* always put at least this amount of time between resets */ 75 ATA_EH_RESET_COOL_DOWN = 5000, 76 77 /* Waiting in ->prereset can never be reliable. It's 78 * sometimes nice to wait there but it can't be depended upon; 79 * otherwise, we wouldn't be resetting. Just give it enough 80 * time for most drives to spin up. 81 */ 82 ATA_EH_PRERESET_TIMEOUT = 10000, 83 ATA_EH_FASTDRAIN_INTERVAL = 3000, 84 85 ATA_EH_UA_TRIES = 5, 86 87 /* probe speed down parameters, see ata_eh_schedule_probe() */ 88 ATA_EH_PROBE_TRIAL_INTERVAL = 60000, /* 1 min */ 89 ATA_EH_PROBE_TRIALS = 2, 90 }; 91 92 /* The following table determines how we sequence resets. Each entry 93 * represents timeout for that try. The first try can be soft or 94 * hardreset. All others are hardreset if available. In most cases 95 * the first reset w/ 10sec timeout should succeed. Following entries 96 * are mostly for error handling, hotplug and retarded devices. 97 */ 98 static const unsigned long ata_eh_reset_timeouts[] = { 99 10000, /* most drives spin up by 10sec */ 100 10000, /* > 99% working drives spin up before 20sec */ 101 35000, /* give > 30 secs of idleness for retarded devices */ 102 5000, /* and sweet one last chance */ 103 ULONG_MAX, /* > 1 min has elapsed, give up */ 104 }; 105 106 static const unsigned long ata_eh_identify_timeouts[] = { 107 5000, /* covers > 99% of successes and not too boring on failures */ 108 10000, /* combined time till here is enough even for media access */ 109 30000, /* for true idiots */ 110 ULONG_MAX, 111 }; 112 113 static const unsigned long ata_eh_flush_timeouts[] = { 114 15000, /* be generous with flush */ 115 15000, /* ditto */ 116 30000, /* and even more generous */ 117 ULONG_MAX, 118 }; 119 120 static const unsigned long ata_eh_other_timeouts[] = { 121 5000, /* same rationale as identify timeout */ 122 10000, /* ditto */ 123 /* but no merciful 30sec for other commands, it just isn't worth it */ 124 ULONG_MAX, 125 }; 126 127 struct ata_eh_cmd_timeout_ent { 128 const u8 *commands; 129 const unsigned long *timeouts; 130 }; 131 132 /* The following table determines timeouts to use for EH internal 133 * commands. Each table entry is a command class and matches the 134 * commands the entry applies to and the timeout table to use. 135 * 136 * On the retry after a command timed out, the next timeout value from 137 * the table is used. If the table doesn't contain further entries, 138 * the last value is used. 139 * 140 * ehc->cmd_timeout_idx keeps track of which timeout to use per 141 * command class, so if SET_FEATURES times out on the first try, the 142 * next try will use the second timeout value only for that class. 143 */ 144 #define CMDS(cmds...) (const u8 []){ cmds, 0 } 145 static const struct ata_eh_cmd_timeout_ent 146 ata_eh_cmd_timeout_table[ATA_EH_CMD_TIMEOUT_TABLE_SIZE] = { 147 { .commands = CMDS(ATA_CMD_ID_ATA, ATA_CMD_ID_ATAPI), 148 .timeouts = ata_eh_identify_timeouts, }, 149 { .commands = CMDS(ATA_CMD_READ_NATIVE_MAX, ATA_CMD_READ_NATIVE_MAX_EXT), 150 .timeouts = ata_eh_other_timeouts, }, 151 { .commands = CMDS(ATA_CMD_SET_MAX, ATA_CMD_SET_MAX_EXT), 152 .timeouts = ata_eh_other_timeouts, }, 153 { .commands = CMDS(ATA_CMD_SET_FEATURES), 154 .timeouts = ata_eh_other_timeouts, }, 155 { .commands = CMDS(ATA_CMD_INIT_DEV_PARAMS), 156 .timeouts = ata_eh_other_timeouts, }, 157 { .commands = CMDS(ATA_CMD_FLUSH, ATA_CMD_FLUSH_EXT), 158 .timeouts = ata_eh_flush_timeouts }, 159 }; 160 #undef CMDS 161 162 static void __ata_port_freeze(struct ata_port *ap); 163 #ifdef CONFIG_PM 164 static void ata_eh_handle_port_suspend(struct ata_port *ap); 165 static void ata_eh_handle_port_resume(struct ata_port *ap); 166 #else /* CONFIG_PM */ 167 static void ata_eh_handle_port_suspend(struct ata_port *ap) 168 { } 169 170 static void ata_eh_handle_port_resume(struct ata_port *ap) 171 { } 172 #endif /* CONFIG_PM */ 173 174 static void __ata_ehi_pushv_desc(struct ata_eh_info *ehi, const char *fmt, 175 va_list args) 176 { 177 ehi->desc_len += vscnprintf(ehi->desc + ehi->desc_len, 178 ATA_EH_DESC_LEN - ehi->desc_len, 179 fmt, args); 180 } 181 182 /** 183 * __ata_ehi_push_desc - push error description without adding separator 184 * @ehi: target EHI 185 * @fmt: printf format string 186 * 187 * Format string according to @fmt and append it to @ehi->desc. 188 * 189 * LOCKING: 190 * spin_lock_irqsave(host lock) 191 */ 192 void __ata_ehi_push_desc(struct ata_eh_info *ehi, const char *fmt, ...) 193 { 194 va_list args; 195 196 va_start(args, fmt); 197 __ata_ehi_pushv_desc(ehi, fmt, args); 198 va_end(args); 199 } 200 201 /** 202 * ata_ehi_push_desc - push error description with separator 203 * @ehi: target EHI 204 * @fmt: printf format string 205 * 206 * Format string according to @fmt and append it to @ehi->desc. 207 * If @ehi->desc is not empty, ", " is added in-between. 208 * 209 * LOCKING: 210 * spin_lock_irqsave(host lock) 211 */ 212 void ata_ehi_push_desc(struct ata_eh_info *ehi, const char *fmt, ...) 213 { 214 va_list args; 215 216 if (ehi->desc_len) 217 __ata_ehi_push_desc(ehi, ", "); 218 219 va_start(args, fmt); 220 __ata_ehi_pushv_desc(ehi, fmt, args); 221 va_end(args); 222 } 223 224 /** 225 * ata_ehi_clear_desc - clean error description 226 * @ehi: target EHI 227 * 228 * Clear @ehi->desc. 229 * 230 * LOCKING: 231 * spin_lock_irqsave(host lock) 232 */ 233 void ata_ehi_clear_desc(struct ata_eh_info *ehi) 234 { 235 ehi->desc[0] = '\0'; 236 ehi->desc_len = 0; 237 } 238 239 /** 240 * ata_port_desc - append port description 241 * @ap: target ATA port 242 * @fmt: printf format string 243 * 244 * Format string according to @fmt and append it to port 245 * description. If port description is not empty, " " is added 246 * in-between. This function is to be used while initializing 247 * ata_host. The description is printed on host registration. 248 * 249 * LOCKING: 250 * None. 251 */ 252 void ata_port_desc(struct ata_port *ap, const char *fmt, ...) 253 { 254 va_list args; 255 256 WARN_ON(!(ap->pflags & ATA_PFLAG_INITIALIZING)); 257 258 if (ap->link.eh_info.desc_len) 259 __ata_ehi_push_desc(&ap->link.eh_info, " "); 260 261 va_start(args, fmt); 262 __ata_ehi_pushv_desc(&ap->link.eh_info, fmt, args); 263 va_end(args); 264 } 265 266 #ifdef CONFIG_PCI 267 268 /** 269 * ata_port_pbar_desc - append PCI BAR description 270 * @ap: target ATA port 271 * @bar: target PCI BAR 272 * @offset: offset into PCI BAR 273 * @name: name of the area 274 * 275 * If @offset is negative, this function formats a string which 276 * contains the name, address, size and type of the BAR and 277 * appends it to the port description. If @offset is zero or 278 * positive, only name and offsetted address is appended. 279 * 280 * LOCKING: 281 * None. 282 */ 283 void ata_port_pbar_desc(struct ata_port *ap, int bar, ssize_t offset, 284 const char *name) 285 { 286 struct pci_dev *pdev = to_pci_dev(ap->host->dev); 287 char *type = ""; 288 unsigned long long start, len; 289 290 if (pci_resource_flags(pdev, bar) & IORESOURCE_MEM) 291 type = "m"; 292 else if (pci_resource_flags(pdev, bar) & IORESOURCE_IO) 293 type = "i"; 294 295 start = (unsigned long long)pci_resource_start(pdev, bar); 296 len = (unsigned long long)pci_resource_len(pdev, bar); 297 298 if (offset < 0) 299 ata_port_desc(ap, "%s %s%llu@0x%llx", name, type, len, start); 300 else 301 ata_port_desc(ap, "%s 0x%llx", name, 302 start + (unsigned long long)offset); 303 } 304 305 #endif /* CONFIG_PCI */ 306 307 static int ata_lookup_timeout_table(u8 cmd) 308 { 309 int i; 310 311 for (i = 0; i < ATA_EH_CMD_TIMEOUT_TABLE_SIZE; i++) { 312 const u8 *cur; 313 314 for (cur = ata_eh_cmd_timeout_table[i].commands; *cur; cur++) 315 if (*cur == cmd) 316 return i; 317 } 318 319 return -1; 320 } 321 322 /** 323 * ata_internal_cmd_timeout - determine timeout for an internal command 324 * @dev: target device 325 * @cmd: internal command to be issued 326 * 327 * Determine timeout for internal command @cmd for @dev. 328 * 329 * LOCKING: 330 * EH context. 331 * 332 * RETURNS: 333 * Determined timeout. 334 */ 335 unsigned long ata_internal_cmd_timeout(struct ata_device *dev, u8 cmd) 336 { 337 struct ata_eh_context *ehc = &dev->link->eh_context; 338 int ent = ata_lookup_timeout_table(cmd); 339 int idx; 340 341 if (ent < 0) 342 return ATA_EH_CMD_DFL_TIMEOUT; 343 344 idx = ehc->cmd_timeout_idx[dev->devno][ent]; 345 return ata_eh_cmd_timeout_table[ent].timeouts[idx]; 346 } 347 348 /** 349 * ata_internal_cmd_timed_out - notification for internal command timeout 350 * @dev: target device 351 * @cmd: internal command which timed out 352 * 353 * Notify EH that internal command @cmd for @dev timed out. This 354 * function should be called only for commands whose timeouts are 355 * determined using ata_internal_cmd_timeout(). 356 * 357 * LOCKING: 358 * EH context. 359 */ 360 void ata_internal_cmd_timed_out(struct ata_device *dev, u8 cmd) 361 { 362 struct ata_eh_context *ehc = &dev->link->eh_context; 363 int ent = ata_lookup_timeout_table(cmd); 364 int idx; 365 366 if (ent < 0) 367 return; 368 369 idx = ehc->cmd_timeout_idx[dev->devno][ent]; 370 if (ata_eh_cmd_timeout_table[ent].timeouts[idx + 1] != ULONG_MAX) 371 ehc->cmd_timeout_idx[dev->devno][ent]++; 372 } 373 374 static void ata_ering_record(struct ata_ering *ering, unsigned int eflags, 375 unsigned int err_mask) 376 { 377 struct ata_ering_entry *ent; 378 379 WARN_ON(!err_mask); 380 381 ering->cursor++; 382 ering->cursor %= ATA_ERING_SIZE; 383 384 ent = &ering->ring[ering->cursor]; 385 ent->eflags = eflags; 386 ent->err_mask = err_mask; 387 ent->timestamp = get_jiffies_64(); 388 } 389 390 static struct ata_ering_entry *ata_ering_top(struct ata_ering *ering) 391 { 392 struct ata_ering_entry *ent = &ering->ring[ering->cursor]; 393 394 if (ent->err_mask) 395 return ent; 396 return NULL; 397 } 398 399 static void ata_ering_clear(struct ata_ering *ering) 400 { 401 memset(ering, 0, sizeof(*ering)); 402 } 403 404 static int ata_ering_map(struct ata_ering *ering, 405 int (*map_fn)(struct ata_ering_entry *, void *), 406 void *arg) 407 { 408 int idx, rc = 0; 409 struct ata_ering_entry *ent; 410 411 idx = ering->cursor; 412 do { 413 ent = &ering->ring[idx]; 414 if (!ent->err_mask) 415 break; 416 rc = map_fn(ent, arg); 417 if (rc) 418 break; 419 idx = (idx - 1 + ATA_ERING_SIZE) % ATA_ERING_SIZE; 420 } while (idx != ering->cursor); 421 422 return rc; 423 } 424 425 static unsigned int ata_eh_dev_action(struct ata_device *dev) 426 { 427 struct ata_eh_context *ehc = &dev->link->eh_context; 428 429 return ehc->i.action | ehc->i.dev_action[dev->devno]; 430 } 431 432 static void ata_eh_clear_action(struct ata_link *link, struct ata_device *dev, 433 struct ata_eh_info *ehi, unsigned int action) 434 { 435 struct ata_device *tdev; 436 437 if (!dev) { 438 ehi->action &= ~action; 439 ata_for_each_dev(tdev, link, ALL) 440 ehi->dev_action[tdev->devno] &= ~action; 441 } else { 442 /* doesn't make sense for port-wide EH actions */ 443 WARN_ON(!(action & ATA_EH_PERDEV_MASK)); 444 445 /* break ehi->action into ehi->dev_action */ 446 if (ehi->action & action) { 447 ata_for_each_dev(tdev, link, ALL) 448 ehi->dev_action[tdev->devno] |= 449 ehi->action & action; 450 ehi->action &= ~action; 451 } 452 453 /* turn off the specified per-dev action */ 454 ehi->dev_action[dev->devno] &= ~action; 455 } 456 } 457 458 /** 459 * ata_scsi_timed_out - SCSI layer time out callback 460 * @cmd: timed out SCSI command 461 * 462 * Handles SCSI layer timeout. We race with normal completion of 463 * the qc for @cmd. If the qc is already gone, we lose and let 464 * the scsi command finish (EH_HANDLED). Otherwise, the qc has 465 * timed out and EH should be invoked. Prevent ata_qc_complete() 466 * from finishing it by setting EH_SCHEDULED and return 467 * EH_NOT_HANDLED. 468 * 469 * TODO: kill this function once old EH is gone. 470 * 471 * LOCKING: 472 * Called from timer context 473 * 474 * RETURNS: 475 * EH_HANDLED or EH_NOT_HANDLED 476 */ 477 enum blk_eh_timer_return ata_scsi_timed_out(struct scsi_cmnd *cmd) 478 { 479 struct Scsi_Host *host = cmd->device->host; 480 struct ata_port *ap = ata_shost_to_port(host); 481 unsigned long flags; 482 struct ata_queued_cmd *qc; 483 enum blk_eh_timer_return ret; 484 485 DPRINTK("ENTER\n"); 486 487 if (ap->ops->error_handler) { 488 ret = BLK_EH_NOT_HANDLED; 489 goto out; 490 } 491 492 ret = BLK_EH_HANDLED; 493 spin_lock_irqsave(ap->lock, flags); 494 qc = ata_qc_from_tag(ap, ap->link.active_tag); 495 if (qc) { 496 WARN_ON(qc->scsicmd != cmd); 497 qc->flags |= ATA_QCFLAG_EH_SCHEDULED; 498 qc->err_mask |= AC_ERR_TIMEOUT; 499 ret = BLK_EH_NOT_HANDLED; 500 } 501 spin_unlock_irqrestore(ap->lock, flags); 502 503 out: 504 DPRINTK("EXIT, ret=%d\n", ret); 505 return ret; 506 } 507 508 static void ata_eh_unload(struct ata_port *ap) 509 { 510 struct ata_link *link; 511 struct ata_device *dev; 512 unsigned long flags; 513 514 /* Restore SControl IPM and SPD for the next driver and 515 * disable attached devices. 516 */ 517 ata_for_each_link(link, ap, PMP_FIRST) { 518 sata_scr_write(link, SCR_CONTROL, link->saved_scontrol & 0xff0); 519 ata_for_each_dev(dev, link, ALL) 520 ata_dev_disable(dev); 521 } 522 523 /* freeze and set UNLOADED */ 524 spin_lock_irqsave(ap->lock, flags); 525 526 ata_port_freeze(ap); /* won't be thawed */ 527 ap->pflags &= ~ATA_PFLAG_EH_PENDING; /* clear pending from freeze */ 528 ap->pflags |= ATA_PFLAG_UNLOADED; 529 530 spin_unlock_irqrestore(ap->lock, flags); 531 } 532 533 /** 534 * ata_scsi_error - SCSI layer error handler callback 535 * @host: SCSI host on which error occurred 536 * 537 * Handles SCSI-layer-thrown error events. 538 * 539 * LOCKING: 540 * Inherited from SCSI layer (none, can sleep) 541 * 542 * RETURNS: 543 * Zero. 544 */ 545 void ata_scsi_error(struct Scsi_Host *host) 546 { 547 struct ata_port *ap = ata_shost_to_port(host); 548 int i; 549 unsigned long flags; 550 551 DPRINTK("ENTER\n"); 552 553 /* synchronize with port task */ 554 ata_port_flush_task(ap); 555 556 /* synchronize with host lock and sort out timeouts */ 557 558 /* For new EH, all qcs are finished in one of three ways - 559 * normal completion, error completion, and SCSI timeout. 560 * Both completions can race against SCSI timeout. When normal 561 * completion wins, the qc never reaches EH. When error 562 * completion wins, the qc has ATA_QCFLAG_FAILED set. 563 * 564 * When SCSI timeout wins, things are a bit more complex. 565 * Normal or error completion can occur after the timeout but 566 * before this point. In such cases, both types of 567 * completions are honored. A scmd is determined to have 568 * timed out iff its associated qc is active and not failed. 569 */ 570 if (ap->ops->error_handler) { 571 struct scsi_cmnd *scmd, *tmp; 572 int nr_timedout = 0; 573 574 spin_lock_irqsave(ap->lock, flags); 575 576 /* This must occur under the ap->lock as we don't want 577 a polled recovery to race the real interrupt handler 578 579 The lost_interrupt handler checks for any completed but 580 non-notified command and completes much like an IRQ handler. 581 582 We then fall into the error recovery code which will treat 583 this as if normal completion won the race */ 584 585 if (ap->ops->lost_interrupt) 586 ap->ops->lost_interrupt(ap); 587 588 list_for_each_entry_safe(scmd, tmp, &host->eh_cmd_q, eh_entry) { 589 struct ata_queued_cmd *qc; 590 591 for (i = 0; i < ATA_MAX_QUEUE; i++) { 592 qc = __ata_qc_from_tag(ap, i); 593 if (qc->flags & ATA_QCFLAG_ACTIVE && 594 qc->scsicmd == scmd) 595 break; 596 } 597 598 if (i < ATA_MAX_QUEUE) { 599 /* the scmd has an associated qc */ 600 if (!(qc->flags & ATA_QCFLAG_FAILED)) { 601 /* which hasn't failed yet, timeout */ 602 qc->err_mask |= AC_ERR_TIMEOUT; 603 qc->flags |= ATA_QCFLAG_FAILED; 604 nr_timedout++; 605 } 606 } else { 607 /* Normal completion occurred after 608 * SCSI timeout but before this point. 609 * Successfully complete it. 610 */ 611 scmd->retries = scmd->allowed; 612 scsi_eh_finish_cmd(scmd, &ap->eh_done_q); 613 } 614 } 615 616 /* If we have timed out qcs. They belong to EH from 617 * this point but the state of the controller is 618 * unknown. Freeze the port to make sure the IRQ 619 * handler doesn't diddle with those qcs. This must 620 * be done atomically w.r.t. setting QCFLAG_FAILED. 621 */ 622 if (nr_timedout) 623 __ata_port_freeze(ap); 624 625 spin_unlock_irqrestore(ap->lock, flags); 626 627 /* initialize eh_tries */ 628 ap->eh_tries = ATA_EH_MAX_TRIES; 629 } else 630 spin_unlock_wait(ap->lock); 631 632 /* If we timed raced normal completion and there is nothing to 633 recover nr_timedout == 0 why exactly are we doing error recovery ? */ 634 635 repeat: 636 /* invoke error handler */ 637 if (ap->ops->error_handler) { 638 struct ata_link *link; 639 640 /* kill fast drain timer */ 641 del_timer_sync(&ap->fastdrain_timer); 642 643 /* process port resume request */ 644 ata_eh_handle_port_resume(ap); 645 646 /* fetch & clear EH info */ 647 spin_lock_irqsave(ap->lock, flags); 648 649 ata_for_each_link(link, ap, HOST_FIRST) { 650 struct ata_eh_context *ehc = &link->eh_context; 651 struct ata_device *dev; 652 653 memset(&link->eh_context, 0, sizeof(link->eh_context)); 654 link->eh_context.i = link->eh_info; 655 memset(&link->eh_info, 0, sizeof(link->eh_info)); 656 657 ata_for_each_dev(dev, link, ENABLED) { 658 int devno = dev->devno; 659 660 ehc->saved_xfer_mode[devno] = dev->xfer_mode; 661 if (ata_ncq_enabled(dev)) 662 ehc->saved_ncq_enabled |= 1 << devno; 663 } 664 } 665 666 ap->pflags |= ATA_PFLAG_EH_IN_PROGRESS; 667 ap->pflags &= ~ATA_PFLAG_EH_PENDING; 668 ap->excl_link = NULL; /* don't maintain exclusion over EH */ 669 670 spin_unlock_irqrestore(ap->lock, flags); 671 672 /* invoke EH, skip if unloading or suspended */ 673 if (!(ap->pflags & (ATA_PFLAG_UNLOADING | ATA_PFLAG_SUSPENDED))) 674 ap->ops->error_handler(ap); 675 else { 676 /* if unloading, commence suicide */ 677 if ((ap->pflags & ATA_PFLAG_UNLOADING) && 678 !(ap->pflags & ATA_PFLAG_UNLOADED)) 679 ata_eh_unload(ap); 680 ata_eh_finish(ap); 681 } 682 683 /* process port suspend request */ 684 ata_eh_handle_port_suspend(ap); 685 686 /* Exception might have happend after ->error_handler 687 * recovered the port but before this point. Repeat 688 * EH in such case. 689 */ 690 spin_lock_irqsave(ap->lock, flags); 691 692 if (ap->pflags & ATA_PFLAG_EH_PENDING) { 693 if (--ap->eh_tries) { 694 spin_unlock_irqrestore(ap->lock, flags); 695 goto repeat; 696 } 697 ata_port_printk(ap, KERN_ERR, "EH pending after %d " 698 "tries, giving up\n", ATA_EH_MAX_TRIES); 699 ap->pflags &= ~ATA_PFLAG_EH_PENDING; 700 } 701 702 /* this run is complete, make sure EH info is clear */ 703 ata_for_each_link(link, ap, HOST_FIRST) 704 memset(&link->eh_info, 0, sizeof(link->eh_info)); 705 706 /* Clear host_eh_scheduled while holding ap->lock such 707 * that if exception occurs after this point but 708 * before EH completion, SCSI midlayer will 709 * re-initiate EH. 710 */ 711 host->host_eh_scheduled = 0; 712 713 spin_unlock_irqrestore(ap->lock, flags); 714 } else { 715 WARN_ON(ata_qc_from_tag(ap, ap->link.active_tag) == NULL); 716 ap->ops->eng_timeout(ap); 717 } 718 719 /* finish or retry handled scmd's and clean up */ 720 WARN_ON(host->host_failed || !list_empty(&host->eh_cmd_q)); 721 722 scsi_eh_flush_done_q(&ap->eh_done_q); 723 724 /* clean up */ 725 spin_lock_irqsave(ap->lock, flags); 726 727 if (ap->pflags & ATA_PFLAG_LOADING) 728 ap->pflags &= ~ATA_PFLAG_LOADING; 729 else if (ap->pflags & ATA_PFLAG_SCSI_HOTPLUG) 730 queue_delayed_work(ata_aux_wq, &ap->hotplug_task, 0); 731 732 if (ap->pflags & ATA_PFLAG_RECOVERED) 733 ata_port_printk(ap, KERN_INFO, "EH complete\n"); 734 735 ap->pflags &= ~(ATA_PFLAG_SCSI_HOTPLUG | ATA_PFLAG_RECOVERED); 736 737 /* tell wait_eh that we're done */ 738 ap->pflags &= ~ATA_PFLAG_EH_IN_PROGRESS; 739 wake_up_all(&ap->eh_wait_q); 740 741 spin_unlock_irqrestore(ap->lock, flags); 742 743 DPRINTK("EXIT\n"); 744 } 745 746 /** 747 * ata_port_wait_eh - Wait for the currently pending EH to complete 748 * @ap: Port to wait EH for 749 * 750 * Wait until the currently pending EH is complete. 751 * 752 * LOCKING: 753 * Kernel thread context (may sleep). 754 */ 755 void ata_port_wait_eh(struct ata_port *ap) 756 { 757 unsigned long flags; 758 DEFINE_WAIT(wait); 759 760 retry: 761 spin_lock_irqsave(ap->lock, flags); 762 763 while (ap->pflags & (ATA_PFLAG_EH_PENDING | ATA_PFLAG_EH_IN_PROGRESS)) { 764 prepare_to_wait(&ap->eh_wait_q, &wait, TASK_UNINTERRUPTIBLE); 765 spin_unlock_irqrestore(ap->lock, flags); 766 schedule(); 767 spin_lock_irqsave(ap->lock, flags); 768 } 769 finish_wait(&ap->eh_wait_q, &wait); 770 771 spin_unlock_irqrestore(ap->lock, flags); 772 773 /* make sure SCSI EH is complete */ 774 if (scsi_host_in_recovery(ap->scsi_host)) { 775 msleep(10); 776 goto retry; 777 } 778 } 779 780 static int ata_eh_nr_in_flight(struct ata_port *ap) 781 { 782 unsigned int tag; 783 int nr = 0; 784 785 /* count only non-internal commands */ 786 for (tag = 0; tag < ATA_MAX_QUEUE - 1; tag++) 787 if (ata_qc_from_tag(ap, tag)) 788 nr++; 789 790 return nr; 791 } 792 793 void ata_eh_fastdrain_timerfn(unsigned long arg) 794 { 795 struct ata_port *ap = (void *)arg; 796 unsigned long flags; 797 int cnt; 798 799 spin_lock_irqsave(ap->lock, flags); 800 801 cnt = ata_eh_nr_in_flight(ap); 802 803 /* are we done? */ 804 if (!cnt) 805 goto out_unlock; 806 807 if (cnt == ap->fastdrain_cnt) { 808 unsigned int tag; 809 810 /* No progress during the last interval, tag all 811 * in-flight qcs as timed out and freeze the port. 812 */ 813 for (tag = 0; tag < ATA_MAX_QUEUE - 1; tag++) { 814 struct ata_queued_cmd *qc = ata_qc_from_tag(ap, tag); 815 if (qc) 816 qc->err_mask |= AC_ERR_TIMEOUT; 817 } 818 819 ata_port_freeze(ap); 820 } else { 821 /* some qcs have finished, give it another chance */ 822 ap->fastdrain_cnt = cnt; 823 ap->fastdrain_timer.expires = 824 ata_deadline(jiffies, ATA_EH_FASTDRAIN_INTERVAL); 825 add_timer(&ap->fastdrain_timer); 826 } 827 828 out_unlock: 829 spin_unlock_irqrestore(ap->lock, flags); 830 } 831 832 /** 833 * ata_eh_set_pending - set ATA_PFLAG_EH_PENDING and activate fast drain 834 * @ap: target ATA port 835 * @fastdrain: activate fast drain 836 * 837 * Set ATA_PFLAG_EH_PENDING and activate fast drain if @fastdrain 838 * is non-zero and EH wasn't pending before. Fast drain ensures 839 * that EH kicks in in timely manner. 840 * 841 * LOCKING: 842 * spin_lock_irqsave(host lock) 843 */ 844 static void ata_eh_set_pending(struct ata_port *ap, int fastdrain) 845 { 846 int cnt; 847 848 /* already scheduled? */ 849 if (ap->pflags & ATA_PFLAG_EH_PENDING) 850 return; 851 852 ap->pflags |= ATA_PFLAG_EH_PENDING; 853 854 if (!fastdrain) 855 return; 856 857 /* do we have in-flight qcs? */ 858 cnt = ata_eh_nr_in_flight(ap); 859 if (!cnt) 860 return; 861 862 /* activate fast drain */ 863 ap->fastdrain_cnt = cnt; 864 ap->fastdrain_timer.expires = 865 ata_deadline(jiffies, ATA_EH_FASTDRAIN_INTERVAL); 866 add_timer(&ap->fastdrain_timer); 867 } 868 869 /** 870 * ata_qc_schedule_eh - schedule qc for error handling 871 * @qc: command to schedule error handling for 872 * 873 * Schedule error handling for @qc. EH will kick in as soon as 874 * other commands are drained. 875 * 876 * LOCKING: 877 * spin_lock_irqsave(host lock) 878 */ 879 void ata_qc_schedule_eh(struct ata_queued_cmd *qc) 880 { 881 struct ata_port *ap = qc->ap; 882 883 WARN_ON(!ap->ops->error_handler); 884 885 qc->flags |= ATA_QCFLAG_FAILED; 886 ata_eh_set_pending(ap, 1); 887 888 /* The following will fail if timeout has already expired. 889 * ata_scsi_error() takes care of such scmds on EH entry. 890 * Note that ATA_QCFLAG_FAILED is unconditionally set after 891 * this function completes. 892 */ 893 blk_abort_request(qc->scsicmd->request); 894 } 895 896 /** 897 * ata_port_schedule_eh - schedule error handling without a qc 898 * @ap: ATA port to schedule EH for 899 * 900 * Schedule error handling for @ap. EH will kick in as soon as 901 * all commands are drained. 902 * 903 * LOCKING: 904 * spin_lock_irqsave(host lock) 905 */ 906 void ata_port_schedule_eh(struct ata_port *ap) 907 { 908 WARN_ON(!ap->ops->error_handler); 909 910 if (ap->pflags & ATA_PFLAG_INITIALIZING) 911 return; 912 913 ata_eh_set_pending(ap, 1); 914 scsi_schedule_eh(ap->scsi_host); 915 916 DPRINTK("port EH scheduled\n"); 917 } 918 919 static int ata_do_link_abort(struct ata_port *ap, struct ata_link *link) 920 { 921 int tag, nr_aborted = 0; 922 923 WARN_ON(!ap->ops->error_handler); 924 925 /* we're gonna abort all commands, no need for fast drain */ 926 ata_eh_set_pending(ap, 0); 927 928 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 929 struct ata_queued_cmd *qc = ata_qc_from_tag(ap, tag); 930 931 if (qc && (!link || qc->dev->link == link)) { 932 qc->flags |= ATA_QCFLAG_FAILED; 933 ata_qc_complete(qc); 934 nr_aborted++; 935 } 936 } 937 938 if (!nr_aborted) 939 ata_port_schedule_eh(ap); 940 941 return nr_aborted; 942 } 943 944 /** 945 * ata_link_abort - abort all qc's on the link 946 * @link: ATA link to abort qc's for 947 * 948 * Abort all active qc's active on @link and schedule EH. 949 * 950 * LOCKING: 951 * spin_lock_irqsave(host lock) 952 * 953 * RETURNS: 954 * Number of aborted qc's. 955 */ 956 int ata_link_abort(struct ata_link *link) 957 { 958 return ata_do_link_abort(link->ap, link); 959 } 960 961 /** 962 * ata_port_abort - abort all qc's on the port 963 * @ap: ATA port to abort qc's for 964 * 965 * Abort all active qc's of @ap and schedule EH. 966 * 967 * LOCKING: 968 * spin_lock_irqsave(host_set lock) 969 * 970 * RETURNS: 971 * Number of aborted qc's. 972 */ 973 int ata_port_abort(struct ata_port *ap) 974 { 975 return ata_do_link_abort(ap, NULL); 976 } 977 978 /** 979 * __ata_port_freeze - freeze port 980 * @ap: ATA port to freeze 981 * 982 * This function is called when HSM violation or some other 983 * condition disrupts normal operation of the port. Frozen port 984 * is not allowed to perform any operation until the port is 985 * thawed, which usually follows a successful reset. 986 * 987 * ap->ops->freeze() callback can be used for freezing the port 988 * hardware-wise (e.g. mask interrupt and stop DMA engine). If a 989 * port cannot be frozen hardware-wise, the interrupt handler 990 * must ack and clear interrupts unconditionally while the port 991 * is frozen. 992 * 993 * LOCKING: 994 * spin_lock_irqsave(host lock) 995 */ 996 static void __ata_port_freeze(struct ata_port *ap) 997 { 998 WARN_ON(!ap->ops->error_handler); 999 1000 if (ap->ops->freeze) 1001 ap->ops->freeze(ap); 1002 1003 ap->pflags |= ATA_PFLAG_FROZEN; 1004 1005 DPRINTK("ata%u port frozen\n", ap->print_id); 1006 } 1007 1008 /** 1009 * ata_port_freeze - abort & freeze port 1010 * @ap: ATA port to freeze 1011 * 1012 * Abort and freeze @ap. The freeze operation must be called 1013 * first, because some hardware requires special operations 1014 * before the taskfile registers are accessible. 1015 * 1016 * LOCKING: 1017 * spin_lock_irqsave(host lock) 1018 * 1019 * RETURNS: 1020 * Number of aborted commands. 1021 */ 1022 int ata_port_freeze(struct ata_port *ap) 1023 { 1024 int nr_aborted; 1025 1026 WARN_ON(!ap->ops->error_handler); 1027 1028 __ata_port_freeze(ap); 1029 nr_aborted = ata_port_abort(ap); 1030 1031 return nr_aborted; 1032 } 1033 1034 /** 1035 * sata_async_notification - SATA async notification handler 1036 * @ap: ATA port where async notification is received 1037 * 1038 * Handler to be called when async notification via SDB FIS is 1039 * received. This function schedules EH if necessary. 1040 * 1041 * LOCKING: 1042 * spin_lock_irqsave(host lock) 1043 * 1044 * RETURNS: 1045 * 1 if EH is scheduled, 0 otherwise. 1046 */ 1047 int sata_async_notification(struct ata_port *ap) 1048 { 1049 u32 sntf; 1050 int rc; 1051 1052 if (!(ap->flags & ATA_FLAG_AN)) 1053 return 0; 1054 1055 rc = sata_scr_read(&ap->link, SCR_NOTIFICATION, &sntf); 1056 if (rc == 0) 1057 sata_scr_write(&ap->link, SCR_NOTIFICATION, sntf); 1058 1059 if (!sata_pmp_attached(ap) || rc) { 1060 /* PMP is not attached or SNTF is not available */ 1061 if (!sata_pmp_attached(ap)) { 1062 /* PMP is not attached. Check whether ATAPI 1063 * AN is configured. If so, notify media 1064 * change. 1065 */ 1066 struct ata_device *dev = ap->link.device; 1067 1068 if ((dev->class == ATA_DEV_ATAPI) && 1069 (dev->flags & ATA_DFLAG_AN)) 1070 ata_scsi_media_change_notify(dev); 1071 return 0; 1072 } else { 1073 /* PMP is attached but SNTF is not available. 1074 * ATAPI async media change notification is 1075 * not used. The PMP must be reporting PHY 1076 * status change, schedule EH. 1077 */ 1078 ata_port_schedule_eh(ap); 1079 return 1; 1080 } 1081 } else { 1082 /* PMP is attached and SNTF is available */ 1083 struct ata_link *link; 1084 1085 /* check and notify ATAPI AN */ 1086 ata_for_each_link(link, ap, EDGE) { 1087 if (!(sntf & (1 << link->pmp))) 1088 continue; 1089 1090 if ((link->device->class == ATA_DEV_ATAPI) && 1091 (link->device->flags & ATA_DFLAG_AN)) 1092 ata_scsi_media_change_notify(link->device); 1093 } 1094 1095 /* If PMP is reporting that PHY status of some 1096 * downstream ports has changed, schedule EH. 1097 */ 1098 if (sntf & (1 << SATA_PMP_CTRL_PORT)) { 1099 ata_port_schedule_eh(ap); 1100 return 1; 1101 } 1102 1103 return 0; 1104 } 1105 } 1106 1107 /** 1108 * ata_eh_freeze_port - EH helper to freeze port 1109 * @ap: ATA port to freeze 1110 * 1111 * Freeze @ap. 1112 * 1113 * LOCKING: 1114 * None. 1115 */ 1116 void ata_eh_freeze_port(struct ata_port *ap) 1117 { 1118 unsigned long flags; 1119 1120 if (!ap->ops->error_handler) 1121 return; 1122 1123 spin_lock_irqsave(ap->lock, flags); 1124 __ata_port_freeze(ap); 1125 spin_unlock_irqrestore(ap->lock, flags); 1126 } 1127 1128 /** 1129 * ata_port_thaw_port - EH helper to thaw port 1130 * @ap: ATA port to thaw 1131 * 1132 * Thaw frozen port @ap. 1133 * 1134 * LOCKING: 1135 * None. 1136 */ 1137 void ata_eh_thaw_port(struct ata_port *ap) 1138 { 1139 unsigned long flags; 1140 1141 if (!ap->ops->error_handler) 1142 return; 1143 1144 spin_lock_irqsave(ap->lock, flags); 1145 1146 ap->pflags &= ~ATA_PFLAG_FROZEN; 1147 1148 if (ap->ops->thaw) 1149 ap->ops->thaw(ap); 1150 1151 spin_unlock_irqrestore(ap->lock, flags); 1152 1153 DPRINTK("ata%u port thawed\n", ap->print_id); 1154 } 1155 1156 static void ata_eh_scsidone(struct scsi_cmnd *scmd) 1157 { 1158 /* nada */ 1159 } 1160 1161 static void __ata_eh_qc_complete(struct ata_queued_cmd *qc) 1162 { 1163 struct ata_port *ap = qc->ap; 1164 struct scsi_cmnd *scmd = qc->scsicmd; 1165 unsigned long flags; 1166 1167 spin_lock_irqsave(ap->lock, flags); 1168 qc->scsidone = ata_eh_scsidone; 1169 __ata_qc_complete(qc); 1170 WARN_ON(ata_tag_valid(qc->tag)); 1171 spin_unlock_irqrestore(ap->lock, flags); 1172 1173 scsi_eh_finish_cmd(scmd, &ap->eh_done_q); 1174 } 1175 1176 /** 1177 * ata_eh_qc_complete - Complete an active ATA command from EH 1178 * @qc: Command to complete 1179 * 1180 * Indicate to the mid and upper layers that an ATA command has 1181 * completed. To be used from EH. 1182 */ 1183 void ata_eh_qc_complete(struct ata_queued_cmd *qc) 1184 { 1185 struct scsi_cmnd *scmd = qc->scsicmd; 1186 scmd->retries = scmd->allowed; 1187 __ata_eh_qc_complete(qc); 1188 } 1189 1190 /** 1191 * ata_eh_qc_retry - Tell midlayer to retry an ATA command after EH 1192 * @qc: Command to retry 1193 * 1194 * Indicate to the mid and upper layers that an ATA command 1195 * should be retried. To be used from EH. 1196 * 1197 * SCSI midlayer limits the number of retries to scmd->allowed. 1198 * scmd->retries is decremented for commands which get retried 1199 * due to unrelated failures (qc->err_mask is zero). 1200 */ 1201 void ata_eh_qc_retry(struct ata_queued_cmd *qc) 1202 { 1203 struct scsi_cmnd *scmd = qc->scsicmd; 1204 if (!qc->err_mask && scmd->retries) 1205 scmd->retries--; 1206 __ata_eh_qc_complete(qc); 1207 } 1208 1209 /** 1210 * ata_dev_disable - disable ATA device 1211 * @dev: ATA device to disable 1212 * 1213 * Disable @dev. 1214 * 1215 * Locking: 1216 * EH context. 1217 */ 1218 void ata_dev_disable(struct ata_device *dev) 1219 { 1220 if (!ata_dev_enabled(dev)) 1221 return; 1222 1223 if (ata_msg_drv(dev->link->ap)) 1224 ata_dev_printk(dev, KERN_WARNING, "disabled\n"); 1225 ata_acpi_on_disable(dev); 1226 ata_down_xfermask_limit(dev, ATA_DNXFER_FORCE_PIO0 | ATA_DNXFER_QUIET); 1227 dev->class++; 1228 1229 /* From now till the next successful probe, ering is used to 1230 * track probe failures. Clear accumulated device error info. 1231 */ 1232 ata_ering_clear(&dev->ering); 1233 } 1234 1235 /** 1236 * ata_eh_detach_dev - detach ATA device 1237 * @dev: ATA device to detach 1238 * 1239 * Detach @dev. 1240 * 1241 * LOCKING: 1242 * None. 1243 */ 1244 void ata_eh_detach_dev(struct ata_device *dev) 1245 { 1246 struct ata_link *link = dev->link; 1247 struct ata_port *ap = link->ap; 1248 struct ata_eh_context *ehc = &link->eh_context; 1249 unsigned long flags; 1250 1251 ata_dev_disable(dev); 1252 1253 spin_lock_irqsave(ap->lock, flags); 1254 1255 dev->flags &= ~ATA_DFLAG_DETACH; 1256 1257 if (ata_scsi_offline_dev(dev)) { 1258 dev->flags |= ATA_DFLAG_DETACHED; 1259 ap->pflags |= ATA_PFLAG_SCSI_HOTPLUG; 1260 } 1261 1262 /* clear per-dev EH info */ 1263 ata_eh_clear_action(link, dev, &link->eh_info, ATA_EH_PERDEV_MASK); 1264 ata_eh_clear_action(link, dev, &link->eh_context.i, ATA_EH_PERDEV_MASK); 1265 ehc->saved_xfer_mode[dev->devno] = 0; 1266 ehc->saved_ncq_enabled &= ~(1 << dev->devno); 1267 1268 spin_unlock_irqrestore(ap->lock, flags); 1269 } 1270 1271 /** 1272 * ata_eh_about_to_do - about to perform eh_action 1273 * @link: target ATA link 1274 * @dev: target ATA dev for per-dev action (can be NULL) 1275 * @action: action about to be performed 1276 * 1277 * Called just before performing EH actions to clear related bits 1278 * in @link->eh_info such that eh actions are not unnecessarily 1279 * repeated. 1280 * 1281 * LOCKING: 1282 * None. 1283 */ 1284 void ata_eh_about_to_do(struct ata_link *link, struct ata_device *dev, 1285 unsigned int action) 1286 { 1287 struct ata_port *ap = link->ap; 1288 struct ata_eh_info *ehi = &link->eh_info; 1289 struct ata_eh_context *ehc = &link->eh_context; 1290 unsigned long flags; 1291 1292 spin_lock_irqsave(ap->lock, flags); 1293 1294 ata_eh_clear_action(link, dev, ehi, action); 1295 1296 /* About to take EH action, set RECOVERED. Ignore actions on 1297 * slave links as master will do them again. 1298 */ 1299 if (!(ehc->i.flags & ATA_EHI_QUIET) && link != ap->slave_link) 1300 ap->pflags |= ATA_PFLAG_RECOVERED; 1301 1302 spin_unlock_irqrestore(ap->lock, flags); 1303 } 1304 1305 /** 1306 * ata_eh_done - EH action complete 1307 * @ap: target ATA port 1308 * @dev: target ATA dev for per-dev action (can be NULL) 1309 * @action: action just completed 1310 * 1311 * Called right after performing EH actions to clear related bits 1312 * in @link->eh_context. 1313 * 1314 * LOCKING: 1315 * None. 1316 */ 1317 void ata_eh_done(struct ata_link *link, struct ata_device *dev, 1318 unsigned int action) 1319 { 1320 struct ata_eh_context *ehc = &link->eh_context; 1321 1322 ata_eh_clear_action(link, dev, &ehc->i, action); 1323 } 1324 1325 /** 1326 * ata_err_string - convert err_mask to descriptive string 1327 * @err_mask: error mask to convert to string 1328 * 1329 * Convert @err_mask to descriptive string. Errors are 1330 * prioritized according to severity and only the most severe 1331 * error is reported. 1332 * 1333 * LOCKING: 1334 * None. 1335 * 1336 * RETURNS: 1337 * Descriptive string for @err_mask 1338 */ 1339 static const char *ata_err_string(unsigned int err_mask) 1340 { 1341 if (err_mask & AC_ERR_HOST_BUS) 1342 return "host bus error"; 1343 if (err_mask & AC_ERR_ATA_BUS) 1344 return "ATA bus error"; 1345 if (err_mask & AC_ERR_TIMEOUT) 1346 return "timeout"; 1347 if (err_mask & AC_ERR_HSM) 1348 return "HSM violation"; 1349 if (err_mask & AC_ERR_SYSTEM) 1350 return "internal error"; 1351 if (err_mask & AC_ERR_MEDIA) 1352 return "media error"; 1353 if (err_mask & AC_ERR_INVALID) 1354 return "invalid argument"; 1355 if (err_mask & AC_ERR_DEV) 1356 return "device error"; 1357 return "unknown error"; 1358 } 1359 1360 /** 1361 * ata_read_log_page - read a specific log page 1362 * @dev: target device 1363 * @page: page to read 1364 * @buf: buffer to store read page 1365 * @sectors: number of sectors to read 1366 * 1367 * Read log page using READ_LOG_EXT command. 1368 * 1369 * LOCKING: 1370 * Kernel thread context (may sleep). 1371 * 1372 * RETURNS: 1373 * 0 on success, AC_ERR_* mask otherwise. 1374 */ 1375 static unsigned int ata_read_log_page(struct ata_device *dev, 1376 u8 page, void *buf, unsigned int sectors) 1377 { 1378 struct ata_taskfile tf; 1379 unsigned int err_mask; 1380 1381 DPRINTK("read log page - page %d\n", page); 1382 1383 ata_tf_init(dev, &tf); 1384 tf.command = ATA_CMD_READ_LOG_EXT; 1385 tf.lbal = page; 1386 tf.nsect = sectors; 1387 tf.hob_nsect = sectors >> 8; 1388 tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_LBA48 | ATA_TFLAG_DEVICE; 1389 tf.protocol = ATA_PROT_PIO; 1390 1391 err_mask = ata_exec_internal(dev, &tf, NULL, DMA_FROM_DEVICE, 1392 buf, sectors * ATA_SECT_SIZE, 0); 1393 1394 DPRINTK("EXIT, err_mask=%x\n", err_mask); 1395 return err_mask; 1396 } 1397 1398 /** 1399 * ata_eh_read_log_10h - Read log page 10h for NCQ error details 1400 * @dev: Device to read log page 10h from 1401 * @tag: Resulting tag of the failed command 1402 * @tf: Resulting taskfile registers of the failed command 1403 * 1404 * Read log page 10h to obtain NCQ error details and clear error 1405 * condition. 1406 * 1407 * LOCKING: 1408 * Kernel thread context (may sleep). 1409 * 1410 * RETURNS: 1411 * 0 on success, -errno otherwise. 1412 */ 1413 static int ata_eh_read_log_10h(struct ata_device *dev, 1414 int *tag, struct ata_taskfile *tf) 1415 { 1416 u8 *buf = dev->link->ap->sector_buf; 1417 unsigned int err_mask; 1418 u8 csum; 1419 int i; 1420 1421 err_mask = ata_read_log_page(dev, ATA_LOG_SATA_NCQ, buf, 1); 1422 if (err_mask) 1423 return -EIO; 1424 1425 csum = 0; 1426 for (i = 0; i < ATA_SECT_SIZE; i++) 1427 csum += buf[i]; 1428 if (csum) 1429 ata_dev_printk(dev, KERN_WARNING, 1430 "invalid checksum 0x%x on log page 10h\n", csum); 1431 1432 if (buf[0] & 0x80) 1433 return -ENOENT; 1434 1435 *tag = buf[0] & 0x1f; 1436 1437 tf->command = buf[2]; 1438 tf->feature = buf[3]; 1439 tf->lbal = buf[4]; 1440 tf->lbam = buf[5]; 1441 tf->lbah = buf[6]; 1442 tf->device = buf[7]; 1443 tf->hob_lbal = buf[8]; 1444 tf->hob_lbam = buf[9]; 1445 tf->hob_lbah = buf[10]; 1446 tf->nsect = buf[12]; 1447 tf->hob_nsect = buf[13]; 1448 1449 return 0; 1450 } 1451 1452 /** 1453 * atapi_eh_tur - perform ATAPI TEST_UNIT_READY 1454 * @dev: target ATAPI device 1455 * @r_sense_key: out parameter for sense_key 1456 * 1457 * Perform ATAPI TEST_UNIT_READY. 1458 * 1459 * LOCKING: 1460 * EH context (may sleep). 1461 * 1462 * RETURNS: 1463 * 0 on success, AC_ERR_* mask on failure. 1464 */ 1465 static unsigned int atapi_eh_tur(struct ata_device *dev, u8 *r_sense_key) 1466 { 1467 u8 cdb[ATAPI_CDB_LEN] = { TEST_UNIT_READY, 0, 0, 0, 0, 0 }; 1468 struct ata_taskfile tf; 1469 unsigned int err_mask; 1470 1471 ata_tf_init(dev, &tf); 1472 1473 tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_DEVICE; 1474 tf.command = ATA_CMD_PACKET; 1475 tf.protocol = ATAPI_PROT_NODATA; 1476 1477 err_mask = ata_exec_internal(dev, &tf, cdb, DMA_NONE, NULL, 0, 0); 1478 if (err_mask == AC_ERR_DEV) 1479 *r_sense_key = tf.feature >> 4; 1480 return err_mask; 1481 } 1482 1483 /** 1484 * atapi_eh_request_sense - perform ATAPI REQUEST_SENSE 1485 * @dev: device to perform REQUEST_SENSE to 1486 * @sense_buf: result sense data buffer (SCSI_SENSE_BUFFERSIZE bytes long) 1487 * @dfl_sense_key: default sense key to use 1488 * 1489 * Perform ATAPI REQUEST_SENSE after the device reported CHECK 1490 * SENSE. This function is EH helper. 1491 * 1492 * LOCKING: 1493 * Kernel thread context (may sleep). 1494 * 1495 * RETURNS: 1496 * 0 on success, AC_ERR_* mask on failure 1497 */ 1498 static unsigned int atapi_eh_request_sense(struct ata_device *dev, 1499 u8 *sense_buf, u8 dfl_sense_key) 1500 { 1501 u8 cdb[ATAPI_CDB_LEN] = 1502 { REQUEST_SENSE, 0, 0, 0, SCSI_SENSE_BUFFERSIZE, 0 }; 1503 struct ata_port *ap = dev->link->ap; 1504 struct ata_taskfile tf; 1505 1506 DPRINTK("ATAPI request sense\n"); 1507 1508 /* FIXME: is this needed? */ 1509 memset(sense_buf, 0, SCSI_SENSE_BUFFERSIZE); 1510 1511 /* initialize sense_buf with the error register, 1512 * for the case where they are -not- overwritten 1513 */ 1514 sense_buf[0] = 0x70; 1515 sense_buf[2] = dfl_sense_key; 1516 1517 /* some devices time out if garbage left in tf */ 1518 ata_tf_init(dev, &tf); 1519 1520 tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_DEVICE; 1521 tf.command = ATA_CMD_PACKET; 1522 1523 /* is it pointless to prefer PIO for "safety reasons"? */ 1524 if (ap->flags & ATA_FLAG_PIO_DMA) { 1525 tf.protocol = ATAPI_PROT_DMA; 1526 tf.feature |= ATAPI_PKT_DMA; 1527 } else { 1528 tf.protocol = ATAPI_PROT_PIO; 1529 tf.lbam = SCSI_SENSE_BUFFERSIZE; 1530 tf.lbah = 0; 1531 } 1532 1533 return ata_exec_internal(dev, &tf, cdb, DMA_FROM_DEVICE, 1534 sense_buf, SCSI_SENSE_BUFFERSIZE, 0); 1535 } 1536 1537 /** 1538 * ata_eh_analyze_serror - analyze SError for a failed port 1539 * @link: ATA link to analyze SError for 1540 * 1541 * Analyze SError if available and further determine cause of 1542 * failure. 1543 * 1544 * LOCKING: 1545 * None. 1546 */ 1547 static void ata_eh_analyze_serror(struct ata_link *link) 1548 { 1549 struct ata_eh_context *ehc = &link->eh_context; 1550 u32 serror = ehc->i.serror; 1551 unsigned int err_mask = 0, action = 0; 1552 u32 hotplug_mask; 1553 1554 if (serror & (SERR_PERSISTENT | SERR_DATA)) { 1555 err_mask |= AC_ERR_ATA_BUS; 1556 action |= ATA_EH_RESET; 1557 } 1558 if (serror & SERR_PROTOCOL) { 1559 err_mask |= AC_ERR_HSM; 1560 action |= ATA_EH_RESET; 1561 } 1562 if (serror & SERR_INTERNAL) { 1563 err_mask |= AC_ERR_SYSTEM; 1564 action |= ATA_EH_RESET; 1565 } 1566 1567 /* Determine whether a hotplug event has occurred. Both 1568 * SError.N/X are considered hotplug events for enabled or 1569 * host links. For disabled PMP links, only N bit is 1570 * considered as X bit is left at 1 for link plugging. 1571 */ 1572 hotplug_mask = 0; 1573 1574 if (!(link->flags & ATA_LFLAG_DISABLED) || ata_is_host_link(link)) 1575 hotplug_mask = SERR_PHYRDY_CHG | SERR_DEV_XCHG; 1576 else 1577 hotplug_mask = SERR_PHYRDY_CHG; 1578 1579 if (serror & hotplug_mask) 1580 ata_ehi_hotplugged(&ehc->i); 1581 1582 ehc->i.err_mask |= err_mask; 1583 ehc->i.action |= action; 1584 } 1585 1586 /** 1587 * ata_eh_analyze_ncq_error - analyze NCQ error 1588 * @link: ATA link to analyze NCQ error for 1589 * 1590 * Read log page 10h, determine the offending qc and acquire 1591 * error status TF. For NCQ device errors, all LLDDs have to do 1592 * is setting AC_ERR_DEV in ehi->err_mask. This function takes 1593 * care of the rest. 1594 * 1595 * LOCKING: 1596 * Kernel thread context (may sleep). 1597 */ 1598 void ata_eh_analyze_ncq_error(struct ata_link *link) 1599 { 1600 struct ata_port *ap = link->ap; 1601 struct ata_eh_context *ehc = &link->eh_context; 1602 struct ata_device *dev = link->device; 1603 struct ata_queued_cmd *qc; 1604 struct ata_taskfile tf; 1605 int tag, rc; 1606 1607 /* if frozen, we can't do much */ 1608 if (ap->pflags & ATA_PFLAG_FROZEN) 1609 return; 1610 1611 /* is it NCQ device error? */ 1612 if (!link->sactive || !(ehc->i.err_mask & AC_ERR_DEV)) 1613 return; 1614 1615 /* has LLDD analyzed already? */ 1616 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 1617 qc = __ata_qc_from_tag(ap, tag); 1618 1619 if (!(qc->flags & ATA_QCFLAG_FAILED)) 1620 continue; 1621 1622 if (qc->err_mask) 1623 return; 1624 } 1625 1626 /* okay, this error is ours */ 1627 rc = ata_eh_read_log_10h(dev, &tag, &tf); 1628 if (rc) { 1629 ata_link_printk(link, KERN_ERR, "failed to read log page 10h " 1630 "(errno=%d)\n", rc); 1631 return; 1632 } 1633 1634 if (!(link->sactive & (1 << tag))) { 1635 ata_link_printk(link, KERN_ERR, "log page 10h reported " 1636 "inactive tag %d\n", tag); 1637 return; 1638 } 1639 1640 /* we've got the perpetrator, condemn it */ 1641 qc = __ata_qc_from_tag(ap, tag); 1642 memcpy(&qc->result_tf, &tf, sizeof(tf)); 1643 qc->result_tf.flags = ATA_TFLAG_ISADDR | ATA_TFLAG_LBA | ATA_TFLAG_LBA48; 1644 qc->err_mask |= AC_ERR_DEV | AC_ERR_NCQ; 1645 ehc->i.err_mask &= ~AC_ERR_DEV; 1646 } 1647 1648 /** 1649 * ata_eh_analyze_tf - analyze taskfile of a failed qc 1650 * @qc: qc to analyze 1651 * @tf: Taskfile registers to analyze 1652 * 1653 * Analyze taskfile of @qc and further determine cause of 1654 * failure. This function also requests ATAPI sense data if 1655 * avaliable. 1656 * 1657 * LOCKING: 1658 * Kernel thread context (may sleep). 1659 * 1660 * RETURNS: 1661 * Determined recovery action 1662 */ 1663 static unsigned int ata_eh_analyze_tf(struct ata_queued_cmd *qc, 1664 const struct ata_taskfile *tf) 1665 { 1666 unsigned int tmp, action = 0; 1667 u8 stat = tf->command, err = tf->feature; 1668 1669 if ((stat & (ATA_BUSY | ATA_DRQ | ATA_DRDY)) != ATA_DRDY) { 1670 qc->err_mask |= AC_ERR_HSM; 1671 return ATA_EH_RESET; 1672 } 1673 1674 if (stat & (ATA_ERR | ATA_DF)) 1675 qc->err_mask |= AC_ERR_DEV; 1676 else 1677 return 0; 1678 1679 switch (qc->dev->class) { 1680 case ATA_DEV_ATA: 1681 if (err & ATA_ICRC) 1682 qc->err_mask |= AC_ERR_ATA_BUS; 1683 if (err & ATA_UNC) 1684 qc->err_mask |= AC_ERR_MEDIA; 1685 if (err & ATA_IDNF) 1686 qc->err_mask |= AC_ERR_INVALID; 1687 break; 1688 1689 case ATA_DEV_ATAPI: 1690 if (!(qc->ap->pflags & ATA_PFLAG_FROZEN)) { 1691 tmp = atapi_eh_request_sense(qc->dev, 1692 qc->scsicmd->sense_buffer, 1693 qc->result_tf.feature >> 4); 1694 if (!tmp) { 1695 /* ATA_QCFLAG_SENSE_VALID is used to 1696 * tell atapi_qc_complete() that sense 1697 * data is already valid. 1698 * 1699 * TODO: interpret sense data and set 1700 * appropriate err_mask. 1701 */ 1702 qc->flags |= ATA_QCFLAG_SENSE_VALID; 1703 } else 1704 qc->err_mask |= tmp; 1705 } 1706 } 1707 1708 if (qc->err_mask & (AC_ERR_HSM | AC_ERR_TIMEOUT | AC_ERR_ATA_BUS)) 1709 action |= ATA_EH_RESET; 1710 1711 return action; 1712 } 1713 1714 static int ata_eh_categorize_error(unsigned int eflags, unsigned int err_mask, 1715 int *xfer_ok) 1716 { 1717 int base = 0; 1718 1719 if (!(eflags & ATA_EFLAG_DUBIOUS_XFER)) 1720 *xfer_ok = 1; 1721 1722 if (!*xfer_ok) 1723 base = ATA_ECAT_DUBIOUS_NONE; 1724 1725 if (err_mask & AC_ERR_ATA_BUS) 1726 return base + ATA_ECAT_ATA_BUS; 1727 1728 if (err_mask & AC_ERR_TIMEOUT) 1729 return base + ATA_ECAT_TOUT_HSM; 1730 1731 if (eflags & ATA_EFLAG_IS_IO) { 1732 if (err_mask & AC_ERR_HSM) 1733 return base + ATA_ECAT_TOUT_HSM; 1734 if ((err_mask & 1735 (AC_ERR_DEV|AC_ERR_MEDIA|AC_ERR_INVALID)) == AC_ERR_DEV) 1736 return base + ATA_ECAT_UNK_DEV; 1737 } 1738 1739 return 0; 1740 } 1741 1742 struct speed_down_verdict_arg { 1743 u64 since; 1744 int xfer_ok; 1745 int nr_errors[ATA_ECAT_NR]; 1746 }; 1747 1748 static int speed_down_verdict_cb(struct ata_ering_entry *ent, void *void_arg) 1749 { 1750 struct speed_down_verdict_arg *arg = void_arg; 1751 int cat; 1752 1753 if (ent->timestamp < arg->since) 1754 return -1; 1755 1756 cat = ata_eh_categorize_error(ent->eflags, ent->err_mask, 1757 &arg->xfer_ok); 1758 arg->nr_errors[cat]++; 1759 1760 return 0; 1761 } 1762 1763 /** 1764 * ata_eh_speed_down_verdict - Determine speed down verdict 1765 * @dev: Device of interest 1766 * 1767 * This function examines error ring of @dev and determines 1768 * whether NCQ needs to be turned off, transfer speed should be 1769 * stepped down, or falling back to PIO is necessary. 1770 * 1771 * ECAT_ATA_BUS : ATA_BUS error for any command 1772 * 1773 * ECAT_TOUT_HSM : TIMEOUT for any command or HSM violation for 1774 * IO commands 1775 * 1776 * ECAT_UNK_DEV : Unknown DEV error for IO commands 1777 * 1778 * ECAT_DUBIOUS_* : Identical to above three but occurred while 1779 * data transfer hasn't been verified. 1780 * 1781 * Verdicts are 1782 * 1783 * NCQ_OFF : Turn off NCQ. 1784 * 1785 * SPEED_DOWN : Speed down transfer speed but don't fall back 1786 * to PIO. 1787 * 1788 * FALLBACK_TO_PIO : Fall back to PIO. 1789 * 1790 * Even if multiple verdicts are returned, only one action is 1791 * taken per error. An action triggered by non-DUBIOUS errors 1792 * clears ering, while one triggered by DUBIOUS_* errors doesn't. 1793 * This is to expedite speed down decisions right after device is 1794 * initially configured. 1795 * 1796 * The followings are speed down rules. #1 and #2 deal with 1797 * DUBIOUS errors. 1798 * 1799 * 1. If more than one DUBIOUS_ATA_BUS or DUBIOUS_TOUT_HSM errors 1800 * occurred during last 5 mins, SPEED_DOWN and FALLBACK_TO_PIO. 1801 * 1802 * 2. If more than one DUBIOUS_TOUT_HSM or DUBIOUS_UNK_DEV errors 1803 * occurred during last 5 mins, NCQ_OFF. 1804 * 1805 * 3. If more than 8 ATA_BUS, TOUT_HSM or UNK_DEV errors 1806 * ocurred during last 5 mins, FALLBACK_TO_PIO 1807 * 1808 * 4. If more than 3 TOUT_HSM or UNK_DEV errors occurred 1809 * during last 10 mins, NCQ_OFF. 1810 * 1811 * 5. If more than 3 ATA_BUS or TOUT_HSM errors, or more than 6 1812 * UNK_DEV errors occurred during last 10 mins, SPEED_DOWN. 1813 * 1814 * LOCKING: 1815 * Inherited from caller. 1816 * 1817 * RETURNS: 1818 * OR of ATA_EH_SPDN_* flags. 1819 */ 1820 static unsigned int ata_eh_speed_down_verdict(struct ata_device *dev) 1821 { 1822 const u64 j5mins = 5LLU * 60 * HZ, j10mins = 10LLU * 60 * HZ; 1823 u64 j64 = get_jiffies_64(); 1824 struct speed_down_verdict_arg arg; 1825 unsigned int verdict = 0; 1826 1827 /* scan past 5 mins of error history */ 1828 memset(&arg, 0, sizeof(arg)); 1829 arg.since = j64 - min(j64, j5mins); 1830 ata_ering_map(&dev->ering, speed_down_verdict_cb, &arg); 1831 1832 if (arg.nr_errors[ATA_ECAT_DUBIOUS_ATA_BUS] + 1833 arg.nr_errors[ATA_ECAT_DUBIOUS_TOUT_HSM] > 1) 1834 verdict |= ATA_EH_SPDN_SPEED_DOWN | 1835 ATA_EH_SPDN_FALLBACK_TO_PIO | ATA_EH_SPDN_KEEP_ERRORS; 1836 1837 if (arg.nr_errors[ATA_ECAT_DUBIOUS_TOUT_HSM] + 1838 arg.nr_errors[ATA_ECAT_DUBIOUS_UNK_DEV] > 1) 1839 verdict |= ATA_EH_SPDN_NCQ_OFF | ATA_EH_SPDN_KEEP_ERRORS; 1840 1841 if (arg.nr_errors[ATA_ECAT_ATA_BUS] + 1842 arg.nr_errors[ATA_ECAT_TOUT_HSM] + 1843 arg.nr_errors[ATA_ECAT_UNK_DEV] > 6) 1844 verdict |= ATA_EH_SPDN_FALLBACK_TO_PIO; 1845 1846 /* scan past 10 mins of error history */ 1847 memset(&arg, 0, sizeof(arg)); 1848 arg.since = j64 - min(j64, j10mins); 1849 ata_ering_map(&dev->ering, speed_down_verdict_cb, &arg); 1850 1851 if (arg.nr_errors[ATA_ECAT_TOUT_HSM] + 1852 arg.nr_errors[ATA_ECAT_UNK_DEV] > 3) 1853 verdict |= ATA_EH_SPDN_NCQ_OFF; 1854 1855 if (arg.nr_errors[ATA_ECAT_ATA_BUS] + 1856 arg.nr_errors[ATA_ECAT_TOUT_HSM] > 3 || 1857 arg.nr_errors[ATA_ECAT_UNK_DEV] > 6) 1858 verdict |= ATA_EH_SPDN_SPEED_DOWN; 1859 1860 return verdict; 1861 } 1862 1863 /** 1864 * ata_eh_speed_down - record error and speed down if necessary 1865 * @dev: Failed device 1866 * @eflags: mask of ATA_EFLAG_* flags 1867 * @err_mask: err_mask of the error 1868 * 1869 * Record error and examine error history to determine whether 1870 * adjusting transmission speed is necessary. It also sets 1871 * transmission limits appropriately if such adjustment is 1872 * necessary. 1873 * 1874 * LOCKING: 1875 * Kernel thread context (may sleep). 1876 * 1877 * RETURNS: 1878 * Determined recovery action. 1879 */ 1880 static unsigned int ata_eh_speed_down(struct ata_device *dev, 1881 unsigned int eflags, unsigned int err_mask) 1882 { 1883 struct ata_link *link = ata_dev_phys_link(dev); 1884 int xfer_ok = 0; 1885 unsigned int verdict; 1886 unsigned int action = 0; 1887 1888 /* don't bother if Cat-0 error */ 1889 if (ata_eh_categorize_error(eflags, err_mask, &xfer_ok) == 0) 1890 return 0; 1891 1892 /* record error and determine whether speed down is necessary */ 1893 ata_ering_record(&dev->ering, eflags, err_mask); 1894 verdict = ata_eh_speed_down_verdict(dev); 1895 1896 /* turn off NCQ? */ 1897 if ((verdict & ATA_EH_SPDN_NCQ_OFF) && 1898 (dev->flags & (ATA_DFLAG_PIO | ATA_DFLAG_NCQ | 1899 ATA_DFLAG_NCQ_OFF)) == ATA_DFLAG_NCQ) { 1900 dev->flags |= ATA_DFLAG_NCQ_OFF; 1901 ata_dev_printk(dev, KERN_WARNING, 1902 "NCQ disabled due to excessive errors\n"); 1903 goto done; 1904 } 1905 1906 /* speed down? */ 1907 if (verdict & ATA_EH_SPDN_SPEED_DOWN) { 1908 /* speed down SATA link speed if possible */ 1909 if (sata_down_spd_limit(link, 0) == 0) { 1910 action |= ATA_EH_RESET; 1911 goto done; 1912 } 1913 1914 /* lower transfer mode */ 1915 if (dev->spdn_cnt < 2) { 1916 static const int dma_dnxfer_sel[] = 1917 { ATA_DNXFER_DMA, ATA_DNXFER_40C }; 1918 static const int pio_dnxfer_sel[] = 1919 { ATA_DNXFER_PIO, ATA_DNXFER_FORCE_PIO0 }; 1920 int sel; 1921 1922 if (dev->xfer_shift != ATA_SHIFT_PIO) 1923 sel = dma_dnxfer_sel[dev->spdn_cnt]; 1924 else 1925 sel = pio_dnxfer_sel[dev->spdn_cnt]; 1926 1927 dev->spdn_cnt++; 1928 1929 if (ata_down_xfermask_limit(dev, sel) == 0) { 1930 action |= ATA_EH_RESET; 1931 goto done; 1932 } 1933 } 1934 } 1935 1936 /* Fall back to PIO? Slowing down to PIO is meaningless for 1937 * SATA ATA devices. Consider it only for PATA and SATAPI. 1938 */ 1939 if ((verdict & ATA_EH_SPDN_FALLBACK_TO_PIO) && (dev->spdn_cnt >= 2) && 1940 (link->ap->cbl != ATA_CBL_SATA || dev->class == ATA_DEV_ATAPI) && 1941 (dev->xfer_shift != ATA_SHIFT_PIO)) { 1942 if (ata_down_xfermask_limit(dev, ATA_DNXFER_FORCE_PIO) == 0) { 1943 dev->spdn_cnt = 0; 1944 action |= ATA_EH_RESET; 1945 goto done; 1946 } 1947 } 1948 1949 return 0; 1950 done: 1951 /* device has been slowed down, blow error history */ 1952 if (!(verdict & ATA_EH_SPDN_KEEP_ERRORS)) 1953 ata_ering_clear(&dev->ering); 1954 return action; 1955 } 1956 1957 /** 1958 * ata_eh_link_autopsy - analyze error and determine recovery action 1959 * @link: host link to perform autopsy on 1960 * 1961 * Analyze why @link failed and determine which recovery actions 1962 * are needed. This function also sets more detailed AC_ERR_* 1963 * values and fills sense data for ATAPI CHECK SENSE. 1964 * 1965 * LOCKING: 1966 * Kernel thread context (may sleep). 1967 */ 1968 static void ata_eh_link_autopsy(struct ata_link *link) 1969 { 1970 struct ata_port *ap = link->ap; 1971 struct ata_eh_context *ehc = &link->eh_context; 1972 struct ata_device *dev; 1973 unsigned int all_err_mask = 0, eflags = 0; 1974 int tag; 1975 u32 serror; 1976 int rc; 1977 1978 DPRINTK("ENTER\n"); 1979 1980 if (ehc->i.flags & ATA_EHI_NO_AUTOPSY) 1981 return; 1982 1983 /* obtain and analyze SError */ 1984 rc = sata_scr_read(link, SCR_ERROR, &serror); 1985 if (rc == 0) { 1986 ehc->i.serror |= serror; 1987 ata_eh_analyze_serror(link); 1988 } else if (rc != -EOPNOTSUPP) { 1989 /* SError read failed, force reset and probing */ 1990 ehc->i.probe_mask |= ATA_ALL_DEVICES; 1991 ehc->i.action |= ATA_EH_RESET; 1992 ehc->i.err_mask |= AC_ERR_OTHER; 1993 } 1994 1995 /* analyze NCQ failure */ 1996 ata_eh_analyze_ncq_error(link); 1997 1998 /* any real error trumps AC_ERR_OTHER */ 1999 if (ehc->i.err_mask & ~AC_ERR_OTHER) 2000 ehc->i.err_mask &= ~AC_ERR_OTHER; 2001 2002 all_err_mask |= ehc->i.err_mask; 2003 2004 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 2005 struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 2006 2007 if (!(qc->flags & ATA_QCFLAG_FAILED) || 2008 ata_dev_phys_link(qc->dev) != link) 2009 continue; 2010 2011 /* inherit upper level err_mask */ 2012 qc->err_mask |= ehc->i.err_mask; 2013 2014 /* analyze TF */ 2015 ehc->i.action |= ata_eh_analyze_tf(qc, &qc->result_tf); 2016 2017 /* DEV errors are probably spurious in case of ATA_BUS error */ 2018 if (qc->err_mask & AC_ERR_ATA_BUS) 2019 qc->err_mask &= ~(AC_ERR_DEV | AC_ERR_MEDIA | 2020 AC_ERR_INVALID); 2021 2022 /* any real error trumps unknown error */ 2023 if (qc->err_mask & ~AC_ERR_OTHER) 2024 qc->err_mask &= ~AC_ERR_OTHER; 2025 2026 /* SENSE_VALID trumps dev/unknown error and revalidation */ 2027 if (qc->flags & ATA_QCFLAG_SENSE_VALID) 2028 qc->err_mask &= ~(AC_ERR_DEV | AC_ERR_OTHER); 2029 2030 /* determine whether the command is worth retrying */ 2031 if (!(qc->err_mask & AC_ERR_INVALID) && 2032 ((qc->flags & ATA_QCFLAG_IO) || qc->err_mask != AC_ERR_DEV)) 2033 qc->flags |= ATA_QCFLAG_RETRY; 2034 2035 /* accumulate error info */ 2036 ehc->i.dev = qc->dev; 2037 all_err_mask |= qc->err_mask; 2038 if (qc->flags & ATA_QCFLAG_IO) 2039 eflags |= ATA_EFLAG_IS_IO; 2040 } 2041 2042 /* enforce default EH actions */ 2043 if (ap->pflags & ATA_PFLAG_FROZEN || 2044 all_err_mask & (AC_ERR_HSM | AC_ERR_TIMEOUT)) 2045 ehc->i.action |= ATA_EH_RESET; 2046 else if (((eflags & ATA_EFLAG_IS_IO) && all_err_mask) || 2047 (!(eflags & ATA_EFLAG_IS_IO) && (all_err_mask & ~AC_ERR_DEV))) 2048 ehc->i.action |= ATA_EH_REVALIDATE; 2049 2050 /* If we have offending qcs and the associated failed device, 2051 * perform per-dev EH action only on the offending device. 2052 */ 2053 if (ehc->i.dev) { 2054 ehc->i.dev_action[ehc->i.dev->devno] |= 2055 ehc->i.action & ATA_EH_PERDEV_MASK; 2056 ehc->i.action &= ~ATA_EH_PERDEV_MASK; 2057 } 2058 2059 /* propagate timeout to host link */ 2060 if ((all_err_mask & AC_ERR_TIMEOUT) && !ata_is_host_link(link)) 2061 ap->link.eh_context.i.err_mask |= AC_ERR_TIMEOUT; 2062 2063 /* record error and consider speeding down */ 2064 dev = ehc->i.dev; 2065 if (!dev && ((ata_link_max_devices(link) == 1 && 2066 ata_dev_enabled(link->device)))) 2067 dev = link->device; 2068 2069 if (dev) { 2070 if (dev->flags & ATA_DFLAG_DUBIOUS_XFER) 2071 eflags |= ATA_EFLAG_DUBIOUS_XFER; 2072 ehc->i.action |= ata_eh_speed_down(dev, eflags, all_err_mask); 2073 } 2074 2075 DPRINTK("EXIT\n"); 2076 } 2077 2078 /** 2079 * ata_eh_autopsy - analyze error and determine recovery action 2080 * @ap: host port to perform autopsy on 2081 * 2082 * Analyze all links of @ap and determine why they failed and 2083 * which recovery actions are needed. 2084 * 2085 * LOCKING: 2086 * Kernel thread context (may sleep). 2087 */ 2088 void ata_eh_autopsy(struct ata_port *ap) 2089 { 2090 struct ata_link *link; 2091 2092 ata_for_each_link(link, ap, EDGE) 2093 ata_eh_link_autopsy(link); 2094 2095 /* Handle the frigging slave link. Autopsy is done similarly 2096 * but actions and flags are transferred over to the master 2097 * link and handled from there. 2098 */ 2099 if (ap->slave_link) { 2100 struct ata_eh_context *mehc = &ap->link.eh_context; 2101 struct ata_eh_context *sehc = &ap->slave_link->eh_context; 2102 2103 /* transfer control flags from master to slave */ 2104 sehc->i.flags |= mehc->i.flags & ATA_EHI_TO_SLAVE_MASK; 2105 2106 /* perform autopsy on the slave link */ 2107 ata_eh_link_autopsy(ap->slave_link); 2108 2109 /* transfer actions from slave to master and clear slave */ 2110 ata_eh_about_to_do(ap->slave_link, NULL, ATA_EH_ALL_ACTIONS); 2111 mehc->i.action |= sehc->i.action; 2112 mehc->i.dev_action[1] |= sehc->i.dev_action[1]; 2113 mehc->i.flags |= sehc->i.flags; 2114 ata_eh_done(ap->slave_link, NULL, ATA_EH_ALL_ACTIONS); 2115 } 2116 2117 /* Autopsy of fanout ports can affect host link autopsy. 2118 * Perform host link autopsy last. 2119 */ 2120 if (sata_pmp_attached(ap)) 2121 ata_eh_link_autopsy(&ap->link); 2122 } 2123 2124 /** 2125 * ata_get_cmd_descript - get description for ATA command 2126 * @command: ATA command code to get description for 2127 * 2128 * Return a textual description of the given command, or NULL if the 2129 * command is not known. 2130 * 2131 * LOCKING: 2132 * None 2133 */ 2134 const char *ata_get_cmd_descript(u8 command) 2135 { 2136 #ifdef CONFIG_ATA_VERBOSE_ERROR 2137 static const struct 2138 { 2139 u8 command; 2140 const char *text; 2141 } cmd_descr[] = { 2142 { ATA_CMD_DEV_RESET, "DEVICE RESET" }, 2143 { ATA_CMD_CHK_POWER, "CHECK POWER MODE" }, 2144 { ATA_CMD_STANDBY, "STANDBY" }, 2145 { ATA_CMD_IDLE, "IDLE" }, 2146 { ATA_CMD_EDD, "EXECUTE DEVICE DIAGNOSTIC" }, 2147 { ATA_CMD_DOWNLOAD_MICRO, "DOWNLOAD MICROCODE" }, 2148 { ATA_CMD_NOP, "NOP" }, 2149 { ATA_CMD_FLUSH, "FLUSH CACHE" }, 2150 { ATA_CMD_FLUSH_EXT, "FLUSH CACHE EXT" }, 2151 { ATA_CMD_ID_ATA, "IDENTIFY DEVICE" }, 2152 { ATA_CMD_ID_ATAPI, "IDENTIFY PACKET DEVICE" }, 2153 { ATA_CMD_SERVICE, "SERVICE" }, 2154 { ATA_CMD_READ, "READ DMA" }, 2155 { ATA_CMD_READ_EXT, "READ DMA EXT" }, 2156 { ATA_CMD_READ_QUEUED, "READ DMA QUEUED" }, 2157 { ATA_CMD_READ_STREAM_EXT, "READ STREAM EXT" }, 2158 { ATA_CMD_READ_STREAM_DMA_EXT, "READ STREAM DMA EXT" }, 2159 { ATA_CMD_WRITE, "WRITE DMA" }, 2160 { ATA_CMD_WRITE_EXT, "WRITE DMA EXT" }, 2161 { ATA_CMD_WRITE_QUEUED, "WRITE DMA QUEUED EXT" }, 2162 { ATA_CMD_WRITE_STREAM_EXT, "WRITE STREAM EXT" }, 2163 { ATA_CMD_WRITE_STREAM_DMA_EXT, "WRITE STREAM DMA EXT" }, 2164 { ATA_CMD_WRITE_FUA_EXT, "WRITE DMA FUA EXT" }, 2165 { ATA_CMD_WRITE_QUEUED_FUA_EXT, "WRITE DMA QUEUED FUA EXT" }, 2166 { ATA_CMD_FPDMA_READ, "READ FPDMA QUEUED" }, 2167 { ATA_CMD_FPDMA_WRITE, "WRITE FPDMA QUEUED" }, 2168 { ATA_CMD_PIO_READ, "READ SECTOR(S)" }, 2169 { ATA_CMD_PIO_READ_EXT, "READ SECTOR(S) EXT" }, 2170 { ATA_CMD_PIO_WRITE, "WRITE SECTOR(S)" }, 2171 { ATA_CMD_PIO_WRITE_EXT, "WRITE SECTOR(S) EXT" }, 2172 { ATA_CMD_READ_MULTI, "READ MULTIPLE" }, 2173 { ATA_CMD_READ_MULTI_EXT, "READ MULTIPLE EXT" }, 2174 { ATA_CMD_WRITE_MULTI, "WRITE MULTIPLE" }, 2175 { ATA_CMD_WRITE_MULTI_EXT, "WRITE MULTIPLE EXT" }, 2176 { ATA_CMD_WRITE_MULTI_FUA_EXT, "WRITE MULTIPLE FUA EXT" }, 2177 { ATA_CMD_SET_FEATURES, "SET FEATURES" }, 2178 { ATA_CMD_SET_MULTI, "SET MULTIPLE MODE" }, 2179 { ATA_CMD_VERIFY, "READ VERIFY SECTOR(S)" }, 2180 { ATA_CMD_VERIFY_EXT, "READ VERIFY SECTOR(S) EXT" }, 2181 { ATA_CMD_WRITE_UNCORR_EXT, "WRITE UNCORRECTABLE EXT" }, 2182 { ATA_CMD_STANDBYNOW1, "STANDBY IMMEDIATE" }, 2183 { ATA_CMD_IDLEIMMEDIATE, "IDLE IMMEDIATE" }, 2184 { ATA_CMD_SLEEP, "SLEEP" }, 2185 { ATA_CMD_INIT_DEV_PARAMS, "INITIALIZE DEVICE PARAMETERS" }, 2186 { ATA_CMD_READ_NATIVE_MAX, "READ NATIVE MAX ADDRESS" }, 2187 { ATA_CMD_READ_NATIVE_MAX_EXT, "READ NATIVE MAX ADDRESS EXT" }, 2188 { ATA_CMD_SET_MAX, "SET MAX ADDRESS" }, 2189 { ATA_CMD_SET_MAX_EXT, "SET MAX ADDRESS EXT" }, 2190 { ATA_CMD_READ_LOG_EXT, "READ LOG EXT" }, 2191 { ATA_CMD_WRITE_LOG_EXT, "WRITE LOG EXT" }, 2192 { ATA_CMD_READ_LOG_DMA_EXT, "READ LOG DMA EXT" }, 2193 { ATA_CMD_WRITE_LOG_DMA_EXT, "WRITE LOG DMA EXT" }, 2194 { ATA_CMD_TRUSTED_RCV, "TRUSTED RECEIVE" }, 2195 { ATA_CMD_TRUSTED_RCV_DMA, "TRUSTED RECEIVE DMA" }, 2196 { ATA_CMD_TRUSTED_SND, "TRUSTED SEND" }, 2197 { ATA_CMD_TRUSTED_SND_DMA, "TRUSTED SEND DMA" }, 2198 { ATA_CMD_PMP_READ, "READ BUFFER" }, 2199 { ATA_CMD_PMP_WRITE, "WRITE BUFFER" }, 2200 { ATA_CMD_CONF_OVERLAY, "DEVICE CONFIGURATION OVERLAY" }, 2201 { ATA_CMD_SEC_SET_PASS, "SECURITY SET PASSWORD" }, 2202 { ATA_CMD_SEC_UNLOCK, "SECURITY UNLOCK" }, 2203 { ATA_CMD_SEC_ERASE_PREP, "SECURITY ERASE PREPARE" }, 2204 { ATA_CMD_SEC_ERASE_UNIT, "SECURITY ERASE UNIT" }, 2205 { ATA_CMD_SEC_FREEZE_LOCK, "SECURITY FREEZE LOCK" }, 2206 { ATA_CMD_SEC_DISABLE_PASS, "SECURITY DISABLE PASSWORD" }, 2207 { ATA_CMD_CONFIG_STREAM, "CONFIGURE STREAM" }, 2208 { ATA_CMD_SMART, "SMART" }, 2209 { ATA_CMD_MEDIA_LOCK, "DOOR LOCK" }, 2210 { ATA_CMD_MEDIA_UNLOCK, "DOOR UNLOCK" }, 2211 { ATA_CMD_CHK_MED_CRD_TYP, "CHECK MEDIA CARD TYPE" }, 2212 { ATA_CMD_CFA_REQ_EXT_ERR, "CFA REQUEST EXTENDED ERROR" }, 2213 { ATA_CMD_CFA_WRITE_NE, "CFA WRITE SECTORS WITHOUT ERASE" }, 2214 { ATA_CMD_CFA_TRANS_SECT, "CFA TRANSLATE SECTOR" }, 2215 { ATA_CMD_CFA_ERASE, "CFA ERASE SECTORS" }, 2216 { ATA_CMD_CFA_WRITE_MULT_NE, "CFA WRITE MULTIPLE WITHOUT ERASE" }, 2217 { ATA_CMD_READ_LONG, "READ LONG (with retries)" }, 2218 { ATA_CMD_READ_LONG_ONCE, "READ LONG (without retries)" }, 2219 { ATA_CMD_WRITE_LONG, "WRITE LONG (with retries)" }, 2220 { ATA_CMD_WRITE_LONG_ONCE, "WRITE LONG (without retries)" }, 2221 { ATA_CMD_RESTORE, "RECALIBRATE" }, 2222 { 0, NULL } /* terminate list */ 2223 }; 2224 2225 unsigned int i; 2226 for (i = 0; cmd_descr[i].text; i++) 2227 if (cmd_descr[i].command == command) 2228 return cmd_descr[i].text; 2229 #endif 2230 2231 return NULL; 2232 } 2233 2234 /** 2235 * ata_eh_link_report - report error handling to user 2236 * @link: ATA link EH is going on 2237 * 2238 * Report EH to user. 2239 * 2240 * LOCKING: 2241 * None. 2242 */ 2243 static void ata_eh_link_report(struct ata_link *link) 2244 { 2245 struct ata_port *ap = link->ap; 2246 struct ata_eh_context *ehc = &link->eh_context; 2247 const char *frozen, *desc; 2248 char tries_buf[6]; 2249 int tag, nr_failed = 0; 2250 2251 if (ehc->i.flags & ATA_EHI_QUIET) 2252 return; 2253 2254 desc = NULL; 2255 if (ehc->i.desc[0] != '\0') 2256 desc = ehc->i.desc; 2257 2258 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 2259 struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 2260 2261 if (!(qc->flags & ATA_QCFLAG_FAILED) || 2262 ata_dev_phys_link(qc->dev) != link || 2263 ((qc->flags & ATA_QCFLAG_QUIET) && 2264 qc->err_mask == AC_ERR_DEV)) 2265 continue; 2266 if (qc->flags & ATA_QCFLAG_SENSE_VALID && !qc->err_mask) 2267 continue; 2268 2269 nr_failed++; 2270 } 2271 2272 if (!nr_failed && !ehc->i.err_mask) 2273 return; 2274 2275 frozen = ""; 2276 if (ap->pflags & ATA_PFLAG_FROZEN) 2277 frozen = " frozen"; 2278 2279 memset(tries_buf, 0, sizeof(tries_buf)); 2280 if (ap->eh_tries < ATA_EH_MAX_TRIES) 2281 snprintf(tries_buf, sizeof(tries_buf) - 1, " t%d", 2282 ap->eh_tries); 2283 2284 if (ehc->i.dev) { 2285 ata_dev_printk(ehc->i.dev, KERN_ERR, "exception Emask 0x%x " 2286 "SAct 0x%x SErr 0x%x action 0x%x%s%s\n", 2287 ehc->i.err_mask, link->sactive, ehc->i.serror, 2288 ehc->i.action, frozen, tries_buf); 2289 if (desc) 2290 ata_dev_printk(ehc->i.dev, KERN_ERR, "%s\n", desc); 2291 } else { 2292 ata_link_printk(link, KERN_ERR, "exception Emask 0x%x " 2293 "SAct 0x%x SErr 0x%x action 0x%x%s%s\n", 2294 ehc->i.err_mask, link->sactive, ehc->i.serror, 2295 ehc->i.action, frozen, tries_buf); 2296 if (desc) 2297 ata_link_printk(link, KERN_ERR, "%s\n", desc); 2298 } 2299 2300 #ifdef CONFIG_ATA_VERBOSE_ERROR 2301 if (ehc->i.serror) 2302 ata_link_printk(link, KERN_ERR, 2303 "SError: { %s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s}\n", 2304 ehc->i.serror & SERR_DATA_RECOVERED ? "RecovData " : "", 2305 ehc->i.serror & SERR_COMM_RECOVERED ? "RecovComm " : "", 2306 ehc->i.serror & SERR_DATA ? "UnrecovData " : "", 2307 ehc->i.serror & SERR_PERSISTENT ? "Persist " : "", 2308 ehc->i.serror & SERR_PROTOCOL ? "Proto " : "", 2309 ehc->i.serror & SERR_INTERNAL ? "HostInt " : "", 2310 ehc->i.serror & SERR_PHYRDY_CHG ? "PHYRdyChg " : "", 2311 ehc->i.serror & SERR_PHY_INT_ERR ? "PHYInt " : "", 2312 ehc->i.serror & SERR_COMM_WAKE ? "CommWake " : "", 2313 ehc->i.serror & SERR_10B_8B_ERR ? "10B8B " : "", 2314 ehc->i.serror & SERR_DISPARITY ? "Dispar " : "", 2315 ehc->i.serror & SERR_CRC ? "BadCRC " : "", 2316 ehc->i.serror & SERR_HANDSHAKE ? "Handshk " : "", 2317 ehc->i.serror & SERR_LINK_SEQ_ERR ? "LinkSeq " : "", 2318 ehc->i.serror & SERR_TRANS_ST_ERROR ? "TrStaTrns " : "", 2319 ehc->i.serror & SERR_UNRECOG_FIS ? "UnrecFIS " : "", 2320 ehc->i.serror & SERR_DEV_XCHG ? "DevExch " : ""); 2321 #endif 2322 2323 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 2324 struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 2325 struct ata_taskfile *cmd = &qc->tf, *res = &qc->result_tf; 2326 const u8 *cdb = qc->cdb; 2327 char data_buf[20] = ""; 2328 char cdb_buf[70] = ""; 2329 2330 if (!(qc->flags & ATA_QCFLAG_FAILED) || 2331 ata_dev_phys_link(qc->dev) != link || !qc->err_mask) 2332 continue; 2333 2334 if (qc->dma_dir != DMA_NONE) { 2335 static const char *dma_str[] = { 2336 [DMA_BIDIRECTIONAL] = "bidi", 2337 [DMA_TO_DEVICE] = "out", 2338 [DMA_FROM_DEVICE] = "in", 2339 }; 2340 static const char *prot_str[] = { 2341 [ATA_PROT_PIO] = "pio", 2342 [ATA_PROT_DMA] = "dma", 2343 [ATA_PROT_NCQ] = "ncq", 2344 [ATAPI_PROT_PIO] = "pio", 2345 [ATAPI_PROT_DMA] = "dma", 2346 }; 2347 2348 snprintf(data_buf, sizeof(data_buf), " %s %u %s", 2349 prot_str[qc->tf.protocol], qc->nbytes, 2350 dma_str[qc->dma_dir]); 2351 } 2352 2353 if (ata_is_atapi(qc->tf.protocol)) { 2354 if (qc->scsicmd) 2355 scsi_print_command(qc->scsicmd); 2356 else 2357 snprintf(cdb_buf, sizeof(cdb_buf), 2358 "cdb %02x %02x %02x %02x %02x %02x %02x %02x " 2359 "%02x %02x %02x %02x %02x %02x %02x %02x\n ", 2360 cdb[0], cdb[1], cdb[2], cdb[3], 2361 cdb[4], cdb[5], cdb[6], cdb[7], 2362 cdb[8], cdb[9], cdb[10], cdb[11], 2363 cdb[12], cdb[13], cdb[14], cdb[15]); 2364 } else { 2365 const char *descr = ata_get_cmd_descript(cmd->command); 2366 if (descr) 2367 ata_dev_printk(qc->dev, KERN_ERR, 2368 "failed command: %s\n", descr); 2369 } 2370 2371 ata_dev_printk(qc->dev, KERN_ERR, 2372 "cmd %02x/%02x:%02x:%02x:%02x:%02x/%02x:%02x:%02x:%02x:%02x/%02x " 2373 "tag %d%s\n %s" 2374 "res %02x/%02x:%02x:%02x:%02x:%02x/%02x:%02x:%02x:%02x:%02x/%02x " 2375 "Emask 0x%x (%s)%s\n", 2376 cmd->command, cmd->feature, cmd->nsect, 2377 cmd->lbal, cmd->lbam, cmd->lbah, 2378 cmd->hob_feature, cmd->hob_nsect, 2379 cmd->hob_lbal, cmd->hob_lbam, cmd->hob_lbah, 2380 cmd->device, qc->tag, data_buf, cdb_buf, 2381 res->command, res->feature, res->nsect, 2382 res->lbal, res->lbam, res->lbah, 2383 res->hob_feature, res->hob_nsect, 2384 res->hob_lbal, res->hob_lbam, res->hob_lbah, 2385 res->device, qc->err_mask, ata_err_string(qc->err_mask), 2386 qc->err_mask & AC_ERR_NCQ ? " <F>" : ""); 2387 2388 #ifdef CONFIG_ATA_VERBOSE_ERROR 2389 if (res->command & (ATA_BUSY | ATA_DRDY | ATA_DF | ATA_DRQ | 2390 ATA_ERR)) { 2391 if (res->command & ATA_BUSY) 2392 ata_dev_printk(qc->dev, KERN_ERR, 2393 "status: { Busy }\n"); 2394 else 2395 ata_dev_printk(qc->dev, KERN_ERR, 2396 "status: { %s%s%s%s}\n", 2397 res->command & ATA_DRDY ? "DRDY " : "", 2398 res->command & ATA_DF ? "DF " : "", 2399 res->command & ATA_DRQ ? "DRQ " : "", 2400 res->command & ATA_ERR ? "ERR " : ""); 2401 } 2402 2403 if (cmd->command != ATA_CMD_PACKET && 2404 (res->feature & (ATA_ICRC | ATA_UNC | ATA_IDNF | 2405 ATA_ABORTED))) 2406 ata_dev_printk(qc->dev, KERN_ERR, 2407 "error: { %s%s%s%s}\n", 2408 res->feature & ATA_ICRC ? "ICRC " : "", 2409 res->feature & ATA_UNC ? "UNC " : "", 2410 res->feature & ATA_IDNF ? "IDNF " : "", 2411 res->feature & ATA_ABORTED ? "ABRT " : ""); 2412 #endif 2413 } 2414 } 2415 2416 /** 2417 * ata_eh_report - report error handling to user 2418 * @ap: ATA port to report EH about 2419 * 2420 * Report EH to user. 2421 * 2422 * LOCKING: 2423 * None. 2424 */ 2425 void ata_eh_report(struct ata_port *ap) 2426 { 2427 struct ata_link *link; 2428 2429 ata_for_each_link(link, ap, HOST_FIRST) 2430 ata_eh_link_report(link); 2431 } 2432 2433 static int ata_do_reset(struct ata_link *link, ata_reset_fn_t reset, 2434 unsigned int *classes, unsigned long deadline, 2435 bool clear_classes) 2436 { 2437 struct ata_device *dev; 2438 2439 if (clear_classes) 2440 ata_for_each_dev(dev, link, ALL) 2441 classes[dev->devno] = ATA_DEV_UNKNOWN; 2442 2443 return reset(link, classes, deadline); 2444 } 2445 2446 static int ata_eh_followup_srst_needed(struct ata_link *link, 2447 int rc, const unsigned int *classes) 2448 { 2449 if ((link->flags & ATA_LFLAG_NO_SRST) || ata_link_offline(link)) 2450 return 0; 2451 if (rc == -EAGAIN) 2452 return 1; 2453 if (sata_pmp_supported(link->ap) && ata_is_host_link(link)) 2454 return 1; 2455 return 0; 2456 } 2457 2458 int ata_eh_reset(struct ata_link *link, int classify, 2459 ata_prereset_fn_t prereset, ata_reset_fn_t softreset, 2460 ata_reset_fn_t hardreset, ata_postreset_fn_t postreset) 2461 { 2462 struct ata_port *ap = link->ap; 2463 struct ata_link *slave = ap->slave_link; 2464 struct ata_eh_context *ehc = &link->eh_context; 2465 struct ata_eh_context *sehc = slave ? &slave->eh_context : NULL; 2466 unsigned int *classes = ehc->classes; 2467 unsigned int lflags = link->flags; 2468 int verbose = !(ehc->i.flags & ATA_EHI_QUIET); 2469 int max_tries = 0, try = 0; 2470 struct ata_link *failed_link; 2471 struct ata_device *dev; 2472 unsigned long deadline, now; 2473 ata_reset_fn_t reset; 2474 unsigned long flags; 2475 u32 sstatus; 2476 int nr_unknown, rc; 2477 2478 /* 2479 * Prepare to reset 2480 */ 2481 while (ata_eh_reset_timeouts[max_tries] != ULONG_MAX) 2482 max_tries++; 2483 if (link->flags & ATA_LFLAG_NO_HRST) 2484 hardreset = NULL; 2485 if (link->flags & ATA_LFLAG_NO_SRST) 2486 softreset = NULL; 2487 2488 /* make sure each reset attemp is at least COOL_DOWN apart */ 2489 if (ehc->i.flags & ATA_EHI_DID_RESET) { 2490 now = jiffies; 2491 WARN_ON(time_after(ehc->last_reset, now)); 2492 deadline = ata_deadline(ehc->last_reset, 2493 ATA_EH_RESET_COOL_DOWN); 2494 if (time_before(now, deadline)) 2495 schedule_timeout_uninterruptible(deadline - now); 2496 } 2497 2498 spin_lock_irqsave(ap->lock, flags); 2499 ap->pflags |= ATA_PFLAG_RESETTING; 2500 spin_unlock_irqrestore(ap->lock, flags); 2501 2502 ata_eh_about_to_do(link, NULL, ATA_EH_RESET); 2503 2504 ata_for_each_dev(dev, link, ALL) { 2505 /* If we issue an SRST then an ATA drive (not ATAPI) 2506 * may change configuration and be in PIO0 timing. If 2507 * we do a hard reset (or are coming from power on) 2508 * this is true for ATA or ATAPI. Until we've set a 2509 * suitable controller mode we should not touch the 2510 * bus as we may be talking too fast. 2511 */ 2512 dev->pio_mode = XFER_PIO_0; 2513 2514 /* If the controller has a pio mode setup function 2515 * then use it to set the chipset to rights. Don't 2516 * touch the DMA setup as that will be dealt with when 2517 * configuring devices. 2518 */ 2519 if (ap->ops->set_piomode) 2520 ap->ops->set_piomode(ap, dev); 2521 } 2522 2523 /* prefer hardreset */ 2524 reset = NULL; 2525 ehc->i.action &= ~ATA_EH_RESET; 2526 if (hardreset) { 2527 reset = hardreset; 2528 ehc->i.action |= ATA_EH_HARDRESET; 2529 } else if (softreset) { 2530 reset = softreset; 2531 ehc->i.action |= ATA_EH_SOFTRESET; 2532 } 2533 2534 if (prereset) { 2535 unsigned long deadline = ata_deadline(jiffies, 2536 ATA_EH_PRERESET_TIMEOUT); 2537 2538 if (slave) { 2539 sehc->i.action &= ~ATA_EH_RESET; 2540 sehc->i.action |= ehc->i.action; 2541 } 2542 2543 rc = prereset(link, deadline); 2544 2545 /* If present, do prereset on slave link too. Reset 2546 * is skipped iff both master and slave links report 2547 * -ENOENT or clear ATA_EH_RESET. 2548 */ 2549 if (slave && (rc == 0 || rc == -ENOENT)) { 2550 int tmp; 2551 2552 tmp = prereset(slave, deadline); 2553 if (tmp != -ENOENT) 2554 rc = tmp; 2555 2556 ehc->i.action |= sehc->i.action; 2557 } 2558 2559 if (rc) { 2560 if (rc == -ENOENT) { 2561 ata_link_printk(link, KERN_DEBUG, 2562 "port disabled. ignoring.\n"); 2563 ehc->i.action &= ~ATA_EH_RESET; 2564 2565 ata_for_each_dev(dev, link, ALL) 2566 classes[dev->devno] = ATA_DEV_NONE; 2567 2568 rc = 0; 2569 } else 2570 ata_link_printk(link, KERN_ERR, 2571 "prereset failed (errno=%d)\n", rc); 2572 goto out; 2573 } 2574 2575 /* prereset() might have cleared ATA_EH_RESET. If so, 2576 * bang classes, thaw and return. 2577 */ 2578 if (reset && !(ehc->i.action & ATA_EH_RESET)) { 2579 ata_for_each_dev(dev, link, ALL) 2580 classes[dev->devno] = ATA_DEV_NONE; 2581 if ((ap->pflags & ATA_PFLAG_FROZEN) && 2582 ata_is_host_link(link)) 2583 ata_eh_thaw_port(ap); 2584 rc = 0; 2585 goto out; 2586 } 2587 } 2588 2589 retry: 2590 /* 2591 * Perform reset 2592 */ 2593 if (ata_is_host_link(link)) 2594 ata_eh_freeze_port(ap); 2595 2596 deadline = ata_deadline(jiffies, ata_eh_reset_timeouts[try++]); 2597 2598 if (reset) { 2599 if (verbose) 2600 ata_link_printk(link, KERN_INFO, "%s resetting link\n", 2601 reset == softreset ? "soft" : "hard"); 2602 2603 /* mark that this EH session started with reset */ 2604 ehc->last_reset = jiffies; 2605 if (reset == hardreset) 2606 ehc->i.flags |= ATA_EHI_DID_HARDRESET; 2607 else 2608 ehc->i.flags |= ATA_EHI_DID_SOFTRESET; 2609 2610 rc = ata_do_reset(link, reset, classes, deadline, true); 2611 if (rc && rc != -EAGAIN) { 2612 failed_link = link; 2613 goto fail; 2614 } 2615 2616 /* hardreset slave link if existent */ 2617 if (slave && reset == hardreset) { 2618 int tmp; 2619 2620 if (verbose) 2621 ata_link_printk(slave, KERN_INFO, 2622 "hard resetting link\n"); 2623 2624 ata_eh_about_to_do(slave, NULL, ATA_EH_RESET); 2625 tmp = ata_do_reset(slave, reset, classes, deadline, 2626 false); 2627 switch (tmp) { 2628 case -EAGAIN: 2629 rc = -EAGAIN; 2630 case 0: 2631 break; 2632 default: 2633 failed_link = slave; 2634 rc = tmp; 2635 goto fail; 2636 } 2637 } 2638 2639 /* perform follow-up SRST if necessary */ 2640 if (reset == hardreset && 2641 ata_eh_followup_srst_needed(link, rc, classes)) { 2642 reset = softreset; 2643 2644 if (!reset) { 2645 ata_link_printk(link, KERN_ERR, 2646 "follow-up softreset required " 2647 "but no softreset avaliable\n"); 2648 failed_link = link; 2649 rc = -EINVAL; 2650 goto fail; 2651 } 2652 2653 ata_eh_about_to_do(link, NULL, ATA_EH_RESET); 2654 rc = ata_do_reset(link, reset, classes, deadline, true); 2655 if (rc) { 2656 failed_link = link; 2657 goto fail; 2658 } 2659 } 2660 } else { 2661 if (verbose) 2662 ata_link_printk(link, KERN_INFO, "no reset method " 2663 "available, skipping reset\n"); 2664 if (!(lflags & ATA_LFLAG_ASSUME_CLASS)) 2665 lflags |= ATA_LFLAG_ASSUME_ATA; 2666 } 2667 2668 /* 2669 * Post-reset processing 2670 */ 2671 ata_for_each_dev(dev, link, ALL) { 2672 /* After the reset, the device state is PIO 0 and the 2673 * controller state is undefined. Reset also wakes up 2674 * drives from sleeping mode. 2675 */ 2676 dev->pio_mode = XFER_PIO_0; 2677 dev->flags &= ~ATA_DFLAG_SLEEPING; 2678 2679 if (ata_phys_link_offline(ata_dev_phys_link(dev))) 2680 continue; 2681 2682 /* apply class override */ 2683 if (lflags & ATA_LFLAG_ASSUME_ATA) 2684 classes[dev->devno] = ATA_DEV_ATA; 2685 else if (lflags & ATA_LFLAG_ASSUME_SEMB) 2686 classes[dev->devno] = ATA_DEV_SEMB_UNSUP; 2687 } 2688 2689 /* record current link speed */ 2690 if (sata_scr_read(link, SCR_STATUS, &sstatus) == 0) 2691 link->sata_spd = (sstatus >> 4) & 0xf; 2692 if (slave && sata_scr_read(slave, SCR_STATUS, &sstatus) == 0) 2693 slave->sata_spd = (sstatus >> 4) & 0xf; 2694 2695 /* thaw the port */ 2696 if (ata_is_host_link(link)) 2697 ata_eh_thaw_port(ap); 2698 2699 /* postreset() should clear hardware SError. Although SError 2700 * is cleared during link resume, clearing SError here is 2701 * necessary as some PHYs raise hotplug events after SRST. 2702 * This introduces race condition where hotplug occurs between 2703 * reset and here. This race is mediated by cross checking 2704 * link onlineness and classification result later. 2705 */ 2706 if (postreset) { 2707 postreset(link, classes); 2708 if (slave) 2709 postreset(slave, classes); 2710 } 2711 2712 /* 2713 * Some controllers can't be frozen very well and may set 2714 * spuruious error conditions during reset. Clear accumulated 2715 * error information. As reset is the final recovery action, 2716 * nothing is lost by doing this. 2717 */ 2718 spin_lock_irqsave(link->ap->lock, flags); 2719 memset(&link->eh_info, 0, sizeof(link->eh_info)); 2720 if (slave) 2721 memset(&slave->eh_info, 0, sizeof(link->eh_info)); 2722 ap->pflags &= ~ATA_PFLAG_EH_PENDING; 2723 spin_unlock_irqrestore(link->ap->lock, flags); 2724 2725 /* 2726 * Make sure onlineness and classification result correspond. 2727 * Hotplug could have happened during reset and some 2728 * controllers fail to wait while a drive is spinning up after 2729 * being hotplugged causing misdetection. By cross checking 2730 * link on/offlineness and classification result, those 2731 * conditions can be reliably detected and retried. 2732 */ 2733 nr_unknown = 0; 2734 ata_for_each_dev(dev, link, ALL) { 2735 if (ata_phys_link_online(ata_dev_phys_link(dev))) { 2736 if (classes[dev->devno] == ATA_DEV_UNKNOWN) { 2737 ata_dev_printk(dev, KERN_DEBUG, "link online " 2738 "but device misclassifed\n"); 2739 classes[dev->devno] = ATA_DEV_NONE; 2740 nr_unknown++; 2741 } 2742 } else if (ata_phys_link_offline(ata_dev_phys_link(dev))) { 2743 if (ata_class_enabled(classes[dev->devno])) 2744 ata_dev_printk(dev, KERN_DEBUG, "link offline, " 2745 "clearing class %d to NONE\n", 2746 classes[dev->devno]); 2747 classes[dev->devno] = ATA_DEV_NONE; 2748 } else if (classes[dev->devno] == ATA_DEV_UNKNOWN) { 2749 ata_dev_printk(dev, KERN_DEBUG, "link status unknown, " 2750 "clearing UNKNOWN to NONE\n"); 2751 classes[dev->devno] = ATA_DEV_NONE; 2752 } 2753 } 2754 2755 if (classify && nr_unknown) { 2756 if (try < max_tries) { 2757 ata_link_printk(link, KERN_WARNING, "link online but " 2758 "%d devices misclassified, retrying\n", 2759 nr_unknown); 2760 failed_link = link; 2761 rc = -EAGAIN; 2762 goto fail; 2763 } 2764 ata_link_printk(link, KERN_WARNING, 2765 "link online but %d devices misclassified, " 2766 "device detection might fail\n", nr_unknown); 2767 } 2768 2769 /* reset successful, schedule revalidation */ 2770 ata_eh_done(link, NULL, ATA_EH_RESET); 2771 if (slave) 2772 ata_eh_done(slave, NULL, ATA_EH_RESET); 2773 ehc->last_reset = jiffies; /* update to completion time */ 2774 ehc->i.action |= ATA_EH_REVALIDATE; 2775 2776 rc = 0; 2777 out: 2778 /* clear hotplug flag */ 2779 ehc->i.flags &= ~ATA_EHI_HOTPLUGGED; 2780 if (slave) 2781 sehc->i.flags &= ~ATA_EHI_HOTPLUGGED; 2782 2783 spin_lock_irqsave(ap->lock, flags); 2784 ap->pflags &= ~ATA_PFLAG_RESETTING; 2785 spin_unlock_irqrestore(ap->lock, flags); 2786 2787 return rc; 2788 2789 fail: 2790 /* if SCR isn't accessible on a fan-out port, PMP needs to be reset */ 2791 if (!ata_is_host_link(link) && 2792 sata_scr_read(link, SCR_STATUS, &sstatus)) 2793 rc = -ERESTART; 2794 2795 if (rc == -ERESTART || try >= max_tries) 2796 goto out; 2797 2798 now = jiffies; 2799 if (time_before(now, deadline)) { 2800 unsigned long delta = deadline - now; 2801 2802 ata_link_printk(failed_link, KERN_WARNING, 2803 "reset failed (errno=%d), retrying in %u secs\n", 2804 rc, DIV_ROUND_UP(jiffies_to_msecs(delta), 1000)); 2805 2806 while (delta) 2807 delta = schedule_timeout_uninterruptible(delta); 2808 } 2809 2810 if (try == max_tries - 1) { 2811 sata_down_spd_limit(link, 0); 2812 if (slave) 2813 sata_down_spd_limit(slave, 0); 2814 } else if (rc == -EPIPE) 2815 sata_down_spd_limit(failed_link, 0); 2816 2817 if (hardreset) 2818 reset = hardreset; 2819 goto retry; 2820 } 2821 2822 static inline void ata_eh_pull_park_action(struct ata_port *ap) 2823 { 2824 struct ata_link *link; 2825 struct ata_device *dev; 2826 unsigned long flags; 2827 2828 /* 2829 * This function can be thought of as an extended version of 2830 * ata_eh_about_to_do() specially crafted to accommodate the 2831 * requirements of ATA_EH_PARK handling. Since the EH thread 2832 * does not leave the do {} while () loop in ata_eh_recover as 2833 * long as the timeout for a park request to *one* device on 2834 * the port has not expired, and since we still want to pick 2835 * up park requests to other devices on the same port or 2836 * timeout updates for the same device, we have to pull 2837 * ATA_EH_PARK actions from eh_info into eh_context.i 2838 * ourselves at the beginning of each pass over the loop. 2839 * 2840 * Additionally, all write accesses to &ap->park_req_pending 2841 * through INIT_COMPLETION() (see below) or complete_all() 2842 * (see ata_scsi_park_store()) are protected by the host lock. 2843 * As a result we have that park_req_pending.done is zero on 2844 * exit from this function, i.e. when ATA_EH_PARK actions for 2845 * *all* devices on port ap have been pulled into the 2846 * respective eh_context structs. If, and only if, 2847 * park_req_pending.done is non-zero by the time we reach 2848 * wait_for_completion_timeout(), another ATA_EH_PARK action 2849 * has been scheduled for at least one of the devices on port 2850 * ap and we have to cycle over the do {} while () loop in 2851 * ata_eh_recover() again. 2852 */ 2853 2854 spin_lock_irqsave(ap->lock, flags); 2855 INIT_COMPLETION(ap->park_req_pending); 2856 ata_for_each_link(link, ap, EDGE) { 2857 ata_for_each_dev(dev, link, ALL) { 2858 struct ata_eh_info *ehi = &link->eh_info; 2859 2860 link->eh_context.i.dev_action[dev->devno] |= 2861 ehi->dev_action[dev->devno] & ATA_EH_PARK; 2862 ata_eh_clear_action(link, dev, ehi, ATA_EH_PARK); 2863 } 2864 } 2865 spin_unlock_irqrestore(ap->lock, flags); 2866 } 2867 2868 static void ata_eh_park_issue_cmd(struct ata_device *dev, int park) 2869 { 2870 struct ata_eh_context *ehc = &dev->link->eh_context; 2871 struct ata_taskfile tf; 2872 unsigned int err_mask; 2873 2874 ata_tf_init(dev, &tf); 2875 if (park) { 2876 ehc->unloaded_mask |= 1 << dev->devno; 2877 tf.command = ATA_CMD_IDLEIMMEDIATE; 2878 tf.feature = 0x44; 2879 tf.lbal = 0x4c; 2880 tf.lbam = 0x4e; 2881 tf.lbah = 0x55; 2882 } else { 2883 ehc->unloaded_mask &= ~(1 << dev->devno); 2884 tf.command = ATA_CMD_CHK_POWER; 2885 } 2886 2887 tf.flags |= ATA_TFLAG_DEVICE | ATA_TFLAG_ISADDR; 2888 tf.protocol |= ATA_PROT_NODATA; 2889 err_mask = ata_exec_internal(dev, &tf, NULL, DMA_NONE, NULL, 0, 0); 2890 if (park && (err_mask || tf.lbal != 0xc4)) { 2891 ata_dev_printk(dev, KERN_ERR, "head unload failed!\n"); 2892 ehc->unloaded_mask &= ~(1 << dev->devno); 2893 } 2894 } 2895 2896 static int ata_eh_revalidate_and_attach(struct ata_link *link, 2897 struct ata_device **r_failed_dev) 2898 { 2899 struct ata_port *ap = link->ap; 2900 struct ata_eh_context *ehc = &link->eh_context; 2901 struct ata_device *dev; 2902 unsigned int new_mask = 0; 2903 unsigned long flags; 2904 int rc = 0; 2905 2906 DPRINTK("ENTER\n"); 2907 2908 /* For PATA drive side cable detection to work, IDENTIFY must 2909 * be done backwards such that PDIAG- is released by the slave 2910 * device before the master device is identified. 2911 */ 2912 ata_for_each_dev(dev, link, ALL_REVERSE) { 2913 unsigned int action = ata_eh_dev_action(dev); 2914 unsigned int readid_flags = 0; 2915 2916 if (ehc->i.flags & ATA_EHI_DID_RESET) 2917 readid_flags |= ATA_READID_POSTRESET; 2918 2919 if ((action & ATA_EH_REVALIDATE) && ata_dev_enabled(dev)) { 2920 WARN_ON(dev->class == ATA_DEV_PMP); 2921 2922 if (ata_phys_link_offline(ata_dev_phys_link(dev))) { 2923 rc = -EIO; 2924 goto err; 2925 } 2926 2927 ata_eh_about_to_do(link, dev, ATA_EH_REVALIDATE); 2928 rc = ata_dev_revalidate(dev, ehc->classes[dev->devno], 2929 readid_flags); 2930 if (rc) 2931 goto err; 2932 2933 ata_eh_done(link, dev, ATA_EH_REVALIDATE); 2934 2935 /* Configuration may have changed, reconfigure 2936 * transfer mode. 2937 */ 2938 ehc->i.flags |= ATA_EHI_SETMODE; 2939 2940 /* schedule the scsi_rescan_device() here */ 2941 queue_work(ata_aux_wq, &(ap->scsi_rescan_task)); 2942 } else if (dev->class == ATA_DEV_UNKNOWN && 2943 ehc->tries[dev->devno] && 2944 ata_class_enabled(ehc->classes[dev->devno])) { 2945 /* Temporarily set dev->class, it will be 2946 * permanently set once all configurations are 2947 * complete. This is necessary because new 2948 * device configuration is done in two 2949 * separate loops. 2950 */ 2951 dev->class = ehc->classes[dev->devno]; 2952 2953 if (dev->class == ATA_DEV_PMP) 2954 rc = sata_pmp_attach(dev); 2955 else 2956 rc = ata_dev_read_id(dev, &dev->class, 2957 readid_flags, dev->id); 2958 2959 /* read_id might have changed class, store and reset */ 2960 ehc->classes[dev->devno] = dev->class; 2961 dev->class = ATA_DEV_UNKNOWN; 2962 2963 switch (rc) { 2964 case 0: 2965 /* clear error info accumulated during probe */ 2966 ata_ering_clear(&dev->ering); 2967 new_mask |= 1 << dev->devno; 2968 break; 2969 case -ENOENT: 2970 /* IDENTIFY was issued to non-existent 2971 * device. No need to reset. Just 2972 * thaw and ignore the device. 2973 */ 2974 ata_eh_thaw_port(ap); 2975 break; 2976 default: 2977 goto err; 2978 } 2979 } 2980 } 2981 2982 /* PDIAG- should have been released, ask cable type if post-reset */ 2983 if ((ehc->i.flags & ATA_EHI_DID_RESET) && ata_is_host_link(link)) { 2984 if (ap->ops->cable_detect) 2985 ap->cbl = ap->ops->cable_detect(ap); 2986 ata_force_cbl(ap); 2987 } 2988 2989 /* Configure new devices forward such that user doesn't see 2990 * device detection messages backwards. 2991 */ 2992 ata_for_each_dev(dev, link, ALL) { 2993 if (!(new_mask & (1 << dev->devno))) 2994 continue; 2995 2996 dev->class = ehc->classes[dev->devno]; 2997 2998 if (dev->class == ATA_DEV_PMP) 2999 continue; 3000 3001 ehc->i.flags |= ATA_EHI_PRINTINFO; 3002 rc = ata_dev_configure(dev); 3003 ehc->i.flags &= ~ATA_EHI_PRINTINFO; 3004 if (rc) { 3005 dev->class = ATA_DEV_UNKNOWN; 3006 goto err; 3007 } 3008 3009 spin_lock_irqsave(ap->lock, flags); 3010 ap->pflags |= ATA_PFLAG_SCSI_HOTPLUG; 3011 spin_unlock_irqrestore(ap->lock, flags); 3012 3013 /* new device discovered, configure xfermode */ 3014 ehc->i.flags |= ATA_EHI_SETMODE; 3015 } 3016 3017 return 0; 3018 3019 err: 3020 *r_failed_dev = dev; 3021 DPRINTK("EXIT rc=%d\n", rc); 3022 return rc; 3023 } 3024 3025 /** 3026 * ata_set_mode - Program timings and issue SET FEATURES - XFER 3027 * @link: link on which timings will be programmed 3028 * @r_failed_dev: out parameter for failed device 3029 * 3030 * Set ATA device disk transfer mode (PIO3, UDMA6, etc.). If 3031 * ata_set_mode() fails, pointer to the failing device is 3032 * returned in @r_failed_dev. 3033 * 3034 * LOCKING: 3035 * PCI/etc. bus probe sem. 3036 * 3037 * RETURNS: 3038 * 0 on success, negative errno otherwise 3039 */ 3040 int ata_set_mode(struct ata_link *link, struct ata_device **r_failed_dev) 3041 { 3042 struct ata_port *ap = link->ap; 3043 struct ata_device *dev; 3044 int rc; 3045 3046 /* if data transfer is verified, clear DUBIOUS_XFER on ering top */ 3047 ata_for_each_dev(dev, link, ENABLED) { 3048 if (!(dev->flags & ATA_DFLAG_DUBIOUS_XFER)) { 3049 struct ata_ering_entry *ent; 3050 3051 ent = ata_ering_top(&dev->ering); 3052 if (ent) 3053 ent->eflags &= ~ATA_EFLAG_DUBIOUS_XFER; 3054 } 3055 } 3056 3057 /* has private set_mode? */ 3058 if (ap->ops->set_mode) 3059 rc = ap->ops->set_mode(link, r_failed_dev); 3060 else 3061 rc = ata_do_set_mode(link, r_failed_dev); 3062 3063 /* if transfer mode has changed, set DUBIOUS_XFER on device */ 3064 ata_for_each_dev(dev, link, ENABLED) { 3065 struct ata_eh_context *ehc = &link->eh_context; 3066 u8 saved_xfer_mode = ehc->saved_xfer_mode[dev->devno]; 3067 u8 saved_ncq = !!(ehc->saved_ncq_enabled & (1 << dev->devno)); 3068 3069 if (dev->xfer_mode != saved_xfer_mode || 3070 ata_ncq_enabled(dev) != saved_ncq) 3071 dev->flags |= ATA_DFLAG_DUBIOUS_XFER; 3072 } 3073 3074 return rc; 3075 } 3076 3077 /** 3078 * atapi_eh_clear_ua - Clear ATAPI UNIT ATTENTION after reset 3079 * @dev: ATAPI device to clear UA for 3080 * 3081 * Resets and other operations can make an ATAPI device raise 3082 * UNIT ATTENTION which causes the next operation to fail. This 3083 * function clears UA. 3084 * 3085 * LOCKING: 3086 * EH context (may sleep). 3087 * 3088 * RETURNS: 3089 * 0 on success, -errno on failure. 3090 */ 3091 static int atapi_eh_clear_ua(struct ata_device *dev) 3092 { 3093 int i; 3094 3095 for (i = 0; i < ATA_EH_UA_TRIES; i++) { 3096 u8 *sense_buffer = dev->link->ap->sector_buf; 3097 u8 sense_key = 0; 3098 unsigned int err_mask; 3099 3100 err_mask = atapi_eh_tur(dev, &sense_key); 3101 if (err_mask != 0 && err_mask != AC_ERR_DEV) { 3102 ata_dev_printk(dev, KERN_WARNING, "TEST_UNIT_READY " 3103 "failed (err_mask=0x%x)\n", err_mask); 3104 return -EIO; 3105 } 3106 3107 if (!err_mask || sense_key != UNIT_ATTENTION) 3108 return 0; 3109 3110 err_mask = atapi_eh_request_sense(dev, sense_buffer, sense_key); 3111 if (err_mask) { 3112 ata_dev_printk(dev, KERN_WARNING, "failed to clear " 3113 "UNIT ATTENTION (err_mask=0x%x)\n", err_mask); 3114 return -EIO; 3115 } 3116 } 3117 3118 ata_dev_printk(dev, KERN_WARNING, 3119 "UNIT ATTENTION persists after %d tries\n", ATA_EH_UA_TRIES); 3120 3121 return 0; 3122 } 3123 3124 /** 3125 * ata_eh_maybe_retry_flush - Retry FLUSH if necessary 3126 * @dev: ATA device which may need FLUSH retry 3127 * 3128 * If @dev failed FLUSH, it needs to be reported upper layer 3129 * immediately as it means that @dev failed to remap and already 3130 * lost at least a sector and further FLUSH retrials won't make 3131 * any difference to the lost sector. However, if FLUSH failed 3132 * for other reasons, for example transmission error, FLUSH needs 3133 * to be retried. 3134 * 3135 * This function determines whether FLUSH failure retry is 3136 * necessary and performs it if so. 3137 * 3138 * RETURNS: 3139 * 0 if EH can continue, -errno if EH needs to be repeated. 3140 */ 3141 static int ata_eh_maybe_retry_flush(struct ata_device *dev) 3142 { 3143 struct ata_link *link = dev->link; 3144 struct ata_port *ap = link->ap; 3145 struct ata_queued_cmd *qc; 3146 struct ata_taskfile tf; 3147 unsigned int err_mask; 3148 int rc = 0; 3149 3150 /* did flush fail for this device? */ 3151 if (!ata_tag_valid(link->active_tag)) 3152 return 0; 3153 3154 qc = __ata_qc_from_tag(ap, link->active_tag); 3155 if (qc->dev != dev || (qc->tf.command != ATA_CMD_FLUSH_EXT && 3156 qc->tf.command != ATA_CMD_FLUSH)) 3157 return 0; 3158 3159 /* if the device failed it, it should be reported to upper layers */ 3160 if (qc->err_mask & AC_ERR_DEV) 3161 return 0; 3162 3163 /* flush failed for some other reason, give it another shot */ 3164 ata_tf_init(dev, &tf); 3165 3166 tf.command = qc->tf.command; 3167 tf.flags |= ATA_TFLAG_DEVICE; 3168 tf.protocol = ATA_PROT_NODATA; 3169 3170 ata_dev_printk(dev, KERN_WARNING, "retrying FLUSH 0x%x Emask 0x%x\n", 3171 tf.command, qc->err_mask); 3172 3173 err_mask = ata_exec_internal(dev, &tf, NULL, DMA_NONE, NULL, 0, 0); 3174 if (!err_mask) { 3175 /* 3176 * FLUSH is complete but there's no way to 3177 * successfully complete a failed command from EH. 3178 * Making sure retry is allowed at least once and 3179 * retrying it should do the trick - whatever was in 3180 * the cache is already on the platter and this won't 3181 * cause infinite loop. 3182 */ 3183 qc->scsicmd->allowed = max(qc->scsicmd->allowed, 1); 3184 } else { 3185 ata_dev_printk(dev, KERN_WARNING, "FLUSH failed Emask 0x%x\n", 3186 err_mask); 3187 rc = -EIO; 3188 3189 /* if device failed it, report it to upper layers */ 3190 if (err_mask & AC_ERR_DEV) { 3191 qc->err_mask |= AC_ERR_DEV; 3192 qc->result_tf = tf; 3193 if (!(ap->pflags & ATA_PFLAG_FROZEN)) 3194 rc = 0; 3195 } 3196 } 3197 return rc; 3198 } 3199 3200 static int ata_link_nr_enabled(struct ata_link *link) 3201 { 3202 struct ata_device *dev; 3203 int cnt = 0; 3204 3205 ata_for_each_dev(dev, link, ENABLED) 3206 cnt++; 3207 return cnt; 3208 } 3209 3210 static int ata_link_nr_vacant(struct ata_link *link) 3211 { 3212 struct ata_device *dev; 3213 int cnt = 0; 3214 3215 ata_for_each_dev(dev, link, ALL) 3216 if (dev->class == ATA_DEV_UNKNOWN) 3217 cnt++; 3218 return cnt; 3219 } 3220 3221 static int ata_eh_skip_recovery(struct ata_link *link) 3222 { 3223 struct ata_port *ap = link->ap; 3224 struct ata_eh_context *ehc = &link->eh_context; 3225 struct ata_device *dev; 3226 3227 /* skip disabled links */ 3228 if (link->flags & ATA_LFLAG_DISABLED) 3229 return 1; 3230 3231 /* thaw frozen port and recover failed devices */ 3232 if ((ap->pflags & ATA_PFLAG_FROZEN) || ata_link_nr_enabled(link)) 3233 return 0; 3234 3235 /* reset at least once if reset is requested */ 3236 if ((ehc->i.action & ATA_EH_RESET) && 3237 !(ehc->i.flags & ATA_EHI_DID_RESET)) 3238 return 0; 3239 3240 /* skip if class codes for all vacant slots are ATA_DEV_NONE */ 3241 ata_for_each_dev(dev, link, ALL) { 3242 if (dev->class == ATA_DEV_UNKNOWN && 3243 ehc->classes[dev->devno] != ATA_DEV_NONE) 3244 return 0; 3245 } 3246 3247 return 1; 3248 } 3249 3250 static int ata_count_probe_trials_cb(struct ata_ering_entry *ent, void *void_arg) 3251 { 3252 u64 interval = msecs_to_jiffies(ATA_EH_PROBE_TRIAL_INTERVAL); 3253 u64 now = get_jiffies_64(); 3254 int *trials = void_arg; 3255 3256 if (ent->timestamp < now - min(now, interval)) 3257 return -1; 3258 3259 (*trials)++; 3260 return 0; 3261 } 3262 3263 static int ata_eh_schedule_probe(struct ata_device *dev) 3264 { 3265 struct ata_eh_context *ehc = &dev->link->eh_context; 3266 struct ata_link *link = ata_dev_phys_link(dev); 3267 int trials = 0; 3268 3269 if (!(ehc->i.probe_mask & (1 << dev->devno)) || 3270 (ehc->did_probe_mask & (1 << dev->devno))) 3271 return 0; 3272 3273 ata_eh_detach_dev(dev); 3274 ata_dev_init(dev); 3275 ehc->did_probe_mask |= (1 << dev->devno); 3276 ehc->i.action |= ATA_EH_RESET; 3277 ehc->saved_xfer_mode[dev->devno] = 0; 3278 ehc->saved_ncq_enabled &= ~(1 << dev->devno); 3279 3280 /* Record and count probe trials on the ering. The specific 3281 * error mask used is irrelevant. Because a successful device 3282 * detection clears the ering, this count accumulates only if 3283 * there are consecutive failed probes. 3284 * 3285 * If the count is equal to or higher than ATA_EH_PROBE_TRIALS 3286 * in the last ATA_EH_PROBE_TRIAL_INTERVAL, link speed is 3287 * forced to 1.5Gbps. 3288 * 3289 * This is to work around cases where failed link speed 3290 * negotiation results in device misdetection leading to 3291 * infinite DEVXCHG or PHRDY CHG events. 3292 */ 3293 ata_ering_record(&dev->ering, 0, AC_ERR_OTHER); 3294 ata_ering_map(&dev->ering, ata_count_probe_trials_cb, &trials); 3295 3296 if (trials > ATA_EH_PROBE_TRIALS) 3297 sata_down_spd_limit(link, 1); 3298 3299 return 1; 3300 } 3301 3302 static int ata_eh_handle_dev_fail(struct ata_device *dev, int err) 3303 { 3304 struct ata_eh_context *ehc = &dev->link->eh_context; 3305 3306 /* -EAGAIN from EH routine indicates retry without prejudice. 3307 * The requester is responsible for ensuring forward progress. 3308 */ 3309 if (err != -EAGAIN) 3310 ehc->tries[dev->devno]--; 3311 3312 switch (err) { 3313 case -ENODEV: 3314 /* device missing or wrong IDENTIFY data, schedule probing */ 3315 ehc->i.probe_mask |= (1 << dev->devno); 3316 case -EINVAL: 3317 /* give it just one more chance */ 3318 ehc->tries[dev->devno] = min(ehc->tries[dev->devno], 1); 3319 case -EIO: 3320 if (ehc->tries[dev->devno] == 1) { 3321 /* This is the last chance, better to slow 3322 * down than lose it. 3323 */ 3324 sata_down_spd_limit(ata_dev_phys_link(dev), 0); 3325 if (dev->pio_mode > XFER_PIO_0) 3326 ata_down_xfermask_limit(dev, ATA_DNXFER_PIO); 3327 } 3328 } 3329 3330 if (ata_dev_enabled(dev) && !ehc->tries[dev->devno]) { 3331 /* disable device if it has used up all its chances */ 3332 ata_dev_disable(dev); 3333 3334 /* detach if offline */ 3335 if (ata_phys_link_offline(ata_dev_phys_link(dev))) 3336 ata_eh_detach_dev(dev); 3337 3338 /* schedule probe if necessary */ 3339 if (ata_eh_schedule_probe(dev)) { 3340 ehc->tries[dev->devno] = ATA_EH_DEV_TRIES; 3341 memset(ehc->cmd_timeout_idx[dev->devno], 0, 3342 sizeof(ehc->cmd_timeout_idx[dev->devno])); 3343 } 3344 3345 return 1; 3346 } else { 3347 ehc->i.action |= ATA_EH_RESET; 3348 return 0; 3349 } 3350 } 3351 3352 /** 3353 * ata_eh_recover - recover host port after error 3354 * @ap: host port to recover 3355 * @prereset: prereset method (can be NULL) 3356 * @softreset: softreset method (can be NULL) 3357 * @hardreset: hardreset method (can be NULL) 3358 * @postreset: postreset method (can be NULL) 3359 * @r_failed_link: out parameter for failed link 3360 * 3361 * This is the alpha and omega, eum and yang, heart and soul of 3362 * libata exception handling. On entry, actions required to 3363 * recover each link and hotplug requests are recorded in the 3364 * link's eh_context. This function executes all the operations 3365 * with appropriate retrials and fallbacks to resurrect failed 3366 * devices, detach goners and greet newcomers. 3367 * 3368 * LOCKING: 3369 * Kernel thread context (may sleep). 3370 * 3371 * RETURNS: 3372 * 0 on success, -errno on failure. 3373 */ 3374 int ata_eh_recover(struct ata_port *ap, ata_prereset_fn_t prereset, 3375 ata_reset_fn_t softreset, ata_reset_fn_t hardreset, 3376 ata_postreset_fn_t postreset, 3377 struct ata_link **r_failed_link) 3378 { 3379 struct ata_link *link; 3380 struct ata_device *dev; 3381 int nr_failed_devs; 3382 int rc; 3383 unsigned long flags, deadline; 3384 3385 DPRINTK("ENTER\n"); 3386 3387 /* prep for recovery */ 3388 ata_for_each_link(link, ap, EDGE) { 3389 struct ata_eh_context *ehc = &link->eh_context; 3390 3391 /* re-enable link? */ 3392 if (ehc->i.action & ATA_EH_ENABLE_LINK) { 3393 ata_eh_about_to_do(link, NULL, ATA_EH_ENABLE_LINK); 3394 spin_lock_irqsave(ap->lock, flags); 3395 link->flags &= ~ATA_LFLAG_DISABLED; 3396 spin_unlock_irqrestore(ap->lock, flags); 3397 ata_eh_done(link, NULL, ATA_EH_ENABLE_LINK); 3398 } 3399 3400 ata_for_each_dev(dev, link, ALL) { 3401 if (link->flags & ATA_LFLAG_NO_RETRY) 3402 ehc->tries[dev->devno] = 1; 3403 else 3404 ehc->tries[dev->devno] = ATA_EH_DEV_TRIES; 3405 3406 /* collect port action mask recorded in dev actions */ 3407 ehc->i.action |= ehc->i.dev_action[dev->devno] & 3408 ~ATA_EH_PERDEV_MASK; 3409 ehc->i.dev_action[dev->devno] &= ATA_EH_PERDEV_MASK; 3410 3411 /* process hotplug request */ 3412 if (dev->flags & ATA_DFLAG_DETACH) 3413 ata_eh_detach_dev(dev); 3414 3415 /* schedule probe if necessary */ 3416 if (!ata_dev_enabled(dev)) 3417 ata_eh_schedule_probe(dev); 3418 } 3419 } 3420 3421 retry: 3422 rc = 0; 3423 nr_failed_devs = 0; 3424 3425 /* if UNLOADING, finish immediately */ 3426 if (ap->pflags & ATA_PFLAG_UNLOADING) 3427 goto out; 3428 3429 /* prep for EH */ 3430 ata_for_each_link(link, ap, EDGE) { 3431 struct ata_eh_context *ehc = &link->eh_context; 3432 3433 /* skip EH if possible. */ 3434 if (ata_eh_skip_recovery(link)) 3435 ehc->i.action = 0; 3436 3437 ata_for_each_dev(dev, link, ALL) 3438 ehc->classes[dev->devno] = ATA_DEV_UNKNOWN; 3439 } 3440 3441 /* reset */ 3442 ata_for_each_link(link, ap, EDGE) { 3443 struct ata_eh_context *ehc = &link->eh_context; 3444 3445 if (!(ehc->i.action & ATA_EH_RESET)) 3446 continue; 3447 3448 rc = ata_eh_reset(link, ata_link_nr_vacant(link), 3449 prereset, softreset, hardreset, postreset); 3450 if (rc) { 3451 ata_link_printk(link, KERN_ERR, 3452 "reset failed, giving up\n"); 3453 goto out; 3454 } 3455 } 3456 3457 do { 3458 unsigned long now; 3459 3460 /* 3461 * clears ATA_EH_PARK in eh_info and resets 3462 * ap->park_req_pending 3463 */ 3464 ata_eh_pull_park_action(ap); 3465 3466 deadline = jiffies; 3467 ata_for_each_link(link, ap, EDGE) { 3468 ata_for_each_dev(dev, link, ALL) { 3469 struct ata_eh_context *ehc = &link->eh_context; 3470 unsigned long tmp; 3471 3472 if (dev->class != ATA_DEV_ATA) 3473 continue; 3474 if (!(ehc->i.dev_action[dev->devno] & 3475 ATA_EH_PARK)) 3476 continue; 3477 tmp = dev->unpark_deadline; 3478 if (time_before(deadline, tmp)) 3479 deadline = tmp; 3480 else if (time_before_eq(tmp, jiffies)) 3481 continue; 3482 if (ehc->unloaded_mask & (1 << dev->devno)) 3483 continue; 3484 3485 ata_eh_park_issue_cmd(dev, 1); 3486 } 3487 } 3488 3489 now = jiffies; 3490 if (time_before_eq(deadline, now)) 3491 break; 3492 3493 deadline = wait_for_completion_timeout(&ap->park_req_pending, 3494 deadline - now); 3495 } while (deadline); 3496 ata_for_each_link(link, ap, EDGE) { 3497 ata_for_each_dev(dev, link, ALL) { 3498 if (!(link->eh_context.unloaded_mask & 3499 (1 << dev->devno))) 3500 continue; 3501 3502 ata_eh_park_issue_cmd(dev, 0); 3503 ata_eh_done(link, dev, ATA_EH_PARK); 3504 } 3505 } 3506 3507 /* the rest */ 3508 ata_for_each_link(link, ap, EDGE) { 3509 struct ata_eh_context *ehc = &link->eh_context; 3510 3511 /* revalidate existing devices and attach new ones */ 3512 rc = ata_eh_revalidate_and_attach(link, &dev); 3513 if (rc) 3514 goto dev_fail; 3515 3516 /* if PMP got attached, return, pmp EH will take care of it */ 3517 if (link->device->class == ATA_DEV_PMP) { 3518 ehc->i.action = 0; 3519 return 0; 3520 } 3521 3522 /* configure transfer mode if necessary */ 3523 if (ehc->i.flags & ATA_EHI_SETMODE) { 3524 rc = ata_set_mode(link, &dev); 3525 if (rc) 3526 goto dev_fail; 3527 ehc->i.flags &= ~ATA_EHI_SETMODE; 3528 } 3529 3530 /* If reset has been issued, clear UA to avoid 3531 * disrupting the current users of the device. 3532 */ 3533 if (ehc->i.flags & ATA_EHI_DID_RESET) { 3534 ata_for_each_dev(dev, link, ALL) { 3535 if (dev->class != ATA_DEV_ATAPI) 3536 continue; 3537 rc = atapi_eh_clear_ua(dev); 3538 if (rc) 3539 goto dev_fail; 3540 } 3541 } 3542 3543 /* retry flush if necessary */ 3544 ata_for_each_dev(dev, link, ALL) { 3545 if (dev->class != ATA_DEV_ATA) 3546 continue; 3547 rc = ata_eh_maybe_retry_flush(dev); 3548 if (rc) 3549 goto dev_fail; 3550 } 3551 3552 /* configure link power saving */ 3553 if (ehc->i.action & ATA_EH_LPM) 3554 ata_for_each_dev(dev, link, ALL) 3555 ata_dev_enable_pm(dev, ap->pm_policy); 3556 3557 /* this link is okay now */ 3558 ehc->i.flags = 0; 3559 continue; 3560 3561 dev_fail: 3562 nr_failed_devs++; 3563 ata_eh_handle_dev_fail(dev, rc); 3564 3565 if (ap->pflags & ATA_PFLAG_FROZEN) { 3566 /* PMP reset requires working host port. 3567 * Can't retry if it's frozen. 3568 */ 3569 if (sata_pmp_attached(ap)) 3570 goto out; 3571 break; 3572 } 3573 } 3574 3575 if (nr_failed_devs) 3576 goto retry; 3577 3578 out: 3579 if (rc && r_failed_link) 3580 *r_failed_link = link; 3581 3582 DPRINTK("EXIT, rc=%d\n", rc); 3583 return rc; 3584 } 3585 3586 /** 3587 * ata_eh_finish - finish up EH 3588 * @ap: host port to finish EH for 3589 * 3590 * Recovery is complete. Clean up EH states and retry or finish 3591 * failed qcs. 3592 * 3593 * LOCKING: 3594 * None. 3595 */ 3596 void ata_eh_finish(struct ata_port *ap) 3597 { 3598 int tag; 3599 3600 /* retry or finish qcs */ 3601 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) { 3602 struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag); 3603 3604 if (!(qc->flags & ATA_QCFLAG_FAILED)) 3605 continue; 3606 3607 if (qc->err_mask) { 3608 /* FIXME: Once EH migration is complete, 3609 * generate sense data in this function, 3610 * considering both err_mask and tf. 3611 */ 3612 if (qc->flags & ATA_QCFLAG_RETRY) 3613 ata_eh_qc_retry(qc); 3614 else 3615 ata_eh_qc_complete(qc); 3616 } else { 3617 if (qc->flags & ATA_QCFLAG_SENSE_VALID) { 3618 ata_eh_qc_complete(qc); 3619 } else { 3620 /* feed zero TF to sense generation */ 3621 memset(&qc->result_tf, 0, sizeof(qc->result_tf)); 3622 ata_eh_qc_retry(qc); 3623 } 3624 } 3625 } 3626 3627 /* make sure nr_active_links is zero after EH */ 3628 WARN_ON(ap->nr_active_links); 3629 ap->nr_active_links = 0; 3630 } 3631 3632 /** 3633 * ata_do_eh - do standard error handling 3634 * @ap: host port to handle error for 3635 * 3636 * @prereset: prereset method (can be NULL) 3637 * @softreset: softreset method (can be NULL) 3638 * @hardreset: hardreset method (can be NULL) 3639 * @postreset: postreset method (can be NULL) 3640 * 3641 * Perform standard error handling sequence. 3642 * 3643 * LOCKING: 3644 * Kernel thread context (may sleep). 3645 */ 3646 void ata_do_eh(struct ata_port *ap, ata_prereset_fn_t prereset, 3647 ata_reset_fn_t softreset, ata_reset_fn_t hardreset, 3648 ata_postreset_fn_t postreset) 3649 { 3650 struct ata_device *dev; 3651 int rc; 3652 3653 ata_eh_autopsy(ap); 3654 ata_eh_report(ap); 3655 3656 rc = ata_eh_recover(ap, prereset, softreset, hardreset, postreset, 3657 NULL); 3658 if (rc) { 3659 ata_for_each_dev(dev, &ap->link, ALL) 3660 ata_dev_disable(dev); 3661 } 3662 3663 ata_eh_finish(ap); 3664 } 3665 3666 /** 3667 * ata_std_error_handler - standard error handler 3668 * @ap: host port to handle error for 3669 * 3670 * Standard error handler 3671 * 3672 * LOCKING: 3673 * Kernel thread context (may sleep). 3674 */ 3675 void ata_std_error_handler(struct ata_port *ap) 3676 { 3677 struct ata_port_operations *ops = ap->ops; 3678 ata_reset_fn_t hardreset = ops->hardreset; 3679 3680 /* ignore built-in hardreset if SCR access is not available */ 3681 if (ata_is_builtin_hardreset(hardreset) && !sata_scr_valid(&ap->link)) 3682 hardreset = NULL; 3683 3684 ata_do_eh(ap, ops->prereset, ops->softreset, hardreset, ops->postreset); 3685 } 3686 3687 #ifdef CONFIG_PM 3688 /** 3689 * ata_eh_handle_port_suspend - perform port suspend operation 3690 * @ap: port to suspend 3691 * 3692 * Suspend @ap. 3693 * 3694 * LOCKING: 3695 * Kernel thread context (may sleep). 3696 */ 3697 static void ata_eh_handle_port_suspend(struct ata_port *ap) 3698 { 3699 unsigned long flags; 3700 int rc = 0; 3701 3702 /* are we suspending? */ 3703 spin_lock_irqsave(ap->lock, flags); 3704 if (!(ap->pflags & ATA_PFLAG_PM_PENDING) || 3705 ap->pm_mesg.event == PM_EVENT_ON) { 3706 spin_unlock_irqrestore(ap->lock, flags); 3707 return; 3708 } 3709 spin_unlock_irqrestore(ap->lock, flags); 3710 3711 WARN_ON(ap->pflags & ATA_PFLAG_SUSPENDED); 3712 3713 /* tell ACPI we're suspending */ 3714 rc = ata_acpi_on_suspend(ap); 3715 if (rc) 3716 goto out; 3717 3718 /* suspend */ 3719 ata_eh_freeze_port(ap); 3720 3721 if (ap->ops->port_suspend) 3722 rc = ap->ops->port_suspend(ap, ap->pm_mesg); 3723 3724 ata_acpi_set_state(ap, PMSG_SUSPEND); 3725 out: 3726 /* report result */ 3727 spin_lock_irqsave(ap->lock, flags); 3728 3729 ap->pflags &= ~ATA_PFLAG_PM_PENDING; 3730 if (rc == 0) 3731 ap->pflags |= ATA_PFLAG_SUSPENDED; 3732 else if (ap->pflags & ATA_PFLAG_FROZEN) 3733 ata_port_schedule_eh(ap); 3734 3735 if (ap->pm_result) { 3736 *ap->pm_result = rc; 3737 ap->pm_result = NULL; 3738 } 3739 3740 spin_unlock_irqrestore(ap->lock, flags); 3741 3742 return; 3743 } 3744 3745 /** 3746 * ata_eh_handle_port_resume - perform port resume operation 3747 * @ap: port to resume 3748 * 3749 * Resume @ap. 3750 * 3751 * LOCKING: 3752 * Kernel thread context (may sleep). 3753 */ 3754 static void ata_eh_handle_port_resume(struct ata_port *ap) 3755 { 3756 struct ata_link *link; 3757 struct ata_device *dev; 3758 unsigned long flags; 3759 int rc = 0; 3760 3761 /* are we resuming? */ 3762 spin_lock_irqsave(ap->lock, flags); 3763 if (!(ap->pflags & ATA_PFLAG_PM_PENDING) || 3764 ap->pm_mesg.event != PM_EVENT_ON) { 3765 spin_unlock_irqrestore(ap->lock, flags); 3766 return; 3767 } 3768 spin_unlock_irqrestore(ap->lock, flags); 3769 3770 WARN_ON(!(ap->pflags & ATA_PFLAG_SUSPENDED)); 3771 3772 /* 3773 * Error timestamps are in jiffies which doesn't run while 3774 * suspended and PHY events during resume isn't too uncommon. 3775 * When the two are combined, it can lead to unnecessary speed 3776 * downs if the machine is suspended and resumed repeatedly. 3777 * Clear error history. 3778 */ 3779 ata_for_each_link(link, ap, HOST_FIRST) 3780 ata_for_each_dev(dev, link, ALL) 3781 ata_ering_clear(&dev->ering); 3782 3783 ata_acpi_set_state(ap, PMSG_ON); 3784 3785 if (ap->ops->port_resume) 3786 rc = ap->ops->port_resume(ap); 3787 3788 /* tell ACPI that we're resuming */ 3789 ata_acpi_on_resume(ap); 3790 3791 /* report result */ 3792 spin_lock_irqsave(ap->lock, flags); 3793 ap->pflags &= ~(ATA_PFLAG_PM_PENDING | ATA_PFLAG_SUSPENDED); 3794 if (ap->pm_result) { 3795 *ap->pm_result = rc; 3796 ap->pm_result = NULL; 3797 } 3798 spin_unlock_irqrestore(ap->lock, flags); 3799 } 3800 #endif /* CONFIG_PM */ 3801