Merge branch 'i2c-for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/jdelvar...

[cascardo/linux.git] / drivers / ata / libata-eh.c
diff --git a/drivers/ata/libata-eh.c b/drivers/ata/libata-eh.c

index ea89091..fa22f94 100644 (file)
--- a/drivers/ata/libata-eh.c
+++ b/drivers/ata/libata-eh.c
@@ -547,7 +547,7 @@ void ata_scsi_error(struct Scsi_Host *host)
  
         /* For new EH, all qcs are finished in one of three ways -
          * normal completion, error completion, and SCSI timeout.
-        * Both cmpletions can race against SCSI timeout.  When normal
+        * Both completions can race against SCSI timeout.  When normal
          * completion wins, the qc never reaches EH.  When error
          * completion wins, the qc has ATA_QCFLAG_FAILED set.
          *
@@ -562,7 +562,19 @@ void ata_scsi_error(struct Scsi_Host *host)
                 int nr_timedout = 0;
  
                 spin_lock_irqsave(ap->lock, flags);
-
+               
+               /* This must occur under the ap->lock as we don't want
+                  a polled recovery to race the real interrupt handler
+                  
+                  The lost_interrupt handler checks for any completed but
+                  non-notified command and completes much like an IRQ handler.
+                  
+                  We then fall into the error recovery code which will treat
+                  this as if normal completion won the race */
+
+               if (ap->ops->lost_interrupt)
+                       ap->ops->lost_interrupt(ap);
+                       
                 list_for_each_entry_safe(scmd, tmp, &host->eh_cmd_q, eh_entry) {
                         struct ata_queued_cmd *qc;
  
@@ -606,6 +618,9 @@ void ata_scsi_error(struct Scsi_Host *host)
                 ap->eh_tries = ATA_EH_MAX_TRIES;
         } else
                 spin_unlock_wait(ap->lock);
+               
+       /* If we timed raced normal completion and there is nothing to
+          recover nr_timedout == 0 why exactly are we doing error recovery ? */
  
   repeat:
         /* invoke error handler */
@@ -2768,6 +2783,12 @@ static int ata_eh_revalidate_and_attach(struct ata_link *link,
                 } else if (dev->class == ATA_DEV_UNKNOWN &&
                            ehc->tries[dev->devno] &&
                            ata_class_enabled(ehc->classes[dev->devno])) {
+                       /* Temporarily set dev->class, it will be
+                        * permanently set once all configurations are
+                        * complete.  This is necessary because new
+                        * device configuration is done in two
+                        * separate loops.
+                        */
                         dev->class = ehc->classes[dev->devno];
  
                         if (dev->class == ATA_DEV_PMP)
@@ -2775,6 +2796,11 @@ static int ata_eh_revalidate_and_attach(struct ata_link *link,
                         else
                                 rc = ata_dev_read_id(dev, &dev->class,
                                                      readid_flags, dev->id);
+
+                       /* read_id might have changed class, store and reset */
+                       ehc->classes[dev->devno] = dev->class;
+                       dev->class = ATA_DEV_UNKNOWN;
+
                         switch (rc) {
                         case 0:
                                 /* clear error info accumulated during probe */
@@ -2784,13 +2810,11 @@ static int ata_eh_revalidate_and_attach(struct ata_link *link,
                         case -ENOENT:
                                 /* IDENTIFY was issued to non-existent
                                  * device.  No need to reset.  Just
-                                * thaw and kill the device.
+                                * thaw and ignore the device.
                                  */
                                 ata_eh_thaw_port(ap);
-                               dev->class = ATA_DEV_UNKNOWN;
                                 break;
                         default:
-                               dev->class = ATA_DEV_UNKNOWN;
                                 goto err;
                         }
                 }
@@ -2811,11 +2835,15 @@ static int ata_eh_revalidate_and_attach(struct ata_link *link,
                     dev->class == ATA_DEV_PMP)
                         continue;
  
+               dev->class = ehc->classes[dev->devno];
+
                 ehc->i.flags |= ATA_EHI_PRINTINFO;
                 rc = ata_dev_configure(dev);
                 ehc->i.flags &= ~ATA_EHI_PRINTINFO;
-               if (rc)
+               if (rc) {
+                       dev->class = ATA_DEV_UNKNOWN;
                         goto err;
+               }
  
                 spin_lock_irqsave(ap->lock, flags);
                 ap->pflags |= ATA_PFLAG_SCSI_HOTPLUG;
@@ -2836,7 +2864,7 @@ static int ata_eh_revalidate_and_attach(struct ata_link *link,
  /**
   *     ata_set_mode - Program timings and issue SET FEATURES - XFER
   *     @link: link on which timings will be programmed
- *     @r_failed_dev: out paramter for failed device
+ *     @r_failed_dev: out parameter for failed device
   *
   *     Set ATA device disk transfer mode (PIO3, UDMA6, etc.).  If
   *     ata_set_mode() fails, pointer to the failing device is
@@ -3479,6 +3507,8 @@ static void ata_eh_handle_port_suspend(struct ata_port *ap)
   */
  static void ata_eh_handle_port_resume(struct ata_port *ap)
  {
+       struct ata_link *link;
+       struct ata_device *dev;
         unsigned long flags;
         int rc = 0;
  
@@ -3493,6 +3523,17 @@ static void ata_eh_handle_port_resume(struct ata_port *ap)
  
         WARN_ON(!(ap->pflags & ATA_PFLAG_SUSPENDED));
  
+       /*
+        * Error timestamps are in jiffies which doesn't run while
+        * suspended and PHY events during resume isn't too uncommon.
+        * When the two are combined, it can lead to unnecessary speed
+        * downs if the machine is suspended and resumed repeatedly.
+        * Clear error history.
+        */
+       ata_for_each_link(link, ap, HOST_FIRST)
+               ata_for_each_dev(dev, link, ALL)
+                       ata_ering_clear(&dev->ering);
+
         ata_acpi_set_state(ap, PMSG_ON);
  
         if (ap->ops->port_resume)