blob: 2c34de841e110c1903f6e3d4b40d693ef08fe2d6 [file] [log] [blame]
Tejun Heoece1d632006-04-02 18:51:53 +09001/*
2 * libata-eh.c - libata error handling
3 *
4 * Maintained by: Jeff Garzik <jgarzik@pobox.com>
5 * Please ALWAYS copy linux-ide@vger.kernel.org
6 * on emails.
7 *
8 * Copyright 2006 Tejun Heo <htejun@gmail.com>
9 *
10 *
11 * This program is free software; you can redistribute it and/or
12 * modify it under the terms of the GNU General Public License as
13 * published by the Free Software Foundation; either version 2, or
14 * (at your option) any later version.
15 *
16 * This program is distributed in the hope that it will be useful,
17 * but WITHOUT ANY WARRANTY; without even the implied warranty of
18 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
19 * General Public License for more details.
20 *
21 * You should have received a copy of the GNU General Public License
22 * along with this program; see the file COPYING. If not, write to
23 * the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139,
24 * USA.
25 *
26 *
27 * libata documentation is available via 'make {ps|pdf}docs',
28 * as Documentation/DocBook/libata.*
29 *
30 * Hardware documentation available from http://www.t13.org/ and
31 * http://www.sata-io.org/
32 *
33 */
34
Tejun Heoece1d632006-04-02 18:51:53 +090035#include <linux/kernel.h>
Jens Axboe242f9dc2008-09-14 05:55:09 -070036#include <linux/blkdev.h>
Jeff Garzik28555682007-10-11 17:12:35 -040037#include <linux/pci.h>
Tejun Heoece1d632006-04-02 18:51:53 +090038#include <scsi/scsi.h>
39#include <scsi/scsi_host.h>
40#include <scsi/scsi_eh.h>
41#include <scsi/scsi_device.h>
42#include <scsi/scsi_cmnd.h>
Jeff Garzikc6fd2802006-08-10 07:31:37 -040043#include "../scsi/scsi_transport_api.h"
Tejun Heoece1d632006-04-02 18:51:53 +090044
45#include <linux/libata.h>
46
47#include "libata.h"
48
Tejun Heo7d47e8d2007-02-02 16:22:31 +090049enum {
Tejun Heo3884f7b2007-11-27 19:28:56 +090050 /* speed down verdicts */
Tejun Heo7d47e8d2007-02-02 16:22:31 +090051 ATA_EH_SPDN_NCQ_OFF = (1 << 0),
52 ATA_EH_SPDN_SPEED_DOWN = (1 << 1),
53 ATA_EH_SPDN_FALLBACK_TO_PIO = (1 << 2),
Tejun Heo76326ac2007-11-27 19:28:59 +090054 ATA_EH_SPDN_KEEP_ERRORS = (1 << 3),
Tejun Heo3884f7b2007-11-27 19:28:56 +090055
56 /* error flags */
57 ATA_EFLAG_IS_IO = (1 << 0),
Tejun Heo76326ac2007-11-27 19:28:59 +090058 ATA_EFLAG_DUBIOUS_XFER = (1 << 1),
Tejun Heo3884f7b2007-11-27 19:28:56 +090059
60 /* error categories */
61 ATA_ECAT_NONE = 0,
62 ATA_ECAT_ATA_BUS = 1,
63 ATA_ECAT_TOUT_HSM = 2,
64 ATA_ECAT_UNK_DEV = 3,
Tejun Heo75f9caf2008-01-03 01:21:14 +090065 ATA_ECAT_DUBIOUS_NONE = 4,
66 ATA_ECAT_DUBIOUS_ATA_BUS = 5,
67 ATA_ECAT_DUBIOUS_TOUT_HSM = 6,
68 ATA_ECAT_DUBIOUS_UNK_DEV = 7,
69 ATA_ECAT_NR = 8,
Tejun Heo7d47e8d2007-02-02 16:22:31 +090070
Tejun Heo87fbc5a2008-05-20 02:17:54 +090071 ATA_EH_CMD_DFL_TIMEOUT = 5000,
72
Tejun Heo0a2c0f52008-05-20 02:17:52 +090073 /* always put at least this amount of time between resets */
74 ATA_EH_RESET_COOL_DOWN = 5000,
75
Tejun Heo341c2c92008-05-20 02:17:51 +090076 /* Waiting in ->prereset can never be reliable. It's
77 * sometimes nice to wait there but it can't be depended upon;
78 * otherwise, we wouldn't be resetting. Just give it enough
79 * time for most drives to spin up.
80 */
81 ATA_EH_PRERESET_TIMEOUT = 10000,
82 ATA_EH_FASTDRAIN_INTERVAL = 3000,
Tejun Heo11fc33d2008-08-30 14:20:01 +020083
84 ATA_EH_UA_TRIES = 5,
Tejun Heoc2c7a892009-01-29 20:31:34 +090085
86 /* probe speed down parameters, see ata_eh_schedule_probe() */
87 ATA_EH_PROBE_TRIAL_INTERVAL = 60000, /* 1 min */
88 ATA_EH_PROBE_TRIALS = 2,
Tejun Heo31daabd2007-02-02 16:50:52 +090089};
90
91/* The following table determines how we sequence resets. Each entry
92 * represents timeout for that try. The first try can be soft or
93 * hardreset. All others are hardreset if available. In most cases
94 * the first reset w/ 10sec timeout should succeed. Following entries
95 * are mostly for error handling, hotplug and retarded devices.
96 */
97static const unsigned long ata_eh_reset_timeouts[] = {
Tejun Heo341c2c92008-05-20 02:17:51 +090098 10000, /* most drives spin up by 10sec */
99 10000, /* > 99% working drives spin up before 20sec */
100 35000, /* give > 30 secs of idleness for retarded devices */
101 5000, /* and sweet one last chance */
Tejun Heod8af0eb2008-05-20 02:17:53 +0900102 ULONG_MAX, /* > 1 min has elapsed, give up */
Tejun Heo31daabd2007-02-02 16:50:52 +0900103};
104
Tejun Heo87fbc5a2008-05-20 02:17:54 +0900105static const unsigned long ata_eh_identify_timeouts[] = {
106 5000, /* covers > 99% of successes and not too boring on failures */
107 10000, /* combined time till here is enough even for media access */
108 30000, /* for true idiots */
109 ULONG_MAX,
110};
111
112static const unsigned long ata_eh_other_timeouts[] = {
113 5000, /* same rationale as identify timeout */
114 10000, /* ditto */
115 /* but no merciful 30sec for other commands, it just isn't worth it */
116 ULONG_MAX,
117};
118
119struct ata_eh_cmd_timeout_ent {
120 const u8 *commands;
121 const unsigned long *timeouts;
122};
123
124/* The following table determines timeouts to use for EH internal
125 * commands. Each table entry is a command class and matches the
126 * commands the entry applies to and the timeout table to use.
127 *
128 * On the retry after a command timed out, the next timeout value from
129 * the table is used. If the table doesn't contain further entries,
130 * the last value is used.
131 *
132 * ehc->cmd_timeout_idx keeps track of which timeout to use per
133 * command class, so if SET_FEATURES times out on the first try, the
134 * next try will use the second timeout value only for that class.
135 */
136#define CMDS(cmds...) (const u8 []){ cmds, 0 }
137static const struct ata_eh_cmd_timeout_ent
138ata_eh_cmd_timeout_table[ATA_EH_CMD_TIMEOUT_TABLE_SIZE] = {
139 { .commands = CMDS(ATA_CMD_ID_ATA, ATA_CMD_ID_ATAPI),
140 .timeouts = ata_eh_identify_timeouts, },
141 { .commands = CMDS(ATA_CMD_READ_NATIVE_MAX, ATA_CMD_READ_NATIVE_MAX_EXT),
142 .timeouts = ata_eh_other_timeouts, },
143 { .commands = CMDS(ATA_CMD_SET_MAX, ATA_CMD_SET_MAX_EXT),
144 .timeouts = ata_eh_other_timeouts, },
145 { .commands = CMDS(ATA_CMD_SET_FEATURES),
146 .timeouts = ata_eh_other_timeouts, },
147 { .commands = CMDS(ATA_CMD_INIT_DEV_PARAMS),
148 .timeouts = ata_eh_other_timeouts, },
149};
150#undef CMDS
151
Tejun Heoad9e2762006-05-15 20:58:12 +0900152static void __ata_port_freeze(struct ata_port *ap);
Tejun Heo6ffa01d2007-03-02 17:32:47 +0900153#ifdef CONFIG_PM
Tejun Heo500530f2006-07-03 16:07:27 +0900154static void ata_eh_handle_port_suspend(struct ata_port *ap);
155static void ata_eh_handle_port_resume(struct ata_port *ap);
Tejun Heo6ffa01d2007-03-02 17:32:47 +0900156#else /* CONFIG_PM */
157static void ata_eh_handle_port_suspend(struct ata_port *ap)
158{ }
159
160static void ata_eh_handle_port_resume(struct ata_port *ap)
161{ }
Tejun Heo6ffa01d2007-03-02 17:32:47 +0900162#endif /* CONFIG_PM */
Tejun Heoad9e2762006-05-15 20:58:12 +0900163
Tejun Heob64bbc32007-07-16 14:29:39 +0900164static void __ata_ehi_pushv_desc(struct ata_eh_info *ehi, const char *fmt,
165 va_list args)
166{
167 ehi->desc_len += vscnprintf(ehi->desc + ehi->desc_len,
168 ATA_EH_DESC_LEN - ehi->desc_len,
169 fmt, args);
170}
171
172/**
173 * __ata_ehi_push_desc - push error description without adding separator
174 * @ehi: target EHI
175 * @fmt: printf format string
176 *
177 * Format string according to @fmt and append it to @ehi->desc.
178 *
179 * LOCKING:
180 * spin_lock_irqsave(host lock)
181 */
182void __ata_ehi_push_desc(struct ata_eh_info *ehi, const char *fmt, ...)
183{
184 va_list args;
185
186 va_start(args, fmt);
187 __ata_ehi_pushv_desc(ehi, fmt, args);
188 va_end(args);
189}
190
191/**
192 * ata_ehi_push_desc - push error description with separator
193 * @ehi: target EHI
194 * @fmt: printf format string
195 *
196 * Format string according to @fmt and append it to @ehi->desc.
197 * If @ehi->desc is not empty, ", " is added in-between.
198 *
199 * LOCKING:
200 * spin_lock_irqsave(host lock)
201 */
202void ata_ehi_push_desc(struct ata_eh_info *ehi, const char *fmt, ...)
203{
204 va_list args;
205
206 if (ehi->desc_len)
207 __ata_ehi_push_desc(ehi, ", ");
208
209 va_start(args, fmt);
210 __ata_ehi_pushv_desc(ehi, fmt, args);
211 va_end(args);
212}
213
214/**
215 * ata_ehi_clear_desc - clean error description
216 * @ehi: target EHI
217 *
218 * Clear @ehi->desc.
219 *
220 * LOCKING:
221 * spin_lock_irqsave(host lock)
222 */
223void ata_ehi_clear_desc(struct ata_eh_info *ehi)
224{
225 ehi->desc[0] = '\0';
226 ehi->desc_len = 0;
227}
228
Tejun Heocbcdd872007-08-18 13:14:55 +0900229/**
230 * ata_port_desc - append port description
231 * @ap: target ATA port
232 * @fmt: printf format string
233 *
234 * Format string according to @fmt and append it to port
235 * description. If port description is not empty, " " is added
236 * in-between. This function is to be used while initializing
237 * ata_host. The description is printed on host registration.
238 *
239 * LOCKING:
240 * None.
241 */
242void ata_port_desc(struct ata_port *ap, const char *fmt, ...)
243{
244 va_list args;
245
246 WARN_ON(!(ap->pflags & ATA_PFLAG_INITIALIZING));
247
248 if (ap->link.eh_info.desc_len)
249 __ata_ehi_push_desc(&ap->link.eh_info, " ");
250
251 va_start(args, fmt);
252 __ata_ehi_pushv_desc(&ap->link.eh_info, fmt, args);
253 va_end(args);
254}
255
256#ifdef CONFIG_PCI
257
258/**
259 * ata_port_pbar_desc - append PCI BAR description
260 * @ap: target ATA port
261 * @bar: target PCI BAR
262 * @offset: offset into PCI BAR
263 * @name: name of the area
264 *
265 * If @offset is negative, this function formats a string which
266 * contains the name, address, size and type of the BAR and
267 * appends it to the port description. If @offset is zero or
268 * positive, only name and offsetted address is appended.
269 *
270 * LOCKING:
271 * None.
272 */
273void ata_port_pbar_desc(struct ata_port *ap, int bar, ssize_t offset,
274 const char *name)
275{
276 struct pci_dev *pdev = to_pci_dev(ap->host->dev);
277 char *type = "";
278 unsigned long long start, len;
279
280 if (pci_resource_flags(pdev, bar) & IORESOURCE_MEM)
281 type = "m";
282 else if (pci_resource_flags(pdev, bar) & IORESOURCE_IO)
283 type = "i";
284
285 start = (unsigned long long)pci_resource_start(pdev, bar);
286 len = (unsigned long long)pci_resource_len(pdev, bar);
287
288 if (offset < 0)
289 ata_port_desc(ap, "%s %s%llu@0x%llx", name, type, len, start);
290 else
Andrew Mortone6a73ab2007-12-13 16:01:37 -0800291 ata_port_desc(ap, "%s 0x%llx", name,
292 start + (unsigned long long)offset);
Tejun Heocbcdd872007-08-18 13:14:55 +0900293}
294
295#endif /* CONFIG_PCI */
296
Tejun Heo87fbc5a2008-05-20 02:17:54 +0900297static int ata_lookup_timeout_table(u8 cmd)
298{
299 int i;
300
301 for (i = 0; i < ATA_EH_CMD_TIMEOUT_TABLE_SIZE; i++) {
302 const u8 *cur;
303
304 for (cur = ata_eh_cmd_timeout_table[i].commands; *cur; cur++)
305 if (*cur == cmd)
306 return i;
307 }
308
309 return -1;
310}
311
312/**
313 * ata_internal_cmd_timeout - determine timeout for an internal command
314 * @dev: target device
315 * @cmd: internal command to be issued
316 *
317 * Determine timeout for internal command @cmd for @dev.
318 *
319 * LOCKING:
320 * EH context.
321 *
322 * RETURNS:
323 * Determined timeout.
324 */
325unsigned long ata_internal_cmd_timeout(struct ata_device *dev, u8 cmd)
326{
327 struct ata_eh_context *ehc = &dev->link->eh_context;
328 int ent = ata_lookup_timeout_table(cmd);
329 int idx;
330
331 if (ent < 0)
332 return ATA_EH_CMD_DFL_TIMEOUT;
333
334 idx = ehc->cmd_timeout_idx[dev->devno][ent];
335 return ata_eh_cmd_timeout_table[ent].timeouts[idx];
336}
337
338/**
339 * ata_internal_cmd_timed_out - notification for internal command timeout
340 * @dev: target device
341 * @cmd: internal command which timed out
342 *
343 * Notify EH that internal command @cmd for @dev timed out. This
344 * function should be called only for commands whose timeouts are
345 * determined using ata_internal_cmd_timeout().
346 *
347 * LOCKING:
348 * EH context.
349 */
350void ata_internal_cmd_timed_out(struct ata_device *dev, u8 cmd)
351{
352 struct ata_eh_context *ehc = &dev->link->eh_context;
353 int ent = ata_lookup_timeout_table(cmd);
354 int idx;
355
356 if (ent < 0)
357 return;
358
359 idx = ehc->cmd_timeout_idx[dev->devno][ent];
360 if (ata_eh_cmd_timeout_table[ent].timeouts[idx + 1] != ULONG_MAX)
361 ehc->cmd_timeout_idx[dev->devno][ent]++;
362}
363
Tejun Heo3884f7b2007-11-27 19:28:56 +0900364static void ata_ering_record(struct ata_ering *ering, unsigned int eflags,
Tejun Heo0c247c52006-05-15 20:58:19 +0900365 unsigned int err_mask)
366{
367 struct ata_ering_entry *ent;
368
369 WARN_ON(!err_mask);
370
371 ering->cursor++;
372 ering->cursor %= ATA_ERING_SIZE;
373
374 ent = &ering->ring[ering->cursor];
Tejun Heo3884f7b2007-11-27 19:28:56 +0900375 ent->eflags = eflags;
Tejun Heo0c247c52006-05-15 20:58:19 +0900376 ent->err_mask = err_mask;
377 ent->timestamp = get_jiffies_64();
378}
379
Tejun Heo76326ac2007-11-27 19:28:59 +0900380static struct ata_ering_entry *ata_ering_top(struct ata_ering *ering)
381{
382 struct ata_ering_entry *ent = &ering->ring[ering->cursor];
383
384 if (ent->err_mask)
385 return ent;
386 return NULL;
387}
388
Tejun Heo7d47e8d2007-02-02 16:22:31 +0900389static void ata_ering_clear(struct ata_ering *ering)
Tejun Heo0c247c52006-05-15 20:58:19 +0900390{
Tejun Heo7d47e8d2007-02-02 16:22:31 +0900391 memset(ering, 0, sizeof(*ering));
Tejun Heo0c247c52006-05-15 20:58:19 +0900392}
393
394static int ata_ering_map(struct ata_ering *ering,
395 int (*map_fn)(struct ata_ering_entry *, void *),
396 void *arg)
397{
398 int idx, rc = 0;
399 struct ata_ering_entry *ent;
400
401 idx = ering->cursor;
402 do {
403 ent = &ering->ring[idx];
404 if (!ent->err_mask)
405 break;
406 rc = map_fn(ent, arg);
407 if (rc)
408 break;
409 idx = (idx - 1 + ATA_ERING_SIZE) % ATA_ERING_SIZE;
410 } while (idx != ering->cursor);
411
412 return rc;
413}
414
Tejun Heo64f65ca2006-06-24 20:30:18 +0900415static unsigned int ata_eh_dev_action(struct ata_device *dev)
416{
Tejun Heo9af5c9c2007-08-06 18:36:22 +0900417 struct ata_eh_context *ehc = &dev->link->eh_context;
Tejun Heo64f65ca2006-06-24 20:30:18 +0900418
419 return ehc->i.action | ehc->i.dev_action[dev->devno];
420}
421
Tejun Heof58229f2007-08-06 18:36:23 +0900422static void ata_eh_clear_action(struct ata_link *link, struct ata_device *dev,
Tejun Heoaf181c22006-06-24 20:30:18 +0900423 struct ata_eh_info *ehi, unsigned int action)
424{
Tejun Heof58229f2007-08-06 18:36:23 +0900425 struct ata_device *tdev;
Tejun Heoaf181c22006-06-24 20:30:18 +0900426
427 if (!dev) {
428 ehi->action &= ~action;
Tejun Heo1eca4362008-11-03 20:03:17 +0900429 ata_for_each_dev(tdev, link, ALL)
Tejun Heof58229f2007-08-06 18:36:23 +0900430 ehi->dev_action[tdev->devno] &= ~action;
Tejun Heoaf181c22006-06-24 20:30:18 +0900431 } else {
432 /* doesn't make sense for port-wide EH actions */
433 WARN_ON(!(action & ATA_EH_PERDEV_MASK));
434
435 /* break ehi->action into ehi->dev_action */
436 if (ehi->action & action) {
Tejun Heo1eca4362008-11-03 20:03:17 +0900437 ata_for_each_dev(tdev, link, ALL)
Tejun Heof58229f2007-08-06 18:36:23 +0900438 ehi->dev_action[tdev->devno] |=
439 ehi->action & action;
Tejun Heoaf181c22006-06-24 20:30:18 +0900440 ehi->action &= ~action;
441 }
442
443 /* turn off the specified per-dev action */
444 ehi->dev_action[dev->devno] &= ~action;
445 }
446}
447
Tejun Heoece1d632006-04-02 18:51:53 +0900448/**
449 * ata_scsi_timed_out - SCSI layer time out callback
450 * @cmd: timed out SCSI command
451 *
452 * Handles SCSI layer timeout. We race with normal completion of
453 * the qc for @cmd. If the qc is already gone, we lose and let
454 * the scsi command finish (EH_HANDLED). Otherwise, the qc has
455 * timed out and EH should be invoked. Prevent ata_qc_complete()
456 * from finishing it by setting EH_SCHEDULED and return
457 * EH_NOT_HANDLED.
458 *
Tejun Heoad9e2762006-05-15 20:58:12 +0900459 * TODO: kill this function once old EH is gone.
460 *
Tejun Heoece1d632006-04-02 18:51:53 +0900461 * LOCKING:
462 * Called from timer context
463 *
464 * RETURNS:
465 * EH_HANDLED or EH_NOT_HANDLED
466 */
Jens Axboe242f9dc2008-09-14 05:55:09 -0700467enum blk_eh_timer_return ata_scsi_timed_out(struct scsi_cmnd *cmd)
Tejun Heoece1d632006-04-02 18:51:53 +0900468{
469 struct Scsi_Host *host = cmd->device->host;
Jeff Garzik35bb94b2006-04-11 13:12:34 -0400470 struct ata_port *ap = ata_shost_to_port(host);
Tejun Heoece1d632006-04-02 18:51:53 +0900471 unsigned long flags;
472 struct ata_queued_cmd *qc;
Jens Axboe242f9dc2008-09-14 05:55:09 -0700473 enum blk_eh_timer_return ret;
Tejun Heoece1d632006-04-02 18:51:53 +0900474
475 DPRINTK("ENTER\n");
476
Tejun Heoad9e2762006-05-15 20:58:12 +0900477 if (ap->ops->error_handler) {
Jens Axboe242f9dc2008-09-14 05:55:09 -0700478 ret = BLK_EH_NOT_HANDLED;
Tejun Heoad9e2762006-05-15 20:58:12 +0900479 goto out;
480 }
481
Jens Axboe242f9dc2008-09-14 05:55:09 -0700482 ret = BLK_EH_HANDLED;
Jeff Garzikba6a1302006-06-22 23:46:10 -0400483 spin_lock_irqsave(ap->lock, flags);
Tejun Heo9af5c9c2007-08-06 18:36:22 +0900484 qc = ata_qc_from_tag(ap, ap->link.active_tag);
Tejun Heoece1d632006-04-02 18:51:53 +0900485 if (qc) {
486 WARN_ON(qc->scsicmd != cmd);
487 qc->flags |= ATA_QCFLAG_EH_SCHEDULED;
488 qc->err_mask |= AC_ERR_TIMEOUT;
Jens Axboe242f9dc2008-09-14 05:55:09 -0700489 ret = BLK_EH_NOT_HANDLED;
Tejun Heoece1d632006-04-02 18:51:53 +0900490 }
Jeff Garzikba6a1302006-06-22 23:46:10 -0400491 spin_unlock_irqrestore(ap->lock, flags);
Tejun Heoece1d632006-04-02 18:51:53 +0900492
Tejun Heoad9e2762006-05-15 20:58:12 +0900493 out:
Tejun Heoece1d632006-04-02 18:51:53 +0900494 DPRINTK("EXIT, ret=%d\n", ret);
495 return ret;
496}
497
Tejun Heoece180d2008-11-03 20:04:37 +0900498static void ata_eh_unload(struct ata_port *ap)
499{
500 struct ata_link *link;
501 struct ata_device *dev;
502 unsigned long flags;
503
504 /* Restore SControl IPM and SPD for the next driver and
505 * disable attached devices.
506 */
507 ata_for_each_link(link, ap, PMP_FIRST) {
508 sata_scr_write(link, SCR_CONTROL, link->saved_scontrol & 0xff0);
509 ata_for_each_dev(dev, link, ALL)
510 ata_dev_disable(dev);
511 }
512
513 /* freeze and set UNLOADED */
514 spin_lock_irqsave(ap->lock, flags);
515
516 ata_port_freeze(ap); /* won't be thawed */
517 ap->pflags &= ~ATA_PFLAG_EH_PENDING; /* clear pending from freeze */
518 ap->pflags |= ATA_PFLAG_UNLOADED;
519
520 spin_unlock_irqrestore(ap->lock, flags);
521}
522
Tejun Heoece1d632006-04-02 18:51:53 +0900523/**
524 * ata_scsi_error - SCSI layer error handler callback
525 * @host: SCSI host on which error occurred
526 *
527 * Handles SCSI-layer-thrown error events.
528 *
529 * LOCKING:
530 * Inherited from SCSI layer (none, can sleep)
531 *
532 * RETURNS:
533 * Zero.
534 */
Jeff Garzik381544b2006-04-11 13:04:39 -0400535void ata_scsi_error(struct Scsi_Host *host)
Tejun Heoece1d632006-04-02 18:51:53 +0900536{
Jeff Garzik35bb94b2006-04-11 13:12:34 -0400537 struct ata_port *ap = ata_shost_to_port(host);
Tejun Heoa1e10f72007-08-18 13:28:49 +0900538 int i;
Tejun Heoad9e2762006-05-15 20:58:12 +0900539 unsigned long flags;
Tejun Heoece1d632006-04-02 18:51:53 +0900540
541 DPRINTK("ENTER\n");
542
Tejun Heoad9e2762006-05-15 20:58:12 +0900543 /* synchronize with port task */
Tejun Heoece1d632006-04-02 18:51:53 +0900544 ata_port_flush_task(ap);
545
Jeff Garzikcca39742006-08-24 03:19:22 -0400546 /* synchronize with host lock and sort out timeouts */
Tejun Heoece1d632006-04-02 18:51:53 +0900547
Tejun Heoad9e2762006-05-15 20:58:12 +0900548 /* For new EH, all qcs are finished in one of three ways -
549 * normal completion, error completion, and SCSI timeout.
Alan Coxc96f1732009-03-24 10:23:46 +0000550 * Both completions can race against SCSI timeout. When normal
Tejun Heoad9e2762006-05-15 20:58:12 +0900551 * completion wins, the qc never reaches EH. When error
552 * completion wins, the qc has ATA_QCFLAG_FAILED set.
553 *
554 * When SCSI timeout wins, things are a bit more complex.
555 * Normal or error completion can occur after the timeout but
556 * before this point. In such cases, both types of
557 * completions are honored. A scmd is determined to have
558 * timed out iff its associated qc is active and not failed.
559 */
560 if (ap->ops->error_handler) {
561 struct scsi_cmnd *scmd, *tmp;
562 int nr_timedout = 0;
Tejun Heoece1d632006-04-02 18:51:53 +0900563
Tejun Heoe30349d2006-07-03 03:02:15 +0900564 spin_lock_irqsave(ap->lock, flags);
Alan Coxc96f1732009-03-24 10:23:46 +0000565
566 /* This must occur under the ap->lock as we don't want
567 a polled recovery to race the real interrupt handler
568
569 The lost_interrupt handler checks for any completed but
570 non-notified command and completes much like an IRQ handler.
571
572 We then fall into the error recovery code which will treat
573 this as if normal completion won the race */
Tejun Heoad9e2762006-05-15 20:58:12 +0900574
Alan Coxc96f1732009-03-24 10:23:46 +0000575 if (ap->ops->lost_interrupt)
576 ap->ops->lost_interrupt(ap);
577
Tejun Heoad9e2762006-05-15 20:58:12 +0900578 list_for_each_entry_safe(scmd, tmp, &host->eh_cmd_q, eh_entry) {
579 struct ata_queued_cmd *qc;
580
581 for (i = 0; i < ATA_MAX_QUEUE; i++) {
582 qc = __ata_qc_from_tag(ap, i);
583 if (qc->flags & ATA_QCFLAG_ACTIVE &&
584 qc->scsicmd == scmd)
585 break;
586 }
587
588 if (i < ATA_MAX_QUEUE) {
589 /* the scmd has an associated qc */
590 if (!(qc->flags & ATA_QCFLAG_FAILED)) {
591 /* which hasn't failed yet, timeout */
592 qc->err_mask |= AC_ERR_TIMEOUT;
593 qc->flags |= ATA_QCFLAG_FAILED;
594 nr_timedout++;
595 }
596 } else {
597 /* Normal completion occurred after
598 * SCSI timeout but before this point.
599 * Successfully complete it.
600 */
601 scmd->retries = scmd->allowed;
602 scsi_eh_finish_cmd(scmd, &ap->eh_done_q);
603 }
604 }
605
606 /* If we have timed out qcs. They belong to EH from
607 * this point but the state of the controller is
608 * unknown. Freeze the port to make sure the IRQ
609 * handler doesn't diddle with those qcs. This must
610 * be done atomically w.r.t. setting QCFLAG_FAILED.
611 */
612 if (nr_timedout)
613 __ata_port_freeze(ap);
614
Tejun Heoe30349d2006-07-03 03:02:15 +0900615 spin_unlock_irqrestore(ap->lock, flags);
Tejun Heoa1e10f72007-08-18 13:28:49 +0900616
617 /* initialize eh_tries */
618 ap->eh_tries = ATA_EH_MAX_TRIES;
Tejun Heoad9e2762006-05-15 20:58:12 +0900619 } else
Tejun Heoe30349d2006-07-03 03:02:15 +0900620 spin_unlock_wait(ap->lock);
Alan Coxc96f1732009-03-24 10:23:46 +0000621
622 /* If we timed raced normal completion and there is nothing to
623 recover nr_timedout == 0 why exactly are we doing error recovery ? */
Tejun Heoad9e2762006-05-15 20:58:12 +0900624
625 repeat:
626 /* invoke error handler */
627 if (ap->ops->error_handler) {
Tejun Heocf1b86c2007-08-06 18:36:23 +0900628 struct ata_link *link;
629
Tejun Heo5ddf24c2007-07-16 14:29:41 +0900630 /* kill fast drain timer */
631 del_timer_sync(&ap->fastdrain_timer);
632
Tejun Heo500530f2006-07-03 16:07:27 +0900633 /* process port resume request */
634 ata_eh_handle_port_resume(ap);
635
Tejun Heof3e81b12006-05-15 20:58:21 +0900636 /* fetch & clear EH info */
Tejun Heoe30349d2006-07-03 03:02:15 +0900637 spin_lock_irqsave(ap->lock, flags);
Tejun Heof3e81b12006-05-15 20:58:21 +0900638
Tejun Heo1eca4362008-11-03 20:03:17 +0900639 ata_for_each_link(link, ap, HOST_FIRST) {
Tejun Heo00115e02007-11-27 19:28:58 +0900640 struct ata_eh_context *ehc = &link->eh_context;
641 struct ata_device *dev;
642
Tejun Heocf1b86c2007-08-06 18:36:23 +0900643 memset(&link->eh_context, 0, sizeof(link->eh_context));
644 link->eh_context.i = link->eh_info;
645 memset(&link->eh_info, 0, sizeof(link->eh_info));
Tejun Heo00115e02007-11-27 19:28:58 +0900646
Tejun Heo1eca4362008-11-03 20:03:17 +0900647 ata_for_each_dev(dev, link, ENABLED) {
Tejun Heo00115e02007-11-27 19:28:58 +0900648 int devno = dev->devno;
649
650 ehc->saved_xfer_mode[devno] = dev->xfer_mode;
651 if (ata_ncq_enabled(dev))
652 ehc->saved_ncq_enabled |= 1 << devno;
653 }
Tejun Heocf1b86c2007-08-06 18:36:23 +0900654 }
Tejun Heof3e81b12006-05-15 20:58:21 +0900655
Tejun Heob51e9e52006-06-29 01:29:30 +0900656 ap->pflags |= ATA_PFLAG_EH_IN_PROGRESS;
657 ap->pflags &= ~ATA_PFLAG_EH_PENDING;
Tejun Heoda917d62007-09-23 13:14:12 +0900658 ap->excl_link = NULL; /* don't maintain exclusion over EH */
Tejun Heof3e81b12006-05-15 20:58:21 +0900659
Tejun Heoe30349d2006-07-03 03:02:15 +0900660 spin_unlock_irqrestore(ap->lock, flags);
Tejun Heoad9e2762006-05-15 20:58:12 +0900661
Tejun Heo500530f2006-07-03 16:07:27 +0900662 /* invoke EH, skip if unloading or suspended */
663 if (!(ap->pflags & (ATA_PFLAG_UNLOADING | ATA_PFLAG_SUSPENDED)))
Tejun Heo720ba122006-05-31 18:28:13 +0900664 ap->ops->error_handler(ap);
Tejun Heoece180d2008-11-03 20:04:37 +0900665 else {
666 /* if unloading, commence suicide */
667 if ((ap->pflags & ATA_PFLAG_UNLOADING) &&
668 !(ap->pflags & ATA_PFLAG_UNLOADED))
669 ata_eh_unload(ap);
Tejun Heo720ba122006-05-31 18:28:13 +0900670 ata_eh_finish(ap);
Tejun Heoece180d2008-11-03 20:04:37 +0900671 }
Tejun Heoad9e2762006-05-15 20:58:12 +0900672
Tejun Heo500530f2006-07-03 16:07:27 +0900673 /* process port suspend request */
674 ata_eh_handle_port_suspend(ap);
675
Tejun Heoad9e2762006-05-15 20:58:12 +0900676 /* Exception might have happend after ->error_handler
677 * recovered the port but before this point. Repeat
678 * EH in such case.
679 */
Tejun Heoe30349d2006-07-03 03:02:15 +0900680 spin_lock_irqsave(ap->lock, flags);
Tejun Heoad9e2762006-05-15 20:58:12 +0900681
Tejun Heob51e9e52006-06-29 01:29:30 +0900682 if (ap->pflags & ATA_PFLAG_EH_PENDING) {
Tejun Heoa1e10f72007-08-18 13:28:49 +0900683 if (--ap->eh_tries) {
Tejun Heoe30349d2006-07-03 03:02:15 +0900684 spin_unlock_irqrestore(ap->lock, flags);
Tejun Heoad9e2762006-05-15 20:58:12 +0900685 goto repeat;
686 }
687 ata_port_printk(ap, KERN_ERR, "EH pending after %d "
Tejun Heoa1e10f72007-08-18 13:28:49 +0900688 "tries, giving up\n", ATA_EH_MAX_TRIES);
Tejun Heo914616a2007-06-25 21:47:11 +0900689 ap->pflags &= ~ATA_PFLAG_EH_PENDING;
Tejun Heoad9e2762006-05-15 20:58:12 +0900690 }
691
Tejun Heof3e81b12006-05-15 20:58:21 +0900692 /* this run is complete, make sure EH info is clear */
Tejun Heo1eca4362008-11-03 20:03:17 +0900693 ata_for_each_link(link, ap, HOST_FIRST)
Tejun Heocf1b86c2007-08-06 18:36:23 +0900694 memset(&link->eh_info, 0, sizeof(link->eh_info));
Tejun Heof3e81b12006-05-15 20:58:21 +0900695
Tejun Heoe30349d2006-07-03 03:02:15 +0900696 /* Clear host_eh_scheduled while holding ap->lock such
Tejun Heoad9e2762006-05-15 20:58:12 +0900697 * that if exception occurs after this point but
698 * before EH completion, SCSI midlayer will
699 * re-initiate EH.
700 */
701 host->host_eh_scheduled = 0;
702
Tejun Heoe30349d2006-07-03 03:02:15 +0900703 spin_unlock_irqrestore(ap->lock, flags);
Tejun Heoad9e2762006-05-15 20:58:12 +0900704 } else {
Tejun Heo9af5c9c2007-08-06 18:36:22 +0900705 WARN_ON(ata_qc_from_tag(ap, ap->link.active_tag) == NULL);
Tejun Heoad9e2762006-05-15 20:58:12 +0900706 ap->ops->eng_timeout(ap);
707 }
708
709 /* finish or retry handled scmd's and clean up */
Tejun Heoece1d632006-04-02 18:51:53 +0900710 WARN_ON(host->host_failed || !list_empty(&host->eh_cmd_q));
711
712 scsi_eh_flush_done_q(&ap->eh_done_q);
713
Tejun Heoad9e2762006-05-15 20:58:12 +0900714 /* clean up */
Tejun Heoe30349d2006-07-03 03:02:15 +0900715 spin_lock_irqsave(ap->lock, flags);
Tejun Heoad9e2762006-05-15 20:58:12 +0900716
Tejun Heo1cdaf532006-07-03 16:07:26 +0900717 if (ap->pflags & ATA_PFLAG_LOADING)
Tejun Heob51e9e52006-06-29 01:29:30 +0900718 ap->pflags &= ~ATA_PFLAG_LOADING;
Tejun Heo1cdaf532006-07-03 16:07:26 +0900719 else if (ap->pflags & ATA_PFLAG_SCSI_HOTPLUG)
David Howells52bad642006-11-22 14:54:01 +0000720 queue_delayed_work(ata_aux_wq, &ap->hotplug_task, 0);
Tejun Heo1cdaf532006-07-03 16:07:26 +0900721
722 if (ap->pflags & ATA_PFLAG_RECOVERED)
723 ata_port_printk(ap, KERN_INFO, "EH complete\n");
Tejun Heo580b21022006-05-31 18:28:05 +0900724
Tejun Heob51e9e52006-06-29 01:29:30 +0900725 ap->pflags &= ~(ATA_PFLAG_SCSI_HOTPLUG | ATA_PFLAG_RECOVERED);
Tejun Heoad9e2762006-05-15 20:58:12 +0900726
Tejun Heoc6cf9e92006-05-31 18:27:27 +0900727 /* tell wait_eh that we're done */
Tejun Heob51e9e52006-06-29 01:29:30 +0900728 ap->pflags &= ~ATA_PFLAG_EH_IN_PROGRESS;
Tejun Heoc6cf9e92006-05-31 18:27:27 +0900729 wake_up_all(&ap->eh_wait_q);
730
Tejun Heoe30349d2006-07-03 03:02:15 +0900731 spin_unlock_irqrestore(ap->lock, flags);
Tejun Heoad9e2762006-05-15 20:58:12 +0900732
Tejun Heoece1d632006-04-02 18:51:53 +0900733 DPRINTK("EXIT\n");
Tejun Heoece1d632006-04-02 18:51:53 +0900734}
735
736/**
Tejun Heoc6cf9e92006-05-31 18:27:27 +0900737 * ata_port_wait_eh - Wait for the currently pending EH to complete
738 * @ap: Port to wait EH for
739 *
740 * Wait until the currently pending EH is complete.
741 *
742 * LOCKING:
743 * Kernel thread context (may sleep).
744 */
745void ata_port_wait_eh(struct ata_port *ap)
746{
747 unsigned long flags;
748 DEFINE_WAIT(wait);
749
750 retry:
Jeff Garzikba6a1302006-06-22 23:46:10 -0400751 spin_lock_irqsave(ap->lock, flags);
Tejun Heoc6cf9e92006-05-31 18:27:27 +0900752
Tejun Heob51e9e52006-06-29 01:29:30 +0900753 while (ap->pflags & (ATA_PFLAG_EH_PENDING | ATA_PFLAG_EH_IN_PROGRESS)) {
Tejun Heoc6cf9e92006-05-31 18:27:27 +0900754 prepare_to_wait(&ap->eh_wait_q, &wait, TASK_UNINTERRUPTIBLE);
Jeff Garzikba6a1302006-06-22 23:46:10 -0400755 spin_unlock_irqrestore(ap->lock, flags);
Tejun Heoc6cf9e92006-05-31 18:27:27 +0900756 schedule();
Jeff Garzikba6a1302006-06-22 23:46:10 -0400757 spin_lock_irqsave(ap->lock, flags);
Tejun Heoc6cf9e92006-05-31 18:27:27 +0900758 }
Tejun Heo0a1b6222006-06-11 11:01:38 +0900759 finish_wait(&ap->eh_wait_q, &wait);
Tejun Heoc6cf9e92006-05-31 18:27:27 +0900760
Jeff Garzikba6a1302006-06-22 23:46:10 -0400761 spin_unlock_irqrestore(ap->lock, flags);
Tejun Heoc6cf9e92006-05-31 18:27:27 +0900762
763 /* make sure SCSI EH is complete */
Jeff Garzikcca39742006-08-24 03:19:22 -0400764 if (scsi_host_in_recovery(ap->scsi_host)) {
Tejun Heoc6cf9e92006-05-31 18:27:27 +0900765 msleep(10);
766 goto retry;
767 }
768}
769
Tejun Heo5ddf24c2007-07-16 14:29:41 +0900770static int ata_eh_nr_in_flight(struct ata_port *ap)
771{
772 unsigned int tag;
773 int nr = 0;
774
775 /* count only non-internal commands */
776 for (tag = 0; tag < ATA_MAX_QUEUE - 1; tag++)
777 if (ata_qc_from_tag(ap, tag))
778 nr++;
779
780 return nr;
781}
782
783void ata_eh_fastdrain_timerfn(unsigned long arg)
784{
785 struct ata_port *ap = (void *)arg;
786 unsigned long flags;
787 int cnt;
788
789 spin_lock_irqsave(ap->lock, flags);
790
791 cnt = ata_eh_nr_in_flight(ap);
792
793 /* are we done? */
794 if (!cnt)
795 goto out_unlock;
796
797 if (cnt == ap->fastdrain_cnt) {
798 unsigned int tag;
799
800 /* No progress during the last interval, tag all
801 * in-flight qcs as timed out and freeze the port.
802 */
803 for (tag = 0; tag < ATA_MAX_QUEUE - 1; tag++) {
804 struct ata_queued_cmd *qc = ata_qc_from_tag(ap, tag);
805 if (qc)
806 qc->err_mask |= AC_ERR_TIMEOUT;
807 }
808
809 ata_port_freeze(ap);
810 } else {
811 /* some qcs have finished, give it another chance */
812 ap->fastdrain_cnt = cnt;
813 ap->fastdrain_timer.expires =
Tejun Heo341c2c92008-05-20 02:17:51 +0900814 ata_deadline(jiffies, ATA_EH_FASTDRAIN_INTERVAL);
Tejun Heo5ddf24c2007-07-16 14:29:41 +0900815 add_timer(&ap->fastdrain_timer);
816 }
817
818 out_unlock:
819 spin_unlock_irqrestore(ap->lock, flags);
820}
821
822/**
823 * ata_eh_set_pending - set ATA_PFLAG_EH_PENDING and activate fast drain
824 * @ap: target ATA port
825 * @fastdrain: activate fast drain
826 *
827 * Set ATA_PFLAG_EH_PENDING and activate fast drain if @fastdrain
828 * is non-zero and EH wasn't pending before. Fast drain ensures
829 * that EH kicks in in timely manner.
830 *
831 * LOCKING:
832 * spin_lock_irqsave(host lock)
833 */
834static void ata_eh_set_pending(struct ata_port *ap, int fastdrain)
835{
836 int cnt;
837
838 /* already scheduled? */
839 if (ap->pflags & ATA_PFLAG_EH_PENDING)
840 return;
841
842 ap->pflags |= ATA_PFLAG_EH_PENDING;
843
844 if (!fastdrain)
845 return;
846
847 /* do we have in-flight qcs? */
848 cnt = ata_eh_nr_in_flight(ap);
849 if (!cnt)
850 return;
851
852 /* activate fast drain */
853 ap->fastdrain_cnt = cnt;
Tejun Heo341c2c92008-05-20 02:17:51 +0900854 ap->fastdrain_timer.expires =
855 ata_deadline(jiffies, ATA_EH_FASTDRAIN_INTERVAL);
Tejun Heo5ddf24c2007-07-16 14:29:41 +0900856 add_timer(&ap->fastdrain_timer);
857}
858
Tejun Heof686bcb2006-05-15 20:58:05 +0900859/**
860 * ata_qc_schedule_eh - schedule qc for error handling
861 * @qc: command to schedule error handling for
862 *
863 * Schedule error handling for @qc. EH will kick in as soon as
864 * other commands are drained.
865 *
866 * LOCKING:
Jeff Garzikcca39742006-08-24 03:19:22 -0400867 * spin_lock_irqsave(host lock)
Tejun Heof686bcb2006-05-15 20:58:05 +0900868 */
869void ata_qc_schedule_eh(struct ata_queued_cmd *qc)
870{
871 struct ata_port *ap = qc->ap;
872
873 WARN_ON(!ap->ops->error_handler);
874
875 qc->flags |= ATA_QCFLAG_FAILED;
Tejun Heo5ddf24c2007-07-16 14:29:41 +0900876 ata_eh_set_pending(ap, 1);
Tejun Heof686bcb2006-05-15 20:58:05 +0900877
878 /* The following will fail if timeout has already expired.
879 * ata_scsi_error() takes care of such scmds on EH entry.
880 * Note that ATA_QCFLAG_FAILED is unconditionally set after
881 * this function completes.
882 */
Jens Axboe242f9dc2008-09-14 05:55:09 -0700883 blk_abort_request(qc->scsicmd->request);
Tejun Heof686bcb2006-05-15 20:58:05 +0900884}
885
Tejun Heo7b70fc02006-05-15 20:58:07 +0900886/**
887 * ata_port_schedule_eh - schedule error handling without a qc
888 * @ap: ATA port to schedule EH for
889 *
890 * Schedule error handling for @ap. EH will kick in as soon as
891 * all commands are drained.
892 *
893 * LOCKING:
Jeff Garzikcca39742006-08-24 03:19:22 -0400894 * spin_lock_irqsave(host lock)
Tejun Heo7b70fc02006-05-15 20:58:07 +0900895 */
896void ata_port_schedule_eh(struct ata_port *ap)
897{
898 WARN_ON(!ap->ops->error_handler);
899
Tejun Heof4d6d002007-05-01 11:50:15 +0200900 if (ap->pflags & ATA_PFLAG_INITIALIZING)
901 return;
902
Tejun Heo5ddf24c2007-07-16 14:29:41 +0900903 ata_eh_set_pending(ap, 1);
Jeff Garzikcca39742006-08-24 03:19:22 -0400904 scsi_schedule_eh(ap->scsi_host);
Tejun Heo7b70fc02006-05-15 20:58:07 +0900905
906 DPRINTK("port EH scheduled\n");
907}
908
Tejun Heodbd82612007-08-06 18:36:23 +0900909static int ata_do_link_abort(struct ata_port *ap, struct ata_link *link)
Tejun Heo7b70fc02006-05-15 20:58:07 +0900910{
911 int tag, nr_aborted = 0;
912
913 WARN_ON(!ap->ops->error_handler);
914
Tejun Heo5ddf24c2007-07-16 14:29:41 +0900915 /* we're gonna abort all commands, no need for fast drain */
916 ata_eh_set_pending(ap, 0);
917
Tejun Heo7b70fc02006-05-15 20:58:07 +0900918 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) {
919 struct ata_queued_cmd *qc = ata_qc_from_tag(ap, tag);
920
Tejun Heodbd82612007-08-06 18:36:23 +0900921 if (qc && (!link || qc->dev->link == link)) {
Tejun Heo7b70fc02006-05-15 20:58:07 +0900922 qc->flags |= ATA_QCFLAG_FAILED;
923 ata_qc_complete(qc);
924 nr_aborted++;
925 }
926 }
927
928 if (!nr_aborted)
929 ata_port_schedule_eh(ap);
930
931 return nr_aborted;
932}
933
Tejun Heoe3180492006-05-15 20:58:09 +0900934/**
Tejun Heodbd82612007-08-06 18:36:23 +0900935 * ata_link_abort - abort all qc's on the link
936 * @link: ATA link to abort qc's for
937 *
938 * Abort all active qc's active on @link and schedule EH.
939 *
940 * LOCKING:
941 * spin_lock_irqsave(host lock)
942 *
943 * RETURNS:
944 * Number of aborted qc's.
945 */
946int ata_link_abort(struct ata_link *link)
947{
948 return ata_do_link_abort(link->ap, link);
949}
950
951/**
952 * ata_port_abort - abort all qc's on the port
953 * @ap: ATA port to abort qc's for
954 *
955 * Abort all active qc's of @ap and schedule EH.
956 *
957 * LOCKING:
958 * spin_lock_irqsave(host_set lock)
959 *
960 * RETURNS:
961 * Number of aborted qc's.
962 */
963int ata_port_abort(struct ata_port *ap)
964{
965 return ata_do_link_abort(ap, NULL);
966}
967
968/**
Tejun Heoe3180492006-05-15 20:58:09 +0900969 * __ata_port_freeze - freeze port
970 * @ap: ATA port to freeze
971 *
972 * This function is called when HSM violation or some other
973 * condition disrupts normal operation of the port. Frozen port
974 * is not allowed to perform any operation until the port is
975 * thawed, which usually follows a successful reset.
976 *
977 * ap->ops->freeze() callback can be used for freezing the port
978 * hardware-wise (e.g. mask interrupt and stop DMA engine). If a
979 * port cannot be frozen hardware-wise, the interrupt handler
980 * must ack and clear interrupts unconditionally while the port
981 * is frozen.
982 *
983 * LOCKING:
Jeff Garzikcca39742006-08-24 03:19:22 -0400984 * spin_lock_irqsave(host lock)
Tejun Heoe3180492006-05-15 20:58:09 +0900985 */
986static void __ata_port_freeze(struct ata_port *ap)
987{
988 WARN_ON(!ap->ops->error_handler);
989
990 if (ap->ops->freeze)
991 ap->ops->freeze(ap);
992
Tejun Heob51e9e52006-06-29 01:29:30 +0900993 ap->pflags |= ATA_PFLAG_FROZEN;
Tejun Heoe3180492006-05-15 20:58:09 +0900994
Tejun Heo44877b42007-02-21 01:06:51 +0900995 DPRINTK("ata%u port frozen\n", ap->print_id);
Tejun Heoe3180492006-05-15 20:58:09 +0900996}
997
998/**
999 * ata_port_freeze - abort & freeze port
1000 * @ap: ATA port to freeze
1001 *
Jeff Garzik54c38442009-04-07 19:13:15 -04001002 * Abort and freeze @ap. The freeze operation must be called
1003 * first, because some hardware requires special operations
1004 * before the taskfile registers are accessible.
Tejun Heoe3180492006-05-15 20:58:09 +09001005 *
1006 * LOCKING:
Jeff Garzikcca39742006-08-24 03:19:22 -04001007 * spin_lock_irqsave(host lock)
Tejun Heoe3180492006-05-15 20:58:09 +09001008 *
1009 * RETURNS:
1010 * Number of aborted commands.
1011 */
1012int ata_port_freeze(struct ata_port *ap)
1013{
1014 int nr_aborted;
1015
1016 WARN_ON(!ap->ops->error_handler);
1017
Tejun Heoe3180492006-05-15 20:58:09 +09001018 __ata_port_freeze(ap);
Jeff Garzik54c38442009-04-07 19:13:15 -04001019 nr_aborted = ata_port_abort(ap);
Tejun Heoe3180492006-05-15 20:58:09 +09001020
1021 return nr_aborted;
1022}
1023
1024/**
Tejun Heo7d77b242007-09-23 13:14:13 +09001025 * sata_async_notification - SATA async notification handler
1026 * @ap: ATA port where async notification is received
1027 *
1028 * Handler to be called when async notification via SDB FIS is
1029 * received. This function schedules EH if necessary.
1030 *
1031 * LOCKING:
1032 * spin_lock_irqsave(host lock)
1033 *
1034 * RETURNS:
1035 * 1 if EH is scheduled, 0 otherwise.
1036 */
1037int sata_async_notification(struct ata_port *ap)
1038{
1039 u32 sntf;
1040 int rc;
1041
1042 if (!(ap->flags & ATA_FLAG_AN))
1043 return 0;
1044
1045 rc = sata_scr_read(&ap->link, SCR_NOTIFICATION, &sntf);
1046 if (rc == 0)
1047 sata_scr_write(&ap->link, SCR_NOTIFICATION, sntf);
1048
Tejun Heo071f44b2008-04-07 22:47:22 +09001049 if (!sata_pmp_attached(ap) || rc) {
Tejun Heo7d77b242007-09-23 13:14:13 +09001050 /* PMP is not attached or SNTF is not available */
Tejun Heo071f44b2008-04-07 22:47:22 +09001051 if (!sata_pmp_attached(ap)) {
Tejun Heo7d77b242007-09-23 13:14:13 +09001052 /* PMP is not attached. Check whether ATAPI
1053 * AN is configured. If so, notify media
1054 * change.
1055 */
1056 struct ata_device *dev = ap->link.device;
1057
1058 if ((dev->class == ATA_DEV_ATAPI) &&
1059 (dev->flags & ATA_DFLAG_AN))
1060 ata_scsi_media_change_notify(dev);
1061 return 0;
1062 } else {
1063 /* PMP is attached but SNTF is not available.
1064 * ATAPI async media change notification is
1065 * not used. The PMP must be reporting PHY
1066 * status change, schedule EH.
1067 */
1068 ata_port_schedule_eh(ap);
1069 return 1;
1070 }
1071 } else {
1072 /* PMP is attached and SNTF is available */
1073 struct ata_link *link;
1074
1075 /* check and notify ATAPI AN */
Tejun Heo1eca4362008-11-03 20:03:17 +09001076 ata_for_each_link(link, ap, EDGE) {
Tejun Heo7d77b242007-09-23 13:14:13 +09001077 if (!(sntf & (1 << link->pmp)))
1078 continue;
1079
1080 if ((link->device->class == ATA_DEV_ATAPI) &&
1081 (link->device->flags & ATA_DFLAG_AN))
1082 ata_scsi_media_change_notify(link->device);
1083 }
1084
1085 /* If PMP is reporting that PHY status of some
1086 * downstream ports has changed, schedule EH.
1087 */
1088 if (sntf & (1 << SATA_PMP_CTRL_PORT)) {
1089 ata_port_schedule_eh(ap);
1090 return 1;
1091 }
1092
1093 return 0;
1094 }
1095}
1096
1097/**
Tejun Heoe3180492006-05-15 20:58:09 +09001098 * ata_eh_freeze_port - EH helper to freeze port
1099 * @ap: ATA port to freeze
1100 *
1101 * Freeze @ap.
1102 *
1103 * LOCKING:
1104 * None.
1105 */
1106void ata_eh_freeze_port(struct ata_port *ap)
1107{
1108 unsigned long flags;
1109
1110 if (!ap->ops->error_handler)
1111 return;
1112
Jeff Garzikba6a1302006-06-22 23:46:10 -04001113 spin_lock_irqsave(ap->lock, flags);
Tejun Heoe3180492006-05-15 20:58:09 +09001114 __ata_port_freeze(ap);
Jeff Garzikba6a1302006-06-22 23:46:10 -04001115 spin_unlock_irqrestore(ap->lock, flags);
Tejun Heoe3180492006-05-15 20:58:09 +09001116}
1117
1118/**
1119 * ata_port_thaw_port - EH helper to thaw port
1120 * @ap: ATA port to thaw
1121 *
1122 * Thaw frozen port @ap.
1123 *
1124 * LOCKING:
1125 * None.
1126 */
1127void ata_eh_thaw_port(struct ata_port *ap)
1128{
1129 unsigned long flags;
1130
1131 if (!ap->ops->error_handler)
1132 return;
1133
Jeff Garzikba6a1302006-06-22 23:46:10 -04001134 spin_lock_irqsave(ap->lock, flags);
Tejun Heoe3180492006-05-15 20:58:09 +09001135
Tejun Heob51e9e52006-06-29 01:29:30 +09001136 ap->pflags &= ~ATA_PFLAG_FROZEN;
Tejun Heoe3180492006-05-15 20:58:09 +09001137
1138 if (ap->ops->thaw)
1139 ap->ops->thaw(ap);
1140
Jeff Garzikba6a1302006-06-22 23:46:10 -04001141 spin_unlock_irqrestore(ap->lock, flags);
Tejun Heoe3180492006-05-15 20:58:09 +09001142
Tejun Heo44877b42007-02-21 01:06:51 +09001143 DPRINTK("ata%u port thawed\n", ap->print_id);
Tejun Heoe3180492006-05-15 20:58:09 +09001144}
1145
Tejun Heoece1d632006-04-02 18:51:53 +09001146static void ata_eh_scsidone(struct scsi_cmnd *scmd)
1147{
1148 /* nada */
1149}
1150
1151static void __ata_eh_qc_complete(struct ata_queued_cmd *qc)
1152{
1153 struct ata_port *ap = qc->ap;
1154 struct scsi_cmnd *scmd = qc->scsicmd;
1155 unsigned long flags;
1156
Jeff Garzikba6a1302006-06-22 23:46:10 -04001157 spin_lock_irqsave(ap->lock, flags);
Tejun Heoece1d632006-04-02 18:51:53 +09001158 qc->scsidone = ata_eh_scsidone;
1159 __ata_qc_complete(qc);
1160 WARN_ON(ata_tag_valid(qc->tag));
Jeff Garzikba6a1302006-06-22 23:46:10 -04001161 spin_unlock_irqrestore(ap->lock, flags);
Tejun Heoece1d632006-04-02 18:51:53 +09001162
1163 scsi_eh_finish_cmd(scmd, &ap->eh_done_q);
1164}
1165
1166/**
1167 * ata_eh_qc_complete - Complete an active ATA command from EH
1168 * @qc: Command to complete
1169 *
1170 * Indicate to the mid and upper layers that an ATA command has
1171 * completed. To be used from EH.
1172 */
1173void ata_eh_qc_complete(struct ata_queued_cmd *qc)
1174{
1175 struct scsi_cmnd *scmd = qc->scsicmd;
1176 scmd->retries = scmd->allowed;
1177 __ata_eh_qc_complete(qc);
1178}
1179
1180/**
1181 * ata_eh_qc_retry - Tell midlayer to retry an ATA command after EH
1182 * @qc: Command to retry
1183 *
1184 * Indicate to the mid and upper layers that an ATA command
1185 * should be retried. To be used from EH.
1186 *
1187 * SCSI midlayer limits the number of retries to scmd->allowed.
1188 * scmd->retries is decremented for commands which get retried
1189 * due to unrelated failures (qc->err_mask is zero).
1190 */
1191void ata_eh_qc_retry(struct ata_queued_cmd *qc)
1192{
1193 struct scsi_cmnd *scmd = qc->scsicmd;
1194 if (!qc->err_mask && scmd->retries)
1195 scmd->retries--;
1196 __ata_eh_qc_complete(qc);
1197}
Tejun Heo022bdb02006-05-15 20:58:22 +09001198
1199/**
Tejun Heo678afac2009-01-29 20:31:30 +09001200 * ata_dev_disable - disable ATA device
1201 * @dev: ATA device to disable
1202 *
1203 * Disable @dev.
1204 *
1205 * Locking:
1206 * EH context.
1207 */
1208void ata_dev_disable(struct ata_device *dev)
1209{
1210 if (!ata_dev_enabled(dev))
1211 return;
1212
1213 if (ata_msg_drv(dev->link->ap))
1214 ata_dev_printk(dev, KERN_WARNING, "disabled\n");
1215 ata_acpi_on_disable(dev);
1216 ata_down_xfermask_limit(dev, ATA_DNXFER_FORCE_PIO0 | ATA_DNXFER_QUIET);
1217 dev->class++;
Tejun Heo99cf6102009-01-29 20:31:32 +09001218
1219 /* From now till the next successful probe, ering is used to
1220 * track probe failures. Clear accumulated device error info.
1221 */
1222 ata_ering_clear(&dev->ering);
Tejun Heo678afac2009-01-29 20:31:30 +09001223}
1224
1225/**
Tejun Heo0ea035a2006-05-31 18:28:01 +09001226 * ata_eh_detach_dev - detach ATA device
1227 * @dev: ATA device to detach
1228 *
1229 * Detach @dev.
1230 *
1231 * LOCKING:
1232 * None.
1233 */
Tejun Heofb7fd612007-09-23 13:14:12 +09001234void ata_eh_detach_dev(struct ata_device *dev)
Tejun Heo0ea035a2006-05-31 18:28:01 +09001235{
Tejun Heof58229f2007-08-06 18:36:23 +09001236 struct ata_link *link = dev->link;
1237 struct ata_port *ap = link->ap;
Tejun Heo90484eb2008-10-26 15:43:03 +09001238 struct ata_eh_context *ehc = &link->eh_context;
Tejun Heo0ea035a2006-05-31 18:28:01 +09001239 unsigned long flags;
1240
1241 ata_dev_disable(dev);
1242
Jeff Garzikba6a1302006-06-22 23:46:10 -04001243 spin_lock_irqsave(ap->lock, flags);
Tejun Heo0ea035a2006-05-31 18:28:01 +09001244
1245 dev->flags &= ~ATA_DFLAG_DETACH;
1246
1247 if (ata_scsi_offline_dev(dev)) {
1248 dev->flags |= ATA_DFLAG_DETACHED;
Tejun Heob51e9e52006-06-29 01:29:30 +09001249 ap->pflags |= ATA_PFLAG_SCSI_HOTPLUG;
Tejun Heo0ea035a2006-05-31 18:28:01 +09001250 }
1251
Tejun Heo90484eb2008-10-26 15:43:03 +09001252 /* clear per-dev EH info */
Tejun Heof58229f2007-08-06 18:36:23 +09001253 ata_eh_clear_action(link, dev, &link->eh_info, ATA_EH_PERDEV_MASK);
1254 ata_eh_clear_action(link, dev, &link->eh_context.i, ATA_EH_PERDEV_MASK);
Tejun Heo90484eb2008-10-26 15:43:03 +09001255 ehc->saved_xfer_mode[dev->devno] = 0;
1256 ehc->saved_ncq_enabled &= ~(1 << dev->devno);
Tejun Heobeb07c12006-06-24 20:30:19 +09001257
Jeff Garzikba6a1302006-06-22 23:46:10 -04001258 spin_unlock_irqrestore(ap->lock, flags);
Tejun Heo0ea035a2006-05-31 18:28:01 +09001259}
1260
1261/**
Tejun Heo022bdb02006-05-15 20:58:22 +09001262 * ata_eh_about_to_do - about to perform eh_action
Tejun Heo955e57d2007-08-06 18:36:23 +09001263 * @link: target ATA link
Tejun Heo47005f22006-06-19 18:27:23 +09001264 * @dev: target ATA dev for per-dev action (can be NULL)
Tejun Heo022bdb02006-05-15 20:58:22 +09001265 * @action: action about to be performed
1266 *
1267 * Called just before performing EH actions to clear related bits
Tejun Heo955e57d2007-08-06 18:36:23 +09001268 * in @link->eh_info such that eh actions are not unnecessarily
1269 * repeated.
Tejun Heo022bdb02006-05-15 20:58:22 +09001270 *
1271 * LOCKING:
1272 * None.
1273 */
Tejun Heofb7fd612007-09-23 13:14:12 +09001274void ata_eh_about_to_do(struct ata_link *link, struct ata_device *dev,
1275 unsigned int action)
Tejun Heo022bdb02006-05-15 20:58:22 +09001276{
Tejun Heo955e57d2007-08-06 18:36:23 +09001277 struct ata_port *ap = link->ap;
1278 struct ata_eh_info *ehi = &link->eh_info;
1279 struct ata_eh_context *ehc = &link->eh_context;
Tejun Heo022bdb02006-05-15 20:58:22 +09001280 unsigned long flags;
1281
Jeff Garzikba6a1302006-06-22 23:46:10 -04001282 spin_lock_irqsave(ap->lock, flags);
Tejun Heo1cdaf532006-07-03 16:07:26 +09001283
Tejun Heo955e57d2007-08-06 18:36:23 +09001284 ata_eh_clear_action(link, dev, ehi, action);
Tejun Heo13abf502006-07-10 23:18:46 +09001285
Tejun Heoa568d1d2008-10-21 20:37:21 +09001286 /* About to take EH action, set RECOVERED. Ignore actions on
1287 * slave links as master will do them again.
1288 */
1289 if (!(ehc->i.flags & ATA_EHI_QUIET) && link != ap->slave_link)
Tejun Heo1cdaf532006-07-03 16:07:26 +09001290 ap->pflags |= ATA_PFLAG_RECOVERED;
1291
Jeff Garzikba6a1302006-06-22 23:46:10 -04001292 spin_unlock_irqrestore(ap->lock, flags);
Tejun Heo022bdb02006-05-15 20:58:22 +09001293}
1294
1295/**
Tejun Heo47005f22006-06-19 18:27:23 +09001296 * ata_eh_done - EH action complete
Tejun Heo955e57d2007-08-06 18:36:23 +09001297* @ap: target ATA port
Tejun Heo47005f22006-06-19 18:27:23 +09001298 * @dev: target ATA dev for per-dev action (can be NULL)
1299 * @action: action just completed
1300 *
1301 * Called right after performing EH actions to clear related bits
Tejun Heo955e57d2007-08-06 18:36:23 +09001302 * in @link->eh_context.
Tejun Heo47005f22006-06-19 18:27:23 +09001303 *
1304 * LOCKING:
1305 * None.
1306 */
Tejun Heofb7fd612007-09-23 13:14:12 +09001307void ata_eh_done(struct ata_link *link, struct ata_device *dev,
1308 unsigned int action)
Tejun Heo47005f22006-06-19 18:27:23 +09001309{
Tejun Heo955e57d2007-08-06 18:36:23 +09001310 struct ata_eh_context *ehc = &link->eh_context;
Tejun Heo9af5c9c2007-08-06 18:36:22 +09001311
Tejun Heo955e57d2007-08-06 18:36:23 +09001312 ata_eh_clear_action(link, dev, &ehc->i, action);
Tejun Heo47005f22006-06-19 18:27:23 +09001313}
1314
1315/**
Tejun Heo022bdb02006-05-15 20:58:22 +09001316 * ata_err_string - convert err_mask to descriptive string
1317 * @err_mask: error mask to convert to string
1318 *
1319 * Convert @err_mask to descriptive string. Errors are
1320 * prioritized according to severity and only the most severe
1321 * error is reported.
1322 *
1323 * LOCKING:
1324 * None.
1325 *
1326 * RETURNS:
1327 * Descriptive string for @err_mask
1328 */
Jeff Garzik2dcb4072007-10-19 06:42:56 -04001329static const char *ata_err_string(unsigned int err_mask)
Tejun Heo022bdb02006-05-15 20:58:22 +09001330{
1331 if (err_mask & AC_ERR_HOST_BUS)
1332 return "host bus error";
1333 if (err_mask & AC_ERR_ATA_BUS)
1334 return "ATA bus error";
1335 if (err_mask & AC_ERR_TIMEOUT)
1336 return "timeout";
1337 if (err_mask & AC_ERR_HSM)
1338 return "HSM violation";
1339 if (err_mask & AC_ERR_SYSTEM)
1340 return "internal error";
1341 if (err_mask & AC_ERR_MEDIA)
1342 return "media error";
1343 if (err_mask & AC_ERR_INVALID)
1344 return "invalid argument";
1345 if (err_mask & AC_ERR_DEV)
1346 return "device error";
1347 return "unknown error";
1348}
1349
1350/**
Tejun Heoe8ee8452006-05-15 21:03:46 +09001351 * ata_read_log_page - read a specific log page
1352 * @dev: target device
1353 * @page: page to read
1354 * @buf: buffer to store read page
1355 * @sectors: number of sectors to read
1356 *
1357 * Read log page using READ_LOG_EXT command.
1358 *
1359 * LOCKING:
1360 * Kernel thread context (may sleep).
1361 *
1362 * RETURNS:
1363 * 0 on success, AC_ERR_* mask otherwise.
1364 */
1365static unsigned int ata_read_log_page(struct ata_device *dev,
1366 u8 page, void *buf, unsigned int sectors)
1367{
1368 struct ata_taskfile tf;
1369 unsigned int err_mask;
1370
1371 DPRINTK("read log page - page %d\n", page);
1372
1373 ata_tf_init(dev, &tf);
1374 tf.command = ATA_CMD_READ_LOG_EXT;
1375 tf.lbal = page;
1376 tf.nsect = sectors;
1377 tf.hob_nsect = sectors >> 8;
1378 tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_LBA48 | ATA_TFLAG_DEVICE;
1379 tf.protocol = ATA_PROT_PIO;
1380
1381 err_mask = ata_exec_internal(dev, &tf, NULL, DMA_FROM_DEVICE,
Tejun Heo2b789102007-10-09 15:05:44 +09001382 buf, sectors * ATA_SECT_SIZE, 0);
Tejun Heoe8ee8452006-05-15 21:03:46 +09001383
1384 DPRINTK("EXIT, err_mask=%x\n", err_mask);
1385 return err_mask;
1386}
1387
1388/**
1389 * ata_eh_read_log_10h - Read log page 10h for NCQ error details
1390 * @dev: Device to read log page 10h from
1391 * @tag: Resulting tag of the failed command
1392 * @tf: Resulting taskfile registers of the failed command
1393 *
1394 * Read log page 10h to obtain NCQ error details and clear error
1395 * condition.
1396 *
1397 * LOCKING:
1398 * Kernel thread context (may sleep).
1399 *
1400 * RETURNS:
1401 * 0 on success, -errno otherwise.
1402 */
1403static int ata_eh_read_log_10h(struct ata_device *dev,
1404 int *tag, struct ata_taskfile *tf)
1405{
Tejun Heo9af5c9c2007-08-06 18:36:22 +09001406 u8 *buf = dev->link->ap->sector_buf;
Tejun Heoe8ee8452006-05-15 21:03:46 +09001407 unsigned int err_mask;
1408 u8 csum;
1409 int i;
1410
1411 err_mask = ata_read_log_page(dev, ATA_LOG_SATA_NCQ, buf, 1);
1412 if (err_mask)
1413 return -EIO;
1414
1415 csum = 0;
1416 for (i = 0; i < ATA_SECT_SIZE; i++)
1417 csum += buf[i];
1418 if (csum)
1419 ata_dev_printk(dev, KERN_WARNING,
1420 "invalid checksum 0x%x on log page 10h\n", csum);
1421
1422 if (buf[0] & 0x80)
1423 return -ENOENT;
1424
1425 *tag = buf[0] & 0x1f;
1426
1427 tf->command = buf[2];
1428 tf->feature = buf[3];
1429 tf->lbal = buf[4];
1430 tf->lbam = buf[5];
1431 tf->lbah = buf[6];
1432 tf->device = buf[7];
1433 tf->hob_lbal = buf[8];
1434 tf->hob_lbam = buf[9];
1435 tf->hob_lbah = buf[10];
1436 tf->nsect = buf[12];
1437 tf->hob_nsect = buf[13];
1438
1439 return 0;
1440}
1441
1442/**
Tejun Heo11fc33d2008-08-30 14:20:01 +02001443 * atapi_eh_tur - perform ATAPI TEST_UNIT_READY
1444 * @dev: target ATAPI device
1445 * @r_sense_key: out parameter for sense_key
1446 *
1447 * Perform ATAPI TEST_UNIT_READY.
1448 *
1449 * LOCKING:
1450 * EH context (may sleep).
1451 *
1452 * RETURNS:
1453 * 0 on success, AC_ERR_* mask on failure.
1454 */
1455static unsigned int atapi_eh_tur(struct ata_device *dev, u8 *r_sense_key)
1456{
1457 u8 cdb[ATAPI_CDB_LEN] = { TEST_UNIT_READY, 0, 0, 0, 0, 0 };
1458 struct ata_taskfile tf;
1459 unsigned int err_mask;
1460
1461 ata_tf_init(dev, &tf);
1462
1463 tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_DEVICE;
1464 tf.command = ATA_CMD_PACKET;
1465 tf.protocol = ATAPI_PROT_NODATA;
1466
1467 err_mask = ata_exec_internal(dev, &tf, cdb, DMA_NONE, NULL, 0, 0);
1468 if (err_mask == AC_ERR_DEV)
1469 *r_sense_key = tf.feature >> 4;
1470 return err_mask;
1471}
1472
1473/**
Tejun Heo022bdb02006-05-15 20:58:22 +09001474 * atapi_eh_request_sense - perform ATAPI REQUEST_SENSE
1475 * @dev: device to perform REQUEST_SENSE to
1476 * @sense_buf: result sense data buffer (SCSI_SENSE_BUFFERSIZE bytes long)
Tejun Heo3eabddb2008-06-10 18:28:05 +09001477 * @dfl_sense_key: default sense key to use
Tejun Heo022bdb02006-05-15 20:58:22 +09001478 *
1479 * Perform ATAPI REQUEST_SENSE after the device reported CHECK
1480 * SENSE. This function is EH helper.
1481 *
1482 * LOCKING:
1483 * Kernel thread context (may sleep).
1484 *
1485 * RETURNS:
1486 * 0 on success, AC_ERR_* mask on failure
1487 */
Tejun Heo3eabddb2008-06-10 18:28:05 +09001488static unsigned int atapi_eh_request_sense(struct ata_device *dev,
1489 u8 *sense_buf, u8 dfl_sense_key)
Tejun Heo022bdb02006-05-15 20:58:22 +09001490{
Tejun Heo3eabddb2008-06-10 18:28:05 +09001491 u8 cdb[ATAPI_CDB_LEN] =
1492 { REQUEST_SENSE, 0, 0, 0, SCSI_SENSE_BUFFERSIZE, 0 };
Tejun Heo9af5c9c2007-08-06 18:36:22 +09001493 struct ata_port *ap = dev->link->ap;
Tejun Heo022bdb02006-05-15 20:58:22 +09001494 struct ata_taskfile tf;
Tejun Heo022bdb02006-05-15 20:58:22 +09001495
1496 DPRINTK("ATAPI request sense\n");
1497
Tejun Heo022bdb02006-05-15 20:58:22 +09001498 /* FIXME: is this needed? */
1499 memset(sense_buf, 0, SCSI_SENSE_BUFFERSIZE);
1500
Albert Lee56287762007-04-02 11:30:46 +08001501 /* initialize sense_buf with the error register,
1502 * for the case where they are -not- overwritten
1503 */
Tejun Heo022bdb02006-05-15 20:58:22 +09001504 sense_buf[0] = 0x70;
Tejun Heo3eabddb2008-06-10 18:28:05 +09001505 sense_buf[2] = dfl_sense_key;
Albert Lee56287762007-04-02 11:30:46 +08001506
Jeff Garzika617c092007-05-21 20:14:23 -04001507 /* some devices time out if garbage left in tf */
Albert Lee56287762007-04-02 11:30:46 +08001508 ata_tf_init(dev, &tf);
Tejun Heo022bdb02006-05-15 20:58:22 +09001509
Tejun Heo022bdb02006-05-15 20:58:22 +09001510 tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_DEVICE;
1511 tf.command = ATA_CMD_PACKET;
1512
1513 /* is it pointless to prefer PIO for "safety reasons"? */
1514 if (ap->flags & ATA_FLAG_PIO_DMA) {
Tejun Heo0dc36882007-12-18 16:34:43 -05001515 tf.protocol = ATAPI_PROT_DMA;
Tejun Heo022bdb02006-05-15 20:58:22 +09001516 tf.feature |= ATAPI_PKT_DMA;
1517 } else {
Tejun Heo0dc36882007-12-18 16:34:43 -05001518 tf.protocol = ATAPI_PROT_PIO;
Tejun Heof2dfc1a2007-12-12 12:12:46 +09001519 tf.lbam = SCSI_SENSE_BUFFERSIZE;
1520 tf.lbah = 0;
Tejun Heo022bdb02006-05-15 20:58:22 +09001521 }
1522
1523 return ata_exec_internal(dev, &tf, cdb, DMA_FROM_DEVICE,
Tejun Heo2b789102007-10-09 15:05:44 +09001524 sense_buf, SCSI_SENSE_BUFFERSIZE, 0);
Tejun Heo022bdb02006-05-15 20:58:22 +09001525}
1526
1527/**
1528 * ata_eh_analyze_serror - analyze SError for a failed port
Tejun Heo02607312007-08-06 18:36:23 +09001529 * @link: ATA link to analyze SError for
Tejun Heo022bdb02006-05-15 20:58:22 +09001530 *
1531 * Analyze SError if available and further determine cause of
1532 * failure.
1533 *
1534 * LOCKING:
1535 * None.
1536 */
Tejun Heo02607312007-08-06 18:36:23 +09001537static void ata_eh_analyze_serror(struct ata_link *link)
Tejun Heo022bdb02006-05-15 20:58:22 +09001538{
Tejun Heo02607312007-08-06 18:36:23 +09001539 struct ata_eh_context *ehc = &link->eh_context;
Tejun Heo022bdb02006-05-15 20:58:22 +09001540 u32 serror = ehc->i.serror;
1541 unsigned int err_mask = 0, action = 0;
Tejun Heof9df58c2007-09-23 13:14:13 +09001542 u32 hotplug_mask;
Tejun Heo022bdb02006-05-15 20:58:22 +09001543
Tejun Heoe0614db2008-05-19 01:15:09 +09001544 if (serror & (SERR_PERSISTENT | SERR_DATA)) {
Tejun Heo022bdb02006-05-15 20:58:22 +09001545 err_mask |= AC_ERR_ATA_BUS;
Tejun Heocf480622008-01-24 00:05:14 +09001546 action |= ATA_EH_RESET;
Tejun Heo022bdb02006-05-15 20:58:22 +09001547 }
1548 if (serror & SERR_PROTOCOL) {
1549 err_mask |= AC_ERR_HSM;
Tejun Heocf480622008-01-24 00:05:14 +09001550 action |= ATA_EH_RESET;
Tejun Heo022bdb02006-05-15 20:58:22 +09001551 }
1552 if (serror & SERR_INTERNAL) {
1553 err_mask |= AC_ERR_SYSTEM;
Tejun Heocf480622008-01-24 00:05:14 +09001554 action |= ATA_EH_RESET;
Tejun Heo022bdb02006-05-15 20:58:22 +09001555 }
Tejun Heof9df58c2007-09-23 13:14:13 +09001556
1557 /* Determine whether a hotplug event has occurred. Both
1558 * SError.N/X are considered hotplug events for enabled or
1559 * host links. For disabled PMP links, only N bit is
1560 * considered as X bit is left at 1 for link plugging.
1561 */
1562 hotplug_mask = 0;
1563
1564 if (!(link->flags & ATA_LFLAG_DISABLED) || ata_is_host_link(link))
1565 hotplug_mask = SERR_PHYRDY_CHG | SERR_DEV_XCHG;
1566 else
1567 hotplug_mask = SERR_PHYRDY_CHG;
1568
1569 if (serror & hotplug_mask)
Tejun Heo084fe632006-05-31 18:28:03 +09001570 ata_ehi_hotplugged(&ehc->i);
Tejun Heo022bdb02006-05-15 20:58:22 +09001571
1572 ehc->i.err_mask |= err_mask;
1573 ehc->i.action |= action;
1574}
1575
1576/**
Tejun Heoe8ee8452006-05-15 21:03:46 +09001577 * ata_eh_analyze_ncq_error - analyze NCQ error
Tejun Heo02607312007-08-06 18:36:23 +09001578 * @link: ATA link to analyze NCQ error for
Tejun Heoe8ee8452006-05-15 21:03:46 +09001579 *
1580 * Read log page 10h, determine the offending qc and acquire
1581 * error status TF. For NCQ device errors, all LLDDs have to do
1582 * is setting AC_ERR_DEV in ehi->err_mask. This function takes
1583 * care of the rest.
1584 *
1585 * LOCKING:
1586 * Kernel thread context (may sleep).
1587 */
Mark Lord10acf3b2008-05-02 02:14:53 -04001588void ata_eh_analyze_ncq_error(struct ata_link *link)
Tejun Heoe8ee8452006-05-15 21:03:46 +09001589{
Tejun Heo02607312007-08-06 18:36:23 +09001590 struct ata_port *ap = link->ap;
1591 struct ata_eh_context *ehc = &link->eh_context;
1592 struct ata_device *dev = link->device;
Tejun Heoe8ee8452006-05-15 21:03:46 +09001593 struct ata_queued_cmd *qc;
1594 struct ata_taskfile tf;
1595 int tag, rc;
1596
1597 /* if frozen, we can't do much */
Tejun Heob51e9e52006-06-29 01:29:30 +09001598 if (ap->pflags & ATA_PFLAG_FROZEN)
Tejun Heoe8ee8452006-05-15 21:03:46 +09001599 return;
1600
1601 /* is it NCQ device error? */
Tejun Heo02607312007-08-06 18:36:23 +09001602 if (!link->sactive || !(ehc->i.err_mask & AC_ERR_DEV))
Tejun Heoe8ee8452006-05-15 21:03:46 +09001603 return;
1604
1605 /* has LLDD analyzed already? */
1606 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) {
1607 qc = __ata_qc_from_tag(ap, tag);
1608
1609 if (!(qc->flags & ATA_QCFLAG_FAILED))
1610 continue;
1611
1612 if (qc->err_mask)
1613 return;
1614 }
1615
1616 /* okay, this error is ours */
1617 rc = ata_eh_read_log_10h(dev, &tag, &tf);
1618 if (rc) {
Tejun Heo02607312007-08-06 18:36:23 +09001619 ata_link_printk(link, KERN_ERR, "failed to read log page 10h "
Tejun Heoe8ee8452006-05-15 21:03:46 +09001620 "(errno=%d)\n", rc);
1621 return;
1622 }
1623
Tejun Heo02607312007-08-06 18:36:23 +09001624 if (!(link->sactive & (1 << tag))) {
1625 ata_link_printk(link, KERN_ERR, "log page 10h reported "
Tejun Heoe8ee8452006-05-15 21:03:46 +09001626 "inactive tag %d\n", tag);
1627 return;
1628 }
1629
1630 /* we've got the perpetrator, condemn it */
1631 qc = __ata_qc_from_tag(ap, tag);
1632 memcpy(&qc->result_tf, &tf, sizeof(tf));
Mark Lorda6116c92008-04-23 22:36:25 -04001633 qc->result_tf.flags = ATA_TFLAG_ISADDR | ATA_TFLAG_LBA | ATA_TFLAG_LBA48;
Tejun Heo5335b722007-07-16 14:29:40 +09001634 qc->err_mask |= AC_ERR_DEV | AC_ERR_NCQ;
Tejun Heoe8ee8452006-05-15 21:03:46 +09001635 ehc->i.err_mask &= ~AC_ERR_DEV;
1636}
1637
1638/**
Tejun Heo022bdb02006-05-15 20:58:22 +09001639 * ata_eh_analyze_tf - analyze taskfile of a failed qc
1640 * @qc: qc to analyze
1641 * @tf: Taskfile registers to analyze
1642 *
1643 * Analyze taskfile of @qc and further determine cause of
1644 * failure. This function also requests ATAPI sense data if
1645 * avaliable.
1646 *
1647 * LOCKING:
1648 * Kernel thread context (may sleep).
1649 *
1650 * RETURNS:
1651 * Determined recovery action
1652 */
1653static unsigned int ata_eh_analyze_tf(struct ata_queued_cmd *qc,
1654 const struct ata_taskfile *tf)
1655{
1656 unsigned int tmp, action = 0;
1657 u8 stat = tf->command, err = tf->feature;
1658
1659 if ((stat & (ATA_BUSY | ATA_DRQ | ATA_DRDY)) != ATA_DRDY) {
1660 qc->err_mask |= AC_ERR_HSM;
Tejun Heocf480622008-01-24 00:05:14 +09001661 return ATA_EH_RESET;
Tejun Heo022bdb02006-05-15 20:58:22 +09001662 }
1663
Tejun Heoa51d6442007-03-20 15:24:11 +09001664 if (stat & (ATA_ERR | ATA_DF))
1665 qc->err_mask |= AC_ERR_DEV;
1666 else
Tejun Heo022bdb02006-05-15 20:58:22 +09001667 return 0;
1668
1669 switch (qc->dev->class) {
1670 case ATA_DEV_ATA:
1671 if (err & ATA_ICRC)
1672 qc->err_mask |= AC_ERR_ATA_BUS;
1673 if (err & ATA_UNC)
1674 qc->err_mask |= AC_ERR_MEDIA;
1675 if (err & ATA_IDNF)
1676 qc->err_mask |= AC_ERR_INVALID;
1677 break;
1678
1679 case ATA_DEV_ATAPI:
Tejun Heoa569a302006-11-21 10:40:51 +09001680 if (!(qc->ap->pflags & ATA_PFLAG_FROZEN)) {
Tejun Heo3eabddb2008-06-10 18:28:05 +09001681 tmp = atapi_eh_request_sense(qc->dev,
1682 qc->scsicmd->sense_buffer,
1683 qc->result_tf.feature >> 4);
Tejun Heoa569a302006-11-21 10:40:51 +09001684 if (!tmp) {
1685 /* ATA_QCFLAG_SENSE_VALID is used to
1686 * tell atapi_qc_complete() that sense
1687 * data is already valid.
1688 *
1689 * TODO: interpret sense data and set
1690 * appropriate err_mask.
1691 */
1692 qc->flags |= ATA_QCFLAG_SENSE_VALID;
1693 } else
1694 qc->err_mask |= tmp;
1695 }
Tejun Heo022bdb02006-05-15 20:58:22 +09001696 }
1697
1698 if (qc->err_mask & (AC_ERR_HSM | AC_ERR_TIMEOUT | AC_ERR_ATA_BUS))
Tejun Heocf480622008-01-24 00:05:14 +09001699 action |= ATA_EH_RESET;
Tejun Heo022bdb02006-05-15 20:58:22 +09001700
1701 return action;
1702}
1703
Tejun Heo76326ac2007-11-27 19:28:59 +09001704static int ata_eh_categorize_error(unsigned int eflags, unsigned int err_mask,
1705 int *xfer_ok)
Tejun Heo022bdb02006-05-15 20:58:22 +09001706{
Tejun Heo76326ac2007-11-27 19:28:59 +09001707 int base = 0;
1708
1709 if (!(eflags & ATA_EFLAG_DUBIOUS_XFER))
1710 *xfer_ok = 1;
1711
1712 if (!*xfer_ok)
Tejun Heo75f9caf2008-01-03 01:21:14 +09001713 base = ATA_ECAT_DUBIOUS_NONE;
Tejun Heo76326ac2007-11-27 19:28:59 +09001714
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001715 if (err_mask & AC_ERR_ATA_BUS)
Tejun Heo76326ac2007-11-27 19:28:59 +09001716 return base + ATA_ECAT_ATA_BUS;
Tejun Heo022bdb02006-05-15 20:58:22 +09001717
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001718 if (err_mask & AC_ERR_TIMEOUT)
Tejun Heo76326ac2007-11-27 19:28:59 +09001719 return base + ATA_ECAT_TOUT_HSM;
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001720
Tejun Heo3884f7b2007-11-27 19:28:56 +09001721 if (eflags & ATA_EFLAG_IS_IO) {
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001722 if (err_mask & AC_ERR_HSM)
Tejun Heo76326ac2007-11-27 19:28:59 +09001723 return base + ATA_ECAT_TOUT_HSM;
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001724 if ((err_mask &
1725 (AC_ERR_DEV|AC_ERR_MEDIA|AC_ERR_INVALID)) == AC_ERR_DEV)
Tejun Heo76326ac2007-11-27 19:28:59 +09001726 return base + ATA_ECAT_UNK_DEV;
Tejun Heo022bdb02006-05-15 20:58:22 +09001727 }
1728
1729 return 0;
1730}
1731
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001732struct speed_down_verdict_arg {
Tejun Heo022bdb02006-05-15 20:58:22 +09001733 u64 since;
Tejun Heo76326ac2007-11-27 19:28:59 +09001734 int xfer_ok;
Tejun Heo3884f7b2007-11-27 19:28:56 +09001735 int nr_errors[ATA_ECAT_NR];
Tejun Heo022bdb02006-05-15 20:58:22 +09001736};
1737
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001738static int speed_down_verdict_cb(struct ata_ering_entry *ent, void *void_arg)
Tejun Heo022bdb02006-05-15 20:58:22 +09001739{
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001740 struct speed_down_verdict_arg *arg = void_arg;
Tejun Heo76326ac2007-11-27 19:28:59 +09001741 int cat;
Tejun Heo022bdb02006-05-15 20:58:22 +09001742
1743 if (ent->timestamp < arg->since)
1744 return -1;
1745
Tejun Heo76326ac2007-11-27 19:28:59 +09001746 cat = ata_eh_categorize_error(ent->eflags, ent->err_mask,
1747 &arg->xfer_ok);
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001748 arg->nr_errors[cat]++;
Tejun Heo76326ac2007-11-27 19:28:59 +09001749
Tejun Heo022bdb02006-05-15 20:58:22 +09001750 return 0;
1751}
1752
1753/**
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001754 * ata_eh_speed_down_verdict - Determine speed down verdict
Tejun Heo022bdb02006-05-15 20:58:22 +09001755 * @dev: Device of interest
1756 *
1757 * This function examines error ring of @dev and determines
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001758 * whether NCQ needs to be turned off, transfer speed should be
1759 * stepped down, or falling back to PIO is necessary.
Tejun Heo022bdb02006-05-15 20:58:22 +09001760 *
Tejun Heo3884f7b2007-11-27 19:28:56 +09001761 * ECAT_ATA_BUS : ATA_BUS error for any command
Tejun Heo022bdb02006-05-15 20:58:22 +09001762 *
Tejun Heo3884f7b2007-11-27 19:28:56 +09001763 * ECAT_TOUT_HSM : TIMEOUT for any command or HSM violation for
1764 * IO commands
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001765 *
Tejun Heo3884f7b2007-11-27 19:28:56 +09001766 * ECAT_UNK_DEV : Unknown DEV error for IO commands
Tejun Heo022bdb02006-05-15 20:58:22 +09001767 *
Tejun Heo76326ac2007-11-27 19:28:59 +09001768 * ECAT_DUBIOUS_* : Identical to above three but occurred while
1769 * data transfer hasn't been verified.
1770 *
Tejun Heo3884f7b2007-11-27 19:28:56 +09001771 * Verdicts are
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001772 *
Tejun Heo3884f7b2007-11-27 19:28:56 +09001773 * NCQ_OFF : Turn off NCQ.
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001774 *
Tejun Heo3884f7b2007-11-27 19:28:56 +09001775 * SPEED_DOWN : Speed down transfer speed but don't fall back
1776 * to PIO.
1777 *
1778 * FALLBACK_TO_PIO : Fall back to PIO.
1779 *
1780 * Even if multiple verdicts are returned, only one action is
Tejun Heo76326ac2007-11-27 19:28:59 +09001781 * taken per error. An action triggered by non-DUBIOUS errors
1782 * clears ering, while one triggered by DUBIOUS_* errors doesn't.
1783 * This is to expedite speed down decisions right after device is
1784 * initially configured.
Tejun Heo3884f7b2007-11-27 19:28:56 +09001785 *
Tejun Heo76326ac2007-11-27 19:28:59 +09001786 * The followings are speed down rules. #1 and #2 deal with
1787 * DUBIOUS errors.
1788 *
1789 * 1. If more than one DUBIOUS_ATA_BUS or DUBIOUS_TOUT_HSM errors
1790 * occurred during last 5 mins, SPEED_DOWN and FALLBACK_TO_PIO.
1791 *
1792 * 2. If more than one DUBIOUS_TOUT_HSM or DUBIOUS_UNK_DEV errors
1793 * occurred during last 5 mins, NCQ_OFF.
1794 *
1795 * 3. If more than 8 ATA_BUS, TOUT_HSM or UNK_DEV errors
Tejun Heo3884f7b2007-11-27 19:28:56 +09001796 * ocurred during last 5 mins, FALLBACK_TO_PIO
1797 *
Tejun Heo76326ac2007-11-27 19:28:59 +09001798 * 4. If more than 3 TOUT_HSM or UNK_DEV errors occurred
Tejun Heo3884f7b2007-11-27 19:28:56 +09001799 * during last 10 mins, NCQ_OFF.
1800 *
Tejun Heo76326ac2007-11-27 19:28:59 +09001801 * 5. If more than 3 ATA_BUS or TOUT_HSM errors, or more than 6
Tejun Heo3884f7b2007-11-27 19:28:56 +09001802 * UNK_DEV errors occurred during last 10 mins, SPEED_DOWN.
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001803 *
Tejun Heo022bdb02006-05-15 20:58:22 +09001804 * LOCKING:
1805 * Inherited from caller.
1806 *
1807 * RETURNS:
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001808 * OR of ATA_EH_SPDN_* flags.
Tejun Heo022bdb02006-05-15 20:58:22 +09001809 */
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001810static unsigned int ata_eh_speed_down_verdict(struct ata_device *dev)
Tejun Heo022bdb02006-05-15 20:58:22 +09001811{
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001812 const u64 j5mins = 5LLU * 60 * HZ, j10mins = 10LLU * 60 * HZ;
1813 u64 j64 = get_jiffies_64();
1814 struct speed_down_verdict_arg arg;
1815 unsigned int verdict = 0;
Tejun Heo022bdb02006-05-15 20:58:22 +09001816
Tejun Heo3884f7b2007-11-27 19:28:56 +09001817 /* scan past 5 mins of error history */
1818 memset(&arg, 0, sizeof(arg));
1819 arg.since = j64 - min(j64, j5mins);
1820 ata_ering_map(&dev->ering, speed_down_verdict_cb, &arg);
1821
Tejun Heo76326ac2007-11-27 19:28:59 +09001822 if (arg.nr_errors[ATA_ECAT_DUBIOUS_ATA_BUS] +
1823 arg.nr_errors[ATA_ECAT_DUBIOUS_TOUT_HSM] > 1)
1824 verdict |= ATA_EH_SPDN_SPEED_DOWN |
1825 ATA_EH_SPDN_FALLBACK_TO_PIO | ATA_EH_SPDN_KEEP_ERRORS;
1826
1827 if (arg.nr_errors[ATA_ECAT_DUBIOUS_TOUT_HSM] +
1828 arg.nr_errors[ATA_ECAT_DUBIOUS_UNK_DEV] > 1)
1829 verdict |= ATA_EH_SPDN_NCQ_OFF | ATA_EH_SPDN_KEEP_ERRORS;
1830
Tejun Heo3884f7b2007-11-27 19:28:56 +09001831 if (arg.nr_errors[ATA_ECAT_ATA_BUS] +
1832 arg.nr_errors[ATA_ECAT_TOUT_HSM] +
Tejun Heo663f99b2007-11-27 19:28:57 +09001833 arg.nr_errors[ATA_ECAT_UNK_DEV] > 6)
Tejun Heo3884f7b2007-11-27 19:28:56 +09001834 verdict |= ATA_EH_SPDN_FALLBACK_TO_PIO;
1835
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001836 /* scan past 10 mins of error history */
Tejun Heo022bdb02006-05-15 20:58:22 +09001837 memset(&arg, 0, sizeof(arg));
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001838 arg.since = j64 - min(j64, j10mins);
1839 ata_ering_map(&dev->ering, speed_down_verdict_cb, &arg);
Tejun Heo022bdb02006-05-15 20:58:22 +09001840
Tejun Heo3884f7b2007-11-27 19:28:56 +09001841 if (arg.nr_errors[ATA_ECAT_TOUT_HSM] +
1842 arg.nr_errors[ATA_ECAT_UNK_DEV] > 3)
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001843 verdict |= ATA_EH_SPDN_NCQ_OFF;
Tejun Heo3884f7b2007-11-27 19:28:56 +09001844
1845 if (arg.nr_errors[ATA_ECAT_ATA_BUS] +
1846 arg.nr_errors[ATA_ECAT_TOUT_HSM] > 3 ||
Tejun Heo663f99b2007-11-27 19:28:57 +09001847 arg.nr_errors[ATA_ECAT_UNK_DEV] > 6)
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001848 verdict |= ATA_EH_SPDN_SPEED_DOWN;
Tejun Heo022bdb02006-05-15 20:58:22 +09001849
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001850 return verdict;
Tejun Heo022bdb02006-05-15 20:58:22 +09001851}
1852
1853/**
1854 * ata_eh_speed_down - record error and speed down if necessary
1855 * @dev: Failed device
Tejun Heo3884f7b2007-11-27 19:28:56 +09001856 * @eflags: mask of ATA_EFLAG_* flags
Tejun Heo022bdb02006-05-15 20:58:22 +09001857 * @err_mask: err_mask of the error
1858 *
1859 * Record error and examine error history to determine whether
1860 * adjusting transmission speed is necessary. It also sets
1861 * transmission limits appropriately if such adjustment is
1862 * necessary.
1863 *
1864 * LOCKING:
1865 * Kernel thread context (may sleep).
1866 *
1867 * RETURNS:
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001868 * Determined recovery action.
Tejun Heo022bdb02006-05-15 20:58:22 +09001869 */
Tejun Heo3884f7b2007-11-27 19:28:56 +09001870static unsigned int ata_eh_speed_down(struct ata_device *dev,
1871 unsigned int eflags, unsigned int err_mask)
Tejun Heo022bdb02006-05-15 20:58:22 +09001872{
Tejun Heob1c72912008-07-31 17:02:43 +09001873 struct ata_link *link = ata_dev_phys_link(dev);
Tejun Heo76326ac2007-11-27 19:28:59 +09001874 int xfer_ok = 0;
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001875 unsigned int verdict;
1876 unsigned int action = 0;
1877
1878 /* don't bother if Cat-0 error */
Tejun Heo76326ac2007-11-27 19:28:59 +09001879 if (ata_eh_categorize_error(eflags, err_mask, &xfer_ok) == 0)
Tejun Heo022bdb02006-05-15 20:58:22 +09001880 return 0;
1881
1882 /* record error and determine whether speed down is necessary */
Tejun Heo3884f7b2007-11-27 19:28:56 +09001883 ata_ering_record(&dev->ering, eflags, err_mask);
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001884 verdict = ata_eh_speed_down_verdict(dev);
Tejun Heo022bdb02006-05-15 20:58:22 +09001885
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001886 /* turn off NCQ? */
1887 if ((verdict & ATA_EH_SPDN_NCQ_OFF) &&
1888 (dev->flags & (ATA_DFLAG_PIO | ATA_DFLAG_NCQ |
1889 ATA_DFLAG_NCQ_OFF)) == ATA_DFLAG_NCQ) {
1890 dev->flags |= ATA_DFLAG_NCQ_OFF;
1891 ata_dev_printk(dev, KERN_WARNING,
1892 "NCQ disabled due to excessive errors\n");
1893 goto done;
1894 }
Tejun Heo022bdb02006-05-15 20:58:22 +09001895
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001896 /* speed down? */
1897 if (verdict & ATA_EH_SPDN_SPEED_DOWN) {
1898 /* speed down SATA link speed if possible */
Tejun Heoa07d4992009-01-29 20:31:33 +09001899 if (sata_down_spd_limit(link, 0) == 0) {
Tejun Heocf480622008-01-24 00:05:14 +09001900 action |= ATA_EH_RESET;
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001901 goto done;
1902 }
Tejun Heo022bdb02006-05-15 20:58:22 +09001903
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001904 /* lower transfer mode */
1905 if (dev->spdn_cnt < 2) {
1906 static const int dma_dnxfer_sel[] =
1907 { ATA_DNXFER_DMA, ATA_DNXFER_40C };
1908 static const int pio_dnxfer_sel[] =
1909 { ATA_DNXFER_PIO, ATA_DNXFER_FORCE_PIO0 };
1910 int sel;
Tejun Heo022bdb02006-05-15 20:58:22 +09001911
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001912 if (dev->xfer_shift != ATA_SHIFT_PIO)
1913 sel = dma_dnxfer_sel[dev->spdn_cnt];
1914 else
1915 sel = pio_dnxfer_sel[dev->spdn_cnt];
1916
1917 dev->spdn_cnt++;
1918
1919 if (ata_down_xfermask_limit(dev, sel) == 0) {
Tejun Heocf480622008-01-24 00:05:14 +09001920 action |= ATA_EH_RESET;
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001921 goto done;
1922 }
1923 }
1924 }
1925
1926 /* Fall back to PIO? Slowing down to PIO is meaningless for
Tejun Heo663f99b2007-11-27 19:28:57 +09001927 * SATA ATA devices. Consider it only for PATA and SATAPI.
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001928 */
1929 if ((verdict & ATA_EH_SPDN_FALLBACK_TO_PIO) && (dev->spdn_cnt >= 2) &&
Tejun Heo663f99b2007-11-27 19:28:57 +09001930 (link->ap->cbl != ATA_CBL_SATA || dev->class == ATA_DEV_ATAPI) &&
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001931 (dev->xfer_shift != ATA_SHIFT_PIO)) {
1932 if (ata_down_xfermask_limit(dev, ATA_DNXFER_FORCE_PIO) == 0) {
1933 dev->spdn_cnt = 0;
Tejun Heocf480622008-01-24 00:05:14 +09001934 action |= ATA_EH_RESET;
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001935 goto done;
1936 }
1937 }
1938
Tejun Heo022bdb02006-05-15 20:58:22 +09001939 return 0;
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001940 done:
1941 /* device has been slowed down, blow error history */
Tejun Heo76326ac2007-11-27 19:28:59 +09001942 if (!(verdict & ATA_EH_SPDN_KEEP_ERRORS))
1943 ata_ering_clear(&dev->ering);
Tejun Heo7d47e8d2007-02-02 16:22:31 +09001944 return action;
Tejun Heo022bdb02006-05-15 20:58:22 +09001945}
1946
1947/**
Tejun Heo9b1e2652007-08-06 18:36:24 +09001948 * ata_eh_link_autopsy - analyze error and determine recovery action
1949 * @link: host link to perform autopsy on
Tejun Heo022bdb02006-05-15 20:58:22 +09001950 *
Tejun Heo02607312007-08-06 18:36:23 +09001951 * Analyze why @link failed and determine which recovery actions
1952 * are needed. This function also sets more detailed AC_ERR_*
1953 * values and fills sense data for ATAPI CHECK SENSE.
Tejun Heo022bdb02006-05-15 20:58:22 +09001954 *
1955 * LOCKING:
1956 * Kernel thread context (may sleep).
1957 */
Tejun Heo9b1e2652007-08-06 18:36:24 +09001958static void ata_eh_link_autopsy(struct ata_link *link)
Tejun Heo022bdb02006-05-15 20:58:22 +09001959{
Tejun Heo02607312007-08-06 18:36:23 +09001960 struct ata_port *ap = link->ap;
Tejun Heo936fd732007-08-06 18:36:23 +09001961 struct ata_eh_context *ehc = &link->eh_context;
Tejun Heodfcc1732007-10-31 10:17:05 +09001962 struct ata_device *dev;
Tejun Heo3884f7b2007-11-27 19:28:56 +09001963 unsigned int all_err_mask = 0, eflags = 0;
1964 int tag;
Tejun Heo022bdb02006-05-15 20:58:22 +09001965 u32 serror;
1966 int rc;
1967
1968 DPRINTK("ENTER\n");
1969
Tejun Heo1cdaf532006-07-03 16:07:26 +09001970 if (ehc->i.flags & ATA_EHI_NO_AUTOPSY)
1971 return;
1972
Tejun Heo022bdb02006-05-15 20:58:22 +09001973 /* obtain and analyze SError */
Tejun Heo936fd732007-08-06 18:36:23 +09001974 rc = sata_scr_read(link, SCR_ERROR, &serror);
Tejun Heo022bdb02006-05-15 20:58:22 +09001975 if (rc == 0) {
1976 ehc->i.serror |= serror;
Tejun Heo02607312007-08-06 18:36:23 +09001977 ata_eh_analyze_serror(link);
Tejun Heo4e57c512007-07-16 14:29:41 +09001978 } else if (rc != -EOPNOTSUPP) {
Tejun Heocf480622008-01-24 00:05:14 +09001979 /* SError read failed, force reset and probing */
Tejun Heob558edd2008-01-24 00:05:14 +09001980 ehc->i.probe_mask |= ATA_ALL_DEVICES;
Tejun Heocf480622008-01-24 00:05:14 +09001981 ehc->i.action |= ATA_EH_RESET;
Tejun Heo4e57c512007-07-16 14:29:41 +09001982 ehc->i.err_mask |= AC_ERR_OTHER;
1983 }
Tejun Heo022bdb02006-05-15 20:58:22 +09001984
Tejun Heoe8ee8452006-05-15 21:03:46 +09001985 /* analyze NCQ failure */
Tejun Heo02607312007-08-06 18:36:23 +09001986 ata_eh_analyze_ncq_error(link);
Tejun Heoe8ee8452006-05-15 21:03:46 +09001987
Tejun Heo022bdb02006-05-15 20:58:22 +09001988 /* any real error trumps AC_ERR_OTHER */
1989 if (ehc->i.err_mask & ~AC_ERR_OTHER)
1990 ehc->i.err_mask &= ~AC_ERR_OTHER;
1991
1992 all_err_mask |= ehc->i.err_mask;
1993
1994 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) {
1995 struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag);
1996
Tejun Heob1c72912008-07-31 17:02:43 +09001997 if (!(qc->flags & ATA_QCFLAG_FAILED) ||
1998 ata_dev_phys_link(qc->dev) != link)
Tejun Heo022bdb02006-05-15 20:58:22 +09001999 continue;
2000
2001 /* inherit upper level err_mask */
2002 qc->err_mask |= ehc->i.err_mask;
2003
Tejun Heo022bdb02006-05-15 20:58:22 +09002004 /* analyze TF */
Tejun Heo4528e4d2006-07-08 20:17:26 +09002005 ehc->i.action |= ata_eh_analyze_tf(qc, &qc->result_tf);
Tejun Heo022bdb02006-05-15 20:58:22 +09002006
2007 /* DEV errors are probably spurious in case of ATA_BUS error */
2008 if (qc->err_mask & AC_ERR_ATA_BUS)
2009 qc->err_mask &= ~(AC_ERR_DEV | AC_ERR_MEDIA |
2010 AC_ERR_INVALID);
2011
2012 /* any real error trumps unknown error */
2013 if (qc->err_mask & ~AC_ERR_OTHER)
2014 qc->err_mask &= ~AC_ERR_OTHER;
2015
2016 /* SENSE_VALID trumps dev/unknown error and revalidation */
Tejun Heof90f0822007-10-26 16:12:41 +09002017 if (qc->flags & ATA_QCFLAG_SENSE_VALID)
Tejun Heo022bdb02006-05-15 20:58:22 +09002018 qc->err_mask &= ~(AC_ERR_DEV | AC_ERR_OTHER);
Tejun Heo022bdb02006-05-15 20:58:22 +09002019
Tejun Heo03faab72008-03-27 19:14:24 +09002020 /* determine whether the command is worth retrying */
2021 if (!(qc->err_mask & AC_ERR_INVALID) &&
2022 ((qc->flags & ATA_QCFLAG_IO) || qc->err_mask != AC_ERR_DEV))
2023 qc->flags |= ATA_QCFLAG_RETRY;
2024
Tejun Heo022bdb02006-05-15 20:58:22 +09002025 /* accumulate error info */
Tejun Heo4528e4d2006-07-08 20:17:26 +09002026 ehc->i.dev = qc->dev;
Tejun Heo022bdb02006-05-15 20:58:22 +09002027 all_err_mask |= qc->err_mask;
2028 if (qc->flags & ATA_QCFLAG_IO)
Tejun Heo3884f7b2007-11-27 19:28:56 +09002029 eflags |= ATA_EFLAG_IS_IO;
Tejun Heo022bdb02006-05-15 20:58:22 +09002030 }
2031
Tejun Heoa20f33f2006-05-16 12:58:24 +09002032 /* enforce default EH actions */
Tejun Heob51e9e52006-06-29 01:29:30 +09002033 if (ap->pflags & ATA_PFLAG_FROZEN ||
Tejun Heoa20f33f2006-05-16 12:58:24 +09002034 all_err_mask & (AC_ERR_HSM | AC_ERR_TIMEOUT))
Tejun Heocf480622008-01-24 00:05:14 +09002035 ehc->i.action |= ATA_EH_RESET;
Tejun Heo3884f7b2007-11-27 19:28:56 +09002036 else if (((eflags & ATA_EFLAG_IS_IO) && all_err_mask) ||
2037 (!(eflags & ATA_EFLAG_IS_IO) && (all_err_mask & ~AC_ERR_DEV)))
Tejun Heo4528e4d2006-07-08 20:17:26 +09002038 ehc->i.action |= ATA_EH_REVALIDATE;
Tejun Heo022bdb02006-05-15 20:58:22 +09002039
Tejun Heodfcc1732007-10-31 10:17:05 +09002040 /* If we have offending qcs and the associated failed device,
2041 * perform per-dev EH action only on the offending device.
2042 */
Tejun Heo4528e4d2006-07-08 20:17:26 +09002043 if (ehc->i.dev) {
Tejun Heo4528e4d2006-07-08 20:17:26 +09002044 ehc->i.dev_action[ehc->i.dev->devno] |=
2045 ehc->i.action & ATA_EH_PERDEV_MASK;
2046 ehc->i.action &= ~ATA_EH_PERDEV_MASK;
Tejun Heo47005f22006-06-19 18:27:23 +09002047 }
2048
Tejun Heo2695e362008-01-10 13:41:23 +09002049 /* propagate timeout to host link */
2050 if ((all_err_mask & AC_ERR_TIMEOUT) && !ata_is_host_link(link))
2051 ap->link.eh_context.i.err_mask |= AC_ERR_TIMEOUT;
2052
2053 /* record error and consider speeding down */
Tejun Heodfcc1732007-10-31 10:17:05 +09002054 dev = ehc->i.dev;
Tejun Heo2695e362008-01-10 13:41:23 +09002055 if (!dev && ((ata_link_max_devices(link) == 1 &&
2056 ata_dev_enabled(link->device))))
2057 dev = link->device;
Tejun Heodfcc1732007-10-31 10:17:05 +09002058
Tejun Heo76326ac2007-11-27 19:28:59 +09002059 if (dev) {
2060 if (dev->flags & ATA_DFLAG_DUBIOUS_XFER)
2061 eflags |= ATA_EFLAG_DUBIOUS_XFER;
Tejun Heo3884f7b2007-11-27 19:28:56 +09002062 ehc->i.action |= ata_eh_speed_down(dev, eflags, all_err_mask);
Tejun Heo76326ac2007-11-27 19:28:59 +09002063 }
Tejun Heodfcc1732007-10-31 10:17:05 +09002064
Tejun Heo022bdb02006-05-15 20:58:22 +09002065 DPRINTK("EXIT\n");
2066}
2067
2068/**
Tejun Heo9b1e2652007-08-06 18:36:24 +09002069 * ata_eh_autopsy - analyze error and determine recovery action
2070 * @ap: host port to perform autopsy on
2071 *
2072 * Analyze all links of @ap and determine why they failed and
2073 * which recovery actions are needed.
2074 *
2075 * LOCKING:
2076 * Kernel thread context (may sleep).
2077 */
Tejun Heofb7fd612007-09-23 13:14:12 +09002078void ata_eh_autopsy(struct ata_port *ap)
Tejun Heo9b1e2652007-08-06 18:36:24 +09002079{
2080 struct ata_link *link;
2081
Tejun Heo1eca4362008-11-03 20:03:17 +09002082 ata_for_each_link(link, ap, EDGE)
Tejun Heo9b1e2652007-08-06 18:36:24 +09002083 ata_eh_link_autopsy(link);
Tejun Heo2695e362008-01-10 13:41:23 +09002084
Tejun Heob1c72912008-07-31 17:02:43 +09002085 /* Handle the frigging slave link. Autopsy is done similarly
2086 * but actions and flags are transferred over to the master
2087 * link and handled from there.
2088 */
2089 if (ap->slave_link) {
2090 struct ata_eh_context *mehc = &ap->link.eh_context;
2091 struct ata_eh_context *sehc = &ap->slave_link->eh_context;
2092
Tejun Heo848e4c62008-10-21 14:26:39 +09002093 /* transfer control flags from master to slave */
2094 sehc->i.flags |= mehc->i.flags & ATA_EHI_TO_SLAVE_MASK;
2095
2096 /* perform autopsy on the slave link */
Tejun Heob1c72912008-07-31 17:02:43 +09002097 ata_eh_link_autopsy(ap->slave_link);
2098
Tejun Heo848e4c62008-10-21 14:26:39 +09002099 /* transfer actions from slave to master and clear slave */
Tejun Heob1c72912008-07-31 17:02:43 +09002100 ata_eh_about_to_do(ap->slave_link, NULL, ATA_EH_ALL_ACTIONS);
2101 mehc->i.action |= sehc->i.action;
2102 mehc->i.dev_action[1] |= sehc->i.dev_action[1];
2103 mehc->i.flags |= sehc->i.flags;
2104 ata_eh_done(ap->slave_link, NULL, ATA_EH_ALL_ACTIONS);
2105 }
2106
Tejun Heo2695e362008-01-10 13:41:23 +09002107 /* Autopsy of fanout ports can affect host link autopsy.
2108 * Perform host link autopsy last.
2109 */
Tejun Heo071f44b2008-04-07 22:47:22 +09002110 if (sata_pmp_attached(ap))
Tejun Heo2695e362008-01-10 13:41:23 +09002111 ata_eh_link_autopsy(&ap->link);
Tejun Heo9b1e2652007-08-06 18:36:24 +09002112}
2113
2114/**
2115 * ata_eh_link_report - report error handling to user
Tejun Heo02607312007-08-06 18:36:23 +09002116 * @link: ATA link EH is going on
Tejun Heo022bdb02006-05-15 20:58:22 +09002117 *
2118 * Report EH to user.
2119 *
2120 * LOCKING:
2121 * None.
2122 */
Tejun Heo9b1e2652007-08-06 18:36:24 +09002123static void ata_eh_link_report(struct ata_link *link)
Tejun Heo022bdb02006-05-15 20:58:22 +09002124{
Tejun Heo02607312007-08-06 18:36:23 +09002125 struct ata_port *ap = link->ap;
2126 struct ata_eh_context *ehc = &link->eh_context;
Tejun Heo022bdb02006-05-15 20:58:22 +09002127 const char *frozen, *desc;
Tejun Heoa1e10f72007-08-18 13:28:49 +09002128 char tries_buf[6];
Tejun Heo022bdb02006-05-15 20:58:22 +09002129 int tag, nr_failed = 0;
2130
Tejun Heo94ff3d52007-10-09 14:57:56 +09002131 if (ehc->i.flags & ATA_EHI_QUIET)
2132 return;
2133
Tejun Heo022bdb02006-05-15 20:58:22 +09002134 desc = NULL;
2135 if (ehc->i.desc[0] != '\0')
2136 desc = ehc->i.desc;
2137
2138 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) {
2139 struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag);
2140
Tejun Heob1c72912008-07-31 17:02:43 +09002141 if (!(qc->flags & ATA_QCFLAG_FAILED) ||
2142 ata_dev_phys_link(qc->dev) != link ||
Tejun Heoe027bd32007-10-26 16:19:26 +09002143 ((qc->flags & ATA_QCFLAG_QUIET) &&
2144 qc->err_mask == AC_ERR_DEV))
Tejun Heo022bdb02006-05-15 20:58:22 +09002145 continue;
2146 if (qc->flags & ATA_QCFLAG_SENSE_VALID && !qc->err_mask)
2147 continue;
2148
2149 nr_failed++;
2150 }
2151
2152 if (!nr_failed && !ehc->i.err_mask)
2153 return;
2154
2155 frozen = "";
Tejun Heob51e9e52006-06-29 01:29:30 +09002156 if (ap->pflags & ATA_PFLAG_FROZEN)
Tejun Heo022bdb02006-05-15 20:58:22 +09002157 frozen = " frozen";
2158
Tejun Heoa1e10f72007-08-18 13:28:49 +09002159 memset(tries_buf, 0, sizeof(tries_buf));
2160 if (ap->eh_tries < ATA_EH_MAX_TRIES)
2161 snprintf(tries_buf, sizeof(tries_buf) - 1, " t%d",
2162 ap->eh_tries);
2163
Tejun Heo022bdb02006-05-15 20:58:22 +09002164 if (ehc->i.dev) {
Tejun Heoe8ee8452006-05-15 21:03:46 +09002165 ata_dev_printk(ehc->i.dev, KERN_ERR, "exception Emask 0x%x "
Tejun Heoa1e10f72007-08-18 13:28:49 +09002166 "SAct 0x%x SErr 0x%x action 0x%x%s%s\n",
2167 ehc->i.err_mask, link->sactive, ehc->i.serror,
2168 ehc->i.action, frozen, tries_buf);
Tejun Heo022bdb02006-05-15 20:58:22 +09002169 if (desc)
Tejun Heob64bbc32007-07-16 14:29:39 +09002170 ata_dev_printk(ehc->i.dev, KERN_ERR, "%s\n", desc);
Tejun Heo022bdb02006-05-15 20:58:22 +09002171 } else {
Tejun Heo02607312007-08-06 18:36:23 +09002172 ata_link_printk(link, KERN_ERR, "exception Emask 0x%x "
Tejun Heoa1e10f72007-08-18 13:28:49 +09002173 "SAct 0x%x SErr 0x%x action 0x%x%s%s\n",
2174 ehc->i.err_mask, link->sactive, ehc->i.serror,
2175 ehc->i.action, frozen, tries_buf);
Tejun Heo022bdb02006-05-15 20:58:22 +09002176 if (desc)
Tejun Heo02607312007-08-06 18:36:23 +09002177 ata_link_printk(link, KERN_ERR, "%s\n", desc);
Tejun Heo022bdb02006-05-15 20:58:22 +09002178 }
2179
Robert Hancock1333e192007-10-02 11:22:02 -04002180 if (ehc->i.serror)
Tejun Heoda0e21d2008-07-31 16:08:38 +09002181 ata_link_printk(link, KERN_ERR,
Robert Hancock1333e192007-10-02 11:22:02 -04002182 "SError: { %s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s}\n",
2183 ehc->i.serror & SERR_DATA_RECOVERED ? "RecovData " : "",
2184 ehc->i.serror & SERR_COMM_RECOVERED ? "RecovComm " : "",
2185 ehc->i.serror & SERR_DATA ? "UnrecovData " : "",
2186 ehc->i.serror & SERR_PERSISTENT ? "Persist " : "",
2187 ehc->i.serror & SERR_PROTOCOL ? "Proto " : "",
2188 ehc->i.serror & SERR_INTERNAL ? "HostInt " : "",
2189 ehc->i.serror & SERR_PHYRDY_CHG ? "PHYRdyChg " : "",
2190 ehc->i.serror & SERR_PHY_INT_ERR ? "PHYInt " : "",
2191 ehc->i.serror & SERR_COMM_WAKE ? "CommWake " : "",
2192 ehc->i.serror & SERR_10B_8B_ERR ? "10B8B " : "",
2193 ehc->i.serror & SERR_DISPARITY ? "Dispar " : "",
2194 ehc->i.serror & SERR_CRC ? "BadCRC " : "",
2195 ehc->i.serror & SERR_HANDSHAKE ? "Handshk " : "",
2196 ehc->i.serror & SERR_LINK_SEQ_ERR ? "LinkSeq " : "",
2197 ehc->i.serror & SERR_TRANS_ST_ERROR ? "TrStaTrns " : "",
2198 ehc->i.serror & SERR_UNRECOG_FIS ? "UnrecFIS " : "",
Jeff Garzik2dcb4072007-10-19 06:42:56 -04002199 ehc->i.serror & SERR_DEV_XCHG ? "DevExch " : "");
Robert Hancock1333e192007-10-02 11:22:02 -04002200
Tejun Heo022bdb02006-05-15 20:58:22 +09002201 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) {
2202 struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag);
Tejun Heo8a937582006-11-14 22:36:12 +09002203 struct ata_taskfile *cmd = &qc->tf, *res = &qc->result_tf;
Tejun Heoabb6a882007-11-28 23:16:09 +09002204 const u8 *cdb = qc->cdb;
2205 char data_buf[20] = "";
2206 char cdb_buf[70] = "";
Tejun Heo022bdb02006-05-15 20:58:22 +09002207
Tejun Heo02607312007-08-06 18:36:23 +09002208 if (!(qc->flags & ATA_QCFLAG_FAILED) ||
Tejun Heob1c72912008-07-31 17:02:43 +09002209 ata_dev_phys_link(qc->dev) != link || !qc->err_mask)
Tejun Heo022bdb02006-05-15 20:58:22 +09002210 continue;
2211
Tejun Heoabb6a882007-11-28 23:16:09 +09002212 if (qc->dma_dir != DMA_NONE) {
2213 static const char *dma_str[] = {
2214 [DMA_BIDIRECTIONAL] = "bidi",
2215 [DMA_TO_DEVICE] = "out",
2216 [DMA_FROM_DEVICE] = "in",
2217 };
2218 static const char *prot_str[] = {
2219 [ATA_PROT_PIO] = "pio",
2220 [ATA_PROT_DMA] = "dma",
2221 [ATA_PROT_NCQ] = "ncq",
Tejun Heo0dc36882007-12-18 16:34:43 -05002222 [ATAPI_PROT_PIO] = "pio",
2223 [ATAPI_PROT_DMA] = "dma",
Tejun Heoabb6a882007-11-28 23:16:09 +09002224 };
2225
2226 snprintf(data_buf, sizeof(data_buf), " %s %u %s",
2227 prot_str[qc->tf.protocol], qc->nbytes,
2228 dma_str[qc->dma_dir]);
2229 }
2230
Jeff Garzike39eec12007-12-01 18:05:39 -05002231 if (ata_is_atapi(qc->tf.protocol))
Tejun Heoabb6a882007-11-28 23:16:09 +09002232 snprintf(cdb_buf, sizeof(cdb_buf),
2233 "cdb %02x %02x %02x %02x %02x %02x %02x %02x "
2234 "%02x %02x %02x %02x %02x %02x %02x %02x\n ",
2235 cdb[0], cdb[1], cdb[2], cdb[3],
2236 cdb[4], cdb[5], cdb[6], cdb[7],
2237 cdb[8], cdb[9], cdb[10], cdb[11],
2238 cdb[12], cdb[13], cdb[14], cdb[15]);
2239
Tejun Heo8a937582006-11-14 22:36:12 +09002240 ata_dev_printk(qc->dev, KERN_ERR,
2241 "cmd %02x/%02x:%02x:%02x:%02x:%02x/%02x:%02x:%02x:%02x:%02x/%02x "
Tejun Heoabb6a882007-11-28 23:16:09 +09002242 "tag %d%s\n %s"
Tejun Heo8a937582006-11-14 22:36:12 +09002243 "res %02x/%02x:%02x:%02x:%02x:%02x/%02x:%02x:%02x:%02x:%02x/%02x "
Tejun Heo5335b722007-07-16 14:29:40 +09002244 "Emask 0x%x (%s)%s\n",
Tejun Heo8a937582006-11-14 22:36:12 +09002245 cmd->command, cmd->feature, cmd->nsect,
2246 cmd->lbal, cmd->lbam, cmd->lbah,
2247 cmd->hob_feature, cmd->hob_nsect,
2248 cmd->hob_lbal, cmd->hob_lbam, cmd->hob_lbah,
Tejun Heoabb6a882007-11-28 23:16:09 +09002249 cmd->device, qc->tag, data_buf, cdb_buf,
Tejun Heo8a937582006-11-14 22:36:12 +09002250 res->command, res->feature, res->nsect,
2251 res->lbal, res->lbam, res->lbah,
2252 res->hob_feature, res->hob_nsect,
2253 res->hob_lbal, res->hob_lbam, res->hob_lbah,
Tejun Heo5335b722007-07-16 14:29:40 +09002254 res->device, qc->err_mask, ata_err_string(qc->err_mask),
2255 qc->err_mask & AC_ERR_NCQ ? " <F>" : "");
Robert Hancock1333e192007-10-02 11:22:02 -04002256
2257 if (res->command & (ATA_BUSY | ATA_DRDY | ATA_DF | ATA_DRQ |
Jeff Garzik2dcb4072007-10-19 06:42:56 -04002258 ATA_ERR)) {
Robert Hancock1333e192007-10-02 11:22:02 -04002259 if (res->command & ATA_BUSY)
2260 ata_dev_printk(qc->dev, KERN_ERR,
Jeff Garzik2dcb4072007-10-19 06:42:56 -04002261 "status: { Busy }\n");
Robert Hancock1333e192007-10-02 11:22:02 -04002262 else
2263 ata_dev_printk(qc->dev, KERN_ERR,
2264 "status: { %s%s%s%s}\n",
2265 res->command & ATA_DRDY ? "DRDY " : "",
2266 res->command & ATA_DF ? "DF " : "",
2267 res->command & ATA_DRQ ? "DRQ " : "",
Jeff Garzik2dcb4072007-10-19 06:42:56 -04002268 res->command & ATA_ERR ? "ERR " : "");
Robert Hancock1333e192007-10-02 11:22:02 -04002269 }
2270
2271 if (cmd->command != ATA_CMD_PACKET &&
2272 (res->feature & (ATA_ICRC | ATA_UNC | ATA_IDNF |
2273 ATA_ABORTED)))
2274 ata_dev_printk(qc->dev, KERN_ERR,
2275 "error: { %s%s%s%s}\n",
2276 res->feature & ATA_ICRC ? "ICRC " : "",
2277 res->feature & ATA_UNC ? "UNC " : "",
2278 res->feature & ATA_IDNF ? "IDNF " : "",
Jeff Garzik2dcb4072007-10-19 06:42:56 -04002279 res->feature & ATA_ABORTED ? "ABRT " : "");
Tejun Heo022bdb02006-05-15 20:58:22 +09002280 }
2281}
2282
Tejun Heo9b1e2652007-08-06 18:36:24 +09002283/**
2284 * ata_eh_report - report error handling to user
2285 * @ap: ATA port to report EH about
2286 *
2287 * Report EH to user.
2288 *
2289 * LOCKING:
2290 * None.
2291 */
Tejun Heofb7fd612007-09-23 13:14:12 +09002292void ata_eh_report(struct ata_port *ap)
Tejun Heo9b1e2652007-08-06 18:36:24 +09002293{
2294 struct ata_link *link;
2295
Tejun Heo1eca4362008-11-03 20:03:17 +09002296 ata_for_each_link(link, ap, HOST_FIRST)
Tejun Heo9b1e2652007-08-06 18:36:24 +09002297 ata_eh_link_report(link);
2298}
2299
Tejun Heocc0680a2007-08-06 18:36:23 +09002300static int ata_do_reset(struct ata_link *link, ata_reset_fn_t reset,
Tejun Heob1c72912008-07-31 17:02:43 +09002301 unsigned int *classes, unsigned long deadline,
2302 bool clear_classes)
Tejun Heod87fa382006-05-31 18:28:24 +09002303{
Tejun Heof58229f2007-08-06 18:36:23 +09002304 struct ata_device *dev;
Tejun Heod87fa382006-05-31 18:28:24 +09002305
Tejun Heob1c72912008-07-31 17:02:43 +09002306 if (clear_classes)
Tejun Heo1eca4362008-11-03 20:03:17 +09002307 ata_for_each_dev(dev, link, ALL)
Tejun Heob1c72912008-07-31 17:02:43 +09002308 classes[dev->devno] = ATA_DEV_UNKNOWN;
Tejun Heod87fa382006-05-31 18:28:24 +09002309
Tejun Heof0465192008-05-19 01:15:08 +09002310 return reset(link, classes, deadline);
Tejun Heod87fa382006-05-31 18:28:24 +09002311}
2312
Tejun Heoae791c02007-09-23 13:14:12 +09002313static int ata_eh_followup_srst_needed(struct ata_link *link,
Tejun Heo5dbfc9c2008-07-31 16:08:02 +09002314 int rc, const unsigned int *classes)
Tejun Heo664faf02006-05-31 18:27:50 +09002315{
Tejun Heo45db2f62008-04-08 01:46:56 +09002316 if ((link->flags & ATA_LFLAG_NO_SRST) || ata_link_offline(link))
Tejun Heoae791c02007-09-23 13:14:12 +09002317 return 0;
Tejun Heo5dbfc9c2008-07-31 16:08:02 +09002318 if (rc == -EAGAIN)
2319 return 1;
Tejun Heo071f44b2008-04-07 22:47:22 +09002320 if (sata_pmp_supported(link->ap) && ata_is_host_link(link))
Tejun Heo3495de72007-09-23 13:19:53 +09002321 return 1;
Tejun Heo664faf02006-05-31 18:27:50 +09002322 return 0;
2323}
2324
Tejun Heofb7fd612007-09-23 13:14:12 +09002325int ata_eh_reset(struct ata_link *link, int classify,
2326 ata_prereset_fn_t prereset, ata_reset_fn_t softreset,
2327 ata_reset_fn_t hardreset, ata_postreset_fn_t postreset)
Tejun Heo022bdb02006-05-15 20:58:22 +09002328{
Tejun Heoafaa5c32007-10-09 15:06:10 +09002329 struct ata_port *ap = link->ap;
Tejun Heob1c72912008-07-31 17:02:43 +09002330 struct ata_link *slave = ap->slave_link;
Tejun Heo936fd732007-08-06 18:36:23 +09002331 struct ata_eh_context *ehc = &link->eh_context;
Bartlomiej Zolnierkiewicz705d2012009-07-26 16:21:01 +02002332 struct ata_eh_context *sehc = slave ? &slave->eh_context : NULL;
Tejun Heo664faf02006-05-31 18:27:50 +09002333 unsigned int *classes = ehc->classes;
Tejun Heo416dc9e2007-10-31 10:17:03 +09002334 unsigned int lflags = link->flags;
Tejun Heo1cdaf532006-07-03 16:07:26 +09002335 int verbose = !(ehc->i.flags & ATA_EHI_QUIET);
Tejun Heod8af0eb2008-05-20 02:17:53 +09002336 int max_tries = 0, try = 0;
Tejun Heob1c72912008-07-31 17:02:43 +09002337 struct ata_link *failed_link;
Tejun Heof58229f2007-08-06 18:36:23 +09002338 struct ata_device *dev;
Tejun Heo416dc9e2007-10-31 10:17:03 +09002339 unsigned long deadline, now;
Tejun Heo022bdb02006-05-15 20:58:22 +09002340 ata_reset_fn_t reset;
Tejun Heoafaa5c32007-10-09 15:06:10 +09002341 unsigned long flags;
Tejun Heo416dc9e2007-10-31 10:17:03 +09002342 u32 sstatus;
Tejun Heob1c72912008-07-31 17:02:43 +09002343 int nr_unknown, rc;
Tejun Heo022bdb02006-05-15 20:58:22 +09002344
Tejun Heo932648b2008-05-19 01:15:06 +09002345 /*
2346 * Prepare to reset
2347 */
Tejun Heod8af0eb2008-05-20 02:17:53 +09002348 while (ata_eh_reset_timeouts[max_tries] != ULONG_MAX)
2349 max_tries++;
Tejun Heo05944bd2008-08-13 20:19:09 +09002350 if (link->flags & ATA_LFLAG_NO_HRST)
2351 hardreset = NULL;
2352 if (link->flags & ATA_LFLAG_NO_SRST)
2353 softreset = NULL;
Tejun Heod8af0eb2008-05-20 02:17:53 +09002354
Tejun Heo19b72322008-11-04 17:08:40 +09002355 /* make sure each reset attemp is at least COOL_DOWN apart */
2356 if (ehc->i.flags & ATA_EHI_DID_RESET) {
2357 now = jiffies;
2358 WARN_ON(time_after(ehc->last_reset, now));
2359 deadline = ata_deadline(ehc->last_reset,
2360 ATA_EH_RESET_COOL_DOWN);
2361 if (time_before(now, deadline))
2362 schedule_timeout_uninterruptible(deadline - now);
2363 }
Tejun Heo0a2c0f52008-05-20 02:17:52 +09002364
Tejun Heoafaa5c32007-10-09 15:06:10 +09002365 spin_lock_irqsave(ap->lock, flags);
2366 ap->pflags |= ATA_PFLAG_RESETTING;
2367 spin_unlock_irqrestore(ap->lock, flags);
2368
Tejun Heocf480622008-01-24 00:05:14 +09002369 ata_eh_about_to_do(link, NULL, ATA_EH_RESET);
Tejun Heo13abf502006-07-10 23:18:46 +09002370
Tejun Heo1eca4362008-11-03 20:03:17 +09002371 ata_for_each_dev(dev, link, ALL) {
Tejun Heocdeab112007-10-29 16:41:09 +09002372 /* If we issue an SRST then an ATA drive (not ATAPI)
2373 * may change configuration and be in PIO0 timing. If
2374 * we do a hard reset (or are coming from power on)
2375 * this is true for ATA or ATAPI. Until we've set a
2376 * suitable controller mode we should not touch the
2377 * bus as we may be talking too fast.
2378 */
2379 dev->pio_mode = XFER_PIO_0;
2380
2381 /* If the controller has a pio mode setup function
2382 * then use it to set the chipset to rights. Don't
2383 * touch the DMA setup as that will be dealt with when
2384 * configuring devices.
2385 */
2386 if (ap->ops->set_piomode)
2387 ap->ops->set_piomode(ap, dev);
2388 }
2389
Tejun Heocf480622008-01-24 00:05:14 +09002390 /* prefer hardreset */
Tejun Heo932648b2008-05-19 01:15:06 +09002391 reset = NULL;
Tejun Heocf480622008-01-24 00:05:14 +09002392 ehc->i.action &= ~ATA_EH_RESET;
2393 if (hardreset) {
2394 reset = hardreset;
Tejun Heoa6740502008-07-31 16:07:04 +09002395 ehc->i.action |= ATA_EH_HARDRESET;
Tejun Heo4f7faa32008-01-30 18:18:26 +09002396 } else if (softreset) {
Tejun Heocf480622008-01-24 00:05:14 +09002397 reset = softreset;
Tejun Heoa6740502008-07-31 16:07:04 +09002398 ehc->i.action |= ATA_EH_SOFTRESET;
Tejun Heocf480622008-01-24 00:05:14 +09002399 }
Tejun Heof5914a42006-05-31 18:27:48 +09002400
2401 if (prereset) {
Tejun Heob1c72912008-07-31 17:02:43 +09002402 unsigned long deadline = ata_deadline(jiffies,
2403 ATA_EH_PRERESET_TIMEOUT);
2404
2405 if (slave) {
2406 sehc->i.action &= ~ATA_EH_RESET;
2407 sehc->i.action |= ehc->i.action;
2408 }
2409
2410 rc = prereset(link, deadline);
2411
2412 /* If present, do prereset on slave link too. Reset
2413 * is skipped iff both master and slave links report
2414 * -ENOENT or clear ATA_EH_RESET.
2415 */
2416 if (slave && (rc == 0 || rc == -ENOENT)) {
2417 int tmp;
2418
2419 tmp = prereset(slave, deadline);
2420 if (tmp != -ENOENT)
2421 rc = tmp;
2422
2423 ehc->i.action |= sehc->i.action;
2424 }
2425
Tejun Heof5914a42006-05-31 18:27:48 +09002426 if (rc) {
Alan Coxc9619222006-09-26 17:53:38 +01002427 if (rc == -ENOENT) {
Tejun Heocc0680a2007-08-06 18:36:23 +09002428 ata_link_printk(link, KERN_DEBUG,
Tejun Heo4aa9ab62007-03-12 17:24:08 +09002429 "port disabled. ignoring.\n");
Tejun Heocf480622008-01-24 00:05:14 +09002430 ehc->i.action &= ~ATA_EH_RESET;
Tejun Heo4aa9ab62007-03-12 17:24:08 +09002431
Tejun Heo1eca4362008-11-03 20:03:17 +09002432 ata_for_each_dev(dev, link, ALL)
Tejun Heof58229f2007-08-06 18:36:23 +09002433 classes[dev->devno] = ATA_DEV_NONE;
Tejun Heo4aa9ab62007-03-12 17:24:08 +09002434
2435 rc = 0;
Alan Coxc9619222006-09-26 17:53:38 +01002436 } else
Tejun Heocc0680a2007-08-06 18:36:23 +09002437 ata_link_printk(link, KERN_ERR,
Tejun Heof5914a42006-05-31 18:27:48 +09002438 "prereset failed (errno=%d)\n", rc);
Tejun Heofccb6ea2007-07-16 14:29:41 +09002439 goto out;
Tejun Heof5914a42006-05-31 18:27:48 +09002440 }
Tejun Heof5914a42006-05-31 18:27:48 +09002441
Tejun Heo932648b2008-05-19 01:15:06 +09002442 /* prereset() might have cleared ATA_EH_RESET. If so,
Tejun Heod6515e62009-03-04 15:59:30 +09002443 * bang classes, thaw and return.
Tejun Heo932648b2008-05-19 01:15:06 +09002444 */
2445 if (reset && !(ehc->i.action & ATA_EH_RESET)) {
Tejun Heo1eca4362008-11-03 20:03:17 +09002446 ata_for_each_dev(dev, link, ALL)
Tejun Heo932648b2008-05-19 01:15:06 +09002447 classes[dev->devno] = ATA_DEV_NONE;
Tejun Heod6515e62009-03-04 15:59:30 +09002448 if ((ap->pflags & ATA_PFLAG_FROZEN) &&
2449 ata_is_host_link(link))
2450 ata_eh_thaw_port(ap);
Tejun Heo932648b2008-05-19 01:15:06 +09002451 rc = 0;
2452 goto out;
2453 }
Tejun Heof5914a42006-05-31 18:27:48 +09002454 }
2455
Tejun Heo022bdb02006-05-15 20:58:22 +09002456 retry:
Tejun Heo932648b2008-05-19 01:15:06 +09002457 /*
2458 * Perform reset
2459 */
Tejun Heodc98c322008-05-19 01:15:07 +09002460 if (ata_is_host_link(link))
2461 ata_eh_freeze_port(ap);
2462
Tejun Heo341c2c92008-05-20 02:17:51 +09002463 deadline = ata_deadline(jiffies, ata_eh_reset_timeouts[try++]);
Tejun Heo31daabd2007-02-02 16:50:52 +09002464
Tejun Heo932648b2008-05-19 01:15:06 +09002465 if (reset) {
2466 if (verbose)
2467 ata_link_printk(link, KERN_INFO, "%s resetting link\n",
2468 reset == softreset ? "soft" : "hard");
Tejun Heo022bdb02006-05-15 20:58:22 +09002469
Tejun Heo932648b2008-05-19 01:15:06 +09002470 /* mark that this EH session started with reset */
Tejun Heo19b72322008-11-04 17:08:40 +09002471 ehc->last_reset = jiffies;
Tejun Heo932648b2008-05-19 01:15:06 +09002472 if (reset == hardreset)
2473 ehc->i.flags |= ATA_EHI_DID_HARDRESET;
2474 else
2475 ehc->i.flags |= ATA_EHI_DID_SOFTRESET;
Tejun Heo022bdb02006-05-15 20:58:22 +09002476
Tejun Heob1c72912008-07-31 17:02:43 +09002477 rc = ata_do_reset(link, reset, classes, deadline, true);
2478 if (rc && rc != -EAGAIN) {
2479 failed_link = link;
Tejun Heo5dbfc9c2008-07-31 16:08:02 +09002480 goto fail;
Tejun Heob1c72912008-07-31 17:02:43 +09002481 }
Tejun Heo022bdb02006-05-15 20:58:22 +09002482
Tejun Heob1c72912008-07-31 17:02:43 +09002483 /* hardreset slave link if existent */
2484 if (slave && reset == hardreset) {
2485 int tmp;
2486
2487 if (verbose)
2488 ata_link_printk(slave, KERN_INFO,
2489 "hard resetting link\n");
2490
2491 ata_eh_about_to_do(slave, NULL, ATA_EH_RESET);
2492 tmp = ata_do_reset(slave, reset, classes, deadline,
2493 false);
2494 switch (tmp) {
2495 case -EAGAIN:
2496 rc = -EAGAIN;
2497 case 0:
2498 break;
2499 default:
2500 failed_link = slave;
2501 rc = tmp;
2502 goto fail;
2503 }
2504 }
2505
2506 /* perform follow-up SRST if necessary */
Tejun Heo932648b2008-05-19 01:15:06 +09002507 if (reset == hardreset &&
Tejun Heo5dbfc9c2008-07-31 16:08:02 +09002508 ata_eh_followup_srst_needed(link, rc, classes)) {
Tejun Heo932648b2008-05-19 01:15:06 +09002509 reset = softreset;
Tejun Heo664faf02006-05-31 18:27:50 +09002510
Tejun Heo932648b2008-05-19 01:15:06 +09002511 if (!reset) {
2512 ata_link_printk(link, KERN_ERR,
2513 "follow-up softreset required "
2514 "but no softreset avaliable\n");
Tejun Heob1c72912008-07-31 17:02:43 +09002515 failed_link = link;
Tejun Heo932648b2008-05-19 01:15:06 +09002516 rc = -EINVAL;
2517 goto fail;
2518 }
2519
2520 ata_eh_about_to_do(link, NULL, ATA_EH_RESET);
Tejun Heob1c72912008-07-31 17:02:43 +09002521 rc = ata_do_reset(link, reset, classes, deadline, true);
Tejun Heofe2c4d02009-07-08 12:16:37 +09002522 if (rc) {
2523 failed_link = link;
2524 goto fail;
2525 }
Tejun Heo664faf02006-05-31 18:27:50 +09002526 }
Tejun Heo932648b2008-05-19 01:15:06 +09002527 } else {
2528 if (verbose)
2529 ata_link_printk(link, KERN_INFO, "no reset method "
2530 "available, skipping reset\n");
2531 if (!(lflags & ATA_LFLAG_ASSUME_CLASS))
2532 lflags |= ATA_LFLAG_ASSUME_ATA;
Tejun Heo664faf02006-05-31 18:27:50 +09002533 }
2534
Tejun Heo932648b2008-05-19 01:15:06 +09002535 /*
2536 * Post-reset processing
2537 */
Tejun Heo1eca4362008-11-03 20:03:17 +09002538 ata_for_each_dev(dev, link, ALL) {
Tejun Heo416dc9e2007-10-31 10:17:03 +09002539 /* After the reset, the device state is PIO 0 and the
2540 * controller state is undefined. Reset also wakes up
2541 * drives from sleeping mode.
2542 */
2543 dev->pio_mode = XFER_PIO_0;
2544 dev->flags &= ~ATA_DFLAG_SLEEPING;
Tejun Heo664faf02006-05-31 18:27:50 +09002545
Tejun Heo816ab892008-10-22 00:31:34 +09002546 if (!ata_phys_link_offline(ata_dev_phys_link(dev))) {
2547 /* apply class override */
2548 if (lflags & ATA_LFLAG_ASSUME_ATA)
2549 classes[dev->devno] = ATA_DEV_ATA;
2550 else if (lflags & ATA_LFLAG_ASSUME_SEMB)
2551 classes[dev->devno] = ATA_DEV_SEMB_UNSUP;
2552 } else
2553 classes[dev->devno] = ATA_DEV_NONE;
Tejun Heo022bdb02006-05-15 20:58:22 +09002554 }
2555
Tejun Heo416dc9e2007-10-31 10:17:03 +09002556 /* record current link speed */
2557 if (sata_scr_read(link, SCR_STATUS, &sstatus) == 0)
2558 link->sata_spd = (sstatus >> 4) & 0xf;
Tejun Heob1c72912008-07-31 17:02:43 +09002559 if (slave && sata_scr_read(slave, SCR_STATUS, &sstatus) == 0)
2560 slave->sata_spd = (sstatus >> 4) & 0xf;
Tejun Heo008a7892007-07-16 14:29:40 +09002561
Tejun Heodc98c322008-05-19 01:15:07 +09002562 /* thaw the port */
2563 if (ata_is_host_link(link))
2564 ata_eh_thaw_port(ap);
2565
Tejun Heof0465192008-05-19 01:15:08 +09002566 /* postreset() should clear hardware SError. Although SError
2567 * is cleared during link resume, clearing SError here is
2568 * necessary as some PHYs raise hotplug events after SRST.
2569 * This introduces race condition where hotplug occurs between
2570 * reset and here. This race is mediated by cross checking
2571 * link onlineness and classification result later.
2572 */
Tejun Heob1c72912008-07-31 17:02:43 +09002573 if (postreset) {
Tejun Heo416dc9e2007-10-31 10:17:03 +09002574 postreset(link, classes);
Tejun Heob1c72912008-07-31 17:02:43 +09002575 if (slave)
2576 postreset(slave, classes);
2577 }
Tejun Heo20952b62006-05-31 18:27:23 +09002578
Tejun Heo1e641062009-07-17 11:58:33 +09002579 /*
2580 * Some controllers can't be frozen very well and may set
2581 * spuruious error conditions during reset. Clear accumulated
2582 * error information. As reset is the final recovery action,
2583 * nothing is lost by doing this.
2584 */
Tejun Heof0465192008-05-19 01:15:08 +09002585 spin_lock_irqsave(link->ap->lock, flags);
Tejun Heo1e641062009-07-17 11:58:33 +09002586 memset(&link->eh_info, 0, sizeof(link->eh_info));
Tejun Heob1c72912008-07-31 17:02:43 +09002587 if (slave)
Tejun Heo1e641062009-07-17 11:58:33 +09002588 memset(&slave->eh_info, 0, sizeof(link->eh_info));
2589 ap->pflags &= ~ATA_PFLAG_EH_PENDING;
Tejun Heof0465192008-05-19 01:15:08 +09002590 spin_unlock_irqrestore(link->ap->lock, flags);
2591
2592 /* Make sure onlineness and classification result correspond.
2593 * Hotplug could have happened during reset and some
2594 * controllers fail to wait while a drive is spinning up after
2595 * being hotplugged causing misdetection. By cross checking
2596 * link onlineness and classification result, those conditions
2597 * can be reliably detected and retried.
2598 */
Tejun Heob1c72912008-07-31 17:02:43 +09002599 nr_unknown = 0;
Tejun Heo1eca4362008-11-03 20:03:17 +09002600 ata_for_each_dev(dev, link, ALL) {
Tejun Heof0465192008-05-19 01:15:08 +09002601 /* convert all ATA_DEV_UNKNOWN to ATA_DEV_NONE */
Tejun Heob1c72912008-07-31 17:02:43 +09002602 if (classes[dev->devno] == ATA_DEV_UNKNOWN) {
Tejun Heof0465192008-05-19 01:15:08 +09002603 classes[dev->devno] = ATA_DEV_NONE;
Tejun Heob1c72912008-07-31 17:02:43 +09002604 if (ata_phys_link_online(ata_dev_phys_link(dev)))
2605 nr_unknown++;
2606 }
Tejun Heof0465192008-05-19 01:15:08 +09002607 }
2608
Tejun Heob1c72912008-07-31 17:02:43 +09002609 if (classify && nr_unknown) {
Tejun Heof0465192008-05-19 01:15:08 +09002610 if (try < max_tries) {
2611 ata_link_printk(link, KERN_WARNING, "link online but "
2612 "device misclassified, retrying\n");
Tejun Heob1c72912008-07-31 17:02:43 +09002613 failed_link = link;
Tejun Heof0465192008-05-19 01:15:08 +09002614 rc = -EAGAIN;
2615 goto fail;
2616 }
2617 ata_link_printk(link, KERN_WARNING,
2618 "link online but device misclassified, "
2619 "device detection might fail\n");
2620 }
2621
Tejun Heo416dc9e2007-10-31 10:17:03 +09002622 /* reset successful, schedule revalidation */
Tejun Heocf480622008-01-24 00:05:14 +09002623 ata_eh_done(link, NULL, ATA_EH_RESET);
Tejun Heob1c72912008-07-31 17:02:43 +09002624 if (slave)
2625 ata_eh_done(slave, NULL, ATA_EH_RESET);
Tejun Heo19b72322008-11-04 17:08:40 +09002626 ehc->last_reset = jiffies; /* update to completion time */
Tejun Heo416dc9e2007-10-31 10:17:03 +09002627 ehc->i.action |= ATA_EH_REVALIDATE;
Tejun Heoae791c02007-09-23 13:14:12 +09002628
Tejun Heo416dc9e2007-10-31 10:17:03 +09002629 rc = 0;
Tejun Heofccb6ea2007-07-16 14:29:41 +09002630 out:
2631 /* clear hotplug flag */
2632 ehc->i.flags &= ~ATA_EHI_HOTPLUGGED;
Tejun Heob1c72912008-07-31 17:02:43 +09002633 if (slave)
2634 sehc->i.flags &= ~ATA_EHI_HOTPLUGGED;
Tejun Heoafaa5c32007-10-09 15:06:10 +09002635
2636 spin_lock_irqsave(ap->lock, flags);
2637 ap->pflags &= ~ATA_PFLAG_RESETTING;
2638 spin_unlock_irqrestore(ap->lock, flags);
2639
Tejun Heo022bdb02006-05-15 20:58:22 +09002640 return rc;
Tejun Heo416dc9e2007-10-31 10:17:03 +09002641
2642 fail:
Tejun Heo5958e302008-04-07 22:47:20 +09002643 /* if SCR isn't accessible on a fan-out port, PMP needs to be reset */
2644 if (!ata_is_host_link(link) &&
2645 sata_scr_read(link, SCR_STATUS, &sstatus))
2646 rc = -ERESTART;
2647
Tejun Heo416dc9e2007-10-31 10:17:03 +09002648 if (rc == -ERESTART || try >= max_tries)
2649 goto out;
2650
2651 now = jiffies;
2652 if (time_before(now, deadline)) {
2653 unsigned long delta = deadline - now;
2654
Tejun Heob1c72912008-07-31 17:02:43 +09002655 ata_link_printk(failed_link, KERN_WARNING,
Tejun Heo0a2c0f52008-05-20 02:17:52 +09002656 "reset failed (errno=%d), retrying in %u secs\n",
2657 rc, DIV_ROUND_UP(jiffies_to_msecs(delta), 1000));
Tejun Heo416dc9e2007-10-31 10:17:03 +09002658
2659 while (delta)
2660 delta = schedule_timeout_uninterruptible(delta);
2661 }
2662
Tejun Heob1c72912008-07-31 17:02:43 +09002663 if (try == max_tries - 1) {
Tejun Heoa07d4992009-01-29 20:31:33 +09002664 sata_down_spd_limit(link, 0);
Tejun Heob1c72912008-07-31 17:02:43 +09002665 if (slave)
Tejun Heoa07d4992009-01-29 20:31:33 +09002666 sata_down_spd_limit(slave, 0);
Tejun Heob1c72912008-07-31 17:02:43 +09002667 } else if (rc == -EPIPE)
Tejun Heoa07d4992009-01-29 20:31:33 +09002668 sata_down_spd_limit(failed_link, 0);
Tejun Heob1c72912008-07-31 17:02:43 +09002669
Tejun Heo416dc9e2007-10-31 10:17:03 +09002670 if (hardreset)
2671 reset = hardreset;
2672 goto retry;
Tejun Heo022bdb02006-05-15 20:58:22 +09002673}
2674
Elias Oltmanns45fabbb2008-09-21 11:54:08 +02002675static inline void ata_eh_pull_park_action(struct ata_port *ap)
2676{
2677 struct ata_link *link;
2678 struct ata_device *dev;
2679 unsigned long flags;
2680
2681 /*
2682 * This function can be thought of as an extended version of
2683 * ata_eh_about_to_do() specially crafted to accommodate the
2684 * requirements of ATA_EH_PARK handling. Since the EH thread
2685 * does not leave the do {} while () loop in ata_eh_recover as
2686 * long as the timeout for a park request to *one* device on
2687 * the port has not expired, and since we still want to pick
2688 * up park requests to other devices on the same port or
2689 * timeout updates for the same device, we have to pull
2690 * ATA_EH_PARK actions from eh_info into eh_context.i
2691 * ourselves at the beginning of each pass over the loop.
2692 *
2693 * Additionally, all write accesses to &ap->park_req_pending
2694 * through INIT_COMPLETION() (see below) or complete_all()
2695 * (see ata_scsi_park_store()) are protected by the host lock.
2696 * As a result we have that park_req_pending.done is zero on
2697 * exit from this function, i.e. when ATA_EH_PARK actions for
2698 * *all* devices on port ap have been pulled into the
2699 * respective eh_context structs. If, and only if,
2700 * park_req_pending.done is non-zero by the time we reach
2701 * wait_for_completion_timeout(), another ATA_EH_PARK action
2702 * has been scheduled for at least one of the devices on port
2703 * ap and we have to cycle over the do {} while () loop in
2704 * ata_eh_recover() again.
2705 */
2706
2707 spin_lock_irqsave(ap->lock, flags);
2708 INIT_COMPLETION(ap->park_req_pending);
Tejun Heo1eca4362008-11-03 20:03:17 +09002709 ata_for_each_link(link, ap, EDGE) {
2710 ata_for_each_dev(dev, link, ALL) {
Elias Oltmanns45fabbb2008-09-21 11:54:08 +02002711 struct ata_eh_info *ehi = &link->eh_info;
2712
2713 link->eh_context.i.dev_action[dev->devno] |=
2714 ehi->dev_action[dev->devno] & ATA_EH_PARK;
2715 ata_eh_clear_action(link, dev, ehi, ATA_EH_PARK);
2716 }
2717 }
2718 spin_unlock_irqrestore(ap->lock, flags);
2719}
2720
2721static void ata_eh_park_issue_cmd(struct ata_device *dev, int park)
2722{
2723 struct ata_eh_context *ehc = &dev->link->eh_context;
2724 struct ata_taskfile tf;
2725 unsigned int err_mask;
2726
2727 ata_tf_init(dev, &tf);
2728 if (park) {
2729 ehc->unloaded_mask |= 1 << dev->devno;
2730 tf.command = ATA_CMD_IDLEIMMEDIATE;
2731 tf.feature = 0x44;
2732 tf.lbal = 0x4c;
2733 tf.lbam = 0x4e;
2734 tf.lbah = 0x55;
2735 } else {
2736 ehc->unloaded_mask &= ~(1 << dev->devno);
2737 tf.command = ATA_CMD_CHK_POWER;
2738 }
2739
2740 tf.flags |= ATA_TFLAG_DEVICE | ATA_TFLAG_ISADDR;
2741 tf.protocol |= ATA_PROT_NODATA;
2742 err_mask = ata_exec_internal(dev, &tf, NULL, DMA_NONE, NULL, 0, 0);
2743 if (park && (err_mask || tf.lbal != 0xc4)) {
2744 ata_dev_printk(dev, KERN_ERR, "head unload failed!\n");
2745 ehc->unloaded_mask &= ~(1 << dev->devno);
2746 }
2747}
2748
Tejun Heo02607312007-08-06 18:36:23 +09002749static int ata_eh_revalidate_and_attach(struct ata_link *link,
Tejun Heo084fe632006-05-31 18:28:03 +09002750 struct ata_device **r_failed_dev)
Tejun Heo022bdb02006-05-15 20:58:22 +09002751{
Tejun Heo02607312007-08-06 18:36:23 +09002752 struct ata_port *ap = link->ap;
2753 struct ata_eh_context *ehc = &link->eh_context;
Tejun Heo022bdb02006-05-15 20:58:22 +09002754 struct ata_device *dev;
Tejun Heo8c3c52a2007-03-22 22:24:19 +09002755 unsigned int new_mask = 0;
Tejun Heo084fe632006-05-31 18:28:03 +09002756 unsigned long flags;
Tejun Heof58229f2007-08-06 18:36:23 +09002757 int rc = 0;
Tejun Heo022bdb02006-05-15 20:58:22 +09002758
2759 DPRINTK("ENTER\n");
2760
Tejun Heo8c3c52a2007-03-22 22:24:19 +09002761 /* For PATA drive side cable detection to work, IDENTIFY must
2762 * be done backwards such that PDIAG- is released by the slave
2763 * device before the master device is identified.
2764 */
Tejun Heo1eca4362008-11-03 20:03:17 +09002765 ata_for_each_dev(dev, link, ALL_REVERSE) {
Tejun Heof58229f2007-08-06 18:36:23 +09002766 unsigned int action = ata_eh_dev_action(dev);
2767 unsigned int readid_flags = 0;
Tejun Heo47005f22006-06-19 18:27:23 +09002768
Tejun Heobff04642006-11-10 18:08:10 +09002769 if (ehc->i.flags & ATA_EHI_DID_RESET)
2770 readid_flags |= ATA_READID_POSTRESET;
2771
Tejun Heo9666f402007-05-04 21:27:47 +02002772 if ((action & ATA_EH_REVALIDATE) && ata_dev_enabled(dev)) {
Tejun Heo633273a2007-09-23 13:19:54 +09002773 WARN_ON(dev->class == ATA_DEV_PMP);
2774
Tejun Heob1c72912008-07-31 17:02:43 +09002775 if (ata_phys_link_offline(ata_dev_phys_link(dev))) {
Tejun Heo022bdb02006-05-15 20:58:22 +09002776 rc = -EIO;
Tejun Heo8c3c52a2007-03-22 22:24:19 +09002777 goto err;
Tejun Heo022bdb02006-05-15 20:58:22 +09002778 }
2779
Tejun Heo02607312007-08-06 18:36:23 +09002780 ata_eh_about_to_do(link, dev, ATA_EH_REVALIDATE);
Tejun Heo422c9da2007-09-23 13:14:12 +09002781 rc = ata_dev_revalidate(dev, ehc->classes[dev->devno],
2782 readid_flags);
Tejun Heo022bdb02006-05-15 20:58:22 +09002783 if (rc)
Tejun Heo8c3c52a2007-03-22 22:24:19 +09002784 goto err;
Tejun Heo022bdb02006-05-15 20:58:22 +09002785
Tejun Heo02607312007-08-06 18:36:23 +09002786 ata_eh_done(link, dev, ATA_EH_REVALIDATE);
Tejun Heo47005f22006-06-19 18:27:23 +09002787
Tejun Heobaa1e782006-11-01 18:39:27 +09002788 /* Configuration may have changed, reconfigure
2789 * transfer mode.
2790 */
2791 ehc->i.flags |= ATA_EHI_SETMODE;
2792
zhao, forrest3057ac32006-06-12 12:01:34 +08002793 /* schedule the scsi_rescan_device() here */
2794 queue_work(ata_aux_wq, &(ap->scsi_rescan_task));
Tejun Heo084fe632006-05-31 18:28:03 +09002795 } else if (dev->class == ATA_DEV_UNKNOWN &&
2796 ehc->tries[dev->devno] &&
2797 ata_class_enabled(ehc->classes[dev->devno])) {
Tejun Heo842faa62009-05-10 01:06:54 +09002798 /* Temporarily set dev->class, it will be
2799 * permanently set once all configurations are
2800 * complete. This is necessary because new
2801 * device configuration is done in two
2802 * separate loops.
2803 */
Tejun Heo084fe632006-05-31 18:28:03 +09002804 dev->class = ehc->classes[dev->devno];
2805
Tejun Heo633273a2007-09-23 13:19:54 +09002806 if (dev->class == ATA_DEV_PMP)
2807 rc = sata_pmp_attach(dev);
2808 else
2809 rc = ata_dev_read_id(dev, &dev->class,
2810 readid_flags, dev->id);
Tejun Heo842faa62009-05-10 01:06:54 +09002811
2812 /* read_id might have changed class, store and reset */
2813 ehc->classes[dev->devno] = dev->class;
2814 dev->class = ATA_DEV_UNKNOWN;
2815
Tejun Heo8c3c52a2007-03-22 22:24:19 +09002816 switch (rc) {
2817 case 0:
Tejun Heo99cf6102009-01-29 20:31:32 +09002818 /* clear error info accumulated during probe */
2819 ata_ering_clear(&dev->ering);
Tejun Heof58229f2007-08-06 18:36:23 +09002820 new_mask |= 1 << dev->devno;
Tejun Heo8c3c52a2007-03-22 22:24:19 +09002821 break;
2822 case -ENOENT:
Tejun Heo55a8e2c2006-11-10 18:08:10 +09002823 /* IDENTIFY was issued to non-existent
2824 * device. No need to reset. Just
Tejun Heo842faa62009-05-10 01:06:54 +09002825 * thaw and ignore the device.
Tejun Heo55a8e2c2006-11-10 18:08:10 +09002826 */
2827 ata_eh_thaw_port(ap);
Tejun Heo084fe632006-05-31 18:28:03 +09002828 break;
Tejun Heo8c3c52a2007-03-22 22:24:19 +09002829 default:
Tejun Heo8c3c52a2007-03-22 22:24:19 +09002830 goto err;
Tejun Heo55a8e2c2006-11-10 18:08:10 +09002831 }
Tejun Heo022bdb02006-05-15 20:58:22 +09002832 }
2833 }
2834
Tejun Heoc1c4e8d2007-04-23 02:05:53 +09002835 /* PDIAG- should have been released, ask cable type if post-reset */
Tejun Heo33267322008-02-13 09:15:09 +09002836 if ((ehc->i.flags & ATA_EHI_DID_RESET) && ata_is_host_link(link)) {
2837 if (ap->ops->cable_detect)
2838 ap->cbl = ap->ops->cable_detect(ap);
2839 ata_force_cbl(ap);
2840 }
Tejun Heoc1c4e8d2007-04-23 02:05:53 +09002841
Tejun Heo8c3c52a2007-03-22 22:24:19 +09002842 /* Configure new devices forward such that user doesn't see
2843 * device detection messages backwards.
2844 */
Tejun Heo1eca4362008-11-03 20:03:17 +09002845 ata_for_each_dev(dev, link, ALL) {
Tejun Heo633273a2007-09-23 13:19:54 +09002846 if (!(new_mask & (1 << dev->devno)) ||
2847 dev->class == ATA_DEV_PMP)
Tejun Heo8c3c52a2007-03-22 22:24:19 +09002848 continue;
2849
Tejun Heo842faa62009-05-10 01:06:54 +09002850 dev->class = ehc->classes[dev->devno];
2851
Tejun Heo8c3c52a2007-03-22 22:24:19 +09002852 ehc->i.flags |= ATA_EHI_PRINTINFO;
2853 rc = ata_dev_configure(dev);
2854 ehc->i.flags &= ~ATA_EHI_PRINTINFO;
Tejun Heo842faa62009-05-10 01:06:54 +09002855 if (rc) {
2856 dev->class = ATA_DEV_UNKNOWN;
Tejun Heo8c3c52a2007-03-22 22:24:19 +09002857 goto err;
Tejun Heo842faa62009-05-10 01:06:54 +09002858 }
Tejun Heo8c3c52a2007-03-22 22:24:19 +09002859
2860 spin_lock_irqsave(ap->lock, flags);
2861 ap->pflags |= ATA_PFLAG_SCSI_HOTPLUG;
2862 spin_unlock_irqrestore(ap->lock, flags);
2863
2864 /* new device discovered, configure xfermode */
2865 ehc->i.flags |= ATA_EHI_SETMODE;
2866 }
2867
2868 return 0;
2869
2870 err:
2871 *r_failed_dev = dev;
2872 DPRINTK("EXIT rc=%d\n", rc);
Tejun Heo022bdb02006-05-15 20:58:22 +09002873 return rc;
2874}
2875
Tejun Heo6f1d1e32007-11-27 19:28:55 +09002876/**
2877 * ata_set_mode - Program timings and issue SET FEATURES - XFER
2878 * @link: link on which timings will be programmed
Martin Olsson98a17082009-04-22 18:21:29 +02002879 * @r_failed_dev: out parameter for failed device
Tejun Heo6f1d1e32007-11-27 19:28:55 +09002880 *
2881 * Set ATA device disk transfer mode (PIO3, UDMA6, etc.). If
2882 * ata_set_mode() fails, pointer to the failing device is
2883 * returned in @r_failed_dev.
2884 *
2885 * LOCKING:
2886 * PCI/etc. bus probe sem.
2887 *
2888 * RETURNS:
2889 * 0 on success, negative errno otherwise
2890 */
2891int ata_set_mode(struct ata_link *link, struct ata_device **r_failed_dev)
2892{
2893 struct ata_port *ap = link->ap;
Tejun Heo00115e02007-11-27 19:28:58 +09002894 struct ata_device *dev;
2895 int rc;
Tejun Heo6f1d1e32007-11-27 19:28:55 +09002896
Tejun Heo76326ac2007-11-27 19:28:59 +09002897 /* if data transfer is verified, clear DUBIOUS_XFER on ering top */
Tejun Heo1eca4362008-11-03 20:03:17 +09002898 ata_for_each_dev(dev, link, ENABLED) {
Tejun Heo76326ac2007-11-27 19:28:59 +09002899 if (!(dev->flags & ATA_DFLAG_DUBIOUS_XFER)) {
2900 struct ata_ering_entry *ent;
2901
2902 ent = ata_ering_top(&dev->ering);
2903 if (ent)
2904 ent->eflags &= ~ATA_EFLAG_DUBIOUS_XFER;
2905 }
2906 }
2907
Tejun Heo6f1d1e32007-11-27 19:28:55 +09002908 /* has private set_mode? */
2909 if (ap->ops->set_mode)
Tejun Heo00115e02007-11-27 19:28:58 +09002910 rc = ap->ops->set_mode(link, r_failed_dev);
2911 else
2912 rc = ata_do_set_mode(link, r_failed_dev);
2913
2914 /* if transfer mode has changed, set DUBIOUS_XFER on device */
Tejun Heo1eca4362008-11-03 20:03:17 +09002915 ata_for_each_dev(dev, link, ENABLED) {
Tejun Heo00115e02007-11-27 19:28:58 +09002916 struct ata_eh_context *ehc = &link->eh_context;
2917 u8 saved_xfer_mode = ehc->saved_xfer_mode[dev->devno];
2918 u8 saved_ncq = !!(ehc->saved_ncq_enabled & (1 << dev->devno));
2919
2920 if (dev->xfer_mode != saved_xfer_mode ||
2921 ata_ncq_enabled(dev) != saved_ncq)
2922 dev->flags |= ATA_DFLAG_DUBIOUS_XFER;
2923 }
2924
2925 return rc;
Tejun Heo6f1d1e32007-11-27 19:28:55 +09002926}
2927
Tejun Heo11fc33d2008-08-30 14:20:01 +02002928/**
2929 * atapi_eh_clear_ua - Clear ATAPI UNIT ATTENTION after reset
2930 * @dev: ATAPI device to clear UA for
2931 *
2932 * Resets and other operations can make an ATAPI device raise
2933 * UNIT ATTENTION which causes the next operation to fail. This
2934 * function clears UA.
2935 *
2936 * LOCKING:
2937 * EH context (may sleep).
2938 *
2939 * RETURNS:
2940 * 0 on success, -errno on failure.
2941 */
2942static int atapi_eh_clear_ua(struct ata_device *dev)
2943{
2944 int i;
2945
2946 for (i = 0; i < ATA_EH_UA_TRIES; i++) {
Tejun Heob5357082009-03-02 18:55:16 +09002947 u8 *sense_buffer = dev->link->ap->sector_buf;
Tejun Heo11fc33d2008-08-30 14:20:01 +02002948 u8 sense_key = 0;
2949 unsigned int err_mask;
2950
2951 err_mask = atapi_eh_tur(dev, &sense_key);
2952 if (err_mask != 0 && err_mask != AC_ERR_DEV) {
2953 ata_dev_printk(dev, KERN_WARNING, "TEST_UNIT_READY "
2954 "failed (err_mask=0x%x)\n", err_mask);
2955 return -EIO;
2956 }
2957
2958 if (!err_mask || sense_key != UNIT_ATTENTION)
2959 return 0;
2960
2961 err_mask = atapi_eh_request_sense(dev, sense_buffer, sense_key);
2962 if (err_mask) {
2963 ata_dev_printk(dev, KERN_WARNING, "failed to clear "
2964 "UNIT ATTENTION (err_mask=0x%x)\n", err_mask);
2965 return -EIO;
2966 }
2967 }
2968
2969 ata_dev_printk(dev, KERN_WARNING,
2970 "UNIT ATTENTION persists after %d tries\n", ATA_EH_UA_TRIES);
2971
2972 return 0;
2973}
2974
Tejun Heo02607312007-08-06 18:36:23 +09002975static int ata_link_nr_enabled(struct ata_link *link)
Tejun Heo022bdb02006-05-15 20:58:22 +09002976{
Tejun Heof58229f2007-08-06 18:36:23 +09002977 struct ata_device *dev;
2978 int cnt = 0;
Tejun Heo022bdb02006-05-15 20:58:22 +09002979
Tejun Heo1eca4362008-11-03 20:03:17 +09002980 ata_for_each_dev(dev, link, ENABLED)
2981 cnt++;
Tejun Heo022bdb02006-05-15 20:58:22 +09002982 return cnt;
2983}
2984
Tejun Heo02607312007-08-06 18:36:23 +09002985static int ata_link_nr_vacant(struct ata_link *link)
Tejun Heo084fe632006-05-31 18:28:03 +09002986{
Tejun Heof58229f2007-08-06 18:36:23 +09002987 struct ata_device *dev;
2988 int cnt = 0;
Tejun Heo084fe632006-05-31 18:28:03 +09002989
Tejun Heo1eca4362008-11-03 20:03:17 +09002990 ata_for_each_dev(dev, link, ALL)
Tejun Heof58229f2007-08-06 18:36:23 +09002991 if (dev->class == ATA_DEV_UNKNOWN)
Tejun Heo084fe632006-05-31 18:28:03 +09002992 cnt++;
2993 return cnt;
2994}
2995
Tejun Heo02607312007-08-06 18:36:23 +09002996static int ata_eh_skip_recovery(struct ata_link *link)
Tejun Heo084fe632006-05-31 18:28:03 +09002997{
Tejun Heo672b2d62008-01-24 00:05:14 +09002998 struct ata_port *ap = link->ap;
Tejun Heo02607312007-08-06 18:36:23 +09002999 struct ata_eh_context *ehc = &link->eh_context;
Tejun Heof58229f2007-08-06 18:36:23 +09003000 struct ata_device *dev;
Tejun Heo084fe632006-05-31 18:28:03 +09003001
Tejun Heof9df58c2007-09-23 13:14:13 +09003002 /* skip disabled links */
3003 if (link->flags & ATA_LFLAG_DISABLED)
3004 return 1;
3005
Tejun Heo672b2d62008-01-24 00:05:14 +09003006 /* thaw frozen port and recover failed devices */
3007 if ((ap->pflags & ATA_PFLAG_FROZEN) || ata_link_nr_enabled(link))
3008 return 0;
3009
3010 /* reset at least once if reset is requested */
3011 if ((ehc->i.action & ATA_EH_RESET) &&
3012 !(ehc->i.flags & ATA_EHI_DID_RESET))
Tejun Heo084fe632006-05-31 18:28:03 +09003013 return 0;
3014
3015 /* skip if class codes for all vacant slots are ATA_DEV_NONE */
Tejun Heo1eca4362008-11-03 20:03:17 +09003016 ata_for_each_dev(dev, link, ALL) {
Tejun Heo084fe632006-05-31 18:28:03 +09003017 if (dev->class == ATA_DEV_UNKNOWN &&
3018 ehc->classes[dev->devno] != ATA_DEV_NONE)
3019 return 0;
3020 }
3021
3022 return 1;
3023}
3024
Tejun Heoc2c7a892009-01-29 20:31:34 +09003025static int ata_count_probe_trials_cb(struct ata_ering_entry *ent, void *void_arg)
3026{
3027 u64 interval = msecs_to_jiffies(ATA_EH_PROBE_TRIAL_INTERVAL);
3028 u64 now = get_jiffies_64();
3029 int *trials = void_arg;
3030
3031 if (ent->timestamp < now - min(now, interval))
3032 return -1;
3033
3034 (*trials)++;
3035 return 0;
3036}
3037
Tejun Heo02c05a22007-11-27 19:28:54 +09003038static int ata_eh_schedule_probe(struct ata_device *dev)
3039{
3040 struct ata_eh_context *ehc = &dev->link->eh_context;
Tejun Heoc2c7a892009-01-29 20:31:34 +09003041 struct ata_link *link = ata_dev_phys_link(dev);
3042 int trials = 0;
Tejun Heo02c05a22007-11-27 19:28:54 +09003043
3044 if (!(ehc->i.probe_mask & (1 << dev->devno)) ||
3045 (ehc->did_probe_mask & (1 << dev->devno)))
3046 return 0;
3047
3048 ata_eh_detach_dev(dev);
3049 ata_dev_init(dev);
3050 ehc->did_probe_mask |= (1 << dev->devno);
Tejun Heocf480622008-01-24 00:05:14 +09003051 ehc->i.action |= ATA_EH_RESET;
Tejun Heo00115e02007-11-27 19:28:58 +09003052 ehc->saved_xfer_mode[dev->devno] = 0;
3053 ehc->saved_ncq_enabled &= ~(1 << dev->devno);
Tejun Heo02c05a22007-11-27 19:28:54 +09003054
Tejun Heoc2c7a892009-01-29 20:31:34 +09003055 /* Record and count probe trials on the ering. The specific
3056 * error mask used is irrelevant. Because a successful device
3057 * detection clears the ering, this count accumulates only if
3058 * there are consecutive failed probes.
3059 *
3060 * If the count is equal to or higher than ATA_EH_PROBE_TRIALS
3061 * in the last ATA_EH_PROBE_TRIAL_INTERVAL, link speed is
3062 * forced to 1.5Gbps.
3063 *
3064 * This is to work around cases where failed link speed
3065 * negotiation results in device misdetection leading to
3066 * infinite DEVXCHG or PHRDY CHG events.
3067 */
3068 ata_ering_record(&dev->ering, 0, AC_ERR_OTHER);
3069 ata_ering_map(&dev->ering, ata_count_probe_trials_cb, &trials);
3070
3071 if (trials > ATA_EH_PROBE_TRIALS)
3072 sata_down_spd_limit(link, 1);
3073
Tejun Heo02c05a22007-11-27 19:28:54 +09003074 return 1;
3075}
3076
Tejun Heo9b1e2652007-08-06 18:36:24 +09003077static int ata_eh_handle_dev_fail(struct ata_device *dev, int err)
Tejun Heofee7ca72007-07-01 19:05:58 +09003078{
Tejun Heo9af5c9c2007-08-06 18:36:22 +09003079 struct ata_eh_context *ehc = &dev->link->eh_context;
Tejun Heofee7ca72007-07-01 19:05:58 +09003080
Tejun Heocf9a5902009-01-29 20:31:35 +09003081 /* -EAGAIN from EH routine indicates retry without prejudice.
3082 * The requester is responsible for ensuring forward progress.
3083 */
3084 if (err != -EAGAIN)
3085 ehc->tries[dev->devno]--;
Tejun Heofee7ca72007-07-01 19:05:58 +09003086
3087 switch (err) {
3088 case -ENODEV:
3089 /* device missing or wrong IDENTIFY data, schedule probing */
3090 ehc->i.probe_mask |= (1 << dev->devno);
3091 case -EINVAL:
3092 /* give it just one more chance */
3093 ehc->tries[dev->devno] = min(ehc->tries[dev->devno], 1);
3094 case -EIO:
Tejun Heod89293a2009-01-29 20:31:29 +09003095 if (ehc->tries[dev->devno] == 1) {
Tejun Heofee7ca72007-07-01 19:05:58 +09003096 /* This is the last chance, better to slow
3097 * down than lose it.
3098 */
Tejun Heoa07d4992009-01-29 20:31:33 +09003099 sata_down_spd_limit(ata_dev_phys_link(dev), 0);
Tejun Heod89293a2009-01-29 20:31:29 +09003100 if (dev->pio_mode > XFER_PIO_0)
3101 ata_down_xfermask_limit(dev, ATA_DNXFER_PIO);
Tejun Heofee7ca72007-07-01 19:05:58 +09003102 }
3103 }
3104
3105 if (ata_dev_enabled(dev) && !ehc->tries[dev->devno]) {
3106 /* disable device if it has used up all its chances */
3107 ata_dev_disable(dev);
3108
3109 /* detach if offline */
Tejun Heob1c72912008-07-31 17:02:43 +09003110 if (ata_phys_link_offline(ata_dev_phys_link(dev)))
Tejun Heofee7ca72007-07-01 19:05:58 +09003111 ata_eh_detach_dev(dev);
3112
Tejun Heo02c05a22007-11-27 19:28:54 +09003113 /* schedule probe if necessary */
Tejun Heo87fbc5a2008-05-20 02:17:54 +09003114 if (ata_eh_schedule_probe(dev)) {
Tejun Heofee7ca72007-07-01 19:05:58 +09003115 ehc->tries[dev->devno] = ATA_EH_DEV_TRIES;
Tejun Heo87fbc5a2008-05-20 02:17:54 +09003116 memset(ehc->cmd_timeout_idx[dev->devno], 0,
3117 sizeof(ehc->cmd_timeout_idx[dev->devno]));
3118 }
Tejun Heo9b1e2652007-08-06 18:36:24 +09003119
3120 return 1;
Tejun Heofee7ca72007-07-01 19:05:58 +09003121 } else {
Tejun Heocf480622008-01-24 00:05:14 +09003122 ehc->i.action |= ATA_EH_RESET;
Tejun Heo9b1e2652007-08-06 18:36:24 +09003123 return 0;
Tejun Heofee7ca72007-07-01 19:05:58 +09003124 }
3125}
3126
Tejun Heo022bdb02006-05-15 20:58:22 +09003127/**
3128 * ata_eh_recover - recover host port after error
3129 * @ap: host port to recover
Tejun Heof5914a42006-05-31 18:27:48 +09003130 * @prereset: prereset method (can be NULL)
Tejun Heo022bdb02006-05-15 20:58:22 +09003131 * @softreset: softreset method (can be NULL)
3132 * @hardreset: hardreset method (can be NULL)
3133 * @postreset: postreset method (can be NULL)
Tejun Heo9b1e2652007-08-06 18:36:24 +09003134 * @r_failed_link: out parameter for failed link
Tejun Heo022bdb02006-05-15 20:58:22 +09003135 *
3136 * This is the alpha and omega, eum and yang, heart and soul of
3137 * libata exception handling. On entry, actions required to
Tejun Heo9b1e2652007-08-06 18:36:24 +09003138 * recover each link and hotplug requests are recorded in the
3139 * link's eh_context. This function executes all the operations
3140 * with appropriate retrials and fallbacks to resurrect failed
Tejun Heo084fe632006-05-31 18:28:03 +09003141 * devices, detach goners and greet newcomers.
Tejun Heo022bdb02006-05-15 20:58:22 +09003142 *
3143 * LOCKING:
3144 * Kernel thread context (may sleep).
3145 *
3146 * RETURNS:
3147 * 0 on success, -errno on failure.
3148 */
Tejun Heofb7fd612007-09-23 13:14:12 +09003149int ata_eh_recover(struct ata_port *ap, ata_prereset_fn_t prereset,
3150 ata_reset_fn_t softreset, ata_reset_fn_t hardreset,
3151 ata_postreset_fn_t postreset,
3152 struct ata_link **r_failed_link)
Tejun Heo022bdb02006-05-15 20:58:22 +09003153{
Tejun Heo9b1e2652007-08-06 18:36:24 +09003154 struct ata_link *link;
Tejun Heo022bdb02006-05-15 20:58:22 +09003155 struct ata_device *dev;
Tejun Heo0a2c0f52008-05-20 02:17:52 +09003156 int nr_failed_devs;
Tejun Heodc98c322008-05-19 01:15:07 +09003157 int rc;
Elias Oltmanns45fabbb2008-09-21 11:54:08 +02003158 unsigned long flags, deadline;
Tejun Heo022bdb02006-05-15 20:58:22 +09003159
3160 DPRINTK("ENTER\n");
3161
3162 /* prep for recovery */
Tejun Heo1eca4362008-11-03 20:03:17 +09003163 ata_for_each_link(link, ap, EDGE) {
Tejun Heo9b1e2652007-08-06 18:36:24 +09003164 struct ata_eh_context *ehc = &link->eh_context;
Tejun Heo084fe632006-05-31 18:28:03 +09003165
Tejun Heof9df58c2007-09-23 13:14:13 +09003166 /* re-enable link? */
3167 if (ehc->i.action & ATA_EH_ENABLE_LINK) {
3168 ata_eh_about_to_do(link, NULL, ATA_EH_ENABLE_LINK);
3169 spin_lock_irqsave(ap->lock, flags);
3170 link->flags &= ~ATA_LFLAG_DISABLED;
3171 spin_unlock_irqrestore(ap->lock, flags);
3172 ata_eh_done(link, NULL, ATA_EH_ENABLE_LINK);
3173 }
3174
Tejun Heo1eca4362008-11-03 20:03:17 +09003175 ata_for_each_dev(dev, link, ALL) {
Tejun Heofd995f72007-09-23 13:14:12 +09003176 if (link->flags & ATA_LFLAG_NO_RETRY)
3177 ehc->tries[dev->devno] = 1;
3178 else
3179 ehc->tries[dev->devno] = ATA_EH_DEV_TRIES;
Tejun Heo79a55b72007-01-18 17:22:18 +09003180
Tejun Heo9b1e2652007-08-06 18:36:24 +09003181 /* collect port action mask recorded in dev actions */
3182 ehc->i.action |= ehc->i.dev_action[dev->devno] &
3183 ~ATA_EH_PERDEV_MASK;
3184 ehc->i.dev_action[dev->devno] &= ATA_EH_PERDEV_MASK;
Tejun Heo084fe632006-05-31 18:28:03 +09003185
Tejun Heo9b1e2652007-08-06 18:36:24 +09003186 /* process hotplug request */
3187 if (dev->flags & ATA_DFLAG_DETACH)
3188 ata_eh_detach_dev(dev);
3189
Tejun Heo02c05a22007-11-27 19:28:54 +09003190 /* schedule probe if necessary */
3191 if (!ata_dev_enabled(dev))
3192 ata_eh_schedule_probe(dev);
Tejun Heo084fe632006-05-31 18:28:03 +09003193 }
Tejun Heo022bdb02006-05-15 20:58:22 +09003194 }
3195
3196 retry:
Tejun Heo022bdb02006-05-15 20:58:22 +09003197 rc = 0;
Tejun Heo9b1e2652007-08-06 18:36:24 +09003198 nr_failed_devs = 0;
Tejun Heo022bdb02006-05-15 20:58:22 +09003199
Tejun Heoaeb2ecd2006-06-12 14:11:43 +09003200 /* if UNLOADING, finish immediately */
Tejun Heob51e9e52006-06-29 01:29:30 +09003201 if (ap->pflags & ATA_PFLAG_UNLOADING)
Tejun Heoaeb2ecd2006-06-12 14:11:43 +09003202 goto out;
3203
Tejun Heo9b1e2652007-08-06 18:36:24 +09003204 /* prep for EH */
Tejun Heo1eca4362008-11-03 20:03:17 +09003205 ata_for_each_link(link, ap, EDGE) {
Tejun Heo9b1e2652007-08-06 18:36:24 +09003206 struct ata_eh_context *ehc = &link->eh_context;
Tejun Heo022bdb02006-05-15 20:58:22 +09003207
Tejun Heo9b1e2652007-08-06 18:36:24 +09003208 /* skip EH if possible. */
3209 if (ata_eh_skip_recovery(link))
3210 ehc->i.action = 0;
3211
Tejun Heo1eca4362008-11-03 20:03:17 +09003212 ata_for_each_dev(dev, link, ALL)
Tejun Heo9b1e2652007-08-06 18:36:24 +09003213 ehc->classes[dev->devno] = ATA_DEV_UNKNOWN;
3214 }
Tejun Heo084fe632006-05-31 18:28:03 +09003215
Tejun Heo022bdb02006-05-15 20:58:22 +09003216 /* reset */
Tejun Heo1eca4362008-11-03 20:03:17 +09003217 ata_for_each_link(link, ap, EDGE) {
Tejun Heodc98c322008-05-19 01:15:07 +09003218 struct ata_eh_context *ehc = &link->eh_context;
Tejun Heo022bdb02006-05-15 20:58:22 +09003219
Tejun Heodc98c322008-05-19 01:15:07 +09003220 if (!(ehc->i.action & ATA_EH_RESET))
3221 continue;
Tejun Heo9b1e2652007-08-06 18:36:24 +09003222
Tejun Heodc98c322008-05-19 01:15:07 +09003223 rc = ata_eh_reset(link, ata_link_nr_vacant(link),
3224 prereset, softreset, hardreset, postreset);
3225 if (rc) {
3226 ata_link_printk(link, KERN_ERR,
3227 "reset failed, giving up\n");
3228 goto out;
Tejun Heo022bdb02006-05-15 20:58:22 +09003229 }
Tejun Heo022bdb02006-05-15 20:58:22 +09003230 }
3231
Elias Oltmanns45fabbb2008-09-21 11:54:08 +02003232 do {
3233 unsigned long now;
3234
3235 /*
3236 * clears ATA_EH_PARK in eh_info and resets
3237 * ap->park_req_pending
3238 */
3239 ata_eh_pull_park_action(ap);
3240
3241 deadline = jiffies;
Tejun Heo1eca4362008-11-03 20:03:17 +09003242 ata_for_each_link(link, ap, EDGE) {
3243 ata_for_each_dev(dev, link, ALL) {
Elias Oltmanns45fabbb2008-09-21 11:54:08 +02003244 struct ata_eh_context *ehc = &link->eh_context;
3245 unsigned long tmp;
3246
3247 if (dev->class != ATA_DEV_ATA)
3248 continue;
3249 if (!(ehc->i.dev_action[dev->devno] &
3250 ATA_EH_PARK))
3251 continue;
3252 tmp = dev->unpark_deadline;
3253 if (time_before(deadline, tmp))
3254 deadline = tmp;
3255 else if (time_before_eq(tmp, jiffies))
3256 continue;
3257 if (ehc->unloaded_mask & (1 << dev->devno))
3258 continue;
3259
3260 ata_eh_park_issue_cmd(dev, 1);
3261 }
3262 }
3263
3264 now = jiffies;
3265 if (time_before_eq(deadline, now))
3266 break;
3267
3268 deadline = wait_for_completion_timeout(&ap->park_req_pending,
3269 deadline - now);
3270 } while (deadline);
Tejun Heo1eca4362008-11-03 20:03:17 +09003271 ata_for_each_link(link, ap, EDGE) {
3272 ata_for_each_dev(dev, link, ALL) {
Elias Oltmanns45fabbb2008-09-21 11:54:08 +02003273 if (!(link->eh_context.unloaded_mask &
3274 (1 << dev->devno)))
3275 continue;
3276
3277 ata_eh_park_issue_cmd(dev, 0);
3278 ata_eh_done(link, dev, ATA_EH_PARK);
3279 }
3280 }
3281
Tejun Heo9b1e2652007-08-06 18:36:24 +09003282 /* the rest */
Tejun Heo1eca4362008-11-03 20:03:17 +09003283 ata_for_each_link(link, ap, EDGE) {
Tejun Heo9b1e2652007-08-06 18:36:24 +09003284 struct ata_eh_context *ehc = &link->eh_context;
Tejun Heo022bdb02006-05-15 20:58:22 +09003285
Tejun Heo9b1e2652007-08-06 18:36:24 +09003286 /* revalidate existing devices and attach new ones */
3287 rc = ata_eh_revalidate_and_attach(link, &dev);
Tejun Heo4ae72a12007-02-02 16:22:30 +09003288 if (rc)
Tejun Heo022bdb02006-05-15 20:58:22 +09003289 goto dev_fail;
Tejun Heo9b1e2652007-08-06 18:36:24 +09003290
Tejun Heo633273a2007-09-23 13:19:54 +09003291 /* if PMP got attached, return, pmp EH will take care of it */
3292 if (link->device->class == ATA_DEV_PMP) {
3293 ehc->i.action = 0;
3294 return 0;
3295 }
3296
Tejun Heo9b1e2652007-08-06 18:36:24 +09003297 /* configure transfer mode if necessary */
3298 if (ehc->i.flags & ATA_EHI_SETMODE) {
3299 rc = ata_set_mode(link, &dev);
3300 if (rc)
3301 goto dev_fail;
3302 ehc->i.flags &= ~ATA_EHI_SETMODE;
3303 }
3304
Tejun Heo11fc33d2008-08-30 14:20:01 +02003305 /* If reset has been issued, clear UA to avoid
3306 * disrupting the current users of the device.
3307 */
3308 if (ehc->i.flags & ATA_EHI_DID_RESET) {
Tejun Heo1eca4362008-11-03 20:03:17 +09003309 ata_for_each_dev(dev, link, ALL) {
Tejun Heo11fc33d2008-08-30 14:20:01 +02003310 if (dev->class != ATA_DEV_ATAPI)
3311 continue;
3312 rc = atapi_eh_clear_ua(dev);
3313 if (rc)
3314 goto dev_fail;
3315 }
3316 }
3317
3318 /* configure link power saving */
Tejun Heo3ec25eb2008-03-27 18:37:14 +09003319 if (ehc->i.action & ATA_EH_LPM)
Tejun Heo1eca4362008-11-03 20:03:17 +09003320 ata_for_each_dev(dev, link, ALL)
Kristen Carlson Accardica773292007-10-25 00:58:59 -04003321 ata_dev_enable_pm(dev, ap->pm_policy);
3322
Tejun Heo9b1e2652007-08-06 18:36:24 +09003323 /* this link is okay now */
3324 ehc->i.flags = 0;
3325 continue;
3326
Jeff Garzik2dcb4072007-10-19 06:42:56 -04003327dev_fail:
Tejun Heo9b1e2652007-08-06 18:36:24 +09003328 nr_failed_devs++;
Tejun Heo0a2c0f52008-05-20 02:17:52 +09003329 ata_eh_handle_dev_fail(dev, rc);
Tejun Heo9b1e2652007-08-06 18:36:24 +09003330
Tejun Heob06ce3e2007-10-09 15:06:48 +09003331 if (ap->pflags & ATA_PFLAG_FROZEN) {
3332 /* PMP reset requires working host port.
3333 * Can't retry if it's frozen.
3334 */
Tejun Heo071f44b2008-04-07 22:47:22 +09003335 if (sata_pmp_attached(ap))
Tejun Heob06ce3e2007-10-09 15:06:48 +09003336 goto out;
Tejun Heo9b1e2652007-08-06 18:36:24 +09003337 break;
Tejun Heob06ce3e2007-10-09 15:06:48 +09003338 }
Tejun Heo022bdb02006-05-15 20:58:22 +09003339 }
3340
Tejun Heo0a2c0f52008-05-20 02:17:52 +09003341 if (nr_failed_devs)
Tejun Heo9b1e2652007-08-06 18:36:24 +09003342 goto retry;
Tejun Heo022bdb02006-05-15 20:58:22 +09003343
Tejun Heo022bdb02006-05-15 20:58:22 +09003344 out:
Tejun Heo9b1e2652007-08-06 18:36:24 +09003345 if (rc && r_failed_link)
3346 *r_failed_link = link;
Tejun Heo022bdb02006-05-15 20:58:22 +09003347
3348 DPRINTK("EXIT, rc=%d\n", rc);
3349 return rc;
3350}
3351
3352/**
3353 * ata_eh_finish - finish up EH
3354 * @ap: host port to finish EH for
3355 *
3356 * Recovery is complete. Clean up EH states and retry or finish
3357 * failed qcs.
3358 *
3359 * LOCKING:
3360 * None.
3361 */
Tejun Heofb7fd612007-09-23 13:14:12 +09003362void ata_eh_finish(struct ata_port *ap)
Tejun Heo022bdb02006-05-15 20:58:22 +09003363{
3364 int tag;
3365
3366 /* retry or finish qcs */
3367 for (tag = 0; tag < ATA_MAX_QUEUE; tag++) {
3368 struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag);
3369
3370 if (!(qc->flags & ATA_QCFLAG_FAILED))
3371 continue;
3372
3373 if (qc->err_mask) {
3374 /* FIXME: Once EH migration is complete,
3375 * generate sense data in this function,
3376 * considering both err_mask and tf.
3377 */
Tejun Heo03faab72008-03-27 19:14:24 +09003378 if (qc->flags & ATA_QCFLAG_RETRY)
Tejun Heo022bdb02006-05-15 20:58:22 +09003379 ata_eh_qc_retry(qc);
Tejun Heo03faab72008-03-27 19:14:24 +09003380 else
3381 ata_eh_qc_complete(qc);
Tejun Heo022bdb02006-05-15 20:58:22 +09003382 } else {
3383 if (qc->flags & ATA_QCFLAG_SENSE_VALID) {
3384 ata_eh_qc_complete(qc);
3385 } else {
3386 /* feed zero TF to sense generation */
3387 memset(&qc->result_tf, 0, sizeof(qc->result_tf));
3388 ata_eh_qc_retry(qc);
3389 }
3390 }
3391 }
Tejun Heoda917d62007-09-23 13:14:12 +09003392
3393 /* make sure nr_active_links is zero after EH */
3394 WARN_ON(ap->nr_active_links);
3395 ap->nr_active_links = 0;
Tejun Heo022bdb02006-05-15 20:58:22 +09003396}
3397
3398/**
3399 * ata_do_eh - do standard error handling
3400 * @ap: host port to handle error for
Tejun Heoa1efdab2008-03-25 12:22:50 +09003401 *
Tejun Heof5914a42006-05-31 18:27:48 +09003402 * @prereset: prereset method (can be NULL)
Tejun Heo022bdb02006-05-15 20:58:22 +09003403 * @softreset: softreset method (can be NULL)
3404 * @hardreset: hardreset method (can be NULL)
3405 * @postreset: postreset method (can be NULL)
3406 *
3407 * Perform standard error handling sequence.
3408 *
3409 * LOCKING:
3410 * Kernel thread context (may sleep).
3411 */
Tejun Heof5914a42006-05-31 18:27:48 +09003412void ata_do_eh(struct ata_port *ap, ata_prereset_fn_t prereset,
3413 ata_reset_fn_t softreset, ata_reset_fn_t hardreset,
3414 ata_postreset_fn_t postreset)
Tejun Heo022bdb02006-05-15 20:58:22 +09003415{
Tejun Heo9b1e2652007-08-06 18:36:24 +09003416 struct ata_device *dev;
3417 int rc;
3418
3419 ata_eh_autopsy(ap);
3420 ata_eh_report(ap);
3421
3422 rc = ata_eh_recover(ap, prereset, softreset, hardreset, postreset,
3423 NULL);
3424 if (rc) {
Tejun Heo1eca4362008-11-03 20:03:17 +09003425 ata_for_each_dev(dev, &ap->link, ALL)
Tejun Heo9b1e2652007-08-06 18:36:24 +09003426 ata_dev_disable(dev);
3427 }
3428
Tejun Heo022bdb02006-05-15 20:58:22 +09003429 ata_eh_finish(ap);
3430}
Tejun Heo500530f2006-07-03 16:07:27 +09003431
Tejun Heoa1efdab2008-03-25 12:22:50 +09003432/**
3433 * ata_std_error_handler - standard error handler
3434 * @ap: host port to handle error for
3435 *
3436 * Standard error handler
3437 *
3438 * LOCKING:
3439 * Kernel thread context (may sleep).
3440 */
3441void ata_std_error_handler(struct ata_port *ap)
3442{
3443 struct ata_port_operations *ops = ap->ops;
3444 ata_reset_fn_t hardreset = ops->hardreset;
3445
Tejun Heo57c9efd2008-04-07 22:47:19 +09003446 /* ignore built-in hardreset if SCR access is not available */
3447 if (ata_is_builtin_hardreset(hardreset) && !sata_scr_valid(&ap->link))
Tejun Heoa1efdab2008-03-25 12:22:50 +09003448 hardreset = NULL;
3449
3450 ata_do_eh(ap, ops->prereset, ops->softreset, hardreset, ops->postreset);
3451}
3452
Tejun Heo6ffa01d2007-03-02 17:32:47 +09003453#ifdef CONFIG_PM
Tejun Heo500530f2006-07-03 16:07:27 +09003454/**
3455 * ata_eh_handle_port_suspend - perform port suspend operation
3456 * @ap: port to suspend
3457 *
3458 * Suspend @ap.
3459 *
3460 * LOCKING:
3461 * Kernel thread context (may sleep).
3462 */
3463static void ata_eh_handle_port_suspend(struct ata_port *ap)
3464{
3465 unsigned long flags;
3466 int rc = 0;
3467
3468 /* are we suspending? */
3469 spin_lock_irqsave(ap->lock, flags);
3470 if (!(ap->pflags & ATA_PFLAG_PM_PENDING) ||
3471 ap->pm_mesg.event == PM_EVENT_ON) {
3472 spin_unlock_irqrestore(ap->lock, flags);
3473 return;
3474 }
3475 spin_unlock_irqrestore(ap->lock, flags);
3476
3477 WARN_ON(ap->pflags & ATA_PFLAG_SUSPENDED);
3478
Tejun Heo64578a32007-05-15 03:28:16 +09003479 /* tell ACPI we're suspending */
3480 rc = ata_acpi_on_suspend(ap);
3481 if (rc)
3482 goto out;
3483
Tejun Heo500530f2006-07-03 16:07:27 +09003484 /* suspend */
3485 ata_eh_freeze_port(ap);
3486
3487 if (ap->ops->port_suspend)
3488 rc = ap->ops->port_suspend(ap, ap->pm_mesg);
3489
Shaohua Libd3adca2007-11-02 09:32:38 +08003490 ata_acpi_set_state(ap, PMSG_SUSPEND);
Tejun Heo64578a32007-05-15 03:28:16 +09003491 out:
Tejun Heo500530f2006-07-03 16:07:27 +09003492 /* report result */
3493 spin_lock_irqsave(ap->lock, flags);
3494
3495 ap->pflags &= ~ATA_PFLAG_PM_PENDING;
3496 if (rc == 0)
3497 ap->pflags |= ATA_PFLAG_SUSPENDED;
Tejun Heo64578a32007-05-15 03:28:16 +09003498 else if (ap->pflags & ATA_PFLAG_FROZEN)
Tejun Heo500530f2006-07-03 16:07:27 +09003499 ata_port_schedule_eh(ap);
3500
3501 if (ap->pm_result) {
3502 *ap->pm_result = rc;
3503 ap->pm_result = NULL;
3504 }
3505
3506 spin_unlock_irqrestore(ap->lock, flags);
3507
3508 return;
3509}
3510
3511/**
3512 * ata_eh_handle_port_resume - perform port resume operation
3513 * @ap: port to resume
3514 *
3515 * Resume @ap.
3516 *
Tejun Heo500530f2006-07-03 16:07:27 +09003517 * LOCKING:
3518 * Kernel thread context (may sleep).
3519 */
3520static void ata_eh_handle_port_resume(struct ata_port *ap)
3521{
Tejun Heo6f9c1ea2009-04-23 09:55:28 +09003522 struct ata_link *link;
3523 struct ata_device *dev;
Tejun Heo500530f2006-07-03 16:07:27 +09003524 unsigned long flags;
Tejun Heo9666f402007-05-04 21:27:47 +02003525 int rc = 0;
Tejun Heo500530f2006-07-03 16:07:27 +09003526
3527 /* are we resuming? */
3528 spin_lock_irqsave(ap->lock, flags);
3529 if (!(ap->pflags & ATA_PFLAG_PM_PENDING) ||
3530 ap->pm_mesg.event != PM_EVENT_ON) {
3531 spin_unlock_irqrestore(ap->lock, flags);
3532 return;
3533 }
3534 spin_unlock_irqrestore(ap->lock, flags);
3535
Tejun Heo9666f402007-05-04 21:27:47 +02003536 WARN_ON(!(ap->pflags & ATA_PFLAG_SUSPENDED));
Tejun Heo500530f2006-07-03 16:07:27 +09003537
Tejun Heo6f9c1ea2009-04-23 09:55:28 +09003538 /*
3539 * Error timestamps are in jiffies which doesn't run while
3540 * suspended and PHY events during resume isn't too uncommon.
3541 * When the two are combined, it can lead to unnecessary speed
3542 * downs if the machine is suspended and resumed repeatedly.
3543 * Clear error history.
3544 */
3545 ata_for_each_link(link, ap, HOST_FIRST)
3546 ata_for_each_dev(dev, link, ALL)
3547 ata_ering_clear(&dev->ering);
3548
Shaohua Libd3adca2007-11-02 09:32:38 +08003549 ata_acpi_set_state(ap, PMSG_ON);
3550
Tejun Heo500530f2006-07-03 16:07:27 +09003551 if (ap->ops->port_resume)
3552 rc = ap->ops->port_resume(ap);
3553
Tejun Heo67465442007-05-15 03:28:16 +09003554 /* tell ACPI that we're resuming */
3555 ata_acpi_on_resume(ap);
3556
Tejun Heo9666f402007-05-04 21:27:47 +02003557 /* report result */
Tejun Heo500530f2006-07-03 16:07:27 +09003558 spin_lock_irqsave(ap->lock, flags);
3559 ap->pflags &= ~(ATA_PFLAG_PM_PENDING | ATA_PFLAG_SUSPENDED);
3560 if (ap->pm_result) {
3561 *ap->pm_result = rc;
3562 ap->pm_result = NULL;
3563 }
3564 spin_unlock_irqrestore(ap->lock, flags);
3565}
Tejun Heo6ffa01d2007-03-02 17:32:47 +09003566#endif /* CONFIG_PM */