• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  *  libata-eh.c - libata error handling
3  *
4  *  Maintained by:  Tejun Heo <tj@kernel.org>
5  *    		    Please ALWAYS copy linux-ide@vger.kernel.org
6  *		    on emails.
7  *
8  *  Copyright 2006 Tejun Heo <htejun@gmail.com>
9  *
10  *
11  *  This program is free software; you can redistribute it and/or
12  *  modify it under the terms of the GNU General Public License as
13  *  published by the Free Software Foundation; either version 2, or
14  *  (at your option) any later version.
15  *
16  *  This program is distributed in the hope that it will be useful,
17  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
18  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
19  *  General Public License for more details.
20  *
21  *  You should have received a copy of the GNU General Public License
22  *  along with this program; see the file COPYING.  If not, write to
23  *  the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139,
24  *  USA.
25  *
26  *
27  *  libata documentation is available via 'make {ps|pdf}docs',
28  *  as Documentation/driver-api/libata.rst
29  *
30  *  Hardware documentation available from http://www.t13.org/ and
31  *  http://www.sata-io.org/
32  *
33  */
34 
35 #include <linux/kernel.h>
36 #include <linux/blkdev.h>
37 #include <linux/export.h>
38 #include <linux/pci.h>
39 #include <scsi/scsi.h>
40 #include <scsi/scsi_host.h>
41 #include <scsi/scsi_eh.h>
42 #include <scsi/scsi_device.h>
43 #include <scsi/scsi_cmnd.h>
44 #include <scsi/scsi_dbg.h>
45 #include "../scsi/scsi_transport_api.h"
46 
47 #include <linux/libata.h>
48 
49 #include <trace/events/libata.h>
50 #include "libata.h"
51 
52 enum {
53 	/* speed down verdicts */
54 	ATA_EH_SPDN_NCQ_OFF		= (1 << 0),
55 	ATA_EH_SPDN_SPEED_DOWN		= (1 << 1),
56 	ATA_EH_SPDN_FALLBACK_TO_PIO	= (1 << 2),
57 	ATA_EH_SPDN_KEEP_ERRORS		= (1 << 3),
58 
59 	/* error flags */
60 	ATA_EFLAG_IS_IO			= (1 << 0),
61 	ATA_EFLAG_DUBIOUS_XFER		= (1 << 1),
62 	ATA_EFLAG_OLD_ER                = (1 << 31),
63 
64 	/* error categories */
65 	ATA_ECAT_NONE			= 0,
66 	ATA_ECAT_ATA_BUS		= 1,
67 	ATA_ECAT_TOUT_HSM		= 2,
68 	ATA_ECAT_UNK_DEV		= 3,
69 	ATA_ECAT_DUBIOUS_NONE		= 4,
70 	ATA_ECAT_DUBIOUS_ATA_BUS	= 5,
71 	ATA_ECAT_DUBIOUS_TOUT_HSM	= 6,
72 	ATA_ECAT_DUBIOUS_UNK_DEV	= 7,
73 	ATA_ECAT_NR			= 8,
74 
75 	ATA_EH_CMD_DFL_TIMEOUT		=  5000,
76 
77 	/* always put at least this amount of time between resets */
78 	ATA_EH_RESET_COOL_DOWN		=  5000,
79 
80 	/* Waiting in ->prereset can never be reliable.  It's
81 	 * sometimes nice to wait there but it can't be depended upon;
82 	 * otherwise, we wouldn't be resetting.  Just give it enough
83 	 * time for most drives to spin up.
84 	 */
85 	ATA_EH_PRERESET_TIMEOUT		= 10000,
86 	ATA_EH_FASTDRAIN_INTERVAL	=  3000,
87 
88 	ATA_EH_UA_TRIES			= 5,
89 
90 	/* probe speed down parameters, see ata_eh_schedule_probe() */
91 	ATA_EH_PROBE_TRIAL_INTERVAL	= 60000,	/* 1 min */
92 	ATA_EH_PROBE_TRIALS		= 2,
93 };
94 
95 /* The following table determines how we sequence resets.  Each entry
96  * represents timeout for that try.  The first try can be soft or
97  * hardreset.  All others are hardreset if available.  In most cases
98  * the first reset w/ 10sec timeout should succeed.  Following entries
99  * are mostly for error handling, hotplug and those outlier devices that
100  * take an exceptionally long time to recover from reset.
101  */
102 static const unsigned long ata_eh_reset_timeouts[] = {
103 	10000,	/* most drives spin up by 10sec */
104 	10000,	/* > 99% working drives spin up before 20sec */
105 	35000,	/* give > 30 secs of idleness for outlier devices */
106 	 5000,	/* and sweet one last chance */
107 	ULONG_MAX, /* > 1 min has elapsed, give up */
108 };
109 
110 static const unsigned long ata_eh_identify_timeouts[] = {
111 	 5000,	/* covers > 99% of successes and not too boring on failures */
112 	10000,  /* combined time till here is enough even for media access */
113 	30000,	/* for true idiots */
114 	ULONG_MAX,
115 };
116 
117 static const unsigned long ata_eh_flush_timeouts[] = {
118 	15000,	/* be generous with flush */
119 	15000,  /* ditto */
120 	30000,	/* and even more generous */
121 	ULONG_MAX,
122 };
123 
124 static const unsigned long ata_eh_other_timeouts[] = {
125 	 5000,	/* same rationale as identify timeout */
126 	10000,	/* ditto */
127 	/* but no merciful 30sec for other commands, it just isn't worth it */
128 	ULONG_MAX,
129 };
130 
131 struct ata_eh_cmd_timeout_ent {
132 	const u8		*commands;
133 	const unsigned long	*timeouts;
134 };
135 
136 /* The following table determines timeouts to use for EH internal
137  * commands.  Each table entry is a command class and matches the
138  * commands the entry applies to and the timeout table to use.
139  *
140  * On the retry after a command timed out, the next timeout value from
141  * the table is used.  If the table doesn't contain further entries,
142  * the last value is used.
143  *
144  * ehc->cmd_timeout_idx keeps track of which timeout to use per
145  * command class, so if SET_FEATURES times out on the first try, the
146  * next try will use the second timeout value only for that class.
147  */
148 #define CMDS(cmds...)	(const u8 []){ cmds, 0 }
149 static const struct ata_eh_cmd_timeout_ent
150 ata_eh_cmd_timeout_table[ATA_EH_CMD_TIMEOUT_TABLE_SIZE] = {
151 	{ .commands = CMDS(ATA_CMD_ID_ATA, ATA_CMD_ID_ATAPI),
152 	  .timeouts = ata_eh_identify_timeouts, },
153 	{ .commands = CMDS(ATA_CMD_READ_NATIVE_MAX, ATA_CMD_READ_NATIVE_MAX_EXT),
154 	  .timeouts = ata_eh_other_timeouts, },
155 	{ .commands = CMDS(ATA_CMD_SET_MAX, ATA_CMD_SET_MAX_EXT),
156 	  .timeouts = ata_eh_other_timeouts, },
157 	{ .commands = CMDS(ATA_CMD_SET_FEATURES),
158 	  .timeouts = ata_eh_other_timeouts, },
159 	{ .commands = CMDS(ATA_CMD_INIT_DEV_PARAMS),
160 	  .timeouts = ata_eh_other_timeouts, },
161 	{ .commands = CMDS(ATA_CMD_FLUSH, ATA_CMD_FLUSH_EXT),
162 	  .timeouts = ata_eh_flush_timeouts },
163 };
164 #undef CMDS
165 
166 static void __ata_port_freeze(struct ata_port *ap);
167 #ifdef CONFIG_PM
168 static void ata_eh_handle_port_suspend(struct ata_port *ap);
169 static void ata_eh_handle_port_resume(struct ata_port *ap);
170 #else /* CONFIG_PM */
ata_eh_handle_port_suspend(struct ata_port * ap)171 static void ata_eh_handle_port_suspend(struct ata_port *ap)
172 { }
173 
ata_eh_handle_port_resume(struct ata_port * ap)174 static void ata_eh_handle_port_resume(struct ata_port *ap)
175 { }
176 #endif /* CONFIG_PM */
177 
__ata_ehi_pushv_desc(struct ata_eh_info * ehi,const char * fmt,va_list args)178 static __printf(2, 0) void __ata_ehi_pushv_desc(struct ata_eh_info *ehi,
179 				 const char *fmt, va_list args)
180 {
181 	ehi->desc_len += vscnprintf(ehi->desc + ehi->desc_len,
182 				     ATA_EH_DESC_LEN - ehi->desc_len,
183 				     fmt, args);
184 }
185 
186 /**
187  *	__ata_ehi_push_desc - push error description without adding separator
188  *	@ehi: target EHI
189  *	@fmt: printf format string
190  *
191  *	Format string according to @fmt and append it to @ehi->desc.
192  *
193  *	LOCKING:
194  *	spin_lock_irqsave(host lock)
195  */
__ata_ehi_push_desc(struct ata_eh_info * ehi,const char * fmt,...)196 void __ata_ehi_push_desc(struct ata_eh_info *ehi, const char *fmt, ...)
197 {
198 	va_list args;
199 
200 	va_start(args, fmt);
201 	__ata_ehi_pushv_desc(ehi, fmt, args);
202 	va_end(args);
203 }
204 
205 /**
206  *	ata_ehi_push_desc - push error description with separator
207  *	@ehi: target EHI
208  *	@fmt: printf format string
209  *
210  *	Format string according to @fmt and append it to @ehi->desc.
211  *	If @ehi->desc is not empty, ", " is added in-between.
212  *
213  *	LOCKING:
214  *	spin_lock_irqsave(host lock)
215  */
ata_ehi_push_desc(struct ata_eh_info * ehi,const char * fmt,...)216 void ata_ehi_push_desc(struct ata_eh_info *ehi, const char *fmt, ...)
217 {
218 	va_list args;
219 
220 	if (ehi->desc_len)
221 		__ata_ehi_push_desc(ehi, ", ");
222 
223 	va_start(args, fmt);
224 	__ata_ehi_pushv_desc(ehi, fmt, args);
225 	va_end(args);
226 }
227 
228 /**
229  *	ata_ehi_clear_desc - clean error description
230  *	@ehi: target EHI
231  *
232  *	Clear @ehi->desc.
233  *
234  *	LOCKING:
235  *	spin_lock_irqsave(host lock)
236  */
ata_ehi_clear_desc(struct ata_eh_info * ehi)237 void ata_ehi_clear_desc(struct ata_eh_info *ehi)
238 {
239 	ehi->desc[0] = '\0';
240 	ehi->desc_len = 0;
241 }
242 
243 /**
244  *	ata_port_desc - append port description
245  *	@ap: target ATA port
246  *	@fmt: printf format string
247  *
248  *	Format string according to @fmt and append it to port
249  *	description.  If port description is not empty, " " is added
250  *	in-between.  This function is to be used while initializing
251  *	ata_host.  The description is printed on host registration.
252  *
253  *	LOCKING:
254  *	None.
255  */
ata_port_desc(struct ata_port * ap,const char * fmt,...)256 void ata_port_desc(struct ata_port *ap, const char *fmt, ...)
257 {
258 	va_list args;
259 
260 	WARN_ON(!(ap->pflags & ATA_PFLAG_INITIALIZING));
261 
262 	if (ap->link.eh_info.desc_len)
263 		__ata_ehi_push_desc(&ap->link.eh_info, " ");
264 
265 	va_start(args, fmt);
266 	__ata_ehi_pushv_desc(&ap->link.eh_info, fmt, args);
267 	va_end(args);
268 }
269 
270 #ifdef CONFIG_PCI
271 
272 /**
273  *	ata_port_pbar_desc - append PCI BAR description
274  *	@ap: target ATA port
275  *	@bar: target PCI BAR
276  *	@offset: offset into PCI BAR
277  *	@name: name of the area
278  *
279  *	If @offset is negative, this function formats a string which
280  *	contains the name, address, size and type of the BAR and
281  *	appends it to the port description.  If @offset is zero or
282  *	positive, only name and offsetted address is appended.
283  *
284  *	LOCKING:
285  *	None.
286  */
ata_port_pbar_desc(struct ata_port * ap,int bar,ssize_t offset,const char * name)287 void ata_port_pbar_desc(struct ata_port *ap, int bar, ssize_t offset,
288 			const char *name)
289 {
290 	struct pci_dev *pdev = to_pci_dev(ap->host->dev);
291 	char *type = "";
292 	unsigned long long start, len;
293 
294 	if (pci_resource_flags(pdev, bar) & IORESOURCE_MEM)
295 		type = "m";
296 	else if (pci_resource_flags(pdev, bar) & IORESOURCE_IO)
297 		type = "i";
298 
299 	start = (unsigned long long)pci_resource_start(pdev, bar);
300 	len = (unsigned long long)pci_resource_len(pdev, bar);
301 
302 	if (offset < 0)
303 		ata_port_desc(ap, "%s %s%llu@0x%llx", name, type, len, start);
304 	else
305 		ata_port_desc(ap, "%s 0x%llx", name,
306 				start + (unsigned long long)offset);
307 }
308 
309 #endif /* CONFIG_PCI */
310 
ata_lookup_timeout_table(u8 cmd)311 static int ata_lookup_timeout_table(u8 cmd)
312 {
313 	int i;
314 
315 	for (i = 0; i < ATA_EH_CMD_TIMEOUT_TABLE_SIZE; i++) {
316 		const u8 *cur;
317 
318 		for (cur = ata_eh_cmd_timeout_table[i].commands; *cur; cur++)
319 			if (*cur == cmd)
320 				return i;
321 	}
322 
323 	return -1;
324 }
325 
326 /**
327  *	ata_internal_cmd_timeout - determine timeout for an internal command
328  *	@dev: target device
329  *	@cmd: internal command to be issued
330  *
331  *	Determine timeout for internal command @cmd for @dev.
332  *
333  *	LOCKING:
334  *	EH context.
335  *
336  *	RETURNS:
337  *	Determined timeout.
338  */
ata_internal_cmd_timeout(struct ata_device * dev,u8 cmd)339 unsigned long ata_internal_cmd_timeout(struct ata_device *dev, u8 cmd)
340 {
341 	struct ata_eh_context *ehc = &dev->link->eh_context;
342 	int ent = ata_lookup_timeout_table(cmd);
343 	int idx;
344 
345 	if (ent < 0)
346 		return ATA_EH_CMD_DFL_TIMEOUT;
347 
348 	idx = ehc->cmd_timeout_idx[dev->devno][ent];
349 	return ata_eh_cmd_timeout_table[ent].timeouts[idx];
350 }
351 
352 /**
353  *	ata_internal_cmd_timed_out - notification for internal command timeout
354  *	@dev: target device
355  *	@cmd: internal command which timed out
356  *
357  *	Notify EH that internal command @cmd for @dev timed out.  This
358  *	function should be called only for commands whose timeouts are
359  *	determined using ata_internal_cmd_timeout().
360  *
361  *	LOCKING:
362  *	EH context.
363  */
ata_internal_cmd_timed_out(struct ata_device * dev,u8 cmd)364 void ata_internal_cmd_timed_out(struct ata_device *dev, u8 cmd)
365 {
366 	struct ata_eh_context *ehc = &dev->link->eh_context;
367 	int ent = ata_lookup_timeout_table(cmd);
368 	int idx;
369 
370 	if (ent < 0)
371 		return;
372 
373 	idx = ehc->cmd_timeout_idx[dev->devno][ent];
374 	if (ata_eh_cmd_timeout_table[ent].timeouts[idx + 1] != ULONG_MAX)
375 		ehc->cmd_timeout_idx[dev->devno][ent]++;
376 }
377 
ata_ering_record(struct ata_ering * ering,unsigned int eflags,unsigned int err_mask)378 static void ata_ering_record(struct ata_ering *ering, unsigned int eflags,
379 			     unsigned int err_mask)
380 {
381 	struct ata_ering_entry *ent;
382 
383 	WARN_ON(!err_mask);
384 
385 	ering->cursor++;
386 	ering->cursor %= ATA_ERING_SIZE;
387 
388 	ent = &ering->ring[ering->cursor];
389 	ent->eflags = eflags;
390 	ent->err_mask = err_mask;
391 	ent->timestamp = get_jiffies_64();
392 }
393 
ata_ering_top(struct ata_ering * ering)394 static struct ata_ering_entry *ata_ering_top(struct ata_ering *ering)
395 {
396 	struct ata_ering_entry *ent = &ering->ring[ering->cursor];
397 
398 	if (ent->err_mask)
399 		return ent;
400 	return NULL;
401 }
402 
ata_ering_map(struct ata_ering * ering,int (* map_fn)(struct ata_ering_entry *,void *),void * arg)403 int ata_ering_map(struct ata_ering *ering,
404 		  int (*map_fn)(struct ata_ering_entry *, void *),
405 		  void *arg)
406 {
407 	int idx, rc = 0;
408 	struct ata_ering_entry *ent;
409 
410 	idx = ering->cursor;
411 	do {
412 		ent = &ering->ring[idx];
413 		if (!ent->err_mask)
414 			break;
415 		rc = map_fn(ent, arg);
416 		if (rc)
417 			break;
418 		idx = (idx - 1 + ATA_ERING_SIZE) % ATA_ERING_SIZE;
419 	} while (idx != ering->cursor);
420 
421 	return rc;
422 }
423 
ata_ering_clear_cb(struct ata_ering_entry * ent,void * void_arg)424 static int ata_ering_clear_cb(struct ata_ering_entry *ent, void *void_arg)
425 {
426 	ent->eflags |= ATA_EFLAG_OLD_ER;
427 	return 0;
428 }
429 
ata_ering_clear(struct ata_ering * ering)430 static void ata_ering_clear(struct ata_ering *ering)
431 {
432 	ata_ering_map(ering, ata_ering_clear_cb, NULL);
433 }
434 
ata_eh_dev_action(struct ata_device * dev)435 static unsigned int ata_eh_dev_action(struct ata_device *dev)
436 {
437 	struct ata_eh_context *ehc = &dev->link->eh_context;
438 
439 	return ehc->i.action | ehc->i.dev_action[dev->devno];
440 }
441 
ata_eh_clear_action(struct ata_link * link,struct ata_device * dev,struct ata_eh_info * ehi,unsigned int action)442 static void ata_eh_clear_action(struct ata_link *link, struct ata_device *dev,
443 				struct ata_eh_info *ehi, unsigned int action)
444 {
445 	struct ata_device *tdev;
446 
447 	if (!dev) {
448 		ehi->action &= ~action;
449 		ata_for_each_dev(tdev, link, ALL)
450 			ehi->dev_action[tdev->devno] &= ~action;
451 	} else {
452 		/* doesn't make sense for port-wide EH actions */
453 		WARN_ON(!(action & ATA_EH_PERDEV_MASK));
454 
455 		/* break ehi->action into ehi->dev_action */
456 		if (ehi->action & action) {
457 			ata_for_each_dev(tdev, link, ALL)
458 				ehi->dev_action[tdev->devno] |=
459 					ehi->action & action;
460 			ehi->action &= ~action;
461 		}
462 
463 		/* turn off the specified per-dev action */
464 		ehi->dev_action[dev->devno] &= ~action;
465 	}
466 }
467 
468 /**
469  *	ata_eh_acquire - acquire EH ownership
470  *	@ap: ATA port to acquire EH ownership for
471  *
472  *	Acquire EH ownership for @ap.  This is the basic exclusion
473  *	mechanism for ports sharing a host.  Only one port hanging off
474  *	the same host can claim the ownership of EH.
475  *
476  *	LOCKING:
477  *	EH context.
478  */
ata_eh_acquire(struct ata_port * ap)479 void ata_eh_acquire(struct ata_port *ap)
480 {
481 	mutex_lock(&ap->host->eh_mutex);
482 	WARN_ON_ONCE(ap->host->eh_owner);
483 	ap->host->eh_owner = current;
484 }
485 
486 /**
487  *	ata_eh_release - release EH ownership
488  *	@ap: ATA port to release EH ownership for
489  *
490  *	Release EH ownership for @ap if the caller.  The caller must
491  *	have acquired EH ownership using ata_eh_acquire() previously.
492  *
493  *	LOCKING:
494  *	EH context.
495  */
ata_eh_release(struct ata_port * ap)496 void ata_eh_release(struct ata_port *ap)
497 {
498 	WARN_ON_ONCE(ap->host->eh_owner != current);
499 	ap->host->eh_owner = NULL;
500 	mutex_unlock(&ap->host->eh_mutex);
501 }
502 
503 /**
504  *	ata_scsi_timed_out - SCSI layer time out callback
505  *	@cmd: timed out SCSI command
506  *
507  *	Handles SCSI layer timeout.  We race with normal completion of
508  *	the qc for @cmd.  If the qc is already gone, we lose and let
509  *	the scsi command finish (EH_HANDLED).  Otherwise, the qc has
510  *	timed out and EH should be invoked.  Prevent ata_qc_complete()
511  *	from finishing it by setting EH_SCHEDULED and return
512  *	EH_NOT_HANDLED.
513  *
514  *	TODO: kill this function once old EH is gone.
515  *
516  *	LOCKING:
517  *	Called from timer context
518  *
519  *	RETURNS:
520  *	EH_HANDLED or EH_NOT_HANDLED
521  */
ata_scsi_timed_out(struct scsi_cmnd * cmd)522 enum blk_eh_timer_return ata_scsi_timed_out(struct scsi_cmnd *cmd)
523 {
524 	struct Scsi_Host *host = cmd->device->host;
525 	struct ata_port *ap = ata_shost_to_port(host);
526 	unsigned long flags;
527 	struct ata_queued_cmd *qc;
528 	enum blk_eh_timer_return ret;
529 
530 	DPRINTK("ENTER\n");
531 
532 	if (ap->ops->error_handler) {
533 		ret = BLK_EH_NOT_HANDLED;
534 		goto out;
535 	}
536 
537 	ret = BLK_EH_HANDLED;
538 	spin_lock_irqsave(ap->lock, flags);
539 	qc = ata_qc_from_tag(ap, ap->link.active_tag);
540 	if (qc) {
541 		WARN_ON(qc->scsicmd != cmd);
542 		qc->flags |= ATA_QCFLAG_EH_SCHEDULED;
543 		qc->err_mask |= AC_ERR_TIMEOUT;
544 		ret = BLK_EH_NOT_HANDLED;
545 	}
546 	spin_unlock_irqrestore(ap->lock, flags);
547 
548  out:
549 	DPRINTK("EXIT, ret=%d\n", ret);
550 	return ret;
551 }
552 EXPORT_SYMBOL(ata_scsi_timed_out);
553 
ata_eh_unload(struct ata_port * ap)554 static void ata_eh_unload(struct ata_port *ap)
555 {
556 	struct ata_link *link;
557 	struct ata_device *dev;
558 	unsigned long flags;
559 
560 	/* Restore SControl IPM and SPD for the next driver and
561 	 * disable attached devices.
562 	 */
563 	ata_for_each_link(link, ap, PMP_FIRST) {
564 		sata_scr_write(link, SCR_CONTROL, link->saved_scontrol & 0xff0);
565 		ata_for_each_dev(dev, link, ALL)
566 			ata_dev_disable(dev);
567 	}
568 
569 	/* freeze and set UNLOADED */
570 	spin_lock_irqsave(ap->lock, flags);
571 
572 	ata_port_freeze(ap);			/* won't be thawed */
573 	ap->pflags &= ~ATA_PFLAG_EH_PENDING;	/* clear pending from freeze */
574 	ap->pflags |= ATA_PFLAG_UNLOADED;
575 
576 	spin_unlock_irqrestore(ap->lock, flags);
577 }
578 
579 /**
580  *	ata_scsi_error - SCSI layer error handler callback
581  *	@host: SCSI host on which error occurred
582  *
583  *	Handles SCSI-layer-thrown error events.
584  *
585  *	LOCKING:
586  *	Inherited from SCSI layer (none, can sleep)
587  *
588  *	RETURNS:
589  *	Zero.
590  */
ata_scsi_error(struct Scsi_Host * host)591 void ata_scsi_error(struct Scsi_Host *host)
592 {
593 	struct ata_port *ap = ata_shost_to_port(host);
594 	unsigned long flags;
595 	LIST_HEAD(eh_work_q);
596 
597 	DPRINTK("ENTER\n");
598 
599 	spin_lock_irqsave(host->host_lock, flags);
600 	list_splice_init(&host->eh_cmd_q, &eh_work_q);
601 	spin_unlock_irqrestore(host->host_lock, flags);
602 
603 	ata_scsi_cmd_error_handler(host, ap, &eh_work_q);
604 
605 	/* If we timed raced normal completion and there is nothing to
606 	   recover nr_timedout == 0 why exactly are we doing error recovery ? */
607 	ata_scsi_port_error_handler(host, ap);
608 
609 	/* finish or retry handled scmd's and clean up */
610 	WARN_ON(!list_empty(&eh_work_q));
611 
612 	DPRINTK("EXIT\n");
613 }
614 
615 /**
616  * ata_scsi_cmd_error_handler - error callback for a list of commands
617  * @host:	scsi host containing the port
618  * @ap:		ATA port within the host
619  * @eh_work_q:	list of commands to process
620  *
621  * process the given list of commands and return those finished to the
622  * ap->eh_done_q.  This function is the first part of the libata error
623  * handler which processes a given list of failed commands.
624  */
ata_scsi_cmd_error_handler(struct Scsi_Host * host,struct ata_port * ap,struct list_head * eh_work_q)625 void ata_scsi_cmd_error_handler(struct Scsi_Host *host, struct ata_port *ap,
626 				struct list_head *eh_work_q)
627 {
628 	int i;
629 	unsigned long flags;
630 
631 	/* make sure sff pio task is not running */
632 	ata_sff_flush_pio_task(ap);
633 
634 	/* synchronize with host lock and sort out timeouts */
635 
636 	/* For new EH, all qcs are finished in one of three ways -
637 	 * normal completion, error completion, and SCSI timeout.
638 	 * Both completions can race against SCSI timeout.  When normal
639 	 * completion wins, the qc never reaches EH.  When error
640 	 * completion wins, the qc has ATA_QCFLAG_FAILED set.
641 	 *
642 	 * When SCSI timeout wins, things are a bit more complex.
643 	 * Normal or error completion can occur after the timeout but
644 	 * before this point.  In such cases, both types of
645 	 * completions are honored.  A scmd is determined to have
646 	 * timed out iff its associated qc is active and not failed.
647 	 */
648 	spin_lock_irqsave(ap->lock, flags);
649 	if (ap->ops->error_handler) {
650 		struct scsi_cmnd *scmd, *tmp;
651 		int nr_timedout = 0;
652 
653 		/* This must occur under the ap->lock as we don't want
654 		   a polled recovery to race the real interrupt handler
655 
656 		   The lost_interrupt handler checks for any completed but
657 		   non-notified command and completes much like an IRQ handler.
658 
659 		   We then fall into the error recovery code which will treat
660 		   this as if normal completion won the race */
661 
662 		if (ap->ops->lost_interrupt)
663 			ap->ops->lost_interrupt(ap);
664 
665 		list_for_each_entry_safe(scmd, tmp, eh_work_q, eh_entry) {
666 			struct ata_queued_cmd *qc;
667 
668 			for (i = 0; i < ATA_MAX_QUEUE; i++) {
669 				qc = __ata_qc_from_tag(ap, i);
670 				if (qc->flags & ATA_QCFLAG_ACTIVE &&
671 				    qc->scsicmd == scmd)
672 					break;
673 			}
674 
675 			if (i < ATA_MAX_QUEUE) {
676 				/* the scmd has an associated qc */
677 				if (!(qc->flags & ATA_QCFLAG_FAILED)) {
678 					/* which hasn't failed yet, timeout */
679 					qc->err_mask |= AC_ERR_TIMEOUT;
680 					qc->flags |= ATA_QCFLAG_FAILED;
681 					nr_timedout++;
682 				}
683 			} else {
684 				/* Normal completion occurred after
685 				 * SCSI timeout but before this point.
686 				 * Successfully complete it.
687 				 */
688 				scmd->retries = scmd->allowed;
689 				scsi_eh_finish_cmd(scmd, &ap->eh_done_q);
690 			}
691 		}
692 
693 		/* If we have timed out qcs.  They belong to EH from
694 		 * this point but the state of the controller is
695 		 * unknown.  Freeze the port to make sure the IRQ
696 		 * handler doesn't diddle with those qcs.  This must
697 		 * be done atomically w.r.t. setting QCFLAG_FAILED.
698 		 */
699 		if (nr_timedout)
700 			__ata_port_freeze(ap);
701 
702 
703 		/* initialize eh_tries */
704 		ap->eh_tries = ATA_EH_MAX_TRIES;
705 	}
706 	spin_unlock_irqrestore(ap->lock, flags);
707 
708 }
709 EXPORT_SYMBOL(ata_scsi_cmd_error_handler);
710 
711 /**
712  * ata_scsi_port_error_handler - recover the port after the commands
713  * @host:	SCSI host containing the port
714  * @ap:		the ATA port
715  *
716  * Handle the recovery of the port @ap after all the commands
717  * have been recovered.
718  */
ata_scsi_port_error_handler(struct Scsi_Host * host,struct ata_port * ap)719 void ata_scsi_port_error_handler(struct Scsi_Host *host, struct ata_port *ap)
720 {
721 	unsigned long flags;
722 
723 	/* invoke error handler */
724 	if (ap->ops->error_handler) {
725 		struct ata_link *link;
726 
727 		/* acquire EH ownership */
728 		ata_eh_acquire(ap);
729  repeat:
730 		/* kill fast drain timer */
731 		del_timer_sync(&ap->fastdrain_timer);
732 
733 		/* process port resume request */
734 		ata_eh_handle_port_resume(ap);
735 
736 		/* fetch & clear EH info */
737 		spin_lock_irqsave(ap->lock, flags);
738 
739 		ata_for_each_link(link, ap, HOST_FIRST) {
740 			struct ata_eh_context *ehc = &link->eh_context;
741 			struct ata_device *dev;
742 
743 			memset(&link->eh_context, 0, sizeof(link->eh_context));
744 			link->eh_context.i = link->eh_info;
745 			memset(&link->eh_info, 0, sizeof(link->eh_info));
746 
747 			ata_for_each_dev(dev, link, ENABLED) {
748 				int devno = dev->devno;
749 
750 				ehc->saved_xfer_mode[devno] = dev->xfer_mode;
751 				if (ata_ncq_enabled(dev))
752 					ehc->saved_ncq_enabled |= 1 << devno;
753 			}
754 		}
755 
756 		ap->pflags |= ATA_PFLAG_EH_IN_PROGRESS;
757 		ap->pflags &= ~ATA_PFLAG_EH_PENDING;
758 		ap->excl_link = NULL;	/* don't maintain exclusion over EH */
759 
760 		spin_unlock_irqrestore(ap->lock, flags);
761 
762 		/* invoke EH, skip if unloading or suspended */
763 		if (!(ap->pflags & (ATA_PFLAG_UNLOADING | ATA_PFLAG_SUSPENDED)))
764 			ap->ops->error_handler(ap);
765 		else {
766 			/* if unloading, commence suicide */
767 			if ((ap->pflags & ATA_PFLAG_UNLOADING) &&
768 			    !(ap->pflags & ATA_PFLAG_UNLOADED))
769 				ata_eh_unload(ap);
770 			ata_eh_finish(ap);
771 		}
772 
773 		/* process port suspend request */
774 		ata_eh_handle_port_suspend(ap);
775 
776 		/* Exception might have happened after ->error_handler
777 		 * recovered the port but before this point.  Repeat
778 		 * EH in such case.
779 		 */
780 		spin_lock_irqsave(ap->lock, flags);
781 
782 		if (ap->pflags & ATA_PFLAG_EH_PENDING) {
783 			if (--ap->eh_tries) {
784 				spin_unlock_irqrestore(ap->lock, flags);
785 				goto repeat;
786 			}
787 			ata_port_err(ap,
788 				     "EH pending after %d tries, giving up\n",
789 				     ATA_EH_MAX_TRIES);
790 			ap->pflags &= ~ATA_PFLAG_EH_PENDING;
791 		}
792 
793 		/* this run is complete, make sure EH info is clear */
794 		ata_for_each_link(link, ap, HOST_FIRST)
795 			memset(&link->eh_info, 0, sizeof(link->eh_info));
796 
797 		/* end eh (clear host_eh_scheduled) while holding
798 		 * ap->lock such that if exception occurs after this
799 		 * point but before EH completion, SCSI midlayer will
800 		 * re-initiate EH.
801 		 */
802 		ap->ops->end_eh(ap);
803 
804 		spin_unlock_irqrestore(ap->lock, flags);
805 		ata_eh_release(ap);
806 	} else {
807 		WARN_ON(ata_qc_from_tag(ap, ap->link.active_tag) == NULL);
808 		ap->ops->eng_timeout(ap);
809 	}
810 
811 	scsi_eh_flush_done_q(&ap->eh_done_q);
812 
813 	/* clean up */
814 	spin_lock_irqsave(ap->lock, flags);
815 
816 	if (ap->pflags & ATA_PFLAG_LOADING)
817 		ap->pflags &= ~ATA_PFLAG_LOADING;
818 	else if (ap->pflags & ATA_PFLAG_SCSI_HOTPLUG)
819 		schedule_delayed_work(&ap->hotplug_task, 0);
820 
821 	if (ap->pflags & ATA_PFLAG_RECOVERED)
822 		ata_port_info(ap, "EH complete\n");
823 
824 	ap->pflags &= ~(ATA_PFLAG_SCSI_HOTPLUG | ATA_PFLAG_RECOVERED);
825 
826 	/* tell wait_eh that we're done */
827 	ap->pflags &= ~ATA_PFLAG_EH_IN_PROGRESS;
828 	wake_up_all(&ap->eh_wait_q);
829 
830 	spin_unlock_irqrestore(ap->lock, flags);
831 }
832 EXPORT_SYMBOL_GPL(ata_scsi_port_error_handler);
833 
834 /**
835  *	ata_port_wait_eh - Wait for the currently pending EH to complete
836  *	@ap: Port to wait EH for
837  *
838  *	Wait until the currently pending EH is complete.
839  *
840  *	LOCKING:
841  *	Kernel thread context (may sleep).
842  */
ata_port_wait_eh(struct ata_port * ap)843 void ata_port_wait_eh(struct ata_port *ap)
844 {
845 	unsigned long flags;
846 	DEFINE_WAIT(wait);
847 
848  retry:
849 	spin_lock_irqsave(ap->lock, flags);
850 
851 	while (ap->pflags & (ATA_PFLAG_EH_PENDING | ATA_PFLAG_EH_IN_PROGRESS)) {
852 		prepare_to_wait(&ap->eh_wait_q, &wait, TASK_UNINTERRUPTIBLE);
853 		spin_unlock_irqrestore(ap->lock, flags);
854 		schedule();
855 		spin_lock_irqsave(ap->lock, flags);
856 	}
857 	finish_wait(&ap->eh_wait_q, &wait);
858 
859 	spin_unlock_irqrestore(ap->lock, flags);
860 
861 	/* make sure SCSI EH is complete */
862 	if (scsi_host_in_recovery(ap->scsi_host)) {
863 		ata_msleep(ap, 10);
864 		goto retry;
865 	}
866 }
867 EXPORT_SYMBOL_GPL(ata_port_wait_eh);
868 
ata_eh_nr_in_flight(struct ata_port * ap)869 static int ata_eh_nr_in_flight(struct ata_port *ap)
870 {
871 	unsigned int tag;
872 	int nr = 0;
873 
874 	/* count only non-internal commands */
875 	for (tag = 0; tag < ATA_MAX_QUEUE - 1; tag++)
876 		if (ata_qc_from_tag(ap, tag))
877 			nr++;
878 
879 	return nr;
880 }
881 
ata_eh_fastdrain_timerfn(unsigned long arg)882 void ata_eh_fastdrain_timerfn(unsigned long arg)
883 {
884 	struct ata_port *ap = (void *)arg;
885 	unsigned long flags;
886 	int cnt;
887 
888 	spin_lock_irqsave(ap->lock, flags);
889 
890 	cnt = ata_eh_nr_in_flight(ap);
891 
892 	/* are we done? */
893 	if (!cnt)
894 		goto out_unlock;
895 
896 	if (cnt == ap->fastdrain_cnt) {
897 		unsigned int tag;
898 
899 		/* No progress during the last interval, tag all
900 		 * in-flight qcs as timed out and freeze the port.
901 		 */
902 		for (tag = 0; tag < ATA_MAX_QUEUE - 1; tag++) {
903 			struct ata_queued_cmd *qc = ata_qc_from_tag(ap, tag);
904 			if (qc)
905 				qc->err_mask |= AC_ERR_TIMEOUT;
906 		}
907 
908 		ata_port_freeze(ap);
909 	} else {
910 		/* some qcs have finished, give it another chance */
911 		ap->fastdrain_cnt = cnt;
912 		ap->fastdrain_timer.expires =
913 			ata_deadline(jiffies, ATA_EH_FASTDRAIN_INTERVAL);
914 		add_timer(&ap->fastdrain_timer);
915 	}
916 
917  out_unlock:
918 	spin_unlock_irqrestore(ap->lock, flags);
919 }
920 
921 /**
922  *	ata_eh_set_pending - set ATA_PFLAG_EH_PENDING and activate fast drain
923  *	@ap: target ATA port
924  *	@fastdrain: activate fast drain
925  *
926  *	Set ATA_PFLAG_EH_PENDING and activate fast drain if @fastdrain
927  *	is non-zero and EH wasn't pending before.  Fast drain ensures
928  *	that EH kicks in in timely manner.
929  *
930  *	LOCKING:
931  *	spin_lock_irqsave(host lock)
932  */
ata_eh_set_pending(struct ata_port * ap,int fastdrain)933 static void ata_eh_set_pending(struct ata_port *ap, int fastdrain)
934 {
935 	int cnt;
936 
937 	/* already scheduled? */
938 	if (ap->pflags & ATA_PFLAG_EH_PENDING)
939 		return;
940 
941 	ap->pflags |= ATA_PFLAG_EH_PENDING;
942 
943 	if (!fastdrain)
944 		return;
945 
946 	/* do we have in-flight qcs? */
947 	cnt = ata_eh_nr_in_flight(ap);
948 	if (!cnt)
949 		return;
950 
951 	/* activate fast drain */
952 	ap->fastdrain_cnt = cnt;
953 	ap->fastdrain_timer.expires =
954 		ata_deadline(jiffies, ATA_EH_FASTDRAIN_INTERVAL);
955 	add_timer(&ap->fastdrain_timer);
956 }
957 
958 /**
959  *	ata_qc_schedule_eh - schedule qc for error handling
960  *	@qc: command to schedule error handling for
961  *
962  *	Schedule error handling for @qc.  EH will kick in as soon as
963  *	other commands are drained.
964  *
965  *	LOCKING:
966  *	spin_lock_irqsave(host lock)
967  */
ata_qc_schedule_eh(struct ata_queued_cmd * qc)968 void ata_qc_schedule_eh(struct ata_queued_cmd *qc)
969 {
970 	struct ata_port *ap = qc->ap;
971 	struct request_queue *q = qc->scsicmd->device->request_queue;
972 	unsigned long flags;
973 
974 	WARN_ON(!ap->ops->error_handler);
975 
976 	qc->flags |= ATA_QCFLAG_FAILED;
977 	ata_eh_set_pending(ap, 1);
978 
979 	/* The following will fail if timeout has already expired.
980 	 * ata_scsi_error() takes care of such scmds on EH entry.
981 	 * Note that ATA_QCFLAG_FAILED is unconditionally set after
982 	 * this function completes.
983 	 */
984 	spin_lock_irqsave(q->queue_lock, flags);
985 	blk_abort_request(qc->scsicmd->request);
986 	spin_unlock_irqrestore(q->queue_lock, flags);
987 }
988 
989 /**
990  * ata_std_sched_eh - non-libsas ata_ports issue eh with this common routine
991  * @ap: ATA port to schedule EH for
992  *
993  *	LOCKING: inherited from ata_port_schedule_eh
994  *	spin_lock_irqsave(host lock)
995  */
ata_std_sched_eh(struct ata_port * ap)996 void ata_std_sched_eh(struct ata_port *ap)
997 {
998 	WARN_ON(!ap->ops->error_handler);
999 
1000 	if (ap->pflags & ATA_PFLAG_INITIALIZING)
1001 		return;
1002 
1003 	ata_eh_set_pending(ap, 1);
1004 	scsi_schedule_eh(ap->scsi_host);
1005 
1006 	DPRINTK("port EH scheduled\n");
1007 }
1008 EXPORT_SYMBOL_GPL(ata_std_sched_eh);
1009 
1010 /**
1011  * ata_std_end_eh - non-libsas ata_ports complete eh with this common routine
1012  * @ap: ATA port to end EH for
1013  *
1014  * In the libata object model there is a 1:1 mapping of ata_port to
1015  * shost, so host fields can be directly manipulated under ap->lock, in
1016  * the libsas case we need to hold a lock at the ha->level to coordinate
1017  * these events.
1018  *
1019  *	LOCKING:
1020  *	spin_lock_irqsave(host lock)
1021  */
ata_std_end_eh(struct ata_port * ap)1022 void ata_std_end_eh(struct ata_port *ap)
1023 {
1024 	struct Scsi_Host *host = ap->scsi_host;
1025 
1026 	host->host_eh_scheduled = 0;
1027 }
1028 EXPORT_SYMBOL(ata_std_end_eh);
1029 
1030 
1031 /**
1032  *	ata_port_schedule_eh - schedule error handling without a qc
1033  *	@ap: ATA port to schedule EH for
1034  *
1035  *	Schedule error handling for @ap.  EH will kick in as soon as
1036  *	all commands are drained.
1037  *
1038  *	LOCKING:
1039  *	spin_lock_irqsave(host lock)
1040  */
ata_port_schedule_eh(struct ata_port * ap)1041 void ata_port_schedule_eh(struct ata_port *ap)
1042 {
1043 	/* see: ata_std_sched_eh, unless you know better */
1044 	ap->ops->sched_eh(ap);
1045 }
1046 
ata_do_link_abort(struct ata_port * ap,struct ata_link * link)1047 static int ata_do_link_abort(struct ata_port *ap, struct ata_link *link)
1048 {
1049 	int tag, nr_aborted = 0;
1050 
1051 	WARN_ON(!ap->ops->error_handler);
1052 
1053 	/* we're gonna abort all commands, no need for fast drain */
1054 	ata_eh_set_pending(ap, 0);
1055 
1056 	for (tag = 0; tag < ATA_MAX_QUEUE; tag++) {
1057 		struct ata_queued_cmd *qc = ata_qc_from_tag(ap, tag);
1058 
1059 		if (qc && (!link || qc->dev->link == link)) {
1060 			qc->flags |= ATA_QCFLAG_FAILED;
1061 			ata_qc_complete(qc);
1062 			nr_aborted++;
1063 		}
1064 	}
1065 
1066 	if (!nr_aborted)
1067 		ata_port_schedule_eh(ap);
1068 
1069 	return nr_aborted;
1070 }
1071 
1072 /**
1073  *	ata_link_abort - abort all qc's on the link
1074  *	@link: ATA link to abort qc's for
1075  *
1076  *	Abort all active qc's active on @link and schedule EH.
1077  *
1078  *	LOCKING:
1079  *	spin_lock_irqsave(host lock)
1080  *
1081  *	RETURNS:
1082  *	Number of aborted qc's.
1083  */
ata_link_abort(struct ata_link * link)1084 int ata_link_abort(struct ata_link *link)
1085 {
1086 	return ata_do_link_abort(link->ap, link);
1087 }
1088 
1089 /**
1090  *	ata_port_abort - abort all qc's on the port
1091  *	@ap: ATA port to abort qc's for
1092  *
1093  *	Abort all active qc's of @ap and schedule EH.
1094  *
1095  *	LOCKING:
1096  *	spin_lock_irqsave(host_set lock)
1097  *
1098  *	RETURNS:
1099  *	Number of aborted qc's.
1100  */
ata_port_abort(struct ata_port * ap)1101 int ata_port_abort(struct ata_port *ap)
1102 {
1103 	return ata_do_link_abort(ap, NULL);
1104 }
1105 
1106 /**
1107  *	__ata_port_freeze - freeze port
1108  *	@ap: ATA port to freeze
1109  *
1110  *	This function is called when HSM violation or some other
1111  *	condition disrupts normal operation of the port.  Frozen port
1112  *	is not allowed to perform any operation until the port is
1113  *	thawed, which usually follows a successful reset.
1114  *
1115  *	ap->ops->freeze() callback can be used for freezing the port
1116  *	hardware-wise (e.g. mask interrupt and stop DMA engine).  If a
1117  *	port cannot be frozen hardware-wise, the interrupt handler
1118  *	must ack and clear interrupts unconditionally while the port
1119  *	is frozen.
1120  *
1121  *	LOCKING:
1122  *	spin_lock_irqsave(host lock)
1123  */
__ata_port_freeze(struct ata_port * ap)1124 static void __ata_port_freeze(struct ata_port *ap)
1125 {
1126 	WARN_ON(!ap->ops->error_handler);
1127 
1128 	if (ap->ops->freeze)
1129 		ap->ops->freeze(ap);
1130 
1131 	ap->pflags |= ATA_PFLAG_FROZEN;
1132 
1133 	DPRINTK("ata%u port frozen\n", ap->print_id);
1134 }
1135 
1136 /**
1137  *	ata_port_freeze - abort & freeze port
1138  *	@ap: ATA port to freeze
1139  *
1140  *	Abort and freeze @ap.  The freeze operation must be called
1141  *	first, because some hardware requires special operations
1142  *	before the taskfile registers are accessible.
1143  *
1144  *	LOCKING:
1145  *	spin_lock_irqsave(host lock)
1146  *
1147  *	RETURNS:
1148  *	Number of aborted commands.
1149  */
ata_port_freeze(struct ata_port * ap)1150 int ata_port_freeze(struct ata_port *ap)
1151 {
1152 	int nr_aborted;
1153 
1154 	WARN_ON(!ap->ops->error_handler);
1155 
1156 	__ata_port_freeze(ap);
1157 	nr_aborted = ata_port_abort(ap);
1158 
1159 	return nr_aborted;
1160 }
1161 
1162 /**
1163  *	sata_async_notification - SATA async notification handler
1164  *	@ap: ATA port where async notification is received
1165  *
1166  *	Handler to be called when async notification via SDB FIS is
1167  *	received.  This function schedules EH if necessary.
1168  *
1169  *	LOCKING:
1170  *	spin_lock_irqsave(host lock)
1171  *
1172  *	RETURNS:
1173  *	1 if EH is scheduled, 0 otherwise.
1174  */
sata_async_notification(struct ata_port * ap)1175 int sata_async_notification(struct ata_port *ap)
1176 {
1177 	u32 sntf;
1178 	int rc;
1179 
1180 	if (!(ap->flags & ATA_FLAG_AN))
1181 		return 0;
1182 
1183 	rc = sata_scr_read(&ap->link, SCR_NOTIFICATION, &sntf);
1184 	if (rc == 0)
1185 		sata_scr_write(&ap->link, SCR_NOTIFICATION, sntf);
1186 
1187 	if (!sata_pmp_attached(ap) || rc) {
1188 		/* PMP is not attached or SNTF is not available */
1189 		if (!sata_pmp_attached(ap)) {
1190 			/* PMP is not attached.  Check whether ATAPI
1191 			 * AN is configured.  If so, notify media
1192 			 * change.
1193 			 */
1194 			struct ata_device *dev = ap->link.device;
1195 
1196 			if ((dev->class == ATA_DEV_ATAPI) &&
1197 			    (dev->flags & ATA_DFLAG_AN))
1198 				ata_scsi_media_change_notify(dev);
1199 			return 0;
1200 		} else {
1201 			/* PMP is attached but SNTF is not available.
1202 			 * ATAPI async media change notification is
1203 			 * not used.  The PMP must be reporting PHY
1204 			 * status change, schedule EH.
1205 			 */
1206 			ata_port_schedule_eh(ap);
1207 			return 1;
1208 		}
1209 	} else {
1210 		/* PMP is attached and SNTF is available */
1211 		struct ata_link *link;
1212 
1213 		/* check and notify ATAPI AN */
1214 		ata_for_each_link(link, ap, EDGE) {
1215 			if (!(sntf & (1 << link->pmp)))
1216 				continue;
1217 
1218 			if ((link->device->class == ATA_DEV_ATAPI) &&
1219 			    (link->device->flags & ATA_DFLAG_AN))
1220 				ata_scsi_media_change_notify(link->device);
1221 		}
1222 
1223 		/* If PMP is reporting that PHY status of some
1224 		 * downstream ports has changed, schedule EH.
1225 		 */
1226 		if (sntf & (1 << SATA_PMP_CTRL_PORT)) {
1227 			ata_port_schedule_eh(ap);
1228 			return 1;
1229 		}
1230 
1231 		return 0;
1232 	}
1233 }
1234 
1235 /**
1236  *	ata_eh_freeze_port - EH helper to freeze port
1237  *	@ap: ATA port to freeze
1238  *
1239  *	Freeze @ap.
1240  *
1241  *	LOCKING:
1242  *	None.
1243  */
ata_eh_freeze_port(struct ata_port * ap)1244 void ata_eh_freeze_port(struct ata_port *ap)
1245 {
1246 	unsigned long flags;
1247 
1248 	if (!ap->ops->error_handler)
1249 		return;
1250 
1251 	spin_lock_irqsave(ap->lock, flags);
1252 	__ata_port_freeze(ap);
1253 	spin_unlock_irqrestore(ap->lock, flags);
1254 }
1255 
1256 /**
1257  *	ata_port_thaw_port - EH helper to thaw port
1258  *	@ap: ATA port to thaw
1259  *
1260  *	Thaw frozen port @ap.
1261  *
1262  *	LOCKING:
1263  *	None.
1264  */
ata_eh_thaw_port(struct ata_port * ap)1265 void ata_eh_thaw_port(struct ata_port *ap)
1266 {
1267 	unsigned long flags;
1268 
1269 	if (!ap->ops->error_handler)
1270 		return;
1271 
1272 	spin_lock_irqsave(ap->lock, flags);
1273 
1274 	ap->pflags &= ~ATA_PFLAG_FROZEN;
1275 
1276 	if (ap->ops->thaw)
1277 		ap->ops->thaw(ap);
1278 
1279 	spin_unlock_irqrestore(ap->lock, flags);
1280 
1281 	DPRINTK("ata%u port thawed\n", ap->print_id);
1282 }
1283 
ata_eh_scsidone(struct scsi_cmnd * scmd)1284 static void ata_eh_scsidone(struct scsi_cmnd *scmd)
1285 {
1286 	/* nada */
1287 }
1288 
__ata_eh_qc_complete(struct ata_queued_cmd * qc)1289 static void __ata_eh_qc_complete(struct ata_queued_cmd *qc)
1290 {
1291 	struct ata_port *ap = qc->ap;
1292 	struct scsi_cmnd *scmd = qc->scsicmd;
1293 	unsigned long flags;
1294 
1295 	spin_lock_irqsave(ap->lock, flags);
1296 	qc->scsidone = ata_eh_scsidone;
1297 	__ata_qc_complete(qc);
1298 	WARN_ON(ata_tag_valid(qc->tag));
1299 	spin_unlock_irqrestore(ap->lock, flags);
1300 
1301 	scsi_eh_finish_cmd(scmd, &ap->eh_done_q);
1302 }
1303 
1304 /**
1305  *	ata_eh_qc_complete - Complete an active ATA command from EH
1306  *	@qc: Command to complete
1307  *
1308  *	Indicate to the mid and upper layers that an ATA command has
1309  *	completed.  To be used from EH.
1310  */
ata_eh_qc_complete(struct ata_queued_cmd * qc)1311 void ata_eh_qc_complete(struct ata_queued_cmd *qc)
1312 {
1313 	struct scsi_cmnd *scmd = qc->scsicmd;
1314 	scmd->retries = scmd->allowed;
1315 	__ata_eh_qc_complete(qc);
1316 }
1317 
1318 /**
1319  *	ata_eh_qc_retry - Tell midlayer to retry an ATA command after EH
1320  *	@qc: Command to retry
1321  *
1322  *	Indicate to the mid and upper layers that an ATA command
1323  *	should be retried.  To be used from EH.
1324  *
1325  *	SCSI midlayer limits the number of retries to scmd->allowed.
1326  *	scmd->allowed is incremented for commands which get retried
1327  *	due to unrelated failures (qc->err_mask is zero).
1328  */
ata_eh_qc_retry(struct ata_queued_cmd * qc)1329 void ata_eh_qc_retry(struct ata_queued_cmd *qc)
1330 {
1331 	struct scsi_cmnd *scmd = qc->scsicmd;
1332 	if (!qc->err_mask)
1333 		scmd->allowed++;
1334 	__ata_eh_qc_complete(qc);
1335 }
1336 
1337 /**
1338  *	ata_dev_disable - disable ATA device
1339  *	@dev: ATA device to disable
1340  *
1341  *	Disable @dev.
1342  *
1343  *	Locking:
1344  *	EH context.
1345  */
ata_dev_disable(struct ata_device * dev)1346 void ata_dev_disable(struct ata_device *dev)
1347 {
1348 	if (!ata_dev_enabled(dev))
1349 		return;
1350 
1351 	if (ata_msg_drv(dev->link->ap))
1352 		ata_dev_warn(dev, "disabled\n");
1353 	ata_acpi_on_disable(dev);
1354 	ata_down_xfermask_limit(dev, ATA_DNXFER_FORCE_PIO0 | ATA_DNXFER_QUIET);
1355 	dev->class++;
1356 
1357 	/* From now till the next successful probe, ering is used to
1358 	 * track probe failures.  Clear accumulated device error info.
1359 	 */
1360 	ata_ering_clear(&dev->ering);
1361 }
1362 
1363 /**
1364  *	ata_eh_detach_dev - detach ATA device
1365  *	@dev: ATA device to detach
1366  *
1367  *	Detach @dev.
1368  *
1369  *	LOCKING:
1370  *	None.
1371  */
ata_eh_detach_dev(struct ata_device * dev)1372 void ata_eh_detach_dev(struct ata_device *dev)
1373 {
1374 	struct ata_link *link = dev->link;
1375 	struct ata_port *ap = link->ap;
1376 	struct ata_eh_context *ehc = &link->eh_context;
1377 	unsigned long flags;
1378 
1379 	ata_dev_disable(dev);
1380 
1381 	spin_lock_irqsave(ap->lock, flags);
1382 
1383 	dev->flags &= ~ATA_DFLAG_DETACH;
1384 
1385 	if (ata_scsi_offline_dev(dev)) {
1386 		dev->flags |= ATA_DFLAG_DETACHED;
1387 		ap->pflags |= ATA_PFLAG_SCSI_HOTPLUG;
1388 	}
1389 
1390 	/* clear per-dev EH info */
1391 	ata_eh_clear_action(link, dev, &link->eh_info, ATA_EH_PERDEV_MASK);
1392 	ata_eh_clear_action(link, dev, &link->eh_context.i, ATA_EH_PERDEV_MASK);
1393 	ehc->saved_xfer_mode[dev->devno] = 0;
1394 	ehc->saved_ncq_enabled &= ~(1 << dev->devno);
1395 
1396 	spin_unlock_irqrestore(ap->lock, flags);
1397 }
1398 
1399 /**
1400  *	ata_eh_about_to_do - about to perform eh_action
1401  *	@link: target ATA link
1402  *	@dev: target ATA dev for per-dev action (can be NULL)
1403  *	@action: action about to be performed
1404  *
1405  *	Called just before performing EH actions to clear related bits
1406  *	in @link->eh_info such that eh actions are not unnecessarily
1407  *	repeated.
1408  *
1409  *	LOCKING:
1410  *	None.
1411  */
ata_eh_about_to_do(struct ata_link * link,struct ata_device * dev,unsigned int action)1412 void ata_eh_about_to_do(struct ata_link *link, struct ata_device *dev,
1413 			unsigned int action)
1414 {
1415 	struct ata_port *ap = link->ap;
1416 	struct ata_eh_info *ehi = &link->eh_info;
1417 	struct ata_eh_context *ehc = &link->eh_context;
1418 	unsigned long flags;
1419 
1420 	spin_lock_irqsave(ap->lock, flags);
1421 
1422 	ata_eh_clear_action(link, dev, ehi, action);
1423 
1424 	/* About to take EH action, set RECOVERED.  Ignore actions on
1425 	 * slave links as master will do them again.
1426 	 */
1427 	if (!(ehc->i.flags & ATA_EHI_QUIET) && link != ap->slave_link)
1428 		ap->pflags |= ATA_PFLAG_RECOVERED;
1429 
1430 	spin_unlock_irqrestore(ap->lock, flags);
1431 }
1432 
1433 /**
1434  *	ata_eh_done - EH action complete
1435  *	@link: ATA link for which EH actions are complete
1436  *	@dev: target ATA dev for per-dev action (can be NULL)
1437  *	@action: action just completed
1438  *
1439  *	Called right after performing EH actions to clear related bits
1440  *	in @link->eh_context.
1441  *
1442  *	LOCKING:
1443  *	None.
1444  */
ata_eh_done(struct ata_link * link,struct ata_device * dev,unsigned int action)1445 void ata_eh_done(struct ata_link *link, struct ata_device *dev,
1446 		 unsigned int action)
1447 {
1448 	struct ata_eh_context *ehc = &link->eh_context;
1449 
1450 	ata_eh_clear_action(link, dev, &ehc->i, action);
1451 }
1452 
1453 /**
1454  *	ata_err_string - convert err_mask to descriptive string
1455  *	@err_mask: error mask to convert to string
1456  *
1457  *	Convert @err_mask to descriptive string.  Errors are
1458  *	prioritized according to severity and only the most severe
1459  *	error is reported.
1460  *
1461  *	LOCKING:
1462  *	None.
1463  *
1464  *	RETURNS:
1465  *	Descriptive string for @err_mask
1466  */
ata_err_string(unsigned int err_mask)1467 static const char *ata_err_string(unsigned int err_mask)
1468 {
1469 	if (err_mask & AC_ERR_HOST_BUS)
1470 		return "host bus error";
1471 	if (err_mask & AC_ERR_ATA_BUS)
1472 		return "ATA bus error";
1473 	if (err_mask & AC_ERR_TIMEOUT)
1474 		return "timeout";
1475 	if (err_mask & AC_ERR_HSM)
1476 		return "HSM violation";
1477 	if (err_mask & AC_ERR_SYSTEM)
1478 		return "internal error";
1479 	if (err_mask & AC_ERR_MEDIA)
1480 		return "media error";
1481 	if (err_mask & AC_ERR_INVALID)
1482 		return "invalid argument";
1483 	if (err_mask & AC_ERR_DEV)
1484 		return "device error";
1485 	return "unknown error";
1486 }
1487 
1488 /**
1489  *	ata_eh_read_log_10h - Read log page 10h for NCQ error details
1490  *	@dev: Device to read log page 10h from
1491  *	@tag: Resulting tag of the failed command
1492  *	@tf: Resulting taskfile registers of the failed command
1493  *
1494  *	Read log page 10h to obtain NCQ error details and clear error
1495  *	condition.
1496  *
1497  *	LOCKING:
1498  *	Kernel thread context (may sleep).
1499  *
1500  *	RETURNS:
1501  *	0 on success, -errno otherwise.
1502  */
ata_eh_read_log_10h(struct ata_device * dev,int * tag,struct ata_taskfile * tf)1503 static int ata_eh_read_log_10h(struct ata_device *dev,
1504 			       int *tag, struct ata_taskfile *tf)
1505 {
1506 	u8 *buf = dev->link->ap->sector_buf;
1507 	unsigned int err_mask;
1508 	u8 csum;
1509 	int i;
1510 
1511 	err_mask = ata_read_log_page(dev, ATA_LOG_SATA_NCQ, 0, buf, 1);
1512 	if (err_mask)
1513 		return -EIO;
1514 
1515 	csum = 0;
1516 	for (i = 0; i < ATA_SECT_SIZE; i++)
1517 		csum += buf[i];
1518 	if (csum)
1519 		ata_dev_warn(dev, "invalid checksum 0x%x on log page 10h\n",
1520 			     csum);
1521 
1522 	if (buf[0] & 0x80)
1523 		return -ENOENT;
1524 
1525 	*tag = buf[0] & 0x1f;
1526 
1527 	tf->command = buf[2];
1528 	tf->feature = buf[3];
1529 	tf->lbal = buf[4];
1530 	tf->lbam = buf[5];
1531 	tf->lbah = buf[6];
1532 	tf->device = buf[7];
1533 	tf->hob_lbal = buf[8];
1534 	tf->hob_lbam = buf[9];
1535 	tf->hob_lbah = buf[10];
1536 	tf->nsect = buf[12];
1537 	tf->hob_nsect = buf[13];
1538 	if (dev->class == ATA_DEV_ZAC && ata_id_has_ncq_autosense(dev->id))
1539 		tf->auxiliary = buf[14] << 16 | buf[15] << 8 | buf[16];
1540 
1541 	return 0;
1542 }
1543 
1544 /**
1545  *	atapi_eh_tur - perform ATAPI TEST_UNIT_READY
1546  *	@dev: target ATAPI device
1547  *	@r_sense_key: out parameter for sense_key
1548  *
1549  *	Perform ATAPI TEST_UNIT_READY.
1550  *
1551  *	LOCKING:
1552  *	EH context (may sleep).
1553  *
1554  *	RETURNS:
1555  *	0 on success, AC_ERR_* mask on failure.
1556  */
atapi_eh_tur(struct ata_device * dev,u8 * r_sense_key)1557 unsigned int atapi_eh_tur(struct ata_device *dev, u8 *r_sense_key)
1558 {
1559 	u8 cdb[ATAPI_CDB_LEN] = { TEST_UNIT_READY, 0, 0, 0, 0, 0 };
1560 	struct ata_taskfile tf;
1561 	unsigned int err_mask;
1562 
1563 	ata_tf_init(dev, &tf);
1564 
1565 	tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_DEVICE;
1566 	tf.command = ATA_CMD_PACKET;
1567 	tf.protocol = ATAPI_PROT_NODATA;
1568 
1569 	err_mask = ata_exec_internal(dev, &tf, cdb, DMA_NONE, NULL, 0, 0);
1570 	if (err_mask == AC_ERR_DEV)
1571 		*r_sense_key = tf.feature >> 4;
1572 	return err_mask;
1573 }
1574 
1575 /**
1576  *	ata_eh_request_sense - perform REQUEST_SENSE_DATA_EXT
1577  *	@qc: qc to perform REQUEST_SENSE_SENSE_DATA_EXT to
1578  *	@cmd: scsi command for which the sense code should be set
1579  *
1580  *	Perform REQUEST_SENSE_DATA_EXT after the device reported CHECK
1581  *	SENSE.  This function is an EH helper.
1582  *
1583  *	LOCKING:
1584  *	Kernel thread context (may sleep).
1585  */
ata_eh_request_sense(struct ata_queued_cmd * qc,struct scsi_cmnd * cmd)1586 static void ata_eh_request_sense(struct ata_queued_cmd *qc,
1587 				 struct scsi_cmnd *cmd)
1588 {
1589 	struct ata_device *dev = qc->dev;
1590 	struct ata_taskfile tf;
1591 	unsigned int err_mask;
1592 
1593 	if (qc->ap->pflags & ATA_PFLAG_FROZEN) {
1594 		ata_dev_warn(dev, "sense data available but port frozen\n");
1595 		return;
1596 	}
1597 
1598 	if (!cmd || qc->flags & ATA_QCFLAG_SENSE_VALID)
1599 		return;
1600 
1601 	if (!ata_id_sense_reporting_enabled(dev->id)) {
1602 		ata_dev_warn(qc->dev, "sense data reporting disabled\n");
1603 		return;
1604 	}
1605 
1606 	DPRINTK("ATA request sense\n");
1607 
1608 	ata_tf_init(dev, &tf);
1609 	tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_DEVICE;
1610 	tf.flags |= ATA_TFLAG_LBA | ATA_TFLAG_LBA48;
1611 	tf.command = ATA_CMD_REQ_SENSE_DATA;
1612 	tf.protocol = ATA_PROT_NODATA;
1613 
1614 	err_mask = ata_exec_internal(dev, &tf, NULL, DMA_NONE, NULL, 0, 0);
1615 	/* Ignore err_mask; ATA_ERR might be set */
1616 	if (tf.command & ATA_SENSE) {
1617 		ata_scsi_set_sense(dev, cmd, tf.lbah, tf.lbam, tf.lbal);
1618 		qc->flags |= ATA_QCFLAG_SENSE_VALID;
1619 	} else {
1620 		ata_dev_warn(dev, "request sense failed stat %02x emask %x\n",
1621 			     tf.command, err_mask);
1622 	}
1623 }
1624 
1625 /**
1626  *	atapi_eh_request_sense - perform ATAPI REQUEST_SENSE
1627  *	@dev: device to perform REQUEST_SENSE to
1628  *	@sense_buf: result sense data buffer (SCSI_SENSE_BUFFERSIZE bytes long)
1629  *	@dfl_sense_key: default sense key to use
1630  *
1631  *	Perform ATAPI REQUEST_SENSE after the device reported CHECK
1632  *	SENSE.  This function is EH helper.
1633  *
1634  *	LOCKING:
1635  *	Kernel thread context (may sleep).
1636  *
1637  *	RETURNS:
1638  *	0 on success, AC_ERR_* mask on failure
1639  */
atapi_eh_request_sense(struct ata_device * dev,u8 * sense_buf,u8 dfl_sense_key)1640 unsigned int atapi_eh_request_sense(struct ata_device *dev,
1641 					   u8 *sense_buf, u8 dfl_sense_key)
1642 {
1643 	u8 cdb[ATAPI_CDB_LEN] =
1644 		{ REQUEST_SENSE, 0, 0, 0, SCSI_SENSE_BUFFERSIZE, 0 };
1645 	struct ata_port *ap = dev->link->ap;
1646 	struct ata_taskfile tf;
1647 
1648 	DPRINTK("ATAPI request sense\n");
1649 
1650 	memset(sense_buf, 0, SCSI_SENSE_BUFFERSIZE);
1651 
1652 	/* initialize sense_buf with the error register,
1653 	 * for the case where they are -not- overwritten
1654 	 */
1655 	sense_buf[0] = 0x70;
1656 	sense_buf[2] = dfl_sense_key;
1657 
1658 	/* some devices time out if garbage left in tf */
1659 	ata_tf_init(dev, &tf);
1660 
1661 	tf.flags |= ATA_TFLAG_ISADDR | ATA_TFLAG_DEVICE;
1662 	tf.command = ATA_CMD_PACKET;
1663 
1664 	/* is it pointless to prefer PIO for "safety reasons"? */
1665 	if (ap->flags & ATA_FLAG_PIO_DMA) {
1666 		tf.protocol = ATAPI_PROT_DMA;
1667 		tf.feature |= ATAPI_PKT_DMA;
1668 	} else {
1669 		tf.protocol = ATAPI_PROT_PIO;
1670 		tf.lbam = SCSI_SENSE_BUFFERSIZE;
1671 		tf.lbah = 0;
1672 	}
1673 
1674 	return ata_exec_internal(dev, &tf, cdb, DMA_FROM_DEVICE,
1675 				 sense_buf, SCSI_SENSE_BUFFERSIZE, 0);
1676 }
1677 
1678 /**
1679  *	ata_eh_analyze_serror - analyze SError for a failed port
1680  *	@link: ATA link to analyze SError for
1681  *
1682  *	Analyze SError if available and further determine cause of
1683  *	failure.
1684  *
1685  *	LOCKING:
1686  *	None.
1687  */
ata_eh_analyze_serror(struct ata_link * link)1688 static void ata_eh_analyze_serror(struct ata_link *link)
1689 {
1690 	struct ata_eh_context *ehc = &link->eh_context;
1691 	u32 serror = ehc->i.serror;
1692 	unsigned int err_mask = 0, action = 0;
1693 	u32 hotplug_mask;
1694 
1695 	if (serror & (SERR_PERSISTENT | SERR_DATA)) {
1696 		err_mask |= AC_ERR_ATA_BUS;
1697 		action |= ATA_EH_RESET;
1698 	}
1699 	if (serror & SERR_PROTOCOL) {
1700 		err_mask |= AC_ERR_HSM;
1701 		action |= ATA_EH_RESET;
1702 	}
1703 	if (serror & SERR_INTERNAL) {
1704 		err_mask |= AC_ERR_SYSTEM;
1705 		action |= ATA_EH_RESET;
1706 	}
1707 
1708 	/* Determine whether a hotplug event has occurred.  Both
1709 	 * SError.N/X are considered hotplug events for enabled or
1710 	 * host links.  For disabled PMP links, only N bit is
1711 	 * considered as X bit is left at 1 for link plugging.
1712 	 */
1713 	if (link->lpm_policy > ATA_LPM_MAX_POWER)
1714 		hotplug_mask = 0;	/* hotplug doesn't work w/ LPM */
1715 	else if (!(link->flags & ATA_LFLAG_DISABLED) || ata_is_host_link(link))
1716 		hotplug_mask = SERR_PHYRDY_CHG | SERR_DEV_XCHG;
1717 	else
1718 		hotplug_mask = SERR_PHYRDY_CHG;
1719 
1720 	if (serror & hotplug_mask)
1721 		ata_ehi_hotplugged(&ehc->i);
1722 
1723 	ehc->i.err_mask |= err_mask;
1724 	ehc->i.action |= action;
1725 }
1726 
1727 /**
1728  *	ata_eh_analyze_ncq_error - analyze NCQ error
1729  *	@link: ATA link to analyze NCQ error for
1730  *
1731  *	Read log page 10h, determine the offending qc and acquire
1732  *	error status TF.  For NCQ device errors, all LLDDs have to do
1733  *	is setting AC_ERR_DEV in ehi->err_mask.  This function takes
1734  *	care of the rest.
1735  *
1736  *	LOCKING:
1737  *	Kernel thread context (may sleep).
1738  */
ata_eh_analyze_ncq_error(struct ata_link * link)1739 void ata_eh_analyze_ncq_error(struct ata_link *link)
1740 {
1741 	struct ata_port *ap = link->ap;
1742 	struct ata_eh_context *ehc = &link->eh_context;
1743 	struct ata_device *dev = link->device;
1744 	struct ata_queued_cmd *qc;
1745 	struct ata_taskfile tf;
1746 	int tag, rc;
1747 
1748 	/* if frozen, we can't do much */
1749 	if (ap->pflags & ATA_PFLAG_FROZEN)
1750 		return;
1751 
1752 	/* is it NCQ device error? */
1753 	if (!link->sactive || !(ehc->i.err_mask & AC_ERR_DEV))
1754 		return;
1755 
1756 	/* has LLDD analyzed already? */
1757 	for (tag = 0; tag < ATA_MAX_QUEUE; tag++) {
1758 		qc = __ata_qc_from_tag(ap, tag);
1759 
1760 		if (!(qc->flags & ATA_QCFLAG_FAILED))
1761 			continue;
1762 
1763 		if (qc->err_mask)
1764 			return;
1765 	}
1766 
1767 	/* okay, this error is ours */
1768 	memset(&tf, 0, sizeof(tf));
1769 	rc = ata_eh_read_log_10h(dev, &tag, &tf);
1770 	if (rc) {
1771 		ata_link_err(link, "failed to read log page 10h (errno=%d)\n",
1772 			     rc);
1773 		return;
1774 	}
1775 
1776 	if (!(link->sactive & (1 << tag))) {
1777 		ata_link_err(link, "log page 10h reported inactive tag %d\n",
1778 			     tag);
1779 		return;
1780 	}
1781 
1782 	/* we've got the perpetrator, condemn it */
1783 	qc = __ata_qc_from_tag(ap, tag);
1784 	memcpy(&qc->result_tf, &tf, sizeof(tf));
1785 	qc->result_tf.flags = ATA_TFLAG_ISADDR | ATA_TFLAG_LBA | ATA_TFLAG_LBA48;
1786 	qc->err_mask |= AC_ERR_DEV | AC_ERR_NCQ;
1787 	if (dev->class == ATA_DEV_ZAC &&
1788 	    ((qc->result_tf.command & ATA_SENSE) || qc->result_tf.auxiliary)) {
1789 		char sense_key, asc, ascq;
1790 
1791 		sense_key = (qc->result_tf.auxiliary >> 16) & 0xff;
1792 		asc = (qc->result_tf.auxiliary >> 8) & 0xff;
1793 		ascq = qc->result_tf.auxiliary & 0xff;
1794 		ata_scsi_set_sense(dev, qc->scsicmd, sense_key, asc, ascq);
1795 		ata_scsi_set_sense_information(dev, qc->scsicmd,
1796 					       &qc->result_tf);
1797 		qc->flags |= ATA_QCFLAG_SENSE_VALID;
1798 	}
1799 
1800 	ehc->i.err_mask &= ~AC_ERR_DEV;
1801 }
1802 
1803 /**
1804  *	ata_eh_analyze_tf - analyze taskfile of a failed qc
1805  *	@qc: qc to analyze
1806  *	@tf: Taskfile registers to analyze
1807  *
1808  *	Analyze taskfile of @qc and further determine cause of
1809  *	failure.  This function also requests ATAPI sense data if
1810  *	available.
1811  *
1812  *	LOCKING:
1813  *	Kernel thread context (may sleep).
1814  *
1815  *	RETURNS:
1816  *	Determined recovery action
1817  */
ata_eh_analyze_tf(struct ata_queued_cmd * qc,const struct ata_taskfile * tf)1818 static unsigned int ata_eh_analyze_tf(struct ata_queued_cmd *qc,
1819 				      const struct ata_taskfile *tf)
1820 {
1821 	unsigned int tmp, action = 0;
1822 	u8 stat = tf->command, err = tf->feature;
1823 
1824 	if ((stat & (ATA_BUSY | ATA_DRQ | ATA_DRDY)) != ATA_DRDY) {
1825 		qc->err_mask |= AC_ERR_HSM;
1826 		return ATA_EH_RESET;
1827 	}
1828 
1829 	if (stat & (ATA_ERR | ATA_DF)) {
1830 		qc->err_mask |= AC_ERR_DEV;
1831 		/*
1832 		 * Sense data reporting does not work if the
1833 		 * device fault bit is set.
1834 		 */
1835 		if (stat & ATA_DF)
1836 			stat &= ~ATA_SENSE;
1837 	} else {
1838 		return 0;
1839 	}
1840 
1841 	switch (qc->dev->class) {
1842 	case ATA_DEV_ZAC:
1843 		if (stat & ATA_SENSE)
1844 			ata_eh_request_sense(qc, qc->scsicmd);
1845 		/* fall through */
1846 	case ATA_DEV_ATA:
1847 		if (err & ATA_ICRC)
1848 			qc->err_mask |= AC_ERR_ATA_BUS;
1849 		if (err & (ATA_UNC | ATA_AMNF))
1850 			qc->err_mask |= AC_ERR_MEDIA;
1851 		if (err & ATA_IDNF)
1852 			qc->err_mask |= AC_ERR_INVALID;
1853 		break;
1854 
1855 	case ATA_DEV_ATAPI:
1856 		if (!(qc->ap->pflags & ATA_PFLAG_FROZEN)) {
1857 			tmp = atapi_eh_request_sense(qc->dev,
1858 						qc->scsicmd->sense_buffer,
1859 						qc->result_tf.feature >> 4);
1860 			if (!tmp)
1861 				qc->flags |= ATA_QCFLAG_SENSE_VALID;
1862 			else
1863 				qc->err_mask |= tmp;
1864 		}
1865 	}
1866 
1867 	if (qc->flags & ATA_QCFLAG_SENSE_VALID) {
1868 		int ret = scsi_check_sense(qc->scsicmd);
1869 		/*
1870 		 * SUCCESS here means that the sense code could
1871 		 * evaluated and should be passed to the upper layers
1872 		 * for correct evaluation.
1873 		 * FAILED means the sense code could not interpreted
1874 		 * and the device would need to be reset.
1875 		 * NEEDS_RETRY and ADD_TO_MLQUEUE means that the
1876 		 * command would need to be retried.
1877 		 */
1878 		if (ret == NEEDS_RETRY || ret == ADD_TO_MLQUEUE) {
1879 			qc->flags |= ATA_QCFLAG_RETRY;
1880 			qc->err_mask |= AC_ERR_OTHER;
1881 		} else if (ret != SUCCESS) {
1882 			qc->err_mask |= AC_ERR_HSM;
1883 		}
1884 	}
1885 	if (qc->err_mask & (AC_ERR_HSM | AC_ERR_TIMEOUT | AC_ERR_ATA_BUS))
1886 		action |= ATA_EH_RESET;
1887 
1888 	return action;
1889 }
1890 
ata_eh_categorize_error(unsigned int eflags,unsigned int err_mask,int * xfer_ok)1891 static int ata_eh_categorize_error(unsigned int eflags, unsigned int err_mask,
1892 				   int *xfer_ok)
1893 {
1894 	int base = 0;
1895 
1896 	if (!(eflags & ATA_EFLAG_DUBIOUS_XFER))
1897 		*xfer_ok = 1;
1898 
1899 	if (!*xfer_ok)
1900 		base = ATA_ECAT_DUBIOUS_NONE;
1901 
1902 	if (err_mask & AC_ERR_ATA_BUS)
1903 		return base + ATA_ECAT_ATA_BUS;
1904 
1905 	if (err_mask & AC_ERR_TIMEOUT)
1906 		return base + ATA_ECAT_TOUT_HSM;
1907 
1908 	if (eflags & ATA_EFLAG_IS_IO) {
1909 		if (err_mask & AC_ERR_HSM)
1910 			return base + ATA_ECAT_TOUT_HSM;
1911 		if ((err_mask &
1912 		     (AC_ERR_DEV|AC_ERR_MEDIA|AC_ERR_INVALID)) == AC_ERR_DEV)
1913 			return base + ATA_ECAT_UNK_DEV;
1914 	}
1915 
1916 	return 0;
1917 }
1918 
1919 struct speed_down_verdict_arg {
1920 	u64 since;
1921 	int xfer_ok;
1922 	int nr_errors[ATA_ECAT_NR];
1923 };
1924 
speed_down_verdict_cb(struct ata_ering_entry * ent,void * void_arg)1925 static int speed_down_verdict_cb(struct ata_ering_entry *ent, void *void_arg)
1926 {
1927 	struct speed_down_verdict_arg *arg = void_arg;
1928 	int cat;
1929 
1930 	if ((ent->eflags & ATA_EFLAG_OLD_ER) || (ent->timestamp < arg->since))
1931 		return -1;
1932 
1933 	cat = ata_eh_categorize_error(ent->eflags, ent->err_mask,
1934 				      &arg->xfer_ok);
1935 	arg->nr_errors[cat]++;
1936 
1937 	return 0;
1938 }
1939 
1940 /**
1941  *	ata_eh_speed_down_verdict - Determine speed down verdict
1942  *	@dev: Device of interest
1943  *
1944  *	This function examines error ring of @dev and determines
1945  *	whether NCQ needs to be turned off, transfer speed should be
1946  *	stepped down, or falling back to PIO is necessary.
1947  *
1948  *	ECAT_ATA_BUS	: ATA_BUS error for any command
1949  *
1950  *	ECAT_TOUT_HSM	: TIMEOUT for any command or HSM violation for
1951  *			  IO commands
1952  *
1953  *	ECAT_UNK_DEV	: Unknown DEV error for IO commands
1954  *
1955  *	ECAT_DUBIOUS_*	: Identical to above three but occurred while
1956  *			  data transfer hasn't been verified.
1957  *
1958  *	Verdicts are
1959  *
1960  *	NCQ_OFF		: Turn off NCQ.
1961  *
1962  *	SPEED_DOWN	: Speed down transfer speed but don't fall back
1963  *			  to PIO.
1964  *
1965  *	FALLBACK_TO_PIO	: Fall back to PIO.
1966  *
1967  *	Even if multiple verdicts are returned, only one action is
1968  *	taken per error.  An action triggered by non-DUBIOUS errors
1969  *	clears ering, while one triggered by DUBIOUS_* errors doesn't.
1970  *	This is to expedite speed down decisions right after device is
1971  *	initially configured.
1972  *
1973  *	The following are speed down rules.  #1 and #2 deal with
1974  *	DUBIOUS errors.
1975  *
1976  *	1. If more than one DUBIOUS_ATA_BUS or DUBIOUS_TOUT_HSM errors
1977  *	   occurred during last 5 mins, SPEED_DOWN and FALLBACK_TO_PIO.
1978  *
1979  *	2. If more than one DUBIOUS_TOUT_HSM or DUBIOUS_UNK_DEV errors
1980  *	   occurred during last 5 mins, NCQ_OFF.
1981  *
1982  *	3. If more than 8 ATA_BUS, TOUT_HSM or UNK_DEV errors
1983  *	   occurred during last 5 mins, FALLBACK_TO_PIO
1984  *
1985  *	4. If more than 3 TOUT_HSM or UNK_DEV errors occurred
1986  *	   during last 10 mins, NCQ_OFF.
1987  *
1988  *	5. If more than 3 ATA_BUS or TOUT_HSM errors, or more than 6
1989  *	   UNK_DEV errors occurred during last 10 mins, SPEED_DOWN.
1990  *
1991  *	LOCKING:
1992  *	Inherited from caller.
1993  *
1994  *	RETURNS:
1995  *	OR of ATA_EH_SPDN_* flags.
1996  */
ata_eh_speed_down_verdict(struct ata_device * dev)1997 static unsigned int ata_eh_speed_down_verdict(struct ata_device *dev)
1998 {
1999 	const u64 j5mins = 5LLU * 60 * HZ, j10mins = 10LLU * 60 * HZ;
2000 	u64 j64 = get_jiffies_64();
2001 	struct speed_down_verdict_arg arg;
2002 	unsigned int verdict = 0;
2003 
2004 	/* scan past 5 mins of error history */
2005 	memset(&arg, 0, sizeof(arg));
2006 	arg.since = j64 - min(j64, j5mins);
2007 	ata_ering_map(&dev->ering, speed_down_verdict_cb, &arg);
2008 
2009 	if (arg.nr_errors[ATA_ECAT_DUBIOUS_ATA_BUS] +
2010 	    arg.nr_errors[ATA_ECAT_DUBIOUS_TOUT_HSM] > 1)
2011 		verdict |= ATA_EH_SPDN_SPEED_DOWN |
2012 			ATA_EH_SPDN_FALLBACK_TO_PIO | ATA_EH_SPDN_KEEP_ERRORS;
2013 
2014 	if (arg.nr_errors[ATA_ECAT_DUBIOUS_TOUT_HSM] +
2015 	    arg.nr_errors[ATA_ECAT_DUBIOUS_UNK_DEV] > 1)
2016 		verdict |= ATA_EH_SPDN_NCQ_OFF | ATA_EH_SPDN_KEEP_ERRORS;
2017 
2018 	if (arg.nr_errors[ATA_ECAT_ATA_BUS] +
2019 	    arg.nr_errors[ATA_ECAT_TOUT_HSM] +
2020 	    arg.nr_errors[ATA_ECAT_UNK_DEV] > 6)
2021 		verdict |= ATA_EH_SPDN_FALLBACK_TO_PIO;
2022 
2023 	/* scan past 10 mins of error history */
2024 	memset(&arg, 0, sizeof(arg));
2025 	arg.since = j64 - min(j64, j10mins);
2026 	ata_ering_map(&dev->ering, speed_down_verdict_cb, &arg);
2027 
2028 	if (arg.nr_errors[ATA_ECAT_TOUT_HSM] +
2029 	    arg.nr_errors[ATA_ECAT_UNK_DEV] > 3)
2030 		verdict |= ATA_EH_SPDN_NCQ_OFF;
2031 
2032 	if (arg.nr_errors[ATA_ECAT_ATA_BUS] +
2033 	    arg.nr_errors[ATA_ECAT_TOUT_HSM] > 3 ||
2034 	    arg.nr_errors[ATA_ECAT_UNK_DEV] > 6)
2035 		verdict |= ATA_EH_SPDN_SPEED_DOWN;
2036 
2037 	return verdict;
2038 }
2039 
2040 /**
2041  *	ata_eh_speed_down - record error and speed down if necessary
2042  *	@dev: Failed device
2043  *	@eflags: mask of ATA_EFLAG_* flags
2044  *	@err_mask: err_mask of the error
2045  *
2046  *	Record error and examine error history to determine whether
2047  *	adjusting transmission speed is necessary.  It also sets
2048  *	transmission limits appropriately if such adjustment is
2049  *	necessary.
2050  *
2051  *	LOCKING:
2052  *	Kernel thread context (may sleep).
2053  *
2054  *	RETURNS:
2055  *	Determined recovery action.
2056  */
ata_eh_speed_down(struct ata_device * dev,unsigned int eflags,unsigned int err_mask)2057 static unsigned int ata_eh_speed_down(struct ata_device *dev,
2058 				unsigned int eflags, unsigned int err_mask)
2059 {
2060 	struct ata_link *link = ata_dev_phys_link(dev);
2061 	int xfer_ok = 0;
2062 	unsigned int verdict;
2063 	unsigned int action = 0;
2064 
2065 	/* don't bother if Cat-0 error */
2066 	if (ata_eh_categorize_error(eflags, err_mask, &xfer_ok) == 0)
2067 		return 0;
2068 
2069 	/* record error and determine whether speed down is necessary */
2070 	ata_ering_record(&dev->ering, eflags, err_mask);
2071 	verdict = ata_eh_speed_down_verdict(dev);
2072 
2073 	/* turn off NCQ? */
2074 	if ((verdict & ATA_EH_SPDN_NCQ_OFF) &&
2075 	    (dev->flags & (ATA_DFLAG_PIO | ATA_DFLAG_NCQ |
2076 			   ATA_DFLAG_NCQ_OFF)) == ATA_DFLAG_NCQ) {
2077 		dev->flags |= ATA_DFLAG_NCQ_OFF;
2078 		ata_dev_warn(dev, "NCQ disabled due to excessive errors\n");
2079 		goto done;
2080 	}
2081 
2082 	/* speed down? */
2083 	if (verdict & ATA_EH_SPDN_SPEED_DOWN) {
2084 		/* speed down SATA link speed if possible */
2085 		if (sata_down_spd_limit(link, 0) == 0) {
2086 			action |= ATA_EH_RESET;
2087 			goto done;
2088 		}
2089 
2090 		/* lower transfer mode */
2091 		if (dev->spdn_cnt < 2) {
2092 			static const int dma_dnxfer_sel[] =
2093 				{ ATA_DNXFER_DMA, ATA_DNXFER_40C };
2094 			static const int pio_dnxfer_sel[] =
2095 				{ ATA_DNXFER_PIO, ATA_DNXFER_FORCE_PIO0 };
2096 			int sel;
2097 
2098 			if (dev->xfer_shift != ATA_SHIFT_PIO)
2099 				sel = dma_dnxfer_sel[dev->spdn_cnt];
2100 			else
2101 				sel = pio_dnxfer_sel[dev->spdn_cnt];
2102 
2103 			dev->spdn_cnt++;
2104 
2105 			if (ata_down_xfermask_limit(dev, sel) == 0) {
2106 				action |= ATA_EH_RESET;
2107 				goto done;
2108 			}
2109 		}
2110 	}
2111 
2112 	/* Fall back to PIO?  Slowing down to PIO is meaningless for
2113 	 * SATA ATA devices.  Consider it only for PATA and SATAPI.
2114 	 */
2115 	if ((verdict & ATA_EH_SPDN_FALLBACK_TO_PIO) && (dev->spdn_cnt >= 2) &&
2116 	    (link->ap->cbl != ATA_CBL_SATA || dev->class == ATA_DEV_ATAPI) &&
2117 	    (dev->xfer_shift != ATA_SHIFT_PIO)) {
2118 		if (ata_down_xfermask_limit(dev, ATA_DNXFER_FORCE_PIO) == 0) {
2119 			dev->spdn_cnt = 0;
2120 			action |= ATA_EH_RESET;
2121 			goto done;
2122 		}
2123 	}
2124 
2125 	return 0;
2126  done:
2127 	/* device has been slowed down, blow error history */
2128 	if (!(verdict & ATA_EH_SPDN_KEEP_ERRORS))
2129 		ata_ering_clear(&dev->ering);
2130 	return action;
2131 }
2132 
2133 /**
2134  *	ata_eh_worth_retry - analyze error and decide whether to retry
2135  *	@qc: qc to possibly retry
2136  *
2137  *	Look at the cause of the error and decide if a retry
2138  * 	might be useful or not.  We don't want to retry media errors
2139  *	because the drive itself has probably already taken 10-30 seconds
2140  *	doing its own internal retries before reporting the failure.
2141  */
ata_eh_worth_retry(struct ata_queued_cmd * qc)2142 static inline int ata_eh_worth_retry(struct ata_queued_cmd *qc)
2143 {
2144 	if (qc->err_mask & AC_ERR_MEDIA)
2145 		return 0;	/* don't retry media errors */
2146 	if (qc->flags & ATA_QCFLAG_IO)
2147 		return 1;	/* otherwise retry anything from fs stack */
2148 	if (qc->err_mask & AC_ERR_INVALID)
2149 		return 0;	/* don't retry these */
2150 	return qc->err_mask != AC_ERR_DEV;  /* retry if not dev error */
2151 }
2152 
2153 /**
2154  *	ata_eh_link_autopsy - analyze error and determine recovery action
2155  *	@link: host link to perform autopsy on
2156  *
2157  *	Analyze why @link failed and determine which recovery actions
2158  *	are needed.  This function also sets more detailed AC_ERR_*
2159  *	values and fills sense data for ATAPI CHECK SENSE.
2160  *
2161  *	LOCKING:
2162  *	Kernel thread context (may sleep).
2163  */
ata_eh_link_autopsy(struct ata_link * link)2164 static void ata_eh_link_autopsy(struct ata_link *link)
2165 {
2166 	struct ata_port *ap = link->ap;
2167 	struct ata_eh_context *ehc = &link->eh_context;
2168 	struct ata_device *dev;
2169 	unsigned int all_err_mask = 0, eflags = 0;
2170 	int tag;
2171 	u32 serror;
2172 	int rc;
2173 
2174 	DPRINTK("ENTER\n");
2175 
2176 	if (ehc->i.flags & ATA_EHI_NO_AUTOPSY)
2177 		return;
2178 
2179 	/* obtain and analyze SError */
2180 	rc = sata_scr_read(link, SCR_ERROR, &serror);
2181 	if (rc == 0) {
2182 		ehc->i.serror |= serror;
2183 		ata_eh_analyze_serror(link);
2184 	} else if (rc != -EOPNOTSUPP) {
2185 		/* SError read failed, force reset and probing */
2186 		ehc->i.probe_mask |= ATA_ALL_DEVICES;
2187 		ehc->i.action |= ATA_EH_RESET;
2188 		ehc->i.err_mask |= AC_ERR_OTHER;
2189 	}
2190 
2191 	/* analyze NCQ failure */
2192 	ata_eh_analyze_ncq_error(link);
2193 
2194 	/* any real error trumps AC_ERR_OTHER */
2195 	if (ehc->i.err_mask & ~AC_ERR_OTHER)
2196 		ehc->i.err_mask &= ~AC_ERR_OTHER;
2197 
2198 	all_err_mask |= ehc->i.err_mask;
2199 
2200 	for (tag = 0; tag < ATA_MAX_QUEUE; tag++) {
2201 		struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag);
2202 
2203 		if (!(qc->flags & ATA_QCFLAG_FAILED) ||
2204 		    ata_dev_phys_link(qc->dev) != link)
2205 			continue;
2206 
2207 		/* inherit upper level err_mask */
2208 		qc->err_mask |= ehc->i.err_mask;
2209 
2210 		/* analyze TF */
2211 		ehc->i.action |= ata_eh_analyze_tf(qc, &qc->result_tf);
2212 
2213 		/* DEV errors are probably spurious in case of ATA_BUS error */
2214 		if (qc->err_mask & AC_ERR_ATA_BUS)
2215 			qc->err_mask &= ~(AC_ERR_DEV | AC_ERR_MEDIA |
2216 					  AC_ERR_INVALID);
2217 
2218 		/* any real error trumps unknown error */
2219 		if (qc->err_mask & ~AC_ERR_OTHER)
2220 			qc->err_mask &= ~AC_ERR_OTHER;
2221 
2222 		/*
2223 		 * SENSE_VALID trumps dev/unknown error and revalidation. Upper
2224 		 * layers will determine whether the command is worth retrying
2225 		 * based on the sense data and device class/type. Otherwise,
2226 		 * determine directly if the command is worth retrying using its
2227 		 * error mask and flags.
2228 		 */
2229 		if (qc->flags & ATA_QCFLAG_SENSE_VALID)
2230 			qc->err_mask &= ~(AC_ERR_DEV | AC_ERR_OTHER);
2231 		else if (ata_eh_worth_retry(qc))
2232 			qc->flags |= ATA_QCFLAG_RETRY;
2233 
2234 		/* accumulate error info */
2235 		ehc->i.dev = qc->dev;
2236 		all_err_mask |= qc->err_mask;
2237 		if (qc->flags & ATA_QCFLAG_IO)
2238 			eflags |= ATA_EFLAG_IS_IO;
2239 		trace_ata_eh_link_autopsy_qc(qc);
2240 	}
2241 
2242 	/* enforce default EH actions */
2243 	if (ap->pflags & ATA_PFLAG_FROZEN ||
2244 	    all_err_mask & (AC_ERR_HSM | AC_ERR_TIMEOUT))
2245 		ehc->i.action |= ATA_EH_RESET;
2246 	else if (((eflags & ATA_EFLAG_IS_IO) && all_err_mask) ||
2247 		 (!(eflags & ATA_EFLAG_IS_IO) && (all_err_mask & ~AC_ERR_DEV)))
2248 		ehc->i.action |= ATA_EH_REVALIDATE;
2249 
2250 	/* If we have offending qcs and the associated failed device,
2251 	 * perform per-dev EH action only on the offending device.
2252 	 */
2253 	if (ehc->i.dev) {
2254 		ehc->i.dev_action[ehc->i.dev->devno] |=
2255 			ehc->i.action & ATA_EH_PERDEV_MASK;
2256 		ehc->i.action &= ~ATA_EH_PERDEV_MASK;
2257 	}
2258 
2259 	/* propagate timeout to host link */
2260 	if ((all_err_mask & AC_ERR_TIMEOUT) && !ata_is_host_link(link))
2261 		ap->link.eh_context.i.err_mask |= AC_ERR_TIMEOUT;
2262 
2263 	/* record error and consider speeding down */
2264 	dev = ehc->i.dev;
2265 	if (!dev && ((ata_link_max_devices(link) == 1 &&
2266 		      ata_dev_enabled(link->device))))
2267 	    dev = link->device;
2268 
2269 	if (dev) {
2270 		if (dev->flags & ATA_DFLAG_DUBIOUS_XFER)
2271 			eflags |= ATA_EFLAG_DUBIOUS_XFER;
2272 		ehc->i.action |= ata_eh_speed_down(dev, eflags, all_err_mask);
2273 		trace_ata_eh_link_autopsy(dev, ehc->i.action, all_err_mask);
2274 	}
2275 	DPRINTK("EXIT\n");
2276 }
2277 
2278 /**
2279  *	ata_eh_autopsy - analyze error and determine recovery action
2280  *	@ap: host port to perform autopsy on
2281  *
2282  *	Analyze all links of @ap and determine why they failed and
2283  *	which recovery actions are needed.
2284  *
2285  *	LOCKING:
2286  *	Kernel thread context (may sleep).
2287  */
ata_eh_autopsy(struct ata_port * ap)2288 void ata_eh_autopsy(struct ata_port *ap)
2289 {
2290 	struct ata_link *link;
2291 
2292 	ata_for_each_link(link, ap, EDGE)
2293 		ata_eh_link_autopsy(link);
2294 
2295 	/* Handle the frigging slave link.  Autopsy is done similarly
2296 	 * but actions and flags are transferred over to the master
2297 	 * link and handled from there.
2298 	 */
2299 	if (ap->slave_link) {
2300 		struct ata_eh_context *mehc = &ap->link.eh_context;
2301 		struct ata_eh_context *sehc = &ap->slave_link->eh_context;
2302 
2303 		/* transfer control flags from master to slave */
2304 		sehc->i.flags |= mehc->i.flags & ATA_EHI_TO_SLAVE_MASK;
2305 
2306 		/* perform autopsy on the slave link */
2307 		ata_eh_link_autopsy(ap->slave_link);
2308 
2309 		/* transfer actions from slave to master and clear slave */
2310 		ata_eh_about_to_do(ap->slave_link, NULL, ATA_EH_ALL_ACTIONS);
2311 		mehc->i.action		|= sehc->i.action;
2312 		mehc->i.dev_action[1]	|= sehc->i.dev_action[1];
2313 		mehc->i.flags		|= sehc->i.flags;
2314 		ata_eh_done(ap->slave_link, NULL, ATA_EH_ALL_ACTIONS);
2315 	}
2316 
2317 	/* Autopsy of fanout ports can affect host link autopsy.
2318 	 * Perform host link autopsy last.
2319 	 */
2320 	if (sata_pmp_attached(ap))
2321 		ata_eh_link_autopsy(&ap->link);
2322 }
2323 
2324 /**
2325  *	ata_get_cmd_descript - get description for ATA command
2326  *	@command: ATA command code to get description for
2327  *
2328  *	Return a textual description of the given command, or NULL if the
2329  *	command is not known.
2330  *
2331  *	LOCKING:
2332  *	None
2333  */
ata_get_cmd_descript(u8 command)2334 const char *ata_get_cmd_descript(u8 command)
2335 {
2336 #ifdef CONFIG_ATA_VERBOSE_ERROR
2337 	static const struct
2338 	{
2339 		u8 command;
2340 		const char *text;
2341 	} cmd_descr[] = {
2342 		{ ATA_CMD_DEV_RESET,		"DEVICE RESET" },
2343 		{ ATA_CMD_CHK_POWER,		"CHECK POWER MODE" },
2344 		{ ATA_CMD_STANDBY,		"STANDBY" },
2345 		{ ATA_CMD_IDLE,			"IDLE" },
2346 		{ ATA_CMD_EDD,			"EXECUTE DEVICE DIAGNOSTIC" },
2347 		{ ATA_CMD_DOWNLOAD_MICRO,	"DOWNLOAD MICROCODE" },
2348 		{ ATA_CMD_DOWNLOAD_MICRO_DMA,	"DOWNLOAD MICROCODE DMA" },
2349 		{ ATA_CMD_NOP,			"NOP" },
2350 		{ ATA_CMD_FLUSH,		"FLUSH CACHE" },
2351 		{ ATA_CMD_FLUSH_EXT,		"FLUSH CACHE EXT" },
2352 		{ ATA_CMD_ID_ATA,		"IDENTIFY DEVICE" },
2353 		{ ATA_CMD_ID_ATAPI,		"IDENTIFY PACKET DEVICE" },
2354 		{ ATA_CMD_SERVICE,		"SERVICE" },
2355 		{ ATA_CMD_READ,			"READ DMA" },
2356 		{ ATA_CMD_READ_EXT,		"READ DMA EXT" },
2357 		{ ATA_CMD_READ_QUEUED,		"READ DMA QUEUED" },
2358 		{ ATA_CMD_READ_STREAM_EXT,	"READ STREAM EXT" },
2359 		{ ATA_CMD_READ_STREAM_DMA_EXT,  "READ STREAM DMA EXT" },
2360 		{ ATA_CMD_WRITE,		"WRITE DMA" },
2361 		{ ATA_CMD_WRITE_EXT,		"WRITE DMA EXT" },
2362 		{ ATA_CMD_WRITE_QUEUED,		"WRITE DMA QUEUED EXT" },
2363 		{ ATA_CMD_WRITE_STREAM_EXT,	"WRITE STREAM EXT" },
2364 		{ ATA_CMD_WRITE_STREAM_DMA_EXT, "WRITE STREAM DMA EXT" },
2365 		{ ATA_CMD_WRITE_FUA_EXT,	"WRITE DMA FUA EXT" },
2366 		{ ATA_CMD_WRITE_QUEUED_FUA_EXT, "WRITE DMA QUEUED FUA EXT" },
2367 		{ ATA_CMD_FPDMA_READ,		"READ FPDMA QUEUED" },
2368 		{ ATA_CMD_FPDMA_WRITE,		"WRITE FPDMA QUEUED" },
2369 		{ ATA_CMD_FPDMA_SEND,		"SEND FPDMA QUEUED" },
2370 		{ ATA_CMD_FPDMA_RECV,		"RECEIVE FPDMA QUEUED" },
2371 		{ ATA_CMD_PIO_READ,		"READ SECTOR(S)" },
2372 		{ ATA_CMD_PIO_READ_EXT,		"READ SECTOR(S) EXT" },
2373 		{ ATA_CMD_PIO_WRITE,		"WRITE SECTOR(S)" },
2374 		{ ATA_CMD_PIO_WRITE_EXT,	"WRITE SECTOR(S) EXT" },
2375 		{ ATA_CMD_READ_MULTI,		"READ MULTIPLE" },
2376 		{ ATA_CMD_READ_MULTI_EXT,	"READ MULTIPLE EXT" },
2377 		{ ATA_CMD_WRITE_MULTI,		"WRITE MULTIPLE" },
2378 		{ ATA_CMD_WRITE_MULTI_EXT,	"WRITE MULTIPLE EXT" },
2379 		{ ATA_CMD_WRITE_MULTI_FUA_EXT,	"WRITE MULTIPLE FUA EXT" },
2380 		{ ATA_CMD_SET_FEATURES,		"SET FEATURES" },
2381 		{ ATA_CMD_SET_MULTI,		"SET MULTIPLE MODE" },
2382 		{ ATA_CMD_VERIFY,		"READ VERIFY SECTOR(S)" },
2383 		{ ATA_CMD_VERIFY_EXT,		"READ VERIFY SECTOR(S) EXT" },
2384 		{ ATA_CMD_WRITE_UNCORR_EXT,	"WRITE UNCORRECTABLE EXT" },
2385 		{ ATA_CMD_STANDBYNOW1,		"STANDBY IMMEDIATE" },
2386 		{ ATA_CMD_IDLEIMMEDIATE,	"IDLE IMMEDIATE" },
2387 		{ ATA_CMD_SLEEP,		"SLEEP" },
2388 		{ ATA_CMD_INIT_DEV_PARAMS,	"INITIALIZE DEVICE PARAMETERS" },
2389 		{ ATA_CMD_READ_NATIVE_MAX,	"READ NATIVE MAX ADDRESS" },
2390 		{ ATA_CMD_READ_NATIVE_MAX_EXT,	"READ NATIVE MAX ADDRESS EXT" },
2391 		{ ATA_CMD_SET_MAX,		"SET MAX ADDRESS" },
2392 		{ ATA_CMD_SET_MAX_EXT,		"SET MAX ADDRESS EXT" },
2393 		{ ATA_CMD_READ_LOG_EXT,		"READ LOG EXT" },
2394 		{ ATA_CMD_WRITE_LOG_EXT,	"WRITE LOG EXT" },
2395 		{ ATA_CMD_READ_LOG_DMA_EXT,	"READ LOG DMA EXT" },
2396 		{ ATA_CMD_WRITE_LOG_DMA_EXT,	"WRITE LOG DMA EXT" },
2397 		{ ATA_CMD_TRUSTED_NONDATA,	"TRUSTED NON-DATA" },
2398 		{ ATA_CMD_TRUSTED_RCV,		"TRUSTED RECEIVE" },
2399 		{ ATA_CMD_TRUSTED_RCV_DMA,	"TRUSTED RECEIVE DMA" },
2400 		{ ATA_CMD_TRUSTED_SND,		"TRUSTED SEND" },
2401 		{ ATA_CMD_TRUSTED_SND_DMA,	"TRUSTED SEND DMA" },
2402 		{ ATA_CMD_PMP_READ,		"READ BUFFER" },
2403 		{ ATA_CMD_PMP_READ_DMA,		"READ BUFFER DMA" },
2404 		{ ATA_CMD_PMP_WRITE,		"WRITE BUFFER" },
2405 		{ ATA_CMD_PMP_WRITE_DMA,	"WRITE BUFFER DMA" },
2406 		{ ATA_CMD_CONF_OVERLAY,		"DEVICE CONFIGURATION OVERLAY" },
2407 		{ ATA_CMD_SEC_SET_PASS,		"SECURITY SET PASSWORD" },
2408 		{ ATA_CMD_SEC_UNLOCK,		"SECURITY UNLOCK" },
2409 		{ ATA_CMD_SEC_ERASE_PREP,	"SECURITY ERASE PREPARE" },
2410 		{ ATA_CMD_SEC_ERASE_UNIT,	"SECURITY ERASE UNIT" },
2411 		{ ATA_CMD_SEC_FREEZE_LOCK,	"SECURITY FREEZE LOCK" },
2412 		{ ATA_CMD_SEC_DISABLE_PASS,	"SECURITY DISABLE PASSWORD" },
2413 		{ ATA_CMD_CONFIG_STREAM,	"CONFIGURE STREAM" },
2414 		{ ATA_CMD_SMART,		"SMART" },
2415 		{ ATA_CMD_MEDIA_LOCK,		"DOOR LOCK" },
2416 		{ ATA_CMD_MEDIA_UNLOCK,		"DOOR UNLOCK" },
2417 		{ ATA_CMD_DSM,			"DATA SET MANAGEMENT" },
2418 		{ ATA_CMD_CHK_MED_CRD_TYP,	"CHECK MEDIA CARD TYPE" },
2419 		{ ATA_CMD_CFA_REQ_EXT_ERR,	"CFA REQUEST EXTENDED ERROR" },
2420 		{ ATA_CMD_CFA_WRITE_NE,		"CFA WRITE SECTORS WITHOUT ERASE" },
2421 		{ ATA_CMD_CFA_TRANS_SECT,	"CFA TRANSLATE SECTOR" },
2422 		{ ATA_CMD_CFA_ERASE,		"CFA ERASE SECTORS" },
2423 		{ ATA_CMD_CFA_WRITE_MULT_NE,	"CFA WRITE MULTIPLE WITHOUT ERASE" },
2424 		{ ATA_CMD_REQ_SENSE_DATA,	"REQUEST SENSE DATA EXT" },
2425 		{ ATA_CMD_SANITIZE_DEVICE,	"SANITIZE DEVICE" },
2426 		{ ATA_CMD_ZAC_MGMT_IN,		"ZAC MANAGEMENT IN" },
2427 		{ ATA_CMD_ZAC_MGMT_OUT,		"ZAC MANAGEMENT OUT" },
2428 		{ ATA_CMD_READ_LONG,		"READ LONG (with retries)" },
2429 		{ ATA_CMD_READ_LONG_ONCE,	"READ LONG (without retries)" },
2430 		{ ATA_CMD_WRITE_LONG,		"WRITE LONG (with retries)" },
2431 		{ ATA_CMD_WRITE_LONG_ONCE,	"WRITE LONG (without retries)" },
2432 		{ ATA_CMD_RESTORE,		"RECALIBRATE" },
2433 		{ 0,				NULL } /* terminate list */
2434 	};
2435 
2436 	unsigned int i;
2437 	for (i = 0; cmd_descr[i].text; i++)
2438 		if (cmd_descr[i].command == command)
2439 			return cmd_descr[i].text;
2440 #endif
2441 
2442 	return NULL;
2443 }
2444 EXPORT_SYMBOL_GPL(ata_get_cmd_descript);
2445 
2446 /**
2447  *	ata_eh_link_report - report error handling to user
2448  *	@link: ATA link EH is going on
2449  *
2450  *	Report EH to user.
2451  *
2452  *	LOCKING:
2453  *	None.
2454  */
ata_eh_link_report(struct ata_link * link)2455 static void ata_eh_link_report(struct ata_link *link)
2456 {
2457 	struct ata_port *ap = link->ap;
2458 	struct ata_eh_context *ehc = &link->eh_context;
2459 	const char *frozen, *desc;
2460 	char tries_buf[6] = "";
2461 	int tag, nr_failed = 0;
2462 
2463 	if (ehc->i.flags & ATA_EHI_QUIET)
2464 		return;
2465 
2466 	desc = NULL;
2467 	if (ehc->i.desc[0] != '\0')
2468 		desc = ehc->i.desc;
2469 
2470 	for (tag = 0; tag < ATA_MAX_QUEUE; tag++) {
2471 		struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag);
2472 
2473 		if (!(qc->flags & ATA_QCFLAG_FAILED) ||
2474 		    ata_dev_phys_link(qc->dev) != link ||
2475 		    ((qc->flags & ATA_QCFLAG_QUIET) &&
2476 		     qc->err_mask == AC_ERR_DEV))
2477 			continue;
2478 		if (qc->flags & ATA_QCFLAG_SENSE_VALID && !qc->err_mask)
2479 			continue;
2480 
2481 		nr_failed++;
2482 	}
2483 
2484 	if (!nr_failed && !ehc->i.err_mask)
2485 		return;
2486 
2487 	frozen = "";
2488 	if (ap->pflags & ATA_PFLAG_FROZEN)
2489 		frozen = " frozen";
2490 
2491 	if (ap->eh_tries < ATA_EH_MAX_TRIES)
2492 		snprintf(tries_buf, sizeof(tries_buf), " t%d",
2493 			 ap->eh_tries);
2494 
2495 	if (ehc->i.dev) {
2496 		ata_dev_err(ehc->i.dev, "exception Emask 0x%x "
2497 			    "SAct 0x%x SErr 0x%x action 0x%x%s%s\n",
2498 			    ehc->i.err_mask, link->sactive, ehc->i.serror,
2499 			    ehc->i.action, frozen, tries_buf);
2500 		if (desc)
2501 			ata_dev_err(ehc->i.dev, "%s\n", desc);
2502 	} else {
2503 		ata_link_err(link, "exception Emask 0x%x "
2504 			     "SAct 0x%x SErr 0x%x action 0x%x%s%s\n",
2505 			     ehc->i.err_mask, link->sactive, ehc->i.serror,
2506 			     ehc->i.action, frozen, tries_buf);
2507 		if (desc)
2508 			ata_link_err(link, "%s\n", desc);
2509 	}
2510 
2511 #ifdef CONFIG_ATA_VERBOSE_ERROR
2512 	if (ehc->i.serror)
2513 		ata_link_err(link,
2514 		  "SError: { %s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s}\n",
2515 		  ehc->i.serror & SERR_DATA_RECOVERED ? "RecovData " : "",
2516 		  ehc->i.serror & SERR_COMM_RECOVERED ? "RecovComm " : "",
2517 		  ehc->i.serror & SERR_DATA ? "UnrecovData " : "",
2518 		  ehc->i.serror & SERR_PERSISTENT ? "Persist " : "",
2519 		  ehc->i.serror & SERR_PROTOCOL ? "Proto " : "",
2520 		  ehc->i.serror & SERR_INTERNAL ? "HostInt " : "",
2521 		  ehc->i.serror & SERR_PHYRDY_CHG ? "PHYRdyChg " : "",
2522 		  ehc->i.serror & SERR_PHY_INT_ERR ? "PHYInt " : "",
2523 		  ehc->i.serror & SERR_COMM_WAKE ? "CommWake " : "",
2524 		  ehc->i.serror & SERR_10B_8B_ERR ? "10B8B " : "",
2525 		  ehc->i.serror & SERR_DISPARITY ? "Dispar " : "",
2526 		  ehc->i.serror & SERR_CRC ? "BadCRC " : "",
2527 		  ehc->i.serror & SERR_HANDSHAKE ? "Handshk " : "",
2528 		  ehc->i.serror & SERR_LINK_SEQ_ERR ? "LinkSeq " : "",
2529 		  ehc->i.serror & SERR_TRANS_ST_ERROR ? "TrStaTrns " : "",
2530 		  ehc->i.serror & SERR_UNRECOG_FIS ? "UnrecFIS " : "",
2531 		  ehc->i.serror & SERR_DEV_XCHG ? "DevExch " : "");
2532 #endif
2533 
2534 	for (tag = 0; tag < ATA_MAX_QUEUE; tag++) {
2535 		struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag);
2536 		struct ata_taskfile *cmd = &qc->tf, *res = &qc->result_tf;
2537 		char data_buf[20] = "";
2538 		char cdb_buf[70] = "";
2539 
2540 		if (!(qc->flags & ATA_QCFLAG_FAILED) ||
2541 		    ata_dev_phys_link(qc->dev) != link || !qc->err_mask)
2542 			continue;
2543 
2544 		if (qc->dma_dir != DMA_NONE) {
2545 			static const char *dma_str[] = {
2546 				[DMA_BIDIRECTIONAL]	= "bidi",
2547 				[DMA_TO_DEVICE]		= "out",
2548 				[DMA_FROM_DEVICE]	= "in",
2549 			};
2550 			const char *prot_str = NULL;
2551 
2552 			switch (qc->tf.protocol) {
2553 			case ATA_PROT_UNKNOWN:
2554 				prot_str = "unknown";
2555 				break;
2556 			case ATA_PROT_NODATA:
2557 				prot_str = "nodata";
2558 				break;
2559 			case ATA_PROT_PIO:
2560 				prot_str = "pio";
2561 				break;
2562 			case ATA_PROT_DMA:
2563 				prot_str = "dma";
2564 				break;
2565 			case ATA_PROT_NCQ:
2566 				prot_str = "ncq dma";
2567 				break;
2568 			case ATA_PROT_NCQ_NODATA:
2569 				prot_str = "ncq nodata";
2570 				break;
2571 			case ATAPI_PROT_NODATA:
2572 				prot_str = "nodata";
2573 				break;
2574 			case ATAPI_PROT_PIO:
2575 				prot_str = "pio";
2576 				break;
2577 			case ATAPI_PROT_DMA:
2578 				prot_str = "dma";
2579 				break;
2580 			}
2581 			snprintf(data_buf, sizeof(data_buf), " %s %u %s",
2582 				 prot_str, qc->nbytes, dma_str[qc->dma_dir]);
2583 		}
2584 
2585 		if (ata_is_atapi(qc->tf.protocol)) {
2586 			const u8 *cdb = qc->cdb;
2587 			size_t cdb_len = qc->dev->cdb_len;
2588 
2589 			if (qc->scsicmd) {
2590 				cdb = qc->scsicmd->cmnd;
2591 				cdb_len = qc->scsicmd->cmd_len;
2592 			}
2593 			__scsi_format_command(cdb_buf, sizeof(cdb_buf),
2594 					      cdb, cdb_len);
2595 		} else {
2596 			const char *descr = ata_get_cmd_descript(cmd->command);
2597 			if (descr)
2598 				ata_dev_err(qc->dev, "failed command: %s\n",
2599 					    descr);
2600 		}
2601 
2602 		ata_dev_err(qc->dev,
2603 			"cmd %02x/%02x:%02x:%02x:%02x:%02x/%02x:%02x:%02x:%02x:%02x/%02x "
2604 			"tag %d%s\n         %s"
2605 			"res %02x/%02x:%02x:%02x:%02x:%02x/%02x:%02x:%02x:%02x:%02x/%02x "
2606 			"Emask 0x%x (%s)%s\n",
2607 			cmd->command, cmd->feature, cmd->nsect,
2608 			cmd->lbal, cmd->lbam, cmd->lbah,
2609 			cmd->hob_feature, cmd->hob_nsect,
2610 			cmd->hob_lbal, cmd->hob_lbam, cmd->hob_lbah,
2611 			cmd->device, qc->tag, data_buf, cdb_buf,
2612 			res->command, res->feature, res->nsect,
2613 			res->lbal, res->lbam, res->lbah,
2614 			res->hob_feature, res->hob_nsect,
2615 			res->hob_lbal, res->hob_lbam, res->hob_lbah,
2616 			res->device, qc->err_mask, ata_err_string(qc->err_mask),
2617 			qc->err_mask & AC_ERR_NCQ ? " <F>" : "");
2618 
2619 #ifdef CONFIG_ATA_VERBOSE_ERROR
2620 		if (res->command & (ATA_BUSY | ATA_DRDY | ATA_DF | ATA_DRQ |
2621 				    ATA_SENSE | ATA_ERR)) {
2622 			if (res->command & ATA_BUSY)
2623 				ata_dev_err(qc->dev, "status: { Busy }\n");
2624 			else
2625 				ata_dev_err(qc->dev, "status: { %s%s%s%s%s}\n",
2626 				  res->command & ATA_DRDY ? "DRDY " : "",
2627 				  res->command & ATA_DF ? "DF " : "",
2628 				  res->command & ATA_DRQ ? "DRQ " : "",
2629 				  res->command & ATA_SENSE ? "SENSE " : "",
2630 				  res->command & ATA_ERR ? "ERR " : "");
2631 		}
2632 
2633 		if (cmd->command != ATA_CMD_PACKET &&
2634 		    (res->feature & (ATA_ICRC | ATA_UNC | ATA_AMNF |
2635 				     ATA_IDNF | ATA_ABORTED)))
2636 			ata_dev_err(qc->dev, "error: { %s%s%s%s%s}\n",
2637 			  res->feature & ATA_ICRC ? "ICRC " : "",
2638 			  res->feature & ATA_UNC ? "UNC " : "",
2639 			  res->feature & ATA_AMNF ? "AMNF " : "",
2640 			  res->feature & ATA_IDNF ? "IDNF " : "",
2641 			  res->feature & ATA_ABORTED ? "ABRT " : "");
2642 #endif
2643 	}
2644 }
2645 
2646 /**
2647  *	ata_eh_report - report error handling to user
2648  *	@ap: ATA port to report EH about
2649  *
2650  *	Report EH to user.
2651  *
2652  *	LOCKING:
2653  *	None.
2654  */
ata_eh_report(struct ata_port * ap)2655 void ata_eh_report(struct ata_port *ap)
2656 {
2657 	struct ata_link *link;
2658 
2659 	ata_for_each_link(link, ap, HOST_FIRST)
2660 		ata_eh_link_report(link);
2661 }
2662 
ata_do_reset(struct ata_link * link,ata_reset_fn_t reset,unsigned int * classes,unsigned long deadline,bool clear_classes)2663 static int ata_do_reset(struct ata_link *link, ata_reset_fn_t reset,
2664 			unsigned int *classes, unsigned long deadline,
2665 			bool clear_classes)
2666 {
2667 	struct ata_device *dev;
2668 
2669 	if (clear_classes)
2670 		ata_for_each_dev(dev, link, ALL)
2671 			classes[dev->devno] = ATA_DEV_UNKNOWN;
2672 
2673 	return reset(link, classes, deadline);
2674 }
2675 
ata_eh_followup_srst_needed(struct ata_link * link,int rc)2676 static int ata_eh_followup_srst_needed(struct ata_link *link, int rc)
2677 {
2678 	if ((link->flags & ATA_LFLAG_NO_SRST) || ata_link_offline(link))
2679 		return 0;
2680 	if (rc == -EAGAIN)
2681 		return 1;
2682 	if (sata_pmp_supported(link->ap) && ata_is_host_link(link))
2683 		return 1;
2684 	return 0;
2685 }
2686 
ata_eh_reset(struct ata_link * link,int classify,ata_prereset_fn_t prereset,ata_reset_fn_t softreset,ata_reset_fn_t hardreset,ata_postreset_fn_t postreset)2687 int ata_eh_reset(struct ata_link *link, int classify,
2688 		 ata_prereset_fn_t prereset, ata_reset_fn_t softreset,
2689 		 ata_reset_fn_t hardreset, ata_postreset_fn_t postreset)
2690 {
2691 	struct ata_port *ap = link->ap;
2692 	struct ata_link *slave = ap->slave_link;
2693 	struct ata_eh_context *ehc = &link->eh_context;
2694 	struct ata_eh_context *sehc = slave ? &slave->eh_context : NULL;
2695 	unsigned int *classes = ehc->classes;
2696 	unsigned int lflags = link->flags;
2697 	int verbose = !(ehc->i.flags & ATA_EHI_QUIET);
2698 	int max_tries = 0, try = 0;
2699 	struct ata_link *failed_link;
2700 	struct ata_device *dev;
2701 	unsigned long deadline, now;
2702 	ata_reset_fn_t reset;
2703 	unsigned long flags;
2704 	u32 sstatus;
2705 	int nr_unknown, rc;
2706 
2707 	/*
2708 	 * Prepare to reset
2709 	 */
2710 	while (ata_eh_reset_timeouts[max_tries] != ULONG_MAX)
2711 		max_tries++;
2712 	if (link->flags & ATA_LFLAG_RST_ONCE)
2713 		max_tries = 1;
2714 	if (link->flags & ATA_LFLAG_NO_HRST)
2715 		hardreset = NULL;
2716 	if (link->flags & ATA_LFLAG_NO_SRST)
2717 		softreset = NULL;
2718 
2719 	/* make sure each reset attempt is at least COOL_DOWN apart */
2720 	if (ehc->i.flags & ATA_EHI_DID_RESET) {
2721 		now = jiffies;
2722 		WARN_ON(time_after(ehc->last_reset, now));
2723 		deadline = ata_deadline(ehc->last_reset,
2724 					ATA_EH_RESET_COOL_DOWN);
2725 		if (time_before(now, deadline))
2726 			schedule_timeout_uninterruptible(deadline - now);
2727 	}
2728 
2729 	spin_lock_irqsave(ap->lock, flags);
2730 	ap->pflags |= ATA_PFLAG_RESETTING;
2731 	spin_unlock_irqrestore(ap->lock, flags);
2732 
2733 	ata_eh_about_to_do(link, NULL, ATA_EH_RESET);
2734 
2735 	ata_for_each_dev(dev, link, ALL) {
2736 		/* If we issue an SRST then an ATA drive (not ATAPI)
2737 		 * may change configuration and be in PIO0 timing. If
2738 		 * we do a hard reset (or are coming from power on)
2739 		 * this is true for ATA or ATAPI. Until we've set a
2740 		 * suitable controller mode we should not touch the
2741 		 * bus as we may be talking too fast.
2742 		 */
2743 		dev->pio_mode = XFER_PIO_0;
2744 		dev->dma_mode = 0xff;
2745 
2746 		/* If the controller has a pio mode setup function
2747 		 * then use it to set the chipset to rights. Don't
2748 		 * touch the DMA setup as that will be dealt with when
2749 		 * configuring devices.
2750 		 */
2751 		if (ap->ops->set_piomode)
2752 			ap->ops->set_piomode(ap, dev);
2753 	}
2754 
2755 	/* prefer hardreset */
2756 	reset = NULL;
2757 	ehc->i.action &= ~ATA_EH_RESET;
2758 	if (hardreset) {
2759 		reset = hardreset;
2760 		ehc->i.action |= ATA_EH_HARDRESET;
2761 	} else if (softreset) {
2762 		reset = softreset;
2763 		ehc->i.action |= ATA_EH_SOFTRESET;
2764 	}
2765 
2766 	if (prereset) {
2767 		unsigned long deadline = ata_deadline(jiffies,
2768 						      ATA_EH_PRERESET_TIMEOUT);
2769 
2770 		if (slave) {
2771 			sehc->i.action &= ~ATA_EH_RESET;
2772 			sehc->i.action |= ehc->i.action;
2773 		}
2774 
2775 		rc = prereset(link, deadline);
2776 
2777 		/* If present, do prereset on slave link too.  Reset
2778 		 * is skipped iff both master and slave links report
2779 		 * -ENOENT or clear ATA_EH_RESET.
2780 		 */
2781 		if (slave && (rc == 0 || rc == -ENOENT)) {
2782 			int tmp;
2783 
2784 			tmp = prereset(slave, deadline);
2785 			if (tmp != -ENOENT)
2786 				rc = tmp;
2787 
2788 			ehc->i.action |= sehc->i.action;
2789 		}
2790 
2791 		if (rc) {
2792 			if (rc == -ENOENT) {
2793 				ata_link_dbg(link, "port disabled--ignoring\n");
2794 				ehc->i.action &= ~ATA_EH_RESET;
2795 
2796 				ata_for_each_dev(dev, link, ALL)
2797 					classes[dev->devno] = ATA_DEV_NONE;
2798 
2799 				rc = 0;
2800 			} else
2801 				ata_link_err(link,
2802 					     "prereset failed (errno=%d)\n",
2803 					     rc);
2804 			goto out;
2805 		}
2806 
2807 		/* prereset() might have cleared ATA_EH_RESET.  If so,
2808 		 * bang classes, thaw and return.
2809 		 */
2810 		if (reset && !(ehc->i.action & ATA_EH_RESET)) {
2811 			ata_for_each_dev(dev, link, ALL)
2812 				classes[dev->devno] = ATA_DEV_NONE;
2813 			if ((ap->pflags & ATA_PFLAG_FROZEN) &&
2814 			    ata_is_host_link(link))
2815 				ata_eh_thaw_port(ap);
2816 			rc = 0;
2817 			goto out;
2818 		}
2819 	}
2820 
2821  retry:
2822 	/*
2823 	 * Perform reset
2824 	 */
2825 	if (ata_is_host_link(link))
2826 		ata_eh_freeze_port(ap);
2827 
2828 	deadline = ata_deadline(jiffies, ata_eh_reset_timeouts[try++]);
2829 
2830 	if (reset) {
2831 		if (verbose)
2832 			ata_link_info(link, "%s resetting link\n",
2833 				      reset == softreset ? "soft" : "hard");
2834 
2835 		/* mark that this EH session started with reset */
2836 		ehc->last_reset = jiffies;
2837 		if (reset == hardreset)
2838 			ehc->i.flags |= ATA_EHI_DID_HARDRESET;
2839 		else
2840 			ehc->i.flags |= ATA_EHI_DID_SOFTRESET;
2841 
2842 		rc = ata_do_reset(link, reset, classes, deadline, true);
2843 		if (rc && rc != -EAGAIN) {
2844 			failed_link = link;
2845 			goto fail;
2846 		}
2847 
2848 		/* hardreset slave link if existent */
2849 		if (slave && reset == hardreset) {
2850 			int tmp;
2851 
2852 			if (verbose)
2853 				ata_link_info(slave, "hard resetting link\n");
2854 
2855 			ata_eh_about_to_do(slave, NULL, ATA_EH_RESET);
2856 			tmp = ata_do_reset(slave, reset, classes, deadline,
2857 					   false);
2858 			switch (tmp) {
2859 			case -EAGAIN:
2860 				rc = -EAGAIN;
2861 			case 0:
2862 				break;
2863 			default:
2864 				failed_link = slave;
2865 				rc = tmp;
2866 				goto fail;
2867 			}
2868 		}
2869 
2870 		/* perform follow-up SRST if necessary */
2871 		if (reset == hardreset &&
2872 		    ata_eh_followup_srst_needed(link, rc)) {
2873 			reset = softreset;
2874 
2875 			if (!reset) {
2876 				ata_link_err(link,
2877 	     "follow-up softreset required but no softreset available\n");
2878 				failed_link = link;
2879 				rc = -EINVAL;
2880 				goto fail;
2881 			}
2882 
2883 			ata_eh_about_to_do(link, NULL, ATA_EH_RESET);
2884 			rc = ata_do_reset(link, reset, classes, deadline, true);
2885 			if (rc) {
2886 				failed_link = link;
2887 				goto fail;
2888 			}
2889 		}
2890 	} else {
2891 		if (verbose)
2892 			ata_link_info(link,
2893 	"no reset method available, skipping reset\n");
2894 		if (!(lflags & ATA_LFLAG_ASSUME_CLASS))
2895 			lflags |= ATA_LFLAG_ASSUME_ATA;
2896 	}
2897 
2898 	/*
2899 	 * Post-reset processing
2900 	 */
2901 	ata_for_each_dev(dev, link, ALL) {
2902 		/* After the reset, the device state is PIO 0 and the
2903 		 * controller state is undefined.  Reset also wakes up
2904 		 * drives from sleeping mode.
2905 		 */
2906 		dev->pio_mode = XFER_PIO_0;
2907 		dev->flags &= ~ATA_DFLAG_SLEEPING;
2908 
2909 		if (ata_phys_link_offline(ata_dev_phys_link(dev)))
2910 			continue;
2911 
2912 		/* apply class override */
2913 		if (lflags & ATA_LFLAG_ASSUME_ATA)
2914 			classes[dev->devno] = ATA_DEV_ATA;
2915 		else if (lflags & ATA_LFLAG_ASSUME_SEMB)
2916 			classes[dev->devno] = ATA_DEV_SEMB_UNSUP;
2917 	}
2918 
2919 	/* record current link speed */
2920 	if (sata_scr_read(link, SCR_STATUS, &sstatus) == 0)
2921 		link->sata_spd = (sstatus >> 4) & 0xf;
2922 	if (slave && sata_scr_read(slave, SCR_STATUS, &sstatus) == 0)
2923 		slave->sata_spd = (sstatus >> 4) & 0xf;
2924 
2925 	/* thaw the port */
2926 	if (ata_is_host_link(link))
2927 		ata_eh_thaw_port(ap);
2928 
2929 	/* postreset() should clear hardware SError.  Although SError
2930 	 * is cleared during link resume, clearing SError here is
2931 	 * necessary as some PHYs raise hotplug events after SRST.
2932 	 * This introduces race condition where hotplug occurs between
2933 	 * reset and here.  This race is mediated by cross checking
2934 	 * link onlineness and classification result later.
2935 	 */
2936 	if (postreset) {
2937 		postreset(link, classes);
2938 		if (slave)
2939 			postreset(slave, classes);
2940 	}
2941 
2942 	/*
2943 	 * Some controllers can't be frozen very well and may set spurious
2944 	 * error conditions during reset.  Clear accumulated error
2945 	 * information and re-thaw the port if frozen.  As reset is the
2946 	 * final recovery action and we cross check link onlineness against
2947 	 * device classification later, no hotplug event is lost by this.
2948 	 */
2949 	spin_lock_irqsave(link->ap->lock, flags);
2950 	memset(&link->eh_info, 0, sizeof(link->eh_info));
2951 	if (slave)
2952 		memset(&slave->eh_info, 0, sizeof(link->eh_info));
2953 	ap->pflags &= ~ATA_PFLAG_EH_PENDING;
2954 	spin_unlock_irqrestore(link->ap->lock, flags);
2955 
2956 	if (ap->pflags & ATA_PFLAG_FROZEN)
2957 		ata_eh_thaw_port(ap);
2958 
2959 	/*
2960 	 * Make sure onlineness and classification result correspond.
2961 	 * Hotplug could have happened during reset and some
2962 	 * controllers fail to wait while a drive is spinning up after
2963 	 * being hotplugged causing misdetection.  By cross checking
2964 	 * link on/offlineness and classification result, those
2965 	 * conditions can be reliably detected and retried.
2966 	 */
2967 	nr_unknown = 0;
2968 	ata_for_each_dev(dev, link, ALL) {
2969 		if (ata_phys_link_online(ata_dev_phys_link(dev))) {
2970 			if (classes[dev->devno] == ATA_DEV_UNKNOWN) {
2971 				ata_dev_dbg(dev, "link online but device misclassified\n");
2972 				classes[dev->devno] = ATA_DEV_NONE;
2973 				nr_unknown++;
2974 			}
2975 		} else if (ata_phys_link_offline(ata_dev_phys_link(dev))) {
2976 			if (ata_class_enabled(classes[dev->devno]))
2977 				ata_dev_dbg(dev,
2978 					    "link offline, clearing class %d to NONE\n",
2979 					    classes[dev->devno]);
2980 			classes[dev->devno] = ATA_DEV_NONE;
2981 		} else if (classes[dev->devno] == ATA_DEV_UNKNOWN) {
2982 			ata_dev_dbg(dev,
2983 				    "link status unknown, clearing UNKNOWN to NONE\n");
2984 			classes[dev->devno] = ATA_DEV_NONE;
2985 		}
2986 	}
2987 
2988 	if (classify && nr_unknown) {
2989 		if (try < max_tries) {
2990 			ata_link_warn(link,
2991 				      "link online but %d devices misclassified, retrying\n",
2992 				      nr_unknown);
2993 			failed_link = link;
2994 			rc = -EAGAIN;
2995 			goto fail;
2996 		}
2997 		ata_link_warn(link,
2998 			      "link online but %d devices misclassified, "
2999 			      "device detection might fail\n", nr_unknown);
3000 	}
3001 
3002 	/* reset successful, schedule revalidation */
3003 	ata_eh_done(link, NULL, ATA_EH_RESET);
3004 	if (slave)
3005 		ata_eh_done(slave, NULL, ATA_EH_RESET);
3006 	ehc->last_reset = jiffies;		/* update to completion time */
3007 	ehc->i.action |= ATA_EH_REVALIDATE;
3008 	link->lpm_policy = ATA_LPM_UNKNOWN;	/* reset LPM state */
3009 
3010 	rc = 0;
3011  out:
3012 	/* clear hotplug flag */
3013 	ehc->i.flags &= ~ATA_EHI_HOTPLUGGED;
3014 	if (slave)
3015 		sehc->i.flags &= ~ATA_EHI_HOTPLUGGED;
3016 
3017 	spin_lock_irqsave(ap->lock, flags);
3018 	ap->pflags &= ~ATA_PFLAG_RESETTING;
3019 	spin_unlock_irqrestore(ap->lock, flags);
3020 
3021 	return rc;
3022 
3023  fail:
3024 	/* if SCR isn't accessible on a fan-out port, PMP needs to be reset */
3025 	if (!ata_is_host_link(link) &&
3026 	    sata_scr_read(link, SCR_STATUS, &sstatus))
3027 		rc = -ERESTART;
3028 
3029 	if (try >= max_tries) {
3030 		/*
3031 		 * Thaw host port even if reset failed, so that the port
3032 		 * can be retried on the next phy event.  This risks
3033 		 * repeated EH runs but seems to be a better tradeoff than
3034 		 * shutting down a port after a botched hotplug attempt.
3035 		 */
3036 		if (ata_is_host_link(link))
3037 			ata_eh_thaw_port(ap);
3038 		goto out;
3039 	}
3040 
3041 	now = jiffies;
3042 	if (time_before(now, deadline)) {
3043 		unsigned long delta = deadline - now;
3044 
3045 		ata_link_warn(failed_link,
3046 			"reset failed (errno=%d), retrying in %u secs\n",
3047 			rc, DIV_ROUND_UP(jiffies_to_msecs(delta), 1000));
3048 
3049 		ata_eh_release(ap);
3050 		while (delta)
3051 			delta = schedule_timeout_uninterruptible(delta);
3052 		ata_eh_acquire(ap);
3053 	}
3054 
3055 	/*
3056 	 * While disks spinup behind PMP, some controllers fail sending SRST.
3057 	 * They need to be reset - as well as the PMP - before retrying.
3058 	 */
3059 	if (rc == -ERESTART) {
3060 		if (ata_is_host_link(link))
3061 			ata_eh_thaw_port(ap);
3062 		goto out;
3063 	}
3064 
3065 	if (try == max_tries - 1) {
3066 		sata_down_spd_limit(link, 0);
3067 		if (slave)
3068 			sata_down_spd_limit(slave, 0);
3069 	} else if (rc == -EPIPE)
3070 		sata_down_spd_limit(failed_link, 0);
3071 
3072 	if (hardreset)
3073 		reset = hardreset;
3074 	goto retry;
3075 }
3076 
ata_eh_pull_park_action(struct ata_port * ap)3077 static inline void ata_eh_pull_park_action(struct ata_port *ap)
3078 {
3079 	struct ata_link *link;
3080 	struct ata_device *dev;
3081 	unsigned long flags;
3082 
3083 	/*
3084 	 * This function can be thought of as an extended version of
3085 	 * ata_eh_about_to_do() specially crafted to accommodate the
3086 	 * requirements of ATA_EH_PARK handling. Since the EH thread
3087 	 * does not leave the do {} while () loop in ata_eh_recover as
3088 	 * long as the timeout for a park request to *one* device on
3089 	 * the port has not expired, and since we still want to pick
3090 	 * up park requests to other devices on the same port or
3091 	 * timeout updates for the same device, we have to pull
3092 	 * ATA_EH_PARK actions from eh_info into eh_context.i
3093 	 * ourselves at the beginning of each pass over the loop.
3094 	 *
3095 	 * Additionally, all write accesses to &ap->park_req_pending
3096 	 * through reinit_completion() (see below) or complete_all()
3097 	 * (see ata_scsi_park_store()) are protected by the host lock.
3098 	 * As a result we have that park_req_pending.done is zero on
3099 	 * exit from this function, i.e. when ATA_EH_PARK actions for
3100 	 * *all* devices on port ap have been pulled into the
3101 	 * respective eh_context structs. If, and only if,
3102 	 * park_req_pending.done is non-zero by the time we reach
3103 	 * wait_for_completion_timeout(), another ATA_EH_PARK action
3104 	 * has been scheduled for at least one of the devices on port
3105 	 * ap and we have to cycle over the do {} while () loop in
3106 	 * ata_eh_recover() again.
3107 	 */
3108 
3109 	spin_lock_irqsave(ap->lock, flags);
3110 	reinit_completion(&ap->park_req_pending);
3111 	ata_for_each_link(link, ap, EDGE) {
3112 		ata_for_each_dev(dev, link, ALL) {
3113 			struct ata_eh_info *ehi = &link->eh_info;
3114 
3115 			link->eh_context.i.dev_action[dev->devno] |=
3116 				ehi->dev_action[dev->devno] & ATA_EH_PARK;
3117 			ata_eh_clear_action(link, dev, ehi, ATA_EH_PARK);
3118 		}
3119 	}
3120 	spin_unlock_irqrestore(ap->lock, flags);
3121 }
3122 
ata_eh_park_issue_cmd(struct ata_device * dev,int park)3123 static void ata_eh_park_issue_cmd(struct ata_device *dev, int park)
3124 {
3125 	struct ata_eh_context *ehc = &dev->link->eh_context;
3126 	struct ata_taskfile tf;
3127 	unsigned int err_mask;
3128 
3129 	ata_tf_init(dev, &tf);
3130 	if (park) {
3131 		ehc->unloaded_mask |= 1 << dev->devno;
3132 		tf.command = ATA_CMD_IDLEIMMEDIATE;
3133 		tf.feature = 0x44;
3134 		tf.lbal = 0x4c;
3135 		tf.lbam = 0x4e;
3136 		tf.lbah = 0x55;
3137 	} else {
3138 		ehc->unloaded_mask &= ~(1 << dev->devno);
3139 		tf.command = ATA_CMD_CHK_POWER;
3140 	}
3141 
3142 	tf.flags |= ATA_TFLAG_DEVICE | ATA_TFLAG_ISADDR;
3143 	tf.protocol = ATA_PROT_NODATA;
3144 	err_mask = ata_exec_internal(dev, &tf, NULL, DMA_NONE, NULL, 0, 0);
3145 	if (park && (err_mask || tf.lbal != 0xc4)) {
3146 		ata_dev_err(dev, "head unload failed!\n");
3147 		ehc->unloaded_mask &= ~(1 << dev->devno);
3148 	}
3149 }
3150 
ata_eh_revalidate_and_attach(struct ata_link * link,struct ata_device ** r_failed_dev)3151 static int ata_eh_revalidate_and_attach(struct ata_link *link,
3152 					struct ata_device **r_failed_dev)
3153 {
3154 	struct ata_port *ap = link->ap;
3155 	struct ata_eh_context *ehc = &link->eh_context;
3156 	struct ata_device *dev;
3157 	unsigned int new_mask = 0;
3158 	unsigned long flags;
3159 	int rc = 0;
3160 
3161 	DPRINTK("ENTER\n");
3162 
3163 	/* For PATA drive side cable detection to work, IDENTIFY must
3164 	 * be done backwards such that PDIAG- is released by the slave
3165 	 * device before the master device is identified.
3166 	 */
3167 	ata_for_each_dev(dev, link, ALL_REVERSE) {
3168 		unsigned int action = ata_eh_dev_action(dev);
3169 		unsigned int readid_flags = 0;
3170 
3171 		if (ehc->i.flags & ATA_EHI_DID_RESET)
3172 			readid_flags |= ATA_READID_POSTRESET;
3173 
3174 		if ((action & ATA_EH_REVALIDATE) && ata_dev_enabled(dev)) {
3175 			WARN_ON(dev->class == ATA_DEV_PMP);
3176 
3177 			if (ata_phys_link_offline(ata_dev_phys_link(dev))) {
3178 				rc = -EIO;
3179 				goto err;
3180 			}
3181 
3182 			ata_eh_about_to_do(link, dev, ATA_EH_REVALIDATE);
3183 			rc = ata_dev_revalidate(dev, ehc->classes[dev->devno],
3184 						readid_flags);
3185 			if (rc)
3186 				goto err;
3187 
3188 			ata_eh_done(link, dev, ATA_EH_REVALIDATE);
3189 
3190 			/* Configuration may have changed, reconfigure
3191 			 * transfer mode.
3192 			 */
3193 			ehc->i.flags |= ATA_EHI_SETMODE;
3194 
3195 			/* schedule the scsi_rescan_device() here */
3196 			schedule_work(&(ap->scsi_rescan_task));
3197 		} else if (dev->class == ATA_DEV_UNKNOWN &&
3198 			   ehc->tries[dev->devno] &&
3199 			   ata_class_enabled(ehc->classes[dev->devno])) {
3200 			/* Temporarily set dev->class, it will be
3201 			 * permanently set once all configurations are
3202 			 * complete.  This is necessary because new
3203 			 * device configuration is done in two
3204 			 * separate loops.
3205 			 */
3206 			dev->class = ehc->classes[dev->devno];
3207 
3208 			if (dev->class == ATA_DEV_PMP)
3209 				rc = sata_pmp_attach(dev);
3210 			else
3211 				rc = ata_dev_read_id(dev, &dev->class,
3212 						     readid_flags, dev->id);
3213 
3214 			/* read_id might have changed class, store and reset */
3215 			ehc->classes[dev->devno] = dev->class;
3216 			dev->class = ATA_DEV_UNKNOWN;
3217 
3218 			switch (rc) {
3219 			case 0:
3220 				/* clear error info accumulated during probe */
3221 				ata_ering_clear(&dev->ering);
3222 				new_mask |= 1 << dev->devno;
3223 				break;
3224 			case -ENOENT:
3225 				/* IDENTIFY was issued to non-existent
3226 				 * device.  No need to reset.  Just
3227 				 * thaw and ignore the device.
3228 				 */
3229 				ata_eh_thaw_port(ap);
3230 				break;
3231 			default:
3232 				goto err;
3233 			}
3234 		}
3235 	}
3236 
3237 	/* PDIAG- should have been released, ask cable type if post-reset */
3238 	if ((ehc->i.flags & ATA_EHI_DID_RESET) && ata_is_host_link(link)) {
3239 		if (ap->ops->cable_detect)
3240 			ap->cbl = ap->ops->cable_detect(ap);
3241 		ata_force_cbl(ap);
3242 	}
3243 
3244 	/* Configure new devices forward such that user doesn't see
3245 	 * device detection messages backwards.
3246 	 */
3247 	ata_for_each_dev(dev, link, ALL) {
3248 		if (!(new_mask & (1 << dev->devno)))
3249 			continue;
3250 
3251 		dev->class = ehc->classes[dev->devno];
3252 
3253 		if (dev->class == ATA_DEV_PMP)
3254 			continue;
3255 
3256 		ehc->i.flags |= ATA_EHI_PRINTINFO;
3257 		rc = ata_dev_configure(dev);
3258 		ehc->i.flags &= ~ATA_EHI_PRINTINFO;
3259 		if (rc) {
3260 			dev->class = ATA_DEV_UNKNOWN;
3261 			goto err;
3262 		}
3263 
3264 		spin_lock_irqsave(ap->lock, flags);
3265 		ap->pflags |= ATA_PFLAG_SCSI_HOTPLUG;
3266 		spin_unlock_irqrestore(ap->lock, flags);
3267 
3268 		/* new device discovered, configure xfermode */
3269 		ehc->i.flags |= ATA_EHI_SETMODE;
3270 	}
3271 
3272 	return 0;
3273 
3274  err:
3275 	*r_failed_dev = dev;
3276 	DPRINTK("EXIT rc=%d\n", rc);
3277 	return rc;
3278 }
3279 
3280 /**
3281  *	ata_set_mode - Program timings and issue SET FEATURES - XFER
3282  *	@link: link on which timings will be programmed
3283  *	@r_failed_dev: out parameter for failed device
3284  *
3285  *	Set ATA device disk transfer mode (PIO3, UDMA6, etc.).  If
3286  *	ata_set_mode() fails, pointer to the failing device is
3287  *	returned in @r_failed_dev.
3288  *
3289  *	LOCKING:
3290  *	PCI/etc. bus probe sem.
3291  *
3292  *	RETURNS:
3293  *	0 on success, negative errno otherwise
3294  */
ata_set_mode(struct ata_link * link,struct ata_device ** r_failed_dev)3295 int ata_set_mode(struct ata_link *link, struct ata_device **r_failed_dev)
3296 {
3297 	struct ata_port *ap = link->ap;
3298 	struct ata_device *dev;
3299 	int rc;
3300 
3301 	/* if data transfer is verified, clear DUBIOUS_XFER on ering top */
3302 	ata_for_each_dev(dev, link, ENABLED) {
3303 		if (!(dev->flags & ATA_DFLAG_DUBIOUS_XFER)) {
3304 			struct ata_ering_entry *ent;
3305 
3306 			ent = ata_ering_top(&dev->ering);
3307 			if (ent)
3308 				ent->eflags &= ~ATA_EFLAG_DUBIOUS_XFER;
3309 		}
3310 	}
3311 
3312 	/* has private set_mode? */
3313 	if (ap->ops->set_mode)
3314 		rc = ap->ops->set_mode(link, r_failed_dev);
3315 	else
3316 		rc = ata_do_set_mode(link, r_failed_dev);
3317 
3318 	/* if transfer mode has changed, set DUBIOUS_XFER on device */
3319 	ata_for_each_dev(dev, link, ENABLED) {
3320 		struct ata_eh_context *ehc = &link->eh_context;
3321 		u8 saved_xfer_mode = ehc->saved_xfer_mode[dev->devno];
3322 		u8 saved_ncq = !!(ehc->saved_ncq_enabled & (1 << dev->devno));
3323 
3324 		if (dev->xfer_mode != saved_xfer_mode ||
3325 		    ata_ncq_enabled(dev) != saved_ncq)
3326 			dev->flags |= ATA_DFLAG_DUBIOUS_XFER;
3327 	}
3328 
3329 	return rc;
3330 }
3331 
3332 /**
3333  *	atapi_eh_clear_ua - Clear ATAPI UNIT ATTENTION after reset
3334  *	@dev: ATAPI device to clear UA for
3335  *
3336  *	Resets and other operations can make an ATAPI device raise
3337  *	UNIT ATTENTION which causes the next operation to fail.  This
3338  *	function clears UA.
3339  *
3340  *	LOCKING:
3341  *	EH context (may sleep).
3342  *
3343  *	RETURNS:
3344  *	0 on success, -errno on failure.
3345  */
atapi_eh_clear_ua(struct ata_device * dev)3346 static int atapi_eh_clear_ua(struct ata_device *dev)
3347 {
3348 	int i;
3349 
3350 	for (i = 0; i < ATA_EH_UA_TRIES; i++) {
3351 		u8 *sense_buffer = dev->link->ap->sector_buf;
3352 		u8 sense_key = 0;
3353 		unsigned int err_mask;
3354 
3355 		err_mask = atapi_eh_tur(dev, &sense_key);
3356 		if (err_mask != 0 && err_mask != AC_ERR_DEV) {
3357 			ata_dev_warn(dev,
3358 				     "TEST_UNIT_READY failed (err_mask=0x%x)\n",
3359 				     err_mask);
3360 			return -EIO;
3361 		}
3362 
3363 		if (!err_mask || sense_key != UNIT_ATTENTION)
3364 			return 0;
3365 
3366 		err_mask = atapi_eh_request_sense(dev, sense_buffer, sense_key);
3367 		if (err_mask) {
3368 			ata_dev_warn(dev, "failed to clear "
3369 				"UNIT ATTENTION (err_mask=0x%x)\n", err_mask);
3370 			return -EIO;
3371 		}
3372 	}
3373 
3374 	ata_dev_warn(dev, "UNIT ATTENTION persists after %d tries\n",
3375 		     ATA_EH_UA_TRIES);
3376 
3377 	return 0;
3378 }
3379 
3380 /**
3381  *	ata_eh_maybe_retry_flush - Retry FLUSH if necessary
3382  *	@dev: ATA device which may need FLUSH retry
3383  *
3384  *	If @dev failed FLUSH, it needs to be reported upper layer
3385  *	immediately as it means that @dev failed to remap and already
3386  *	lost at least a sector and further FLUSH retrials won't make
3387  *	any difference to the lost sector.  However, if FLUSH failed
3388  *	for other reasons, for example transmission error, FLUSH needs
3389  *	to be retried.
3390  *
3391  *	This function determines whether FLUSH failure retry is
3392  *	necessary and performs it if so.
3393  *
3394  *	RETURNS:
3395  *	0 if EH can continue, -errno if EH needs to be repeated.
3396  */
ata_eh_maybe_retry_flush(struct ata_device * dev)3397 static int ata_eh_maybe_retry_flush(struct ata_device *dev)
3398 {
3399 	struct ata_link *link = dev->link;
3400 	struct ata_port *ap = link->ap;
3401 	struct ata_queued_cmd *qc;
3402 	struct ata_taskfile tf;
3403 	unsigned int err_mask;
3404 	int rc = 0;
3405 
3406 	/* did flush fail for this device? */
3407 	if (!ata_tag_valid(link->active_tag))
3408 		return 0;
3409 
3410 	qc = __ata_qc_from_tag(ap, link->active_tag);
3411 	if (qc->dev != dev || (qc->tf.command != ATA_CMD_FLUSH_EXT &&
3412 			       qc->tf.command != ATA_CMD_FLUSH))
3413 		return 0;
3414 
3415 	/* if the device failed it, it should be reported to upper layers */
3416 	if (qc->err_mask & AC_ERR_DEV)
3417 		return 0;
3418 
3419 	/* flush failed for some other reason, give it another shot */
3420 	ata_tf_init(dev, &tf);
3421 
3422 	tf.command = qc->tf.command;
3423 	tf.flags |= ATA_TFLAG_DEVICE;
3424 	tf.protocol = ATA_PROT_NODATA;
3425 
3426 	ata_dev_warn(dev, "retrying FLUSH 0x%x Emask 0x%x\n",
3427 		       tf.command, qc->err_mask);
3428 
3429 	err_mask = ata_exec_internal(dev, &tf, NULL, DMA_NONE, NULL, 0, 0);
3430 	if (!err_mask) {
3431 		/*
3432 		 * FLUSH is complete but there's no way to
3433 		 * successfully complete a failed command from EH.
3434 		 * Making sure retry is allowed at least once and
3435 		 * retrying it should do the trick - whatever was in
3436 		 * the cache is already on the platter and this won't
3437 		 * cause infinite loop.
3438 		 */
3439 		qc->scsicmd->allowed = max(qc->scsicmd->allowed, 1);
3440 	} else {
3441 		ata_dev_warn(dev, "FLUSH failed Emask 0x%x\n",
3442 			       err_mask);
3443 		rc = -EIO;
3444 
3445 		/* if device failed it, report it to upper layers */
3446 		if (err_mask & AC_ERR_DEV) {
3447 			qc->err_mask |= AC_ERR_DEV;
3448 			qc->result_tf = tf;
3449 			if (!(ap->pflags & ATA_PFLAG_FROZEN))
3450 				rc = 0;
3451 		}
3452 	}
3453 	return rc;
3454 }
3455 
3456 /**
3457  *	ata_eh_set_lpm - configure SATA interface power management
3458  *	@link: link to configure power management
3459  *	@policy: the link power management policy
3460  *	@r_failed_dev: out parameter for failed device
3461  *
3462  *	Enable SATA Interface power management.  This will enable
3463  *	Device Interface Power Management (DIPM) for min_power
3464  * 	policy, and then call driver specific callbacks for
3465  *	enabling Host Initiated Power management.
3466  *
3467  *	LOCKING:
3468  *	EH context.
3469  *
3470  *	RETURNS:
3471  *	0 on success, -errno on failure.
3472  */
ata_eh_set_lpm(struct ata_link * link,enum ata_lpm_policy policy,struct ata_device ** r_failed_dev)3473 static int ata_eh_set_lpm(struct ata_link *link, enum ata_lpm_policy policy,
3474 			  struct ata_device **r_failed_dev)
3475 {
3476 	struct ata_port *ap = ata_is_host_link(link) ? link->ap : NULL;
3477 	struct ata_eh_context *ehc = &link->eh_context;
3478 	struct ata_device *dev, *link_dev = NULL, *lpm_dev = NULL;
3479 	enum ata_lpm_policy old_policy = link->lpm_policy;
3480 	bool no_dipm = link->ap->flags & ATA_FLAG_NO_DIPM;
3481 	unsigned int hints = ATA_LPM_EMPTY | ATA_LPM_HIPM;
3482 	unsigned int err_mask;
3483 	int rc;
3484 
3485 	/* if the link or host doesn't do LPM, noop */
3486 	if ((link->flags & ATA_LFLAG_NO_LPM) || (ap && !ap->ops->set_lpm))
3487 		return 0;
3488 
3489 	/*
3490 	 * DIPM is enabled only for MIN_POWER as some devices
3491 	 * misbehave when the host NACKs transition to SLUMBER.  Order
3492 	 * device and link configurations such that the host always
3493 	 * allows DIPM requests.
3494 	 */
3495 	ata_for_each_dev(dev, link, ENABLED) {
3496 		bool hipm = ata_id_has_hipm(dev->id);
3497 		bool dipm = ata_id_has_dipm(dev->id) && !no_dipm;
3498 
3499 		/* find the first enabled and LPM enabled devices */
3500 		if (!link_dev)
3501 			link_dev = dev;
3502 
3503 		if (!lpm_dev && (hipm || dipm))
3504 			lpm_dev = dev;
3505 
3506 		hints &= ~ATA_LPM_EMPTY;
3507 		if (!hipm)
3508 			hints &= ~ATA_LPM_HIPM;
3509 
3510 		/* disable DIPM before changing link config */
3511 		if (policy != ATA_LPM_MIN_POWER && dipm) {
3512 			err_mask = ata_dev_set_feature(dev,
3513 					SETFEATURES_SATA_DISABLE, SATA_DIPM);
3514 			if (err_mask && err_mask != AC_ERR_DEV) {
3515 				ata_dev_warn(dev,
3516 					     "failed to disable DIPM, Emask 0x%x\n",
3517 					     err_mask);
3518 				rc = -EIO;
3519 				goto fail;
3520 			}
3521 		}
3522 	}
3523 
3524 	if (ap) {
3525 		rc = ap->ops->set_lpm(link, policy, hints);
3526 		if (!rc && ap->slave_link)
3527 			rc = ap->ops->set_lpm(ap->slave_link, policy, hints);
3528 	} else
3529 		rc = sata_pmp_set_lpm(link, policy, hints);
3530 
3531 	/*
3532 	 * Attribute link config failure to the first (LPM) enabled
3533 	 * device on the link.
3534 	 */
3535 	if (rc) {
3536 		if (rc == -EOPNOTSUPP) {
3537 			link->flags |= ATA_LFLAG_NO_LPM;
3538 			return 0;
3539 		}
3540 		dev = lpm_dev ? lpm_dev : link_dev;
3541 		goto fail;
3542 	}
3543 
3544 	/*
3545 	 * Low level driver acked the transition.  Issue DIPM command
3546 	 * with the new policy set.
3547 	 */
3548 	link->lpm_policy = policy;
3549 	if (ap && ap->slave_link)
3550 		ap->slave_link->lpm_policy = policy;
3551 
3552 	/* host config updated, enable DIPM if transitioning to MIN_POWER */
3553 	ata_for_each_dev(dev, link, ENABLED) {
3554 		if (policy == ATA_LPM_MIN_POWER && !no_dipm &&
3555 		    ata_id_has_dipm(dev->id)) {
3556 			err_mask = ata_dev_set_feature(dev,
3557 					SETFEATURES_SATA_ENABLE, SATA_DIPM);
3558 			if (err_mask && err_mask != AC_ERR_DEV) {
3559 				ata_dev_warn(dev,
3560 					"failed to enable DIPM, Emask 0x%x\n",
3561 					err_mask);
3562 				rc = -EIO;
3563 				goto fail;
3564 			}
3565 		}
3566 	}
3567 
3568 	link->last_lpm_change = jiffies;
3569 	link->flags |= ATA_LFLAG_CHANGED;
3570 
3571 	return 0;
3572 
3573 fail:
3574 	/* restore the old policy */
3575 	link->lpm_policy = old_policy;
3576 	if (ap && ap->slave_link)
3577 		ap->slave_link->lpm_policy = old_policy;
3578 
3579 	/* if no device or only one more chance is left, disable LPM */
3580 	if (!dev || ehc->tries[dev->devno] <= 2) {
3581 		ata_link_warn(link, "disabling LPM on the link\n");
3582 		link->flags |= ATA_LFLAG_NO_LPM;
3583 	}
3584 	if (r_failed_dev)
3585 		*r_failed_dev = dev;
3586 	return rc;
3587 }
3588 
ata_link_nr_enabled(struct ata_link * link)3589 int ata_link_nr_enabled(struct ata_link *link)
3590 {
3591 	struct ata_device *dev;
3592 	int cnt = 0;
3593 
3594 	ata_for_each_dev(dev, link, ENABLED)
3595 		cnt++;
3596 	return cnt;
3597 }
3598 
ata_link_nr_vacant(struct ata_link * link)3599 static int ata_link_nr_vacant(struct ata_link *link)
3600 {
3601 	struct ata_device *dev;
3602 	int cnt = 0;
3603 
3604 	ata_for_each_dev(dev, link, ALL)
3605 		if (dev->class == ATA_DEV_UNKNOWN)
3606 			cnt++;
3607 	return cnt;
3608 }
3609 
ata_eh_skip_recovery(struct ata_link * link)3610 static int ata_eh_skip_recovery(struct ata_link *link)
3611 {
3612 	struct ata_port *ap = link->ap;
3613 	struct ata_eh_context *ehc = &link->eh_context;
3614 	struct ata_device *dev;
3615 
3616 	/* skip disabled links */
3617 	if (link->flags & ATA_LFLAG_DISABLED)
3618 		return 1;
3619 
3620 	/* skip if explicitly requested */
3621 	if (ehc->i.flags & ATA_EHI_NO_RECOVERY)
3622 		return 1;
3623 
3624 	/* thaw frozen port and recover failed devices */
3625 	if ((ap->pflags & ATA_PFLAG_FROZEN) || ata_link_nr_enabled(link))
3626 		return 0;
3627 
3628 	/* reset at least once if reset is requested */
3629 	if ((ehc->i.action & ATA_EH_RESET) &&
3630 	    !(ehc->i.flags & ATA_EHI_DID_RESET))
3631 		return 0;
3632 
3633 	/* skip if class codes for all vacant slots are ATA_DEV_NONE */
3634 	ata_for_each_dev(dev, link, ALL) {
3635 		if (dev->class == ATA_DEV_UNKNOWN &&
3636 		    ehc->classes[dev->devno] != ATA_DEV_NONE)
3637 			return 0;
3638 	}
3639 
3640 	return 1;
3641 }
3642 
ata_count_probe_trials_cb(struct ata_ering_entry * ent,void * void_arg)3643 static int ata_count_probe_trials_cb(struct ata_ering_entry *ent, void *void_arg)
3644 {
3645 	u64 interval = msecs_to_jiffies(ATA_EH_PROBE_TRIAL_INTERVAL);
3646 	u64 now = get_jiffies_64();
3647 	int *trials = void_arg;
3648 
3649 	if ((ent->eflags & ATA_EFLAG_OLD_ER) ||
3650 	    (ent->timestamp < now - min(now, interval)))
3651 		return -1;
3652 
3653 	(*trials)++;
3654 	return 0;
3655 }
3656 
ata_eh_schedule_probe(struct ata_device * dev)3657 static int ata_eh_schedule_probe(struct ata_device *dev)
3658 {
3659 	struct ata_eh_context *ehc = &dev->link->eh_context;
3660 	struct ata_link *link = ata_dev_phys_link(dev);
3661 	int trials = 0;
3662 
3663 	if (!(ehc->i.probe_mask & (1 << dev->devno)) ||
3664 	    (ehc->did_probe_mask & (1 << dev->devno)))
3665 		return 0;
3666 
3667 	ata_eh_detach_dev(dev);
3668 	ata_dev_init(dev);
3669 	ehc->did_probe_mask |= (1 << dev->devno);
3670 	ehc->i.action |= ATA_EH_RESET;
3671 	ehc->saved_xfer_mode[dev->devno] = 0;
3672 	ehc->saved_ncq_enabled &= ~(1 << dev->devno);
3673 
3674 	/* the link maybe in a deep sleep, wake it up */
3675 	if (link->lpm_policy > ATA_LPM_MAX_POWER) {
3676 		if (ata_is_host_link(link))
3677 			link->ap->ops->set_lpm(link, ATA_LPM_MAX_POWER,
3678 					       ATA_LPM_EMPTY);
3679 		else
3680 			sata_pmp_set_lpm(link, ATA_LPM_MAX_POWER,
3681 					 ATA_LPM_EMPTY);
3682 	}
3683 
3684 	/* Record and count probe trials on the ering.  The specific
3685 	 * error mask used is irrelevant.  Because a successful device
3686 	 * detection clears the ering, this count accumulates only if
3687 	 * there are consecutive failed probes.
3688 	 *
3689 	 * If the count is equal to or higher than ATA_EH_PROBE_TRIALS
3690 	 * in the last ATA_EH_PROBE_TRIAL_INTERVAL, link speed is
3691 	 * forced to 1.5Gbps.
3692 	 *
3693 	 * This is to work around cases where failed link speed
3694 	 * negotiation results in device misdetection leading to
3695 	 * infinite DEVXCHG or PHRDY CHG events.
3696 	 */
3697 	ata_ering_record(&dev->ering, 0, AC_ERR_OTHER);
3698 	ata_ering_map(&dev->ering, ata_count_probe_trials_cb, &trials);
3699 
3700 	if (trials > ATA_EH_PROBE_TRIALS)
3701 		sata_down_spd_limit(link, 1);
3702 
3703 	return 1;
3704 }
3705 
ata_eh_handle_dev_fail(struct ata_device * dev,int err)3706 static int ata_eh_handle_dev_fail(struct ata_device *dev, int err)
3707 {
3708 	struct ata_eh_context *ehc = &dev->link->eh_context;
3709 
3710 	/* -EAGAIN from EH routine indicates retry without prejudice.
3711 	 * The requester is responsible for ensuring forward progress.
3712 	 */
3713 	if (err != -EAGAIN)
3714 		ehc->tries[dev->devno]--;
3715 
3716 	switch (err) {
3717 	case -ENODEV:
3718 		/* device missing or wrong IDENTIFY data, schedule probing */
3719 		ehc->i.probe_mask |= (1 << dev->devno);
3720 	case -EINVAL:
3721 		/* give it just one more chance */
3722 		ehc->tries[dev->devno] = min(ehc->tries[dev->devno], 1);
3723 	case -EIO:
3724 		if (ehc->tries[dev->devno] == 1) {
3725 			/* This is the last chance, better to slow
3726 			 * down than lose it.
3727 			 */
3728 			sata_down_spd_limit(ata_dev_phys_link(dev), 0);
3729 			if (dev->pio_mode > XFER_PIO_0)
3730 				ata_down_xfermask_limit(dev, ATA_DNXFER_PIO);
3731 		}
3732 	}
3733 
3734 	if (ata_dev_enabled(dev) && !ehc->tries[dev->devno]) {
3735 		/* disable device if it has used up all its chances */
3736 		ata_dev_disable(dev);
3737 
3738 		/* detach if offline */
3739 		if (ata_phys_link_offline(ata_dev_phys_link(dev)))
3740 			ata_eh_detach_dev(dev);
3741 
3742 		/* schedule probe if necessary */
3743 		if (ata_eh_schedule_probe(dev)) {
3744 			ehc->tries[dev->devno] = ATA_EH_DEV_TRIES;
3745 			memset(ehc->cmd_timeout_idx[dev->devno], 0,
3746 			       sizeof(ehc->cmd_timeout_idx[dev->devno]));
3747 		}
3748 
3749 		return 1;
3750 	} else {
3751 		ehc->i.action |= ATA_EH_RESET;
3752 		return 0;
3753 	}
3754 }
3755 
3756 /**
3757  *	ata_eh_recover - recover host port after error
3758  *	@ap: host port to recover
3759  *	@prereset: prereset method (can be NULL)
3760  *	@softreset: softreset method (can be NULL)
3761  *	@hardreset: hardreset method (can be NULL)
3762  *	@postreset: postreset method (can be NULL)
3763  *	@r_failed_link: out parameter for failed link
3764  *
3765  *	This is the alpha and omega, eum and yang, heart and soul of
3766  *	libata exception handling.  On entry, actions required to
3767  *	recover each link and hotplug requests are recorded in the
3768  *	link's eh_context.  This function executes all the operations
3769  *	with appropriate retrials and fallbacks to resurrect failed
3770  *	devices, detach goners and greet newcomers.
3771  *
3772  *	LOCKING:
3773  *	Kernel thread context (may sleep).
3774  *
3775  *	RETURNS:
3776  *	0 on success, -errno on failure.
3777  */
ata_eh_recover(struct ata_port * ap,ata_prereset_fn_t prereset,ata_reset_fn_t softreset,ata_reset_fn_t hardreset,ata_postreset_fn_t postreset,struct ata_link ** r_failed_link)3778 int ata_eh_recover(struct ata_port *ap, ata_prereset_fn_t prereset,
3779 		   ata_reset_fn_t softreset, ata_reset_fn_t hardreset,
3780 		   ata_postreset_fn_t postreset,
3781 		   struct ata_link **r_failed_link)
3782 {
3783 	struct ata_link *link;
3784 	struct ata_device *dev;
3785 	int rc, nr_fails;
3786 	unsigned long flags, deadline;
3787 
3788 	DPRINTK("ENTER\n");
3789 
3790 	/* prep for recovery */
3791 	ata_for_each_link(link, ap, EDGE) {
3792 		struct ata_eh_context *ehc = &link->eh_context;
3793 
3794 		/* re-enable link? */
3795 		if (ehc->i.action & ATA_EH_ENABLE_LINK) {
3796 			ata_eh_about_to_do(link, NULL, ATA_EH_ENABLE_LINK);
3797 			spin_lock_irqsave(ap->lock, flags);
3798 			link->flags &= ~ATA_LFLAG_DISABLED;
3799 			spin_unlock_irqrestore(ap->lock, flags);
3800 			ata_eh_done(link, NULL, ATA_EH_ENABLE_LINK);
3801 		}
3802 
3803 		ata_for_each_dev(dev, link, ALL) {
3804 			if (link->flags & ATA_LFLAG_NO_RETRY)
3805 				ehc->tries[dev->devno] = 1;
3806 			else
3807 				ehc->tries[dev->devno] = ATA_EH_DEV_TRIES;
3808 
3809 			/* collect port action mask recorded in dev actions */
3810 			ehc->i.action |= ehc->i.dev_action[dev->devno] &
3811 					 ~ATA_EH_PERDEV_MASK;
3812 			ehc->i.dev_action[dev->devno] &= ATA_EH_PERDEV_MASK;
3813 
3814 			/* process hotplug request */
3815 			if (dev->flags & ATA_DFLAG_DETACH)
3816 				ata_eh_detach_dev(dev);
3817 
3818 			/* schedule probe if necessary */
3819 			if (!ata_dev_enabled(dev))
3820 				ata_eh_schedule_probe(dev);
3821 		}
3822 	}
3823 
3824  retry:
3825 	rc = 0;
3826 
3827 	/* if UNLOADING, finish immediately */
3828 	if (ap->pflags & ATA_PFLAG_UNLOADING)
3829 		goto out;
3830 
3831 	/* prep for EH */
3832 	ata_for_each_link(link, ap, EDGE) {
3833 		struct ata_eh_context *ehc = &link->eh_context;
3834 
3835 		/* skip EH if possible. */
3836 		if (ata_eh_skip_recovery(link))
3837 			ehc->i.action = 0;
3838 
3839 		ata_for_each_dev(dev, link, ALL)
3840 			ehc->classes[dev->devno] = ATA_DEV_UNKNOWN;
3841 	}
3842 
3843 	/* reset */
3844 	ata_for_each_link(link, ap, EDGE) {
3845 		struct ata_eh_context *ehc = &link->eh_context;
3846 
3847 		if (!(ehc->i.action & ATA_EH_RESET))
3848 			continue;
3849 
3850 		rc = ata_eh_reset(link, ata_link_nr_vacant(link),
3851 				  prereset, softreset, hardreset, postreset);
3852 		if (rc) {
3853 			ata_link_err(link, "reset failed, giving up\n");
3854 			goto out;
3855 		}
3856 	}
3857 
3858 	do {
3859 		unsigned long now;
3860 
3861 		/*
3862 		 * clears ATA_EH_PARK in eh_info and resets
3863 		 * ap->park_req_pending
3864 		 */
3865 		ata_eh_pull_park_action(ap);
3866 
3867 		deadline = jiffies;
3868 		ata_for_each_link(link, ap, EDGE) {
3869 			ata_for_each_dev(dev, link, ALL) {
3870 				struct ata_eh_context *ehc = &link->eh_context;
3871 				unsigned long tmp;
3872 
3873 				if (dev->class != ATA_DEV_ATA &&
3874 				    dev->class != ATA_DEV_ZAC)
3875 					continue;
3876 				if (!(ehc->i.dev_action[dev->devno] &
3877 				      ATA_EH_PARK))
3878 					continue;
3879 				tmp = dev->unpark_deadline;
3880 				if (time_before(deadline, tmp))
3881 					deadline = tmp;
3882 				else if (time_before_eq(tmp, jiffies))
3883 					continue;
3884 				if (ehc->unloaded_mask & (1 << dev->devno))
3885 					continue;
3886 
3887 				ata_eh_park_issue_cmd(dev, 1);
3888 			}
3889 		}
3890 
3891 		now = jiffies;
3892 		if (time_before_eq(deadline, now))
3893 			break;
3894 
3895 		ata_eh_release(ap);
3896 		deadline = wait_for_completion_timeout(&ap->park_req_pending,
3897 						       deadline - now);
3898 		ata_eh_acquire(ap);
3899 	} while (deadline);
3900 	ata_for_each_link(link, ap, EDGE) {
3901 		ata_for_each_dev(dev, link, ALL) {
3902 			if (!(link->eh_context.unloaded_mask &
3903 			      (1 << dev->devno)))
3904 				continue;
3905 
3906 			ata_eh_park_issue_cmd(dev, 0);
3907 			ata_eh_done(link, dev, ATA_EH_PARK);
3908 		}
3909 	}
3910 
3911 	/* the rest */
3912 	nr_fails = 0;
3913 	ata_for_each_link(link, ap, PMP_FIRST) {
3914 		struct ata_eh_context *ehc = &link->eh_context;
3915 
3916 		if (sata_pmp_attached(ap) && ata_is_host_link(link))
3917 			goto config_lpm;
3918 
3919 		/* revalidate existing devices and attach new ones */
3920 		rc = ata_eh_revalidate_and_attach(link, &dev);
3921 		if (rc)
3922 			goto rest_fail;
3923 
3924 		/* if PMP got attached, return, pmp EH will take care of it */
3925 		if (link->device->class == ATA_DEV_PMP) {
3926 			ehc->i.action = 0;
3927 			return 0;
3928 		}
3929 
3930 		/* configure transfer mode if necessary */
3931 		if (ehc->i.flags & ATA_EHI_SETMODE) {
3932 			rc = ata_set_mode(link, &dev);
3933 			if (rc)
3934 				goto rest_fail;
3935 			ehc->i.flags &= ~ATA_EHI_SETMODE;
3936 		}
3937 
3938 		/* If reset has been issued, clear UA to avoid
3939 		 * disrupting the current users of the device.
3940 		 */
3941 		if (ehc->i.flags & ATA_EHI_DID_RESET) {
3942 			ata_for_each_dev(dev, link, ALL) {
3943 				if (dev->class != ATA_DEV_ATAPI)
3944 					continue;
3945 				rc = atapi_eh_clear_ua(dev);
3946 				if (rc)
3947 					goto rest_fail;
3948 				if (zpodd_dev_enabled(dev))
3949 					zpodd_post_poweron(dev);
3950 			}
3951 		}
3952 
3953 		/* retry flush if necessary */
3954 		ata_for_each_dev(dev, link, ALL) {
3955 			if (dev->class != ATA_DEV_ATA &&
3956 			    dev->class != ATA_DEV_ZAC)
3957 				continue;
3958 			rc = ata_eh_maybe_retry_flush(dev);
3959 			if (rc)
3960 				goto rest_fail;
3961 		}
3962 
3963 	config_lpm:
3964 		/* configure link power saving */
3965 		if (link->lpm_policy != ap->target_lpm_policy) {
3966 			rc = ata_eh_set_lpm(link, ap->target_lpm_policy, &dev);
3967 			if (rc)
3968 				goto rest_fail;
3969 		}
3970 
3971 		/* this link is okay now */
3972 		ehc->i.flags = 0;
3973 		continue;
3974 
3975 	rest_fail:
3976 		nr_fails++;
3977 		if (dev)
3978 			ata_eh_handle_dev_fail(dev, rc);
3979 
3980 		if (ap->pflags & ATA_PFLAG_FROZEN) {
3981 			/* PMP reset requires working host port.
3982 			 * Can't retry if it's frozen.
3983 			 */
3984 			if (sata_pmp_attached(ap))
3985 				goto out;
3986 			break;
3987 		}
3988 	}
3989 
3990 	if (nr_fails)
3991 		goto retry;
3992 
3993  out:
3994 	if (rc && r_failed_link)
3995 		*r_failed_link = link;
3996 
3997 	DPRINTK("EXIT, rc=%d\n", rc);
3998 	return rc;
3999 }
4000 
4001 /**
4002  *	ata_eh_finish - finish up EH
4003  *	@ap: host port to finish EH for
4004  *
4005  *	Recovery is complete.  Clean up EH states and retry or finish
4006  *	failed qcs.
4007  *
4008  *	LOCKING:
4009  *	None.
4010  */
ata_eh_finish(struct ata_port * ap)4011 void ata_eh_finish(struct ata_port *ap)
4012 {
4013 	int tag;
4014 
4015 	/* retry or finish qcs */
4016 	for (tag = 0; tag < ATA_MAX_QUEUE; tag++) {
4017 		struct ata_queued_cmd *qc = __ata_qc_from_tag(ap, tag);
4018 
4019 		if (!(qc->flags & ATA_QCFLAG_FAILED))
4020 			continue;
4021 
4022 		if (qc->err_mask) {
4023 			/* FIXME: Once EH migration is complete,
4024 			 * generate sense data in this function,
4025 			 * considering both err_mask and tf.
4026 			 */
4027 			if (qc->flags & ATA_QCFLAG_RETRY)
4028 				ata_eh_qc_retry(qc);
4029 			else
4030 				ata_eh_qc_complete(qc);
4031 		} else {
4032 			if (qc->flags & ATA_QCFLAG_SENSE_VALID) {
4033 				ata_eh_qc_complete(qc);
4034 			} else {
4035 				/* feed zero TF to sense generation */
4036 				memset(&qc->result_tf, 0, sizeof(qc->result_tf));
4037 				ata_eh_qc_retry(qc);
4038 			}
4039 		}
4040 	}
4041 
4042 	/* make sure nr_active_links is zero after EH */
4043 	WARN_ON(ap->nr_active_links);
4044 	ap->nr_active_links = 0;
4045 }
4046 
4047 /**
4048  *	ata_do_eh - do standard error handling
4049  *	@ap: host port to handle error for
4050  *
4051  *	@prereset: prereset method (can be NULL)
4052  *	@softreset: softreset method (can be NULL)
4053  *	@hardreset: hardreset method (can be NULL)
4054  *	@postreset: postreset method (can be NULL)
4055  *
4056  *	Perform standard error handling sequence.
4057  *
4058  *	LOCKING:
4059  *	Kernel thread context (may sleep).
4060  */
ata_do_eh(struct ata_port * ap,ata_prereset_fn_t prereset,ata_reset_fn_t softreset,ata_reset_fn_t hardreset,ata_postreset_fn_t postreset)4061 void ata_do_eh(struct ata_port *ap, ata_prereset_fn_t prereset,
4062 	       ata_reset_fn_t softreset, ata_reset_fn_t hardreset,
4063 	       ata_postreset_fn_t postreset)
4064 {
4065 	struct ata_device *dev;
4066 	int rc;
4067 
4068 	ata_eh_autopsy(ap);
4069 	ata_eh_report(ap);
4070 
4071 	rc = ata_eh_recover(ap, prereset, softreset, hardreset, postreset,
4072 			    NULL);
4073 	if (rc) {
4074 		ata_for_each_dev(dev, &ap->link, ALL)
4075 			ata_dev_disable(dev);
4076 	}
4077 
4078 	ata_eh_finish(ap);
4079 }
4080 
4081 /**
4082  *	ata_std_error_handler - standard error handler
4083  *	@ap: host port to handle error for
4084  *
4085  *	Standard error handler
4086  *
4087  *	LOCKING:
4088  *	Kernel thread context (may sleep).
4089  */
ata_std_error_handler(struct ata_port * ap)4090 void ata_std_error_handler(struct ata_port *ap)
4091 {
4092 	struct ata_port_operations *ops = ap->ops;
4093 	ata_reset_fn_t hardreset = ops->hardreset;
4094 
4095 	/* ignore built-in hardreset if SCR access is not available */
4096 	if (hardreset == sata_std_hardreset && !sata_scr_valid(&ap->link))
4097 		hardreset = NULL;
4098 
4099 	ata_do_eh(ap, ops->prereset, ops->softreset, hardreset, ops->postreset);
4100 }
4101 
4102 #ifdef CONFIG_PM
4103 /**
4104  *	ata_eh_handle_port_suspend - perform port suspend operation
4105  *	@ap: port to suspend
4106  *
4107  *	Suspend @ap.
4108  *
4109  *	LOCKING:
4110  *	Kernel thread context (may sleep).
4111  */
ata_eh_handle_port_suspend(struct ata_port * ap)4112 static void ata_eh_handle_port_suspend(struct ata_port *ap)
4113 {
4114 	unsigned long flags;
4115 	int rc = 0;
4116 	struct ata_device *dev;
4117 
4118 	/* are we suspending? */
4119 	spin_lock_irqsave(ap->lock, flags);
4120 	if (!(ap->pflags & ATA_PFLAG_PM_PENDING) ||
4121 	    ap->pm_mesg.event & PM_EVENT_RESUME) {
4122 		spin_unlock_irqrestore(ap->lock, flags);
4123 		return;
4124 	}
4125 	spin_unlock_irqrestore(ap->lock, flags);
4126 
4127 	WARN_ON(ap->pflags & ATA_PFLAG_SUSPENDED);
4128 
4129 	/*
4130 	 * If we have a ZPODD attached, check its zero
4131 	 * power ready status before the port is frozen.
4132 	 * Only needed for runtime suspend.
4133 	 */
4134 	if (PMSG_IS_AUTO(ap->pm_mesg)) {
4135 		ata_for_each_dev(dev, &ap->link, ENABLED) {
4136 			if (zpodd_dev_enabled(dev))
4137 				zpodd_on_suspend(dev);
4138 		}
4139 	}
4140 
4141 	/* tell ACPI we're suspending */
4142 	rc = ata_acpi_on_suspend(ap);
4143 	if (rc)
4144 		goto out;
4145 
4146 	/* suspend */
4147 	ata_eh_freeze_port(ap);
4148 
4149 	if (ap->ops->port_suspend)
4150 		rc = ap->ops->port_suspend(ap, ap->pm_mesg);
4151 
4152 	ata_acpi_set_state(ap, ap->pm_mesg);
4153  out:
4154 	/* update the flags */
4155 	spin_lock_irqsave(ap->lock, flags);
4156 
4157 	ap->pflags &= ~ATA_PFLAG_PM_PENDING;
4158 	if (rc == 0)
4159 		ap->pflags |= ATA_PFLAG_SUSPENDED;
4160 	else if (ap->pflags & ATA_PFLAG_FROZEN)
4161 		ata_port_schedule_eh(ap);
4162 
4163 	spin_unlock_irqrestore(ap->lock, flags);
4164 
4165 	return;
4166 }
4167 
4168 /**
4169  *	ata_eh_handle_port_resume - perform port resume operation
4170  *	@ap: port to resume
4171  *
4172  *	Resume @ap.
4173  *
4174  *	LOCKING:
4175  *	Kernel thread context (may sleep).
4176  */
ata_eh_handle_port_resume(struct ata_port * ap)4177 static void ata_eh_handle_port_resume(struct ata_port *ap)
4178 {
4179 	struct ata_link *link;
4180 	struct ata_device *dev;
4181 	unsigned long flags;
4182 
4183 	/* are we resuming? */
4184 	spin_lock_irqsave(ap->lock, flags);
4185 	if (!(ap->pflags & ATA_PFLAG_PM_PENDING) ||
4186 	    !(ap->pm_mesg.event & PM_EVENT_RESUME)) {
4187 		spin_unlock_irqrestore(ap->lock, flags);
4188 		return;
4189 	}
4190 	spin_unlock_irqrestore(ap->lock, flags);
4191 
4192 	WARN_ON(!(ap->pflags & ATA_PFLAG_SUSPENDED));
4193 
4194 	/*
4195 	 * Error timestamps are in jiffies which doesn't run while
4196 	 * suspended and PHY events during resume isn't too uncommon.
4197 	 * When the two are combined, it can lead to unnecessary speed
4198 	 * downs if the machine is suspended and resumed repeatedly.
4199 	 * Clear error history.
4200 	 */
4201 	ata_for_each_link(link, ap, HOST_FIRST)
4202 		ata_for_each_dev(dev, link, ALL)
4203 			ata_ering_clear(&dev->ering);
4204 
4205 	ata_acpi_set_state(ap, ap->pm_mesg);
4206 
4207 	if (ap->ops->port_resume)
4208 		ap->ops->port_resume(ap);
4209 
4210 	/* tell ACPI that we're resuming */
4211 	ata_acpi_on_resume(ap);
4212 
4213 	/* update the flags */
4214 	spin_lock_irqsave(ap->lock, flags);
4215 	ap->pflags &= ~(ATA_PFLAG_PM_PENDING | ATA_PFLAG_SUSPENDED);
4216 	spin_unlock_irqrestore(ap->lock, flags);
4217 }
4218 #endif /* CONFIG_PM */
4219