xref: /openbmc/linux/drivers/dma/ioat/dma.c (revision dfd4f649)
1 /*
2  * Intel I/OAT DMA Linux driver
3  * Copyright(c) 2004 - 2015 Intel Corporation.
4  *
5  * This program is free software; you can redistribute it and/or modify it
6  * under the terms and conditions of the GNU General Public License,
7  * version 2, as published by the Free Software Foundation.
8  *
9  * This program is distributed in the hope that it will be useful, but WITHOUT
10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
12  * more details.
13  *
14  * The full GNU General Public License is included in this distribution in
15  * the file called "COPYING".
16  *
17  */
18 
19 /*
20  * This driver supports an Intel I/OAT DMA engine, which does asynchronous
21  * copy operations.
22  */
23 
24 #include <linux/init.h>
25 #include <linux/module.h>
26 #include <linux/slab.h>
27 #include <linux/pci.h>
28 #include <linux/interrupt.h>
29 #include <linux/dmaengine.h>
30 #include <linux/delay.h>
31 #include <linux/dma-mapping.h>
32 #include <linux/workqueue.h>
33 #include <linux/prefetch.h>
34 #include <linux/sizes.h>
35 #include "dma.h"
36 #include "registers.h"
37 #include "hw.h"
38 
39 #include "../dmaengine.h"
40 
41 static char *chanerr_str[] = {
42 	"DMA Transfer Source Address Error",
43 	"DMA Transfer Destination Address Error",
44 	"Next Descriptor Address Error",
45 	"Descriptor Error",
46 	"Chan Address Value Error",
47 	"CHANCMD Error",
48 	"Chipset Uncorrectable Data Integrity Error",
49 	"DMA Uncorrectable Data Integrity Error",
50 	"Read Data Error",
51 	"Write Data Error",
52 	"Descriptor Control Error",
53 	"Descriptor Transfer Size Error",
54 	"Completion Address Error",
55 	"Interrupt Configuration Error",
56 	"Super extended descriptor Address Error",
57 	"Unaffiliated Error",
58 	"CRC or XOR P Error",
59 	"XOR Q Error",
60 	"Descriptor Count Error",
61 	"DIF All F detect Error",
62 	"Guard Tag verification Error",
63 	"Application Tag verification Error",
64 	"Reference Tag verification Error",
65 	"Bundle Bit Error",
66 	"Result DIF All F detect Error",
67 	"Result Guard Tag verification Error",
68 	"Result Application Tag verification Error",
69 	"Result Reference Tag verification Error",
70 };
71 
72 static void ioat_eh(struct ioatdma_chan *ioat_chan);
73 
74 static void ioat_print_chanerrs(struct ioatdma_chan *ioat_chan, u32 chanerr)
75 {
76 	int i;
77 
78 	for (i = 0; i < ARRAY_SIZE(chanerr_str); i++) {
79 		if ((chanerr >> i) & 1) {
80 			dev_err(to_dev(ioat_chan), "Err(%d): %s\n",
81 				i, chanerr_str[i]);
82 		}
83 	}
84 }
85 
86 /**
87  * ioat_dma_do_interrupt - handler used for single vector interrupt mode
88  * @irq: interrupt id
89  * @data: interrupt data
90  */
91 irqreturn_t ioat_dma_do_interrupt(int irq, void *data)
92 {
93 	struct ioatdma_device *instance = data;
94 	struct ioatdma_chan *ioat_chan;
95 	unsigned long attnstatus;
96 	int bit;
97 	u8 intrctrl;
98 
99 	intrctrl = readb(instance->reg_base + IOAT_INTRCTRL_OFFSET);
100 
101 	if (!(intrctrl & IOAT_INTRCTRL_MASTER_INT_EN))
102 		return IRQ_NONE;
103 
104 	if (!(intrctrl & IOAT_INTRCTRL_INT_STATUS)) {
105 		writeb(intrctrl, instance->reg_base + IOAT_INTRCTRL_OFFSET);
106 		return IRQ_NONE;
107 	}
108 
109 	attnstatus = readl(instance->reg_base + IOAT_ATTNSTATUS_OFFSET);
110 	for_each_set_bit(bit, &attnstatus, BITS_PER_LONG) {
111 		ioat_chan = ioat_chan_by_index(instance, bit);
112 		if (test_bit(IOAT_RUN, &ioat_chan->state))
113 			tasklet_schedule(&ioat_chan->cleanup_task);
114 	}
115 
116 	writeb(intrctrl, instance->reg_base + IOAT_INTRCTRL_OFFSET);
117 	return IRQ_HANDLED;
118 }
119 
120 /**
121  * ioat_dma_do_interrupt_msix - handler used for vector-per-channel interrupt mode
122  * @irq: interrupt id
123  * @data: interrupt data
124  */
125 irqreturn_t ioat_dma_do_interrupt_msix(int irq, void *data)
126 {
127 	struct ioatdma_chan *ioat_chan = data;
128 
129 	if (test_bit(IOAT_RUN, &ioat_chan->state))
130 		tasklet_schedule(&ioat_chan->cleanup_task);
131 
132 	return IRQ_HANDLED;
133 }
134 
135 void ioat_stop(struct ioatdma_chan *ioat_chan)
136 {
137 	struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma;
138 	struct pci_dev *pdev = ioat_dma->pdev;
139 	int chan_id = chan_num(ioat_chan);
140 	struct msix_entry *msix;
141 
142 	/* 1/ stop irq from firing tasklets
143 	 * 2/ stop the tasklet from re-arming irqs
144 	 */
145 	clear_bit(IOAT_RUN, &ioat_chan->state);
146 
147 	/* flush inflight interrupts */
148 	switch (ioat_dma->irq_mode) {
149 	case IOAT_MSIX:
150 		msix = &ioat_dma->msix_entries[chan_id];
151 		synchronize_irq(msix->vector);
152 		break;
153 	case IOAT_MSI:
154 	case IOAT_INTX:
155 		synchronize_irq(pdev->irq);
156 		break;
157 	default:
158 		break;
159 	}
160 
161 	/* flush inflight timers */
162 	del_timer_sync(&ioat_chan->timer);
163 
164 	/* flush inflight tasklet runs */
165 	tasklet_kill(&ioat_chan->cleanup_task);
166 
167 	/* final cleanup now that everything is quiesced and can't re-arm */
168 	ioat_cleanup_event((unsigned long)&ioat_chan->dma_chan);
169 }
170 
171 static void __ioat_issue_pending(struct ioatdma_chan *ioat_chan)
172 {
173 	ioat_chan->dmacount += ioat_ring_pending(ioat_chan);
174 	ioat_chan->issued = ioat_chan->head;
175 	writew(ioat_chan->dmacount,
176 	       ioat_chan->reg_base + IOAT_CHAN_DMACOUNT_OFFSET);
177 	dev_dbg(to_dev(ioat_chan),
178 		"%s: head: %#x tail: %#x issued: %#x count: %#x\n",
179 		__func__, ioat_chan->head, ioat_chan->tail,
180 		ioat_chan->issued, ioat_chan->dmacount);
181 }
182 
183 void ioat_issue_pending(struct dma_chan *c)
184 {
185 	struct ioatdma_chan *ioat_chan = to_ioat_chan(c);
186 
187 	if (ioat_ring_pending(ioat_chan)) {
188 		spin_lock_bh(&ioat_chan->prep_lock);
189 		__ioat_issue_pending(ioat_chan);
190 		spin_unlock_bh(&ioat_chan->prep_lock);
191 	}
192 }
193 
194 /**
195  * ioat_update_pending - log pending descriptors
196  * @ioat: ioat+ channel
197  *
198  * Check if the number of unsubmitted descriptors has exceeded the
199  * watermark.  Called with prep_lock held
200  */
201 static void ioat_update_pending(struct ioatdma_chan *ioat_chan)
202 {
203 	if (ioat_ring_pending(ioat_chan) > ioat_pending_level)
204 		__ioat_issue_pending(ioat_chan);
205 }
206 
207 static void __ioat_start_null_desc(struct ioatdma_chan *ioat_chan)
208 {
209 	struct ioat_ring_ent *desc;
210 	struct ioat_dma_descriptor *hw;
211 
212 	if (ioat_ring_space(ioat_chan) < 1) {
213 		dev_err(to_dev(ioat_chan),
214 			"Unable to start null desc - ring full\n");
215 		return;
216 	}
217 
218 	dev_dbg(to_dev(ioat_chan),
219 		"%s: head: %#x tail: %#x issued: %#x\n",
220 		__func__, ioat_chan->head, ioat_chan->tail, ioat_chan->issued);
221 	desc = ioat_get_ring_ent(ioat_chan, ioat_chan->head);
222 
223 	hw = desc->hw;
224 	hw->ctl = 0;
225 	hw->ctl_f.null = 1;
226 	hw->ctl_f.int_en = 1;
227 	hw->ctl_f.compl_write = 1;
228 	/* set size to non-zero value (channel returns error when size is 0) */
229 	hw->size = NULL_DESC_BUFFER_SIZE;
230 	hw->src_addr = 0;
231 	hw->dst_addr = 0;
232 	async_tx_ack(&desc->txd);
233 	ioat_set_chainaddr(ioat_chan, desc->txd.phys);
234 	dump_desc_dbg(ioat_chan, desc);
235 	/* make sure descriptors are written before we submit */
236 	wmb();
237 	ioat_chan->head += 1;
238 	__ioat_issue_pending(ioat_chan);
239 }
240 
241 void ioat_start_null_desc(struct ioatdma_chan *ioat_chan)
242 {
243 	spin_lock_bh(&ioat_chan->prep_lock);
244 	if (!test_bit(IOAT_CHAN_DOWN, &ioat_chan->state))
245 		__ioat_start_null_desc(ioat_chan);
246 	spin_unlock_bh(&ioat_chan->prep_lock);
247 }
248 
249 static void __ioat_restart_chan(struct ioatdma_chan *ioat_chan)
250 {
251 	/* set the tail to be re-issued */
252 	ioat_chan->issued = ioat_chan->tail;
253 	ioat_chan->dmacount = 0;
254 	mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
255 
256 	dev_dbg(to_dev(ioat_chan),
257 		"%s: head: %#x tail: %#x issued: %#x count: %#x\n",
258 		__func__, ioat_chan->head, ioat_chan->tail,
259 		ioat_chan->issued, ioat_chan->dmacount);
260 
261 	if (ioat_ring_pending(ioat_chan)) {
262 		struct ioat_ring_ent *desc;
263 
264 		desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail);
265 		ioat_set_chainaddr(ioat_chan, desc->txd.phys);
266 		__ioat_issue_pending(ioat_chan);
267 	} else
268 		__ioat_start_null_desc(ioat_chan);
269 }
270 
271 static int ioat_quiesce(struct ioatdma_chan *ioat_chan, unsigned long tmo)
272 {
273 	unsigned long end = jiffies + tmo;
274 	int err = 0;
275 	u32 status;
276 
277 	status = ioat_chansts(ioat_chan);
278 	if (is_ioat_active(status) || is_ioat_idle(status))
279 		ioat_suspend(ioat_chan);
280 	while (is_ioat_active(status) || is_ioat_idle(status)) {
281 		if (tmo && time_after(jiffies, end)) {
282 			err = -ETIMEDOUT;
283 			break;
284 		}
285 		status = ioat_chansts(ioat_chan);
286 		cpu_relax();
287 	}
288 
289 	return err;
290 }
291 
292 static int ioat_reset_sync(struct ioatdma_chan *ioat_chan, unsigned long tmo)
293 {
294 	unsigned long end = jiffies + tmo;
295 	int err = 0;
296 
297 	ioat_reset(ioat_chan);
298 	while (ioat_reset_pending(ioat_chan)) {
299 		if (end && time_after(jiffies, end)) {
300 			err = -ETIMEDOUT;
301 			break;
302 		}
303 		cpu_relax();
304 	}
305 
306 	return err;
307 }
308 
309 static dma_cookie_t ioat_tx_submit_unlock(struct dma_async_tx_descriptor *tx)
310 	__releases(&ioat_chan->prep_lock)
311 {
312 	struct dma_chan *c = tx->chan;
313 	struct ioatdma_chan *ioat_chan = to_ioat_chan(c);
314 	dma_cookie_t cookie;
315 
316 	cookie = dma_cookie_assign(tx);
317 	dev_dbg(to_dev(ioat_chan), "%s: cookie: %d\n", __func__, cookie);
318 
319 	if (!test_and_set_bit(IOAT_CHAN_ACTIVE, &ioat_chan->state))
320 		mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
321 
322 	/* make descriptor updates visible before advancing ioat->head,
323 	 * this is purposefully not smp_wmb() since we are also
324 	 * publishing the descriptor updates to a dma device
325 	 */
326 	wmb();
327 
328 	ioat_chan->head += ioat_chan->produce;
329 
330 	ioat_update_pending(ioat_chan);
331 	spin_unlock_bh(&ioat_chan->prep_lock);
332 
333 	return cookie;
334 }
335 
336 static struct ioat_ring_ent *
337 ioat_alloc_ring_ent(struct dma_chan *chan, int idx, gfp_t flags)
338 {
339 	struct ioat_dma_descriptor *hw;
340 	struct ioat_ring_ent *desc;
341 	struct ioatdma_chan *ioat_chan = to_ioat_chan(chan);
342 	int chunk;
343 	dma_addr_t phys;
344 	u8 *pos;
345 	off_t offs;
346 
347 	chunk = idx / IOAT_DESCS_PER_2M;
348 	idx &= (IOAT_DESCS_PER_2M - 1);
349 	offs = idx * IOAT_DESC_SZ;
350 	pos = (u8 *)ioat_chan->descs[chunk].virt + offs;
351 	phys = ioat_chan->descs[chunk].hw + offs;
352 	hw = (struct ioat_dma_descriptor *)pos;
353 	memset(hw, 0, sizeof(*hw));
354 
355 	desc = kmem_cache_zalloc(ioat_cache, flags);
356 	if (!desc)
357 		return NULL;
358 
359 	dma_async_tx_descriptor_init(&desc->txd, chan);
360 	desc->txd.tx_submit = ioat_tx_submit_unlock;
361 	desc->hw = hw;
362 	desc->txd.phys = phys;
363 	return desc;
364 }
365 
366 void ioat_free_ring_ent(struct ioat_ring_ent *desc, struct dma_chan *chan)
367 {
368 	kmem_cache_free(ioat_cache, desc);
369 }
370 
371 struct ioat_ring_ent **
372 ioat_alloc_ring(struct dma_chan *c, int order, gfp_t flags)
373 {
374 	struct ioatdma_chan *ioat_chan = to_ioat_chan(c);
375 	struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma;
376 	struct ioat_ring_ent **ring;
377 	int total_descs = 1 << order;
378 	int i, chunks;
379 
380 	/* allocate the array to hold the software ring */
381 	ring = kcalloc(total_descs, sizeof(*ring), flags);
382 	if (!ring)
383 		return NULL;
384 
385 	ioat_chan->desc_chunks = chunks = (total_descs * IOAT_DESC_SZ) / SZ_2M;
386 
387 	for (i = 0; i < chunks; i++) {
388 		struct ioat_descs *descs = &ioat_chan->descs[i];
389 
390 		descs->virt = dma_alloc_coherent(to_dev(ioat_chan),
391 						 SZ_2M, &descs->hw, flags);
392 		if (!descs->virt && (i > 0)) {
393 			int idx;
394 
395 			for (idx = 0; idx < i; idx++) {
396 				dma_free_coherent(to_dev(ioat_chan), SZ_2M,
397 						  descs->virt, descs->hw);
398 				descs->virt = NULL;
399 				descs->hw = 0;
400 			}
401 
402 			ioat_chan->desc_chunks = 0;
403 			kfree(ring);
404 			return NULL;
405 		}
406 	}
407 
408 	for (i = 0; i < total_descs; i++) {
409 		ring[i] = ioat_alloc_ring_ent(c, i, flags);
410 		if (!ring[i]) {
411 			int idx;
412 
413 			while (i--)
414 				ioat_free_ring_ent(ring[i], c);
415 
416 			for (idx = 0; idx < ioat_chan->desc_chunks; idx++) {
417 				dma_free_coherent(to_dev(ioat_chan),
418 						  SZ_2M,
419 						  ioat_chan->descs[idx].virt,
420 						  ioat_chan->descs[idx].hw);
421 				ioat_chan->descs[idx].virt = NULL;
422 				ioat_chan->descs[idx].hw = 0;
423 			}
424 
425 			ioat_chan->desc_chunks = 0;
426 			kfree(ring);
427 			return NULL;
428 		}
429 		set_desc_id(ring[i], i);
430 	}
431 
432 	/* link descs */
433 	for (i = 0; i < total_descs-1; i++) {
434 		struct ioat_ring_ent *next = ring[i+1];
435 		struct ioat_dma_descriptor *hw = ring[i]->hw;
436 
437 		hw->next = next->txd.phys;
438 	}
439 	ring[i]->hw->next = ring[0]->txd.phys;
440 
441 	/* setup descriptor pre-fetching for v3.4 */
442 	if (ioat_dma->cap & IOAT_CAP_DPS) {
443 		u16 drsctl = IOAT_CHAN_DRSZ_2MB | IOAT_CHAN_DRS_EN;
444 
445 		if (chunks == 1)
446 			drsctl |= IOAT_CHAN_DRS_AUTOWRAP;
447 
448 		writew(drsctl, ioat_chan->reg_base + IOAT_CHAN_DRSCTL_OFFSET);
449 
450 	}
451 
452 	return ring;
453 }
454 
455 /**
456  * ioat_check_space_lock - verify space and grab ring producer lock
457  * @ioat: ioat,3 channel (ring) to operate on
458  * @num_descs: allocation length
459  */
460 int ioat_check_space_lock(struct ioatdma_chan *ioat_chan, int num_descs)
461 	__acquires(&ioat_chan->prep_lock)
462 {
463 	spin_lock_bh(&ioat_chan->prep_lock);
464 	/* never allow the last descriptor to be consumed, we need at
465 	 * least one free at all times to allow for on-the-fly ring
466 	 * resizing.
467 	 */
468 	if (likely(ioat_ring_space(ioat_chan) > num_descs)) {
469 		dev_dbg(to_dev(ioat_chan), "%s: num_descs: %d (%x:%x:%x)\n",
470 			__func__, num_descs, ioat_chan->head,
471 			ioat_chan->tail, ioat_chan->issued);
472 		ioat_chan->produce = num_descs;
473 		return 0;  /* with ioat->prep_lock held */
474 	}
475 	spin_unlock_bh(&ioat_chan->prep_lock);
476 
477 	dev_dbg_ratelimited(to_dev(ioat_chan),
478 			    "%s: ring full! num_descs: %d (%x:%x:%x)\n",
479 			    __func__, num_descs, ioat_chan->head,
480 			    ioat_chan->tail, ioat_chan->issued);
481 
482 	/* progress reclaim in the allocation failure case we may be
483 	 * called under bh_disabled so we need to trigger the timer
484 	 * event directly
485 	 */
486 	if (time_is_before_jiffies(ioat_chan->timer.expires)
487 	    && timer_pending(&ioat_chan->timer)) {
488 		mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
489 		ioat_timer_event(&ioat_chan->timer);
490 	}
491 
492 	return -ENOMEM;
493 }
494 
495 static bool desc_has_ext(struct ioat_ring_ent *desc)
496 {
497 	struct ioat_dma_descriptor *hw = desc->hw;
498 
499 	if (hw->ctl_f.op == IOAT_OP_XOR ||
500 	    hw->ctl_f.op == IOAT_OP_XOR_VAL) {
501 		struct ioat_xor_descriptor *xor = desc->xor;
502 
503 		if (src_cnt_to_sw(xor->ctl_f.src_cnt) > 5)
504 			return true;
505 	} else if (hw->ctl_f.op == IOAT_OP_PQ ||
506 		   hw->ctl_f.op == IOAT_OP_PQ_VAL) {
507 		struct ioat_pq_descriptor *pq = desc->pq;
508 
509 		if (src_cnt_to_sw(pq->ctl_f.src_cnt) > 3)
510 			return true;
511 	}
512 
513 	return false;
514 }
515 
516 static void
517 ioat_free_sed(struct ioatdma_device *ioat_dma, struct ioat_sed_ent *sed)
518 {
519 	if (!sed)
520 		return;
521 
522 	dma_pool_free(ioat_dma->sed_hw_pool[sed->hw_pool], sed->hw, sed->dma);
523 	kmem_cache_free(ioat_sed_cache, sed);
524 }
525 
526 static u64 ioat_get_current_completion(struct ioatdma_chan *ioat_chan)
527 {
528 	u64 phys_complete;
529 	u64 completion;
530 
531 	completion = *ioat_chan->completion;
532 	phys_complete = ioat_chansts_to_addr(completion);
533 
534 	dev_dbg(to_dev(ioat_chan), "%s: phys_complete: %#llx\n", __func__,
535 		(unsigned long long) phys_complete);
536 
537 	return phys_complete;
538 }
539 
540 static bool ioat_cleanup_preamble(struct ioatdma_chan *ioat_chan,
541 				   u64 *phys_complete)
542 {
543 	*phys_complete = ioat_get_current_completion(ioat_chan);
544 	if (*phys_complete == ioat_chan->last_completion)
545 		return false;
546 
547 	clear_bit(IOAT_COMPLETION_ACK, &ioat_chan->state);
548 	mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
549 
550 	return true;
551 }
552 
553 static void
554 desc_get_errstat(struct ioatdma_chan *ioat_chan, struct ioat_ring_ent *desc)
555 {
556 	struct ioat_dma_descriptor *hw = desc->hw;
557 
558 	switch (hw->ctl_f.op) {
559 	case IOAT_OP_PQ_VAL:
560 	case IOAT_OP_PQ_VAL_16S:
561 	{
562 		struct ioat_pq_descriptor *pq = desc->pq;
563 
564 		/* check if there's error written */
565 		if (!pq->dwbes_f.wbes)
566 			return;
567 
568 		/* need to set a chanerr var for checking to clear later */
569 
570 		if (pq->dwbes_f.p_val_err)
571 			*desc->result |= SUM_CHECK_P_RESULT;
572 
573 		if (pq->dwbes_f.q_val_err)
574 			*desc->result |= SUM_CHECK_Q_RESULT;
575 
576 		return;
577 	}
578 	default:
579 		return;
580 	}
581 }
582 
583 /**
584  * __cleanup - reclaim used descriptors
585  * @ioat: channel (ring) to clean
586  */
587 static void __cleanup(struct ioatdma_chan *ioat_chan, dma_addr_t phys_complete)
588 {
589 	struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma;
590 	struct ioat_ring_ent *desc;
591 	bool seen_current = false;
592 	int idx = ioat_chan->tail, i;
593 	u16 active;
594 
595 	dev_dbg(to_dev(ioat_chan), "%s: head: %#x tail: %#x issued: %#x\n",
596 		__func__, ioat_chan->head, ioat_chan->tail, ioat_chan->issued);
597 
598 	/*
599 	 * At restart of the channel, the completion address and the
600 	 * channel status will be 0 due to starting a new chain. Since
601 	 * it's new chain and the first descriptor "fails", there is
602 	 * nothing to clean up. We do not want to reap the entire submitted
603 	 * chain due to this 0 address value and then BUG.
604 	 */
605 	if (!phys_complete)
606 		return;
607 
608 	active = ioat_ring_active(ioat_chan);
609 	for (i = 0; i < active && !seen_current; i++) {
610 		struct dma_async_tx_descriptor *tx;
611 
612 		prefetch(ioat_get_ring_ent(ioat_chan, idx + i + 1));
613 		desc = ioat_get_ring_ent(ioat_chan, idx + i);
614 		dump_desc_dbg(ioat_chan, desc);
615 
616 		/* set err stat if we are using dwbes */
617 		if (ioat_dma->cap & IOAT_CAP_DWBES)
618 			desc_get_errstat(ioat_chan, desc);
619 
620 		tx = &desc->txd;
621 		if (tx->cookie) {
622 			dma_cookie_complete(tx);
623 			dma_descriptor_unmap(tx);
624 			dmaengine_desc_get_callback_invoke(tx, NULL);
625 			tx->callback = NULL;
626 			tx->callback_result = NULL;
627 		}
628 
629 		if (tx->phys == phys_complete)
630 			seen_current = true;
631 
632 		/* skip extended descriptors */
633 		if (desc_has_ext(desc)) {
634 			BUG_ON(i + 1 >= active);
635 			i++;
636 		}
637 
638 		/* cleanup super extended descriptors */
639 		if (desc->sed) {
640 			ioat_free_sed(ioat_dma, desc->sed);
641 			desc->sed = NULL;
642 		}
643 	}
644 
645 	/* finish all descriptor reads before incrementing tail */
646 	smp_mb();
647 	ioat_chan->tail = idx + i;
648 	/* no active descs have written a completion? */
649 	BUG_ON(active && !seen_current);
650 	ioat_chan->last_completion = phys_complete;
651 
652 	if (active - i == 0) {
653 		dev_dbg(to_dev(ioat_chan), "%s: cancel completion timeout\n",
654 			__func__);
655 		mod_timer(&ioat_chan->timer, jiffies + IDLE_TIMEOUT);
656 	}
657 
658 	/* microsecond delay by sysfs variable  per pending descriptor */
659 	if (ioat_chan->intr_coalesce != ioat_chan->prev_intr_coalesce) {
660 		writew(min((ioat_chan->intr_coalesce * (active - i)),
661 		       IOAT_INTRDELAY_MASK),
662 		       ioat_chan->ioat_dma->reg_base + IOAT_INTRDELAY_OFFSET);
663 		ioat_chan->prev_intr_coalesce = ioat_chan->intr_coalesce;
664 	}
665 }
666 
667 static void ioat_cleanup(struct ioatdma_chan *ioat_chan)
668 {
669 	u64 phys_complete;
670 
671 	spin_lock_bh(&ioat_chan->cleanup_lock);
672 
673 	if (ioat_cleanup_preamble(ioat_chan, &phys_complete))
674 		__cleanup(ioat_chan, phys_complete);
675 
676 	if (is_ioat_halted(*ioat_chan->completion)) {
677 		u32 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
678 
679 		if (chanerr &
680 		    (IOAT_CHANERR_HANDLE_MASK | IOAT_CHANERR_RECOVER_MASK)) {
681 			mod_timer(&ioat_chan->timer, jiffies + IDLE_TIMEOUT);
682 			ioat_eh(ioat_chan);
683 		}
684 	}
685 
686 	spin_unlock_bh(&ioat_chan->cleanup_lock);
687 }
688 
689 void ioat_cleanup_event(unsigned long data)
690 {
691 	struct ioatdma_chan *ioat_chan = to_ioat_chan((void *)data);
692 
693 	ioat_cleanup(ioat_chan);
694 	if (!test_bit(IOAT_RUN, &ioat_chan->state))
695 		return;
696 	writew(IOAT_CHANCTRL_RUN, ioat_chan->reg_base + IOAT_CHANCTRL_OFFSET);
697 }
698 
699 static void ioat_restart_channel(struct ioatdma_chan *ioat_chan)
700 {
701 	u64 phys_complete;
702 
703 	/* set the completion address register again */
704 	writel(lower_32_bits(ioat_chan->completion_dma),
705 	       ioat_chan->reg_base + IOAT_CHANCMP_OFFSET_LOW);
706 	writel(upper_32_bits(ioat_chan->completion_dma),
707 	       ioat_chan->reg_base + IOAT_CHANCMP_OFFSET_HIGH);
708 
709 	ioat_quiesce(ioat_chan, 0);
710 	if (ioat_cleanup_preamble(ioat_chan, &phys_complete))
711 		__cleanup(ioat_chan, phys_complete);
712 
713 	__ioat_restart_chan(ioat_chan);
714 }
715 
716 
717 static void ioat_abort_descs(struct ioatdma_chan *ioat_chan)
718 {
719 	struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma;
720 	struct ioat_ring_ent *desc;
721 	u16 active;
722 	int idx = ioat_chan->tail, i;
723 
724 	/*
725 	 * We assume that the failed descriptor has been processed.
726 	 * Now we are just returning all the remaining submitted
727 	 * descriptors to abort.
728 	 */
729 	active = ioat_ring_active(ioat_chan);
730 
731 	/* we skip the failed descriptor that tail points to */
732 	for (i = 1; i < active; i++) {
733 		struct dma_async_tx_descriptor *tx;
734 
735 		prefetch(ioat_get_ring_ent(ioat_chan, idx + i + 1));
736 		desc = ioat_get_ring_ent(ioat_chan, idx + i);
737 
738 		tx = &desc->txd;
739 		if (tx->cookie) {
740 			struct dmaengine_result res;
741 
742 			dma_cookie_complete(tx);
743 			dma_descriptor_unmap(tx);
744 			res.result = DMA_TRANS_ABORTED;
745 			dmaengine_desc_get_callback_invoke(tx, &res);
746 			tx->callback = NULL;
747 			tx->callback_result = NULL;
748 		}
749 
750 		/* skip extended descriptors */
751 		if (desc_has_ext(desc)) {
752 			WARN_ON(i + 1 >= active);
753 			i++;
754 		}
755 
756 		/* cleanup super extended descriptors */
757 		if (desc->sed) {
758 			ioat_free_sed(ioat_dma, desc->sed);
759 			desc->sed = NULL;
760 		}
761 	}
762 
763 	smp_mb(); /* finish all descriptor reads before incrementing tail */
764 	ioat_chan->tail = idx + active;
765 
766 	desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail);
767 	ioat_chan->last_completion = *ioat_chan->completion = desc->txd.phys;
768 }
769 
770 static void ioat_eh(struct ioatdma_chan *ioat_chan)
771 {
772 	struct pci_dev *pdev = to_pdev(ioat_chan);
773 	struct ioat_dma_descriptor *hw;
774 	struct dma_async_tx_descriptor *tx;
775 	u64 phys_complete;
776 	struct ioat_ring_ent *desc;
777 	u32 err_handled = 0;
778 	u32 chanerr_int;
779 	u32 chanerr;
780 	bool abort = false;
781 	struct dmaengine_result res;
782 
783 	/* cleanup so tail points to descriptor that caused the error */
784 	if (ioat_cleanup_preamble(ioat_chan, &phys_complete))
785 		__cleanup(ioat_chan, phys_complete);
786 
787 	chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
788 	pci_read_config_dword(pdev, IOAT_PCI_CHANERR_INT_OFFSET, &chanerr_int);
789 
790 	dev_dbg(to_dev(ioat_chan), "%s: error = %x:%x\n",
791 		__func__, chanerr, chanerr_int);
792 
793 	desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail);
794 	hw = desc->hw;
795 	dump_desc_dbg(ioat_chan, desc);
796 
797 	switch (hw->ctl_f.op) {
798 	case IOAT_OP_XOR_VAL:
799 		if (chanerr & IOAT_CHANERR_XOR_P_OR_CRC_ERR) {
800 			*desc->result |= SUM_CHECK_P_RESULT;
801 			err_handled |= IOAT_CHANERR_XOR_P_OR_CRC_ERR;
802 		}
803 		break;
804 	case IOAT_OP_PQ_VAL:
805 	case IOAT_OP_PQ_VAL_16S:
806 		if (chanerr & IOAT_CHANERR_XOR_P_OR_CRC_ERR) {
807 			*desc->result |= SUM_CHECK_P_RESULT;
808 			err_handled |= IOAT_CHANERR_XOR_P_OR_CRC_ERR;
809 		}
810 		if (chanerr & IOAT_CHANERR_XOR_Q_ERR) {
811 			*desc->result |= SUM_CHECK_Q_RESULT;
812 			err_handled |= IOAT_CHANERR_XOR_Q_ERR;
813 		}
814 		break;
815 	}
816 
817 	if (chanerr & IOAT_CHANERR_RECOVER_MASK) {
818 		if (chanerr & IOAT_CHANERR_READ_DATA_ERR) {
819 			res.result = DMA_TRANS_READ_FAILED;
820 			err_handled |= IOAT_CHANERR_READ_DATA_ERR;
821 		} else if (chanerr & IOAT_CHANERR_WRITE_DATA_ERR) {
822 			res.result = DMA_TRANS_WRITE_FAILED;
823 			err_handled |= IOAT_CHANERR_WRITE_DATA_ERR;
824 		}
825 
826 		abort = true;
827 	} else
828 		res.result = DMA_TRANS_NOERROR;
829 
830 	/* fault on unhandled error or spurious halt */
831 	if (chanerr ^ err_handled || chanerr == 0) {
832 		dev_err(to_dev(ioat_chan), "%s: fatal error (%x:%x)\n",
833 			__func__, chanerr, err_handled);
834 		dev_err(to_dev(ioat_chan), "Errors handled:\n");
835 		ioat_print_chanerrs(ioat_chan, err_handled);
836 		dev_err(to_dev(ioat_chan), "Errors not handled:\n");
837 		ioat_print_chanerrs(ioat_chan, (chanerr & ~err_handled));
838 
839 		BUG();
840 	}
841 
842 	/* cleanup the faulty descriptor since we are continuing */
843 	tx = &desc->txd;
844 	if (tx->cookie) {
845 		dma_cookie_complete(tx);
846 		dma_descriptor_unmap(tx);
847 		dmaengine_desc_get_callback_invoke(tx, &res);
848 		tx->callback = NULL;
849 		tx->callback_result = NULL;
850 	}
851 
852 	/* mark faulting descriptor as complete */
853 	*ioat_chan->completion = desc->txd.phys;
854 
855 	spin_lock_bh(&ioat_chan->prep_lock);
856 	/* we need abort all descriptors */
857 	if (abort) {
858 		ioat_abort_descs(ioat_chan);
859 		/* clean up the channel, we could be in weird state */
860 		ioat_reset_hw(ioat_chan);
861 	}
862 
863 	writel(chanerr, ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
864 	pci_write_config_dword(pdev, IOAT_PCI_CHANERR_INT_OFFSET, chanerr_int);
865 
866 	ioat_restart_channel(ioat_chan);
867 	spin_unlock_bh(&ioat_chan->prep_lock);
868 }
869 
870 static void check_active(struct ioatdma_chan *ioat_chan)
871 {
872 	if (ioat_ring_active(ioat_chan)) {
873 		mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
874 		return;
875 	}
876 
877 	if (test_and_clear_bit(IOAT_CHAN_ACTIVE, &ioat_chan->state))
878 		mod_timer(&ioat_chan->timer, jiffies + IDLE_TIMEOUT);
879 }
880 
881 void ioat_timer_event(struct timer_list *t)
882 {
883 	struct ioatdma_chan *ioat_chan = from_timer(ioat_chan, t, timer);
884 	dma_addr_t phys_complete;
885 	u64 status;
886 
887 	status = ioat_chansts(ioat_chan);
888 
889 	/* when halted due to errors check for channel
890 	 * programming errors before advancing the completion state
891 	 */
892 	if (is_ioat_halted(status)) {
893 		u32 chanerr;
894 
895 		chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
896 		dev_err(to_dev(ioat_chan), "%s: Channel halted (%x)\n",
897 			__func__, chanerr);
898 		dev_err(to_dev(ioat_chan), "Errors:\n");
899 		ioat_print_chanerrs(ioat_chan, chanerr);
900 
901 		if (test_bit(IOAT_RUN, &ioat_chan->state)) {
902 			spin_lock_bh(&ioat_chan->cleanup_lock);
903 			spin_lock_bh(&ioat_chan->prep_lock);
904 			set_bit(IOAT_CHAN_DOWN, &ioat_chan->state);
905 			spin_unlock_bh(&ioat_chan->prep_lock);
906 
907 			ioat_abort_descs(ioat_chan);
908 			dev_warn(to_dev(ioat_chan), "Reset channel...\n");
909 			ioat_reset_hw(ioat_chan);
910 			dev_warn(to_dev(ioat_chan), "Restart channel...\n");
911 			ioat_restart_channel(ioat_chan);
912 
913 			spin_lock_bh(&ioat_chan->prep_lock);
914 			clear_bit(IOAT_CHAN_DOWN, &ioat_chan->state);
915 			spin_unlock_bh(&ioat_chan->prep_lock);
916 			spin_unlock_bh(&ioat_chan->cleanup_lock);
917 		}
918 
919 		return;
920 	}
921 
922 	spin_lock_bh(&ioat_chan->cleanup_lock);
923 
924 	/* handle the no-actives case */
925 	if (!ioat_ring_active(ioat_chan)) {
926 		spin_lock_bh(&ioat_chan->prep_lock);
927 		check_active(ioat_chan);
928 		spin_unlock_bh(&ioat_chan->prep_lock);
929 		spin_unlock_bh(&ioat_chan->cleanup_lock);
930 		return;
931 	}
932 
933 	/* if we haven't made progress and we have already
934 	 * acknowledged a pending completion once, then be more
935 	 * forceful with a restart
936 	 */
937 	if (ioat_cleanup_preamble(ioat_chan, &phys_complete))
938 		__cleanup(ioat_chan, phys_complete);
939 	else if (test_bit(IOAT_COMPLETION_ACK, &ioat_chan->state)) {
940 		u32 chanerr;
941 
942 		chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
943 		dev_err(to_dev(ioat_chan), "CHANSTS: %#Lx CHANERR: %#x\n",
944 			status, chanerr);
945 		dev_err(to_dev(ioat_chan), "Errors:\n");
946 		ioat_print_chanerrs(ioat_chan, chanerr);
947 
948 		dev_dbg(to_dev(ioat_chan), "Active descriptors: %d\n",
949 			ioat_ring_active(ioat_chan));
950 
951 		spin_lock_bh(&ioat_chan->prep_lock);
952 		set_bit(IOAT_CHAN_DOWN, &ioat_chan->state);
953 		spin_unlock_bh(&ioat_chan->prep_lock);
954 
955 		ioat_abort_descs(ioat_chan);
956 		dev_warn(to_dev(ioat_chan), "Resetting channel...\n");
957 		ioat_reset_hw(ioat_chan);
958 		dev_warn(to_dev(ioat_chan), "Restarting channel...\n");
959 		ioat_restart_channel(ioat_chan);
960 
961 		spin_lock_bh(&ioat_chan->prep_lock);
962 		clear_bit(IOAT_CHAN_DOWN, &ioat_chan->state);
963 		spin_unlock_bh(&ioat_chan->prep_lock);
964 		spin_unlock_bh(&ioat_chan->cleanup_lock);
965 		return;
966 	} else
967 		set_bit(IOAT_COMPLETION_ACK, &ioat_chan->state);
968 
969 	mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
970 	spin_unlock_bh(&ioat_chan->cleanup_lock);
971 }
972 
973 enum dma_status
974 ioat_tx_status(struct dma_chan *c, dma_cookie_t cookie,
975 		struct dma_tx_state *txstate)
976 {
977 	struct ioatdma_chan *ioat_chan = to_ioat_chan(c);
978 	enum dma_status ret;
979 
980 	ret = dma_cookie_status(c, cookie, txstate);
981 	if (ret == DMA_COMPLETE)
982 		return ret;
983 
984 	ioat_cleanup(ioat_chan);
985 
986 	return dma_cookie_status(c, cookie, txstate);
987 }
988 
989 int ioat_reset_hw(struct ioatdma_chan *ioat_chan)
990 {
991 	/* throw away whatever the channel was doing and get it
992 	 * initialized, with ioat3 specific workarounds
993 	 */
994 	struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma;
995 	struct pci_dev *pdev = ioat_dma->pdev;
996 	u32 chanerr;
997 	u16 dev_id;
998 	int err;
999 
1000 	ioat_quiesce(ioat_chan, msecs_to_jiffies(100));
1001 
1002 	chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
1003 	writel(chanerr, ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
1004 
1005 	if (ioat_dma->version < IOAT_VER_3_3) {
1006 		/* clear any pending errors */
1007 		err = pci_read_config_dword(pdev,
1008 				IOAT_PCI_CHANERR_INT_OFFSET, &chanerr);
1009 		if (err) {
1010 			dev_err(&pdev->dev,
1011 				"channel error register unreachable\n");
1012 			return err;
1013 		}
1014 		pci_write_config_dword(pdev,
1015 				IOAT_PCI_CHANERR_INT_OFFSET, chanerr);
1016 
1017 		/* Clear DMAUNCERRSTS Cfg-Reg Parity Error status bit
1018 		 * (workaround for spurious config parity error after restart)
1019 		 */
1020 		pci_read_config_word(pdev, IOAT_PCI_DEVICE_ID_OFFSET, &dev_id);
1021 		if (dev_id == PCI_DEVICE_ID_INTEL_IOAT_TBG0) {
1022 			pci_write_config_dword(pdev,
1023 					       IOAT_PCI_DMAUNCERRSTS_OFFSET,
1024 					       0x10);
1025 		}
1026 	}
1027 
1028 	if (is_bwd_ioat(pdev) && (ioat_dma->irq_mode == IOAT_MSIX)) {
1029 		ioat_dma->msixtba0 = readq(ioat_dma->reg_base + 0x1000);
1030 		ioat_dma->msixdata0 = readq(ioat_dma->reg_base + 0x1008);
1031 		ioat_dma->msixpba = readq(ioat_dma->reg_base + 0x1800);
1032 	}
1033 
1034 
1035 	err = ioat_reset_sync(ioat_chan, msecs_to_jiffies(200));
1036 	if (!err) {
1037 		if (is_bwd_ioat(pdev) && (ioat_dma->irq_mode == IOAT_MSIX)) {
1038 			writeq(ioat_dma->msixtba0, ioat_dma->reg_base + 0x1000);
1039 			writeq(ioat_dma->msixdata0, ioat_dma->reg_base + 0x1008);
1040 			writeq(ioat_dma->msixpba, ioat_dma->reg_base + 0x1800);
1041 		}
1042 	}
1043 
1044 	if (err)
1045 		dev_err(&pdev->dev, "Failed to reset: %d\n", err);
1046 
1047 	return err;
1048 }
1049