Linux 4.19.133
[linux/fpc-iii.git] / drivers / dma / ioat / dma.c
blobb94cece58b984fb0ab1a09e50b33ea7a5901816b
1 /*
2 * Intel I/OAT DMA Linux driver
3 * Copyright(c) 2004 - 2015 Intel Corporation.
5 * This program is free software; you can redistribute it and/or modify it
6 * under the terms and conditions of the GNU General Public License,
7 * version 2, as published by the Free Software Foundation.
9 * This program is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
12 * more details.
14 * The full GNU General Public License is included in this distribution in
15 * the file called "COPYING".
20 * This driver supports an Intel I/OAT DMA engine, which does asynchronous
21 * copy operations.
24 #include <linux/init.h>
25 #include <linux/module.h>
26 #include <linux/slab.h>
27 #include <linux/pci.h>
28 #include <linux/interrupt.h>
29 #include <linux/dmaengine.h>
30 #include <linux/delay.h>
31 #include <linux/dma-mapping.h>
32 #include <linux/workqueue.h>
33 #include <linux/prefetch.h>
34 #include <linux/sizes.h>
35 #include "dma.h"
36 #include "registers.h"
37 #include "hw.h"
39 #include "../dmaengine.h"
41 static char *chanerr_str[] = {
42 "DMA Transfer Source Address Error",
43 "DMA Transfer Destination Address Error",
44 "Next Descriptor Address Error",
45 "Descriptor Error",
46 "Chan Address Value Error",
47 "CHANCMD Error",
48 "Chipset Uncorrectable Data Integrity Error",
49 "DMA Uncorrectable Data Integrity Error",
50 "Read Data Error",
51 "Write Data Error",
52 "Descriptor Control Error",
53 "Descriptor Transfer Size Error",
54 "Completion Address Error",
55 "Interrupt Configuration Error",
56 "Super extended descriptor Address Error",
57 "Unaffiliated Error",
58 "CRC or XOR P Error",
59 "XOR Q Error",
60 "Descriptor Count Error",
61 "DIF All F detect Error",
62 "Guard Tag verification Error",
63 "Application Tag verification Error",
64 "Reference Tag verification Error",
65 "Bundle Bit Error",
66 "Result DIF All F detect Error",
67 "Result Guard Tag verification Error",
68 "Result Application Tag verification Error",
69 "Result Reference Tag verification Error",
72 static void ioat_eh(struct ioatdma_chan *ioat_chan);
74 static void ioat_print_chanerrs(struct ioatdma_chan *ioat_chan, u32 chanerr)
76 int i;
78 for (i = 0; i < ARRAY_SIZE(chanerr_str); i++) {
79 if ((chanerr >> i) & 1) {
80 dev_err(to_dev(ioat_chan), "Err(%d): %s\n",
81 i, chanerr_str[i]);
86 /**
87 * ioat_dma_do_interrupt - handler used for single vector interrupt mode
88 * @irq: interrupt id
89 * @data: interrupt data
91 irqreturn_t ioat_dma_do_interrupt(int irq, void *data)
93 struct ioatdma_device *instance = data;
94 struct ioatdma_chan *ioat_chan;
95 unsigned long attnstatus;
96 int bit;
97 u8 intrctrl;
99 intrctrl = readb(instance->reg_base + IOAT_INTRCTRL_OFFSET);
101 if (!(intrctrl & IOAT_INTRCTRL_MASTER_INT_EN))
102 return IRQ_NONE;
104 if (!(intrctrl & IOAT_INTRCTRL_INT_STATUS)) {
105 writeb(intrctrl, instance->reg_base + IOAT_INTRCTRL_OFFSET);
106 return IRQ_NONE;
109 attnstatus = readl(instance->reg_base + IOAT_ATTNSTATUS_OFFSET);
110 for_each_set_bit(bit, &attnstatus, BITS_PER_LONG) {
111 ioat_chan = ioat_chan_by_index(instance, bit);
112 if (test_bit(IOAT_RUN, &ioat_chan->state))
113 tasklet_schedule(&ioat_chan->cleanup_task);
116 writeb(intrctrl, instance->reg_base + IOAT_INTRCTRL_OFFSET);
117 return IRQ_HANDLED;
121 * ioat_dma_do_interrupt_msix - handler used for vector-per-channel interrupt mode
122 * @irq: interrupt id
123 * @data: interrupt data
125 irqreturn_t ioat_dma_do_interrupt_msix(int irq, void *data)
127 struct ioatdma_chan *ioat_chan = data;
129 if (test_bit(IOAT_RUN, &ioat_chan->state))
130 tasklet_schedule(&ioat_chan->cleanup_task);
132 return IRQ_HANDLED;
135 void ioat_stop(struct ioatdma_chan *ioat_chan)
137 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma;
138 struct pci_dev *pdev = ioat_dma->pdev;
139 int chan_id = chan_num(ioat_chan);
140 struct msix_entry *msix;
142 /* 1/ stop irq from firing tasklets
143 * 2/ stop the tasklet from re-arming irqs
145 clear_bit(IOAT_RUN, &ioat_chan->state);
147 /* flush inflight interrupts */
148 switch (ioat_dma->irq_mode) {
149 case IOAT_MSIX:
150 msix = &ioat_dma->msix_entries[chan_id];
151 synchronize_irq(msix->vector);
152 break;
153 case IOAT_MSI:
154 case IOAT_INTX:
155 synchronize_irq(pdev->irq);
156 break;
157 default:
158 break;
161 /* flush inflight timers */
162 del_timer_sync(&ioat_chan->timer);
164 /* flush inflight tasklet runs */
165 tasklet_kill(&ioat_chan->cleanup_task);
167 /* final cleanup now that everything is quiesced and can't re-arm */
168 ioat_cleanup_event((unsigned long)&ioat_chan->dma_chan);
171 static void __ioat_issue_pending(struct ioatdma_chan *ioat_chan)
173 ioat_chan->dmacount += ioat_ring_pending(ioat_chan);
174 ioat_chan->issued = ioat_chan->head;
175 writew(ioat_chan->dmacount,
176 ioat_chan->reg_base + IOAT_CHAN_DMACOUNT_OFFSET);
177 dev_dbg(to_dev(ioat_chan),
178 "%s: head: %#x tail: %#x issued: %#x count: %#x\n",
179 __func__, ioat_chan->head, ioat_chan->tail,
180 ioat_chan->issued, ioat_chan->dmacount);
183 void ioat_issue_pending(struct dma_chan *c)
185 struct ioatdma_chan *ioat_chan = to_ioat_chan(c);
187 if (ioat_ring_pending(ioat_chan)) {
188 spin_lock_bh(&ioat_chan->prep_lock);
189 __ioat_issue_pending(ioat_chan);
190 spin_unlock_bh(&ioat_chan->prep_lock);
195 * ioat_update_pending - log pending descriptors
196 * @ioat: ioat+ channel
198 * Check if the number of unsubmitted descriptors has exceeded the
199 * watermark. Called with prep_lock held
201 static void ioat_update_pending(struct ioatdma_chan *ioat_chan)
203 if (ioat_ring_pending(ioat_chan) > ioat_pending_level)
204 __ioat_issue_pending(ioat_chan);
207 static void __ioat_start_null_desc(struct ioatdma_chan *ioat_chan)
209 struct ioat_ring_ent *desc;
210 struct ioat_dma_descriptor *hw;
212 if (ioat_ring_space(ioat_chan) < 1) {
213 dev_err(to_dev(ioat_chan),
214 "Unable to start null desc - ring full\n");
215 return;
218 dev_dbg(to_dev(ioat_chan),
219 "%s: head: %#x tail: %#x issued: %#x\n",
220 __func__, ioat_chan->head, ioat_chan->tail, ioat_chan->issued);
221 desc = ioat_get_ring_ent(ioat_chan, ioat_chan->head);
223 hw = desc->hw;
224 hw->ctl = 0;
225 hw->ctl_f.null = 1;
226 hw->ctl_f.int_en = 1;
227 hw->ctl_f.compl_write = 1;
228 /* set size to non-zero value (channel returns error when size is 0) */
229 hw->size = NULL_DESC_BUFFER_SIZE;
230 hw->src_addr = 0;
231 hw->dst_addr = 0;
232 async_tx_ack(&desc->txd);
233 ioat_set_chainaddr(ioat_chan, desc->txd.phys);
234 dump_desc_dbg(ioat_chan, desc);
235 /* make sure descriptors are written before we submit */
236 wmb();
237 ioat_chan->head += 1;
238 __ioat_issue_pending(ioat_chan);
241 void ioat_start_null_desc(struct ioatdma_chan *ioat_chan)
243 spin_lock_bh(&ioat_chan->prep_lock);
244 if (!test_bit(IOAT_CHAN_DOWN, &ioat_chan->state))
245 __ioat_start_null_desc(ioat_chan);
246 spin_unlock_bh(&ioat_chan->prep_lock);
249 static void __ioat_restart_chan(struct ioatdma_chan *ioat_chan)
251 /* set the tail to be re-issued */
252 ioat_chan->issued = ioat_chan->tail;
253 ioat_chan->dmacount = 0;
254 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
256 dev_dbg(to_dev(ioat_chan),
257 "%s: head: %#x tail: %#x issued: %#x count: %#x\n",
258 __func__, ioat_chan->head, ioat_chan->tail,
259 ioat_chan->issued, ioat_chan->dmacount);
261 if (ioat_ring_pending(ioat_chan)) {
262 struct ioat_ring_ent *desc;
264 desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail);
265 ioat_set_chainaddr(ioat_chan, desc->txd.phys);
266 __ioat_issue_pending(ioat_chan);
267 } else
268 __ioat_start_null_desc(ioat_chan);
271 static int ioat_quiesce(struct ioatdma_chan *ioat_chan, unsigned long tmo)
273 unsigned long end = jiffies + tmo;
274 int err = 0;
275 u32 status;
277 status = ioat_chansts(ioat_chan);
278 if (is_ioat_active(status) || is_ioat_idle(status))
279 ioat_suspend(ioat_chan);
280 while (is_ioat_active(status) || is_ioat_idle(status)) {
281 if (tmo && time_after(jiffies, end)) {
282 err = -ETIMEDOUT;
283 break;
285 status = ioat_chansts(ioat_chan);
286 cpu_relax();
289 return err;
292 static int ioat_reset_sync(struct ioatdma_chan *ioat_chan, unsigned long tmo)
294 unsigned long end = jiffies + tmo;
295 int err = 0;
297 ioat_reset(ioat_chan);
298 while (ioat_reset_pending(ioat_chan)) {
299 if (end && time_after(jiffies, end)) {
300 err = -ETIMEDOUT;
301 break;
303 cpu_relax();
306 return err;
309 static dma_cookie_t ioat_tx_submit_unlock(struct dma_async_tx_descriptor *tx)
310 __releases(&ioat_chan->prep_lock)
312 struct dma_chan *c = tx->chan;
313 struct ioatdma_chan *ioat_chan = to_ioat_chan(c);
314 dma_cookie_t cookie;
316 cookie = dma_cookie_assign(tx);
317 dev_dbg(to_dev(ioat_chan), "%s: cookie: %d\n", __func__, cookie);
319 if (!test_and_set_bit(IOAT_CHAN_ACTIVE, &ioat_chan->state))
320 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
322 /* make descriptor updates visible before advancing ioat->head,
323 * this is purposefully not smp_wmb() since we are also
324 * publishing the descriptor updates to a dma device
326 wmb();
328 ioat_chan->head += ioat_chan->produce;
330 ioat_update_pending(ioat_chan);
331 spin_unlock_bh(&ioat_chan->prep_lock);
333 return cookie;
336 static struct ioat_ring_ent *
337 ioat_alloc_ring_ent(struct dma_chan *chan, int idx, gfp_t flags)
339 struct ioat_dma_descriptor *hw;
340 struct ioat_ring_ent *desc;
341 struct ioatdma_chan *ioat_chan = to_ioat_chan(chan);
342 int chunk;
343 dma_addr_t phys;
344 u8 *pos;
345 off_t offs;
347 chunk = idx / IOAT_DESCS_PER_2M;
348 idx &= (IOAT_DESCS_PER_2M - 1);
349 offs = idx * IOAT_DESC_SZ;
350 pos = (u8 *)ioat_chan->descs[chunk].virt + offs;
351 phys = ioat_chan->descs[chunk].hw + offs;
352 hw = (struct ioat_dma_descriptor *)pos;
353 memset(hw, 0, sizeof(*hw));
355 desc = kmem_cache_zalloc(ioat_cache, flags);
356 if (!desc)
357 return NULL;
359 dma_async_tx_descriptor_init(&desc->txd, chan);
360 desc->txd.tx_submit = ioat_tx_submit_unlock;
361 desc->hw = hw;
362 desc->txd.phys = phys;
363 return desc;
366 void ioat_free_ring_ent(struct ioat_ring_ent *desc, struct dma_chan *chan)
368 kmem_cache_free(ioat_cache, desc);
371 struct ioat_ring_ent **
372 ioat_alloc_ring(struct dma_chan *c, int order, gfp_t flags)
374 struct ioatdma_chan *ioat_chan = to_ioat_chan(c);
375 struct ioat_ring_ent **ring;
376 int total_descs = 1 << order;
377 int i, chunks;
379 /* allocate the array to hold the software ring */
380 ring = kcalloc(total_descs, sizeof(*ring), flags);
381 if (!ring)
382 return NULL;
384 ioat_chan->desc_chunks = chunks = (total_descs * IOAT_DESC_SZ) / SZ_2M;
386 for (i = 0; i < chunks; i++) {
387 struct ioat_descs *descs = &ioat_chan->descs[i];
389 descs->virt = dma_alloc_coherent(to_dev(ioat_chan),
390 SZ_2M, &descs->hw, flags);
391 if (!descs->virt) {
392 int idx;
394 for (idx = 0; idx < i; idx++) {
395 descs = &ioat_chan->descs[idx];
396 dma_free_coherent(to_dev(ioat_chan), SZ_2M,
397 descs->virt, descs->hw);
398 descs->virt = NULL;
399 descs->hw = 0;
402 ioat_chan->desc_chunks = 0;
403 kfree(ring);
404 return NULL;
408 for (i = 0; i < total_descs; i++) {
409 ring[i] = ioat_alloc_ring_ent(c, i, flags);
410 if (!ring[i]) {
411 int idx;
413 while (i--)
414 ioat_free_ring_ent(ring[i], c);
416 for (idx = 0; idx < ioat_chan->desc_chunks; idx++) {
417 dma_free_coherent(to_dev(ioat_chan),
418 SZ_2M,
419 ioat_chan->descs[idx].virt,
420 ioat_chan->descs[idx].hw);
421 ioat_chan->descs[idx].virt = NULL;
422 ioat_chan->descs[idx].hw = 0;
425 ioat_chan->desc_chunks = 0;
426 kfree(ring);
427 return NULL;
429 set_desc_id(ring[i], i);
432 /* link descs */
433 for (i = 0; i < total_descs-1; i++) {
434 struct ioat_ring_ent *next = ring[i+1];
435 struct ioat_dma_descriptor *hw = ring[i]->hw;
437 hw->next = next->txd.phys;
439 ring[i]->hw->next = ring[0]->txd.phys;
441 return ring;
445 * ioat_check_space_lock - verify space and grab ring producer lock
446 * @ioat: ioat,3 channel (ring) to operate on
447 * @num_descs: allocation length
449 int ioat_check_space_lock(struct ioatdma_chan *ioat_chan, int num_descs)
450 __acquires(&ioat_chan->prep_lock)
452 spin_lock_bh(&ioat_chan->prep_lock);
453 /* never allow the last descriptor to be consumed, we need at
454 * least one free at all times to allow for on-the-fly ring
455 * resizing.
457 if (likely(ioat_ring_space(ioat_chan) > num_descs)) {
458 dev_dbg(to_dev(ioat_chan), "%s: num_descs: %d (%x:%x:%x)\n",
459 __func__, num_descs, ioat_chan->head,
460 ioat_chan->tail, ioat_chan->issued);
461 ioat_chan->produce = num_descs;
462 return 0; /* with ioat->prep_lock held */
464 spin_unlock_bh(&ioat_chan->prep_lock);
466 dev_dbg_ratelimited(to_dev(ioat_chan),
467 "%s: ring full! num_descs: %d (%x:%x:%x)\n",
468 __func__, num_descs, ioat_chan->head,
469 ioat_chan->tail, ioat_chan->issued);
471 /* progress reclaim in the allocation failure case we may be
472 * called under bh_disabled so we need to trigger the timer
473 * event directly
475 if (time_is_before_jiffies(ioat_chan->timer.expires)
476 && timer_pending(&ioat_chan->timer)) {
477 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
478 ioat_timer_event(&ioat_chan->timer);
481 return -ENOMEM;
484 static bool desc_has_ext(struct ioat_ring_ent *desc)
486 struct ioat_dma_descriptor *hw = desc->hw;
488 if (hw->ctl_f.op == IOAT_OP_XOR ||
489 hw->ctl_f.op == IOAT_OP_XOR_VAL) {
490 struct ioat_xor_descriptor *xor = desc->xor;
492 if (src_cnt_to_sw(xor->ctl_f.src_cnt) > 5)
493 return true;
494 } else if (hw->ctl_f.op == IOAT_OP_PQ ||
495 hw->ctl_f.op == IOAT_OP_PQ_VAL) {
496 struct ioat_pq_descriptor *pq = desc->pq;
498 if (src_cnt_to_sw(pq->ctl_f.src_cnt) > 3)
499 return true;
502 return false;
505 static void
506 ioat_free_sed(struct ioatdma_device *ioat_dma, struct ioat_sed_ent *sed)
508 if (!sed)
509 return;
511 dma_pool_free(ioat_dma->sed_hw_pool[sed->hw_pool], sed->hw, sed->dma);
512 kmem_cache_free(ioat_sed_cache, sed);
515 static u64 ioat_get_current_completion(struct ioatdma_chan *ioat_chan)
517 u64 phys_complete;
518 u64 completion;
520 completion = *ioat_chan->completion;
521 phys_complete = ioat_chansts_to_addr(completion);
523 dev_dbg(to_dev(ioat_chan), "%s: phys_complete: %#llx\n", __func__,
524 (unsigned long long) phys_complete);
526 return phys_complete;
529 static bool ioat_cleanup_preamble(struct ioatdma_chan *ioat_chan,
530 u64 *phys_complete)
532 *phys_complete = ioat_get_current_completion(ioat_chan);
533 if (*phys_complete == ioat_chan->last_completion)
534 return false;
536 clear_bit(IOAT_COMPLETION_ACK, &ioat_chan->state);
537 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
539 return true;
542 static void
543 desc_get_errstat(struct ioatdma_chan *ioat_chan, struct ioat_ring_ent *desc)
545 struct ioat_dma_descriptor *hw = desc->hw;
547 switch (hw->ctl_f.op) {
548 case IOAT_OP_PQ_VAL:
549 case IOAT_OP_PQ_VAL_16S:
551 struct ioat_pq_descriptor *pq = desc->pq;
553 /* check if there's error written */
554 if (!pq->dwbes_f.wbes)
555 return;
557 /* need to set a chanerr var for checking to clear later */
559 if (pq->dwbes_f.p_val_err)
560 *desc->result |= SUM_CHECK_P_RESULT;
562 if (pq->dwbes_f.q_val_err)
563 *desc->result |= SUM_CHECK_Q_RESULT;
565 return;
567 default:
568 return;
573 * __cleanup - reclaim used descriptors
574 * @ioat: channel (ring) to clean
576 static void __cleanup(struct ioatdma_chan *ioat_chan, dma_addr_t phys_complete)
578 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma;
579 struct ioat_ring_ent *desc;
580 bool seen_current = false;
581 int idx = ioat_chan->tail, i;
582 u16 active;
584 dev_dbg(to_dev(ioat_chan), "%s: head: %#x tail: %#x issued: %#x\n",
585 __func__, ioat_chan->head, ioat_chan->tail, ioat_chan->issued);
588 * At restart of the channel, the completion address and the
589 * channel status will be 0 due to starting a new chain. Since
590 * it's new chain and the first descriptor "fails", there is
591 * nothing to clean up. We do not want to reap the entire submitted
592 * chain due to this 0 address value and then BUG.
594 if (!phys_complete)
595 return;
597 active = ioat_ring_active(ioat_chan);
598 for (i = 0; i < active && !seen_current; i++) {
599 struct dma_async_tx_descriptor *tx;
601 prefetch(ioat_get_ring_ent(ioat_chan, idx + i + 1));
602 desc = ioat_get_ring_ent(ioat_chan, idx + i);
603 dump_desc_dbg(ioat_chan, desc);
605 /* set err stat if we are using dwbes */
606 if (ioat_dma->cap & IOAT_CAP_DWBES)
607 desc_get_errstat(ioat_chan, desc);
609 tx = &desc->txd;
610 if (tx->cookie) {
611 dma_cookie_complete(tx);
612 dma_descriptor_unmap(tx);
613 dmaengine_desc_get_callback_invoke(tx, NULL);
614 tx->callback = NULL;
615 tx->callback_result = NULL;
618 if (tx->phys == phys_complete)
619 seen_current = true;
621 /* skip extended descriptors */
622 if (desc_has_ext(desc)) {
623 BUG_ON(i + 1 >= active);
624 i++;
627 /* cleanup super extended descriptors */
628 if (desc->sed) {
629 ioat_free_sed(ioat_dma, desc->sed);
630 desc->sed = NULL;
634 /* finish all descriptor reads before incrementing tail */
635 smp_mb();
636 ioat_chan->tail = idx + i;
637 /* no active descs have written a completion? */
638 BUG_ON(active && !seen_current);
639 ioat_chan->last_completion = phys_complete;
641 if (active - i == 0) {
642 dev_dbg(to_dev(ioat_chan), "%s: cancel completion timeout\n",
643 __func__);
644 mod_timer(&ioat_chan->timer, jiffies + IDLE_TIMEOUT);
647 /* microsecond delay by sysfs variable per pending descriptor */
648 if (ioat_chan->intr_coalesce != ioat_chan->prev_intr_coalesce) {
649 writew(min((ioat_chan->intr_coalesce * (active - i)),
650 IOAT_INTRDELAY_MASK),
651 ioat_chan->ioat_dma->reg_base + IOAT_INTRDELAY_OFFSET);
652 ioat_chan->prev_intr_coalesce = ioat_chan->intr_coalesce;
656 static void ioat_cleanup(struct ioatdma_chan *ioat_chan)
658 u64 phys_complete;
660 spin_lock_bh(&ioat_chan->cleanup_lock);
662 if (ioat_cleanup_preamble(ioat_chan, &phys_complete))
663 __cleanup(ioat_chan, phys_complete);
665 if (is_ioat_halted(*ioat_chan->completion)) {
666 u32 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
668 if (chanerr &
669 (IOAT_CHANERR_HANDLE_MASK | IOAT_CHANERR_RECOVER_MASK)) {
670 mod_timer(&ioat_chan->timer, jiffies + IDLE_TIMEOUT);
671 ioat_eh(ioat_chan);
675 spin_unlock_bh(&ioat_chan->cleanup_lock);
678 void ioat_cleanup_event(unsigned long data)
680 struct ioatdma_chan *ioat_chan = to_ioat_chan((void *)data);
682 ioat_cleanup(ioat_chan);
683 if (!test_bit(IOAT_RUN, &ioat_chan->state))
684 return;
685 writew(IOAT_CHANCTRL_RUN, ioat_chan->reg_base + IOAT_CHANCTRL_OFFSET);
688 static void ioat_restart_channel(struct ioatdma_chan *ioat_chan)
690 u64 phys_complete;
692 /* set the completion address register again */
693 writel(lower_32_bits(ioat_chan->completion_dma),
694 ioat_chan->reg_base + IOAT_CHANCMP_OFFSET_LOW);
695 writel(upper_32_bits(ioat_chan->completion_dma),
696 ioat_chan->reg_base + IOAT_CHANCMP_OFFSET_HIGH);
698 ioat_quiesce(ioat_chan, 0);
699 if (ioat_cleanup_preamble(ioat_chan, &phys_complete))
700 __cleanup(ioat_chan, phys_complete);
702 __ioat_restart_chan(ioat_chan);
706 static void ioat_abort_descs(struct ioatdma_chan *ioat_chan)
708 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma;
709 struct ioat_ring_ent *desc;
710 u16 active;
711 int idx = ioat_chan->tail, i;
714 * We assume that the failed descriptor has been processed.
715 * Now we are just returning all the remaining submitted
716 * descriptors to abort.
718 active = ioat_ring_active(ioat_chan);
720 /* we skip the failed descriptor that tail points to */
721 for (i = 1; i < active; i++) {
722 struct dma_async_tx_descriptor *tx;
724 prefetch(ioat_get_ring_ent(ioat_chan, idx + i + 1));
725 desc = ioat_get_ring_ent(ioat_chan, idx + i);
727 tx = &desc->txd;
728 if (tx->cookie) {
729 struct dmaengine_result res;
731 dma_cookie_complete(tx);
732 dma_descriptor_unmap(tx);
733 res.result = DMA_TRANS_ABORTED;
734 dmaengine_desc_get_callback_invoke(tx, &res);
735 tx->callback = NULL;
736 tx->callback_result = NULL;
739 /* skip extended descriptors */
740 if (desc_has_ext(desc)) {
741 WARN_ON(i + 1 >= active);
742 i++;
745 /* cleanup super extended descriptors */
746 if (desc->sed) {
747 ioat_free_sed(ioat_dma, desc->sed);
748 desc->sed = NULL;
752 smp_mb(); /* finish all descriptor reads before incrementing tail */
753 ioat_chan->tail = idx + active;
755 desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail);
756 ioat_chan->last_completion = *ioat_chan->completion = desc->txd.phys;
759 static void ioat_eh(struct ioatdma_chan *ioat_chan)
761 struct pci_dev *pdev = to_pdev(ioat_chan);
762 struct ioat_dma_descriptor *hw;
763 struct dma_async_tx_descriptor *tx;
764 u64 phys_complete;
765 struct ioat_ring_ent *desc;
766 u32 err_handled = 0;
767 u32 chanerr_int;
768 u32 chanerr;
769 bool abort = false;
770 struct dmaengine_result res;
772 /* cleanup so tail points to descriptor that caused the error */
773 if (ioat_cleanup_preamble(ioat_chan, &phys_complete))
774 __cleanup(ioat_chan, phys_complete);
776 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
777 pci_read_config_dword(pdev, IOAT_PCI_CHANERR_INT_OFFSET, &chanerr_int);
779 dev_dbg(to_dev(ioat_chan), "%s: error = %x:%x\n",
780 __func__, chanerr, chanerr_int);
782 desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail);
783 hw = desc->hw;
784 dump_desc_dbg(ioat_chan, desc);
786 switch (hw->ctl_f.op) {
787 case IOAT_OP_XOR_VAL:
788 if (chanerr & IOAT_CHANERR_XOR_P_OR_CRC_ERR) {
789 *desc->result |= SUM_CHECK_P_RESULT;
790 err_handled |= IOAT_CHANERR_XOR_P_OR_CRC_ERR;
792 break;
793 case IOAT_OP_PQ_VAL:
794 case IOAT_OP_PQ_VAL_16S:
795 if (chanerr & IOAT_CHANERR_XOR_P_OR_CRC_ERR) {
796 *desc->result |= SUM_CHECK_P_RESULT;
797 err_handled |= IOAT_CHANERR_XOR_P_OR_CRC_ERR;
799 if (chanerr & IOAT_CHANERR_XOR_Q_ERR) {
800 *desc->result |= SUM_CHECK_Q_RESULT;
801 err_handled |= IOAT_CHANERR_XOR_Q_ERR;
803 break;
806 if (chanerr & IOAT_CHANERR_RECOVER_MASK) {
807 if (chanerr & IOAT_CHANERR_READ_DATA_ERR) {
808 res.result = DMA_TRANS_READ_FAILED;
809 err_handled |= IOAT_CHANERR_READ_DATA_ERR;
810 } else if (chanerr & IOAT_CHANERR_WRITE_DATA_ERR) {
811 res.result = DMA_TRANS_WRITE_FAILED;
812 err_handled |= IOAT_CHANERR_WRITE_DATA_ERR;
815 abort = true;
816 } else
817 res.result = DMA_TRANS_NOERROR;
819 /* fault on unhandled error or spurious halt */
820 if (chanerr ^ err_handled || chanerr == 0) {
821 dev_err(to_dev(ioat_chan), "%s: fatal error (%x:%x)\n",
822 __func__, chanerr, err_handled);
823 dev_err(to_dev(ioat_chan), "Errors handled:\n");
824 ioat_print_chanerrs(ioat_chan, err_handled);
825 dev_err(to_dev(ioat_chan), "Errors not handled:\n");
826 ioat_print_chanerrs(ioat_chan, (chanerr & ~err_handled));
828 BUG();
831 /* cleanup the faulty descriptor since we are continuing */
832 tx = &desc->txd;
833 if (tx->cookie) {
834 dma_cookie_complete(tx);
835 dma_descriptor_unmap(tx);
836 dmaengine_desc_get_callback_invoke(tx, &res);
837 tx->callback = NULL;
838 tx->callback_result = NULL;
841 /* mark faulting descriptor as complete */
842 *ioat_chan->completion = desc->txd.phys;
844 spin_lock_bh(&ioat_chan->prep_lock);
845 /* we need abort all descriptors */
846 if (abort) {
847 ioat_abort_descs(ioat_chan);
848 /* clean up the channel, we could be in weird state */
849 ioat_reset_hw(ioat_chan);
852 writel(chanerr, ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
853 pci_write_config_dword(pdev, IOAT_PCI_CHANERR_INT_OFFSET, chanerr_int);
855 ioat_restart_channel(ioat_chan);
856 spin_unlock_bh(&ioat_chan->prep_lock);
859 static void check_active(struct ioatdma_chan *ioat_chan)
861 if (ioat_ring_active(ioat_chan)) {
862 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
863 return;
866 if (test_and_clear_bit(IOAT_CHAN_ACTIVE, &ioat_chan->state))
867 mod_timer(&ioat_chan->timer, jiffies + IDLE_TIMEOUT);
870 void ioat_timer_event(struct timer_list *t)
872 struct ioatdma_chan *ioat_chan = from_timer(ioat_chan, t, timer);
873 dma_addr_t phys_complete;
874 u64 status;
876 status = ioat_chansts(ioat_chan);
878 /* when halted due to errors check for channel
879 * programming errors before advancing the completion state
881 if (is_ioat_halted(status)) {
882 u32 chanerr;
884 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
885 dev_err(to_dev(ioat_chan), "%s: Channel halted (%x)\n",
886 __func__, chanerr);
887 dev_err(to_dev(ioat_chan), "Errors:\n");
888 ioat_print_chanerrs(ioat_chan, chanerr);
890 if (test_bit(IOAT_RUN, &ioat_chan->state)) {
891 spin_lock_bh(&ioat_chan->cleanup_lock);
892 spin_lock_bh(&ioat_chan->prep_lock);
893 set_bit(IOAT_CHAN_DOWN, &ioat_chan->state);
894 spin_unlock_bh(&ioat_chan->prep_lock);
896 ioat_abort_descs(ioat_chan);
897 dev_warn(to_dev(ioat_chan), "Reset channel...\n");
898 ioat_reset_hw(ioat_chan);
899 dev_warn(to_dev(ioat_chan), "Restart channel...\n");
900 ioat_restart_channel(ioat_chan);
902 spin_lock_bh(&ioat_chan->prep_lock);
903 clear_bit(IOAT_CHAN_DOWN, &ioat_chan->state);
904 spin_unlock_bh(&ioat_chan->prep_lock);
905 spin_unlock_bh(&ioat_chan->cleanup_lock);
908 return;
911 spin_lock_bh(&ioat_chan->cleanup_lock);
913 /* handle the no-actives case */
914 if (!ioat_ring_active(ioat_chan)) {
915 spin_lock_bh(&ioat_chan->prep_lock);
916 check_active(ioat_chan);
917 spin_unlock_bh(&ioat_chan->prep_lock);
918 spin_unlock_bh(&ioat_chan->cleanup_lock);
919 return;
922 /* if we haven't made progress and we have already
923 * acknowledged a pending completion once, then be more
924 * forceful with a restart
926 if (ioat_cleanup_preamble(ioat_chan, &phys_complete))
927 __cleanup(ioat_chan, phys_complete);
928 else if (test_bit(IOAT_COMPLETION_ACK, &ioat_chan->state)) {
929 u32 chanerr;
931 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
932 dev_err(to_dev(ioat_chan), "CHANSTS: %#Lx CHANERR: %#x\n",
933 status, chanerr);
934 dev_err(to_dev(ioat_chan), "Errors:\n");
935 ioat_print_chanerrs(ioat_chan, chanerr);
937 dev_dbg(to_dev(ioat_chan), "Active descriptors: %d\n",
938 ioat_ring_active(ioat_chan));
940 spin_lock_bh(&ioat_chan->prep_lock);
941 set_bit(IOAT_CHAN_DOWN, &ioat_chan->state);
942 spin_unlock_bh(&ioat_chan->prep_lock);
944 ioat_abort_descs(ioat_chan);
945 dev_warn(to_dev(ioat_chan), "Resetting channel...\n");
946 ioat_reset_hw(ioat_chan);
947 dev_warn(to_dev(ioat_chan), "Restarting channel...\n");
948 ioat_restart_channel(ioat_chan);
950 spin_lock_bh(&ioat_chan->prep_lock);
951 clear_bit(IOAT_CHAN_DOWN, &ioat_chan->state);
952 spin_unlock_bh(&ioat_chan->prep_lock);
953 spin_unlock_bh(&ioat_chan->cleanup_lock);
954 return;
955 } else
956 set_bit(IOAT_COMPLETION_ACK, &ioat_chan->state);
958 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
959 spin_unlock_bh(&ioat_chan->cleanup_lock);
962 enum dma_status
963 ioat_tx_status(struct dma_chan *c, dma_cookie_t cookie,
964 struct dma_tx_state *txstate)
966 struct ioatdma_chan *ioat_chan = to_ioat_chan(c);
967 enum dma_status ret;
969 ret = dma_cookie_status(c, cookie, txstate);
970 if (ret == DMA_COMPLETE)
971 return ret;
973 ioat_cleanup(ioat_chan);
975 return dma_cookie_status(c, cookie, txstate);
978 int ioat_reset_hw(struct ioatdma_chan *ioat_chan)
980 /* throw away whatever the channel was doing and get it
981 * initialized, with ioat3 specific workarounds
983 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma;
984 struct pci_dev *pdev = ioat_dma->pdev;
985 u32 chanerr;
986 u16 dev_id;
987 int err;
989 ioat_quiesce(ioat_chan, msecs_to_jiffies(100));
991 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
992 writel(chanerr, ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
994 if (ioat_dma->version < IOAT_VER_3_3) {
995 /* clear any pending errors */
996 err = pci_read_config_dword(pdev,
997 IOAT_PCI_CHANERR_INT_OFFSET, &chanerr);
998 if (err) {
999 dev_err(&pdev->dev,
1000 "channel error register unreachable\n");
1001 return err;
1003 pci_write_config_dword(pdev,
1004 IOAT_PCI_CHANERR_INT_OFFSET, chanerr);
1006 /* Clear DMAUNCERRSTS Cfg-Reg Parity Error status bit
1007 * (workaround for spurious config parity error after restart)
1009 pci_read_config_word(pdev, IOAT_PCI_DEVICE_ID_OFFSET, &dev_id);
1010 if (dev_id == PCI_DEVICE_ID_INTEL_IOAT_TBG0) {
1011 pci_write_config_dword(pdev,
1012 IOAT_PCI_DMAUNCERRSTS_OFFSET,
1013 0x10);
1017 if (is_bwd_ioat(pdev) && (ioat_dma->irq_mode == IOAT_MSIX)) {
1018 ioat_dma->msixtba0 = readq(ioat_dma->reg_base + 0x1000);
1019 ioat_dma->msixdata0 = readq(ioat_dma->reg_base + 0x1008);
1020 ioat_dma->msixpba = readq(ioat_dma->reg_base + 0x1800);
1024 err = ioat_reset_sync(ioat_chan, msecs_to_jiffies(200));
1025 if (!err) {
1026 if (is_bwd_ioat(pdev) && (ioat_dma->irq_mode == IOAT_MSIX)) {
1027 writeq(ioat_dma->msixtba0, ioat_dma->reg_base + 0x1000);
1028 writeq(ioat_dma->msixdata0, ioat_dma->reg_base + 0x1008);
1029 writeq(ioat_dma->msixpba, ioat_dma->reg_base + 0x1800);
1033 if (err)
1034 dev_err(&pdev->dev, "Failed to reset: %d\n", err);
1036 return err;