perf tools: Don't clone maps from parent when synthesizing forks
[linux/fpc-iii.git] / drivers / dma / ioat / dma.c
blob23fb2fa040002daeb3e248036efa261b63b3769e
1 /*
2 * Intel I/OAT DMA Linux driver
3 * Copyright(c) 2004 - 2015 Intel Corporation.
5 * This program is free software; you can redistribute it and/or modify it
6 * under the terms and conditions of the GNU General Public License,
7 * version 2, as published by the Free Software Foundation.
9 * This program is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
12 * more details.
14 * The full GNU General Public License is included in this distribution in
15 * the file called "COPYING".
20 * This driver supports an Intel I/OAT DMA engine, which does asynchronous
21 * copy operations.
24 #include <linux/init.h>
25 #include <linux/module.h>
26 #include <linux/slab.h>
27 #include <linux/pci.h>
28 #include <linux/interrupt.h>
29 #include <linux/dmaengine.h>
30 #include <linux/delay.h>
31 #include <linux/dma-mapping.h>
32 #include <linux/workqueue.h>
33 #include <linux/prefetch.h>
34 #include <linux/sizes.h>
35 #include "dma.h"
36 #include "registers.h"
37 #include "hw.h"
39 #include "../dmaengine.h"
41 static char *chanerr_str[] = {
42 "DMA Transfer Source Address Error",
43 "DMA Transfer Destination Address Error",
44 "Next Descriptor Address Error",
45 "Descriptor Error",
46 "Chan Address Value Error",
47 "CHANCMD Error",
48 "Chipset Uncorrectable Data Integrity Error",
49 "DMA Uncorrectable Data Integrity Error",
50 "Read Data Error",
51 "Write Data Error",
52 "Descriptor Control Error",
53 "Descriptor Transfer Size Error",
54 "Completion Address Error",
55 "Interrupt Configuration Error",
56 "Super extended descriptor Address Error",
57 "Unaffiliated Error",
58 "CRC or XOR P Error",
59 "XOR Q Error",
60 "Descriptor Count Error",
61 "DIF All F detect Error",
62 "Guard Tag verification Error",
63 "Application Tag verification Error",
64 "Reference Tag verification Error",
65 "Bundle Bit Error",
66 "Result DIF All F detect Error",
67 "Result Guard Tag verification Error",
68 "Result Application Tag verification Error",
69 "Result Reference Tag verification Error",
72 static void ioat_eh(struct ioatdma_chan *ioat_chan);
74 static void ioat_print_chanerrs(struct ioatdma_chan *ioat_chan, u32 chanerr)
76 int i;
78 for (i = 0; i < ARRAY_SIZE(chanerr_str); i++) {
79 if ((chanerr >> i) & 1) {
80 dev_err(to_dev(ioat_chan), "Err(%d): %s\n",
81 i, chanerr_str[i]);
86 /**
87 * ioat_dma_do_interrupt - handler used for single vector interrupt mode
88 * @irq: interrupt id
89 * @data: interrupt data
91 irqreturn_t ioat_dma_do_interrupt(int irq, void *data)
93 struct ioatdma_device *instance = data;
94 struct ioatdma_chan *ioat_chan;
95 unsigned long attnstatus;
96 int bit;
97 u8 intrctrl;
99 intrctrl = readb(instance->reg_base + IOAT_INTRCTRL_OFFSET);
101 if (!(intrctrl & IOAT_INTRCTRL_MASTER_INT_EN))
102 return IRQ_NONE;
104 if (!(intrctrl & IOAT_INTRCTRL_INT_STATUS)) {
105 writeb(intrctrl, instance->reg_base + IOAT_INTRCTRL_OFFSET);
106 return IRQ_NONE;
109 attnstatus = readl(instance->reg_base + IOAT_ATTNSTATUS_OFFSET);
110 for_each_set_bit(bit, &attnstatus, BITS_PER_LONG) {
111 ioat_chan = ioat_chan_by_index(instance, bit);
112 if (test_bit(IOAT_RUN, &ioat_chan->state))
113 tasklet_schedule(&ioat_chan->cleanup_task);
116 writeb(intrctrl, instance->reg_base + IOAT_INTRCTRL_OFFSET);
117 return IRQ_HANDLED;
121 * ioat_dma_do_interrupt_msix - handler used for vector-per-channel interrupt mode
122 * @irq: interrupt id
123 * @data: interrupt data
125 irqreturn_t ioat_dma_do_interrupt_msix(int irq, void *data)
127 struct ioatdma_chan *ioat_chan = data;
129 if (test_bit(IOAT_RUN, &ioat_chan->state))
130 tasklet_schedule(&ioat_chan->cleanup_task);
132 return IRQ_HANDLED;
135 void ioat_stop(struct ioatdma_chan *ioat_chan)
137 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma;
138 struct pci_dev *pdev = ioat_dma->pdev;
139 int chan_id = chan_num(ioat_chan);
140 struct msix_entry *msix;
142 /* 1/ stop irq from firing tasklets
143 * 2/ stop the tasklet from re-arming irqs
145 clear_bit(IOAT_RUN, &ioat_chan->state);
147 /* flush inflight interrupts */
148 switch (ioat_dma->irq_mode) {
149 case IOAT_MSIX:
150 msix = &ioat_dma->msix_entries[chan_id];
151 synchronize_irq(msix->vector);
152 break;
153 case IOAT_MSI:
154 case IOAT_INTX:
155 synchronize_irq(pdev->irq);
156 break;
157 default:
158 break;
161 /* flush inflight timers */
162 del_timer_sync(&ioat_chan->timer);
164 /* flush inflight tasklet runs */
165 tasklet_kill(&ioat_chan->cleanup_task);
167 /* final cleanup now that everything is quiesced and can't re-arm */
168 ioat_cleanup_event((unsigned long)&ioat_chan->dma_chan);
171 static void __ioat_issue_pending(struct ioatdma_chan *ioat_chan)
173 ioat_chan->dmacount += ioat_ring_pending(ioat_chan);
174 ioat_chan->issued = ioat_chan->head;
175 writew(ioat_chan->dmacount,
176 ioat_chan->reg_base + IOAT_CHAN_DMACOUNT_OFFSET);
177 dev_dbg(to_dev(ioat_chan),
178 "%s: head: %#x tail: %#x issued: %#x count: %#x\n",
179 __func__, ioat_chan->head, ioat_chan->tail,
180 ioat_chan->issued, ioat_chan->dmacount);
183 void ioat_issue_pending(struct dma_chan *c)
185 struct ioatdma_chan *ioat_chan = to_ioat_chan(c);
187 if (ioat_ring_pending(ioat_chan)) {
188 spin_lock_bh(&ioat_chan->prep_lock);
189 __ioat_issue_pending(ioat_chan);
190 spin_unlock_bh(&ioat_chan->prep_lock);
195 * ioat_update_pending - log pending descriptors
196 * @ioat: ioat+ channel
198 * Check if the number of unsubmitted descriptors has exceeded the
199 * watermark. Called with prep_lock held
201 static void ioat_update_pending(struct ioatdma_chan *ioat_chan)
203 if (ioat_ring_pending(ioat_chan) > ioat_pending_level)
204 __ioat_issue_pending(ioat_chan);
207 static void __ioat_start_null_desc(struct ioatdma_chan *ioat_chan)
209 struct ioat_ring_ent *desc;
210 struct ioat_dma_descriptor *hw;
212 if (ioat_ring_space(ioat_chan) < 1) {
213 dev_err(to_dev(ioat_chan),
214 "Unable to start null desc - ring full\n");
215 return;
218 dev_dbg(to_dev(ioat_chan),
219 "%s: head: %#x tail: %#x issued: %#x\n",
220 __func__, ioat_chan->head, ioat_chan->tail, ioat_chan->issued);
221 desc = ioat_get_ring_ent(ioat_chan, ioat_chan->head);
223 hw = desc->hw;
224 hw->ctl = 0;
225 hw->ctl_f.null = 1;
226 hw->ctl_f.int_en = 1;
227 hw->ctl_f.compl_write = 1;
228 /* set size to non-zero value (channel returns error when size is 0) */
229 hw->size = NULL_DESC_BUFFER_SIZE;
230 hw->src_addr = 0;
231 hw->dst_addr = 0;
232 async_tx_ack(&desc->txd);
233 ioat_set_chainaddr(ioat_chan, desc->txd.phys);
234 dump_desc_dbg(ioat_chan, desc);
235 /* make sure descriptors are written before we submit */
236 wmb();
237 ioat_chan->head += 1;
238 __ioat_issue_pending(ioat_chan);
241 void ioat_start_null_desc(struct ioatdma_chan *ioat_chan)
243 spin_lock_bh(&ioat_chan->prep_lock);
244 if (!test_bit(IOAT_CHAN_DOWN, &ioat_chan->state))
245 __ioat_start_null_desc(ioat_chan);
246 spin_unlock_bh(&ioat_chan->prep_lock);
249 static void __ioat_restart_chan(struct ioatdma_chan *ioat_chan)
251 /* set the tail to be re-issued */
252 ioat_chan->issued = ioat_chan->tail;
253 ioat_chan->dmacount = 0;
254 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
256 dev_dbg(to_dev(ioat_chan),
257 "%s: head: %#x tail: %#x issued: %#x count: %#x\n",
258 __func__, ioat_chan->head, ioat_chan->tail,
259 ioat_chan->issued, ioat_chan->dmacount);
261 if (ioat_ring_pending(ioat_chan)) {
262 struct ioat_ring_ent *desc;
264 desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail);
265 ioat_set_chainaddr(ioat_chan, desc->txd.phys);
266 __ioat_issue_pending(ioat_chan);
267 } else
268 __ioat_start_null_desc(ioat_chan);
271 static int ioat_quiesce(struct ioatdma_chan *ioat_chan, unsigned long tmo)
273 unsigned long end = jiffies + tmo;
274 int err = 0;
275 u32 status;
277 status = ioat_chansts(ioat_chan);
278 if (is_ioat_active(status) || is_ioat_idle(status))
279 ioat_suspend(ioat_chan);
280 while (is_ioat_active(status) || is_ioat_idle(status)) {
281 if (tmo && time_after(jiffies, end)) {
282 err = -ETIMEDOUT;
283 break;
285 status = ioat_chansts(ioat_chan);
286 cpu_relax();
289 return err;
292 static int ioat_reset_sync(struct ioatdma_chan *ioat_chan, unsigned long tmo)
294 unsigned long end = jiffies + tmo;
295 int err = 0;
297 ioat_reset(ioat_chan);
298 while (ioat_reset_pending(ioat_chan)) {
299 if (end && time_after(jiffies, end)) {
300 err = -ETIMEDOUT;
301 break;
303 cpu_relax();
306 return err;
309 static dma_cookie_t ioat_tx_submit_unlock(struct dma_async_tx_descriptor *tx)
310 __releases(&ioat_chan->prep_lock)
312 struct dma_chan *c = tx->chan;
313 struct ioatdma_chan *ioat_chan = to_ioat_chan(c);
314 dma_cookie_t cookie;
316 cookie = dma_cookie_assign(tx);
317 dev_dbg(to_dev(ioat_chan), "%s: cookie: %d\n", __func__, cookie);
319 if (!test_and_set_bit(IOAT_CHAN_ACTIVE, &ioat_chan->state))
320 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
322 /* make descriptor updates visible before advancing ioat->head,
323 * this is purposefully not smp_wmb() since we are also
324 * publishing the descriptor updates to a dma device
326 wmb();
328 ioat_chan->head += ioat_chan->produce;
330 ioat_update_pending(ioat_chan);
331 spin_unlock_bh(&ioat_chan->prep_lock);
333 return cookie;
336 static struct ioat_ring_ent *
337 ioat_alloc_ring_ent(struct dma_chan *chan, int idx, gfp_t flags)
339 struct ioat_dma_descriptor *hw;
340 struct ioat_ring_ent *desc;
341 struct ioatdma_chan *ioat_chan = to_ioat_chan(chan);
342 int chunk;
343 dma_addr_t phys;
344 u8 *pos;
345 off_t offs;
347 chunk = idx / IOAT_DESCS_PER_2M;
348 idx &= (IOAT_DESCS_PER_2M - 1);
349 offs = idx * IOAT_DESC_SZ;
350 pos = (u8 *)ioat_chan->descs[chunk].virt + offs;
351 phys = ioat_chan->descs[chunk].hw + offs;
352 hw = (struct ioat_dma_descriptor *)pos;
353 memset(hw, 0, sizeof(*hw));
355 desc = kmem_cache_zalloc(ioat_cache, flags);
356 if (!desc)
357 return NULL;
359 dma_async_tx_descriptor_init(&desc->txd, chan);
360 desc->txd.tx_submit = ioat_tx_submit_unlock;
361 desc->hw = hw;
362 desc->txd.phys = phys;
363 return desc;
366 void ioat_free_ring_ent(struct ioat_ring_ent *desc, struct dma_chan *chan)
368 kmem_cache_free(ioat_cache, desc);
371 struct ioat_ring_ent **
372 ioat_alloc_ring(struct dma_chan *c, int order, gfp_t flags)
374 struct ioatdma_chan *ioat_chan = to_ioat_chan(c);
375 struct ioat_ring_ent **ring;
376 int total_descs = 1 << order;
377 int i, chunks;
379 /* allocate the array to hold the software ring */
380 ring = kcalloc(total_descs, sizeof(*ring), flags);
381 if (!ring)
382 return NULL;
384 ioat_chan->desc_chunks = chunks = (total_descs * IOAT_DESC_SZ) / SZ_2M;
386 for (i = 0; i < chunks; i++) {
387 struct ioat_descs *descs = &ioat_chan->descs[i];
389 descs->virt = dma_alloc_coherent(to_dev(ioat_chan),
390 SZ_2M, &descs->hw, flags);
391 if (!descs->virt && (i > 0)) {
392 int idx;
394 for (idx = 0; idx < i; idx++) {
395 dma_free_coherent(to_dev(ioat_chan), SZ_2M,
396 descs->virt, descs->hw);
397 descs->virt = NULL;
398 descs->hw = 0;
401 ioat_chan->desc_chunks = 0;
402 kfree(ring);
403 return NULL;
407 for (i = 0; i < total_descs; i++) {
408 ring[i] = ioat_alloc_ring_ent(c, i, flags);
409 if (!ring[i]) {
410 int idx;
412 while (i--)
413 ioat_free_ring_ent(ring[i], c);
415 for (idx = 0; idx < ioat_chan->desc_chunks; idx++) {
416 dma_free_coherent(to_dev(ioat_chan),
417 SZ_2M,
418 ioat_chan->descs[idx].virt,
419 ioat_chan->descs[idx].hw);
420 ioat_chan->descs[idx].virt = NULL;
421 ioat_chan->descs[idx].hw = 0;
424 ioat_chan->desc_chunks = 0;
425 kfree(ring);
426 return NULL;
428 set_desc_id(ring[i], i);
431 /* link descs */
432 for (i = 0; i < total_descs-1; i++) {
433 struct ioat_ring_ent *next = ring[i+1];
434 struct ioat_dma_descriptor *hw = ring[i]->hw;
436 hw->next = next->txd.phys;
438 ring[i]->hw->next = ring[0]->txd.phys;
440 return ring;
444 * ioat_check_space_lock - verify space and grab ring producer lock
445 * @ioat: ioat,3 channel (ring) to operate on
446 * @num_descs: allocation length
448 int ioat_check_space_lock(struct ioatdma_chan *ioat_chan, int num_descs)
449 __acquires(&ioat_chan->prep_lock)
451 spin_lock_bh(&ioat_chan->prep_lock);
452 /* never allow the last descriptor to be consumed, we need at
453 * least one free at all times to allow for on-the-fly ring
454 * resizing.
456 if (likely(ioat_ring_space(ioat_chan) > num_descs)) {
457 dev_dbg(to_dev(ioat_chan), "%s: num_descs: %d (%x:%x:%x)\n",
458 __func__, num_descs, ioat_chan->head,
459 ioat_chan->tail, ioat_chan->issued);
460 ioat_chan->produce = num_descs;
461 return 0; /* with ioat->prep_lock held */
463 spin_unlock_bh(&ioat_chan->prep_lock);
465 dev_dbg_ratelimited(to_dev(ioat_chan),
466 "%s: ring full! num_descs: %d (%x:%x:%x)\n",
467 __func__, num_descs, ioat_chan->head,
468 ioat_chan->tail, ioat_chan->issued);
470 /* progress reclaim in the allocation failure case we may be
471 * called under bh_disabled so we need to trigger the timer
472 * event directly
474 if (time_is_before_jiffies(ioat_chan->timer.expires)
475 && timer_pending(&ioat_chan->timer)) {
476 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
477 ioat_timer_event(&ioat_chan->timer);
480 return -ENOMEM;
483 static bool desc_has_ext(struct ioat_ring_ent *desc)
485 struct ioat_dma_descriptor *hw = desc->hw;
487 if (hw->ctl_f.op == IOAT_OP_XOR ||
488 hw->ctl_f.op == IOAT_OP_XOR_VAL) {
489 struct ioat_xor_descriptor *xor = desc->xor;
491 if (src_cnt_to_sw(xor->ctl_f.src_cnt) > 5)
492 return true;
493 } else if (hw->ctl_f.op == IOAT_OP_PQ ||
494 hw->ctl_f.op == IOAT_OP_PQ_VAL) {
495 struct ioat_pq_descriptor *pq = desc->pq;
497 if (src_cnt_to_sw(pq->ctl_f.src_cnt) > 3)
498 return true;
501 return false;
504 static void
505 ioat_free_sed(struct ioatdma_device *ioat_dma, struct ioat_sed_ent *sed)
507 if (!sed)
508 return;
510 dma_pool_free(ioat_dma->sed_hw_pool[sed->hw_pool], sed->hw, sed->dma);
511 kmem_cache_free(ioat_sed_cache, sed);
514 static u64 ioat_get_current_completion(struct ioatdma_chan *ioat_chan)
516 u64 phys_complete;
517 u64 completion;
519 completion = *ioat_chan->completion;
520 phys_complete = ioat_chansts_to_addr(completion);
522 dev_dbg(to_dev(ioat_chan), "%s: phys_complete: %#llx\n", __func__,
523 (unsigned long long) phys_complete);
525 return phys_complete;
528 static bool ioat_cleanup_preamble(struct ioatdma_chan *ioat_chan,
529 u64 *phys_complete)
531 *phys_complete = ioat_get_current_completion(ioat_chan);
532 if (*phys_complete == ioat_chan->last_completion)
533 return false;
535 clear_bit(IOAT_COMPLETION_ACK, &ioat_chan->state);
536 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
538 return true;
541 static void
542 desc_get_errstat(struct ioatdma_chan *ioat_chan, struct ioat_ring_ent *desc)
544 struct ioat_dma_descriptor *hw = desc->hw;
546 switch (hw->ctl_f.op) {
547 case IOAT_OP_PQ_VAL:
548 case IOAT_OP_PQ_VAL_16S:
550 struct ioat_pq_descriptor *pq = desc->pq;
552 /* check if there's error written */
553 if (!pq->dwbes_f.wbes)
554 return;
556 /* need to set a chanerr var for checking to clear later */
558 if (pq->dwbes_f.p_val_err)
559 *desc->result |= SUM_CHECK_P_RESULT;
561 if (pq->dwbes_f.q_val_err)
562 *desc->result |= SUM_CHECK_Q_RESULT;
564 return;
566 default:
567 return;
572 * __cleanup - reclaim used descriptors
573 * @ioat: channel (ring) to clean
575 static void __cleanup(struct ioatdma_chan *ioat_chan, dma_addr_t phys_complete)
577 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma;
578 struct ioat_ring_ent *desc;
579 bool seen_current = false;
580 int idx = ioat_chan->tail, i;
581 u16 active;
583 dev_dbg(to_dev(ioat_chan), "%s: head: %#x tail: %#x issued: %#x\n",
584 __func__, ioat_chan->head, ioat_chan->tail, ioat_chan->issued);
587 * At restart of the channel, the completion address and the
588 * channel status will be 0 due to starting a new chain. Since
589 * it's new chain and the first descriptor "fails", there is
590 * nothing to clean up. We do not want to reap the entire submitted
591 * chain due to this 0 address value and then BUG.
593 if (!phys_complete)
594 return;
596 active = ioat_ring_active(ioat_chan);
597 for (i = 0; i < active && !seen_current; i++) {
598 struct dma_async_tx_descriptor *tx;
600 prefetch(ioat_get_ring_ent(ioat_chan, idx + i + 1));
601 desc = ioat_get_ring_ent(ioat_chan, idx + i);
602 dump_desc_dbg(ioat_chan, desc);
604 /* set err stat if we are using dwbes */
605 if (ioat_dma->cap & IOAT_CAP_DWBES)
606 desc_get_errstat(ioat_chan, desc);
608 tx = &desc->txd;
609 if (tx->cookie) {
610 dma_cookie_complete(tx);
611 dma_descriptor_unmap(tx);
612 dmaengine_desc_get_callback_invoke(tx, NULL);
613 tx->callback = NULL;
614 tx->callback_result = NULL;
617 if (tx->phys == phys_complete)
618 seen_current = true;
620 /* skip extended descriptors */
621 if (desc_has_ext(desc)) {
622 BUG_ON(i + 1 >= active);
623 i++;
626 /* cleanup super extended descriptors */
627 if (desc->sed) {
628 ioat_free_sed(ioat_dma, desc->sed);
629 desc->sed = NULL;
633 /* finish all descriptor reads before incrementing tail */
634 smp_mb();
635 ioat_chan->tail = idx + i;
636 /* no active descs have written a completion? */
637 BUG_ON(active && !seen_current);
638 ioat_chan->last_completion = phys_complete;
640 if (active - i == 0) {
641 dev_dbg(to_dev(ioat_chan), "%s: cancel completion timeout\n",
642 __func__);
643 mod_timer(&ioat_chan->timer, jiffies + IDLE_TIMEOUT);
646 /* microsecond delay by sysfs variable per pending descriptor */
647 if (ioat_chan->intr_coalesce != ioat_chan->prev_intr_coalesce) {
648 writew(min((ioat_chan->intr_coalesce * (active - i)),
649 IOAT_INTRDELAY_MASK),
650 ioat_chan->ioat_dma->reg_base + IOAT_INTRDELAY_OFFSET);
651 ioat_chan->prev_intr_coalesce = ioat_chan->intr_coalesce;
655 static void ioat_cleanup(struct ioatdma_chan *ioat_chan)
657 u64 phys_complete;
659 spin_lock_bh(&ioat_chan->cleanup_lock);
661 if (ioat_cleanup_preamble(ioat_chan, &phys_complete))
662 __cleanup(ioat_chan, phys_complete);
664 if (is_ioat_halted(*ioat_chan->completion)) {
665 u32 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
667 if (chanerr &
668 (IOAT_CHANERR_HANDLE_MASK | IOAT_CHANERR_RECOVER_MASK)) {
669 mod_timer(&ioat_chan->timer, jiffies + IDLE_TIMEOUT);
670 ioat_eh(ioat_chan);
674 spin_unlock_bh(&ioat_chan->cleanup_lock);
677 void ioat_cleanup_event(unsigned long data)
679 struct ioatdma_chan *ioat_chan = to_ioat_chan((void *)data);
681 ioat_cleanup(ioat_chan);
682 if (!test_bit(IOAT_RUN, &ioat_chan->state))
683 return;
684 writew(IOAT_CHANCTRL_RUN, ioat_chan->reg_base + IOAT_CHANCTRL_OFFSET);
687 static void ioat_restart_channel(struct ioatdma_chan *ioat_chan)
689 u64 phys_complete;
691 /* set the completion address register again */
692 writel(lower_32_bits(ioat_chan->completion_dma),
693 ioat_chan->reg_base + IOAT_CHANCMP_OFFSET_LOW);
694 writel(upper_32_bits(ioat_chan->completion_dma),
695 ioat_chan->reg_base + IOAT_CHANCMP_OFFSET_HIGH);
697 ioat_quiesce(ioat_chan, 0);
698 if (ioat_cleanup_preamble(ioat_chan, &phys_complete))
699 __cleanup(ioat_chan, phys_complete);
701 __ioat_restart_chan(ioat_chan);
705 static void ioat_abort_descs(struct ioatdma_chan *ioat_chan)
707 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma;
708 struct ioat_ring_ent *desc;
709 u16 active;
710 int idx = ioat_chan->tail, i;
713 * We assume that the failed descriptor has been processed.
714 * Now we are just returning all the remaining submitted
715 * descriptors to abort.
717 active = ioat_ring_active(ioat_chan);
719 /* we skip the failed descriptor that tail points to */
720 for (i = 1; i < active; i++) {
721 struct dma_async_tx_descriptor *tx;
723 prefetch(ioat_get_ring_ent(ioat_chan, idx + i + 1));
724 desc = ioat_get_ring_ent(ioat_chan, idx + i);
726 tx = &desc->txd;
727 if (tx->cookie) {
728 struct dmaengine_result res;
730 dma_cookie_complete(tx);
731 dma_descriptor_unmap(tx);
732 res.result = DMA_TRANS_ABORTED;
733 dmaengine_desc_get_callback_invoke(tx, &res);
734 tx->callback = NULL;
735 tx->callback_result = NULL;
738 /* skip extended descriptors */
739 if (desc_has_ext(desc)) {
740 WARN_ON(i + 1 >= active);
741 i++;
744 /* cleanup super extended descriptors */
745 if (desc->sed) {
746 ioat_free_sed(ioat_dma, desc->sed);
747 desc->sed = NULL;
751 smp_mb(); /* finish all descriptor reads before incrementing tail */
752 ioat_chan->tail = idx + active;
754 desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail);
755 ioat_chan->last_completion = *ioat_chan->completion = desc->txd.phys;
758 static void ioat_eh(struct ioatdma_chan *ioat_chan)
760 struct pci_dev *pdev = to_pdev(ioat_chan);
761 struct ioat_dma_descriptor *hw;
762 struct dma_async_tx_descriptor *tx;
763 u64 phys_complete;
764 struct ioat_ring_ent *desc;
765 u32 err_handled = 0;
766 u32 chanerr_int;
767 u32 chanerr;
768 bool abort = false;
769 struct dmaengine_result res;
771 /* cleanup so tail points to descriptor that caused the error */
772 if (ioat_cleanup_preamble(ioat_chan, &phys_complete))
773 __cleanup(ioat_chan, phys_complete);
775 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
776 pci_read_config_dword(pdev, IOAT_PCI_CHANERR_INT_OFFSET, &chanerr_int);
778 dev_dbg(to_dev(ioat_chan), "%s: error = %x:%x\n",
779 __func__, chanerr, chanerr_int);
781 desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail);
782 hw = desc->hw;
783 dump_desc_dbg(ioat_chan, desc);
785 switch (hw->ctl_f.op) {
786 case IOAT_OP_XOR_VAL:
787 if (chanerr & IOAT_CHANERR_XOR_P_OR_CRC_ERR) {
788 *desc->result |= SUM_CHECK_P_RESULT;
789 err_handled |= IOAT_CHANERR_XOR_P_OR_CRC_ERR;
791 break;
792 case IOAT_OP_PQ_VAL:
793 case IOAT_OP_PQ_VAL_16S:
794 if (chanerr & IOAT_CHANERR_XOR_P_OR_CRC_ERR) {
795 *desc->result |= SUM_CHECK_P_RESULT;
796 err_handled |= IOAT_CHANERR_XOR_P_OR_CRC_ERR;
798 if (chanerr & IOAT_CHANERR_XOR_Q_ERR) {
799 *desc->result |= SUM_CHECK_Q_RESULT;
800 err_handled |= IOAT_CHANERR_XOR_Q_ERR;
802 break;
805 if (chanerr & IOAT_CHANERR_RECOVER_MASK) {
806 if (chanerr & IOAT_CHANERR_READ_DATA_ERR) {
807 res.result = DMA_TRANS_READ_FAILED;
808 err_handled |= IOAT_CHANERR_READ_DATA_ERR;
809 } else if (chanerr & IOAT_CHANERR_WRITE_DATA_ERR) {
810 res.result = DMA_TRANS_WRITE_FAILED;
811 err_handled |= IOAT_CHANERR_WRITE_DATA_ERR;
814 abort = true;
815 } else
816 res.result = DMA_TRANS_NOERROR;
818 /* fault on unhandled error or spurious halt */
819 if (chanerr ^ err_handled || chanerr == 0) {
820 dev_err(to_dev(ioat_chan), "%s: fatal error (%x:%x)\n",
821 __func__, chanerr, err_handled);
822 dev_err(to_dev(ioat_chan), "Errors handled:\n");
823 ioat_print_chanerrs(ioat_chan, err_handled);
824 dev_err(to_dev(ioat_chan), "Errors not handled:\n");
825 ioat_print_chanerrs(ioat_chan, (chanerr & ~err_handled));
827 BUG();
830 /* cleanup the faulty descriptor since we are continuing */
831 tx = &desc->txd;
832 if (tx->cookie) {
833 dma_cookie_complete(tx);
834 dma_descriptor_unmap(tx);
835 dmaengine_desc_get_callback_invoke(tx, &res);
836 tx->callback = NULL;
837 tx->callback_result = NULL;
840 /* mark faulting descriptor as complete */
841 *ioat_chan->completion = desc->txd.phys;
843 spin_lock_bh(&ioat_chan->prep_lock);
844 /* we need abort all descriptors */
845 if (abort) {
846 ioat_abort_descs(ioat_chan);
847 /* clean up the channel, we could be in weird state */
848 ioat_reset_hw(ioat_chan);
851 writel(chanerr, ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
852 pci_write_config_dword(pdev, IOAT_PCI_CHANERR_INT_OFFSET, chanerr_int);
854 ioat_restart_channel(ioat_chan);
855 spin_unlock_bh(&ioat_chan->prep_lock);
858 static void check_active(struct ioatdma_chan *ioat_chan)
860 if (ioat_ring_active(ioat_chan)) {
861 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
862 return;
865 if (test_and_clear_bit(IOAT_CHAN_ACTIVE, &ioat_chan->state))
866 mod_timer(&ioat_chan->timer, jiffies + IDLE_TIMEOUT);
869 void ioat_timer_event(struct timer_list *t)
871 struct ioatdma_chan *ioat_chan = from_timer(ioat_chan, t, timer);
872 dma_addr_t phys_complete;
873 u64 status;
875 status = ioat_chansts(ioat_chan);
877 /* when halted due to errors check for channel
878 * programming errors before advancing the completion state
880 if (is_ioat_halted(status)) {
881 u32 chanerr;
883 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
884 dev_err(to_dev(ioat_chan), "%s: Channel halted (%x)\n",
885 __func__, chanerr);
886 dev_err(to_dev(ioat_chan), "Errors:\n");
887 ioat_print_chanerrs(ioat_chan, chanerr);
889 if (test_bit(IOAT_RUN, &ioat_chan->state)) {
890 spin_lock_bh(&ioat_chan->cleanup_lock);
891 spin_lock_bh(&ioat_chan->prep_lock);
892 set_bit(IOAT_CHAN_DOWN, &ioat_chan->state);
893 spin_unlock_bh(&ioat_chan->prep_lock);
895 ioat_abort_descs(ioat_chan);
896 dev_warn(to_dev(ioat_chan), "Reset channel...\n");
897 ioat_reset_hw(ioat_chan);
898 dev_warn(to_dev(ioat_chan), "Restart channel...\n");
899 ioat_restart_channel(ioat_chan);
901 spin_lock_bh(&ioat_chan->prep_lock);
902 clear_bit(IOAT_CHAN_DOWN, &ioat_chan->state);
903 spin_unlock_bh(&ioat_chan->prep_lock);
904 spin_unlock_bh(&ioat_chan->cleanup_lock);
907 return;
910 spin_lock_bh(&ioat_chan->cleanup_lock);
912 /* handle the no-actives case */
913 if (!ioat_ring_active(ioat_chan)) {
914 spin_lock_bh(&ioat_chan->prep_lock);
915 check_active(ioat_chan);
916 spin_unlock_bh(&ioat_chan->prep_lock);
917 spin_unlock_bh(&ioat_chan->cleanup_lock);
918 return;
921 /* if we haven't made progress and we have already
922 * acknowledged a pending completion once, then be more
923 * forceful with a restart
925 if (ioat_cleanup_preamble(ioat_chan, &phys_complete))
926 __cleanup(ioat_chan, phys_complete);
927 else if (test_bit(IOAT_COMPLETION_ACK, &ioat_chan->state)) {
928 u32 chanerr;
930 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
931 dev_err(to_dev(ioat_chan), "CHANSTS: %#Lx CHANERR: %#x\n",
932 status, chanerr);
933 dev_err(to_dev(ioat_chan), "Errors:\n");
934 ioat_print_chanerrs(ioat_chan, chanerr);
936 dev_dbg(to_dev(ioat_chan), "Active descriptors: %d\n",
937 ioat_ring_active(ioat_chan));
939 spin_lock_bh(&ioat_chan->prep_lock);
940 set_bit(IOAT_CHAN_DOWN, &ioat_chan->state);
941 spin_unlock_bh(&ioat_chan->prep_lock);
943 ioat_abort_descs(ioat_chan);
944 dev_warn(to_dev(ioat_chan), "Resetting channel...\n");
945 ioat_reset_hw(ioat_chan);
946 dev_warn(to_dev(ioat_chan), "Restarting channel...\n");
947 ioat_restart_channel(ioat_chan);
949 spin_lock_bh(&ioat_chan->prep_lock);
950 clear_bit(IOAT_CHAN_DOWN, &ioat_chan->state);
951 spin_unlock_bh(&ioat_chan->prep_lock);
952 spin_unlock_bh(&ioat_chan->cleanup_lock);
953 return;
954 } else
955 set_bit(IOAT_COMPLETION_ACK, &ioat_chan->state);
957 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT);
958 spin_unlock_bh(&ioat_chan->cleanup_lock);
961 enum dma_status
962 ioat_tx_status(struct dma_chan *c, dma_cookie_t cookie,
963 struct dma_tx_state *txstate)
965 struct ioatdma_chan *ioat_chan = to_ioat_chan(c);
966 enum dma_status ret;
968 ret = dma_cookie_status(c, cookie, txstate);
969 if (ret == DMA_COMPLETE)
970 return ret;
972 ioat_cleanup(ioat_chan);
974 return dma_cookie_status(c, cookie, txstate);
977 int ioat_reset_hw(struct ioatdma_chan *ioat_chan)
979 /* throw away whatever the channel was doing and get it
980 * initialized, with ioat3 specific workarounds
982 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma;
983 struct pci_dev *pdev = ioat_dma->pdev;
984 u32 chanerr;
985 u16 dev_id;
986 int err;
988 ioat_quiesce(ioat_chan, msecs_to_jiffies(100));
990 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
991 writel(chanerr, ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
993 if (ioat_dma->version < IOAT_VER_3_3) {
994 /* clear any pending errors */
995 err = pci_read_config_dword(pdev,
996 IOAT_PCI_CHANERR_INT_OFFSET, &chanerr);
997 if (err) {
998 dev_err(&pdev->dev,
999 "channel error register unreachable\n");
1000 return err;
1002 pci_write_config_dword(pdev,
1003 IOAT_PCI_CHANERR_INT_OFFSET, chanerr);
1005 /* Clear DMAUNCERRSTS Cfg-Reg Parity Error status bit
1006 * (workaround for spurious config parity error after restart)
1008 pci_read_config_word(pdev, IOAT_PCI_DEVICE_ID_OFFSET, &dev_id);
1009 if (dev_id == PCI_DEVICE_ID_INTEL_IOAT_TBG0) {
1010 pci_write_config_dword(pdev,
1011 IOAT_PCI_DMAUNCERRSTS_OFFSET,
1012 0x10);
1016 if (is_bwd_ioat(pdev) && (ioat_dma->irq_mode == IOAT_MSIX)) {
1017 ioat_dma->msixtba0 = readq(ioat_dma->reg_base + 0x1000);
1018 ioat_dma->msixdata0 = readq(ioat_dma->reg_base + 0x1008);
1019 ioat_dma->msixpba = readq(ioat_dma->reg_base + 0x1800);
1023 err = ioat_reset_sync(ioat_chan, msecs_to_jiffies(200));
1024 if (!err) {
1025 if (is_bwd_ioat(pdev) && (ioat_dma->irq_mode == IOAT_MSIX)) {
1026 writeq(ioat_dma->msixtba0, ioat_dma->reg_base + 0x1000);
1027 writeq(ioat_dma->msixdata0, ioat_dma->reg_base + 0x1008);
1028 writeq(ioat_dma->msixpba, ioat_dma->reg_base + 0x1800);
1032 if (err)
1033 dev_err(&pdev->dev, "Failed to reset: %d\n", err);
1035 return err;