2 * Intel I/OAT DMA Linux driver
3 * Copyright(c) 2004 - 2015 Intel Corporation.
5 * This program is free software; you can redistribute it and/or modify it
6 * under the terms and conditions of the GNU General Public License,
7 * version 2, as published by the Free Software Foundation.
9 * This program is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
14 * The full GNU General Public License is included in this distribution in
15 * the file called "COPYING".
20 * This driver supports an Intel I/OAT DMA engine, which does asynchronous
24 #include <linux/init.h>
25 #include <linux/module.h>
26 #include <linux/slab.h>
27 #include <linux/pci.h>
28 #include <linux/interrupt.h>
29 #include <linux/dmaengine.h>
30 #include <linux/delay.h>
31 #include <linux/dma-mapping.h>
32 #include <linux/workqueue.h>
33 #include <linux/prefetch.h>
35 #include "registers.h"
38 #include "../dmaengine.h"
40 static void ioat_eh(struct ioatdma_chan
*ioat_chan
);
43 * ioat_dma_do_interrupt - handler used for single vector interrupt mode
45 * @data: interrupt data
47 irqreturn_t
ioat_dma_do_interrupt(int irq
, void *data
)
49 struct ioatdma_device
*instance
= data
;
50 struct ioatdma_chan
*ioat_chan
;
51 unsigned long attnstatus
;
55 intrctrl
= readb(instance
->reg_base
+ IOAT_INTRCTRL_OFFSET
);
57 if (!(intrctrl
& IOAT_INTRCTRL_MASTER_INT_EN
))
60 if (!(intrctrl
& IOAT_INTRCTRL_INT_STATUS
)) {
61 writeb(intrctrl
, instance
->reg_base
+ IOAT_INTRCTRL_OFFSET
);
65 attnstatus
= readl(instance
->reg_base
+ IOAT_ATTNSTATUS_OFFSET
);
66 for_each_set_bit(bit
, &attnstatus
, BITS_PER_LONG
) {
67 ioat_chan
= ioat_chan_by_index(instance
, bit
);
68 if (test_bit(IOAT_RUN
, &ioat_chan
->state
))
69 tasklet_schedule(&ioat_chan
->cleanup_task
);
72 writeb(intrctrl
, instance
->reg_base
+ IOAT_INTRCTRL_OFFSET
);
77 * ioat_dma_do_interrupt_msix - handler used for vector-per-channel interrupt mode
79 * @data: interrupt data
81 irqreturn_t
ioat_dma_do_interrupt_msix(int irq
, void *data
)
83 struct ioatdma_chan
*ioat_chan
= data
;
85 if (test_bit(IOAT_RUN
, &ioat_chan
->state
))
86 tasklet_schedule(&ioat_chan
->cleanup_task
);
91 void ioat_stop(struct ioatdma_chan
*ioat_chan
)
93 struct ioatdma_device
*ioat_dma
= ioat_chan
->ioat_dma
;
94 struct pci_dev
*pdev
= ioat_dma
->pdev
;
95 int chan_id
= chan_num(ioat_chan
);
96 struct msix_entry
*msix
;
98 /* 1/ stop irq from firing tasklets
99 * 2/ stop the tasklet from re-arming irqs
101 clear_bit(IOAT_RUN
, &ioat_chan
->state
);
103 /* flush inflight interrupts */
104 switch (ioat_dma
->irq_mode
) {
106 msix
= &ioat_dma
->msix_entries
[chan_id
];
107 synchronize_irq(msix
->vector
);
111 synchronize_irq(pdev
->irq
);
117 /* flush inflight timers */
118 del_timer_sync(&ioat_chan
->timer
);
120 /* flush inflight tasklet runs */
121 tasklet_kill(&ioat_chan
->cleanup_task
);
123 /* final cleanup now that everything is quiesced and can't re-arm */
124 ioat_cleanup_event((unsigned long)&ioat_chan
->dma_chan
);
127 static void __ioat_issue_pending(struct ioatdma_chan
*ioat_chan
)
129 ioat_chan
->dmacount
+= ioat_ring_pending(ioat_chan
);
130 ioat_chan
->issued
= ioat_chan
->head
;
131 writew(ioat_chan
->dmacount
,
132 ioat_chan
->reg_base
+ IOAT_CHAN_DMACOUNT_OFFSET
);
133 dev_dbg(to_dev(ioat_chan
),
134 "%s: head: %#x tail: %#x issued: %#x count: %#x\n",
135 __func__
, ioat_chan
->head
, ioat_chan
->tail
,
136 ioat_chan
->issued
, ioat_chan
->dmacount
);
139 void ioat_issue_pending(struct dma_chan
*c
)
141 struct ioatdma_chan
*ioat_chan
= to_ioat_chan(c
);
143 if (ioat_ring_pending(ioat_chan
)) {
144 spin_lock_bh(&ioat_chan
->prep_lock
);
145 __ioat_issue_pending(ioat_chan
);
146 spin_unlock_bh(&ioat_chan
->prep_lock
);
151 * ioat_update_pending - log pending descriptors
152 * @ioat: ioat+ channel
154 * Check if the number of unsubmitted descriptors has exceeded the
155 * watermark. Called with prep_lock held
157 static void ioat_update_pending(struct ioatdma_chan
*ioat_chan
)
159 if (ioat_ring_pending(ioat_chan
) > ioat_pending_level
)
160 __ioat_issue_pending(ioat_chan
);
163 static void __ioat_start_null_desc(struct ioatdma_chan
*ioat_chan
)
165 struct ioat_ring_ent
*desc
;
166 struct ioat_dma_descriptor
*hw
;
168 if (ioat_ring_space(ioat_chan
) < 1) {
169 dev_err(to_dev(ioat_chan
),
170 "Unable to start null desc - ring full\n");
174 dev_dbg(to_dev(ioat_chan
),
175 "%s: head: %#x tail: %#x issued: %#x\n",
176 __func__
, ioat_chan
->head
, ioat_chan
->tail
, ioat_chan
->issued
);
177 desc
= ioat_get_ring_ent(ioat_chan
, ioat_chan
->head
);
182 hw
->ctl_f
.int_en
= 1;
183 hw
->ctl_f
.compl_write
= 1;
184 /* set size to non-zero value (channel returns error when size is 0) */
185 hw
->size
= NULL_DESC_BUFFER_SIZE
;
188 async_tx_ack(&desc
->txd
);
189 ioat_set_chainaddr(ioat_chan
, desc
->txd
.phys
);
190 dump_desc_dbg(ioat_chan
, desc
);
191 /* make sure descriptors are written before we submit */
193 ioat_chan
->head
+= 1;
194 __ioat_issue_pending(ioat_chan
);
197 void ioat_start_null_desc(struct ioatdma_chan
*ioat_chan
)
199 spin_lock_bh(&ioat_chan
->prep_lock
);
200 if (!test_bit(IOAT_CHAN_DOWN
, &ioat_chan
->state
))
201 __ioat_start_null_desc(ioat_chan
);
202 spin_unlock_bh(&ioat_chan
->prep_lock
);
205 static void __ioat_restart_chan(struct ioatdma_chan
*ioat_chan
)
207 /* set the tail to be re-issued */
208 ioat_chan
->issued
= ioat_chan
->tail
;
209 ioat_chan
->dmacount
= 0;
210 mod_timer(&ioat_chan
->timer
, jiffies
+ COMPLETION_TIMEOUT
);
212 dev_dbg(to_dev(ioat_chan
),
213 "%s: head: %#x tail: %#x issued: %#x count: %#x\n",
214 __func__
, ioat_chan
->head
, ioat_chan
->tail
,
215 ioat_chan
->issued
, ioat_chan
->dmacount
);
217 if (ioat_ring_pending(ioat_chan
)) {
218 struct ioat_ring_ent
*desc
;
220 desc
= ioat_get_ring_ent(ioat_chan
, ioat_chan
->tail
);
221 ioat_set_chainaddr(ioat_chan
, desc
->txd
.phys
);
222 __ioat_issue_pending(ioat_chan
);
224 __ioat_start_null_desc(ioat_chan
);
227 static int ioat_quiesce(struct ioatdma_chan
*ioat_chan
, unsigned long tmo
)
229 unsigned long end
= jiffies
+ tmo
;
233 status
= ioat_chansts(ioat_chan
);
234 if (is_ioat_active(status
) || is_ioat_idle(status
))
235 ioat_suspend(ioat_chan
);
236 while (is_ioat_active(status
) || is_ioat_idle(status
)) {
237 if (tmo
&& time_after(jiffies
, end
)) {
241 status
= ioat_chansts(ioat_chan
);
248 static int ioat_reset_sync(struct ioatdma_chan
*ioat_chan
, unsigned long tmo
)
250 unsigned long end
= jiffies
+ tmo
;
253 ioat_reset(ioat_chan
);
254 while (ioat_reset_pending(ioat_chan
)) {
255 if (end
&& time_after(jiffies
, end
)) {
265 static dma_cookie_t
ioat_tx_submit_unlock(struct dma_async_tx_descriptor
*tx
)
266 __releases(&ioat_chan
->prep_lock
)
268 struct dma_chan
*c
= tx
->chan
;
269 struct ioatdma_chan
*ioat_chan
= to_ioat_chan(c
);
272 cookie
= dma_cookie_assign(tx
);
273 dev_dbg(to_dev(ioat_chan
), "%s: cookie: %d\n", __func__
, cookie
);
275 if (!test_and_set_bit(IOAT_CHAN_ACTIVE
, &ioat_chan
->state
))
276 mod_timer(&ioat_chan
->timer
, jiffies
+ COMPLETION_TIMEOUT
);
278 /* make descriptor updates visible before advancing ioat->head,
279 * this is purposefully not smp_wmb() since we are also
280 * publishing the descriptor updates to a dma device
284 ioat_chan
->head
+= ioat_chan
->produce
;
286 ioat_update_pending(ioat_chan
);
287 spin_unlock_bh(&ioat_chan
->prep_lock
);
292 static struct ioat_ring_ent
*
293 ioat_alloc_ring_ent(struct dma_chan
*chan
, gfp_t flags
)
295 struct ioat_dma_descriptor
*hw
;
296 struct ioat_ring_ent
*desc
;
297 struct ioatdma_device
*ioat_dma
;
300 ioat_dma
= to_ioatdma_device(chan
->device
);
301 hw
= pci_pool_alloc(ioat_dma
->dma_pool
, flags
, &phys
);
304 memset(hw
, 0, sizeof(*hw
));
306 desc
= kmem_cache_zalloc(ioat_cache
, flags
);
308 pci_pool_free(ioat_dma
->dma_pool
, hw
, phys
);
312 dma_async_tx_descriptor_init(&desc
->txd
, chan
);
313 desc
->txd
.tx_submit
= ioat_tx_submit_unlock
;
315 desc
->txd
.phys
= phys
;
319 void ioat_free_ring_ent(struct ioat_ring_ent
*desc
, struct dma_chan
*chan
)
321 struct ioatdma_device
*ioat_dma
;
323 ioat_dma
= to_ioatdma_device(chan
->device
);
324 pci_pool_free(ioat_dma
->dma_pool
, desc
->hw
, desc
->txd
.phys
);
325 kmem_cache_free(ioat_cache
, desc
);
328 struct ioat_ring_ent
**
329 ioat_alloc_ring(struct dma_chan
*c
, int order
, gfp_t flags
)
331 struct ioat_ring_ent
**ring
;
332 int descs
= 1 << order
;
335 if (order
> ioat_get_max_alloc_order())
338 /* allocate the array to hold the software ring */
339 ring
= kcalloc(descs
, sizeof(*ring
), flags
);
342 for (i
= 0; i
< descs
; i
++) {
343 ring
[i
] = ioat_alloc_ring_ent(c
, flags
);
346 ioat_free_ring_ent(ring
[i
], c
);
350 set_desc_id(ring
[i
], i
);
354 for (i
= 0; i
< descs
-1; i
++) {
355 struct ioat_ring_ent
*next
= ring
[i
+1];
356 struct ioat_dma_descriptor
*hw
= ring
[i
]->hw
;
358 hw
->next
= next
->txd
.phys
;
360 ring
[i
]->hw
->next
= ring
[0]->txd
.phys
;
365 static bool reshape_ring(struct ioatdma_chan
*ioat_chan
, int order
)
367 /* reshape differs from normal ring allocation in that we want
368 * to allocate a new software ring while only
369 * extending/truncating the hardware ring
371 struct dma_chan
*c
= &ioat_chan
->dma_chan
;
372 const u32 curr_size
= ioat_ring_size(ioat_chan
);
373 const u16 active
= ioat_ring_active(ioat_chan
);
374 const u32 new_size
= 1 << order
;
375 struct ioat_ring_ent
**ring
;
378 if (order
> ioat_get_max_alloc_order())
381 /* double check that we have at least 1 free descriptor */
382 if (active
== curr_size
)
385 /* when shrinking, verify that we can hold the current active
386 * set in the new ring
388 if (active
>= new_size
)
391 /* allocate the array to hold the software ring */
392 ring
= kcalloc(new_size
, sizeof(*ring
), GFP_NOWAIT
);
396 /* allocate/trim descriptors as needed */
397 if (new_size
> curr_size
) {
398 /* copy current descriptors to the new ring */
399 for (i
= 0; i
< curr_size
; i
++) {
400 u16 curr_idx
= (ioat_chan
->tail
+i
) & (curr_size
-1);
401 u16 new_idx
= (ioat_chan
->tail
+i
) & (new_size
-1);
403 ring
[new_idx
] = ioat_chan
->ring
[curr_idx
];
404 set_desc_id(ring
[new_idx
], new_idx
);
407 /* add new descriptors to the ring */
408 for (i
= curr_size
; i
< new_size
; i
++) {
409 u16 new_idx
= (ioat_chan
->tail
+i
) & (new_size
-1);
411 ring
[new_idx
] = ioat_alloc_ring_ent(c
, GFP_NOWAIT
);
412 if (!ring
[new_idx
]) {
414 u16 new_idx
= (ioat_chan
->tail
+i
) &
417 ioat_free_ring_ent(ring
[new_idx
], c
);
422 set_desc_id(ring
[new_idx
], new_idx
);
425 /* hw link new descriptors */
426 for (i
= curr_size
-1; i
< new_size
; i
++) {
427 u16 new_idx
= (ioat_chan
->tail
+i
) & (new_size
-1);
428 struct ioat_ring_ent
*next
=
429 ring
[(new_idx
+1) & (new_size
-1)];
430 struct ioat_dma_descriptor
*hw
= ring
[new_idx
]->hw
;
432 hw
->next
= next
->txd
.phys
;
435 struct ioat_dma_descriptor
*hw
;
436 struct ioat_ring_ent
*next
;
438 /* copy current descriptors to the new ring, dropping the
439 * removed descriptors
441 for (i
= 0; i
< new_size
; i
++) {
442 u16 curr_idx
= (ioat_chan
->tail
+i
) & (curr_size
-1);
443 u16 new_idx
= (ioat_chan
->tail
+i
) & (new_size
-1);
445 ring
[new_idx
] = ioat_chan
->ring
[curr_idx
];
446 set_desc_id(ring
[new_idx
], new_idx
);
449 /* free deleted descriptors */
450 for (i
= new_size
; i
< curr_size
; i
++) {
451 struct ioat_ring_ent
*ent
;
453 ent
= ioat_get_ring_ent(ioat_chan
, ioat_chan
->tail
+i
);
454 ioat_free_ring_ent(ent
, c
);
457 /* fix up hardware ring */
458 hw
= ring
[(ioat_chan
->tail
+new_size
-1) & (new_size
-1)]->hw
;
459 next
= ring
[(ioat_chan
->tail
+new_size
) & (new_size
-1)];
460 hw
->next
= next
->txd
.phys
;
463 dev_dbg(to_dev(ioat_chan
), "%s: allocated %d descriptors\n",
466 kfree(ioat_chan
->ring
);
467 ioat_chan
->ring
= ring
;
468 ioat_chan
->alloc_order
= order
;
474 * ioat_check_space_lock - verify space and grab ring producer lock
475 * @ioat: ioat,3 channel (ring) to operate on
476 * @num_descs: allocation length
478 int ioat_check_space_lock(struct ioatdma_chan
*ioat_chan
, int num_descs
)
479 __acquires(&ioat_chan
->prep_lock
)
484 spin_lock_bh(&ioat_chan
->prep_lock
);
485 /* never allow the last descriptor to be consumed, we need at
486 * least one free at all times to allow for on-the-fly ring
489 if (likely(ioat_ring_space(ioat_chan
) > num_descs
)) {
490 dev_dbg(to_dev(ioat_chan
), "%s: num_descs: %d (%x:%x:%x)\n",
491 __func__
, num_descs
, ioat_chan
->head
,
492 ioat_chan
->tail
, ioat_chan
->issued
);
493 ioat_chan
->produce
= num_descs
;
494 return 0; /* with ioat->prep_lock held */
496 retry
= test_and_set_bit(IOAT_RESHAPE_PENDING
, &ioat_chan
->state
);
497 spin_unlock_bh(&ioat_chan
->prep_lock
);
499 /* is another cpu already trying to expand the ring? */
503 spin_lock_bh(&ioat_chan
->cleanup_lock
);
504 spin_lock_bh(&ioat_chan
->prep_lock
);
505 retry
= reshape_ring(ioat_chan
, ioat_chan
->alloc_order
+ 1);
506 clear_bit(IOAT_RESHAPE_PENDING
, &ioat_chan
->state
);
507 spin_unlock_bh(&ioat_chan
->prep_lock
);
508 spin_unlock_bh(&ioat_chan
->cleanup_lock
);
510 /* if we were able to expand the ring retry the allocation */
514 dev_dbg_ratelimited(to_dev(ioat_chan
),
515 "%s: ring full! num_descs: %d (%x:%x:%x)\n",
516 __func__
, num_descs
, ioat_chan
->head
,
517 ioat_chan
->tail
, ioat_chan
->issued
);
519 /* progress reclaim in the allocation failure case we may be
520 * called under bh_disabled so we need to trigger the timer
523 if (time_is_before_jiffies(ioat_chan
->timer
.expires
)
524 && timer_pending(&ioat_chan
->timer
)) {
525 mod_timer(&ioat_chan
->timer
, jiffies
+ COMPLETION_TIMEOUT
);
526 ioat_timer_event((unsigned long)ioat_chan
);
532 static bool desc_has_ext(struct ioat_ring_ent
*desc
)
534 struct ioat_dma_descriptor
*hw
= desc
->hw
;
536 if (hw
->ctl_f
.op
== IOAT_OP_XOR
||
537 hw
->ctl_f
.op
== IOAT_OP_XOR_VAL
) {
538 struct ioat_xor_descriptor
*xor = desc
->xor;
540 if (src_cnt_to_sw(xor->ctl_f
.src_cnt
) > 5)
542 } else if (hw
->ctl_f
.op
== IOAT_OP_PQ
||
543 hw
->ctl_f
.op
== IOAT_OP_PQ_VAL
) {
544 struct ioat_pq_descriptor
*pq
= desc
->pq
;
546 if (src_cnt_to_sw(pq
->ctl_f
.src_cnt
) > 3)
554 ioat_free_sed(struct ioatdma_device
*ioat_dma
, struct ioat_sed_ent
*sed
)
559 dma_pool_free(ioat_dma
->sed_hw_pool
[sed
->hw_pool
], sed
->hw
, sed
->dma
);
560 kmem_cache_free(ioat_sed_cache
, sed
);
563 static u64
ioat_get_current_completion(struct ioatdma_chan
*ioat_chan
)
568 completion
= *ioat_chan
->completion
;
569 phys_complete
= ioat_chansts_to_addr(completion
);
571 dev_dbg(to_dev(ioat_chan
), "%s: phys_complete: %#llx\n", __func__
,
572 (unsigned long long) phys_complete
);
574 return phys_complete
;
577 static bool ioat_cleanup_preamble(struct ioatdma_chan
*ioat_chan
,
580 *phys_complete
= ioat_get_current_completion(ioat_chan
);
581 if (*phys_complete
== ioat_chan
->last_completion
)
584 clear_bit(IOAT_COMPLETION_ACK
, &ioat_chan
->state
);
585 mod_timer(&ioat_chan
->timer
, jiffies
+ COMPLETION_TIMEOUT
);
591 desc_get_errstat(struct ioatdma_chan
*ioat_chan
, struct ioat_ring_ent
*desc
)
593 struct ioat_dma_descriptor
*hw
= desc
->hw
;
595 switch (hw
->ctl_f
.op
) {
597 case IOAT_OP_PQ_VAL_16S
:
599 struct ioat_pq_descriptor
*pq
= desc
->pq
;
601 /* check if there's error written */
602 if (!pq
->dwbes_f
.wbes
)
605 /* need to set a chanerr var for checking to clear later */
607 if (pq
->dwbes_f
.p_val_err
)
608 *desc
->result
|= SUM_CHECK_P_RESULT
;
610 if (pq
->dwbes_f
.q_val_err
)
611 *desc
->result
|= SUM_CHECK_Q_RESULT
;
621 * __cleanup - reclaim used descriptors
622 * @ioat: channel (ring) to clean
624 static void __cleanup(struct ioatdma_chan
*ioat_chan
, dma_addr_t phys_complete
)
626 struct ioatdma_device
*ioat_dma
= ioat_chan
->ioat_dma
;
627 struct ioat_ring_ent
*desc
;
628 bool seen_current
= false;
629 int idx
= ioat_chan
->tail
, i
;
632 dev_dbg(to_dev(ioat_chan
), "%s: head: %#x tail: %#x issued: %#x\n",
633 __func__
, ioat_chan
->head
, ioat_chan
->tail
, ioat_chan
->issued
);
636 * At restart of the channel, the completion address and the
637 * channel status will be 0 due to starting a new chain. Since
638 * it's new chain and the first descriptor "fails", there is
639 * nothing to clean up. We do not want to reap the entire submitted
640 * chain due to this 0 address value and then BUG.
645 active
= ioat_ring_active(ioat_chan
);
646 for (i
= 0; i
< active
&& !seen_current
; i
++) {
647 struct dma_async_tx_descriptor
*tx
;
649 smp_read_barrier_depends();
650 prefetch(ioat_get_ring_ent(ioat_chan
, idx
+ i
+ 1));
651 desc
= ioat_get_ring_ent(ioat_chan
, idx
+ i
);
652 dump_desc_dbg(ioat_chan
, desc
);
654 /* set err stat if we are using dwbes */
655 if (ioat_dma
->cap
& IOAT_CAP_DWBES
)
656 desc_get_errstat(ioat_chan
, desc
);
660 dma_cookie_complete(tx
);
661 dma_descriptor_unmap(tx
);
663 tx
->callback(tx
->callback_param
);
668 if (tx
->phys
== phys_complete
)
671 /* skip extended descriptors */
672 if (desc_has_ext(desc
)) {
673 BUG_ON(i
+ 1 >= active
);
677 /* cleanup super extended descriptors */
679 ioat_free_sed(ioat_dma
, desc
->sed
);
684 /* finish all descriptor reads before incrementing tail */
686 ioat_chan
->tail
= idx
+ i
;
687 /* no active descs have written a completion? */
688 BUG_ON(active
&& !seen_current
);
689 ioat_chan
->last_completion
= phys_complete
;
691 if (active
- i
== 0) {
692 dev_dbg(to_dev(ioat_chan
), "%s: cancel completion timeout\n",
694 mod_timer(&ioat_chan
->timer
, jiffies
+ IDLE_TIMEOUT
);
697 /* 5 microsecond delay per pending descriptor */
698 writew(min((5 * (active
- i
)), IOAT_INTRDELAY_MASK
),
699 ioat_chan
->ioat_dma
->reg_base
+ IOAT_INTRDELAY_OFFSET
);
702 static void ioat_cleanup(struct ioatdma_chan
*ioat_chan
)
706 spin_lock_bh(&ioat_chan
->cleanup_lock
);
708 if (ioat_cleanup_preamble(ioat_chan
, &phys_complete
))
709 __cleanup(ioat_chan
, phys_complete
);
711 if (is_ioat_halted(*ioat_chan
->completion
)) {
712 u32 chanerr
= readl(ioat_chan
->reg_base
+ IOAT_CHANERR_OFFSET
);
714 if (chanerr
& IOAT_CHANERR_HANDLE_MASK
) {
715 mod_timer(&ioat_chan
->timer
, jiffies
+ IDLE_TIMEOUT
);
720 spin_unlock_bh(&ioat_chan
->cleanup_lock
);
723 void ioat_cleanup_event(unsigned long data
)
725 struct ioatdma_chan
*ioat_chan
= to_ioat_chan((void *)data
);
727 ioat_cleanup(ioat_chan
);
728 if (!test_bit(IOAT_RUN
, &ioat_chan
->state
))
730 writew(IOAT_CHANCTRL_RUN
, ioat_chan
->reg_base
+ IOAT_CHANCTRL_OFFSET
);
733 static void ioat_restart_channel(struct ioatdma_chan
*ioat_chan
)
737 ioat_quiesce(ioat_chan
, 0);
738 if (ioat_cleanup_preamble(ioat_chan
, &phys_complete
))
739 __cleanup(ioat_chan
, phys_complete
);
741 __ioat_restart_chan(ioat_chan
);
744 static void ioat_eh(struct ioatdma_chan
*ioat_chan
)
746 struct pci_dev
*pdev
= to_pdev(ioat_chan
);
747 struct ioat_dma_descriptor
*hw
;
748 struct dma_async_tx_descriptor
*tx
;
750 struct ioat_ring_ent
*desc
;
755 /* cleanup so tail points to descriptor that caused the error */
756 if (ioat_cleanup_preamble(ioat_chan
, &phys_complete
))
757 __cleanup(ioat_chan
, phys_complete
);
759 chanerr
= readl(ioat_chan
->reg_base
+ IOAT_CHANERR_OFFSET
);
760 pci_read_config_dword(pdev
, IOAT_PCI_CHANERR_INT_OFFSET
, &chanerr_int
);
762 dev_dbg(to_dev(ioat_chan
), "%s: error = %x:%x\n",
763 __func__
, chanerr
, chanerr_int
);
765 desc
= ioat_get_ring_ent(ioat_chan
, ioat_chan
->tail
);
767 dump_desc_dbg(ioat_chan
, desc
);
769 switch (hw
->ctl_f
.op
) {
770 case IOAT_OP_XOR_VAL
:
771 if (chanerr
& IOAT_CHANERR_XOR_P_OR_CRC_ERR
) {
772 *desc
->result
|= SUM_CHECK_P_RESULT
;
773 err_handled
|= IOAT_CHANERR_XOR_P_OR_CRC_ERR
;
777 case IOAT_OP_PQ_VAL_16S
:
778 if (chanerr
& IOAT_CHANERR_XOR_P_OR_CRC_ERR
) {
779 *desc
->result
|= SUM_CHECK_P_RESULT
;
780 err_handled
|= IOAT_CHANERR_XOR_P_OR_CRC_ERR
;
782 if (chanerr
& IOAT_CHANERR_XOR_Q_ERR
) {
783 *desc
->result
|= SUM_CHECK_Q_RESULT
;
784 err_handled
|= IOAT_CHANERR_XOR_Q_ERR
;
789 /* fault on unhandled error or spurious halt */
790 if (chanerr
^ err_handled
|| chanerr
== 0) {
791 dev_err(to_dev(ioat_chan
), "%s: fatal error (%x:%x)\n",
792 __func__
, chanerr
, err_handled
);
794 } else { /* cleanup the faulty descriptor */
797 dma_cookie_complete(tx
);
798 dma_descriptor_unmap(tx
);
800 tx
->callback(tx
->callback_param
);
806 writel(chanerr
, ioat_chan
->reg_base
+ IOAT_CHANERR_OFFSET
);
807 pci_write_config_dword(pdev
, IOAT_PCI_CHANERR_INT_OFFSET
, chanerr_int
);
809 /* mark faulting descriptor as complete */
810 *ioat_chan
->completion
= desc
->txd
.phys
;
812 spin_lock_bh(&ioat_chan
->prep_lock
);
813 ioat_restart_channel(ioat_chan
);
814 spin_unlock_bh(&ioat_chan
->prep_lock
);
817 static void check_active(struct ioatdma_chan
*ioat_chan
)
819 if (ioat_ring_active(ioat_chan
)) {
820 mod_timer(&ioat_chan
->timer
, jiffies
+ COMPLETION_TIMEOUT
);
824 if (test_and_clear_bit(IOAT_CHAN_ACTIVE
, &ioat_chan
->state
))
825 mod_timer(&ioat_chan
->timer
, jiffies
+ IDLE_TIMEOUT
);
826 else if (ioat_chan
->alloc_order
> ioat_get_alloc_order()) {
827 /* if the ring is idle, empty, and oversized try to step
830 reshape_ring(ioat_chan
, ioat_chan
->alloc_order
- 1);
832 /* keep shrinking until we get back to our minimum
835 if (ioat_chan
->alloc_order
> ioat_get_alloc_order())
836 mod_timer(&ioat_chan
->timer
, jiffies
+ IDLE_TIMEOUT
);
841 void ioat_timer_event(unsigned long data
)
843 struct ioatdma_chan
*ioat_chan
= to_ioat_chan((void *)data
);
844 dma_addr_t phys_complete
;
847 status
= ioat_chansts(ioat_chan
);
849 /* when halted due to errors check for channel
850 * programming errors before advancing the completion state
852 if (is_ioat_halted(status
)) {
855 chanerr
= readl(ioat_chan
->reg_base
+ IOAT_CHANERR_OFFSET
);
856 dev_err(to_dev(ioat_chan
), "%s: Channel halted (%x)\n",
858 if (test_bit(IOAT_RUN
, &ioat_chan
->state
))
859 BUG_ON(is_ioat_bug(chanerr
));
860 else /* we never got off the ground */
864 /* if we haven't made progress and we have already
865 * acknowledged a pending completion once, then be more
866 * forceful with a restart
868 spin_lock_bh(&ioat_chan
->cleanup_lock
);
869 if (ioat_cleanup_preamble(ioat_chan
, &phys_complete
))
870 __cleanup(ioat_chan
, phys_complete
);
871 else if (test_bit(IOAT_COMPLETION_ACK
, &ioat_chan
->state
)) {
872 spin_lock_bh(&ioat_chan
->prep_lock
);
873 ioat_restart_channel(ioat_chan
);
874 spin_unlock_bh(&ioat_chan
->prep_lock
);
875 spin_unlock_bh(&ioat_chan
->cleanup_lock
);
878 set_bit(IOAT_COMPLETION_ACK
, &ioat_chan
->state
);
879 mod_timer(&ioat_chan
->timer
, jiffies
+ COMPLETION_TIMEOUT
);
883 if (ioat_ring_active(ioat_chan
))
884 mod_timer(&ioat_chan
->timer
, jiffies
+ COMPLETION_TIMEOUT
);
886 spin_lock_bh(&ioat_chan
->prep_lock
);
887 check_active(ioat_chan
);
888 spin_unlock_bh(&ioat_chan
->prep_lock
);
890 spin_unlock_bh(&ioat_chan
->cleanup_lock
);
894 ioat_tx_status(struct dma_chan
*c
, dma_cookie_t cookie
,
895 struct dma_tx_state
*txstate
)
897 struct ioatdma_chan
*ioat_chan
= to_ioat_chan(c
);
900 ret
= dma_cookie_status(c
, cookie
, txstate
);
901 if (ret
== DMA_COMPLETE
)
904 ioat_cleanup(ioat_chan
);
906 return dma_cookie_status(c
, cookie
, txstate
);
909 static int ioat_irq_reinit(struct ioatdma_device
*ioat_dma
)
911 struct pci_dev
*pdev
= ioat_dma
->pdev
;
912 int irq
= pdev
->irq
, i
;
914 if (!is_bwd_ioat(pdev
))
917 switch (ioat_dma
->irq_mode
) {
919 for (i
= 0; i
< ioat_dma
->dma_dev
.chancnt
; i
++) {
920 struct msix_entry
*msix
= &ioat_dma
->msix_entries
[i
];
921 struct ioatdma_chan
*ioat_chan
;
923 ioat_chan
= ioat_chan_by_index(ioat_dma
, i
);
924 devm_free_irq(&pdev
->dev
, msix
->vector
, ioat_chan
);
927 pci_disable_msix(pdev
);
930 pci_disable_msi(pdev
);
933 devm_free_irq(&pdev
->dev
, irq
, ioat_dma
);
938 ioat_dma
->irq_mode
= IOAT_NOIRQ
;
940 return ioat_dma_setup_interrupts(ioat_dma
);
943 int ioat_reset_hw(struct ioatdma_chan
*ioat_chan
)
945 /* throw away whatever the channel was doing and get it
946 * initialized, with ioat3 specific workarounds
948 struct ioatdma_device
*ioat_dma
= ioat_chan
->ioat_dma
;
949 struct pci_dev
*pdev
= ioat_dma
->pdev
;
954 ioat_quiesce(ioat_chan
, msecs_to_jiffies(100));
956 chanerr
= readl(ioat_chan
->reg_base
+ IOAT_CHANERR_OFFSET
);
957 writel(chanerr
, ioat_chan
->reg_base
+ IOAT_CHANERR_OFFSET
);
959 if (ioat_dma
->version
< IOAT_VER_3_3
) {
960 /* clear any pending errors */
961 err
= pci_read_config_dword(pdev
,
962 IOAT_PCI_CHANERR_INT_OFFSET
, &chanerr
);
965 "channel error register unreachable\n");
968 pci_write_config_dword(pdev
,
969 IOAT_PCI_CHANERR_INT_OFFSET
, chanerr
);
971 /* Clear DMAUNCERRSTS Cfg-Reg Parity Error status bit
972 * (workaround for spurious config parity error after restart)
974 pci_read_config_word(pdev
, IOAT_PCI_DEVICE_ID_OFFSET
, &dev_id
);
975 if (dev_id
== PCI_DEVICE_ID_INTEL_IOAT_TBG0
) {
976 pci_write_config_dword(pdev
,
977 IOAT_PCI_DMAUNCERRSTS_OFFSET
,
982 err
= ioat_reset_sync(ioat_chan
, msecs_to_jiffies(200));
984 err
= ioat_irq_reinit(ioat_dma
);
987 dev_err(&pdev
->dev
, "Failed to reset: %d\n", err
);