ARM: mm: Recreate kernel mappings in early_paging_init()
[linux/fpc-iii.git] / drivers / net / wireless / b43 / dma.c
blobc51d2dc489e45bd3a9b2aac36bf9fa2130453e72
1 /*
3 Broadcom B43 wireless driver
5 DMA ringbuffer and descriptor allocation/management
7 Copyright (c) 2005, 2006 Michael Buesch <m@bues.ch>
9 Some code in this file is derived from the b44.c driver
10 Copyright (C) 2002 David S. Miller
11 Copyright (C) Pekka Pietikainen
13 This program is free software; you can redistribute it and/or modify
14 it under the terms of the GNU General Public License as published by
15 the Free Software Foundation; either version 2 of the License, or
16 (at your option) any later version.
18 This program is distributed in the hope that it will be useful,
19 but WITHOUT ANY WARRANTY; without even the implied warranty of
20 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
21 GNU General Public License for more details.
23 You should have received a copy of the GNU General Public License
24 along with this program; see the file COPYING. If not, write to
25 the Free Software Foundation, Inc., 51 Franklin Steet, Fifth Floor,
26 Boston, MA 02110-1301, USA.
30 #include "b43.h"
31 #include "dma.h"
32 #include "main.h"
33 #include "debugfs.h"
34 #include "xmit.h"
36 #include <linux/dma-mapping.h>
37 #include <linux/pci.h>
38 #include <linux/delay.h>
39 #include <linux/skbuff.h>
40 #include <linux/etherdevice.h>
41 #include <linux/slab.h>
42 #include <asm/div64.h>
45 /* Required number of TX DMA slots per TX frame.
46 * This currently is 2, because we put the header and the ieee80211 frame
47 * into separate slots. */
48 #define TX_SLOTS_PER_FRAME 2
50 static u32 b43_dma_address(struct b43_dma *dma, dma_addr_t dmaaddr,
51 enum b43_addrtype addrtype)
53 u32 uninitialized_var(addr);
55 switch (addrtype) {
56 case B43_DMA_ADDR_LOW:
57 addr = lower_32_bits(dmaaddr);
58 if (dma->translation_in_low) {
59 addr &= ~SSB_DMA_TRANSLATION_MASK;
60 addr |= dma->translation;
62 break;
63 case B43_DMA_ADDR_HIGH:
64 addr = upper_32_bits(dmaaddr);
65 if (!dma->translation_in_low) {
66 addr &= ~SSB_DMA_TRANSLATION_MASK;
67 addr |= dma->translation;
69 break;
70 case B43_DMA_ADDR_EXT:
71 if (dma->translation_in_low)
72 addr = lower_32_bits(dmaaddr);
73 else
74 addr = upper_32_bits(dmaaddr);
75 addr &= SSB_DMA_TRANSLATION_MASK;
76 addr >>= SSB_DMA_TRANSLATION_SHIFT;
77 break;
80 return addr;
83 /* 32bit DMA ops. */
84 static
85 struct b43_dmadesc_generic *op32_idx2desc(struct b43_dmaring *ring,
86 int slot,
87 struct b43_dmadesc_meta **meta)
89 struct b43_dmadesc32 *desc;
91 *meta = &(ring->meta[slot]);
92 desc = ring->descbase;
93 desc = &(desc[slot]);
95 return (struct b43_dmadesc_generic *)desc;
98 static void op32_fill_descriptor(struct b43_dmaring *ring,
99 struct b43_dmadesc_generic *desc,
100 dma_addr_t dmaaddr, u16 bufsize,
101 int start, int end, int irq)
103 struct b43_dmadesc32 *descbase = ring->descbase;
104 int slot;
105 u32 ctl;
106 u32 addr;
107 u32 addrext;
109 slot = (int)(&(desc->dma32) - descbase);
110 B43_WARN_ON(!(slot >= 0 && slot < ring->nr_slots));
112 addr = b43_dma_address(&ring->dev->dma, dmaaddr, B43_DMA_ADDR_LOW);
113 addrext = b43_dma_address(&ring->dev->dma, dmaaddr, B43_DMA_ADDR_EXT);
115 ctl = bufsize & B43_DMA32_DCTL_BYTECNT;
116 if (slot == ring->nr_slots - 1)
117 ctl |= B43_DMA32_DCTL_DTABLEEND;
118 if (start)
119 ctl |= B43_DMA32_DCTL_FRAMESTART;
120 if (end)
121 ctl |= B43_DMA32_DCTL_FRAMEEND;
122 if (irq)
123 ctl |= B43_DMA32_DCTL_IRQ;
124 ctl |= (addrext << B43_DMA32_DCTL_ADDREXT_SHIFT)
125 & B43_DMA32_DCTL_ADDREXT_MASK;
127 desc->dma32.control = cpu_to_le32(ctl);
128 desc->dma32.address = cpu_to_le32(addr);
131 static void op32_poke_tx(struct b43_dmaring *ring, int slot)
133 b43_dma_write(ring, B43_DMA32_TXINDEX,
134 (u32) (slot * sizeof(struct b43_dmadesc32)));
137 static void op32_tx_suspend(struct b43_dmaring *ring)
139 b43_dma_write(ring, B43_DMA32_TXCTL, b43_dma_read(ring, B43_DMA32_TXCTL)
140 | B43_DMA32_TXSUSPEND);
143 static void op32_tx_resume(struct b43_dmaring *ring)
145 b43_dma_write(ring, B43_DMA32_TXCTL, b43_dma_read(ring, B43_DMA32_TXCTL)
146 & ~B43_DMA32_TXSUSPEND);
149 static int op32_get_current_rxslot(struct b43_dmaring *ring)
151 u32 val;
153 val = b43_dma_read(ring, B43_DMA32_RXSTATUS);
154 val &= B43_DMA32_RXDPTR;
156 return (val / sizeof(struct b43_dmadesc32));
159 static void op32_set_current_rxslot(struct b43_dmaring *ring, int slot)
161 b43_dma_write(ring, B43_DMA32_RXINDEX,
162 (u32) (slot * sizeof(struct b43_dmadesc32)));
165 static const struct b43_dma_ops dma32_ops = {
166 .idx2desc = op32_idx2desc,
167 .fill_descriptor = op32_fill_descriptor,
168 .poke_tx = op32_poke_tx,
169 .tx_suspend = op32_tx_suspend,
170 .tx_resume = op32_tx_resume,
171 .get_current_rxslot = op32_get_current_rxslot,
172 .set_current_rxslot = op32_set_current_rxslot,
175 /* 64bit DMA ops. */
176 static
177 struct b43_dmadesc_generic *op64_idx2desc(struct b43_dmaring *ring,
178 int slot,
179 struct b43_dmadesc_meta **meta)
181 struct b43_dmadesc64 *desc;
183 *meta = &(ring->meta[slot]);
184 desc = ring->descbase;
185 desc = &(desc[slot]);
187 return (struct b43_dmadesc_generic *)desc;
190 static void op64_fill_descriptor(struct b43_dmaring *ring,
191 struct b43_dmadesc_generic *desc,
192 dma_addr_t dmaaddr, u16 bufsize,
193 int start, int end, int irq)
195 struct b43_dmadesc64 *descbase = ring->descbase;
196 int slot;
197 u32 ctl0 = 0, ctl1 = 0;
198 u32 addrlo, addrhi;
199 u32 addrext;
201 slot = (int)(&(desc->dma64) - descbase);
202 B43_WARN_ON(!(slot >= 0 && slot < ring->nr_slots));
204 addrlo = b43_dma_address(&ring->dev->dma, dmaaddr, B43_DMA_ADDR_LOW);
205 addrhi = b43_dma_address(&ring->dev->dma, dmaaddr, B43_DMA_ADDR_HIGH);
206 addrext = b43_dma_address(&ring->dev->dma, dmaaddr, B43_DMA_ADDR_EXT);
208 if (slot == ring->nr_slots - 1)
209 ctl0 |= B43_DMA64_DCTL0_DTABLEEND;
210 if (start)
211 ctl0 |= B43_DMA64_DCTL0_FRAMESTART;
212 if (end)
213 ctl0 |= B43_DMA64_DCTL0_FRAMEEND;
214 if (irq)
215 ctl0 |= B43_DMA64_DCTL0_IRQ;
216 ctl1 |= bufsize & B43_DMA64_DCTL1_BYTECNT;
217 ctl1 |= (addrext << B43_DMA64_DCTL1_ADDREXT_SHIFT)
218 & B43_DMA64_DCTL1_ADDREXT_MASK;
220 desc->dma64.control0 = cpu_to_le32(ctl0);
221 desc->dma64.control1 = cpu_to_le32(ctl1);
222 desc->dma64.address_low = cpu_to_le32(addrlo);
223 desc->dma64.address_high = cpu_to_le32(addrhi);
226 static void op64_poke_tx(struct b43_dmaring *ring, int slot)
228 b43_dma_write(ring, B43_DMA64_TXINDEX,
229 (u32) (slot * sizeof(struct b43_dmadesc64)));
232 static void op64_tx_suspend(struct b43_dmaring *ring)
234 b43_dma_write(ring, B43_DMA64_TXCTL, b43_dma_read(ring, B43_DMA64_TXCTL)
235 | B43_DMA64_TXSUSPEND);
238 static void op64_tx_resume(struct b43_dmaring *ring)
240 b43_dma_write(ring, B43_DMA64_TXCTL, b43_dma_read(ring, B43_DMA64_TXCTL)
241 & ~B43_DMA64_TXSUSPEND);
244 static int op64_get_current_rxslot(struct b43_dmaring *ring)
246 u32 val;
248 val = b43_dma_read(ring, B43_DMA64_RXSTATUS);
249 val &= B43_DMA64_RXSTATDPTR;
251 return (val / sizeof(struct b43_dmadesc64));
254 static void op64_set_current_rxslot(struct b43_dmaring *ring, int slot)
256 b43_dma_write(ring, B43_DMA64_RXINDEX,
257 (u32) (slot * sizeof(struct b43_dmadesc64)));
260 static const struct b43_dma_ops dma64_ops = {
261 .idx2desc = op64_idx2desc,
262 .fill_descriptor = op64_fill_descriptor,
263 .poke_tx = op64_poke_tx,
264 .tx_suspend = op64_tx_suspend,
265 .tx_resume = op64_tx_resume,
266 .get_current_rxslot = op64_get_current_rxslot,
267 .set_current_rxslot = op64_set_current_rxslot,
270 static inline int free_slots(struct b43_dmaring *ring)
272 return (ring->nr_slots - ring->used_slots);
275 static inline int next_slot(struct b43_dmaring *ring, int slot)
277 B43_WARN_ON(!(slot >= -1 && slot <= ring->nr_slots - 1));
278 if (slot == ring->nr_slots - 1)
279 return 0;
280 return slot + 1;
283 static inline int prev_slot(struct b43_dmaring *ring, int slot)
285 B43_WARN_ON(!(slot >= 0 && slot <= ring->nr_slots - 1));
286 if (slot == 0)
287 return ring->nr_slots - 1;
288 return slot - 1;
291 #ifdef CONFIG_B43_DEBUG
292 static void update_max_used_slots(struct b43_dmaring *ring,
293 int current_used_slots)
295 if (current_used_slots <= ring->max_used_slots)
296 return;
297 ring->max_used_slots = current_used_slots;
298 if (b43_debug(ring->dev, B43_DBG_DMAVERBOSE)) {
299 b43dbg(ring->dev->wl,
300 "max_used_slots increased to %d on %s ring %d\n",
301 ring->max_used_slots,
302 ring->tx ? "TX" : "RX", ring->index);
305 #else
306 static inline
307 void update_max_used_slots(struct b43_dmaring *ring, int current_used_slots)
310 #endif /* DEBUG */
312 /* Request a slot for usage. */
313 static inline int request_slot(struct b43_dmaring *ring)
315 int slot;
317 B43_WARN_ON(!ring->tx);
318 B43_WARN_ON(ring->stopped);
319 B43_WARN_ON(free_slots(ring) == 0);
321 slot = next_slot(ring, ring->current_slot);
322 ring->current_slot = slot;
323 ring->used_slots++;
325 update_max_used_slots(ring, ring->used_slots);
327 return slot;
330 static u16 b43_dmacontroller_base(enum b43_dmatype type, int controller_idx)
332 static const u16 map64[] = {
333 B43_MMIO_DMA64_BASE0,
334 B43_MMIO_DMA64_BASE1,
335 B43_MMIO_DMA64_BASE2,
336 B43_MMIO_DMA64_BASE3,
337 B43_MMIO_DMA64_BASE4,
338 B43_MMIO_DMA64_BASE5,
340 static const u16 map32[] = {
341 B43_MMIO_DMA32_BASE0,
342 B43_MMIO_DMA32_BASE1,
343 B43_MMIO_DMA32_BASE2,
344 B43_MMIO_DMA32_BASE3,
345 B43_MMIO_DMA32_BASE4,
346 B43_MMIO_DMA32_BASE5,
349 if (type == B43_DMA_64BIT) {
350 B43_WARN_ON(!(controller_idx >= 0 &&
351 controller_idx < ARRAY_SIZE(map64)));
352 return map64[controller_idx];
354 B43_WARN_ON(!(controller_idx >= 0 &&
355 controller_idx < ARRAY_SIZE(map32)));
356 return map32[controller_idx];
359 static inline
360 dma_addr_t map_descbuffer(struct b43_dmaring *ring,
361 unsigned char *buf, size_t len, int tx)
363 dma_addr_t dmaaddr;
365 if (tx) {
366 dmaaddr = dma_map_single(ring->dev->dev->dma_dev,
367 buf, len, DMA_TO_DEVICE);
368 } else {
369 dmaaddr = dma_map_single(ring->dev->dev->dma_dev,
370 buf, len, DMA_FROM_DEVICE);
373 return dmaaddr;
376 static inline
377 void unmap_descbuffer(struct b43_dmaring *ring,
378 dma_addr_t addr, size_t len, int tx)
380 if (tx) {
381 dma_unmap_single(ring->dev->dev->dma_dev,
382 addr, len, DMA_TO_DEVICE);
383 } else {
384 dma_unmap_single(ring->dev->dev->dma_dev,
385 addr, len, DMA_FROM_DEVICE);
389 static inline
390 void sync_descbuffer_for_cpu(struct b43_dmaring *ring,
391 dma_addr_t addr, size_t len)
393 B43_WARN_ON(ring->tx);
394 dma_sync_single_for_cpu(ring->dev->dev->dma_dev,
395 addr, len, DMA_FROM_DEVICE);
398 static inline
399 void sync_descbuffer_for_device(struct b43_dmaring *ring,
400 dma_addr_t addr, size_t len)
402 B43_WARN_ON(ring->tx);
403 dma_sync_single_for_device(ring->dev->dev->dma_dev,
404 addr, len, DMA_FROM_DEVICE);
407 static inline
408 void free_descriptor_buffer(struct b43_dmaring *ring,
409 struct b43_dmadesc_meta *meta)
411 if (meta->skb) {
412 if (ring->tx)
413 ieee80211_free_txskb(ring->dev->wl->hw, meta->skb);
414 else
415 dev_kfree_skb_any(meta->skb);
416 meta->skb = NULL;
420 static int alloc_ringmemory(struct b43_dmaring *ring)
422 /* The specs call for 4K buffers for 30- and 32-bit DMA with 4K
423 * alignment and 8K buffers for 64-bit DMA with 8K alignment.
424 * In practice we could use smaller buffers for the latter, but the
425 * alignment is really important because of the hardware bug. If bit
426 * 0x00001000 is used in DMA address, some hardware (like BCM4331)
427 * copies that bit into B43_DMA64_RXSTATUS and we get false values from
428 * B43_DMA64_RXSTATDPTR. Let's just use 8K buffers even if we don't use
429 * more than 256 slots for ring.
431 u16 ring_mem_size = (ring->type == B43_DMA_64BIT) ?
432 B43_DMA64_RINGMEMSIZE : B43_DMA32_RINGMEMSIZE;
434 ring->descbase = dma_zalloc_coherent(ring->dev->dev->dma_dev,
435 ring_mem_size, &(ring->dmabase),
436 GFP_KERNEL);
437 if (!ring->descbase)
438 return -ENOMEM;
440 return 0;
443 static void free_ringmemory(struct b43_dmaring *ring)
445 u16 ring_mem_size = (ring->type == B43_DMA_64BIT) ?
446 B43_DMA64_RINGMEMSIZE : B43_DMA32_RINGMEMSIZE;
447 dma_free_coherent(ring->dev->dev->dma_dev, ring_mem_size,
448 ring->descbase, ring->dmabase);
451 /* Reset the RX DMA channel */
452 static int b43_dmacontroller_rx_reset(struct b43_wldev *dev, u16 mmio_base,
453 enum b43_dmatype type)
455 int i;
456 u32 value;
457 u16 offset;
459 might_sleep();
461 offset = (type == B43_DMA_64BIT) ? B43_DMA64_RXCTL : B43_DMA32_RXCTL;
462 b43_write32(dev, mmio_base + offset, 0);
463 for (i = 0; i < 10; i++) {
464 offset = (type == B43_DMA_64BIT) ? B43_DMA64_RXSTATUS :
465 B43_DMA32_RXSTATUS;
466 value = b43_read32(dev, mmio_base + offset);
467 if (type == B43_DMA_64BIT) {
468 value &= B43_DMA64_RXSTAT;
469 if (value == B43_DMA64_RXSTAT_DISABLED) {
470 i = -1;
471 break;
473 } else {
474 value &= B43_DMA32_RXSTATE;
475 if (value == B43_DMA32_RXSTAT_DISABLED) {
476 i = -1;
477 break;
480 msleep(1);
482 if (i != -1) {
483 b43err(dev->wl, "DMA RX reset timed out\n");
484 return -ENODEV;
487 return 0;
490 /* Reset the TX DMA channel */
491 static int b43_dmacontroller_tx_reset(struct b43_wldev *dev, u16 mmio_base,
492 enum b43_dmatype type)
494 int i;
495 u32 value;
496 u16 offset;
498 might_sleep();
500 for (i = 0; i < 10; i++) {
501 offset = (type == B43_DMA_64BIT) ? B43_DMA64_TXSTATUS :
502 B43_DMA32_TXSTATUS;
503 value = b43_read32(dev, mmio_base + offset);
504 if (type == B43_DMA_64BIT) {
505 value &= B43_DMA64_TXSTAT;
506 if (value == B43_DMA64_TXSTAT_DISABLED ||
507 value == B43_DMA64_TXSTAT_IDLEWAIT ||
508 value == B43_DMA64_TXSTAT_STOPPED)
509 break;
510 } else {
511 value &= B43_DMA32_TXSTATE;
512 if (value == B43_DMA32_TXSTAT_DISABLED ||
513 value == B43_DMA32_TXSTAT_IDLEWAIT ||
514 value == B43_DMA32_TXSTAT_STOPPED)
515 break;
517 msleep(1);
519 offset = (type == B43_DMA_64BIT) ? B43_DMA64_TXCTL : B43_DMA32_TXCTL;
520 b43_write32(dev, mmio_base + offset, 0);
521 for (i = 0; i < 10; i++) {
522 offset = (type == B43_DMA_64BIT) ? B43_DMA64_TXSTATUS :
523 B43_DMA32_TXSTATUS;
524 value = b43_read32(dev, mmio_base + offset);
525 if (type == B43_DMA_64BIT) {
526 value &= B43_DMA64_TXSTAT;
527 if (value == B43_DMA64_TXSTAT_DISABLED) {
528 i = -1;
529 break;
531 } else {
532 value &= B43_DMA32_TXSTATE;
533 if (value == B43_DMA32_TXSTAT_DISABLED) {
534 i = -1;
535 break;
538 msleep(1);
540 if (i != -1) {
541 b43err(dev->wl, "DMA TX reset timed out\n");
542 return -ENODEV;
544 /* ensure the reset is completed. */
545 msleep(1);
547 return 0;
550 /* Check if a DMA mapping address is invalid. */
551 static bool b43_dma_mapping_error(struct b43_dmaring *ring,
552 dma_addr_t addr,
553 size_t buffersize, bool dma_to_device)
555 if (unlikely(dma_mapping_error(ring->dev->dev->dma_dev, addr)))
556 return 1;
558 switch (ring->type) {
559 case B43_DMA_30BIT:
560 if ((u64)addr + buffersize > (1ULL << 30))
561 goto address_error;
562 break;
563 case B43_DMA_32BIT:
564 if ((u64)addr + buffersize > (1ULL << 32))
565 goto address_error;
566 break;
567 case B43_DMA_64BIT:
568 /* Currently we can't have addresses beyond
569 * 64bit in the kernel. */
570 break;
573 /* The address is OK. */
574 return 0;
576 address_error:
577 /* We can't support this address. Unmap it again. */
578 unmap_descbuffer(ring, addr, buffersize, dma_to_device);
580 return 1;
583 static bool b43_rx_buffer_is_poisoned(struct b43_dmaring *ring, struct sk_buff *skb)
585 unsigned char *f = skb->data + ring->frameoffset;
587 return ((f[0] & f[1] & f[2] & f[3] & f[4] & f[5] & f[6] & f[7]) == 0xFF);
590 static void b43_poison_rx_buffer(struct b43_dmaring *ring, struct sk_buff *skb)
592 struct b43_rxhdr_fw4 *rxhdr;
593 unsigned char *frame;
595 /* This poisons the RX buffer to detect DMA failures. */
597 rxhdr = (struct b43_rxhdr_fw4 *)(skb->data);
598 rxhdr->frame_len = 0;
600 B43_WARN_ON(ring->rx_buffersize < ring->frameoffset + sizeof(struct b43_plcp_hdr6) + 2);
601 frame = skb->data + ring->frameoffset;
602 memset(frame, 0xFF, sizeof(struct b43_plcp_hdr6) + 2 /* padding */);
605 static int setup_rx_descbuffer(struct b43_dmaring *ring,
606 struct b43_dmadesc_generic *desc,
607 struct b43_dmadesc_meta *meta, gfp_t gfp_flags)
609 dma_addr_t dmaaddr;
610 struct sk_buff *skb;
612 B43_WARN_ON(ring->tx);
614 skb = __dev_alloc_skb(ring->rx_buffersize, gfp_flags);
615 if (unlikely(!skb))
616 return -ENOMEM;
617 b43_poison_rx_buffer(ring, skb);
618 dmaaddr = map_descbuffer(ring, skb->data, ring->rx_buffersize, 0);
619 if (b43_dma_mapping_error(ring, dmaaddr, ring->rx_buffersize, 0)) {
620 /* ugh. try to realloc in zone_dma */
621 gfp_flags |= GFP_DMA;
623 dev_kfree_skb_any(skb);
625 skb = __dev_alloc_skb(ring->rx_buffersize, gfp_flags);
626 if (unlikely(!skb))
627 return -ENOMEM;
628 b43_poison_rx_buffer(ring, skb);
629 dmaaddr = map_descbuffer(ring, skb->data,
630 ring->rx_buffersize, 0);
631 if (b43_dma_mapping_error(ring, dmaaddr, ring->rx_buffersize, 0)) {
632 b43err(ring->dev->wl, "RX DMA buffer allocation failed\n");
633 dev_kfree_skb_any(skb);
634 return -EIO;
638 meta->skb = skb;
639 meta->dmaaddr = dmaaddr;
640 ring->ops->fill_descriptor(ring, desc, dmaaddr,
641 ring->rx_buffersize, 0, 0, 0);
643 return 0;
646 /* Allocate the initial descbuffers.
647 * This is used for an RX ring only.
649 static int alloc_initial_descbuffers(struct b43_dmaring *ring)
651 int i, err = -ENOMEM;
652 struct b43_dmadesc_generic *desc;
653 struct b43_dmadesc_meta *meta;
655 for (i = 0; i < ring->nr_slots; i++) {
656 desc = ring->ops->idx2desc(ring, i, &meta);
658 err = setup_rx_descbuffer(ring, desc, meta, GFP_KERNEL);
659 if (err) {
660 b43err(ring->dev->wl,
661 "Failed to allocate initial descbuffers\n");
662 goto err_unwind;
665 mb();
666 ring->used_slots = ring->nr_slots;
667 err = 0;
668 out:
669 return err;
671 err_unwind:
672 for (i--; i >= 0; i--) {
673 desc = ring->ops->idx2desc(ring, i, &meta);
675 unmap_descbuffer(ring, meta->dmaaddr, ring->rx_buffersize, 0);
676 dev_kfree_skb(meta->skb);
678 goto out;
681 /* Do initial setup of the DMA controller.
682 * Reset the controller, write the ring busaddress
683 * and switch the "enable" bit on.
685 static int dmacontroller_setup(struct b43_dmaring *ring)
687 int err = 0;
688 u32 value;
689 u32 addrext;
690 bool parity = ring->dev->dma.parity;
691 u32 addrlo;
692 u32 addrhi;
694 if (ring->tx) {
695 if (ring->type == B43_DMA_64BIT) {
696 u64 ringbase = (u64) (ring->dmabase);
697 addrext = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_EXT);
698 addrlo = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_LOW);
699 addrhi = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_HIGH);
701 value = B43_DMA64_TXENABLE;
702 value |= (addrext << B43_DMA64_TXADDREXT_SHIFT)
703 & B43_DMA64_TXADDREXT_MASK;
704 if (!parity)
705 value |= B43_DMA64_TXPARITYDISABLE;
706 b43_dma_write(ring, B43_DMA64_TXCTL, value);
707 b43_dma_write(ring, B43_DMA64_TXRINGLO, addrlo);
708 b43_dma_write(ring, B43_DMA64_TXRINGHI, addrhi);
709 } else {
710 u32 ringbase = (u32) (ring->dmabase);
711 addrext = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_EXT);
712 addrlo = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_LOW);
714 value = B43_DMA32_TXENABLE;
715 value |= (addrext << B43_DMA32_TXADDREXT_SHIFT)
716 & B43_DMA32_TXADDREXT_MASK;
717 if (!parity)
718 value |= B43_DMA32_TXPARITYDISABLE;
719 b43_dma_write(ring, B43_DMA32_TXCTL, value);
720 b43_dma_write(ring, B43_DMA32_TXRING, addrlo);
722 } else {
723 err = alloc_initial_descbuffers(ring);
724 if (err)
725 goto out;
726 if (ring->type == B43_DMA_64BIT) {
727 u64 ringbase = (u64) (ring->dmabase);
728 addrext = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_EXT);
729 addrlo = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_LOW);
730 addrhi = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_HIGH);
732 value = (ring->frameoffset << B43_DMA64_RXFROFF_SHIFT);
733 value |= B43_DMA64_RXENABLE;
734 value |= (addrext << B43_DMA64_RXADDREXT_SHIFT)
735 & B43_DMA64_RXADDREXT_MASK;
736 if (!parity)
737 value |= B43_DMA64_RXPARITYDISABLE;
738 b43_dma_write(ring, B43_DMA64_RXCTL, value);
739 b43_dma_write(ring, B43_DMA64_RXRINGLO, addrlo);
740 b43_dma_write(ring, B43_DMA64_RXRINGHI, addrhi);
741 b43_dma_write(ring, B43_DMA64_RXINDEX, ring->nr_slots *
742 sizeof(struct b43_dmadesc64));
743 } else {
744 u32 ringbase = (u32) (ring->dmabase);
745 addrext = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_EXT);
746 addrlo = b43_dma_address(&ring->dev->dma, ringbase, B43_DMA_ADDR_LOW);
748 value = (ring->frameoffset << B43_DMA32_RXFROFF_SHIFT);
749 value |= B43_DMA32_RXENABLE;
750 value |= (addrext << B43_DMA32_RXADDREXT_SHIFT)
751 & B43_DMA32_RXADDREXT_MASK;
752 if (!parity)
753 value |= B43_DMA32_RXPARITYDISABLE;
754 b43_dma_write(ring, B43_DMA32_RXCTL, value);
755 b43_dma_write(ring, B43_DMA32_RXRING, addrlo);
756 b43_dma_write(ring, B43_DMA32_RXINDEX, ring->nr_slots *
757 sizeof(struct b43_dmadesc32));
761 out:
762 return err;
765 /* Shutdown the DMA controller. */
766 static void dmacontroller_cleanup(struct b43_dmaring *ring)
768 if (ring->tx) {
769 b43_dmacontroller_tx_reset(ring->dev, ring->mmio_base,
770 ring->type);
771 if (ring->type == B43_DMA_64BIT) {
772 b43_dma_write(ring, B43_DMA64_TXRINGLO, 0);
773 b43_dma_write(ring, B43_DMA64_TXRINGHI, 0);
774 } else
775 b43_dma_write(ring, B43_DMA32_TXRING, 0);
776 } else {
777 b43_dmacontroller_rx_reset(ring->dev, ring->mmio_base,
778 ring->type);
779 if (ring->type == B43_DMA_64BIT) {
780 b43_dma_write(ring, B43_DMA64_RXRINGLO, 0);
781 b43_dma_write(ring, B43_DMA64_RXRINGHI, 0);
782 } else
783 b43_dma_write(ring, B43_DMA32_RXRING, 0);
787 static void free_all_descbuffers(struct b43_dmaring *ring)
789 struct b43_dmadesc_meta *meta;
790 int i;
792 if (!ring->used_slots)
793 return;
794 for (i = 0; i < ring->nr_slots; i++) {
795 /* get meta - ignore returned value */
796 ring->ops->idx2desc(ring, i, &meta);
798 if (!meta->skb || b43_dma_ptr_is_poisoned(meta->skb)) {
799 B43_WARN_ON(!ring->tx);
800 continue;
802 if (ring->tx) {
803 unmap_descbuffer(ring, meta->dmaaddr,
804 meta->skb->len, 1);
805 } else {
806 unmap_descbuffer(ring, meta->dmaaddr,
807 ring->rx_buffersize, 0);
809 free_descriptor_buffer(ring, meta);
813 static u64 supported_dma_mask(struct b43_wldev *dev)
815 u32 tmp;
816 u16 mmio_base;
818 switch (dev->dev->bus_type) {
819 #ifdef CONFIG_B43_BCMA
820 case B43_BUS_BCMA:
821 tmp = bcma_aread32(dev->dev->bdev, BCMA_IOST);
822 if (tmp & BCMA_IOST_DMA64)
823 return DMA_BIT_MASK(64);
824 break;
825 #endif
826 #ifdef CONFIG_B43_SSB
827 case B43_BUS_SSB:
828 tmp = ssb_read32(dev->dev->sdev, SSB_TMSHIGH);
829 if (tmp & SSB_TMSHIGH_DMA64)
830 return DMA_BIT_MASK(64);
831 break;
832 #endif
835 mmio_base = b43_dmacontroller_base(0, 0);
836 b43_write32(dev, mmio_base + B43_DMA32_TXCTL, B43_DMA32_TXADDREXT_MASK);
837 tmp = b43_read32(dev, mmio_base + B43_DMA32_TXCTL);
838 if (tmp & B43_DMA32_TXADDREXT_MASK)
839 return DMA_BIT_MASK(32);
841 return DMA_BIT_MASK(30);
844 static enum b43_dmatype dma_mask_to_engine_type(u64 dmamask)
846 if (dmamask == DMA_BIT_MASK(30))
847 return B43_DMA_30BIT;
848 if (dmamask == DMA_BIT_MASK(32))
849 return B43_DMA_32BIT;
850 if (dmamask == DMA_BIT_MASK(64))
851 return B43_DMA_64BIT;
852 B43_WARN_ON(1);
853 return B43_DMA_30BIT;
856 /* Main initialization function. */
857 static
858 struct b43_dmaring *b43_setup_dmaring(struct b43_wldev *dev,
859 int controller_index,
860 int for_tx,
861 enum b43_dmatype type)
863 struct b43_dmaring *ring;
864 int i, err;
865 dma_addr_t dma_test;
867 ring = kzalloc(sizeof(*ring), GFP_KERNEL);
868 if (!ring)
869 goto out;
871 ring->nr_slots = B43_RXRING_SLOTS;
872 if (for_tx)
873 ring->nr_slots = B43_TXRING_SLOTS;
875 ring->meta = kcalloc(ring->nr_slots, sizeof(struct b43_dmadesc_meta),
876 GFP_KERNEL);
877 if (!ring->meta)
878 goto err_kfree_ring;
879 for (i = 0; i < ring->nr_slots; i++)
880 ring->meta->skb = B43_DMA_PTR_POISON;
882 ring->type = type;
883 ring->dev = dev;
884 ring->mmio_base = b43_dmacontroller_base(type, controller_index);
885 ring->index = controller_index;
886 if (type == B43_DMA_64BIT)
887 ring->ops = &dma64_ops;
888 else
889 ring->ops = &dma32_ops;
890 if (for_tx) {
891 ring->tx = true;
892 ring->current_slot = -1;
893 } else {
894 if (ring->index == 0) {
895 switch (dev->fw.hdr_format) {
896 case B43_FW_HDR_598:
897 ring->rx_buffersize = B43_DMA0_RX_FW598_BUFSIZE;
898 ring->frameoffset = B43_DMA0_RX_FW598_FO;
899 break;
900 case B43_FW_HDR_410:
901 case B43_FW_HDR_351:
902 ring->rx_buffersize = B43_DMA0_RX_FW351_BUFSIZE;
903 ring->frameoffset = B43_DMA0_RX_FW351_FO;
904 break;
906 } else
907 B43_WARN_ON(1);
909 #ifdef CONFIG_B43_DEBUG
910 ring->last_injected_overflow = jiffies;
911 #endif
913 if (for_tx) {
914 /* Assumption: B43_TXRING_SLOTS can be divided by TX_SLOTS_PER_FRAME */
915 BUILD_BUG_ON(B43_TXRING_SLOTS % TX_SLOTS_PER_FRAME != 0);
917 ring->txhdr_cache = kcalloc(ring->nr_slots / TX_SLOTS_PER_FRAME,
918 b43_txhdr_size(dev),
919 GFP_KERNEL);
920 if (!ring->txhdr_cache)
921 goto err_kfree_meta;
923 /* test for ability to dma to txhdr_cache */
924 dma_test = dma_map_single(dev->dev->dma_dev,
925 ring->txhdr_cache,
926 b43_txhdr_size(dev),
927 DMA_TO_DEVICE);
929 if (b43_dma_mapping_error(ring, dma_test,
930 b43_txhdr_size(dev), 1)) {
931 /* ugh realloc */
932 kfree(ring->txhdr_cache);
933 ring->txhdr_cache = kcalloc(ring->nr_slots / TX_SLOTS_PER_FRAME,
934 b43_txhdr_size(dev),
935 GFP_KERNEL | GFP_DMA);
936 if (!ring->txhdr_cache)
937 goto err_kfree_meta;
939 dma_test = dma_map_single(dev->dev->dma_dev,
940 ring->txhdr_cache,
941 b43_txhdr_size(dev),
942 DMA_TO_DEVICE);
944 if (b43_dma_mapping_error(ring, dma_test,
945 b43_txhdr_size(dev), 1)) {
947 b43err(dev->wl,
948 "TXHDR DMA allocation failed\n");
949 goto err_kfree_txhdr_cache;
953 dma_unmap_single(dev->dev->dma_dev,
954 dma_test, b43_txhdr_size(dev),
955 DMA_TO_DEVICE);
958 err = alloc_ringmemory(ring);
959 if (err)
960 goto err_kfree_txhdr_cache;
961 err = dmacontroller_setup(ring);
962 if (err)
963 goto err_free_ringmemory;
965 out:
966 return ring;
968 err_free_ringmemory:
969 free_ringmemory(ring);
970 err_kfree_txhdr_cache:
971 kfree(ring->txhdr_cache);
972 err_kfree_meta:
973 kfree(ring->meta);
974 err_kfree_ring:
975 kfree(ring);
976 ring = NULL;
977 goto out;
980 #define divide(a, b) ({ \
981 typeof(a) __a = a; \
982 do_div(__a, b); \
983 __a; \
986 #define modulo(a, b) ({ \
987 typeof(a) __a = a; \
988 do_div(__a, b); \
991 /* Main cleanup function. */
992 static void b43_destroy_dmaring(struct b43_dmaring *ring,
993 const char *ringname)
995 if (!ring)
996 return;
998 #ifdef CONFIG_B43_DEBUG
1000 /* Print some statistics. */
1001 u64 failed_packets = ring->nr_failed_tx_packets;
1002 u64 succeed_packets = ring->nr_succeed_tx_packets;
1003 u64 nr_packets = failed_packets + succeed_packets;
1004 u64 permille_failed = 0, average_tries = 0;
1006 if (nr_packets)
1007 permille_failed = divide(failed_packets * 1000, nr_packets);
1008 if (nr_packets)
1009 average_tries = divide(ring->nr_total_packet_tries * 100, nr_packets);
1011 b43dbg(ring->dev->wl, "DMA-%u %s: "
1012 "Used slots %d/%d, Failed frames %llu/%llu = %llu.%01llu%%, "
1013 "Average tries %llu.%02llu\n",
1014 (unsigned int)(ring->type), ringname,
1015 ring->max_used_slots,
1016 ring->nr_slots,
1017 (unsigned long long)failed_packets,
1018 (unsigned long long)nr_packets,
1019 (unsigned long long)divide(permille_failed, 10),
1020 (unsigned long long)modulo(permille_failed, 10),
1021 (unsigned long long)divide(average_tries, 100),
1022 (unsigned long long)modulo(average_tries, 100));
1024 #endif /* DEBUG */
1026 /* Device IRQs are disabled prior entering this function,
1027 * so no need to take care of concurrency with rx handler stuff.
1029 dmacontroller_cleanup(ring);
1030 free_all_descbuffers(ring);
1031 free_ringmemory(ring);
1033 kfree(ring->txhdr_cache);
1034 kfree(ring->meta);
1035 kfree(ring);
1038 #define destroy_ring(dma, ring) do { \
1039 b43_destroy_dmaring((dma)->ring, __stringify(ring)); \
1040 (dma)->ring = NULL; \
1041 } while (0)
1043 void b43_dma_free(struct b43_wldev *dev)
1045 struct b43_dma *dma;
1047 if (b43_using_pio_transfers(dev))
1048 return;
1049 dma = &dev->dma;
1051 destroy_ring(dma, rx_ring);
1052 destroy_ring(dma, tx_ring_AC_BK);
1053 destroy_ring(dma, tx_ring_AC_BE);
1054 destroy_ring(dma, tx_ring_AC_VI);
1055 destroy_ring(dma, tx_ring_AC_VO);
1056 destroy_ring(dma, tx_ring_mcast);
1059 static int b43_dma_set_mask(struct b43_wldev *dev, u64 mask)
1061 u64 orig_mask = mask;
1062 bool fallback = false;
1063 int err;
1065 /* Try to set the DMA mask. If it fails, try falling back to a
1066 * lower mask, as we can always also support a lower one. */
1067 while (1) {
1068 err = dma_set_mask(dev->dev->dma_dev, mask);
1069 if (!err) {
1070 err = dma_set_coherent_mask(dev->dev->dma_dev, mask);
1071 if (!err)
1072 break;
1074 if (mask == DMA_BIT_MASK(64)) {
1075 mask = DMA_BIT_MASK(32);
1076 fallback = true;
1077 continue;
1079 if (mask == DMA_BIT_MASK(32)) {
1080 mask = DMA_BIT_MASK(30);
1081 fallback = true;
1082 continue;
1084 b43err(dev->wl, "The machine/kernel does not support "
1085 "the required %u-bit DMA mask\n",
1086 (unsigned int)dma_mask_to_engine_type(orig_mask));
1087 return -EOPNOTSUPP;
1089 if (fallback) {
1090 b43info(dev->wl, "DMA mask fallback from %u-bit to %u-bit\n",
1091 (unsigned int)dma_mask_to_engine_type(orig_mask),
1092 (unsigned int)dma_mask_to_engine_type(mask));
1095 return 0;
1098 /* Some hardware with 64-bit DMA seems to be bugged and looks for translation
1099 * bit in low address word instead of high one.
1101 static bool b43_dma_translation_in_low_word(struct b43_wldev *dev,
1102 enum b43_dmatype type)
1104 if (type != B43_DMA_64BIT)
1105 return 1;
1107 #ifdef CONFIG_B43_SSB
1108 if (dev->dev->bus_type == B43_BUS_SSB &&
1109 dev->dev->sdev->bus->bustype == SSB_BUSTYPE_PCI &&
1110 !(pci_is_pcie(dev->dev->sdev->bus->host_pci) &&
1111 ssb_read32(dev->dev->sdev, SSB_TMSHIGH) & SSB_TMSHIGH_DMA64))
1112 return 1;
1113 #endif
1114 return 0;
1117 int b43_dma_init(struct b43_wldev *dev)
1119 struct b43_dma *dma = &dev->dma;
1120 int err;
1121 u64 dmamask;
1122 enum b43_dmatype type;
1124 dmamask = supported_dma_mask(dev);
1125 type = dma_mask_to_engine_type(dmamask);
1126 err = b43_dma_set_mask(dev, dmamask);
1127 if (err)
1128 return err;
1130 switch (dev->dev->bus_type) {
1131 #ifdef CONFIG_B43_BCMA
1132 case B43_BUS_BCMA:
1133 dma->translation = bcma_core_dma_translation(dev->dev->bdev);
1134 break;
1135 #endif
1136 #ifdef CONFIG_B43_SSB
1137 case B43_BUS_SSB:
1138 dma->translation = ssb_dma_translation(dev->dev->sdev);
1139 break;
1140 #endif
1142 dma->translation_in_low = b43_dma_translation_in_low_word(dev, type);
1144 dma->parity = true;
1145 #ifdef CONFIG_B43_BCMA
1146 /* TODO: find out which SSB devices need disabling parity */
1147 if (dev->dev->bus_type == B43_BUS_BCMA)
1148 dma->parity = false;
1149 #endif
1151 err = -ENOMEM;
1152 /* setup TX DMA channels. */
1153 dma->tx_ring_AC_BK = b43_setup_dmaring(dev, 0, 1, type);
1154 if (!dma->tx_ring_AC_BK)
1155 goto out;
1157 dma->tx_ring_AC_BE = b43_setup_dmaring(dev, 1, 1, type);
1158 if (!dma->tx_ring_AC_BE)
1159 goto err_destroy_bk;
1161 dma->tx_ring_AC_VI = b43_setup_dmaring(dev, 2, 1, type);
1162 if (!dma->tx_ring_AC_VI)
1163 goto err_destroy_be;
1165 dma->tx_ring_AC_VO = b43_setup_dmaring(dev, 3, 1, type);
1166 if (!dma->tx_ring_AC_VO)
1167 goto err_destroy_vi;
1169 dma->tx_ring_mcast = b43_setup_dmaring(dev, 4, 1, type);
1170 if (!dma->tx_ring_mcast)
1171 goto err_destroy_vo;
1173 /* setup RX DMA channel. */
1174 dma->rx_ring = b43_setup_dmaring(dev, 0, 0, type);
1175 if (!dma->rx_ring)
1176 goto err_destroy_mcast;
1178 /* No support for the TX status DMA ring. */
1179 B43_WARN_ON(dev->dev->core_rev < 5);
1181 b43dbg(dev->wl, "%u-bit DMA initialized\n",
1182 (unsigned int)type);
1183 err = 0;
1184 out:
1185 return err;
1187 err_destroy_mcast:
1188 destroy_ring(dma, tx_ring_mcast);
1189 err_destroy_vo:
1190 destroy_ring(dma, tx_ring_AC_VO);
1191 err_destroy_vi:
1192 destroy_ring(dma, tx_ring_AC_VI);
1193 err_destroy_be:
1194 destroy_ring(dma, tx_ring_AC_BE);
1195 err_destroy_bk:
1196 destroy_ring(dma, tx_ring_AC_BK);
1197 return err;
1200 /* Generate a cookie for the TX header. */
1201 static u16 generate_cookie(struct b43_dmaring *ring, int slot)
1203 u16 cookie;
1205 /* Use the upper 4 bits of the cookie as
1206 * DMA controller ID and store the slot number
1207 * in the lower 12 bits.
1208 * Note that the cookie must never be 0, as this
1209 * is a special value used in RX path.
1210 * It can also not be 0xFFFF because that is special
1211 * for multicast frames.
1213 cookie = (((u16)ring->index + 1) << 12);
1214 B43_WARN_ON(slot & ~0x0FFF);
1215 cookie |= (u16)slot;
1217 return cookie;
1220 /* Inspect a cookie and find out to which controller/slot it belongs. */
1221 static
1222 struct b43_dmaring *parse_cookie(struct b43_wldev *dev, u16 cookie, int *slot)
1224 struct b43_dma *dma = &dev->dma;
1225 struct b43_dmaring *ring = NULL;
1227 switch (cookie & 0xF000) {
1228 case 0x1000:
1229 ring = dma->tx_ring_AC_BK;
1230 break;
1231 case 0x2000:
1232 ring = dma->tx_ring_AC_BE;
1233 break;
1234 case 0x3000:
1235 ring = dma->tx_ring_AC_VI;
1236 break;
1237 case 0x4000:
1238 ring = dma->tx_ring_AC_VO;
1239 break;
1240 case 0x5000:
1241 ring = dma->tx_ring_mcast;
1242 break;
1244 *slot = (cookie & 0x0FFF);
1245 if (unlikely(!ring || *slot < 0 || *slot >= ring->nr_slots)) {
1246 b43dbg(dev->wl, "TX-status contains "
1247 "invalid cookie: 0x%04X\n", cookie);
1248 return NULL;
1251 return ring;
1254 static int dma_tx_fragment(struct b43_dmaring *ring,
1255 struct sk_buff *skb)
1257 const struct b43_dma_ops *ops = ring->ops;
1258 struct ieee80211_tx_info *info = IEEE80211_SKB_CB(skb);
1259 struct b43_private_tx_info *priv_info = b43_get_priv_tx_info(info);
1260 u8 *header;
1261 int slot, old_top_slot, old_used_slots;
1262 int err;
1263 struct b43_dmadesc_generic *desc;
1264 struct b43_dmadesc_meta *meta;
1265 struct b43_dmadesc_meta *meta_hdr;
1266 u16 cookie;
1267 size_t hdrsize = b43_txhdr_size(ring->dev);
1269 /* Important note: If the number of used DMA slots per TX frame
1270 * is changed here, the TX_SLOTS_PER_FRAME definition at the top of
1271 * the file has to be updated, too!
1274 old_top_slot = ring->current_slot;
1275 old_used_slots = ring->used_slots;
1277 /* Get a slot for the header. */
1278 slot = request_slot(ring);
1279 desc = ops->idx2desc(ring, slot, &meta_hdr);
1280 memset(meta_hdr, 0, sizeof(*meta_hdr));
1282 header = &(ring->txhdr_cache[(slot / TX_SLOTS_PER_FRAME) * hdrsize]);
1283 cookie = generate_cookie(ring, slot);
1284 err = b43_generate_txhdr(ring->dev, header,
1285 skb, info, cookie);
1286 if (unlikely(err)) {
1287 ring->current_slot = old_top_slot;
1288 ring->used_slots = old_used_slots;
1289 return err;
1292 meta_hdr->dmaaddr = map_descbuffer(ring, (unsigned char *)header,
1293 hdrsize, 1);
1294 if (b43_dma_mapping_error(ring, meta_hdr->dmaaddr, hdrsize, 1)) {
1295 ring->current_slot = old_top_slot;
1296 ring->used_slots = old_used_slots;
1297 return -EIO;
1299 ops->fill_descriptor(ring, desc, meta_hdr->dmaaddr,
1300 hdrsize, 1, 0, 0);
1302 /* Get a slot for the payload. */
1303 slot = request_slot(ring);
1304 desc = ops->idx2desc(ring, slot, &meta);
1305 memset(meta, 0, sizeof(*meta));
1307 meta->skb = skb;
1308 meta->is_last_fragment = true;
1309 priv_info->bouncebuffer = NULL;
1311 meta->dmaaddr = map_descbuffer(ring, skb->data, skb->len, 1);
1312 /* create a bounce buffer in zone_dma on mapping failure. */
1313 if (b43_dma_mapping_error(ring, meta->dmaaddr, skb->len, 1)) {
1314 priv_info->bouncebuffer = kmemdup(skb->data, skb->len,
1315 GFP_ATOMIC | GFP_DMA);
1316 if (!priv_info->bouncebuffer) {
1317 ring->current_slot = old_top_slot;
1318 ring->used_slots = old_used_slots;
1319 err = -ENOMEM;
1320 goto out_unmap_hdr;
1323 meta->dmaaddr = map_descbuffer(ring, priv_info->bouncebuffer, skb->len, 1);
1324 if (b43_dma_mapping_error(ring, meta->dmaaddr, skb->len, 1)) {
1325 kfree(priv_info->bouncebuffer);
1326 priv_info->bouncebuffer = NULL;
1327 ring->current_slot = old_top_slot;
1328 ring->used_slots = old_used_slots;
1329 err = -EIO;
1330 goto out_unmap_hdr;
1334 ops->fill_descriptor(ring, desc, meta->dmaaddr, skb->len, 0, 1, 1);
1336 if (info->flags & IEEE80211_TX_CTL_SEND_AFTER_DTIM) {
1337 /* Tell the firmware about the cookie of the last
1338 * mcast frame, so it can clear the more-data bit in it. */
1339 b43_shm_write16(ring->dev, B43_SHM_SHARED,
1340 B43_SHM_SH_MCASTCOOKIE, cookie);
1342 /* Now transfer the whole frame. */
1343 wmb();
1344 ops->poke_tx(ring, next_slot(ring, slot));
1345 return 0;
1347 out_unmap_hdr:
1348 unmap_descbuffer(ring, meta_hdr->dmaaddr,
1349 hdrsize, 1);
1350 return err;
1353 static inline int should_inject_overflow(struct b43_dmaring *ring)
1355 #ifdef CONFIG_B43_DEBUG
1356 if (unlikely(b43_debug(ring->dev, B43_DBG_DMAOVERFLOW))) {
1357 /* Check if we should inject another ringbuffer overflow
1358 * to test handling of this situation in the stack. */
1359 unsigned long next_overflow;
1361 next_overflow = ring->last_injected_overflow + HZ;
1362 if (time_after(jiffies, next_overflow)) {
1363 ring->last_injected_overflow = jiffies;
1364 b43dbg(ring->dev->wl,
1365 "Injecting TX ring overflow on "
1366 "DMA controller %d\n", ring->index);
1367 return 1;
1370 #endif /* CONFIG_B43_DEBUG */
1371 return 0;
1374 /* Static mapping of mac80211's queues (priorities) to b43 DMA rings. */
1375 static struct b43_dmaring *select_ring_by_priority(struct b43_wldev *dev,
1376 u8 queue_prio)
1378 struct b43_dmaring *ring;
1380 if (dev->qos_enabled) {
1381 /* 0 = highest priority */
1382 switch (queue_prio) {
1383 default:
1384 B43_WARN_ON(1);
1385 /* fallthrough */
1386 case 0:
1387 ring = dev->dma.tx_ring_AC_VO;
1388 break;
1389 case 1:
1390 ring = dev->dma.tx_ring_AC_VI;
1391 break;
1392 case 2:
1393 ring = dev->dma.tx_ring_AC_BE;
1394 break;
1395 case 3:
1396 ring = dev->dma.tx_ring_AC_BK;
1397 break;
1399 } else
1400 ring = dev->dma.tx_ring_AC_BE;
1402 return ring;
1405 int b43_dma_tx(struct b43_wldev *dev, struct sk_buff *skb)
1407 struct b43_dmaring *ring;
1408 struct ieee80211_hdr *hdr;
1409 int err = 0;
1410 struct ieee80211_tx_info *info = IEEE80211_SKB_CB(skb);
1412 hdr = (struct ieee80211_hdr *)skb->data;
1413 if (info->flags & IEEE80211_TX_CTL_SEND_AFTER_DTIM) {
1414 /* The multicast ring will be sent after the DTIM */
1415 ring = dev->dma.tx_ring_mcast;
1416 /* Set the more-data bit. Ucode will clear it on
1417 * the last frame for us. */
1418 hdr->frame_control |= cpu_to_le16(IEEE80211_FCTL_MOREDATA);
1419 } else {
1420 /* Decide by priority where to put this frame. */
1421 ring = select_ring_by_priority(
1422 dev, skb_get_queue_mapping(skb));
1425 B43_WARN_ON(!ring->tx);
1427 if (unlikely(ring->stopped)) {
1428 /* We get here only because of a bug in mac80211.
1429 * Because of a race, one packet may be queued after
1430 * the queue is stopped, thus we got called when we shouldn't.
1431 * For now, just refuse the transmit. */
1432 if (b43_debug(dev, B43_DBG_DMAVERBOSE))
1433 b43err(dev->wl, "Packet after queue stopped\n");
1434 err = -ENOSPC;
1435 goto out;
1438 if (unlikely(WARN_ON(free_slots(ring) < TX_SLOTS_PER_FRAME))) {
1439 /* If we get here, we have a real error with the queue
1440 * full, but queues not stopped. */
1441 b43err(dev->wl, "DMA queue overflow\n");
1442 err = -ENOSPC;
1443 goto out;
1446 /* Assign the queue number to the ring (if not already done before)
1447 * so TX status handling can use it. The queue to ring mapping is
1448 * static, so we don't need to store it per frame. */
1449 ring->queue_prio = skb_get_queue_mapping(skb);
1451 err = dma_tx_fragment(ring, skb);
1452 if (unlikely(err == -ENOKEY)) {
1453 /* Drop this packet, as we don't have the encryption key
1454 * anymore and must not transmit it unencrypted. */
1455 ieee80211_free_txskb(dev->wl->hw, skb);
1456 err = 0;
1457 goto out;
1459 if (unlikely(err)) {
1460 b43err(dev->wl, "DMA tx mapping failure\n");
1461 goto out;
1463 if ((free_slots(ring) < TX_SLOTS_PER_FRAME) ||
1464 should_inject_overflow(ring)) {
1465 /* This TX ring is full. */
1466 unsigned int skb_mapping = skb_get_queue_mapping(skb);
1467 ieee80211_stop_queue(dev->wl->hw, skb_mapping);
1468 dev->wl->tx_queue_stopped[skb_mapping] = 1;
1469 ring->stopped = true;
1470 if (b43_debug(dev, B43_DBG_DMAVERBOSE)) {
1471 b43dbg(dev->wl, "Stopped TX ring %d\n", ring->index);
1474 out:
1476 return err;
1479 void b43_dma_handle_txstatus(struct b43_wldev *dev,
1480 const struct b43_txstatus *status)
1482 const struct b43_dma_ops *ops;
1483 struct b43_dmaring *ring;
1484 struct b43_dmadesc_meta *meta;
1485 static const struct b43_txstatus fake; /* filled with 0 */
1486 const struct b43_txstatus *txstat;
1487 int slot, firstused;
1488 bool frame_succeed;
1489 int skip;
1490 static u8 err_out1, err_out2;
1492 ring = parse_cookie(dev, status->cookie, &slot);
1493 if (unlikely(!ring))
1494 return;
1495 B43_WARN_ON(!ring->tx);
1497 /* Sanity check: TX packets are processed in-order on one ring.
1498 * Check if the slot deduced from the cookie really is the first
1499 * used slot. */
1500 firstused = ring->current_slot - ring->used_slots + 1;
1501 if (firstused < 0)
1502 firstused = ring->nr_slots + firstused;
1504 skip = 0;
1505 if (unlikely(slot != firstused)) {
1506 /* This possibly is a firmware bug and will result in
1507 * malfunction, memory leaks and/or stall of DMA functionality.
1509 if (slot == next_slot(ring, next_slot(ring, firstused))) {
1510 /* If a single header/data pair was missed, skip over
1511 * the first two slots in an attempt to recover.
1513 slot = firstused;
1514 skip = 2;
1515 if (!err_out1) {
1516 /* Report the error once. */
1517 b43dbg(dev->wl,
1518 "Skip on DMA ring %d slot %d.\n",
1519 ring->index, slot);
1520 err_out1 = 1;
1522 } else {
1523 /* More than a single header/data pair were missed.
1524 * Report this error once.
1526 if (!err_out2)
1527 b43dbg(dev->wl,
1528 "Out of order TX status report on DMA ring %d. Expected %d, but got %d\n",
1529 ring->index, firstused, slot);
1530 err_out2 = 1;
1531 return;
1535 ops = ring->ops;
1536 while (1) {
1537 B43_WARN_ON(slot < 0 || slot >= ring->nr_slots);
1538 /* get meta - ignore returned value */
1539 ops->idx2desc(ring, slot, &meta);
1541 if (b43_dma_ptr_is_poisoned(meta->skb)) {
1542 b43dbg(dev->wl, "Poisoned TX slot %d (first=%d) "
1543 "on ring %d\n",
1544 slot, firstused, ring->index);
1545 break;
1548 if (meta->skb) {
1549 struct b43_private_tx_info *priv_info =
1550 b43_get_priv_tx_info(IEEE80211_SKB_CB(meta->skb));
1552 unmap_descbuffer(ring, meta->dmaaddr,
1553 meta->skb->len, 1);
1554 kfree(priv_info->bouncebuffer);
1555 priv_info->bouncebuffer = NULL;
1556 } else {
1557 unmap_descbuffer(ring, meta->dmaaddr,
1558 b43_txhdr_size(dev), 1);
1561 if (meta->is_last_fragment) {
1562 struct ieee80211_tx_info *info;
1564 if (unlikely(!meta->skb)) {
1565 /* This is a scatter-gather fragment of a frame,
1566 * so the skb pointer must not be NULL.
1568 b43dbg(dev->wl, "TX status unexpected NULL skb "
1569 "at slot %d (first=%d) on ring %d\n",
1570 slot, firstused, ring->index);
1571 break;
1574 info = IEEE80211_SKB_CB(meta->skb);
1577 * Call back to inform the ieee80211 subsystem about
1578 * the status of the transmission. When skipping over
1579 * a missed TX status report, use a status structure
1580 * filled with zeros to indicate that the frame was not
1581 * sent (frame_count 0) and not acknowledged
1583 if (unlikely(skip))
1584 txstat = &fake;
1585 else
1586 txstat = status;
1588 frame_succeed = b43_fill_txstatus_report(dev, info,
1589 txstat);
1590 #ifdef CONFIG_B43_DEBUG
1591 if (frame_succeed)
1592 ring->nr_succeed_tx_packets++;
1593 else
1594 ring->nr_failed_tx_packets++;
1595 ring->nr_total_packet_tries += status->frame_count;
1596 #endif /* DEBUG */
1597 ieee80211_tx_status(dev->wl->hw, meta->skb);
1599 /* skb will be freed by ieee80211_tx_status().
1600 * Poison our pointer. */
1601 meta->skb = B43_DMA_PTR_POISON;
1602 } else {
1603 /* No need to call free_descriptor_buffer here, as
1604 * this is only the txhdr, which is not allocated.
1606 if (unlikely(meta->skb)) {
1607 b43dbg(dev->wl, "TX status unexpected non-NULL skb "
1608 "at slot %d (first=%d) on ring %d\n",
1609 slot, firstused, ring->index);
1610 break;
1614 /* Everything unmapped and free'd. So it's not used anymore. */
1615 ring->used_slots--;
1617 if (meta->is_last_fragment && !skip) {
1618 /* This is the last scatter-gather
1619 * fragment of the frame. We are done. */
1620 break;
1622 slot = next_slot(ring, slot);
1623 if (skip > 0)
1624 --skip;
1626 if (ring->stopped) {
1627 B43_WARN_ON(free_slots(ring) < TX_SLOTS_PER_FRAME);
1628 ring->stopped = false;
1631 if (dev->wl->tx_queue_stopped[ring->queue_prio]) {
1632 dev->wl->tx_queue_stopped[ring->queue_prio] = 0;
1633 } else {
1634 /* If the driver queue is running wake the corresponding
1635 * mac80211 queue. */
1636 ieee80211_wake_queue(dev->wl->hw, ring->queue_prio);
1637 if (b43_debug(dev, B43_DBG_DMAVERBOSE)) {
1638 b43dbg(dev->wl, "Woke up TX ring %d\n", ring->index);
1641 /* Add work to the queue. */
1642 ieee80211_queue_work(dev->wl->hw, &dev->wl->tx_work);
1645 static void dma_rx(struct b43_dmaring *ring, int *slot)
1647 const struct b43_dma_ops *ops = ring->ops;
1648 struct b43_dmadesc_generic *desc;
1649 struct b43_dmadesc_meta *meta;
1650 struct b43_rxhdr_fw4 *rxhdr;
1651 struct sk_buff *skb;
1652 u16 len;
1653 int err;
1654 dma_addr_t dmaaddr;
1656 desc = ops->idx2desc(ring, *slot, &meta);
1658 sync_descbuffer_for_cpu(ring, meta->dmaaddr, ring->rx_buffersize);
1659 skb = meta->skb;
1661 rxhdr = (struct b43_rxhdr_fw4 *)skb->data;
1662 len = le16_to_cpu(rxhdr->frame_len);
1663 if (len == 0) {
1664 int i = 0;
1666 do {
1667 udelay(2);
1668 barrier();
1669 len = le16_to_cpu(rxhdr->frame_len);
1670 } while (len == 0 && i++ < 5);
1671 if (unlikely(len == 0)) {
1672 dmaaddr = meta->dmaaddr;
1673 goto drop_recycle_buffer;
1676 if (unlikely(b43_rx_buffer_is_poisoned(ring, skb))) {
1677 /* Something went wrong with the DMA.
1678 * The device did not touch the buffer and did not overwrite the poison. */
1679 b43dbg(ring->dev->wl, "DMA RX: Dropping poisoned buffer.\n");
1680 dmaaddr = meta->dmaaddr;
1681 goto drop_recycle_buffer;
1683 if (unlikely(len + ring->frameoffset > ring->rx_buffersize)) {
1684 /* The data did not fit into one descriptor buffer
1685 * and is split over multiple buffers.
1686 * This should never happen, as we try to allocate buffers
1687 * big enough. So simply ignore this packet.
1689 int cnt = 0;
1690 s32 tmp = len;
1692 while (1) {
1693 desc = ops->idx2desc(ring, *slot, &meta);
1694 /* recycle the descriptor buffer. */
1695 b43_poison_rx_buffer(ring, meta->skb);
1696 sync_descbuffer_for_device(ring, meta->dmaaddr,
1697 ring->rx_buffersize);
1698 *slot = next_slot(ring, *slot);
1699 cnt++;
1700 tmp -= ring->rx_buffersize;
1701 if (tmp <= 0)
1702 break;
1704 b43err(ring->dev->wl, "DMA RX buffer too small "
1705 "(len: %u, buffer: %u, nr-dropped: %d)\n",
1706 len, ring->rx_buffersize, cnt);
1707 goto drop;
1710 dmaaddr = meta->dmaaddr;
1711 err = setup_rx_descbuffer(ring, desc, meta, GFP_ATOMIC);
1712 if (unlikely(err)) {
1713 b43dbg(ring->dev->wl, "DMA RX: setup_rx_descbuffer() failed\n");
1714 goto drop_recycle_buffer;
1717 unmap_descbuffer(ring, dmaaddr, ring->rx_buffersize, 0);
1718 skb_put(skb, len + ring->frameoffset);
1719 skb_pull(skb, ring->frameoffset);
1721 b43_rx(ring->dev, skb, rxhdr);
1722 drop:
1723 return;
1725 drop_recycle_buffer:
1726 /* Poison and recycle the RX buffer. */
1727 b43_poison_rx_buffer(ring, skb);
1728 sync_descbuffer_for_device(ring, dmaaddr, ring->rx_buffersize);
1731 void b43_dma_handle_rx_overflow(struct b43_dmaring *ring)
1733 int current_slot, previous_slot;
1735 B43_WARN_ON(ring->tx);
1737 /* Device has filled all buffers, drop all packets and let TCP
1738 * decrease speed.
1739 * Decrement RX index by one will let the device to see all slots
1740 * as free again
1743 *TODO: How to increase rx_drop in mac80211?
1745 current_slot = ring->ops->get_current_rxslot(ring);
1746 previous_slot = prev_slot(ring, current_slot);
1747 ring->ops->set_current_rxslot(ring, previous_slot);
1750 void b43_dma_rx(struct b43_dmaring *ring)
1752 const struct b43_dma_ops *ops = ring->ops;
1753 int slot, current_slot;
1754 int used_slots = 0;
1756 B43_WARN_ON(ring->tx);
1757 current_slot = ops->get_current_rxslot(ring);
1758 B43_WARN_ON(!(current_slot >= 0 && current_slot < ring->nr_slots));
1760 slot = ring->current_slot;
1761 for (; slot != current_slot; slot = next_slot(ring, slot)) {
1762 dma_rx(ring, &slot);
1763 update_max_used_slots(ring, ++used_slots);
1765 wmb();
1766 ops->set_current_rxslot(ring, slot);
1767 ring->current_slot = slot;
1770 static void b43_dma_tx_suspend_ring(struct b43_dmaring *ring)
1772 B43_WARN_ON(!ring->tx);
1773 ring->ops->tx_suspend(ring);
1776 static void b43_dma_tx_resume_ring(struct b43_dmaring *ring)
1778 B43_WARN_ON(!ring->tx);
1779 ring->ops->tx_resume(ring);
1782 void b43_dma_tx_suspend(struct b43_wldev *dev)
1784 b43_power_saving_ctl_bits(dev, B43_PS_AWAKE);
1785 b43_dma_tx_suspend_ring(dev->dma.tx_ring_AC_BK);
1786 b43_dma_tx_suspend_ring(dev->dma.tx_ring_AC_BE);
1787 b43_dma_tx_suspend_ring(dev->dma.tx_ring_AC_VI);
1788 b43_dma_tx_suspend_ring(dev->dma.tx_ring_AC_VO);
1789 b43_dma_tx_suspend_ring(dev->dma.tx_ring_mcast);
1792 void b43_dma_tx_resume(struct b43_wldev *dev)
1794 b43_dma_tx_resume_ring(dev->dma.tx_ring_mcast);
1795 b43_dma_tx_resume_ring(dev->dma.tx_ring_AC_VO);
1796 b43_dma_tx_resume_ring(dev->dma.tx_ring_AC_VI);
1797 b43_dma_tx_resume_ring(dev->dma.tx_ring_AC_BE);
1798 b43_dma_tx_resume_ring(dev->dma.tx_ring_AC_BK);
1799 b43_power_saving_ctl_bits(dev, 0);
1802 static void direct_fifo_rx(struct b43_wldev *dev, enum b43_dmatype type,
1803 u16 mmio_base, bool enable)
1805 u32 ctl;
1807 if (type == B43_DMA_64BIT) {
1808 ctl = b43_read32(dev, mmio_base + B43_DMA64_RXCTL);
1809 ctl &= ~B43_DMA64_RXDIRECTFIFO;
1810 if (enable)
1811 ctl |= B43_DMA64_RXDIRECTFIFO;
1812 b43_write32(dev, mmio_base + B43_DMA64_RXCTL, ctl);
1813 } else {
1814 ctl = b43_read32(dev, mmio_base + B43_DMA32_RXCTL);
1815 ctl &= ~B43_DMA32_RXDIRECTFIFO;
1816 if (enable)
1817 ctl |= B43_DMA32_RXDIRECTFIFO;
1818 b43_write32(dev, mmio_base + B43_DMA32_RXCTL, ctl);
1822 /* Enable/Disable Direct FIFO Receive Mode (PIO) on a RX engine.
1823 * This is called from PIO code, so DMA structures are not available. */
1824 void b43_dma_direct_fifo_rx(struct b43_wldev *dev,
1825 unsigned int engine_index, bool enable)
1827 enum b43_dmatype type;
1828 u16 mmio_base;
1830 type = dma_mask_to_engine_type(supported_dma_mask(dev));
1832 mmio_base = b43_dmacontroller_base(type, engine_index);
1833 direct_fifo_rx(dev, type, mmio_base, enable);