2 * Linux driver for VMware's vmxnet3 ethernet NIC.
4 * Copyright (C) 2008-2009, VMware, Inc. All Rights Reserved.
6 * This program is free software; you can redistribute it and/or modify it
7 * under the terms of the GNU General Public License as published by the
8 * Free Software Foundation; version 2 of the License and no later version.
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY OR FITNESS FOR A PARTICULAR PURPOSE, GOOD TITLE or
13 * NON INFRINGEMENT. See the GNU General Public License for more
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
20 * The full GNU General Public License is included in this distribution in
21 * the file called "COPYING".
23 * Maintained by: Shreyas Bhatewara <pv-drivers@vmware.com>
27 #include <linux/module.h>
28 #include <net/ip6_checksum.h>
30 #include "vmxnet3_int.h"
32 char vmxnet3_driver_name
[] = "vmxnet3";
33 #define VMXNET3_DRIVER_DESC "VMware vmxnet3 virtual NIC driver"
37 * Last entry must be all 0s
39 static const struct pci_device_id vmxnet3_pciid_table
[] = {
40 {PCI_VDEVICE(VMWARE
, PCI_DEVICE_ID_VMWARE_VMXNET3
)},
44 MODULE_DEVICE_TABLE(pci
, vmxnet3_pciid_table
);
46 static int enable_mq
= 1;
49 vmxnet3_write_mac_addr(struct vmxnet3_adapter
*adapter
, u8
*mac
);
52 * Enable/Disable the given intr
55 vmxnet3_enable_intr(struct vmxnet3_adapter
*adapter
, unsigned intr_idx
)
57 VMXNET3_WRITE_BAR0_REG(adapter
, VMXNET3_REG_IMR
+ intr_idx
* 8, 0);
62 vmxnet3_disable_intr(struct vmxnet3_adapter
*adapter
, unsigned intr_idx
)
64 VMXNET3_WRITE_BAR0_REG(adapter
, VMXNET3_REG_IMR
+ intr_idx
* 8, 1);
69 * Enable/Disable all intrs used by the device
72 vmxnet3_enable_all_intrs(struct vmxnet3_adapter
*adapter
)
76 for (i
= 0; i
< adapter
->intr
.num_intrs
; i
++)
77 vmxnet3_enable_intr(adapter
, i
);
78 adapter
->shared
->devRead
.intrConf
.intrCtrl
&=
79 cpu_to_le32(~VMXNET3_IC_DISABLE_ALL
);
84 vmxnet3_disable_all_intrs(struct vmxnet3_adapter
*adapter
)
88 adapter
->shared
->devRead
.intrConf
.intrCtrl
|=
89 cpu_to_le32(VMXNET3_IC_DISABLE_ALL
);
90 for (i
= 0; i
< adapter
->intr
.num_intrs
; i
++)
91 vmxnet3_disable_intr(adapter
, i
);
96 vmxnet3_ack_events(struct vmxnet3_adapter
*adapter
, u32 events
)
98 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_ECR
, events
);
103 vmxnet3_tq_stopped(struct vmxnet3_tx_queue
*tq
, struct vmxnet3_adapter
*adapter
)
110 vmxnet3_tq_start(struct vmxnet3_tx_queue
*tq
, struct vmxnet3_adapter
*adapter
)
113 netif_start_subqueue(adapter
->netdev
, tq
- adapter
->tx_queue
);
118 vmxnet3_tq_wake(struct vmxnet3_tx_queue
*tq
, struct vmxnet3_adapter
*adapter
)
121 netif_wake_subqueue(adapter
->netdev
, (tq
- adapter
->tx_queue
));
126 vmxnet3_tq_stop(struct vmxnet3_tx_queue
*tq
, struct vmxnet3_adapter
*adapter
)
130 netif_stop_subqueue(adapter
->netdev
, (tq
- adapter
->tx_queue
));
135 * Check the link state. This may start or stop the tx queue.
138 vmxnet3_check_link(struct vmxnet3_adapter
*adapter
, bool affectTxQueue
)
144 spin_lock_irqsave(&adapter
->cmd_lock
, flags
);
145 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_CMD
, VMXNET3_CMD_GET_LINK
);
146 ret
= VMXNET3_READ_BAR1_REG(adapter
, VMXNET3_REG_CMD
);
147 spin_unlock_irqrestore(&adapter
->cmd_lock
, flags
);
149 adapter
->link_speed
= ret
>> 16;
150 if (ret
& 1) { /* Link is up. */
151 netdev_info(adapter
->netdev
, "NIC Link is Up %d Mbps\n",
152 adapter
->link_speed
);
153 netif_carrier_on(adapter
->netdev
);
156 for (i
= 0; i
< adapter
->num_tx_queues
; i
++)
157 vmxnet3_tq_start(&adapter
->tx_queue
[i
],
161 netdev_info(adapter
->netdev
, "NIC Link is Down\n");
162 netif_carrier_off(adapter
->netdev
);
165 for (i
= 0; i
< adapter
->num_tx_queues
; i
++)
166 vmxnet3_tq_stop(&adapter
->tx_queue
[i
], adapter
);
172 vmxnet3_process_events(struct vmxnet3_adapter
*adapter
)
176 u32 events
= le32_to_cpu(adapter
->shared
->ecr
);
180 vmxnet3_ack_events(adapter
, events
);
182 /* Check if link state has changed */
183 if (events
& VMXNET3_ECR_LINK
)
184 vmxnet3_check_link(adapter
, true);
186 /* Check if there is an error on xmit/recv queues */
187 if (events
& (VMXNET3_ECR_TQERR
| VMXNET3_ECR_RQERR
)) {
188 spin_lock_irqsave(&adapter
->cmd_lock
, flags
);
189 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_CMD
,
190 VMXNET3_CMD_GET_QUEUE_STATUS
);
191 spin_unlock_irqrestore(&adapter
->cmd_lock
, flags
);
193 for (i
= 0; i
< adapter
->num_tx_queues
; i
++)
194 if (adapter
->tqd_start
[i
].status
.stopped
)
195 dev_err(&adapter
->netdev
->dev
,
196 "%s: tq[%d] error 0x%x\n",
197 adapter
->netdev
->name
, i
, le32_to_cpu(
198 adapter
->tqd_start
[i
].status
.error
));
199 for (i
= 0; i
< adapter
->num_rx_queues
; i
++)
200 if (adapter
->rqd_start
[i
].status
.stopped
)
201 dev_err(&adapter
->netdev
->dev
,
202 "%s: rq[%d] error 0x%x\n",
203 adapter
->netdev
->name
, i
,
204 adapter
->rqd_start
[i
].status
.error
);
206 schedule_work(&adapter
->work
);
210 #ifdef __BIG_ENDIAN_BITFIELD
212 * The device expects the bitfields in shared structures to be written in
213 * little endian. When CPU is big endian, the following routines are used to
214 * correctly read and write into ABI.
215 * The general technique used here is : double word bitfields are defined in
216 * opposite order for big endian architecture. Then before reading them in
217 * driver the complete double word is translated using le32_to_cpu. Similarly
218 * After the driver writes into bitfields, cpu_to_le32 is used to translate the
219 * double words into required format.
220 * In order to avoid touching bits in shared structure more than once, temporary
221 * descriptors are used. These are passed as srcDesc to following functions.
223 static void vmxnet3_RxDescToCPU(const struct Vmxnet3_RxDesc
*srcDesc
,
224 struct Vmxnet3_RxDesc
*dstDesc
)
226 u32
*src
= (u32
*)srcDesc
+ 2;
227 u32
*dst
= (u32
*)dstDesc
+ 2;
228 dstDesc
->addr
= le64_to_cpu(srcDesc
->addr
);
229 *dst
= le32_to_cpu(*src
);
230 dstDesc
->ext1
= le32_to_cpu(srcDesc
->ext1
);
233 static void vmxnet3_TxDescToLe(const struct Vmxnet3_TxDesc
*srcDesc
,
234 struct Vmxnet3_TxDesc
*dstDesc
)
237 u32
*src
= (u32
*)(srcDesc
+ 1);
238 u32
*dst
= (u32
*)(dstDesc
+ 1);
240 /* Working backwards so that the gen bit is set at the end. */
241 for (i
= 2; i
> 0; i
--) {
244 *dst
= cpu_to_le32(*src
);
249 static void vmxnet3_RxCompToCPU(const struct Vmxnet3_RxCompDesc
*srcDesc
,
250 struct Vmxnet3_RxCompDesc
*dstDesc
)
253 u32
*src
= (u32
*)srcDesc
;
254 u32
*dst
= (u32
*)dstDesc
;
255 for (i
= 0; i
< sizeof(struct Vmxnet3_RxCompDesc
) / sizeof(u32
); i
++) {
256 *dst
= le32_to_cpu(*src
);
263 /* Used to read bitfield values from double words. */
264 static u32
get_bitfield32(const __le32
*bitfield
, u32 pos
, u32 size
)
266 u32 temp
= le32_to_cpu(*bitfield
);
267 u32 mask
= ((1 << size
) - 1) << pos
;
275 #endif /* __BIG_ENDIAN_BITFIELD */
277 #ifdef __BIG_ENDIAN_BITFIELD
279 # define VMXNET3_TXDESC_GET_GEN(txdesc) get_bitfield32(((const __le32 *) \
280 txdesc) + VMXNET3_TXD_GEN_DWORD_SHIFT, \
281 VMXNET3_TXD_GEN_SHIFT, VMXNET3_TXD_GEN_SIZE)
282 # define VMXNET3_TXDESC_GET_EOP(txdesc) get_bitfield32(((const __le32 *) \
283 txdesc) + VMXNET3_TXD_EOP_DWORD_SHIFT, \
284 VMXNET3_TXD_EOP_SHIFT, VMXNET3_TXD_EOP_SIZE)
285 # define VMXNET3_TCD_GET_GEN(tcd) get_bitfield32(((const __le32 *)tcd) + \
286 VMXNET3_TCD_GEN_DWORD_SHIFT, VMXNET3_TCD_GEN_SHIFT, \
287 VMXNET3_TCD_GEN_SIZE)
288 # define VMXNET3_TCD_GET_TXIDX(tcd) get_bitfield32((const __le32 *)tcd, \
289 VMXNET3_TCD_TXIDX_SHIFT, VMXNET3_TCD_TXIDX_SIZE)
290 # define vmxnet3_getRxComp(dstrcd, rcd, tmp) do { \
292 vmxnet3_RxCompToCPU((rcd), (tmp)); \
294 # define vmxnet3_getRxDesc(dstrxd, rxd, tmp) do { \
296 vmxnet3_RxDescToCPU((rxd), (tmp)); \
301 # define VMXNET3_TXDESC_GET_GEN(txdesc) ((txdesc)->gen)
302 # define VMXNET3_TXDESC_GET_EOP(txdesc) ((txdesc)->eop)
303 # define VMXNET3_TCD_GET_GEN(tcd) ((tcd)->gen)
304 # define VMXNET3_TCD_GET_TXIDX(tcd) ((tcd)->txdIdx)
305 # define vmxnet3_getRxComp(dstrcd, rcd, tmp) (dstrcd) = (rcd)
306 # define vmxnet3_getRxDesc(dstrxd, rxd, tmp) (dstrxd) = (rxd)
308 #endif /* __BIG_ENDIAN_BITFIELD */
312 vmxnet3_unmap_tx_buf(struct vmxnet3_tx_buf_info
*tbi
,
313 struct pci_dev
*pdev
)
315 if (tbi
->map_type
== VMXNET3_MAP_SINGLE
)
316 dma_unmap_single(&pdev
->dev
, tbi
->dma_addr
, tbi
->len
,
318 else if (tbi
->map_type
== VMXNET3_MAP_PAGE
)
319 dma_unmap_page(&pdev
->dev
, tbi
->dma_addr
, tbi
->len
,
322 BUG_ON(tbi
->map_type
!= VMXNET3_MAP_NONE
);
324 tbi
->map_type
= VMXNET3_MAP_NONE
; /* to help debugging */
329 vmxnet3_unmap_pkt(u32 eop_idx
, struct vmxnet3_tx_queue
*tq
,
330 struct pci_dev
*pdev
, struct vmxnet3_adapter
*adapter
)
335 /* no out of order completion */
336 BUG_ON(tq
->buf_info
[eop_idx
].sop_idx
!= tq
->tx_ring
.next2comp
);
337 BUG_ON(VMXNET3_TXDESC_GET_EOP(&(tq
->tx_ring
.base
[eop_idx
].txd
)) != 1);
339 skb
= tq
->buf_info
[eop_idx
].skb
;
341 tq
->buf_info
[eop_idx
].skb
= NULL
;
343 VMXNET3_INC_RING_IDX_ONLY(eop_idx
, tq
->tx_ring
.size
);
345 while (tq
->tx_ring
.next2comp
!= eop_idx
) {
346 vmxnet3_unmap_tx_buf(tq
->buf_info
+ tq
->tx_ring
.next2comp
,
349 /* update next2comp w/o tx_lock. Since we are marking more,
350 * instead of less, tx ring entries avail, the worst case is
351 * that the tx routine incorrectly re-queues a pkt due to
352 * insufficient tx ring entries.
354 vmxnet3_cmd_ring_adv_next2comp(&tq
->tx_ring
);
358 dev_kfree_skb_any(skb
);
364 vmxnet3_tq_tx_complete(struct vmxnet3_tx_queue
*tq
,
365 struct vmxnet3_adapter
*adapter
)
368 union Vmxnet3_GenericDesc
*gdesc
;
370 gdesc
= tq
->comp_ring
.base
+ tq
->comp_ring
.next2proc
;
371 while (VMXNET3_TCD_GET_GEN(&gdesc
->tcd
) == tq
->comp_ring
.gen
) {
372 completed
+= vmxnet3_unmap_pkt(VMXNET3_TCD_GET_TXIDX(
373 &gdesc
->tcd
), tq
, adapter
->pdev
,
376 vmxnet3_comp_ring_adv_next2proc(&tq
->comp_ring
);
377 gdesc
= tq
->comp_ring
.base
+ tq
->comp_ring
.next2proc
;
381 spin_lock(&tq
->tx_lock
);
382 if (unlikely(vmxnet3_tq_stopped(tq
, adapter
) &&
383 vmxnet3_cmd_ring_desc_avail(&tq
->tx_ring
) >
384 VMXNET3_WAKE_QUEUE_THRESHOLD(tq
) &&
385 netif_carrier_ok(adapter
->netdev
))) {
386 vmxnet3_tq_wake(tq
, adapter
);
388 spin_unlock(&tq
->tx_lock
);
395 vmxnet3_tq_cleanup(struct vmxnet3_tx_queue
*tq
,
396 struct vmxnet3_adapter
*adapter
)
400 while (tq
->tx_ring
.next2comp
!= tq
->tx_ring
.next2fill
) {
401 struct vmxnet3_tx_buf_info
*tbi
;
403 tbi
= tq
->buf_info
+ tq
->tx_ring
.next2comp
;
405 vmxnet3_unmap_tx_buf(tbi
, adapter
->pdev
);
407 dev_kfree_skb_any(tbi
->skb
);
410 vmxnet3_cmd_ring_adv_next2comp(&tq
->tx_ring
);
413 /* sanity check, verify all buffers are indeed unmapped and freed */
414 for (i
= 0; i
< tq
->tx_ring
.size
; i
++) {
415 BUG_ON(tq
->buf_info
[i
].skb
!= NULL
||
416 tq
->buf_info
[i
].map_type
!= VMXNET3_MAP_NONE
);
419 tq
->tx_ring
.gen
= VMXNET3_INIT_GEN
;
420 tq
->tx_ring
.next2fill
= tq
->tx_ring
.next2comp
= 0;
422 tq
->comp_ring
.gen
= VMXNET3_INIT_GEN
;
423 tq
->comp_ring
.next2proc
= 0;
428 vmxnet3_tq_destroy(struct vmxnet3_tx_queue
*tq
,
429 struct vmxnet3_adapter
*adapter
)
431 if (tq
->tx_ring
.base
) {
432 dma_free_coherent(&adapter
->pdev
->dev
, tq
->tx_ring
.size
*
433 sizeof(struct Vmxnet3_TxDesc
),
434 tq
->tx_ring
.base
, tq
->tx_ring
.basePA
);
435 tq
->tx_ring
.base
= NULL
;
437 if (tq
->data_ring
.base
) {
438 dma_free_coherent(&adapter
->pdev
->dev
, tq
->data_ring
.size
*
439 sizeof(struct Vmxnet3_TxDataDesc
),
440 tq
->data_ring
.base
, tq
->data_ring
.basePA
);
441 tq
->data_ring
.base
= NULL
;
443 if (tq
->comp_ring
.base
) {
444 dma_free_coherent(&adapter
->pdev
->dev
, tq
->comp_ring
.size
*
445 sizeof(struct Vmxnet3_TxCompDesc
),
446 tq
->comp_ring
.base
, tq
->comp_ring
.basePA
);
447 tq
->comp_ring
.base
= NULL
;
450 dma_free_coherent(&adapter
->pdev
->dev
,
451 tq
->tx_ring
.size
* sizeof(tq
->buf_info
[0]),
452 tq
->buf_info
, tq
->buf_info_pa
);
458 /* Destroy all tx queues */
460 vmxnet3_tq_destroy_all(struct vmxnet3_adapter
*adapter
)
464 for (i
= 0; i
< adapter
->num_tx_queues
; i
++)
465 vmxnet3_tq_destroy(&adapter
->tx_queue
[i
], adapter
);
470 vmxnet3_tq_init(struct vmxnet3_tx_queue
*tq
,
471 struct vmxnet3_adapter
*adapter
)
475 /* reset the tx ring contents to 0 and reset the tx ring states */
476 memset(tq
->tx_ring
.base
, 0, tq
->tx_ring
.size
*
477 sizeof(struct Vmxnet3_TxDesc
));
478 tq
->tx_ring
.next2fill
= tq
->tx_ring
.next2comp
= 0;
479 tq
->tx_ring
.gen
= VMXNET3_INIT_GEN
;
481 memset(tq
->data_ring
.base
, 0, tq
->data_ring
.size
*
482 sizeof(struct Vmxnet3_TxDataDesc
));
484 /* reset the tx comp ring contents to 0 and reset comp ring states */
485 memset(tq
->comp_ring
.base
, 0, tq
->comp_ring
.size
*
486 sizeof(struct Vmxnet3_TxCompDesc
));
487 tq
->comp_ring
.next2proc
= 0;
488 tq
->comp_ring
.gen
= VMXNET3_INIT_GEN
;
490 /* reset the bookkeeping data */
491 memset(tq
->buf_info
, 0, sizeof(tq
->buf_info
[0]) * tq
->tx_ring
.size
);
492 for (i
= 0; i
< tq
->tx_ring
.size
; i
++)
493 tq
->buf_info
[i
].map_type
= VMXNET3_MAP_NONE
;
495 /* stats are not reset */
500 vmxnet3_tq_create(struct vmxnet3_tx_queue
*tq
,
501 struct vmxnet3_adapter
*adapter
)
505 BUG_ON(tq
->tx_ring
.base
|| tq
->data_ring
.base
||
506 tq
->comp_ring
.base
|| tq
->buf_info
);
508 tq
->tx_ring
.base
= dma_alloc_coherent(&adapter
->pdev
->dev
,
509 tq
->tx_ring
.size
* sizeof(struct Vmxnet3_TxDesc
),
510 &tq
->tx_ring
.basePA
, GFP_KERNEL
);
511 if (!tq
->tx_ring
.base
) {
512 netdev_err(adapter
->netdev
, "failed to allocate tx ring\n");
516 tq
->data_ring
.base
= dma_alloc_coherent(&adapter
->pdev
->dev
,
517 tq
->data_ring
.size
* sizeof(struct Vmxnet3_TxDataDesc
),
518 &tq
->data_ring
.basePA
, GFP_KERNEL
);
519 if (!tq
->data_ring
.base
) {
520 netdev_err(adapter
->netdev
, "failed to allocate data ring\n");
524 tq
->comp_ring
.base
= dma_alloc_coherent(&adapter
->pdev
->dev
,
525 tq
->comp_ring
.size
* sizeof(struct Vmxnet3_TxCompDesc
),
526 &tq
->comp_ring
.basePA
, GFP_KERNEL
);
527 if (!tq
->comp_ring
.base
) {
528 netdev_err(adapter
->netdev
, "failed to allocate tx comp ring\n");
532 sz
= tq
->tx_ring
.size
* sizeof(tq
->buf_info
[0]);
533 tq
->buf_info
= dma_zalloc_coherent(&adapter
->pdev
->dev
, sz
,
534 &tq
->buf_info_pa
, GFP_KERNEL
);
541 vmxnet3_tq_destroy(tq
, adapter
);
546 vmxnet3_tq_cleanup_all(struct vmxnet3_adapter
*adapter
)
550 for (i
= 0; i
< adapter
->num_tx_queues
; i
++)
551 vmxnet3_tq_cleanup(&adapter
->tx_queue
[i
], adapter
);
555 * starting from ring->next2fill, allocate rx buffers for the given ring
556 * of the rx queue and update the rx desc. stop after @num_to_alloc buffers
557 * are allocated or allocation fails
561 vmxnet3_rq_alloc_rx_buf(struct vmxnet3_rx_queue
*rq
, u32 ring_idx
,
562 int num_to_alloc
, struct vmxnet3_adapter
*adapter
)
564 int num_allocated
= 0;
565 struct vmxnet3_rx_buf_info
*rbi_base
= rq
->buf_info
[ring_idx
];
566 struct vmxnet3_cmd_ring
*ring
= &rq
->rx_ring
[ring_idx
];
569 while (num_allocated
<= num_to_alloc
) {
570 struct vmxnet3_rx_buf_info
*rbi
;
571 union Vmxnet3_GenericDesc
*gd
;
573 rbi
= rbi_base
+ ring
->next2fill
;
574 gd
= ring
->base
+ ring
->next2fill
;
576 if (rbi
->buf_type
== VMXNET3_RX_BUF_SKB
) {
577 if (rbi
->skb
== NULL
) {
578 rbi
->skb
= __netdev_alloc_skb_ip_align(adapter
->netdev
,
581 if (unlikely(rbi
->skb
== NULL
)) {
582 rq
->stats
.rx_buf_alloc_failure
++;
586 rbi
->dma_addr
= dma_map_single(
588 rbi
->skb
->data
, rbi
->len
,
590 if (dma_mapping_error(&adapter
->pdev
->dev
,
592 dev_kfree_skb_any(rbi
->skb
);
593 rq
->stats
.rx_buf_alloc_failure
++;
597 /* rx buffer skipped by the device */
599 val
= VMXNET3_RXD_BTYPE_HEAD
<< VMXNET3_RXD_BTYPE_SHIFT
;
601 BUG_ON(rbi
->buf_type
!= VMXNET3_RX_BUF_PAGE
||
602 rbi
->len
!= PAGE_SIZE
);
604 if (rbi
->page
== NULL
) {
605 rbi
->page
= alloc_page(GFP_ATOMIC
);
606 if (unlikely(rbi
->page
== NULL
)) {
607 rq
->stats
.rx_buf_alloc_failure
++;
610 rbi
->dma_addr
= dma_map_page(
612 rbi
->page
, 0, PAGE_SIZE
,
614 if (dma_mapping_error(&adapter
->pdev
->dev
,
617 rq
->stats
.rx_buf_alloc_failure
++;
621 /* rx buffers skipped by the device */
623 val
= VMXNET3_RXD_BTYPE_BODY
<< VMXNET3_RXD_BTYPE_SHIFT
;
626 gd
->rxd
.addr
= cpu_to_le64(rbi
->dma_addr
);
627 gd
->dword
[2] = cpu_to_le32((!ring
->gen
<< VMXNET3_RXD_GEN_SHIFT
)
630 /* Fill the last buffer but dont mark it ready, or else the
631 * device will think that the queue is full */
632 if (num_allocated
== num_to_alloc
)
635 gd
->dword
[2] |= cpu_to_le32(ring
->gen
<< VMXNET3_RXD_GEN_SHIFT
);
637 vmxnet3_cmd_ring_adv_next2fill(ring
);
640 netdev_dbg(adapter
->netdev
,
641 "alloc_rx_buf: %d allocated, next2fill %u, next2comp %u\n",
642 num_allocated
, ring
->next2fill
, ring
->next2comp
);
644 /* so that the device can distinguish a full ring and an empty ring */
645 BUG_ON(num_allocated
!= 0 && ring
->next2fill
== ring
->next2comp
);
647 return num_allocated
;
652 vmxnet3_append_frag(struct sk_buff
*skb
, struct Vmxnet3_RxCompDesc
*rcd
,
653 struct vmxnet3_rx_buf_info
*rbi
)
655 struct skb_frag_struct
*frag
= skb_shinfo(skb
)->frags
+
656 skb_shinfo(skb
)->nr_frags
;
658 BUG_ON(skb_shinfo(skb
)->nr_frags
>= MAX_SKB_FRAGS
);
660 __skb_frag_set_page(frag
, rbi
->page
);
661 frag
->page_offset
= 0;
662 skb_frag_size_set(frag
, rcd
->len
);
663 skb
->data_len
+= rcd
->len
;
664 skb
->truesize
+= PAGE_SIZE
;
665 skb_shinfo(skb
)->nr_frags
++;
670 vmxnet3_map_pkt(struct sk_buff
*skb
, struct vmxnet3_tx_ctx
*ctx
,
671 struct vmxnet3_tx_queue
*tq
, struct pci_dev
*pdev
,
672 struct vmxnet3_adapter
*adapter
)
675 unsigned long buf_offset
;
677 union Vmxnet3_GenericDesc
*gdesc
;
678 struct vmxnet3_tx_buf_info
*tbi
= NULL
;
680 BUG_ON(ctx
->copy_size
> skb_headlen(skb
));
682 /* use the previous gen bit for the SOP desc */
683 dw2
= (tq
->tx_ring
.gen
^ 0x1) << VMXNET3_TXD_GEN_SHIFT
;
685 ctx
->sop_txd
= tq
->tx_ring
.base
+ tq
->tx_ring
.next2fill
;
686 gdesc
= ctx
->sop_txd
; /* both loops below can be skipped */
688 /* no need to map the buffer if headers are copied */
689 if (ctx
->copy_size
) {
690 ctx
->sop_txd
->txd
.addr
= cpu_to_le64(tq
->data_ring
.basePA
+
691 tq
->tx_ring
.next2fill
*
692 sizeof(struct Vmxnet3_TxDataDesc
));
693 ctx
->sop_txd
->dword
[2] = cpu_to_le32(dw2
| ctx
->copy_size
);
694 ctx
->sop_txd
->dword
[3] = 0;
696 tbi
= tq
->buf_info
+ tq
->tx_ring
.next2fill
;
697 tbi
->map_type
= VMXNET3_MAP_NONE
;
699 netdev_dbg(adapter
->netdev
,
700 "txd[%u]: 0x%Lx 0x%x 0x%x\n",
701 tq
->tx_ring
.next2fill
,
702 le64_to_cpu(ctx
->sop_txd
->txd
.addr
),
703 ctx
->sop_txd
->dword
[2], ctx
->sop_txd
->dword
[3]);
704 vmxnet3_cmd_ring_adv_next2fill(&tq
->tx_ring
);
706 /* use the right gen for non-SOP desc */
707 dw2
= tq
->tx_ring
.gen
<< VMXNET3_TXD_GEN_SHIFT
;
710 /* linear part can use multiple tx desc if it's big */
711 len
= skb_headlen(skb
) - ctx
->copy_size
;
712 buf_offset
= ctx
->copy_size
;
716 if (len
< VMXNET3_MAX_TX_BUF_SIZE
) {
720 buf_size
= VMXNET3_MAX_TX_BUF_SIZE
;
721 /* spec says that for TxDesc.len, 0 == 2^14 */
724 tbi
= tq
->buf_info
+ tq
->tx_ring
.next2fill
;
725 tbi
->map_type
= VMXNET3_MAP_SINGLE
;
726 tbi
->dma_addr
= dma_map_single(&adapter
->pdev
->dev
,
727 skb
->data
+ buf_offset
, buf_size
,
729 if (dma_mapping_error(&adapter
->pdev
->dev
, tbi
->dma_addr
))
734 gdesc
= tq
->tx_ring
.base
+ tq
->tx_ring
.next2fill
;
735 BUG_ON(gdesc
->txd
.gen
== tq
->tx_ring
.gen
);
737 gdesc
->txd
.addr
= cpu_to_le64(tbi
->dma_addr
);
738 gdesc
->dword
[2] = cpu_to_le32(dw2
);
741 netdev_dbg(adapter
->netdev
,
742 "txd[%u]: 0x%Lx 0x%x 0x%x\n",
743 tq
->tx_ring
.next2fill
, le64_to_cpu(gdesc
->txd
.addr
),
744 le32_to_cpu(gdesc
->dword
[2]), gdesc
->dword
[3]);
745 vmxnet3_cmd_ring_adv_next2fill(&tq
->tx_ring
);
746 dw2
= tq
->tx_ring
.gen
<< VMXNET3_TXD_GEN_SHIFT
;
749 buf_offset
+= buf_size
;
752 for (i
= 0; i
< skb_shinfo(skb
)->nr_frags
; i
++) {
753 const struct skb_frag_struct
*frag
= &skb_shinfo(skb
)->frags
[i
];
757 len
= skb_frag_size(frag
);
759 tbi
= tq
->buf_info
+ tq
->tx_ring
.next2fill
;
760 if (len
< VMXNET3_MAX_TX_BUF_SIZE
) {
764 buf_size
= VMXNET3_MAX_TX_BUF_SIZE
;
765 /* spec says that for TxDesc.len, 0 == 2^14 */
767 tbi
->map_type
= VMXNET3_MAP_PAGE
;
768 tbi
->dma_addr
= skb_frag_dma_map(&adapter
->pdev
->dev
, frag
,
769 buf_offset
, buf_size
,
771 if (dma_mapping_error(&adapter
->pdev
->dev
, tbi
->dma_addr
))
776 gdesc
= tq
->tx_ring
.base
+ tq
->tx_ring
.next2fill
;
777 BUG_ON(gdesc
->txd
.gen
== tq
->tx_ring
.gen
);
779 gdesc
->txd
.addr
= cpu_to_le64(tbi
->dma_addr
);
780 gdesc
->dword
[2] = cpu_to_le32(dw2
);
783 netdev_dbg(adapter
->netdev
,
784 "txd[%u]: 0x%llx %u %u\n",
785 tq
->tx_ring
.next2fill
, le64_to_cpu(gdesc
->txd
.addr
),
786 le32_to_cpu(gdesc
->dword
[2]), gdesc
->dword
[3]);
787 vmxnet3_cmd_ring_adv_next2fill(&tq
->tx_ring
);
788 dw2
= tq
->tx_ring
.gen
<< VMXNET3_TXD_GEN_SHIFT
;
791 buf_offset
+= buf_size
;
795 ctx
->eop_txd
= gdesc
;
797 /* set the last buf_info for the pkt */
799 tbi
->sop_idx
= ctx
->sop_txd
- tq
->tx_ring
.base
;
805 /* Init all tx queues */
807 vmxnet3_tq_init_all(struct vmxnet3_adapter
*adapter
)
811 for (i
= 0; i
< adapter
->num_tx_queues
; i
++)
812 vmxnet3_tq_init(&adapter
->tx_queue
[i
], adapter
);
817 * parse and copy relevant protocol headers:
818 * For a tso pkt, relevant headers are L2/3/4 including options
819 * For a pkt requesting csum offloading, they are L2/3 and may include L4
820 * if it's a TCP/UDP pkt
823 * -1: error happens during parsing
824 * 0: protocol headers parsed, but too big to be copied
825 * 1: protocol headers parsed and copied
828 * 1. related *ctx fields are updated.
829 * 2. ctx->copy_size is # of bytes copied
830 * 3. the portion copied is guaranteed to be in the linear part
834 vmxnet3_parse_and_copy_hdr(struct sk_buff
*skb
, struct vmxnet3_tx_queue
*tq
,
835 struct vmxnet3_tx_ctx
*ctx
,
836 struct vmxnet3_adapter
*adapter
)
838 struct Vmxnet3_TxDataDesc
*tdd
;
841 if (ctx
->mss
) { /* TSO */
842 ctx
->eth_ip_hdr_size
= skb_transport_offset(skb
);
843 ctx
->l4_hdr_size
= tcp_hdrlen(skb
);
844 ctx
->copy_size
= ctx
->eth_ip_hdr_size
+ ctx
->l4_hdr_size
;
846 if (skb
->ip_summed
== CHECKSUM_PARTIAL
) {
847 ctx
->eth_ip_hdr_size
= skb_checksum_start_offset(skb
);
850 const struct iphdr
*iph
= ip_hdr(skb
);
852 protocol
= iph
->protocol
;
853 } else if (ctx
->ipv6
) {
854 const struct ipv6hdr
*ipv6h
= ipv6_hdr(skb
);
856 protocol
= ipv6h
->nexthdr
;
861 ctx
->l4_hdr_size
= tcp_hdrlen(skb
);
864 ctx
->l4_hdr_size
= sizeof(struct udphdr
);
867 ctx
->l4_hdr_size
= 0;
871 ctx
->copy_size
= min(ctx
->eth_ip_hdr_size
+
872 ctx
->l4_hdr_size
, skb
->len
);
874 ctx
->eth_ip_hdr_size
= 0;
875 ctx
->l4_hdr_size
= 0;
876 /* copy as much as allowed */
877 ctx
->copy_size
= min((unsigned int)VMXNET3_HDR_COPY_SIZE
881 if (skb
->len
<= VMXNET3_HDR_COPY_SIZE
)
882 ctx
->copy_size
= skb
->len
;
884 /* make sure headers are accessible directly */
885 if (unlikely(!pskb_may_pull(skb
, ctx
->copy_size
)))
889 if (unlikely(ctx
->copy_size
> VMXNET3_HDR_COPY_SIZE
)) {
890 tq
->stats
.oversized_hdr
++;
895 tdd
= tq
->data_ring
.base
+ tq
->tx_ring
.next2fill
;
897 memcpy(tdd
->data
, skb
->data
, ctx
->copy_size
);
898 netdev_dbg(adapter
->netdev
,
899 "copy %u bytes to dataRing[%u]\n",
900 ctx
->copy_size
, tq
->tx_ring
.next2fill
);
909 vmxnet3_prepare_tso(struct sk_buff
*skb
,
910 struct vmxnet3_tx_ctx
*ctx
)
912 struct tcphdr
*tcph
= tcp_hdr(skb
);
915 struct iphdr
*iph
= ip_hdr(skb
);
918 tcph
->check
= ~csum_tcpudp_magic(iph
->saddr
, iph
->daddr
, 0,
920 } else if (ctx
->ipv6
) {
921 struct ipv6hdr
*iph
= ipv6_hdr(skb
);
923 tcph
->check
= ~csum_ipv6_magic(&iph
->saddr
, &iph
->daddr
, 0,
928 static int txd_estimate(const struct sk_buff
*skb
)
930 int count
= VMXNET3_TXD_NEEDED(skb_headlen(skb
)) + 1;
933 for (i
= 0; i
< skb_shinfo(skb
)->nr_frags
; i
++) {
934 const struct skb_frag_struct
*frag
= &skb_shinfo(skb
)->frags
[i
];
936 count
+= VMXNET3_TXD_NEEDED(skb_frag_size(frag
));
942 * Transmits a pkt thru a given tq
944 * NETDEV_TX_OK: descriptors are setup successfully
945 * NETDEV_TX_OK: error occurred, the pkt is dropped
946 * NETDEV_TX_BUSY: tx ring is full, queue is stopped
949 * 1. tx ring may be changed
950 * 2. tq stats may be updated accordingly
951 * 3. shared->txNumDeferred may be updated
955 vmxnet3_tq_xmit(struct sk_buff
*skb
, struct vmxnet3_tx_queue
*tq
,
956 struct vmxnet3_adapter
*adapter
, struct net_device
*netdev
)
961 struct vmxnet3_tx_ctx ctx
;
962 union Vmxnet3_GenericDesc
*gdesc
;
963 #ifdef __BIG_ENDIAN_BITFIELD
964 /* Use temporary descriptor to avoid touching bits multiple times */
965 union Vmxnet3_GenericDesc tempTxDesc
;
968 count
= txd_estimate(skb
);
970 ctx
.ipv4
= (vlan_get_protocol(skb
) == cpu_to_be16(ETH_P_IP
));
971 ctx
.ipv6
= (vlan_get_protocol(skb
) == cpu_to_be16(ETH_P_IPV6
));
973 ctx
.mss
= skb_shinfo(skb
)->gso_size
;
975 if (skb_header_cloned(skb
)) {
976 if (unlikely(pskb_expand_head(skb
, 0, 0,
978 tq
->stats
.drop_tso
++;
981 tq
->stats
.copy_skb_header
++;
983 vmxnet3_prepare_tso(skb
, &ctx
);
985 if (unlikely(count
> VMXNET3_MAX_TXD_PER_PKT
)) {
987 /* non-tso pkts must not use more than
988 * VMXNET3_MAX_TXD_PER_PKT entries
990 if (skb_linearize(skb
) != 0) {
991 tq
->stats
.drop_too_many_frags
++;
994 tq
->stats
.linearized
++;
996 /* recalculate the # of descriptors to use */
997 count
= VMXNET3_TXD_NEEDED(skb_headlen(skb
)) + 1;
1001 spin_lock_irqsave(&tq
->tx_lock
, flags
);
1003 if (count
> vmxnet3_cmd_ring_desc_avail(&tq
->tx_ring
)) {
1004 tq
->stats
.tx_ring_full
++;
1005 netdev_dbg(adapter
->netdev
,
1006 "tx queue stopped on %s, next2comp %u"
1007 " next2fill %u\n", adapter
->netdev
->name
,
1008 tq
->tx_ring
.next2comp
, tq
->tx_ring
.next2fill
);
1010 vmxnet3_tq_stop(tq
, adapter
);
1011 spin_unlock_irqrestore(&tq
->tx_lock
, flags
);
1012 return NETDEV_TX_BUSY
;
1016 ret
= vmxnet3_parse_and_copy_hdr(skb
, tq
, &ctx
, adapter
);
1018 BUG_ON(ret
<= 0 && ctx
.copy_size
!= 0);
1019 /* hdrs parsed, check against other limits */
1021 if (unlikely(ctx
.eth_ip_hdr_size
+ ctx
.l4_hdr_size
>
1022 VMXNET3_MAX_TX_BUF_SIZE
)) {
1026 if (skb
->ip_summed
== CHECKSUM_PARTIAL
) {
1027 if (unlikely(ctx
.eth_ip_hdr_size
+
1029 VMXNET3_MAX_CSUM_OFFSET
)) {
1035 tq
->stats
.drop_hdr_inspect_err
++;
1036 goto unlock_drop_pkt
;
1039 /* fill tx descs related to addr & len */
1040 if (vmxnet3_map_pkt(skb
, &ctx
, tq
, adapter
->pdev
, adapter
))
1041 goto unlock_drop_pkt
;
1043 /* setup the EOP desc */
1044 ctx
.eop_txd
->dword
[3] = cpu_to_le32(VMXNET3_TXD_CQ
| VMXNET3_TXD_EOP
);
1046 /* setup the SOP desc */
1047 #ifdef __BIG_ENDIAN_BITFIELD
1048 gdesc
= &tempTxDesc
;
1049 gdesc
->dword
[2] = ctx
.sop_txd
->dword
[2];
1050 gdesc
->dword
[3] = ctx
.sop_txd
->dword
[3];
1052 gdesc
= ctx
.sop_txd
;
1055 gdesc
->txd
.hlen
= ctx
.eth_ip_hdr_size
+ ctx
.l4_hdr_size
;
1056 gdesc
->txd
.om
= VMXNET3_OM_TSO
;
1057 gdesc
->txd
.msscof
= ctx
.mss
;
1058 le32_add_cpu(&tq
->shared
->txNumDeferred
, (skb
->len
-
1059 gdesc
->txd
.hlen
+ ctx
.mss
- 1) / ctx
.mss
);
1061 if (skb
->ip_summed
== CHECKSUM_PARTIAL
) {
1062 gdesc
->txd
.hlen
= ctx
.eth_ip_hdr_size
;
1063 gdesc
->txd
.om
= VMXNET3_OM_CSUM
;
1064 gdesc
->txd
.msscof
= ctx
.eth_ip_hdr_size
+
1068 gdesc
->txd
.msscof
= 0;
1070 le32_add_cpu(&tq
->shared
->txNumDeferred
, 1);
1073 if (skb_vlan_tag_present(skb
)) {
1075 gdesc
->txd
.tci
= skb_vlan_tag_get(skb
);
1078 /* finally flips the GEN bit of the SOP desc. */
1079 gdesc
->dword
[2] = cpu_to_le32(le32_to_cpu(gdesc
->dword
[2]) ^
1081 #ifdef __BIG_ENDIAN_BITFIELD
1082 /* Finished updating in bitfields of Tx Desc, so write them in original
1085 vmxnet3_TxDescToLe((struct Vmxnet3_TxDesc
*)gdesc
,
1086 (struct Vmxnet3_TxDesc
*)ctx
.sop_txd
);
1087 gdesc
= ctx
.sop_txd
;
1089 netdev_dbg(adapter
->netdev
,
1090 "txd[%u]: SOP 0x%Lx 0x%x 0x%x\n",
1092 tq
->tx_ring
.base
), le64_to_cpu(gdesc
->txd
.addr
),
1093 le32_to_cpu(gdesc
->dword
[2]), le32_to_cpu(gdesc
->dword
[3]));
1095 spin_unlock_irqrestore(&tq
->tx_lock
, flags
);
1097 if (le32_to_cpu(tq
->shared
->txNumDeferred
) >=
1098 le32_to_cpu(tq
->shared
->txThreshold
)) {
1099 tq
->shared
->txNumDeferred
= 0;
1100 VMXNET3_WRITE_BAR0_REG(adapter
,
1101 VMXNET3_REG_TXPROD
+ tq
->qid
* 8,
1102 tq
->tx_ring
.next2fill
);
1105 return NETDEV_TX_OK
;
1108 tq
->stats
.drop_oversized_hdr
++;
1110 spin_unlock_irqrestore(&tq
->tx_lock
, flags
);
1112 tq
->stats
.drop_total
++;
1113 dev_kfree_skb_any(skb
);
1114 return NETDEV_TX_OK
;
1119 vmxnet3_xmit_frame(struct sk_buff
*skb
, struct net_device
*netdev
)
1121 struct vmxnet3_adapter
*adapter
= netdev_priv(netdev
);
1123 BUG_ON(skb
->queue_mapping
> adapter
->num_tx_queues
);
1124 return vmxnet3_tq_xmit(skb
,
1125 &adapter
->tx_queue
[skb
->queue_mapping
],
1131 vmxnet3_rx_csum(struct vmxnet3_adapter
*adapter
,
1132 struct sk_buff
*skb
,
1133 union Vmxnet3_GenericDesc
*gdesc
)
1135 if (!gdesc
->rcd
.cnc
&& adapter
->netdev
->features
& NETIF_F_RXCSUM
) {
1136 /* typical case: TCP/UDP over IP and both csums are correct */
1137 if ((le32_to_cpu(gdesc
->dword
[3]) & VMXNET3_RCD_CSUM_OK
) ==
1138 VMXNET3_RCD_CSUM_OK
) {
1139 skb
->ip_summed
= CHECKSUM_UNNECESSARY
;
1140 BUG_ON(!(gdesc
->rcd
.tcp
|| gdesc
->rcd
.udp
));
1141 BUG_ON(!(gdesc
->rcd
.v4
|| gdesc
->rcd
.v6
));
1142 BUG_ON(gdesc
->rcd
.frg
);
1144 if (gdesc
->rcd
.csum
) {
1145 skb
->csum
= htons(gdesc
->rcd
.csum
);
1146 skb
->ip_summed
= CHECKSUM_PARTIAL
;
1148 skb_checksum_none_assert(skb
);
1152 skb_checksum_none_assert(skb
);
1158 vmxnet3_rx_error(struct vmxnet3_rx_queue
*rq
, struct Vmxnet3_RxCompDesc
*rcd
,
1159 struct vmxnet3_rx_ctx
*ctx
, struct vmxnet3_adapter
*adapter
)
1161 rq
->stats
.drop_err
++;
1163 rq
->stats
.drop_fcs
++;
1165 rq
->stats
.drop_total
++;
1168 * We do not unmap and chain the rx buffer to the skb.
1169 * We basically pretend this buffer is not used and will be recycled
1170 * by vmxnet3_rq_alloc_rx_buf()
1174 * ctx->skb may be NULL if this is the first and the only one
1178 dev_kfree_skb_irq(ctx
->skb
);
1185 vmxnet3_get_hdr_len(struct vmxnet3_adapter
*adapter
, struct sk_buff
*skb
,
1186 union Vmxnet3_GenericDesc
*gdesc
)
1193 struct ipv6hdr
*ipv6
;
1196 BUG_ON(gdesc
->rcd
.tcp
== 0);
1198 maplen
= skb_headlen(skb
);
1199 if (unlikely(sizeof(struct iphdr
) + sizeof(struct tcphdr
) > maplen
))
1202 hdr
.eth
= eth_hdr(skb
);
1203 if (gdesc
->rcd
.v4
) {
1204 BUG_ON(hdr
.eth
->h_proto
!= htons(ETH_P_IP
));
1205 hdr
.ptr
+= sizeof(struct ethhdr
);
1206 BUG_ON(hdr
.ipv4
->protocol
!= IPPROTO_TCP
);
1207 hlen
= hdr
.ipv4
->ihl
<< 2;
1208 hdr
.ptr
+= hdr
.ipv4
->ihl
<< 2;
1209 } else if (gdesc
->rcd
.v6
) {
1210 BUG_ON(hdr
.eth
->h_proto
!= htons(ETH_P_IPV6
));
1211 hdr
.ptr
+= sizeof(struct ethhdr
);
1212 /* Use an estimated value, since we also need to handle
1215 if (hdr
.ipv6
->nexthdr
!= IPPROTO_TCP
)
1216 return sizeof(struct ipv6hdr
) + sizeof(struct tcphdr
);
1217 hlen
= sizeof(struct ipv6hdr
);
1218 hdr
.ptr
+= sizeof(struct ipv6hdr
);
1220 /* Non-IP pkt, dont estimate header length */
1224 if (hlen
+ sizeof(struct tcphdr
) > maplen
)
1227 return (hlen
+ (hdr
.tcp
->doff
<< 2));
1231 vmxnet3_rq_rx_complete(struct vmxnet3_rx_queue
*rq
,
1232 struct vmxnet3_adapter
*adapter
, int quota
)
1234 static const u32 rxprod_reg
[2] = {
1235 VMXNET3_REG_RXPROD
, VMXNET3_REG_RXPROD2
1238 bool skip_page_frags
= false;
1239 struct Vmxnet3_RxCompDesc
*rcd
;
1240 struct vmxnet3_rx_ctx
*ctx
= &rq
->rx_ctx
;
1241 u16 segCnt
= 0, mss
= 0;
1242 #ifdef __BIG_ENDIAN_BITFIELD
1243 struct Vmxnet3_RxDesc rxCmdDesc
;
1244 struct Vmxnet3_RxCompDesc rxComp
;
1246 vmxnet3_getRxComp(rcd
, &rq
->comp_ring
.base
[rq
->comp_ring
.next2proc
].rcd
,
1248 while (rcd
->gen
== rq
->comp_ring
.gen
) {
1249 struct vmxnet3_rx_buf_info
*rbi
;
1250 struct sk_buff
*skb
, *new_skb
= NULL
;
1251 struct page
*new_page
= NULL
;
1252 dma_addr_t new_dma_addr
;
1254 struct Vmxnet3_RxDesc
*rxd
;
1256 struct vmxnet3_cmd_ring
*ring
= NULL
;
1257 if (num_pkts
>= quota
) {
1258 /* we may stop even before we see the EOP desc of
1263 BUG_ON(rcd
->rqID
!= rq
->qid
&& rcd
->rqID
!= rq
->qid2
);
1265 ring_idx
= rcd
->rqID
< adapter
->num_rx_queues
? 0 : 1;
1266 ring
= rq
->rx_ring
+ ring_idx
;
1267 vmxnet3_getRxDesc(rxd
, &rq
->rx_ring
[ring_idx
].base
[idx
].rxd
,
1269 rbi
= rq
->buf_info
[ring_idx
] + idx
;
1271 BUG_ON(rxd
->addr
!= rbi
->dma_addr
||
1272 rxd
->len
!= rbi
->len
);
1274 if (unlikely(rcd
->eop
&& rcd
->err
)) {
1275 vmxnet3_rx_error(rq
, rcd
, ctx
, adapter
);
1279 if (rcd
->sop
) { /* first buf of the pkt */
1280 BUG_ON(rxd
->btype
!= VMXNET3_RXD_BTYPE_HEAD
||
1281 rcd
->rqID
!= rq
->qid
);
1283 BUG_ON(rbi
->buf_type
!= VMXNET3_RX_BUF_SKB
);
1284 BUG_ON(ctx
->skb
!= NULL
|| rbi
->skb
== NULL
);
1286 if (unlikely(rcd
->len
== 0)) {
1287 /* Pretend the rx buffer is skipped. */
1288 BUG_ON(!(rcd
->sop
&& rcd
->eop
));
1289 netdev_dbg(adapter
->netdev
,
1290 "rxRing[%u][%u] 0 length\n",
1295 skip_page_frags
= false;
1296 ctx
->skb
= rbi
->skb
;
1297 new_skb
= netdev_alloc_skb_ip_align(adapter
->netdev
,
1299 if (new_skb
== NULL
) {
1300 /* Skb allocation failed, do not handover this
1301 * skb to stack. Reuse it. Drop the existing pkt
1303 rq
->stats
.rx_buf_alloc_failure
++;
1305 rq
->stats
.drop_total
++;
1306 skip_page_frags
= true;
1309 new_dma_addr
= dma_map_single(&adapter
->pdev
->dev
,
1310 new_skb
->data
, rbi
->len
,
1311 PCI_DMA_FROMDEVICE
);
1312 if (dma_mapping_error(&adapter
->pdev
->dev
,
1314 dev_kfree_skb(new_skb
);
1315 /* Skb allocation failed, do not handover this
1316 * skb to stack. Reuse it. Drop the existing pkt
1318 rq
->stats
.rx_buf_alloc_failure
++;
1320 rq
->stats
.drop_total
++;
1321 skip_page_frags
= true;
1325 dma_unmap_single(&adapter
->pdev
->dev
, rbi
->dma_addr
,
1327 PCI_DMA_FROMDEVICE
);
1330 if (rcd
->rssType
!= VMXNET3_RCD_RSS_TYPE_NONE
&&
1331 (adapter
->netdev
->features
& NETIF_F_RXHASH
))
1332 skb_set_hash(ctx
->skb
,
1333 le32_to_cpu(rcd
->rssHash
),
1336 skb_put(ctx
->skb
, rcd
->len
);
1338 /* Immediate refill */
1340 rbi
->dma_addr
= new_dma_addr
;
1341 rxd
->addr
= cpu_to_le64(rbi
->dma_addr
);
1342 rxd
->len
= rbi
->len
;
1343 if (adapter
->version
== 2 &&
1344 rcd
->type
== VMXNET3_CDTYPE_RXCOMP_LRO
) {
1345 struct Vmxnet3_RxCompDescExt
*rcdlro
;
1346 rcdlro
= (struct Vmxnet3_RxCompDescExt
*)rcd
;
1348 segCnt
= rcdlro
->segCnt
;
1349 BUG_ON(segCnt
<= 1);
1351 if (unlikely(segCnt
<= 1))
1357 BUG_ON(ctx
->skb
== NULL
&& !skip_page_frags
);
1359 /* non SOP buffer must be type 1 in most cases */
1360 BUG_ON(rbi
->buf_type
!= VMXNET3_RX_BUF_PAGE
);
1361 BUG_ON(rxd
->btype
!= VMXNET3_RXD_BTYPE_BODY
);
1363 /* If an sop buffer was dropped, skip all
1364 * following non-sop fragments. They will be reused.
1366 if (skip_page_frags
)
1370 new_page
= alloc_page(GFP_ATOMIC
);
1371 /* Replacement page frag could not be allocated.
1372 * Reuse this page. Drop the pkt and free the
1373 * skb which contained this page as a frag. Skip
1374 * processing all the following non-sop frags.
1376 if (unlikely(!new_page
)) {
1377 rq
->stats
.rx_buf_alloc_failure
++;
1378 dev_kfree_skb(ctx
->skb
);
1380 skip_page_frags
= true;
1383 new_dma_addr
= dma_map_page(&adapter
->pdev
->dev
,
1386 PCI_DMA_FROMDEVICE
);
1387 if (dma_mapping_error(&adapter
->pdev
->dev
,
1390 rq
->stats
.rx_buf_alloc_failure
++;
1391 dev_kfree_skb(ctx
->skb
);
1393 skip_page_frags
= true;
1397 dma_unmap_page(&adapter
->pdev
->dev
,
1398 rbi
->dma_addr
, rbi
->len
,
1399 PCI_DMA_FROMDEVICE
);
1401 vmxnet3_append_frag(ctx
->skb
, rcd
, rbi
);
1403 /* Immediate refill */
1404 rbi
->page
= new_page
;
1405 rbi
->dma_addr
= new_dma_addr
;
1406 rxd
->addr
= cpu_to_le64(rbi
->dma_addr
);
1407 rxd
->len
= rbi
->len
;
1414 u32 mtu
= adapter
->netdev
->mtu
;
1415 skb
->len
+= skb
->data_len
;
1417 vmxnet3_rx_csum(adapter
, skb
,
1418 (union Vmxnet3_GenericDesc
*)rcd
);
1419 skb
->protocol
= eth_type_trans(skb
, adapter
->netdev
);
1420 if (!rcd
->tcp
|| !adapter
->lro
)
1423 if (segCnt
!= 0 && mss
!= 0) {
1424 skb_shinfo(skb
)->gso_type
= rcd
->v4
?
1425 SKB_GSO_TCPV4
: SKB_GSO_TCPV6
;
1426 skb_shinfo(skb
)->gso_size
= mss
;
1427 skb_shinfo(skb
)->gso_segs
= segCnt
;
1428 } else if (segCnt
!= 0 || skb
->len
> mtu
) {
1431 hlen
= vmxnet3_get_hdr_len(adapter
, skb
,
1432 (union Vmxnet3_GenericDesc
*)rcd
);
1436 skb_shinfo(skb
)->gso_type
=
1437 rcd
->v4
? SKB_GSO_TCPV4
: SKB_GSO_TCPV6
;
1439 skb_shinfo(skb
)->gso_segs
= segCnt
;
1440 skb_shinfo(skb
)->gso_size
=
1441 DIV_ROUND_UP(skb
->len
-
1444 skb_shinfo(skb
)->gso_size
= mtu
- hlen
;
1448 if (unlikely(rcd
->ts
))
1449 __vlan_hwaccel_put_tag(skb
, htons(ETH_P_8021Q
), rcd
->tci
);
1451 if (adapter
->netdev
->features
& NETIF_F_LRO
)
1452 netif_receive_skb(skb
);
1454 napi_gro_receive(&rq
->napi
, skb
);
1461 /* device may have skipped some rx descs */
1462 ring
->next2comp
= idx
;
1463 num_to_alloc
= vmxnet3_cmd_ring_desc_avail(ring
);
1464 ring
= rq
->rx_ring
+ ring_idx
;
1465 while (num_to_alloc
) {
1466 vmxnet3_getRxDesc(rxd
, &ring
->base
[ring
->next2fill
].rxd
,
1470 /* Recv desc is ready to be used by the device */
1471 rxd
->gen
= ring
->gen
;
1472 vmxnet3_cmd_ring_adv_next2fill(ring
);
1476 /* if needed, update the register */
1477 if (unlikely(rq
->shared
->updateRxProd
)) {
1478 VMXNET3_WRITE_BAR0_REG(adapter
,
1479 rxprod_reg
[ring_idx
] + rq
->qid
* 8,
1483 vmxnet3_comp_ring_adv_next2proc(&rq
->comp_ring
);
1484 vmxnet3_getRxComp(rcd
,
1485 &rq
->comp_ring
.base
[rq
->comp_ring
.next2proc
].rcd
, &rxComp
);
1493 vmxnet3_rq_cleanup(struct vmxnet3_rx_queue
*rq
,
1494 struct vmxnet3_adapter
*adapter
)
1497 struct Vmxnet3_RxDesc
*rxd
;
1499 for (ring_idx
= 0; ring_idx
< 2; ring_idx
++) {
1500 for (i
= 0; i
< rq
->rx_ring
[ring_idx
].size
; i
++) {
1501 #ifdef __BIG_ENDIAN_BITFIELD
1502 struct Vmxnet3_RxDesc rxDesc
;
1504 vmxnet3_getRxDesc(rxd
,
1505 &rq
->rx_ring
[ring_idx
].base
[i
].rxd
, &rxDesc
);
1507 if (rxd
->btype
== VMXNET3_RXD_BTYPE_HEAD
&&
1508 rq
->buf_info
[ring_idx
][i
].skb
) {
1509 dma_unmap_single(&adapter
->pdev
->dev
, rxd
->addr
,
1510 rxd
->len
, PCI_DMA_FROMDEVICE
);
1511 dev_kfree_skb(rq
->buf_info
[ring_idx
][i
].skb
);
1512 rq
->buf_info
[ring_idx
][i
].skb
= NULL
;
1513 } else if (rxd
->btype
== VMXNET3_RXD_BTYPE_BODY
&&
1514 rq
->buf_info
[ring_idx
][i
].page
) {
1515 dma_unmap_page(&adapter
->pdev
->dev
, rxd
->addr
,
1516 rxd
->len
, PCI_DMA_FROMDEVICE
);
1517 put_page(rq
->buf_info
[ring_idx
][i
].page
);
1518 rq
->buf_info
[ring_idx
][i
].page
= NULL
;
1522 rq
->rx_ring
[ring_idx
].gen
= VMXNET3_INIT_GEN
;
1523 rq
->rx_ring
[ring_idx
].next2fill
=
1524 rq
->rx_ring
[ring_idx
].next2comp
= 0;
1527 rq
->comp_ring
.gen
= VMXNET3_INIT_GEN
;
1528 rq
->comp_ring
.next2proc
= 0;
1533 vmxnet3_rq_cleanup_all(struct vmxnet3_adapter
*adapter
)
1537 for (i
= 0; i
< adapter
->num_rx_queues
; i
++)
1538 vmxnet3_rq_cleanup(&adapter
->rx_queue
[i
], adapter
);
1542 static void vmxnet3_rq_destroy(struct vmxnet3_rx_queue
*rq
,
1543 struct vmxnet3_adapter
*adapter
)
1548 /* all rx buffers must have already been freed */
1549 for (i
= 0; i
< 2; i
++) {
1550 if (rq
->buf_info
[i
]) {
1551 for (j
= 0; j
< rq
->rx_ring
[i
].size
; j
++)
1552 BUG_ON(rq
->buf_info
[i
][j
].page
!= NULL
);
1557 for (i
= 0; i
< 2; i
++) {
1558 if (rq
->rx_ring
[i
].base
) {
1559 dma_free_coherent(&adapter
->pdev
->dev
,
1561 * sizeof(struct Vmxnet3_RxDesc
),
1562 rq
->rx_ring
[i
].base
,
1563 rq
->rx_ring
[i
].basePA
);
1564 rq
->rx_ring
[i
].base
= NULL
;
1568 if (rq
->comp_ring
.base
) {
1569 dma_free_coherent(&adapter
->pdev
->dev
, rq
->comp_ring
.size
1570 * sizeof(struct Vmxnet3_RxCompDesc
),
1571 rq
->comp_ring
.base
, rq
->comp_ring
.basePA
);
1572 rq
->comp_ring
.base
= NULL
;
1575 if (rq
->buf_info
[0]) {
1576 size_t sz
= sizeof(struct vmxnet3_rx_buf_info
) *
1577 (rq
->rx_ring
[0].size
+ rq
->rx_ring
[1].size
);
1578 dma_free_coherent(&adapter
->pdev
->dev
, sz
, rq
->buf_info
[0],
1580 rq
->buf_info
[0] = rq
->buf_info
[1] = NULL
;
1586 vmxnet3_rq_init(struct vmxnet3_rx_queue
*rq
,
1587 struct vmxnet3_adapter
*adapter
)
1591 /* initialize buf_info */
1592 for (i
= 0; i
< rq
->rx_ring
[0].size
; i
++) {
1594 /* 1st buf for a pkt is skbuff */
1595 if (i
% adapter
->rx_buf_per_pkt
== 0) {
1596 rq
->buf_info
[0][i
].buf_type
= VMXNET3_RX_BUF_SKB
;
1597 rq
->buf_info
[0][i
].len
= adapter
->skb_buf_size
;
1598 } else { /* subsequent bufs for a pkt is frag */
1599 rq
->buf_info
[0][i
].buf_type
= VMXNET3_RX_BUF_PAGE
;
1600 rq
->buf_info
[0][i
].len
= PAGE_SIZE
;
1603 for (i
= 0; i
< rq
->rx_ring
[1].size
; i
++) {
1604 rq
->buf_info
[1][i
].buf_type
= VMXNET3_RX_BUF_PAGE
;
1605 rq
->buf_info
[1][i
].len
= PAGE_SIZE
;
1608 /* reset internal state and allocate buffers for both rings */
1609 for (i
= 0; i
< 2; i
++) {
1610 rq
->rx_ring
[i
].next2fill
= rq
->rx_ring
[i
].next2comp
= 0;
1612 memset(rq
->rx_ring
[i
].base
, 0, rq
->rx_ring
[i
].size
*
1613 sizeof(struct Vmxnet3_RxDesc
));
1614 rq
->rx_ring
[i
].gen
= VMXNET3_INIT_GEN
;
1616 if (vmxnet3_rq_alloc_rx_buf(rq
, 0, rq
->rx_ring
[0].size
- 1,
1618 /* at least has 1 rx buffer for the 1st ring */
1621 vmxnet3_rq_alloc_rx_buf(rq
, 1, rq
->rx_ring
[1].size
- 1, adapter
);
1623 /* reset the comp ring */
1624 rq
->comp_ring
.next2proc
= 0;
1625 memset(rq
->comp_ring
.base
, 0, rq
->comp_ring
.size
*
1626 sizeof(struct Vmxnet3_RxCompDesc
));
1627 rq
->comp_ring
.gen
= VMXNET3_INIT_GEN
;
1630 rq
->rx_ctx
.skb
= NULL
;
1632 /* stats are not reset */
1638 vmxnet3_rq_init_all(struct vmxnet3_adapter
*adapter
)
1642 for (i
= 0; i
< adapter
->num_rx_queues
; i
++) {
1643 err
= vmxnet3_rq_init(&adapter
->rx_queue
[i
], adapter
);
1644 if (unlikely(err
)) {
1645 dev_err(&adapter
->netdev
->dev
, "%s: failed to "
1646 "initialize rx queue%i\n",
1647 adapter
->netdev
->name
, i
);
1657 vmxnet3_rq_create(struct vmxnet3_rx_queue
*rq
, struct vmxnet3_adapter
*adapter
)
1661 struct vmxnet3_rx_buf_info
*bi
;
1663 for (i
= 0; i
< 2; i
++) {
1665 sz
= rq
->rx_ring
[i
].size
* sizeof(struct Vmxnet3_RxDesc
);
1666 rq
->rx_ring
[i
].base
= dma_alloc_coherent(
1667 &adapter
->pdev
->dev
, sz
,
1668 &rq
->rx_ring
[i
].basePA
,
1670 if (!rq
->rx_ring
[i
].base
) {
1671 netdev_err(adapter
->netdev
,
1672 "failed to allocate rx ring %d\n", i
);
1677 sz
= rq
->comp_ring
.size
* sizeof(struct Vmxnet3_RxCompDesc
);
1678 rq
->comp_ring
.base
= dma_alloc_coherent(&adapter
->pdev
->dev
, sz
,
1679 &rq
->comp_ring
.basePA
,
1681 if (!rq
->comp_ring
.base
) {
1682 netdev_err(adapter
->netdev
, "failed to allocate rx comp ring\n");
1686 sz
= sizeof(struct vmxnet3_rx_buf_info
) * (rq
->rx_ring
[0].size
+
1687 rq
->rx_ring
[1].size
);
1688 bi
= dma_zalloc_coherent(&adapter
->pdev
->dev
, sz
, &rq
->buf_info_pa
,
1693 rq
->buf_info
[0] = bi
;
1694 rq
->buf_info
[1] = bi
+ rq
->rx_ring
[0].size
;
1699 vmxnet3_rq_destroy(rq
, adapter
);
1705 vmxnet3_rq_create_all(struct vmxnet3_adapter
*adapter
)
1709 for (i
= 0; i
< adapter
->num_rx_queues
; i
++) {
1710 err
= vmxnet3_rq_create(&adapter
->rx_queue
[i
], adapter
);
1711 if (unlikely(err
)) {
1712 dev_err(&adapter
->netdev
->dev
,
1713 "%s: failed to create rx queue%i\n",
1714 adapter
->netdev
->name
, i
);
1720 vmxnet3_rq_destroy_all(adapter
);
1725 /* Multiple queue aware polling function for tx and rx */
1728 vmxnet3_do_poll(struct vmxnet3_adapter
*adapter
, int budget
)
1730 int rcd_done
= 0, i
;
1731 if (unlikely(adapter
->shared
->ecr
))
1732 vmxnet3_process_events(adapter
);
1733 for (i
= 0; i
< adapter
->num_tx_queues
; i
++)
1734 vmxnet3_tq_tx_complete(&adapter
->tx_queue
[i
], adapter
);
1736 for (i
= 0; i
< adapter
->num_rx_queues
; i
++)
1737 rcd_done
+= vmxnet3_rq_rx_complete(&adapter
->rx_queue
[i
],
1744 vmxnet3_poll(struct napi_struct
*napi
, int budget
)
1746 struct vmxnet3_rx_queue
*rx_queue
= container_of(napi
,
1747 struct vmxnet3_rx_queue
, napi
);
1750 rxd_done
= vmxnet3_do_poll(rx_queue
->adapter
, budget
);
1752 if (rxd_done
< budget
) {
1753 napi_complete(napi
);
1754 vmxnet3_enable_all_intrs(rx_queue
->adapter
);
1760 * NAPI polling function for MSI-X mode with multiple Rx queues
1761 * Returns the # of the NAPI credit consumed (# of rx descriptors processed)
1765 vmxnet3_poll_rx_only(struct napi_struct
*napi
, int budget
)
1767 struct vmxnet3_rx_queue
*rq
= container_of(napi
,
1768 struct vmxnet3_rx_queue
, napi
);
1769 struct vmxnet3_adapter
*adapter
= rq
->adapter
;
1772 /* When sharing interrupt with corresponding tx queue, process
1773 * tx completions in that queue as well
1775 if (adapter
->share_intr
== VMXNET3_INTR_BUDDYSHARE
) {
1776 struct vmxnet3_tx_queue
*tq
=
1777 &adapter
->tx_queue
[rq
- adapter
->rx_queue
];
1778 vmxnet3_tq_tx_complete(tq
, adapter
);
1781 rxd_done
= vmxnet3_rq_rx_complete(rq
, adapter
, budget
);
1783 if (rxd_done
< budget
) {
1784 napi_complete(napi
);
1785 vmxnet3_enable_intr(adapter
, rq
->comp_ring
.intr_idx
);
1791 #ifdef CONFIG_PCI_MSI
1794 * Handle completion interrupts on tx queues
1795 * Returns whether or not the intr is handled
1799 vmxnet3_msix_tx(int irq
, void *data
)
1801 struct vmxnet3_tx_queue
*tq
= data
;
1802 struct vmxnet3_adapter
*adapter
= tq
->adapter
;
1804 if (adapter
->intr
.mask_mode
== VMXNET3_IMM_ACTIVE
)
1805 vmxnet3_disable_intr(adapter
, tq
->comp_ring
.intr_idx
);
1807 /* Handle the case where only one irq is allocate for all tx queues */
1808 if (adapter
->share_intr
== VMXNET3_INTR_TXSHARE
) {
1810 for (i
= 0; i
< adapter
->num_tx_queues
; i
++) {
1811 struct vmxnet3_tx_queue
*txq
= &adapter
->tx_queue
[i
];
1812 vmxnet3_tq_tx_complete(txq
, adapter
);
1815 vmxnet3_tq_tx_complete(tq
, adapter
);
1817 vmxnet3_enable_intr(adapter
, tq
->comp_ring
.intr_idx
);
1824 * Handle completion interrupts on rx queues. Returns whether or not the
1829 vmxnet3_msix_rx(int irq
, void *data
)
1831 struct vmxnet3_rx_queue
*rq
= data
;
1832 struct vmxnet3_adapter
*adapter
= rq
->adapter
;
1834 /* disable intr if needed */
1835 if (adapter
->intr
.mask_mode
== VMXNET3_IMM_ACTIVE
)
1836 vmxnet3_disable_intr(adapter
, rq
->comp_ring
.intr_idx
);
1837 napi_schedule(&rq
->napi
);
1843 *----------------------------------------------------------------------------
1845 * vmxnet3_msix_event --
1847 * vmxnet3 msix event intr handler
1850 * whether or not the intr is handled
1852 *----------------------------------------------------------------------------
1856 vmxnet3_msix_event(int irq
, void *data
)
1858 struct net_device
*dev
= data
;
1859 struct vmxnet3_adapter
*adapter
= netdev_priv(dev
);
1861 /* disable intr if needed */
1862 if (adapter
->intr
.mask_mode
== VMXNET3_IMM_ACTIVE
)
1863 vmxnet3_disable_intr(adapter
, adapter
->intr
.event_intr_idx
);
1865 if (adapter
->shared
->ecr
)
1866 vmxnet3_process_events(adapter
);
1868 vmxnet3_enable_intr(adapter
, adapter
->intr
.event_intr_idx
);
1873 #endif /* CONFIG_PCI_MSI */
1876 /* Interrupt handler for vmxnet3 */
1878 vmxnet3_intr(int irq
, void *dev_id
)
1880 struct net_device
*dev
= dev_id
;
1881 struct vmxnet3_adapter
*adapter
= netdev_priv(dev
);
1883 if (adapter
->intr
.type
== VMXNET3_IT_INTX
) {
1884 u32 icr
= VMXNET3_READ_BAR1_REG(adapter
, VMXNET3_REG_ICR
);
1885 if (unlikely(icr
== 0))
1891 /* disable intr if needed */
1892 if (adapter
->intr
.mask_mode
== VMXNET3_IMM_ACTIVE
)
1893 vmxnet3_disable_all_intrs(adapter
);
1895 napi_schedule(&adapter
->rx_queue
[0].napi
);
1900 #ifdef CONFIG_NET_POLL_CONTROLLER
1902 /* netpoll callback. */
1904 vmxnet3_netpoll(struct net_device
*netdev
)
1906 struct vmxnet3_adapter
*adapter
= netdev_priv(netdev
);
1908 switch (adapter
->intr
.type
) {
1909 #ifdef CONFIG_PCI_MSI
1910 case VMXNET3_IT_MSIX
: {
1912 for (i
= 0; i
< adapter
->num_rx_queues
; i
++)
1913 vmxnet3_msix_rx(0, &adapter
->rx_queue
[i
]);
1917 case VMXNET3_IT_MSI
:
1919 vmxnet3_intr(0, adapter
->netdev
);
1924 #endif /* CONFIG_NET_POLL_CONTROLLER */
1927 vmxnet3_request_irqs(struct vmxnet3_adapter
*adapter
)
1929 struct vmxnet3_intr
*intr
= &adapter
->intr
;
1933 #ifdef CONFIG_PCI_MSI
1934 if (adapter
->intr
.type
== VMXNET3_IT_MSIX
) {
1935 for (i
= 0; i
< adapter
->num_tx_queues
; i
++) {
1936 if (adapter
->share_intr
!= VMXNET3_INTR_BUDDYSHARE
) {
1937 sprintf(adapter
->tx_queue
[i
].name
, "%s-tx-%d",
1938 adapter
->netdev
->name
, vector
);
1940 intr
->msix_entries
[vector
].vector
,
1942 adapter
->tx_queue
[i
].name
,
1943 &adapter
->tx_queue
[i
]);
1945 sprintf(adapter
->tx_queue
[i
].name
, "%s-rxtx-%d",
1946 adapter
->netdev
->name
, vector
);
1949 dev_err(&adapter
->netdev
->dev
,
1950 "Failed to request irq for MSIX, %s, "
1952 adapter
->tx_queue
[i
].name
, err
);
1956 /* Handle the case where only 1 MSIx was allocated for
1958 if (adapter
->share_intr
== VMXNET3_INTR_TXSHARE
) {
1959 for (; i
< adapter
->num_tx_queues
; i
++)
1960 adapter
->tx_queue
[i
].comp_ring
.intr_idx
1965 adapter
->tx_queue
[i
].comp_ring
.intr_idx
1969 if (adapter
->share_intr
== VMXNET3_INTR_BUDDYSHARE
)
1972 for (i
= 0; i
< adapter
->num_rx_queues
; i
++) {
1973 if (adapter
->share_intr
!= VMXNET3_INTR_BUDDYSHARE
)
1974 sprintf(adapter
->rx_queue
[i
].name
, "%s-rx-%d",
1975 adapter
->netdev
->name
, vector
);
1977 sprintf(adapter
->rx_queue
[i
].name
, "%s-rxtx-%d",
1978 adapter
->netdev
->name
, vector
);
1979 err
= request_irq(intr
->msix_entries
[vector
].vector
,
1981 adapter
->rx_queue
[i
].name
,
1982 &(adapter
->rx_queue
[i
]));
1984 netdev_err(adapter
->netdev
,
1985 "Failed to request irq for MSIX, "
1987 adapter
->rx_queue
[i
].name
, err
);
1991 adapter
->rx_queue
[i
].comp_ring
.intr_idx
= vector
++;
1994 sprintf(intr
->event_msi_vector_name
, "%s-event-%d",
1995 adapter
->netdev
->name
, vector
);
1996 err
= request_irq(intr
->msix_entries
[vector
].vector
,
1997 vmxnet3_msix_event
, 0,
1998 intr
->event_msi_vector_name
, adapter
->netdev
);
1999 intr
->event_intr_idx
= vector
;
2001 } else if (intr
->type
== VMXNET3_IT_MSI
) {
2002 adapter
->num_rx_queues
= 1;
2003 err
= request_irq(adapter
->pdev
->irq
, vmxnet3_intr
, 0,
2004 adapter
->netdev
->name
, adapter
->netdev
);
2007 adapter
->num_rx_queues
= 1;
2008 err
= request_irq(adapter
->pdev
->irq
, vmxnet3_intr
,
2009 IRQF_SHARED
, adapter
->netdev
->name
,
2011 #ifdef CONFIG_PCI_MSI
2014 intr
->num_intrs
= vector
+ 1;
2016 netdev_err(adapter
->netdev
,
2017 "Failed to request irq (intr type:%d), error %d\n",
2020 /* Number of rx queues will not change after this */
2021 for (i
= 0; i
< adapter
->num_rx_queues
; i
++) {
2022 struct vmxnet3_rx_queue
*rq
= &adapter
->rx_queue
[i
];
2024 rq
->qid2
= i
+ adapter
->num_rx_queues
;
2029 /* init our intr settings */
2030 for (i
= 0; i
< intr
->num_intrs
; i
++)
2031 intr
->mod_levels
[i
] = UPT1_IML_ADAPTIVE
;
2032 if (adapter
->intr
.type
!= VMXNET3_IT_MSIX
) {
2033 adapter
->intr
.event_intr_idx
= 0;
2034 for (i
= 0; i
< adapter
->num_tx_queues
; i
++)
2035 adapter
->tx_queue
[i
].comp_ring
.intr_idx
= 0;
2036 adapter
->rx_queue
[0].comp_ring
.intr_idx
= 0;
2039 netdev_info(adapter
->netdev
,
2040 "intr type %u, mode %u, %u vectors allocated\n",
2041 intr
->type
, intr
->mask_mode
, intr
->num_intrs
);
2049 vmxnet3_free_irqs(struct vmxnet3_adapter
*adapter
)
2051 struct vmxnet3_intr
*intr
= &adapter
->intr
;
2052 BUG_ON(intr
->type
== VMXNET3_IT_AUTO
|| intr
->num_intrs
<= 0);
2054 switch (intr
->type
) {
2055 #ifdef CONFIG_PCI_MSI
2056 case VMXNET3_IT_MSIX
:
2060 if (adapter
->share_intr
!= VMXNET3_INTR_BUDDYSHARE
) {
2061 for (i
= 0; i
< adapter
->num_tx_queues
; i
++) {
2062 free_irq(intr
->msix_entries
[vector
++].vector
,
2063 &(adapter
->tx_queue
[i
]));
2064 if (adapter
->share_intr
== VMXNET3_INTR_TXSHARE
)
2069 for (i
= 0; i
< adapter
->num_rx_queues
; i
++) {
2070 free_irq(intr
->msix_entries
[vector
++].vector
,
2071 &(adapter
->rx_queue
[i
]));
2074 free_irq(intr
->msix_entries
[vector
].vector
,
2076 BUG_ON(vector
>= intr
->num_intrs
);
2080 case VMXNET3_IT_MSI
:
2081 free_irq(adapter
->pdev
->irq
, adapter
->netdev
);
2083 case VMXNET3_IT_INTX
:
2084 free_irq(adapter
->pdev
->irq
, adapter
->netdev
);
2093 vmxnet3_restore_vlan(struct vmxnet3_adapter
*adapter
)
2095 u32
*vfTable
= adapter
->shared
->devRead
.rxFilterConf
.vfTable
;
2098 /* allow untagged pkts */
2099 VMXNET3_SET_VFTABLE_ENTRY(vfTable
, 0);
2101 for_each_set_bit(vid
, adapter
->active_vlans
, VLAN_N_VID
)
2102 VMXNET3_SET_VFTABLE_ENTRY(vfTable
, vid
);
2107 vmxnet3_vlan_rx_add_vid(struct net_device
*netdev
, __be16 proto
, u16 vid
)
2109 struct vmxnet3_adapter
*adapter
= netdev_priv(netdev
);
2111 if (!(netdev
->flags
& IFF_PROMISC
)) {
2112 u32
*vfTable
= adapter
->shared
->devRead
.rxFilterConf
.vfTable
;
2113 unsigned long flags
;
2115 VMXNET3_SET_VFTABLE_ENTRY(vfTable
, vid
);
2116 spin_lock_irqsave(&adapter
->cmd_lock
, flags
);
2117 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_CMD
,
2118 VMXNET3_CMD_UPDATE_VLAN_FILTERS
);
2119 spin_unlock_irqrestore(&adapter
->cmd_lock
, flags
);
2122 set_bit(vid
, adapter
->active_vlans
);
2129 vmxnet3_vlan_rx_kill_vid(struct net_device
*netdev
, __be16 proto
, u16 vid
)
2131 struct vmxnet3_adapter
*adapter
= netdev_priv(netdev
);
2133 if (!(netdev
->flags
& IFF_PROMISC
)) {
2134 u32
*vfTable
= adapter
->shared
->devRead
.rxFilterConf
.vfTable
;
2135 unsigned long flags
;
2137 VMXNET3_CLEAR_VFTABLE_ENTRY(vfTable
, vid
);
2138 spin_lock_irqsave(&adapter
->cmd_lock
, flags
);
2139 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_CMD
,
2140 VMXNET3_CMD_UPDATE_VLAN_FILTERS
);
2141 spin_unlock_irqrestore(&adapter
->cmd_lock
, flags
);
2144 clear_bit(vid
, adapter
->active_vlans
);
2151 vmxnet3_copy_mc(struct net_device
*netdev
)
2154 u32 sz
= netdev_mc_count(netdev
) * ETH_ALEN
;
2156 /* struct Vmxnet3_RxFilterConf.mfTableLen is u16. */
2158 /* We may be called with BH disabled */
2159 buf
= kmalloc(sz
, GFP_ATOMIC
);
2161 struct netdev_hw_addr
*ha
;
2164 netdev_for_each_mc_addr(ha
, netdev
)
2165 memcpy(buf
+ i
++ * ETH_ALEN
, ha
->addr
,
2174 vmxnet3_set_mc(struct net_device
*netdev
)
2176 struct vmxnet3_adapter
*adapter
= netdev_priv(netdev
);
2177 unsigned long flags
;
2178 struct Vmxnet3_RxFilterConf
*rxConf
=
2179 &adapter
->shared
->devRead
.rxFilterConf
;
2180 u8
*new_table
= NULL
;
2181 dma_addr_t new_table_pa
= 0;
2182 u32 new_mode
= VMXNET3_RXM_UCAST
;
2184 if (netdev
->flags
& IFF_PROMISC
) {
2185 u32
*vfTable
= adapter
->shared
->devRead
.rxFilterConf
.vfTable
;
2186 memset(vfTable
, 0, VMXNET3_VFT_SIZE
* sizeof(*vfTable
));
2188 new_mode
|= VMXNET3_RXM_PROMISC
;
2190 vmxnet3_restore_vlan(adapter
);
2193 if (netdev
->flags
& IFF_BROADCAST
)
2194 new_mode
|= VMXNET3_RXM_BCAST
;
2196 if (netdev
->flags
& IFF_ALLMULTI
)
2197 new_mode
|= VMXNET3_RXM_ALL_MULTI
;
2199 if (!netdev_mc_empty(netdev
)) {
2200 new_table
= vmxnet3_copy_mc(netdev
);
2202 size_t sz
= netdev_mc_count(netdev
) * ETH_ALEN
;
2204 rxConf
->mfTableLen
= cpu_to_le16(sz
);
2205 new_table_pa
= dma_map_single(
2206 &adapter
->pdev
->dev
,
2212 if (!dma_mapping_error(&adapter
->pdev
->dev
,
2214 new_mode
|= VMXNET3_RXM_MCAST
;
2215 rxConf
->mfTablePA
= cpu_to_le64(new_table_pa
);
2218 "failed to copy mcast list, setting ALL_MULTI\n");
2219 new_mode
|= VMXNET3_RXM_ALL_MULTI
;
2223 if (!(new_mode
& VMXNET3_RXM_MCAST
)) {
2224 rxConf
->mfTableLen
= 0;
2225 rxConf
->mfTablePA
= 0;
2228 spin_lock_irqsave(&adapter
->cmd_lock
, flags
);
2229 if (new_mode
!= rxConf
->rxMode
) {
2230 rxConf
->rxMode
= cpu_to_le32(new_mode
);
2231 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_CMD
,
2232 VMXNET3_CMD_UPDATE_RX_MODE
);
2233 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_CMD
,
2234 VMXNET3_CMD_UPDATE_VLAN_FILTERS
);
2237 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_CMD
,
2238 VMXNET3_CMD_UPDATE_MAC_FILTERS
);
2239 spin_unlock_irqrestore(&adapter
->cmd_lock
, flags
);
2242 dma_unmap_single(&adapter
->pdev
->dev
, new_table_pa
,
2243 rxConf
->mfTableLen
, PCI_DMA_TODEVICE
);
2248 vmxnet3_rq_destroy_all(struct vmxnet3_adapter
*adapter
)
2252 for (i
= 0; i
< adapter
->num_rx_queues
; i
++)
2253 vmxnet3_rq_destroy(&adapter
->rx_queue
[i
], adapter
);
2258 * Set up driver_shared based on settings in adapter.
2262 vmxnet3_setup_driver_shared(struct vmxnet3_adapter
*adapter
)
2264 struct Vmxnet3_DriverShared
*shared
= adapter
->shared
;
2265 struct Vmxnet3_DSDevRead
*devRead
= &shared
->devRead
;
2266 struct Vmxnet3_TxQueueConf
*tqc
;
2267 struct Vmxnet3_RxQueueConf
*rqc
;
2270 memset(shared
, 0, sizeof(*shared
));
2272 /* driver settings */
2273 shared
->magic
= cpu_to_le32(VMXNET3_REV1_MAGIC
);
2274 devRead
->misc
.driverInfo
.version
= cpu_to_le32(
2275 VMXNET3_DRIVER_VERSION_NUM
);
2276 devRead
->misc
.driverInfo
.gos
.gosBits
= (sizeof(void *) == 4 ?
2277 VMXNET3_GOS_BITS_32
: VMXNET3_GOS_BITS_64
);
2278 devRead
->misc
.driverInfo
.gos
.gosType
= VMXNET3_GOS_TYPE_LINUX
;
2279 *((u32
*)&devRead
->misc
.driverInfo
.gos
) = cpu_to_le32(
2280 *((u32
*)&devRead
->misc
.driverInfo
.gos
));
2281 devRead
->misc
.driverInfo
.vmxnet3RevSpt
= cpu_to_le32(1);
2282 devRead
->misc
.driverInfo
.uptVerSpt
= cpu_to_le32(1);
2284 devRead
->misc
.ddPA
= cpu_to_le64(adapter
->adapter_pa
);
2285 devRead
->misc
.ddLen
= cpu_to_le32(sizeof(struct vmxnet3_adapter
));
2287 /* set up feature flags */
2288 if (adapter
->netdev
->features
& NETIF_F_RXCSUM
)
2289 devRead
->misc
.uptFeatures
|= UPT1_F_RXCSUM
;
2291 if (adapter
->netdev
->features
& NETIF_F_LRO
) {
2292 devRead
->misc
.uptFeatures
|= UPT1_F_LRO
;
2293 devRead
->misc
.maxNumRxSG
= cpu_to_le16(1 + MAX_SKB_FRAGS
);
2295 if (adapter
->netdev
->features
& NETIF_F_HW_VLAN_CTAG_RX
)
2296 devRead
->misc
.uptFeatures
|= UPT1_F_RXVLAN
;
2298 devRead
->misc
.mtu
= cpu_to_le32(adapter
->netdev
->mtu
);
2299 devRead
->misc
.queueDescPA
= cpu_to_le64(adapter
->queue_desc_pa
);
2300 devRead
->misc
.queueDescLen
= cpu_to_le32(
2301 adapter
->num_tx_queues
* sizeof(struct Vmxnet3_TxQueueDesc
) +
2302 adapter
->num_rx_queues
* sizeof(struct Vmxnet3_RxQueueDesc
));
2304 /* tx queue settings */
2305 devRead
->misc
.numTxQueues
= adapter
->num_tx_queues
;
2306 for (i
= 0; i
< adapter
->num_tx_queues
; i
++) {
2307 struct vmxnet3_tx_queue
*tq
= &adapter
->tx_queue
[i
];
2308 BUG_ON(adapter
->tx_queue
[i
].tx_ring
.base
== NULL
);
2309 tqc
= &adapter
->tqd_start
[i
].conf
;
2310 tqc
->txRingBasePA
= cpu_to_le64(tq
->tx_ring
.basePA
);
2311 tqc
->dataRingBasePA
= cpu_to_le64(tq
->data_ring
.basePA
);
2312 tqc
->compRingBasePA
= cpu_to_le64(tq
->comp_ring
.basePA
);
2313 tqc
->ddPA
= cpu_to_le64(tq
->buf_info_pa
);
2314 tqc
->txRingSize
= cpu_to_le32(tq
->tx_ring
.size
);
2315 tqc
->dataRingSize
= cpu_to_le32(tq
->data_ring
.size
);
2316 tqc
->compRingSize
= cpu_to_le32(tq
->comp_ring
.size
);
2317 tqc
->ddLen
= cpu_to_le32(
2318 sizeof(struct vmxnet3_tx_buf_info
) *
2320 tqc
->intrIdx
= tq
->comp_ring
.intr_idx
;
2323 /* rx queue settings */
2324 devRead
->misc
.numRxQueues
= adapter
->num_rx_queues
;
2325 for (i
= 0; i
< adapter
->num_rx_queues
; i
++) {
2326 struct vmxnet3_rx_queue
*rq
= &adapter
->rx_queue
[i
];
2327 rqc
= &adapter
->rqd_start
[i
].conf
;
2328 rqc
->rxRingBasePA
[0] = cpu_to_le64(rq
->rx_ring
[0].basePA
);
2329 rqc
->rxRingBasePA
[1] = cpu_to_le64(rq
->rx_ring
[1].basePA
);
2330 rqc
->compRingBasePA
= cpu_to_le64(rq
->comp_ring
.basePA
);
2331 rqc
->ddPA
= cpu_to_le64(rq
->buf_info_pa
);
2332 rqc
->rxRingSize
[0] = cpu_to_le32(rq
->rx_ring
[0].size
);
2333 rqc
->rxRingSize
[1] = cpu_to_le32(rq
->rx_ring
[1].size
);
2334 rqc
->compRingSize
= cpu_to_le32(rq
->comp_ring
.size
);
2335 rqc
->ddLen
= cpu_to_le32(
2336 sizeof(struct vmxnet3_rx_buf_info
) *
2337 (rqc
->rxRingSize
[0] +
2338 rqc
->rxRingSize
[1]));
2339 rqc
->intrIdx
= rq
->comp_ring
.intr_idx
;
2343 memset(adapter
->rss_conf
, 0, sizeof(*adapter
->rss_conf
));
2346 struct UPT1_RSSConf
*rssConf
= adapter
->rss_conf
;
2348 devRead
->misc
.uptFeatures
|= UPT1_F_RSS
;
2349 devRead
->misc
.numRxQueues
= adapter
->num_rx_queues
;
2350 rssConf
->hashType
= UPT1_RSS_HASH_TYPE_TCP_IPV4
|
2351 UPT1_RSS_HASH_TYPE_IPV4
|
2352 UPT1_RSS_HASH_TYPE_TCP_IPV6
|
2353 UPT1_RSS_HASH_TYPE_IPV6
;
2354 rssConf
->hashFunc
= UPT1_RSS_HASH_FUNC_TOEPLITZ
;
2355 rssConf
->hashKeySize
= UPT1_RSS_MAX_KEY_SIZE
;
2356 rssConf
->indTableSize
= VMXNET3_RSS_IND_TABLE_SIZE
;
2357 netdev_rss_key_fill(rssConf
->hashKey
, sizeof(rssConf
->hashKey
));
2359 for (i
= 0; i
< rssConf
->indTableSize
; i
++)
2360 rssConf
->indTable
[i
] = ethtool_rxfh_indir_default(
2361 i
, adapter
->num_rx_queues
);
2363 devRead
->rssConfDesc
.confVer
= 1;
2364 devRead
->rssConfDesc
.confLen
= cpu_to_le32(sizeof(*rssConf
));
2365 devRead
->rssConfDesc
.confPA
=
2366 cpu_to_le64(adapter
->rss_conf_pa
);
2369 #endif /* VMXNET3_RSS */
2372 devRead
->intrConf
.autoMask
= adapter
->intr
.mask_mode
==
2374 devRead
->intrConf
.numIntrs
= adapter
->intr
.num_intrs
;
2375 for (i
= 0; i
< adapter
->intr
.num_intrs
; i
++)
2376 devRead
->intrConf
.modLevels
[i
] = adapter
->intr
.mod_levels
[i
];
2378 devRead
->intrConf
.eventIntrIdx
= adapter
->intr
.event_intr_idx
;
2379 devRead
->intrConf
.intrCtrl
|= cpu_to_le32(VMXNET3_IC_DISABLE_ALL
);
2381 /* rx filter settings */
2382 devRead
->rxFilterConf
.rxMode
= 0;
2383 vmxnet3_restore_vlan(adapter
);
2384 vmxnet3_write_mac_addr(adapter
, adapter
->netdev
->dev_addr
);
2386 /* the rest are already zeroed */
2391 vmxnet3_activate_dev(struct vmxnet3_adapter
*adapter
)
2395 unsigned long flags
;
2397 netdev_dbg(adapter
->netdev
, "%s: skb_buf_size %d, rx_buf_per_pkt %d,"
2398 " ring sizes %u %u %u\n", adapter
->netdev
->name
,
2399 adapter
->skb_buf_size
, adapter
->rx_buf_per_pkt
,
2400 adapter
->tx_queue
[0].tx_ring
.size
,
2401 adapter
->rx_queue
[0].rx_ring
[0].size
,
2402 adapter
->rx_queue
[0].rx_ring
[1].size
);
2404 vmxnet3_tq_init_all(adapter
);
2405 err
= vmxnet3_rq_init_all(adapter
);
2407 netdev_err(adapter
->netdev
,
2408 "Failed to init rx queue error %d\n", err
);
2412 err
= vmxnet3_request_irqs(adapter
);
2414 netdev_err(adapter
->netdev
,
2415 "Failed to setup irq for error %d\n", err
);
2419 vmxnet3_setup_driver_shared(adapter
);
2421 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_DSAL
, VMXNET3_GET_ADDR_LO(
2422 adapter
->shared_pa
));
2423 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_DSAH
, VMXNET3_GET_ADDR_HI(
2424 adapter
->shared_pa
));
2425 spin_lock_irqsave(&adapter
->cmd_lock
, flags
);
2426 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_CMD
,
2427 VMXNET3_CMD_ACTIVATE_DEV
);
2428 ret
= VMXNET3_READ_BAR1_REG(adapter
, VMXNET3_REG_CMD
);
2429 spin_unlock_irqrestore(&adapter
->cmd_lock
, flags
);
2432 netdev_err(adapter
->netdev
,
2433 "Failed to activate dev: error %u\n", ret
);
2438 for (i
= 0; i
< adapter
->num_rx_queues
; i
++) {
2439 VMXNET3_WRITE_BAR0_REG(adapter
,
2440 VMXNET3_REG_RXPROD
+ i
* VMXNET3_REG_ALIGN
,
2441 adapter
->rx_queue
[i
].rx_ring
[0].next2fill
);
2442 VMXNET3_WRITE_BAR0_REG(adapter
, (VMXNET3_REG_RXPROD2
+
2443 (i
* VMXNET3_REG_ALIGN
)),
2444 adapter
->rx_queue
[i
].rx_ring
[1].next2fill
);
2447 /* Apply the rx filter settins last. */
2448 vmxnet3_set_mc(adapter
->netdev
);
2451 * Check link state when first activating device. It will start the
2452 * tx queue if the link is up.
2454 vmxnet3_check_link(adapter
, true);
2455 for (i
= 0; i
< adapter
->num_rx_queues
; i
++)
2456 napi_enable(&adapter
->rx_queue
[i
].napi
);
2457 vmxnet3_enable_all_intrs(adapter
);
2458 clear_bit(VMXNET3_STATE_BIT_QUIESCED
, &adapter
->state
);
2462 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_DSAL
, 0);
2463 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_DSAH
, 0);
2464 vmxnet3_free_irqs(adapter
);
2467 /* free up buffers we allocated */
2468 vmxnet3_rq_cleanup_all(adapter
);
2474 vmxnet3_reset_dev(struct vmxnet3_adapter
*adapter
)
2476 unsigned long flags
;
2477 spin_lock_irqsave(&adapter
->cmd_lock
, flags
);
2478 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_CMD
, VMXNET3_CMD_RESET_DEV
);
2479 spin_unlock_irqrestore(&adapter
->cmd_lock
, flags
);
2484 vmxnet3_quiesce_dev(struct vmxnet3_adapter
*adapter
)
2487 unsigned long flags
;
2488 if (test_and_set_bit(VMXNET3_STATE_BIT_QUIESCED
, &adapter
->state
))
2492 spin_lock_irqsave(&adapter
->cmd_lock
, flags
);
2493 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_CMD
,
2494 VMXNET3_CMD_QUIESCE_DEV
);
2495 spin_unlock_irqrestore(&adapter
->cmd_lock
, flags
);
2496 vmxnet3_disable_all_intrs(adapter
);
2498 for (i
= 0; i
< adapter
->num_rx_queues
; i
++)
2499 napi_disable(&adapter
->rx_queue
[i
].napi
);
2500 netif_tx_disable(adapter
->netdev
);
2501 adapter
->link_speed
= 0;
2502 netif_carrier_off(adapter
->netdev
);
2504 vmxnet3_tq_cleanup_all(adapter
);
2505 vmxnet3_rq_cleanup_all(adapter
);
2506 vmxnet3_free_irqs(adapter
);
2512 vmxnet3_write_mac_addr(struct vmxnet3_adapter
*adapter
, u8
*mac
)
2517 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_MACL
, tmp
);
2519 tmp
= (mac
[5] << 8) | mac
[4];
2520 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_MACH
, tmp
);
2525 vmxnet3_set_mac_addr(struct net_device
*netdev
, void *p
)
2527 struct sockaddr
*addr
= p
;
2528 struct vmxnet3_adapter
*adapter
= netdev_priv(netdev
);
2530 memcpy(netdev
->dev_addr
, addr
->sa_data
, netdev
->addr_len
);
2531 vmxnet3_write_mac_addr(adapter
, addr
->sa_data
);
2537 /* ==================== initialization and cleanup routines ============ */
2540 vmxnet3_alloc_pci_resources(struct vmxnet3_adapter
*adapter
, bool *dma64
)
2543 unsigned long mmio_start
, mmio_len
;
2544 struct pci_dev
*pdev
= adapter
->pdev
;
2546 err
= pci_enable_device(pdev
);
2548 dev_err(&pdev
->dev
, "Failed to enable adapter: error %d\n", err
);
2552 if (pci_set_dma_mask(pdev
, DMA_BIT_MASK(64)) == 0) {
2553 if (pci_set_consistent_dma_mask(pdev
, DMA_BIT_MASK(64)) != 0) {
2555 "pci_set_consistent_dma_mask failed\n");
2561 if (pci_set_dma_mask(pdev
, DMA_BIT_MASK(32)) != 0) {
2563 "pci_set_dma_mask failed\n");
2570 err
= pci_request_selected_regions(pdev
, (1 << 2) - 1,
2571 vmxnet3_driver_name
);
2574 "Failed to request region for adapter: error %d\n", err
);
2578 pci_set_master(pdev
);
2580 mmio_start
= pci_resource_start(pdev
, 0);
2581 mmio_len
= pci_resource_len(pdev
, 0);
2582 adapter
->hw_addr0
= ioremap(mmio_start
, mmio_len
);
2583 if (!adapter
->hw_addr0
) {
2584 dev_err(&pdev
->dev
, "Failed to map bar0\n");
2589 mmio_start
= pci_resource_start(pdev
, 1);
2590 mmio_len
= pci_resource_len(pdev
, 1);
2591 adapter
->hw_addr1
= ioremap(mmio_start
, mmio_len
);
2592 if (!adapter
->hw_addr1
) {
2593 dev_err(&pdev
->dev
, "Failed to map bar1\n");
2600 iounmap(adapter
->hw_addr0
);
2602 pci_release_selected_regions(pdev
, (1 << 2) - 1);
2604 pci_disable_device(pdev
);
2610 vmxnet3_free_pci_resources(struct vmxnet3_adapter
*adapter
)
2612 BUG_ON(!adapter
->pdev
);
2614 iounmap(adapter
->hw_addr0
);
2615 iounmap(adapter
->hw_addr1
);
2616 pci_release_selected_regions(adapter
->pdev
, (1 << 2) - 1);
2617 pci_disable_device(adapter
->pdev
);
2622 vmxnet3_adjust_rx_ring_size(struct vmxnet3_adapter
*adapter
)
2624 size_t sz
, i
, ring0_size
, ring1_size
, comp_size
;
2625 struct vmxnet3_rx_queue
*rq
= &adapter
->rx_queue
[0];
2628 if (adapter
->netdev
->mtu
<= VMXNET3_MAX_SKB_BUF_SIZE
-
2629 VMXNET3_MAX_ETH_HDR_SIZE
) {
2630 adapter
->skb_buf_size
= adapter
->netdev
->mtu
+
2631 VMXNET3_MAX_ETH_HDR_SIZE
;
2632 if (adapter
->skb_buf_size
< VMXNET3_MIN_T0_BUF_SIZE
)
2633 adapter
->skb_buf_size
= VMXNET3_MIN_T0_BUF_SIZE
;
2635 adapter
->rx_buf_per_pkt
= 1;
2637 adapter
->skb_buf_size
= VMXNET3_MAX_SKB_BUF_SIZE
;
2638 sz
= adapter
->netdev
->mtu
- VMXNET3_MAX_SKB_BUF_SIZE
+
2639 VMXNET3_MAX_ETH_HDR_SIZE
;
2640 adapter
->rx_buf_per_pkt
= 1 + (sz
+ PAGE_SIZE
- 1) / PAGE_SIZE
;
2644 * for simplicity, force the ring0 size to be a multiple of
2645 * rx_buf_per_pkt * VMXNET3_RING_SIZE_ALIGN
2647 sz
= adapter
->rx_buf_per_pkt
* VMXNET3_RING_SIZE_ALIGN
;
2648 ring0_size
= adapter
->rx_queue
[0].rx_ring
[0].size
;
2649 ring0_size
= (ring0_size
+ sz
- 1) / sz
* sz
;
2650 ring0_size
= min_t(u32
, ring0_size
, VMXNET3_RX_RING_MAX_SIZE
/
2652 ring1_size
= adapter
->rx_queue
[0].rx_ring
[1].size
;
2653 ring1_size
= (ring1_size
+ sz
- 1) / sz
* sz
;
2654 ring1_size
= min_t(u32
, ring1_size
, VMXNET3_RX_RING2_MAX_SIZE
/
2656 comp_size
= ring0_size
+ ring1_size
;
2658 for (i
= 0; i
< adapter
->num_rx_queues
; i
++) {
2659 rq
= &adapter
->rx_queue
[i
];
2660 rq
->rx_ring
[0].size
= ring0_size
;
2661 rq
->rx_ring
[1].size
= ring1_size
;
2662 rq
->comp_ring
.size
= comp_size
;
2668 vmxnet3_create_queues(struct vmxnet3_adapter
*adapter
, u32 tx_ring_size
,
2669 u32 rx_ring_size
, u32 rx_ring2_size
)
2673 for (i
= 0; i
< adapter
->num_tx_queues
; i
++) {
2674 struct vmxnet3_tx_queue
*tq
= &adapter
->tx_queue
[i
];
2675 tq
->tx_ring
.size
= tx_ring_size
;
2676 tq
->data_ring
.size
= tx_ring_size
;
2677 tq
->comp_ring
.size
= tx_ring_size
;
2678 tq
->shared
= &adapter
->tqd_start
[i
].ctrl
;
2680 tq
->adapter
= adapter
;
2682 err
= vmxnet3_tq_create(tq
, adapter
);
2684 * Too late to change num_tx_queues. We cannot do away with
2685 * lesser number of queues than what we asked for
2691 adapter
->rx_queue
[0].rx_ring
[0].size
= rx_ring_size
;
2692 adapter
->rx_queue
[0].rx_ring
[1].size
= rx_ring2_size
;
2693 vmxnet3_adjust_rx_ring_size(adapter
);
2694 for (i
= 0; i
< adapter
->num_rx_queues
; i
++) {
2695 struct vmxnet3_rx_queue
*rq
= &adapter
->rx_queue
[i
];
2696 /* qid and qid2 for rx queues will be assigned later when num
2697 * of rx queues is finalized after allocating intrs */
2698 rq
->shared
= &adapter
->rqd_start
[i
].ctrl
;
2699 rq
->adapter
= adapter
;
2700 err
= vmxnet3_rq_create(rq
, adapter
);
2703 netdev_err(adapter
->netdev
,
2704 "Could not allocate any rx queues. "
2708 netdev_info(adapter
->netdev
,
2709 "Number of rx queues changed "
2711 adapter
->num_rx_queues
= i
;
2719 vmxnet3_tq_destroy_all(adapter
);
2724 vmxnet3_open(struct net_device
*netdev
)
2726 struct vmxnet3_adapter
*adapter
;
2729 adapter
= netdev_priv(netdev
);
2731 for (i
= 0; i
< adapter
->num_tx_queues
; i
++)
2732 spin_lock_init(&adapter
->tx_queue
[i
].tx_lock
);
2734 err
= vmxnet3_create_queues(adapter
, adapter
->tx_ring_size
,
2735 adapter
->rx_ring_size
,
2736 adapter
->rx_ring2_size
);
2740 err
= vmxnet3_activate_dev(adapter
);
2747 vmxnet3_rq_destroy_all(adapter
);
2748 vmxnet3_tq_destroy_all(adapter
);
2755 vmxnet3_close(struct net_device
*netdev
)
2757 struct vmxnet3_adapter
*adapter
= netdev_priv(netdev
);
2760 * Reset_work may be in the middle of resetting the device, wait for its
2763 while (test_and_set_bit(VMXNET3_STATE_BIT_RESETTING
, &adapter
->state
))
2766 vmxnet3_quiesce_dev(adapter
);
2768 vmxnet3_rq_destroy_all(adapter
);
2769 vmxnet3_tq_destroy_all(adapter
);
2771 clear_bit(VMXNET3_STATE_BIT_RESETTING
, &adapter
->state
);
2779 vmxnet3_force_close(struct vmxnet3_adapter
*adapter
)
2784 * we must clear VMXNET3_STATE_BIT_RESETTING, otherwise
2785 * vmxnet3_close() will deadlock.
2787 BUG_ON(test_bit(VMXNET3_STATE_BIT_RESETTING
, &adapter
->state
));
2789 /* we need to enable NAPI, otherwise dev_close will deadlock */
2790 for (i
= 0; i
< adapter
->num_rx_queues
; i
++)
2791 napi_enable(&adapter
->rx_queue
[i
].napi
);
2793 * Need to clear the quiesce bit to ensure that vmxnet3_close
2794 * can quiesce the device properly
2796 clear_bit(VMXNET3_STATE_BIT_QUIESCED
, &adapter
->state
);
2797 dev_close(adapter
->netdev
);
2802 vmxnet3_change_mtu(struct net_device
*netdev
, int new_mtu
)
2804 struct vmxnet3_adapter
*adapter
= netdev_priv(netdev
);
2807 if (new_mtu
< VMXNET3_MIN_MTU
|| new_mtu
> VMXNET3_MAX_MTU
)
2810 netdev
->mtu
= new_mtu
;
2813 * Reset_work may be in the middle of resetting the device, wait for its
2816 while (test_and_set_bit(VMXNET3_STATE_BIT_RESETTING
, &adapter
->state
))
2819 if (netif_running(netdev
)) {
2820 vmxnet3_quiesce_dev(adapter
);
2821 vmxnet3_reset_dev(adapter
);
2823 /* we need to re-create the rx queue based on the new mtu */
2824 vmxnet3_rq_destroy_all(adapter
);
2825 vmxnet3_adjust_rx_ring_size(adapter
);
2826 err
= vmxnet3_rq_create_all(adapter
);
2829 "failed to re-create rx queues, "
2830 " error %d. Closing it.\n", err
);
2834 err
= vmxnet3_activate_dev(adapter
);
2837 "failed to re-activate, error %d. "
2838 "Closing it\n", err
);
2844 clear_bit(VMXNET3_STATE_BIT_RESETTING
, &adapter
->state
);
2846 vmxnet3_force_close(adapter
);
2853 vmxnet3_declare_features(struct vmxnet3_adapter
*adapter
, bool dma64
)
2855 struct net_device
*netdev
= adapter
->netdev
;
2857 netdev
->hw_features
= NETIF_F_SG
| NETIF_F_RXCSUM
|
2858 NETIF_F_HW_CSUM
| NETIF_F_HW_VLAN_CTAG_TX
|
2859 NETIF_F_HW_VLAN_CTAG_RX
| NETIF_F_TSO
| NETIF_F_TSO6
|
2862 netdev
->hw_features
|= NETIF_F_HIGHDMA
;
2863 netdev
->vlan_features
= netdev
->hw_features
&
2864 ~(NETIF_F_HW_VLAN_CTAG_TX
|
2865 NETIF_F_HW_VLAN_CTAG_RX
);
2866 netdev
->features
= netdev
->hw_features
| NETIF_F_HW_VLAN_CTAG_FILTER
;
2871 vmxnet3_read_mac_addr(struct vmxnet3_adapter
*adapter
, u8
*mac
)
2875 tmp
= VMXNET3_READ_BAR1_REG(adapter
, VMXNET3_REG_MACL
);
2878 tmp
= VMXNET3_READ_BAR1_REG(adapter
, VMXNET3_REG_MACH
);
2879 mac
[4] = tmp
& 0xff;
2880 mac
[5] = (tmp
>> 8) & 0xff;
2883 #ifdef CONFIG_PCI_MSI
2886 * Enable MSIx vectors.
2888 * VMXNET3_LINUX_MIN_MSIX_VECT when only minimum number of vectors required
2890 * number of vectors which were enabled otherwise (this number is greater
2891 * than VMXNET3_LINUX_MIN_MSIX_VECT)
2895 vmxnet3_acquire_msix_vectors(struct vmxnet3_adapter
*adapter
, int nvec
)
2897 int ret
= pci_enable_msix_range(adapter
->pdev
,
2898 adapter
->intr
.msix_entries
, nvec
, nvec
);
2900 if (ret
== -ENOSPC
&& nvec
> VMXNET3_LINUX_MIN_MSIX_VECT
) {
2901 dev_err(&adapter
->netdev
->dev
,
2902 "Failed to enable %d MSI-X, trying %d\n",
2903 nvec
, VMXNET3_LINUX_MIN_MSIX_VECT
);
2905 ret
= pci_enable_msix_range(adapter
->pdev
,
2906 adapter
->intr
.msix_entries
,
2907 VMXNET3_LINUX_MIN_MSIX_VECT
,
2908 VMXNET3_LINUX_MIN_MSIX_VECT
);
2912 dev_err(&adapter
->netdev
->dev
,
2913 "Failed to enable MSI-X, error: %d\n", ret
);
2920 #endif /* CONFIG_PCI_MSI */
2923 vmxnet3_alloc_intr_resources(struct vmxnet3_adapter
*adapter
)
2926 unsigned long flags
;
2929 spin_lock_irqsave(&adapter
->cmd_lock
, flags
);
2930 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_CMD
,
2931 VMXNET3_CMD_GET_CONF_INTR
);
2932 cfg
= VMXNET3_READ_BAR1_REG(adapter
, VMXNET3_REG_CMD
);
2933 spin_unlock_irqrestore(&adapter
->cmd_lock
, flags
);
2934 adapter
->intr
.type
= cfg
& 0x3;
2935 adapter
->intr
.mask_mode
= (cfg
>> 2) & 0x3;
2937 if (adapter
->intr
.type
== VMXNET3_IT_AUTO
) {
2938 adapter
->intr
.type
= VMXNET3_IT_MSIX
;
2941 #ifdef CONFIG_PCI_MSI
2942 if (adapter
->intr
.type
== VMXNET3_IT_MSIX
) {
2945 nvec
= adapter
->share_intr
== VMXNET3_INTR_TXSHARE
?
2946 1 : adapter
->num_tx_queues
;
2947 nvec
+= adapter
->share_intr
== VMXNET3_INTR_BUDDYSHARE
?
2948 0 : adapter
->num_rx_queues
;
2949 nvec
+= 1; /* for link event */
2950 nvec
= nvec
> VMXNET3_LINUX_MIN_MSIX_VECT
?
2951 nvec
: VMXNET3_LINUX_MIN_MSIX_VECT
;
2953 for (i
= 0; i
< nvec
; i
++)
2954 adapter
->intr
.msix_entries
[i
].entry
= i
;
2956 nvec
= vmxnet3_acquire_msix_vectors(adapter
, nvec
);
2960 /* If we cannot allocate one MSIx vector per queue
2961 * then limit the number of rx queues to 1
2963 if (nvec
== VMXNET3_LINUX_MIN_MSIX_VECT
) {
2964 if (adapter
->share_intr
!= VMXNET3_INTR_BUDDYSHARE
2965 || adapter
->num_rx_queues
!= 1) {
2966 adapter
->share_intr
= VMXNET3_INTR_TXSHARE
;
2967 netdev_err(adapter
->netdev
,
2968 "Number of rx queues : 1\n");
2969 adapter
->num_rx_queues
= 1;
2973 adapter
->intr
.num_intrs
= nvec
;
2977 /* If we cannot allocate MSIx vectors use only one rx queue */
2978 dev_info(&adapter
->pdev
->dev
,
2979 "Failed to enable MSI-X, error %d. "
2980 "Limiting #rx queues to 1, try MSI.\n", nvec
);
2982 adapter
->intr
.type
= VMXNET3_IT_MSI
;
2985 if (adapter
->intr
.type
== VMXNET3_IT_MSI
) {
2986 if (!pci_enable_msi(adapter
->pdev
)) {
2987 adapter
->num_rx_queues
= 1;
2988 adapter
->intr
.num_intrs
= 1;
2992 #endif /* CONFIG_PCI_MSI */
2994 adapter
->num_rx_queues
= 1;
2995 dev_info(&adapter
->netdev
->dev
,
2996 "Using INTx interrupt, #Rx queues: 1.\n");
2997 adapter
->intr
.type
= VMXNET3_IT_INTX
;
2999 /* INT-X related setting */
3000 adapter
->intr
.num_intrs
= 1;
3005 vmxnet3_free_intr_resources(struct vmxnet3_adapter
*adapter
)
3007 if (adapter
->intr
.type
== VMXNET3_IT_MSIX
)
3008 pci_disable_msix(adapter
->pdev
);
3009 else if (adapter
->intr
.type
== VMXNET3_IT_MSI
)
3010 pci_disable_msi(adapter
->pdev
);
3012 BUG_ON(adapter
->intr
.type
!= VMXNET3_IT_INTX
);
3017 vmxnet3_tx_timeout(struct net_device
*netdev
)
3019 struct vmxnet3_adapter
*adapter
= netdev_priv(netdev
);
3020 adapter
->tx_timeout_count
++;
3022 netdev_err(adapter
->netdev
, "tx hang\n");
3023 schedule_work(&adapter
->work
);
3024 netif_wake_queue(adapter
->netdev
);
3029 vmxnet3_reset_work(struct work_struct
*data
)
3031 struct vmxnet3_adapter
*adapter
;
3033 adapter
= container_of(data
, struct vmxnet3_adapter
, work
);
3035 /* if another thread is resetting the device, no need to proceed */
3036 if (test_and_set_bit(VMXNET3_STATE_BIT_RESETTING
, &adapter
->state
))
3039 /* if the device is closed, we must leave it alone */
3041 if (netif_running(adapter
->netdev
)) {
3042 netdev_notice(adapter
->netdev
, "resetting\n");
3043 vmxnet3_quiesce_dev(adapter
);
3044 vmxnet3_reset_dev(adapter
);
3045 vmxnet3_activate_dev(adapter
);
3047 netdev_info(adapter
->netdev
, "already closed\n");
3051 clear_bit(VMXNET3_STATE_BIT_RESETTING
, &adapter
->state
);
3056 vmxnet3_probe_device(struct pci_dev
*pdev
,
3057 const struct pci_device_id
*id
)
3059 static const struct net_device_ops vmxnet3_netdev_ops
= {
3060 .ndo_open
= vmxnet3_open
,
3061 .ndo_stop
= vmxnet3_close
,
3062 .ndo_start_xmit
= vmxnet3_xmit_frame
,
3063 .ndo_set_mac_address
= vmxnet3_set_mac_addr
,
3064 .ndo_change_mtu
= vmxnet3_change_mtu
,
3065 .ndo_set_features
= vmxnet3_set_features
,
3066 .ndo_get_stats64
= vmxnet3_get_stats64
,
3067 .ndo_tx_timeout
= vmxnet3_tx_timeout
,
3068 .ndo_set_rx_mode
= vmxnet3_set_mc
,
3069 .ndo_vlan_rx_add_vid
= vmxnet3_vlan_rx_add_vid
,
3070 .ndo_vlan_rx_kill_vid
= vmxnet3_vlan_rx_kill_vid
,
3071 #ifdef CONFIG_NET_POLL_CONTROLLER
3072 .ndo_poll_controller
= vmxnet3_netpoll
,
3076 bool dma64
= false; /* stupid gcc */
3078 struct net_device
*netdev
;
3079 struct vmxnet3_adapter
*adapter
;
3085 if (!pci_msi_enabled())
3090 num_rx_queues
= min(VMXNET3_DEVICE_MAX_RX_QUEUES
,
3091 (int)num_online_cpus());
3095 num_rx_queues
= rounddown_pow_of_two(num_rx_queues
);
3098 num_tx_queues
= min(VMXNET3_DEVICE_MAX_TX_QUEUES
,
3099 (int)num_online_cpus());
3103 num_tx_queues
= rounddown_pow_of_two(num_tx_queues
);
3104 netdev
= alloc_etherdev_mq(sizeof(struct vmxnet3_adapter
),
3105 max(num_tx_queues
, num_rx_queues
));
3106 dev_info(&pdev
->dev
,
3107 "# of Tx queues : %d, # of Rx queues : %d\n",
3108 num_tx_queues
, num_rx_queues
);
3113 pci_set_drvdata(pdev
, netdev
);
3114 adapter
= netdev_priv(netdev
);
3115 adapter
->netdev
= netdev
;
3116 adapter
->pdev
= pdev
;
3118 adapter
->tx_ring_size
= VMXNET3_DEF_TX_RING_SIZE
;
3119 adapter
->rx_ring_size
= VMXNET3_DEF_RX_RING_SIZE
;
3120 adapter
->rx_ring2_size
= VMXNET3_DEF_RX_RING2_SIZE
;
3122 spin_lock_init(&adapter
->cmd_lock
);
3123 adapter
->adapter_pa
= dma_map_single(&adapter
->pdev
->dev
, adapter
,
3124 sizeof(struct vmxnet3_adapter
),
3126 if (dma_mapping_error(&adapter
->pdev
->dev
, adapter
->adapter_pa
)) {
3127 dev_err(&pdev
->dev
, "Failed to map dma\n");
3131 adapter
->shared
= dma_alloc_coherent(
3132 &adapter
->pdev
->dev
,
3133 sizeof(struct Vmxnet3_DriverShared
),
3134 &adapter
->shared_pa
, GFP_KERNEL
);
3135 if (!adapter
->shared
) {
3136 dev_err(&pdev
->dev
, "Failed to allocate memory\n");
3138 goto err_alloc_shared
;
3141 adapter
->num_rx_queues
= num_rx_queues
;
3142 adapter
->num_tx_queues
= num_tx_queues
;
3143 adapter
->rx_buf_per_pkt
= 1;
3145 size
= sizeof(struct Vmxnet3_TxQueueDesc
) * adapter
->num_tx_queues
;
3146 size
+= sizeof(struct Vmxnet3_RxQueueDesc
) * adapter
->num_rx_queues
;
3147 adapter
->tqd_start
= dma_alloc_coherent(&adapter
->pdev
->dev
, size
,
3148 &adapter
->queue_desc_pa
,
3151 if (!adapter
->tqd_start
) {
3152 dev_err(&pdev
->dev
, "Failed to allocate memory\n");
3154 goto err_alloc_queue_desc
;
3156 adapter
->rqd_start
= (struct Vmxnet3_RxQueueDesc
*)(adapter
->tqd_start
+
3157 adapter
->num_tx_queues
);
3159 adapter
->pm_conf
= dma_alloc_coherent(&adapter
->pdev
->dev
,
3160 sizeof(struct Vmxnet3_PMConf
),
3161 &adapter
->pm_conf_pa
,
3163 if (adapter
->pm_conf
== NULL
) {
3170 adapter
->rss_conf
= dma_alloc_coherent(&adapter
->pdev
->dev
,
3171 sizeof(struct UPT1_RSSConf
),
3172 &adapter
->rss_conf_pa
,
3174 if (adapter
->rss_conf
== NULL
) {
3178 #endif /* VMXNET3_RSS */
3180 err
= vmxnet3_alloc_pci_resources(adapter
, &dma64
);
3184 ver
= VMXNET3_READ_BAR1_REG(adapter
, VMXNET3_REG_VRRS
);
3186 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_VRRS
, 2);
3187 adapter
->version
= 2;
3188 } else if (ver
& 1) {
3189 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_VRRS
, 1);
3190 adapter
->version
= 1;
3193 "Incompatible h/w version (0x%x) for adapter\n", ver
);
3197 dev_dbg(&pdev
->dev
, "Using device version %d\n", adapter
->version
);
3199 ver
= VMXNET3_READ_BAR1_REG(adapter
, VMXNET3_REG_UVRS
);
3201 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_UVRS
, 1);
3204 "Incompatible upt version (0x%x) for adapter\n", ver
);
3209 SET_NETDEV_DEV(netdev
, &pdev
->dev
);
3210 vmxnet3_declare_features(adapter
, dma64
);
3212 if (adapter
->num_tx_queues
== adapter
->num_rx_queues
)
3213 adapter
->share_intr
= VMXNET3_INTR_BUDDYSHARE
;
3215 adapter
->share_intr
= VMXNET3_INTR_DONTSHARE
;
3217 vmxnet3_alloc_intr_resources(adapter
);
3220 if (adapter
->num_rx_queues
> 1 &&
3221 adapter
->intr
.type
== VMXNET3_IT_MSIX
) {
3222 adapter
->rss
= true;
3223 netdev
->hw_features
|= NETIF_F_RXHASH
;
3224 netdev
->features
|= NETIF_F_RXHASH
;
3225 dev_dbg(&pdev
->dev
, "RSS is enabled.\n");
3227 adapter
->rss
= false;
3231 vmxnet3_read_mac_addr(adapter
, mac
);
3232 memcpy(netdev
->dev_addr
, mac
, netdev
->addr_len
);
3234 netdev
->netdev_ops
= &vmxnet3_netdev_ops
;
3235 vmxnet3_set_ethtool_ops(netdev
);
3236 netdev
->watchdog_timeo
= 5 * HZ
;
3238 INIT_WORK(&adapter
->work
, vmxnet3_reset_work
);
3239 set_bit(VMXNET3_STATE_BIT_QUIESCED
, &adapter
->state
);
3241 if (adapter
->intr
.type
== VMXNET3_IT_MSIX
) {
3243 for (i
= 0; i
< adapter
->num_rx_queues
; i
++) {
3244 netif_napi_add(adapter
->netdev
,
3245 &adapter
->rx_queue
[i
].napi
,
3246 vmxnet3_poll_rx_only
, 64);
3249 netif_napi_add(adapter
->netdev
, &adapter
->rx_queue
[0].napi
,
3253 netif_set_real_num_tx_queues(adapter
->netdev
, adapter
->num_tx_queues
);
3254 netif_set_real_num_rx_queues(adapter
->netdev
, adapter
->num_rx_queues
);
3256 netif_carrier_off(netdev
);
3257 err
= register_netdev(netdev
);
3260 dev_err(&pdev
->dev
, "Failed to register adapter\n");
3264 vmxnet3_check_link(adapter
, false);
3268 vmxnet3_free_intr_resources(adapter
);
3270 vmxnet3_free_pci_resources(adapter
);
3273 dma_free_coherent(&adapter
->pdev
->dev
, sizeof(struct UPT1_RSSConf
),
3274 adapter
->rss_conf
, adapter
->rss_conf_pa
);
3277 dma_free_coherent(&adapter
->pdev
->dev
, sizeof(struct Vmxnet3_PMConf
),
3278 adapter
->pm_conf
, adapter
->pm_conf_pa
);
3280 dma_free_coherent(&adapter
->pdev
->dev
, size
, adapter
->tqd_start
,
3281 adapter
->queue_desc_pa
);
3282 err_alloc_queue_desc
:
3283 dma_free_coherent(&adapter
->pdev
->dev
,
3284 sizeof(struct Vmxnet3_DriverShared
),
3285 adapter
->shared
, adapter
->shared_pa
);
3287 dma_unmap_single(&adapter
->pdev
->dev
, adapter
->adapter_pa
,
3288 sizeof(struct vmxnet3_adapter
), PCI_DMA_TODEVICE
);
3290 free_netdev(netdev
);
3296 vmxnet3_remove_device(struct pci_dev
*pdev
)
3298 struct net_device
*netdev
= pci_get_drvdata(pdev
);
3299 struct vmxnet3_adapter
*adapter
= netdev_priv(netdev
);
3305 num_rx_queues
= min(VMXNET3_DEVICE_MAX_RX_QUEUES
,
3306 (int)num_online_cpus());
3310 num_rx_queues
= rounddown_pow_of_two(num_rx_queues
);
3312 cancel_work_sync(&adapter
->work
);
3314 unregister_netdev(netdev
);
3316 vmxnet3_free_intr_resources(adapter
);
3317 vmxnet3_free_pci_resources(adapter
);
3319 dma_free_coherent(&adapter
->pdev
->dev
, sizeof(struct UPT1_RSSConf
),
3320 adapter
->rss_conf
, adapter
->rss_conf_pa
);
3322 dma_free_coherent(&adapter
->pdev
->dev
, sizeof(struct Vmxnet3_PMConf
),
3323 adapter
->pm_conf
, adapter
->pm_conf_pa
);
3325 size
= sizeof(struct Vmxnet3_TxQueueDesc
) * adapter
->num_tx_queues
;
3326 size
+= sizeof(struct Vmxnet3_RxQueueDesc
) * num_rx_queues
;
3327 dma_free_coherent(&adapter
->pdev
->dev
, size
, adapter
->tqd_start
,
3328 adapter
->queue_desc_pa
);
3329 dma_free_coherent(&adapter
->pdev
->dev
,
3330 sizeof(struct Vmxnet3_DriverShared
),
3331 adapter
->shared
, adapter
->shared_pa
);
3332 dma_unmap_single(&adapter
->pdev
->dev
, adapter
->adapter_pa
,
3333 sizeof(struct vmxnet3_adapter
), PCI_DMA_TODEVICE
);
3334 free_netdev(netdev
);
3337 static void vmxnet3_shutdown_device(struct pci_dev
*pdev
)
3339 struct net_device
*netdev
= pci_get_drvdata(pdev
);
3340 struct vmxnet3_adapter
*adapter
= netdev_priv(netdev
);
3341 unsigned long flags
;
3343 /* Reset_work may be in the middle of resetting the device, wait for its
3346 while (test_and_set_bit(VMXNET3_STATE_BIT_RESETTING
, &adapter
->state
))
3349 if (test_and_set_bit(VMXNET3_STATE_BIT_QUIESCED
,
3351 clear_bit(VMXNET3_STATE_BIT_RESETTING
, &adapter
->state
);
3354 spin_lock_irqsave(&adapter
->cmd_lock
, flags
);
3355 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_CMD
,
3356 VMXNET3_CMD_QUIESCE_DEV
);
3357 spin_unlock_irqrestore(&adapter
->cmd_lock
, flags
);
3358 vmxnet3_disable_all_intrs(adapter
);
3360 clear_bit(VMXNET3_STATE_BIT_RESETTING
, &adapter
->state
);
3367 vmxnet3_suspend(struct device
*device
)
3369 struct pci_dev
*pdev
= to_pci_dev(device
);
3370 struct net_device
*netdev
= pci_get_drvdata(pdev
);
3371 struct vmxnet3_adapter
*adapter
= netdev_priv(netdev
);
3372 struct Vmxnet3_PMConf
*pmConf
;
3373 struct ethhdr
*ehdr
;
3374 struct arphdr
*ahdr
;
3376 struct in_device
*in_dev
;
3377 struct in_ifaddr
*ifa
;
3378 unsigned long flags
;
3381 if (!netif_running(netdev
))
3384 for (i
= 0; i
< adapter
->num_rx_queues
; i
++)
3385 napi_disable(&adapter
->rx_queue
[i
].napi
);
3387 vmxnet3_disable_all_intrs(adapter
);
3388 vmxnet3_free_irqs(adapter
);
3389 vmxnet3_free_intr_resources(adapter
);
3391 netif_device_detach(netdev
);
3392 netif_tx_stop_all_queues(netdev
);
3394 /* Create wake-up filters. */
3395 pmConf
= adapter
->pm_conf
;
3396 memset(pmConf
, 0, sizeof(*pmConf
));
3398 if (adapter
->wol
& WAKE_UCAST
) {
3399 pmConf
->filters
[i
].patternSize
= ETH_ALEN
;
3400 pmConf
->filters
[i
].maskSize
= 1;
3401 memcpy(pmConf
->filters
[i
].pattern
, netdev
->dev_addr
, ETH_ALEN
);
3402 pmConf
->filters
[i
].mask
[0] = 0x3F; /* LSB ETH_ALEN bits */
3404 pmConf
->wakeUpEvents
|= VMXNET3_PM_WAKEUP_FILTER
;
3408 if (adapter
->wol
& WAKE_ARP
) {
3409 in_dev
= in_dev_get(netdev
);
3413 ifa
= (struct in_ifaddr
*)in_dev
->ifa_list
;
3417 pmConf
->filters
[i
].patternSize
= ETH_HLEN
+ /* Ethernet header*/
3418 sizeof(struct arphdr
) + /* ARP header */
3419 2 * ETH_ALEN
+ /* 2 Ethernet addresses*/
3420 2 * sizeof(u32
); /*2 IPv4 addresses */
3421 pmConf
->filters
[i
].maskSize
=
3422 (pmConf
->filters
[i
].patternSize
- 1) / 8 + 1;
3424 /* ETH_P_ARP in Ethernet header. */
3425 ehdr
= (struct ethhdr
*)pmConf
->filters
[i
].pattern
;
3426 ehdr
->h_proto
= htons(ETH_P_ARP
);
3428 /* ARPOP_REQUEST in ARP header. */
3429 ahdr
= (struct arphdr
*)&pmConf
->filters
[i
].pattern
[ETH_HLEN
];
3430 ahdr
->ar_op
= htons(ARPOP_REQUEST
);
3431 arpreq
= (u8
*)(ahdr
+ 1);
3433 /* The Unicast IPv4 address in 'tip' field. */
3434 arpreq
+= 2 * ETH_ALEN
+ sizeof(u32
);
3435 *(u32
*)arpreq
= ifa
->ifa_address
;
3437 /* The mask for the relevant bits. */
3438 pmConf
->filters
[i
].mask
[0] = 0x00;
3439 pmConf
->filters
[i
].mask
[1] = 0x30; /* ETH_P_ARP */
3440 pmConf
->filters
[i
].mask
[2] = 0x30; /* ARPOP_REQUEST */
3441 pmConf
->filters
[i
].mask
[3] = 0x00;
3442 pmConf
->filters
[i
].mask
[4] = 0xC0; /* IPv4 TIP */
3443 pmConf
->filters
[i
].mask
[5] = 0x03; /* IPv4 TIP */
3446 pmConf
->wakeUpEvents
|= VMXNET3_PM_WAKEUP_FILTER
;
3451 if (adapter
->wol
& WAKE_MAGIC
)
3452 pmConf
->wakeUpEvents
|= VMXNET3_PM_WAKEUP_MAGIC
;
3454 pmConf
->numFilters
= i
;
3456 adapter
->shared
->devRead
.pmConfDesc
.confVer
= cpu_to_le32(1);
3457 adapter
->shared
->devRead
.pmConfDesc
.confLen
= cpu_to_le32(sizeof(
3459 adapter
->shared
->devRead
.pmConfDesc
.confPA
=
3460 cpu_to_le64(adapter
->pm_conf_pa
);
3462 spin_lock_irqsave(&adapter
->cmd_lock
, flags
);
3463 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_CMD
,
3464 VMXNET3_CMD_UPDATE_PMCFG
);
3465 spin_unlock_irqrestore(&adapter
->cmd_lock
, flags
);
3467 pci_save_state(pdev
);
3468 pci_enable_wake(pdev
, pci_choose_state(pdev
, PMSG_SUSPEND
),
3470 pci_disable_device(pdev
);
3471 pci_set_power_state(pdev
, pci_choose_state(pdev
, PMSG_SUSPEND
));
3478 vmxnet3_resume(struct device
*device
)
3481 unsigned long flags
;
3482 struct pci_dev
*pdev
= to_pci_dev(device
);
3483 struct net_device
*netdev
= pci_get_drvdata(pdev
);
3484 struct vmxnet3_adapter
*adapter
= netdev_priv(netdev
);
3486 if (!netif_running(netdev
))
3489 pci_set_power_state(pdev
, PCI_D0
);
3490 pci_restore_state(pdev
);
3491 err
= pci_enable_device_mem(pdev
);
3495 pci_enable_wake(pdev
, PCI_D0
, 0);
3497 vmxnet3_alloc_intr_resources(adapter
);
3499 /* During hibernate and suspend, device has to be reinitialized as the
3500 * device state need not be preserved.
3503 /* Need not check adapter state as other reset tasks cannot run during
3506 spin_lock_irqsave(&adapter
->cmd_lock
, flags
);
3507 VMXNET3_WRITE_BAR1_REG(adapter
, VMXNET3_REG_CMD
,
3508 VMXNET3_CMD_QUIESCE_DEV
);
3509 spin_unlock_irqrestore(&adapter
->cmd_lock
, flags
);
3510 vmxnet3_tq_cleanup_all(adapter
);
3511 vmxnet3_rq_cleanup_all(adapter
);
3513 vmxnet3_reset_dev(adapter
);
3514 err
= vmxnet3_activate_dev(adapter
);
3517 "failed to re-activate on resume, error: %d", err
);
3518 vmxnet3_force_close(adapter
);
3521 netif_device_attach(netdev
);
3526 static const struct dev_pm_ops vmxnet3_pm_ops
= {
3527 .suspend
= vmxnet3_suspend
,
3528 .resume
= vmxnet3_resume
,
3529 .freeze
= vmxnet3_suspend
,
3530 .restore
= vmxnet3_resume
,
3534 static struct pci_driver vmxnet3_driver
= {
3535 .name
= vmxnet3_driver_name
,
3536 .id_table
= vmxnet3_pciid_table
,
3537 .probe
= vmxnet3_probe_device
,
3538 .remove
= vmxnet3_remove_device
,
3539 .shutdown
= vmxnet3_shutdown_device
,
3541 .driver
.pm
= &vmxnet3_pm_ops
,
3547 vmxnet3_init_module(void)
3549 pr_info("%s - version %s\n", VMXNET3_DRIVER_DESC
,
3550 VMXNET3_DRIVER_VERSION_REPORT
);
3551 return pci_register_driver(&vmxnet3_driver
);
3554 module_init(vmxnet3_init_module
);
3558 vmxnet3_exit_module(void)
3560 pci_unregister_driver(&vmxnet3_driver
);
3563 module_exit(vmxnet3_exit_module
);
3565 MODULE_AUTHOR("VMware, Inc.");
3566 MODULE_DESCRIPTION(VMXNET3_DRIVER_DESC
);
3567 MODULE_LICENSE("GPL v2");
3568 MODULE_VERSION(VMXNET3_DRIVER_VERSION_STRING
);