Merge branch 'for-linus' of git://oss.sgi.com/xfs/xfs
[linux/fpc-iii.git] / drivers / net / enic / enic_main.c
blobbc7d6b96de3dec39ca96b369a6656ec22ab04a12
1 /*
2 * Copyright 2008 Cisco Systems, Inc. All rights reserved.
3 * Copyright 2007 Nuova Systems, Inc. All rights reserved.
5 * This program is free software; you may redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; version 2 of the License.
9 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
10 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
11 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
12 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
13 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
14 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
15 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
16 * SOFTWARE.
20 #include <linux/module.h>
21 #include <linux/kernel.h>
22 #include <linux/string.h>
23 #include <linux/errno.h>
24 #include <linux/types.h>
25 #include <linux/init.h>
26 #include <linux/workqueue.h>
27 #include <linux/pci.h>
28 #include <linux/netdevice.h>
29 #include <linux/etherdevice.h>
30 #include <linux/if_ether.h>
31 #include <linux/if_vlan.h>
32 #include <linux/if_link.h>
33 #include <linux/ethtool.h>
34 #include <linux/in.h>
35 #include <linux/ip.h>
36 #include <linux/ipv6.h>
37 #include <linux/tcp.h>
38 #include <net/ip6_checksum.h>
40 #include "cq_enet_desc.h"
41 #include "vnic_dev.h"
42 #include "vnic_intr.h"
43 #include "vnic_stats.h"
44 #include "vnic_vic.h"
45 #include "enic_res.h"
46 #include "enic.h"
48 #define ENIC_NOTIFY_TIMER_PERIOD (2 * HZ)
49 #define WQ_ENET_MAX_DESC_LEN (1 << WQ_ENET_LEN_BITS)
50 #define MAX_TSO (1 << 16)
51 #define ENIC_DESC_MAX_SPLITS (MAX_TSO / WQ_ENET_MAX_DESC_LEN + 1)
53 #define PCI_DEVICE_ID_CISCO_VIC_ENET 0x0043 /* ethernet vnic */
54 #define PCI_DEVICE_ID_CISCO_VIC_ENET_DYN 0x0044 /* enet dynamic vnic */
56 /* Supported devices */
57 static DEFINE_PCI_DEVICE_TABLE(enic_id_table) = {
58 { PCI_VDEVICE(CISCO, PCI_DEVICE_ID_CISCO_VIC_ENET) },
59 { PCI_VDEVICE(CISCO, PCI_DEVICE_ID_CISCO_VIC_ENET_DYN) },
60 { 0, } /* end of table */
63 MODULE_DESCRIPTION(DRV_DESCRIPTION);
64 MODULE_AUTHOR("Scott Feldman <scofeldm@cisco.com>");
65 MODULE_LICENSE("GPL");
66 MODULE_VERSION(DRV_VERSION);
67 MODULE_DEVICE_TABLE(pci, enic_id_table);
69 struct enic_stat {
70 char name[ETH_GSTRING_LEN];
71 unsigned int offset;
74 #define ENIC_TX_STAT(stat) \
75 { .name = #stat, .offset = offsetof(struct vnic_tx_stats, stat) / 8 }
76 #define ENIC_RX_STAT(stat) \
77 { .name = #stat, .offset = offsetof(struct vnic_rx_stats, stat) / 8 }
79 static const struct enic_stat enic_tx_stats[] = {
80 ENIC_TX_STAT(tx_frames_ok),
81 ENIC_TX_STAT(tx_unicast_frames_ok),
82 ENIC_TX_STAT(tx_multicast_frames_ok),
83 ENIC_TX_STAT(tx_broadcast_frames_ok),
84 ENIC_TX_STAT(tx_bytes_ok),
85 ENIC_TX_STAT(tx_unicast_bytes_ok),
86 ENIC_TX_STAT(tx_multicast_bytes_ok),
87 ENIC_TX_STAT(tx_broadcast_bytes_ok),
88 ENIC_TX_STAT(tx_drops),
89 ENIC_TX_STAT(tx_errors),
90 ENIC_TX_STAT(tx_tso),
93 static const struct enic_stat enic_rx_stats[] = {
94 ENIC_RX_STAT(rx_frames_ok),
95 ENIC_RX_STAT(rx_frames_total),
96 ENIC_RX_STAT(rx_unicast_frames_ok),
97 ENIC_RX_STAT(rx_multicast_frames_ok),
98 ENIC_RX_STAT(rx_broadcast_frames_ok),
99 ENIC_RX_STAT(rx_bytes_ok),
100 ENIC_RX_STAT(rx_unicast_bytes_ok),
101 ENIC_RX_STAT(rx_multicast_bytes_ok),
102 ENIC_RX_STAT(rx_broadcast_bytes_ok),
103 ENIC_RX_STAT(rx_drop),
104 ENIC_RX_STAT(rx_no_bufs),
105 ENIC_RX_STAT(rx_errors),
106 ENIC_RX_STAT(rx_rss),
107 ENIC_RX_STAT(rx_crc_errors),
108 ENIC_RX_STAT(rx_frames_64),
109 ENIC_RX_STAT(rx_frames_127),
110 ENIC_RX_STAT(rx_frames_255),
111 ENIC_RX_STAT(rx_frames_511),
112 ENIC_RX_STAT(rx_frames_1023),
113 ENIC_RX_STAT(rx_frames_1518),
114 ENIC_RX_STAT(rx_frames_to_max),
117 static const unsigned int enic_n_tx_stats = ARRAY_SIZE(enic_tx_stats);
118 static const unsigned int enic_n_rx_stats = ARRAY_SIZE(enic_rx_stats);
120 static int enic_is_dynamic(struct enic *enic)
122 return enic->pdev->device == PCI_DEVICE_ID_CISCO_VIC_ENET_DYN;
125 static int enic_get_settings(struct net_device *netdev,
126 struct ethtool_cmd *ecmd)
128 struct enic *enic = netdev_priv(netdev);
130 ecmd->supported = (SUPPORTED_10000baseT_Full | SUPPORTED_FIBRE);
131 ecmd->advertising = (ADVERTISED_10000baseT_Full | ADVERTISED_FIBRE);
132 ecmd->port = PORT_FIBRE;
133 ecmd->transceiver = XCVR_EXTERNAL;
135 if (netif_carrier_ok(netdev)) {
136 ecmd->speed = vnic_dev_port_speed(enic->vdev);
137 ecmd->duplex = DUPLEX_FULL;
138 } else {
139 ecmd->speed = -1;
140 ecmd->duplex = -1;
143 ecmd->autoneg = AUTONEG_DISABLE;
145 return 0;
148 static void enic_get_drvinfo(struct net_device *netdev,
149 struct ethtool_drvinfo *drvinfo)
151 struct enic *enic = netdev_priv(netdev);
152 struct vnic_devcmd_fw_info *fw_info;
154 spin_lock(&enic->devcmd_lock);
155 vnic_dev_fw_info(enic->vdev, &fw_info);
156 spin_unlock(&enic->devcmd_lock);
158 strncpy(drvinfo->driver, DRV_NAME, sizeof(drvinfo->driver));
159 strncpy(drvinfo->version, DRV_VERSION, sizeof(drvinfo->version));
160 strncpy(drvinfo->fw_version, fw_info->fw_version,
161 sizeof(drvinfo->fw_version));
162 strncpy(drvinfo->bus_info, pci_name(enic->pdev),
163 sizeof(drvinfo->bus_info));
166 static void enic_get_strings(struct net_device *netdev, u32 stringset, u8 *data)
168 unsigned int i;
170 switch (stringset) {
171 case ETH_SS_STATS:
172 for (i = 0; i < enic_n_tx_stats; i++) {
173 memcpy(data, enic_tx_stats[i].name, ETH_GSTRING_LEN);
174 data += ETH_GSTRING_LEN;
176 for (i = 0; i < enic_n_rx_stats; i++) {
177 memcpy(data, enic_rx_stats[i].name, ETH_GSTRING_LEN);
178 data += ETH_GSTRING_LEN;
180 break;
184 static int enic_get_sset_count(struct net_device *netdev, int sset)
186 switch (sset) {
187 case ETH_SS_STATS:
188 return enic_n_tx_stats + enic_n_rx_stats;
189 default:
190 return -EOPNOTSUPP;
194 static void enic_get_ethtool_stats(struct net_device *netdev,
195 struct ethtool_stats *stats, u64 *data)
197 struct enic *enic = netdev_priv(netdev);
198 struct vnic_stats *vstats;
199 unsigned int i;
201 spin_lock(&enic->devcmd_lock);
202 vnic_dev_stats_dump(enic->vdev, &vstats);
203 spin_unlock(&enic->devcmd_lock);
205 for (i = 0; i < enic_n_tx_stats; i++)
206 *(data++) = ((u64 *)&vstats->tx)[enic_tx_stats[i].offset];
207 for (i = 0; i < enic_n_rx_stats; i++)
208 *(data++) = ((u64 *)&vstats->rx)[enic_rx_stats[i].offset];
211 static u32 enic_get_rx_csum(struct net_device *netdev)
213 struct enic *enic = netdev_priv(netdev);
214 return enic->csum_rx_enabled;
217 static int enic_set_rx_csum(struct net_device *netdev, u32 data)
219 struct enic *enic = netdev_priv(netdev);
221 if (data && !ENIC_SETTING(enic, RXCSUM))
222 return -EINVAL;
224 enic->csum_rx_enabled = !!data;
226 return 0;
229 static int enic_set_tx_csum(struct net_device *netdev, u32 data)
231 struct enic *enic = netdev_priv(netdev);
233 if (data && !ENIC_SETTING(enic, TXCSUM))
234 return -EINVAL;
236 if (data)
237 netdev->features |= NETIF_F_HW_CSUM;
238 else
239 netdev->features &= ~NETIF_F_HW_CSUM;
241 return 0;
244 static int enic_set_tso(struct net_device *netdev, u32 data)
246 struct enic *enic = netdev_priv(netdev);
248 if (data && !ENIC_SETTING(enic, TSO))
249 return -EINVAL;
251 if (data)
252 netdev->features |=
253 NETIF_F_TSO | NETIF_F_TSO6 | NETIF_F_TSO_ECN;
254 else
255 netdev->features &=
256 ~(NETIF_F_TSO | NETIF_F_TSO6 | NETIF_F_TSO_ECN);
258 return 0;
261 static u32 enic_get_msglevel(struct net_device *netdev)
263 struct enic *enic = netdev_priv(netdev);
264 return enic->msg_enable;
267 static void enic_set_msglevel(struct net_device *netdev, u32 value)
269 struct enic *enic = netdev_priv(netdev);
270 enic->msg_enable = value;
273 static int enic_get_coalesce(struct net_device *netdev,
274 struct ethtool_coalesce *ecmd)
276 struct enic *enic = netdev_priv(netdev);
278 ecmd->tx_coalesce_usecs = enic->tx_coalesce_usecs;
279 ecmd->rx_coalesce_usecs = enic->rx_coalesce_usecs;
281 return 0;
284 static int enic_set_coalesce(struct net_device *netdev,
285 struct ethtool_coalesce *ecmd)
287 struct enic *enic = netdev_priv(netdev);
288 u32 tx_coalesce_usecs;
289 u32 rx_coalesce_usecs;
291 tx_coalesce_usecs = min_t(u32,
292 INTR_COALESCE_HW_TO_USEC(VNIC_INTR_TIMER_MAX),
293 ecmd->tx_coalesce_usecs);
294 rx_coalesce_usecs = min_t(u32,
295 INTR_COALESCE_HW_TO_USEC(VNIC_INTR_TIMER_MAX),
296 ecmd->rx_coalesce_usecs);
298 switch (vnic_dev_get_intr_mode(enic->vdev)) {
299 case VNIC_DEV_INTR_MODE_INTX:
300 if (tx_coalesce_usecs != rx_coalesce_usecs)
301 return -EINVAL;
303 vnic_intr_coalescing_timer_set(&enic->intr[ENIC_INTX_WQ_RQ],
304 INTR_COALESCE_USEC_TO_HW(tx_coalesce_usecs));
305 break;
306 case VNIC_DEV_INTR_MODE_MSI:
307 if (tx_coalesce_usecs != rx_coalesce_usecs)
308 return -EINVAL;
310 vnic_intr_coalescing_timer_set(&enic->intr[0],
311 INTR_COALESCE_USEC_TO_HW(tx_coalesce_usecs));
312 break;
313 case VNIC_DEV_INTR_MODE_MSIX:
314 vnic_intr_coalescing_timer_set(&enic->intr[ENIC_MSIX_WQ],
315 INTR_COALESCE_USEC_TO_HW(tx_coalesce_usecs));
316 vnic_intr_coalescing_timer_set(&enic->intr[ENIC_MSIX_RQ],
317 INTR_COALESCE_USEC_TO_HW(rx_coalesce_usecs));
318 break;
319 default:
320 break;
323 enic->tx_coalesce_usecs = tx_coalesce_usecs;
324 enic->rx_coalesce_usecs = rx_coalesce_usecs;
326 return 0;
329 static const struct ethtool_ops enic_ethtool_ops = {
330 .get_settings = enic_get_settings,
331 .get_drvinfo = enic_get_drvinfo,
332 .get_msglevel = enic_get_msglevel,
333 .set_msglevel = enic_set_msglevel,
334 .get_link = ethtool_op_get_link,
335 .get_strings = enic_get_strings,
336 .get_sset_count = enic_get_sset_count,
337 .get_ethtool_stats = enic_get_ethtool_stats,
338 .get_rx_csum = enic_get_rx_csum,
339 .set_rx_csum = enic_set_rx_csum,
340 .get_tx_csum = ethtool_op_get_tx_csum,
341 .set_tx_csum = enic_set_tx_csum,
342 .get_sg = ethtool_op_get_sg,
343 .set_sg = ethtool_op_set_sg,
344 .get_tso = ethtool_op_get_tso,
345 .set_tso = enic_set_tso,
346 .get_coalesce = enic_get_coalesce,
347 .set_coalesce = enic_set_coalesce,
348 .get_flags = ethtool_op_get_flags,
349 .set_flags = ethtool_op_set_flags,
352 static void enic_free_wq_buf(struct vnic_wq *wq, struct vnic_wq_buf *buf)
354 struct enic *enic = vnic_dev_priv(wq->vdev);
356 if (buf->sop)
357 pci_unmap_single(enic->pdev, buf->dma_addr,
358 buf->len, PCI_DMA_TODEVICE);
359 else
360 pci_unmap_page(enic->pdev, buf->dma_addr,
361 buf->len, PCI_DMA_TODEVICE);
363 if (buf->os_buf)
364 dev_kfree_skb_any(buf->os_buf);
367 static void enic_wq_free_buf(struct vnic_wq *wq,
368 struct cq_desc *cq_desc, struct vnic_wq_buf *buf, void *opaque)
370 enic_free_wq_buf(wq, buf);
373 static int enic_wq_service(struct vnic_dev *vdev, struct cq_desc *cq_desc,
374 u8 type, u16 q_number, u16 completed_index, void *opaque)
376 struct enic *enic = vnic_dev_priv(vdev);
378 spin_lock(&enic->wq_lock[q_number]);
380 vnic_wq_service(&enic->wq[q_number], cq_desc,
381 completed_index, enic_wq_free_buf,
382 opaque);
384 if (netif_queue_stopped(enic->netdev) &&
385 vnic_wq_desc_avail(&enic->wq[q_number]) >=
386 (MAX_SKB_FRAGS + ENIC_DESC_MAX_SPLITS))
387 netif_wake_queue(enic->netdev);
389 spin_unlock(&enic->wq_lock[q_number]);
391 return 0;
394 static void enic_log_q_error(struct enic *enic)
396 unsigned int i;
397 u32 error_status;
399 for (i = 0; i < enic->wq_count; i++) {
400 error_status = vnic_wq_error_status(&enic->wq[i]);
401 if (error_status)
402 printk(KERN_ERR PFX "%s: WQ[%d] error_status %d\n",
403 enic->netdev->name, i, error_status);
406 for (i = 0; i < enic->rq_count; i++) {
407 error_status = vnic_rq_error_status(&enic->rq[i]);
408 if (error_status)
409 printk(KERN_ERR PFX "%s: RQ[%d] error_status %d\n",
410 enic->netdev->name, i, error_status);
414 static void enic_link_check(struct enic *enic)
416 int link_status = vnic_dev_link_status(enic->vdev);
417 int carrier_ok = netif_carrier_ok(enic->netdev);
419 if (link_status && !carrier_ok) {
420 printk(KERN_INFO PFX "%s: Link UP\n", enic->netdev->name);
421 netif_carrier_on(enic->netdev);
422 } else if (!link_status && carrier_ok) {
423 printk(KERN_INFO PFX "%s: Link DOWN\n", enic->netdev->name);
424 netif_carrier_off(enic->netdev);
428 static void enic_mtu_check(struct enic *enic)
430 u32 mtu = vnic_dev_mtu(enic->vdev);
432 if (mtu && mtu != enic->port_mtu) {
433 enic->port_mtu = mtu;
434 if (mtu < enic->netdev->mtu)
435 printk(KERN_WARNING PFX
436 "%s: interface MTU (%d) set higher "
437 "than switch port MTU (%d)\n",
438 enic->netdev->name, enic->netdev->mtu, mtu);
442 static void enic_msglvl_check(struct enic *enic)
444 u32 msg_enable = vnic_dev_msg_lvl(enic->vdev);
446 if (msg_enable != enic->msg_enable) {
447 printk(KERN_INFO PFX "%s: msg lvl changed from 0x%x to 0x%x\n",
448 enic->netdev->name, enic->msg_enable, msg_enable);
449 enic->msg_enable = msg_enable;
453 static void enic_notify_check(struct enic *enic)
455 enic_msglvl_check(enic);
456 enic_mtu_check(enic);
457 enic_link_check(enic);
460 #define ENIC_TEST_INTR(pba, i) (pba & (1 << i))
462 static irqreturn_t enic_isr_legacy(int irq, void *data)
464 struct net_device *netdev = data;
465 struct enic *enic = netdev_priv(netdev);
466 u32 pba;
468 vnic_intr_mask(&enic->intr[ENIC_INTX_WQ_RQ]);
470 pba = vnic_intr_legacy_pba(enic->legacy_pba);
471 if (!pba) {
472 vnic_intr_unmask(&enic->intr[ENIC_INTX_WQ_RQ]);
473 return IRQ_NONE; /* not our interrupt */
476 if (ENIC_TEST_INTR(pba, ENIC_INTX_NOTIFY)) {
477 vnic_intr_return_all_credits(&enic->intr[ENIC_INTX_NOTIFY]);
478 enic_notify_check(enic);
481 if (ENIC_TEST_INTR(pba, ENIC_INTX_ERR)) {
482 vnic_intr_return_all_credits(&enic->intr[ENIC_INTX_ERR]);
483 enic_log_q_error(enic);
484 /* schedule recovery from WQ/RQ error */
485 schedule_work(&enic->reset);
486 return IRQ_HANDLED;
489 if (ENIC_TEST_INTR(pba, ENIC_INTX_WQ_RQ)) {
490 if (napi_schedule_prep(&enic->napi))
491 __napi_schedule(&enic->napi);
492 } else {
493 vnic_intr_unmask(&enic->intr[ENIC_INTX_WQ_RQ]);
496 return IRQ_HANDLED;
499 static irqreturn_t enic_isr_msi(int irq, void *data)
501 struct enic *enic = data;
503 /* With MSI, there is no sharing of interrupts, so this is
504 * our interrupt and there is no need to ack it. The device
505 * is not providing per-vector masking, so the OS will not
506 * write to PCI config space to mask/unmask the interrupt.
507 * We're using mask_on_assertion for MSI, so the device
508 * automatically masks the interrupt when the interrupt is
509 * generated. Later, when exiting polling, the interrupt
510 * will be unmasked (see enic_poll).
512 * Also, the device uses the same PCIe Traffic Class (TC)
513 * for Memory Write data and MSI, so there are no ordering
514 * issues; the MSI will always arrive at the Root Complex
515 * _after_ corresponding Memory Writes (i.e. descriptor
516 * writes).
519 napi_schedule(&enic->napi);
521 return IRQ_HANDLED;
524 static irqreturn_t enic_isr_msix_rq(int irq, void *data)
526 struct enic *enic = data;
528 /* schedule NAPI polling for RQ cleanup */
529 napi_schedule(&enic->napi);
531 return IRQ_HANDLED;
534 static irqreturn_t enic_isr_msix_wq(int irq, void *data)
536 struct enic *enic = data;
537 unsigned int wq_work_to_do = -1; /* no limit */
538 unsigned int wq_work_done;
540 wq_work_done = vnic_cq_service(&enic->cq[ENIC_CQ_WQ],
541 wq_work_to_do, enic_wq_service, NULL);
543 vnic_intr_return_credits(&enic->intr[ENIC_MSIX_WQ],
544 wq_work_done,
545 1 /* unmask intr */,
546 1 /* reset intr timer */);
548 return IRQ_HANDLED;
551 static irqreturn_t enic_isr_msix_err(int irq, void *data)
553 struct enic *enic = data;
555 vnic_intr_return_all_credits(&enic->intr[ENIC_MSIX_ERR]);
557 enic_log_q_error(enic);
559 /* schedule recovery from WQ/RQ error */
560 schedule_work(&enic->reset);
562 return IRQ_HANDLED;
565 static irqreturn_t enic_isr_msix_notify(int irq, void *data)
567 struct enic *enic = data;
569 vnic_intr_return_all_credits(&enic->intr[ENIC_MSIX_NOTIFY]);
570 enic_notify_check(enic);
572 return IRQ_HANDLED;
575 static inline void enic_queue_wq_skb_cont(struct enic *enic,
576 struct vnic_wq *wq, struct sk_buff *skb,
577 unsigned int len_left)
579 skb_frag_t *frag;
581 /* Queue additional data fragments */
582 for (frag = skb_shinfo(skb)->frags; len_left; frag++) {
583 len_left -= frag->size;
584 enic_queue_wq_desc_cont(wq, skb,
585 pci_map_page(enic->pdev, frag->page,
586 frag->page_offset, frag->size,
587 PCI_DMA_TODEVICE),
588 frag->size,
589 (len_left == 0)); /* EOP? */
593 static inline void enic_queue_wq_skb_vlan(struct enic *enic,
594 struct vnic_wq *wq, struct sk_buff *skb,
595 int vlan_tag_insert, unsigned int vlan_tag)
597 unsigned int head_len = skb_headlen(skb);
598 unsigned int len_left = skb->len - head_len;
599 int eop = (len_left == 0);
601 /* Queue the main skb fragment. The fragments are no larger
602 * than max MTU(9000)+ETH_HDR_LEN(14) bytes, which is less
603 * than WQ_ENET_MAX_DESC_LEN length. So only one descriptor
604 * per fragment is queued.
606 enic_queue_wq_desc(wq, skb,
607 pci_map_single(enic->pdev, skb->data,
608 head_len, PCI_DMA_TODEVICE),
609 head_len,
610 vlan_tag_insert, vlan_tag,
611 eop);
613 if (!eop)
614 enic_queue_wq_skb_cont(enic, wq, skb, len_left);
617 static inline void enic_queue_wq_skb_csum_l4(struct enic *enic,
618 struct vnic_wq *wq, struct sk_buff *skb,
619 int vlan_tag_insert, unsigned int vlan_tag)
621 unsigned int head_len = skb_headlen(skb);
622 unsigned int len_left = skb->len - head_len;
623 unsigned int hdr_len = skb_transport_offset(skb);
624 unsigned int csum_offset = hdr_len + skb->csum_offset;
625 int eop = (len_left == 0);
627 /* Queue the main skb fragment. The fragments are no larger
628 * than max MTU(9000)+ETH_HDR_LEN(14) bytes, which is less
629 * than WQ_ENET_MAX_DESC_LEN length. So only one descriptor
630 * per fragment is queued.
632 enic_queue_wq_desc_csum_l4(wq, skb,
633 pci_map_single(enic->pdev, skb->data,
634 head_len, PCI_DMA_TODEVICE),
635 head_len,
636 csum_offset,
637 hdr_len,
638 vlan_tag_insert, vlan_tag,
639 eop);
641 if (!eop)
642 enic_queue_wq_skb_cont(enic, wq, skb, len_left);
645 static inline void enic_queue_wq_skb_tso(struct enic *enic,
646 struct vnic_wq *wq, struct sk_buff *skb, unsigned int mss,
647 int vlan_tag_insert, unsigned int vlan_tag)
649 unsigned int frag_len_left = skb_headlen(skb);
650 unsigned int len_left = skb->len - frag_len_left;
651 unsigned int hdr_len = skb_transport_offset(skb) + tcp_hdrlen(skb);
652 int eop = (len_left == 0);
653 unsigned int len;
654 dma_addr_t dma_addr;
655 unsigned int offset = 0;
656 skb_frag_t *frag;
658 /* Preload TCP csum field with IP pseudo hdr calculated
659 * with IP length set to zero. HW will later add in length
660 * to each TCP segment resulting from the TSO.
663 if (skb->protocol == cpu_to_be16(ETH_P_IP)) {
664 ip_hdr(skb)->check = 0;
665 tcp_hdr(skb)->check = ~csum_tcpudp_magic(ip_hdr(skb)->saddr,
666 ip_hdr(skb)->daddr, 0, IPPROTO_TCP, 0);
667 } else if (skb->protocol == cpu_to_be16(ETH_P_IPV6)) {
668 tcp_hdr(skb)->check = ~csum_ipv6_magic(&ipv6_hdr(skb)->saddr,
669 &ipv6_hdr(skb)->daddr, 0, IPPROTO_TCP, 0);
672 /* Queue WQ_ENET_MAX_DESC_LEN length descriptors
673 * for the main skb fragment
675 while (frag_len_left) {
676 len = min(frag_len_left, (unsigned int)WQ_ENET_MAX_DESC_LEN);
677 dma_addr = pci_map_single(enic->pdev, skb->data + offset,
678 len, PCI_DMA_TODEVICE);
679 enic_queue_wq_desc_tso(wq, skb,
680 dma_addr,
681 len,
682 mss, hdr_len,
683 vlan_tag_insert, vlan_tag,
684 eop && (len == frag_len_left));
685 frag_len_left -= len;
686 offset += len;
689 if (eop)
690 return;
692 /* Queue WQ_ENET_MAX_DESC_LEN length descriptors
693 * for additional data fragments
695 for (frag = skb_shinfo(skb)->frags; len_left; frag++) {
696 len_left -= frag->size;
697 frag_len_left = frag->size;
698 offset = frag->page_offset;
700 while (frag_len_left) {
701 len = min(frag_len_left,
702 (unsigned int)WQ_ENET_MAX_DESC_LEN);
703 dma_addr = pci_map_page(enic->pdev, frag->page,
704 offset, len,
705 PCI_DMA_TODEVICE);
706 enic_queue_wq_desc_cont(wq, skb,
707 dma_addr,
708 len,
709 (len_left == 0) &&
710 (len == frag_len_left)); /* EOP? */
711 frag_len_left -= len;
712 offset += len;
717 static inline void enic_queue_wq_skb(struct enic *enic,
718 struct vnic_wq *wq, struct sk_buff *skb)
720 unsigned int mss = skb_shinfo(skb)->gso_size;
721 unsigned int vlan_tag = 0;
722 int vlan_tag_insert = 0;
724 if (enic->vlan_group && vlan_tx_tag_present(skb)) {
725 /* VLAN tag from trunking driver */
726 vlan_tag_insert = 1;
727 vlan_tag = vlan_tx_tag_get(skb);
730 if (mss)
731 enic_queue_wq_skb_tso(enic, wq, skb, mss,
732 vlan_tag_insert, vlan_tag);
733 else if (skb->ip_summed == CHECKSUM_PARTIAL)
734 enic_queue_wq_skb_csum_l4(enic, wq, skb,
735 vlan_tag_insert, vlan_tag);
736 else
737 enic_queue_wq_skb_vlan(enic, wq, skb,
738 vlan_tag_insert, vlan_tag);
741 /* netif_tx_lock held, process context with BHs disabled, or BH */
742 static netdev_tx_t enic_hard_start_xmit(struct sk_buff *skb,
743 struct net_device *netdev)
745 struct enic *enic = netdev_priv(netdev);
746 struct vnic_wq *wq = &enic->wq[0];
747 unsigned long flags;
749 if (skb->len <= 0) {
750 dev_kfree_skb(skb);
751 return NETDEV_TX_OK;
754 /* Non-TSO sends must fit within ENIC_NON_TSO_MAX_DESC descs,
755 * which is very likely. In the off chance it's going to take
756 * more than * ENIC_NON_TSO_MAX_DESC, linearize the skb.
759 if (skb_shinfo(skb)->gso_size == 0 &&
760 skb_shinfo(skb)->nr_frags + 1 > ENIC_NON_TSO_MAX_DESC &&
761 skb_linearize(skb)) {
762 dev_kfree_skb(skb);
763 return NETDEV_TX_OK;
766 spin_lock_irqsave(&enic->wq_lock[0], flags);
768 if (vnic_wq_desc_avail(wq) <
769 skb_shinfo(skb)->nr_frags + ENIC_DESC_MAX_SPLITS) {
770 netif_stop_queue(netdev);
771 /* This is a hard error, log it */
772 printk(KERN_ERR PFX "%s: BUG! Tx ring full when "
773 "queue awake!\n", netdev->name);
774 spin_unlock_irqrestore(&enic->wq_lock[0], flags);
775 return NETDEV_TX_BUSY;
778 enic_queue_wq_skb(enic, wq, skb);
780 if (vnic_wq_desc_avail(wq) < MAX_SKB_FRAGS + ENIC_DESC_MAX_SPLITS)
781 netif_stop_queue(netdev);
783 spin_unlock_irqrestore(&enic->wq_lock[0], flags);
785 return NETDEV_TX_OK;
788 /* dev_base_lock rwlock held, nominally process context */
789 static struct net_device_stats *enic_get_stats(struct net_device *netdev)
791 struct enic *enic = netdev_priv(netdev);
792 struct net_device_stats *net_stats = &netdev->stats;
793 struct vnic_stats *stats;
795 spin_lock(&enic->devcmd_lock);
796 vnic_dev_stats_dump(enic->vdev, &stats);
797 spin_unlock(&enic->devcmd_lock);
799 net_stats->tx_packets = stats->tx.tx_frames_ok;
800 net_stats->tx_bytes = stats->tx.tx_bytes_ok;
801 net_stats->tx_errors = stats->tx.tx_errors;
802 net_stats->tx_dropped = stats->tx.tx_drops;
804 net_stats->rx_packets = stats->rx.rx_frames_ok;
805 net_stats->rx_bytes = stats->rx.rx_bytes_ok;
806 net_stats->rx_errors = stats->rx.rx_errors;
807 net_stats->multicast = stats->rx.rx_multicast_frames_ok;
808 net_stats->rx_over_errors = enic->rq_truncated_pkts;
809 net_stats->rx_crc_errors = enic->rq_bad_fcs;
810 net_stats->rx_dropped = stats->rx.rx_no_bufs + stats->rx.rx_drop;
812 return net_stats;
815 static void enic_reset_mcaddrs(struct enic *enic)
817 enic->mc_count = 0;
820 static int enic_set_mac_addr(struct net_device *netdev, char *addr)
822 struct enic *enic = netdev_priv(netdev);
824 if (enic_is_dynamic(enic)) {
825 if (!is_valid_ether_addr(addr) && !is_zero_ether_addr(addr))
826 return -EADDRNOTAVAIL;
827 } else {
828 if (!is_valid_ether_addr(addr))
829 return -EADDRNOTAVAIL;
832 memcpy(netdev->dev_addr, addr, netdev->addr_len);
834 return 0;
837 static int enic_dev_add_station_addr(struct enic *enic)
839 int err = 0;
841 if (is_valid_ether_addr(enic->netdev->dev_addr)) {
842 spin_lock(&enic->devcmd_lock);
843 err = vnic_dev_add_addr(enic->vdev, enic->netdev->dev_addr);
844 spin_unlock(&enic->devcmd_lock);
847 return err;
850 static int enic_dev_del_station_addr(struct enic *enic)
852 int err = 0;
854 if (is_valid_ether_addr(enic->netdev->dev_addr)) {
855 spin_lock(&enic->devcmd_lock);
856 err = vnic_dev_del_addr(enic->vdev, enic->netdev->dev_addr);
857 spin_unlock(&enic->devcmd_lock);
860 return err;
863 static int enic_set_mac_address_dynamic(struct net_device *netdev, void *p)
865 struct enic *enic = netdev_priv(netdev);
866 struct sockaddr *saddr = p;
867 char *addr = saddr->sa_data;
868 int err;
870 if (netif_running(enic->netdev)) {
871 err = enic_dev_del_station_addr(enic);
872 if (err)
873 return err;
876 err = enic_set_mac_addr(netdev, addr);
877 if (err)
878 return err;
880 if (netif_running(enic->netdev)) {
881 err = enic_dev_add_station_addr(enic);
882 if (err)
883 return err;
886 return err;
889 static int enic_set_mac_address(struct net_device *netdev, void *p)
891 return -EOPNOTSUPP;
894 /* netif_tx_lock held, BHs disabled */
895 static void enic_set_multicast_list(struct net_device *netdev)
897 struct enic *enic = netdev_priv(netdev);
898 struct netdev_hw_addr *ha;
899 int directed = 1;
900 int multicast = (netdev->flags & IFF_MULTICAST) ? 1 : 0;
901 int broadcast = (netdev->flags & IFF_BROADCAST) ? 1 : 0;
902 int promisc = (netdev->flags & IFF_PROMISC) ? 1 : 0;
903 unsigned int mc_count = netdev_mc_count(netdev);
904 int allmulti = (netdev->flags & IFF_ALLMULTI) ||
905 mc_count > ENIC_MULTICAST_PERFECT_FILTERS;
906 unsigned int flags = netdev->flags | (allmulti ? IFF_ALLMULTI : 0);
907 u8 mc_addr[ENIC_MULTICAST_PERFECT_FILTERS][ETH_ALEN];
908 unsigned int i, j;
910 if (mc_count > ENIC_MULTICAST_PERFECT_FILTERS)
911 mc_count = ENIC_MULTICAST_PERFECT_FILTERS;
913 spin_lock(&enic->devcmd_lock);
915 if (enic->flags != flags) {
916 enic->flags = flags;
917 vnic_dev_packet_filter(enic->vdev, directed,
918 multicast, broadcast, promisc, allmulti);
921 /* Is there an easier way? Trying to minimize to
922 * calls to add/del multicast addrs. We keep the
923 * addrs from the last call in enic->mc_addr and
924 * look for changes to add/del.
927 i = 0;
928 netdev_for_each_mc_addr(ha, netdev) {
929 if (i == mc_count)
930 break;
931 memcpy(mc_addr[i++], ha->addr, ETH_ALEN);
934 for (i = 0; i < enic->mc_count; i++) {
935 for (j = 0; j < mc_count; j++)
936 if (compare_ether_addr(enic->mc_addr[i],
937 mc_addr[j]) == 0)
938 break;
939 if (j == mc_count)
940 enic_del_multicast_addr(enic, enic->mc_addr[i]);
943 for (i = 0; i < mc_count; i++) {
944 for (j = 0; j < enic->mc_count; j++)
945 if (compare_ether_addr(mc_addr[i],
946 enic->mc_addr[j]) == 0)
947 break;
948 if (j == enic->mc_count)
949 enic_add_multicast_addr(enic, mc_addr[i]);
952 /* Save the list to compare against next time
955 for (i = 0; i < mc_count; i++)
956 memcpy(enic->mc_addr[i], mc_addr[i], ETH_ALEN);
958 enic->mc_count = mc_count;
960 spin_unlock(&enic->devcmd_lock);
963 /* rtnl lock is held */
964 static void enic_vlan_rx_register(struct net_device *netdev,
965 struct vlan_group *vlan_group)
967 struct enic *enic = netdev_priv(netdev);
968 enic->vlan_group = vlan_group;
971 /* rtnl lock is held */
972 static void enic_vlan_rx_add_vid(struct net_device *netdev, u16 vid)
974 struct enic *enic = netdev_priv(netdev);
976 spin_lock(&enic->devcmd_lock);
977 enic_add_vlan(enic, vid);
978 spin_unlock(&enic->devcmd_lock);
981 /* rtnl lock is held */
982 static void enic_vlan_rx_kill_vid(struct net_device *netdev, u16 vid)
984 struct enic *enic = netdev_priv(netdev);
986 spin_lock(&enic->devcmd_lock);
987 enic_del_vlan(enic, vid);
988 spin_unlock(&enic->devcmd_lock);
991 /* netif_tx_lock held, BHs disabled */
992 static void enic_tx_timeout(struct net_device *netdev)
994 struct enic *enic = netdev_priv(netdev);
995 schedule_work(&enic->reset);
998 static int enic_vnic_dev_deinit(struct enic *enic)
1000 int err;
1002 spin_lock(&enic->devcmd_lock);
1003 err = vnic_dev_deinit(enic->vdev);
1004 spin_unlock(&enic->devcmd_lock);
1006 return err;
1009 static int enic_dev_init_prov(struct enic *enic, struct vic_provinfo *vp)
1011 int err;
1013 spin_lock(&enic->devcmd_lock);
1014 err = vnic_dev_init_prov(enic->vdev,
1015 (u8 *)vp, vic_provinfo_size(vp));
1016 spin_unlock(&enic->devcmd_lock);
1018 return err;
1021 static int enic_dev_init_done(struct enic *enic, int *done, int *error)
1023 int err;
1025 spin_lock(&enic->devcmd_lock);
1026 err = vnic_dev_init_done(enic->vdev, done, error);
1027 spin_unlock(&enic->devcmd_lock);
1029 return err;
1032 static int enic_set_port_profile(struct enic *enic, u8 *mac)
1034 struct vic_provinfo *vp;
1035 u8 oui[3] = VIC_PROVINFO_CISCO_OUI;
1036 u8 *uuid;
1037 char uuid_str[38];
1038 static char *uuid_fmt = "%02X%02X%02X%02X-%02X%02X-%02X%02X-"
1039 "%02X%02X-%02X%02X%02X%02X%0X%02X";
1040 int err;
1042 err = enic_vnic_dev_deinit(enic);
1043 if (err)
1044 return err;
1046 switch (enic->pp.request) {
1048 case PORT_REQUEST_ASSOCIATE:
1050 if (!(enic->pp.set & ENIC_SET_NAME) || !strlen(enic->pp.name))
1051 return -EINVAL;
1053 if (!is_valid_ether_addr(mac))
1054 return -EADDRNOTAVAIL;
1056 vp = vic_provinfo_alloc(GFP_KERNEL, oui,
1057 VIC_PROVINFO_LINUX_TYPE);
1058 if (!vp)
1059 return -ENOMEM;
1061 vic_provinfo_add_tlv(vp,
1062 VIC_LINUX_PROV_TLV_PORT_PROFILE_NAME_STR,
1063 strlen(enic->pp.name) + 1, enic->pp.name);
1065 vic_provinfo_add_tlv(vp,
1066 VIC_LINUX_PROV_TLV_CLIENT_MAC_ADDR,
1067 ETH_ALEN, mac);
1069 if (enic->pp.set & ENIC_SET_INSTANCE) {
1070 uuid = enic->pp.instance_uuid;
1071 sprintf(uuid_str, uuid_fmt,
1072 uuid[0], uuid[1], uuid[2], uuid[3],
1073 uuid[4], uuid[5], uuid[6], uuid[7],
1074 uuid[8], uuid[9], uuid[10], uuid[11],
1075 uuid[12], uuid[13], uuid[14], uuid[15]);
1076 vic_provinfo_add_tlv(vp,
1077 VIC_LINUX_PROV_TLV_CLIENT_UUID_STR,
1078 sizeof(uuid_str), uuid_str);
1081 if (enic->pp.set & ENIC_SET_HOST) {
1082 uuid = enic->pp.host_uuid;
1083 sprintf(uuid_str, uuid_fmt,
1084 uuid[0], uuid[1], uuid[2], uuid[3],
1085 uuid[4], uuid[5], uuid[6], uuid[7],
1086 uuid[8], uuid[9], uuid[10], uuid[11],
1087 uuid[12], uuid[13], uuid[14], uuid[15]);
1088 vic_provinfo_add_tlv(vp,
1089 VIC_LINUX_PROV_TLV_HOST_UUID_STR,
1090 sizeof(uuid_str), uuid_str);
1093 err = enic_dev_init_prov(enic, vp);
1094 vic_provinfo_free(vp);
1095 if (err)
1096 return err;
1097 break;
1099 case PORT_REQUEST_DISASSOCIATE:
1100 break;
1102 default:
1103 return -EINVAL;
1106 enic->pp.set |= ENIC_SET_APPLIED;
1107 return 0;
1110 static int enic_set_vf_port(struct net_device *netdev, int vf,
1111 struct nlattr *port[])
1113 struct enic *enic = netdev_priv(netdev);
1115 memset(&enic->pp, 0, sizeof(enic->pp));
1117 if (port[IFLA_PORT_REQUEST]) {
1118 enic->pp.set |= ENIC_SET_REQUEST;
1119 enic->pp.request = nla_get_u8(port[IFLA_PORT_REQUEST]);
1122 if (port[IFLA_PORT_PROFILE]) {
1123 enic->pp.set |= ENIC_SET_NAME;
1124 memcpy(enic->pp.name, nla_data(port[IFLA_PORT_PROFILE]),
1125 PORT_PROFILE_MAX);
1128 if (port[IFLA_PORT_INSTANCE_UUID]) {
1129 enic->pp.set |= ENIC_SET_INSTANCE;
1130 memcpy(enic->pp.instance_uuid,
1131 nla_data(port[IFLA_PORT_INSTANCE_UUID]), PORT_UUID_MAX);
1134 if (port[IFLA_PORT_HOST_UUID]) {
1135 enic->pp.set |= ENIC_SET_HOST;
1136 memcpy(enic->pp.host_uuid,
1137 nla_data(port[IFLA_PORT_HOST_UUID]), PORT_UUID_MAX);
1140 /* don't support VFs, yet */
1141 if (vf != PORT_SELF_VF)
1142 return -EOPNOTSUPP;
1144 if (!(enic->pp.set & ENIC_SET_REQUEST))
1145 return -EOPNOTSUPP;
1147 if (enic->pp.request == PORT_REQUEST_ASSOCIATE) {
1149 /* If the interface mac addr hasn't been assigned,
1150 * assign a random mac addr before setting port-
1151 * profile.
1154 if (is_zero_ether_addr(netdev->dev_addr))
1155 random_ether_addr(netdev->dev_addr);
1158 return enic_set_port_profile(enic, netdev->dev_addr);
1161 static int enic_get_vf_port(struct net_device *netdev, int vf,
1162 struct sk_buff *skb)
1164 struct enic *enic = netdev_priv(netdev);
1165 int err, error, done;
1166 u16 response = PORT_PROFILE_RESPONSE_SUCCESS;
1168 if (!(enic->pp.set & ENIC_SET_APPLIED))
1169 return -ENODATA;
1171 err = enic_dev_init_done(enic, &done, &error);
1172 if (err)
1173 error = err;
1175 switch (error) {
1176 case ERR_SUCCESS:
1177 if (!done)
1178 response = PORT_PROFILE_RESPONSE_INPROGRESS;
1179 break;
1180 case ERR_EINVAL:
1181 response = PORT_PROFILE_RESPONSE_INVALID;
1182 break;
1183 case ERR_EBADSTATE:
1184 response = PORT_PROFILE_RESPONSE_BADSTATE;
1185 break;
1186 case ERR_ENOMEM:
1187 response = PORT_PROFILE_RESPONSE_INSUFFICIENT_RESOURCES;
1188 break;
1189 default:
1190 response = PORT_PROFILE_RESPONSE_ERROR;
1191 break;
1194 NLA_PUT_U16(skb, IFLA_PORT_REQUEST, enic->pp.request);
1195 NLA_PUT_U16(skb, IFLA_PORT_RESPONSE, response);
1196 if (enic->pp.set & ENIC_SET_NAME)
1197 NLA_PUT(skb, IFLA_PORT_PROFILE, PORT_PROFILE_MAX,
1198 enic->pp.name);
1199 if (enic->pp.set & ENIC_SET_INSTANCE)
1200 NLA_PUT(skb, IFLA_PORT_INSTANCE_UUID, PORT_UUID_MAX,
1201 enic->pp.instance_uuid);
1202 if (enic->pp.set & ENIC_SET_HOST)
1203 NLA_PUT(skb, IFLA_PORT_HOST_UUID, PORT_UUID_MAX,
1204 enic->pp.host_uuid);
1206 return 0;
1208 nla_put_failure:
1209 return -EMSGSIZE;
1212 static void enic_free_rq_buf(struct vnic_rq *rq, struct vnic_rq_buf *buf)
1214 struct enic *enic = vnic_dev_priv(rq->vdev);
1216 if (!buf->os_buf)
1217 return;
1219 pci_unmap_single(enic->pdev, buf->dma_addr,
1220 buf->len, PCI_DMA_FROMDEVICE);
1221 dev_kfree_skb_any(buf->os_buf);
1224 static int enic_rq_alloc_buf(struct vnic_rq *rq)
1226 struct enic *enic = vnic_dev_priv(rq->vdev);
1227 struct net_device *netdev = enic->netdev;
1228 struct sk_buff *skb;
1229 unsigned int len = netdev->mtu + ETH_HLEN;
1230 unsigned int os_buf_index = 0;
1231 dma_addr_t dma_addr;
1233 skb = netdev_alloc_skb_ip_align(netdev, len);
1234 if (!skb)
1235 return -ENOMEM;
1237 dma_addr = pci_map_single(enic->pdev, skb->data,
1238 len, PCI_DMA_FROMDEVICE);
1240 enic_queue_rq_desc(rq, skb, os_buf_index,
1241 dma_addr, len);
1243 return 0;
1246 static int enic_rq_alloc_buf_a1(struct vnic_rq *rq)
1248 struct rq_enet_desc *desc = vnic_rq_next_desc(rq);
1250 if (vnic_rq_posting_soon(rq)) {
1252 /* SW workaround for A0 HW erratum: if we're just about
1253 * to write posted_index, insert a dummy desc
1254 * of type resvd
1257 rq_enet_desc_enc(desc, 0, RQ_ENET_TYPE_RESV2, 0);
1258 vnic_rq_post(rq, 0, 0, 0, 0);
1259 } else {
1260 return enic_rq_alloc_buf(rq);
1263 return 0;
1266 static int enic_set_rq_alloc_buf(struct enic *enic)
1268 enum vnic_dev_hw_version hw_ver;
1269 int err;
1271 err = vnic_dev_hw_version(enic->vdev, &hw_ver);
1272 if (err)
1273 return err;
1275 switch (hw_ver) {
1276 case VNIC_DEV_HW_VER_A1:
1277 enic->rq_alloc_buf = enic_rq_alloc_buf_a1;
1278 break;
1279 case VNIC_DEV_HW_VER_A2:
1280 case VNIC_DEV_HW_VER_UNKNOWN:
1281 enic->rq_alloc_buf = enic_rq_alloc_buf;
1282 break;
1283 default:
1284 return -ENODEV;
1287 return 0;
1290 static int enic_get_skb_header(struct sk_buff *skb, void **iphdr,
1291 void **tcph, u64 *hdr_flags, void *priv)
1293 struct cq_enet_rq_desc *cq_desc = priv;
1294 unsigned int ip_len;
1295 struct iphdr *iph;
1297 u8 type, color, eop, sop, ingress_port, vlan_stripped;
1298 u8 fcoe, fcoe_sof, fcoe_fc_crc_ok, fcoe_enc_error, fcoe_eof;
1299 u8 tcp_udp_csum_ok, udp, tcp, ipv4_csum_ok;
1300 u8 ipv6, ipv4, ipv4_fragment, fcs_ok, rss_type, csum_not_calc;
1301 u8 packet_error;
1302 u16 q_number, completed_index, bytes_written, vlan, checksum;
1303 u32 rss_hash;
1305 cq_enet_rq_desc_dec(cq_desc,
1306 &type, &color, &q_number, &completed_index,
1307 &ingress_port, &fcoe, &eop, &sop, &rss_type,
1308 &csum_not_calc, &rss_hash, &bytes_written,
1309 &packet_error, &vlan_stripped, &vlan, &checksum,
1310 &fcoe_sof, &fcoe_fc_crc_ok, &fcoe_enc_error,
1311 &fcoe_eof, &tcp_udp_csum_ok, &udp, &tcp,
1312 &ipv4_csum_ok, &ipv6, &ipv4, &ipv4_fragment,
1313 &fcs_ok);
1315 if (!(ipv4 && tcp && !ipv4_fragment))
1316 return -1;
1318 skb_reset_network_header(skb);
1319 iph = ip_hdr(skb);
1321 ip_len = ip_hdrlen(skb);
1322 skb_set_transport_header(skb, ip_len);
1324 /* check if ip header and tcp header are complete */
1325 if (ntohs(iph->tot_len) < ip_len + tcp_hdrlen(skb))
1326 return -1;
1328 *hdr_flags = LRO_IPV4 | LRO_TCP;
1329 *tcph = tcp_hdr(skb);
1330 *iphdr = iph;
1332 return 0;
1335 static void enic_rq_indicate_buf(struct vnic_rq *rq,
1336 struct cq_desc *cq_desc, struct vnic_rq_buf *buf,
1337 int skipped, void *opaque)
1339 struct enic *enic = vnic_dev_priv(rq->vdev);
1340 struct net_device *netdev = enic->netdev;
1341 struct sk_buff *skb;
1343 u8 type, color, eop, sop, ingress_port, vlan_stripped;
1344 u8 fcoe, fcoe_sof, fcoe_fc_crc_ok, fcoe_enc_error, fcoe_eof;
1345 u8 tcp_udp_csum_ok, udp, tcp, ipv4_csum_ok;
1346 u8 ipv6, ipv4, ipv4_fragment, fcs_ok, rss_type, csum_not_calc;
1347 u8 packet_error;
1348 u16 q_number, completed_index, bytes_written, vlan, checksum;
1349 u32 rss_hash;
1351 if (skipped)
1352 return;
1354 skb = buf->os_buf;
1355 prefetch(skb->data - NET_IP_ALIGN);
1356 pci_unmap_single(enic->pdev, buf->dma_addr,
1357 buf->len, PCI_DMA_FROMDEVICE);
1359 cq_enet_rq_desc_dec((struct cq_enet_rq_desc *)cq_desc,
1360 &type, &color, &q_number, &completed_index,
1361 &ingress_port, &fcoe, &eop, &sop, &rss_type,
1362 &csum_not_calc, &rss_hash, &bytes_written,
1363 &packet_error, &vlan_stripped, &vlan, &checksum,
1364 &fcoe_sof, &fcoe_fc_crc_ok, &fcoe_enc_error,
1365 &fcoe_eof, &tcp_udp_csum_ok, &udp, &tcp,
1366 &ipv4_csum_ok, &ipv6, &ipv4, &ipv4_fragment,
1367 &fcs_ok);
1369 if (packet_error) {
1371 if (!fcs_ok) {
1372 if (bytes_written > 0)
1373 enic->rq_bad_fcs++;
1374 else if (bytes_written == 0)
1375 enic->rq_truncated_pkts++;
1378 dev_kfree_skb_any(skb);
1380 return;
1383 if (eop && bytes_written > 0) {
1385 /* Good receive
1388 skb_put(skb, bytes_written);
1389 skb->protocol = eth_type_trans(skb, netdev);
1391 if (enic->csum_rx_enabled && !csum_not_calc) {
1392 skb->csum = htons(checksum);
1393 skb->ip_summed = CHECKSUM_COMPLETE;
1396 skb->dev = netdev;
1398 if (enic->vlan_group && vlan_stripped) {
1400 if ((netdev->features & NETIF_F_LRO) && ipv4)
1401 lro_vlan_hwaccel_receive_skb(&enic->lro_mgr,
1402 skb, enic->vlan_group,
1403 vlan, cq_desc);
1404 else
1405 vlan_hwaccel_receive_skb(skb,
1406 enic->vlan_group, vlan);
1408 } else {
1410 if ((netdev->features & NETIF_F_LRO) && ipv4)
1411 lro_receive_skb(&enic->lro_mgr, skb, cq_desc);
1412 else
1413 netif_receive_skb(skb);
1417 } else {
1419 /* Buffer overflow
1422 dev_kfree_skb_any(skb);
1426 static int enic_rq_service(struct vnic_dev *vdev, struct cq_desc *cq_desc,
1427 u8 type, u16 q_number, u16 completed_index, void *opaque)
1429 struct enic *enic = vnic_dev_priv(vdev);
1431 vnic_rq_service(&enic->rq[q_number], cq_desc,
1432 completed_index, VNIC_RQ_RETURN_DESC,
1433 enic_rq_indicate_buf, opaque);
1435 return 0;
1438 static int enic_poll(struct napi_struct *napi, int budget)
1440 struct enic *enic = container_of(napi, struct enic, napi);
1441 struct net_device *netdev = enic->netdev;
1442 unsigned int rq_work_to_do = budget;
1443 unsigned int wq_work_to_do = -1; /* no limit */
1444 unsigned int work_done, rq_work_done, wq_work_done;
1445 int err;
1447 /* Service RQ (first) and WQ
1450 rq_work_done = vnic_cq_service(&enic->cq[ENIC_CQ_RQ],
1451 rq_work_to_do, enic_rq_service, NULL);
1453 wq_work_done = vnic_cq_service(&enic->cq[ENIC_CQ_WQ],
1454 wq_work_to_do, enic_wq_service, NULL);
1456 /* Accumulate intr event credits for this polling
1457 * cycle. An intr event is the completion of a
1458 * a WQ or RQ packet.
1461 work_done = rq_work_done + wq_work_done;
1463 if (work_done > 0)
1464 vnic_intr_return_credits(&enic->intr[ENIC_INTX_WQ_RQ],
1465 work_done,
1466 0 /* don't unmask intr */,
1467 0 /* don't reset intr timer */);
1469 err = vnic_rq_fill(&enic->rq[0], enic->rq_alloc_buf);
1471 /* Buffer allocation failed. Stay in polling
1472 * mode so we can try to fill the ring again.
1475 if (err)
1476 rq_work_done = rq_work_to_do;
1478 if (rq_work_done < rq_work_to_do) {
1480 /* Some work done, but not enough to stay in polling,
1481 * flush all LROs and exit polling
1484 if (netdev->features & NETIF_F_LRO)
1485 lro_flush_all(&enic->lro_mgr);
1487 napi_complete(napi);
1488 vnic_intr_unmask(&enic->intr[ENIC_INTX_WQ_RQ]);
1491 return rq_work_done;
1494 static int enic_poll_msix(struct napi_struct *napi, int budget)
1496 struct enic *enic = container_of(napi, struct enic, napi);
1497 struct net_device *netdev = enic->netdev;
1498 unsigned int work_to_do = budget;
1499 unsigned int work_done;
1500 int err;
1502 /* Service RQ
1505 work_done = vnic_cq_service(&enic->cq[ENIC_CQ_RQ],
1506 work_to_do, enic_rq_service, NULL);
1508 /* Return intr event credits for this polling
1509 * cycle. An intr event is the completion of a
1510 * RQ packet.
1513 if (work_done > 0)
1514 vnic_intr_return_credits(&enic->intr[ENIC_MSIX_RQ],
1515 work_done,
1516 0 /* don't unmask intr */,
1517 0 /* don't reset intr timer */);
1519 err = vnic_rq_fill(&enic->rq[0], enic->rq_alloc_buf);
1521 /* Buffer allocation failed. Stay in polling mode
1522 * so we can try to fill the ring again.
1525 if (err)
1526 work_done = work_to_do;
1528 if (work_done < work_to_do) {
1530 /* Some work done, but not enough to stay in polling,
1531 * flush all LROs and exit polling
1534 if (netdev->features & NETIF_F_LRO)
1535 lro_flush_all(&enic->lro_mgr);
1537 napi_complete(napi);
1538 vnic_intr_unmask(&enic->intr[ENIC_MSIX_RQ]);
1541 return work_done;
1544 static void enic_notify_timer(unsigned long data)
1546 struct enic *enic = (struct enic *)data;
1548 enic_notify_check(enic);
1550 mod_timer(&enic->notify_timer,
1551 round_jiffies(jiffies + ENIC_NOTIFY_TIMER_PERIOD));
1554 static void enic_free_intr(struct enic *enic)
1556 struct net_device *netdev = enic->netdev;
1557 unsigned int i;
1559 switch (vnic_dev_get_intr_mode(enic->vdev)) {
1560 case VNIC_DEV_INTR_MODE_INTX:
1561 free_irq(enic->pdev->irq, netdev);
1562 break;
1563 case VNIC_DEV_INTR_MODE_MSI:
1564 free_irq(enic->pdev->irq, enic);
1565 break;
1566 case VNIC_DEV_INTR_MODE_MSIX:
1567 for (i = 0; i < ARRAY_SIZE(enic->msix); i++)
1568 if (enic->msix[i].requested)
1569 free_irq(enic->msix_entry[i].vector,
1570 enic->msix[i].devid);
1571 break;
1572 default:
1573 break;
1577 static int enic_request_intr(struct enic *enic)
1579 struct net_device *netdev = enic->netdev;
1580 unsigned int i;
1581 int err = 0;
1583 switch (vnic_dev_get_intr_mode(enic->vdev)) {
1585 case VNIC_DEV_INTR_MODE_INTX:
1587 err = request_irq(enic->pdev->irq, enic_isr_legacy,
1588 IRQF_SHARED, netdev->name, netdev);
1589 break;
1591 case VNIC_DEV_INTR_MODE_MSI:
1593 err = request_irq(enic->pdev->irq, enic_isr_msi,
1594 0, netdev->name, enic);
1595 break;
1597 case VNIC_DEV_INTR_MODE_MSIX:
1599 sprintf(enic->msix[ENIC_MSIX_RQ].devname,
1600 "%.11s-rx-0", netdev->name);
1601 enic->msix[ENIC_MSIX_RQ].isr = enic_isr_msix_rq;
1602 enic->msix[ENIC_MSIX_RQ].devid = enic;
1604 sprintf(enic->msix[ENIC_MSIX_WQ].devname,
1605 "%.11s-tx-0", netdev->name);
1606 enic->msix[ENIC_MSIX_WQ].isr = enic_isr_msix_wq;
1607 enic->msix[ENIC_MSIX_WQ].devid = enic;
1609 sprintf(enic->msix[ENIC_MSIX_ERR].devname,
1610 "%.11s-err", netdev->name);
1611 enic->msix[ENIC_MSIX_ERR].isr = enic_isr_msix_err;
1612 enic->msix[ENIC_MSIX_ERR].devid = enic;
1614 sprintf(enic->msix[ENIC_MSIX_NOTIFY].devname,
1615 "%.11s-notify", netdev->name);
1616 enic->msix[ENIC_MSIX_NOTIFY].isr = enic_isr_msix_notify;
1617 enic->msix[ENIC_MSIX_NOTIFY].devid = enic;
1619 for (i = 0; i < ARRAY_SIZE(enic->msix); i++) {
1620 err = request_irq(enic->msix_entry[i].vector,
1621 enic->msix[i].isr, 0,
1622 enic->msix[i].devname,
1623 enic->msix[i].devid);
1624 if (err) {
1625 enic_free_intr(enic);
1626 break;
1628 enic->msix[i].requested = 1;
1631 break;
1633 default:
1634 break;
1637 return err;
1640 static void enic_synchronize_irqs(struct enic *enic)
1642 unsigned int i;
1644 switch (vnic_dev_get_intr_mode(enic->vdev)) {
1645 case VNIC_DEV_INTR_MODE_INTX:
1646 case VNIC_DEV_INTR_MODE_MSI:
1647 synchronize_irq(enic->pdev->irq);
1648 break;
1649 case VNIC_DEV_INTR_MODE_MSIX:
1650 for (i = 0; i < enic->intr_count; i++)
1651 synchronize_irq(enic->msix_entry[i].vector);
1652 break;
1653 default:
1654 break;
1658 static int enic_notify_set(struct enic *enic)
1660 int err;
1662 spin_lock(&enic->devcmd_lock);
1663 switch (vnic_dev_get_intr_mode(enic->vdev)) {
1664 case VNIC_DEV_INTR_MODE_INTX:
1665 err = vnic_dev_notify_set(enic->vdev, ENIC_INTX_NOTIFY);
1666 break;
1667 case VNIC_DEV_INTR_MODE_MSIX:
1668 err = vnic_dev_notify_set(enic->vdev, ENIC_MSIX_NOTIFY);
1669 break;
1670 default:
1671 err = vnic_dev_notify_set(enic->vdev, -1 /* no intr */);
1672 break;
1674 spin_unlock(&enic->devcmd_lock);
1676 return err;
1679 static void enic_notify_timer_start(struct enic *enic)
1681 switch (vnic_dev_get_intr_mode(enic->vdev)) {
1682 case VNIC_DEV_INTR_MODE_MSI:
1683 mod_timer(&enic->notify_timer, jiffies);
1684 break;
1685 default:
1686 /* Using intr for notification for INTx/MSI-X */
1687 break;
1691 /* rtnl lock is held, process context */
1692 static int enic_open(struct net_device *netdev)
1694 struct enic *enic = netdev_priv(netdev);
1695 unsigned int i;
1696 int err;
1698 err = enic_request_intr(enic);
1699 if (err) {
1700 printk(KERN_ERR PFX "%s: Unable to request irq.\n",
1701 netdev->name);
1702 return err;
1705 err = enic_notify_set(enic);
1706 if (err) {
1707 printk(KERN_ERR PFX
1708 "%s: Failed to alloc notify buffer, aborting.\n",
1709 netdev->name);
1710 goto err_out_free_intr;
1713 for (i = 0; i < enic->rq_count; i++) {
1714 vnic_rq_fill(&enic->rq[i], enic->rq_alloc_buf);
1715 /* Need at least one buffer on ring to get going */
1716 if (vnic_rq_desc_used(&enic->rq[i]) == 0) {
1717 printk(KERN_ERR PFX
1718 "%s: Unable to alloc receive buffers.\n",
1719 netdev->name);
1720 err = -ENOMEM;
1721 goto err_out_notify_unset;
1725 for (i = 0; i < enic->wq_count; i++)
1726 vnic_wq_enable(&enic->wq[i]);
1727 for (i = 0; i < enic->rq_count; i++)
1728 vnic_rq_enable(&enic->rq[i]);
1730 enic_dev_add_station_addr(enic);
1731 enic_set_multicast_list(netdev);
1733 netif_wake_queue(netdev);
1734 napi_enable(&enic->napi);
1735 spin_lock(&enic->devcmd_lock);
1736 vnic_dev_enable(enic->vdev);
1737 spin_unlock(&enic->devcmd_lock);
1739 for (i = 0; i < enic->intr_count; i++)
1740 vnic_intr_unmask(&enic->intr[i]);
1742 enic_notify_timer_start(enic);
1744 return 0;
1746 err_out_notify_unset:
1747 spin_lock(&enic->devcmd_lock);
1748 vnic_dev_notify_unset(enic->vdev);
1749 spin_unlock(&enic->devcmd_lock);
1750 err_out_free_intr:
1751 enic_free_intr(enic);
1753 return err;
1756 /* rtnl lock is held, process context */
1757 static int enic_stop(struct net_device *netdev)
1759 struct enic *enic = netdev_priv(netdev);
1760 unsigned int i;
1761 int err;
1763 for (i = 0; i < enic->intr_count; i++)
1764 vnic_intr_mask(&enic->intr[i]);
1766 enic_synchronize_irqs(enic);
1768 del_timer_sync(&enic->notify_timer);
1770 spin_lock(&enic->devcmd_lock);
1771 vnic_dev_disable(enic->vdev);
1772 spin_unlock(&enic->devcmd_lock);
1773 napi_disable(&enic->napi);
1774 netif_carrier_off(netdev);
1775 netif_tx_disable(netdev);
1777 enic_dev_del_station_addr(enic);
1779 for (i = 0; i < enic->wq_count; i++) {
1780 err = vnic_wq_disable(&enic->wq[i]);
1781 if (err)
1782 return err;
1784 for (i = 0; i < enic->rq_count; i++) {
1785 err = vnic_rq_disable(&enic->rq[i]);
1786 if (err)
1787 return err;
1790 spin_lock(&enic->devcmd_lock);
1791 vnic_dev_notify_unset(enic->vdev);
1792 spin_unlock(&enic->devcmd_lock);
1793 enic_free_intr(enic);
1795 for (i = 0; i < enic->wq_count; i++)
1796 vnic_wq_clean(&enic->wq[i], enic_free_wq_buf);
1797 for (i = 0; i < enic->rq_count; i++)
1798 vnic_rq_clean(&enic->rq[i], enic_free_rq_buf);
1799 for (i = 0; i < enic->cq_count; i++)
1800 vnic_cq_clean(&enic->cq[i]);
1801 for (i = 0; i < enic->intr_count; i++)
1802 vnic_intr_clean(&enic->intr[i]);
1804 return 0;
1807 static int enic_change_mtu(struct net_device *netdev, int new_mtu)
1809 struct enic *enic = netdev_priv(netdev);
1810 int running = netif_running(netdev);
1812 if (new_mtu < ENIC_MIN_MTU || new_mtu > ENIC_MAX_MTU)
1813 return -EINVAL;
1815 if (running)
1816 enic_stop(netdev);
1818 netdev->mtu = new_mtu;
1820 if (netdev->mtu > enic->port_mtu)
1821 printk(KERN_WARNING PFX
1822 "%s: interface MTU (%d) set higher "
1823 "than port MTU (%d)\n",
1824 netdev->name, netdev->mtu, enic->port_mtu);
1826 if (running)
1827 enic_open(netdev);
1829 return 0;
1832 #ifdef CONFIG_NET_POLL_CONTROLLER
1833 static void enic_poll_controller(struct net_device *netdev)
1835 struct enic *enic = netdev_priv(netdev);
1836 struct vnic_dev *vdev = enic->vdev;
1838 switch (vnic_dev_get_intr_mode(vdev)) {
1839 case VNIC_DEV_INTR_MODE_MSIX:
1840 enic_isr_msix_rq(enic->pdev->irq, enic);
1841 enic_isr_msix_wq(enic->pdev->irq, enic);
1842 break;
1843 case VNIC_DEV_INTR_MODE_MSI:
1844 enic_isr_msi(enic->pdev->irq, enic);
1845 break;
1846 case VNIC_DEV_INTR_MODE_INTX:
1847 enic_isr_legacy(enic->pdev->irq, netdev);
1848 break;
1849 default:
1850 break;
1853 #endif
1855 static int enic_dev_wait(struct vnic_dev *vdev,
1856 int (*start)(struct vnic_dev *, int),
1857 int (*finished)(struct vnic_dev *, int *),
1858 int arg)
1860 unsigned long time;
1861 int done;
1862 int err;
1864 BUG_ON(in_interrupt());
1866 err = start(vdev, arg);
1867 if (err)
1868 return err;
1870 /* Wait for func to complete...2 seconds max
1873 time = jiffies + (HZ * 2);
1874 do {
1876 err = finished(vdev, &done);
1877 if (err)
1878 return err;
1880 if (done)
1881 return 0;
1883 schedule_timeout_uninterruptible(HZ / 10);
1885 } while (time_after(time, jiffies));
1887 return -ETIMEDOUT;
1890 static int enic_dev_open(struct enic *enic)
1892 int err;
1894 err = enic_dev_wait(enic->vdev, vnic_dev_open,
1895 vnic_dev_open_done, 0);
1896 if (err)
1897 printk(KERN_ERR PFX
1898 "vNIC device open failed, err %d.\n", err);
1900 return err;
1903 static int enic_dev_soft_reset(struct enic *enic)
1905 int err;
1907 err = enic_dev_wait(enic->vdev, vnic_dev_soft_reset,
1908 vnic_dev_soft_reset_done, 0);
1909 if (err)
1910 printk(KERN_ERR PFX
1911 "vNIC soft reset failed, err %d.\n", err);
1913 return err;
1916 static int enic_set_niccfg(struct enic *enic)
1918 const u8 rss_default_cpu = 0;
1919 const u8 rss_hash_type = 0;
1920 const u8 rss_hash_bits = 0;
1921 const u8 rss_base_cpu = 0;
1922 const u8 rss_enable = 0;
1923 const u8 tso_ipid_split_en = 0;
1924 const u8 ig_vlan_strip_en = 1;
1926 /* Enable VLAN tag stripping. RSS not enabled (yet).
1929 return enic_set_nic_cfg(enic,
1930 rss_default_cpu, rss_hash_type,
1931 rss_hash_bits, rss_base_cpu,
1932 rss_enable, tso_ipid_split_en,
1933 ig_vlan_strip_en);
1936 static void enic_reset(struct work_struct *work)
1938 struct enic *enic = container_of(work, struct enic, reset);
1940 if (!netif_running(enic->netdev))
1941 return;
1943 rtnl_lock();
1945 spin_lock(&enic->devcmd_lock);
1946 vnic_dev_hang_notify(enic->vdev);
1947 spin_unlock(&enic->devcmd_lock);
1949 enic_stop(enic->netdev);
1950 enic_dev_soft_reset(enic);
1951 vnic_dev_init(enic->vdev, 0);
1952 enic_reset_mcaddrs(enic);
1953 enic_init_vnic_resources(enic);
1954 enic_set_niccfg(enic);
1955 enic_open(enic->netdev);
1957 rtnl_unlock();
1960 static int enic_set_intr_mode(struct enic *enic)
1962 unsigned int n = 1;
1963 unsigned int m = 1;
1964 unsigned int i;
1966 /* Set interrupt mode (INTx, MSI, MSI-X) depending
1967 * system capabilities.
1969 * Try MSI-X first
1971 * We need n RQs, m WQs, n+m CQs, and n+m+2 INTRs
1972 * (the second to last INTR is used for WQ/RQ errors)
1973 * (the last INTR is used for notifications)
1976 BUG_ON(ARRAY_SIZE(enic->msix_entry) < n + m + 2);
1977 for (i = 0; i < n + m + 2; i++)
1978 enic->msix_entry[i].entry = i;
1980 if (enic->config.intr_mode < 1 &&
1981 enic->rq_count >= n &&
1982 enic->wq_count >= m &&
1983 enic->cq_count >= n + m &&
1984 enic->intr_count >= n + m + 2 &&
1985 !pci_enable_msix(enic->pdev, enic->msix_entry, n + m + 2)) {
1987 enic->rq_count = n;
1988 enic->wq_count = m;
1989 enic->cq_count = n + m;
1990 enic->intr_count = n + m + 2;
1992 vnic_dev_set_intr_mode(enic->vdev, VNIC_DEV_INTR_MODE_MSIX);
1994 return 0;
1997 /* Next try MSI
1999 * We need 1 RQ, 1 WQ, 2 CQs, and 1 INTR
2002 if (enic->config.intr_mode < 2 &&
2003 enic->rq_count >= 1 &&
2004 enic->wq_count >= 1 &&
2005 enic->cq_count >= 2 &&
2006 enic->intr_count >= 1 &&
2007 !pci_enable_msi(enic->pdev)) {
2009 enic->rq_count = 1;
2010 enic->wq_count = 1;
2011 enic->cq_count = 2;
2012 enic->intr_count = 1;
2014 vnic_dev_set_intr_mode(enic->vdev, VNIC_DEV_INTR_MODE_MSI);
2016 return 0;
2019 /* Next try INTx
2021 * We need 1 RQ, 1 WQ, 2 CQs, and 3 INTRs
2022 * (the first INTR is used for WQ/RQ)
2023 * (the second INTR is used for WQ/RQ errors)
2024 * (the last INTR is used for notifications)
2027 if (enic->config.intr_mode < 3 &&
2028 enic->rq_count >= 1 &&
2029 enic->wq_count >= 1 &&
2030 enic->cq_count >= 2 &&
2031 enic->intr_count >= 3) {
2033 enic->rq_count = 1;
2034 enic->wq_count = 1;
2035 enic->cq_count = 2;
2036 enic->intr_count = 3;
2038 vnic_dev_set_intr_mode(enic->vdev, VNIC_DEV_INTR_MODE_INTX);
2040 return 0;
2043 vnic_dev_set_intr_mode(enic->vdev, VNIC_DEV_INTR_MODE_UNKNOWN);
2045 return -EINVAL;
2048 static void enic_clear_intr_mode(struct enic *enic)
2050 switch (vnic_dev_get_intr_mode(enic->vdev)) {
2051 case VNIC_DEV_INTR_MODE_MSIX:
2052 pci_disable_msix(enic->pdev);
2053 break;
2054 case VNIC_DEV_INTR_MODE_MSI:
2055 pci_disable_msi(enic->pdev);
2056 break;
2057 default:
2058 break;
2061 vnic_dev_set_intr_mode(enic->vdev, VNIC_DEV_INTR_MODE_UNKNOWN);
2064 static const struct net_device_ops enic_netdev_dynamic_ops = {
2065 .ndo_open = enic_open,
2066 .ndo_stop = enic_stop,
2067 .ndo_start_xmit = enic_hard_start_xmit,
2068 .ndo_get_stats = enic_get_stats,
2069 .ndo_validate_addr = eth_validate_addr,
2070 .ndo_set_multicast_list = enic_set_multicast_list,
2071 .ndo_set_mac_address = enic_set_mac_address_dynamic,
2072 .ndo_change_mtu = enic_change_mtu,
2073 .ndo_vlan_rx_register = enic_vlan_rx_register,
2074 .ndo_vlan_rx_add_vid = enic_vlan_rx_add_vid,
2075 .ndo_vlan_rx_kill_vid = enic_vlan_rx_kill_vid,
2076 .ndo_tx_timeout = enic_tx_timeout,
2077 .ndo_set_vf_port = enic_set_vf_port,
2078 .ndo_get_vf_port = enic_get_vf_port,
2079 #ifdef CONFIG_NET_POLL_CONTROLLER
2080 .ndo_poll_controller = enic_poll_controller,
2081 #endif
2084 static const struct net_device_ops enic_netdev_ops = {
2085 .ndo_open = enic_open,
2086 .ndo_stop = enic_stop,
2087 .ndo_start_xmit = enic_hard_start_xmit,
2088 .ndo_get_stats = enic_get_stats,
2089 .ndo_validate_addr = eth_validate_addr,
2090 .ndo_set_multicast_list = enic_set_multicast_list,
2091 .ndo_set_mac_address = enic_set_mac_address,
2092 .ndo_change_mtu = enic_change_mtu,
2093 .ndo_vlan_rx_register = enic_vlan_rx_register,
2094 .ndo_vlan_rx_add_vid = enic_vlan_rx_add_vid,
2095 .ndo_vlan_rx_kill_vid = enic_vlan_rx_kill_vid,
2096 .ndo_tx_timeout = enic_tx_timeout,
2097 #ifdef CONFIG_NET_POLL_CONTROLLER
2098 .ndo_poll_controller = enic_poll_controller,
2099 #endif
2102 void enic_dev_deinit(struct enic *enic)
2104 netif_napi_del(&enic->napi);
2105 enic_free_vnic_resources(enic);
2106 enic_clear_intr_mode(enic);
2109 int enic_dev_init(struct enic *enic)
2111 struct net_device *netdev = enic->netdev;
2112 int err;
2114 /* Get vNIC configuration
2117 err = enic_get_vnic_config(enic);
2118 if (err) {
2119 printk(KERN_ERR PFX
2120 "Get vNIC configuration failed, aborting.\n");
2121 return err;
2124 /* Get available resource counts
2127 enic_get_res_counts(enic);
2129 /* Set interrupt mode based on resource counts and system
2130 * capabilities
2133 err = enic_set_intr_mode(enic);
2134 if (err) {
2135 printk(KERN_ERR PFX
2136 "Failed to set intr mode based on resource "
2137 "counts and system capabilities, aborting.\n");
2138 return err;
2141 /* Allocate and configure vNIC resources
2144 err = enic_alloc_vnic_resources(enic);
2145 if (err) {
2146 printk(KERN_ERR PFX
2147 "Failed to alloc vNIC resources, aborting.\n");
2148 goto err_out_free_vnic_resources;
2151 enic_init_vnic_resources(enic);
2153 err = enic_set_rq_alloc_buf(enic);
2154 if (err) {
2155 printk(KERN_ERR PFX
2156 "Failed to set RQ buffer allocator, aborting.\n");
2157 goto err_out_free_vnic_resources;
2160 err = enic_set_niccfg(enic);
2161 if (err) {
2162 printk(KERN_ERR PFX
2163 "Failed to config nic, aborting.\n");
2164 goto err_out_free_vnic_resources;
2167 switch (vnic_dev_get_intr_mode(enic->vdev)) {
2168 default:
2169 netif_napi_add(netdev, &enic->napi, enic_poll, 64);
2170 break;
2171 case VNIC_DEV_INTR_MODE_MSIX:
2172 netif_napi_add(netdev, &enic->napi, enic_poll_msix, 64);
2173 break;
2176 return 0;
2178 err_out_free_vnic_resources:
2179 enic_clear_intr_mode(enic);
2180 enic_free_vnic_resources(enic);
2182 return err;
2185 static void enic_iounmap(struct enic *enic)
2187 unsigned int i;
2189 for (i = 0; i < ARRAY_SIZE(enic->bar); i++)
2190 if (enic->bar[i].vaddr)
2191 iounmap(enic->bar[i].vaddr);
2194 static int __devinit enic_probe(struct pci_dev *pdev,
2195 const struct pci_device_id *ent)
2197 struct net_device *netdev;
2198 struct enic *enic;
2199 int using_dac = 0;
2200 unsigned int i;
2201 int err;
2203 /* Allocate net device structure and initialize. Private
2204 * instance data is initialized to zero.
2207 netdev = alloc_etherdev(sizeof(struct enic));
2208 if (!netdev) {
2209 printk(KERN_ERR PFX "Etherdev alloc failed, aborting.\n");
2210 return -ENOMEM;
2213 pci_set_drvdata(pdev, netdev);
2215 SET_NETDEV_DEV(netdev, &pdev->dev);
2217 enic = netdev_priv(netdev);
2218 enic->netdev = netdev;
2219 enic->pdev = pdev;
2221 /* Setup PCI resources
2224 err = pci_enable_device(pdev);
2225 if (err) {
2226 printk(KERN_ERR PFX
2227 "Cannot enable PCI device, aborting.\n");
2228 goto err_out_free_netdev;
2231 err = pci_request_regions(pdev, DRV_NAME);
2232 if (err) {
2233 printk(KERN_ERR PFX
2234 "Cannot request PCI regions, aborting.\n");
2235 goto err_out_disable_device;
2238 pci_set_master(pdev);
2240 /* Query PCI controller on system for DMA addressing
2241 * limitation for the device. Try 40-bit first, and
2242 * fail to 32-bit.
2245 err = pci_set_dma_mask(pdev, DMA_BIT_MASK(40));
2246 if (err) {
2247 err = pci_set_dma_mask(pdev, DMA_BIT_MASK(32));
2248 if (err) {
2249 printk(KERN_ERR PFX
2250 "No usable DMA configuration, aborting.\n");
2251 goto err_out_release_regions;
2253 err = pci_set_consistent_dma_mask(pdev, DMA_BIT_MASK(32));
2254 if (err) {
2255 printk(KERN_ERR PFX
2256 "Unable to obtain 32-bit DMA "
2257 "for consistent allocations, aborting.\n");
2258 goto err_out_release_regions;
2260 } else {
2261 err = pci_set_consistent_dma_mask(pdev, DMA_BIT_MASK(40));
2262 if (err) {
2263 printk(KERN_ERR PFX
2264 "Unable to obtain 40-bit DMA "
2265 "for consistent allocations, aborting.\n");
2266 goto err_out_release_regions;
2268 using_dac = 1;
2271 /* Map vNIC resources from BAR0-5
2274 for (i = 0; i < ARRAY_SIZE(enic->bar); i++) {
2275 if (!(pci_resource_flags(pdev, i) & IORESOURCE_MEM))
2276 continue;
2277 enic->bar[i].len = pci_resource_len(pdev, i);
2278 enic->bar[i].vaddr = pci_iomap(pdev, i, enic->bar[i].len);
2279 if (!enic->bar[i].vaddr) {
2280 printk(KERN_ERR PFX
2281 "Cannot memory-map BAR %d, aborting.\n", i);
2282 err = -ENODEV;
2283 goto err_out_iounmap;
2285 enic->bar[i].bus_addr = pci_resource_start(pdev, i);
2288 /* Register vNIC device
2291 enic->vdev = vnic_dev_register(NULL, enic, pdev, enic->bar,
2292 ARRAY_SIZE(enic->bar));
2293 if (!enic->vdev) {
2294 printk(KERN_ERR PFX
2295 "vNIC registration failed, aborting.\n");
2296 err = -ENODEV;
2297 goto err_out_iounmap;
2300 /* Issue device open to get device in known state
2303 err = enic_dev_open(enic);
2304 if (err) {
2305 printk(KERN_ERR PFX
2306 "vNIC dev open failed, aborting.\n");
2307 goto err_out_vnic_unregister;
2310 /* Issue device init to initialize the vnic-to-switch link.
2311 * We'll start with carrier off and wait for link UP
2312 * notification later to turn on carrier. We don't need
2313 * to wait here for the vnic-to-switch link initialization
2314 * to complete; link UP notification is the indication that
2315 * the process is complete.
2318 netif_carrier_off(netdev);
2320 if (!enic_is_dynamic(enic)) {
2321 err = vnic_dev_init(enic->vdev, 0);
2322 if (err) {
2323 printk(KERN_ERR PFX
2324 "vNIC dev init failed, aborting.\n");
2325 goto err_out_dev_close;
2329 err = enic_dev_init(enic);
2330 if (err) {
2331 printk(KERN_ERR PFX
2332 "Device initialization failed, aborting.\n");
2333 goto err_out_dev_close;
2336 /* Setup notification timer, HW reset task, and locks
2339 init_timer(&enic->notify_timer);
2340 enic->notify_timer.function = enic_notify_timer;
2341 enic->notify_timer.data = (unsigned long)enic;
2343 INIT_WORK(&enic->reset, enic_reset);
2345 for (i = 0; i < enic->wq_count; i++)
2346 spin_lock_init(&enic->wq_lock[i]);
2348 spin_lock_init(&enic->devcmd_lock);
2350 /* Register net device
2353 enic->port_mtu = enic->config.mtu;
2354 (void)enic_change_mtu(netdev, enic->port_mtu);
2356 err = enic_set_mac_addr(netdev, enic->mac_addr);
2357 if (err) {
2358 printk(KERN_ERR PFX
2359 "Invalid MAC address, aborting.\n");
2360 goto err_out_dev_deinit;
2363 enic->tx_coalesce_usecs = enic->config.intr_timer_usec;
2364 enic->rx_coalesce_usecs = enic->tx_coalesce_usecs;
2366 if (enic_is_dynamic(enic))
2367 netdev->netdev_ops = &enic_netdev_dynamic_ops;
2368 else
2369 netdev->netdev_ops = &enic_netdev_ops;
2371 netdev->watchdog_timeo = 2 * HZ;
2372 netdev->ethtool_ops = &enic_ethtool_ops;
2374 netdev->features |= NETIF_F_HW_VLAN_TX | NETIF_F_HW_VLAN_RX;
2375 if (ENIC_SETTING(enic, TXCSUM))
2376 netdev->features |= NETIF_F_SG | NETIF_F_HW_CSUM;
2377 if (ENIC_SETTING(enic, TSO))
2378 netdev->features |= NETIF_F_TSO |
2379 NETIF_F_TSO6 | NETIF_F_TSO_ECN;
2380 if (ENIC_SETTING(enic, LRO))
2381 netdev->features |= NETIF_F_LRO;
2382 if (using_dac)
2383 netdev->features |= NETIF_F_HIGHDMA;
2385 enic->csum_rx_enabled = ENIC_SETTING(enic, RXCSUM);
2387 enic->lro_mgr.max_aggr = ENIC_LRO_MAX_AGGR;
2388 enic->lro_mgr.max_desc = ENIC_LRO_MAX_DESC;
2389 enic->lro_mgr.lro_arr = enic->lro_desc;
2390 enic->lro_mgr.get_skb_header = enic_get_skb_header;
2391 enic->lro_mgr.features = LRO_F_NAPI | LRO_F_EXTRACT_VLAN_ID;
2392 enic->lro_mgr.dev = netdev;
2393 enic->lro_mgr.ip_summed = CHECKSUM_COMPLETE;
2394 enic->lro_mgr.ip_summed_aggr = CHECKSUM_UNNECESSARY;
2396 err = register_netdev(netdev);
2397 if (err) {
2398 printk(KERN_ERR PFX
2399 "Cannot register net device, aborting.\n");
2400 goto err_out_dev_deinit;
2403 return 0;
2405 err_out_dev_deinit:
2406 enic_dev_deinit(enic);
2407 err_out_dev_close:
2408 vnic_dev_close(enic->vdev);
2409 err_out_vnic_unregister:
2410 vnic_dev_unregister(enic->vdev);
2411 err_out_iounmap:
2412 enic_iounmap(enic);
2413 err_out_release_regions:
2414 pci_release_regions(pdev);
2415 err_out_disable_device:
2416 pci_disable_device(pdev);
2417 err_out_free_netdev:
2418 pci_set_drvdata(pdev, NULL);
2419 free_netdev(netdev);
2421 return err;
2424 static void __devexit enic_remove(struct pci_dev *pdev)
2426 struct net_device *netdev = pci_get_drvdata(pdev);
2428 if (netdev) {
2429 struct enic *enic = netdev_priv(netdev);
2431 flush_scheduled_work();
2432 unregister_netdev(netdev);
2433 enic_dev_deinit(enic);
2434 vnic_dev_close(enic->vdev);
2435 vnic_dev_unregister(enic->vdev);
2436 enic_iounmap(enic);
2437 pci_release_regions(pdev);
2438 pci_disable_device(pdev);
2439 pci_set_drvdata(pdev, NULL);
2440 free_netdev(netdev);
2444 static struct pci_driver enic_driver = {
2445 .name = DRV_NAME,
2446 .id_table = enic_id_table,
2447 .probe = enic_probe,
2448 .remove = __devexit_p(enic_remove),
2451 static int __init enic_init_module(void)
2453 printk(KERN_INFO PFX "%s, ver %s\n", DRV_DESCRIPTION, DRV_VERSION);
2455 return pci_register_driver(&enic_driver);
2458 static void __exit enic_cleanup_module(void)
2460 pci_unregister_driver(&enic_driver);
2463 module_init(enic_init_module);
2464 module_exit(enic_cleanup_module);