1 /* SPDX-License-Identifier: GPL-2.0 OR Linux-OpenIB */
3 * Copyright 2015-2020 Amazon.com, Inc. or its affiliates. All rights reserved.
9 #include <linux/bitops.h>
10 #include <linux/dim.h>
11 #include <linux/etherdevice.h>
12 #include <linux/if_vlan.h>
13 #include <linux/inetdevice.h>
14 #include <linux/interrupt.h>
15 #include <linux/netdevice.h>
16 #include <linux/skbuff.h>
19 #include "ena_eth_com.h"
21 #define DRV_MODULE_GEN_MAJOR 2
22 #define DRV_MODULE_GEN_MINOR 1
23 #define DRV_MODULE_GEN_SUBMINOR 0
25 #define DRV_MODULE_NAME "ena"
27 #define DEVICE_NAME "Elastic Network Adapter (ENA)"
29 /* 1 for AENQ + ADMIN */
30 #define ENA_ADMIN_MSIX_VEC 1
31 #define ENA_MAX_MSIX_VEC(io_queues) (ENA_ADMIN_MSIX_VEC + (io_queues))
33 /* The ENA buffer length fields is 16 bit long. So when PAGE_SIZE == 64kB the
35 * Since the max packet size the ENA handles is ~9kB limit the buffer length to
38 #if PAGE_SIZE > SZ_16K
39 #define ENA_PAGE_SIZE (_AC(SZ_16K, UL))
41 #define ENA_PAGE_SIZE PAGE_SIZE
44 #define ENA_MIN_MSIX_VEC 2
48 #define ENA_BAR_MASK (BIT(ENA_REG_BAR) | BIT(ENA_MEM_BAR))
50 #define ENA_DEFAULT_RING_SIZE (1024)
51 #define ENA_MIN_RING_SIZE (256)
53 #define ENA_MIN_NUM_IO_QUEUES (1)
55 #define ENA_TX_WAKEUP_THRESH (MAX_SKB_FRAGS + 2)
56 #define ENA_DEFAULT_RX_COPYBREAK (256 - NET_IP_ALIGN)
58 /* limit the buffer size to 600 bytes to handle MTU changes from very
59 * small to very large, in which case the number of buffers per packet
60 * could exceed ENA_PKT_MAX_BUFS
62 #define ENA_DEFAULT_MIN_RX_BUFF_ALLOC_SIZE 600
64 #define ENA_MIN_MTU 128
66 #define ENA_NAME_MAX_LEN 20
67 #define ENA_IRQNAME_SIZE 40
69 #define ENA_PKT_MAX_BUFS 19
71 #define ENA_RX_RSS_TABLE_LOG_SIZE 7
72 #define ENA_RX_RSS_TABLE_SIZE (1 << ENA_RX_RSS_TABLE_LOG_SIZE)
74 /* The number of tx packet completions that will be handled each NAPI poll
75 * cycle is ring_size / ENA_TX_POLL_BUDGET_DIVIDER.
77 #define ENA_TX_POLL_BUDGET_DIVIDER 4
79 /* Refill Rx queue when number of required descriptors is above
80 * QUEUE_SIZE / ENA_RX_REFILL_THRESH_DIVIDER or ENA_RX_REFILL_THRESH_PACKET
82 #define ENA_RX_REFILL_THRESH_DIVIDER 8
83 #define ENA_RX_REFILL_THRESH_PACKET 256
85 /* Number of queues to check for missing queues per timer service */
86 #define ENA_MONITORED_TX_QUEUES 4
87 /* Max timeout packets before device reset */
88 #define MAX_NUM_OF_TIMEOUTED_PACKETS 128
90 #define ENA_TX_RING_IDX_NEXT(idx, ring_size) (((idx) + 1) & ((ring_size) - 1))
92 #define ENA_RX_RING_IDX_NEXT(idx, ring_size) (((idx) + 1) & ((ring_size) - 1))
93 #define ENA_RX_RING_IDX_ADD(idx, n, ring_size) \
94 (((idx) + (n)) & ((ring_size) - 1))
96 #define ENA_IO_TXQ_IDX(q) (2 * (q))
97 #define ENA_IO_RXQ_IDX(q) (2 * (q) + 1)
98 #define ENA_IO_TXQ_IDX_TO_COMBINED_IDX(q) ((q) / 2)
99 #define ENA_IO_RXQ_IDX_TO_COMBINED_IDX(q) (((q) - 1) / 2)
101 #define ENA_MGMNT_IRQ_IDX 0
102 #define ENA_IO_IRQ_FIRST_IDX 1
103 #define ENA_IO_IRQ_IDX(q) (ENA_IO_IRQ_FIRST_IDX + (q))
105 #define ENA_ADMIN_POLL_DELAY_US 100
107 /* ENA device should send keep alive msg every 1 sec.
108 * We wait for 6 sec just to be on the safe side.
110 #define ENA_DEVICE_KALIVE_TIMEOUT (6 * HZ)
111 #define ENA_MAX_NO_INTERRUPT_ITERATIONS 3
113 #define ENA_MMIO_DISABLE_REG_READ BIT(0)
115 /* The max MTU size is configured to be the ethernet frame size without
116 * the overhead of the ethernet header, which can have a VLAN header, and
117 * a frame check sequence (FCS).
118 * The buffer size we share with the device is defined to be ENA_PAGE_SIZE
121 #define ENA_XDP_MAX_MTU (ENA_PAGE_SIZE - ETH_HLEN - ETH_FCS_LEN - \
122 VLAN_HLEN - XDP_PACKET_HEADROOM - \
123 SKB_DATA_ALIGN(sizeof(struct skb_shared_info)))
125 #define ENA_IS_XDP_INDEX(adapter, index) (((index) >= (adapter)->xdp_first_ring) && \
126 ((index) < (adapter)->xdp_first_ring + (adapter)->xdp_num_queues))
129 irq_handler_t handler
;
133 cpumask_t affinity_hint_mask
;
134 char name
[ENA_IRQNAME_SIZE
];
138 struct napi_struct napi ____cacheline_aligned
;
139 struct ena_ring
*tx_ring
;
140 struct ena_ring
*rx_ring
;
141 struct ena_ring
*xdp_ring
;
142 bool first_interrupt
;
143 bool interrupts_masked
;
148 struct ena_calc_queue_size_ctx
{
149 struct ena_com_dev_get_features_ctx
*get_feat_ctx
;
150 struct ena_com_dev
*ena_dev
;
151 struct pci_dev
*pdev
;
154 u32 max_tx_queue_size
;
155 u32 max_rx_queue_size
;
160 struct ena_tx_buffer
{
162 /* num of ena desc for this specific skb
163 * (includes data desc and metadata desc)
166 /* num of buffers used by this skb */
169 /* XDP buffer structure which is used for sending packets in
172 struct xdp_frame
*xdpf
;
174 /* Indicate if bufs[0] map the linear data of the skb. */
177 /* Used for detect missing tx packets to limit the number of prints */
179 /* Save the last jiffies to detect missing tx packets
181 * sets to non zero value on ena_start_xmit and set to zero on
182 * napi and timer_Service_routine.
184 * while this value is not protected by lock,
185 * a given packet is not expected to be handled by ena_start_xmit
186 * and by napi/timer_service at the same time.
188 unsigned long last_jiffies
;
189 struct ena_com_buf bufs
[ENA_PKT_MAX_BUFS
];
190 } ____cacheline_aligned
;
192 struct ena_rx_buffer
{
196 struct ena_com_buf ena_buf
;
197 } ____cacheline_aligned
;
199 struct ena_stats_tx
{
207 u64 linearize_failed
;
214 u64 unmask_interrupt
;
217 struct ena_stats_rx
{
220 u64 rx_copybreak_pkt
;
240 /* Holds the empty requests for TX/RX
241 * out of order completions
246 struct ena_tx_buffer
*tx_buffer_info
;
247 struct ena_rx_buffer
*rx_buffer_info
;
250 /* cache ptr to avoid using the adapter */
252 struct pci_dev
*pdev
;
253 struct napi_struct
*napi
;
254 struct net_device
*netdev
;
255 struct ena_com_dev
*ena_dev
;
256 struct ena_adapter
*adapter
;
257 struct ena_com_io_cq
*ena_com_io_cq
;
258 struct ena_com_io_sq
*ena_com_io_sq
;
259 struct bpf_prog
*xdp_bpf_prog
;
260 struct xdp_rxq_info xdp_rxq
;
261 spinlock_t xdp_tx_lock
; /* synchronize XDP TX/Redirect traffic */
271 /* The maximum header length the device can handle */
272 u8 tx_max_header_size
;
274 bool first_interrupt
;
275 bool disable_meta_caching
;
276 u16 no_interrupt_event_cnt
;
280 /* number of tx/rx_buffer_info's entries */
283 enum ena_admin_placement_policy_type tx_mem_queue_type
;
285 struct ena_com_rx_buf_info ena_bufs
[ENA_PKT_MAX_BUFS
];
286 u32 smoothed_interval
;
287 u32 per_napi_packets
;
288 u16 non_empty_napi_events
;
289 struct u64_stats_sync syncp
;
291 struct ena_stats_tx tx_stats
;
292 struct ena_stats_rx rx_stats
;
295 u8
*push_buf_intermediate_buf
;
297 } ____cacheline_aligned
;
299 struct ena_stats_dev
{
312 ENA_FLAG_DEVICE_RUNNING
,
315 ENA_FLAG_MSIX_ENABLED
,
316 ENA_FLAG_TRIGGER_RESET
,
317 ENA_FLAG_ONGOING_RESET
320 /* adapter specific private data structure */
322 struct ena_com_dev
*ena_dev
;
323 /* OS defined structs */
324 struct net_device
*netdev
;
325 struct pci_dev
*pdev
;
327 /* rx packets that shorter that this len will be copied to the skb
334 u32 max_num_io_queues
;
338 u32 missing_tx_completion_threshold
;
340 u32 requested_tx_ring_size
;
341 u32 requested_rx_ring_size
;
343 u32 max_tx_ring_size
;
344 u32 max_rx_ring_size
;
351 u8 mac_addr
[ETH_ALEN
];
353 unsigned long keep_alive_timeout
;
354 unsigned long missing_tx_completion_to
;
356 char name
[ENA_NAME_MAX_LEN
];
360 struct ena_ring tx_ring
[ENA_MAX_NUM_IO_QUEUES
]
361 ____cacheline_aligned_in_smp
;
364 struct ena_ring rx_ring
[ENA_MAX_NUM_IO_QUEUES
]
365 ____cacheline_aligned_in_smp
;
367 struct ena_napi ena_napi
[ENA_MAX_NUM_IO_QUEUES
];
369 struct ena_irq irq_tbl
[ENA_MAX_MSIX_VEC(ENA_MAX_NUM_IO_QUEUES
)];
372 struct work_struct reset_task
;
373 struct timer_list timer_service
;
376 bool dev_up_before_reset
;
377 bool disable_meta_caching
;
378 unsigned long last_keep_alive_jiffies
;
380 struct u64_stats_sync syncp
;
381 struct ena_stats_dev dev_stats
;
382 struct ena_admin_eni_stats eni_stats
;
383 bool eni_stats_supported
;
385 /* last queue index that was checked for uncompleted tx packets */
386 u32 last_monitored_tx_qid
;
388 enum ena_regs_reset_reason_types reset_reason
;
390 struct bpf_prog
*xdp_bpf_prog
;
395 void ena_set_ethtool_ops(struct net_device
*netdev
);
397 void ena_dump_stats_to_dmesg(struct ena_adapter
*adapter
);
399 void ena_dump_stats_to_buf(struct ena_adapter
*adapter
, u8
*buf
);
401 int ena_update_hw_stats(struct ena_adapter
*adapter
);
403 int ena_update_queue_sizes(struct ena_adapter
*adapter
,
407 int ena_update_queue_count(struct ena_adapter
*adapter
, u32 new_channel_count
);
409 int ena_get_sset_count(struct net_device
*netdev
, int sset
);
411 enum ena_xdp_errors_t
{
413 ENA_XDP_CURRENT_MTU_TOO_LARGE
,
414 ENA_XDP_NO_ENOUGH_QUEUES
,
417 static inline bool ena_xdp_queues_present(struct ena_adapter
*adapter
)
419 return adapter
->xdp_first_ring
!= 0;
422 static inline bool ena_xdp_present(struct ena_adapter
*adapter
)
424 return !!adapter
->xdp_bpf_prog
;
427 static inline bool ena_xdp_present_ring(struct ena_ring
*ring
)
429 return !!ring
->xdp_bpf_prog
;
432 static inline bool ena_xdp_legal_queue_count(struct ena_adapter
*adapter
,
435 return 2 * queues
<= adapter
->max_num_io_queues
;
438 static inline enum ena_xdp_errors_t
ena_xdp_allowed(struct ena_adapter
*adapter
)
440 enum ena_xdp_errors_t rc
= ENA_XDP_ALLOWED
;
442 if (adapter
->netdev
->mtu
> ENA_XDP_MAX_MTU
)
443 rc
= ENA_XDP_CURRENT_MTU_TOO_LARGE
;
444 else if (!ena_xdp_legal_queue_count(adapter
, adapter
->num_io_queues
))
445 rc
= ENA_XDP_NO_ENOUGH_QUEUES
;
450 #endif /* !(ENA_H) */