1 /* SPDX-License-Identifier: GPL-2.0 */
2 #ifndef _LINUX_NET_QUEUES_H
3 #define _LINUX_NET_QUEUES_H
5 #include <linux/netdevice.h>
7 /* See the netdev.yaml spec for definition of each statistic */
8 struct netdev_queue_stats_rx
{
22 u64 hw_gro_wire_packets
;
23 u64 hw_gro_wire_bytes
;
25 u64 hw_drop_ratelimits
;
28 struct netdev_queue_stats_tx
{
40 u64 hw_gso_wire_packets
;
41 u64 hw_gso_wire_bytes
;
43 u64 hw_drop_ratelimits
;
50 * struct netdev_stat_ops - netdev ops for fine grained stats
51 * @get_queue_stats_rx: get stats for a given Rx queue
52 * @get_queue_stats_tx: get stats for a given Tx queue
53 * @get_base_stats: get base stats (not belonging to any live instance)
55 * Query stats for a given object. The values of the statistics are undefined
56 * on entry (specifically they are *not* zero-initialized). Drivers should
57 * assign values only to the statistics they collect. Statistics which are not
58 * collected must be left undefined.
60 * Queue objects are not necessarily persistent, and only currently active
61 * queues are queried by the per-queue callbacks. This means that per-queue
62 * statistics will not generally add up to the total number of events for
63 * the device. The @get_base_stats callback allows filling in the delta
64 * between events for currently live queues and overall device history.
65 * @get_base_stats can also be used to report any miscellaneous packets
66 * transferred outside of the main set of queues used by the networking stack.
67 * When the statistics for the entire device are queried, first @get_base_stats
68 * is issued to collect the delta, and then a series of per-queue callbacks.
69 * Only statistics which are set in @get_base_stats will be reported
70 * at the device level, meaning that unlike in queue callbacks, setting
71 * a statistic to zero in @get_base_stats is a legitimate thing to do.
72 * This is because @get_base_stats has a second function of designating which
73 * statistics are in fact correct for the entire device (e.g. when history
74 * for some of the events is not maintained, and reliable "total" cannot
77 * Device drivers can assume that when collecting total device stats,
78 * the @get_base_stats and subsequent per-queue calls are performed
79 * "atomically" (without releasing the rtnl_lock).
81 * Device drivers are encouraged to reset the per-queue statistics when
82 * number of queues change. This is because the primary use case for
83 * per-queue statistics is currently to detect traffic imbalance.
85 struct netdev_stat_ops
{
86 void (*get_queue_stats_rx
)(struct net_device
*dev
, int idx
,
87 struct netdev_queue_stats_rx
*stats
);
88 void (*get_queue_stats_tx
)(struct net_device
*dev
, int idx
,
89 struct netdev_queue_stats_tx
*stats
);
90 void (*get_base_stats
)(struct net_device
*dev
,
91 struct netdev_queue_stats_rx
*rx
,
92 struct netdev_queue_stats_tx
*tx
);
96 * struct netdev_queue_mgmt_ops - netdev ops for queue management
98 * @ndo_queue_mem_size: Size of the struct that describes a queue's memory.
100 * @ndo_queue_mem_alloc: Allocate memory for an RX queue at the specified index.
101 * The new memory is written at the specified address.
103 * @ndo_queue_mem_free: Free memory from an RX queue.
105 * @ndo_queue_start: Start an RX queue with the specified memory and at the
108 * @ndo_queue_stop: Stop the RX queue at the specified index. The stopped
109 * queue's memory is written at the specified address.
111 struct netdev_queue_mgmt_ops
{
112 size_t ndo_queue_mem_size
;
113 int (*ndo_queue_mem_alloc
)(struct net_device
*dev
,
116 void (*ndo_queue_mem_free
)(struct net_device
*dev
,
117 void *per_queue_mem
);
118 int (*ndo_queue_start
)(struct net_device
*dev
,
121 int (*ndo_queue_stop
)(struct net_device
*dev
,
127 * DOC: Lockless queue stopping / waking helpers.
129 * The netif_txq_maybe_stop() and __netif_txq_completed_wake()
130 * macros are designed to safely implement stopping
131 * and waking netdev queues without full lock protection.
133 * We assume that there can be no concurrent stop attempts and no concurrent
134 * wake attempts. The try-stop should happen from the xmit handler,
135 * while wake up should be triggered from NAPI poll context.
136 * The two may run concurrently (single producer, single consumer).
138 * The try-stop side is expected to run from the xmit handler and therefore
139 * it does not reschedule Tx (netif_tx_start_queue() instead of
140 * netif_tx_wake_queue()). Uses of the ``stop`` macros outside of the xmit
141 * handler may lead to xmit queue being enabled but not run.
142 * The waking side does not have similar context restrictions.
144 * The macros guarantee that rings will not remain stopped if there's
145 * space available, but they do *not* prevent false wake ups when
146 * the ring is full! Drivers should check for ring full at the start
147 * for the xmit handler.
149 * All descriptor ring indexes (and other relevant shared state) must
150 * be updated before invoking the macros.
153 #define netif_txq_try_stop(txq, get_desc, start_thrs) \
157 netif_tx_stop_queue(txq); \
158 /* Producer index and stop bit must be visible \
159 * to consumer before we recheck. \
160 * Pairs with a barrier in __netif_txq_completed_wake(). \
162 smp_mb__after_atomic(); \
164 /* We need to check again in a case another \
165 * CPU has just made room available. \
168 if (unlikely(get_desc >= start_thrs)) { \
169 netif_tx_start_queue(txq); \
176 * netif_txq_maybe_stop() - locklessly stop a Tx queue, if needed
177 * @txq: struct netdev_queue to stop/start
178 * @get_desc: get current number of free descriptors (see requirements below!)
179 * @stop_thrs: minimal number of available descriptors for queue to be left
181 * @start_thrs: minimal number of descriptors to re-enable the queue, can be
182 * equal to @stop_thrs or higher to avoid frequent waking
184 * All arguments may be evaluated multiple times, beware of side effects.
185 * @get_desc must be a formula or a function call, it must always
186 * return up-to-date information when evaluated!
187 * Expected to be used from ndo_start_xmit, see the comment on top of the file.
190 * 0 if the queue was stopped
191 * 1 if the queue was left enabled
192 * -1 if the queue was re-enabled (raced with waking)
194 #define netif_txq_maybe_stop(txq, get_desc, stop_thrs, start_thrs) \
199 if (unlikely(get_desc < stop_thrs)) \
200 _res = netif_txq_try_stop(txq, get_desc, start_thrs); \
204 /* Variant of netdev_tx_completed_queue() which guarantees smp_mb() if
205 * @bytes != 0, regardless of kernel config.
208 netdev_txq_completed_mb(struct netdev_queue
*dev_queue
,
209 unsigned int pkts
, unsigned int bytes
)
211 if (IS_ENABLED(CONFIG_BQL
))
212 netdev_tx_completed_queue(dev_queue
, pkts
, bytes
);
218 * __netif_txq_completed_wake() - locklessly wake a Tx queue, if needed
219 * @txq: struct netdev_queue to stop/start
220 * @pkts: number of packets completed
221 * @bytes: number of bytes completed
222 * @get_desc: get current number of free descriptors (see requirements below!)
223 * @start_thrs: minimal number of descriptors to re-enable the queue
224 * @down_cond: down condition, predicate indicating that the queue should
225 * not be woken up even if descriptors are available
227 * All arguments may be evaluated multiple times.
228 * @get_desc must be a formula or a function call, it must always
229 * return up-to-date information when evaluated!
230 * Reports completed pkts/bytes to BQL.
233 * 0 if the queue was woken up
234 * 1 if the queue was already enabled (or disabled but @down_cond is true)
235 * -1 if the queue was left unchanged (@start_thrs not reached)
237 #define __netif_txq_completed_wake(txq, pkts, bytes, \
238 get_desc, start_thrs, down_cond) \
242 /* Report to BQL and piggy back on its barrier. \
243 * Barrier makes sure that anybody stopping the queue \
244 * after this point sees the new consumer index. \
245 * Pairs with barrier in netif_txq_try_stop(). \
247 netdev_txq_completed_mb(txq, pkts, bytes); \
250 if (pkts && likely(get_desc >= start_thrs)) { \
252 if (unlikely(netif_tx_queue_stopped(txq)) && \
254 netif_tx_wake_queue(txq); \
261 #define netif_txq_completed_wake(txq, pkts, bytes, get_desc, start_thrs) \
262 __netif_txq_completed_wake(txq, pkts, bytes, get_desc, start_thrs, false)
264 /* subqueue variants follow */
266 #define netif_subqueue_try_stop(dev, idx, get_desc, start_thrs) \
268 struct netdev_queue *txq; \
270 txq = netdev_get_tx_queue(dev, idx); \
271 netif_txq_try_stop(txq, get_desc, start_thrs); \
274 #define netif_subqueue_maybe_stop(dev, idx, get_desc, stop_thrs, start_thrs) \
276 struct netdev_queue *txq; \
278 txq = netdev_get_tx_queue(dev, idx); \
279 netif_txq_maybe_stop(txq, get_desc, stop_thrs, start_thrs); \
282 #define netif_subqueue_completed_wake(dev, idx, pkts, bytes, \
283 get_desc, start_thrs) \
285 struct netdev_queue *txq; \
287 txq = netdev_get_tx_queue(dev, idx); \
288 netif_txq_completed_wake(txq, pkts, bytes, \
289 get_desc, start_thrs); \