1 /* SPDX-License-Identifier: GPL-2.0 */
2 #ifndef __NET_SCHED_GENERIC_H
3 #define __NET_SCHED_GENERIC_H
5 #include <linux/netdevice.h>
6 #include <linux/types.h>
7 #include <linux/rcupdate.h>
8 #include <linux/pkt_sched.h>
9 #include <linux/pkt_cls.h>
10 #include <linux/percpu.h>
11 #include <linux/dynamic_queue_limits.h>
12 #include <linux/list.h>
13 #include <linux/refcount.h>
14 #include <linux/workqueue.h>
15 #include <linux/mutex.h>
16 #include <linux/rwsem.h>
17 #include <linux/atomic.h>
18 #include <linux/hashtable.h>
19 #include <net/gen_stats.h>
20 #include <net/rtnetlink.h>
21 #include <net/flow_offload.h>
29 struct qdisc_rate_table
{
30 struct tc_ratespec rate
;
32 struct qdisc_rate_table
*next
;
38 __QDISC_STATE_DEACTIVATED
,
41 struct qdisc_size_table
{
43 struct list_head list
;
44 struct tc_sizespec szopts
;
49 /* similar to sk_buff_head, but skb->prev pointer is undefined. */
50 struct qdisc_skb_head
{
58 int (*enqueue
)(struct sk_buff
*skb
,
60 struct sk_buff
**to_free
);
61 struct sk_buff
* (*dequeue
)(struct Qdisc
*sch
);
63 #define TCQ_F_BUILTIN 1
64 #define TCQ_F_INGRESS 2
65 #define TCQ_F_CAN_BYPASS 4
66 #define TCQ_F_MQROOT 8
67 #define TCQ_F_ONETXQUEUE 0x10 /* dequeue_skb() can assume all skbs are for
68 * q->dev_queue : It can test
69 * netif_xmit_frozen_or_stopped() before
70 * dequeueing next packet.
71 * Its true for MQ/MQPRIO slaves, or non
74 #define TCQ_F_WARN_NONWC (1 << 16)
75 #define TCQ_F_CPUSTATS 0x20 /* run using percpu statistics */
76 #define TCQ_F_NOPARENT 0x40 /* root of its hierarchy :
77 * qdisc_tree_decrease_qlen() should stop.
79 #define TCQ_F_INVISIBLE 0x80 /* invisible by default in dump */
80 #define TCQ_F_NOLOCK 0x100 /* qdisc does not require locking */
81 #define TCQ_F_OFFLOADED 0x200 /* qdisc is offloaded to HW */
83 const struct Qdisc_ops
*ops
;
84 struct qdisc_size_table __rcu
*stab
;
85 struct hlist_node hash
;
89 struct netdev_queue
*dev_queue
;
91 struct net_rate_estimator __rcu
*rate_est
;
92 struct gnet_stats_basic_cpu __percpu
*cpu_bstats
;
93 struct gnet_stats_queue __percpu
*cpu_qstats
;
98 * For performance sake on SMP, we put highly modified fields at the end
100 struct sk_buff_head gso_skb ____cacheline_aligned_in_smp
;
101 struct qdisc_skb_head q
;
102 struct gnet_stats_basic_packed bstats
;
104 struct gnet_stats_queue qstats
;
106 struct Qdisc
*next_sched
;
107 struct sk_buff_head skb_bad_txq
;
109 spinlock_t busylock ____cacheline_aligned_in_smp
;
112 /* for NOLOCK qdisc, true if there are no enqueued skbs */
117 static inline void qdisc_refcount_inc(struct Qdisc
*qdisc
)
119 if (qdisc
->flags
& TCQ_F_BUILTIN
)
121 refcount_inc(&qdisc
->refcnt
);
124 /* Intended to be used by unlocked users, when concurrent qdisc release is
128 static inline struct Qdisc
*qdisc_refcount_inc_nz(struct Qdisc
*qdisc
)
130 if (qdisc
->flags
& TCQ_F_BUILTIN
)
132 if (refcount_inc_not_zero(&qdisc
->refcnt
))
137 static inline bool qdisc_is_running(struct Qdisc
*qdisc
)
139 if (qdisc
->flags
& TCQ_F_NOLOCK
)
140 return spin_is_locked(&qdisc
->seqlock
);
141 return (raw_read_seqcount(&qdisc
->running
) & 1) ? true : false;
144 static inline bool qdisc_is_percpu_stats(const struct Qdisc
*q
)
146 return q
->flags
& TCQ_F_CPUSTATS
;
149 static inline bool qdisc_is_empty(const struct Qdisc
*qdisc
)
151 if (qdisc_is_percpu_stats(qdisc
))
152 return READ_ONCE(qdisc
->empty
);
153 return !READ_ONCE(qdisc
->q
.qlen
);
156 static inline bool qdisc_run_begin(struct Qdisc
*qdisc
)
158 if (qdisc
->flags
& TCQ_F_NOLOCK
) {
159 if (!spin_trylock(&qdisc
->seqlock
))
161 WRITE_ONCE(qdisc
->empty
, false);
162 } else if (qdisc_is_running(qdisc
)) {
165 /* Variant of write_seqcount_begin() telling lockdep a trylock
168 raw_write_seqcount_begin(&qdisc
->running
);
169 seqcount_acquire(&qdisc
->running
.dep_map
, 0, 1, _RET_IP_
);
173 static inline void qdisc_run_end(struct Qdisc
*qdisc
)
175 write_seqcount_end(&qdisc
->running
);
176 if (qdisc
->flags
& TCQ_F_NOLOCK
)
177 spin_unlock(&qdisc
->seqlock
);
180 static inline bool qdisc_may_bulk(const struct Qdisc
*qdisc
)
182 return qdisc
->flags
& TCQ_F_ONETXQUEUE
;
185 static inline int qdisc_avail_bulklimit(const struct netdev_queue
*txq
)
188 /* Non-BQL migrated drivers will return 0, too. */
189 return dql_avail(&txq
->dql
);
195 struct Qdisc_class_ops
{
197 /* Child qdisc manipulation */
198 struct netdev_queue
* (*select_queue
)(struct Qdisc
*, struct tcmsg
*);
199 int (*graft
)(struct Qdisc
*, unsigned long cl
,
200 struct Qdisc
*, struct Qdisc
**,
201 struct netlink_ext_ack
*extack
);
202 struct Qdisc
* (*leaf
)(struct Qdisc
*, unsigned long cl
);
203 void (*qlen_notify
)(struct Qdisc
*, unsigned long);
205 /* Class manipulation routines */
206 unsigned long (*find
)(struct Qdisc
*, u32 classid
);
207 int (*change
)(struct Qdisc
*, u32
, u32
,
208 struct nlattr
**, unsigned long *,
209 struct netlink_ext_ack
*);
210 int (*delete)(struct Qdisc
*, unsigned long);
211 void (*walk
)(struct Qdisc
*, struct qdisc_walker
* arg
);
213 /* Filter manipulation */
214 struct tcf_block
* (*tcf_block
)(struct Qdisc
*sch
,
216 struct netlink_ext_ack
*extack
);
217 unsigned long (*bind_tcf
)(struct Qdisc
*, unsigned long,
219 void (*unbind_tcf
)(struct Qdisc
*, unsigned long);
221 /* rtnetlink specific */
222 int (*dump
)(struct Qdisc
*, unsigned long,
223 struct sk_buff
*skb
, struct tcmsg
*);
224 int (*dump_stats
)(struct Qdisc
*, unsigned long,
228 /* Qdisc_class_ops flag values */
230 /* Implements API that doesn't require rtnl lock */
231 enum qdisc_class_ops_flags
{
232 QDISC_CLASS_OPS_DOIT_UNLOCKED
= 1,
236 struct Qdisc_ops
*next
;
237 const struct Qdisc_class_ops
*cl_ops
;
240 unsigned int static_flags
;
242 int (*enqueue
)(struct sk_buff
*skb
,
244 struct sk_buff
**to_free
);
245 struct sk_buff
* (*dequeue
)(struct Qdisc
*);
246 struct sk_buff
* (*peek
)(struct Qdisc
*);
248 int (*init
)(struct Qdisc
*sch
, struct nlattr
*arg
,
249 struct netlink_ext_ack
*extack
);
250 void (*reset
)(struct Qdisc
*);
251 void (*destroy
)(struct Qdisc
*);
252 int (*change
)(struct Qdisc
*sch
,
254 struct netlink_ext_ack
*extack
);
255 void (*attach
)(struct Qdisc
*sch
);
256 int (*change_tx_queue_len
)(struct Qdisc
*, unsigned int);
258 int (*dump
)(struct Qdisc
*, struct sk_buff
*);
259 int (*dump_stats
)(struct Qdisc
*, struct gnet_dump
*);
261 void (*ingress_block_set
)(struct Qdisc
*sch
,
263 void (*egress_block_set
)(struct Qdisc
*sch
,
265 u32 (*ingress_block_get
)(struct Qdisc
*sch
);
266 u32 (*egress_block_get
)(struct Qdisc
*sch
);
268 struct module
*owner
;
278 const struct tcf_proto
*goto_tp
;
280 /* used in the skb_tc_reinsert function */
283 struct gnet_stats_queue
*qstats
;
290 struct tcf_proto_ops
{
291 struct list_head head
;
294 int (*classify
)(struct sk_buff
*,
295 const struct tcf_proto
*,
296 struct tcf_result
*);
297 int (*init
)(struct tcf_proto
*);
298 void (*destroy
)(struct tcf_proto
*tp
, bool rtnl_held
,
299 struct netlink_ext_ack
*extack
);
301 void* (*get
)(struct tcf_proto
*, u32 handle
);
302 void (*put
)(struct tcf_proto
*tp
, void *f
);
303 int (*change
)(struct net
*net
, struct sk_buff
*,
304 struct tcf_proto
*, unsigned long,
305 u32 handle
, struct nlattr
**,
307 struct netlink_ext_ack
*);
308 int (*delete)(struct tcf_proto
*tp
, void *arg
,
309 bool *last
, bool rtnl_held
,
310 struct netlink_ext_ack
*);
311 bool (*delete_empty
)(struct tcf_proto
*tp
);
312 void (*walk
)(struct tcf_proto
*tp
,
313 struct tcf_walker
*arg
, bool rtnl_held
);
314 int (*reoffload
)(struct tcf_proto
*tp
, bool add
,
315 flow_setup_cb_t
*cb
, void *cb_priv
,
316 struct netlink_ext_ack
*extack
);
317 void (*hw_add
)(struct tcf_proto
*tp
,
319 void (*hw_del
)(struct tcf_proto
*tp
,
321 void (*bind_class
)(void *, u32
, unsigned long,
322 void *, unsigned long);
323 void * (*tmplt_create
)(struct net
*net
,
324 struct tcf_chain
*chain
,
326 struct netlink_ext_ack
*extack
);
327 void (*tmplt_destroy
)(void *tmplt_priv
);
329 /* rtnetlink specific */
330 int (*dump
)(struct net
*, struct tcf_proto
*, void *,
331 struct sk_buff
*skb
, struct tcmsg
*,
333 int (*tmplt_dump
)(struct sk_buff
*skb
,
337 struct module
*owner
;
341 /* Classifiers setting TCF_PROTO_OPS_DOIT_UNLOCKED in tcf_proto_ops->flags
342 * are expected to implement tcf_proto_ops->delete_empty(), otherwise race
343 * conditions can occur when filters are inserted/deleted simultaneously.
345 enum tcf_proto_ops_flags
{
346 TCF_PROTO_OPS_DOIT_UNLOCKED
= 1,
350 /* Fast access part */
351 struct tcf_proto __rcu
*next
;
354 /* called under RCU BH lock*/
355 int (*classify
)(struct sk_buff
*,
356 const struct tcf_proto
*,
357 struct tcf_result
*);
363 const struct tcf_proto_ops
*ops
;
364 struct tcf_chain
*chain
;
365 /* Lock protects tcf_proto shared state and can be used by unlocked
366 * classifiers to protect their private data.
372 struct hlist_node destroy_ht_node
;
375 struct qdisc_skb_cb
{
377 unsigned int pkt_len
;
378 u16 slave_dev_queue_mapping
;
381 #define QDISC_CB_PRIV_LEN 20
382 unsigned char data
[QDISC_CB_PRIV_LEN
];
385 typedef void tcf_chain_head_change_t(struct tcf_proto
*tp_head
, void *priv
);
388 /* Protects filter_chain. */
389 struct mutex filter_chain_lock
;
390 struct tcf_proto __rcu
*filter_chain
;
391 struct list_head list
;
392 struct tcf_block
*block
;
393 u32 index
; /* chain index */
395 unsigned int action_refcnt
;
396 bool explicitly_created
;
398 const struct tcf_proto_ops
*tmplt_ops
;
404 /* Lock protects tcf_block and lifetime-management data of chains
405 * attached to the block (refcnt, action_refcnt, explicitly_created).
408 struct list_head chain_list
;
409 u32 index
; /* block index for shared blocks */
410 u32 classid
; /* which class this block belongs to */
414 struct rw_semaphore cb_lock
; /* protects cb_list and offload counters */
415 struct flow_block flow_block
;
416 struct list_head owner_list
;
418 atomic_t offloadcnt
; /* Number of oddloaded filters */
419 unsigned int nooffloaddevcnt
; /* Number of devs unable to do offload */
420 unsigned int lockeddevcnt
; /* Number of devs that require rtnl lock. */
422 struct tcf_chain
*chain
;
423 struct list_head filter_chain_list
;
426 DECLARE_HASHTABLE(proto_destroy_ht
, 7);
427 struct mutex proto_destroy_lock
; /* Lock for proto_destroy hashtable. */
430 #ifdef CONFIG_PROVE_LOCKING
431 static inline bool lockdep_tcf_chain_is_locked(struct tcf_chain
*chain
)
433 return lockdep_is_held(&chain
->filter_chain_lock
);
436 static inline bool lockdep_tcf_proto_is_locked(struct tcf_proto
*tp
)
438 return lockdep_is_held(&tp
->lock
);
441 static inline bool lockdep_tcf_chain_is_locked(struct tcf_block
*chain
)
446 static inline bool lockdep_tcf_proto_is_locked(struct tcf_proto
*tp
)
450 #endif /* #ifdef CONFIG_PROVE_LOCKING */
452 #define tcf_chain_dereference(p, chain) \
453 rcu_dereference_protected(p, lockdep_tcf_chain_is_locked(chain))
455 #define tcf_proto_dereference(p, tp) \
456 rcu_dereference_protected(p, lockdep_tcf_proto_is_locked(tp))
458 static inline void qdisc_cb_private_validate(const struct sk_buff
*skb
, int sz
)
460 struct qdisc_skb_cb
*qcb
;
462 BUILD_BUG_ON(sizeof(skb
->cb
) < offsetof(struct qdisc_skb_cb
, data
) + sz
);
463 BUILD_BUG_ON(sizeof(qcb
->data
) < sz
);
466 static inline int qdisc_qlen_cpu(const struct Qdisc
*q
)
468 return this_cpu_ptr(q
->cpu_qstats
)->qlen
;
471 static inline int qdisc_qlen(const struct Qdisc
*q
)
476 static inline int qdisc_qlen_sum(const struct Qdisc
*q
)
478 __u32 qlen
= q
->qstats
.qlen
;
481 if (qdisc_is_percpu_stats(q
)) {
482 for_each_possible_cpu(i
)
483 qlen
+= per_cpu_ptr(q
->cpu_qstats
, i
)->qlen
;
491 static inline struct qdisc_skb_cb
*qdisc_skb_cb(const struct sk_buff
*skb
)
493 return (struct qdisc_skb_cb
*)skb
->cb
;
496 static inline spinlock_t
*qdisc_lock(struct Qdisc
*qdisc
)
498 return &qdisc
->q
.lock
;
501 static inline struct Qdisc
*qdisc_root(const struct Qdisc
*qdisc
)
503 struct Qdisc
*q
= rcu_dereference_rtnl(qdisc
->dev_queue
->qdisc
);
508 static inline struct Qdisc
*qdisc_root_bh(const struct Qdisc
*qdisc
)
510 return rcu_dereference_bh(qdisc
->dev_queue
->qdisc
);
513 static inline struct Qdisc
*qdisc_root_sleeping(const struct Qdisc
*qdisc
)
515 return qdisc
->dev_queue
->qdisc_sleeping
;
518 /* The qdisc root lock is a mechanism by which to top level
519 * of a qdisc tree can be locked from any qdisc node in the
520 * forest. This allows changing the configuration of some
521 * aspect of the qdisc tree while blocking out asynchronous
522 * qdisc access in the packet processing paths.
524 * It is only legal to do this when the root will not change
525 * on us. Otherwise we'll potentially lock the wrong qdisc
526 * root. This is enforced by holding the RTNL semaphore, which
527 * all users of this lock accessor must do.
529 static inline spinlock_t
*qdisc_root_lock(const struct Qdisc
*qdisc
)
531 struct Qdisc
*root
= qdisc_root(qdisc
);
534 return qdisc_lock(root
);
537 static inline spinlock_t
*qdisc_root_sleeping_lock(const struct Qdisc
*qdisc
)
539 struct Qdisc
*root
= qdisc_root_sleeping(qdisc
);
542 return qdisc_lock(root
);
545 static inline seqcount_t
*qdisc_root_sleeping_running(const struct Qdisc
*qdisc
)
547 struct Qdisc
*root
= qdisc_root_sleeping(qdisc
);
550 return &root
->running
;
553 static inline struct net_device
*qdisc_dev(const struct Qdisc
*qdisc
)
555 return qdisc
->dev_queue
->dev
;
558 static inline void sch_tree_lock(const struct Qdisc
*q
)
560 spin_lock_bh(qdisc_root_sleeping_lock(q
));
563 static inline void sch_tree_unlock(const struct Qdisc
*q
)
565 spin_unlock_bh(qdisc_root_sleeping_lock(q
));
568 extern struct Qdisc noop_qdisc
;
569 extern struct Qdisc_ops noop_qdisc_ops
;
570 extern struct Qdisc_ops pfifo_fast_ops
;
571 extern struct Qdisc_ops mq_qdisc_ops
;
572 extern struct Qdisc_ops noqueue_qdisc_ops
;
573 extern const struct Qdisc_ops
*default_qdisc_ops
;
574 static inline const struct Qdisc_ops
*
575 get_default_qdisc_ops(const struct net_device
*dev
, int ntx
)
577 return ntx
< dev
->real_num_tx_queues
?
578 default_qdisc_ops
: &pfifo_fast_ops
;
581 struct Qdisc_class_common
{
583 struct hlist_node hnode
;
586 struct Qdisc_class_hash
{
587 struct hlist_head
*hash
;
588 unsigned int hashsize
;
589 unsigned int hashmask
;
590 unsigned int hashelems
;
593 static inline unsigned int qdisc_class_hash(u32 id
, u32 mask
)
600 static inline struct Qdisc_class_common
*
601 qdisc_class_find(const struct Qdisc_class_hash
*hash
, u32 id
)
603 struct Qdisc_class_common
*cl
;
609 h
= qdisc_class_hash(id
, hash
->hashmask
);
610 hlist_for_each_entry(cl
, &hash
->hash
[h
], hnode
) {
611 if (cl
->classid
== id
)
617 static inline int tc_classid_to_hwtc(struct net_device
*dev
, u32 classid
)
619 u32 hwtc
= TC_H_MIN(classid
) - TC_H_MIN_PRIORITY
;
621 return (hwtc
< netdev_get_num_tc(dev
)) ? hwtc
: -EINVAL
;
624 int qdisc_class_hash_init(struct Qdisc_class_hash
*);
625 void qdisc_class_hash_insert(struct Qdisc_class_hash
*,
626 struct Qdisc_class_common
*);
627 void qdisc_class_hash_remove(struct Qdisc_class_hash
*,
628 struct Qdisc_class_common
*);
629 void qdisc_class_hash_grow(struct Qdisc
*, struct Qdisc_class_hash
*);
630 void qdisc_class_hash_destroy(struct Qdisc_class_hash
*);
632 int dev_qdisc_change_tx_queue_len(struct net_device
*dev
);
633 void dev_init_scheduler(struct net_device
*dev
);
634 void dev_shutdown(struct net_device
*dev
);
635 void dev_activate(struct net_device
*dev
);
636 void dev_deactivate(struct net_device
*dev
);
637 void dev_deactivate_many(struct list_head
*head
);
638 struct Qdisc
*dev_graft_qdisc(struct netdev_queue
*dev_queue
,
639 struct Qdisc
*qdisc
);
640 void qdisc_reset(struct Qdisc
*qdisc
);
641 void qdisc_put(struct Qdisc
*qdisc
);
642 void qdisc_put_unlocked(struct Qdisc
*qdisc
);
643 void qdisc_tree_reduce_backlog(struct Qdisc
*qdisc
, int n
, int len
);
644 #ifdef CONFIG_NET_SCHED
645 int qdisc_offload_dump_helper(struct Qdisc
*q
, enum tc_setup_type type
,
647 void qdisc_offload_graft_helper(struct net_device
*dev
, struct Qdisc
*sch
,
648 struct Qdisc
*new, struct Qdisc
*old
,
649 enum tc_setup_type type
, void *type_data
,
650 struct netlink_ext_ack
*extack
);
653 qdisc_offload_dump_helper(struct Qdisc
*q
, enum tc_setup_type type
,
656 q
->flags
&= ~TCQ_F_OFFLOADED
;
661 qdisc_offload_graft_helper(struct net_device
*dev
, struct Qdisc
*sch
,
662 struct Qdisc
*new, struct Qdisc
*old
,
663 enum tc_setup_type type
, void *type_data
,
664 struct netlink_ext_ack
*extack
)
668 struct Qdisc
*qdisc_alloc(struct netdev_queue
*dev_queue
,
669 const struct Qdisc_ops
*ops
,
670 struct netlink_ext_ack
*extack
);
671 void qdisc_free(struct Qdisc
*qdisc
);
672 struct Qdisc
*qdisc_create_dflt(struct netdev_queue
*dev_queue
,
673 const struct Qdisc_ops
*ops
, u32 parentid
,
674 struct netlink_ext_ack
*extack
);
675 void __qdisc_calculate_pkt_len(struct sk_buff
*skb
,
676 const struct qdisc_size_table
*stab
);
677 int skb_do_redirect(struct sk_buff
*);
679 static inline bool skb_at_tc_ingress(const struct sk_buff
*skb
)
681 #ifdef CONFIG_NET_CLS_ACT
682 return skb
->tc_at_ingress
;
688 static inline bool skb_skip_tc_classify(struct sk_buff
*skb
)
690 #ifdef CONFIG_NET_CLS_ACT
691 if (skb
->tc_skip_classify
) {
692 skb
->tc_skip_classify
= 0;
699 /* Reset all TX qdiscs greater than index of a device. */
700 static inline void qdisc_reset_all_tx_gt(struct net_device
*dev
, unsigned int i
)
704 for (; i
< dev
->num_tx_queues
; i
++) {
705 qdisc
= rtnl_dereference(netdev_get_tx_queue(dev
, i
)->qdisc
);
707 spin_lock_bh(qdisc_lock(qdisc
));
709 spin_unlock_bh(qdisc_lock(qdisc
));
714 static inline void qdisc_reset_all_tx(struct net_device
*dev
)
716 qdisc_reset_all_tx_gt(dev
, 0);
719 /* Are all TX queues of the device empty? */
720 static inline bool qdisc_all_tx_empty(const struct net_device
*dev
)
725 for (i
= 0; i
< dev
->num_tx_queues
; i
++) {
726 struct netdev_queue
*txq
= netdev_get_tx_queue(dev
, i
);
727 const struct Qdisc
*q
= rcu_dereference(txq
->qdisc
);
729 if (!qdisc_is_empty(q
)) {
738 /* Are any of the TX qdiscs changing? */
739 static inline bool qdisc_tx_changing(const struct net_device
*dev
)
743 for (i
= 0; i
< dev
->num_tx_queues
; i
++) {
744 struct netdev_queue
*txq
= netdev_get_tx_queue(dev
, i
);
745 if (rcu_access_pointer(txq
->qdisc
) != txq
->qdisc_sleeping
)
751 /* Is the device using the noop qdisc on all queues? */
752 static inline bool qdisc_tx_is_noop(const struct net_device
*dev
)
756 for (i
= 0; i
< dev
->num_tx_queues
; i
++) {
757 struct netdev_queue
*txq
= netdev_get_tx_queue(dev
, i
);
758 if (rcu_access_pointer(txq
->qdisc
) != &noop_qdisc
)
764 static inline unsigned int qdisc_pkt_len(const struct sk_buff
*skb
)
766 return qdisc_skb_cb(skb
)->pkt_len
;
769 /* additional qdisc xmit flags (NET_XMIT_MASK in linux/netdevice.h) */
770 enum net_xmit_qdisc_t
{
771 __NET_XMIT_STOLEN
= 0x00010000,
772 __NET_XMIT_BYPASS
= 0x00020000,
775 #ifdef CONFIG_NET_CLS_ACT
776 #define net_xmit_drop_count(e) ((e) & __NET_XMIT_STOLEN ? 0 : 1)
778 #define net_xmit_drop_count(e) (1)
781 static inline void qdisc_calculate_pkt_len(struct sk_buff
*skb
,
782 const struct Qdisc
*sch
)
784 #ifdef CONFIG_NET_SCHED
785 struct qdisc_size_table
*stab
= rcu_dereference_bh(sch
->stab
);
788 __qdisc_calculate_pkt_len(skb
, stab
);
792 static inline int qdisc_enqueue(struct sk_buff
*skb
, struct Qdisc
*sch
,
793 struct sk_buff
**to_free
)
795 qdisc_calculate_pkt_len(skb
, sch
);
796 return sch
->enqueue(skb
, sch
, to_free
);
799 static inline void _bstats_update(struct gnet_stats_basic_packed
*bstats
,
800 __u64 bytes
, __u32 packets
)
802 bstats
->bytes
+= bytes
;
803 bstats
->packets
+= packets
;
806 static inline void bstats_update(struct gnet_stats_basic_packed
*bstats
,
807 const struct sk_buff
*skb
)
809 _bstats_update(bstats
,
811 skb_is_gso(skb
) ? skb_shinfo(skb
)->gso_segs
: 1);
814 static inline void _bstats_cpu_update(struct gnet_stats_basic_cpu
*bstats
,
815 __u64 bytes
, __u32 packets
)
817 u64_stats_update_begin(&bstats
->syncp
);
818 _bstats_update(&bstats
->bstats
, bytes
, packets
);
819 u64_stats_update_end(&bstats
->syncp
);
822 static inline void bstats_cpu_update(struct gnet_stats_basic_cpu
*bstats
,
823 const struct sk_buff
*skb
)
825 u64_stats_update_begin(&bstats
->syncp
);
826 bstats_update(&bstats
->bstats
, skb
);
827 u64_stats_update_end(&bstats
->syncp
);
830 static inline void qdisc_bstats_cpu_update(struct Qdisc
*sch
,
831 const struct sk_buff
*skb
)
833 bstats_cpu_update(this_cpu_ptr(sch
->cpu_bstats
), skb
);
836 static inline void qdisc_bstats_update(struct Qdisc
*sch
,
837 const struct sk_buff
*skb
)
839 bstats_update(&sch
->bstats
, skb
);
842 static inline void qdisc_qstats_backlog_dec(struct Qdisc
*sch
,
843 const struct sk_buff
*skb
)
845 sch
->qstats
.backlog
-= qdisc_pkt_len(skb
);
848 static inline void qdisc_qstats_cpu_backlog_dec(struct Qdisc
*sch
,
849 const struct sk_buff
*skb
)
851 this_cpu_sub(sch
->cpu_qstats
->backlog
, qdisc_pkt_len(skb
));
854 static inline void qdisc_qstats_backlog_inc(struct Qdisc
*sch
,
855 const struct sk_buff
*skb
)
857 sch
->qstats
.backlog
+= qdisc_pkt_len(skb
);
860 static inline void qdisc_qstats_cpu_backlog_inc(struct Qdisc
*sch
,
861 const struct sk_buff
*skb
)
863 this_cpu_add(sch
->cpu_qstats
->backlog
, qdisc_pkt_len(skb
));
866 static inline void qdisc_qstats_cpu_qlen_inc(struct Qdisc
*sch
)
868 this_cpu_inc(sch
->cpu_qstats
->qlen
);
871 static inline void qdisc_qstats_cpu_qlen_dec(struct Qdisc
*sch
)
873 this_cpu_dec(sch
->cpu_qstats
->qlen
);
876 static inline void qdisc_qstats_cpu_requeues_inc(struct Qdisc
*sch
)
878 this_cpu_inc(sch
->cpu_qstats
->requeues
);
881 static inline void __qdisc_qstats_drop(struct Qdisc
*sch
, int count
)
883 sch
->qstats
.drops
+= count
;
886 static inline void qstats_drop_inc(struct gnet_stats_queue
*qstats
)
891 static inline void qstats_overlimit_inc(struct gnet_stats_queue
*qstats
)
893 qstats
->overlimits
++;
896 static inline void qdisc_qstats_drop(struct Qdisc
*sch
)
898 qstats_drop_inc(&sch
->qstats
);
901 static inline void qdisc_qstats_cpu_drop(struct Qdisc
*sch
)
903 this_cpu_inc(sch
->cpu_qstats
->drops
);
906 static inline void qdisc_qstats_overlimit(struct Qdisc
*sch
)
908 sch
->qstats
.overlimits
++;
911 static inline int qdisc_qstats_copy(struct gnet_dump
*d
, struct Qdisc
*sch
)
913 __u32 qlen
= qdisc_qlen_sum(sch
);
915 return gnet_stats_copy_queue(d
, sch
->cpu_qstats
, &sch
->qstats
, qlen
);
918 static inline void qdisc_qstats_qlen_backlog(struct Qdisc
*sch
, __u32
*qlen
,
921 struct gnet_stats_queue qstats
= { 0 };
922 __u32 len
= qdisc_qlen_sum(sch
);
924 __gnet_stats_copy_queue(&qstats
, sch
->cpu_qstats
, &sch
->qstats
, len
);
926 *backlog
= qstats
.backlog
;
929 static inline void qdisc_tree_flush_backlog(struct Qdisc
*sch
)
933 qdisc_qstats_qlen_backlog(sch
, &qlen
, &backlog
);
934 qdisc_tree_reduce_backlog(sch
, qlen
, backlog
);
937 static inline void qdisc_purge_queue(struct Qdisc
*sch
)
941 qdisc_qstats_qlen_backlog(sch
, &qlen
, &backlog
);
943 qdisc_tree_reduce_backlog(sch
, qlen
, backlog
);
946 static inline void qdisc_skb_head_init(struct qdisc_skb_head
*qh
)
953 static inline void __qdisc_enqueue_tail(struct sk_buff
*skb
,
954 struct qdisc_skb_head
*qh
)
956 struct sk_buff
*last
= qh
->tail
;
969 static inline int qdisc_enqueue_tail(struct sk_buff
*skb
, struct Qdisc
*sch
)
971 __qdisc_enqueue_tail(skb
, &sch
->q
);
972 qdisc_qstats_backlog_inc(sch
, skb
);
973 return NET_XMIT_SUCCESS
;
976 static inline void __qdisc_enqueue_head(struct sk_buff
*skb
,
977 struct qdisc_skb_head
*qh
)
979 skb
->next
= qh
->head
;
987 static inline struct sk_buff
*__qdisc_dequeue_head(struct qdisc_skb_head
*qh
)
989 struct sk_buff
*skb
= qh
->head
;
991 if (likely(skb
!= NULL
)) {
992 qh
->head
= skb
->next
;
994 if (qh
->head
== NULL
)
1002 static inline struct sk_buff
*qdisc_dequeue_head(struct Qdisc
*sch
)
1004 struct sk_buff
*skb
= __qdisc_dequeue_head(&sch
->q
);
1006 if (likely(skb
!= NULL
)) {
1007 qdisc_qstats_backlog_dec(sch
, skb
);
1008 qdisc_bstats_update(sch
, skb
);
1014 /* Instead of calling kfree_skb() while root qdisc lock is held,
1015 * queue the skb for future freeing at end of __dev_xmit_skb()
1017 static inline void __qdisc_drop(struct sk_buff
*skb
, struct sk_buff
**to_free
)
1019 skb
->next
= *to_free
;
1023 static inline void __qdisc_drop_all(struct sk_buff
*skb
,
1024 struct sk_buff
**to_free
)
1027 skb
->prev
->next
= *to_free
;
1029 skb
->next
= *to_free
;
1033 static inline unsigned int __qdisc_queue_drop_head(struct Qdisc
*sch
,
1034 struct qdisc_skb_head
*qh
,
1035 struct sk_buff
**to_free
)
1037 struct sk_buff
*skb
= __qdisc_dequeue_head(qh
);
1039 if (likely(skb
!= NULL
)) {
1040 unsigned int len
= qdisc_pkt_len(skb
);
1042 qdisc_qstats_backlog_dec(sch
, skb
);
1043 __qdisc_drop(skb
, to_free
);
1050 static inline unsigned int qdisc_queue_drop_head(struct Qdisc
*sch
,
1051 struct sk_buff
**to_free
)
1053 return __qdisc_queue_drop_head(sch
, &sch
->q
, to_free
);
1056 static inline struct sk_buff
*qdisc_peek_head(struct Qdisc
*sch
)
1058 const struct qdisc_skb_head
*qh
= &sch
->q
;
1063 /* generic pseudo peek method for non-work-conserving qdisc */
1064 static inline struct sk_buff
*qdisc_peek_dequeued(struct Qdisc
*sch
)
1066 struct sk_buff
*skb
= skb_peek(&sch
->gso_skb
);
1068 /* we can reuse ->gso_skb because peek isn't called for root qdiscs */
1070 skb
= sch
->dequeue(sch
);
1073 __skb_queue_head(&sch
->gso_skb
, skb
);
1074 /* it's still part of the queue */
1075 qdisc_qstats_backlog_inc(sch
, skb
);
1083 static inline void qdisc_update_stats_at_dequeue(struct Qdisc
*sch
,
1084 struct sk_buff
*skb
)
1086 if (qdisc_is_percpu_stats(sch
)) {
1087 qdisc_qstats_cpu_backlog_dec(sch
, skb
);
1088 qdisc_bstats_cpu_update(sch
, skb
);
1089 qdisc_qstats_cpu_qlen_dec(sch
);
1091 qdisc_qstats_backlog_dec(sch
, skb
);
1092 qdisc_bstats_update(sch
, skb
);
1097 static inline void qdisc_update_stats_at_enqueue(struct Qdisc
*sch
,
1098 unsigned int pkt_len
)
1100 if (qdisc_is_percpu_stats(sch
)) {
1101 qdisc_qstats_cpu_qlen_inc(sch
);
1102 this_cpu_add(sch
->cpu_qstats
->backlog
, pkt_len
);
1104 sch
->qstats
.backlog
+= pkt_len
;
1109 /* use instead of qdisc->dequeue() for all qdiscs queried with ->peek() */
1110 static inline struct sk_buff
*qdisc_dequeue_peeked(struct Qdisc
*sch
)
1112 struct sk_buff
*skb
= skb_peek(&sch
->gso_skb
);
1115 skb
= __skb_dequeue(&sch
->gso_skb
);
1116 if (qdisc_is_percpu_stats(sch
)) {
1117 qdisc_qstats_cpu_backlog_dec(sch
, skb
);
1118 qdisc_qstats_cpu_qlen_dec(sch
);
1120 qdisc_qstats_backlog_dec(sch
, skb
);
1124 skb
= sch
->dequeue(sch
);
1130 static inline void __qdisc_reset_queue(struct qdisc_skb_head
*qh
)
1133 * We do not know the backlog in bytes of this list, it
1134 * is up to the caller to correct it
1138 rtnl_kfree_skbs(qh
->head
, qh
->tail
);
1146 static inline void qdisc_reset_queue(struct Qdisc
*sch
)
1148 __qdisc_reset_queue(&sch
->q
);
1149 sch
->qstats
.backlog
= 0;
1152 static inline struct Qdisc
*qdisc_replace(struct Qdisc
*sch
, struct Qdisc
*new,
1153 struct Qdisc
**pold
)
1161 qdisc_tree_flush_backlog(old
);
1162 sch_tree_unlock(sch
);
1167 static inline void rtnl_qdisc_drop(struct sk_buff
*skb
, struct Qdisc
*sch
)
1169 rtnl_kfree_skbs(skb
, skb
);
1170 qdisc_qstats_drop(sch
);
1173 static inline int qdisc_drop_cpu(struct sk_buff
*skb
, struct Qdisc
*sch
,
1174 struct sk_buff
**to_free
)
1176 __qdisc_drop(skb
, to_free
);
1177 qdisc_qstats_cpu_drop(sch
);
1179 return NET_XMIT_DROP
;
1182 static inline int qdisc_drop(struct sk_buff
*skb
, struct Qdisc
*sch
,
1183 struct sk_buff
**to_free
)
1185 __qdisc_drop(skb
, to_free
);
1186 qdisc_qstats_drop(sch
);
1188 return NET_XMIT_DROP
;
1191 static inline int qdisc_drop_all(struct sk_buff
*skb
, struct Qdisc
*sch
,
1192 struct sk_buff
**to_free
)
1194 __qdisc_drop_all(skb
, to_free
);
1195 qdisc_qstats_drop(sch
);
1197 return NET_XMIT_DROP
;
1200 /* Length to Time (L2T) lookup in a qdisc_rate_table, to determine how
1201 long it will take to send a packet given its size.
1203 static inline u32
qdisc_l2t(struct qdisc_rate_table
* rtab
, unsigned int pktlen
)
1205 int slot
= pktlen
+ rtab
->rate
.cell_align
+ rtab
->rate
.overhead
;
1208 slot
>>= rtab
->rate
.cell_log
;
1210 return rtab
->data
[255]*(slot
>> 8) + rtab
->data
[slot
& 0xFF];
1211 return rtab
->data
[slot
];
1214 struct psched_ratecfg
{
1215 u64 rate_bytes_ps
; /* bytes per second */
1222 static inline u64
psched_l2t_ns(const struct psched_ratecfg
*r
,
1227 if (unlikely(r
->linklayer
== TC_LINKLAYER_ATM
))
1228 return ((u64
)(DIV_ROUND_UP(len
,48)*53) * r
->mult
) >> r
->shift
;
1230 return ((u64
)len
* r
->mult
) >> r
->shift
;
1233 void psched_ratecfg_precompute(struct psched_ratecfg
*r
,
1234 const struct tc_ratespec
*conf
,
1237 static inline void psched_ratecfg_getrate(struct tc_ratespec
*res
,
1238 const struct psched_ratecfg
*r
)
1240 memset(res
, 0, sizeof(*res
));
1242 /* legacy struct tc_ratespec has a 32bit @rate field
1243 * Qdisc using 64bit rate should add new attributes
1244 * in order to maintain compatibility.
1246 res
->rate
= min_t(u64
, r
->rate_bytes_ps
, ~0U);
1248 res
->overhead
= r
->overhead
;
1249 res
->linklayer
= (r
->linklayer
& TC_LINKLAYER_MASK
);
1252 /* Mini Qdisc serves for specific needs of ingress/clsact Qdisc.
1253 * The fast path only needs to access filter list and to update stats
1256 struct tcf_proto
*filter_list
;
1257 struct tcf_block
*block
;
1258 struct gnet_stats_basic_cpu __percpu
*cpu_bstats
;
1259 struct gnet_stats_queue __percpu
*cpu_qstats
;
1260 struct rcu_head rcu
;
1263 static inline void mini_qdisc_bstats_cpu_update(struct mini_Qdisc
*miniq
,
1264 const struct sk_buff
*skb
)
1266 bstats_cpu_update(this_cpu_ptr(miniq
->cpu_bstats
), skb
);
1269 static inline void mini_qdisc_qstats_cpu_drop(struct mini_Qdisc
*miniq
)
1271 this_cpu_inc(miniq
->cpu_qstats
->drops
);
1274 struct mini_Qdisc_pair
{
1275 struct mini_Qdisc miniq1
;
1276 struct mini_Qdisc miniq2
;
1277 struct mini_Qdisc __rcu
**p_miniq
;
1280 void mini_qdisc_pair_swap(struct mini_Qdisc_pair
*miniqp
,
1281 struct tcf_proto
*tp_head
);
1282 void mini_qdisc_pair_init(struct mini_Qdisc_pair
*miniqp
, struct Qdisc
*qdisc
,
1283 struct mini_Qdisc __rcu
**p_miniq
);
1284 void mini_qdisc_pair_block_init(struct mini_Qdisc_pair
*miniqp
,
1285 struct tcf_block
*block
);
1287 static inline int skb_tc_reinsert(struct sk_buff
*skb
, struct tcf_result
*res
)
1289 return res
->ingress
? netif_receive_skb(skb
) : dev_queue_xmit(skb
);