1 /* SPDX-License-Identifier: GPL-2.0 */
2 #ifndef __NET_SCHED_GENERIC_H
3 #define __NET_SCHED_GENERIC_H
5 #include <linux/netdevice.h>
6 #include <linux/types.h>
7 #include <linux/rcupdate.h>
8 #include <linux/pkt_sched.h>
9 #include <linux/pkt_cls.h>
10 #include <linux/percpu.h>
11 #include <linux/dynamic_queue_limits.h>
12 #include <linux/list.h>
13 #include <linux/refcount.h>
14 #include <linux/workqueue.h>
15 #include <linux/mutex.h>
16 #include <linux/rwsem.h>
17 #include <linux/atomic.h>
18 #include <linux/hashtable.h>
19 #include <net/gen_stats.h>
20 #include <net/rtnetlink.h>
21 #include <net/flow_offload.h>
29 struct qdisc_rate_table
{
30 struct tc_ratespec rate
;
32 struct qdisc_rate_table
*next
;
38 __QDISC_STATE_DEACTIVATED
,
41 struct qdisc_size_table
{
43 struct list_head list
;
44 struct tc_sizespec szopts
;
49 /* similar to sk_buff_head, but skb->prev pointer is undefined. */
50 struct qdisc_skb_head
{
58 int (*enqueue
)(struct sk_buff
*skb
,
60 struct sk_buff
**to_free
);
61 struct sk_buff
* (*dequeue
)(struct Qdisc
*sch
);
63 #define TCQ_F_BUILTIN 1
64 #define TCQ_F_INGRESS 2
65 #define TCQ_F_CAN_BYPASS 4
66 #define TCQ_F_MQROOT 8
67 #define TCQ_F_ONETXQUEUE 0x10 /* dequeue_skb() can assume all skbs are for
68 * q->dev_queue : It can test
69 * netif_xmit_frozen_or_stopped() before
70 * dequeueing next packet.
71 * Its true for MQ/MQPRIO slaves, or non
74 #define TCQ_F_WARN_NONWC (1 << 16)
75 #define TCQ_F_CPUSTATS 0x20 /* run using percpu statistics */
76 #define TCQ_F_NOPARENT 0x40 /* root of its hierarchy :
77 * qdisc_tree_decrease_qlen() should stop.
79 #define TCQ_F_INVISIBLE 0x80 /* invisible by default in dump */
80 #define TCQ_F_NOLOCK 0x100 /* qdisc does not require locking */
81 #define TCQ_F_OFFLOADED 0x200 /* qdisc is offloaded to HW */
83 const struct Qdisc_ops
*ops
;
84 struct qdisc_size_table __rcu
*stab
;
85 struct hlist_node hash
;
89 struct netdev_queue
*dev_queue
;
91 struct net_rate_estimator __rcu
*rate_est
;
92 struct gnet_stats_basic_cpu __percpu
*cpu_bstats
;
93 struct gnet_stats_queue __percpu
*cpu_qstats
;
98 * For performance sake on SMP, we put highly modified fields at the end
100 struct sk_buff_head gso_skb ____cacheline_aligned_in_smp
;
101 struct qdisc_skb_head q
;
102 struct gnet_stats_basic_packed bstats
;
104 struct gnet_stats_queue qstats
;
106 struct Qdisc
*next_sched
;
107 struct sk_buff_head skb_bad_txq
;
109 spinlock_t busylock ____cacheline_aligned_in_smp
;
112 /* for NOLOCK qdisc, true if there are no enqueued skbs */
117 static inline void qdisc_refcount_inc(struct Qdisc
*qdisc
)
119 if (qdisc
->flags
& TCQ_F_BUILTIN
)
121 refcount_inc(&qdisc
->refcnt
);
124 /* Intended to be used by unlocked users, when concurrent qdisc release is
128 static inline struct Qdisc
*qdisc_refcount_inc_nz(struct Qdisc
*qdisc
)
130 if (qdisc
->flags
& TCQ_F_BUILTIN
)
132 if (refcount_inc_not_zero(&qdisc
->refcnt
))
137 static inline bool qdisc_is_running(struct Qdisc
*qdisc
)
139 if (qdisc
->flags
& TCQ_F_NOLOCK
)
140 return spin_is_locked(&qdisc
->seqlock
);
141 return (raw_read_seqcount(&qdisc
->running
) & 1) ? true : false;
144 static inline bool qdisc_is_percpu_stats(const struct Qdisc
*q
)
146 return q
->flags
& TCQ_F_CPUSTATS
;
149 static inline bool qdisc_is_empty(const struct Qdisc
*qdisc
)
151 if (qdisc_is_percpu_stats(qdisc
))
152 return READ_ONCE(qdisc
->empty
);
153 return !READ_ONCE(qdisc
->q
.qlen
);
156 static inline bool qdisc_run_begin(struct Qdisc
*qdisc
)
158 if (qdisc
->flags
& TCQ_F_NOLOCK
) {
159 if (!spin_trylock(&qdisc
->seqlock
))
161 WRITE_ONCE(qdisc
->empty
, false);
162 } else if (qdisc_is_running(qdisc
)) {
165 /* Variant of write_seqcount_begin() telling lockdep a trylock
168 raw_write_seqcount_begin(&qdisc
->running
);
169 seqcount_acquire(&qdisc
->running
.dep_map
, 0, 1, _RET_IP_
);
173 static inline void qdisc_run_end(struct Qdisc
*qdisc
)
175 write_seqcount_end(&qdisc
->running
);
176 if (qdisc
->flags
& TCQ_F_NOLOCK
)
177 spin_unlock(&qdisc
->seqlock
);
180 static inline bool qdisc_may_bulk(const struct Qdisc
*qdisc
)
182 return qdisc
->flags
& TCQ_F_ONETXQUEUE
;
185 static inline int qdisc_avail_bulklimit(const struct netdev_queue
*txq
)
188 /* Non-BQL migrated drivers will return 0, too. */
189 return dql_avail(&txq
->dql
);
195 struct Qdisc_class_ops
{
197 /* Child qdisc manipulation */
198 struct netdev_queue
* (*select_queue
)(struct Qdisc
*, struct tcmsg
*);
199 int (*graft
)(struct Qdisc
*, unsigned long cl
,
200 struct Qdisc
*, struct Qdisc
**,
201 struct netlink_ext_ack
*extack
);
202 struct Qdisc
* (*leaf
)(struct Qdisc
*, unsigned long cl
);
203 void (*qlen_notify
)(struct Qdisc
*, unsigned long);
205 /* Class manipulation routines */
206 unsigned long (*find
)(struct Qdisc
*, u32 classid
);
207 int (*change
)(struct Qdisc
*, u32
, u32
,
208 struct nlattr
**, unsigned long *,
209 struct netlink_ext_ack
*);
210 int (*delete)(struct Qdisc
*, unsigned long);
211 void (*walk
)(struct Qdisc
*, struct qdisc_walker
* arg
);
213 /* Filter manipulation */
214 struct tcf_block
* (*tcf_block
)(struct Qdisc
*sch
,
216 struct netlink_ext_ack
*extack
);
217 unsigned long (*bind_tcf
)(struct Qdisc
*, unsigned long,
219 void (*unbind_tcf
)(struct Qdisc
*, unsigned long);
221 /* rtnetlink specific */
222 int (*dump
)(struct Qdisc
*, unsigned long,
223 struct sk_buff
*skb
, struct tcmsg
*);
224 int (*dump_stats
)(struct Qdisc
*, unsigned long,
228 /* Qdisc_class_ops flag values */
230 /* Implements API that doesn't require rtnl lock */
231 enum qdisc_class_ops_flags
{
232 QDISC_CLASS_OPS_DOIT_UNLOCKED
= 1,
236 struct Qdisc_ops
*next
;
237 const struct Qdisc_class_ops
*cl_ops
;
240 unsigned int static_flags
;
242 int (*enqueue
)(struct sk_buff
*skb
,
244 struct sk_buff
**to_free
);
245 struct sk_buff
* (*dequeue
)(struct Qdisc
*);
246 struct sk_buff
* (*peek
)(struct Qdisc
*);
248 int (*init
)(struct Qdisc
*sch
, struct nlattr
*arg
,
249 struct netlink_ext_ack
*extack
);
250 void (*reset
)(struct Qdisc
*);
251 void (*destroy
)(struct Qdisc
*);
252 int (*change
)(struct Qdisc
*sch
,
254 struct netlink_ext_ack
*extack
);
255 void (*attach
)(struct Qdisc
*sch
);
256 int (*change_tx_queue_len
)(struct Qdisc
*, unsigned int);
258 int (*dump
)(struct Qdisc
*, struct sk_buff
*);
259 int (*dump_stats
)(struct Qdisc
*, struct gnet_dump
*);
261 void (*ingress_block_set
)(struct Qdisc
*sch
,
263 void (*egress_block_set
)(struct Qdisc
*sch
,
265 u32 (*ingress_block_get
)(struct Qdisc
*sch
);
266 u32 (*egress_block_get
)(struct Qdisc
*sch
);
268 struct module
*owner
;
278 const struct tcf_proto
*goto_tp
;
280 /* used in the skb_tc_reinsert function */
283 struct gnet_stats_queue
*qstats
;
290 struct tcf_proto_ops
{
291 struct list_head head
;
294 int (*classify
)(struct sk_buff
*,
295 const struct tcf_proto
*,
296 struct tcf_result
*);
297 int (*init
)(struct tcf_proto
*);
298 void (*destroy
)(struct tcf_proto
*tp
, bool rtnl_held
,
299 struct netlink_ext_ack
*extack
);
301 void* (*get
)(struct tcf_proto
*, u32 handle
);
302 void (*put
)(struct tcf_proto
*tp
, void *f
);
303 int (*change
)(struct net
*net
, struct sk_buff
*,
304 struct tcf_proto
*, unsigned long,
305 u32 handle
, struct nlattr
**,
307 struct netlink_ext_ack
*);
308 int (*delete)(struct tcf_proto
*tp
, void *arg
,
309 bool *last
, bool rtnl_held
,
310 struct netlink_ext_ack
*);
311 bool (*delete_empty
)(struct tcf_proto
*tp
);
312 void (*walk
)(struct tcf_proto
*tp
,
313 struct tcf_walker
*arg
, bool rtnl_held
);
314 int (*reoffload
)(struct tcf_proto
*tp
, bool add
,
315 flow_setup_cb_t
*cb
, void *cb_priv
,
316 struct netlink_ext_ack
*extack
);
317 void (*hw_add
)(struct tcf_proto
*tp
,
319 void (*hw_del
)(struct tcf_proto
*tp
,
321 void (*bind_class
)(void *, u32
, unsigned long,
322 void *, unsigned long);
323 void * (*tmplt_create
)(struct net
*net
,
324 struct tcf_chain
*chain
,
326 struct netlink_ext_ack
*extack
);
327 void (*tmplt_destroy
)(void *tmplt_priv
);
329 /* rtnetlink specific */
330 int (*dump
)(struct net
*, struct tcf_proto
*, void *,
331 struct sk_buff
*skb
, struct tcmsg
*,
333 int (*tmplt_dump
)(struct sk_buff
*skb
,
337 struct module
*owner
;
341 /* Classifiers setting TCF_PROTO_OPS_DOIT_UNLOCKED in tcf_proto_ops->flags
342 * are expected to implement tcf_proto_ops->delete_empty(), otherwise race
343 * conditions can occur when filters are inserted/deleted simultaneously.
345 enum tcf_proto_ops_flags
{
346 TCF_PROTO_OPS_DOIT_UNLOCKED
= 1,
350 /* Fast access part */
351 struct tcf_proto __rcu
*next
;
354 /* called under RCU BH lock*/
355 int (*classify
)(struct sk_buff
*,
356 const struct tcf_proto
*,
357 struct tcf_result
*);
363 const struct tcf_proto_ops
*ops
;
364 struct tcf_chain
*chain
;
365 /* Lock protects tcf_proto shared state and can be used by unlocked
366 * classifiers to protect their private data.
372 struct hlist_node destroy_ht_node
;
375 struct qdisc_skb_cb
{
377 unsigned int pkt_len
;
378 u16 slave_dev_queue_mapping
;
381 #define QDISC_CB_PRIV_LEN 20
382 unsigned char data
[QDISC_CB_PRIV_LEN
];
385 typedef void tcf_chain_head_change_t(struct tcf_proto
*tp_head
, void *priv
);
388 /* Protects filter_chain. */
389 struct mutex filter_chain_lock
;
390 struct tcf_proto __rcu
*filter_chain
;
391 struct list_head list
;
392 struct tcf_block
*block
;
393 u32 index
; /* chain index */
395 unsigned int action_refcnt
;
396 bool explicitly_created
;
398 const struct tcf_proto_ops
*tmplt_ops
;
404 /* Lock protects tcf_block and lifetime-management data of chains
405 * attached to the block (refcnt, action_refcnt, explicitly_created).
408 struct list_head chain_list
;
409 u32 index
; /* block index for shared blocks */
413 struct rw_semaphore cb_lock
; /* protects cb_list and offload counters */
414 struct flow_block flow_block
;
415 struct list_head owner_list
;
417 atomic_t offloadcnt
; /* Number of oddloaded filters */
418 unsigned int nooffloaddevcnt
; /* Number of devs unable to do offload */
419 unsigned int lockeddevcnt
; /* Number of devs that require rtnl lock. */
421 struct tcf_chain
*chain
;
422 struct list_head filter_chain_list
;
425 DECLARE_HASHTABLE(proto_destroy_ht
, 7);
426 struct mutex proto_destroy_lock
; /* Lock for proto_destroy hashtable. */
429 #ifdef CONFIG_PROVE_LOCKING
430 static inline bool lockdep_tcf_chain_is_locked(struct tcf_chain
*chain
)
432 return lockdep_is_held(&chain
->filter_chain_lock
);
435 static inline bool lockdep_tcf_proto_is_locked(struct tcf_proto
*tp
)
437 return lockdep_is_held(&tp
->lock
);
440 static inline bool lockdep_tcf_chain_is_locked(struct tcf_block
*chain
)
445 static inline bool lockdep_tcf_proto_is_locked(struct tcf_proto
*tp
)
449 #endif /* #ifdef CONFIG_PROVE_LOCKING */
451 #define tcf_chain_dereference(p, chain) \
452 rcu_dereference_protected(p, lockdep_tcf_chain_is_locked(chain))
454 #define tcf_proto_dereference(p, tp) \
455 rcu_dereference_protected(p, lockdep_tcf_proto_is_locked(tp))
457 static inline void qdisc_cb_private_validate(const struct sk_buff
*skb
, int sz
)
459 struct qdisc_skb_cb
*qcb
;
461 BUILD_BUG_ON(sizeof(skb
->cb
) < offsetof(struct qdisc_skb_cb
, data
) + sz
);
462 BUILD_BUG_ON(sizeof(qcb
->data
) < sz
);
465 static inline int qdisc_qlen_cpu(const struct Qdisc
*q
)
467 return this_cpu_ptr(q
->cpu_qstats
)->qlen
;
470 static inline int qdisc_qlen(const struct Qdisc
*q
)
475 static inline int qdisc_qlen_sum(const struct Qdisc
*q
)
477 __u32 qlen
= q
->qstats
.qlen
;
480 if (qdisc_is_percpu_stats(q
)) {
481 for_each_possible_cpu(i
)
482 qlen
+= per_cpu_ptr(q
->cpu_qstats
, i
)->qlen
;
490 static inline struct qdisc_skb_cb
*qdisc_skb_cb(const struct sk_buff
*skb
)
492 return (struct qdisc_skb_cb
*)skb
->cb
;
495 static inline spinlock_t
*qdisc_lock(struct Qdisc
*qdisc
)
497 return &qdisc
->q
.lock
;
500 static inline struct Qdisc
*qdisc_root(const struct Qdisc
*qdisc
)
502 struct Qdisc
*q
= rcu_dereference_rtnl(qdisc
->dev_queue
->qdisc
);
507 static inline struct Qdisc
*qdisc_root_bh(const struct Qdisc
*qdisc
)
509 return rcu_dereference_bh(qdisc
->dev_queue
->qdisc
);
512 static inline struct Qdisc
*qdisc_root_sleeping(const struct Qdisc
*qdisc
)
514 return qdisc
->dev_queue
->qdisc_sleeping
;
517 /* The qdisc root lock is a mechanism by which to top level
518 * of a qdisc tree can be locked from any qdisc node in the
519 * forest. This allows changing the configuration of some
520 * aspect of the qdisc tree while blocking out asynchronous
521 * qdisc access in the packet processing paths.
523 * It is only legal to do this when the root will not change
524 * on us. Otherwise we'll potentially lock the wrong qdisc
525 * root. This is enforced by holding the RTNL semaphore, which
526 * all users of this lock accessor must do.
528 static inline spinlock_t
*qdisc_root_lock(const struct Qdisc
*qdisc
)
530 struct Qdisc
*root
= qdisc_root(qdisc
);
533 return qdisc_lock(root
);
536 static inline spinlock_t
*qdisc_root_sleeping_lock(const struct Qdisc
*qdisc
)
538 struct Qdisc
*root
= qdisc_root_sleeping(qdisc
);
541 return qdisc_lock(root
);
544 static inline seqcount_t
*qdisc_root_sleeping_running(const struct Qdisc
*qdisc
)
546 struct Qdisc
*root
= qdisc_root_sleeping(qdisc
);
549 return &root
->running
;
552 static inline struct net_device
*qdisc_dev(const struct Qdisc
*qdisc
)
554 return qdisc
->dev_queue
->dev
;
557 static inline void sch_tree_lock(const struct Qdisc
*q
)
559 spin_lock_bh(qdisc_root_sleeping_lock(q
));
562 static inline void sch_tree_unlock(const struct Qdisc
*q
)
564 spin_unlock_bh(qdisc_root_sleeping_lock(q
));
567 extern struct Qdisc noop_qdisc
;
568 extern struct Qdisc_ops noop_qdisc_ops
;
569 extern struct Qdisc_ops pfifo_fast_ops
;
570 extern struct Qdisc_ops mq_qdisc_ops
;
571 extern struct Qdisc_ops noqueue_qdisc_ops
;
572 extern const struct Qdisc_ops
*default_qdisc_ops
;
573 static inline const struct Qdisc_ops
*
574 get_default_qdisc_ops(const struct net_device
*dev
, int ntx
)
576 return ntx
< dev
->real_num_tx_queues
?
577 default_qdisc_ops
: &pfifo_fast_ops
;
580 struct Qdisc_class_common
{
582 struct hlist_node hnode
;
585 struct Qdisc_class_hash
{
586 struct hlist_head
*hash
;
587 unsigned int hashsize
;
588 unsigned int hashmask
;
589 unsigned int hashelems
;
592 static inline unsigned int qdisc_class_hash(u32 id
, u32 mask
)
599 static inline struct Qdisc_class_common
*
600 qdisc_class_find(const struct Qdisc_class_hash
*hash
, u32 id
)
602 struct Qdisc_class_common
*cl
;
608 h
= qdisc_class_hash(id
, hash
->hashmask
);
609 hlist_for_each_entry(cl
, &hash
->hash
[h
], hnode
) {
610 if (cl
->classid
== id
)
616 static inline int tc_classid_to_hwtc(struct net_device
*dev
, u32 classid
)
618 u32 hwtc
= TC_H_MIN(classid
) - TC_H_MIN_PRIORITY
;
620 return (hwtc
< netdev_get_num_tc(dev
)) ? hwtc
: -EINVAL
;
623 int qdisc_class_hash_init(struct Qdisc_class_hash
*);
624 void qdisc_class_hash_insert(struct Qdisc_class_hash
*,
625 struct Qdisc_class_common
*);
626 void qdisc_class_hash_remove(struct Qdisc_class_hash
*,
627 struct Qdisc_class_common
*);
628 void qdisc_class_hash_grow(struct Qdisc
*, struct Qdisc_class_hash
*);
629 void qdisc_class_hash_destroy(struct Qdisc_class_hash
*);
631 int dev_qdisc_change_tx_queue_len(struct net_device
*dev
);
632 void dev_init_scheduler(struct net_device
*dev
);
633 void dev_shutdown(struct net_device
*dev
);
634 void dev_activate(struct net_device
*dev
);
635 void dev_deactivate(struct net_device
*dev
);
636 void dev_deactivate_many(struct list_head
*head
);
637 struct Qdisc
*dev_graft_qdisc(struct netdev_queue
*dev_queue
,
638 struct Qdisc
*qdisc
);
639 void qdisc_reset(struct Qdisc
*qdisc
);
640 void qdisc_put(struct Qdisc
*qdisc
);
641 void qdisc_put_unlocked(struct Qdisc
*qdisc
);
642 void qdisc_tree_reduce_backlog(struct Qdisc
*qdisc
, int n
, int len
);
643 #ifdef CONFIG_NET_SCHED
644 int qdisc_offload_dump_helper(struct Qdisc
*q
, enum tc_setup_type type
,
646 void qdisc_offload_graft_helper(struct net_device
*dev
, struct Qdisc
*sch
,
647 struct Qdisc
*new, struct Qdisc
*old
,
648 enum tc_setup_type type
, void *type_data
,
649 struct netlink_ext_ack
*extack
);
652 qdisc_offload_dump_helper(struct Qdisc
*q
, enum tc_setup_type type
,
655 q
->flags
&= ~TCQ_F_OFFLOADED
;
660 qdisc_offload_graft_helper(struct net_device
*dev
, struct Qdisc
*sch
,
661 struct Qdisc
*new, struct Qdisc
*old
,
662 enum tc_setup_type type
, void *type_data
,
663 struct netlink_ext_ack
*extack
)
667 struct Qdisc
*qdisc_alloc(struct netdev_queue
*dev_queue
,
668 const struct Qdisc_ops
*ops
,
669 struct netlink_ext_ack
*extack
);
670 void qdisc_free(struct Qdisc
*qdisc
);
671 struct Qdisc
*qdisc_create_dflt(struct netdev_queue
*dev_queue
,
672 const struct Qdisc_ops
*ops
, u32 parentid
,
673 struct netlink_ext_ack
*extack
);
674 void __qdisc_calculate_pkt_len(struct sk_buff
*skb
,
675 const struct qdisc_size_table
*stab
);
676 int skb_do_redirect(struct sk_buff
*);
678 static inline void skb_reset_tc(struct sk_buff
*skb
)
680 #ifdef CONFIG_NET_CLS_ACT
681 skb
->tc_redirected
= 0;
685 static inline bool skb_is_tc_redirected(const struct sk_buff
*skb
)
687 #ifdef CONFIG_NET_CLS_ACT
688 return skb
->tc_redirected
;
694 static inline bool skb_at_tc_ingress(const struct sk_buff
*skb
)
696 #ifdef CONFIG_NET_CLS_ACT
697 return skb
->tc_at_ingress
;
703 static inline bool skb_skip_tc_classify(struct sk_buff
*skb
)
705 #ifdef CONFIG_NET_CLS_ACT
706 if (skb
->tc_skip_classify
) {
707 skb
->tc_skip_classify
= 0;
714 /* Reset all TX qdiscs greater than index of a device. */
715 static inline void qdisc_reset_all_tx_gt(struct net_device
*dev
, unsigned int i
)
719 for (; i
< dev
->num_tx_queues
; i
++) {
720 qdisc
= rtnl_dereference(netdev_get_tx_queue(dev
, i
)->qdisc
);
722 spin_lock_bh(qdisc_lock(qdisc
));
724 spin_unlock_bh(qdisc_lock(qdisc
));
729 static inline void qdisc_reset_all_tx(struct net_device
*dev
)
731 qdisc_reset_all_tx_gt(dev
, 0);
734 /* Are all TX queues of the device empty? */
735 static inline bool qdisc_all_tx_empty(const struct net_device
*dev
)
740 for (i
= 0; i
< dev
->num_tx_queues
; i
++) {
741 struct netdev_queue
*txq
= netdev_get_tx_queue(dev
, i
);
742 const struct Qdisc
*q
= rcu_dereference(txq
->qdisc
);
744 if (!qdisc_is_empty(q
)) {
753 /* Are any of the TX qdiscs changing? */
754 static inline bool qdisc_tx_changing(const struct net_device
*dev
)
758 for (i
= 0; i
< dev
->num_tx_queues
; i
++) {
759 struct netdev_queue
*txq
= netdev_get_tx_queue(dev
, i
);
760 if (rcu_access_pointer(txq
->qdisc
) != txq
->qdisc_sleeping
)
766 /* Is the device using the noop qdisc on all queues? */
767 static inline bool qdisc_tx_is_noop(const struct net_device
*dev
)
771 for (i
= 0; i
< dev
->num_tx_queues
; i
++) {
772 struct netdev_queue
*txq
= netdev_get_tx_queue(dev
, i
);
773 if (rcu_access_pointer(txq
->qdisc
) != &noop_qdisc
)
779 static inline unsigned int qdisc_pkt_len(const struct sk_buff
*skb
)
781 return qdisc_skb_cb(skb
)->pkt_len
;
784 /* additional qdisc xmit flags (NET_XMIT_MASK in linux/netdevice.h) */
785 enum net_xmit_qdisc_t
{
786 __NET_XMIT_STOLEN
= 0x00010000,
787 __NET_XMIT_BYPASS
= 0x00020000,
790 #ifdef CONFIG_NET_CLS_ACT
791 #define net_xmit_drop_count(e) ((e) & __NET_XMIT_STOLEN ? 0 : 1)
793 #define net_xmit_drop_count(e) (1)
796 static inline void qdisc_calculate_pkt_len(struct sk_buff
*skb
,
797 const struct Qdisc
*sch
)
799 #ifdef CONFIG_NET_SCHED
800 struct qdisc_size_table
*stab
= rcu_dereference_bh(sch
->stab
);
803 __qdisc_calculate_pkt_len(skb
, stab
);
807 static inline int qdisc_enqueue(struct sk_buff
*skb
, struct Qdisc
*sch
,
808 struct sk_buff
**to_free
)
810 qdisc_calculate_pkt_len(skb
, sch
);
811 return sch
->enqueue(skb
, sch
, to_free
);
814 static inline void _bstats_update(struct gnet_stats_basic_packed
*bstats
,
815 __u64 bytes
, __u32 packets
)
817 bstats
->bytes
+= bytes
;
818 bstats
->packets
+= packets
;
821 static inline void bstats_update(struct gnet_stats_basic_packed
*bstats
,
822 const struct sk_buff
*skb
)
824 _bstats_update(bstats
,
826 skb_is_gso(skb
) ? skb_shinfo(skb
)->gso_segs
: 1);
829 static inline void _bstats_cpu_update(struct gnet_stats_basic_cpu
*bstats
,
830 __u64 bytes
, __u32 packets
)
832 u64_stats_update_begin(&bstats
->syncp
);
833 _bstats_update(&bstats
->bstats
, bytes
, packets
);
834 u64_stats_update_end(&bstats
->syncp
);
837 static inline void bstats_cpu_update(struct gnet_stats_basic_cpu
*bstats
,
838 const struct sk_buff
*skb
)
840 u64_stats_update_begin(&bstats
->syncp
);
841 bstats_update(&bstats
->bstats
, skb
);
842 u64_stats_update_end(&bstats
->syncp
);
845 static inline void qdisc_bstats_cpu_update(struct Qdisc
*sch
,
846 const struct sk_buff
*skb
)
848 bstats_cpu_update(this_cpu_ptr(sch
->cpu_bstats
), skb
);
851 static inline void qdisc_bstats_update(struct Qdisc
*sch
,
852 const struct sk_buff
*skb
)
854 bstats_update(&sch
->bstats
, skb
);
857 static inline void qdisc_qstats_backlog_dec(struct Qdisc
*sch
,
858 const struct sk_buff
*skb
)
860 sch
->qstats
.backlog
-= qdisc_pkt_len(skb
);
863 static inline void qdisc_qstats_cpu_backlog_dec(struct Qdisc
*sch
,
864 const struct sk_buff
*skb
)
866 this_cpu_sub(sch
->cpu_qstats
->backlog
, qdisc_pkt_len(skb
));
869 static inline void qdisc_qstats_backlog_inc(struct Qdisc
*sch
,
870 const struct sk_buff
*skb
)
872 sch
->qstats
.backlog
+= qdisc_pkt_len(skb
);
875 static inline void qdisc_qstats_cpu_backlog_inc(struct Qdisc
*sch
,
876 const struct sk_buff
*skb
)
878 this_cpu_add(sch
->cpu_qstats
->backlog
, qdisc_pkt_len(skb
));
881 static inline void qdisc_qstats_cpu_qlen_inc(struct Qdisc
*sch
)
883 this_cpu_inc(sch
->cpu_qstats
->qlen
);
886 static inline void qdisc_qstats_cpu_qlen_dec(struct Qdisc
*sch
)
888 this_cpu_dec(sch
->cpu_qstats
->qlen
);
891 static inline void qdisc_qstats_cpu_requeues_inc(struct Qdisc
*sch
)
893 this_cpu_inc(sch
->cpu_qstats
->requeues
);
896 static inline void __qdisc_qstats_drop(struct Qdisc
*sch
, int count
)
898 sch
->qstats
.drops
+= count
;
901 static inline void qstats_drop_inc(struct gnet_stats_queue
*qstats
)
906 static inline void qstats_overlimit_inc(struct gnet_stats_queue
*qstats
)
908 qstats
->overlimits
++;
911 static inline void qdisc_qstats_drop(struct Qdisc
*sch
)
913 qstats_drop_inc(&sch
->qstats
);
916 static inline void qdisc_qstats_cpu_drop(struct Qdisc
*sch
)
918 this_cpu_inc(sch
->cpu_qstats
->drops
);
921 static inline void qdisc_qstats_overlimit(struct Qdisc
*sch
)
923 sch
->qstats
.overlimits
++;
926 static inline int qdisc_qstats_copy(struct gnet_dump
*d
, struct Qdisc
*sch
)
928 __u32 qlen
= qdisc_qlen_sum(sch
);
930 return gnet_stats_copy_queue(d
, sch
->cpu_qstats
, &sch
->qstats
, qlen
);
933 static inline void qdisc_qstats_qlen_backlog(struct Qdisc
*sch
, __u32
*qlen
,
936 struct gnet_stats_queue qstats
= { 0 };
937 __u32 len
= qdisc_qlen_sum(sch
);
939 __gnet_stats_copy_queue(&qstats
, sch
->cpu_qstats
, &sch
->qstats
, len
);
941 *backlog
= qstats
.backlog
;
944 static inline void qdisc_tree_flush_backlog(struct Qdisc
*sch
)
948 qdisc_qstats_qlen_backlog(sch
, &qlen
, &backlog
);
949 qdisc_tree_reduce_backlog(sch
, qlen
, backlog
);
952 static inline void qdisc_purge_queue(struct Qdisc
*sch
)
956 qdisc_qstats_qlen_backlog(sch
, &qlen
, &backlog
);
958 qdisc_tree_reduce_backlog(sch
, qlen
, backlog
);
961 static inline void qdisc_skb_head_init(struct qdisc_skb_head
*qh
)
968 static inline void __qdisc_enqueue_tail(struct sk_buff
*skb
,
969 struct qdisc_skb_head
*qh
)
971 struct sk_buff
*last
= qh
->tail
;
984 static inline int qdisc_enqueue_tail(struct sk_buff
*skb
, struct Qdisc
*sch
)
986 __qdisc_enqueue_tail(skb
, &sch
->q
);
987 qdisc_qstats_backlog_inc(sch
, skb
);
988 return NET_XMIT_SUCCESS
;
991 static inline void __qdisc_enqueue_head(struct sk_buff
*skb
,
992 struct qdisc_skb_head
*qh
)
994 skb
->next
= qh
->head
;
1002 static inline struct sk_buff
*__qdisc_dequeue_head(struct qdisc_skb_head
*qh
)
1004 struct sk_buff
*skb
= qh
->head
;
1006 if (likely(skb
!= NULL
)) {
1007 qh
->head
= skb
->next
;
1009 if (qh
->head
== NULL
)
1017 static inline struct sk_buff
*qdisc_dequeue_head(struct Qdisc
*sch
)
1019 struct sk_buff
*skb
= __qdisc_dequeue_head(&sch
->q
);
1021 if (likely(skb
!= NULL
)) {
1022 qdisc_qstats_backlog_dec(sch
, skb
);
1023 qdisc_bstats_update(sch
, skb
);
1029 /* Instead of calling kfree_skb() while root qdisc lock is held,
1030 * queue the skb for future freeing at end of __dev_xmit_skb()
1032 static inline void __qdisc_drop(struct sk_buff
*skb
, struct sk_buff
**to_free
)
1034 skb
->next
= *to_free
;
1038 static inline void __qdisc_drop_all(struct sk_buff
*skb
,
1039 struct sk_buff
**to_free
)
1042 skb
->prev
->next
= *to_free
;
1044 skb
->next
= *to_free
;
1048 static inline unsigned int __qdisc_queue_drop_head(struct Qdisc
*sch
,
1049 struct qdisc_skb_head
*qh
,
1050 struct sk_buff
**to_free
)
1052 struct sk_buff
*skb
= __qdisc_dequeue_head(qh
);
1054 if (likely(skb
!= NULL
)) {
1055 unsigned int len
= qdisc_pkt_len(skb
);
1057 qdisc_qstats_backlog_dec(sch
, skb
);
1058 __qdisc_drop(skb
, to_free
);
1065 static inline unsigned int qdisc_queue_drop_head(struct Qdisc
*sch
,
1066 struct sk_buff
**to_free
)
1068 return __qdisc_queue_drop_head(sch
, &sch
->q
, to_free
);
1071 static inline struct sk_buff
*qdisc_peek_head(struct Qdisc
*sch
)
1073 const struct qdisc_skb_head
*qh
= &sch
->q
;
1078 /* generic pseudo peek method for non-work-conserving qdisc */
1079 static inline struct sk_buff
*qdisc_peek_dequeued(struct Qdisc
*sch
)
1081 struct sk_buff
*skb
= skb_peek(&sch
->gso_skb
);
1083 /* we can reuse ->gso_skb because peek isn't called for root qdiscs */
1085 skb
= sch
->dequeue(sch
);
1088 __skb_queue_head(&sch
->gso_skb
, skb
);
1089 /* it's still part of the queue */
1090 qdisc_qstats_backlog_inc(sch
, skb
);
1098 static inline void qdisc_update_stats_at_dequeue(struct Qdisc
*sch
,
1099 struct sk_buff
*skb
)
1101 if (qdisc_is_percpu_stats(sch
)) {
1102 qdisc_qstats_cpu_backlog_dec(sch
, skb
);
1103 qdisc_bstats_cpu_update(sch
, skb
);
1104 qdisc_qstats_cpu_qlen_dec(sch
);
1106 qdisc_qstats_backlog_dec(sch
, skb
);
1107 qdisc_bstats_update(sch
, skb
);
1112 static inline void qdisc_update_stats_at_enqueue(struct Qdisc
*sch
,
1113 unsigned int pkt_len
)
1115 if (qdisc_is_percpu_stats(sch
)) {
1116 qdisc_qstats_cpu_qlen_inc(sch
);
1117 this_cpu_add(sch
->cpu_qstats
->backlog
, pkt_len
);
1119 sch
->qstats
.backlog
+= pkt_len
;
1124 /* use instead of qdisc->dequeue() for all qdiscs queried with ->peek() */
1125 static inline struct sk_buff
*qdisc_dequeue_peeked(struct Qdisc
*sch
)
1127 struct sk_buff
*skb
= skb_peek(&sch
->gso_skb
);
1130 skb
= __skb_dequeue(&sch
->gso_skb
);
1131 if (qdisc_is_percpu_stats(sch
)) {
1132 qdisc_qstats_cpu_backlog_dec(sch
, skb
);
1133 qdisc_qstats_cpu_qlen_dec(sch
);
1135 qdisc_qstats_backlog_dec(sch
, skb
);
1139 skb
= sch
->dequeue(sch
);
1145 static inline void __qdisc_reset_queue(struct qdisc_skb_head
*qh
)
1148 * We do not know the backlog in bytes of this list, it
1149 * is up to the caller to correct it
1153 rtnl_kfree_skbs(qh
->head
, qh
->tail
);
1161 static inline void qdisc_reset_queue(struct Qdisc
*sch
)
1163 __qdisc_reset_queue(&sch
->q
);
1164 sch
->qstats
.backlog
= 0;
1167 static inline struct Qdisc
*qdisc_replace(struct Qdisc
*sch
, struct Qdisc
*new,
1168 struct Qdisc
**pold
)
1176 qdisc_tree_flush_backlog(old
);
1177 sch_tree_unlock(sch
);
1182 static inline void rtnl_qdisc_drop(struct sk_buff
*skb
, struct Qdisc
*sch
)
1184 rtnl_kfree_skbs(skb
, skb
);
1185 qdisc_qstats_drop(sch
);
1188 static inline int qdisc_drop_cpu(struct sk_buff
*skb
, struct Qdisc
*sch
,
1189 struct sk_buff
**to_free
)
1191 __qdisc_drop(skb
, to_free
);
1192 qdisc_qstats_cpu_drop(sch
);
1194 return NET_XMIT_DROP
;
1197 static inline int qdisc_drop(struct sk_buff
*skb
, struct Qdisc
*sch
,
1198 struct sk_buff
**to_free
)
1200 __qdisc_drop(skb
, to_free
);
1201 qdisc_qstats_drop(sch
);
1203 return NET_XMIT_DROP
;
1206 static inline int qdisc_drop_all(struct sk_buff
*skb
, struct Qdisc
*sch
,
1207 struct sk_buff
**to_free
)
1209 __qdisc_drop_all(skb
, to_free
);
1210 qdisc_qstats_drop(sch
);
1212 return NET_XMIT_DROP
;
1215 /* Length to Time (L2T) lookup in a qdisc_rate_table, to determine how
1216 long it will take to send a packet given its size.
1218 static inline u32
qdisc_l2t(struct qdisc_rate_table
* rtab
, unsigned int pktlen
)
1220 int slot
= pktlen
+ rtab
->rate
.cell_align
+ rtab
->rate
.overhead
;
1223 slot
>>= rtab
->rate
.cell_log
;
1225 return rtab
->data
[255]*(slot
>> 8) + rtab
->data
[slot
& 0xFF];
1226 return rtab
->data
[slot
];
1229 struct psched_ratecfg
{
1230 u64 rate_bytes_ps
; /* bytes per second */
1237 static inline u64
psched_l2t_ns(const struct psched_ratecfg
*r
,
1242 if (unlikely(r
->linklayer
== TC_LINKLAYER_ATM
))
1243 return ((u64
)(DIV_ROUND_UP(len
,48)*53) * r
->mult
) >> r
->shift
;
1245 return ((u64
)len
* r
->mult
) >> r
->shift
;
1248 void psched_ratecfg_precompute(struct psched_ratecfg
*r
,
1249 const struct tc_ratespec
*conf
,
1252 static inline void psched_ratecfg_getrate(struct tc_ratespec
*res
,
1253 const struct psched_ratecfg
*r
)
1255 memset(res
, 0, sizeof(*res
));
1257 /* legacy struct tc_ratespec has a 32bit @rate field
1258 * Qdisc using 64bit rate should add new attributes
1259 * in order to maintain compatibility.
1261 res
->rate
= min_t(u64
, r
->rate_bytes_ps
, ~0U);
1263 res
->overhead
= r
->overhead
;
1264 res
->linklayer
= (r
->linklayer
& TC_LINKLAYER_MASK
);
1267 /* Mini Qdisc serves for specific needs of ingress/clsact Qdisc.
1268 * The fast path only needs to access filter list and to update stats
1271 struct tcf_proto
*filter_list
;
1272 struct gnet_stats_basic_cpu __percpu
*cpu_bstats
;
1273 struct gnet_stats_queue __percpu
*cpu_qstats
;
1274 struct rcu_head rcu
;
1277 static inline void mini_qdisc_bstats_cpu_update(struct mini_Qdisc
*miniq
,
1278 const struct sk_buff
*skb
)
1280 bstats_cpu_update(this_cpu_ptr(miniq
->cpu_bstats
), skb
);
1283 static inline void mini_qdisc_qstats_cpu_drop(struct mini_Qdisc
*miniq
)
1285 this_cpu_inc(miniq
->cpu_qstats
->drops
);
1288 struct mini_Qdisc_pair
{
1289 struct mini_Qdisc miniq1
;
1290 struct mini_Qdisc miniq2
;
1291 struct mini_Qdisc __rcu
**p_miniq
;
1294 void mini_qdisc_pair_swap(struct mini_Qdisc_pair
*miniqp
,
1295 struct tcf_proto
*tp_head
);
1296 void mini_qdisc_pair_init(struct mini_Qdisc_pair
*miniqp
, struct Qdisc
*qdisc
,
1297 struct mini_Qdisc __rcu
**p_miniq
);
1299 static inline int skb_tc_reinsert(struct sk_buff
*skb
, struct tcf_result
*res
)
1301 return res
->ingress
? netif_receive_skb(skb
) : dev_queue_xmit(skb
);