2 * Copyright (c) 2008, Intel Corporation.
4 * This program is free software; you can redistribute it and/or modify it
5 * under the terms and conditions of the GNU General Public License,
6 * version 2, as published by the Free Software Foundation.
8 * This program is distributed in the hope it will be useful, but WITHOUT
9 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
13 * You should have received a copy of the GNU General Public License along with
14 * this program; if not, see <http://www.gnu.org/licenses/>.
16 * Author: Alexander Duyck <alexander.h.duyck@intel.com>
19 #include <linux/module.h>
20 #include <linux/slab.h>
21 #include <linux/types.h>
22 #include <linux/kernel.h>
23 #include <linux/string.h>
24 #include <linux/errno.h>
25 #include <linux/skbuff.h>
26 #include <net/netlink.h>
27 #include <net/pkt_sched.h>
28 #include <net/pkt_cls.h>
30 struct multiq_sched_data
{
34 struct tcf_proto __rcu
*filter_list
;
35 struct tcf_block
*block
;
36 struct Qdisc
**queues
;
41 multiq_classify(struct sk_buff
*skb
, struct Qdisc
*sch
, int *qerr
)
43 struct multiq_sched_data
*q
= qdisc_priv(sch
);
45 struct tcf_result res
;
46 struct tcf_proto
*fl
= rcu_dereference_bh(q
->filter_list
);
49 *qerr
= NET_XMIT_SUCCESS
| __NET_XMIT_BYPASS
;
50 err
= tcf_classify(skb
, fl
, &res
, false);
51 #ifdef CONFIG_NET_CLS_ACT
56 *qerr
= NET_XMIT_SUCCESS
| __NET_XMIT_STOLEN
;
62 band
= skb_get_queue_mapping(skb
);
67 return q
->queues
[band
];
71 multiq_enqueue(struct sk_buff
*skb
, struct Qdisc
*sch
,
72 struct sk_buff
**to_free
)
77 qdisc
= multiq_classify(skb
, sch
, &ret
);
78 #ifdef CONFIG_NET_CLS_ACT
81 if (ret
& __NET_XMIT_BYPASS
)
82 qdisc_qstats_drop(sch
);
83 __qdisc_drop(skb
, to_free
);
88 ret
= qdisc_enqueue(skb
, qdisc
, to_free
);
89 if (ret
== NET_XMIT_SUCCESS
) {
91 return NET_XMIT_SUCCESS
;
93 if (net_xmit_drop_count(ret
))
94 qdisc_qstats_drop(sch
);
98 static struct sk_buff
*multiq_dequeue(struct Qdisc
*sch
)
100 struct multiq_sched_data
*q
= qdisc_priv(sch
);
105 for (band
= 0; band
< q
->bands
; band
++) {
106 /* cycle through bands to ensure fairness */
108 if (q
->curband
>= q
->bands
)
111 /* Check that target subqueue is available before
112 * pulling an skb to avoid head-of-line blocking.
114 if (!netif_xmit_stopped(
115 netdev_get_tx_queue(qdisc_dev(sch
), q
->curband
))) {
116 qdisc
= q
->queues
[q
->curband
];
117 skb
= qdisc
->dequeue(qdisc
);
119 qdisc_bstats_update(sch
, skb
);
129 static struct sk_buff
*multiq_peek(struct Qdisc
*sch
)
131 struct multiq_sched_data
*q
= qdisc_priv(sch
);
132 unsigned int curband
= q
->curband
;
137 for (band
= 0; band
< q
->bands
; band
++) {
138 /* cycle through bands to ensure fairness */
140 if (curband
>= q
->bands
)
143 /* Check that target subqueue is available before
144 * pulling an skb to avoid head-of-line blocking.
146 if (!netif_xmit_stopped(
147 netdev_get_tx_queue(qdisc_dev(sch
), curband
))) {
148 qdisc
= q
->queues
[curband
];
149 skb
= qdisc
->ops
->peek(qdisc
);
159 multiq_reset(struct Qdisc
*sch
)
162 struct multiq_sched_data
*q
= qdisc_priv(sch
);
164 for (band
= 0; band
< q
->bands
; band
++)
165 qdisc_reset(q
->queues
[band
]);
171 multiq_destroy(struct Qdisc
*sch
)
174 struct multiq_sched_data
*q
= qdisc_priv(sch
);
176 tcf_block_put(q
->block
);
177 for (band
= 0; band
< q
->bands
; band
++)
178 qdisc_destroy(q
->queues
[band
]);
183 static int multiq_tune(struct Qdisc
*sch
, struct nlattr
*opt
,
184 struct netlink_ext_ack
*extack
)
186 struct multiq_sched_data
*q
= qdisc_priv(sch
);
187 struct tc_multiq_qopt
*qopt
;
190 if (!netif_is_multiqueue(qdisc_dev(sch
)))
192 if (nla_len(opt
) < sizeof(*qopt
))
195 qopt
= nla_data(opt
);
197 qopt
->bands
= qdisc_dev(sch
)->real_num_tx_queues
;
200 q
->bands
= qopt
->bands
;
201 for (i
= q
->bands
; i
< q
->max_bands
; i
++) {
202 if (q
->queues
[i
] != &noop_qdisc
) {
203 struct Qdisc
*child
= q
->queues
[i
];
204 q
->queues
[i
] = &noop_qdisc
;
205 qdisc_tree_reduce_backlog(child
, child
->q
.qlen
,
206 child
->qstats
.backlog
);
207 qdisc_destroy(child
);
211 sch_tree_unlock(sch
);
213 for (i
= 0; i
< q
->bands
; i
++) {
214 if (q
->queues
[i
] == &noop_qdisc
) {
215 struct Qdisc
*child
, *old
;
216 child
= qdisc_create_dflt(sch
->dev_queue
,
218 TC_H_MAKE(sch
->handle
,
223 q
->queues
[i
] = child
;
224 if (child
!= &noop_qdisc
)
225 qdisc_hash_add(child
, true);
227 if (old
!= &noop_qdisc
) {
228 qdisc_tree_reduce_backlog(old
,
230 old
->qstats
.backlog
);
233 sch_tree_unlock(sch
);
240 static int multiq_init(struct Qdisc
*sch
, struct nlattr
*opt
,
241 struct netlink_ext_ack
*extack
)
243 struct multiq_sched_data
*q
= qdisc_priv(sch
);
251 err
= tcf_block_get(&q
->block
, &q
->filter_list
, sch
, extack
);
255 q
->max_bands
= qdisc_dev(sch
)->num_tx_queues
;
257 q
->queues
= kcalloc(q
->max_bands
, sizeof(struct Qdisc
*), GFP_KERNEL
);
260 for (i
= 0; i
< q
->max_bands
; i
++)
261 q
->queues
[i
] = &noop_qdisc
;
263 return multiq_tune(sch
, opt
, extack
);
266 static int multiq_dump(struct Qdisc
*sch
, struct sk_buff
*skb
)
268 struct multiq_sched_data
*q
= qdisc_priv(sch
);
269 unsigned char *b
= skb_tail_pointer(skb
);
270 struct tc_multiq_qopt opt
;
272 opt
.bands
= q
->bands
;
273 opt
.max_bands
= q
->max_bands
;
275 if (nla_put(skb
, TCA_OPTIONS
, sizeof(opt
), &opt
))
276 goto nla_put_failure
;
285 static int multiq_graft(struct Qdisc
*sch
, unsigned long arg
, struct Qdisc
*new,
286 struct Qdisc
**old
, struct netlink_ext_ack
*extack
)
288 struct multiq_sched_data
*q
= qdisc_priv(sch
);
289 unsigned long band
= arg
- 1;
294 *old
= qdisc_replace(sch
, new, &q
->queues
[band
]);
298 static struct Qdisc
*
299 multiq_leaf(struct Qdisc
*sch
, unsigned long arg
)
301 struct multiq_sched_data
*q
= qdisc_priv(sch
);
302 unsigned long band
= arg
- 1;
304 return q
->queues
[band
];
307 static unsigned long multiq_find(struct Qdisc
*sch
, u32 classid
)
309 struct multiq_sched_data
*q
= qdisc_priv(sch
);
310 unsigned long band
= TC_H_MIN(classid
);
312 if (band
- 1 >= q
->bands
)
317 static unsigned long multiq_bind(struct Qdisc
*sch
, unsigned long parent
,
320 return multiq_find(sch
, classid
);
324 static void multiq_unbind(struct Qdisc
*q
, unsigned long cl
)
328 static int multiq_dump_class(struct Qdisc
*sch
, unsigned long cl
,
329 struct sk_buff
*skb
, struct tcmsg
*tcm
)
331 struct multiq_sched_data
*q
= qdisc_priv(sch
);
333 tcm
->tcm_handle
|= TC_H_MIN(cl
);
334 tcm
->tcm_info
= q
->queues
[cl
- 1]->handle
;
338 static int multiq_dump_class_stats(struct Qdisc
*sch
, unsigned long cl
,
341 struct multiq_sched_data
*q
= qdisc_priv(sch
);
344 cl_q
= q
->queues
[cl
- 1];
345 if (gnet_stats_copy_basic(qdisc_root_sleeping_running(sch
),
346 d
, NULL
, &cl_q
->bstats
) < 0 ||
347 gnet_stats_copy_queue(d
, NULL
, &cl_q
->qstats
, cl_q
->q
.qlen
) < 0)
353 static void multiq_walk(struct Qdisc
*sch
, struct qdisc_walker
*arg
)
355 struct multiq_sched_data
*q
= qdisc_priv(sch
);
361 for (band
= 0; band
< q
->bands
; band
++) {
362 if (arg
->count
< arg
->skip
) {
366 if (arg
->fn(sch
, band
+ 1, arg
) < 0) {
374 static struct tcf_block
*multiq_tcf_block(struct Qdisc
*sch
, unsigned long cl
,
375 struct netlink_ext_ack
*extack
)
377 struct multiq_sched_data
*q
= qdisc_priv(sch
);
384 static const struct Qdisc_class_ops multiq_class_ops
= {
385 .graft
= multiq_graft
,
389 .tcf_block
= multiq_tcf_block
,
390 .bind_tcf
= multiq_bind
,
391 .unbind_tcf
= multiq_unbind
,
392 .dump
= multiq_dump_class
,
393 .dump_stats
= multiq_dump_class_stats
,
396 static struct Qdisc_ops multiq_qdisc_ops __read_mostly
= {
398 .cl_ops
= &multiq_class_ops
,
400 .priv_size
= sizeof(struct multiq_sched_data
),
401 .enqueue
= multiq_enqueue
,
402 .dequeue
= multiq_dequeue
,
405 .reset
= multiq_reset
,
406 .destroy
= multiq_destroy
,
407 .change
= multiq_tune
,
409 .owner
= THIS_MODULE
,
412 static int __init
multiq_module_init(void)
414 return register_qdisc(&multiq_qdisc_ops
);
417 static void __exit
multiq_module_exit(void)
419 unregister_qdisc(&multiq_qdisc_ops
);
422 module_init(multiq_module_init
)
423 module_exit(multiq_module_exit
)
425 MODULE_LICENSE("GPL");