2 * net/sched/act_api.c Packet action API.
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
9 * Author: Jamal Hadi Salim
14 #include <asm/uaccess.h>
15 #include <asm/system.h>
16 #include <linux/bitops.h>
17 #include <linux/config.h>
18 #include <linux/types.h>
19 #include <linux/kernel.h>
20 #include <linux/sched.h>
21 #include <linux/string.h>
23 #include <linux/socket.h>
24 #include <linux/sockios.h>
26 #include <linux/errno.h>
27 #include <linux/interrupt.h>
28 #include <linux/netdevice.h>
29 #include <linux/skbuff.h>
30 #include <linux/rtnetlink.h>
31 #include <linux/init.h>
32 #include <linux/kmod.h>
34 #include <net/sch_generic.h>
35 #include <net/act_api.h>
38 #define DPRINTK(format, args...) printk(KERN_DEBUG format, ##args)
40 #define DPRINTK(format, args...)
43 #define D2PRINTK(format, args...) printk(KERN_DEBUG format, ##args)
45 #define D2PRINTK(format, args...)
48 static struct tc_action_ops
*act_base
= NULL
;
49 static DEFINE_RWLOCK(act_mod_lock
);
51 int tcf_register_action(struct tc_action_ops
*act
)
53 struct tc_action_ops
*a
, **ap
;
55 write_lock(&act_mod_lock
);
56 for (ap
= &act_base
; (a
= *ap
) != NULL
; ap
= &a
->next
) {
57 if (act
->type
== a
->type
|| (strcmp(act
->kind
, a
->kind
) == 0)) {
58 write_unlock(&act_mod_lock
);
64 write_unlock(&act_mod_lock
);
68 int tcf_unregister_action(struct tc_action_ops
*act
)
70 struct tc_action_ops
*a
, **ap
;
73 write_lock(&act_mod_lock
);
74 for (ap
= &act_base
; (a
= *ap
) != NULL
; ap
= &a
->next
)
82 write_unlock(&act_mod_lock
);
87 static struct tc_action_ops
*tc_lookup_action_n(char *kind
)
89 struct tc_action_ops
*a
= NULL
;
92 read_lock(&act_mod_lock
);
93 for (a
= act_base
; a
; a
= a
->next
) {
94 if (strcmp(kind
, a
->kind
) == 0) {
95 if (!try_module_get(a
->owner
)) {
96 read_unlock(&act_mod_lock
);
102 read_unlock(&act_mod_lock
);
107 /* lookup by rtattr */
108 static struct tc_action_ops
*tc_lookup_action(struct rtattr
*kind
)
110 struct tc_action_ops
*a
= NULL
;
113 read_lock(&act_mod_lock
);
114 for (a
= act_base
; a
; a
= a
->next
) {
115 if (rtattr_strcmp(kind
, a
->kind
) == 0) {
116 if (!try_module_get(a
->owner
)) {
117 read_unlock(&act_mod_lock
);
123 read_unlock(&act_mod_lock
);
130 static struct tc_action_ops
*tc_lookup_action_id(u32 type
)
132 struct tc_action_ops
*a
= NULL
;
135 read_lock(&act_mod_lock
);
136 for (a
= act_base
; a
; a
= a
->next
) {
137 if (a
->type
== type
) {
138 if (!try_module_get(a
->owner
)) {
139 read_unlock(&act_mod_lock
);
145 read_unlock(&act_mod_lock
);
151 int tcf_action_exec(struct sk_buff
*skb
, struct tc_action
*act
,
152 struct tcf_result
*res
)
157 if (skb
->tc_verd
& TC_NCLS
) {
158 skb
->tc_verd
= CLR_TC_NCLS(skb
->tc_verd
);
159 D2PRINTK("(%p)tcf_action_exec: cleared TC_NCLS in %s out %s\n",
160 skb
, skb
->input_dev
? skb
->input_dev
->name
: "xxx",
165 while ((a
= act
) != NULL
) {
167 if (a
->ops
&& a
->ops
->act
) {
168 ret
= a
->ops
->act(skb
, a
, res
);
169 if (TC_MUNGED
& skb
->tc_verd
) {
170 /* copied already, allow trampling */
171 skb
->tc_verd
= SET_TC_OK2MUNGE(skb
->tc_verd
);
172 skb
->tc_verd
= CLR_TC_MUNGED(skb
->tc_verd
);
174 if (ret
== TC_ACT_REPEAT
)
175 goto repeat
; /* we need a ttl - JHS */
176 if (ret
!= TC_ACT_PIPE
)
185 void tcf_action_destroy(struct tc_action
*act
, int bind
)
189 for (a
= act
; a
; a
= act
) {
190 if (a
->ops
&& a
->ops
->cleanup
) {
191 DPRINTK("tcf_action_destroy destroying %p next %p\n",
193 if (a
->ops
->cleanup(a
, bind
) == ACT_P_DELETED
)
194 module_put(a
->ops
->owner
);
197 } else { /*FIXME: Remove later - catch insertion bugs*/
198 printk("tcf_action_destroy: BUG? destroying NULL ops\n");
206 tcf_action_dump_old(struct sk_buff
*skb
, struct tc_action
*a
, int bind
, int ref
)
210 if (a
->ops
== NULL
|| a
->ops
->dump
== NULL
)
212 return a
->ops
->dump(skb
, a
, bind
, ref
);
216 tcf_action_dump_1(struct sk_buff
*skb
, struct tc_action
*a
, int bind
, int ref
)
219 unsigned char *b
= skb
->tail
;
222 if (a
->ops
== NULL
|| a
->ops
->dump
== NULL
)
225 RTA_PUT(skb
, TCA_KIND
, IFNAMSIZ
, a
->ops
->kind
);
226 if (tcf_action_copy_stats(skb
, a
, 0))
228 r
= (struct rtattr
*) skb
->tail
;
229 RTA_PUT(skb
, TCA_OPTIONS
, 0, NULL
);
230 if ((err
= tcf_action_dump_old(skb
, a
, bind
, ref
)) > 0) {
231 r
->rta_len
= skb
->tail
- (u8
*)r
;
236 skb_trim(skb
, b
- skb
->data
);
241 tcf_action_dump(struct sk_buff
*skb
, struct tc_action
*act
, int bind
, int ref
)
245 unsigned char *b
= skb
->tail
;
248 while ((a
= act
) != NULL
) {
249 r
= (struct rtattr
*) skb
->tail
;
251 RTA_PUT(skb
, a
->order
, 0, NULL
);
252 err
= tcf_action_dump_1(skb
, a
, bind
, ref
);
255 r
->rta_len
= skb
->tail
- (u8
*)r
;
263 skb_trim(skb
, b
- skb
->data
);
267 struct tc_action
*tcf_action_init_1(struct rtattr
*rta
, struct rtattr
*est
,
268 char *name
, int ovr
, int bind
, int *err
)
271 struct tc_action_ops
*a_o
;
272 char act_name
[IFNAMSIZ
];
273 struct rtattr
*tb
[TCA_ACT_MAX
+1];
279 if (rtattr_parse_nested(tb
, TCA_ACT_MAX
, rta
) < 0)
281 kind
= tb
[TCA_ACT_KIND
-1];
284 if (rtattr_strlcpy(act_name
, kind
, IFNAMSIZ
) >= IFNAMSIZ
)
287 if (strlcpy(act_name
, name
, IFNAMSIZ
) >= IFNAMSIZ
)
291 a_o
= tc_lookup_action_n(act_name
);
295 request_module("act_%s", act_name
);
298 a_o
= tc_lookup_action_n(act_name
);
300 /* We dropped the RTNL semaphore in order to
301 * perform the module load. So, even if we
302 * succeeded in loading the module we have to
303 * tell the caller to replay the request. We
304 * indicate this using -EAGAIN.
316 a
= kmalloc(sizeof(*a
), GFP_KERNEL
);
319 memset(a
, 0, sizeof(*a
));
321 /* backward compatibility for policer */
323 *err
= a_o
->init(tb
[TCA_ACT_OPTIONS
-1], est
, a
, ovr
, bind
);
325 *err
= a_o
->init(rta
, est
, a
, ovr
, bind
);
329 /* module count goes up only when brand new policy is created
330 if it exists and is only bound to in a_o->init() then
331 ACT_P_CREATED is not returned (a zero is).
333 if (*err
!= ACT_P_CREATED
)
334 module_put(a_o
->owner
);
336 DPRINTK("tcf_action_init_1: successfull %s\n", act_name
);
344 module_put(a_o
->owner
);
349 struct tc_action
*tcf_action_init(struct rtattr
*rta
, struct rtattr
*est
,
350 char *name
, int ovr
, int bind
, int *err
)
352 struct rtattr
*tb
[TCA_ACT_MAX_PRIO
+1];
353 struct tc_action
*head
= NULL
, *act
, *act_prev
= NULL
;
356 if (rtattr_parse_nested(tb
, TCA_ACT_MAX_PRIO
, rta
) < 0) {
361 for (i
=0; i
< TCA_ACT_MAX_PRIO
&& tb
[i
]; i
++) {
362 act
= tcf_action_init_1(tb
[i
], est
, name
, ovr
, bind
, err
);
370 act_prev
->next
= act
;
377 tcf_action_destroy(head
, bind
);
381 int tcf_action_copy_stats(struct sk_buff
*skb
, struct tc_action
*a
,
386 struct tcf_act_hdr
*h
= a
->priv
;
391 /* compat_mode being true specifies a call that is supposed
392 * to add additional backward compatiblity statistic TLVs.
395 if (a
->type
== TCA_OLD_COMPAT
)
396 err
= gnet_stats_start_copy_compat(skb
, 0,
397 TCA_STATS
, TCA_XSTATS
, h
->stats_lock
, &d
);
401 err
= gnet_stats_start_copy(skb
, TCA_ACT_STATS
,
407 if (a
->ops
!= NULL
&& a
->ops
->get_stats
!= NULL
)
408 if (a
->ops
->get_stats(skb
, a
) < 0)
411 if (gnet_stats_copy_basic(&d
, &h
->bstats
) < 0 ||
412 #ifdef CONFIG_NET_ESTIMATOR
413 gnet_stats_copy_rate_est(&d
, &h
->rate_est
) < 0 ||
415 gnet_stats_copy_queue(&d
, &h
->qstats
) < 0)
418 if (gnet_stats_finish_copy(&d
) < 0)
428 tca_get_fill(struct sk_buff
*skb
, struct tc_action
*a
, u32 pid
, u32 seq
,
429 u16 flags
, int event
, int bind
, int ref
)
432 struct nlmsghdr
*nlh
;
433 unsigned char *b
= skb
->tail
;
436 nlh
= NLMSG_NEW(skb
, pid
, seq
, event
, sizeof(*t
), flags
);
439 t
->tca_family
= AF_UNSPEC
;
443 x
= (struct rtattr
*) skb
->tail
;
444 RTA_PUT(skb
, TCA_ACT_TAB
, 0, NULL
);
446 if (tcf_action_dump(skb
, a
, bind
, ref
) < 0)
449 x
->rta_len
= skb
->tail
- (u8
*)x
;
451 nlh
->nlmsg_len
= skb
->tail
- b
;
456 skb_trim(skb
, b
- skb
->data
);
461 act_get_notify(u32 pid
, struct nlmsghdr
*n
, struct tc_action
*a
, int event
)
466 skb
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
469 if (tca_get_fill(skb
, a
, pid
, n
->nlmsg_seq
, 0, event
, 0, 0) <= 0) {
473 err
= netlink_unicast(rtnl
, skb
, pid
, MSG_DONTWAIT
);
479 static struct tc_action
*
480 tcf_action_get_1(struct rtattr
*rta
, struct nlmsghdr
*n
, u32 pid
, int *err
)
482 struct rtattr
*tb
[TCA_ACT_MAX
+1];
487 if (rtattr_parse_nested(tb
, TCA_ACT_MAX
, rta
) < 0)
490 if (tb
[TCA_ACT_INDEX
- 1] == NULL
||
491 RTA_PAYLOAD(tb
[TCA_ACT_INDEX
- 1]) < sizeof(index
))
493 index
= *(int *)RTA_DATA(tb
[TCA_ACT_INDEX
- 1]);
496 a
= kmalloc(sizeof(struct tc_action
), GFP_KERNEL
);
499 memset(a
, 0, sizeof(struct tc_action
));
502 a
->ops
= tc_lookup_action(tb
[TCA_ACT_KIND
- 1]);
505 if (a
->ops
->lookup
== NULL
)
508 if (a
->ops
->lookup(a
, index
) == 0)
511 module_put(a
->ops
->owner
);
515 module_put(a
->ops
->owner
);
521 static void cleanup_a(struct tc_action
*act
)
525 for (a
= act
; a
; a
= act
) {
531 static struct tc_action
*create_a(int i
)
533 struct tc_action
*act
;
535 act
= kmalloc(sizeof(*act
), GFP_KERNEL
);
537 printk("create_a: failed to alloc!\n");
540 memset(act
, 0, sizeof(*act
));
545 static int tca_action_flush(struct rtattr
*rta
, struct nlmsghdr
*n
, u32 pid
)
549 struct nlmsghdr
*nlh
;
551 struct netlink_callback dcb
;
553 struct rtattr
*tb
[TCA_ACT_MAX
+1];
555 struct tc_action
*a
= create_a(0);
559 printk("tca_action_flush: couldnt create tc_action\n");
563 skb
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
565 printk("tca_action_flush: failed skb alloc\n");
570 b
= (unsigned char *)skb
->tail
;
572 if (rtattr_parse_nested(tb
, TCA_ACT_MAX
, rta
) < 0)
575 kind
= tb
[TCA_ACT_KIND
-1];
576 a
->ops
= tc_lookup_action(kind
);
580 nlh
= NLMSG_PUT(skb
, pid
, n
->nlmsg_seq
, RTM_DELACTION
, sizeof(*t
));
582 t
->tca_family
= AF_UNSPEC
;
586 x
= (struct rtattr
*) skb
->tail
;
587 RTA_PUT(skb
, TCA_ACT_TAB
, 0, NULL
);
589 err
= a
->ops
->walk(skb
, &dcb
, RTM_DELACTION
, a
);
593 x
->rta_len
= skb
->tail
- (u8
*) x
;
595 nlh
->nlmsg_len
= skb
->tail
- b
;
596 nlh
->nlmsg_flags
|= NLM_F_ROOT
;
597 module_put(a
->ops
->owner
);
599 err
= rtnetlink_send(skb
, pid
, RTNLGRP_TC
, n
->nlmsg_flags
&NLM_F_ECHO
);
607 module_put(a
->ops
->owner
);
615 tca_action_gd(struct rtattr
*rta
, struct nlmsghdr
*n
, u32 pid
, int event
)
618 struct rtattr
*tb
[TCA_ACT_MAX_PRIO
+1];
619 struct tc_action
*head
= NULL
, *act
, *act_prev
= NULL
;
621 if (rtattr_parse_nested(tb
, TCA_ACT_MAX_PRIO
, rta
) < 0)
624 if (event
== RTM_DELACTION
&& n
->nlmsg_flags
&NLM_F_ROOT
) {
625 if (tb
[0] != NULL
&& tb
[1] == NULL
)
626 return tca_action_flush(tb
[0], n
, pid
);
629 for (i
=0; i
< TCA_ACT_MAX_PRIO
&& tb
[i
]; i
++) {
630 act
= tcf_action_get_1(tb
[i
], n
, pid
, &ret
);
638 act_prev
->next
= act
;
642 if (event
== RTM_GETACTION
)
643 ret
= act_get_notify(pid
, n
, head
, event
);
647 skb
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
653 if (tca_get_fill(skb
, head
, pid
, n
->nlmsg_seq
, 0, event
,
660 /* now do the delete */
661 tcf_action_destroy(head
, 0);
662 ret
= rtnetlink_send(skb
, pid
, RTNLGRP_TC
,
663 n
->nlmsg_flags
&NLM_F_ECHO
);
673 static int tcf_add_notify(struct tc_action
*a
, u32 pid
, u32 seq
, int event
,
677 struct nlmsghdr
*nlh
;
683 skb
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
687 b
= (unsigned char *)skb
->tail
;
689 nlh
= NLMSG_NEW(skb
, pid
, seq
, event
, sizeof(*t
), flags
);
691 t
->tca_family
= AF_UNSPEC
;
695 x
= (struct rtattr
*) skb
->tail
;
696 RTA_PUT(skb
, TCA_ACT_TAB
, 0, NULL
);
698 if (tcf_action_dump(skb
, a
, 0, 0) < 0)
701 x
->rta_len
= skb
->tail
- (u8
*)x
;
703 nlh
->nlmsg_len
= skb
->tail
- b
;
704 NETLINK_CB(skb
).dst_group
= RTNLGRP_TC
;
706 err
= rtnetlink_send(skb
, pid
, RTNLGRP_TC
, flags
&NLM_F_ECHO
);
719 tcf_action_add(struct rtattr
*rta
, struct nlmsghdr
*n
, u32 pid
, int ovr
)
722 struct tc_action
*act
;
724 u32 seq
= n
->nlmsg_seq
;
726 act
= tcf_action_init(rta
, NULL
, NULL
, ovr
, 0, &ret
);
730 /* dump then free all the actions after update; inserted policy
733 ret
= tcf_add_notify(act
, pid
, seq
, RTM_NEWACTION
, n
->nlmsg_flags
);
734 for (a
= act
; a
; a
= act
) {
742 static int tc_ctl_action(struct sk_buff
*skb
, struct nlmsghdr
*n
, void *arg
)
744 struct rtattr
**tca
= arg
;
745 u32 pid
= skb
? NETLINK_CB(skb
).pid
: 0;
746 int ret
= 0, ovr
= 0;
748 if (tca
[TCA_ACT_TAB
-1] == NULL
) {
749 printk("tc_ctl_action: received NO action attribs\n");
753 /* n->nlmsg_flags&NLM_F_CREATE
755 switch (n
->nlmsg_type
) {
757 /* we are going to assume all other flags
758 * imply create only if it doesnt exist
759 * Note that CREATE | EXCL implies that
760 * but since we want avoid ambiguity (eg when flags
761 * is zero) then just set this
763 if (n
->nlmsg_flags
&NLM_F_REPLACE
)
766 ret
= tcf_action_add(tca
[TCA_ACT_TAB
-1], n
, pid
, ovr
);
771 ret
= tca_action_gd(tca
[TCA_ACT_TAB
-1], n
, pid
, RTM_DELACTION
);
774 ret
= tca_action_gd(tca
[TCA_ACT_TAB
-1], n
, pid
, RTM_GETACTION
);
783 static struct rtattr
*
784 find_dump_kind(struct nlmsghdr
*n
)
786 struct rtattr
*tb1
, *tb2
[TCA_ACT_MAX
+1];
787 struct rtattr
*tb
[TCA_ACT_MAX_PRIO
+ 1];
788 struct rtattr
*rta
[TCAA_MAX
+ 1];
790 int min_len
= NLMSG_LENGTH(sizeof(struct tcamsg
));
791 int attrlen
= n
->nlmsg_len
- NLMSG_ALIGN(min_len
);
792 struct rtattr
*attr
= (void *) n
+ NLMSG_ALIGN(min_len
);
794 if (rtattr_parse(rta
, TCAA_MAX
, attr
, attrlen
) < 0)
796 tb1
= rta
[TCA_ACT_TAB
- 1];
800 if (rtattr_parse(tb
, TCA_ACT_MAX_PRIO
, RTA_DATA(tb1
),
801 NLMSG_ALIGN(RTA_PAYLOAD(tb1
))) < 0)
806 if (rtattr_parse(tb2
, TCA_ACT_MAX
, RTA_DATA(tb
[0]),
807 RTA_PAYLOAD(tb
[0])) < 0)
809 kind
= tb2
[TCA_ACT_KIND
-1];
815 tc_dump_action(struct sk_buff
*skb
, struct netlink_callback
*cb
)
817 struct nlmsghdr
*nlh
;
818 unsigned char *b
= skb
->tail
;
820 struct tc_action_ops
*a_o
;
823 struct tcamsg
*t
= (struct tcamsg
*) NLMSG_DATA(cb
->nlh
);
824 struct rtattr
*kind
= find_dump_kind(cb
->nlh
);
827 printk("tc_dump_action: action bad kind\n");
831 a_o
= tc_lookup_action(kind
);
836 memset(&a
, 0, sizeof(struct tc_action
));
839 if (a_o
->walk
== NULL
) {
840 printk("tc_dump_action: %s !capable of dumping table\n", a_o
->kind
);
844 nlh
= NLMSG_PUT(skb
, NETLINK_CB(cb
->skb
).pid
, cb
->nlh
->nlmsg_seq
,
845 cb
->nlh
->nlmsg_type
, sizeof(*t
));
847 t
->tca_family
= AF_UNSPEC
;
851 x
= (struct rtattr
*) skb
->tail
;
852 RTA_PUT(skb
, TCA_ACT_TAB
, 0, NULL
);
854 ret
= a_o
->walk(skb
, cb
, RTM_GETACTION
, &a
);
859 x
->rta_len
= skb
->tail
- (u8
*) x
;
862 skb_trim(skb
, (u8
*)x
- skb
->data
);
864 nlh
->nlmsg_len
= skb
->tail
- b
;
865 if (NETLINK_CB(cb
->skb
).pid
&& ret
)
866 nlh
->nlmsg_flags
|= NLM_F_MULTI
;
867 module_put(a_o
->owner
);
872 module_put(a_o
->owner
);
873 skb_trim(skb
, b
- skb
->data
);
877 static int __init
tc_action_init(void)
879 struct rtnetlink_link
*link_p
= rtnetlink_links
[PF_UNSPEC
];
882 link_p
[RTM_NEWACTION
-RTM_BASE
].doit
= tc_ctl_action
;
883 link_p
[RTM_DELACTION
-RTM_BASE
].doit
= tc_ctl_action
;
884 link_p
[RTM_GETACTION
-RTM_BASE
].doit
= tc_ctl_action
;
885 link_p
[RTM_GETACTION
-RTM_BASE
].dumpit
= tc_dump_action
;
891 subsys_initcall(tc_action_init
);
893 EXPORT_SYMBOL(tcf_register_action
);
894 EXPORT_SYMBOL(tcf_unregister_action
);
895 EXPORT_SYMBOL(tcf_action_exec
);
896 EXPORT_SYMBOL(tcf_action_dump_1
);