2 * net/sched/act_api.c Packet action API.
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
9 * Author: Jamal Hadi Salim
14 #include <asm/uaccess.h>
15 #include <asm/system.h>
16 #include <linux/bitops.h>
17 #include <linux/config.h>
18 #include <linux/types.h>
19 #include <linux/kernel.h>
20 #include <linux/sched.h>
21 #include <linux/string.h>
23 #include <linux/socket.h>
24 #include <linux/sockios.h>
26 #include <linux/errno.h>
27 #include <linux/interrupt.h>
28 #include <linux/netdevice.h>
29 #include <linux/skbuff.h>
30 #include <linux/rtnetlink.h>
31 #include <linux/init.h>
32 #include <linux/kmod.h>
34 #include <net/sch_generic.h>
35 #include <net/act_api.h>
38 #define DPRINTK(format, args...) printk(KERN_DEBUG format, ##args)
40 #define DPRINTK(format, args...)
43 #define D2PRINTK(format, args...) printk(KERN_DEBUG format, ##args)
45 #define D2PRINTK(format, args...)
48 static struct tc_action_ops
*act_base
= NULL
;
49 static DEFINE_RWLOCK(act_mod_lock
);
51 int tcf_register_action(struct tc_action_ops
*act
)
53 struct tc_action_ops
*a
, **ap
;
55 write_lock(&act_mod_lock
);
56 for (ap
= &act_base
; (a
= *ap
) != NULL
; ap
= &a
->next
) {
57 if (act
->type
== a
->type
|| (strcmp(act
->kind
, a
->kind
) == 0)) {
58 write_unlock(&act_mod_lock
);
64 write_unlock(&act_mod_lock
);
68 int tcf_unregister_action(struct tc_action_ops
*act
)
70 struct tc_action_ops
*a
, **ap
;
73 write_lock(&act_mod_lock
);
74 for (ap
= &act_base
; (a
= *ap
) != NULL
; ap
= &a
->next
)
82 write_unlock(&act_mod_lock
);
87 static struct tc_action_ops
*tc_lookup_action_n(char *kind
)
89 struct tc_action_ops
*a
= NULL
;
92 read_lock(&act_mod_lock
);
93 for (a
= act_base
; a
; a
= a
->next
) {
94 if (strcmp(kind
, a
->kind
) == 0) {
95 if (!try_module_get(a
->owner
)) {
96 read_unlock(&act_mod_lock
);
102 read_unlock(&act_mod_lock
);
107 /* lookup by rtattr */
108 static struct tc_action_ops
*tc_lookup_action(struct rtattr
*kind
)
110 struct tc_action_ops
*a
= NULL
;
113 read_lock(&act_mod_lock
);
114 for (a
= act_base
; a
; a
= a
->next
) {
115 if (rtattr_strcmp(kind
, a
->kind
) == 0) {
116 if (!try_module_get(a
->owner
)) {
117 read_unlock(&act_mod_lock
);
123 read_unlock(&act_mod_lock
);
130 static struct tc_action_ops
*tc_lookup_action_id(u32 type
)
132 struct tc_action_ops
*a
= NULL
;
135 read_lock(&act_mod_lock
);
136 for (a
= act_base
; a
; a
= a
->next
) {
137 if (a
->type
== type
) {
138 if (!try_module_get(a
->owner
)) {
139 read_unlock(&act_mod_lock
);
145 read_unlock(&act_mod_lock
);
151 int tcf_action_exec(struct sk_buff
*skb
, struct tc_action
*act
,
152 struct tcf_result
*res
)
157 if (skb
->tc_verd
& TC_NCLS
) {
158 skb
->tc_verd
= CLR_TC_NCLS(skb
->tc_verd
);
159 D2PRINTK("(%p)tcf_action_exec: cleared TC_NCLS in %s out %s\n",
160 skb
, skb
->input_dev
? skb
->input_dev
->name
: "xxx",
165 while ((a
= act
) != NULL
) {
167 if (a
->ops
&& a
->ops
->act
) {
168 ret
= a
->ops
->act(&skb
, a
);
169 if (TC_MUNGED
& skb
->tc_verd
) {
170 /* copied already, allow trampling */
171 skb
->tc_verd
= SET_TC_OK2MUNGE(skb
->tc_verd
);
172 skb
->tc_verd
= CLR_TC_MUNGED(skb
->tc_verd
);
174 if (ret
== TC_ACT_REPEAT
)
175 goto repeat
; /* we need a ttl - JHS */
176 if (ret
!= TC_ACT_PIPE
)
182 if (skb
->tc_classid
> 0) {
183 res
->classid
= skb
->tc_classid
;
190 void tcf_action_destroy(struct tc_action
*act
, int bind
)
194 for (a
= act
; a
; a
= act
) {
195 if (a
->ops
&& a
->ops
->cleanup
) {
196 DPRINTK("tcf_action_destroy destroying %p next %p\n",
198 if (a
->ops
->cleanup(a
, bind
) == ACT_P_DELETED
)
199 module_put(a
->ops
->owner
);
202 } else { /*FIXME: Remove later - catch insertion bugs*/
203 printk("tcf_action_destroy: BUG? destroying NULL ops\n");
211 tcf_action_dump_old(struct sk_buff
*skb
, struct tc_action
*a
, int bind
, int ref
)
215 if (a
->ops
== NULL
|| a
->ops
->dump
== NULL
)
217 return a
->ops
->dump(skb
, a
, bind
, ref
);
221 tcf_action_dump_1(struct sk_buff
*skb
, struct tc_action
*a
, int bind
, int ref
)
224 unsigned char *b
= skb
->tail
;
227 if (a
->ops
== NULL
|| a
->ops
->dump
== NULL
)
230 RTA_PUT(skb
, TCA_KIND
, IFNAMSIZ
, a
->ops
->kind
);
231 if (tcf_action_copy_stats(skb
, a
, 0))
233 r
= (struct rtattr
*) skb
->tail
;
234 RTA_PUT(skb
, TCA_OPTIONS
, 0, NULL
);
235 if ((err
= tcf_action_dump_old(skb
, a
, bind
, ref
)) > 0) {
236 r
->rta_len
= skb
->tail
- (u8
*)r
;
241 skb_trim(skb
, b
- skb
->data
);
246 tcf_action_dump(struct sk_buff
*skb
, struct tc_action
*act
, int bind
, int ref
)
250 unsigned char *b
= skb
->tail
;
253 while ((a
= act
) != NULL
) {
254 r
= (struct rtattr
*) skb
->tail
;
256 RTA_PUT(skb
, a
->order
, 0, NULL
);
257 err
= tcf_action_dump_1(skb
, a
, bind
, ref
);
260 r
->rta_len
= skb
->tail
- (u8
*)r
;
266 skb_trim(skb
, b
- skb
->data
);
270 struct tc_action
*tcf_action_init_1(struct rtattr
*rta
, struct rtattr
*est
,
271 char *name
, int ovr
, int bind
, int *err
)
274 struct tc_action_ops
*a_o
;
275 char act_name
[IFNAMSIZ
];
276 struct rtattr
*tb
[TCA_ACT_MAX
+1];
282 if (rtattr_parse_nested(tb
, TCA_ACT_MAX
, rta
) < 0)
284 kind
= tb
[TCA_ACT_KIND
-1];
287 if (rtattr_strlcpy(act_name
, kind
, IFNAMSIZ
) >= IFNAMSIZ
)
290 if (strlcpy(act_name
, name
, IFNAMSIZ
) >= IFNAMSIZ
)
294 a_o
= tc_lookup_action_n(act_name
);
298 request_module(act_name
);
301 a_o
= tc_lookup_action_n(act_name
);
303 /* We dropped the RTNL semaphore in order to
304 * perform the module load. So, even if we
305 * succeeded in loading the module we have to
306 * tell the caller to replay the request. We
307 * indicate this using -EAGAIN.
318 a
= kmalloc(sizeof(*a
), GFP_KERNEL
);
321 memset(a
, 0, sizeof(*a
));
323 /* backward compatibility for policer */
325 *err
= a_o
->init(tb
[TCA_ACT_OPTIONS
-1], est
, a
, ovr
, bind
);
327 *err
= a_o
->init(rta
, est
, a
, ovr
, bind
);
331 /* module count goes up only when brand new policy is created
332 if it exists and is only bound to in a_o->init() then
333 ACT_P_CREATED is not returned (a zero is).
335 if (*err
!= ACT_P_CREATED
)
336 module_put(a_o
->owner
);
338 DPRINTK("tcf_action_init_1: successfull %s\n", act_name
);
346 module_put(a_o
->owner
);
351 struct tc_action
*tcf_action_init(struct rtattr
*rta
, struct rtattr
*est
,
352 char *name
, int ovr
, int bind
, int *err
)
354 struct rtattr
*tb
[TCA_ACT_MAX_PRIO
+1];
355 struct tc_action
*head
= NULL
, *act
, *act_prev
= NULL
;
358 if (rtattr_parse_nested(tb
, TCA_ACT_MAX_PRIO
, rta
) < 0) {
363 for (i
=0; i
< TCA_ACT_MAX_PRIO
&& tb
[i
]; i
++) {
364 act
= tcf_action_init_1(tb
[i
], est
, name
, ovr
, bind
, err
);
372 act_prev
->next
= act
;
379 tcf_action_destroy(head
, bind
);
383 int tcf_action_copy_stats(struct sk_buff
*skb
, struct tc_action
*a
,
388 struct tcf_act_hdr
*h
= a
->priv
;
393 /* compat_mode being true specifies a call that is supposed
394 * to add additional backward compatiblity statistic TLVs.
397 if (a
->type
== TCA_OLD_COMPAT
)
398 err
= gnet_stats_start_copy_compat(skb
, 0,
399 TCA_STATS
, TCA_XSTATS
, h
->stats_lock
, &d
);
403 err
= gnet_stats_start_copy(skb
, TCA_ACT_STATS
,
409 if (a
->ops
!= NULL
&& a
->ops
->get_stats
!= NULL
)
410 if (a
->ops
->get_stats(skb
, a
) < 0)
413 if (gnet_stats_copy_basic(&d
, &h
->bstats
) < 0 ||
414 #ifdef CONFIG_NET_ESTIMATOR
415 gnet_stats_copy_rate_est(&d
, &h
->rate_est
) < 0 ||
417 gnet_stats_copy_queue(&d
, &h
->qstats
) < 0)
420 if (gnet_stats_finish_copy(&d
) < 0)
430 tca_get_fill(struct sk_buff
*skb
, struct tc_action
*a
, u32 pid
, u32 seq
,
431 u16 flags
, int event
, int bind
, int ref
)
434 struct nlmsghdr
*nlh
;
435 unsigned char *b
= skb
->tail
;
438 nlh
= NLMSG_NEW(skb
, pid
, seq
, event
, sizeof(*t
), flags
);
441 t
->tca_family
= AF_UNSPEC
;
445 x
= (struct rtattr
*) skb
->tail
;
446 RTA_PUT(skb
, TCA_ACT_TAB
, 0, NULL
);
448 if (tcf_action_dump(skb
, a
, bind
, ref
) < 0)
451 x
->rta_len
= skb
->tail
- (u8
*)x
;
453 nlh
->nlmsg_len
= skb
->tail
- b
;
458 skb_trim(skb
, b
- skb
->data
);
463 act_get_notify(u32 pid
, struct nlmsghdr
*n
, struct tc_action
*a
, int event
)
468 skb
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
471 if (tca_get_fill(skb
, a
, pid
, n
->nlmsg_seq
, 0, event
, 0, 0) <= 0) {
475 err
= netlink_unicast(rtnl
, skb
, pid
, MSG_DONTWAIT
);
481 static struct tc_action
*
482 tcf_action_get_1(struct rtattr
*rta
, struct nlmsghdr
*n
, u32 pid
, int *err
)
484 struct rtattr
*tb
[TCA_ACT_MAX
+1];
489 if (rtattr_parse_nested(tb
, TCA_ACT_MAX
, rta
) < 0)
492 if (tb
[TCA_ACT_INDEX
- 1] == NULL
||
493 RTA_PAYLOAD(tb
[TCA_ACT_INDEX
- 1]) < sizeof(index
))
495 index
= *(int *)RTA_DATA(tb
[TCA_ACT_INDEX
- 1]);
498 a
= kmalloc(sizeof(struct tc_action
), GFP_KERNEL
);
501 memset(a
, 0, sizeof(struct tc_action
));
504 a
->ops
= tc_lookup_action(tb
[TCA_ACT_KIND
- 1]);
507 if (a
->ops
->lookup
== NULL
)
510 if (a
->ops
->lookup(a
, index
) == 0)
513 module_put(a
->ops
->owner
);
517 module_put(a
->ops
->owner
);
523 static void cleanup_a(struct tc_action
*act
)
527 for (a
= act
; a
; a
= act
) {
533 static struct tc_action
*create_a(int i
)
535 struct tc_action
*act
;
537 act
= kmalloc(sizeof(*act
), GFP_KERNEL
);
539 printk("create_a: failed to alloc!\n");
542 memset(act
, 0, sizeof(*act
));
547 static int tca_action_flush(struct rtattr
*rta
, struct nlmsghdr
*n
, u32 pid
)
551 struct nlmsghdr
*nlh
;
553 struct netlink_callback dcb
;
555 struct rtattr
*tb
[TCA_ACT_MAX
+1];
557 struct tc_action
*a
= create_a(0);
561 printk("tca_action_flush: couldnt create tc_action\n");
565 skb
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
567 printk("tca_action_flush: failed skb alloc\n");
572 b
= (unsigned char *)skb
->tail
;
574 if (rtattr_parse_nested(tb
, TCA_ACT_MAX
, rta
) < 0)
577 kind
= tb
[TCA_ACT_KIND
-1];
578 a
->ops
= tc_lookup_action(kind
);
582 nlh
= NLMSG_PUT(skb
, pid
, n
->nlmsg_seq
, RTM_DELACTION
, sizeof(*t
));
584 t
->tca_family
= AF_UNSPEC
;
588 x
= (struct rtattr
*) skb
->tail
;
589 RTA_PUT(skb
, TCA_ACT_TAB
, 0, NULL
);
591 err
= a
->ops
->walk(skb
, &dcb
, RTM_DELACTION
, a
);
595 x
->rta_len
= skb
->tail
- (u8
*) x
;
597 nlh
->nlmsg_len
= skb
->tail
- b
;
598 nlh
->nlmsg_flags
|= NLM_F_ROOT
;
599 module_put(a
->ops
->owner
);
601 err
= rtnetlink_send(skb
, pid
, RTMGRP_TC
, n
->nlmsg_flags
&NLM_F_ECHO
);
608 module_put(a
->ops
->owner
);
617 tca_action_gd(struct rtattr
*rta
, struct nlmsghdr
*n
, u32 pid
, int event
)
620 struct rtattr
*tb
[TCA_ACT_MAX_PRIO
+1];
621 struct tc_action
*head
= NULL
, *act
, *act_prev
= NULL
;
623 if (rtattr_parse_nested(tb
, TCA_ACT_MAX_PRIO
, rta
) < 0)
626 if (event
== RTM_DELACTION
&& n
->nlmsg_flags
&NLM_F_ROOT
) {
627 if (tb
[0] != NULL
&& tb
[1] == NULL
)
628 return tca_action_flush(tb
[0], n
, pid
);
631 for (i
=0; i
< TCA_ACT_MAX_PRIO
&& tb
[i
]; i
++) {
632 act
= tcf_action_get_1(tb
[i
], n
, pid
, &ret
);
640 act_prev
->next
= act
;
644 if (event
== RTM_GETACTION
)
645 ret
= act_get_notify(pid
, n
, head
, event
);
649 skb
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
655 if (tca_get_fill(skb
, head
, pid
, n
->nlmsg_seq
, 0, event
,
662 /* now do the delete */
663 tcf_action_destroy(head
, 0);
664 ret
= rtnetlink_send(skb
, pid
, RTMGRP_TC
,
665 n
->nlmsg_flags
&NLM_F_ECHO
);
675 static int tcf_add_notify(struct tc_action
*a
, u32 pid
, u32 seq
, int event
,
679 struct nlmsghdr
*nlh
;
685 skb
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
689 b
= (unsigned char *)skb
->tail
;
691 nlh
= NLMSG_NEW(skb
, pid
, seq
, event
, sizeof(*t
), flags
);
693 t
->tca_family
= AF_UNSPEC
;
697 x
= (struct rtattr
*) skb
->tail
;
698 RTA_PUT(skb
, TCA_ACT_TAB
, 0, NULL
);
700 if (tcf_action_dump(skb
, a
, 0, 0) < 0)
703 x
->rta_len
= skb
->tail
- (u8
*)x
;
705 nlh
->nlmsg_len
= skb
->tail
- b
;
706 NETLINK_CB(skb
).dst_groups
= RTMGRP_TC
;
708 err
= rtnetlink_send(skb
, pid
, RTMGRP_TC
, flags
&NLM_F_ECHO
);
715 skb_trim(skb
, b
- skb
->data
);
721 tcf_action_add(struct rtattr
*rta
, struct nlmsghdr
*n
, u32 pid
, int ovr
)
724 struct tc_action
*act
;
726 u32 seq
= n
->nlmsg_seq
;
728 act
= tcf_action_init(rta
, NULL
, NULL
, ovr
, 0, &ret
);
732 /* dump then free all the actions after update; inserted policy
735 ret
= tcf_add_notify(act
, pid
, seq
, RTM_NEWACTION
, n
->nlmsg_flags
);
736 for (a
= act
; a
; a
= act
) {
744 static int tc_ctl_action(struct sk_buff
*skb
, struct nlmsghdr
*n
, void *arg
)
746 struct rtattr
**tca
= arg
;
747 u32 pid
= skb
? NETLINK_CB(skb
).pid
: 0;
748 int ret
= 0, ovr
= 0;
750 if (tca
[TCA_ACT_TAB
-1] == NULL
) {
751 printk("tc_ctl_action: received NO action attribs\n");
755 /* n->nlmsg_flags&NLM_F_CREATE
757 switch (n
->nlmsg_type
) {
759 /* we are going to assume all other flags
760 * imply create only if it doesnt exist
761 * Note that CREATE | EXCL implies that
762 * but since we want avoid ambiguity (eg when flags
763 * is zero) then just set this
765 if (n
->nlmsg_flags
&NLM_F_REPLACE
)
768 ret
= tcf_action_add(tca
[TCA_ACT_TAB
-1], n
, pid
, ovr
);
773 ret
= tca_action_gd(tca
[TCA_ACT_TAB
-1], n
, pid
, RTM_DELACTION
);
776 ret
= tca_action_gd(tca
[TCA_ACT_TAB
-1], n
, pid
, RTM_GETACTION
);
786 find_dump_kind(struct nlmsghdr
*n
)
788 struct rtattr
*tb1
, *tb2
[TCA_ACT_MAX
+1];
789 struct rtattr
*tb
[TCA_ACT_MAX_PRIO
+ 1];
790 struct rtattr
*rta
[TCAA_MAX
+ 1];
792 int min_len
= NLMSG_LENGTH(sizeof(struct tcamsg
));
793 int attrlen
= n
->nlmsg_len
- NLMSG_ALIGN(min_len
);
794 struct rtattr
*attr
= (void *) n
+ NLMSG_ALIGN(min_len
);
796 if (rtattr_parse(rta
, TCAA_MAX
, attr
, attrlen
) < 0)
798 tb1
= rta
[TCA_ACT_TAB
- 1];
802 if (rtattr_parse(tb
, TCA_ACT_MAX_PRIO
, RTA_DATA(tb1
),
803 NLMSG_ALIGN(RTA_PAYLOAD(tb1
))) < 0)
808 if (rtattr_parse(tb2
, TCA_ACT_MAX
, RTA_DATA(tb
[0]),
809 RTA_PAYLOAD(tb
[0])) < 0)
811 kind
= tb2
[TCA_ACT_KIND
-1];
813 return (char *) RTA_DATA(kind
);
817 tc_dump_action(struct sk_buff
*skb
, struct netlink_callback
*cb
)
819 struct nlmsghdr
*nlh
;
820 unsigned char *b
= skb
->tail
;
822 struct tc_action_ops
*a_o
;
825 struct tcamsg
*t
= (struct tcamsg
*) NLMSG_DATA(cb
->nlh
);
826 char *kind
= find_dump_kind(cb
->nlh
);
829 printk("tc_dump_action: action bad kind\n");
833 a_o
= tc_lookup_action_n(kind
);
835 printk("failed to find %s\n", kind
);
839 memset(&a
, 0, sizeof(struct tc_action
));
842 if (a_o
->walk
== NULL
) {
843 printk("tc_dump_action: %s !capable of dumping table\n", kind
);
847 nlh
= NLMSG_PUT(skb
, NETLINK_CB(cb
->skb
).pid
, cb
->nlh
->nlmsg_seq
,
848 cb
->nlh
->nlmsg_type
, sizeof(*t
));
850 t
->tca_family
= AF_UNSPEC
;
854 x
= (struct rtattr
*) skb
->tail
;
855 RTA_PUT(skb
, TCA_ACT_TAB
, 0, NULL
);
857 ret
= a_o
->walk(skb
, cb
, RTM_GETACTION
, &a
);
862 x
->rta_len
= skb
->tail
- (u8
*) x
;
865 skb_trim(skb
, (u8
*)x
- skb
->data
);
867 nlh
->nlmsg_len
= skb
->tail
- b
;
868 if (NETLINK_CB(cb
->skb
).pid
&& ret
)
869 nlh
->nlmsg_flags
|= NLM_F_MULTI
;
870 module_put(a_o
->owner
);
875 module_put(a_o
->owner
);
876 skb_trim(skb
, b
- skb
->data
);
880 static int __init
tc_action_init(void)
882 struct rtnetlink_link
*link_p
= rtnetlink_links
[PF_UNSPEC
];
885 link_p
[RTM_NEWACTION
-RTM_BASE
].doit
= tc_ctl_action
;
886 link_p
[RTM_DELACTION
-RTM_BASE
].doit
= tc_ctl_action
;
887 link_p
[RTM_GETACTION
-RTM_BASE
].doit
= tc_ctl_action
;
888 link_p
[RTM_GETACTION
-RTM_BASE
].dumpit
= tc_dump_action
;
891 printk("TC classifier action (bugs to netdev@vger.kernel.org cc "
892 "hadi@cyberus.ca)\n");
896 subsys_initcall(tc_action_init
);
898 EXPORT_SYMBOL(tcf_register_action
);
899 EXPORT_SYMBOL(tcf_unregister_action
);
900 EXPORT_SYMBOL(tcf_action_exec
);
901 EXPORT_SYMBOL(tcf_action_dump_1
);