1 // SPDX-License-Identifier: GPL-2.0-or-later
3 * net/sched/act_api.c Packet action API.
5 * Author: Jamal Hadi Salim
8 #include <linux/types.h>
9 #include <linux/kernel.h>
10 #include <linux/string.h>
11 #include <linux/errno.h>
12 #include <linux/slab.h>
13 #include <linux/skbuff.h>
14 #include <linux/init.h>
15 #include <linux/kmod.h>
16 #include <linux/err.h>
17 #include <linux/module.h>
18 #include <net/net_namespace.h>
20 #include <net/sch_generic.h>
21 #include <net/pkt_cls.h>
22 #include <net/act_api.h>
23 #include <net/netlink.h>
25 static void tcf_action_goto_chain_exec(const struct tc_action
*a
,
26 struct tcf_result
*res
)
28 const struct tcf_chain
*chain
= rcu_dereference_bh(a
->goto_chain
);
30 res
->goto_tp
= rcu_dereference_bh(chain
->filter_chain
);
33 static void tcf_free_cookie_rcu(struct rcu_head
*p
)
35 struct tc_cookie
*cookie
= container_of(p
, struct tc_cookie
, rcu
);
41 static void tcf_set_action_cookie(struct tc_cookie __rcu
**old_cookie
,
42 struct tc_cookie
*new_cookie
)
44 struct tc_cookie
*old
;
46 old
= xchg((__force
struct tc_cookie
**)old_cookie
, new_cookie
);
48 call_rcu(&old
->rcu
, tcf_free_cookie_rcu
);
51 int tcf_action_check_ctrlact(int action
, struct tcf_proto
*tp
,
52 struct tcf_chain
**newchain
,
53 struct netlink_ext_ack
*extack
)
55 int opcode
= TC_ACT_EXT_OPCODE(action
), ret
= -EINVAL
;
59 ret
= action
> TC_ACT_VALUE_MAX
? -EINVAL
: 0;
60 else if (opcode
<= TC_ACT_EXT_OPCODE_MAX
|| action
== TC_ACT_UNSPEC
)
63 NL_SET_ERR_MSG(extack
, "invalid control action");
67 if (TC_ACT_EXT_CMP(action
, TC_ACT_GOTO_CHAIN
)) {
68 chain_index
= action
& TC_ACT_EXT_VAL_MASK
;
69 if (!tp
|| !newchain
) {
71 NL_SET_ERR_MSG(extack
,
72 "can't goto NULL proto/chain");
75 *newchain
= tcf_chain_get_by_act(tp
->chain
->block
, chain_index
);
78 NL_SET_ERR_MSG(extack
,
79 "can't allocate goto_chain");
85 EXPORT_SYMBOL(tcf_action_check_ctrlact
);
87 struct tcf_chain
*tcf_action_set_ctrlact(struct tc_action
*a
, int action
,
88 struct tcf_chain
*goto_chain
)
90 a
->tcfa_action
= action
;
91 goto_chain
= rcu_replace_pointer(a
->goto_chain
, goto_chain
, 1);
94 EXPORT_SYMBOL(tcf_action_set_ctrlact
);
96 /* XXX: For standalone actions, we don't need a RCU grace period either, because
97 * actions are always connected to filters and filters are already destroyed in
98 * RCU callbacks, so after a RCU grace period actions are already disconnected
99 * from filters. Readers later can not find us.
101 static void free_tcf(struct tc_action
*p
)
103 struct tcf_chain
*chain
= rcu_dereference_protected(p
->goto_chain
, 1);
105 free_percpu(p
->cpu_bstats
);
106 free_percpu(p
->cpu_bstats_hw
);
107 free_percpu(p
->cpu_qstats
);
109 tcf_set_action_cookie(&p
->act_cookie
, NULL
);
111 tcf_chain_put_by_act(chain
);
116 static void tcf_action_cleanup(struct tc_action
*p
)
121 gen_kill_estimator(&p
->tcfa_rate_est
);
125 static int __tcf_action_put(struct tc_action
*p
, bool bind
)
127 struct tcf_idrinfo
*idrinfo
= p
->idrinfo
;
129 if (refcount_dec_and_mutex_lock(&p
->tcfa_refcnt
, &idrinfo
->lock
)) {
131 atomic_dec(&p
->tcfa_bindcnt
);
132 idr_remove(&idrinfo
->action_idr
, p
->tcfa_index
);
133 mutex_unlock(&idrinfo
->lock
);
135 tcf_action_cleanup(p
);
140 atomic_dec(&p
->tcfa_bindcnt
);
145 int __tcf_idr_release(struct tc_action
*p
, bool bind
, bool strict
)
149 /* Release with strict==1 and bind==0 is only called through act API
150 * interface (classifiers always bind). Only case when action with
151 * positive reference count and zero bind count can exist is when it was
152 * also created with act API (unbinding last classifier will destroy the
153 * action if it was created by classifier). So only case when bind count
154 * can be changed after initial check is when unbound action is
155 * destroyed by act API while classifier binds to action with same id
156 * concurrently. This result either creation of new action(same behavior
157 * as before), or reusing existing action if concurrent process
158 * increments reference count before action is deleted. Both scenarios
162 if (!bind
&& strict
&& atomic_read(&p
->tcfa_bindcnt
) > 0)
165 if (__tcf_action_put(p
, bind
))
171 EXPORT_SYMBOL(__tcf_idr_release
);
173 static size_t tcf_action_shared_attrs_size(const struct tc_action
*act
)
175 struct tc_cookie
*act_cookie
;
179 act_cookie
= rcu_dereference(act
->act_cookie
);
182 cookie_len
= nla_total_size(act_cookie
->len
);
185 return nla_total_size(0) /* action number nested */
186 + nla_total_size(IFNAMSIZ
) /* TCA_ACT_KIND */
187 + cookie_len
/* TCA_ACT_COOKIE */
188 + nla_total_size(sizeof(struct nla_bitfield32
)) /* TCA_ACT_HW_STATS */
189 + nla_total_size(0) /* TCA_ACT_STATS nested */
190 + nla_total_size(sizeof(struct nla_bitfield32
)) /* TCA_ACT_FLAGS */
191 /* TCA_STATS_BASIC */
192 + nla_total_size_64bit(sizeof(struct gnet_stats_basic
))
193 /* TCA_STATS_PKT64 */
194 + nla_total_size_64bit(sizeof(u64
))
195 /* TCA_STATS_QUEUE */
196 + nla_total_size_64bit(sizeof(struct gnet_stats_queue
))
197 + nla_total_size(0) /* TCA_OPTIONS nested */
198 + nla_total_size(sizeof(struct tcf_t
)); /* TCA_GACT_TM */
201 static size_t tcf_action_full_attrs_size(size_t sz
)
203 return NLMSG_HDRLEN
/* struct nlmsghdr */
204 + sizeof(struct tcamsg
)
205 + nla_total_size(0) /* TCA_ACT_TAB nested */
209 static size_t tcf_action_fill_size(const struct tc_action
*act
)
211 size_t sz
= tcf_action_shared_attrs_size(act
);
213 if (act
->ops
->get_fill_size
)
214 return act
->ops
->get_fill_size(act
) + sz
;
218 static int tcf_dump_walker(struct tcf_idrinfo
*idrinfo
, struct sk_buff
*skb
,
219 struct netlink_callback
*cb
)
221 int err
= 0, index
= -1, s_i
= 0, n_i
= 0;
222 u32 act_flags
= cb
->args
[2];
223 unsigned long jiffy_since
= cb
->args
[3];
225 struct idr
*idr
= &idrinfo
->action_idr
;
227 unsigned long id
= 1;
230 mutex_lock(&idrinfo
->lock
);
234 idr_for_each_entry_ul(idr
, p
, tmp
, id
) {
240 time_after(jiffy_since
,
241 (unsigned long)p
->tcfa_tm
.lastuse
))
244 nest
= nla_nest_start_noflag(skb
, n_i
);
247 goto nla_put_failure
;
249 err
= tcf_action_dump_1(skb
, p
, 0, 0);
252 nlmsg_trim(skb
, nest
);
255 nla_nest_end(skb
, nest
);
257 if (!(act_flags
& TCA_FLAG_LARGE_DUMP_ON
) &&
258 n_i
>= TCA_ACT_MAX_PRIO
)
263 cb
->args
[0] = index
+ 1;
265 mutex_unlock(&idrinfo
->lock
);
267 if (act_flags
& TCA_FLAG_LARGE_DUMP_ON
)
273 nla_nest_cancel(skb
, nest
);
277 static int tcf_idr_release_unsafe(struct tc_action
*p
)
279 if (atomic_read(&p
->tcfa_bindcnt
) > 0)
282 if (refcount_dec_and_test(&p
->tcfa_refcnt
)) {
283 idr_remove(&p
->idrinfo
->action_idr
, p
->tcfa_index
);
284 tcf_action_cleanup(p
);
285 return ACT_P_DELETED
;
291 static int tcf_del_walker(struct tcf_idrinfo
*idrinfo
, struct sk_buff
*skb
,
292 const struct tc_action_ops
*ops
)
297 struct idr
*idr
= &idrinfo
->action_idr
;
299 unsigned long id
= 1;
302 nest
= nla_nest_start_noflag(skb
, 0);
304 goto nla_put_failure
;
305 if (nla_put_string(skb
, TCA_KIND
, ops
->kind
))
306 goto nla_put_failure
;
308 mutex_lock(&idrinfo
->lock
);
309 idr_for_each_entry_ul(idr
, p
, tmp
, id
) {
310 ret
= tcf_idr_release_unsafe(p
);
311 if (ret
== ACT_P_DELETED
) {
312 module_put(ops
->owner
);
314 } else if (ret
< 0) {
315 mutex_unlock(&idrinfo
->lock
);
316 goto nla_put_failure
;
319 mutex_unlock(&idrinfo
->lock
);
321 if (nla_put_u32(skb
, TCA_FCNT
, n_i
))
322 goto nla_put_failure
;
323 nla_nest_end(skb
, nest
);
327 nla_nest_cancel(skb
, nest
);
331 int tcf_generic_walker(struct tc_action_net
*tn
, struct sk_buff
*skb
,
332 struct netlink_callback
*cb
, int type
,
333 const struct tc_action_ops
*ops
,
334 struct netlink_ext_ack
*extack
)
336 struct tcf_idrinfo
*idrinfo
= tn
->idrinfo
;
338 if (type
== RTM_DELACTION
) {
339 return tcf_del_walker(idrinfo
, skb
, ops
);
340 } else if (type
== RTM_GETACTION
) {
341 return tcf_dump_walker(idrinfo
, skb
, cb
);
343 WARN(1, "tcf_generic_walker: unknown command %d\n", type
);
344 NL_SET_ERR_MSG(extack
, "tcf_generic_walker: unknown command");
348 EXPORT_SYMBOL(tcf_generic_walker
);
350 int tcf_idr_search(struct tc_action_net
*tn
, struct tc_action
**a
, u32 index
)
352 struct tcf_idrinfo
*idrinfo
= tn
->idrinfo
;
355 mutex_lock(&idrinfo
->lock
);
356 p
= idr_find(&idrinfo
->action_idr
, index
);
360 refcount_inc(&p
->tcfa_refcnt
);
361 mutex_unlock(&idrinfo
->lock
);
369 EXPORT_SYMBOL(tcf_idr_search
);
371 static int tcf_idr_delete_index(struct tcf_idrinfo
*idrinfo
, u32 index
)
376 mutex_lock(&idrinfo
->lock
);
377 p
= idr_find(&idrinfo
->action_idr
, index
);
379 mutex_unlock(&idrinfo
->lock
);
383 if (!atomic_read(&p
->tcfa_bindcnt
)) {
384 if (refcount_dec_and_test(&p
->tcfa_refcnt
)) {
385 struct module
*owner
= p
->ops
->owner
;
387 WARN_ON(p
!= idr_remove(&idrinfo
->action_idr
,
389 mutex_unlock(&idrinfo
->lock
);
391 tcf_action_cleanup(p
);
400 mutex_unlock(&idrinfo
->lock
);
404 int tcf_idr_create(struct tc_action_net
*tn
, u32 index
, struct nlattr
*est
,
405 struct tc_action
**a
, const struct tc_action_ops
*ops
,
406 int bind
, bool cpustats
, u32 flags
)
408 struct tc_action
*p
= kzalloc(ops
->size
, GFP_KERNEL
);
409 struct tcf_idrinfo
*idrinfo
= tn
->idrinfo
;
414 refcount_set(&p
->tcfa_refcnt
, 1);
416 atomic_set(&p
->tcfa_bindcnt
, 1);
419 p
->cpu_bstats
= netdev_alloc_pcpu_stats(struct gnet_stats_basic_cpu
);
422 p
->cpu_bstats_hw
= netdev_alloc_pcpu_stats(struct gnet_stats_basic_cpu
);
423 if (!p
->cpu_bstats_hw
)
425 p
->cpu_qstats
= alloc_percpu(struct gnet_stats_queue
);
429 spin_lock_init(&p
->tcfa_lock
);
430 p
->tcfa_index
= index
;
431 p
->tcfa_tm
.install
= jiffies
;
432 p
->tcfa_tm
.lastuse
= jiffies
;
433 p
->tcfa_tm
.firstuse
= 0;
434 p
->tcfa_flags
= flags
;
436 err
= gen_new_estimator(&p
->tcfa_bstats
, p
->cpu_bstats
,
438 &p
->tcfa_lock
, NULL
, est
);
443 p
->idrinfo
= idrinfo
;
448 free_percpu(p
->cpu_qstats
);
450 free_percpu(p
->cpu_bstats_hw
);
452 free_percpu(p
->cpu_bstats
);
457 EXPORT_SYMBOL(tcf_idr_create
);
459 int tcf_idr_create_from_flags(struct tc_action_net
*tn
, u32 index
,
460 struct nlattr
*est
, struct tc_action
**a
,
461 const struct tc_action_ops
*ops
, int bind
,
464 /* Set cpustats according to actions flags. */
465 return tcf_idr_create(tn
, index
, est
, a
, ops
, bind
,
466 !(flags
& TCA_ACT_FLAGS_NO_PERCPU_STATS
), flags
);
468 EXPORT_SYMBOL(tcf_idr_create_from_flags
);
470 void tcf_idr_insert(struct tc_action_net
*tn
, struct tc_action
*a
)
472 struct tcf_idrinfo
*idrinfo
= tn
->idrinfo
;
474 mutex_lock(&idrinfo
->lock
);
475 /* Replace ERR_PTR(-EBUSY) allocated by tcf_idr_check_alloc */
476 WARN_ON(!IS_ERR(idr_replace(&idrinfo
->action_idr
, a
, a
->tcfa_index
)));
477 mutex_unlock(&idrinfo
->lock
);
479 EXPORT_SYMBOL(tcf_idr_insert
);
481 /* Cleanup idr index that was allocated but not initialized. */
483 void tcf_idr_cleanup(struct tc_action_net
*tn
, u32 index
)
485 struct tcf_idrinfo
*idrinfo
= tn
->idrinfo
;
487 mutex_lock(&idrinfo
->lock
);
488 /* Remove ERR_PTR(-EBUSY) allocated by tcf_idr_check_alloc */
489 WARN_ON(!IS_ERR(idr_remove(&idrinfo
->action_idr
, index
)));
490 mutex_unlock(&idrinfo
->lock
);
492 EXPORT_SYMBOL(tcf_idr_cleanup
);
494 /* Check if action with specified index exists. If actions is found, increments
495 * its reference and bind counters, and return 1. Otherwise insert temporary
496 * error pointer (to prevent concurrent users from inserting actions with same
497 * index) and return 0.
500 int tcf_idr_check_alloc(struct tc_action_net
*tn
, u32
*index
,
501 struct tc_action
**a
, int bind
)
503 struct tcf_idrinfo
*idrinfo
= tn
->idrinfo
;
508 mutex_lock(&idrinfo
->lock
);
510 p
= idr_find(&idrinfo
->action_idr
, *index
);
512 /* This means that another process allocated
513 * index but did not assign the pointer yet.
515 mutex_unlock(&idrinfo
->lock
);
520 refcount_inc(&p
->tcfa_refcnt
);
522 atomic_inc(&p
->tcfa_bindcnt
);
527 ret
= idr_alloc_u32(&idrinfo
->action_idr
, NULL
, index
,
530 idr_replace(&idrinfo
->action_idr
,
531 ERR_PTR(-EBUSY
), *index
);
536 ret
= idr_alloc_u32(&idrinfo
->action_idr
, NULL
, index
,
537 UINT_MAX
, GFP_KERNEL
);
539 idr_replace(&idrinfo
->action_idr
, ERR_PTR(-EBUSY
),
542 mutex_unlock(&idrinfo
->lock
);
545 EXPORT_SYMBOL(tcf_idr_check_alloc
);
547 void tcf_idrinfo_destroy(const struct tc_action_ops
*ops
,
548 struct tcf_idrinfo
*idrinfo
)
550 struct idr
*idr
= &idrinfo
->action_idr
;
553 unsigned long id
= 1;
556 idr_for_each_entry_ul(idr
, p
, tmp
, id
) {
557 ret
= __tcf_idr_release(p
, false, true);
558 if (ret
== ACT_P_DELETED
)
559 module_put(ops
->owner
);
563 idr_destroy(&idrinfo
->action_idr
);
565 EXPORT_SYMBOL(tcf_idrinfo_destroy
);
567 static LIST_HEAD(act_base
);
568 static DEFINE_RWLOCK(act_mod_lock
);
570 int tcf_register_action(struct tc_action_ops
*act
,
571 struct pernet_operations
*ops
)
573 struct tc_action_ops
*a
;
576 if (!act
->act
|| !act
->dump
|| !act
->init
|| !act
->walk
|| !act
->lookup
)
579 /* We have to register pernet ops before making the action ops visible,
580 * otherwise tcf_action_init_1() could get a partially initialized
583 ret
= register_pernet_subsys(ops
);
587 write_lock(&act_mod_lock
);
588 list_for_each_entry(a
, &act_base
, head
) {
589 if (act
->id
== a
->id
|| (strcmp(act
->kind
, a
->kind
) == 0)) {
590 write_unlock(&act_mod_lock
);
591 unregister_pernet_subsys(ops
);
595 list_add_tail(&act
->head
, &act_base
);
596 write_unlock(&act_mod_lock
);
600 EXPORT_SYMBOL(tcf_register_action
);
602 int tcf_unregister_action(struct tc_action_ops
*act
,
603 struct pernet_operations
*ops
)
605 struct tc_action_ops
*a
;
608 write_lock(&act_mod_lock
);
609 list_for_each_entry(a
, &act_base
, head
) {
611 list_del(&act
->head
);
616 write_unlock(&act_mod_lock
);
618 unregister_pernet_subsys(ops
);
621 EXPORT_SYMBOL(tcf_unregister_action
);
624 static struct tc_action_ops
*tc_lookup_action_n(char *kind
)
626 struct tc_action_ops
*a
, *res
= NULL
;
629 read_lock(&act_mod_lock
);
630 list_for_each_entry(a
, &act_base
, head
) {
631 if (strcmp(kind
, a
->kind
) == 0) {
632 if (try_module_get(a
->owner
))
637 read_unlock(&act_mod_lock
);
642 /* lookup by nlattr */
643 static struct tc_action_ops
*tc_lookup_action(struct nlattr
*kind
)
645 struct tc_action_ops
*a
, *res
= NULL
;
648 read_lock(&act_mod_lock
);
649 list_for_each_entry(a
, &act_base
, head
) {
650 if (nla_strcmp(kind
, a
->kind
) == 0) {
651 if (try_module_get(a
->owner
))
656 read_unlock(&act_mod_lock
);
661 /*TCA_ACT_MAX_PRIO is 32, there count upto 32 */
662 #define TCA_ACT_MAX_PRIO_MASK 0x1FF
663 int tcf_action_exec(struct sk_buff
*skb
, struct tc_action
**actions
,
664 int nr_actions
, struct tcf_result
*res
)
667 u32 jmp_ttl
= TCA_ACT_MAX_PRIO
; /*matches actions per filter */
671 if (skb_skip_tc_classify(skb
))
675 for (i
= 0; i
< nr_actions
; i
++) {
676 const struct tc_action
*a
= actions
[i
];
678 if (jmp_prgcnt
> 0) {
683 ret
= a
->ops
->act(skb
, a
, res
);
684 if (ret
== TC_ACT_REPEAT
)
685 goto repeat
; /* we need a ttl - JHS */
687 if (TC_ACT_EXT_CMP(ret
, TC_ACT_JUMP
)) {
688 jmp_prgcnt
= ret
& TCA_ACT_MAX_PRIO_MASK
;
689 if (!jmp_prgcnt
|| (jmp_prgcnt
> nr_actions
)) {
690 /* faulty opcode, stop pipeline */
695 goto restart_act_graph
;
696 else /* faulty graph, stop pipeline */
699 } else if (TC_ACT_EXT_CMP(ret
, TC_ACT_GOTO_CHAIN
)) {
700 if (unlikely(!rcu_access_pointer(a
->goto_chain
))) {
701 net_warn_ratelimited("can't go to NULL chain!\n");
704 tcf_action_goto_chain_exec(a
, res
);
707 if (ret
!= TC_ACT_PIPE
)
713 EXPORT_SYMBOL(tcf_action_exec
);
715 int tcf_action_destroy(struct tc_action
*actions
[], int bind
)
717 const struct tc_action_ops
*ops
;
721 for (i
= 0; i
< TCA_ACT_MAX_PRIO
&& actions
[i
]; i
++) {
725 ret
= __tcf_idr_release(a
, bind
, true);
726 if (ret
== ACT_P_DELETED
)
727 module_put(ops
->owner
);
734 static int tcf_action_destroy_1(struct tc_action
*a
, int bind
)
736 struct tc_action
*actions
[] = { a
, NULL
};
738 return tcf_action_destroy(actions
, bind
);
741 static int tcf_action_put(struct tc_action
*p
)
743 return __tcf_action_put(p
, false);
746 /* Put all actions in this array, skip those NULL's. */
747 static void tcf_action_put_many(struct tc_action
*actions
[])
751 for (i
= 0; i
< TCA_ACT_MAX_PRIO
; i
++) {
752 struct tc_action
*a
= actions
[i
];
753 const struct tc_action_ops
*ops
;
758 if (tcf_action_put(a
))
759 module_put(ops
->owner
);
764 tcf_action_dump_old(struct sk_buff
*skb
, struct tc_action
*a
, int bind
, int ref
)
766 return a
->ops
->dump(skb
, a
, bind
, ref
);
770 tcf_action_dump_1(struct sk_buff
*skb
, struct tc_action
*a
, int bind
, int ref
)
773 unsigned char *b
= skb_tail_pointer(skb
);
775 struct tc_cookie
*cookie
;
777 if (nla_put_string(skb
, TCA_KIND
, a
->ops
->kind
))
778 goto nla_put_failure
;
779 if (tcf_action_copy_stats(skb
, a
, 0))
780 goto nla_put_failure
;
783 cookie
= rcu_dereference(a
->act_cookie
);
785 if (nla_put(skb
, TCA_ACT_COOKIE
, cookie
->len
, cookie
->data
)) {
787 goto nla_put_failure
;
792 if (a
->hw_stats
!= TCA_ACT_HW_STATS_ANY
&&
793 nla_put_bitfield32(skb
, TCA_ACT_HW_STATS
,
794 a
->hw_stats
, TCA_ACT_HW_STATS_ANY
))
795 goto nla_put_failure
;
797 if (a
->used_hw_stats_valid
&&
798 nla_put_bitfield32(skb
, TCA_ACT_USED_HW_STATS
,
799 a
->used_hw_stats
, TCA_ACT_HW_STATS_ANY
))
800 goto nla_put_failure
;
803 nla_put_bitfield32(skb
, TCA_ACT_FLAGS
,
804 a
->tcfa_flags
, a
->tcfa_flags
))
805 goto nla_put_failure
;
807 nest
= nla_nest_start_noflag(skb
, TCA_OPTIONS
);
809 goto nla_put_failure
;
810 err
= tcf_action_dump_old(skb
, a
, bind
, ref
);
812 nla_nest_end(skb
, nest
);
820 EXPORT_SYMBOL(tcf_action_dump_1
);
822 int tcf_action_dump(struct sk_buff
*skb
, struct tc_action
*actions
[],
826 int err
= -EINVAL
, i
;
829 for (i
= 0; i
< TCA_ACT_MAX_PRIO
&& actions
[i
]; i
++) {
831 nest
= nla_nest_start_noflag(skb
, i
+ 1);
833 goto nla_put_failure
;
834 err
= tcf_action_dump_1(skb
, a
, bind
, ref
);
837 nla_nest_end(skb
, nest
);
845 nla_nest_cancel(skb
, nest
);
849 static struct tc_cookie
*nla_memdup_cookie(struct nlattr
**tb
)
851 struct tc_cookie
*c
= kzalloc(sizeof(*c
), GFP_KERNEL
);
855 c
->data
= nla_memdup(tb
[TCA_ACT_COOKIE
], GFP_KERNEL
);
860 c
->len
= nla_len(tb
[TCA_ACT_COOKIE
]);
865 static u8
tcf_action_hw_stats_get(struct nlattr
*hw_stats_attr
)
867 struct nla_bitfield32 hw_stats_bf
;
869 /* If the user did not pass the attr, that means he does
870 * not care about the type. Return "any" in that case
871 * which is setting on all supported types.
874 return TCA_ACT_HW_STATS_ANY
;
875 hw_stats_bf
= nla_get_bitfield32(hw_stats_attr
);
876 return hw_stats_bf
.value
;
879 static const struct nla_policy tcf_action_policy
[TCA_ACT_MAX
+ 1] = {
880 [TCA_ACT_KIND
] = { .type
= NLA_STRING
},
881 [TCA_ACT_INDEX
] = { .type
= NLA_U32
},
882 [TCA_ACT_COOKIE
] = { .type
= NLA_BINARY
,
883 .len
= TC_COOKIE_MAX_SIZE
},
884 [TCA_ACT_OPTIONS
] = { .type
= NLA_NESTED
},
885 [TCA_ACT_FLAGS
] = NLA_POLICY_BITFIELD32(TCA_ACT_FLAGS_NO_PERCPU_STATS
),
886 [TCA_ACT_HW_STATS
] = NLA_POLICY_BITFIELD32(TCA_ACT_HW_STATS_ANY
),
889 struct tc_action
*tcf_action_init_1(struct net
*net
, struct tcf_proto
*tp
,
890 struct nlattr
*nla
, struct nlattr
*est
,
891 char *name
, int ovr
, int bind
,
893 struct netlink_ext_ack
*extack
)
895 struct nla_bitfield32 flags
= { 0, 0 };
896 u8 hw_stats
= TCA_ACT_HW_STATS_ANY
;
898 struct tc_action_ops
*a_o
;
899 struct tc_cookie
*cookie
= NULL
;
900 char act_name
[IFNAMSIZ
];
901 struct nlattr
*tb
[TCA_ACT_MAX
+ 1];
906 err
= nla_parse_nested_deprecated(tb
, TCA_ACT_MAX
, nla
,
907 tcf_action_policy
, extack
);
911 kind
= tb
[TCA_ACT_KIND
];
913 NL_SET_ERR_MSG(extack
, "TC action kind must be specified");
916 if (nla_strlcpy(act_name
, kind
, IFNAMSIZ
) >= IFNAMSIZ
) {
917 NL_SET_ERR_MSG(extack
, "TC action name too long");
920 if (tb
[TCA_ACT_COOKIE
]) {
921 cookie
= nla_memdup_cookie(tb
);
923 NL_SET_ERR_MSG(extack
, "No memory to generate TC cookie");
928 hw_stats
= tcf_action_hw_stats_get(tb
[TCA_ACT_HW_STATS
]);
929 if (tb
[TCA_ACT_FLAGS
])
930 flags
= nla_get_bitfield32(tb
[TCA_ACT_FLAGS
]);
932 if (strlcpy(act_name
, name
, IFNAMSIZ
) >= IFNAMSIZ
) {
933 NL_SET_ERR_MSG(extack
, "TC action name too long");
939 a_o
= tc_lookup_action_n(act_name
);
941 #ifdef CONFIG_MODULES
944 request_module("act_%s", act_name
);
948 a_o
= tc_lookup_action_n(act_name
);
950 /* We dropped the RTNL semaphore in order to
951 * perform the module load. So, even if we
952 * succeeded in loading the module we have to
953 * tell the caller to replay the request. We
954 * indicate this using -EAGAIN.
961 NL_SET_ERR_MSG(extack
, "Failed to load TC action module");
966 /* backward compatibility for policer */
968 err
= a_o
->init(net
, tb
[TCA_ACT_OPTIONS
], est
, &a
, ovr
, bind
,
969 rtnl_held
, tp
, flags
.value
, extack
);
971 err
= a_o
->init(net
, nla
, est
, &a
, ovr
, bind
, rtnl_held
,
972 tp
, flags
.value
, extack
);
976 if (!name
&& tb
[TCA_ACT_COOKIE
])
977 tcf_set_action_cookie(&a
->act_cookie
, cookie
);
980 a
->hw_stats
= hw_stats
;
982 /* module count goes up only when brand new policy is created
983 * if it exists and is only bound to in a_o->init() then
984 * ACT_P_CREATED is not returned (a zero is).
986 if (err
!= ACT_P_CREATED
)
987 module_put(a_o
->owner
);
989 if (TC_ACT_EXT_CMP(a
->tcfa_action
, TC_ACT_GOTO_CHAIN
) &&
990 !rcu_access_pointer(a
->goto_chain
)) {
991 tcf_action_destroy_1(a
, bind
);
992 NL_SET_ERR_MSG(extack
, "can't use goto chain with NULL chain");
993 return ERR_PTR(-EINVAL
);
999 module_put(a_o
->owner
);
1002 kfree(cookie
->data
);
1005 return ERR_PTR(err
);
1008 /* Returns numbers of initialized actions or negative error. */
1010 int tcf_action_init(struct net
*net
, struct tcf_proto
*tp
, struct nlattr
*nla
,
1011 struct nlattr
*est
, char *name
, int ovr
, int bind
,
1012 struct tc_action
*actions
[], size_t *attr_size
,
1013 bool rtnl_held
, struct netlink_ext_ack
*extack
)
1015 struct nlattr
*tb
[TCA_ACT_MAX_PRIO
+ 1];
1016 struct tc_action
*act
;
1021 err
= nla_parse_nested_deprecated(tb
, TCA_ACT_MAX_PRIO
, nla
, NULL
,
1026 for (i
= 1; i
<= TCA_ACT_MAX_PRIO
&& tb
[i
]; i
++) {
1027 act
= tcf_action_init_1(net
, tp
, tb
[i
], est
, name
, ovr
, bind
,
1033 sz
+= tcf_action_fill_size(act
);
1034 /* Start from index 0 */
1035 actions
[i
- 1] = act
;
1038 *attr_size
= tcf_action_full_attrs_size(sz
);
1042 tcf_action_destroy(actions
, bind
);
1046 void tcf_action_update_stats(struct tc_action
*a
, u64 bytes
, u32 packets
,
1049 if (a
->cpu_bstats
) {
1050 _bstats_cpu_update(this_cpu_ptr(a
->cpu_bstats
), bytes
, packets
);
1053 this_cpu_ptr(a
->cpu_qstats
)->drops
+= packets
;
1056 _bstats_cpu_update(this_cpu_ptr(a
->cpu_bstats_hw
),
1061 _bstats_update(&a
->tcfa_bstats
, bytes
, packets
);
1063 a
->tcfa_qstats
.drops
+= packets
;
1065 _bstats_update(&a
->tcfa_bstats_hw
, bytes
, packets
);
1067 EXPORT_SYMBOL(tcf_action_update_stats
);
1069 int tcf_action_copy_stats(struct sk_buff
*skb
, struct tc_action
*p
,
1078 /* compat_mode being true specifies a call that is supposed
1079 * to add additional backward compatibility statistic TLVs.
1082 if (p
->type
== TCA_OLD_COMPAT
)
1083 err
= gnet_stats_start_copy_compat(skb
, 0,
1091 err
= gnet_stats_start_copy(skb
, TCA_ACT_STATS
,
1092 &p
->tcfa_lock
, &d
, TCA_ACT_PAD
);
1097 if (gnet_stats_copy_basic(NULL
, &d
, p
->cpu_bstats
, &p
->tcfa_bstats
) < 0 ||
1098 gnet_stats_copy_basic_hw(NULL
, &d
, p
->cpu_bstats_hw
,
1099 &p
->tcfa_bstats_hw
) < 0 ||
1100 gnet_stats_copy_rate_est(&d
, &p
->tcfa_rate_est
) < 0 ||
1101 gnet_stats_copy_queue(&d
, p
->cpu_qstats
,
1103 p
->tcfa_qstats
.qlen
) < 0)
1106 if (gnet_stats_finish_copy(&d
) < 0)
1115 static int tca_get_fill(struct sk_buff
*skb
, struct tc_action
*actions
[],
1116 u32 portid
, u32 seq
, u16 flags
, int event
, int bind
,
1120 struct nlmsghdr
*nlh
;
1121 unsigned char *b
= skb_tail_pointer(skb
);
1122 struct nlattr
*nest
;
1124 nlh
= nlmsg_put(skb
, portid
, seq
, event
, sizeof(*t
), flags
);
1126 goto out_nlmsg_trim
;
1127 t
= nlmsg_data(nlh
);
1128 t
->tca_family
= AF_UNSPEC
;
1132 nest
= nla_nest_start_noflag(skb
, TCA_ACT_TAB
);
1134 goto out_nlmsg_trim
;
1136 if (tcf_action_dump(skb
, actions
, bind
, ref
) < 0)
1137 goto out_nlmsg_trim
;
1139 nla_nest_end(skb
, nest
);
1141 nlh
->nlmsg_len
= skb_tail_pointer(skb
) - b
;
1150 tcf_get_notify(struct net
*net
, u32 portid
, struct nlmsghdr
*n
,
1151 struct tc_action
*actions
[], int event
,
1152 struct netlink_ext_ack
*extack
)
1154 struct sk_buff
*skb
;
1156 skb
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
1159 if (tca_get_fill(skb
, actions
, portid
, n
->nlmsg_seq
, 0, event
,
1161 NL_SET_ERR_MSG(extack
, "Failed to fill netlink attributes while adding TC action");
1166 return rtnl_unicast(skb
, net
, portid
);
1169 static struct tc_action
*tcf_action_get_1(struct net
*net
, struct nlattr
*nla
,
1170 struct nlmsghdr
*n
, u32 portid
,
1171 struct netlink_ext_ack
*extack
)
1173 struct nlattr
*tb
[TCA_ACT_MAX
+ 1];
1174 const struct tc_action_ops
*ops
;
1175 struct tc_action
*a
;
1179 err
= nla_parse_nested_deprecated(tb
, TCA_ACT_MAX
, nla
,
1180 tcf_action_policy
, extack
);
1185 if (tb
[TCA_ACT_INDEX
] == NULL
||
1186 nla_len(tb
[TCA_ACT_INDEX
]) < sizeof(index
)) {
1187 NL_SET_ERR_MSG(extack
, "Invalid TC action index value");
1190 index
= nla_get_u32(tb
[TCA_ACT_INDEX
]);
1193 ops
= tc_lookup_action(tb
[TCA_ACT_KIND
]);
1194 if (!ops
) { /* could happen in batch of actions */
1195 NL_SET_ERR_MSG(extack
, "Specified TC action kind not found");
1199 if (ops
->lookup(net
, &a
, index
) == 0) {
1200 NL_SET_ERR_MSG(extack
, "TC action with specified index not found");
1204 module_put(ops
->owner
);
1208 module_put(ops
->owner
);
1210 return ERR_PTR(err
);
1213 static int tca_action_flush(struct net
*net
, struct nlattr
*nla
,
1214 struct nlmsghdr
*n
, u32 portid
,
1215 struct netlink_ext_ack
*extack
)
1217 struct sk_buff
*skb
;
1219 struct nlmsghdr
*nlh
;
1221 struct netlink_callback dcb
;
1222 struct nlattr
*nest
;
1223 struct nlattr
*tb
[TCA_ACT_MAX
+ 1];
1224 const struct tc_action_ops
*ops
;
1225 struct nlattr
*kind
;
1228 skb
= alloc_skb(NLMSG_GOODSIZE
, GFP_KERNEL
);
1232 b
= skb_tail_pointer(skb
);
1234 err
= nla_parse_nested_deprecated(tb
, TCA_ACT_MAX
, nla
,
1235 tcf_action_policy
, extack
);
1240 kind
= tb
[TCA_ACT_KIND
];
1241 ops
= tc_lookup_action(kind
);
1242 if (!ops
) { /*some idjot trying to flush unknown action */
1243 NL_SET_ERR_MSG(extack
, "Cannot flush unknown TC action");
1247 nlh
= nlmsg_put(skb
, portid
, n
->nlmsg_seq
, RTM_DELACTION
,
1250 NL_SET_ERR_MSG(extack
, "Failed to create TC action flush notification");
1251 goto out_module_put
;
1253 t
= nlmsg_data(nlh
);
1254 t
->tca_family
= AF_UNSPEC
;
1258 nest
= nla_nest_start_noflag(skb
, TCA_ACT_TAB
);
1260 NL_SET_ERR_MSG(extack
, "Failed to add new netlink message");
1261 goto out_module_put
;
1264 err
= ops
->walk(net
, skb
, &dcb
, RTM_DELACTION
, ops
, extack
);
1266 nla_nest_cancel(skb
, nest
);
1267 goto out_module_put
;
1270 nla_nest_end(skb
, nest
);
1272 nlh
->nlmsg_len
= skb_tail_pointer(skb
) - b
;
1273 nlh
->nlmsg_flags
|= NLM_F_ROOT
;
1274 module_put(ops
->owner
);
1275 err
= rtnetlink_send(skb
, net
, portid
, RTNLGRP_TC
,
1276 n
->nlmsg_flags
& NLM_F_ECHO
);
1280 NL_SET_ERR_MSG(extack
, "Failed to send TC action flush notification");
1285 module_put(ops
->owner
);
1291 static int tcf_action_delete(struct net
*net
, struct tc_action
*actions
[])
1295 for (i
= 0; i
< TCA_ACT_MAX_PRIO
&& actions
[i
]; i
++) {
1296 struct tc_action
*a
= actions
[i
];
1297 const struct tc_action_ops
*ops
= a
->ops
;
1298 /* Actions can be deleted concurrently so we must save their
1299 * type and id to search again after reference is released.
1301 struct tcf_idrinfo
*idrinfo
= a
->idrinfo
;
1302 u32 act_index
= a
->tcfa_index
;
1305 if (tcf_action_put(a
)) {
1306 /* last reference, action was deleted concurrently */
1307 module_put(ops
->owner
);
1311 /* now do the delete */
1312 ret
= tcf_idr_delete_index(idrinfo
, act_index
);
1321 tcf_del_notify(struct net
*net
, struct nlmsghdr
*n
, struct tc_action
*actions
[],
1322 u32 portid
, size_t attr_size
, struct netlink_ext_ack
*extack
)
1325 struct sk_buff
*skb
;
1327 skb
= alloc_skb(attr_size
<= NLMSG_GOODSIZE
? NLMSG_GOODSIZE
: attr_size
,
1332 if (tca_get_fill(skb
, actions
, portid
, n
->nlmsg_seq
, 0, RTM_DELACTION
,
1334 NL_SET_ERR_MSG(extack
, "Failed to fill netlink TC action attributes");
1339 /* now do the delete */
1340 ret
= tcf_action_delete(net
, actions
);
1342 NL_SET_ERR_MSG(extack
, "Failed to delete TC action");
1347 ret
= rtnetlink_send(skb
, net
, portid
, RTNLGRP_TC
,
1348 n
->nlmsg_flags
& NLM_F_ECHO
);
1355 tca_action_gd(struct net
*net
, struct nlattr
*nla
, struct nlmsghdr
*n
,
1356 u32 portid
, int event
, struct netlink_ext_ack
*extack
)
1359 struct nlattr
*tb
[TCA_ACT_MAX_PRIO
+ 1];
1360 struct tc_action
*act
;
1361 size_t attr_size
= 0;
1362 struct tc_action
*actions
[TCA_ACT_MAX_PRIO
] = {};
1364 ret
= nla_parse_nested_deprecated(tb
, TCA_ACT_MAX_PRIO
, nla
, NULL
,
1369 if (event
== RTM_DELACTION
&& n
->nlmsg_flags
& NLM_F_ROOT
) {
1371 return tca_action_flush(net
, tb
[1], n
, portid
, extack
);
1373 NL_SET_ERR_MSG(extack
, "Invalid netlink attributes while flushing TC action");
1377 for (i
= 1; i
<= TCA_ACT_MAX_PRIO
&& tb
[i
]; i
++) {
1378 act
= tcf_action_get_1(net
, tb
[i
], n
, portid
, extack
);
1383 attr_size
+= tcf_action_fill_size(act
);
1384 actions
[i
- 1] = act
;
1387 attr_size
= tcf_action_full_attrs_size(attr_size
);
1389 if (event
== RTM_GETACTION
)
1390 ret
= tcf_get_notify(net
, portid
, n
, actions
, event
, extack
);
1392 ret
= tcf_del_notify(net
, n
, actions
, portid
, attr_size
, extack
);
1398 tcf_action_put_many(actions
);
1403 tcf_add_notify(struct net
*net
, struct nlmsghdr
*n
, struct tc_action
*actions
[],
1404 u32 portid
, size_t attr_size
, struct netlink_ext_ack
*extack
)
1406 struct sk_buff
*skb
;
1409 skb
= alloc_skb(attr_size
<= NLMSG_GOODSIZE
? NLMSG_GOODSIZE
: attr_size
,
1414 if (tca_get_fill(skb
, actions
, portid
, n
->nlmsg_seq
, n
->nlmsg_flags
,
1415 RTM_NEWACTION
, 0, 0) <= 0) {
1416 NL_SET_ERR_MSG(extack
, "Failed to fill netlink attributes while adding TC action");
1421 err
= rtnetlink_send(skb
, net
, portid
, RTNLGRP_TC
,
1422 n
->nlmsg_flags
& NLM_F_ECHO
);
1428 static int tcf_action_add(struct net
*net
, struct nlattr
*nla
,
1429 struct nlmsghdr
*n
, u32 portid
, int ovr
,
1430 struct netlink_ext_ack
*extack
)
1432 size_t attr_size
= 0;
1434 struct tc_action
*actions
[TCA_ACT_MAX_PRIO
] = {};
1436 for (loop
= 0; loop
< 10; loop
++) {
1437 ret
= tcf_action_init(net
, NULL
, nla
, NULL
, NULL
, ovr
, 0,
1438 actions
, &attr_size
, true, extack
);
1445 ret
= tcf_add_notify(net
, n
, actions
, portid
, attr_size
, extack
);
1447 tcf_action_put_many(actions
);
1452 static const struct nla_policy tcaa_policy
[TCA_ROOT_MAX
+ 1] = {
1453 [TCA_ROOT_FLAGS
] = NLA_POLICY_BITFIELD32(TCA_FLAG_LARGE_DUMP_ON
),
1454 [TCA_ROOT_TIME_DELTA
] = { .type
= NLA_U32
},
1457 static int tc_ctl_action(struct sk_buff
*skb
, struct nlmsghdr
*n
,
1458 struct netlink_ext_ack
*extack
)
1460 struct net
*net
= sock_net(skb
->sk
);
1461 struct nlattr
*tca
[TCA_ROOT_MAX
+ 1];
1462 u32 portid
= skb
? NETLINK_CB(skb
).portid
: 0;
1463 int ret
= 0, ovr
= 0;
1465 if ((n
->nlmsg_type
!= RTM_GETACTION
) &&
1466 !netlink_capable(skb
, CAP_NET_ADMIN
))
1469 ret
= nlmsg_parse_deprecated(n
, sizeof(struct tcamsg
), tca
,
1470 TCA_ROOT_MAX
, NULL
, extack
);
1474 if (tca
[TCA_ACT_TAB
] == NULL
) {
1475 NL_SET_ERR_MSG(extack
, "Netlink action attributes missing");
1479 /* n->nlmsg_flags & NLM_F_CREATE */
1480 switch (n
->nlmsg_type
) {
1482 /* we are going to assume all other flags
1483 * imply create only if it doesn't exist
1484 * Note that CREATE | EXCL implies that
1485 * but since we want avoid ambiguity (eg when flags
1486 * is zero) then just set this
1488 if (n
->nlmsg_flags
& NLM_F_REPLACE
)
1490 ret
= tcf_action_add(net
, tca
[TCA_ACT_TAB
], n
, portid
, ovr
,
1494 ret
= tca_action_gd(net
, tca
[TCA_ACT_TAB
], n
,
1495 portid
, RTM_DELACTION
, extack
);
1498 ret
= tca_action_gd(net
, tca
[TCA_ACT_TAB
], n
,
1499 portid
, RTM_GETACTION
, extack
);
1508 static struct nlattr
*find_dump_kind(struct nlattr
**nla
)
1510 struct nlattr
*tb1
, *tb2
[TCA_ACT_MAX
+ 1];
1511 struct nlattr
*tb
[TCA_ACT_MAX_PRIO
+ 1];
1512 struct nlattr
*kind
;
1514 tb1
= nla
[TCA_ACT_TAB
];
1518 if (nla_parse_deprecated(tb
, TCA_ACT_MAX_PRIO
, nla_data(tb1
), NLMSG_ALIGN(nla_len(tb1
)), NULL
, NULL
) < 0)
1523 if (nla_parse_nested_deprecated(tb2
, TCA_ACT_MAX
, tb
[1], tcf_action_policy
, NULL
) < 0)
1525 kind
= tb2
[TCA_ACT_KIND
];
1530 static int tc_dump_action(struct sk_buff
*skb
, struct netlink_callback
*cb
)
1532 struct net
*net
= sock_net(skb
->sk
);
1533 struct nlmsghdr
*nlh
;
1534 unsigned char *b
= skb_tail_pointer(skb
);
1535 struct nlattr
*nest
;
1536 struct tc_action_ops
*a_o
;
1538 struct tcamsg
*t
= (struct tcamsg
*) nlmsg_data(cb
->nlh
);
1539 struct nlattr
*tb
[TCA_ROOT_MAX
+ 1];
1540 struct nlattr
*count_attr
= NULL
;
1541 unsigned long jiffy_since
= 0;
1542 struct nlattr
*kind
= NULL
;
1543 struct nla_bitfield32 bf
;
1544 u32 msecs_since
= 0;
1547 ret
= nlmsg_parse_deprecated(cb
->nlh
, sizeof(struct tcamsg
), tb
,
1548 TCA_ROOT_MAX
, tcaa_policy
, cb
->extack
);
1552 kind
= find_dump_kind(tb
);
1554 pr_info("tc_dump_action: action bad kind\n");
1558 a_o
= tc_lookup_action(kind
);
1563 if (tb
[TCA_ROOT_FLAGS
]) {
1564 bf
= nla_get_bitfield32(tb
[TCA_ROOT_FLAGS
]);
1565 cb
->args
[2] = bf
.value
;
1568 if (tb
[TCA_ROOT_TIME_DELTA
]) {
1569 msecs_since
= nla_get_u32(tb
[TCA_ROOT_TIME_DELTA
]);
1572 nlh
= nlmsg_put(skb
, NETLINK_CB(cb
->skb
).portid
, cb
->nlh
->nlmsg_seq
,
1573 cb
->nlh
->nlmsg_type
, sizeof(*t
), 0);
1575 goto out_module_put
;
1578 jiffy_since
= jiffies
- msecs_to_jiffies(msecs_since
);
1580 t
= nlmsg_data(nlh
);
1581 t
->tca_family
= AF_UNSPEC
;
1584 cb
->args
[3] = jiffy_since
;
1585 count_attr
= nla_reserve(skb
, TCA_ROOT_COUNT
, sizeof(u32
));
1587 goto out_module_put
;
1589 nest
= nla_nest_start_noflag(skb
, TCA_ACT_TAB
);
1591 goto out_module_put
;
1593 ret
= a_o
->walk(net
, skb
, cb
, RTM_GETACTION
, a_o
, NULL
);
1595 goto out_module_put
;
1598 nla_nest_end(skb
, nest
);
1600 act_count
= cb
->args
[1];
1601 memcpy(nla_data(count_attr
), &act_count
, sizeof(u32
));
1606 nlh
->nlmsg_len
= skb_tail_pointer(skb
) - b
;
1607 if (NETLINK_CB(cb
->skb
).portid
&& ret
)
1608 nlh
->nlmsg_flags
|= NLM_F_MULTI
;
1609 module_put(a_o
->owner
);
1613 module_put(a_o
->owner
);
1618 static int __init
tc_action_init(void)
1620 rtnl_register(PF_UNSPEC
, RTM_NEWACTION
, tc_ctl_action
, NULL
, 0);
1621 rtnl_register(PF_UNSPEC
, RTM_DELACTION
, tc_ctl_action
, NULL
, 0);
1622 rtnl_register(PF_UNSPEC
, RTM_GETACTION
, tc_ctl_action
, tc_dump_action
,
1628 subsys_initcall(tc_action_init
);