1 // SPDX-License-Identifier: GPL-2.0-or-later
3 * Checksum updating actions
5 * Copyright (c) 2010 Gregoire Baron <baronchon@n7mm.org>
8 #include <linux/types.h>
9 #include <linux/init.h>
10 #include <linux/kernel.h>
11 #include <linux/module.h>
12 #include <linux/spinlock.h>
14 #include <linux/netlink.h>
15 #include <net/netlink.h>
16 #include <linux/rtnetlink.h>
18 #include <linux/skbuff.h>
23 #include <linux/icmpv6.h>
24 #include <linux/igmp.h>
27 #include <net/ip6_checksum.h>
28 #include <net/sctp/checksum.h>
30 #include <net/act_api.h>
31 #include <net/pkt_cls.h>
33 #include <linux/tc_act/tc_csum.h>
34 #include <net/tc_act/tc_csum.h>
35 #include <net/tc_wrapper.h>
37 static const struct nla_policy csum_policy
[TCA_CSUM_MAX
+ 1] = {
38 [TCA_CSUM_PARMS
] = { .len
= sizeof(struct tc_csum
), },
41 static struct tc_action_ops act_csum_ops
;
43 static int tcf_csum_init(struct net
*net
, struct nlattr
*nla
,
44 struct nlattr
*est
, struct tc_action
**a
,
46 u32 flags
, struct netlink_ext_ack
*extack
)
48 struct tc_action_net
*tn
= net_generic(net
, act_csum_ops
.net_id
);
49 bool bind
= flags
& TCA_ACT_FLAGS_BIND
;
50 struct tcf_csum_params
*params_new
;
51 struct nlattr
*tb
[TCA_CSUM_MAX
+ 1];
52 struct tcf_chain
*goto_ch
= NULL
;
61 err
= nla_parse_nested_deprecated(tb
, TCA_CSUM_MAX
, nla
, csum_policy
,
66 if (tb
[TCA_CSUM_PARMS
] == NULL
)
68 parm
= nla_data(tb
[TCA_CSUM_PARMS
]);
70 err
= tcf_idr_check_alloc(tn
, &index
, a
, bind
);
72 ret
= tcf_idr_create_from_flags(tn
, index
, est
, a
,
73 &act_csum_ops
, bind
, flags
);
75 tcf_idr_cleanup(tn
, index
);
80 if (bind
) /* dont override defaults */
82 if (!(flags
& TCA_ACT_FLAGS_REPLACE
)) {
83 tcf_idr_release(*a
, bind
);
90 err
= tcf_action_check_ctrlact(parm
->action
, tp
, &goto_ch
, extack
);
96 params_new
= kzalloc(sizeof(*params_new
), GFP_KERNEL
);
97 if (unlikely(!params_new
)) {
101 params_new
->update_flags
= parm
->update_flags
;
103 spin_lock_bh(&p
->tcf_lock
);
104 goto_ch
= tcf_action_set_ctrlact(*a
, parm
->action
, goto_ch
);
105 params_new
= rcu_replace_pointer(p
->params
, params_new
,
106 lockdep_is_held(&p
->tcf_lock
));
107 spin_unlock_bh(&p
->tcf_lock
);
110 tcf_chain_put_by_act(goto_ch
);
112 kfree_rcu(params_new
, rcu
);
117 tcf_chain_put_by_act(goto_ch
);
119 tcf_idr_release(*a
, bind
);
124 * tcf_csum_skb_nextlayer - Get next layer pointer
125 * @skb: sk_buff to use
126 * @ihl: previous summed headers length
127 * @ipl: complete packet length
128 * @jhl: next header length
130 * Check the expected next layer availability in the specified sk_buff.
131 * Return the next layer pointer if pass, NULL otherwise.
133 static void *tcf_csum_skb_nextlayer(struct sk_buff
*skb
,
134 unsigned int ihl
, unsigned int ipl
,
137 int ntkoff
= skb_network_offset(skb
);
140 if (!pskb_may_pull(skb
, ipl
+ ntkoff
) || (ipl
< hl
) ||
141 skb_try_make_writable(skb
, hl
+ ntkoff
))
144 return (void *)(skb_network_header(skb
) + ihl
);
147 static int tcf_csum_ipv4_icmp(struct sk_buff
*skb
, unsigned int ihl
,
150 struct icmphdr
*icmph
;
152 icmph
= tcf_csum_skb_nextlayer(skb
, ihl
, ipl
, sizeof(*icmph
));
157 skb
->csum
= csum_partial(icmph
, ipl
- ihl
, 0);
158 icmph
->checksum
= csum_fold(skb
->csum
);
160 skb
->ip_summed
= CHECKSUM_NONE
;
165 static int tcf_csum_ipv4_igmp(struct sk_buff
*skb
,
166 unsigned int ihl
, unsigned int ipl
)
168 struct igmphdr
*igmph
;
170 igmph
= tcf_csum_skb_nextlayer(skb
, ihl
, ipl
, sizeof(*igmph
));
175 skb
->csum
= csum_partial(igmph
, ipl
- ihl
, 0);
176 igmph
->csum
= csum_fold(skb
->csum
);
178 skb
->ip_summed
= CHECKSUM_NONE
;
183 static int tcf_csum_ipv6_icmp(struct sk_buff
*skb
, unsigned int ihl
,
186 struct icmp6hdr
*icmp6h
;
187 const struct ipv6hdr
*ip6h
;
189 icmp6h
= tcf_csum_skb_nextlayer(skb
, ihl
, ipl
, sizeof(*icmp6h
));
193 ip6h
= ipv6_hdr(skb
);
194 icmp6h
->icmp6_cksum
= 0;
195 skb
->csum
= csum_partial(icmp6h
, ipl
- ihl
, 0);
196 icmp6h
->icmp6_cksum
= csum_ipv6_magic(&ip6h
->saddr
, &ip6h
->daddr
,
197 ipl
- ihl
, IPPROTO_ICMPV6
,
200 skb
->ip_summed
= CHECKSUM_NONE
;
205 static int tcf_csum_ipv4_tcp(struct sk_buff
*skb
, unsigned int ihl
,
209 const struct iphdr
*iph
;
211 if (skb_is_gso(skb
) && skb_shinfo(skb
)->gso_type
& SKB_GSO_TCPV4
)
214 tcph
= tcf_csum_skb_nextlayer(skb
, ihl
, ipl
, sizeof(*tcph
));
220 skb
->csum
= csum_partial(tcph
, ipl
- ihl
, 0);
221 tcph
->check
= tcp_v4_check(ipl
- ihl
,
222 iph
->saddr
, iph
->daddr
, skb
->csum
);
224 skb
->ip_summed
= CHECKSUM_NONE
;
229 static int tcf_csum_ipv6_tcp(struct sk_buff
*skb
, unsigned int ihl
,
233 const struct ipv6hdr
*ip6h
;
235 if (skb_is_gso(skb
) && skb_shinfo(skb
)->gso_type
& SKB_GSO_TCPV6
)
238 tcph
= tcf_csum_skb_nextlayer(skb
, ihl
, ipl
, sizeof(*tcph
));
242 ip6h
= ipv6_hdr(skb
);
244 skb
->csum
= csum_partial(tcph
, ipl
- ihl
, 0);
245 tcph
->check
= csum_ipv6_magic(&ip6h
->saddr
, &ip6h
->daddr
,
246 ipl
- ihl
, IPPROTO_TCP
,
249 skb
->ip_summed
= CHECKSUM_NONE
;
254 static int tcf_csum_ipv4_udp(struct sk_buff
*skb
, unsigned int ihl
,
255 unsigned int ipl
, int udplite
)
258 const struct iphdr
*iph
;
261 if (skb_is_gso(skb
) && skb_shinfo(skb
)->gso_type
& SKB_GSO_UDP
)
265 * Support both UDP and UDPLITE checksum algorithms, Don't use
266 * udph->len to get the real length without any protocol check,
267 * UDPLITE uses udph->len for another thing,
268 * Use iph->tot_len, or just ipl.
271 udph
= tcf_csum_skb_nextlayer(skb
, ihl
, ipl
, sizeof(*udph
));
276 ul
= ntohs(udph
->len
);
278 if (udplite
|| udph
->check
) {
284 skb
->csum
= csum_partial(udph
, ipl
- ihl
, 0);
285 else if ((ul
>= sizeof(*udph
)) && (ul
<= ipl
- ihl
))
286 skb
->csum
= csum_partial(udph
, ul
, 0);
288 goto ignore_obscure_skb
;
291 goto ignore_obscure_skb
;
293 skb
->csum
= csum_partial(udph
, ul
, 0);
296 udph
->check
= csum_tcpudp_magic(iph
->saddr
, iph
->daddr
,
301 udph
->check
= CSUM_MANGLED_0
;
304 skb
->ip_summed
= CHECKSUM_NONE
;
310 static int tcf_csum_ipv6_udp(struct sk_buff
*skb
, unsigned int ihl
,
311 unsigned int ipl
, int udplite
)
314 const struct ipv6hdr
*ip6h
;
317 if (skb_is_gso(skb
) && skb_shinfo(skb
)->gso_type
& SKB_GSO_UDP
)
321 * Support both UDP and UDPLITE checksum algorithms, Don't use
322 * udph->len to get the real length without any protocol check,
323 * UDPLITE uses udph->len for another thing,
324 * Use ip6h->payload_len + sizeof(*ip6h) ... , or just ipl.
327 udph
= tcf_csum_skb_nextlayer(skb
, ihl
, ipl
, sizeof(*udph
));
331 ip6h
= ipv6_hdr(skb
);
332 ul
= ntohs(udph
->len
);
338 skb
->csum
= csum_partial(udph
, ipl
- ihl
, 0);
340 else if ((ul
>= sizeof(*udph
)) && (ul
<= ipl
- ihl
))
341 skb
->csum
= csum_partial(udph
, ul
, 0);
344 goto ignore_obscure_skb
;
347 goto ignore_obscure_skb
;
349 skb
->csum
= csum_partial(udph
, ul
, 0);
352 udph
->check
= csum_ipv6_magic(&ip6h
->saddr
, &ip6h
->daddr
, ul
,
353 udplite
? IPPROTO_UDPLITE
: IPPROTO_UDP
,
357 udph
->check
= CSUM_MANGLED_0
;
359 skb
->ip_summed
= CHECKSUM_NONE
;
365 static int tcf_csum_sctp(struct sk_buff
*skb
, unsigned int ihl
,
368 struct sctphdr
*sctph
;
370 if (skb_is_gso(skb
) && skb_is_gso_sctp(skb
))
373 sctph
= tcf_csum_skb_nextlayer(skb
, ihl
, ipl
, sizeof(*sctph
));
377 sctph
->checksum
= sctp_compute_cksum(skb
,
378 skb_network_offset(skb
) + ihl
);
379 skb_reset_csum_not_inet(skb
);
384 static int tcf_csum_ipv4(struct sk_buff
*skb
, u32 update_flags
)
386 const struct iphdr
*iph
;
389 ntkoff
= skb_network_offset(skb
);
391 if (!pskb_may_pull(skb
, sizeof(*iph
) + ntkoff
))
396 switch (iph
->frag_off
& htons(IP_OFFSET
) ? 0 : iph
->protocol
) {
398 if (update_flags
& TCA_CSUM_UPDATE_FLAG_ICMP
)
399 if (!tcf_csum_ipv4_icmp(skb
, iph
->ihl
* 4,
400 ntohs(iph
->tot_len
)))
404 if (update_flags
& TCA_CSUM_UPDATE_FLAG_IGMP
)
405 if (!tcf_csum_ipv4_igmp(skb
, iph
->ihl
* 4,
406 ntohs(iph
->tot_len
)))
410 if (update_flags
& TCA_CSUM_UPDATE_FLAG_TCP
)
411 if (!tcf_csum_ipv4_tcp(skb
, iph
->ihl
* 4,
412 ntohs(iph
->tot_len
)))
416 if (update_flags
& TCA_CSUM_UPDATE_FLAG_UDP
)
417 if (!tcf_csum_ipv4_udp(skb
, iph
->ihl
* 4,
418 ntohs(iph
->tot_len
), 0))
421 case IPPROTO_UDPLITE
:
422 if (update_flags
& TCA_CSUM_UPDATE_FLAG_UDPLITE
)
423 if (!tcf_csum_ipv4_udp(skb
, iph
->ihl
* 4,
424 ntohs(iph
->tot_len
), 1))
428 if ((update_flags
& TCA_CSUM_UPDATE_FLAG_SCTP
) &&
429 !tcf_csum_sctp(skb
, iph
->ihl
* 4, ntohs(iph
->tot_len
)))
434 if (update_flags
& TCA_CSUM_UPDATE_FLAG_IPV4HDR
) {
435 if (skb_try_make_writable(skb
, sizeof(*iph
) + ntkoff
))
438 ip_send_check(ip_hdr(skb
));
447 static int tcf_csum_ipv6_hopopts(struct ipv6_opt_hdr
*ip6xh
, unsigned int ixhl
,
450 int off
, len
, optlen
;
451 unsigned char *xh
= (void *)ip6xh
;
453 off
= sizeof(*ip6xh
);
462 optlen
= xh
[off
+ 1] + 2;
463 if (optlen
!= 6 || len
< 6 || (off
& 3) != 2)
464 /* wrong jumbo option length/alignment */
466 *pl
= ntohl(*(__be32
*)(xh
+ off
+ 2));
469 optlen
= xh
[off
+ 1] + 2;
471 /* ignore obscure options */
483 static int tcf_csum_ipv6(struct sk_buff
*skb
, u32 update_flags
)
485 struct ipv6hdr
*ip6h
;
486 struct ipv6_opt_hdr
*ip6xh
;
487 unsigned int hl
, ixhl
;
492 ntkoff
= skb_network_offset(skb
);
496 if (!pskb_may_pull(skb
, hl
+ ntkoff
))
499 ip6h
= ipv6_hdr(skb
);
501 pl
= ntohs(ip6h
->payload_len
);
502 nexthdr
= ip6h
->nexthdr
;
506 case NEXTHDR_FRAGMENT
:
508 case NEXTHDR_ROUTING
:
511 if (!pskb_may_pull(skb
, hl
+ sizeof(*ip6xh
) + ntkoff
))
513 ip6xh
= (void *)(skb_network_header(skb
) + hl
);
514 ixhl
= ipv6_optlen(ip6xh
);
515 if (!pskb_may_pull(skb
, hl
+ ixhl
+ ntkoff
))
517 ip6xh
= (void *)(skb_network_header(skb
) + hl
);
518 if ((nexthdr
== NEXTHDR_HOP
) &&
519 !(tcf_csum_ipv6_hopopts(ip6xh
, ixhl
, &pl
)))
521 nexthdr
= ip6xh
->nexthdr
;
525 if (update_flags
& TCA_CSUM_UPDATE_FLAG_ICMP
)
526 if (!tcf_csum_ipv6_icmp(skb
,
527 hl
, pl
+ sizeof(*ip6h
)))
531 if (update_flags
& TCA_CSUM_UPDATE_FLAG_TCP
)
532 if (!tcf_csum_ipv6_tcp(skb
,
533 hl
, pl
+ sizeof(*ip6h
)))
537 if (update_flags
& TCA_CSUM_UPDATE_FLAG_UDP
)
538 if (!tcf_csum_ipv6_udp(skb
, hl
,
539 pl
+ sizeof(*ip6h
), 0))
542 case IPPROTO_UDPLITE
:
543 if (update_flags
& TCA_CSUM_UPDATE_FLAG_UDPLITE
)
544 if (!tcf_csum_ipv6_udp(skb
, hl
,
545 pl
+ sizeof(*ip6h
), 1))
549 if ((update_flags
& TCA_CSUM_UPDATE_FLAG_SCTP
) &&
550 !tcf_csum_sctp(skb
, hl
, pl
+ sizeof(*ip6h
)))
556 } while (pskb_may_pull(skb
, hl
+ 1 + ntkoff
));
566 TC_INDIRECT_SCOPE
int tcf_csum_act(struct sk_buff
*skb
,
567 const struct tc_action
*a
,
568 struct tcf_result
*res
)
570 struct tcf_csum
*p
= to_tcf_csum(a
);
571 bool orig_vlan_tag_present
= false;
572 unsigned int vlan_hdr_count
= 0;
573 struct tcf_csum_params
*params
;
578 params
= rcu_dereference_bh(p
->params
);
580 tcf_lastuse_update(&p
->tcf_tm
);
581 tcf_action_update_bstats(&p
->common
, skb
);
583 action
= READ_ONCE(p
->tcf_action
);
584 if (unlikely(action
== TC_ACT_SHOT
))
587 update_flags
= params
->update_flags
;
588 protocol
= skb_protocol(skb
, false);
591 case cpu_to_be16(ETH_P_IP
):
592 if (!tcf_csum_ipv4(skb
, update_flags
))
595 case cpu_to_be16(ETH_P_IPV6
):
596 if (!tcf_csum_ipv6(skb
, update_flags
))
599 case cpu_to_be16(ETH_P_8021AD
):
601 case cpu_to_be16(ETH_P_8021Q
):
602 if (skb_vlan_tag_present(skb
) && !orig_vlan_tag_present
) {
603 protocol
= skb
->protocol
;
604 orig_vlan_tag_present
= true;
606 struct vlan_hdr
*vlan
= (struct vlan_hdr
*)skb
->data
;
608 protocol
= vlan
->h_vlan_encapsulated_proto
;
609 skb_pull(skb
, VLAN_HLEN
);
610 skb_reset_network_header(skb
);
617 /* Restore the skb for the pulled VLAN tags */
618 while (vlan_hdr_count
--) {
619 skb_push(skb
, VLAN_HLEN
);
620 skb_reset_network_header(skb
);
626 tcf_action_inc_drop_qstats(&p
->common
);
627 action
= TC_ACT_SHOT
;
631 static int tcf_csum_dump(struct sk_buff
*skb
, struct tc_action
*a
, int bind
,
634 unsigned char *b
= skb_tail_pointer(skb
);
635 struct tcf_csum
*p
= to_tcf_csum(a
);
636 struct tcf_csum_params
*params
;
637 struct tc_csum opt
= {
638 .index
= p
->tcf_index
,
639 .refcnt
= refcount_read(&p
->tcf_refcnt
) - ref
,
640 .bindcnt
= atomic_read(&p
->tcf_bindcnt
) - bind
,
644 spin_lock_bh(&p
->tcf_lock
);
645 params
= rcu_dereference_protected(p
->params
,
646 lockdep_is_held(&p
->tcf_lock
));
647 opt
.action
= p
->tcf_action
;
648 opt
.update_flags
= params
->update_flags
;
650 if (nla_put(skb
, TCA_CSUM_PARMS
, sizeof(opt
), &opt
))
651 goto nla_put_failure
;
653 tcf_tm_dump(&t
, &p
->tcf_tm
);
654 if (nla_put_64bit(skb
, TCA_CSUM_TM
, sizeof(t
), &t
, TCA_CSUM_PAD
))
655 goto nla_put_failure
;
656 spin_unlock_bh(&p
->tcf_lock
);
661 spin_unlock_bh(&p
->tcf_lock
);
666 static void tcf_csum_cleanup(struct tc_action
*a
)
668 struct tcf_csum
*p
= to_tcf_csum(a
);
669 struct tcf_csum_params
*params
;
671 params
= rcu_dereference_protected(p
->params
, 1);
673 kfree_rcu(params
, rcu
);
676 static size_t tcf_csum_get_fill_size(const struct tc_action
*act
)
678 return nla_total_size(sizeof(struct tc_csum
));
681 static int tcf_csum_offload_act_setup(struct tc_action
*act
, void *entry_data
,
682 u32
*index_inc
, bool bind
,
683 struct netlink_ext_ack
*extack
)
686 struct flow_action_entry
*entry
= entry_data
;
688 entry
->id
= FLOW_ACTION_CSUM
;
689 entry
->csum_flags
= tcf_csum_update_flags(act
);
692 struct flow_offload_action
*fl_action
= entry_data
;
694 fl_action
->id
= FLOW_ACTION_CSUM
;
700 static struct tc_action_ops act_csum_ops
= {
703 .owner
= THIS_MODULE
,
705 .dump
= tcf_csum_dump
,
706 .init
= tcf_csum_init
,
707 .cleanup
= tcf_csum_cleanup
,
708 .get_fill_size
= tcf_csum_get_fill_size
,
709 .offload_act_setup
= tcf_csum_offload_act_setup
,
710 .size
= sizeof(struct tcf_csum
),
712 MODULE_ALIAS_NET_ACT("csum");
714 static __net_init
int csum_init_net(struct net
*net
)
716 struct tc_action_net
*tn
= net_generic(net
, act_csum_ops
.net_id
);
718 return tc_action_net_init(net
, tn
, &act_csum_ops
);
721 static void __net_exit
csum_exit_net(struct list_head
*net_list
)
723 tc_action_net_exit(net_list
, act_csum_ops
.net_id
);
726 static struct pernet_operations csum_net_ops
= {
727 .init
= csum_init_net
,
728 .exit_batch
= csum_exit_net
,
729 .id
= &act_csum_ops
.net_id
,
730 .size
= sizeof(struct tc_action_net
),
733 MODULE_DESCRIPTION("Checksum updating actions");
734 MODULE_LICENSE("GPL");
736 static int __init
csum_init_module(void)
738 return tcf_register_action(&act_csum_ops
, &csum_net_ops
);
741 static void __exit
csum_cleanup_module(void)
743 tcf_unregister_action(&act_csum_ops
, &csum_net_ops
);
746 module_init(csum_init_module
);
747 module_exit(csum_cleanup_module
);