target/cxgbit: Use T6 specific macros to get ETH/IP hdr len
[linux/fpc-iii.git] / net / ipv6 / exthdrs.c
blobe4198502fd98ce55c1ab6d4d9767b8506b2cf707
1 /*
2 * Extension Header handling for IPv6
3 * Linux INET6 implementation
5 * Authors:
6 * Pedro Roque <roque@di.fc.ul.pt>
7 * Andi Kleen <ak@muc.de>
8 * Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
10 * This program is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU General Public License
12 * as published by the Free Software Foundation; either version
13 * 2 of the License, or (at your option) any later version.
16 /* Changes:
17 * yoshfuji : ensure not to overrun while parsing
18 * tlv options.
19 * Mitsuru KANDA @USAGI and: Remove ipv6_parse_exthdrs().
20 * YOSHIFUJI Hideaki @USAGI Register inbound extension header
21 * handlers as inet6_protocol{}.
24 #include <linux/errno.h>
25 #include <linux/types.h>
26 #include <linux/socket.h>
27 #include <linux/sockios.h>
28 #include <linux/net.h>
29 #include <linux/netdevice.h>
30 #include <linux/in6.h>
31 #include <linux/icmpv6.h>
32 #include <linux/slab.h>
33 #include <linux/export.h>
35 #include <net/dst.h>
36 #include <net/sock.h>
37 #include <net/snmp.h>
39 #include <net/ipv6.h>
40 #include <net/protocol.h>
41 #include <net/transp_v6.h>
42 #include <net/rawv6.h>
43 #include <net/ndisc.h>
44 #include <net/ip6_route.h>
45 #include <net/addrconf.h>
46 #include <net/calipso.h>
47 #if IS_ENABLED(CONFIG_IPV6_MIP6)
48 #include <net/xfrm.h>
49 #endif
50 #include <linux/seg6.h>
51 #include <net/seg6.h>
52 #ifdef CONFIG_IPV6_SEG6_HMAC
53 #include <net/seg6_hmac.h>
54 #endif
56 #include <linux/uaccess.h>
59 * Parsing tlv encoded headers.
61 * Parsing function "func" returns true, if parsing succeed
62 * and false, if it failed.
63 * It MUST NOT touch skb->h.
66 struct tlvtype_proc {
67 int type;
68 bool (*func)(struct sk_buff *skb, int offset);
71 /*********************
72 Generic functions
73 *********************/
75 /* An unknown option is detected, decide what to do */
77 static bool ip6_tlvopt_unknown(struct sk_buff *skb, int optoff)
79 switch ((skb_network_header(skb)[optoff] & 0xC0) >> 6) {
80 case 0: /* ignore */
81 return true;
83 case 1: /* drop packet */
84 break;
86 case 3: /* Send ICMP if not a multicast address and drop packet */
87 /* Actually, it is redundant check. icmp_send
88 will recheck in any case.
90 if (ipv6_addr_is_multicast(&ipv6_hdr(skb)->daddr))
91 break;
92 case 2: /* send ICMP PARM PROB regardless and drop packet */
93 icmpv6_param_prob(skb, ICMPV6_UNK_OPTION, optoff);
94 return false;
97 kfree_skb(skb);
98 return false;
101 /* Parse tlv encoded option header (hop-by-hop or destination) */
103 static bool ip6_parse_tlv(const struct tlvtype_proc *procs, struct sk_buff *skb)
105 const struct tlvtype_proc *curr;
106 const unsigned char *nh = skb_network_header(skb);
107 int off = skb_network_header_len(skb);
108 int len = (skb_transport_header(skb)[1] + 1) << 3;
109 int padlen = 0;
111 if (skb_transport_offset(skb) + len > skb_headlen(skb))
112 goto bad;
114 off += 2;
115 len -= 2;
117 while (len > 0) {
118 int optlen = nh[off + 1] + 2;
119 int i;
121 switch (nh[off]) {
122 case IPV6_TLV_PAD1:
123 optlen = 1;
124 padlen++;
125 if (padlen > 7)
126 goto bad;
127 break;
129 case IPV6_TLV_PADN:
130 /* RFC 2460 states that the purpose of PadN is
131 * to align the containing header to multiples
132 * of 8. 7 is therefore the highest valid value.
133 * See also RFC 4942, Section 2.1.9.5.
135 padlen += optlen;
136 if (padlen > 7)
137 goto bad;
138 /* RFC 4942 recommends receiving hosts to
139 * actively check PadN payload to contain
140 * only zeroes.
142 for (i = 2; i < optlen; i++) {
143 if (nh[off + i] != 0)
144 goto bad;
146 break;
148 default: /* Other TLV code so scan list */
149 if (optlen > len)
150 goto bad;
151 for (curr = procs; curr->type >= 0; curr++) {
152 if (curr->type == nh[off]) {
153 /* type specific length/alignment
154 checks will be performed in the
155 func(). */
156 if (curr->func(skb, off) == false)
157 return false;
158 break;
161 if (curr->type < 0) {
162 if (ip6_tlvopt_unknown(skb, off) == 0)
163 return false;
165 padlen = 0;
166 break;
168 off += optlen;
169 len -= optlen;
172 if (len == 0)
173 return true;
174 bad:
175 kfree_skb(skb);
176 return false;
179 /*****************************
180 Destination options header.
181 *****************************/
183 #if IS_ENABLED(CONFIG_IPV6_MIP6)
184 static bool ipv6_dest_hao(struct sk_buff *skb, int optoff)
186 struct ipv6_destopt_hao *hao;
187 struct inet6_skb_parm *opt = IP6CB(skb);
188 struct ipv6hdr *ipv6h = ipv6_hdr(skb);
189 struct in6_addr tmp_addr;
190 int ret;
192 if (opt->dsthao) {
193 net_dbg_ratelimited("hao duplicated\n");
194 goto discard;
196 opt->dsthao = opt->dst1;
197 opt->dst1 = 0;
199 hao = (struct ipv6_destopt_hao *)(skb_network_header(skb) + optoff);
201 if (hao->length != 16) {
202 net_dbg_ratelimited("hao invalid option length = %d\n",
203 hao->length);
204 goto discard;
207 if (!(ipv6_addr_type(&hao->addr) & IPV6_ADDR_UNICAST)) {
208 net_dbg_ratelimited("hao is not an unicast addr: %pI6\n",
209 &hao->addr);
210 goto discard;
213 ret = xfrm6_input_addr(skb, (xfrm_address_t *)&ipv6h->daddr,
214 (xfrm_address_t *)&hao->addr, IPPROTO_DSTOPTS);
215 if (unlikely(ret < 0))
216 goto discard;
218 if (skb_cloned(skb)) {
219 if (pskb_expand_head(skb, 0, 0, GFP_ATOMIC))
220 goto discard;
222 /* update all variable using below by copied skbuff */
223 hao = (struct ipv6_destopt_hao *)(skb_network_header(skb) +
224 optoff);
225 ipv6h = ipv6_hdr(skb);
228 if (skb->ip_summed == CHECKSUM_COMPLETE)
229 skb->ip_summed = CHECKSUM_NONE;
231 tmp_addr = ipv6h->saddr;
232 ipv6h->saddr = hao->addr;
233 hao->addr = tmp_addr;
235 if (skb->tstamp == 0)
236 __net_timestamp(skb);
238 return true;
240 discard:
241 kfree_skb(skb);
242 return false;
244 #endif
246 static const struct tlvtype_proc tlvprocdestopt_lst[] = {
247 #if IS_ENABLED(CONFIG_IPV6_MIP6)
249 .type = IPV6_TLV_HAO,
250 .func = ipv6_dest_hao,
252 #endif
253 {-1, NULL}
256 static int ipv6_destopt_rcv(struct sk_buff *skb)
258 struct inet6_skb_parm *opt = IP6CB(skb);
259 #if IS_ENABLED(CONFIG_IPV6_MIP6)
260 __u16 dstbuf;
261 #endif
262 struct dst_entry *dst = skb_dst(skb);
264 if (!pskb_may_pull(skb, skb_transport_offset(skb) + 8) ||
265 !pskb_may_pull(skb, (skb_transport_offset(skb) +
266 ((skb_transport_header(skb)[1] + 1) << 3)))) {
267 __IP6_INC_STATS(dev_net(dst->dev), ip6_dst_idev(dst),
268 IPSTATS_MIB_INHDRERRORS);
269 kfree_skb(skb);
270 return -1;
273 opt->lastopt = opt->dst1 = skb_network_header_len(skb);
274 #if IS_ENABLED(CONFIG_IPV6_MIP6)
275 dstbuf = opt->dst1;
276 #endif
278 if (ip6_parse_tlv(tlvprocdestopt_lst, skb)) {
279 skb->transport_header += (skb_transport_header(skb)[1] + 1) << 3;
280 opt = IP6CB(skb);
281 #if IS_ENABLED(CONFIG_IPV6_MIP6)
282 opt->nhoff = dstbuf;
283 #else
284 opt->nhoff = opt->dst1;
285 #endif
286 return 1;
289 __IP6_INC_STATS(dev_net(dst->dev),
290 ip6_dst_idev(dst), IPSTATS_MIB_INHDRERRORS);
291 return -1;
294 static void seg6_update_csum(struct sk_buff *skb)
296 struct ipv6_sr_hdr *hdr;
297 struct in6_addr *addr;
298 __be32 from, to;
300 /* srh is at transport offset and seg_left is already decremented
301 * but daddr is not yet updated with next segment
304 hdr = (struct ipv6_sr_hdr *)skb_transport_header(skb);
305 addr = hdr->segments + hdr->segments_left;
307 hdr->segments_left++;
308 from = *(__be32 *)hdr;
310 hdr->segments_left--;
311 to = *(__be32 *)hdr;
313 /* update skb csum with diff resulting from seg_left decrement */
315 update_csum_diff4(skb, from, to);
317 /* compute csum diff between current and next segment and update */
319 update_csum_diff16(skb, (__be32 *)(&ipv6_hdr(skb)->daddr),
320 (__be32 *)addr);
323 static int ipv6_srh_rcv(struct sk_buff *skb)
325 struct inet6_skb_parm *opt = IP6CB(skb);
326 struct net *net = dev_net(skb->dev);
327 struct ipv6_sr_hdr *hdr;
328 struct inet6_dev *idev;
329 struct in6_addr *addr;
330 bool cleanup = false;
331 int accept_seg6;
333 hdr = (struct ipv6_sr_hdr *)skb_transport_header(skb);
335 idev = __in6_dev_get(skb->dev);
337 accept_seg6 = net->ipv6.devconf_all->seg6_enabled;
338 if (accept_seg6 > idev->cnf.seg6_enabled)
339 accept_seg6 = idev->cnf.seg6_enabled;
341 if (!accept_seg6) {
342 kfree_skb(skb);
343 return -1;
346 #ifdef CONFIG_IPV6_SEG6_HMAC
347 if (!seg6_hmac_validate_skb(skb)) {
348 kfree_skb(skb);
349 return -1;
351 #endif
353 looped_back:
354 if (hdr->segments_left > 0) {
355 if (hdr->nexthdr != NEXTHDR_IPV6 && hdr->segments_left == 1 &&
356 sr_has_cleanup(hdr))
357 cleanup = true;
358 } else {
359 if (hdr->nexthdr == NEXTHDR_IPV6) {
360 int offset = (hdr->hdrlen + 1) << 3;
362 skb_postpull_rcsum(skb, skb_network_header(skb),
363 skb_network_header_len(skb));
365 if (!pskb_pull(skb, offset)) {
366 kfree_skb(skb);
367 return -1;
369 skb_postpull_rcsum(skb, skb_transport_header(skb),
370 offset);
372 skb_reset_network_header(skb);
373 skb_reset_transport_header(skb);
374 skb->encapsulation = 0;
376 __skb_tunnel_rx(skb, skb->dev, net);
378 netif_rx(skb);
379 return -1;
382 opt->srcrt = skb_network_header_len(skb);
383 opt->lastopt = opt->srcrt;
384 skb->transport_header += (hdr->hdrlen + 1) << 3;
385 opt->nhoff = (&hdr->nexthdr) - skb_network_header(skb);
387 return 1;
390 if (hdr->segments_left >= (hdr->hdrlen >> 1)) {
391 __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
392 IPSTATS_MIB_INHDRERRORS);
393 icmpv6_param_prob(skb, ICMPV6_HDR_FIELD,
394 ((&hdr->segments_left) -
395 skb_network_header(skb)));
396 kfree_skb(skb);
397 return -1;
400 if (skb_cloned(skb)) {
401 if (pskb_expand_head(skb, 0, 0, GFP_ATOMIC)) {
402 __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
403 IPSTATS_MIB_OUTDISCARDS);
404 kfree_skb(skb);
405 return -1;
409 hdr = (struct ipv6_sr_hdr *)skb_transport_header(skb);
411 hdr->segments_left--;
412 addr = hdr->segments + hdr->segments_left;
414 skb_push(skb, sizeof(struct ipv6hdr));
416 if (skb->ip_summed == CHECKSUM_COMPLETE)
417 seg6_update_csum(skb);
419 ipv6_hdr(skb)->daddr = *addr;
421 if (cleanup) {
422 int srhlen = (hdr->hdrlen + 1) << 3;
423 int nh = hdr->nexthdr;
425 skb_pull_rcsum(skb, sizeof(struct ipv6hdr) + srhlen);
426 memmove(skb_network_header(skb) + srhlen,
427 skb_network_header(skb),
428 (unsigned char *)hdr - skb_network_header(skb));
429 skb->network_header += srhlen;
430 ipv6_hdr(skb)->nexthdr = nh;
431 ipv6_hdr(skb)->payload_len = htons(skb->len -
432 sizeof(struct ipv6hdr));
433 skb_push_rcsum(skb, sizeof(struct ipv6hdr));
436 skb_dst_drop(skb);
438 ip6_route_input(skb);
440 if (skb_dst(skb)->error) {
441 dst_input(skb);
442 return -1;
445 if (skb_dst(skb)->dev->flags & IFF_LOOPBACK) {
446 if (ipv6_hdr(skb)->hop_limit <= 1) {
447 __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
448 IPSTATS_MIB_INHDRERRORS);
449 icmpv6_send(skb, ICMPV6_TIME_EXCEED,
450 ICMPV6_EXC_HOPLIMIT, 0);
451 kfree_skb(skb);
452 return -1;
454 ipv6_hdr(skb)->hop_limit--;
456 /* be sure that srh is still present before reinjecting */
457 if (!cleanup) {
458 skb_pull(skb, sizeof(struct ipv6hdr));
459 goto looped_back;
461 skb_set_transport_header(skb, sizeof(struct ipv6hdr));
462 IP6CB(skb)->nhoff = offsetof(struct ipv6hdr, nexthdr);
465 dst_input(skb);
467 return -1;
470 /********************************
471 Routing header.
472 ********************************/
474 /* called with rcu_read_lock() */
475 static int ipv6_rthdr_rcv(struct sk_buff *skb)
477 struct inet6_skb_parm *opt = IP6CB(skb);
478 struct in6_addr *addr = NULL;
479 struct in6_addr daddr;
480 struct inet6_dev *idev;
481 int n, i;
482 struct ipv6_rt_hdr *hdr;
483 struct rt0_hdr *rthdr;
484 struct net *net = dev_net(skb->dev);
485 int accept_source_route = net->ipv6.devconf_all->accept_source_route;
487 idev = __in6_dev_get(skb->dev);
488 if (idev && accept_source_route > idev->cnf.accept_source_route)
489 accept_source_route = idev->cnf.accept_source_route;
491 if (!pskb_may_pull(skb, skb_transport_offset(skb) + 8) ||
492 !pskb_may_pull(skb, (skb_transport_offset(skb) +
493 ((skb_transport_header(skb)[1] + 1) << 3)))) {
494 __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
495 IPSTATS_MIB_INHDRERRORS);
496 kfree_skb(skb);
497 return -1;
500 hdr = (struct ipv6_rt_hdr *)skb_transport_header(skb);
502 if (ipv6_addr_is_multicast(&ipv6_hdr(skb)->daddr) ||
503 skb->pkt_type != PACKET_HOST) {
504 __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
505 IPSTATS_MIB_INADDRERRORS);
506 kfree_skb(skb);
507 return -1;
510 /* segment routing */
511 if (hdr->type == IPV6_SRCRT_TYPE_4)
512 return ipv6_srh_rcv(skb);
514 looped_back:
515 if (hdr->segments_left == 0) {
516 switch (hdr->type) {
517 #if IS_ENABLED(CONFIG_IPV6_MIP6)
518 case IPV6_SRCRT_TYPE_2:
519 /* Silently discard type 2 header unless it was
520 * processed by own
522 if (!addr) {
523 __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
524 IPSTATS_MIB_INADDRERRORS);
525 kfree_skb(skb);
526 return -1;
528 break;
529 #endif
530 default:
531 break;
534 opt->lastopt = opt->srcrt = skb_network_header_len(skb);
535 skb->transport_header += (hdr->hdrlen + 1) << 3;
536 opt->dst0 = opt->dst1;
537 opt->dst1 = 0;
538 opt->nhoff = (&hdr->nexthdr) - skb_network_header(skb);
539 return 1;
542 switch (hdr->type) {
543 #if IS_ENABLED(CONFIG_IPV6_MIP6)
544 case IPV6_SRCRT_TYPE_2:
545 if (accept_source_route < 0)
546 goto unknown_rh;
547 /* Silently discard invalid RTH type 2 */
548 if (hdr->hdrlen != 2 || hdr->segments_left != 1) {
549 __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
550 IPSTATS_MIB_INHDRERRORS);
551 kfree_skb(skb);
552 return -1;
554 break;
555 #endif
556 default:
557 goto unknown_rh;
561 * This is the routing header forwarding algorithm from
562 * RFC 2460, page 16.
565 n = hdr->hdrlen >> 1;
567 if (hdr->segments_left > n) {
568 __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
569 IPSTATS_MIB_INHDRERRORS);
570 icmpv6_param_prob(skb, ICMPV6_HDR_FIELD,
571 ((&hdr->segments_left) -
572 skb_network_header(skb)));
573 return -1;
576 /* We are about to mangle packet header. Be careful!
577 Do not damage packets queued somewhere.
579 if (skb_cloned(skb)) {
580 /* the copy is a forwarded packet */
581 if (pskb_expand_head(skb, 0, 0, GFP_ATOMIC)) {
582 __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
583 IPSTATS_MIB_OUTDISCARDS);
584 kfree_skb(skb);
585 return -1;
587 hdr = (struct ipv6_rt_hdr *)skb_transport_header(skb);
590 if (skb->ip_summed == CHECKSUM_COMPLETE)
591 skb->ip_summed = CHECKSUM_NONE;
593 i = n - --hdr->segments_left;
595 rthdr = (struct rt0_hdr *) hdr;
596 addr = rthdr->addr;
597 addr += i - 1;
599 switch (hdr->type) {
600 #if IS_ENABLED(CONFIG_IPV6_MIP6)
601 case IPV6_SRCRT_TYPE_2:
602 if (xfrm6_input_addr(skb, (xfrm_address_t *)addr,
603 (xfrm_address_t *)&ipv6_hdr(skb)->saddr,
604 IPPROTO_ROUTING) < 0) {
605 __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
606 IPSTATS_MIB_INADDRERRORS);
607 kfree_skb(skb);
608 return -1;
610 if (!ipv6_chk_home_addr(dev_net(skb_dst(skb)->dev), addr)) {
611 __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
612 IPSTATS_MIB_INADDRERRORS);
613 kfree_skb(skb);
614 return -1;
616 break;
617 #endif
618 default:
619 break;
622 if (ipv6_addr_is_multicast(addr)) {
623 __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
624 IPSTATS_MIB_INADDRERRORS);
625 kfree_skb(skb);
626 return -1;
629 daddr = *addr;
630 *addr = ipv6_hdr(skb)->daddr;
631 ipv6_hdr(skb)->daddr = daddr;
633 skb_dst_drop(skb);
634 ip6_route_input(skb);
635 if (skb_dst(skb)->error) {
636 skb_push(skb, skb->data - skb_network_header(skb));
637 dst_input(skb);
638 return -1;
641 if (skb_dst(skb)->dev->flags&IFF_LOOPBACK) {
642 if (ipv6_hdr(skb)->hop_limit <= 1) {
643 __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
644 IPSTATS_MIB_INHDRERRORS);
645 icmpv6_send(skb, ICMPV6_TIME_EXCEED, ICMPV6_EXC_HOPLIMIT,
647 kfree_skb(skb);
648 return -1;
650 ipv6_hdr(skb)->hop_limit--;
651 goto looped_back;
654 skb_push(skb, skb->data - skb_network_header(skb));
655 dst_input(skb);
656 return -1;
658 unknown_rh:
659 __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)), IPSTATS_MIB_INHDRERRORS);
660 icmpv6_param_prob(skb, ICMPV6_HDR_FIELD,
661 (&hdr->type) - skb_network_header(skb));
662 return -1;
665 static const struct inet6_protocol rthdr_protocol = {
666 .handler = ipv6_rthdr_rcv,
667 .flags = INET6_PROTO_NOPOLICY,
670 static const struct inet6_protocol destopt_protocol = {
671 .handler = ipv6_destopt_rcv,
672 .flags = INET6_PROTO_NOPOLICY,
675 static const struct inet6_protocol nodata_protocol = {
676 .handler = dst_discard,
677 .flags = INET6_PROTO_NOPOLICY,
680 int __init ipv6_exthdrs_init(void)
682 int ret;
684 ret = inet6_add_protocol(&rthdr_protocol, IPPROTO_ROUTING);
685 if (ret)
686 goto out;
688 ret = inet6_add_protocol(&destopt_protocol, IPPROTO_DSTOPTS);
689 if (ret)
690 goto out_rthdr;
692 ret = inet6_add_protocol(&nodata_protocol, IPPROTO_NONE);
693 if (ret)
694 goto out_destopt;
696 out:
697 return ret;
698 out_destopt:
699 inet6_del_protocol(&destopt_protocol, IPPROTO_DSTOPTS);
700 out_rthdr:
701 inet6_del_protocol(&rthdr_protocol, IPPROTO_ROUTING);
702 goto out;
705 void ipv6_exthdrs_exit(void)
707 inet6_del_protocol(&nodata_protocol, IPPROTO_NONE);
708 inet6_del_protocol(&destopt_protocol, IPPROTO_DSTOPTS);
709 inet6_del_protocol(&rthdr_protocol, IPPROTO_ROUTING);
712 /**********************************
713 Hop-by-hop options.
714 **********************************/
717 * Note: we cannot rely on skb_dst(skb) before we assign it in ip6_route_input().
719 static inline struct inet6_dev *ipv6_skb_idev(struct sk_buff *skb)
721 return skb_dst(skb) ? ip6_dst_idev(skb_dst(skb)) : __in6_dev_get(skb->dev);
724 static inline struct net *ipv6_skb_net(struct sk_buff *skb)
726 return skb_dst(skb) ? dev_net(skb_dst(skb)->dev) : dev_net(skb->dev);
729 /* Router Alert as of RFC 2711 */
731 static bool ipv6_hop_ra(struct sk_buff *skb, int optoff)
733 const unsigned char *nh = skb_network_header(skb);
735 if (nh[optoff + 1] == 2) {
736 IP6CB(skb)->flags |= IP6SKB_ROUTERALERT;
737 memcpy(&IP6CB(skb)->ra, nh + optoff + 2, sizeof(IP6CB(skb)->ra));
738 return true;
740 net_dbg_ratelimited("ipv6_hop_ra: wrong RA length %d\n",
741 nh[optoff + 1]);
742 kfree_skb(skb);
743 return false;
746 /* Jumbo payload */
748 static bool ipv6_hop_jumbo(struct sk_buff *skb, int optoff)
750 const unsigned char *nh = skb_network_header(skb);
751 struct net *net = ipv6_skb_net(skb);
752 u32 pkt_len;
754 if (nh[optoff + 1] != 4 || (optoff & 3) != 2) {
755 net_dbg_ratelimited("ipv6_hop_jumbo: wrong jumbo opt length/alignment %d\n",
756 nh[optoff+1]);
757 __IP6_INC_STATS(net, ipv6_skb_idev(skb),
758 IPSTATS_MIB_INHDRERRORS);
759 goto drop;
762 pkt_len = ntohl(*(__be32 *)(nh + optoff + 2));
763 if (pkt_len <= IPV6_MAXPLEN) {
764 __IP6_INC_STATS(net, ipv6_skb_idev(skb),
765 IPSTATS_MIB_INHDRERRORS);
766 icmpv6_param_prob(skb, ICMPV6_HDR_FIELD, optoff+2);
767 return false;
769 if (ipv6_hdr(skb)->payload_len) {
770 __IP6_INC_STATS(net, ipv6_skb_idev(skb),
771 IPSTATS_MIB_INHDRERRORS);
772 icmpv6_param_prob(skb, ICMPV6_HDR_FIELD, optoff);
773 return false;
776 if (pkt_len > skb->len - sizeof(struct ipv6hdr)) {
777 __IP6_INC_STATS(net, ipv6_skb_idev(skb),
778 IPSTATS_MIB_INTRUNCATEDPKTS);
779 goto drop;
782 if (pskb_trim_rcsum(skb, pkt_len + sizeof(struct ipv6hdr)))
783 goto drop;
785 return true;
787 drop:
788 kfree_skb(skb);
789 return false;
792 /* CALIPSO RFC 5570 */
794 static bool ipv6_hop_calipso(struct sk_buff *skb, int optoff)
796 const unsigned char *nh = skb_network_header(skb);
798 if (nh[optoff + 1] < 8)
799 goto drop;
801 if (nh[optoff + 6] * 4 + 8 > nh[optoff + 1])
802 goto drop;
804 if (!calipso_validate(skb, nh + optoff))
805 goto drop;
807 return true;
809 drop:
810 kfree_skb(skb);
811 return false;
814 static const struct tlvtype_proc tlvprochopopt_lst[] = {
816 .type = IPV6_TLV_ROUTERALERT,
817 .func = ipv6_hop_ra,
820 .type = IPV6_TLV_JUMBO,
821 .func = ipv6_hop_jumbo,
824 .type = IPV6_TLV_CALIPSO,
825 .func = ipv6_hop_calipso,
827 { -1, }
830 int ipv6_parse_hopopts(struct sk_buff *skb)
832 struct inet6_skb_parm *opt = IP6CB(skb);
835 * skb_network_header(skb) is equal to skb->data, and
836 * skb_network_header_len(skb) is always equal to
837 * sizeof(struct ipv6hdr) by definition of
838 * hop-by-hop options.
840 if (!pskb_may_pull(skb, sizeof(struct ipv6hdr) + 8) ||
841 !pskb_may_pull(skb, (sizeof(struct ipv6hdr) +
842 ((skb_transport_header(skb)[1] + 1) << 3)))) {
843 kfree_skb(skb);
844 return -1;
847 opt->flags |= IP6SKB_HOPBYHOP;
848 if (ip6_parse_tlv(tlvprochopopt_lst, skb)) {
849 skb->transport_header += (skb_transport_header(skb)[1] + 1) << 3;
850 opt = IP6CB(skb);
851 opt->nhoff = sizeof(struct ipv6hdr);
852 return 1;
854 return -1;
858 * Creating outbound headers.
860 * "build" functions work when skb is filled from head to tail (datagram)
861 * "push" functions work when headers are added from tail to head (tcp)
863 * In both cases we assume, that caller reserved enough room
864 * for headers.
867 static void ipv6_push_rthdr0(struct sk_buff *skb, u8 *proto,
868 struct ipv6_rt_hdr *opt,
869 struct in6_addr **addr_p, struct in6_addr *saddr)
871 struct rt0_hdr *phdr, *ihdr;
872 int hops;
874 ihdr = (struct rt0_hdr *) opt;
876 phdr = (struct rt0_hdr *) skb_push(skb, (ihdr->rt_hdr.hdrlen + 1) << 3);
877 memcpy(phdr, ihdr, sizeof(struct rt0_hdr));
879 hops = ihdr->rt_hdr.hdrlen >> 1;
881 if (hops > 1)
882 memcpy(phdr->addr, ihdr->addr + 1,
883 (hops - 1) * sizeof(struct in6_addr));
885 phdr->addr[hops - 1] = **addr_p;
886 *addr_p = ihdr->addr;
888 phdr->rt_hdr.nexthdr = *proto;
889 *proto = NEXTHDR_ROUTING;
892 static void ipv6_push_rthdr4(struct sk_buff *skb, u8 *proto,
893 struct ipv6_rt_hdr *opt,
894 struct in6_addr **addr_p, struct in6_addr *saddr)
896 struct ipv6_sr_hdr *sr_phdr, *sr_ihdr;
897 int plen, hops;
899 sr_ihdr = (struct ipv6_sr_hdr *)opt;
900 plen = (sr_ihdr->hdrlen + 1) << 3;
902 sr_phdr = (struct ipv6_sr_hdr *)skb_push(skb, plen);
903 memcpy(sr_phdr, sr_ihdr, sizeof(struct ipv6_sr_hdr));
905 hops = sr_ihdr->first_segment + 1;
906 memcpy(sr_phdr->segments + 1, sr_ihdr->segments + 1,
907 (hops - 1) * sizeof(struct in6_addr));
909 sr_phdr->segments[0] = **addr_p;
910 *addr_p = &sr_ihdr->segments[hops - 1];
912 #ifdef CONFIG_IPV6_SEG6_HMAC
913 if (sr_has_hmac(sr_phdr)) {
914 struct net *net = NULL;
916 if (skb->dev)
917 net = dev_net(skb->dev);
918 else if (skb->sk)
919 net = sock_net(skb->sk);
921 WARN_ON(!net);
923 if (net)
924 seg6_push_hmac(net, saddr, sr_phdr);
926 #endif
928 sr_phdr->nexthdr = *proto;
929 *proto = NEXTHDR_ROUTING;
932 static void ipv6_push_rthdr(struct sk_buff *skb, u8 *proto,
933 struct ipv6_rt_hdr *opt,
934 struct in6_addr **addr_p, struct in6_addr *saddr)
936 switch (opt->type) {
937 case IPV6_SRCRT_TYPE_0:
938 ipv6_push_rthdr0(skb, proto, opt, addr_p, saddr);
939 break;
940 case IPV6_SRCRT_TYPE_4:
941 ipv6_push_rthdr4(skb, proto, opt, addr_p, saddr);
942 break;
943 default:
944 break;
948 static void ipv6_push_exthdr(struct sk_buff *skb, u8 *proto, u8 type, struct ipv6_opt_hdr *opt)
950 struct ipv6_opt_hdr *h = (struct ipv6_opt_hdr *)skb_push(skb, ipv6_optlen(opt));
952 memcpy(h, opt, ipv6_optlen(opt));
953 h->nexthdr = *proto;
954 *proto = type;
957 void ipv6_push_nfrag_opts(struct sk_buff *skb, struct ipv6_txoptions *opt,
958 u8 *proto,
959 struct in6_addr **daddr, struct in6_addr *saddr)
961 if (opt->srcrt) {
962 ipv6_push_rthdr(skb, proto, opt->srcrt, daddr, saddr);
964 * IPV6_RTHDRDSTOPTS is ignored
965 * unless IPV6_RTHDR is set (RFC3542).
967 if (opt->dst0opt)
968 ipv6_push_exthdr(skb, proto, NEXTHDR_DEST, opt->dst0opt);
970 if (opt->hopopt)
971 ipv6_push_exthdr(skb, proto, NEXTHDR_HOP, opt->hopopt);
973 EXPORT_SYMBOL(ipv6_push_nfrag_opts);
975 void ipv6_push_frag_opts(struct sk_buff *skb, struct ipv6_txoptions *opt, u8 *proto)
977 if (opt->dst1opt)
978 ipv6_push_exthdr(skb, proto, NEXTHDR_DEST, opt->dst1opt);
981 struct ipv6_txoptions *
982 ipv6_dup_options(struct sock *sk, struct ipv6_txoptions *opt)
984 struct ipv6_txoptions *opt2;
986 opt2 = sock_kmalloc(sk, opt->tot_len, GFP_ATOMIC);
987 if (opt2) {
988 long dif = (char *)opt2 - (char *)opt;
989 memcpy(opt2, opt, opt->tot_len);
990 if (opt2->hopopt)
991 *((char **)&opt2->hopopt) += dif;
992 if (opt2->dst0opt)
993 *((char **)&opt2->dst0opt) += dif;
994 if (opt2->dst1opt)
995 *((char **)&opt2->dst1opt) += dif;
996 if (opt2->srcrt)
997 *((char **)&opt2->srcrt) += dif;
998 atomic_set(&opt2->refcnt, 1);
1000 return opt2;
1002 EXPORT_SYMBOL_GPL(ipv6_dup_options);
1004 static int ipv6_renew_option(void *ohdr,
1005 struct ipv6_opt_hdr __user *newopt, int newoptlen,
1006 int inherit,
1007 struct ipv6_opt_hdr **hdr,
1008 char **p)
1010 if (inherit) {
1011 if (ohdr) {
1012 memcpy(*p, ohdr, ipv6_optlen((struct ipv6_opt_hdr *)ohdr));
1013 *hdr = (struct ipv6_opt_hdr *)*p;
1014 *p += CMSG_ALIGN(ipv6_optlen(*hdr));
1016 } else {
1017 if (newopt) {
1018 if (copy_from_user(*p, newopt, newoptlen))
1019 return -EFAULT;
1020 *hdr = (struct ipv6_opt_hdr *)*p;
1021 if (ipv6_optlen(*hdr) > newoptlen)
1022 return -EINVAL;
1023 *p += CMSG_ALIGN(newoptlen);
1026 return 0;
1030 * ipv6_renew_options - replace a specific ext hdr with a new one.
1032 * @sk: sock from which to allocate memory
1033 * @opt: original options
1034 * @newtype: option type to replace in @opt
1035 * @newopt: new option of type @newtype to replace (user-mem)
1036 * @newoptlen: length of @newopt
1038 * Returns a new set of options which is a copy of @opt with the
1039 * option type @newtype replaced with @newopt.
1041 * @opt may be NULL, in which case a new set of options is returned
1042 * containing just @newopt.
1044 * @newopt may be NULL, in which case the specified option type is
1045 * not copied into the new set of options.
1047 * The new set of options is allocated from the socket option memory
1048 * buffer of @sk.
1050 struct ipv6_txoptions *
1051 ipv6_renew_options(struct sock *sk, struct ipv6_txoptions *opt,
1052 int newtype,
1053 struct ipv6_opt_hdr __user *newopt, int newoptlen)
1055 int tot_len = 0;
1056 char *p;
1057 struct ipv6_txoptions *opt2;
1058 int err;
1060 if (opt) {
1061 if (newtype != IPV6_HOPOPTS && opt->hopopt)
1062 tot_len += CMSG_ALIGN(ipv6_optlen(opt->hopopt));
1063 if (newtype != IPV6_RTHDRDSTOPTS && opt->dst0opt)
1064 tot_len += CMSG_ALIGN(ipv6_optlen(opt->dst0opt));
1065 if (newtype != IPV6_RTHDR && opt->srcrt)
1066 tot_len += CMSG_ALIGN(ipv6_optlen(opt->srcrt));
1067 if (newtype != IPV6_DSTOPTS && opt->dst1opt)
1068 tot_len += CMSG_ALIGN(ipv6_optlen(opt->dst1opt));
1071 if (newopt && newoptlen)
1072 tot_len += CMSG_ALIGN(newoptlen);
1074 if (!tot_len)
1075 return NULL;
1077 tot_len += sizeof(*opt2);
1078 opt2 = sock_kmalloc(sk, tot_len, GFP_ATOMIC);
1079 if (!opt2)
1080 return ERR_PTR(-ENOBUFS);
1082 memset(opt2, 0, tot_len);
1083 atomic_set(&opt2->refcnt, 1);
1084 opt2->tot_len = tot_len;
1085 p = (char *)(opt2 + 1);
1087 err = ipv6_renew_option(opt ? opt->hopopt : NULL, newopt, newoptlen,
1088 newtype != IPV6_HOPOPTS,
1089 &opt2->hopopt, &p);
1090 if (err)
1091 goto out;
1093 err = ipv6_renew_option(opt ? opt->dst0opt : NULL, newopt, newoptlen,
1094 newtype != IPV6_RTHDRDSTOPTS,
1095 &opt2->dst0opt, &p);
1096 if (err)
1097 goto out;
1099 err = ipv6_renew_option(opt ? opt->srcrt : NULL, newopt, newoptlen,
1100 newtype != IPV6_RTHDR,
1101 (struct ipv6_opt_hdr **)&opt2->srcrt, &p);
1102 if (err)
1103 goto out;
1105 err = ipv6_renew_option(opt ? opt->dst1opt : NULL, newopt, newoptlen,
1106 newtype != IPV6_DSTOPTS,
1107 &opt2->dst1opt, &p);
1108 if (err)
1109 goto out;
1111 opt2->opt_nflen = (opt2->hopopt ? ipv6_optlen(opt2->hopopt) : 0) +
1112 (opt2->dst0opt ? ipv6_optlen(opt2->dst0opt) : 0) +
1113 (opt2->srcrt ? ipv6_optlen(opt2->srcrt) : 0);
1114 opt2->opt_flen = (opt2->dst1opt ? ipv6_optlen(opt2->dst1opt) : 0);
1116 return opt2;
1117 out:
1118 sock_kfree_s(sk, opt2, opt2->tot_len);
1119 return ERR_PTR(err);
1123 * ipv6_renew_options_kern - replace a specific ext hdr with a new one.
1125 * @sk: sock from which to allocate memory
1126 * @opt: original options
1127 * @newtype: option type to replace in @opt
1128 * @newopt: new option of type @newtype to replace (kernel-mem)
1129 * @newoptlen: length of @newopt
1131 * See ipv6_renew_options(). The difference is that @newopt is
1132 * kernel memory, rather than user memory.
1134 struct ipv6_txoptions *
1135 ipv6_renew_options_kern(struct sock *sk, struct ipv6_txoptions *opt,
1136 int newtype, struct ipv6_opt_hdr *newopt,
1137 int newoptlen)
1139 struct ipv6_txoptions *ret_val;
1140 const mm_segment_t old_fs = get_fs();
1142 set_fs(KERNEL_DS);
1143 ret_val = ipv6_renew_options(sk, opt, newtype,
1144 (struct ipv6_opt_hdr __user *)newopt,
1145 newoptlen);
1146 set_fs(old_fs);
1147 return ret_val;
1150 struct ipv6_txoptions *ipv6_fixup_options(struct ipv6_txoptions *opt_space,
1151 struct ipv6_txoptions *opt)
1154 * ignore the dest before srcrt unless srcrt is being included.
1155 * --yoshfuji
1157 if (opt && opt->dst0opt && !opt->srcrt) {
1158 if (opt_space != opt) {
1159 memcpy(opt_space, opt, sizeof(*opt_space));
1160 opt = opt_space;
1162 opt->opt_nflen -= ipv6_optlen(opt->dst0opt);
1163 opt->dst0opt = NULL;
1166 return opt;
1168 EXPORT_SYMBOL_GPL(ipv6_fixup_options);
1171 * fl6_update_dst - update flowi destination address with info given
1172 * by srcrt option, if any.
1174 * @fl6: flowi6 for which daddr is to be updated
1175 * @opt: struct ipv6_txoptions in which to look for srcrt opt
1176 * @orig: copy of original daddr address if modified
1178 * Returns NULL if no txoptions or no srcrt, otherwise returns orig
1179 * and initial value of fl6->daddr set in orig
1181 struct in6_addr *fl6_update_dst(struct flowi6 *fl6,
1182 const struct ipv6_txoptions *opt,
1183 struct in6_addr *orig)
1185 if (!opt || !opt->srcrt)
1186 return NULL;
1188 *orig = fl6->daddr;
1190 switch (opt->srcrt->type) {
1191 case IPV6_SRCRT_TYPE_0:
1192 fl6->daddr = *((struct rt0_hdr *)opt->srcrt)->addr;
1193 break;
1194 case IPV6_SRCRT_TYPE_4:
1196 struct ipv6_sr_hdr *srh = (struct ipv6_sr_hdr *)opt->srcrt;
1198 fl6->daddr = srh->segments[srh->first_segment];
1199 break;
1201 default:
1202 return NULL;
1205 return orig;
1207 EXPORT_SYMBOL_GPL(fl6_update_dst);