2 * Internet Control Message Protocol (ICMPv6)
3 * Linux INET6 implementation
6 * Pedro Roque <roque@di.fc.ul.pt>
8 * Based on net/ipv4/icmp.c
12 * This program is free software; you can redistribute it and/or
13 * modify it under the terms of the GNU General Public License
14 * as published by the Free Software Foundation; either version
15 * 2 of the License, or (at your option) any later version.
21 * Andi Kleen : exception handling
22 * Andi Kleen add rate limits. never reply to a icmp.
23 * add more length checks and other fixes.
24 * yoshfuji : ensure to sent parameter problem for
26 * YOSHIFUJI Hideaki @USAGI: added sysctl for icmp rate limit.
28 * YOSHIFUJI Hideaki @USAGI: Per-interface statistics support
29 * Kazunori MIYAZAWA @USAGI: change output process to use ip6_append_data
32 #define pr_fmt(fmt) "IPv6: " fmt
34 #include <linux/module.h>
35 #include <linux/errno.h>
36 #include <linux/types.h>
37 #include <linux/socket.h>
39 #include <linux/kernel.h>
40 #include <linux/sockios.h>
41 #include <linux/net.h>
42 #include <linux/skbuff.h>
43 #include <linux/init.h>
44 #include <linux/netfilter.h>
45 #include <linux/slab.h>
48 #include <linux/sysctl.h>
51 #include <linux/inet.h>
52 #include <linux/netdevice.h>
53 #include <linux/icmpv6.h>
59 #include <net/ip6_checksum.h>
61 #include <net/protocol.h>
63 #include <net/rawv6.h>
64 #include <net/transp_v6.h>
65 #include <net/ip6_route.h>
66 #include <net/addrconf.h>
69 #include <net/inet_common.h>
70 #include <net/dsfield.h>
71 #include <net/l3mdev.h>
73 #include <linux/uaccess.h>
76 * The ICMP socket(s). This is the most convenient way to flow control
77 * our ICMP output as well as maintain a clean interface throughout
78 * all layers. All Socketless IP sends will soon be gone.
80 * On SMP we have one ICMP socket per-cpu.
82 static inline struct sock
*icmpv6_sk(struct net
*net
)
84 return net
->ipv6
.icmp_sk
[smp_processor_id()];
87 static void icmpv6_err(struct sk_buff
*skb
, struct inet6_skb_parm
*opt
,
88 u8 type
, u8 code
, int offset
, __be32 info
)
90 /* icmpv6_notify checks 8 bytes can be pulled, icmp6hdr is 8 bytes */
91 struct icmp6hdr
*icmp6
= (struct icmp6hdr
*) (skb
->data
+ offset
);
92 struct net
*net
= dev_net(skb
->dev
);
94 if (type
== ICMPV6_PKT_TOOBIG
)
95 ip6_update_pmtu(skb
, net
, info
, skb
->dev
->ifindex
, 0, sock_net_uid(net
, NULL
));
96 else if (type
== NDISC_REDIRECT
)
97 ip6_redirect(skb
, net
, skb
->dev
->ifindex
, 0,
98 sock_net_uid(net
, NULL
));
100 if (!(type
& ICMPV6_INFOMSG_MASK
))
101 if (icmp6
->icmp6_type
== ICMPV6_ECHO_REQUEST
)
102 ping_err(skb
, offset
, ntohl(info
));
105 static int icmpv6_rcv(struct sk_buff
*skb
);
107 static const struct inet6_protocol icmpv6_protocol
= {
108 .handler
= icmpv6_rcv
,
109 .err_handler
= icmpv6_err
,
110 .flags
= INET6_PROTO_NOPOLICY
|INET6_PROTO_FINAL
,
113 /* Called with BH disabled */
114 static __inline__
struct sock
*icmpv6_xmit_lock(struct net
*net
)
119 if (unlikely(!spin_trylock(&sk
->sk_lock
.slock
))) {
120 /* This can happen if the output path (f.e. SIT or
121 * ip6ip6 tunnel) signals dst_link_failure() for an
122 * outgoing ICMP6 packet.
129 static __inline__
void icmpv6_xmit_unlock(struct sock
*sk
)
131 spin_unlock(&sk
->sk_lock
.slock
);
135 * Figure out, may we reply to this packet with icmp error.
137 * We do not reply, if:
138 * - it was icmp error message.
139 * - it is truncated, so that it is known, that protocol is ICMPV6
140 * (i.e. in the middle of some exthdr)
145 static bool is_ineligible(const struct sk_buff
*skb
)
147 int ptr
= (u8
*)(ipv6_hdr(skb
) + 1) - skb
->data
;
148 int len
= skb
->len
- ptr
;
149 __u8 nexthdr
= ipv6_hdr(skb
)->nexthdr
;
155 ptr
= ipv6_skip_exthdr(skb
, ptr
, &nexthdr
, &frag_off
);
158 if (nexthdr
== IPPROTO_ICMPV6
) {
160 tp
= skb_header_pointer(skb
,
161 ptr
+offsetof(struct icmp6hdr
, icmp6_type
),
162 sizeof(_type
), &_type
);
163 if (!tp
|| !(*tp
& ICMPV6_INFOMSG_MASK
))
169 static bool icmpv6_mask_allow(int type
)
171 /* Informational messages are not limited. */
172 if (type
& ICMPV6_INFOMSG_MASK
)
175 /* Do not limit pmtu discovery, it would break it. */
176 if (type
== ICMPV6_PKT_TOOBIG
)
182 static bool icmpv6_global_allow(int type
)
184 if (icmpv6_mask_allow(type
))
187 if (icmp_global_allow())
194 * Check the ICMP output rate limit
196 static bool icmpv6_xrlim_allow(struct sock
*sk
, u8 type
,
199 struct net
*net
= sock_net(sk
);
200 struct dst_entry
*dst
;
203 if (icmpv6_mask_allow(type
))
207 * Look up the output route.
208 * XXX: perhaps the expire for routing entries cloned by
209 * this lookup should be more aggressive (not longer than timeout).
211 dst
= ip6_route_output(net
, sk
, fl6
);
213 IP6_INC_STATS(net
, ip6_dst_idev(dst
),
214 IPSTATS_MIB_OUTNOROUTES
);
215 } else if (dst
->dev
&& (dst
->dev
->flags
&IFF_LOOPBACK
)) {
218 struct rt6_info
*rt
= (struct rt6_info
*)dst
;
219 int tmo
= net
->ipv6
.sysctl
.icmpv6_time
;
220 struct inet_peer
*peer
;
222 /* Give more bandwidth to wider prefixes. */
223 if (rt
->rt6i_dst
.plen
< 128)
224 tmo
>>= ((128 - rt
->rt6i_dst
.plen
)>>5);
226 peer
= inet_getpeer_v6(net
->ipv6
.peers
, &fl6
->daddr
, 1);
227 res
= inet_peer_xrlim_allow(peer
, tmo
);
236 * an inline helper for the "simple" if statement below
237 * checks if parameter problem report is caused by an
238 * unrecognized IPv6 option that has the Option Type
239 * highest-order two bits set to 10
242 static bool opt_unrec(struct sk_buff
*skb
, __u32 offset
)
246 offset
+= skb_network_offset(skb
);
247 op
= skb_header_pointer(skb
, offset
, sizeof(_optval
), &_optval
);
250 return (*op
& 0xC0) == 0x80;
253 void icmpv6_push_pending_frames(struct sock
*sk
, struct flowi6
*fl6
,
254 struct icmp6hdr
*thdr
, int len
)
257 struct icmp6hdr
*icmp6h
;
259 skb
= skb_peek(&sk
->sk_write_queue
);
263 icmp6h
= icmp6_hdr(skb
);
264 memcpy(icmp6h
, thdr
, sizeof(struct icmp6hdr
));
265 icmp6h
->icmp6_cksum
= 0;
267 if (skb_queue_len(&sk
->sk_write_queue
) == 1) {
268 skb
->csum
= csum_partial(icmp6h
,
269 sizeof(struct icmp6hdr
), skb
->csum
);
270 icmp6h
->icmp6_cksum
= csum_ipv6_magic(&fl6
->saddr
,
272 len
, fl6
->flowi6_proto
,
277 skb_queue_walk(&sk
->sk_write_queue
, skb
) {
278 tmp_csum
= csum_add(tmp_csum
, skb
->csum
);
281 tmp_csum
= csum_partial(icmp6h
,
282 sizeof(struct icmp6hdr
), tmp_csum
);
283 icmp6h
->icmp6_cksum
= csum_ipv6_magic(&fl6
->saddr
,
285 len
, fl6
->flowi6_proto
,
288 ip6_push_pending_frames(sk
);
297 static int icmpv6_getfrag(void *from
, char *to
, int offset
, int len
, int odd
, struct sk_buff
*skb
)
299 struct icmpv6_msg
*msg
= (struct icmpv6_msg
*) from
;
300 struct sk_buff
*org_skb
= msg
->skb
;
303 csum
= skb_copy_and_csum_bits(org_skb
, msg
->offset
+ offset
,
305 skb
->csum
= csum_block_add(skb
->csum
, csum
, odd
);
306 if (!(msg
->type
& ICMPV6_INFOMSG_MASK
))
307 nf_ct_attach(skb
, org_skb
);
311 #if IS_ENABLED(CONFIG_IPV6_MIP6)
312 static void mip6_addr_swap(struct sk_buff
*skb
)
314 struct ipv6hdr
*iph
= ipv6_hdr(skb
);
315 struct inet6_skb_parm
*opt
= IP6CB(skb
);
316 struct ipv6_destopt_hao
*hao
;
321 off
= ipv6_find_tlv(skb
, opt
->dsthao
, IPV6_TLV_HAO
);
322 if (likely(off
>= 0)) {
323 hao
= (struct ipv6_destopt_hao
*)
324 (skb_network_header(skb
) + off
);
326 iph
->saddr
= hao
->addr
;
332 static inline void mip6_addr_swap(struct sk_buff
*skb
) {}
335 static struct dst_entry
*icmpv6_route_lookup(struct net
*net
,
340 struct dst_entry
*dst
, *dst2
;
344 err
= ip6_dst_lookup(net
, sk
, &dst
, fl6
);
349 * We won't send icmp if the destination is known
352 if (ipv6_anycast_destination(dst
, &fl6
->daddr
)) {
353 net_dbg_ratelimited("icmp6_send: acast source\n");
355 return ERR_PTR(-EINVAL
);
358 /* No need to clone since we're just using its address. */
361 dst
= xfrm_lookup(net
, dst
, flowi6_to_flowi(fl6
), sk
, 0);
366 if (PTR_ERR(dst
) == -EPERM
)
372 err
= xfrm_decode_session_reverse(skb
, flowi6_to_flowi(&fl2
), AF_INET6
);
374 goto relookup_failed
;
376 err
= ip6_dst_lookup(net
, sk
, &dst2
, &fl2
);
378 goto relookup_failed
;
380 dst2
= xfrm_lookup(net
, dst2
, flowi6_to_flowi(&fl2
), sk
, XFRM_LOOKUP_ICMP
);
390 goto relookup_failed
;
399 static int icmp6_iif(const struct sk_buff
*skb
)
401 int iif
= skb
->dev
->ifindex
;
403 /* for local traffic to local address, skb dev is the loopback
404 * device. Check if there is a dst attached to the skb and if so
405 * get the real device index. Same is needed for replies to a link
406 * local address on a device enslaved to an L3 master device
408 if (unlikely(iif
== LOOPBACK_IFINDEX
|| netif_is_l3_master(skb
->dev
))) {
409 const struct rt6_info
*rt6
= skb_rt6_info(skb
);
412 iif
= rt6
->rt6i_idev
->dev
->ifindex
;
419 * Send an ICMP message in response to a packet in error
421 static void icmp6_send(struct sk_buff
*skb
, u8 type
, u8 code
, __u32 info
,
422 const struct in6_addr
*force_saddr
)
424 struct inet6_dev
*idev
= NULL
;
425 struct ipv6hdr
*hdr
= ipv6_hdr(skb
);
428 struct ipv6_pinfo
*np
;
429 const struct in6_addr
*saddr
= NULL
;
430 struct dst_entry
*dst
;
431 struct icmp6hdr tmp_hdr
;
433 struct icmpv6_msg msg
;
434 struct ipcm6_cookie ipc6
;
440 if ((u8
*)hdr
< skb
->head
||
441 (skb_network_header(skb
) + sizeof(*hdr
)) > skb_tail_pointer(skb
))
446 net
= dev_net(skb
->dev
);
447 mark
= IP6_REPLY_MARK(net
, skb
->mark
);
449 * Make sure we respect the rules
450 * i.e. RFC 1885 2.4(e)
451 * Rule (e.1) is enforced by not using icmp6_send
452 * in any code that processes icmp errors.
454 addr_type
= ipv6_addr_type(&hdr
->daddr
);
456 if (ipv6_chk_addr(net
, &hdr
->daddr
, skb
->dev
, 0) ||
457 ipv6_chk_acast_addr_src(net
, skb
->dev
, &hdr
->daddr
))
464 if (addr_type
& IPV6_ADDR_MULTICAST
|| skb
->pkt_type
!= PACKET_HOST
) {
465 if (type
!= ICMPV6_PKT_TOOBIG
&&
466 !(type
== ICMPV6_PARAMPROB
&&
467 code
== ICMPV6_UNK_OPTION
&&
468 (opt_unrec(skb
, info
))))
474 addr_type
= ipv6_addr_type(&hdr
->saddr
);
480 if (__ipv6_addr_needs_scope_id(addr_type
)) {
481 iif
= icmp6_iif(skb
);
484 iif
= l3mdev_master_ifindex(dst
? dst
->dev
: skb
->dev
);
488 * Must not send error if the source does not uniquely
489 * identify a single node (RFC2463 Section 2.4).
490 * We check unspecified / multicast addresses here,
491 * and anycast addresses will be checked later.
493 if ((addr_type
== IPV6_ADDR_ANY
) || (addr_type
& IPV6_ADDR_MULTICAST
)) {
494 net_dbg_ratelimited("icmp6_send: addr_any/mcast source [%pI6c > %pI6c]\n",
495 &hdr
->saddr
, &hdr
->daddr
);
500 * Never answer to a ICMP packet.
502 if (is_ineligible(skb
)) {
503 net_dbg_ratelimited("icmp6_send: no reply to icmp error [%pI6c > %pI6c]\n",
504 &hdr
->saddr
, &hdr
->daddr
);
508 /* Needed by both icmp_global_allow and icmpv6_xmit_lock */
511 /* Check global sysctl_icmp_msgs_per_sec ratelimit */
512 if (!(skb
->dev
->flags
&IFF_LOOPBACK
) && !icmpv6_global_allow(type
))
517 memset(&fl6
, 0, sizeof(fl6
));
518 fl6
.flowi6_proto
= IPPROTO_ICMPV6
;
519 fl6
.daddr
= hdr
->saddr
;
524 fl6
.flowi6_mark
= mark
;
525 fl6
.flowi6_oif
= iif
;
526 fl6
.fl6_icmp_type
= type
;
527 fl6
.fl6_icmp_code
= code
;
528 fl6
.flowi6_uid
= sock_net_uid(net
, NULL
);
529 fl6
.mp_hash
= rt6_multipath_hash(net
, &fl6
, skb
, NULL
);
530 security_skb_classify_flow(skb
, flowi6_to_flowi(&fl6
));
532 sk
= icmpv6_xmit_lock(net
);
539 if (!icmpv6_xrlim_allow(sk
, type
, &fl6
))
542 tmp_hdr
.icmp6_type
= type
;
543 tmp_hdr
.icmp6_code
= code
;
544 tmp_hdr
.icmp6_cksum
= 0;
545 tmp_hdr
.icmp6_pointer
= htonl(info
);
547 if (!fl6
.flowi6_oif
&& ipv6_addr_is_multicast(&fl6
.daddr
))
548 fl6
.flowi6_oif
= np
->mcast_oif
;
549 else if (!fl6
.flowi6_oif
)
550 fl6
.flowi6_oif
= np
->ucast_oif
;
552 ipcm6_init_sk(&ipc6
, np
);
553 fl6
.flowlabel
= ip6_make_flowinfo(ipc6
.tclass
, fl6
.flowlabel
);
555 dst
= icmpv6_route_lookup(net
, skb
, sk
, &fl6
);
559 ipc6
.hlimit
= ip6_sk_dst_hoplimit(np
, &fl6
, dst
);
562 msg
.offset
= skb_network_offset(skb
);
565 len
= skb
->len
- msg
.offset
;
566 len
= min_t(unsigned int, len
, IPV6_MIN_MTU
- sizeof(struct ipv6hdr
) - sizeof(struct icmp6hdr
));
568 net_dbg_ratelimited("icmp: len problem [%pI6c > %pI6c]\n",
569 &hdr
->saddr
, &hdr
->daddr
);
570 goto out_dst_release
;
574 idev
= __in6_dev_get(skb
->dev
);
576 if (ip6_append_data(sk
, icmpv6_getfrag
, &msg
,
577 len
+ sizeof(struct icmp6hdr
),
578 sizeof(struct icmp6hdr
),
579 &ipc6
, &fl6
, (struct rt6_info
*)dst
,
581 ICMP6_INC_STATS(net
, idev
, ICMP6_MIB_OUTERRORS
);
582 ip6_flush_pending_frames(sk
);
584 icmpv6_push_pending_frames(sk
, &fl6
, &tmp_hdr
,
585 len
+ sizeof(struct icmp6hdr
));
591 icmpv6_xmit_unlock(sk
);
596 /* Slightly more convenient version of icmp6_send.
598 void icmpv6_param_prob(struct sk_buff
*skb
, u8 code
, int pos
)
600 icmp6_send(skb
, ICMPV6_PARAMPROB
, code
, pos
, NULL
);
604 /* Generate icmpv6 with type/code ICMPV6_DEST_UNREACH/ICMPV6_ADDR_UNREACH
605 * if sufficient data bytes are available
606 * @nhs is the size of the tunnel header(s) :
607 * Either an IPv4 header for SIT encap
608 * an IPv4 header + GRE header for GRE encap
610 int ip6_err_gen_icmpv6_unreach(struct sk_buff
*skb
, int nhs
, int type
,
611 unsigned int data_len
)
613 struct in6_addr temp_saddr
;
615 struct sk_buff
*skb2
;
618 if (!pskb_may_pull(skb
, nhs
+ sizeof(struct ipv6hdr
) + 8))
621 /* RFC 4884 (partial) support for ICMP extensions */
622 if (data_len
< 128 || (data_len
& 7) || skb
->len
< data_len
)
625 skb2
= data_len
? skb_copy(skb
, GFP_ATOMIC
) : skb_clone(skb
, GFP_ATOMIC
);
632 skb_reset_network_header(skb2
);
634 rt
= rt6_lookup(dev_net(skb
->dev
), &ipv6_hdr(skb2
)->saddr
, NULL
, 0,
637 if (rt
&& rt
->dst
.dev
)
638 skb2
->dev
= rt
->dst
.dev
;
640 ipv6_addr_set_v4mapped(ip_hdr(skb
)->saddr
, &temp_saddr
);
643 /* RFC 4884 (partial) support :
644 * insert 0 padding at the end, before the extensions
646 __skb_push(skb2
, nhs
);
647 skb_reset_network_header(skb2
);
648 memmove(skb2
->data
, skb2
->data
+ nhs
, data_len
- nhs
);
649 memset(skb2
->data
+ data_len
- nhs
, 0, nhs
);
650 /* RFC 4884 4.5 : Length is measured in 64-bit words,
651 * and stored in reserved[0]
653 info
= (data_len
/8) << 24;
655 if (type
== ICMP_TIME_EXCEEDED
)
656 icmp6_send(skb2
, ICMPV6_TIME_EXCEED
, ICMPV6_EXC_HOPLIMIT
,
659 icmp6_send(skb2
, ICMPV6_DEST_UNREACH
, ICMPV6_ADDR_UNREACH
,
668 EXPORT_SYMBOL(ip6_err_gen_icmpv6_unreach
);
670 static void icmpv6_echo_reply(struct sk_buff
*skb
)
672 struct net
*net
= dev_net(skb
->dev
);
674 struct inet6_dev
*idev
;
675 struct ipv6_pinfo
*np
;
676 const struct in6_addr
*saddr
= NULL
;
677 struct icmp6hdr
*icmph
= icmp6_hdr(skb
);
678 struct icmp6hdr tmp_hdr
;
680 struct icmpv6_msg msg
;
681 struct dst_entry
*dst
;
682 struct ipcm6_cookie ipc6
;
683 u32 mark
= IP6_REPLY_MARK(net
, skb
->mark
);
685 saddr
= &ipv6_hdr(skb
)->daddr
;
687 if (!ipv6_unicast_destination(skb
) &&
688 !(net
->ipv6
.sysctl
.anycast_src_echo_reply
&&
689 ipv6_anycast_destination(skb_dst(skb
), saddr
)))
692 memcpy(&tmp_hdr
, icmph
, sizeof(tmp_hdr
));
693 tmp_hdr
.icmp6_type
= ICMPV6_ECHO_REPLY
;
695 memset(&fl6
, 0, sizeof(fl6
));
696 fl6
.flowi6_proto
= IPPROTO_ICMPV6
;
697 fl6
.daddr
= ipv6_hdr(skb
)->saddr
;
700 fl6
.flowi6_oif
= icmp6_iif(skb
);
701 fl6
.fl6_icmp_type
= ICMPV6_ECHO_REPLY
;
702 fl6
.flowi6_mark
= mark
;
703 fl6
.flowi6_uid
= sock_net_uid(net
, NULL
);
704 security_skb_classify_flow(skb
, flowi6_to_flowi(&fl6
));
707 sk
= icmpv6_xmit_lock(net
);
713 if (!fl6
.flowi6_oif
&& ipv6_addr_is_multicast(&fl6
.daddr
))
714 fl6
.flowi6_oif
= np
->mcast_oif
;
715 else if (!fl6
.flowi6_oif
)
716 fl6
.flowi6_oif
= np
->ucast_oif
;
718 if (ip6_dst_lookup(net
, sk
, &dst
, &fl6
))
720 dst
= xfrm_lookup(net
, dst
, flowi6_to_flowi(&fl6
), sk
, 0);
724 idev
= __in6_dev_get(skb
->dev
);
728 msg
.type
= ICMPV6_ECHO_REPLY
;
730 ipcm6_init_sk(&ipc6
, np
);
731 ipc6
.hlimit
= ip6_sk_dst_hoplimit(np
, &fl6
, dst
);
732 ipc6
.tclass
= ipv6_get_dsfield(ipv6_hdr(skb
));
734 if (ip6_append_data(sk
, icmpv6_getfrag
, &msg
,
735 skb
->len
+ sizeof(struct icmp6hdr
),
736 sizeof(struct icmp6hdr
), &ipc6
, &fl6
,
737 (struct rt6_info
*)dst
, MSG_DONTWAIT
)) {
738 __ICMP6_INC_STATS(net
, idev
, ICMP6_MIB_OUTERRORS
);
739 ip6_flush_pending_frames(sk
);
741 icmpv6_push_pending_frames(sk
, &fl6
, &tmp_hdr
,
742 skb
->len
+ sizeof(struct icmp6hdr
));
746 icmpv6_xmit_unlock(sk
);
751 void icmpv6_notify(struct sk_buff
*skb
, u8 type
, u8 code
, __be32 info
)
753 const struct inet6_protocol
*ipprot
;
757 struct net
*net
= dev_net(skb
->dev
);
759 if (!pskb_may_pull(skb
, sizeof(struct ipv6hdr
)))
762 nexthdr
= ((struct ipv6hdr
*)skb
->data
)->nexthdr
;
763 if (ipv6_ext_hdr(nexthdr
)) {
764 /* now skip over extension headers */
765 inner_offset
= ipv6_skip_exthdr(skb
, sizeof(struct ipv6hdr
),
766 &nexthdr
, &frag_off
);
767 if (inner_offset
< 0)
770 inner_offset
= sizeof(struct ipv6hdr
);
773 /* Checkin header including 8 bytes of inner protocol header. */
774 if (!pskb_may_pull(skb
, inner_offset
+8))
777 /* BUGGG_FUTURE: we should try to parse exthdrs in this packet.
778 Without this we will not able f.e. to make source routed
780 Corresponding argument (opt) to notifiers is already added.
784 ipprot
= rcu_dereference(inet6_protos
[nexthdr
]);
785 if (ipprot
&& ipprot
->err_handler
)
786 ipprot
->err_handler(skb
, NULL
, type
, code
, inner_offset
, info
);
788 raw6_icmp_error(skb
, nexthdr
, type
, code
, inner_offset
, info
);
792 __ICMP6_INC_STATS(net
, __in6_dev_get(skb
->dev
), ICMP6_MIB_INERRORS
);
796 * Handle icmp messages
799 static int icmpv6_rcv(struct sk_buff
*skb
)
801 struct net
*net
= dev_net(skb
->dev
);
802 struct net_device
*dev
= skb
->dev
;
803 struct inet6_dev
*idev
= __in6_dev_get(dev
);
804 const struct in6_addr
*saddr
, *daddr
;
805 struct icmp6hdr
*hdr
;
807 bool success
= false;
809 if (!xfrm6_policy_check(NULL
, XFRM_POLICY_IN
, skb
)) {
810 struct sec_path
*sp
= skb_sec_path(skb
);
813 if (!(sp
&& sp
->xvec
[sp
->len
- 1]->props
.flags
&
817 if (!pskb_may_pull(skb
, sizeof(*hdr
) + sizeof(struct ipv6hdr
)))
820 nh
= skb_network_offset(skb
);
821 skb_set_network_header(skb
, sizeof(*hdr
));
823 if (!xfrm6_policy_check_reverse(NULL
, XFRM_POLICY_IN
, skb
))
826 skb_set_network_header(skb
, nh
);
829 __ICMP6_INC_STATS(dev_net(dev
), idev
, ICMP6_MIB_INMSGS
);
831 saddr
= &ipv6_hdr(skb
)->saddr
;
832 daddr
= &ipv6_hdr(skb
)->daddr
;
834 if (skb_checksum_validate(skb
, IPPROTO_ICMPV6
, ip6_compute_pseudo
)) {
835 net_dbg_ratelimited("ICMPv6 checksum failed [%pI6c > %pI6c]\n",
840 if (!pskb_pull(skb
, sizeof(*hdr
)))
843 hdr
= icmp6_hdr(skb
);
845 type
= hdr
->icmp6_type
;
847 ICMP6MSGIN_INC_STATS(dev_net(dev
), idev
, type
);
850 case ICMPV6_ECHO_REQUEST
:
851 if (!net
->ipv6
.sysctl
.icmpv6_echo_ignore_all
)
852 icmpv6_echo_reply(skb
);
855 case ICMPV6_ECHO_REPLY
:
856 success
= ping_rcv(skb
);
859 case ICMPV6_PKT_TOOBIG
:
860 /* BUGGG_FUTURE: if packet contains rthdr, we cannot update
861 standard destination cache. Seems, only "advanced"
862 destination cache will allow to solve this problem
865 if (!pskb_may_pull(skb
, sizeof(struct ipv6hdr
)))
867 hdr
= icmp6_hdr(skb
);
871 case ICMPV6_DEST_UNREACH
:
872 case ICMPV6_TIME_EXCEED
:
873 case ICMPV6_PARAMPROB
:
874 icmpv6_notify(skb
, type
, hdr
->icmp6_code
, hdr
->icmp6_mtu
);
877 case NDISC_ROUTER_SOLICITATION
:
878 case NDISC_ROUTER_ADVERTISEMENT
:
879 case NDISC_NEIGHBOUR_SOLICITATION
:
880 case NDISC_NEIGHBOUR_ADVERTISEMENT
:
885 case ICMPV6_MGM_QUERY
:
886 igmp6_event_query(skb
);
889 case ICMPV6_MGM_REPORT
:
890 igmp6_event_report(skb
);
893 case ICMPV6_MGM_REDUCTION
:
894 case ICMPV6_NI_QUERY
:
895 case ICMPV6_NI_REPLY
:
896 case ICMPV6_MLD2_REPORT
:
897 case ICMPV6_DHAAD_REQUEST
:
898 case ICMPV6_DHAAD_REPLY
:
899 case ICMPV6_MOBILE_PREFIX_SOL
:
900 case ICMPV6_MOBILE_PREFIX_ADV
:
905 if (type
& ICMPV6_INFOMSG_MASK
)
908 net_dbg_ratelimited("icmpv6: msg of unknown type [%pI6c > %pI6c]\n",
912 * error of unknown type.
913 * must pass to upper level
916 icmpv6_notify(skb
, type
, hdr
->icmp6_code
, hdr
->icmp6_mtu
);
919 /* until the v6 path can be better sorted assume failure and
920 * preserve the status quo behaviour for the rest of the paths to here
930 __ICMP6_INC_STATS(dev_net(dev
), idev
, ICMP6_MIB_CSUMERRORS
);
932 __ICMP6_INC_STATS(dev_net(dev
), idev
, ICMP6_MIB_INERRORS
);
938 void icmpv6_flow_init(struct sock
*sk
, struct flowi6
*fl6
,
940 const struct in6_addr
*saddr
,
941 const struct in6_addr
*daddr
,
944 memset(fl6
, 0, sizeof(*fl6
));
947 fl6
->flowi6_proto
= IPPROTO_ICMPV6
;
948 fl6
->fl6_icmp_type
= type
;
949 fl6
->fl6_icmp_code
= 0;
950 fl6
->flowi6_oif
= oif
;
951 security_sk_classify_flow(sk
, flowi6_to_flowi(fl6
));
954 static int __net_init
icmpv6_sk_init(struct net
*net
)
960 kcalloc(nr_cpu_ids
, sizeof(struct sock
*), GFP_KERNEL
);
961 if (!net
->ipv6
.icmp_sk
)
964 for_each_possible_cpu(i
) {
965 err
= inet_ctl_sock_create(&sk
, PF_INET6
,
966 SOCK_RAW
, IPPROTO_ICMPV6
, net
);
968 pr_err("Failed to initialize the ICMP6 control socket (err %d)\n",
973 net
->ipv6
.icmp_sk
[i
] = sk
;
975 /* Enough space for 2 64K ICMP packets, including
976 * sk_buff struct overhead.
978 sk
->sk_sndbuf
= 2 * SKB_TRUESIZE(64 * 1024);
983 for (j
= 0; j
< i
; j
++)
984 inet_ctl_sock_destroy(net
->ipv6
.icmp_sk
[j
]);
985 kfree(net
->ipv6
.icmp_sk
);
989 static void __net_exit
icmpv6_sk_exit(struct net
*net
)
993 for_each_possible_cpu(i
) {
994 inet_ctl_sock_destroy(net
->ipv6
.icmp_sk
[i
]);
996 kfree(net
->ipv6
.icmp_sk
);
999 static struct pernet_operations icmpv6_sk_ops
= {
1000 .init
= icmpv6_sk_init
,
1001 .exit
= icmpv6_sk_exit
,
1004 int __init
icmpv6_init(void)
1008 err
= register_pernet_subsys(&icmpv6_sk_ops
);
1013 if (inet6_add_protocol(&icmpv6_protocol
, IPPROTO_ICMPV6
) < 0)
1016 err
= inet6_register_icmp_sender(icmp6_send
);
1018 goto sender_reg_err
;
1022 inet6_del_protocol(&icmpv6_protocol
, IPPROTO_ICMPV6
);
1024 pr_err("Failed to register ICMP6 protocol\n");
1025 unregister_pernet_subsys(&icmpv6_sk_ops
);
1029 void icmpv6_cleanup(void)
1031 inet6_unregister_icmp_sender(icmp6_send
);
1032 unregister_pernet_subsys(&icmpv6_sk_ops
);
1033 inet6_del_protocol(&icmpv6_protocol
, IPPROTO_ICMPV6
);
1037 static const struct icmp6_err
{
1045 { /* ADM_PROHIBITED */
1049 { /* Was NOT_NEIGHBOUR, now reserved */
1050 .err
= EHOSTUNREACH
,
1053 { /* ADDR_UNREACH */
1054 .err
= EHOSTUNREACH
,
1057 { /* PORT_UNREACH */
1058 .err
= ECONNREFUSED
,
1065 { /* REJECT_ROUTE */
1071 int icmpv6_err_convert(u8 type
, u8 code
, int *err
)
1078 case ICMPV6_DEST_UNREACH
:
1080 if (code
< ARRAY_SIZE(tab_unreach
)) {
1081 *err
= tab_unreach
[code
].err
;
1082 fatal
= tab_unreach
[code
].fatal
;
1086 case ICMPV6_PKT_TOOBIG
:
1090 case ICMPV6_PARAMPROB
:
1095 case ICMPV6_TIME_EXCEED
:
1096 *err
= EHOSTUNREACH
;
1102 EXPORT_SYMBOL(icmpv6_err_convert
);
1104 #ifdef CONFIG_SYSCTL
1105 static struct ctl_table ipv6_icmp_table_template
[] = {
1107 .procname
= "ratelimit",
1108 .data
= &init_net
.ipv6
.sysctl
.icmpv6_time
,
1109 .maxlen
= sizeof(int),
1111 .proc_handler
= proc_dointvec_ms_jiffies
,
1114 .procname
= "echo_ignore_all",
1115 .data
= &init_net
.ipv6
.sysctl
.icmpv6_echo_ignore_all
,
1116 .maxlen
= sizeof(int),
1118 .proc_handler
= proc_dointvec
,
1123 struct ctl_table
* __net_init
ipv6_icmp_sysctl_init(struct net
*net
)
1125 struct ctl_table
*table
;
1127 table
= kmemdup(ipv6_icmp_table_template
,
1128 sizeof(ipv6_icmp_table_template
),
1132 table
[0].data
= &net
->ipv6
.sysctl
.icmpv6_time
;
1133 table
[1].data
= &net
->ipv6
.sysctl
.icmpv6_echo_ignore_all
;