mm-only debug patch...
[mmotm.git] / net / ipv6 / icmp.c
blobf23ebbec0631792407f6ea82827a572027050401
1 /*
2 * Internet Control Message Protocol (ICMPv6)
3 * Linux INET6 implementation
5 * Authors:
6 * Pedro Roque <roque@di.fc.ul.pt>
8 * Based on net/ipv4/icmp.c
10 * RFC 1885
12 * This program is free software; you can redistribute it and/or
13 * modify it under the terms of the GNU General Public License
14 * as published by the Free Software Foundation; either version
15 * 2 of the License, or (at your option) any later version.
19 * Changes:
21 * Andi Kleen : exception handling
22 * Andi Kleen add rate limits. never reply to a icmp.
23 * add more length checks and other fixes.
24 * yoshfuji : ensure to sent parameter problem for
25 * fragments.
26 * YOSHIFUJI Hideaki @USAGI: added sysctl for icmp rate limit.
27 * Randy Dunlap and
28 * YOSHIFUJI Hideaki @USAGI: Per-interface statistics support
29 * Kazunori MIYAZAWA @USAGI: change output process to use ip6_append_data
32 #include <linux/module.h>
33 #include <linux/errno.h>
34 #include <linux/types.h>
35 #include <linux/socket.h>
36 #include <linux/in.h>
37 #include <linux/kernel.h>
38 #include <linux/sockios.h>
39 #include <linux/net.h>
40 #include <linux/skbuff.h>
41 #include <linux/init.h>
42 #include <linux/netfilter.h>
44 #ifdef CONFIG_SYSCTL
45 #include <linux/sysctl.h>
46 #endif
48 #include <linux/inet.h>
49 #include <linux/netdevice.h>
50 #include <linux/icmpv6.h>
52 #include <net/ip.h>
53 #include <net/sock.h>
55 #include <net/ipv6.h>
56 #include <net/ip6_checksum.h>
57 #include <net/protocol.h>
58 #include <net/raw.h>
59 #include <net/rawv6.h>
60 #include <net/transp_v6.h>
61 #include <net/ip6_route.h>
62 #include <net/addrconf.h>
63 #include <net/icmp.h>
64 #include <net/xfrm.h>
65 #include <net/inet_common.h>
67 #include <asm/uaccess.h>
68 #include <asm/system.h>
70 DEFINE_SNMP_STAT(struct icmpv6_mib, icmpv6_statistics) __read_mostly;
71 EXPORT_SYMBOL(icmpv6_statistics);
72 DEFINE_SNMP_STAT(struct icmpv6msg_mib, icmpv6msg_statistics) __read_mostly;
73 EXPORT_SYMBOL(icmpv6msg_statistics);
76 * The ICMP socket(s). This is the most convenient way to flow control
77 * our ICMP output as well as maintain a clean interface throughout
78 * all layers. All Socketless IP sends will soon be gone.
80 * On SMP we have one ICMP socket per-cpu.
82 static inline struct sock *icmpv6_sk(struct net *net)
84 return net->ipv6.icmp_sk[smp_processor_id()];
87 static int icmpv6_rcv(struct sk_buff *skb);
89 static const struct inet6_protocol icmpv6_protocol = {
90 .handler = icmpv6_rcv,
91 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
94 static __inline__ struct sock *icmpv6_xmit_lock(struct net *net)
96 struct sock *sk;
98 local_bh_disable();
100 sk = icmpv6_sk(net);
101 if (unlikely(!spin_trylock(&sk->sk_lock.slock))) {
102 /* This can happen if the output path (f.e. SIT or
103 * ip6ip6 tunnel) signals dst_link_failure() for an
104 * outgoing ICMP6 packet.
106 local_bh_enable();
107 return NULL;
109 return sk;
112 static __inline__ void icmpv6_xmit_unlock(struct sock *sk)
114 spin_unlock_bh(&sk->sk_lock.slock);
118 * Slightly more convenient version of icmpv6_send.
120 void icmpv6_param_prob(struct sk_buff *skb, u8 code, int pos)
122 icmpv6_send(skb, ICMPV6_PARAMPROB, code, pos, skb->dev);
123 kfree_skb(skb);
127 * Figure out, may we reply to this packet with icmp error.
129 * We do not reply, if:
130 * - it was icmp error message.
131 * - it is truncated, so that it is known, that protocol is ICMPV6
132 * (i.e. in the middle of some exthdr)
134 * --ANK (980726)
137 static int is_ineligible(struct sk_buff *skb)
139 int ptr = (u8 *)(ipv6_hdr(skb) + 1) - skb->data;
140 int len = skb->len - ptr;
141 __u8 nexthdr = ipv6_hdr(skb)->nexthdr;
143 if (len < 0)
144 return 1;
146 ptr = ipv6_skip_exthdr(skb, ptr, &nexthdr);
147 if (ptr < 0)
148 return 0;
149 if (nexthdr == IPPROTO_ICMPV6) {
150 u8 _type, *tp;
151 tp = skb_header_pointer(skb,
152 ptr+offsetof(struct icmp6hdr, icmp6_type),
153 sizeof(_type), &_type);
154 if (tp == NULL ||
155 !(*tp & ICMPV6_INFOMSG_MASK))
156 return 1;
158 return 0;
162 * Check the ICMP output rate limit
164 static inline int icmpv6_xrlim_allow(struct sock *sk, u8 type,
165 struct flowi *fl)
167 struct dst_entry *dst;
168 struct net *net = sock_net(sk);
169 int res = 0;
171 /* Informational messages are not limited. */
172 if (type & ICMPV6_INFOMSG_MASK)
173 return 1;
175 /* Do not limit pmtu discovery, it would break it. */
176 if (type == ICMPV6_PKT_TOOBIG)
177 return 1;
180 * Look up the output route.
181 * XXX: perhaps the expire for routing entries cloned by
182 * this lookup should be more aggressive (not longer than timeout).
184 dst = ip6_route_output(net, sk, fl);
185 if (dst->error) {
186 IP6_INC_STATS(net, ip6_dst_idev(dst),
187 IPSTATS_MIB_OUTNOROUTES);
188 } else if (dst->dev && (dst->dev->flags&IFF_LOOPBACK)) {
189 res = 1;
190 } else {
191 struct rt6_info *rt = (struct rt6_info *)dst;
192 int tmo = net->ipv6.sysctl.icmpv6_time;
194 /* Give more bandwidth to wider prefixes. */
195 if (rt->rt6i_dst.plen < 128)
196 tmo >>= ((128 - rt->rt6i_dst.plen)>>5);
198 res = xrlim_allow(dst, tmo);
200 dst_release(dst);
201 return res;
205 * an inline helper for the "simple" if statement below
206 * checks if parameter problem report is caused by an
207 * unrecognized IPv6 option that has the Option Type
208 * highest-order two bits set to 10
211 static __inline__ int opt_unrec(struct sk_buff *skb, __u32 offset)
213 u8 _optval, *op;
215 offset += skb_network_offset(skb);
216 op = skb_header_pointer(skb, offset, sizeof(_optval), &_optval);
217 if (op == NULL)
218 return 1;
219 return (*op & 0xC0) == 0x80;
222 static int icmpv6_push_pending_frames(struct sock *sk, struct flowi *fl, struct icmp6hdr *thdr, int len)
224 struct sk_buff *skb;
225 struct icmp6hdr *icmp6h;
226 int err = 0;
228 if ((skb = skb_peek(&sk->sk_write_queue)) == NULL)
229 goto out;
231 icmp6h = icmp6_hdr(skb);
232 memcpy(icmp6h, thdr, sizeof(struct icmp6hdr));
233 icmp6h->icmp6_cksum = 0;
235 if (skb_queue_len(&sk->sk_write_queue) == 1) {
236 skb->csum = csum_partial(icmp6h,
237 sizeof(struct icmp6hdr), skb->csum);
238 icmp6h->icmp6_cksum = csum_ipv6_magic(&fl->fl6_src,
239 &fl->fl6_dst,
240 len, fl->proto,
241 skb->csum);
242 } else {
243 __wsum tmp_csum = 0;
245 skb_queue_walk(&sk->sk_write_queue, skb) {
246 tmp_csum = csum_add(tmp_csum, skb->csum);
249 tmp_csum = csum_partial(icmp6h,
250 sizeof(struct icmp6hdr), tmp_csum);
251 icmp6h->icmp6_cksum = csum_ipv6_magic(&fl->fl6_src,
252 &fl->fl6_dst,
253 len, fl->proto,
254 tmp_csum);
256 ip6_push_pending_frames(sk);
257 out:
258 return err;
261 struct icmpv6_msg {
262 struct sk_buff *skb;
263 int offset;
264 uint8_t type;
267 static int icmpv6_getfrag(void *from, char *to, int offset, int len, int odd, struct sk_buff *skb)
269 struct icmpv6_msg *msg = (struct icmpv6_msg *) from;
270 struct sk_buff *org_skb = msg->skb;
271 __wsum csum = 0;
273 csum = skb_copy_and_csum_bits(org_skb, msg->offset + offset,
274 to, len, csum);
275 skb->csum = csum_block_add(skb->csum, csum, odd);
276 if (!(msg->type & ICMPV6_INFOMSG_MASK))
277 nf_ct_attach(skb, org_skb);
278 return 0;
281 #if defined(CONFIG_IPV6_MIP6) || defined(CONFIG_IPV6_MIP6_MODULE)
282 static void mip6_addr_swap(struct sk_buff *skb)
284 struct ipv6hdr *iph = ipv6_hdr(skb);
285 struct inet6_skb_parm *opt = IP6CB(skb);
286 struct ipv6_destopt_hao *hao;
287 struct in6_addr tmp;
288 int off;
290 if (opt->dsthao) {
291 off = ipv6_find_tlv(skb, opt->dsthao, IPV6_TLV_HAO);
292 if (likely(off >= 0)) {
293 hao = (struct ipv6_destopt_hao *)
294 (skb_network_header(skb) + off);
295 ipv6_addr_copy(&tmp, &iph->saddr);
296 ipv6_addr_copy(&iph->saddr, &hao->addr);
297 ipv6_addr_copy(&hao->addr, &tmp);
301 #else
302 static inline void mip6_addr_swap(struct sk_buff *skb) {}
303 #endif
306 * Send an ICMP message in response to a packet in error
308 void icmpv6_send(struct sk_buff *skb, u8 type, u8 code, __u32 info,
309 struct net_device *dev)
311 struct net *net = dev_net(skb->dev);
312 struct inet6_dev *idev = NULL;
313 struct ipv6hdr *hdr = ipv6_hdr(skb);
314 struct sock *sk;
315 struct ipv6_pinfo *np;
316 struct in6_addr *saddr = NULL;
317 struct dst_entry *dst;
318 struct dst_entry *dst2;
319 struct icmp6hdr tmp_hdr;
320 struct flowi fl;
321 struct flowi fl2;
322 struct icmpv6_msg msg;
323 int iif = 0;
324 int addr_type = 0;
325 int len;
326 int hlimit;
327 int err = 0;
329 if ((u8 *)hdr < skb->head ||
330 (skb->network_header + sizeof(*hdr)) > skb->tail)
331 return;
334 * Make sure we respect the rules
335 * i.e. RFC 1885 2.4(e)
336 * Rule (e.1) is enforced by not using icmpv6_send
337 * in any code that processes icmp errors.
339 addr_type = ipv6_addr_type(&hdr->daddr);
341 if (ipv6_chk_addr(net, &hdr->daddr, skb->dev, 0))
342 saddr = &hdr->daddr;
345 * Dest addr check
348 if ((addr_type & IPV6_ADDR_MULTICAST || skb->pkt_type != PACKET_HOST)) {
349 if (type != ICMPV6_PKT_TOOBIG &&
350 !(type == ICMPV6_PARAMPROB &&
351 code == ICMPV6_UNK_OPTION &&
352 (opt_unrec(skb, info))))
353 return;
355 saddr = NULL;
358 addr_type = ipv6_addr_type(&hdr->saddr);
361 * Source addr check
364 if (addr_type & IPV6_ADDR_LINKLOCAL)
365 iif = skb->dev->ifindex;
368 * Must not send error if the source does not uniquely
369 * identify a single node (RFC2463 Section 2.4).
370 * We check unspecified / multicast addresses here,
371 * and anycast addresses will be checked later.
373 if ((addr_type == IPV6_ADDR_ANY) || (addr_type & IPV6_ADDR_MULTICAST)) {
374 LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: addr_any/mcast source\n");
375 return;
379 * Never answer to a ICMP packet.
381 if (is_ineligible(skb)) {
382 LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: no reply to icmp error\n");
383 return;
386 mip6_addr_swap(skb);
388 memset(&fl, 0, sizeof(fl));
389 fl.proto = IPPROTO_ICMPV6;
390 ipv6_addr_copy(&fl.fl6_dst, &hdr->saddr);
391 if (saddr)
392 ipv6_addr_copy(&fl.fl6_src, saddr);
393 fl.oif = iif;
394 fl.fl_icmp_type = type;
395 fl.fl_icmp_code = code;
396 security_skb_classify_flow(skb, &fl);
398 sk = icmpv6_xmit_lock(net);
399 if (sk == NULL)
400 return;
401 np = inet6_sk(sk);
403 if (!icmpv6_xrlim_allow(sk, type, &fl))
404 goto out;
406 tmp_hdr.icmp6_type = type;
407 tmp_hdr.icmp6_code = code;
408 tmp_hdr.icmp6_cksum = 0;
409 tmp_hdr.icmp6_pointer = htonl(info);
411 if (!fl.oif && ipv6_addr_is_multicast(&fl.fl6_dst))
412 fl.oif = np->mcast_oif;
414 err = ip6_dst_lookup(sk, &dst, &fl);
415 if (err)
416 goto out;
419 * We won't send icmp if the destination is known
420 * anycast.
422 if (((struct rt6_info *)dst)->rt6i_flags & RTF_ANYCAST) {
423 LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: acast source\n");
424 goto out_dst_release;
427 /* No need to clone since we're just using its address. */
428 dst2 = dst;
430 err = xfrm_lookup(net, &dst, &fl, sk, 0);
431 switch (err) {
432 case 0:
433 if (dst != dst2)
434 goto route_done;
435 break;
436 case -EPERM:
437 dst = NULL;
438 break;
439 default:
440 goto out;
443 if (xfrm_decode_session_reverse(skb, &fl2, AF_INET6))
444 goto relookup_failed;
446 if (ip6_dst_lookup(sk, &dst2, &fl2))
447 goto relookup_failed;
449 err = xfrm_lookup(net, &dst2, &fl2, sk, XFRM_LOOKUP_ICMP);
450 switch (err) {
451 case 0:
452 dst_release(dst);
453 dst = dst2;
454 break;
455 case -EPERM:
456 goto out_dst_release;
457 default:
458 relookup_failed:
459 if (!dst)
460 goto out;
461 break;
464 route_done:
465 if (ipv6_addr_is_multicast(&fl.fl6_dst))
466 hlimit = np->mcast_hops;
467 else
468 hlimit = np->hop_limit;
469 if (hlimit < 0)
470 hlimit = ip6_dst_hoplimit(dst);
472 msg.skb = skb;
473 msg.offset = skb_network_offset(skb);
474 msg.type = type;
476 len = skb->len - msg.offset;
477 len = min_t(unsigned int, len, IPV6_MIN_MTU - sizeof(struct ipv6hdr) -sizeof(struct icmp6hdr));
478 if (len < 0) {
479 LIMIT_NETDEBUG(KERN_DEBUG "icmp: len problem\n");
480 goto out_dst_release;
483 idev = in6_dev_get(skb->dev);
485 err = ip6_append_data(sk, icmpv6_getfrag, &msg,
486 len + sizeof(struct icmp6hdr),
487 sizeof(struct icmp6hdr), hlimit,
488 np->tclass, NULL, &fl, (struct rt6_info*)dst,
489 MSG_DONTWAIT);
490 if (err) {
491 ip6_flush_pending_frames(sk);
492 goto out_put;
494 err = icmpv6_push_pending_frames(sk, &fl, &tmp_hdr, len + sizeof(struct icmp6hdr));
496 out_put:
497 if (likely(idev != NULL))
498 in6_dev_put(idev);
499 out_dst_release:
500 dst_release(dst);
501 out:
502 icmpv6_xmit_unlock(sk);
505 EXPORT_SYMBOL(icmpv6_send);
507 static void icmpv6_echo_reply(struct sk_buff *skb)
509 struct net *net = dev_net(skb->dev);
510 struct sock *sk;
511 struct inet6_dev *idev;
512 struct ipv6_pinfo *np;
513 struct in6_addr *saddr = NULL;
514 struct icmp6hdr *icmph = icmp6_hdr(skb);
515 struct icmp6hdr tmp_hdr;
516 struct flowi fl;
517 struct icmpv6_msg msg;
518 struct dst_entry *dst;
519 int err = 0;
520 int hlimit;
522 saddr = &ipv6_hdr(skb)->daddr;
524 if (!ipv6_unicast_destination(skb))
525 saddr = NULL;
527 memcpy(&tmp_hdr, icmph, sizeof(tmp_hdr));
528 tmp_hdr.icmp6_type = ICMPV6_ECHO_REPLY;
530 memset(&fl, 0, sizeof(fl));
531 fl.proto = IPPROTO_ICMPV6;
532 ipv6_addr_copy(&fl.fl6_dst, &ipv6_hdr(skb)->saddr);
533 if (saddr)
534 ipv6_addr_copy(&fl.fl6_src, saddr);
535 fl.oif = skb->dev->ifindex;
536 fl.fl_icmp_type = ICMPV6_ECHO_REPLY;
537 security_skb_classify_flow(skb, &fl);
539 sk = icmpv6_xmit_lock(net);
540 if (sk == NULL)
541 return;
542 np = inet6_sk(sk);
544 if (!fl.oif && ipv6_addr_is_multicast(&fl.fl6_dst))
545 fl.oif = np->mcast_oif;
547 err = ip6_dst_lookup(sk, &dst, &fl);
548 if (err)
549 goto out;
550 if ((err = xfrm_lookup(net, &dst, &fl, sk, 0)) < 0)
551 goto out;
553 if (ipv6_addr_is_multicast(&fl.fl6_dst))
554 hlimit = np->mcast_hops;
555 else
556 hlimit = np->hop_limit;
557 if (hlimit < 0)
558 hlimit = ip6_dst_hoplimit(dst);
560 idev = in6_dev_get(skb->dev);
562 msg.skb = skb;
563 msg.offset = 0;
564 msg.type = ICMPV6_ECHO_REPLY;
566 err = ip6_append_data(sk, icmpv6_getfrag, &msg, skb->len + sizeof(struct icmp6hdr),
567 sizeof(struct icmp6hdr), hlimit, np->tclass, NULL, &fl,
568 (struct rt6_info*)dst, MSG_DONTWAIT);
570 if (err) {
571 ip6_flush_pending_frames(sk);
572 goto out_put;
574 err = icmpv6_push_pending_frames(sk, &fl, &tmp_hdr, skb->len + sizeof(struct icmp6hdr));
576 out_put:
577 if (likely(idev != NULL))
578 in6_dev_put(idev);
579 dst_release(dst);
580 out:
581 icmpv6_xmit_unlock(sk);
584 static void icmpv6_notify(struct sk_buff *skb, u8 type, u8 code, __be32 info)
586 const struct inet6_protocol *ipprot;
587 int inner_offset;
588 int hash;
589 u8 nexthdr;
591 if (!pskb_may_pull(skb, sizeof(struct ipv6hdr)))
592 return;
594 nexthdr = ((struct ipv6hdr *)skb->data)->nexthdr;
595 if (ipv6_ext_hdr(nexthdr)) {
596 /* now skip over extension headers */
597 inner_offset = ipv6_skip_exthdr(skb, sizeof(struct ipv6hdr), &nexthdr);
598 if (inner_offset<0)
599 return;
600 } else {
601 inner_offset = sizeof(struct ipv6hdr);
604 /* Checkin header including 8 bytes of inner protocol header. */
605 if (!pskb_may_pull(skb, inner_offset+8))
606 return;
608 /* BUGGG_FUTURE: we should try to parse exthdrs in this packet.
609 Without this we will not able f.e. to make source routed
610 pmtu discovery.
611 Corresponding argument (opt) to notifiers is already added.
612 --ANK (980726)
615 hash = nexthdr & (MAX_INET_PROTOS - 1);
617 rcu_read_lock();
618 ipprot = rcu_dereference(inet6_protos[hash]);
619 if (ipprot && ipprot->err_handler)
620 ipprot->err_handler(skb, NULL, type, code, inner_offset, info);
621 rcu_read_unlock();
623 raw6_icmp_error(skb, nexthdr, type, code, inner_offset, info);
627 * Handle icmp messages
630 static int icmpv6_rcv(struct sk_buff *skb)
632 struct net_device *dev = skb->dev;
633 struct inet6_dev *idev = __in6_dev_get(dev);
634 struct in6_addr *saddr, *daddr;
635 struct ipv6hdr *orig_hdr;
636 struct icmp6hdr *hdr;
637 u8 type;
639 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
640 struct sec_path *sp = skb_sec_path(skb);
641 int nh;
643 if (!(sp && sp->xvec[sp->len - 1]->props.flags &
644 XFRM_STATE_ICMP))
645 goto drop_no_count;
647 if (!pskb_may_pull(skb, sizeof(*hdr) + sizeof(*orig_hdr)))
648 goto drop_no_count;
650 nh = skb_network_offset(skb);
651 skb_set_network_header(skb, sizeof(*hdr));
653 if (!xfrm6_policy_check_reverse(NULL, XFRM_POLICY_IN, skb))
654 goto drop_no_count;
656 skb_set_network_header(skb, nh);
659 ICMP6_INC_STATS_BH(dev_net(dev), idev, ICMP6_MIB_INMSGS);
661 saddr = &ipv6_hdr(skb)->saddr;
662 daddr = &ipv6_hdr(skb)->daddr;
664 /* Perform checksum. */
665 switch (skb->ip_summed) {
666 case CHECKSUM_COMPLETE:
667 if (!csum_ipv6_magic(saddr, daddr, skb->len, IPPROTO_ICMPV6,
668 skb->csum))
669 break;
670 /* fall through */
671 case CHECKSUM_NONE:
672 skb->csum = ~csum_unfold(csum_ipv6_magic(saddr, daddr, skb->len,
673 IPPROTO_ICMPV6, 0));
674 if (__skb_checksum_complete(skb)) {
675 LIMIT_NETDEBUG(KERN_DEBUG "ICMPv6 checksum failed [%pI6 > %pI6]\n",
676 saddr, daddr);
677 goto discard_it;
681 if (!pskb_pull(skb, sizeof(*hdr)))
682 goto discard_it;
684 hdr = icmp6_hdr(skb);
686 type = hdr->icmp6_type;
688 ICMP6MSGIN_INC_STATS_BH(dev_net(dev), idev, type);
690 switch (type) {
691 case ICMPV6_ECHO_REQUEST:
692 icmpv6_echo_reply(skb);
693 break;
695 case ICMPV6_ECHO_REPLY:
696 /* we couldn't care less */
697 break;
699 case ICMPV6_PKT_TOOBIG:
700 /* BUGGG_FUTURE: if packet contains rthdr, we cannot update
701 standard destination cache. Seems, only "advanced"
702 destination cache will allow to solve this problem
703 --ANK (980726)
705 if (!pskb_may_pull(skb, sizeof(struct ipv6hdr)))
706 goto discard_it;
707 hdr = icmp6_hdr(skb);
708 orig_hdr = (struct ipv6hdr *) (hdr + 1);
709 rt6_pmtu_discovery(&orig_hdr->daddr, &orig_hdr->saddr, dev,
710 ntohl(hdr->icmp6_mtu));
713 * Drop through to notify
716 case ICMPV6_DEST_UNREACH:
717 case ICMPV6_TIME_EXCEED:
718 case ICMPV6_PARAMPROB:
719 icmpv6_notify(skb, type, hdr->icmp6_code, hdr->icmp6_mtu);
720 break;
722 case NDISC_ROUTER_SOLICITATION:
723 case NDISC_ROUTER_ADVERTISEMENT:
724 case NDISC_NEIGHBOUR_SOLICITATION:
725 case NDISC_NEIGHBOUR_ADVERTISEMENT:
726 case NDISC_REDIRECT:
727 ndisc_rcv(skb);
728 break;
730 case ICMPV6_MGM_QUERY:
731 igmp6_event_query(skb);
732 break;
734 case ICMPV6_MGM_REPORT:
735 igmp6_event_report(skb);
736 break;
738 case ICMPV6_MGM_REDUCTION:
739 case ICMPV6_NI_QUERY:
740 case ICMPV6_NI_REPLY:
741 case ICMPV6_MLD2_REPORT:
742 case ICMPV6_DHAAD_REQUEST:
743 case ICMPV6_DHAAD_REPLY:
744 case ICMPV6_MOBILE_PREFIX_SOL:
745 case ICMPV6_MOBILE_PREFIX_ADV:
746 break;
748 default:
749 LIMIT_NETDEBUG(KERN_DEBUG "icmpv6: msg of unknown type\n");
751 /* informational */
752 if (type & ICMPV6_INFOMSG_MASK)
753 break;
756 * error of unknown type.
757 * must pass to upper level
760 icmpv6_notify(skb, type, hdr->icmp6_code, hdr->icmp6_mtu);
763 kfree_skb(skb);
764 return 0;
766 discard_it:
767 ICMP6_INC_STATS_BH(dev_net(dev), idev, ICMP6_MIB_INERRORS);
768 drop_no_count:
769 kfree_skb(skb);
770 return 0;
773 void icmpv6_flow_init(struct sock *sk, struct flowi *fl,
774 u8 type,
775 const struct in6_addr *saddr,
776 const struct in6_addr *daddr,
777 int oif)
779 memset(fl, 0, sizeof(*fl));
780 ipv6_addr_copy(&fl->fl6_src, saddr);
781 ipv6_addr_copy(&fl->fl6_dst, daddr);
782 fl->proto = IPPROTO_ICMPV6;
783 fl->fl_icmp_type = type;
784 fl->fl_icmp_code = 0;
785 fl->oif = oif;
786 security_sk_classify_flow(sk, fl);
790 * Special lock-class for __icmpv6_sk:
792 static struct lock_class_key icmpv6_socket_sk_dst_lock_key;
794 static int __net_init icmpv6_sk_init(struct net *net)
796 struct sock *sk;
797 int err, i, j;
799 net->ipv6.icmp_sk =
800 kzalloc(nr_cpu_ids * sizeof(struct sock *), GFP_KERNEL);
801 if (net->ipv6.icmp_sk == NULL)
802 return -ENOMEM;
804 for_each_possible_cpu(i) {
805 err = inet_ctl_sock_create(&sk, PF_INET6,
806 SOCK_RAW, IPPROTO_ICMPV6, net);
807 if (err < 0) {
808 printk(KERN_ERR
809 "Failed to initialize the ICMP6 control socket "
810 "(err %d).\n",
811 err);
812 goto fail;
815 net->ipv6.icmp_sk[i] = sk;
818 * Split off their lock-class, because sk->sk_dst_lock
819 * gets used from softirqs, which is safe for
820 * __icmpv6_sk (because those never get directly used
821 * via userspace syscalls), but unsafe for normal sockets.
823 lockdep_set_class(&sk->sk_dst_lock,
824 &icmpv6_socket_sk_dst_lock_key);
826 /* Enough space for 2 64K ICMP packets, including
827 * sk_buff struct overhead.
829 sk->sk_sndbuf =
830 (2 * ((64 * 1024) + sizeof(struct sk_buff)));
832 return 0;
834 fail:
835 for (j = 0; j < i; j++)
836 inet_ctl_sock_destroy(net->ipv6.icmp_sk[j]);
837 kfree(net->ipv6.icmp_sk);
838 return err;
841 static void __net_exit icmpv6_sk_exit(struct net *net)
843 int i;
845 for_each_possible_cpu(i) {
846 inet_ctl_sock_destroy(net->ipv6.icmp_sk[i]);
848 kfree(net->ipv6.icmp_sk);
851 static struct pernet_operations icmpv6_sk_ops = {
852 .init = icmpv6_sk_init,
853 .exit = icmpv6_sk_exit,
856 int __init icmpv6_init(void)
858 int err;
860 err = register_pernet_subsys(&icmpv6_sk_ops);
861 if (err < 0)
862 return err;
864 err = -EAGAIN;
865 if (inet6_add_protocol(&icmpv6_protocol, IPPROTO_ICMPV6) < 0)
866 goto fail;
867 return 0;
869 fail:
870 printk(KERN_ERR "Failed to register ICMP6 protocol\n");
871 unregister_pernet_subsys(&icmpv6_sk_ops);
872 return err;
875 void icmpv6_cleanup(void)
877 unregister_pernet_subsys(&icmpv6_sk_ops);
878 inet6_del_protocol(&icmpv6_protocol, IPPROTO_ICMPV6);
882 static const struct icmp6_err {
883 int err;
884 int fatal;
885 } tab_unreach[] = {
886 { /* NOROUTE */
887 .err = ENETUNREACH,
888 .fatal = 0,
890 { /* ADM_PROHIBITED */
891 .err = EACCES,
892 .fatal = 1,
894 { /* Was NOT_NEIGHBOUR, now reserved */
895 .err = EHOSTUNREACH,
896 .fatal = 0,
898 { /* ADDR_UNREACH */
899 .err = EHOSTUNREACH,
900 .fatal = 0,
902 { /* PORT_UNREACH */
903 .err = ECONNREFUSED,
904 .fatal = 1,
908 int icmpv6_err_convert(u8 type, u8 code, int *err)
910 int fatal = 0;
912 *err = EPROTO;
914 switch (type) {
915 case ICMPV6_DEST_UNREACH:
916 fatal = 1;
917 if (code <= ICMPV6_PORT_UNREACH) {
918 *err = tab_unreach[code].err;
919 fatal = tab_unreach[code].fatal;
921 break;
923 case ICMPV6_PKT_TOOBIG:
924 *err = EMSGSIZE;
925 break;
927 case ICMPV6_PARAMPROB:
928 *err = EPROTO;
929 fatal = 1;
930 break;
932 case ICMPV6_TIME_EXCEED:
933 *err = EHOSTUNREACH;
934 break;
937 return fatal;
940 EXPORT_SYMBOL(icmpv6_err_convert);
942 #ifdef CONFIG_SYSCTL
943 ctl_table ipv6_icmp_table_template[] = {
945 .ctl_name = NET_IPV6_ICMP_RATELIMIT,
946 .procname = "ratelimit",
947 .data = &init_net.ipv6.sysctl.icmpv6_time,
948 .maxlen = sizeof(int),
949 .mode = 0644,
950 .proc_handler = proc_dointvec_ms_jiffies,
951 .strategy = sysctl_ms_jiffies
953 { .ctl_name = 0 },
956 struct ctl_table *ipv6_icmp_sysctl_init(struct net *net)
958 struct ctl_table *table;
960 table = kmemdup(ipv6_icmp_table_template,
961 sizeof(ipv6_icmp_table_template),
962 GFP_KERNEL);
964 if (table)
965 table[0].data = &net->ipv6.sysctl.icmpv6_time;
967 return table;
969 #endif