1 // SPDX-License-Identifier: GPL-2.0-or-later
3 * Neighbour Discovery for IPv6
4 * Linux INET6 implementation
7 * Pedro Roque <roque@di.fc.ul.pt>
8 * Mike Shaver <shaver@ingenia.com>
14 * Alexey I. Froloff : RFC6106 (DNSSL) support
15 * Pierre Ynard : export userland ND options
16 * through netlink (RDNSS support)
17 * Lars Fenneberg : fixed MTU setting on receipt
19 * Janos Farkas : kmalloc failure checks
20 * Alexey Kuznetsov : state machine reworked
21 * and moved to net/core.
22 * Pekka Savola : RFC2461 validation
23 * YOSHIFUJI Hideaki @USAGI : Verify ND options properly
26 #define pr_fmt(fmt) "ICMPv6: " fmt
28 #include <linux/module.h>
29 #include <linux/errno.h>
30 #include <linux/types.h>
31 #include <linux/socket.h>
32 #include <linux/sockios.h>
33 #include <linux/sched.h>
34 #include <linux/net.h>
35 #include <linux/in6.h>
36 #include <linux/route.h>
37 #include <linux/init.h>
38 #include <linux/rcupdate.h>
39 #include <linux/slab.h>
41 #include <linux/sysctl.h>
44 #include <linux/if_addr.h>
45 #include <linux/if_ether.h>
46 #include <linux/if_arp.h>
47 #include <linux/ipv6.h>
48 #include <linux/icmpv6.h>
49 #include <linux/jhash.h>
55 #include <net/protocol.h>
56 #include <net/ndisc.h>
57 #include <net/ip6_route.h>
58 #include <net/addrconf.h>
61 #include <net/netlink.h>
62 #include <linux/rtnetlink.h>
65 #include <net/ip6_checksum.h>
66 #include <net/inet_common.h>
67 #include <linux/proc_fs.h>
69 #include <linux/netfilter.h>
70 #include <linux/netfilter_ipv6.h>
72 static u32
ndisc_hash(const void *pkey
,
73 const struct net_device
*dev
,
75 static bool ndisc_key_eq(const struct neighbour
*neigh
, const void *pkey
);
76 static bool ndisc_allow_add(const struct net_device
*dev
,
77 struct netlink_ext_ack
*extack
);
78 static int ndisc_constructor(struct neighbour
*neigh
);
79 static void ndisc_solicit(struct neighbour
*neigh
, struct sk_buff
*skb
);
80 static void ndisc_error_report(struct neighbour
*neigh
, struct sk_buff
*skb
);
81 static int pndisc_constructor(struct pneigh_entry
*n
);
82 static void pndisc_destructor(struct pneigh_entry
*n
);
83 static void pndisc_redo(struct sk_buff
*skb
);
84 static int ndisc_is_multicast(const void *pkey
);
86 static const struct neigh_ops ndisc_generic_ops
= {
88 .solicit
= ndisc_solicit
,
89 .error_report
= ndisc_error_report
,
90 .output
= neigh_resolve_output
,
91 .connected_output
= neigh_connected_output
,
94 static const struct neigh_ops ndisc_hh_ops
= {
96 .solicit
= ndisc_solicit
,
97 .error_report
= ndisc_error_report
,
98 .output
= neigh_resolve_output
,
99 .connected_output
= neigh_resolve_output
,
103 static const struct neigh_ops ndisc_direct_ops
= {
105 .output
= neigh_direct_output
,
106 .connected_output
= neigh_direct_output
,
109 struct neigh_table nd_tbl
= {
111 .key_len
= sizeof(struct in6_addr
),
112 .protocol
= cpu_to_be16(ETH_P_IPV6
),
114 .key_eq
= ndisc_key_eq
,
115 .constructor
= ndisc_constructor
,
116 .pconstructor
= pndisc_constructor
,
117 .pdestructor
= pndisc_destructor
,
118 .proxy_redo
= pndisc_redo
,
119 .is_multicast
= ndisc_is_multicast
,
120 .allow_add
= ndisc_allow_add
,
124 .reachable_time
= ND_REACHABLE_TIME
,
126 [NEIGH_VAR_MCAST_PROBES
] = 3,
127 [NEIGH_VAR_UCAST_PROBES
] = 3,
128 [NEIGH_VAR_RETRANS_TIME
] = ND_RETRANS_TIMER
,
129 [NEIGH_VAR_BASE_REACHABLE_TIME
] = ND_REACHABLE_TIME
,
130 [NEIGH_VAR_DELAY_PROBE_TIME
] = 5 * HZ
,
131 [NEIGH_VAR_INTERVAL_PROBE_TIME_MS
] = 5 * HZ
,
132 [NEIGH_VAR_GC_STALETIME
] = 60 * HZ
,
133 [NEIGH_VAR_QUEUE_LEN_BYTES
] = SK_WMEM_MAX
,
134 [NEIGH_VAR_PROXY_QLEN
] = 64,
135 [NEIGH_VAR_ANYCAST_DELAY
] = 1 * HZ
,
136 [NEIGH_VAR_PROXY_DELAY
] = (8 * HZ
) / 10,
139 .gc_interval
= 30 * HZ
,
144 EXPORT_SYMBOL_GPL(nd_tbl
);
146 void __ndisc_fill_addr_option(struct sk_buff
*skb
, int type
, const void *data
,
147 int data_len
, int pad
)
149 int space
= __ndisc_opt_addr_space(data_len
, pad
);
150 u8
*opt
= skb_put(skb
, space
);
155 memset(opt
+ 2, 0, pad
);
159 memcpy(opt
+2, data
, data_len
);
164 memset(opt
, 0, space
);
166 EXPORT_SYMBOL_GPL(__ndisc_fill_addr_option
);
168 static inline void ndisc_fill_addr_option(struct sk_buff
*skb
, int type
,
169 const void *data
, u8 icmp6_type
)
171 __ndisc_fill_addr_option(skb
, type
, data
, skb
->dev
->addr_len
,
172 ndisc_addr_option_pad(skb
->dev
->type
));
173 ndisc_ops_fill_addr_option(skb
->dev
, skb
, icmp6_type
);
176 static inline void ndisc_fill_redirect_addr_option(struct sk_buff
*skb
,
180 ndisc_fill_addr_option(skb
, ND_OPT_TARGET_LL_ADDR
, ha
, NDISC_REDIRECT
);
181 ndisc_ops_fill_redirect_addr_option(skb
->dev
, skb
, ops_data
);
184 static struct nd_opt_hdr
*ndisc_next_option(struct nd_opt_hdr
*cur
,
185 struct nd_opt_hdr
*end
)
188 if (!cur
|| !end
|| cur
>= end
)
190 type
= cur
->nd_opt_type
;
192 cur
= ((void *)cur
) + (cur
->nd_opt_len
<< 3);
193 } while (cur
< end
&& cur
->nd_opt_type
!= type
);
194 return cur
<= end
&& cur
->nd_opt_type
== type
? cur
: NULL
;
197 static inline int ndisc_is_useropt(const struct net_device
*dev
,
198 struct nd_opt_hdr
*opt
)
200 return opt
->nd_opt_type
== ND_OPT_PREFIX_INFO
||
201 opt
->nd_opt_type
== ND_OPT_RDNSS
||
202 opt
->nd_opt_type
== ND_OPT_DNSSL
||
203 opt
->nd_opt_type
== ND_OPT_6CO
||
204 opt
->nd_opt_type
== ND_OPT_CAPTIVE_PORTAL
||
205 opt
->nd_opt_type
== ND_OPT_PREF64
;
208 static struct nd_opt_hdr
*ndisc_next_useropt(const struct net_device
*dev
,
209 struct nd_opt_hdr
*cur
,
210 struct nd_opt_hdr
*end
)
212 if (!cur
|| !end
|| cur
>= end
)
215 cur
= ((void *)cur
) + (cur
->nd_opt_len
<< 3);
216 } while (cur
< end
&& !ndisc_is_useropt(dev
, cur
));
217 return cur
<= end
&& ndisc_is_useropt(dev
, cur
) ? cur
: NULL
;
220 struct ndisc_options
*ndisc_parse_options(const struct net_device
*dev
,
221 u8
*opt
, int opt_len
,
222 struct ndisc_options
*ndopts
)
224 struct nd_opt_hdr
*nd_opt
= (struct nd_opt_hdr
*)opt
;
226 if (!nd_opt
|| opt_len
< 0 || !ndopts
)
228 memset(ndopts
, 0, sizeof(*ndopts
));
230 bool unknown
= false;
232 if (opt_len
< sizeof(struct nd_opt_hdr
))
234 l
= nd_opt
->nd_opt_len
<< 3;
235 if (opt_len
< l
|| l
== 0)
237 if (ndisc_ops_parse_options(dev
, nd_opt
, ndopts
))
239 switch (nd_opt
->nd_opt_type
) {
240 case ND_OPT_SOURCE_LL_ADDR
:
241 case ND_OPT_TARGET_LL_ADDR
:
244 case ND_OPT_REDIRECT_HDR
:
245 if (ndopts
->nd_opt_array
[nd_opt
->nd_opt_type
]) {
247 "%s: duplicated ND6 option found: type=%d\n",
248 __func__
, nd_opt
->nd_opt_type
);
250 ndopts
->nd_opt_array
[nd_opt
->nd_opt_type
] = nd_opt
;
253 case ND_OPT_PREFIX_INFO
:
254 ndopts
->nd_opts_pi_end
= nd_opt
;
255 if (!ndopts
->nd_opt_array
[nd_opt
->nd_opt_type
])
256 ndopts
->nd_opt_array
[nd_opt
->nd_opt_type
] = nd_opt
;
258 #ifdef CONFIG_IPV6_ROUTE_INFO
259 case ND_OPT_ROUTE_INFO
:
260 ndopts
->nd_opts_ri_end
= nd_opt
;
261 if (!ndopts
->nd_opts_ri
)
262 ndopts
->nd_opts_ri
= nd_opt
;
268 if (ndisc_is_useropt(dev
, nd_opt
)) {
269 ndopts
->nd_useropts_end
= nd_opt
;
270 if (!ndopts
->nd_useropts
)
271 ndopts
->nd_useropts
= nd_opt
;
272 } else if (unknown
) {
274 * Unknown options must be silently ignored,
275 * to accommodate future extension to the
279 "%s: ignored unsupported option; type=%d, len=%d\n",
286 nd_opt
= ((void *)nd_opt
) + l
;
291 int ndisc_mc_map(const struct in6_addr
*addr
, char *buf
, struct net_device
*dev
, int dir
)
295 case ARPHRD_IEEE802
: /* Not sure. Check it later. --ANK */
297 ipv6_eth_mc_map(addr
, buf
);
300 ipv6_arcnet_mc_map(addr
, buf
);
302 case ARPHRD_INFINIBAND
:
303 ipv6_ib_mc_map(addr
, dev
->broadcast
, buf
);
306 return ipv6_ipgre_mc_map(addr
, dev
->broadcast
, buf
);
309 memcpy(buf
, dev
->broadcast
, dev
->addr_len
);
315 EXPORT_SYMBOL(ndisc_mc_map
);
317 static u32
ndisc_hash(const void *pkey
,
318 const struct net_device
*dev
,
321 return ndisc_hashfn(pkey
, dev
, hash_rnd
);
324 static bool ndisc_key_eq(const struct neighbour
*n
, const void *pkey
)
326 return neigh_key_eq128(n
, pkey
);
329 static int ndisc_constructor(struct neighbour
*neigh
)
331 struct in6_addr
*addr
= (struct in6_addr
*)&neigh
->primary_key
;
332 struct net_device
*dev
= neigh
->dev
;
333 struct inet6_dev
*in6_dev
;
334 struct neigh_parms
*parms
;
335 bool is_multicast
= ipv6_addr_is_multicast(addr
);
337 in6_dev
= in6_dev_get(dev
);
342 parms
= in6_dev
->nd_parms
;
343 __neigh_parms_put(neigh
->parms
);
344 neigh
->parms
= neigh_parms_clone(parms
);
346 neigh
->type
= is_multicast
? RTN_MULTICAST
: RTN_UNICAST
;
347 if (!dev
->header_ops
) {
348 neigh
->nud_state
= NUD_NOARP
;
349 neigh
->ops
= &ndisc_direct_ops
;
350 neigh
->output
= neigh_direct_output
;
353 neigh
->nud_state
= NUD_NOARP
;
354 ndisc_mc_map(addr
, neigh
->ha
, dev
, 1);
355 } else if (dev
->flags
&(IFF_NOARP
|IFF_LOOPBACK
)) {
356 neigh
->nud_state
= NUD_NOARP
;
357 memcpy(neigh
->ha
, dev
->dev_addr
, dev
->addr_len
);
358 if (dev
->flags
&IFF_LOOPBACK
)
359 neigh
->type
= RTN_LOCAL
;
360 } else if (dev
->flags
&IFF_POINTOPOINT
) {
361 neigh
->nud_state
= NUD_NOARP
;
362 memcpy(neigh
->ha
, dev
->broadcast
, dev
->addr_len
);
364 if (dev
->header_ops
->cache
)
365 neigh
->ops
= &ndisc_hh_ops
;
367 neigh
->ops
= &ndisc_generic_ops
;
368 if (neigh
->nud_state
&NUD_VALID
)
369 neigh
->output
= neigh
->ops
->connected_output
;
371 neigh
->output
= neigh
->ops
->output
;
373 in6_dev_put(in6_dev
);
377 static int pndisc_constructor(struct pneigh_entry
*n
)
379 struct in6_addr
*addr
= (struct in6_addr
*)&n
->key
;
380 struct in6_addr maddr
;
381 struct net_device
*dev
= n
->dev
;
383 if (!dev
|| !__in6_dev_get(dev
))
385 addrconf_addr_solict_mult(addr
, &maddr
);
386 ipv6_dev_mc_inc(dev
, &maddr
);
390 static void pndisc_destructor(struct pneigh_entry
*n
)
392 struct in6_addr
*addr
= (struct in6_addr
*)&n
->key
;
393 struct in6_addr maddr
;
394 struct net_device
*dev
= n
->dev
;
396 if (!dev
|| !__in6_dev_get(dev
))
398 addrconf_addr_solict_mult(addr
, &maddr
);
399 ipv6_dev_mc_dec(dev
, &maddr
);
402 /* called with rtnl held */
403 static bool ndisc_allow_add(const struct net_device
*dev
,
404 struct netlink_ext_ack
*extack
)
406 struct inet6_dev
*idev
= __in6_dev_get(dev
);
408 if (!idev
|| idev
->cnf
.disable_ipv6
) {
409 NL_SET_ERR_MSG(extack
, "IPv6 is disabled on this device");
416 static struct sk_buff
*ndisc_alloc_skb(struct net_device
*dev
,
419 int hlen
= LL_RESERVED_SPACE(dev
);
420 int tlen
= dev
->needed_tailroom
;
421 struct sock
*sk
= dev_net(dev
)->ipv6
.ndisc_sk
;
424 skb
= alloc_skb(hlen
+ sizeof(struct ipv6hdr
) + len
+ tlen
, GFP_ATOMIC
);
426 ND_PRINTK(0, err
, "ndisc: %s failed to allocate an skb\n",
431 skb
->protocol
= htons(ETH_P_IPV6
);
434 skb_reserve(skb
, hlen
+ sizeof(struct ipv6hdr
));
435 skb_reset_transport_header(skb
);
437 /* Manually assign socket ownership as we avoid calling
438 * sock_alloc_send_pskb() to bypass wmem buffer limits
440 skb_set_owner_w(skb
, sk
);
445 static void ip6_nd_hdr(struct sk_buff
*skb
,
446 const struct in6_addr
*saddr
,
447 const struct in6_addr
*daddr
,
448 int hop_limit
, int len
)
451 struct inet6_dev
*idev
;
455 idev
= __in6_dev_get(skb
->dev
);
456 tclass
= idev
? READ_ONCE(idev
->cnf
.ndisc_tclass
) : 0;
459 skb_push(skb
, sizeof(*hdr
));
460 skb_reset_network_header(skb
);
463 ip6_flow_hdr(hdr
, tclass
, 0);
465 hdr
->payload_len
= htons(len
);
466 hdr
->nexthdr
= IPPROTO_ICMPV6
;
467 hdr
->hop_limit
= hop_limit
;
473 void ndisc_send_skb(struct sk_buff
*skb
, const struct in6_addr
*daddr
,
474 const struct in6_addr
*saddr
)
476 struct dst_entry
*dst
= skb_dst(skb
);
477 struct net
*net
= dev_net(skb
->dev
);
478 struct sock
*sk
= net
->ipv6
.ndisc_sk
;
479 struct inet6_dev
*idev
;
481 struct icmp6hdr
*icmp6h
= icmp6_hdr(skb
);
484 type
= icmp6h
->icmp6_type
;
488 int oif
= skb
->dev
->ifindex
;
490 icmpv6_flow_init(sk
, &fl6
, type
, saddr
, daddr
, oif
);
491 dst
= icmp6_dst_alloc(skb
->dev
, &fl6
);
497 skb_dst_set(skb
, dst
);
500 icmp6h
->icmp6_cksum
= csum_ipv6_magic(saddr
, daddr
, skb
->len
,
505 ip6_nd_hdr(skb
, saddr
, daddr
, READ_ONCE(inet6_sk(sk
)->hop_limit
), skb
->len
);
508 idev
= __in6_dev_get(dst
->dev
);
509 IP6_INC_STATS(net
, idev
, IPSTATS_MIB_OUTREQUESTS
);
511 err
= NF_HOOK(NFPROTO_IPV6
, NF_INET_LOCAL_OUT
,
512 net
, sk
, skb
, NULL
, dst
->dev
,
515 ICMP6MSGOUT_INC_STATS(net
, idev
, type
);
516 ICMP6_INC_STATS(net
, idev
, ICMP6_MIB_OUTMSGS
);
521 EXPORT_SYMBOL(ndisc_send_skb
);
523 void ndisc_send_na(struct net_device
*dev
, const struct in6_addr
*daddr
,
524 const struct in6_addr
*solicited_addr
,
525 bool router
, bool solicited
, bool override
, bool inc_opt
)
528 struct in6_addr tmpaddr
;
529 struct inet6_ifaddr
*ifp
;
530 const struct in6_addr
*src_addr
;
534 /* for anycast or proxy, solicited_addr != src_addr */
535 ifp
= ipv6_get_ifaddr(dev_net(dev
), solicited_addr
, dev
, 1);
537 src_addr
= solicited_addr
;
538 if (ifp
->flags
& IFA_F_OPTIMISTIC
)
540 inc_opt
|= READ_ONCE(ifp
->idev
->cnf
.force_tllao
);
543 if (ipv6_dev_get_saddr(dev_net(dev
), dev
, daddr
,
544 inet6_sk(dev_net(dev
)->ipv6
.ndisc_sk
)->srcprefs
,
553 optlen
+= ndisc_opt_addr_space(dev
,
554 NDISC_NEIGHBOUR_ADVERTISEMENT
);
556 skb
= ndisc_alloc_skb(dev
, sizeof(*msg
) + optlen
);
560 msg
= skb_put(skb
, sizeof(*msg
));
561 *msg
= (struct nd_msg
) {
563 .icmp6_type
= NDISC_NEIGHBOUR_ADVERTISEMENT
,
564 .icmp6_router
= router
,
565 .icmp6_solicited
= solicited
,
566 .icmp6_override
= override
,
568 .target
= *solicited_addr
,
572 ndisc_fill_addr_option(skb
, ND_OPT_TARGET_LL_ADDR
,
574 NDISC_NEIGHBOUR_ADVERTISEMENT
);
576 ndisc_send_skb(skb
, daddr
, src_addr
);
579 static void ndisc_send_unsol_na(struct net_device
*dev
)
581 struct inet6_dev
*idev
;
582 struct inet6_ifaddr
*ifa
;
584 idev
= in6_dev_get(dev
);
588 read_lock_bh(&idev
->lock
);
589 list_for_each_entry(ifa
, &idev
->addr_list
, if_list
) {
590 /* skip tentative addresses until dad completes */
591 if (ifa
->flags
& IFA_F_TENTATIVE
&&
592 !(ifa
->flags
& IFA_F_OPTIMISTIC
))
595 ndisc_send_na(dev
, &in6addr_linklocal_allnodes
, &ifa
->addr
,
596 /*router=*/ !!idev
->cnf
.forwarding
,
597 /*solicited=*/ false, /*override=*/ true,
600 read_unlock_bh(&idev
->lock
);
605 struct sk_buff
*ndisc_ns_create(struct net_device
*dev
, const struct in6_addr
*solicit
,
606 const struct in6_addr
*saddr
, u64 nonce
)
608 int inc_opt
= dev
->addr_len
;
616 if (ipv6_addr_any(saddr
))
619 optlen
+= ndisc_opt_addr_space(dev
,
620 NDISC_NEIGHBOUR_SOLICITATION
);
624 skb
= ndisc_alloc_skb(dev
, sizeof(*msg
) + optlen
);
628 msg
= skb_put(skb
, sizeof(*msg
));
629 *msg
= (struct nd_msg
) {
631 .icmp6_type
= NDISC_NEIGHBOUR_SOLICITATION
,
637 ndisc_fill_addr_option(skb
, ND_OPT_SOURCE_LL_ADDR
,
639 NDISC_NEIGHBOUR_SOLICITATION
);
641 u8
*opt
= skb_put(skb
, 8);
643 opt
[0] = ND_OPT_NONCE
;
645 memcpy(opt
+ 2, &nonce
, 6);
650 EXPORT_SYMBOL(ndisc_ns_create
);
652 void ndisc_send_ns(struct net_device
*dev
, const struct in6_addr
*solicit
,
653 const struct in6_addr
*daddr
, const struct in6_addr
*saddr
,
656 struct in6_addr addr_buf
;
660 if (ipv6_get_lladdr(dev
, &addr_buf
,
661 (IFA_F_TENTATIVE
| IFA_F_OPTIMISTIC
)))
666 skb
= ndisc_ns_create(dev
, solicit
, saddr
, nonce
);
669 ndisc_send_skb(skb
, daddr
, saddr
);
672 void ndisc_send_rs(struct net_device
*dev
, const struct in6_addr
*saddr
,
673 const struct in6_addr
*daddr
)
677 int send_sllao
= dev
->addr_len
;
680 #ifdef CONFIG_IPV6_OPTIMISTIC_DAD
682 * According to section 2.2 of RFC 4429, we must not
683 * send router solicitations with a sllao from
684 * optimistic addresses, but we may send the solicitation
685 * if we don't include the sllao. So here we check
686 * if our address is optimistic, and if so, we
687 * suppress the inclusion of the sllao.
690 struct inet6_ifaddr
*ifp
= ipv6_get_ifaddr(dev_net(dev
), saddr
,
693 if (ifp
->flags
& IFA_F_OPTIMISTIC
) {
703 optlen
+= ndisc_opt_addr_space(dev
, NDISC_ROUTER_SOLICITATION
);
705 skb
= ndisc_alloc_skb(dev
, sizeof(*msg
) + optlen
);
709 msg
= skb_put(skb
, sizeof(*msg
));
710 *msg
= (struct rs_msg
) {
712 .icmp6_type
= NDISC_ROUTER_SOLICITATION
,
717 ndisc_fill_addr_option(skb
, ND_OPT_SOURCE_LL_ADDR
,
719 NDISC_ROUTER_SOLICITATION
);
721 ndisc_send_skb(skb
, daddr
, saddr
);
725 static void ndisc_error_report(struct neighbour
*neigh
, struct sk_buff
*skb
)
728 * "The sender MUST return an ICMP
729 * destination unreachable"
731 dst_link_failure(skb
);
735 /* Called with locked neigh: either read or both */
737 static void ndisc_solicit(struct neighbour
*neigh
, struct sk_buff
*skb
)
739 struct in6_addr
*saddr
= NULL
;
740 struct in6_addr mcaddr
;
741 struct net_device
*dev
= neigh
->dev
;
742 struct in6_addr
*target
= (struct in6_addr
*)&neigh
->primary_key
;
743 int probes
= atomic_read(&neigh
->probes
);
745 if (skb
&& ipv6_chk_addr_and_flags(dev_net(dev
), &ipv6_hdr(skb
)->saddr
,
747 IFA_F_TENTATIVE
|IFA_F_OPTIMISTIC
))
748 saddr
= &ipv6_hdr(skb
)->saddr
;
749 probes
-= NEIGH_VAR(neigh
->parms
, UCAST_PROBES
);
751 if (!(READ_ONCE(neigh
->nud_state
) & NUD_VALID
)) {
753 "%s: trying to ucast probe in NUD_INVALID: %pI6\n",
756 ndisc_send_ns(dev
, target
, target
, saddr
, 0);
757 } else if ((probes
-= NEIGH_VAR(neigh
->parms
, APP_PROBES
)) < 0) {
760 addrconf_addr_solict_mult(target
, &mcaddr
);
761 ndisc_send_ns(dev
, target
, &mcaddr
, saddr
, 0);
765 static int pndisc_is_router(const void *pkey
,
766 struct net_device
*dev
)
768 struct pneigh_entry
*n
;
771 read_lock_bh(&nd_tbl
.lock
);
772 n
= __pneigh_lookup(&nd_tbl
, dev_net(dev
), pkey
, dev
);
774 ret
= !!(n
->flags
& NTF_ROUTER
);
775 read_unlock_bh(&nd_tbl
.lock
);
780 void ndisc_update(const struct net_device
*dev
, struct neighbour
*neigh
,
781 const u8
*lladdr
, u8
new, u32 flags
, u8 icmp6_type
,
782 struct ndisc_options
*ndopts
)
784 neigh_update(neigh
, lladdr
, new, flags
, 0);
785 /* report ndisc ops about neighbour update */
786 ndisc_ops_update(dev
, neigh
, flags
, icmp6_type
, ndopts
);
789 static enum skb_drop_reason
ndisc_recv_ns(struct sk_buff
*skb
)
791 struct nd_msg
*msg
= (struct nd_msg
*)skb_transport_header(skb
);
792 const struct in6_addr
*saddr
= &ipv6_hdr(skb
)->saddr
;
793 const struct in6_addr
*daddr
= &ipv6_hdr(skb
)->daddr
;
795 u32 ndoptlen
= skb_tail_pointer(skb
) - (skb_transport_header(skb
) +
796 offsetof(struct nd_msg
, opt
));
797 struct ndisc_options ndopts
;
798 struct net_device
*dev
= skb
->dev
;
799 struct inet6_ifaddr
*ifp
;
800 struct inet6_dev
*idev
= NULL
;
801 struct neighbour
*neigh
;
802 int dad
= ipv6_addr_any(saddr
);
808 if (skb
->len
< sizeof(struct nd_msg
))
809 return SKB_DROP_REASON_PKT_TOO_SMALL
;
811 if (ipv6_addr_is_multicast(&msg
->target
)) {
812 ND_PRINTK(2, warn
, "NS: multicast target address\n");
818 * DAD has to be destined for solicited node multicast address.
820 if (dad
&& !ipv6_addr_is_solict_mult(daddr
)) {
821 ND_PRINTK(2, warn
, "NS: bad DAD packet (wrong destination)\n");
825 if (!ndisc_parse_options(dev
, msg
->opt
, ndoptlen
, &ndopts
))
826 return SKB_DROP_REASON_IPV6_NDISC_BAD_OPTIONS
;
828 if (ndopts
.nd_opts_src_lladdr
) {
829 lladdr
= ndisc_opt_addr_data(ndopts
.nd_opts_src_lladdr
, dev
);
832 "NS: invalid link-layer address length\n");
837 * If the IP source address is the unspecified address,
838 * there MUST NOT be source link-layer address option
843 "NS: bad DAD packet (link-layer address option)\n");
847 if (ndopts
.nd_opts_nonce
&& ndopts
.nd_opts_nonce
->nd_opt_len
== 1)
848 memcpy(&nonce
, (u8
*)(ndopts
.nd_opts_nonce
+ 1), 6);
850 inc
= ipv6_addr_is_multicast(daddr
);
852 ifp
= ipv6_get_ifaddr(dev_net(dev
), &msg
->target
, dev
, 1);
855 if (ifp
->flags
& (IFA_F_TENTATIVE
|IFA_F_OPTIMISTIC
)) {
857 if (nonce
!= 0 && ifp
->dad_nonce
== nonce
) {
858 u8
*np
= (u8
*)&nonce
;
859 /* Matching nonce if looped back */
861 "%s: IPv6 DAD loopback for address %pI6c nonce %pM ignored\n",
862 ifp
->idev
->dev
->name
,
867 * We are colliding with another node
869 * so fail our DAD process
871 addrconf_dad_failure(skb
, ifp
);
875 * This is not a dad solicitation.
876 * If we are an optimistic node,
878 * Otherwise, we should ignore it.
880 if (!(ifp
->flags
& IFA_F_OPTIMISTIC
))
887 struct net
*net
= dev_net(dev
);
889 /* perhaps an address on the master device */
890 if (netif_is_l3_slave(dev
)) {
891 struct net_device
*mdev
;
893 mdev
= netdev_master_upper_dev_get_rcu(dev
);
895 ifp
= ipv6_get_ifaddr(net
, &msg
->target
, mdev
, 1);
901 idev
= in6_dev_get(dev
);
903 /* XXX: count this drop? */
907 if (ipv6_chk_acast_addr(net
, dev
, &msg
->target
) ||
908 (READ_ONCE(idev
->cnf
.forwarding
) &&
909 (READ_ONCE(net
->ipv6
.devconf_all
->proxy_ndp
) ||
910 READ_ONCE(idev
->cnf
.proxy_ndp
)) &&
911 (is_router
= pndisc_is_router(&msg
->target
, dev
)) >= 0)) {
912 if (!(NEIGH_CB(skb
)->flags
& LOCALLY_ENQUEUED
) &&
913 skb
->pkt_type
!= PACKET_HOST
&&
915 NEIGH_VAR(idev
->nd_parms
, PROXY_DELAY
) != 0) {
917 * for anycast or proxy,
918 * sender should delay its response
919 * by a random time between 0 and
920 * MAX_ANYCAST_DELAY_TIME seconds.
921 * (RFC2461) -- yoshfuji
923 struct sk_buff
*n
= skb_clone(skb
, GFP_ATOMIC
);
925 pneigh_enqueue(&nd_tbl
, idev
->nd_parms
, n
);
929 SKB_DR_SET(reason
, IPV6_NDISC_NS_OTHERHOST
);
935 is_router
= READ_ONCE(idev
->cnf
.forwarding
);
938 ndisc_send_na(dev
, &in6addr_linklocal_allnodes
, &msg
->target
,
939 !!is_router
, false, (ifp
!= NULL
), true);
944 NEIGH_CACHE_STAT_INC(&nd_tbl
, rcv_probes_mcast
);
946 NEIGH_CACHE_STAT_INC(&nd_tbl
, rcv_probes_ucast
);
949 * update / create cache entry
950 * for the source address
952 neigh
= __neigh_lookup(&nd_tbl
, saddr
, dev
,
953 !inc
|| lladdr
|| !dev
->addr_len
);
955 ndisc_update(dev
, neigh
, lladdr
, NUD_STALE
,
956 NEIGH_UPDATE_F_WEAK_OVERRIDE
|
957 NEIGH_UPDATE_F_OVERRIDE
,
958 NDISC_NEIGHBOUR_SOLICITATION
, &ndopts
);
959 if (neigh
|| !dev
->header_ops
) {
960 ndisc_send_na(dev
, saddr
, &msg
->target
, !!is_router
,
961 true, (ifp
!= NULL
&& inc
), inc
);
963 neigh_release(neigh
);
964 reason
= SKB_CONSUMED
;
975 static int accept_untracked_na(struct net_device
*dev
, struct in6_addr
*saddr
)
977 struct inet6_dev
*idev
= __in6_dev_get(dev
);
979 switch (READ_ONCE(idev
->cnf
.accept_untracked_na
)) {
980 case 0: /* Don't accept untracked na (absent in neighbor cache) */
982 case 1: /* Create new entries from na if currently untracked */
984 case 2: /* Create new entries from untracked na only if saddr is in the
985 * same subnet as an address configured on the interface that
988 return !!ipv6_chk_prefix(saddr
, dev
);
994 static enum skb_drop_reason
ndisc_recv_na(struct sk_buff
*skb
)
996 struct nd_msg
*msg
= (struct nd_msg
*)skb_transport_header(skb
);
997 struct in6_addr
*saddr
= &ipv6_hdr(skb
)->saddr
;
998 const struct in6_addr
*daddr
= &ipv6_hdr(skb
)->daddr
;
1000 u32 ndoptlen
= skb_tail_pointer(skb
) - (skb_transport_header(skb
) +
1001 offsetof(struct nd_msg
, opt
));
1002 struct ndisc_options ndopts
;
1003 struct net_device
*dev
= skb
->dev
;
1004 struct inet6_dev
*idev
= __in6_dev_get(dev
);
1005 struct inet6_ifaddr
*ifp
;
1006 struct neighbour
*neigh
;
1010 if (skb
->len
< sizeof(struct nd_msg
))
1011 return SKB_DROP_REASON_PKT_TOO_SMALL
;
1013 if (ipv6_addr_is_multicast(&msg
->target
)) {
1014 ND_PRINTK(2, warn
, "NA: target address is multicast\n");
1018 if (ipv6_addr_is_multicast(daddr
) &&
1019 msg
->icmph
.icmp6_solicited
) {
1020 ND_PRINTK(2, warn
, "NA: solicited NA is multicasted\n");
1024 /* For some 802.11 wireless deployments (and possibly other networks),
1025 * there will be a NA proxy and unsolicitd packets are attacks
1026 * and thus should not be accepted.
1027 * drop_unsolicited_na takes precedence over accept_untracked_na
1029 if (!msg
->icmph
.icmp6_solicited
&& idev
&&
1030 READ_ONCE(idev
->cnf
.drop_unsolicited_na
))
1033 if (!ndisc_parse_options(dev
, msg
->opt
, ndoptlen
, &ndopts
))
1034 return SKB_DROP_REASON_IPV6_NDISC_BAD_OPTIONS
;
1036 if (ndopts
.nd_opts_tgt_lladdr
) {
1037 lladdr
= ndisc_opt_addr_data(ndopts
.nd_opts_tgt_lladdr
, dev
);
1040 "NA: invalid link-layer address length\n");
1044 ifp
= ipv6_get_ifaddr(dev_net(dev
), &msg
->target
, dev
, 1);
1046 if (skb
->pkt_type
!= PACKET_LOOPBACK
1047 && (ifp
->flags
& IFA_F_TENTATIVE
)) {
1048 addrconf_dad_failure(skb
, ifp
);
1051 /* What should we make now? The advertisement
1052 is invalid, but ndisc specs say nothing
1053 about it. It could be misconfiguration, or
1054 an smart proxy agent tries to help us :-)
1056 We should not print the error if NA has been
1057 received from loopback - it is just our own
1058 unsolicited advertisement.
1060 if (skb
->pkt_type
!= PACKET_LOOPBACK
)
1062 "NA: %pM advertised our address %pI6c on %s!\n",
1063 eth_hdr(skb
)->h_source
, &ifp
->addr
, ifp
->idev
->dev
->name
);
1068 neigh
= neigh_lookup(&nd_tbl
, &msg
->target
, dev
);
1070 /* RFC 9131 updates original Neighbour Discovery RFC 4861.
1071 * NAs with Target LL Address option without a corresponding
1072 * entry in the neighbour cache can now create a STALE neighbour
1073 * cache entry on routers.
1075 * entry accept fwding solicited behaviour
1076 * ------- ------ ------ --------- ----------------------
1077 * present X X 0 Set state to STALE
1078 * present X X 1 Set state to REACHABLE
1079 * absent 0 X X Do nothing
1080 * absent 1 0 X Do nothing
1081 * absent 1 1 X Add a new STALE entry
1083 * Note that we don't do a (daddr == all-routers-mcast) check.
1085 new_state
= msg
->icmph
.icmp6_solicited
? NUD_REACHABLE
: NUD_STALE
;
1086 if (!neigh
&& lladdr
&& idev
&& READ_ONCE(idev
->cnf
.forwarding
)) {
1087 if (accept_untracked_na(dev
, saddr
)) {
1088 neigh
= neigh_create(&nd_tbl
, &msg
->target
, dev
);
1089 new_state
= NUD_STALE
;
1093 if (neigh
&& !IS_ERR(neigh
)) {
1094 u8 old_flags
= neigh
->flags
;
1095 struct net
*net
= dev_net(dev
);
1097 if (READ_ONCE(neigh
->nud_state
) & NUD_FAILED
)
1101 * Don't update the neighbor cache entry on a proxy NA from
1102 * ourselves because either the proxied node is off link or it
1103 * has already sent a NA to us.
1105 if (lladdr
&& !memcmp(lladdr
, dev
->dev_addr
, dev
->addr_len
) &&
1106 READ_ONCE(net
->ipv6
.devconf_all
->forwarding
) &&
1107 READ_ONCE(net
->ipv6
.devconf_all
->proxy_ndp
) &&
1108 pneigh_lookup(&nd_tbl
, net
, &msg
->target
, dev
, 0)) {
1109 /* XXX: idev->cnf.proxy_ndp */
1113 ndisc_update(dev
, neigh
, lladdr
,
1115 NEIGH_UPDATE_F_WEAK_OVERRIDE
|
1116 (msg
->icmph
.icmp6_override
? NEIGH_UPDATE_F_OVERRIDE
: 0)|
1117 NEIGH_UPDATE_F_OVERRIDE_ISROUTER
|
1118 (msg
->icmph
.icmp6_router
? NEIGH_UPDATE_F_ISROUTER
: 0),
1119 NDISC_NEIGHBOUR_ADVERTISEMENT
, &ndopts
);
1121 if ((old_flags
& ~neigh
->flags
) & NTF_ROUTER
) {
1123 * Change: router to host
1125 rt6_clean_tohost(dev_net(dev
), saddr
);
1127 reason
= SKB_CONSUMED
;
1129 neigh_release(neigh
);
1134 static enum skb_drop_reason
ndisc_recv_rs(struct sk_buff
*skb
)
1136 struct rs_msg
*rs_msg
= (struct rs_msg
*)skb_transport_header(skb
);
1137 unsigned long ndoptlen
= skb
->len
- sizeof(*rs_msg
);
1138 struct neighbour
*neigh
;
1139 struct inet6_dev
*idev
;
1140 const struct in6_addr
*saddr
= &ipv6_hdr(skb
)->saddr
;
1141 struct ndisc_options ndopts
;
1145 if (skb
->len
< sizeof(*rs_msg
))
1146 return SKB_DROP_REASON_PKT_TOO_SMALL
;
1148 idev
= __in6_dev_get(skb
->dev
);
1150 ND_PRINTK(1, err
, "RS: can't find in6 device\n");
1154 /* Don't accept RS if we're not in router mode */
1155 if (!READ_ONCE(idev
->cnf
.forwarding
))
1159 * Don't update NCE if src = ::;
1160 * this implies that the source node has no ip address assigned yet.
1162 if (ipv6_addr_any(saddr
))
1165 /* Parse ND options */
1166 if (!ndisc_parse_options(skb
->dev
, rs_msg
->opt
, ndoptlen
, &ndopts
))
1167 return SKB_DROP_REASON_IPV6_NDISC_BAD_OPTIONS
;
1169 if (ndopts
.nd_opts_src_lladdr
) {
1170 lladdr
= ndisc_opt_addr_data(ndopts
.nd_opts_src_lladdr
,
1176 neigh
= __neigh_lookup(&nd_tbl
, saddr
, skb
->dev
, 1);
1178 ndisc_update(skb
->dev
, neigh
, lladdr
, NUD_STALE
,
1179 NEIGH_UPDATE_F_WEAK_OVERRIDE
|
1180 NEIGH_UPDATE_F_OVERRIDE
|
1181 NEIGH_UPDATE_F_OVERRIDE_ISROUTER
,
1182 NDISC_ROUTER_SOLICITATION
, &ndopts
);
1183 neigh_release(neigh
);
1184 reason
= SKB_CONSUMED
;
1190 static void ndisc_ra_useropt(struct sk_buff
*ra
, struct nd_opt_hdr
*opt
)
1192 struct icmp6hdr
*icmp6h
= (struct icmp6hdr
*)skb_transport_header(ra
);
1193 struct sk_buff
*skb
;
1194 struct nlmsghdr
*nlh
;
1195 struct nduseroptmsg
*ndmsg
;
1196 struct net
*net
= dev_net(ra
->dev
);
1198 int base_size
= NLMSG_ALIGN(sizeof(struct nduseroptmsg
)
1199 + (opt
->nd_opt_len
<< 3));
1200 size_t msg_size
= base_size
+ nla_total_size(sizeof(struct in6_addr
));
1202 skb
= nlmsg_new(msg_size
, GFP_ATOMIC
);
1208 nlh
= nlmsg_put(skb
, 0, 0, RTM_NEWNDUSEROPT
, base_size
, 0);
1210 goto nla_put_failure
;
1213 ndmsg
= nlmsg_data(nlh
);
1214 ndmsg
->nduseropt_family
= AF_INET6
;
1215 ndmsg
->nduseropt_ifindex
= ra
->dev
->ifindex
;
1216 ndmsg
->nduseropt_icmp_type
= icmp6h
->icmp6_type
;
1217 ndmsg
->nduseropt_icmp_code
= icmp6h
->icmp6_code
;
1218 ndmsg
->nduseropt_opts_len
= opt
->nd_opt_len
<< 3;
1220 memcpy(ndmsg
+ 1, opt
, opt
->nd_opt_len
<< 3);
1222 if (nla_put_in6_addr(skb
, NDUSEROPT_SRCADDR
, &ipv6_hdr(ra
)->saddr
))
1223 goto nla_put_failure
;
1224 nlmsg_end(skb
, nlh
);
1226 rtnl_notify(skb
, net
, 0, RTNLGRP_ND_USEROPT
, NULL
, GFP_ATOMIC
);
1233 rtnl_set_sk_err(net
, RTNLGRP_ND_USEROPT
, err
);
1236 static enum skb_drop_reason
ndisc_router_discovery(struct sk_buff
*skb
)
1238 struct ra_msg
*ra_msg
= (struct ra_msg
*)skb_transport_header(skb
);
1239 bool send_ifinfo_notify
= false;
1240 struct neighbour
*neigh
= NULL
;
1241 struct ndisc_options ndopts
;
1242 struct fib6_info
*rt
= NULL
;
1243 struct inet6_dev
*in6_dev
;
1244 struct fib6_table
*table
;
1245 u32 defrtr_usr_metric
;
1246 unsigned int pref
= 0;
1253 __u8
*opt
= (__u8
*)(ra_msg
+ 1);
1255 optlen
= (skb_tail_pointer(skb
) - skb_transport_header(skb
)) -
1256 sizeof(struct ra_msg
);
1259 "RA: %s, dev: %s\n",
1260 __func__
, skb
->dev
->name
);
1261 if (!(ipv6_addr_type(&ipv6_hdr(skb
)->saddr
) & IPV6_ADDR_LINKLOCAL
)) {
1262 ND_PRINTK(2, warn
, "RA: source address is not link-local\n");
1266 return SKB_DROP_REASON_PKT_TOO_SMALL
;
1268 #ifdef CONFIG_IPV6_NDISC_NODETYPE
1269 if (skb
->ndisc_nodetype
== NDISC_NODETYPE_HOST
) {
1270 ND_PRINTK(2, warn
, "RA: from host or unauthorized router\n");
1275 in6_dev
= __in6_dev_get(skb
->dev
);
1277 ND_PRINTK(0, err
, "RA: can't find inet6 device for %s\n",
1282 if (!ndisc_parse_options(skb
->dev
, opt
, optlen
, &ndopts
))
1283 return SKB_DROP_REASON_IPV6_NDISC_BAD_OPTIONS
;
1285 if (!ipv6_accept_ra(in6_dev
)) {
1287 "RA: %s, did not accept ra for dev: %s\n",
1288 __func__
, skb
->dev
->name
);
1289 goto skip_linkparms
;
1292 #ifdef CONFIG_IPV6_NDISC_NODETYPE
1293 /* skip link-specific parameters from interior routers */
1294 if (skb
->ndisc_nodetype
== NDISC_NODETYPE_NODEFAULT
) {
1296 "RA: %s, nodetype is NODEFAULT, dev: %s\n",
1297 __func__
, skb
->dev
->name
);
1298 goto skip_linkparms
;
1302 if (in6_dev
->if_flags
& IF_RS_SENT
) {
1304 * flag that an RA was received after an RS was sent
1305 * out on this interface.
1307 in6_dev
->if_flags
|= IF_RA_RCVD
;
1311 * Remember the managed/otherconf flags from most recently
1312 * received RA message (RFC 2462) -- yoshfuji
1314 old_if_flags
= in6_dev
->if_flags
;
1315 in6_dev
->if_flags
= (in6_dev
->if_flags
& ~(IF_RA_MANAGED
|
1317 (ra_msg
->icmph
.icmp6_addrconf_managed
?
1318 IF_RA_MANAGED
: 0) |
1319 (ra_msg
->icmph
.icmp6_addrconf_other
?
1320 IF_RA_OTHERCONF
: 0);
1322 if (old_if_flags
!= in6_dev
->if_flags
)
1323 send_ifinfo_notify
= true;
1325 if (!READ_ONCE(in6_dev
->cnf
.accept_ra_defrtr
)) {
1327 "RA: %s, defrtr is false for dev: %s\n",
1328 __func__
, skb
->dev
->name
);
1332 lifetime
= ntohs(ra_msg
->icmph
.icmp6_rt_lifetime
);
1333 if (lifetime
!= 0 &&
1334 lifetime
< READ_ONCE(in6_dev
->cnf
.accept_ra_min_lft
)) {
1336 "RA: router lifetime (%ds) is too short: %s\n",
1337 lifetime
, skb
->dev
->name
);
1341 /* Do not accept RA with source-addr found on local machine unless
1342 * accept_ra_from_local is set to true.
1344 net
= dev_net(in6_dev
->dev
);
1345 if (!READ_ONCE(in6_dev
->cnf
.accept_ra_from_local
) &&
1346 ipv6_chk_addr(net
, &ipv6_hdr(skb
)->saddr
, in6_dev
->dev
, 0)) {
1348 "RA from local address detected on dev: %s: default router ignored\n",
1353 #ifdef CONFIG_IPV6_ROUTER_PREF
1354 pref
= ra_msg
->icmph
.icmp6_router_pref
;
1355 /* 10b is handled as if it were 00b (medium) */
1356 if (pref
== ICMPV6_ROUTER_PREF_INVALID
||
1357 !READ_ONCE(in6_dev
->cnf
.accept_ra_rtr_pref
))
1358 pref
= ICMPV6_ROUTER_PREF_MEDIUM
;
1360 /* routes added from RAs do not use nexthop objects */
1361 rt
= rt6_get_dflt_router(net
, &ipv6_hdr(skb
)->saddr
, skb
->dev
);
1363 neigh
= ip6_neigh_lookup(&rt
->fib6_nh
->fib_nh_gw6
,
1364 rt
->fib6_nh
->fib_nh_dev
, NULL
,
1365 &ipv6_hdr(skb
)->saddr
);
1368 "RA: %s got default router without neighbour\n",
1370 fib6_info_release(rt
);
1374 /* Set default route metric as specified by user */
1375 defrtr_usr_metric
= in6_dev
->cnf
.ra_defrtr_metric
;
1376 /* delete the route if lifetime is 0 or if metric needs change */
1377 if (rt
&& (lifetime
== 0 || rt
->fib6_metric
!= defrtr_usr_metric
)) {
1378 ip6_del_rt(net
, rt
, false);
1382 ND_PRINTK(3, info
, "RA: rt: %p lifetime: %d, metric: %d, for dev: %s\n",
1383 rt
, lifetime
, defrtr_usr_metric
, skb
->dev
->name
);
1384 if (!rt
&& lifetime
) {
1385 ND_PRINTK(3, info
, "RA: adding default router\n");
1388 neigh_release(neigh
);
1390 rt
= rt6_add_dflt_router(net
, &ipv6_hdr(skb
)->saddr
,
1391 skb
->dev
, pref
, defrtr_usr_metric
,
1395 "RA: %s failed to add default route\n",
1400 neigh
= ip6_neigh_lookup(&rt
->fib6_nh
->fib_nh_gw6
,
1401 rt
->fib6_nh
->fib_nh_dev
, NULL
,
1402 &ipv6_hdr(skb
)->saddr
);
1405 "RA: %s got default router without neighbour\n",
1407 fib6_info_release(rt
);
1410 neigh
->flags
|= NTF_ROUTER
;
1411 } else if (rt
&& IPV6_EXTRACT_PREF(rt
->fib6_flags
) != pref
) {
1412 struct nl_info nlinfo
= {
1415 rt
->fib6_flags
= (rt
->fib6_flags
& ~RTF_PREF_MASK
) | RTF_PREF(pref
);
1416 inet6_rt_notify(RTM_NEWROUTE
, rt
, &nlinfo
, NLM_F_REPLACE
);
1420 table
= rt
->fib6_table
;
1421 spin_lock_bh(&table
->tb6_lock
);
1423 fib6_set_expires(rt
, jiffies
+ (HZ
* lifetime
));
1424 fib6_add_gc_list(rt
);
1426 spin_unlock_bh(&table
->tb6_lock
);
1428 if (READ_ONCE(in6_dev
->cnf
.accept_ra_min_hop_limit
) < 256 &&
1429 ra_msg
->icmph
.icmp6_hop_limit
) {
1430 if (READ_ONCE(in6_dev
->cnf
.accept_ra_min_hop_limit
) <=
1431 ra_msg
->icmph
.icmp6_hop_limit
) {
1432 WRITE_ONCE(in6_dev
->cnf
.hop_limit
,
1433 ra_msg
->icmph
.icmp6_hop_limit
);
1434 fib6_metric_set(rt
, RTAX_HOPLIMIT
,
1435 ra_msg
->icmph
.icmp6_hop_limit
);
1437 ND_PRINTK(2, warn
, "RA: Got route advertisement with lower hop_limit than minimum\n");
1444 * Update Reachable Time and Retrans Timer
1447 if (in6_dev
->nd_parms
) {
1448 unsigned long rtime
= ntohl(ra_msg
->retrans_timer
);
1450 if (rtime
&& rtime
/1000 < MAX_SCHEDULE_TIMEOUT
/HZ
) {
1451 rtime
= (rtime
*HZ
)/1000;
1454 NEIGH_VAR_SET(in6_dev
->nd_parms
, RETRANS_TIME
, rtime
);
1455 in6_dev
->tstamp
= jiffies
;
1456 send_ifinfo_notify
= true;
1459 rtime
= ntohl(ra_msg
->reachable_time
);
1460 if (rtime
&& rtime
/1000 < MAX_SCHEDULE_TIMEOUT
/(3*HZ
)) {
1461 rtime
= (rtime
*HZ
)/1000;
1466 if (rtime
!= NEIGH_VAR(in6_dev
->nd_parms
, BASE_REACHABLE_TIME
)) {
1467 NEIGH_VAR_SET(in6_dev
->nd_parms
,
1468 BASE_REACHABLE_TIME
, rtime
);
1469 NEIGH_VAR_SET(in6_dev
->nd_parms
,
1470 GC_STALETIME
, 3 * rtime
);
1471 in6_dev
->nd_parms
->reachable_time
= neigh_rand_reach_time(rtime
);
1472 in6_dev
->tstamp
= jiffies
;
1473 send_ifinfo_notify
= true;
1485 neigh
= __neigh_lookup(&nd_tbl
, &ipv6_hdr(skb
)->saddr
,
1489 if (ndopts
.nd_opts_src_lladdr
) {
1490 lladdr
= ndisc_opt_addr_data(ndopts
.nd_opts_src_lladdr
,
1494 "RA: invalid link-layer address length\n");
1498 ndisc_update(skb
->dev
, neigh
, lladdr
, NUD_STALE
,
1499 NEIGH_UPDATE_F_WEAK_OVERRIDE
|
1500 NEIGH_UPDATE_F_OVERRIDE
|
1501 NEIGH_UPDATE_F_OVERRIDE_ISROUTER
|
1502 NEIGH_UPDATE_F_ISROUTER
,
1503 NDISC_ROUTER_ADVERTISEMENT
, &ndopts
);
1504 reason
= SKB_CONSUMED
;
1507 if (!ipv6_accept_ra(in6_dev
)) {
1509 "RA: %s, accept_ra is false for dev: %s\n",
1510 __func__
, skb
->dev
->name
);
1514 #ifdef CONFIG_IPV6_ROUTE_INFO
1515 if (!READ_ONCE(in6_dev
->cnf
.accept_ra_from_local
) &&
1516 ipv6_chk_addr(dev_net(in6_dev
->dev
), &ipv6_hdr(skb
)->saddr
,
1519 "RA from local address detected on dev: %s: router info ignored.\n",
1521 goto skip_routeinfo
;
1524 if (READ_ONCE(in6_dev
->cnf
.accept_ra_rtr_pref
) && ndopts
.nd_opts_ri
) {
1525 struct nd_opt_hdr
*p
;
1526 for (p
= ndopts
.nd_opts_ri
;
1528 p
= ndisc_next_option(p
, ndopts
.nd_opts_ri_end
)) {
1529 struct route_info
*ri
= (struct route_info
*)p
;
1530 #ifdef CONFIG_IPV6_NDISC_NODETYPE
1531 if (skb
->ndisc_nodetype
== NDISC_NODETYPE_NODEFAULT
&&
1532 ri
->prefix_len
== 0)
1535 if (ri
->prefix_len
== 0 &&
1536 !READ_ONCE(in6_dev
->cnf
.accept_ra_defrtr
))
1538 if (ri
->lifetime
!= 0 &&
1539 ntohl(ri
->lifetime
) < READ_ONCE(in6_dev
->cnf
.accept_ra_min_lft
))
1541 if (ri
->prefix_len
< READ_ONCE(in6_dev
->cnf
.accept_ra_rt_info_min_plen
))
1543 if (ri
->prefix_len
> READ_ONCE(in6_dev
->cnf
.accept_ra_rt_info_max_plen
))
1545 rt6_route_rcv(skb
->dev
, (u8
*)p
, (p
->nd_opt_len
) << 3,
1546 &ipv6_hdr(skb
)->saddr
);
1553 #ifdef CONFIG_IPV6_NDISC_NODETYPE
1554 /* skip link-specific ndopts from interior routers */
1555 if (skb
->ndisc_nodetype
== NDISC_NODETYPE_NODEFAULT
) {
1557 "RA: %s, nodetype is NODEFAULT (interior routes), dev: %s\n",
1558 __func__
, skb
->dev
->name
);
1563 if (READ_ONCE(in6_dev
->cnf
.accept_ra_pinfo
) && ndopts
.nd_opts_pi
) {
1564 struct nd_opt_hdr
*p
;
1565 for (p
= ndopts
.nd_opts_pi
;
1567 p
= ndisc_next_option(p
, ndopts
.nd_opts_pi_end
)) {
1568 addrconf_prefix_rcv(skb
->dev
, (u8
*)p
,
1569 (p
->nd_opt_len
) << 3,
1570 ndopts
.nd_opts_src_lladdr
!= NULL
);
1574 if (ndopts
.nd_opts_mtu
&& READ_ONCE(in6_dev
->cnf
.accept_ra_mtu
)) {
1578 memcpy(&n
, ((u8
*)(ndopts
.nd_opts_mtu
+1))+2, sizeof(mtu
));
1581 if (in6_dev
->ra_mtu
!= mtu
) {
1582 in6_dev
->ra_mtu
= mtu
;
1583 send_ifinfo_notify
= true;
1586 if (mtu
< IPV6_MIN_MTU
|| mtu
> skb
->dev
->mtu
) {
1587 ND_PRINTK(2, warn
, "RA: invalid mtu: %d\n", mtu
);
1588 } else if (READ_ONCE(in6_dev
->cnf
.mtu6
) != mtu
) {
1589 WRITE_ONCE(in6_dev
->cnf
.mtu6
, mtu
);
1590 fib6_metric_set(rt
, RTAX_MTU
, mtu
);
1591 rt6_mtu_change(skb
->dev
, mtu
);
1595 if (ndopts
.nd_useropts
) {
1596 struct nd_opt_hdr
*p
;
1597 for (p
= ndopts
.nd_useropts
;
1599 p
= ndisc_next_useropt(skb
->dev
, p
,
1600 ndopts
.nd_useropts_end
)) {
1601 ndisc_ra_useropt(skb
, p
);
1605 if (ndopts
.nd_opts_tgt_lladdr
|| ndopts
.nd_opts_rh
) {
1606 ND_PRINTK(2, warn
, "RA: invalid RA options\n");
1609 /* Send a notify if RA changed managed/otherconf flags or
1610 * timer settings or ra_mtu value
1612 if (send_ifinfo_notify
)
1613 inet6_ifinfo_notify(RTM_NEWLINK
, in6_dev
);
1615 fib6_info_release(rt
);
1617 neigh_release(neigh
);
1621 static enum skb_drop_reason
ndisc_redirect_rcv(struct sk_buff
*skb
)
1623 struct rd_msg
*msg
= (struct rd_msg
*)skb_transport_header(skb
);
1624 u32 ndoptlen
= skb_tail_pointer(skb
) - (skb_transport_header(skb
) +
1625 offsetof(struct rd_msg
, opt
));
1626 struct ndisc_options ndopts
;
1630 #ifdef CONFIG_IPV6_NDISC_NODETYPE
1631 switch (skb
->ndisc_nodetype
) {
1632 case NDISC_NODETYPE_HOST
:
1633 case NDISC_NODETYPE_NODEFAULT
:
1635 "Redirect: from host or unauthorized router\n");
1640 if (!(ipv6_addr_type(&ipv6_hdr(skb
)->saddr
) & IPV6_ADDR_LINKLOCAL
)) {
1642 "Redirect: source address is not link-local\n");
1646 if (!ndisc_parse_options(skb
->dev
, msg
->opt
, ndoptlen
, &ndopts
))
1647 return SKB_DROP_REASON_IPV6_NDISC_BAD_OPTIONS
;
1649 if (!ndopts
.nd_opts_rh
) {
1650 ip6_redirect_no_header(skb
, dev_net(skb
->dev
),
1655 hdr
= (u8
*)ndopts
.nd_opts_rh
;
1657 if (!pskb_pull(skb
, hdr
- skb_transport_header(skb
)))
1658 return SKB_DROP_REASON_PKT_TOO_SMALL
;
1660 return icmpv6_notify(skb
, NDISC_REDIRECT
, 0, 0);
1663 static void ndisc_fill_redirect_hdr_option(struct sk_buff
*skb
,
1664 struct sk_buff
*orig_skb
,
1667 u8
*opt
= skb_put(skb
, rd_len
);
1670 *(opt
++) = ND_OPT_REDIRECT_HDR
;
1671 *(opt
++) = (rd_len
>> 3);
1674 skb_copy_bits(orig_skb
, skb_network_offset(orig_skb
), opt
,
1678 void ndisc_send_redirect(struct sk_buff
*skb
, const struct in6_addr
*target
)
1680 struct net_device
*dev
= skb
->dev
;
1681 struct net
*net
= dev_net(dev
);
1682 struct sock
*sk
= net
->ipv6
.ndisc_sk
;
1684 struct inet_peer
*peer
;
1685 struct sk_buff
*buff
;
1687 struct in6_addr saddr_buf
;
1688 struct rt6_info
*rt
;
1689 struct dst_entry
*dst
;
1692 u8 ha_buf
[MAX_ADDR_LEN
], *ha
= NULL
,
1693 ops_data_buf
[NDISC_OPS_REDIRECT_DATA_SPACE
], *ops_data
= NULL
;
1696 if (netif_is_l3_master(skb
->dev
)) {
1697 dev
= __dev_get_by_index(dev_net(skb
->dev
), IPCB(skb
)->iif
);
1702 if (ipv6_get_lladdr(dev
, &saddr_buf
, IFA_F_TENTATIVE
)) {
1703 ND_PRINTK(2, warn
, "Redirect: no link-local address on %s\n",
1708 if (!ipv6_addr_equal(&ipv6_hdr(skb
)->daddr
, target
) &&
1709 ipv6_addr_type(target
) != (IPV6_ADDR_UNICAST
|IPV6_ADDR_LINKLOCAL
)) {
1711 "Redirect: target address is not link-local unicast\n");
1715 icmpv6_flow_init(sk
, &fl6
, NDISC_REDIRECT
,
1716 &saddr_buf
, &ipv6_hdr(skb
)->saddr
, dev
->ifindex
);
1718 dst
= ip6_route_output(net
, NULL
, &fl6
);
1723 dst
= xfrm_lookup(net
, dst
, flowi6_to_flowi(&fl6
), NULL
, 0);
1727 rt
= dst_rt6_info(dst
);
1729 if (rt
->rt6i_flags
& RTF_GATEWAY
) {
1731 "Redirect: destination is not a neighbour\n");
1734 peer
= inet_getpeer_v6(net
->ipv6
.peers
, &ipv6_hdr(skb
)->saddr
, 1);
1735 ret
= inet_peer_xrlim_allow(peer
, 1*HZ
);
1741 if (dev
->addr_len
) {
1742 struct neighbour
*neigh
= dst_neigh_lookup(skb_dst(skb
), target
);
1745 "Redirect: no neigh for target address\n");
1749 read_lock_bh(&neigh
->lock
);
1750 if (neigh
->nud_state
& NUD_VALID
) {
1751 memcpy(ha_buf
, neigh
->ha
, dev
->addr_len
);
1752 read_unlock_bh(&neigh
->lock
);
1754 optlen
+= ndisc_redirect_opt_addr_space(dev
, neigh
,
1758 read_unlock_bh(&neigh
->lock
);
1760 neigh_release(neigh
);
1763 rd_len
= min_t(unsigned int,
1764 IPV6_MIN_MTU
- sizeof(struct ipv6hdr
) - sizeof(*msg
) - optlen
,
1769 buff
= ndisc_alloc_skb(dev
, sizeof(*msg
) + optlen
);
1773 msg
= skb_put(buff
, sizeof(*msg
));
1774 *msg
= (struct rd_msg
) {
1776 .icmp6_type
= NDISC_REDIRECT
,
1779 .dest
= ipv6_hdr(skb
)->daddr
,
1783 * include target_address option
1787 ndisc_fill_redirect_addr_option(buff
, ha
, ops_data
);
1790 * build redirect option and copy skb over to the new packet.
1794 ndisc_fill_redirect_hdr_option(buff
, skb
, rd_len
);
1796 skb_dst_set(buff
, dst
);
1797 ndisc_send_skb(buff
, &ipv6_hdr(skb
)->saddr
, &saddr_buf
);
1804 static void pndisc_redo(struct sk_buff
*skb
)
1806 enum skb_drop_reason reason
= ndisc_recv_ns(skb
);
1808 kfree_skb_reason(skb
, reason
);
1811 static int ndisc_is_multicast(const void *pkey
)
1813 return ipv6_addr_is_multicast((struct in6_addr
*)pkey
);
1816 static bool ndisc_suppress_frag_ndisc(struct sk_buff
*skb
)
1818 struct inet6_dev
*idev
= __in6_dev_get(skb
->dev
);
1822 if (IP6CB(skb
)->flags
& IP6SKB_FRAGMENTED
&&
1823 READ_ONCE(idev
->cnf
.suppress_frag_ndisc
)) {
1824 net_warn_ratelimited("Received fragmented ndisc packet. Carefully consider disabling suppress_frag_ndisc.\n");
1830 enum skb_drop_reason
ndisc_rcv(struct sk_buff
*skb
)
1835 if (ndisc_suppress_frag_ndisc(skb
))
1836 return SKB_DROP_REASON_IPV6_NDISC_FRAG
;
1838 if (skb_linearize(skb
))
1839 return SKB_DROP_REASON_NOMEM
;
1841 msg
= (struct nd_msg
*)skb_transport_header(skb
);
1843 __skb_push(skb
, skb
->data
- skb_transport_header(skb
));
1845 if (ipv6_hdr(skb
)->hop_limit
!= 255) {
1846 ND_PRINTK(2, warn
, "NDISC: invalid hop-limit: %d\n",
1847 ipv6_hdr(skb
)->hop_limit
);
1848 return SKB_DROP_REASON_IPV6_NDISC_HOP_LIMIT
;
1851 if (msg
->icmph
.icmp6_code
!= 0) {
1852 ND_PRINTK(2, warn
, "NDISC: invalid ICMPv6 code: %d\n",
1853 msg
->icmph
.icmp6_code
);
1854 return SKB_DROP_REASON_IPV6_NDISC_BAD_CODE
;
1857 switch (msg
->icmph
.icmp6_type
) {
1858 case NDISC_NEIGHBOUR_SOLICITATION
:
1859 memset(NEIGH_CB(skb
), 0, sizeof(struct neighbour_cb
));
1860 reason
= ndisc_recv_ns(skb
);
1863 case NDISC_NEIGHBOUR_ADVERTISEMENT
:
1864 reason
= ndisc_recv_na(skb
);
1867 case NDISC_ROUTER_SOLICITATION
:
1868 reason
= ndisc_recv_rs(skb
);
1871 case NDISC_ROUTER_ADVERTISEMENT
:
1872 reason
= ndisc_router_discovery(skb
);
1875 case NDISC_REDIRECT
:
1876 reason
= ndisc_redirect_rcv(skb
);
1883 static int ndisc_netdev_event(struct notifier_block
*this, unsigned long event
, void *ptr
)
1885 struct net_device
*dev
= netdev_notifier_info_to_dev(ptr
);
1886 struct netdev_notifier_change_info
*change_info
;
1887 struct net
*net
= dev_net(dev
);
1888 struct inet6_dev
*idev
;
1889 bool evict_nocarrier
;
1892 case NETDEV_CHANGEADDR
:
1893 neigh_changeaddr(&nd_tbl
, dev
);
1894 fib6_run_gc(0, net
, false);
1897 idev
= in6_dev_get(dev
);
1900 if (READ_ONCE(idev
->cnf
.ndisc_notify
) ||
1901 READ_ONCE(net
->ipv6
.devconf_all
->ndisc_notify
))
1902 ndisc_send_unsol_na(dev
);
1906 idev
= in6_dev_get(dev
);
1908 evict_nocarrier
= true;
1910 evict_nocarrier
= READ_ONCE(idev
->cnf
.ndisc_evict_nocarrier
) &&
1911 READ_ONCE(net
->ipv6
.devconf_all
->ndisc_evict_nocarrier
);
1916 if (change_info
->flags_changed
& IFF_NOARP
)
1917 neigh_changeaddr(&nd_tbl
, dev
);
1918 if (evict_nocarrier
&& !netif_carrier_ok(dev
))
1919 neigh_carrier_down(&nd_tbl
, dev
);
1922 neigh_ifdown(&nd_tbl
, dev
);
1923 fib6_run_gc(0, net
, false);
1925 case NETDEV_NOTIFY_PEERS
:
1926 ndisc_send_unsol_na(dev
);
1935 static struct notifier_block ndisc_netdev_notifier
= {
1936 .notifier_call
= ndisc_netdev_event
,
1937 .priority
= ADDRCONF_NOTIFY_PRIORITY
- 5,
1940 #ifdef CONFIG_SYSCTL
1941 static void ndisc_warn_deprecated_sysctl(const struct ctl_table
*ctl
,
1942 const char *func
, const char *dev_name
)
1944 static char warncomm
[TASK_COMM_LEN
];
1946 if (strcmp(warncomm
, current
->comm
) && warned
< 5) {
1947 strscpy(warncomm
, current
->comm
);
1948 pr_warn("process `%s' is using deprecated sysctl (%s) net.ipv6.neigh.%s.%s - use net.ipv6.neigh.%s.%s_ms instead\n",
1950 dev_name
, ctl
->procname
,
1951 dev_name
, ctl
->procname
);
1956 int ndisc_ifinfo_sysctl_change(const struct ctl_table
*ctl
, int write
, void *buffer
,
1957 size_t *lenp
, loff_t
*ppos
)
1959 struct net_device
*dev
= ctl
->extra1
;
1960 struct inet6_dev
*idev
;
1963 if ((strcmp(ctl
->procname
, "retrans_time") == 0) ||
1964 (strcmp(ctl
->procname
, "base_reachable_time") == 0))
1965 ndisc_warn_deprecated_sysctl(ctl
, "syscall", dev
? dev
->name
: "default");
1967 if (strcmp(ctl
->procname
, "retrans_time") == 0)
1968 ret
= neigh_proc_dointvec(ctl
, write
, buffer
, lenp
, ppos
);
1970 else if (strcmp(ctl
->procname
, "base_reachable_time") == 0)
1971 ret
= neigh_proc_dointvec_jiffies(ctl
, write
,
1972 buffer
, lenp
, ppos
);
1974 else if ((strcmp(ctl
->procname
, "retrans_time_ms") == 0) ||
1975 (strcmp(ctl
->procname
, "base_reachable_time_ms") == 0))
1976 ret
= neigh_proc_dointvec_ms_jiffies(ctl
, write
,
1977 buffer
, lenp
, ppos
);
1981 if (write
&& ret
== 0 && dev
&& (idev
= in6_dev_get(dev
)) != NULL
) {
1982 if (ctl
->data
== &NEIGH_VAR(idev
->nd_parms
, BASE_REACHABLE_TIME
))
1983 idev
->nd_parms
->reachable_time
=
1984 neigh_rand_reach_time(NEIGH_VAR(idev
->nd_parms
, BASE_REACHABLE_TIME
));
1985 WRITE_ONCE(idev
->tstamp
, jiffies
);
1986 inet6_ifinfo_notify(RTM_NEWLINK
, idev
);
1995 static int __net_init
ndisc_net_init(struct net
*net
)
1997 struct ipv6_pinfo
*np
;
2001 err
= inet_ctl_sock_create(&sk
, PF_INET6
,
2002 SOCK_RAW
, IPPROTO_ICMPV6
, net
);
2005 "NDISC: Failed to initialize the control socket (err %d)\n",
2010 net
->ipv6
.ndisc_sk
= sk
;
2013 np
->hop_limit
= 255;
2014 /* Do not loopback ndisc messages */
2015 inet6_clear_bit(MC6_LOOP
, sk
);
2020 static void __net_exit
ndisc_net_exit(struct net
*net
)
2022 inet_ctl_sock_destroy(net
->ipv6
.ndisc_sk
);
2025 static struct pernet_operations ndisc_net_ops
= {
2026 .init
= ndisc_net_init
,
2027 .exit
= ndisc_net_exit
,
2030 int __init
ndisc_init(void)
2034 err
= register_pernet_subsys(&ndisc_net_ops
);
2038 * Initialize the neighbour table
2040 neigh_table_init(NEIGH_ND_TABLE
, &nd_tbl
);
2042 #ifdef CONFIG_SYSCTL
2043 err
= neigh_sysctl_register(NULL
, &nd_tbl
.parms
,
2044 ndisc_ifinfo_sysctl_change
);
2046 goto out_unregister_pernet
;
2051 #ifdef CONFIG_SYSCTL
2052 out_unregister_pernet
:
2053 unregister_pernet_subsys(&ndisc_net_ops
);
2058 int __init
ndisc_late_init(void)
2060 return register_netdevice_notifier(&ndisc_netdev_notifier
);
2063 void ndisc_late_cleanup(void)
2065 unregister_netdevice_notifier(&ndisc_netdev_notifier
);
2068 void ndisc_cleanup(void)
2070 #ifdef CONFIG_SYSCTL
2071 neigh_sysctl_unregister(&nd_tbl
.parms
);
2073 neigh_table_clear(NEIGH_ND_TABLE
, &nd_tbl
);
2074 unregister_pernet_subsys(&ndisc_net_ops
);