Merge tag 'for_linus' of git://git.kernel.org/pub/scm/linux/kernel/git/mst/vhost
[cris-mirror.git] / net / ipv6 / mcast.c
blob9b9d2ff01b3554cbf5f176e642484d1efde6a547
1 /*
2 * Multicast support for IPv6
3 * Linux INET6 implementation
5 * Authors:
6 * Pedro Roque <roque@di.fc.ul.pt>
8 * Based on linux/ipv4/igmp.c and linux/ipv4/ip_sockglue.c
10 * This program is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU General Public License
12 * as published by the Free Software Foundation; either version
13 * 2 of the License, or (at your option) any later version.
16 /* Changes:
18 * yoshfuji : fix format of router-alert option
19 * YOSHIFUJI Hideaki @USAGI:
20 * Fixed source address for MLD message based on
21 * <draft-ietf-magma-mld-source-05.txt>.
22 * YOSHIFUJI Hideaki @USAGI:
23 * - Ignore Queries for invalid addresses.
24 * - MLD for link-local addresses.
25 * David L Stevens <dlstevens@us.ibm.com>:
26 * - MLDv2 support
29 #include <linux/module.h>
30 #include <linux/errno.h>
31 #include <linux/types.h>
32 #include <linux/string.h>
33 #include <linux/socket.h>
34 #include <linux/sockios.h>
35 #include <linux/jiffies.h>
36 #include <linux/times.h>
37 #include <linux/net.h>
38 #include <linux/in.h>
39 #include <linux/in6.h>
40 #include <linux/netdevice.h>
41 #include <linux/if_arp.h>
42 #include <linux/route.h>
43 #include <linux/init.h>
44 #include <linux/proc_fs.h>
45 #include <linux/seq_file.h>
46 #include <linux/slab.h>
47 #include <linux/pkt_sched.h>
48 #include <net/mld.h>
50 #include <linux/netfilter.h>
51 #include <linux/netfilter_ipv6.h>
53 #include <net/net_namespace.h>
54 #include <net/sock.h>
55 #include <net/snmp.h>
57 #include <net/ipv6.h>
58 #include <net/protocol.h>
59 #include <net/if_inet6.h>
60 #include <net/ndisc.h>
61 #include <net/addrconf.h>
62 #include <net/ip6_route.h>
63 #include <net/inet_common.h>
65 #include <net/ip6_checksum.h>
67 /* Ensure that we have struct in6_addr aligned on 32bit word. */
68 static int __mld2_query_bugs[] __attribute__((__unused__)) = {
69 BUILD_BUG_ON_ZERO(offsetof(struct mld2_query, mld2q_srcs) % 4),
70 BUILD_BUG_ON_ZERO(offsetof(struct mld2_report, mld2r_grec) % 4),
71 BUILD_BUG_ON_ZERO(offsetof(struct mld2_grec, grec_mca) % 4)
74 static struct in6_addr mld2_all_mcr = MLD2_ALL_MCR_INIT;
76 static void igmp6_join_group(struct ifmcaddr6 *ma);
77 static void igmp6_leave_group(struct ifmcaddr6 *ma);
78 static void igmp6_timer_handler(struct timer_list *t);
80 static void mld_gq_timer_expire(struct timer_list *t);
81 static void mld_ifc_timer_expire(struct timer_list *t);
82 static void mld_ifc_event(struct inet6_dev *idev);
83 static void mld_add_delrec(struct inet6_dev *idev, struct ifmcaddr6 *pmc);
84 static void mld_del_delrec(struct inet6_dev *idev, struct ifmcaddr6 *pmc);
85 static void mld_clear_delrec(struct inet6_dev *idev);
86 static bool mld_in_v1_mode(const struct inet6_dev *idev);
87 static int sf_setstate(struct ifmcaddr6 *pmc);
88 static void sf_markstate(struct ifmcaddr6 *pmc);
89 static void ip6_mc_clear_src(struct ifmcaddr6 *pmc);
90 static int ip6_mc_del_src(struct inet6_dev *idev, const struct in6_addr *pmca,
91 int sfmode, int sfcount, const struct in6_addr *psfsrc,
92 int delta);
93 static int ip6_mc_add_src(struct inet6_dev *idev, const struct in6_addr *pmca,
94 int sfmode, int sfcount, const struct in6_addr *psfsrc,
95 int delta);
96 static int ip6_mc_leave_src(struct sock *sk, struct ipv6_mc_socklist *iml,
97 struct inet6_dev *idev);
99 #define MLD_QRV_DEFAULT 2
100 /* RFC3810, 9.2. Query Interval */
101 #define MLD_QI_DEFAULT (125 * HZ)
102 /* RFC3810, 9.3. Query Response Interval */
103 #define MLD_QRI_DEFAULT (10 * HZ)
105 /* RFC3810, 8.1 Query Version Distinctions */
106 #define MLD_V1_QUERY_LEN 24
107 #define MLD_V2_QUERY_LEN_MIN 28
109 #define IPV6_MLD_MAX_MSF 64
111 int sysctl_mld_max_msf __read_mostly = IPV6_MLD_MAX_MSF;
112 int sysctl_mld_qrv __read_mostly = MLD_QRV_DEFAULT;
115 * socket join on multicast group
118 #define for_each_pmc_rcu(np, pmc) \
119 for (pmc = rcu_dereference(np->ipv6_mc_list); \
120 pmc != NULL; \
121 pmc = rcu_dereference(pmc->next))
123 static int unsolicited_report_interval(struct inet6_dev *idev)
125 int iv;
127 if (mld_in_v1_mode(idev))
128 iv = idev->cnf.mldv1_unsolicited_report_interval;
129 else
130 iv = idev->cnf.mldv2_unsolicited_report_interval;
132 return iv > 0 ? iv : 1;
135 int ipv6_sock_mc_join(struct sock *sk, int ifindex, const struct in6_addr *addr)
137 struct net_device *dev = NULL;
138 struct ipv6_mc_socklist *mc_lst;
139 struct ipv6_pinfo *np = inet6_sk(sk);
140 struct net *net = sock_net(sk);
141 int err;
143 ASSERT_RTNL();
145 if (!ipv6_addr_is_multicast(addr))
146 return -EINVAL;
148 rcu_read_lock();
149 for_each_pmc_rcu(np, mc_lst) {
150 if ((ifindex == 0 || mc_lst->ifindex == ifindex) &&
151 ipv6_addr_equal(&mc_lst->addr, addr)) {
152 rcu_read_unlock();
153 return -EADDRINUSE;
156 rcu_read_unlock();
158 mc_lst = sock_kmalloc(sk, sizeof(struct ipv6_mc_socklist), GFP_KERNEL);
160 if (!mc_lst)
161 return -ENOMEM;
163 mc_lst->next = NULL;
164 mc_lst->addr = *addr;
166 if (ifindex == 0) {
167 struct rt6_info *rt;
168 rt = rt6_lookup(net, addr, NULL, 0, 0);
169 if (rt) {
170 dev = rt->dst.dev;
171 ip6_rt_put(rt);
173 } else
174 dev = __dev_get_by_index(net, ifindex);
176 if (!dev) {
177 sock_kfree_s(sk, mc_lst, sizeof(*mc_lst));
178 return -ENODEV;
181 mc_lst->ifindex = dev->ifindex;
182 mc_lst->sfmode = MCAST_EXCLUDE;
183 rwlock_init(&mc_lst->sflock);
184 mc_lst->sflist = NULL;
187 * now add/increase the group membership on the device
190 err = ipv6_dev_mc_inc(dev, addr);
192 if (err) {
193 sock_kfree_s(sk, mc_lst, sizeof(*mc_lst));
194 return err;
197 mc_lst->next = np->ipv6_mc_list;
198 rcu_assign_pointer(np->ipv6_mc_list, mc_lst);
200 return 0;
202 EXPORT_SYMBOL(ipv6_sock_mc_join);
205 * socket leave on multicast group
207 int ipv6_sock_mc_drop(struct sock *sk, int ifindex, const struct in6_addr *addr)
209 struct ipv6_pinfo *np = inet6_sk(sk);
210 struct ipv6_mc_socklist *mc_lst;
211 struct ipv6_mc_socklist __rcu **lnk;
212 struct net *net = sock_net(sk);
214 ASSERT_RTNL();
216 if (!ipv6_addr_is_multicast(addr))
217 return -EINVAL;
219 for (lnk = &np->ipv6_mc_list;
220 (mc_lst = rtnl_dereference(*lnk)) != NULL;
221 lnk = &mc_lst->next) {
222 if ((ifindex == 0 || mc_lst->ifindex == ifindex) &&
223 ipv6_addr_equal(&mc_lst->addr, addr)) {
224 struct net_device *dev;
226 *lnk = mc_lst->next;
228 dev = __dev_get_by_index(net, mc_lst->ifindex);
229 if (dev) {
230 struct inet6_dev *idev = __in6_dev_get(dev);
232 (void) ip6_mc_leave_src(sk, mc_lst, idev);
233 if (idev)
234 __ipv6_dev_mc_dec(idev, &mc_lst->addr);
235 } else
236 (void) ip6_mc_leave_src(sk, mc_lst, NULL);
238 atomic_sub(sizeof(*mc_lst), &sk->sk_omem_alloc);
239 kfree_rcu(mc_lst, rcu);
240 return 0;
244 return -EADDRNOTAVAIL;
246 EXPORT_SYMBOL(ipv6_sock_mc_drop);
248 /* called with rcu_read_lock() */
249 static struct inet6_dev *ip6_mc_find_dev_rcu(struct net *net,
250 const struct in6_addr *group,
251 int ifindex)
253 struct net_device *dev = NULL;
254 struct inet6_dev *idev = NULL;
256 if (ifindex == 0) {
257 struct rt6_info *rt = rt6_lookup(net, group, NULL, 0, 0);
259 if (rt) {
260 dev = rt->dst.dev;
261 ip6_rt_put(rt);
263 } else
264 dev = dev_get_by_index_rcu(net, ifindex);
266 if (!dev)
267 return NULL;
268 idev = __in6_dev_get(dev);
269 if (!idev)
270 return NULL;
271 read_lock_bh(&idev->lock);
272 if (idev->dead) {
273 read_unlock_bh(&idev->lock);
274 return NULL;
276 return idev;
279 void __ipv6_sock_mc_close(struct sock *sk)
281 struct ipv6_pinfo *np = inet6_sk(sk);
282 struct ipv6_mc_socklist *mc_lst;
283 struct net *net = sock_net(sk);
285 ASSERT_RTNL();
287 while ((mc_lst = rtnl_dereference(np->ipv6_mc_list)) != NULL) {
288 struct net_device *dev;
290 np->ipv6_mc_list = mc_lst->next;
292 dev = __dev_get_by_index(net, mc_lst->ifindex);
293 if (dev) {
294 struct inet6_dev *idev = __in6_dev_get(dev);
296 (void) ip6_mc_leave_src(sk, mc_lst, idev);
297 if (idev)
298 __ipv6_dev_mc_dec(idev, &mc_lst->addr);
299 } else
300 (void) ip6_mc_leave_src(sk, mc_lst, NULL);
302 atomic_sub(sizeof(*mc_lst), &sk->sk_omem_alloc);
303 kfree_rcu(mc_lst, rcu);
307 void ipv6_sock_mc_close(struct sock *sk)
309 struct ipv6_pinfo *np = inet6_sk(sk);
311 if (!rcu_access_pointer(np->ipv6_mc_list))
312 return;
313 rtnl_lock();
314 __ipv6_sock_mc_close(sk);
315 rtnl_unlock();
318 int ip6_mc_source(int add, int omode, struct sock *sk,
319 struct group_source_req *pgsr)
321 struct in6_addr *source, *group;
322 struct ipv6_mc_socklist *pmc;
323 struct inet6_dev *idev;
324 struct ipv6_pinfo *inet6 = inet6_sk(sk);
325 struct ip6_sf_socklist *psl;
326 struct net *net = sock_net(sk);
327 int i, j, rv;
328 int leavegroup = 0;
329 int pmclocked = 0;
330 int err;
332 source = &((struct sockaddr_in6 *)&pgsr->gsr_source)->sin6_addr;
333 group = &((struct sockaddr_in6 *)&pgsr->gsr_group)->sin6_addr;
335 if (!ipv6_addr_is_multicast(group))
336 return -EINVAL;
338 rcu_read_lock();
339 idev = ip6_mc_find_dev_rcu(net, group, pgsr->gsr_interface);
340 if (!idev) {
341 rcu_read_unlock();
342 return -ENODEV;
345 err = -EADDRNOTAVAIL;
347 for_each_pmc_rcu(inet6, pmc) {
348 if (pgsr->gsr_interface && pmc->ifindex != pgsr->gsr_interface)
349 continue;
350 if (ipv6_addr_equal(&pmc->addr, group))
351 break;
353 if (!pmc) { /* must have a prior join */
354 err = -EINVAL;
355 goto done;
357 /* if a source filter was set, must be the same mode as before */
358 if (pmc->sflist) {
359 if (pmc->sfmode != omode) {
360 err = -EINVAL;
361 goto done;
363 } else if (pmc->sfmode != omode) {
364 /* allow mode switches for empty-set filters */
365 ip6_mc_add_src(idev, group, omode, 0, NULL, 0);
366 ip6_mc_del_src(idev, group, pmc->sfmode, 0, NULL, 0);
367 pmc->sfmode = omode;
370 write_lock(&pmc->sflock);
371 pmclocked = 1;
373 psl = pmc->sflist;
374 if (!add) {
375 if (!psl)
376 goto done; /* err = -EADDRNOTAVAIL */
377 rv = !0;
378 for (i = 0; i < psl->sl_count; i++) {
379 rv = !ipv6_addr_equal(&psl->sl_addr[i], source);
380 if (rv == 0)
381 break;
383 if (rv) /* source not found */
384 goto done; /* err = -EADDRNOTAVAIL */
386 /* special case - (INCLUDE, empty) == LEAVE_GROUP */
387 if (psl->sl_count == 1 && omode == MCAST_INCLUDE) {
388 leavegroup = 1;
389 goto done;
392 /* update the interface filter */
393 ip6_mc_del_src(idev, group, omode, 1, source, 1);
395 for (j = i+1; j < psl->sl_count; j++)
396 psl->sl_addr[j-1] = psl->sl_addr[j];
397 psl->sl_count--;
398 err = 0;
399 goto done;
401 /* else, add a new source to the filter */
403 if (psl && psl->sl_count >= sysctl_mld_max_msf) {
404 err = -ENOBUFS;
405 goto done;
407 if (!psl || psl->sl_count == psl->sl_max) {
408 struct ip6_sf_socklist *newpsl;
409 int count = IP6_SFBLOCK;
411 if (psl)
412 count += psl->sl_max;
413 newpsl = sock_kmalloc(sk, IP6_SFLSIZE(count), GFP_ATOMIC);
414 if (!newpsl) {
415 err = -ENOBUFS;
416 goto done;
418 newpsl->sl_max = count;
419 newpsl->sl_count = count - IP6_SFBLOCK;
420 if (psl) {
421 for (i = 0; i < psl->sl_count; i++)
422 newpsl->sl_addr[i] = psl->sl_addr[i];
423 sock_kfree_s(sk, psl, IP6_SFLSIZE(psl->sl_max));
425 pmc->sflist = psl = newpsl;
427 rv = 1; /* > 0 for insert logic below if sl_count is 0 */
428 for (i = 0; i < psl->sl_count; i++) {
429 rv = !ipv6_addr_equal(&psl->sl_addr[i], source);
430 if (rv == 0) /* There is an error in the address. */
431 goto done;
433 for (j = psl->sl_count-1; j >= i; j--)
434 psl->sl_addr[j+1] = psl->sl_addr[j];
435 psl->sl_addr[i] = *source;
436 psl->sl_count++;
437 err = 0;
438 /* update the interface list */
439 ip6_mc_add_src(idev, group, omode, 1, source, 1);
440 done:
441 if (pmclocked)
442 write_unlock(&pmc->sflock);
443 read_unlock_bh(&idev->lock);
444 rcu_read_unlock();
445 if (leavegroup)
446 err = ipv6_sock_mc_drop(sk, pgsr->gsr_interface, group);
447 return err;
450 int ip6_mc_msfilter(struct sock *sk, struct group_filter *gsf)
452 const struct in6_addr *group;
453 struct ipv6_mc_socklist *pmc;
454 struct inet6_dev *idev;
455 struct ipv6_pinfo *inet6 = inet6_sk(sk);
456 struct ip6_sf_socklist *newpsl, *psl;
457 struct net *net = sock_net(sk);
458 int leavegroup = 0;
459 int i, err;
461 group = &((struct sockaddr_in6 *)&gsf->gf_group)->sin6_addr;
463 if (!ipv6_addr_is_multicast(group))
464 return -EINVAL;
465 if (gsf->gf_fmode != MCAST_INCLUDE &&
466 gsf->gf_fmode != MCAST_EXCLUDE)
467 return -EINVAL;
469 rcu_read_lock();
470 idev = ip6_mc_find_dev_rcu(net, group, gsf->gf_interface);
472 if (!idev) {
473 rcu_read_unlock();
474 return -ENODEV;
477 err = 0;
479 if (gsf->gf_fmode == MCAST_INCLUDE && gsf->gf_numsrc == 0) {
480 leavegroup = 1;
481 goto done;
484 for_each_pmc_rcu(inet6, pmc) {
485 if (pmc->ifindex != gsf->gf_interface)
486 continue;
487 if (ipv6_addr_equal(&pmc->addr, group))
488 break;
490 if (!pmc) { /* must have a prior join */
491 err = -EINVAL;
492 goto done;
494 if (gsf->gf_numsrc) {
495 newpsl = sock_kmalloc(sk, IP6_SFLSIZE(gsf->gf_numsrc),
496 GFP_ATOMIC);
497 if (!newpsl) {
498 err = -ENOBUFS;
499 goto done;
501 newpsl->sl_max = newpsl->sl_count = gsf->gf_numsrc;
502 for (i = 0; i < newpsl->sl_count; ++i) {
503 struct sockaddr_in6 *psin6;
505 psin6 = (struct sockaddr_in6 *)&gsf->gf_slist[i];
506 newpsl->sl_addr[i] = psin6->sin6_addr;
508 err = ip6_mc_add_src(idev, group, gsf->gf_fmode,
509 newpsl->sl_count, newpsl->sl_addr, 0);
510 if (err) {
511 sock_kfree_s(sk, newpsl, IP6_SFLSIZE(newpsl->sl_max));
512 goto done;
514 } else {
515 newpsl = NULL;
516 (void) ip6_mc_add_src(idev, group, gsf->gf_fmode, 0, NULL, 0);
519 write_lock(&pmc->sflock);
520 psl = pmc->sflist;
521 if (psl) {
522 (void) ip6_mc_del_src(idev, group, pmc->sfmode,
523 psl->sl_count, psl->sl_addr, 0);
524 sock_kfree_s(sk, psl, IP6_SFLSIZE(psl->sl_max));
525 } else
526 (void) ip6_mc_del_src(idev, group, pmc->sfmode, 0, NULL, 0);
527 pmc->sflist = newpsl;
528 pmc->sfmode = gsf->gf_fmode;
529 write_unlock(&pmc->sflock);
530 err = 0;
531 done:
532 read_unlock_bh(&idev->lock);
533 rcu_read_unlock();
534 if (leavegroup)
535 err = ipv6_sock_mc_drop(sk, gsf->gf_interface, group);
536 return err;
539 int ip6_mc_msfget(struct sock *sk, struct group_filter *gsf,
540 struct group_filter __user *optval, int __user *optlen)
542 int err, i, count, copycount;
543 const struct in6_addr *group;
544 struct ipv6_mc_socklist *pmc;
545 struct inet6_dev *idev;
546 struct ipv6_pinfo *inet6 = inet6_sk(sk);
547 struct ip6_sf_socklist *psl;
548 struct net *net = sock_net(sk);
550 group = &((struct sockaddr_in6 *)&gsf->gf_group)->sin6_addr;
552 if (!ipv6_addr_is_multicast(group))
553 return -EINVAL;
555 rcu_read_lock();
556 idev = ip6_mc_find_dev_rcu(net, group, gsf->gf_interface);
558 if (!idev) {
559 rcu_read_unlock();
560 return -ENODEV;
563 err = -EADDRNOTAVAIL;
564 /* changes to the ipv6_mc_list require the socket lock and
565 * rtnl lock. We have the socket lock and rcu read lock,
566 * so reading the list is safe.
569 for_each_pmc_rcu(inet6, pmc) {
570 if (pmc->ifindex != gsf->gf_interface)
571 continue;
572 if (ipv6_addr_equal(group, &pmc->addr))
573 break;
575 if (!pmc) /* must have a prior join */
576 goto done;
577 gsf->gf_fmode = pmc->sfmode;
578 psl = pmc->sflist;
579 count = psl ? psl->sl_count : 0;
580 read_unlock_bh(&idev->lock);
581 rcu_read_unlock();
583 copycount = count < gsf->gf_numsrc ? count : gsf->gf_numsrc;
584 gsf->gf_numsrc = count;
585 if (put_user(GROUP_FILTER_SIZE(copycount), optlen) ||
586 copy_to_user(optval, gsf, GROUP_FILTER_SIZE(0))) {
587 return -EFAULT;
589 /* changes to psl require the socket lock, and a write lock
590 * on pmc->sflock. We have the socket lock so reading here is safe.
592 for (i = 0; i < copycount; i++) {
593 struct sockaddr_in6 *psin6;
594 struct sockaddr_storage ss;
596 psin6 = (struct sockaddr_in6 *)&ss;
597 memset(&ss, 0, sizeof(ss));
598 psin6->sin6_family = AF_INET6;
599 psin6->sin6_addr = psl->sl_addr[i];
600 if (copy_to_user(&optval->gf_slist[i], &ss, sizeof(ss)))
601 return -EFAULT;
603 return 0;
604 done:
605 read_unlock_bh(&idev->lock);
606 rcu_read_unlock();
607 return err;
610 bool inet6_mc_check(struct sock *sk, const struct in6_addr *mc_addr,
611 const struct in6_addr *src_addr)
613 struct ipv6_pinfo *np = inet6_sk(sk);
614 struct ipv6_mc_socklist *mc;
615 struct ip6_sf_socklist *psl;
616 bool rv = true;
618 rcu_read_lock();
619 for_each_pmc_rcu(np, mc) {
620 if (ipv6_addr_equal(&mc->addr, mc_addr))
621 break;
623 if (!mc) {
624 rcu_read_unlock();
625 return true;
627 read_lock(&mc->sflock);
628 psl = mc->sflist;
629 if (!psl) {
630 rv = mc->sfmode == MCAST_EXCLUDE;
631 } else {
632 int i;
634 for (i = 0; i < psl->sl_count; i++) {
635 if (ipv6_addr_equal(&psl->sl_addr[i], src_addr))
636 break;
638 if (mc->sfmode == MCAST_INCLUDE && i >= psl->sl_count)
639 rv = false;
640 if (mc->sfmode == MCAST_EXCLUDE && i < psl->sl_count)
641 rv = false;
643 read_unlock(&mc->sflock);
644 rcu_read_unlock();
646 return rv;
649 static void igmp6_group_added(struct ifmcaddr6 *mc)
651 struct net_device *dev = mc->idev->dev;
652 char buf[MAX_ADDR_LEN];
654 if (IPV6_ADDR_MC_SCOPE(&mc->mca_addr) <
655 IPV6_ADDR_SCOPE_LINKLOCAL)
656 return;
658 spin_lock_bh(&mc->mca_lock);
659 if (!(mc->mca_flags&MAF_LOADED)) {
660 mc->mca_flags |= MAF_LOADED;
661 if (ndisc_mc_map(&mc->mca_addr, buf, dev, 0) == 0)
662 dev_mc_add(dev, buf);
664 spin_unlock_bh(&mc->mca_lock);
666 if (!(dev->flags & IFF_UP) || (mc->mca_flags & MAF_NOREPORT))
667 return;
669 if (mld_in_v1_mode(mc->idev)) {
670 igmp6_join_group(mc);
671 return;
673 /* else v2 */
675 mc->mca_crcount = mc->idev->mc_qrv;
676 mld_ifc_event(mc->idev);
679 static void igmp6_group_dropped(struct ifmcaddr6 *mc)
681 struct net_device *dev = mc->idev->dev;
682 char buf[MAX_ADDR_LEN];
684 if (IPV6_ADDR_MC_SCOPE(&mc->mca_addr) <
685 IPV6_ADDR_SCOPE_LINKLOCAL)
686 return;
688 spin_lock_bh(&mc->mca_lock);
689 if (mc->mca_flags&MAF_LOADED) {
690 mc->mca_flags &= ~MAF_LOADED;
691 if (ndisc_mc_map(&mc->mca_addr, buf, dev, 0) == 0)
692 dev_mc_del(dev, buf);
695 spin_unlock_bh(&mc->mca_lock);
696 if (mc->mca_flags & MAF_NOREPORT)
697 return;
699 if (!mc->idev->dead)
700 igmp6_leave_group(mc);
702 spin_lock_bh(&mc->mca_lock);
703 if (del_timer(&mc->mca_timer))
704 refcount_dec(&mc->mca_refcnt);
705 spin_unlock_bh(&mc->mca_lock);
709 * deleted ifmcaddr6 manipulation
711 static void mld_add_delrec(struct inet6_dev *idev, struct ifmcaddr6 *im)
713 struct ifmcaddr6 *pmc;
715 /* this is an "ifmcaddr6" for convenience; only the fields below
716 * are actually used. In particular, the refcnt and users are not
717 * used for management of the delete list. Using the same structure
718 * for deleted items allows change reports to use common code with
719 * non-deleted or query-response MCA's.
721 pmc = kzalloc(sizeof(*pmc), GFP_ATOMIC);
722 if (!pmc)
723 return;
725 spin_lock_bh(&im->mca_lock);
726 spin_lock_init(&pmc->mca_lock);
727 pmc->idev = im->idev;
728 in6_dev_hold(idev);
729 pmc->mca_addr = im->mca_addr;
730 pmc->mca_crcount = idev->mc_qrv;
731 pmc->mca_sfmode = im->mca_sfmode;
732 if (pmc->mca_sfmode == MCAST_INCLUDE) {
733 struct ip6_sf_list *psf;
735 pmc->mca_tomb = im->mca_tomb;
736 pmc->mca_sources = im->mca_sources;
737 im->mca_tomb = im->mca_sources = NULL;
738 for (psf = pmc->mca_sources; psf; psf = psf->sf_next)
739 psf->sf_crcount = pmc->mca_crcount;
741 spin_unlock_bh(&im->mca_lock);
743 spin_lock_bh(&idev->mc_lock);
744 pmc->next = idev->mc_tomb;
745 idev->mc_tomb = pmc;
746 spin_unlock_bh(&idev->mc_lock);
749 static void mld_del_delrec(struct inet6_dev *idev, struct ifmcaddr6 *im)
751 struct ifmcaddr6 *pmc, *pmc_prev;
752 struct ip6_sf_list *psf;
753 struct in6_addr *pmca = &im->mca_addr;
755 spin_lock_bh(&idev->mc_lock);
756 pmc_prev = NULL;
757 for (pmc = idev->mc_tomb; pmc; pmc = pmc->next) {
758 if (ipv6_addr_equal(&pmc->mca_addr, pmca))
759 break;
760 pmc_prev = pmc;
762 if (pmc) {
763 if (pmc_prev)
764 pmc_prev->next = pmc->next;
765 else
766 idev->mc_tomb = pmc->next;
768 spin_unlock_bh(&idev->mc_lock);
770 spin_lock_bh(&im->mca_lock);
771 if (pmc) {
772 im->idev = pmc->idev;
773 im->mca_crcount = idev->mc_qrv;
774 im->mca_sfmode = pmc->mca_sfmode;
775 if (pmc->mca_sfmode == MCAST_INCLUDE) {
776 im->mca_tomb = pmc->mca_tomb;
777 im->mca_sources = pmc->mca_sources;
778 for (psf = im->mca_sources; psf; psf = psf->sf_next)
779 psf->sf_crcount = im->mca_crcount;
781 in6_dev_put(pmc->idev);
782 kfree(pmc);
784 spin_unlock_bh(&im->mca_lock);
787 static void mld_clear_delrec(struct inet6_dev *idev)
789 struct ifmcaddr6 *pmc, *nextpmc;
791 spin_lock_bh(&idev->mc_lock);
792 pmc = idev->mc_tomb;
793 idev->mc_tomb = NULL;
794 spin_unlock_bh(&idev->mc_lock);
796 for (; pmc; pmc = nextpmc) {
797 nextpmc = pmc->next;
798 ip6_mc_clear_src(pmc);
799 in6_dev_put(pmc->idev);
800 kfree(pmc);
803 /* clear dead sources, too */
804 read_lock_bh(&idev->lock);
805 for (pmc = idev->mc_list; pmc; pmc = pmc->next) {
806 struct ip6_sf_list *psf, *psf_next;
808 spin_lock_bh(&pmc->mca_lock);
809 psf = pmc->mca_tomb;
810 pmc->mca_tomb = NULL;
811 spin_unlock_bh(&pmc->mca_lock);
812 for (; psf; psf = psf_next) {
813 psf_next = psf->sf_next;
814 kfree(psf);
817 read_unlock_bh(&idev->lock);
820 static void mca_get(struct ifmcaddr6 *mc)
822 refcount_inc(&mc->mca_refcnt);
825 static void ma_put(struct ifmcaddr6 *mc)
827 if (refcount_dec_and_test(&mc->mca_refcnt)) {
828 in6_dev_put(mc->idev);
829 kfree(mc);
833 static struct ifmcaddr6 *mca_alloc(struct inet6_dev *idev,
834 const struct in6_addr *addr)
836 struct ifmcaddr6 *mc;
838 mc = kzalloc(sizeof(*mc), GFP_ATOMIC);
839 if (!mc)
840 return NULL;
842 timer_setup(&mc->mca_timer, igmp6_timer_handler, 0);
844 mc->mca_addr = *addr;
845 mc->idev = idev; /* reference taken by caller */
846 mc->mca_users = 1;
847 /* mca_stamp should be updated upon changes */
848 mc->mca_cstamp = mc->mca_tstamp = jiffies;
849 refcount_set(&mc->mca_refcnt, 1);
850 spin_lock_init(&mc->mca_lock);
852 /* initial mode is (EX, empty) */
853 mc->mca_sfmode = MCAST_EXCLUDE;
854 mc->mca_sfcount[MCAST_EXCLUDE] = 1;
856 if (ipv6_addr_is_ll_all_nodes(&mc->mca_addr) ||
857 IPV6_ADDR_MC_SCOPE(&mc->mca_addr) < IPV6_ADDR_SCOPE_LINKLOCAL)
858 mc->mca_flags |= MAF_NOREPORT;
860 return mc;
864 * device multicast group inc (add if not found)
866 int ipv6_dev_mc_inc(struct net_device *dev, const struct in6_addr *addr)
868 struct ifmcaddr6 *mc;
869 struct inet6_dev *idev;
871 ASSERT_RTNL();
873 /* we need to take a reference on idev */
874 idev = in6_dev_get(dev);
876 if (!idev)
877 return -EINVAL;
879 write_lock_bh(&idev->lock);
880 if (idev->dead) {
881 write_unlock_bh(&idev->lock);
882 in6_dev_put(idev);
883 return -ENODEV;
886 for (mc = idev->mc_list; mc; mc = mc->next) {
887 if (ipv6_addr_equal(&mc->mca_addr, addr)) {
888 mc->mca_users++;
889 write_unlock_bh(&idev->lock);
890 ip6_mc_add_src(idev, &mc->mca_addr, MCAST_EXCLUDE, 0,
891 NULL, 0);
892 in6_dev_put(idev);
893 return 0;
897 mc = mca_alloc(idev, addr);
898 if (!mc) {
899 write_unlock_bh(&idev->lock);
900 in6_dev_put(idev);
901 return -ENOMEM;
904 mc->next = idev->mc_list;
905 idev->mc_list = mc;
907 /* Hold this for the code below before we unlock,
908 * it is already exposed via idev->mc_list.
910 mca_get(mc);
911 write_unlock_bh(&idev->lock);
913 mld_del_delrec(idev, mc);
914 igmp6_group_added(mc);
915 ma_put(mc);
916 return 0;
920 * device multicast group del
922 int __ipv6_dev_mc_dec(struct inet6_dev *idev, const struct in6_addr *addr)
924 struct ifmcaddr6 *ma, **map;
926 ASSERT_RTNL();
928 write_lock_bh(&idev->lock);
929 for (map = &idev->mc_list; (ma = *map) != NULL; map = &ma->next) {
930 if (ipv6_addr_equal(&ma->mca_addr, addr)) {
931 if (--ma->mca_users == 0) {
932 *map = ma->next;
933 write_unlock_bh(&idev->lock);
935 igmp6_group_dropped(ma);
936 ip6_mc_clear_src(ma);
938 ma_put(ma);
939 return 0;
941 write_unlock_bh(&idev->lock);
942 return 0;
945 write_unlock_bh(&idev->lock);
947 return -ENOENT;
950 int ipv6_dev_mc_dec(struct net_device *dev, const struct in6_addr *addr)
952 struct inet6_dev *idev;
953 int err;
955 ASSERT_RTNL();
957 idev = __in6_dev_get(dev);
958 if (!idev)
959 err = -ENODEV;
960 else
961 err = __ipv6_dev_mc_dec(idev, addr);
963 return err;
967 * check if the interface/address pair is valid
969 bool ipv6_chk_mcast_addr(struct net_device *dev, const struct in6_addr *group,
970 const struct in6_addr *src_addr)
972 struct inet6_dev *idev;
973 struct ifmcaddr6 *mc;
974 bool rv = false;
976 rcu_read_lock();
977 idev = __in6_dev_get(dev);
978 if (idev) {
979 read_lock_bh(&idev->lock);
980 for (mc = idev->mc_list; mc; mc = mc->next) {
981 if (ipv6_addr_equal(&mc->mca_addr, group))
982 break;
984 if (mc) {
985 if (src_addr && !ipv6_addr_any(src_addr)) {
986 struct ip6_sf_list *psf;
988 spin_lock_bh(&mc->mca_lock);
989 for (psf = mc->mca_sources; psf; psf = psf->sf_next) {
990 if (ipv6_addr_equal(&psf->sf_addr, src_addr))
991 break;
993 if (psf)
994 rv = psf->sf_count[MCAST_INCLUDE] ||
995 psf->sf_count[MCAST_EXCLUDE] !=
996 mc->mca_sfcount[MCAST_EXCLUDE];
997 else
998 rv = mc->mca_sfcount[MCAST_EXCLUDE] != 0;
999 spin_unlock_bh(&mc->mca_lock);
1000 } else
1001 rv = true; /* don't filter unspecified source */
1003 read_unlock_bh(&idev->lock);
1005 rcu_read_unlock();
1006 return rv;
1009 static void mld_gq_start_timer(struct inet6_dev *idev)
1011 unsigned long tv = prandom_u32() % idev->mc_maxdelay;
1013 idev->mc_gq_running = 1;
1014 if (!mod_timer(&idev->mc_gq_timer, jiffies+tv+2))
1015 in6_dev_hold(idev);
1018 static void mld_gq_stop_timer(struct inet6_dev *idev)
1020 idev->mc_gq_running = 0;
1021 if (del_timer(&idev->mc_gq_timer))
1022 __in6_dev_put(idev);
1025 static void mld_ifc_start_timer(struct inet6_dev *idev, unsigned long delay)
1027 unsigned long tv = prandom_u32() % delay;
1029 if (!mod_timer(&idev->mc_ifc_timer, jiffies+tv+2))
1030 in6_dev_hold(idev);
1033 static void mld_ifc_stop_timer(struct inet6_dev *idev)
1035 idev->mc_ifc_count = 0;
1036 if (del_timer(&idev->mc_ifc_timer))
1037 __in6_dev_put(idev);
1040 static void mld_dad_start_timer(struct inet6_dev *idev, unsigned long delay)
1042 unsigned long tv = prandom_u32() % delay;
1044 if (!mod_timer(&idev->mc_dad_timer, jiffies+tv+2))
1045 in6_dev_hold(idev);
1048 static void mld_dad_stop_timer(struct inet6_dev *idev)
1050 if (del_timer(&idev->mc_dad_timer))
1051 __in6_dev_put(idev);
1055 * IGMP handling (alias multicast ICMPv6 messages)
1058 static void igmp6_group_queried(struct ifmcaddr6 *ma, unsigned long resptime)
1060 unsigned long delay = resptime;
1062 /* Do not start timer for these addresses */
1063 if (ipv6_addr_is_ll_all_nodes(&ma->mca_addr) ||
1064 IPV6_ADDR_MC_SCOPE(&ma->mca_addr) < IPV6_ADDR_SCOPE_LINKLOCAL)
1065 return;
1067 if (del_timer(&ma->mca_timer)) {
1068 refcount_dec(&ma->mca_refcnt);
1069 delay = ma->mca_timer.expires - jiffies;
1072 if (delay >= resptime)
1073 delay = prandom_u32() % resptime;
1075 ma->mca_timer.expires = jiffies + delay;
1076 if (!mod_timer(&ma->mca_timer, jiffies + delay))
1077 refcount_inc(&ma->mca_refcnt);
1078 ma->mca_flags |= MAF_TIMER_RUNNING;
1081 /* mark EXCLUDE-mode sources */
1082 static bool mld_xmarksources(struct ifmcaddr6 *pmc, int nsrcs,
1083 const struct in6_addr *srcs)
1085 struct ip6_sf_list *psf;
1086 int i, scount;
1088 scount = 0;
1089 for (psf = pmc->mca_sources; psf; psf = psf->sf_next) {
1090 if (scount == nsrcs)
1091 break;
1092 for (i = 0; i < nsrcs; i++) {
1093 /* skip inactive filters */
1094 if (psf->sf_count[MCAST_INCLUDE] ||
1095 pmc->mca_sfcount[MCAST_EXCLUDE] !=
1096 psf->sf_count[MCAST_EXCLUDE])
1097 break;
1098 if (ipv6_addr_equal(&srcs[i], &psf->sf_addr)) {
1099 scount++;
1100 break;
1104 pmc->mca_flags &= ~MAF_GSQUERY;
1105 if (scount == nsrcs) /* all sources excluded */
1106 return false;
1107 return true;
1110 static bool mld_marksources(struct ifmcaddr6 *pmc, int nsrcs,
1111 const struct in6_addr *srcs)
1113 struct ip6_sf_list *psf;
1114 int i, scount;
1116 if (pmc->mca_sfmode == MCAST_EXCLUDE)
1117 return mld_xmarksources(pmc, nsrcs, srcs);
1119 /* mark INCLUDE-mode sources */
1121 scount = 0;
1122 for (psf = pmc->mca_sources; psf; psf = psf->sf_next) {
1123 if (scount == nsrcs)
1124 break;
1125 for (i = 0; i < nsrcs; i++) {
1126 if (ipv6_addr_equal(&srcs[i], &psf->sf_addr)) {
1127 psf->sf_gsresp = 1;
1128 scount++;
1129 break;
1133 if (!scount) {
1134 pmc->mca_flags &= ~MAF_GSQUERY;
1135 return false;
1137 pmc->mca_flags |= MAF_GSQUERY;
1138 return true;
1141 static int mld_force_mld_version(const struct inet6_dev *idev)
1143 /* Normally, both are 0 here. If enforcement to a particular is
1144 * being used, individual device enforcement will have a lower
1145 * precedence over 'all' device (.../conf/all/force_mld_version).
1148 if (dev_net(idev->dev)->ipv6.devconf_all->force_mld_version != 0)
1149 return dev_net(idev->dev)->ipv6.devconf_all->force_mld_version;
1150 else
1151 return idev->cnf.force_mld_version;
1154 static bool mld_in_v2_mode_only(const struct inet6_dev *idev)
1156 return mld_force_mld_version(idev) == 2;
1159 static bool mld_in_v1_mode_only(const struct inet6_dev *idev)
1161 return mld_force_mld_version(idev) == 1;
1164 static bool mld_in_v1_mode(const struct inet6_dev *idev)
1166 if (mld_in_v2_mode_only(idev))
1167 return false;
1168 if (mld_in_v1_mode_only(idev))
1169 return true;
1170 if (idev->mc_v1_seen && time_before(jiffies, idev->mc_v1_seen))
1171 return true;
1173 return false;
1176 static void mld_set_v1_mode(struct inet6_dev *idev)
1178 /* RFC3810, relevant sections:
1179 * - 9.1. Robustness Variable
1180 * - 9.2. Query Interval
1181 * - 9.3. Query Response Interval
1182 * - 9.12. Older Version Querier Present Timeout
1184 unsigned long switchback;
1186 switchback = (idev->mc_qrv * idev->mc_qi) + idev->mc_qri;
1188 idev->mc_v1_seen = jiffies + switchback;
1191 static void mld_update_qrv(struct inet6_dev *idev,
1192 const struct mld2_query *mlh2)
1194 /* RFC3810, relevant sections:
1195 * - 5.1.8. QRV (Querier's Robustness Variable)
1196 * - 9.1. Robustness Variable
1199 /* The value of the Robustness Variable MUST NOT be zero,
1200 * and SHOULD NOT be one. Catch this here if we ever run
1201 * into such a case in future.
1203 const int min_qrv = min(MLD_QRV_DEFAULT, sysctl_mld_qrv);
1204 WARN_ON(idev->mc_qrv == 0);
1206 if (mlh2->mld2q_qrv > 0)
1207 idev->mc_qrv = mlh2->mld2q_qrv;
1209 if (unlikely(idev->mc_qrv < min_qrv)) {
1210 net_warn_ratelimited("IPv6: MLD: clamping QRV from %u to %u!\n",
1211 idev->mc_qrv, min_qrv);
1212 idev->mc_qrv = min_qrv;
1216 static void mld_update_qi(struct inet6_dev *idev,
1217 const struct mld2_query *mlh2)
1219 /* RFC3810, relevant sections:
1220 * - 5.1.9. QQIC (Querier's Query Interval Code)
1221 * - 9.2. Query Interval
1222 * - 9.12. Older Version Querier Present Timeout
1223 * (the [Query Interval] in the last Query received)
1225 unsigned long mc_qqi;
1227 if (mlh2->mld2q_qqic < 128) {
1228 mc_qqi = mlh2->mld2q_qqic;
1229 } else {
1230 unsigned long mc_man, mc_exp;
1232 mc_exp = MLDV2_QQIC_EXP(mlh2->mld2q_qqic);
1233 mc_man = MLDV2_QQIC_MAN(mlh2->mld2q_qqic);
1235 mc_qqi = (mc_man | 0x10) << (mc_exp + 3);
1238 idev->mc_qi = mc_qqi * HZ;
1241 static void mld_update_qri(struct inet6_dev *idev,
1242 const struct mld2_query *mlh2)
1244 /* RFC3810, relevant sections:
1245 * - 5.1.3. Maximum Response Code
1246 * - 9.3. Query Response Interval
1248 idev->mc_qri = msecs_to_jiffies(mldv2_mrc(mlh2));
1251 static int mld_process_v1(struct inet6_dev *idev, struct mld_msg *mld,
1252 unsigned long *max_delay, bool v1_query)
1254 unsigned long mldv1_md;
1256 /* Ignore v1 queries */
1257 if (mld_in_v2_mode_only(idev))
1258 return -EINVAL;
1260 mldv1_md = ntohs(mld->mld_maxdelay);
1262 /* When in MLDv1 fallback and a MLDv2 router start-up being
1263 * unaware of current MLDv1 operation, the MRC == MRD mapping
1264 * only works when the exponential algorithm is not being
1265 * used (as MLDv1 is unaware of such things).
1267 * According to the RFC author, the MLDv2 implementations
1268 * he's aware of all use a MRC < 32768 on start up queries.
1270 * Thus, should we *ever* encounter something else larger
1271 * than that, just assume the maximum possible within our
1272 * reach.
1274 if (!v1_query)
1275 mldv1_md = min(mldv1_md, MLDV1_MRD_MAX_COMPAT);
1277 *max_delay = max(msecs_to_jiffies(mldv1_md), 1UL);
1279 /* MLDv1 router present: we need to go into v1 mode *only*
1280 * when an MLDv1 query is received as per section 9.12. of
1281 * RFC3810! And we know from RFC2710 section 3.7 that MLDv1
1282 * queries MUST be of exactly 24 octets.
1284 if (v1_query)
1285 mld_set_v1_mode(idev);
1287 /* cancel MLDv2 report timer */
1288 mld_gq_stop_timer(idev);
1289 /* cancel the interface change timer */
1290 mld_ifc_stop_timer(idev);
1291 /* clear deleted report items */
1292 mld_clear_delrec(idev);
1294 return 0;
1297 static int mld_process_v2(struct inet6_dev *idev, struct mld2_query *mld,
1298 unsigned long *max_delay)
1300 *max_delay = max(msecs_to_jiffies(mldv2_mrc(mld)), 1UL);
1302 mld_update_qrv(idev, mld);
1303 mld_update_qi(idev, mld);
1304 mld_update_qri(idev, mld);
1306 idev->mc_maxdelay = *max_delay;
1308 return 0;
1311 /* called with rcu_read_lock() */
1312 int igmp6_event_query(struct sk_buff *skb)
1314 struct mld2_query *mlh2 = NULL;
1315 struct ifmcaddr6 *ma;
1316 const struct in6_addr *group;
1317 unsigned long max_delay;
1318 struct inet6_dev *idev;
1319 struct mld_msg *mld;
1320 int group_type;
1321 int mark = 0;
1322 int len, err;
1324 if (!pskb_may_pull(skb, sizeof(struct in6_addr)))
1325 return -EINVAL;
1327 /* compute payload length excluding extension headers */
1328 len = ntohs(ipv6_hdr(skb)->payload_len) + sizeof(struct ipv6hdr);
1329 len -= skb_network_header_len(skb);
1331 /* RFC3810 6.2
1332 * Upon reception of an MLD message that contains a Query, the node
1333 * checks if the source address of the message is a valid link-local
1334 * address, if the Hop Limit is set to 1, and if the Router Alert
1335 * option is present in the Hop-By-Hop Options header of the IPv6
1336 * packet. If any of these checks fails, the packet is dropped.
1338 if (!(ipv6_addr_type(&ipv6_hdr(skb)->saddr) & IPV6_ADDR_LINKLOCAL) ||
1339 ipv6_hdr(skb)->hop_limit != 1 ||
1340 !(IP6CB(skb)->flags & IP6SKB_ROUTERALERT) ||
1341 IP6CB(skb)->ra != htons(IPV6_OPT_ROUTERALERT_MLD))
1342 return -EINVAL;
1344 idev = __in6_dev_get(skb->dev);
1345 if (!idev)
1346 return 0;
1348 mld = (struct mld_msg *)icmp6_hdr(skb);
1349 group = &mld->mld_mca;
1350 group_type = ipv6_addr_type(group);
1352 if (group_type != IPV6_ADDR_ANY &&
1353 !(group_type&IPV6_ADDR_MULTICAST))
1354 return -EINVAL;
1356 if (len < MLD_V1_QUERY_LEN) {
1357 return -EINVAL;
1358 } else if (len == MLD_V1_QUERY_LEN || mld_in_v1_mode(idev)) {
1359 err = mld_process_v1(idev, mld, &max_delay,
1360 len == MLD_V1_QUERY_LEN);
1361 if (err < 0)
1362 return err;
1363 } else if (len >= MLD_V2_QUERY_LEN_MIN) {
1364 int srcs_offset = sizeof(struct mld2_query) -
1365 sizeof(struct icmp6hdr);
1367 if (!pskb_may_pull(skb, srcs_offset))
1368 return -EINVAL;
1370 mlh2 = (struct mld2_query *)skb_transport_header(skb);
1372 err = mld_process_v2(idev, mlh2, &max_delay);
1373 if (err < 0)
1374 return err;
1376 if (group_type == IPV6_ADDR_ANY) { /* general query */
1377 if (mlh2->mld2q_nsrcs)
1378 return -EINVAL; /* no sources allowed */
1380 mld_gq_start_timer(idev);
1381 return 0;
1383 /* mark sources to include, if group & source-specific */
1384 if (mlh2->mld2q_nsrcs != 0) {
1385 if (!pskb_may_pull(skb, srcs_offset +
1386 ntohs(mlh2->mld2q_nsrcs) * sizeof(struct in6_addr)))
1387 return -EINVAL;
1389 mlh2 = (struct mld2_query *)skb_transport_header(skb);
1390 mark = 1;
1392 } else {
1393 return -EINVAL;
1396 read_lock_bh(&idev->lock);
1397 if (group_type == IPV6_ADDR_ANY) {
1398 for (ma = idev->mc_list; ma; ma = ma->next) {
1399 spin_lock_bh(&ma->mca_lock);
1400 igmp6_group_queried(ma, max_delay);
1401 spin_unlock_bh(&ma->mca_lock);
1403 } else {
1404 for (ma = idev->mc_list; ma; ma = ma->next) {
1405 if (!ipv6_addr_equal(group, &ma->mca_addr))
1406 continue;
1407 spin_lock_bh(&ma->mca_lock);
1408 if (ma->mca_flags & MAF_TIMER_RUNNING) {
1409 /* gsquery <- gsquery && mark */
1410 if (!mark)
1411 ma->mca_flags &= ~MAF_GSQUERY;
1412 } else {
1413 /* gsquery <- mark */
1414 if (mark)
1415 ma->mca_flags |= MAF_GSQUERY;
1416 else
1417 ma->mca_flags &= ~MAF_GSQUERY;
1419 if (!(ma->mca_flags & MAF_GSQUERY) ||
1420 mld_marksources(ma, ntohs(mlh2->mld2q_nsrcs), mlh2->mld2q_srcs))
1421 igmp6_group_queried(ma, max_delay);
1422 spin_unlock_bh(&ma->mca_lock);
1423 break;
1426 read_unlock_bh(&idev->lock);
1428 return 0;
1431 /* called with rcu_read_lock() */
1432 int igmp6_event_report(struct sk_buff *skb)
1434 struct ifmcaddr6 *ma;
1435 struct inet6_dev *idev;
1436 struct mld_msg *mld;
1437 int addr_type;
1439 /* Our own report looped back. Ignore it. */
1440 if (skb->pkt_type == PACKET_LOOPBACK)
1441 return 0;
1443 /* send our report if the MC router may not have heard this report */
1444 if (skb->pkt_type != PACKET_MULTICAST &&
1445 skb->pkt_type != PACKET_BROADCAST)
1446 return 0;
1448 if (!pskb_may_pull(skb, sizeof(*mld) - sizeof(struct icmp6hdr)))
1449 return -EINVAL;
1451 mld = (struct mld_msg *)icmp6_hdr(skb);
1453 /* Drop reports with not link local source */
1454 addr_type = ipv6_addr_type(&ipv6_hdr(skb)->saddr);
1455 if (addr_type != IPV6_ADDR_ANY &&
1456 !(addr_type&IPV6_ADDR_LINKLOCAL))
1457 return -EINVAL;
1459 idev = __in6_dev_get(skb->dev);
1460 if (!idev)
1461 return -ENODEV;
1464 * Cancel the timer for this group
1467 read_lock_bh(&idev->lock);
1468 for (ma = idev->mc_list; ma; ma = ma->next) {
1469 if (ipv6_addr_equal(&ma->mca_addr, &mld->mld_mca)) {
1470 spin_lock(&ma->mca_lock);
1471 if (del_timer(&ma->mca_timer))
1472 refcount_dec(&ma->mca_refcnt);
1473 ma->mca_flags &= ~(MAF_LAST_REPORTER|MAF_TIMER_RUNNING);
1474 spin_unlock(&ma->mca_lock);
1475 break;
1478 read_unlock_bh(&idev->lock);
1479 return 0;
1482 static bool is_in(struct ifmcaddr6 *pmc, struct ip6_sf_list *psf, int type,
1483 int gdeleted, int sdeleted)
1485 switch (type) {
1486 case MLD2_MODE_IS_INCLUDE:
1487 case MLD2_MODE_IS_EXCLUDE:
1488 if (gdeleted || sdeleted)
1489 return false;
1490 if (!((pmc->mca_flags & MAF_GSQUERY) && !psf->sf_gsresp)) {
1491 if (pmc->mca_sfmode == MCAST_INCLUDE)
1492 return true;
1493 /* don't include if this source is excluded
1494 * in all filters
1496 if (psf->sf_count[MCAST_INCLUDE])
1497 return type == MLD2_MODE_IS_INCLUDE;
1498 return pmc->mca_sfcount[MCAST_EXCLUDE] ==
1499 psf->sf_count[MCAST_EXCLUDE];
1501 return false;
1502 case MLD2_CHANGE_TO_INCLUDE:
1503 if (gdeleted || sdeleted)
1504 return false;
1505 return psf->sf_count[MCAST_INCLUDE] != 0;
1506 case MLD2_CHANGE_TO_EXCLUDE:
1507 if (gdeleted || sdeleted)
1508 return false;
1509 if (pmc->mca_sfcount[MCAST_EXCLUDE] == 0 ||
1510 psf->sf_count[MCAST_INCLUDE])
1511 return false;
1512 return pmc->mca_sfcount[MCAST_EXCLUDE] ==
1513 psf->sf_count[MCAST_EXCLUDE];
1514 case MLD2_ALLOW_NEW_SOURCES:
1515 if (gdeleted || !psf->sf_crcount)
1516 return false;
1517 return (pmc->mca_sfmode == MCAST_INCLUDE) ^ sdeleted;
1518 case MLD2_BLOCK_OLD_SOURCES:
1519 if (pmc->mca_sfmode == MCAST_INCLUDE)
1520 return gdeleted || (psf->sf_crcount && sdeleted);
1521 return psf->sf_crcount && !gdeleted && !sdeleted;
1523 return false;
1526 static int
1527 mld_scount(struct ifmcaddr6 *pmc, int type, int gdeleted, int sdeleted)
1529 struct ip6_sf_list *psf;
1530 int scount = 0;
1532 for (psf = pmc->mca_sources; psf; psf = psf->sf_next) {
1533 if (!is_in(pmc, psf, type, gdeleted, sdeleted))
1534 continue;
1535 scount++;
1537 return scount;
1540 static void ip6_mc_hdr(struct sock *sk, struct sk_buff *skb,
1541 struct net_device *dev,
1542 const struct in6_addr *saddr,
1543 const struct in6_addr *daddr,
1544 int proto, int len)
1546 struct ipv6hdr *hdr;
1548 skb->protocol = htons(ETH_P_IPV6);
1549 skb->dev = dev;
1551 skb_reset_network_header(skb);
1552 skb_put(skb, sizeof(struct ipv6hdr));
1553 hdr = ipv6_hdr(skb);
1555 ip6_flow_hdr(hdr, 0, 0);
1557 hdr->payload_len = htons(len);
1558 hdr->nexthdr = proto;
1559 hdr->hop_limit = inet6_sk(sk)->hop_limit;
1561 hdr->saddr = *saddr;
1562 hdr->daddr = *daddr;
1565 static struct sk_buff *mld_newpack(struct inet6_dev *idev, unsigned int mtu)
1567 struct net_device *dev = idev->dev;
1568 struct net *net = dev_net(dev);
1569 struct sock *sk = net->ipv6.igmp_sk;
1570 struct sk_buff *skb;
1571 struct mld2_report *pmr;
1572 struct in6_addr addr_buf;
1573 const struct in6_addr *saddr;
1574 int hlen = LL_RESERVED_SPACE(dev);
1575 int tlen = dev->needed_tailroom;
1576 unsigned int size = mtu + hlen + tlen;
1577 int err;
1578 u8 ra[8] = { IPPROTO_ICMPV6, 0,
1579 IPV6_TLV_ROUTERALERT, 2, 0, 0,
1580 IPV6_TLV_PADN, 0 };
1582 /* we assume size > sizeof(ra) here */
1583 /* limit our allocations to order-0 page */
1584 size = min_t(int, size, SKB_MAX_ORDER(0, 0));
1585 skb = sock_alloc_send_skb(sk, size, 1, &err);
1587 if (!skb)
1588 return NULL;
1590 skb->priority = TC_PRIO_CONTROL;
1591 skb_reserve(skb, hlen);
1592 skb_tailroom_reserve(skb, mtu, tlen);
1594 if (__ipv6_get_lladdr(idev, &addr_buf, IFA_F_TENTATIVE)) {
1595 /* <draft-ietf-magma-mld-source-05.txt>:
1596 * use unspecified address as the source address
1597 * when a valid link-local address is not available.
1599 saddr = &in6addr_any;
1600 } else
1601 saddr = &addr_buf;
1603 ip6_mc_hdr(sk, skb, dev, saddr, &mld2_all_mcr, NEXTHDR_HOP, 0);
1605 skb_put_data(skb, ra, sizeof(ra));
1607 skb_set_transport_header(skb, skb_tail_pointer(skb) - skb->data);
1608 skb_put(skb, sizeof(*pmr));
1609 pmr = (struct mld2_report *)skb_transport_header(skb);
1610 pmr->mld2r_type = ICMPV6_MLD2_REPORT;
1611 pmr->mld2r_resv1 = 0;
1612 pmr->mld2r_cksum = 0;
1613 pmr->mld2r_resv2 = 0;
1614 pmr->mld2r_ngrec = 0;
1615 return skb;
1618 static void mld_sendpack(struct sk_buff *skb)
1620 struct ipv6hdr *pip6 = ipv6_hdr(skb);
1621 struct mld2_report *pmr =
1622 (struct mld2_report *)skb_transport_header(skb);
1623 int payload_len, mldlen;
1624 struct inet6_dev *idev;
1625 struct net *net = dev_net(skb->dev);
1626 int err;
1627 struct flowi6 fl6;
1628 struct dst_entry *dst;
1630 rcu_read_lock();
1631 idev = __in6_dev_get(skb->dev);
1632 IP6_UPD_PO_STATS(net, idev, IPSTATS_MIB_OUT, skb->len);
1634 payload_len = (skb_tail_pointer(skb) - skb_network_header(skb)) -
1635 sizeof(*pip6);
1636 mldlen = skb_tail_pointer(skb) - skb_transport_header(skb);
1637 pip6->payload_len = htons(payload_len);
1639 pmr->mld2r_cksum = csum_ipv6_magic(&pip6->saddr, &pip6->daddr, mldlen,
1640 IPPROTO_ICMPV6,
1641 csum_partial(skb_transport_header(skb),
1642 mldlen, 0));
1644 icmpv6_flow_init(net->ipv6.igmp_sk, &fl6, ICMPV6_MLD2_REPORT,
1645 &ipv6_hdr(skb)->saddr, &ipv6_hdr(skb)->daddr,
1646 skb->dev->ifindex);
1647 dst = icmp6_dst_alloc(skb->dev, &fl6);
1649 err = 0;
1650 if (IS_ERR(dst)) {
1651 err = PTR_ERR(dst);
1652 dst = NULL;
1654 skb_dst_set(skb, dst);
1655 if (err)
1656 goto err_out;
1658 err = NF_HOOK(NFPROTO_IPV6, NF_INET_LOCAL_OUT,
1659 net, net->ipv6.igmp_sk, skb, NULL, skb->dev,
1660 dst_output);
1661 out:
1662 if (!err) {
1663 ICMP6MSGOUT_INC_STATS(net, idev, ICMPV6_MLD2_REPORT);
1664 ICMP6_INC_STATS(net, idev, ICMP6_MIB_OUTMSGS);
1665 } else {
1666 IP6_INC_STATS(net, idev, IPSTATS_MIB_OUTDISCARDS);
1669 rcu_read_unlock();
1670 return;
1672 err_out:
1673 kfree_skb(skb);
1674 goto out;
1677 static int grec_size(struct ifmcaddr6 *pmc, int type, int gdel, int sdel)
1679 return sizeof(struct mld2_grec) + 16 * mld_scount(pmc,type,gdel,sdel);
1682 static struct sk_buff *add_grhead(struct sk_buff *skb, struct ifmcaddr6 *pmc,
1683 int type, struct mld2_grec **ppgr, unsigned int mtu)
1685 struct mld2_report *pmr;
1686 struct mld2_grec *pgr;
1688 if (!skb) {
1689 skb = mld_newpack(pmc->idev, mtu);
1690 if (!skb)
1691 return NULL;
1693 pgr = skb_put(skb, sizeof(struct mld2_grec));
1694 pgr->grec_type = type;
1695 pgr->grec_auxwords = 0;
1696 pgr->grec_nsrcs = 0;
1697 pgr->grec_mca = pmc->mca_addr; /* structure copy */
1698 pmr = (struct mld2_report *)skb_transport_header(skb);
1699 pmr->mld2r_ngrec = htons(ntohs(pmr->mld2r_ngrec)+1);
1700 *ppgr = pgr;
1701 return skb;
1704 #define AVAILABLE(skb) ((skb) ? skb_availroom(skb) : 0)
1706 static struct sk_buff *add_grec(struct sk_buff *skb, struct ifmcaddr6 *pmc,
1707 int type, int gdeleted, int sdeleted, int crsend)
1709 struct inet6_dev *idev = pmc->idev;
1710 struct net_device *dev = idev->dev;
1711 struct mld2_report *pmr;
1712 struct mld2_grec *pgr = NULL;
1713 struct ip6_sf_list *psf, *psf_next, *psf_prev, **psf_list;
1714 int scount, stotal, first, isquery, truncate;
1715 unsigned int mtu;
1717 if (pmc->mca_flags & MAF_NOREPORT)
1718 return skb;
1720 mtu = READ_ONCE(dev->mtu);
1721 if (mtu < IPV6_MIN_MTU)
1722 return skb;
1724 isquery = type == MLD2_MODE_IS_INCLUDE ||
1725 type == MLD2_MODE_IS_EXCLUDE;
1726 truncate = type == MLD2_MODE_IS_EXCLUDE ||
1727 type == MLD2_CHANGE_TO_EXCLUDE;
1729 stotal = scount = 0;
1731 psf_list = sdeleted ? &pmc->mca_tomb : &pmc->mca_sources;
1733 if (!*psf_list)
1734 goto empty_source;
1736 pmr = skb ? (struct mld2_report *)skb_transport_header(skb) : NULL;
1738 /* EX and TO_EX get a fresh packet, if needed */
1739 if (truncate) {
1740 if (pmr && pmr->mld2r_ngrec &&
1741 AVAILABLE(skb) < grec_size(pmc, type, gdeleted, sdeleted)) {
1742 if (skb)
1743 mld_sendpack(skb);
1744 skb = mld_newpack(idev, mtu);
1747 first = 1;
1748 psf_prev = NULL;
1749 for (psf = *psf_list; psf; psf = psf_next) {
1750 struct in6_addr *psrc;
1752 psf_next = psf->sf_next;
1754 if (!is_in(pmc, psf, type, gdeleted, sdeleted)) {
1755 psf_prev = psf;
1756 continue;
1759 /* Based on RFC3810 6.1. Should not send source-list change
1760 * records when there is a filter mode change.
1762 if (((gdeleted && pmc->mca_sfmode == MCAST_EXCLUDE) ||
1763 (!gdeleted && pmc->mca_crcount)) &&
1764 (type == MLD2_ALLOW_NEW_SOURCES ||
1765 type == MLD2_BLOCK_OLD_SOURCES) && psf->sf_crcount)
1766 goto decrease_sf_crcount;
1768 /* clear marks on query responses */
1769 if (isquery)
1770 psf->sf_gsresp = 0;
1772 if (AVAILABLE(skb) < sizeof(*psrc) +
1773 first*sizeof(struct mld2_grec)) {
1774 if (truncate && !first)
1775 break; /* truncate these */
1776 if (pgr)
1777 pgr->grec_nsrcs = htons(scount);
1778 if (skb)
1779 mld_sendpack(skb);
1780 skb = mld_newpack(idev, mtu);
1781 first = 1;
1782 scount = 0;
1784 if (first) {
1785 skb = add_grhead(skb, pmc, type, &pgr, mtu);
1786 first = 0;
1788 if (!skb)
1789 return NULL;
1790 psrc = skb_put(skb, sizeof(*psrc));
1791 *psrc = psf->sf_addr;
1792 scount++; stotal++;
1793 if ((type == MLD2_ALLOW_NEW_SOURCES ||
1794 type == MLD2_BLOCK_OLD_SOURCES) && psf->sf_crcount) {
1795 decrease_sf_crcount:
1796 psf->sf_crcount--;
1797 if ((sdeleted || gdeleted) && psf->sf_crcount == 0) {
1798 if (psf_prev)
1799 psf_prev->sf_next = psf->sf_next;
1800 else
1801 *psf_list = psf->sf_next;
1802 kfree(psf);
1803 continue;
1806 psf_prev = psf;
1809 empty_source:
1810 if (!stotal) {
1811 if (type == MLD2_ALLOW_NEW_SOURCES ||
1812 type == MLD2_BLOCK_OLD_SOURCES)
1813 return skb;
1814 if (pmc->mca_crcount || isquery || crsend) {
1815 /* make sure we have room for group header */
1816 if (skb && AVAILABLE(skb) < sizeof(struct mld2_grec)) {
1817 mld_sendpack(skb);
1818 skb = NULL; /* add_grhead will get a new one */
1820 skb = add_grhead(skb, pmc, type, &pgr, mtu);
1823 if (pgr)
1824 pgr->grec_nsrcs = htons(scount);
1826 if (isquery)
1827 pmc->mca_flags &= ~MAF_GSQUERY; /* clear query state */
1828 return skb;
1831 static void mld_send_report(struct inet6_dev *idev, struct ifmcaddr6 *pmc)
1833 struct sk_buff *skb = NULL;
1834 int type;
1836 read_lock_bh(&idev->lock);
1837 if (!pmc) {
1838 for (pmc = idev->mc_list; pmc; pmc = pmc->next) {
1839 if (pmc->mca_flags & MAF_NOREPORT)
1840 continue;
1841 spin_lock_bh(&pmc->mca_lock);
1842 if (pmc->mca_sfcount[MCAST_EXCLUDE])
1843 type = MLD2_MODE_IS_EXCLUDE;
1844 else
1845 type = MLD2_MODE_IS_INCLUDE;
1846 skb = add_grec(skb, pmc, type, 0, 0, 0);
1847 spin_unlock_bh(&pmc->mca_lock);
1849 } else {
1850 spin_lock_bh(&pmc->mca_lock);
1851 if (pmc->mca_sfcount[MCAST_EXCLUDE])
1852 type = MLD2_MODE_IS_EXCLUDE;
1853 else
1854 type = MLD2_MODE_IS_INCLUDE;
1855 skb = add_grec(skb, pmc, type, 0, 0, 0);
1856 spin_unlock_bh(&pmc->mca_lock);
1858 read_unlock_bh(&idev->lock);
1859 if (skb)
1860 mld_sendpack(skb);
1864 * remove zero-count source records from a source filter list
1866 static void mld_clear_zeros(struct ip6_sf_list **ppsf)
1868 struct ip6_sf_list *psf_prev, *psf_next, *psf;
1870 psf_prev = NULL;
1871 for (psf = *ppsf; psf; psf = psf_next) {
1872 psf_next = psf->sf_next;
1873 if (psf->sf_crcount == 0) {
1874 if (psf_prev)
1875 psf_prev->sf_next = psf->sf_next;
1876 else
1877 *ppsf = psf->sf_next;
1878 kfree(psf);
1879 } else
1880 psf_prev = psf;
1884 static void mld_send_cr(struct inet6_dev *idev)
1886 struct ifmcaddr6 *pmc, *pmc_prev, *pmc_next;
1887 struct sk_buff *skb = NULL;
1888 int type, dtype;
1890 read_lock_bh(&idev->lock);
1891 spin_lock(&idev->mc_lock);
1893 /* deleted MCA's */
1894 pmc_prev = NULL;
1895 for (pmc = idev->mc_tomb; pmc; pmc = pmc_next) {
1896 pmc_next = pmc->next;
1897 if (pmc->mca_sfmode == MCAST_INCLUDE) {
1898 type = MLD2_BLOCK_OLD_SOURCES;
1899 dtype = MLD2_BLOCK_OLD_SOURCES;
1900 skb = add_grec(skb, pmc, type, 1, 0, 0);
1901 skb = add_grec(skb, pmc, dtype, 1, 1, 0);
1903 if (pmc->mca_crcount) {
1904 if (pmc->mca_sfmode == MCAST_EXCLUDE) {
1905 type = MLD2_CHANGE_TO_INCLUDE;
1906 skb = add_grec(skb, pmc, type, 1, 0, 0);
1908 pmc->mca_crcount--;
1909 if (pmc->mca_crcount == 0) {
1910 mld_clear_zeros(&pmc->mca_tomb);
1911 mld_clear_zeros(&pmc->mca_sources);
1914 if (pmc->mca_crcount == 0 && !pmc->mca_tomb &&
1915 !pmc->mca_sources) {
1916 if (pmc_prev)
1917 pmc_prev->next = pmc_next;
1918 else
1919 idev->mc_tomb = pmc_next;
1920 in6_dev_put(pmc->idev);
1921 kfree(pmc);
1922 } else
1923 pmc_prev = pmc;
1925 spin_unlock(&idev->mc_lock);
1927 /* change recs */
1928 for (pmc = idev->mc_list; pmc; pmc = pmc->next) {
1929 spin_lock_bh(&pmc->mca_lock);
1930 if (pmc->mca_sfcount[MCAST_EXCLUDE]) {
1931 type = MLD2_BLOCK_OLD_SOURCES;
1932 dtype = MLD2_ALLOW_NEW_SOURCES;
1933 } else {
1934 type = MLD2_ALLOW_NEW_SOURCES;
1935 dtype = MLD2_BLOCK_OLD_SOURCES;
1937 skb = add_grec(skb, pmc, type, 0, 0, 0);
1938 skb = add_grec(skb, pmc, dtype, 0, 1, 0); /* deleted sources */
1940 /* filter mode changes */
1941 if (pmc->mca_crcount) {
1942 if (pmc->mca_sfmode == MCAST_EXCLUDE)
1943 type = MLD2_CHANGE_TO_EXCLUDE;
1944 else
1945 type = MLD2_CHANGE_TO_INCLUDE;
1946 skb = add_grec(skb, pmc, type, 0, 0, 0);
1947 pmc->mca_crcount--;
1949 spin_unlock_bh(&pmc->mca_lock);
1951 read_unlock_bh(&idev->lock);
1952 if (!skb)
1953 return;
1954 (void) mld_sendpack(skb);
1957 static void igmp6_send(struct in6_addr *addr, struct net_device *dev, int type)
1959 struct net *net = dev_net(dev);
1960 struct sock *sk = net->ipv6.igmp_sk;
1961 struct inet6_dev *idev;
1962 struct sk_buff *skb;
1963 struct mld_msg *hdr;
1964 const struct in6_addr *snd_addr, *saddr;
1965 struct in6_addr addr_buf;
1966 int hlen = LL_RESERVED_SPACE(dev);
1967 int tlen = dev->needed_tailroom;
1968 int err, len, payload_len, full_len;
1969 u8 ra[8] = { IPPROTO_ICMPV6, 0,
1970 IPV6_TLV_ROUTERALERT, 2, 0, 0,
1971 IPV6_TLV_PADN, 0 };
1972 struct flowi6 fl6;
1973 struct dst_entry *dst;
1975 if (type == ICMPV6_MGM_REDUCTION)
1976 snd_addr = &in6addr_linklocal_allrouters;
1977 else
1978 snd_addr = addr;
1980 len = sizeof(struct icmp6hdr) + sizeof(struct in6_addr);
1981 payload_len = len + sizeof(ra);
1982 full_len = sizeof(struct ipv6hdr) + payload_len;
1984 rcu_read_lock();
1985 IP6_UPD_PO_STATS(net, __in6_dev_get(dev),
1986 IPSTATS_MIB_OUT, full_len);
1987 rcu_read_unlock();
1989 skb = sock_alloc_send_skb(sk, hlen + tlen + full_len, 1, &err);
1991 if (!skb) {
1992 rcu_read_lock();
1993 IP6_INC_STATS(net, __in6_dev_get(dev),
1994 IPSTATS_MIB_OUTDISCARDS);
1995 rcu_read_unlock();
1996 return;
1998 skb->priority = TC_PRIO_CONTROL;
1999 skb_reserve(skb, hlen);
2001 if (ipv6_get_lladdr(dev, &addr_buf, IFA_F_TENTATIVE)) {
2002 /* <draft-ietf-magma-mld-source-05.txt>:
2003 * use unspecified address as the source address
2004 * when a valid link-local address is not available.
2006 saddr = &in6addr_any;
2007 } else
2008 saddr = &addr_buf;
2010 ip6_mc_hdr(sk, skb, dev, saddr, snd_addr, NEXTHDR_HOP, payload_len);
2012 skb_put_data(skb, ra, sizeof(ra));
2014 hdr = skb_put_zero(skb, sizeof(struct mld_msg));
2015 hdr->mld_type = type;
2016 hdr->mld_mca = *addr;
2018 hdr->mld_cksum = csum_ipv6_magic(saddr, snd_addr, len,
2019 IPPROTO_ICMPV6,
2020 csum_partial(hdr, len, 0));
2022 rcu_read_lock();
2023 idev = __in6_dev_get(skb->dev);
2025 icmpv6_flow_init(sk, &fl6, type,
2026 &ipv6_hdr(skb)->saddr, &ipv6_hdr(skb)->daddr,
2027 skb->dev->ifindex);
2028 dst = icmp6_dst_alloc(skb->dev, &fl6);
2029 if (IS_ERR(dst)) {
2030 err = PTR_ERR(dst);
2031 goto err_out;
2034 skb_dst_set(skb, dst);
2035 err = NF_HOOK(NFPROTO_IPV6, NF_INET_LOCAL_OUT,
2036 net, sk, skb, NULL, skb->dev,
2037 dst_output);
2038 out:
2039 if (!err) {
2040 ICMP6MSGOUT_INC_STATS(net, idev, type);
2041 ICMP6_INC_STATS(net, idev, ICMP6_MIB_OUTMSGS);
2042 } else
2043 IP6_INC_STATS(net, idev, IPSTATS_MIB_OUTDISCARDS);
2045 rcu_read_unlock();
2046 return;
2048 err_out:
2049 kfree_skb(skb);
2050 goto out;
2053 static void mld_send_initial_cr(struct inet6_dev *idev)
2055 struct sk_buff *skb;
2056 struct ifmcaddr6 *pmc;
2057 int type;
2059 if (mld_in_v1_mode(idev))
2060 return;
2062 skb = NULL;
2063 read_lock_bh(&idev->lock);
2064 for (pmc = idev->mc_list; pmc; pmc = pmc->next) {
2065 spin_lock_bh(&pmc->mca_lock);
2066 if (pmc->mca_sfcount[MCAST_EXCLUDE])
2067 type = MLD2_CHANGE_TO_EXCLUDE;
2068 else
2069 type = MLD2_CHANGE_TO_INCLUDE;
2070 skb = add_grec(skb, pmc, type, 0, 0, 1);
2071 spin_unlock_bh(&pmc->mca_lock);
2073 read_unlock_bh(&idev->lock);
2074 if (skb)
2075 mld_sendpack(skb);
2078 void ipv6_mc_dad_complete(struct inet6_dev *idev)
2080 idev->mc_dad_count = idev->mc_qrv;
2081 if (idev->mc_dad_count) {
2082 mld_send_initial_cr(idev);
2083 idev->mc_dad_count--;
2084 if (idev->mc_dad_count)
2085 mld_dad_start_timer(idev, idev->mc_maxdelay);
2089 static void mld_dad_timer_expire(struct timer_list *t)
2091 struct inet6_dev *idev = from_timer(idev, t, mc_dad_timer);
2093 mld_send_initial_cr(idev);
2094 if (idev->mc_dad_count) {
2095 idev->mc_dad_count--;
2096 if (idev->mc_dad_count)
2097 mld_dad_start_timer(idev, idev->mc_maxdelay);
2099 in6_dev_put(idev);
2102 static int ip6_mc_del1_src(struct ifmcaddr6 *pmc, int sfmode,
2103 const struct in6_addr *psfsrc)
2105 struct ip6_sf_list *psf, *psf_prev;
2106 int rv = 0;
2108 psf_prev = NULL;
2109 for (psf = pmc->mca_sources; psf; psf = psf->sf_next) {
2110 if (ipv6_addr_equal(&psf->sf_addr, psfsrc))
2111 break;
2112 psf_prev = psf;
2114 if (!psf || psf->sf_count[sfmode] == 0) {
2115 /* source filter not found, or count wrong => bug */
2116 return -ESRCH;
2118 psf->sf_count[sfmode]--;
2119 if (!psf->sf_count[MCAST_INCLUDE] && !psf->sf_count[MCAST_EXCLUDE]) {
2120 struct inet6_dev *idev = pmc->idev;
2122 /* no more filters for this source */
2123 if (psf_prev)
2124 psf_prev->sf_next = psf->sf_next;
2125 else
2126 pmc->mca_sources = psf->sf_next;
2127 if (psf->sf_oldin && !(pmc->mca_flags & MAF_NOREPORT) &&
2128 !mld_in_v1_mode(idev)) {
2129 psf->sf_crcount = idev->mc_qrv;
2130 psf->sf_next = pmc->mca_tomb;
2131 pmc->mca_tomb = psf;
2132 rv = 1;
2133 } else
2134 kfree(psf);
2136 return rv;
2139 static int ip6_mc_del_src(struct inet6_dev *idev, const struct in6_addr *pmca,
2140 int sfmode, int sfcount, const struct in6_addr *psfsrc,
2141 int delta)
2143 struct ifmcaddr6 *pmc;
2144 int changerec = 0;
2145 int i, err;
2147 if (!idev)
2148 return -ENODEV;
2149 read_lock_bh(&idev->lock);
2150 for (pmc = idev->mc_list; pmc; pmc = pmc->next) {
2151 if (ipv6_addr_equal(pmca, &pmc->mca_addr))
2152 break;
2154 if (!pmc) {
2155 /* MCA not found?? bug */
2156 read_unlock_bh(&idev->lock);
2157 return -ESRCH;
2159 spin_lock_bh(&pmc->mca_lock);
2160 sf_markstate(pmc);
2161 if (!delta) {
2162 if (!pmc->mca_sfcount[sfmode]) {
2163 spin_unlock_bh(&pmc->mca_lock);
2164 read_unlock_bh(&idev->lock);
2165 return -EINVAL;
2167 pmc->mca_sfcount[sfmode]--;
2169 err = 0;
2170 for (i = 0; i < sfcount; i++) {
2171 int rv = ip6_mc_del1_src(pmc, sfmode, &psfsrc[i]);
2173 changerec |= rv > 0;
2174 if (!err && rv < 0)
2175 err = rv;
2177 if (pmc->mca_sfmode == MCAST_EXCLUDE &&
2178 pmc->mca_sfcount[MCAST_EXCLUDE] == 0 &&
2179 pmc->mca_sfcount[MCAST_INCLUDE]) {
2180 struct ip6_sf_list *psf;
2182 /* filter mode change */
2183 pmc->mca_sfmode = MCAST_INCLUDE;
2184 pmc->mca_crcount = idev->mc_qrv;
2185 idev->mc_ifc_count = pmc->mca_crcount;
2186 for (psf = pmc->mca_sources; psf; psf = psf->sf_next)
2187 psf->sf_crcount = 0;
2188 mld_ifc_event(pmc->idev);
2189 } else if (sf_setstate(pmc) || changerec)
2190 mld_ifc_event(pmc->idev);
2191 spin_unlock_bh(&pmc->mca_lock);
2192 read_unlock_bh(&idev->lock);
2193 return err;
2197 * Add multicast single-source filter to the interface list
2199 static int ip6_mc_add1_src(struct ifmcaddr6 *pmc, int sfmode,
2200 const struct in6_addr *psfsrc)
2202 struct ip6_sf_list *psf, *psf_prev;
2204 psf_prev = NULL;
2205 for (psf = pmc->mca_sources; psf; psf = psf->sf_next) {
2206 if (ipv6_addr_equal(&psf->sf_addr, psfsrc))
2207 break;
2208 psf_prev = psf;
2210 if (!psf) {
2211 psf = kzalloc(sizeof(*psf), GFP_ATOMIC);
2212 if (!psf)
2213 return -ENOBUFS;
2215 psf->sf_addr = *psfsrc;
2216 if (psf_prev) {
2217 psf_prev->sf_next = psf;
2218 } else
2219 pmc->mca_sources = psf;
2221 psf->sf_count[sfmode]++;
2222 return 0;
2225 static void sf_markstate(struct ifmcaddr6 *pmc)
2227 struct ip6_sf_list *psf;
2228 int mca_xcount = pmc->mca_sfcount[MCAST_EXCLUDE];
2230 for (psf = pmc->mca_sources; psf; psf = psf->sf_next)
2231 if (pmc->mca_sfcount[MCAST_EXCLUDE]) {
2232 psf->sf_oldin = mca_xcount ==
2233 psf->sf_count[MCAST_EXCLUDE] &&
2234 !psf->sf_count[MCAST_INCLUDE];
2235 } else
2236 psf->sf_oldin = psf->sf_count[MCAST_INCLUDE] != 0;
2239 static int sf_setstate(struct ifmcaddr6 *pmc)
2241 struct ip6_sf_list *psf, *dpsf;
2242 int mca_xcount = pmc->mca_sfcount[MCAST_EXCLUDE];
2243 int qrv = pmc->idev->mc_qrv;
2244 int new_in, rv;
2246 rv = 0;
2247 for (psf = pmc->mca_sources; psf; psf = psf->sf_next) {
2248 if (pmc->mca_sfcount[MCAST_EXCLUDE]) {
2249 new_in = mca_xcount == psf->sf_count[MCAST_EXCLUDE] &&
2250 !psf->sf_count[MCAST_INCLUDE];
2251 } else
2252 new_in = psf->sf_count[MCAST_INCLUDE] != 0;
2253 if (new_in) {
2254 if (!psf->sf_oldin) {
2255 struct ip6_sf_list *prev = NULL;
2257 for (dpsf = pmc->mca_tomb; dpsf;
2258 dpsf = dpsf->sf_next) {
2259 if (ipv6_addr_equal(&dpsf->sf_addr,
2260 &psf->sf_addr))
2261 break;
2262 prev = dpsf;
2264 if (dpsf) {
2265 if (prev)
2266 prev->sf_next = dpsf->sf_next;
2267 else
2268 pmc->mca_tomb = dpsf->sf_next;
2269 kfree(dpsf);
2271 psf->sf_crcount = qrv;
2272 rv++;
2274 } else if (psf->sf_oldin) {
2275 psf->sf_crcount = 0;
2277 * add or update "delete" records if an active filter
2278 * is now inactive
2280 for (dpsf = pmc->mca_tomb; dpsf; dpsf = dpsf->sf_next)
2281 if (ipv6_addr_equal(&dpsf->sf_addr,
2282 &psf->sf_addr))
2283 break;
2284 if (!dpsf) {
2285 dpsf = kmalloc(sizeof(*dpsf), GFP_ATOMIC);
2286 if (!dpsf)
2287 continue;
2288 *dpsf = *psf;
2289 /* pmc->mca_lock held by callers */
2290 dpsf->sf_next = pmc->mca_tomb;
2291 pmc->mca_tomb = dpsf;
2293 dpsf->sf_crcount = qrv;
2294 rv++;
2297 return rv;
2301 * Add multicast source filter list to the interface list
2303 static int ip6_mc_add_src(struct inet6_dev *idev, const struct in6_addr *pmca,
2304 int sfmode, int sfcount, const struct in6_addr *psfsrc,
2305 int delta)
2307 struct ifmcaddr6 *pmc;
2308 int isexclude;
2309 int i, err;
2311 if (!idev)
2312 return -ENODEV;
2313 read_lock_bh(&idev->lock);
2314 for (pmc = idev->mc_list; pmc; pmc = pmc->next) {
2315 if (ipv6_addr_equal(pmca, &pmc->mca_addr))
2316 break;
2318 if (!pmc) {
2319 /* MCA not found?? bug */
2320 read_unlock_bh(&idev->lock);
2321 return -ESRCH;
2323 spin_lock_bh(&pmc->mca_lock);
2325 sf_markstate(pmc);
2326 isexclude = pmc->mca_sfmode == MCAST_EXCLUDE;
2327 if (!delta)
2328 pmc->mca_sfcount[sfmode]++;
2329 err = 0;
2330 for (i = 0; i < sfcount; i++) {
2331 err = ip6_mc_add1_src(pmc, sfmode, &psfsrc[i]);
2332 if (err)
2333 break;
2335 if (err) {
2336 int j;
2338 if (!delta)
2339 pmc->mca_sfcount[sfmode]--;
2340 for (j = 0; j < i; j++)
2341 ip6_mc_del1_src(pmc, sfmode, &psfsrc[j]);
2342 } else if (isexclude != (pmc->mca_sfcount[MCAST_EXCLUDE] != 0)) {
2343 struct ip6_sf_list *psf;
2345 /* filter mode change */
2346 if (pmc->mca_sfcount[MCAST_EXCLUDE])
2347 pmc->mca_sfmode = MCAST_EXCLUDE;
2348 else if (pmc->mca_sfcount[MCAST_INCLUDE])
2349 pmc->mca_sfmode = MCAST_INCLUDE;
2350 /* else no filters; keep old mode for reports */
2352 pmc->mca_crcount = idev->mc_qrv;
2353 idev->mc_ifc_count = pmc->mca_crcount;
2354 for (psf = pmc->mca_sources; psf; psf = psf->sf_next)
2355 psf->sf_crcount = 0;
2356 mld_ifc_event(idev);
2357 } else if (sf_setstate(pmc))
2358 mld_ifc_event(idev);
2359 spin_unlock_bh(&pmc->mca_lock);
2360 read_unlock_bh(&idev->lock);
2361 return err;
2364 static void ip6_mc_clear_src(struct ifmcaddr6 *pmc)
2366 struct ip6_sf_list *psf, *nextpsf;
2368 for (psf = pmc->mca_tomb; psf; psf = nextpsf) {
2369 nextpsf = psf->sf_next;
2370 kfree(psf);
2372 pmc->mca_tomb = NULL;
2373 for (psf = pmc->mca_sources; psf; psf = nextpsf) {
2374 nextpsf = psf->sf_next;
2375 kfree(psf);
2377 pmc->mca_sources = NULL;
2378 pmc->mca_sfmode = MCAST_EXCLUDE;
2379 pmc->mca_sfcount[MCAST_INCLUDE] = 0;
2380 pmc->mca_sfcount[MCAST_EXCLUDE] = 1;
2384 static void igmp6_join_group(struct ifmcaddr6 *ma)
2386 unsigned long delay;
2388 if (ma->mca_flags & MAF_NOREPORT)
2389 return;
2391 igmp6_send(&ma->mca_addr, ma->idev->dev, ICMPV6_MGM_REPORT);
2393 delay = prandom_u32() % unsolicited_report_interval(ma->idev);
2395 spin_lock_bh(&ma->mca_lock);
2396 if (del_timer(&ma->mca_timer)) {
2397 refcount_dec(&ma->mca_refcnt);
2398 delay = ma->mca_timer.expires - jiffies;
2401 if (!mod_timer(&ma->mca_timer, jiffies + delay))
2402 refcount_inc(&ma->mca_refcnt);
2403 ma->mca_flags |= MAF_TIMER_RUNNING | MAF_LAST_REPORTER;
2404 spin_unlock_bh(&ma->mca_lock);
2407 static int ip6_mc_leave_src(struct sock *sk, struct ipv6_mc_socklist *iml,
2408 struct inet6_dev *idev)
2410 int err;
2412 /* callers have the socket lock and rtnl lock
2413 * so no other readers or writers of iml or its sflist
2415 if (!iml->sflist) {
2416 /* any-source empty exclude case */
2417 return ip6_mc_del_src(idev, &iml->addr, iml->sfmode, 0, NULL, 0);
2419 err = ip6_mc_del_src(idev, &iml->addr, iml->sfmode,
2420 iml->sflist->sl_count, iml->sflist->sl_addr, 0);
2421 sock_kfree_s(sk, iml->sflist, IP6_SFLSIZE(iml->sflist->sl_max));
2422 iml->sflist = NULL;
2423 return err;
2426 static void igmp6_leave_group(struct ifmcaddr6 *ma)
2428 if (mld_in_v1_mode(ma->idev)) {
2429 if (ma->mca_flags & MAF_LAST_REPORTER)
2430 igmp6_send(&ma->mca_addr, ma->idev->dev,
2431 ICMPV6_MGM_REDUCTION);
2432 } else {
2433 mld_add_delrec(ma->idev, ma);
2434 mld_ifc_event(ma->idev);
2438 static void mld_gq_timer_expire(struct timer_list *t)
2440 struct inet6_dev *idev = from_timer(idev, t, mc_gq_timer);
2442 idev->mc_gq_running = 0;
2443 mld_send_report(idev, NULL);
2444 in6_dev_put(idev);
2447 static void mld_ifc_timer_expire(struct timer_list *t)
2449 struct inet6_dev *idev = from_timer(idev, t, mc_ifc_timer);
2451 mld_send_cr(idev);
2452 if (idev->mc_ifc_count) {
2453 idev->mc_ifc_count--;
2454 if (idev->mc_ifc_count)
2455 mld_ifc_start_timer(idev, idev->mc_maxdelay);
2457 in6_dev_put(idev);
2460 static void mld_ifc_event(struct inet6_dev *idev)
2462 if (mld_in_v1_mode(idev))
2463 return;
2464 idev->mc_ifc_count = idev->mc_qrv;
2465 mld_ifc_start_timer(idev, 1);
2468 static void igmp6_timer_handler(struct timer_list *t)
2470 struct ifmcaddr6 *ma = from_timer(ma, t, mca_timer);
2472 if (mld_in_v1_mode(ma->idev))
2473 igmp6_send(&ma->mca_addr, ma->idev->dev, ICMPV6_MGM_REPORT);
2474 else
2475 mld_send_report(ma->idev, ma);
2477 spin_lock(&ma->mca_lock);
2478 ma->mca_flags |= MAF_LAST_REPORTER;
2479 ma->mca_flags &= ~MAF_TIMER_RUNNING;
2480 spin_unlock(&ma->mca_lock);
2481 ma_put(ma);
2484 /* Device changing type */
2486 void ipv6_mc_unmap(struct inet6_dev *idev)
2488 struct ifmcaddr6 *i;
2490 /* Install multicast list, except for all-nodes (already installed) */
2492 read_lock_bh(&idev->lock);
2493 for (i = idev->mc_list; i; i = i->next)
2494 igmp6_group_dropped(i);
2495 read_unlock_bh(&idev->lock);
2498 void ipv6_mc_remap(struct inet6_dev *idev)
2500 ipv6_mc_up(idev);
2503 /* Device going down */
2505 void ipv6_mc_down(struct inet6_dev *idev)
2507 struct ifmcaddr6 *i;
2509 /* Withdraw multicast list */
2511 read_lock_bh(&idev->lock);
2513 for (i = idev->mc_list; i; i = i->next)
2514 igmp6_group_dropped(i);
2516 /* Should stop timer after group drop. or we will
2517 * start timer again in mld_ifc_event()
2519 mld_ifc_stop_timer(idev);
2520 mld_gq_stop_timer(idev);
2521 mld_dad_stop_timer(idev);
2522 read_unlock_bh(&idev->lock);
2525 static void ipv6_mc_reset(struct inet6_dev *idev)
2527 idev->mc_qrv = sysctl_mld_qrv;
2528 idev->mc_qi = MLD_QI_DEFAULT;
2529 idev->mc_qri = MLD_QRI_DEFAULT;
2530 idev->mc_v1_seen = 0;
2531 idev->mc_maxdelay = unsolicited_report_interval(idev);
2534 /* Device going up */
2536 void ipv6_mc_up(struct inet6_dev *idev)
2538 struct ifmcaddr6 *i;
2540 /* Install multicast list, except for all-nodes (already installed) */
2542 read_lock_bh(&idev->lock);
2543 ipv6_mc_reset(idev);
2544 for (i = idev->mc_list; i; i = i->next) {
2545 mld_del_delrec(idev, i);
2546 igmp6_group_added(i);
2548 read_unlock_bh(&idev->lock);
2551 /* IPv6 device initialization. */
2553 void ipv6_mc_init_dev(struct inet6_dev *idev)
2555 write_lock_bh(&idev->lock);
2556 spin_lock_init(&idev->mc_lock);
2557 idev->mc_gq_running = 0;
2558 timer_setup(&idev->mc_gq_timer, mld_gq_timer_expire, 0);
2559 idev->mc_tomb = NULL;
2560 idev->mc_ifc_count = 0;
2561 timer_setup(&idev->mc_ifc_timer, mld_ifc_timer_expire, 0);
2562 timer_setup(&idev->mc_dad_timer, mld_dad_timer_expire, 0);
2563 ipv6_mc_reset(idev);
2564 write_unlock_bh(&idev->lock);
2568 * Device is about to be destroyed: clean up.
2571 void ipv6_mc_destroy_dev(struct inet6_dev *idev)
2573 struct ifmcaddr6 *i;
2575 /* Deactivate timers */
2576 ipv6_mc_down(idev);
2577 mld_clear_delrec(idev);
2579 /* Delete all-nodes address. */
2580 /* We cannot call ipv6_dev_mc_dec() directly, our caller in
2581 * addrconf.c has NULL'd out dev->ip6_ptr so in6_dev_get() will
2582 * fail.
2584 __ipv6_dev_mc_dec(idev, &in6addr_linklocal_allnodes);
2586 if (idev->cnf.forwarding)
2587 __ipv6_dev_mc_dec(idev, &in6addr_linklocal_allrouters);
2589 write_lock_bh(&idev->lock);
2590 while ((i = idev->mc_list) != NULL) {
2591 idev->mc_list = i->next;
2593 write_unlock_bh(&idev->lock);
2594 ma_put(i);
2595 write_lock_bh(&idev->lock);
2597 write_unlock_bh(&idev->lock);
2600 static void ipv6_mc_rejoin_groups(struct inet6_dev *idev)
2602 struct ifmcaddr6 *pmc;
2604 ASSERT_RTNL();
2606 if (mld_in_v1_mode(idev)) {
2607 read_lock_bh(&idev->lock);
2608 for (pmc = idev->mc_list; pmc; pmc = pmc->next)
2609 igmp6_join_group(pmc);
2610 read_unlock_bh(&idev->lock);
2611 } else
2612 mld_send_report(idev, NULL);
2615 static int ipv6_mc_netdev_event(struct notifier_block *this,
2616 unsigned long event,
2617 void *ptr)
2619 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
2620 struct inet6_dev *idev = __in6_dev_get(dev);
2622 switch (event) {
2623 case NETDEV_RESEND_IGMP:
2624 if (idev)
2625 ipv6_mc_rejoin_groups(idev);
2626 break;
2627 default:
2628 break;
2631 return NOTIFY_DONE;
2634 static struct notifier_block igmp6_netdev_notifier = {
2635 .notifier_call = ipv6_mc_netdev_event,
2638 #ifdef CONFIG_PROC_FS
2639 struct igmp6_mc_iter_state {
2640 struct seq_net_private p;
2641 struct net_device *dev;
2642 struct inet6_dev *idev;
2645 #define igmp6_mc_seq_private(seq) ((struct igmp6_mc_iter_state *)(seq)->private)
2647 static inline struct ifmcaddr6 *igmp6_mc_get_first(struct seq_file *seq)
2649 struct ifmcaddr6 *im = NULL;
2650 struct igmp6_mc_iter_state *state = igmp6_mc_seq_private(seq);
2651 struct net *net = seq_file_net(seq);
2653 state->idev = NULL;
2654 for_each_netdev_rcu(net, state->dev) {
2655 struct inet6_dev *idev;
2656 idev = __in6_dev_get(state->dev);
2657 if (!idev)
2658 continue;
2659 read_lock_bh(&idev->lock);
2660 im = idev->mc_list;
2661 if (im) {
2662 state->idev = idev;
2663 break;
2665 read_unlock_bh(&idev->lock);
2667 return im;
2670 static struct ifmcaddr6 *igmp6_mc_get_next(struct seq_file *seq, struct ifmcaddr6 *im)
2672 struct igmp6_mc_iter_state *state = igmp6_mc_seq_private(seq);
2674 im = im->next;
2675 while (!im) {
2676 if (likely(state->idev))
2677 read_unlock_bh(&state->idev->lock);
2679 state->dev = next_net_device_rcu(state->dev);
2680 if (!state->dev) {
2681 state->idev = NULL;
2682 break;
2684 state->idev = __in6_dev_get(state->dev);
2685 if (!state->idev)
2686 continue;
2687 read_lock_bh(&state->idev->lock);
2688 im = state->idev->mc_list;
2690 return im;
2693 static struct ifmcaddr6 *igmp6_mc_get_idx(struct seq_file *seq, loff_t pos)
2695 struct ifmcaddr6 *im = igmp6_mc_get_first(seq);
2696 if (im)
2697 while (pos && (im = igmp6_mc_get_next(seq, im)) != NULL)
2698 --pos;
2699 return pos ? NULL : im;
2702 static void *igmp6_mc_seq_start(struct seq_file *seq, loff_t *pos)
2703 __acquires(RCU)
2705 rcu_read_lock();
2706 return igmp6_mc_get_idx(seq, *pos);
2709 static void *igmp6_mc_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2711 struct ifmcaddr6 *im = igmp6_mc_get_next(seq, v);
2713 ++*pos;
2714 return im;
2717 static void igmp6_mc_seq_stop(struct seq_file *seq, void *v)
2718 __releases(RCU)
2720 struct igmp6_mc_iter_state *state = igmp6_mc_seq_private(seq);
2722 if (likely(state->idev)) {
2723 read_unlock_bh(&state->idev->lock);
2724 state->idev = NULL;
2726 state->dev = NULL;
2727 rcu_read_unlock();
2730 static int igmp6_mc_seq_show(struct seq_file *seq, void *v)
2732 struct ifmcaddr6 *im = (struct ifmcaddr6 *)v;
2733 struct igmp6_mc_iter_state *state = igmp6_mc_seq_private(seq);
2735 seq_printf(seq,
2736 "%-4d %-15s %pi6 %5d %08X %ld\n",
2737 state->dev->ifindex, state->dev->name,
2738 &im->mca_addr,
2739 im->mca_users, im->mca_flags,
2740 (im->mca_flags&MAF_TIMER_RUNNING) ?
2741 jiffies_to_clock_t(im->mca_timer.expires-jiffies) : 0);
2742 return 0;
2745 static const struct seq_operations igmp6_mc_seq_ops = {
2746 .start = igmp6_mc_seq_start,
2747 .next = igmp6_mc_seq_next,
2748 .stop = igmp6_mc_seq_stop,
2749 .show = igmp6_mc_seq_show,
2752 static int igmp6_mc_seq_open(struct inode *inode, struct file *file)
2754 return seq_open_net(inode, file, &igmp6_mc_seq_ops,
2755 sizeof(struct igmp6_mc_iter_state));
2758 static const struct file_operations igmp6_mc_seq_fops = {
2759 .open = igmp6_mc_seq_open,
2760 .read = seq_read,
2761 .llseek = seq_lseek,
2762 .release = seq_release_net,
2765 struct igmp6_mcf_iter_state {
2766 struct seq_net_private p;
2767 struct net_device *dev;
2768 struct inet6_dev *idev;
2769 struct ifmcaddr6 *im;
2772 #define igmp6_mcf_seq_private(seq) ((struct igmp6_mcf_iter_state *)(seq)->private)
2774 static inline struct ip6_sf_list *igmp6_mcf_get_first(struct seq_file *seq)
2776 struct ip6_sf_list *psf = NULL;
2777 struct ifmcaddr6 *im = NULL;
2778 struct igmp6_mcf_iter_state *state = igmp6_mcf_seq_private(seq);
2779 struct net *net = seq_file_net(seq);
2781 state->idev = NULL;
2782 state->im = NULL;
2783 for_each_netdev_rcu(net, state->dev) {
2784 struct inet6_dev *idev;
2785 idev = __in6_dev_get(state->dev);
2786 if (unlikely(idev == NULL))
2787 continue;
2788 read_lock_bh(&idev->lock);
2789 im = idev->mc_list;
2790 if (likely(im)) {
2791 spin_lock_bh(&im->mca_lock);
2792 psf = im->mca_sources;
2793 if (likely(psf)) {
2794 state->im = im;
2795 state->idev = idev;
2796 break;
2798 spin_unlock_bh(&im->mca_lock);
2800 read_unlock_bh(&idev->lock);
2802 return psf;
2805 static struct ip6_sf_list *igmp6_mcf_get_next(struct seq_file *seq, struct ip6_sf_list *psf)
2807 struct igmp6_mcf_iter_state *state = igmp6_mcf_seq_private(seq);
2809 psf = psf->sf_next;
2810 while (!psf) {
2811 spin_unlock_bh(&state->im->mca_lock);
2812 state->im = state->im->next;
2813 while (!state->im) {
2814 if (likely(state->idev))
2815 read_unlock_bh(&state->idev->lock);
2817 state->dev = next_net_device_rcu(state->dev);
2818 if (!state->dev) {
2819 state->idev = NULL;
2820 goto out;
2822 state->idev = __in6_dev_get(state->dev);
2823 if (!state->idev)
2824 continue;
2825 read_lock_bh(&state->idev->lock);
2826 state->im = state->idev->mc_list;
2828 if (!state->im)
2829 break;
2830 spin_lock_bh(&state->im->mca_lock);
2831 psf = state->im->mca_sources;
2833 out:
2834 return psf;
2837 static struct ip6_sf_list *igmp6_mcf_get_idx(struct seq_file *seq, loff_t pos)
2839 struct ip6_sf_list *psf = igmp6_mcf_get_first(seq);
2840 if (psf)
2841 while (pos && (psf = igmp6_mcf_get_next(seq, psf)) != NULL)
2842 --pos;
2843 return pos ? NULL : psf;
2846 static void *igmp6_mcf_seq_start(struct seq_file *seq, loff_t *pos)
2847 __acquires(RCU)
2849 rcu_read_lock();
2850 return *pos ? igmp6_mcf_get_idx(seq, *pos - 1) : SEQ_START_TOKEN;
2853 static void *igmp6_mcf_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2855 struct ip6_sf_list *psf;
2856 if (v == SEQ_START_TOKEN)
2857 psf = igmp6_mcf_get_first(seq);
2858 else
2859 psf = igmp6_mcf_get_next(seq, v);
2860 ++*pos;
2861 return psf;
2864 static void igmp6_mcf_seq_stop(struct seq_file *seq, void *v)
2865 __releases(RCU)
2867 struct igmp6_mcf_iter_state *state = igmp6_mcf_seq_private(seq);
2868 if (likely(state->im)) {
2869 spin_unlock_bh(&state->im->mca_lock);
2870 state->im = NULL;
2872 if (likely(state->idev)) {
2873 read_unlock_bh(&state->idev->lock);
2874 state->idev = NULL;
2876 state->dev = NULL;
2877 rcu_read_unlock();
2880 static int igmp6_mcf_seq_show(struct seq_file *seq, void *v)
2882 struct ip6_sf_list *psf = (struct ip6_sf_list *)v;
2883 struct igmp6_mcf_iter_state *state = igmp6_mcf_seq_private(seq);
2885 if (v == SEQ_START_TOKEN) {
2886 seq_puts(seq, "Idx Device Multicast Address Source Address INC EXC\n");
2887 } else {
2888 seq_printf(seq,
2889 "%3d %6.6s %pi6 %pi6 %6lu %6lu\n",
2890 state->dev->ifindex, state->dev->name,
2891 &state->im->mca_addr,
2892 &psf->sf_addr,
2893 psf->sf_count[MCAST_INCLUDE],
2894 psf->sf_count[MCAST_EXCLUDE]);
2896 return 0;
2899 static const struct seq_operations igmp6_mcf_seq_ops = {
2900 .start = igmp6_mcf_seq_start,
2901 .next = igmp6_mcf_seq_next,
2902 .stop = igmp6_mcf_seq_stop,
2903 .show = igmp6_mcf_seq_show,
2906 static int igmp6_mcf_seq_open(struct inode *inode, struct file *file)
2908 return seq_open_net(inode, file, &igmp6_mcf_seq_ops,
2909 sizeof(struct igmp6_mcf_iter_state));
2912 static const struct file_operations igmp6_mcf_seq_fops = {
2913 .open = igmp6_mcf_seq_open,
2914 .read = seq_read,
2915 .llseek = seq_lseek,
2916 .release = seq_release_net,
2919 static int __net_init igmp6_proc_init(struct net *net)
2921 int err;
2923 err = -ENOMEM;
2924 if (!proc_create("igmp6", S_IRUGO, net->proc_net, &igmp6_mc_seq_fops))
2925 goto out;
2926 if (!proc_create("mcfilter6", S_IRUGO, net->proc_net,
2927 &igmp6_mcf_seq_fops))
2928 goto out_proc_net_igmp6;
2930 err = 0;
2931 out:
2932 return err;
2934 out_proc_net_igmp6:
2935 remove_proc_entry("igmp6", net->proc_net);
2936 goto out;
2939 static void __net_exit igmp6_proc_exit(struct net *net)
2941 remove_proc_entry("mcfilter6", net->proc_net);
2942 remove_proc_entry("igmp6", net->proc_net);
2944 #else
2945 static inline int igmp6_proc_init(struct net *net)
2947 return 0;
2949 static inline void igmp6_proc_exit(struct net *net)
2952 #endif
2954 static int __net_init igmp6_net_init(struct net *net)
2956 int err;
2958 err = inet_ctl_sock_create(&net->ipv6.igmp_sk, PF_INET6,
2959 SOCK_RAW, IPPROTO_ICMPV6, net);
2960 if (err < 0) {
2961 pr_err("Failed to initialize the IGMP6 control socket (err %d)\n",
2962 err);
2963 goto out;
2966 inet6_sk(net->ipv6.igmp_sk)->hop_limit = 1;
2968 err = inet_ctl_sock_create(&net->ipv6.mc_autojoin_sk, PF_INET6,
2969 SOCK_RAW, IPPROTO_ICMPV6, net);
2970 if (err < 0) {
2971 pr_err("Failed to initialize the IGMP6 autojoin socket (err %d)\n",
2972 err);
2973 goto out_sock_create;
2976 err = igmp6_proc_init(net);
2977 if (err)
2978 goto out_sock_create_autojoin;
2980 return 0;
2982 out_sock_create_autojoin:
2983 inet_ctl_sock_destroy(net->ipv6.mc_autojoin_sk);
2984 out_sock_create:
2985 inet_ctl_sock_destroy(net->ipv6.igmp_sk);
2986 out:
2987 return err;
2990 static void __net_exit igmp6_net_exit(struct net *net)
2992 inet_ctl_sock_destroy(net->ipv6.igmp_sk);
2993 inet_ctl_sock_destroy(net->ipv6.mc_autojoin_sk);
2994 igmp6_proc_exit(net);
2997 static struct pernet_operations igmp6_net_ops = {
2998 .init = igmp6_net_init,
2999 .exit = igmp6_net_exit,
3002 int __init igmp6_init(void)
3004 return register_pernet_subsys(&igmp6_net_ops);
3007 int __init igmp6_late_init(void)
3009 return register_netdevice_notifier(&igmp6_netdev_notifier);
3012 void igmp6_cleanup(void)
3014 unregister_pernet_subsys(&igmp6_net_ops);
3017 void igmp6_late_cleanup(void)
3019 unregister_netdevice_notifier(&igmp6_netdev_notifier);