2 * Multicast support for IPv6
3 * Linux INET6 implementation
6 * Pedro Roque <roque@di.fc.ul.pt>
8 * Based on linux/ipv4/igmp.c and linux/ipv4/ip_sockglue.c
10 * This program is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU General Public License
12 * as published by the Free Software Foundation; either version
13 * 2 of the License, or (at your option) any later version.
18 * yoshfuji : fix format of router-alert option
19 * YOSHIFUJI Hideaki @USAGI:
20 * Fixed source address for MLD message based on
21 * <draft-ietf-magma-mld-source-05.txt>.
22 * YOSHIFUJI Hideaki @USAGI:
23 * - Ignore Queries for invalid addresses.
24 * - MLD for link-local addresses.
25 * David L Stevens <dlstevens@us.ibm.com>:
29 #include <linux/module.h>
30 #include <linux/errno.h>
31 #include <linux/types.h>
32 #include <linux/string.h>
33 #include <linux/socket.h>
34 #include <linux/sockios.h>
35 #include <linux/jiffies.h>
36 #include <linux/times.h>
37 #include <linux/net.h>
39 #include <linux/in6.h>
40 #include <linux/netdevice.h>
41 #include <linux/if_arp.h>
42 #include <linux/route.h>
43 #include <linux/init.h>
44 #include <linux/proc_fs.h>
45 #include <linux/seq_file.h>
46 #include <linux/slab.h>
47 #include <linux/pkt_sched.h>
50 #include <linux/netfilter.h>
51 #include <linux/netfilter_ipv6.h>
53 #include <net/net_namespace.h>
58 #include <net/protocol.h>
59 #include <net/if_inet6.h>
60 #include <net/ndisc.h>
61 #include <net/addrconf.h>
62 #include <net/ip6_route.h>
63 #include <net/inet_common.h>
65 #include <net/ip6_checksum.h>
67 /* Ensure that we have struct in6_addr aligned on 32bit word. */
68 static int __mld2_query_bugs[] __attribute__((__unused__)) = {
69 BUILD_BUG_ON_ZERO(offsetof(struct mld2_query, mld2q_srcs) % 4),
70 BUILD_BUG_ON_ZERO(offsetof(struct mld2_report, mld2r_grec) % 4),
71 BUILD_BUG_ON_ZERO(offsetof(struct mld2_grec, grec_mca) % 4)
74 static struct in6_addr mld2_all_mcr = MLD2_ALL_MCR_INIT;
76 static void igmp6_join_group(struct ifmcaddr6 *ma);
77 static void igmp6_leave_group(struct ifmcaddr6 *ma);
78 static void igmp6_timer_handler(struct timer_list *t);
80 static void mld_gq_timer_expire(struct timer_list *t);
81 static void mld_ifc_timer_expire(struct timer_list *t);
82 static void mld_ifc_event(struct inet6_dev *idev);
83 static void mld_add_delrec(struct inet6_dev *idev, struct ifmcaddr6 *pmc);
84 static void mld_del_delrec(struct inet6_dev *idev, struct ifmcaddr6 *pmc);
85 static void mld_clear_delrec(struct inet6_dev *idev);
86 static bool mld_in_v1_mode(const struct inet6_dev *idev);
87 static int sf_setstate(struct ifmcaddr6 *pmc);
88 static void sf_markstate(struct ifmcaddr6 *pmc);
89 static void ip6_mc_clear_src(struct ifmcaddr6 *pmc);
90 static int ip6_mc_del_src(struct inet6_dev *idev, const struct in6_addr *pmca,
91 int sfmode, int sfcount, const struct in6_addr *psfsrc,
93 static int ip6_mc_add_src(struct inet6_dev *idev, const struct in6_addr *pmca,
94 int sfmode, int sfcount, const struct in6_addr *psfsrc,
96 static int ip6_mc_leave_src(struct sock *sk, struct ipv6_mc_socklist *iml,
97 struct inet6_dev *idev);
99 #define MLD_QRV_DEFAULT 2
100 /* RFC3810, 9.2. Query Interval */
101 #define MLD_QI_DEFAULT (125 * HZ)
102 /* RFC3810, 9.3. Query Response Interval */
103 #define MLD_QRI_DEFAULT (10 * HZ)
105 /* RFC3810, 8.1 Query Version Distinctions */
106 #define MLD_V1_QUERY_LEN 24
107 #define MLD_V2_QUERY_LEN_MIN 28
109 #define IPV6_MLD_MAX_MSF 64
111 int sysctl_mld_max_msf __read_mostly = IPV6_MLD_MAX_MSF;
112 int sysctl_mld_qrv __read_mostly = MLD_QRV_DEFAULT;
115 * socket join on multicast group
118 #define for_each_pmc_rcu(np, pmc) \
119 for (pmc = rcu_dereference(np->ipv6_mc_list); \
121 pmc = rcu_dereference(pmc->next))
123 static int unsolicited_report_interval(struct inet6_dev *idev)
127 if (mld_in_v1_mode(idev))
128 iv = idev->cnf.mldv1_unsolicited_report_interval;
130 iv = idev->cnf.mldv2_unsolicited_report_interval;
132 return iv > 0 ? iv : 1;
135 int ipv6_sock_mc_join(struct sock *sk, int ifindex, const struct in6_addr *addr)
137 struct net_device *dev = NULL;
138 struct ipv6_mc_socklist *mc_lst;
139 struct ipv6_pinfo *np = inet6_sk(sk);
140 struct net *net = sock_net(sk);
145 if (!ipv6_addr_is_multicast(addr))
149 for_each_pmc_rcu(np, mc_lst) {
150 if ((ifindex == 0 || mc_lst->ifindex == ifindex) &&
151 ipv6_addr_equal(&mc_lst->addr, addr)) {
158 mc_lst = sock_kmalloc(sk, sizeof(struct ipv6_mc_socklist), GFP_KERNEL);
164 mc_lst->addr = *addr;
168 rt = rt6_lookup(net, addr, NULL, 0, NULL, 0);
174 dev = __dev_get_by_index(net, ifindex);
177 sock_kfree_s(sk, mc_lst, sizeof(*mc_lst));
181 mc_lst->ifindex = dev->ifindex;
182 mc_lst->sfmode = MCAST_EXCLUDE;
183 rwlock_init(&mc_lst->sflock);
184 mc_lst->sflist = NULL;
187 * now add/increase the group membership on the device
190 err = ipv6_dev_mc_inc(dev, addr);
193 sock_kfree_s(sk, mc_lst, sizeof(*mc_lst));
197 mc_lst->next = np->ipv6_mc_list;
198 rcu_assign_pointer(np->ipv6_mc_list, mc_lst);
202 EXPORT_SYMBOL(ipv6_sock_mc_join);
205 * socket leave on multicast group
207 int ipv6_sock_mc_drop(struct sock *sk, int ifindex, const struct in6_addr *addr)
209 struct ipv6_pinfo *np = inet6_sk(sk);
210 struct ipv6_mc_socklist *mc_lst;
211 struct ipv6_mc_socklist __rcu **lnk;
212 struct net *net = sock_net(sk);
216 if (!ipv6_addr_is_multicast(addr))
219 for (lnk = &np->ipv6_mc_list;
220 (mc_lst = rtnl_dereference(*lnk)) != NULL;
221 lnk = &mc_lst->next) {
222 if ((ifindex == 0 || mc_lst->ifindex == ifindex) &&
223 ipv6_addr_equal(&mc_lst->addr, addr)) {
224 struct net_device *dev;
228 dev = __dev_get_by_index(net, mc_lst->ifindex);
230 struct inet6_dev *idev = __in6_dev_get(dev);
232 (void) ip6_mc_leave_src(sk, mc_lst, idev);
234 __ipv6_dev_mc_dec(idev, &mc_lst->addr);
236 (void) ip6_mc_leave_src(sk, mc_lst, NULL);
238 atomic_sub(sizeof(*mc_lst), &sk->sk_omem_alloc);
239 kfree_rcu(mc_lst, rcu);
244 return -EADDRNOTAVAIL;
246 EXPORT_SYMBOL(ipv6_sock_mc_drop);
248 /* called with rcu_read_lock() */
249 static struct inet6_dev *ip6_mc_find_dev_rcu(struct net *net,
250 const struct in6_addr *group,
253 struct net_device *dev = NULL;
254 struct inet6_dev *idev = NULL;
257 struct rt6_info *rt = rt6_lookup(net, group, NULL, 0, NULL, 0);
264 dev = dev_get_by_index_rcu(net, ifindex);
268 idev = __in6_dev_get(dev);
271 read_lock_bh(&idev->lock);
273 read_unlock_bh(&idev->lock);
279 void __ipv6_sock_mc_close(struct sock *sk)
281 struct ipv6_pinfo *np = inet6_sk(sk);
282 struct ipv6_mc_socklist *mc_lst;
283 struct net *net = sock_net(sk);
287 while ((mc_lst = rtnl_dereference(np->ipv6_mc_list)) != NULL) {
288 struct net_device *dev;
290 np->ipv6_mc_list = mc_lst->next;
292 dev = __dev_get_by_index(net, mc_lst->ifindex);
294 struct inet6_dev *idev = __in6_dev_get(dev);
296 (void) ip6_mc_leave_src(sk, mc_lst, idev);
298 __ipv6_dev_mc_dec(idev, &mc_lst->addr);
300 (void) ip6_mc_leave_src(sk, mc_lst, NULL);
302 atomic_sub(sizeof(*mc_lst), &sk->sk_omem_alloc);
303 kfree_rcu(mc_lst, rcu);
307 void ipv6_sock_mc_close(struct sock *sk)
309 struct ipv6_pinfo *np = inet6_sk(sk);
311 if (!rcu_access_pointer(np->ipv6_mc_list))
314 __ipv6_sock_mc_close(sk);
318 int ip6_mc_source(int add, int omode, struct sock *sk,
319 struct group_source_req *pgsr)
321 struct in6_addr *source, *group;
322 struct ipv6_mc_socklist *pmc;
323 struct inet6_dev *idev;
324 struct ipv6_pinfo *inet6 = inet6_sk(sk);
325 struct ip6_sf_socklist *psl;
326 struct net *net = sock_net(sk);
332 source = &((struct sockaddr_in6 *)&pgsr->gsr_source)->sin6_addr;
333 group = &((struct sockaddr_in6 *)&pgsr->gsr_group)->sin6_addr;
335 if (!ipv6_addr_is_multicast(group))
339 idev = ip6_mc_find_dev_rcu(net, group, pgsr->gsr_interface);
345 err = -EADDRNOTAVAIL;
347 for_each_pmc_rcu(inet6, pmc) {
348 if (pgsr->gsr_interface && pmc->ifindex != pgsr->gsr_interface)
350 if (ipv6_addr_equal(&pmc->addr, group))
353 if (!pmc) { /* must have a prior join */
357 /* if a source filter was set, must be the same mode as before */
359 if (pmc->sfmode != omode) {
363 } else if (pmc->sfmode != omode) {
364 /* allow mode switches for empty-set filters */
365 ip6_mc_add_src(idev, group, omode, 0, NULL, 0);
366 ip6_mc_del_src(idev, group, pmc->sfmode, 0, NULL, 0);
370 write_lock(&pmc->sflock);
376 goto done; /* err = -EADDRNOTAVAIL */
378 for (i = 0; i < psl->sl_count; i++) {
379 rv = !ipv6_addr_equal(&psl->sl_addr[i], source);
383 if (rv) /* source not found */
384 goto done; /* err = -EADDRNOTAVAIL */
386 /* special case - (INCLUDE, empty) == LEAVE_GROUP */
387 if (psl->sl_count == 1 && omode == MCAST_INCLUDE) {
392 /* update the interface filter */
393 ip6_mc_del_src(idev, group, omode, 1, source, 1);
395 for (j = i+1; j < psl->sl_count; j++)
396 psl->sl_addr[j-1] = psl->sl_addr[j];
401 /* else, add a new source to the filter */
403 if (psl && psl->sl_count >= sysctl_mld_max_msf) {
407 if (!psl || psl->sl_count == psl->sl_max) {
408 struct ip6_sf_socklist *newpsl;
409 int count = IP6_SFBLOCK;
412 count += psl->sl_max;
413 newpsl = sock_kmalloc(sk, IP6_SFLSIZE(count), GFP_ATOMIC);
418 newpsl->sl_max = count;
419 newpsl->sl_count = count - IP6_SFBLOCK;
421 for (i = 0; i < psl->sl_count; i++)
422 newpsl->sl_addr[i] = psl->sl_addr[i];
423 sock_kfree_s(sk, psl, IP6_SFLSIZE(psl->sl_max));
425 pmc->sflist = psl = newpsl;
427 rv = 1; /* > 0 for insert logic below if sl_count is 0 */
428 for (i = 0; i < psl->sl_count; i++) {
429 rv = !ipv6_addr_equal(&psl->sl_addr[i], source);
430 if (rv == 0) /* There is an error in the address. */
433 for (j = psl->sl_count-1; j >= i; j--)
434 psl->sl_addr[j+1] = psl->sl_addr[j];
435 psl->sl_addr[i] = *source;
438 /* update the interface list */
439 ip6_mc_add_src(idev, group, omode, 1, source, 1);
442 write_unlock(&pmc->sflock);
443 read_unlock_bh(&idev->lock);
446 err = ipv6_sock_mc_drop(sk, pgsr->gsr_interface, group);
450 int ip6_mc_msfilter(struct sock *sk, struct group_filter *gsf)
452 const struct in6_addr *group;
453 struct ipv6_mc_socklist *pmc;
454 struct inet6_dev *idev;
455 struct ipv6_pinfo *inet6 = inet6_sk(sk);
456 struct ip6_sf_socklist *newpsl, *psl;
457 struct net *net = sock_net(sk);
461 group = &((struct sockaddr_in6 *)&gsf->gf_group)->sin6_addr;
463 if (!ipv6_addr_is_multicast(group))
465 if (gsf->gf_fmode != MCAST_INCLUDE &&
466 gsf->gf_fmode != MCAST_EXCLUDE)
470 idev = ip6_mc_find_dev_rcu(net, group, gsf->gf_interface);
479 if (gsf->gf_fmode == MCAST_INCLUDE && gsf->gf_numsrc == 0) {
484 for_each_pmc_rcu(inet6, pmc) {
485 if (pmc->ifindex != gsf->gf_interface)
487 if (ipv6_addr_equal(&pmc->addr, group))
490 if (!pmc) { /* must have a prior join */
494 if (gsf->gf_numsrc) {
495 newpsl = sock_kmalloc(sk, IP6_SFLSIZE(gsf->gf_numsrc),
501 newpsl->sl_max = newpsl->sl_count = gsf->gf_numsrc;
502 for (i = 0; i < newpsl->sl_count; ++i) {
503 struct sockaddr_in6 *psin6;
505 psin6 = (struct sockaddr_in6 *)&gsf->gf_slist[i];
506 newpsl->sl_addr[i] = psin6->sin6_addr;
508 err = ip6_mc_add_src(idev, group, gsf->gf_fmode,
509 newpsl->sl_count, newpsl->sl_addr, 0);
511 sock_kfree_s(sk, newpsl, IP6_SFLSIZE(newpsl->sl_max));
516 (void) ip6_mc_add_src(idev, group, gsf->gf_fmode, 0, NULL, 0);
519 write_lock(&pmc->sflock);
522 (void) ip6_mc_del_src(idev, group, pmc->sfmode,
523 psl->sl_count, psl->sl_addr, 0);
524 sock_kfree_s(sk, psl, IP6_SFLSIZE(psl->sl_max));
526 (void) ip6_mc_del_src(idev, group, pmc->sfmode, 0, NULL, 0);
527 pmc->sflist = newpsl;
528 pmc->sfmode = gsf->gf_fmode;
529 write_unlock(&pmc->sflock);
532 read_unlock_bh(&idev->lock);
535 err = ipv6_sock_mc_drop(sk, gsf->gf_interface, group);
539 int ip6_mc_msfget(struct sock *sk, struct group_filter *gsf,
540 struct group_filter __user *optval, int __user *optlen)
542 int err, i, count, copycount;
543 const struct in6_addr *group;
544 struct ipv6_mc_socklist *pmc;
545 struct inet6_dev *idev;
546 struct ipv6_pinfo *inet6 = inet6_sk(sk);
547 struct ip6_sf_socklist *psl;
548 struct net *net = sock_net(sk);
550 group = &((struct sockaddr_in6 *)&gsf->gf_group)->sin6_addr;
552 if (!ipv6_addr_is_multicast(group))
556 idev = ip6_mc_find_dev_rcu(net, group, gsf->gf_interface);
563 err = -EADDRNOTAVAIL;
564 /* changes to the ipv6_mc_list require the socket lock and
565 * rtnl lock. We have the socket lock and rcu read lock,
566 * so reading the list is safe.
569 for_each_pmc_rcu(inet6, pmc) {
570 if (pmc->ifindex != gsf->gf_interface)
572 if (ipv6_addr_equal(group, &pmc->addr))
575 if (!pmc) /* must have a prior join */
577 gsf->gf_fmode = pmc->sfmode;
579 count = psl ? psl->sl_count : 0;
580 read_unlock_bh(&idev->lock);
583 copycount = count < gsf->gf_numsrc ? count : gsf->gf_numsrc;
584 gsf->gf_numsrc = count;
585 if (put_user(GROUP_FILTER_SIZE(copycount), optlen) ||
586 copy_to_user(optval, gsf, GROUP_FILTER_SIZE(0))) {
589 /* changes to psl require the socket lock, and a write lock
590 * on pmc->sflock. We have the socket lock so reading here is safe.
592 for (i = 0; i < copycount; i++) {
593 struct sockaddr_in6 *psin6;
594 struct sockaddr_storage ss;
596 psin6 = (struct sockaddr_in6 *)&ss;
597 memset(&ss, 0, sizeof(ss));
598 psin6->sin6_family = AF_INET6;
599 psin6->sin6_addr = psl->sl_addr[i];
600 if (copy_to_user(&optval->gf_slist[i], &ss, sizeof(ss)))
605 read_unlock_bh(&idev->lock);
610 bool inet6_mc_check(struct sock *sk, const struct in6_addr *mc_addr,
611 const struct in6_addr *src_addr)
613 struct ipv6_pinfo *np = inet6_sk(sk);
614 struct ipv6_mc_socklist *mc;
615 struct ip6_sf_socklist *psl;
619 for_each_pmc_rcu(np, mc) {
620 if (ipv6_addr_equal(&mc->addr, mc_addr))
627 read_lock(&mc->sflock);
630 rv = mc->sfmode == MCAST_EXCLUDE;
634 for (i = 0; i < psl->sl_count; i++) {
635 if (ipv6_addr_equal(&psl->sl_addr[i], src_addr))
638 if (mc->sfmode == MCAST_INCLUDE && i >= psl->sl_count)
640 if (mc->sfmode == MCAST_EXCLUDE && i < psl->sl_count)
643 read_unlock(&mc->sflock);
649 static void igmp6_group_added(struct ifmcaddr6 *mc)
651 struct net_device *dev = mc->idev->dev;
652 char buf[MAX_ADDR_LEN];
654 if (IPV6_ADDR_MC_SCOPE(&mc->mca_addr) <
655 IPV6_ADDR_SCOPE_LINKLOCAL)
658 spin_lock_bh(&mc->mca_lock);
659 if (!(mc->mca_flags&MAF_LOADED)) {
660 mc->mca_flags |= MAF_LOADED;
661 if (ndisc_mc_map(&mc->mca_addr, buf, dev, 0) == 0)
662 dev_mc_add(dev, buf);
664 spin_unlock_bh(&mc->mca_lock);
666 if (!(dev->flags & IFF_UP) || (mc->mca_flags & MAF_NOREPORT))
669 if (mld_in_v1_mode(mc->idev)) {
670 igmp6_join_group(mc);
675 mc->mca_crcount = mc->idev->mc_qrv;
676 mld_ifc_event(mc->idev);
679 static void igmp6_group_dropped(struct ifmcaddr6 *mc)
681 struct net_device *dev = mc->idev->dev;
682 char buf[MAX_ADDR_LEN];
684 if (IPV6_ADDR_MC_SCOPE(&mc->mca_addr) <
685 IPV6_ADDR_SCOPE_LINKLOCAL)
688 spin_lock_bh(&mc->mca_lock);
689 if (mc->mca_flags&MAF_LOADED) {
690 mc->mca_flags &= ~MAF_LOADED;
691 if (ndisc_mc_map(&mc->mca_addr, buf, dev, 0) == 0)
692 dev_mc_del(dev, buf);
695 spin_unlock_bh(&mc->mca_lock);
696 if (mc->mca_flags & MAF_NOREPORT)
700 igmp6_leave_group(mc);
702 spin_lock_bh(&mc->mca_lock);
703 if (del_timer(&mc->mca_timer))
704 refcount_dec(&mc->mca_refcnt);
705 spin_unlock_bh(&mc->mca_lock);
709 * deleted ifmcaddr6 manipulation
711 static void mld_add_delrec(struct inet6_dev *idev, struct ifmcaddr6 *im)
713 struct ifmcaddr6 *pmc;
715 /* this is an "ifmcaddr6" for convenience; only the fields below
716 * are actually used. In particular, the refcnt and users are not
717 * used for management of the delete list. Using the same structure
718 * for deleted items allows change reports to use common code with
719 * non-deleted or query-response MCA's.
721 pmc = kzalloc(sizeof(*pmc), GFP_ATOMIC);
725 spin_lock_bh(&im->mca_lock);
726 spin_lock_init(&pmc->mca_lock);
727 pmc->idev = im->idev;
729 pmc->mca_addr = im->mca_addr;
730 pmc->mca_crcount = idev->mc_qrv;
731 pmc->mca_sfmode = im->mca_sfmode;
732 if (pmc->mca_sfmode == MCAST_INCLUDE) {
733 struct ip6_sf_list *psf;
735 pmc->mca_tomb = im->mca_tomb;
736 pmc->mca_sources = im->mca_sources;
737 im->mca_tomb = im->mca_sources = NULL;
738 for (psf = pmc->mca_sources; psf; psf = psf->sf_next)
739 psf->sf_crcount = pmc->mca_crcount;
741 spin_unlock_bh(&im->mca_lock);
743 spin_lock_bh(&idev->mc_lock);
744 pmc->next = idev->mc_tomb;
746 spin_unlock_bh(&idev->mc_lock);
749 static void mld_del_delrec(struct inet6_dev *idev, struct ifmcaddr6 *im)
751 struct ifmcaddr6 *pmc, *pmc_prev;
752 struct ip6_sf_list *psf;
753 struct in6_addr *pmca = &im->mca_addr;
755 spin_lock_bh(&idev->mc_lock);
757 for (pmc = idev->mc_tomb; pmc; pmc = pmc->next) {
758 if (ipv6_addr_equal(&pmc->mca_addr, pmca))
764 pmc_prev->next = pmc->next;
766 idev->mc_tomb = pmc->next;
768 spin_unlock_bh(&idev->mc_lock);
770 spin_lock_bh(&im->mca_lock);
772 im->idev = pmc->idev;
773 im->mca_crcount = idev->mc_qrv;
774 im->mca_sfmode = pmc->mca_sfmode;
775 if (pmc->mca_sfmode == MCAST_INCLUDE) {
776 im->mca_tomb = pmc->mca_tomb;
777 im->mca_sources = pmc->mca_sources;
778 for (psf = im->mca_sources; psf; psf = psf->sf_next)
779 psf->sf_crcount = im->mca_crcount;
781 in6_dev_put(pmc->idev);
784 spin_unlock_bh(&im->mca_lock);
787 static void mld_clear_delrec(struct inet6_dev *idev)
789 struct ifmcaddr6 *pmc, *nextpmc;
791 spin_lock_bh(&idev->mc_lock);
793 idev->mc_tomb = NULL;
794 spin_unlock_bh(&idev->mc_lock);
796 for (; pmc; pmc = nextpmc) {
798 ip6_mc_clear_src(pmc);
799 in6_dev_put(pmc->idev);
803 /* clear dead sources, too */
804 read_lock_bh(&idev->lock);
805 for (pmc = idev->mc_list; pmc; pmc = pmc->next) {
806 struct ip6_sf_list *psf, *psf_next;
808 spin_lock_bh(&pmc->mca_lock);
810 pmc->mca_tomb = NULL;
811 spin_unlock_bh(&pmc->mca_lock);
812 for (; psf; psf = psf_next) {
813 psf_next = psf->sf_next;
817 read_unlock_bh(&idev->lock);
820 static void mca_get(struct ifmcaddr6 *mc)
822 refcount_inc(&mc->mca_refcnt);
825 static void ma_put(struct ifmcaddr6 *mc)
827 if (refcount_dec_and_test(&mc->mca_refcnt)) {
828 in6_dev_put(mc->idev);
833 static struct ifmcaddr6 *mca_alloc(struct inet6_dev *idev,
834 const struct in6_addr *addr)
836 struct ifmcaddr6 *mc;
838 mc = kzalloc(sizeof(*mc), GFP_ATOMIC);
842 timer_setup(&mc->mca_timer, igmp6_timer_handler, 0);
844 mc->mca_addr = *addr;
845 mc->idev = idev; /* reference taken by caller */
847 /* mca_stamp should be updated upon changes */
848 mc->mca_cstamp = mc->mca_tstamp = jiffies;
849 refcount_set(&mc->mca_refcnt, 1);
850 spin_lock_init(&mc->mca_lock);
852 /* initial mode is (EX, empty) */
853 mc->mca_sfmode = MCAST_EXCLUDE;
854 mc->mca_sfcount[MCAST_EXCLUDE] = 1;
856 if (ipv6_addr_is_ll_all_nodes(&mc->mca_addr) ||
857 IPV6_ADDR_MC_SCOPE(&mc->mca_addr) < IPV6_ADDR_SCOPE_LINKLOCAL)
858 mc->mca_flags |= MAF_NOREPORT;
864 * device multicast group inc (add if not found)
866 int ipv6_dev_mc_inc(struct net_device *dev, const struct in6_addr *addr)
868 struct ifmcaddr6 *mc;
869 struct inet6_dev *idev;
873 /* we need to take a reference on idev */
874 idev = in6_dev_get(dev);
879 write_lock_bh(&idev->lock);
881 write_unlock_bh(&idev->lock);
886 for (mc = idev->mc_list; mc; mc = mc->next) {
887 if (ipv6_addr_equal(&mc->mca_addr, addr)) {
889 write_unlock_bh(&idev->lock);
890 ip6_mc_add_src(idev, &mc->mca_addr, MCAST_EXCLUDE, 0,
897 mc = mca_alloc(idev, addr);
899 write_unlock_bh(&idev->lock);
904 mc->next = idev->mc_list;
907 /* Hold this for the code below before we unlock,
908 * it is already exposed via idev->mc_list.
911 write_unlock_bh(&idev->lock);
913 mld_del_delrec(idev, mc);
914 igmp6_group_added(mc);
920 * device multicast group del
922 int __ipv6_dev_mc_dec(struct inet6_dev *idev, const struct in6_addr *addr)
924 struct ifmcaddr6 *ma, **map;
928 write_lock_bh(&idev->lock);
929 for (map = &idev->mc_list; (ma = *map) != NULL; map = &ma->next) {
930 if (ipv6_addr_equal(&ma->mca_addr, addr)) {
931 if (--ma->mca_users == 0) {
933 write_unlock_bh(&idev->lock);
935 igmp6_group_dropped(ma);
936 ip6_mc_clear_src(ma);
941 write_unlock_bh(&idev->lock);
945 write_unlock_bh(&idev->lock);
950 int ipv6_dev_mc_dec(struct net_device *dev, const struct in6_addr *addr)
952 struct inet6_dev *idev;
957 idev = __in6_dev_get(dev);
961 err = __ipv6_dev_mc_dec(idev, addr);
967 * check if the interface/address pair is valid
969 bool ipv6_chk_mcast_addr(struct net_device *dev, const struct in6_addr *group,
970 const struct in6_addr *src_addr)
972 struct inet6_dev *idev;
973 struct ifmcaddr6 *mc;
977 idev = __in6_dev_get(dev);
979 read_lock_bh(&idev->lock);
980 for (mc = idev->mc_list; mc; mc = mc->next) {
981 if (ipv6_addr_equal(&mc->mca_addr, group))
985 if (src_addr && !ipv6_addr_any(src_addr)) {
986 struct ip6_sf_list *psf;
988 spin_lock_bh(&mc->mca_lock);
989 for (psf = mc->mca_sources; psf; psf = psf->sf_next) {
990 if (ipv6_addr_equal(&psf->sf_addr, src_addr))
994 rv = psf->sf_count[MCAST_INCLUDE] ||
995 psf->sf_count[MCAST_EXCLUDE] !=
996 mc->mca_sfcount[MCAST_EXCLUDE];
998 rv = mc->mca_sfcount[MCAST_EXCLUDE] != 0;
999 spin_unlock_bh(&mc->mca_lock);
1001 rv = true; /* don't filter unspecified source */
1003 read_unlock_bh(&idev->lock);
1009 static void mld_gq_start_timer(struct inet6_dev *idev)
1011 unsigned long tv = prandom_u32() % idev->mc_maxdelay;
1013 idev->mc_gq_running = 1;
1014 if (!mod_timer(&idev->mc_gq_timer, jiffies+tv+2))
1018 static void mld_gq_stop_timer(struct inet6_dev *idev)
1020 idev->mc_gq_running = 0;
1021 if (del_timer(&idev->mc_gq_timer))
1022 __in6_dev_put(idev);
1025 static void mld_ifc_start_timer(struct inet6_dev *idev, unsigned long delay)
1027 unsigned long tv = prandom_u32() % delay;
1029 if (!mod_timer(&idev->mc_ifc_timer, jiffies+tv+2))
1033 static void mld_ifc_stop_timer(struct inet6_dev *idev)
1035 idev->mc_ifc_count = 0;
1036 if (del_timer(&idev->mc_ifc_timer))
1037 __in6_dev_put(idev);
1040 static void mld_dad_start_timer(struct inet6_dev *idev, unsigned long delay)
1042 unsigned long tv = prandom_u32() % delay;
1044 if (!mod_timer(&idev->mc_dad_timer, jiffies+tv+2))
1048 static void mld_dad_stop_timer(struct inet6_dev *idev)
1050 if (del_timer(&idev->mc_dad_timer))
1051 __in6_dev_put(idev);
1055 * IGMP handling (alias multicast ICMPv6 messages)
1058 static void igmp6_group_queried(struct ifmcaddr6 *ma, unsigned long resptime)
1060 unsigned long delay = resptime;
1062 /* Do not start timer for these addresses */
1063 if (ipv6_addr_is_ll_all_nodes(&ma->mca_addr) ||
1064 IPV6_ADDR_MC_SCOPE(&ma->mca_addr) < IPV6_ADDR_SCOPE_LINKLOCAL)
1067 if (del_timer(&ma->mca_timer)) {
1068 refcount_dec(&ma->mca_refcnt);
1069 delay = ma->mca_timer.expires - jiffies;
1072 if (delay >= resptime)
1073 delay = prandom_u32() % resptime;
1075 ma->mca_timer.expires = jiffies + delay;
1076 if (!mod_timer(&ma->mca_timer, jiffies + delay))
1077 refcount_inc(&ma->mca_refcnt);
1078 ma->mca_flags |= MAF_TIMER_RUNNING;
1081 /* mark EXCLUDE-mode sources */
1082 static bool mld_xmarksources(struct ifmcaddr6 *pmc, int nsrcs,
1083 const struct in6_addr *srcs)
1085 struct ip6_sf_list *psf;
1089 for (psf = pmc->mca_sources; psf; psf = psf->sf_next) {
1090 if (scount == nsrcs)
1092 for (i = 0; i < nsrcs; i++) {
1093 /* skip inactive filters */
1094 if (psf->sf_count[MCAST_INCLUDE] ||
1095 pmc->mca_sfcount[MCAST_EXCLUDE] !=
1096 psf->sf_count[MCAST_EXCLUDE])
1098 if (ipv6_addr_equal(&srcs[i], &psf->sf_addr)) {
1104 pmc->mca_flags &= ~MAF_GSQUERY;
1105 if (scount == nsrcs) /* all sources excluded */
1110 static bool mld_marksources(struct ifmcaddr6 *pmc, int nsrcs,
1111 const struct in6_addr *srcs)
1113 struct ip6_sf_list *psf;
1116 if (pmc->mca_sfmode == MCAST_EXCLUDE)
1117 return mld_xmarksources(pmc, nsrcs, srcs);
1119 /* mark INCLUDE-mode sources */
1122 for (psf = pmc->mca_sources; psf; psf = psf->sf_next) {
1123 if (scount == nsrcs)
1125 for (i = 0; i < nsrcs; i++) {
1126 if (ipv6_addr_equal(&srcs[i], &psf->sf_addr)) {
1134 pmc->mca_flags &= ~MAF_GSQUERY;
1137 pmc->mca_flags |= MAF_GSQUERY;
1141 static int mld_force_mld_version(const struct inet6_dev *idev)
1143 /* Normally, both are 0 here. If enforcement to a particular is
1144 * being used, individual device enforcement will have a lower
1145 * precedence over 'all' device (.../conf/all/force_mld_version).
1148 if (dev_net(idev->dev)->ipv6.devconf_all->force_mld_version != 0)
1149 return dev_net(idev->dev)->ipv6.devconf_all->force_mld_version;
1151 return idev->cnf.force_mld_version;
1154 static bool mld_in_v2_mode_only(const struct inet6_dev *idev)
1156 return mld_force_mld_version(idev) == 2;
1159 static bool mld_in_v1_mode_only(const struct inet6_dev *idev)
1161 return mld_force_mld_version(idev) == 1;
1164 static bool mld_in_v1_mode(const struct inet6_dev *idev)
1166 if (mld_in_v2_mode_only(idev))
1168 if (mld_in_v1_mode_only(idev))
1170 if (idev->mc_v1_seen && time_before(jiffies, idev->mc_v1_seen))
1176 static void mld_set_v1_mode(struct inet6_dev *idev)
1178 /* RFC3810, relevant sections:
1179 * - 9.1. Robustness Variable
1180 * - 9.2. Query Interval
1181 * - 9.3. Query Response Interval
1182 * - 9.12. Older Version Querier Present Timeout
1184 unsigned long switchback;
1186 switchback = (idev->mc_qrv * idev->mc_qi) + idev->mc_qri;
1188 idev->mc_v1_seen = jiffies + switchback;
1191 static void mld_update_qrv(struct inet6_dev *idev,
1192 const struct mld2_query *mlh2)
1194 /* RFC3810, relevant sections:
1195 * - 5.1.8. QRV (Querier's Robustness Variable)
1196 * - 9.1. Robustness Variable
1199 /* The value of the Robustness Variable MUST NOT be zero,
1200 * and SHOULD NOT be one. Catch this here if we ever run
1201 * into such a case in future.
1203 const int min_qrv = min(MLD_QRV_DEFAULT, sysctl_mld_qrv);
1204 WARN_ON(idev->mc_qrv == 0);
1206 if (mlh2->mld2q_qrv > 0)
1207 idev->mc_qrv = mlh2->mld2q_qrv;
1209 if (unlikely(idev->mc_qrv < min_qrv)) {
1210 net_warn_ratelimited("IPv6: MLD: clamping QRV from %u to %u!\n",
1211 idev->mc_qrv, min_qrv);
1212 idev->mc_qrv = min_qrv;
1216 static void mld_update_qi(struct inet6_dev *idev,
1217 const struct mld2_query *mlh2)
1219 /* RFC3810, relevant sections:
1220 * - 5.1.9. QQIC (Querier's Query Interval Code)
1221 * - 9.2. Query Interval
1222 * - 9.12. Older Version Querier Present Timeout
1223 * (the [Query Interval] in the last Query received)
1225 unsigned long mc_qqi;
1227 if (mlh2->mld2q_qqic < 128) {
1228 mc_qqi = mlh2->mld2q_qqic;
1230 unsigned long mc_man, mc_exp;
1232 mc_exp = MLDV2_QQIC_EXP(mlh2->mld2q_qqic);
1233 mc_man = MLDV2_QQIC_MAN(mlh2->mld2q_qqic);
1235 mc_qqi = (mc_man | 0x10) << (mc_exp + 3);
1238 idev->mc_qi = mc_qqi * HZ;
1241 static void mld_update_qri(struct inet6_dev *idev,
1242 const struct mld2_query *mlh2)
1244 /* RFC3810, relevant sections:
1245 * - 5.1.3. Maximum Response Code
1246 * - 9.3. Query Response Interval
1248 idev->mc_qri = msecs_to_jiffies(mldv2_mrc(mlh2));
1251 static int mld_process_v1(struct inet6_dev *idev, struct mld_msg *mld,
1252 unsigned long *max_delay, bool v1_query)
1254 unsigned long mldv1_md;
1256 /* Ignore v1 queries */
1257 if (mld_in_v2_mode_only(idev))
1260 mldv1_md = ntohs(mld->mld_maxdelay);
1262 /* When in MLDv1 fallback and a MLDv2 router start-up being
1263 * unaware of current MLDv1 operation, the MRC == MRD mapping
1264 * only works when the exponential algorithm is not being
1265 * used (as MLDv1 is unaware of such things).
1267 * According to the RFC author, the MLDv2 implementations
1268 * he's aware of all use a MRC < 32768 on start up queries.
1270 * Thus, should we *ever* encounter something else larger
1271 * than that, just assume the maximum possible within our
1275 mldv1_md = min(mldv1_md, MLDV1_MRD_MAX_COMPAT);
1277 *max_delay = max(msecs_to_jiffies(mldv1_md), 1UL);
1279 /* MLDv1 router present: we need to go into v1 mode *only*
1280 * when an MLDv1 query is received as per section 9.12. of
1281 * RFC3810! And we know from RFC2710 section 3.7 that MLDv1
1282 * queries MUST be of exactly 24 octets.
1285 mld_set_v1_mode(idev);
1287 /* cancel MLDv2 report timer */
1288 mld_gq_stop_timer(idev);
1289 /* cancel the interface change timer */
1290 mld_ifc_stop_timer(idev);
1291 /* clear deleted report items */
1292 mld_clear_delrec(idev);
1297 static int mld_process_v2(struct inet6_dev *idev, struct mld2_query *mld,
1298 unsigned long *max_delay)
1300 *max_delay = max(msecs_to_jiffies(mldv2_mrc(mld)), 1UL);
1302 mld_update_qrv(idev, mld);
1303 mld_update_qi(idev, mld);
1304 mld_update_qri(idev, mld);
1306 idev->mc_maxdelay = *max_delay;
1311 /* called with rcu_read_lock() */
1312 int igmp6_event_query(struct sk_buff *skb)
1314 struct mld2_query *mlh2 = NULL;
1315 struct ifmcaddr6 *ma;
1316 const struct in6_addr *group;
1317 unsigned long max_delay;
1318 struct inet6_dev *idev;
1319 struct mld_msg *mld;
1324 if (!pskb_may_pull(skb, sizeof(struct in6_addr)))
1327 /* compute payload length excluding extension headers */
1328 len = ntohs(ipv6_hdr(skb)->payload_len) + sizeof(struct ipv6hdr);
1329 len -= skb_network_header_len(skb);
1332 * Upon reception of an MLD message that contains a Query, the node
1333 * checks if the source address of the message is a valid link-local
1334 * address, if the Hop Limit is set to 1, and if the Router Alert
1335 * option is present in the Hop-By-Hop Options header of the IPv6
1336 * packet. If any of these checks fails, the packet is dropped.
1338 if (!(ipv6_addr_type(&ipv6_hdr(skb)->saddr) & IPV6_ADDR_LINKLOCAL) ||
1339 ipv6_hdr(skb)->hop_limit != 1 ||
1340 !(IP6CB(skb)->flags & IP6SKB_ROUTERALERT) ||
1341 IP6CB(skb)->ra != htons(IPV6_OPT_ROUTERALERT_MLD))
1344 idev = __in6_dev_get(skb->dev);
1348 mld = (struct mld_msg *)icmp6_hdr(skb);
1349 group = &mld->mld_mca;
1350 group_type = ipv6_addr_type(group);
1352 if (group_type != IPV6_ADDR_ANY &&
1353 !(group_type&IPV6_ADDR_MULTICAST))
1356 if (len < MLD_V1_QUERY_LEN) {
1358 } else if (len == MLD_V1_QUERY_LEN || mld_in_v1_mode(idev)) {
1359 err = mld_process_v1(idev, mld, &max_delay,
1360 len == MLD_V1_QUERY_LEN);
1363 } else if (len >= MLD_V2_QUERY_LEN_MIN) {
1364 int srcs_offset = sizeof(struct mld2_query) -
1365 sizeof(struct icmp6hdr);
1367 if (!pskb_may_pull(skb, srcs_offset))
1370 mlh2 = (struct mld2_query *)skb_transport_header(skb);
1372 err = mld_process_v2(idev, mlh2, &max_delay);
1376 if (group_type == IPV6_ADDR_ANY) { /* general query */
1377 if (mlh2->mld2q_nsrcs)
1378 return -EINVAL; /* no sources allowed */
1380 mld_gq_start_timer(idev);
1383 /* mark sources to include, if group & source-specific */
1384 if (mlh2->mld2q_nsrcs != 0) {
1385 if (!pskb_may_pull(skb, srcs_offset +
1386 ntohs(mlh2->mld2q_nsrcs) * sizeof(struct in6_addr)))
1389 mlh2 = (struct mld2_query *)skb_transport_header(skb);
1396 read_lock_bh(&idev->lock);
1397 if (group_type == IPV6_ADDR_ANY) {
1398 for (ma = idev->mc_list; ma; ma = ma->next) {
1399 spin_lock_bh(&ma->mca_lock);
1400 igmp6_group_queried(ma, max_delay);
1401 spin_unlock_bh(&ma->mca_lock);
1404 for (ma = idev->mc_list; ma; ma = ma->next) {
1405 if (!ipv6_addr_equal(group, &ma->mca_addr))
1407 spin_lock_bh(&ma->mca_lock);
1408 if (ma->mca_flags & MAF_TIMER_RUNNING) {
1409 /* gsquery <- gsquery && mark */
1411 ma->mca_flags &= ~MAF_GSQUERY;
1413 /* gsquery <- mark */
1415 ma->mca_flags |= MAF_GSQUERY;
1417 ma->mca_flags &= ~MAF_GSQUERY;
1419 if (!(ma->mca_flags & MAF_GSQUERY) ||
1420 mld_marksources(ma, ntohs(mlh2->mld2q_nsrcs), mlh2->mld2q_srcs))
1421 igmp6_group_queried(ma, max_delay);
1422 spin_unlock_bh(&ma->mca_lock);
1426 read_unlock_bh(&idev->lock);
1431 /* called with rcu_read_lock() */
1432 int igmp6_event_report(struct sk_buff *skb)
1434 struct ifmcaddr6 *ma;
1435 struct inet6_dev *idev;
1436 struct mld_msg *mld;
1439 /* Our own report looped back. Ignore it. */
1440 if (skb->pkt_type == PACKET_LOOPBACK)
1443 /* send our report if the MC router may not have heard this report */
1444 if (skb->pkt_type != PACKET_MULTICAST &&
1445 skb->pkt_type != PACKET_BROADCAST)
1448 if (!pskb_may_pull(skb, sizeof(*mld) - sizeof(struct icmp6hdr)))
1451 mld = (struct mld_msg *)icmp6_hdr(skb);
1453 /* Drop reports with not link local source */
1454 addr_type = ipv6_addr_type(&ipv6_hdr(skb)->saddr);
1455 if (addr_type != IPV6_ADDR_ANY &&
1456 !(addr_type&IPV6_ADDR_LINKLOCAL))
1459 idev = __in6_dev_get(skb->dev);
1464 * Cancel the timer for this group
1467 read_lock_bh(&idev->lock);
1468 for (ma = idev->mc_list; ma; ma = ma->next) {
1469 if (ipv6_addr_equal(&ma->mca_addr, &mld->mld_mca)) {
1470 spin_lock(&ma->mca_lock);
1471 if (del_timer(&ma->mca_timer))
1472 refcount_dec(&ma->mca_refcnt);
1473 ma->mca_flags &= ~(MAF_LAST_REPORTER|MAF_TIMER_RUNNING);
1474 spin_unlock(&ma->mca_lock);
1478 read_unlock_bh(&idev->lock);
1482 static bool is_in(struct ifmcaddr6 *pmc, struct ip6_sf_list *psf, int type,
1483 int gdeleted, int sdeleted)
1486 case MLD2_MODE_IS_INCLUDE:
1487 case MLD2_MODE_IS_EXCLUDE:
1488 if (gdeleted || sdeleted)
1490 if (!((pmc->mca_flags & MAF_GSQUERY) && !psf->sf_gsresp)) {
1491 if (pmc->mca_sfmode == MCAST_INCLUDE)
1493 /* don't include if this source is excluded
1496 if (psf->sf_count[MCAST_INCLUDE])
1497 return type == MLD2_MODE_IS_INCLUDE;
1498 return pmc->mca_sfcount[MCAST_EXCLUDE] ==
1499 psf->sf_count[MCAST_EXCLUDE];
1502 case MLD2_CHANGE_TO_INCLUDE:
1503 if (gdeleted || sdeleted)
1505 return psf->sf_count[MCAST_INCLUDE] != 0;
1506 case MLD2_CHANGE_TO_EXCLUDE:
1507 if (gdeleted || sdeleted)
1509 if (pmc->mca_sfcount[MCAST_EXCLUDE] == 0 ||
1510 psf->sf_count[MCAST_INCLUDE])
1512 return pmc->mca_sfcount[MCAST_EXCLUDE] ==
1513 psf->sf_count[MCAST_EXCLUDE];
1514 case MLD2_ALLOW_NEW_SOURCES:
1515 if (gdeleted || !psf->sf_crcount)
1517 return (pmc->mca_sfmode == MCAST_INCLUDE) ^ sdeleted;
1518 case MLD2_BLOCK_OLD_SOURCES:
1519 if (pmc->mca_sfmode == MCAST_INCLUDE)
1520 return gdeleted || (psf->sf_crcount && sdeleted);
1521 return psf->sf_crcount && !gdeleted && !sdeleted;
1527 mld_scount(struct ifmcaddr6 *pmc, int type, int gdeleted, int sdeleted)
1529 struct ip6_sf_list *psf;
1532 for (psf = pmc->mca_sources; psf; psf = psf->sf_next) {
1533 if (!is_in(pmc, psf, type, gdeleted, sdeleted))
1540 static void ip6_mc_hdr(struct sock *sk, struct sk_buff *skb,
1541 struct net_device *dev,
1542 const struct in6_addr *saddr,
1543 const struct in6_addr *daddr,
1546 struct ipv6hdr *hdr;
1548 skb->protocol = htons(ETH_P_IPV6);
1551 skb_reset_network_header(skb);
1552 skb_put(skb, sizeof(struct ipv6hdr));
1553 hdr = ipv6_hdr(skb);
1555 ip6_flow_hdr(hdr, 0, 0);
1557 hdr->payload_len = htons(len);
1558 hdr->nexthdr = proto;
1559 hdr->hop_limit = inet6_sk(sk)->hop_limit;
1561 hdr->saddr = *saddr;
1562 hdr->daddr = *daddr;
1565 static struct sk_buff *mld_newpack(struct inet6_dev *idev, unsigned int mtu)
1567 struct net_device *dev = idev->dev;
1568 struct net *net = dev_net(dev);
1569 struct sock *sk = net->ipv6.igmp_sk;
1570 struct sk_buff *skb;
1571 struct mld2_report *pmr;
1572 struct in6_addr addr_buf;
1573 const struct in6_addr *saddr;
1574 int hlen = LL_RESERVED_SPACE(dev);
1575 int tlen = dev->needed_tailroom;
1576 unsigned int size = mtu + hlen + tlen;
1578 u8 ra[8] = { IPPROTO_ICMPV6, 0,
1579 IPV6_TLV_ROUTERALERT, 2, 0, 0,
1582 /* we assume size > sizeof(ra) here */
1583 /* limit our allocations to order-0 page */
1584 size = min_t(int, size, SKB_MAX_ORDER(0, 0));
1585 skb = sock_alloc_send_skb(sk, size, 1, &err);
1590 skb->priority = TC_PRIO_CONTROL;
1591 skb_reserve(skb, hlen);
1592 skb_tailroom_reserve(skb, mtu, tlen);
1594 if (__ipv6_get_lladdr(idev, &addr_buf, IFA_F_TENTATIVE)) {
1595 /* <draft-ietf-magma-mld-source-05.txt>:
1596 * use unspecified address as the source address
1597 * when a valid link-local address is not available.
1599 saddr = &in6addr_any;
1603 ip6_mc_hdr(sk, skb, dev, saddr, &mld2_all_mcr, NEXTHDR_HOP, 0);
1605 skb_put_data(skb, ra, sizeof(ra));
1607 skb_set_transport_header(skb, skb_tail_pointer(skb) - skb->data);
1608 skb_put(skb, sizeof(*pmr));
1609 pmr = (struct mld2_report *)skb_transport_header(skb);
1610 pmr->mld2r_type = ICMPV6_MLD2_REPORT;
1611 pmr->mld2r_resv1 = 0;
1612 pmr->mld2r_cksum = 0;
1613 pmr->mld2r_resv2 = 0;
1614 pmr->mld2r_ngrec = 0;
1618 static void mld_sendpack(struct sk_buff *skb)
1620 struct ipv6hdr *pip6 = ipv6_hdr(skb);
1621 struct mld2_report *pmr =
1622 (struct mld2_report *)skb_transport_header(skb);
1623 int payload_len, mldlen;
1624 struct inet6_dev *idev;
1625 struct net *net = dev_net(skb->dev);
1628 struct dst_entry *dst;
1631 idev = __in6_dev_get(skb->dev);
1632 IP6_UPD_PO_STATS(net, idev, IPSTATS_MIB_OUT, skb->len);
1634 payload_len = (skb_tail_pointer(skb) - skb_network_header(skb)) -
1636 mldlen = skb_tail_pointer(skb) - skb_transport_header(skb);
1637 pip6->payload_len = htons(payload_len);
1639 pmr->mld2r_cksum = csum_ipv6_magic(&pip6->saddr, &pip6->daddr, mldlen,
1641 csum_partial(skb_transport_header(skb),
1644 icmpv6_flow_init(net->ipv6.igmp_sk, &fl6, ICMPV6_MLD2_REPORT,
1645 &ipv6_hdr(skb)->saddr, &ipv6_hdr(skb)->daddr,
1647 dst = icmp6_dst_alloc(skb->dev, &fl6);
1654 skb_dst_set(skb, dst);
1658 err = NF_HOOK(NFPROTO_IPV6, NF_INET_LOCAL_OUT,
1659 net, net->ipv6.igmp_sk, skb, NULL, skb->dev,
1663 ICMP6MSGOUT_INC_STATS(net, idev, ICMPV6_MLD2_REPORT);
1664 ICMP6_INC_STATS(net, idev, ICMP6_MIB_OUTMSGS);
1666 IP6_INC_STATS(net, idev, IPSTATS_MIB_OUTDISCARDS);
1677 static int grec_size(struct ifmcaddr6 *pmc, int type, int gdel, int sdel)
1679 return sizeof(struct mld2_grec) + 16 * mld_scount(pmc,type,gdel,sdel);
1682 static struct sk_buff *add_grhead(struct sk_buff *skb, struct ifmcaddr6 *pmc,
1683 int type, struct mld2_grec **ppgr, unsigned int mtu)
1685 struct mld2_report *pmr;
1686 struct mld2_grec *pgr;
1689 skb = mld_newpack(pmc->idev, mtu);
1693 pgr = skb_put(skb, sizeof(struct mld2_grec));
1694 pgr->grec_type = type;
1695 pgr->grec_auxwords = 0;
1696 pgr->grec_nsrcs = 0;
1697 pgr->grec_mca = pmc->mca_addr; /* structure copy */
1698 pmr = (struct mld2_report *)skb_transport_header(skb);
1699 pmr->mld2r_ngrec = htons(ntohs(pmr->mld2r_ngrec)+1);
1704 #define AVAILABLE(skb) ((skb) ? skb_availroom(skb) : 0)
1706 static struct sk_buff *add_grec(struct sk_buff *skb, struct ifmcaddr6 *pmc,
1707 int type, int gdeleted, int sdeleted, int crsend)
1709 struct inet6_dev *idev = pmc->idev;
1710 struct net_device *dev = idev->dev;
1711 struct mld2_report *pmr;
1712 struct mld2_grec *pgr = NULL;
1713 struct ip6_sf_list *psf, *psf_next, *psf_prev, **psf_list;
1714 int scount, stotal, first, isquery, truncate;
1717 if (pmc->mca_flags & MAF_NOREPORT)
1720 mtu = READ_ONCE(dev->mtu);
1721 if (mtu < IPV6_MIN_MTU)
1724 isquery = type == MLD2_MODE_IS_INCLUDE ||
1725 type == MLD2_MODE_IS_EXCLUDE;
1726 truncate = type == MLD2_MODE_IS_EXCLUDE ||
1727 type == MLD2_CHANGE_TO_EXCLUDE;
1729 stotal = scount = 0;
1731 psf_list = sdeleted ? &pmc->mca_tomb : &pmc->mca_sources;
1736 pmr = skb ? (struct mld2_report *)skb_transport_header(skb) : NULL;
1738 /* EX and TO_EX get a fresh packet, if needed */
1740 if (pmr && pmr->mld2r_ngrec &&
1741 AVAILABLE(skb) < grec_size(pmc, type, gdeleted, sdeleted)) {
1744 skb = mld_newpack(idev, mtu);
1749 for (psf = *psf_list; psf; psf = psf_next) {
1750 struct in6_addr *psrc;
1752 psf_next = psf->sf_next;
1754 if (!is_in(pmc, psf, type, gdeleted, sdeleted)) {
1759 /* Based on RFC3810 6.1. Should not send source-list change
1760 * records when there is a filter mode change.
1762 if (((gdeleted && pmc->mca_sfmode == MCAST_EXCLUDE) ||
1763 (!gdeleted && pmc->mca_crcount)) &&
1764 (type == MLD2_ALLOW_NEW_SOURCES ||
1765 type == MLD2_BLOCK_OLD_SOURCES) && psf->sf_crcount)
1766 goto decrease_sf_crcount;
1768 /* clear marks on query responses */
1772 if (AVAILABLE(skb) < sizeof(*psrc) +
1773 first*sizeof(struct mld2_grec)) {
1774 if (truncate && !first)
1775 break; /* truncate these */
1777 pgr->grec_nsrcs = htons(scount);
1780 skb = mld_newpack(idev, mtu);
1785 skb = add_grhead(skb, pmc, type, &pgr, mtu);
1790 psrc = skb_put(skb, sizeof(*psrc));
1791 *psrc = psf->sf_addr;
1793 if ((type == MLD2_ALLOW_NEW_SOURCES ||
1794 type == MLD2_BLOCK_OLD_SOURCES) && psf->sf_crcount) {
1795 decrease_sf_crcount:
1797 if ((sdeleted || gdeleted) && psf->sf_crcount == 0) {
1799 psf_prev->sf_next = psf->sf_next;
1801 *psf_list = psf->sf_next;
1811 if (type == MLD2_ALLOW_NEW_SOURCES ||
1812 type == MLD2_BLOCK_OLD_SOURCES)
1814 if (pmc->mca_crcount || isquery || crsend) {
1815 /* make sure we have room for group header */
1816 if (skb && AVAILABLE(skb) < sizeof(struct mld2_grec)) {
1818 skb = NULL; /* add_grhead will get a new one */
1820 skb = add_grhead(skb, pmc, type, &pgr, mtu);
1824 pgr->grec_nsrcs = htons(scount);
1827 pmc->mca_flags &= ~MAF_GSQUERY; /* clear query state */
1831 static void mld_send_report(struct inet6_dev *idev, struct ifmcaddr6 *pmc)
1833 struct sk_buff *skb = NULL;
1836 read_lock_bh(&idev->lock);
1838 for (pmc = idev->mc_list; pmc; pmc = pmc->next) {
1839 if (pmc->mca_flags & MAF_NOREPORT)
1841 spin_lock_bh(&pmc->mca_lock);
1842 if (pmc->mca_sfcount[MCAST_EXCLUDE])
1843 type = MLD2_MODE_IS_EXCLUDE;
1845 type = MLD2_MODE_IS_INCLUDE;
1846 skb = add_grec(skb, pmc, type, 0, 0, 0);
1847 spin_unlock_bh(&pmc->mca_lock);
1850 spin_lock_bh(&pmc->mca_lock);
1851 if (pmc->mca_sfcount[MCAST_EXCLUDE])
1852 type = MLD2_MODE_IS_EXCLUDE;
1854 type = MLD2_MODE_IS_INCLUDE;
1855 skb = add_grec(skb, pmc, type, 0, 0, 0);
1856 spin_unlock_bh(&pmc->mca_lock);
1858 read_unlock_bh(&idev->lock);
1864 * remove zero-count source records from a source filter list
1866 static void mld_clear_zeros(struct ip6_sf_list **ppsf)
1868 struct ip6_sf_list *psf_prev, *psf_next, *psf;
1871 for (psf = *ppsf; psf; psf = psf_next) {
1872 psf_next = psf->sf_next;
1873 if (psf->sf_crcount == 0) {
1875 psf_prev->sf_next = psf->sf_next;
1877 *ppsf = psf->sf_next;
1884 static void mld_send_cr(struct inet6_dev *idev)
1886 struct ifmcaddr6 *pmc, *pmc_prev, *pmc_next;
1887 struct sk_buff *skb = NULL;
1890 read_lock_bh(&idev->lock);
1891 spin_lock(&idev->mc_lock);
1895 for (pmc = idev->mc_tomb; pmc; pmc = pmc_next) {
1896 pmc_next = pmc->next;
1897 if (pmc->mca_sfmode == MCAST_INCLUDE) {
1898 type = MLD2_BLOCK_OLD_SOURCES;
1899 dtype = MLD2_BLOCK_OLD_SOURCES;
1900 skb = add_grec(skb, pmc, type, 1, 0, 0);
1901 skb = add_grec(skb, pmc, dtype, 1, 1, 0);
1903 if (pmc->mca_crcount) {
1904 if (pmc->mca_sfmode == MCAST_EXCLUDE) {
1905 type = MLD2_CHANGE_TO_INCLUDE;
1906 skb = add_grec(skb, pmc, type, 1, 0, 0);
1909 if (pmc->mca_crcount == 0) {
1910 mld_clear_zeros(&pmc->mca_tomb);
1911 mld_clear_zeros(&pmc->mca_sources);
1914 if (pmc->mca_crcount == 0 && !pmc->mca_tomb &&
1915 !pmc->mca_sources) {
1917 pmc_prev->next = pmc_next;
1919 idev->mc_tomb = pmc_next;
1920 in6_dev_put(pmc->idev);
1925 spin_unlock(&idev->mc_lock);
1928 for (pmc = idev->mc_list; pmc; pmc = pmc->next) {
1929 spin_lock_bh(&pmc->mca_lock);
1930 if (pmc->mca_sfcount[MCAST_EXCLUDE]) {
1931 type = MLD2_BLOCK_OLD_SOURCES;
1932 dtype = MLD2_ALLOW_NEW_SOURCES;
1934 type = MLD2_ALLOW_NEW_SOURCES;
1935 dtype = MLD2_BLOCK_OLD_SOURCES;
1937 skb = add_grec(skb, pmc, type, 0, 0, 0);
1938 skb = add_grec(skb, pmc, dtype, 0, 1, 0); /* deleted sources */
1940 /* filter mode changes */
1941 if (pmc->mca_crcount) {
1942 if (pmc->mca_sfmode == MCAST_EXCLUDE)
1943 type = MLD2_CHANGE_TO_EXCLUDE;
1945 type = MLD2_CHANGE_TO_INCLUDE;
1946 skb = add_grec(skb, pmc, type, 0, 0, 0);
1949 spin_unlock_bh(&pmc->mca_lock);
1951 read_unlock_bh(&idev->lock);
1954 (void) mld_sendpack(skb);
1957 static void igmp6_send(struct in6_addr *addr, struct net_device *dev, int type)
1959 struct net *net = dev_net(dev);
1960 struct sock *sk = net->ipv6.igmp_sk;
1961 struct inet6_dev *idev;
1962 struct sk_buff *skb;
1963 struct mld_msg *hdr;
1964 const struct in6_addr *snd_addr, *saddr;
1965 struct in6_addr addr_buf;
1966 int hlen = LL_RESERVED_SPACE(dev);
1967 int tlen = dev->needed_tailroom;
1968 int err, len, payload_len, full_len;
1969 u8 ra[8] = { IPPROTO_ICMPV6, 0,
1970 IPV6_TLV_ROUTERALERT, 2, 0, 0,
1973 struct dst_entry *dst;
1975 if (type == ICMPV6_MGM_REDUCTION)
1976 snd_addr = &in6addr_linklocal_allrouters;
1980 len = sizeof(struct icmp6hdr) + sizeof(struct in6_addr);
1981 payload_len = len + sizeof(ra);
1982 full_len = sizeof(struct ipv6hdr) + payload_len;
1985 IP6_UPD_PO_STATS(net, __in6_dev_get(dev),
1986 IPSTATS_MIB_OUT, full_len);
1989 skb = sock_alloc_send_skb(sk, hlen + tlen + full_len, 1, &err);
1993 IP6_INC_STATS(net, __in6_dev_get(dev),
1994 IPSTATS_MIB_OUTDISCARDS);
1998 skb->priority = TC_PRIO_CONTROL;
1999 skb_reserve(skb, hlen);
2001 if (ipv6_get_lladdr(dev, &addr_buf, IFA_F_TENTATIVE)) {
2002 /* <draft-ietf-magma-mld-source-05.txt>:
2003 * use unspecified address as the source address
2004 * when a valid link-local address is not available.
2006 saddr = &in6addr_any;
2010 ip6_mc_hdr(sk, skb, dev, saddr, snd_addr, NEXTHDR_HOP, payload_len);
2012 skb_put_data(skb, ra, sizeof(ra));
2014 hdr = skb_put_zero(skb, sizeof(struct mld_msg));
2015 hdr->mld_type = type;
2016 hdr->mld_mca = *addr;
2018 hdr->mld_cksum = csum_ipv6_magic(saddr, snd_addr, len,
2020 csum_partial(hdr, len, 0));
2023 idev = __in6_dev_get(skb->dev);
2025 icmpv6_flow_init(sk, &fl6, type,
2026 &ipv6_hdr(skb)->saddr, &ipv6_hdr(skb)->daddr,
2028 dst = icmp6_dst_alloc(skb->dev, &fl6);
2034 skb_dst_set(skb, dst);
2035 err = NF_HOOK(NFPROTO_IPV6, NF_INET_LOCAL_OUT,
2036 net, sk, skb, NULL, skb->dev,
2040 ICMP6MSGOUT_INC_STATS(net, idev, type);
2041 ICMP6_INC_STATS(net, idev, ICMP6_MIB_OUTMSGS);
2043 IP6_INC_STATS(net, idev, IPSTATS_MIB_OUTDISCARDS);
2053 static void mld_send_initial_cr(struct inet6_dev *idev)
2055 struct sk_buff *skb;
2056 struct ifmcaddr6 *pmc;
2059 if (mld_in_v1_mode(idev))
2063 read_lock_bh(&idev->lock);
2064 for (pmc = idev->mc_list; pmc; pmc = pmc->next) {
2065 spin_lock_bh(&pmc->mca_lock);
2066 if (pmc->mca_sfcount[MCAST_EXCLUDE])
2067 type = MLD2_CHANGE_TO_EXCLUDE;
2069 type = MLD2_CHANGE_TO_INCLUDE;
2070 skb = add_grec(skb, pmc, type, 0, 0, 1);
2071 spin_unlock_bh(&pmc->mca_lock);
2073 read_unlock_bh(&idev->lock);
2078 void ipv6_mc_dad_complete(struct inet6_dev *idev)
2080 idev->mc_dad_count = idev->mc_qrv;
2081 if (idev->mc_dad_count) {
2082 mld_send_initial_cr(idev);
2083 idev->mc_dad_count--;
2084 if (idev->mc_dad_count)
2085 mld_dad_start_timer(idev, idev->mc_maxdelay);
2089 static void mld_dad_timer_expire(struct timer_list *t)
2091 struct inet6_dev *idev = from_timer(idev, t, mc_dad_timer);
2093 mld_send_initial_cr(idev);
2094 if (idev->mc_dad_count) {
2095 idev->mc_dad_count--;
2096 if (idev->mc_dad_count)
2097 mld_dad_start_timer(idev, idev->mc_maxdelay);
2102 static int ip6_mc_del1_src(struct ifmcaddr6 *pmc, int sfmode,
2103 const struct in6_addr *psfsrc)
2105 struct ip6_sf_list *psf, *psf_prev;
2109 for (psf = pmc->mca_sources; psf; psf = psf->sf_next) {
2110 if (ipv6_addr_equal(&psf->sf_addr, psfsrc))
2114 if (!psf || psf->sf_count[sfmode] == 0) {
2115 /* source filter not found, or count wrong => bug */
2118 psf->sf_count[sfmode]--;
2119 if (!psf->sf_count[MCAST_INCLUDE] && !psf->sf_count[MCAST_EXCLUDE]) {
2120 struct inet6_dev *idev = pmc->idev;
2122 /* no more filters for this source */
2124 psf_prev->sf_next = psf->sf_next;
2126 pmc->mca_sources = psf->sf_next;
2127 if (psf->sf_oldin && !(pmc->mca_flags & MAF_NOREPORT) &&
2128 !mld_in_v1_mode(idev)) {
2129 psf->sf_crcount = idev->mc_qrv;
2130 psf->sf_next = pmc->mca_tomb;
2131 pmc->mca_tomb = psf;
2139 static int ip6_mc_del_src(struct inet6_dev *idev, const struct in6_addr *pmca,
2140 int sfmode, int sfcount, const struct in6_addr *psfsrc,
2143 struct ifmcaddr6 *pmc;
2149 read_lock_bh(&idev->lock);
2150 for (pmc = idev->mc_list; pmc; pmc = pmc->next) {
2151 if (ipv6_addr_equal(pmca, &pmc->mca_addr))
2155 /* MCA not found?? bug */
2156 read_unlock_bh(&idev->lock);
2159 spin_lock_bh(&pmc->mca_lock);
2162 if (!pmc->mca_sfcount[sfmode]) {
2163 spin_unlock_bh(&pmc->mca_lock);
2164 read_unlock_bh(&idev->lock);
2167 pmc->mca_sfcount[sfmode]--;
2170 for (i = 0; i < sfcount; i++) {
2171 int rv = ip6_mc_del1_src(pmc, sfmode, &psfsrc[i]);
2173 changerec |= rv > 0;
2177 if (pmc->mca_sfmode == MCAST_EXCLUDE &&
2178 pmc->mca_sfcount[MCAST_EXCLUDE] == 0 &&
2179 pmc->mca_sfcount[MCAST_INCLUDE]) {
2180 struct ip6_sf_list *psf;
2182 /* filter mode change */
2183 pmc->mca_sfmode = MCAST_INCLUDE;
2184 pmc->mca_crcount = idev->mc_qrv;
2185 idev->mc_ifc_count = pmc->mca_crcount;
2186 for (psf = pmc->mca_sources; psf; psf = psf->sf_next)
2187 psf->sf_crcount = 0;
2188 mld_ifc_event(pmc->idev);
2189 } else if (sf_setstate(pmc) || changerec)
2190 mld_ifc_event(pmc->idev);
2191 spin_unlock_bh(&pmc->mca_lock);
2192 read_unlock_bh(&idev->lock);
2197 * Add multicast single-source filter to the interface list
2199 static int ip6_mc_add1_src(struct ifmcaddr6 *pmc, int sfmode,
2200 const struct in6_addr *psfsrc)
2202 struct ip6_sf_list *psf, *psf_prev;
2205 for (psf = pmc->mca_sources; psf; psf = psf->sf_next) {
2206 if (ipv6_addr_equal(&psf->sf_addr, psfsrc))
2211 psf = kzalloc(sizeof(*psf), GFP_ATOMIC);
2215 psf->sf_addr = *psfsrc;
2217 psf_prev->sf_next = psf;
2219 pmc->mca_sources = psf;
2221 psf->sf_count[sfmode]++;
2225 static void sf_markstate(struct ifmcaddr6 *pmc)
2227 struct ip6_sf_list *psf;
2228 int mca_xcount = pmc->mca_sfcount[MCAST_EXCLUDE];
2230 for (psf = pmc->mca_sources; psf; psf = psf->sf_next)
2231 if (pmc->mca_sfcount[MCAST_EXCLUDE]) {
2232 psf->sf_oldin = mca_xcount ==
2233 psf->sf_count[MCAST_EXCLUDE] &&
2234 !psf->sf_count[MCAST_INCLUDE];
2236 psf->sf_oldin = psf->sf_count[MCAST_INCLUDE] != 0;
2239 static int sf_setstate(struct ifmcaddr6 *pmc)
2241 struct ip6_sf_list *psf, *dpsf;
2242 int mca_xcount = pmc->mca_sfcount[MCAST_EXCLUDE];
2243 int qrv = pmc->idev->mc_qrv;
2247 for (psf = pmc->mca_sources; psf; psf = psf->sf_next) {
2248 if (pmc->mca_sfcount[MCAST_EXCLUDE]) {
2249 new_in = mca_xcount == psf->sf_count[MCAST_EXCLUDE] &&
2250 !psf->sf_count[MCAST_INCLUDE];
2252 new_in = psf->sf_count[MCAST_INCLUDE] != 0;
2254 if (!psf->sf_oldin) {
2255 struct ip6_sf_list *prev = NULL;
2257 for (dpsf = pmc->mca_tomb; dpsf;
2258 dpsf = dpsf->sf_next) {
2259 if (ipv6_addr_equal(&dpsf->sf_addr,
2266 prev->sf_next = dpsf->sf_next;
2268 pmc->mca_tomb = dpsf->sf_next;
2271 psf->sf_crcount = qrv;
2274 } else if (psf->sf_oldin) {
2275 psf->sf_crcount = 0;
2277 * add or update "delete" records if an active filter
2280 for (dpsf = pmc->mca_tomb; dpsf; dpsf = dpsf->sf_next)
2281 if (ipv6_addr_equal(&dpsf->sf_addr,
2285 dpsf = kmalloc(sizeof(*dpsf), GFP_ATOMIC);
2289 /* pmc->mca_lock held by callers */
2290 dpsf->sf_next = pmc->mca_tomb;
2291 pmc->mca_tomb = dpsf;
2293 dpsf->sf_crcount = qrv;
2301 * Add multicast source filter list to the interface list
2303 static int ip6_mc_add_src(struct inet6_dev *idev, const struct in6_addr *pmca,
2304 int sfmode, int sfcount, const struct in6_addr *psfsrc,
2307 struct ifmcaddr6 *pmc;
2313 read_lock_bh(&idev->lock);
2314 for (pmc = idev->mc_list; pmc; pmc = pmc->next) {
2315 if (ipv6_addr_equal(pmca, &pmc->mca_addr))
2319 /* MCA not found?? bug */
2320 read_unlock_bh(&idev->lock);
2323 spin_lock_bh(&pmc->mca_lock);
2326 isexclude = pmc->mca_sfmode == MCAST_EXCLUDE;
2328 pmc->mca_sfcount[sfmode]++;
2330 for (i = 0; i < sfcount; i++) {
2331 err = ip6_mc_add1_src(pmc, sfmode, &psfsrc[i]);
2339 pmc->mca_sfcount[sfmode]--;
2340 for (j = 0; j < i; j++)
2341 ip6_mc_del1_src(pmc, sfmode, &psfsrc[j]);
2342 } else if (isexclude != (pmc->mca_sfcount[MCAST_EXCLUDE] != 0)) {
2343 struct ip6_sf_list *psf;
2345 /* filter mode change */
2346 if (pmc->mca_sfcount[MCAST_EXCLUDE])
2347 pmc->mca_sfmode = MCAST_EXCLUDE;
2348 else if (pmc->mca_sfcount[MCAST_INCLUDE])
2349 pmc->mca_sfmode = MCAST_INCLUDE;
2350 /* else no filters; keep old mode for reports */
2352 pmc->mca_crcount = idev->mc_qrv;
2353 idev->mc_ifc_count = pmc->mca_crcount;
2354 for (psf = pmc->mca_sources; psf; psf = psf->sf_next)
2355 psf->sf_crcount = 0;
2356 mld_ifc_event(idev);
2357 } else if (sf_setstate(pmc))
2358 mld_ifc_event(idev);
2359 spin_unlock_bh(&pmc->mca_lock);
2360 read_unlock_bh(&idev->lock);
2364 static void ip6_mc_clear_src(struct ifmcaddr6 *pmc)
2366 struct ip6_sf_list *psf, *nextpsf;
2368 for (psf = pmc->mca_tomb; psf; psf = nextpsf) {
2369 nextpsf = psf->sf_next;
2372 pmc->mca_tomb = NULL;
2373 for (psf = pmc->mca_sources; psf; psf = nextpsf) {
2374 nextpsf = psf->sf_next;
2377 pmc->mca_sources = NULL;
2378 pmc->mca_sfmode = MCAST_EXCLUDE;
2379 pmc->mca_sfcount[MCAST_INCLUDE] = 0;
2380 pmc->mca_sfcount[MCAST_EXCLUDE] = 1;
2384 static void igmp6_join_group(struct ifmcaddr6 *ma)
2386 unsigned long delay;
2388 if (ma->mca_flags & MAF_NOREPORT)
2391 igmp6_send(&ma->mca_addr, ma->idev->dev, ICMPV6_MGM_REPORT);
2393 delay = prandom_u32() % unsolicited_report_interval(ma->idev);
2395 spin_lock_bh(&ma->mca_lock);
2396 if (del_timer(&ma->mca_timer)) {
2397 refcount_dec(&ma->mca_refcnt);
2398 delay = ma->mca_timer.expires - jiffies;
2401 if (!mod_timer(&ma->mca_timer, jiffies + delay))
2402 refcount_inc(&ma->mca_refcnt);
2403 ma->mca_flags |= MAF_TIMER_RUNNING | MAF_LAST_REPORTER;
2404 spin_unlock_bh(&ma->mca_lock);
2407 static int ip6_mc_leave_src(struct sock *sk, struct ipv6_mc_socklist *iml,
2408 struct inet6_dev *idev)
2412 /* callers have the socket lock and rtnl lock
2413 * so no other readers or writers of iml or its sflist
2416 /* any-source empty exclude case */
2417 return ip6_mc_del_src(idev, &iml->addr, iml->sfmode, 0, NULL, 0);
2419 err = ip6_mc_del_src(idev, &iml->addr, iml->sfmode,
2420 iml->sflist->sl_count, iml->sflist->sl_addr, 0);
2421 sock_kfree_s(sk, iml->sflist, IP6_SFLSIZE(iml->sflist->sl_max));
2426 static void igmp6_leave_group(struct ifmcaddr6 *ma)
2428 if (mld_in_v1_mode(ma->idev)) {
2429 if (ma->mca_flags & MAF_LAST_REPORTER)
2430 igmp6_send(&ma->mca_addr, ma->idev->dev,
2431 ICMPV6_MGM_REDUCTION);
2433 mld_add_delrec(ma->idev, ma);
2434 mld_ifc_event(ma->idev);
2438 static void mld_gq_timer_expire(struct timer_list *t)
2440 struct inet6_dev *idev = from_timer(idev, t, mc_gq_timer);
2442 idev->mc_gq_running = 0;
2443 mld_send_report(idev, NULL);
2447 static void mld_ifc_timer_expire(struct timer_list *t)
2449 struct inet6_dev *idev = from_timer(idev, t, mc_ifc_timer);
2452 if (idev->mc_ifc_count) {
2453 idev->mc_ifc_count--;
2454 if (idev->mc_ifc_count)
2455 mld_ifc_start_timer(idev, idev->mc_maxdelay);
2460 static void mld_ifc_event(struct inet6_dev *idev)
2462 if (mld_in_v1_mode(idev))
2464 idev->mc_ifc_count = idev->mc_qrv;
2465 mld_ifc_start_timer(idev, 1);
2468 static void igmp6_timer_handler(struct timer_list *t)
2470 struct ifmcaddr6 *ma = from_timer(ma, t, mca_timer);
2472 if (mld_in_v1_mode(ma->idev))
2473 igmp6_send(&ma->mca_addr, ma->idev->dev, ICMPV6_MGM_REPORT);
2475 mld_send_report(ma->idev, ma);
2477 spin_lock(&ma->mca_lock);
2478 ma->mca_flags |= MAF_LAST_REPORTER;
2479 ma->mca_flags &= ~MAF_TIMER_RUNNING;
2480 spin_unlock(&ma->mca_lock);
2484 /* Device changing type */
2486 void ipv6_mc_unmap(struct inet6_dev *idev)
2488 struct ifmcaddr6 *i;
2490 /* Install multicast list, except for all-nodes (already installed) */
2492 read_lock_bh(&idev->lock);
2493 for (i = idev->mc_list; i; i = i->next)
2494 igmp6_group_dropped(i);
2495 read_unlock_bh(&idev->lock);
2498 void ipv6_mc_remap(struct inet6_dev *idev)
2503 /* Device going down */
2505 void ipv6_mc_down(struct inet6_dev *idev)
2507 struct ifmcaddr6 *i;
2509 /* Withdraw multicast list */
2511 read_lock_bh(&idev->lock);
2513 for (i = idev->mc_list; i; i = i->next)
2514 igmp6_group_dropped(i);
2516 /* Should stop timer after group drop. or we will
2517 * start timer again in mld_ifc_event()
2519 mld_ifc_stop_timer(idev);
2520 mld_gq_stop_timer(idev);
2521 mld_dad_stop_timer(idev);
2522 read_unlock_bh(&idev->lock);
2525 static void ipv6_mc_reset(struct inet6_dev *idev)
2527 idev->mc_qrv = sysctl_mld_qrv;
2528 idev->mc_qi = MLD_QI_DEFAULT;
2529 idev->mc_qri = MLD_QRI_DEFAULT;
2530 idev->mc_v1_seen = 0;
2531 idev->mc_maxdelay = unsolicited_report_interval(idev);
2534 /* Device going up */
2536 void ipv6_mc_up(struct inet6_dev *idev)
2538 struct ifmcaddr6 *i;
2540 /* Install multicast list, except for all-nodes (already installed) */
2542 read_lock_bh(&idev->lock);
2543 ipv6_mc_reset(idev);
2544 for (i = idev->mc_list; i; i = i->next) {
2545 mld_del_delrec(idev, i);
2546 igmp6_group_added(i);
2548 read_unlock_bh(&idev->lock);
2551 /* IPv6 device initialization. */
2553 void ipv6_mc_init_dev(struct inet6_dev *idev)
2555 write_lock_bh(&idev->lock);
2556 spin_lock_init(&idev->mc_lock);
2557 idev->mc_gq_running = 0;
2558 timer_setup(&idev->mc_gq_timer, mld_gq_timer_expire, 0);
2559 idev->mc_tomb = NULL;
2560 idev->mc_ifc_count = 0;
2561 timer_setup(&idev->mc_ifc_timer, mld_ifc_timer_expire, 0);
2562 timer_setup(&idev->mc_dad_timer, mld_dad_timer_expire, 0);
2563 ipv6_mc_reset(idev);
2564 write_unlock_bh(&idev->lock);
2568 * Device is about to be destroyed: clean up.
2571 void ipv6_mc_destroy_dev(struct inet6_dev *idev)
2573 struct ifmcaddr6 *i;
2575 /* Deactivate timers */
2577 mld_clear_delrec(idev);
2579 /* Delete all-nodes address. */
2580 /* We cannot call ipv6_dev_mc_dec() directly, our caller in
2581 * addrconf.c has NULL'd out dev->ip6_ptr so in6_dev_get() will
2584 __ipv6_dev_mc_dec(idev, &in6addr_linklocal_allnodes);
2586 if (idev->cnf.forwarding)
2587 __ipv6_dev_mc_dec(idev, &in6addr_linklocal_allrouters);
2589 write_lock_bh(&idev->lock);
2590 while ((i = idev->mc_list) != NULL) {
2591 idev->mc_list = i->next;
2593 write_unlock_bh(&idev->lock);
2595 write_lock_bh(&idev->lock);
2597 write_unlock_bh(&idev->lock);
2600 static void ipv6_mc_rejoin_groups(struct inet6_dev *idev)
2602 struct ifmcaddr6 *pmc;
2606 if (mld_in_v1_mode(idev)) {
2607 read_lock_bh(&idev->lock);
2608 for (pmc = idev->mc_list; pmc; pmc = pmc->next)
2609 igmp6_join_group(pmc);
2610 read_unlock_bh(&idev->lock);
2612 mld_send_report(idev, NULL);
2615 static int ipv6_mc_netdev_event(struct notifier_block *this,
2616 unsigned long event,
2619 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
2620 struct inet6_dev *idev = __in6_dev_get(dev);
2623 case NETDEV_RESEND_IGMP:
2625 ipv6_mc_rejoin_groups(idev);
2634 static struct notifier_block igmp6_netdev_notifier = {
2635 .notifier_call = ipv6_mc_netdev_event,
2638 #ifdef CONFIG_PROC_FS
2639 struct igmp6_mc_iter_state {
2640 struct seq_net_private p;
2641 struct net_device *dev;
2642 struct inet6_dev *idev;
2645 #define igmp6_mc_seq_private(seq) ((struct igmp6_mc_iter_state *)(seq)->private)
2647 static inline struct ifmcaddr6 *igmp6_mc_get_first(struct seq_file *seq)
2649 struct ifmcaddr6 *im = NULL;
2650 struct igmp6_mc_iter_state *state = igmp6_mc_seq_private(seq);
2651 struct net *net = seq_file_net(seq);
2654 for_each_netdev_rcu(net, state->dev) {
2655 struct inet6_dev *idev;
2656 idev = __in6_dev_get(state->dev);
2659 read_lock_bh(&idev->lock);
2665 read_unlock_bh(&idev->lock);
2670 static struct ifmcaddr6 *igmp6_mc_get_next(struct seq_file *seq, struct ifmcaddr6 *im)
2672 struct igmp6_mc_iter_state *state = igmp6_mc_seq_private(seq);
2676 if (likely(state->idev))
2677 read_unlock_bh(&state->idev->lock);
2679 state->dev = next_net_device_rcu(state->dev);
2684 state->idev = __in6_dev_get(state->dev);
2687 read_lock_bh(&state->idev->lock);
2688 im = state->idev->mc_list;
2693 static struct ifmcaddr6 *igmp6_mc_get_idx(struct seq_file *seq, loff_t pos)
2695 struct ifmcaddr6 *im = igmp6_mc_get_first(seq);
2697 while (pos && (im = igmp6_mc_get_next(seq, im)) != NULL)
2699 return pos ? NULL : im;
2702 static void *igmp6_mc_seq_start(struct seq_file *seq, loff_t *pos)
2706 return igmp6_mc_get_idx(seq, *pos);
2709 static void *igmp6_mc_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2711 struct ifmcaddr6 *im = igmp6_mc_get_next(seq, v);
2717 static void igmp6_mc_seq_stop(struct seq_file *seq, void *v)
2720 struct igmp6_mc_iter_state *state = igmp6_mc_seq_private(seq);
2722 if (likely(state->idev)) {
2723 read_unlock_bh(&state->idev->lock);
2730 static int igmp6_mc_seq_show(struct seq_file *seq, void *v)
2732 struct ifmcaddr6 *im = (struct ifmcaddr6 *)v;
2733 struct igmp6_mc_iter_state *state = igmp6_mc_seq_private(seq);
2736 "%-4d %-15s %pi6 %5d %08X %ld\n",
2737 state->dev->ifindex, state->dev->name,
2739 im->mca_users, im->mca_flags,
2740 (im->mca_flags&MAF_TIMER_RUNNING) ?
2741 jiffies_to_clock_t(im->mca_timer.expires-jiffies) : 0);
2745 static const struct seq_operations igmp6_mc_seq_ops = {
2746 .start = igmp6_mc_seq_start,
2747 .next = igmp6_mc_seq_next,
2748 .stop = igmp6_mc_seq_stop,
2749 .show = igmp6_mc_seq_show,
2752 struct igmp6_mcf_iter_state {
2753 struct seq_net_private p;
2754 struct net_device *dev;
2755 struct inet6_dev *idev;
2756 struct ifmcaddr6 *im;
2759 #define igmp6_mcf_seq_private(seq) ((struct igmp6_mcf_iter_state *)(seq)->private)
2761 static inline struct ip6_sf_list *igmp6_mcf_get_first(struct seq_file *seq)
2763 struct ip6_sf_list *psf = NULL;
2764 struct ifmcaddr6 *im = NULL;
2765 struct igmp6_mcf_iter_state *state = igmp6_mcf_seq_private(seq);
2766 struct net *net = seq_file_net(seq);
2770 for_each_netdev_rcu(net, state->dev) {
2771 struct inet6_dev *idev;
2772 idev = __in6_dev_get(state->dev);
2773 if (unlikely(idev == NULL))
2775 read_lock_bh(&idev->lock);
2778 spin_lock_bh(&im->mca_lock);
2779 psf = im->mca_sources;
2785 spin_unlock_bh(&im->mca_lock);
2787 read_unlock_bh(&idev->lock);
2792 static struct ip6_sf_list *igmp6_mcf_get_next(struct seq_file *seq, struct ip6_sf_list *psf)
2794 struct igmp6_mcf_iter_state *state = igmp6_mcf_seq_private(seq);
2798 spin_unlock_bh(&state->im->mca_lock);
2799 state->im = state->im->next;
2800 while (!state->im) {
2801 if (likely(state->idev))
2802 read_unlock_bh(&state->idev->lock);
2804 state->dev = next_net_device_rcu(state->dev);
2809 state->idev = __in6_dev_get(state->dev);
2812 read_lock_bh(&state->idev->lock);
2813 state->im = state->idev->mc_list;
2817 spin_lock_bh(&state->im->mca_lock);
2818 psf = state->im->mca_sources;
2824 static struct ip6_sf_list *igmp6_mcf_get_idx(struct seq_file *seq, loff_t pos)
2826 struct ip6_sf_list *psf = igmp6_mcf_get_first(seq);
2828 while (pos && (psf = igmp6_mcf_get_next(seq, psf)) != NULL)
2830 return pos ? NULL : psf;
2833 static void *igmp6_mcf_seq_start(struct seq_file *seq, loff_t *pos)
2837 return *pos ? igmp6_mcf_get_idx(seq, *pos - 1) : SEQ_START_TOKEN;
2840 static void *igmp6_mcf_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2842 struct ip6_sf_list *psf;
2843 if (v == SEQ_START_TOKEN)
2844 psf = igmp6_mcf_get_first(seq);
2846 psf = igmp6_mcf_get_next(seq, v);
2851 static void igmp6_mcf_seq_stop(struct seq_file *seq, void *v)
2854 struct igmp6_mcf_iter_state *state = igmp6_mcf_seq_private(seq);
2855 if (likely(state->im)) {
2856 spin_unlock_bh(&state->im->mca_lock);
2859 if (likely(state->idev)) {
2860 read_unlock_bh(&state->idev->lock);
2867 static int igmp6_mcf_seq_show(struct seq_file *seq, void *v)
2869 struct ip6_sf_list *psf = (struct ip6_sf_list *)v;
2870 struct igmp6_mcf_iter_state *state = igmp6_mcf_seq_private(seq);
2872 if (v == SEQ_START_TOKEN) {
2873 seq_puts(seq, "Idx Device Multicast Address Source Address INC EXC\n");
2876 "%3d %6.6s %pi6 %pi6 %6lu %6lu\n",
2877 state->dev->ifindex, state->dev->name,
2878 &state->im->mca_addr,
2880 psf->sf_count[MCAST_INCLUDE],
2881 psf->sf_count[MCAST_EXCLUDE]);
2886 static const struct seq_operations igmp6_mcf_seq_ops = {
2887 .start = igmp6_mcf_seq_start,
2888 .next = igmp6_mcf_seq_next,
2889 .stop = igmp6_mcf_seq_stop,
2890 .show = igmp6_mcf_seq_show,
2893 static int __net_init igmp6_proc_init(struct net *net)
2898 if (!proc_create_net("igmp6", 0444, net->proc_net, &igmp6_mc_seq_ops,
2899 sizeof(struct igmp6_mc_iter_state)))
2901 if (!proc_create_net("mcfilter6", 0444, net->proc_net,
2903 sizeof(struct igmp6_mcf_iter_state)))
2904 goto out_proc_net_igmp6;
2911 remove_proc_entry("igmp6", net->proc_net);
2915 static void __net_exit igmp6_proc_exit(struct net *net)
2917 remove_proc_entry("mcfilter6", net->proc_net);
2918 remove_proc_entry("igmp6", net->proc_net);
2921 static inline int igmp6_proc_init(struct net *net)
2925 static inline void igmp6_proc_exit(struct net *net)
2930 static int __net_init igmp6_net_init(struct net *net)
2934 err = inet_ctl_sock_create(&net->ipv6.igmp_sk, PF_INET6,
2935 SOCK_RAW, IPPROTO_ICMPV6, net);
2937 pr_err("Failed to initialize the IGMP6 control socket (err %d)\n",
2942 inet6_sk(net->ipv6.igmp_sk)->hop_limit = 1;
2944 err = inet_ctl_sock_create(&net->ipv6.mc_autojoin_sk, PF_INET6,
2945 SOCK_RAW, IPPROTO_ICMPV6, net);
2947 pr_err("Failed to initialize the IGMP6 autojoin socket (err %d)\n",
2949 goto out_sock_create;
2952 err = igmp6_proc_init(net);
2954 goto out_sock_create_autojoin;
2958 out_sock_create_autojoin:
2959 inet_ctl_sock_destroy(net->ipv6.mc_autojoin_sk);
2961 inet_ctl_sock_destroy(net->ipv6.igmp_sk);
2966 static void __net_exit igmp6_net_exit(struct net *net)
2968 inet_ctl_sock_destroy(net->ipv6.igmp_sk);
2969 inet_ctl_sock_destroy(net->ipv6.mc_autojoin_sk);
2970 igmp6_proc_exit(net);
2973 static struct pernet_operations igmp6_net_ops = {
2974 .init = igmp6_net_init,
2975 .exit = igmp6_net_exit,
2978 int __init igmp6_init(void)
2980 return register_pernet_subsys(&igmp6_net_ops);
2983 int __init igmp6_late_init(void)
2985 return register_netdevice_notifier(&igmp6_netdev_notifier);
2988 void igmp6_cleanup(void)
2990 unregister_pernet_subsys(&igmp6_net_ops);
2993 void igmp6_late_cleanup(void)
2995 unregister_netdevice_notifier(&igmp6_netdev_notifier);