2 * Copyright (c) 2010-2016 Apple Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
29 * Copyright (c) 2009 Bruce Simpson.
30 * All rights reserved.
32 * Redistribution and use in source and binary forms, with or without
33 * modification, are permitted provided that the following conditions
35 * 1. Redistributions of source code must retain the above copyright
36 * notice, this list of conditions and the following disclaimer.
37 * 2. Redistributions in binary form must reproduce the above copyright
38 * notice, this list of conditions and the following disclaimer in the
39 * documentation and/or other materials provided with the distribution.
40 * 3. The name of the author may not be used to endorse or promote
41 * products derived from this software without specific prior written
44 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
45 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
46 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
47 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
48 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
49 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
50 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
51 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
52 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
53 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
58 * IPv6 multicast socket, group, and socket option processing module.
59 * Normative references: RFC 2292, RFC 3492, RFC 3542, RFC 3678, RFC 3810.
62 #include <sys/cdefs.h>
64 #include <sys/param.h>
65 #include <sys/systm.h>
66 #include <sys/kernel.h>
67 #include <sys/malloc.h>
69 #include <sys/protosw.h>
70 #include <sys/socket.h>
71 #include <sys/socketvar.h>
72 #include <sys/protosw.h>
73 #include <sys/sysctl.h>
75 #include <sys/mcache.h>
77 #include <kern/zalloc.h>
79 #include <pexpert/pexpert.h>
82 #include <net/if_dl.h>
83 #include <net/route.h>
85 #include <netinet/in.h>
86 #include <netinet/in_var.h>
87 #include <netinet6/in6_var.h>
88 #include <netinet/ip6.h>
89 #include <netinet/icmp6.h>
90 #include <netinet6/ip6_var.h>
91 #include <netinet/in_pcb.h>
92 #include <netinet/tcp.h>
93 #include <netinet/tcp_seq.h>
94 #include <netinet/tcp_var.h>
95 #include <netinet6/nd6.h>
96 #include <netinet6/mld6_var.h>
97 #include <netinet6/scope6_var.h>
99 #ifndef __SOCKUNION_DECLARED
101 struct sockaddr_storage ss
;
103 struct sockaddr_dl sdl
;
104 struct sockaddr_in6 sin6
;
106 typedef union sockunion sockunion_t
;
107 #define __SOCKUNION_DECLARED
108 #endif /* __SOCKUNION_DECLARED */
110 static void im6f_commit(struct in6_mfilter
*);
111 static int im6f_get_source(struct in6_mfilter
*imf
,
112 const struct sockaddr_in6
*psin
,
113 struct in6_msource
**);
114 static struct in6_msource
*
115 im6f_graft(struct in6_mfilter
*, const uint8_t,
116 const struct sockaddr_in6
*);
117 static int im6f_prune(struct in6_mfilter
*, const struct sockaddr_in6
*);
118 static void im6f_rollback(struct in6_mfilter
*);
119 static void im6f_reap(struct in6_mfilter
*);
120 static int im6o_grow(struct ip6_moptions
*, size_t);
121 static size_t im6o_match_group(const struct ip6_moptions
*,
122 const struct ifnet
*, const struct sockaddr
*);
123 static struct in6_msource
*
124 im6o_match_source(const struct ip6_moptions
*, const size_t,
125 const struct sockaddr
*);
126 static void im6s_merge(struct ip6_msource
*ims
,
127 const struct in6_msource
*lims
, const int rollback
);
128 static int in6_mc_get(struct ifnet
*, const struct in6_addr
*,
129 struct in6_multi
**);
130 static int in6m_get_source(struct in6_multi
*inm
,
131 const struct in6_addr
*addr
, const int noalloc
,
132 struct ip6_msource
**pims
);
133 static int in6m_is_ifp_detached(const struct in6_multi
*);
134 static int in6m_merge(struct in6_multi
*, /*const*/ struct in6_mfilter
*);
135 static void in6m_reap(struct in6_multi
*);
136 static struct ip6_moptions
*
137 in6p_findmoptions(struct inpcb
*);
138 static int in6p_get_source_filters(struct inpcb
*, struct sockopt
*);
139 static int in6p_lookup_v4addr(struct ipv6_mreq
*, struct ip_mreq
*);
140 static int in6p_join_group(struct inpcb
*, struct sockopt
*);
141 static int in6p_leave_group(struct inpcb
*, struct sockopt
*);
142 static struct ifnet
*
143 in6p_lookup_mcast_ifp(const struct inpcb
*,
144 const struct sockaddr_in6
*);
145 static int in6p_block_unblock_source(struct inpcb
*, struct sockopt
*);
146 static int in6p_set_multicast_if(struct inpcb
*, struct sockopt
*);
147 static int in6p_set_source_filters(struct inpcb
*, struct sockopt
*);
148 static int sysctl_ip6_mcast_filters SYSCTL_HANDLER_ARGS
;
149 static __inline__
int ip6_msource_cmp(const struct ip6_msource
*,
150 const struct ip6_msource
*);
152 SYSCTL_DECL(_net_inet6_ip6
); /* XXX Not in any common header. */
154 SYSCTL_NODE(_net_inet6_ip6
, OID_AUTO
, mcast
, CTLFLAG_RW
| CTLFLAG_LOCKED
, 0, "IPv6 multicast");
156 static unsigned long in6_mcast_maxgrpsrc
= IPV6_MAX_GROUP_SRC_FILTER
;
157 SYSCTL_LONG(_net_inet6_ip6_mcast
, OID_AUTO
, maxgrpsrc
,
158 CTLFLAG_RW
| CTLFLAG_LOCKED
, &in6_mcast_maxgrpsrc
,
159 "Max source filters per group");
161 static unsigned long in6_mcast_maxsocksrc
= IPV6_MAX_SOCK_SRC_FILTER
;
162 SYSCTL_LONG(_net_inet6_ip6_mcast
, OID_AUTO
, maxsocksrc
,
163 CTLFLAG_RW
| CTLFLAG_LOCKED
, &in6_mcast_maxsocksrc
,
164 "Max source filters per socket");
166 int in6_mcast_loop
= IPV6_DEFAULT_MULTICAST_LOOP
;
167 SYSCTL_INT(_net_inet6_ip6_mcast
, OID_AUTO
, loop
, CTLFLAG_RW
| CTLFLAG_LOCKED
,
168 &in6_mcast_loop
, 0, "Loopback multicast datagrams by default");
170 SYSCTL_NODE(_net_inet6_ip6_mcast
, OID_AUTO
, filters
,
171 CTLFLAG_RD
| CTLFLAG_LOCKED
, sysctl_ip6_mcast_filters
,
172 "Per-interface stack-wide source filters");
174 RB_GENERATE_PREV(ip6_msource_tree
, ip6_msource
, im6s_link
, ip6_msource_cmp
);
176 #define IN6M_TRACE_HIST_SIZE 32 /* size of trace history */
179 __private_extern__
unsigned int in6m_trace_hist_size
= IN6M_TRACE_HIST_SIZE
;
181 struct in6_multi_dbg
{
182 struct in6_multi in6m
; /* in6_multi */
183 u_int16_t in6m_refhold_cnt
; /* # of ref */
184 u_int16_t in6m_refrele_cnt
; /* # of rele */
186 * Circular lists of in6m_addref and in6m_remref callers.
188 ctrace_t in6m_refhold
[IN6M_TRACE_HIST_SIZE
];
189 ctrace_t in6m_refrele
[IN6M_TRACE_HIST_SIZE
];
193 TAILQ_ENTRY(in6_multi_dbg
) in6m_trash_link
;
196 /* List of trash in6_multi entries protected by in6m_trash_lock */
197 static TAILQ_HEAD(, in6_multi_dbg
) in6m_trash_head
;
198 static decl_lck_mtx_data(, in6m_trash_lock
);
201 static unsigned int in6m_debug
= 1; /* debugging (enabled) */
203 static unsigned int in6m_debug
; /* debugging (disabled) */
205 static unsigned int in6m_size
; /* size of zone element */
206 static struct zone
*in6m_zone
; /* zone for in6_multi */
208 #define IN6M_ZONE_MAX 64 /* maximum elements in zone */
209 #define IN6M_ZONE_NAME "in6_multi" /* zone name */
211 static unsigned int imm_size
; /* size of zone element */
212 static struct zone
*imm_zone
; /* zone for in6_multi_mship */
214 #define IMM_ZONE_MAX 64 /* maximum elements in zone */
215 #define IMM_ZONE_NAME "in6_multi_mship" /* zone name */
217 #define IP6MS_ZONE_MAX 64 /* maximum elements in zone */
218 #define IP6MS_ZONE_NAME "ip6_msource" /* zone name */
220 static unsigned int ip6ms_size
; /* size of zone element */
221 static struct zone
*ip6ms_zone
; /* zone for ip6_msource */
223 #define IN6MS_ZONE_MAX 64 /* maximum elements in zone */
224 #define IN6MS_ZONE_NAME "in6_msource" /* zone name */
226 static unsigned int in6ms_size
; /* size of zone element */
227 static struct zone
*in6ms_zone
; /* zone for in6_msource */
229 /* Lock group and attribute for in6_multihead_lock lock */
230 static lck_attr_t
*in6_multihead_lock_attr
;
231 static lck_grp_t
*in6_multihead_lock_grp
;
232 static lck_grp_attr_t
*in6_multihead_lock_grp_attr
;
234 static decl_lck_rw_data(, in6_multihead_lock
);
235 struct in6_multihead in6_multihead
;
237 static struct in6_multi
*in6_multi_alloc(int);
238 static void in6_multi_free(struct in6_multi
*);
239 static void in6_multi_attach(struct in6_multi
*);
240 static struct in6_multi_mship
*in6_multi_mship_alloc(int);
241 static void in6_multi_mship_free(struct in6_multi_mship
*);
242 static void in6m_trace(struct in6_multi
*, int);
244 static struct ip6_msource
*ip6ms_alloc(int);
245 static void ip6ms_free(struct ip6_msource
*);
246 static struct in6_msource
*in6ms_alloc(int);
247 static void in6ms_free(struct in6_msource
*);
250 * IPv6 source tree comparison function.
252 * An ordered predicate is necessary; bcmp() is not documented to return
253 * an indication of order, memcmp() is, and is an ISO C99 requirement.
256 ip6_msource_cmp(const struct ip6_msource
*a
, const struct ip6_msource
*b
)
258 return (memcmp(&a
->im6s_addr
, &b
->im6s_addr
, sizeof(struct in6_addr
)));
262 * Inline function which wraps assertions for a valid ifp.
264 static __inline__
int
265 in6m_is_ifp_detached(const struct in6_multi
*inm
)
267 VERIFY(inm
->in6m_ifma
!= NULL
);
268 VERIFY(inm
->in6m_ifp
== inm
->in6m_ifma
->ifma_ifp
);
270 return (!ifnet_is_attached(inm
->in6m_ifp
, 0));
274 * Initialize an in6_mfilter structure to a known state at t0, t1
275 * with an empty source filter list.
277 static __inline__
void
278 im6f_init(struct in6_mfilter
*imf
, const int st0
, const int st1
)
280 memset(imf
, 0, sizeof(struct in6_mfilter
));
281 RB_INIT(&imf
->im6f_sources
);
282 imf
->im6f_st
[0] = st0
;
283 imf
->im6f_st
[1] = st1
;
287 * Resize the ip6_moptions vector to the next power-of-two minus 1.
290 im6o_grow(struct ip6_moptions
*imo
, size_t newmax
)
292 struct in6_multi
**nmships
;
293 struct in6_multi
**omships
;
294 struct in6_mfilter
*nmfilters
;
295 struct in6_mfilter
*omfilters
;
299 IM6O_LOCK_ASSERT_HELD(imo
);
303 omships
= imo
->im6o_membership
;
304 omfilters
= imo
->im6o_mfilters
;
305 oldmax
= imo
->im6o_max_memberships
;
307 newmax
= ((oldmax
+ 1) * 2) - 1;
309 if (newmax
> IPV6_MAX_MEMBERSHIPS
)
310 return (ETOOMANYREFS
);
312 if ((nmships
= (struct in6_multi
**)_REALLOC(omships
,
313 sizeof (struct in6_multi
*) * newmax
, M_IP6MOPTS
,
314 M_WAITOK
| M_ZERO
)) == NULL
)
317 imo
->im6o_membership
= nmships
;
319 if ((nmfilters
= (struct in6_mfilter
*)_REALLOC(omfilters
,
320 sizeof (struct in6_mfilter
) * newmax
, M_IN6MFILTER
,
321 M_WAITOK
| M_ZERO
)) == NULL
)
324 imo
->im6o_mfilters
= nmfilters
;
326 /* Initialize newly allocated source filter heads. */
327 for (idx
= oldmax
; idx
< newmax
; idx
++)
328 im6f_init(&nmfilters
[idx
], MCAST_UNDEFINED
, MCAST_EXCLUDE
);
330 imo
->im6o_max_memberships
= newmax
;
336 * Find an IPv6 multicast group entry for this ip6_moptions instance
337 * which matches the specified group, and optionally an interface.
338 * Return its index into the array, or -1 if not found.
341 im6o_match_group(const struct ip6_moptions
*imo
, const struct ifnet
*ifp
,
342 const struct sockaddr
*group
)
344 const struct sockaddr_in6
*gsin6
;
345 struct in6_multi
*pinm
;
349 IM6O_LOCK_ASSERT_HELD(__DECONST(struct ip6_moptions
*, imo
));
351 gsin6
= (struct sockaddr_in6
*)(uintptr_t)(size_t)group
;
353 /* The im6o_membership array may be lazy allocated. */
354 if (imo
->im6o_membership
== NULL
|| imo
->im6o_num_memberships
== 0)
357 nmships
= imo
->im6o_num_memberships
;
358 for (idx
= 0; idx
< nmships
; idx
++) {
359 pinm
= imo
->im6o_membership
[idx
];
363 if ((ifp
== NULL
|| (pinm
->in6m_ifp
== ifp
)) &&
364 IN6_ARE_ADDR_EQUAL(&pinm
->in6m_addr
,
365 &gsin6
->sin6_addr
)) {
378 * Find an IPv6 multicast source entry for this imo which matches
379 * the given group index for this socket, and source address.
381 * XXX TODO: The scope ID, if present in src, is stripped before
382 * any comparison. We SHOULD enforce scope/zone checks where the source
383 * filter entry has a link scope.
385 * NOTE: This does not check if the entry is in-mode, merely if
386 * it exists, which may not be the desired behaviour.
388 static struct in6_msource
*
389 im6o_match_source(const struct ip6_moptions
*imo
, const size_t gidx
,
390 const struct sockaddr
*src
)
392 struct ip6_msource find
;
393 struct in6_mfilter
*imf
;
394 struct ip6_msource
*ims
;
395 const sockunion_t
*psa
;
397 IM6O_LOCK_ASSERT_HELD(__DECONST(struct ip6_moptions
*, imo
));
399 VERIFY(src
->sa_family
== AF_INET6
);
400 VERIFY(gidx
!= (size_t)-1 && gidx
< imo
->im6o_num_memberships
);
402 /* The im6o_mfilters array may be lazy allocated. */
403 if (imo
->im6o_mfilters
== NULL
)
405 imf
= &imo
->im6o_mfilters
[gidx
];
407 psa
= (sockunion_t
*)(uintptr_t)(size_t)src
;
408 find
.im6s_addr
= psa
->sin6
.sin6_addr
;
409 in6_clearscope(&find
.im6s_addr
); /* XXX */
410 ims
= RB_FIND(ip6_msource_tree
, &imf
->im6f_sources
, &find
);
412 return ((struct in6_msource
*)ims
);
416 * Perform filtering for multicast datagrams on a socket by group and source.
418 * Returns 0 if a datagram should be allowed through, or various error codes
419 * if the socket was not a member of the group, or the source was muted, etc.
422 im6o_mc_filter(const struct ip6_moptions
*imo
, const struct ifnet
*ifp
,
423 const struct sockaddr
*group
, const struct sockaddr
*src
)
426 struct in6_msource
*ims
;
429 IM6O_LOCK_ASSERT_HELD(__DECONST(struct ip6_moptions
*, imo
));
432 gidx
= im6o_match_group(imo
, ifp
, group
);
433 if (gidx
== (size_t)-1)
434 return (MCAST_NOTGMEMBER
);
437 * Check if the source was included in an (S,G) join.
438 * Allow reception on exclusive memberships by default,
439 * reject reception on inclusive memberships by default.
440 * Exclude source only if an in-mode exclude filter exists.
441 * Include source only if an in-mode include filter exists.
442 * NOTE: We are comparing group state here at MLD t1 (now)
443 * with socket-layer t0 (since last downcall).
445 mode
= imo
->im6o_mfilters
[gidx
].im6f_st
[1];
446 ims
= im6o_match_source(imo
, gidx
, src
);
448 if ((ims
== NULL
&& mode
== MCAST_INCLUDE
) ||
449 (ims
!= NULL
&& ims
->im6sl_st
[0] != mode
))
450 return (MCAST_NOTSMEMBER
);
456 * Find and return a reference to an in6_multi record for (ifp, group),
457 * and bump its reference count.
458 * If one does not exist, try to allocate it, and update link-layer multicast
459 * filters on ifp to listen for group.
460 * Assumes the IN6_MULTI lock is held across the call.
461 * Return 0 if successful, otherwise return an appropriate error code.
464 in6_mc_get(struct ifnet
*ifp
, const struct in6_addr
*group
,
465 struct in6_multi
**pinm
)
467 struct sockaddr_in6 gsin6
;
468 struct ifmultiaddr
*ifma
;
469 struct in6_multi
*inm
;
474 in6_multihead_lock_shared();
475 IN6_LOOKUP_MULTI(group
, ifp
, inm
);
478 VERIFY(inm
->in6m_reqcnt
>= 1);
480 VERIFY(inm
->in6m_reqcnt
!= 0);
483 in6_multihead_lock_done();
485 * We already joined this group; return the in6m
486 * with a refcount held (via lookup) for caller.
490 in6_multihead_lock_done();
492 memset(&gsin6
, 0, sizeof(gsin6
));
493 gsin6
.sin6_family
= AF_INET6
;
494 gsin6
.sin6_len
= sizeof(struct sockaddr_in6
);
495 gsin6
.sin6_addr
= *group
;
498 * Check if a link-layer group is already associated
499 * with this network-layer group on the given ifnet.
501 error
= if_addmulti(ifp
, (struct sockaddr
*)&gsin6
, &ifma
);
506 * See comments in in6m_remref() for access to ifma_protospec.
508 in6_multihead_lock_exclusive();
510 if ((inm
= ifma
->ifma_protospec
) != NULL
) {
511 VERIFY(ifma
->ifma_addr
!= NULL
);
512 VERIFY(ifma
->ifma_addr
->sa_family
== AF_INET6
);
513 IN6M_ADDREF(inm
); /* for caller */
516 VERIFY(inm
->in6m_ifma
== ifma
);
517 VERIFY(inm
->in6m_ifp
== ifp
);
518 VERIFY(IN6_ARE_ADDR_EQUAL(&inm
->in6m_addr
, group
));
519 if (inm
->in6m_debug
& IFD_ATTACHED
) {
520 VERIFY(inm
->in6m_reqcnt
>= 1);
522 VERIFY(inm
->in6m_reqcnt
!= 0);
525 in6_multihead_lock_done();
528 * We lost the race with another thread doing
529 * in6_mc_get(); since this group has already
530 * been joined; return the inm with a refcount
536 * We lost the race with another thread doing in6_delmulti();
537 * the inm referring to the ifma has been detached, thus we
538 * reattach it back to the in6_multihead list, and return the
539 * inm with a refcount held for the caller.
541 in6_multi_attach(inm
);
542 VERIFY((inm
->in6m_debug
&
543 (IFD_ATTACHED
| IFD_TRASHED
)) == IFD_ATTACHED
);
546 in6_multihead_lock_done();
553 * A new in6_multi record is needed; allocate and initialize it.
554 * We DO NOT perform an MLD join as the in6_ layer may need to
555 * push an initial source list down to MLD to support SSM.
557 * The initial source filter state is INCLUDE, {} as per the RFC.
558 * Pending state-changes per group are subject to a bounds check.
560 inm
= in6_multi_alloc(M_WAITOK
);
562 in6_multihead_lock_done();
567 inm
->in6m_addr
= *group
;
569 inm
->in6m_mli
= MLD_IFINFO(ifp
);
570 VERIFY(inm
->in6m_mli
!= NULL
);
571 MLI_ADDREF(inm
->in6m_mli
);
572 inm
->in6m_ifma
= ifma
; /* keep refcount from if_addmulti() */
573 inm
->in6m_state
= MLD_NOT_MEMBER
;
575 * Pending state-changes per group are subject to a bounds check.
577 inm
->in6m_scq
.ifq_maxlen
= MLD_MAX_STATE_CHANGES
;
578 inm
->in6m_st
[0].iss_fmode
= MCAST_UNDEFINED
;
579 inm
->in6m_st
[1].iss_fmode
= MCAST_UNDEFINED
;
580 RB_INIT(&inm
->in6m_srcs
);
582 in6_multi_attach(inm
);
583 VERIFY((inm
->in6m_debug
&
584 (IFD_ATTACHED
| IFD_TRASHED
)) == IFD_ATTACHED
);
585 IN6M_ADDREF_LOCKED(inm
); /* for caller */
589 VERIFY(ifma
->ifma_protospec
== NULL
);
590 ifma
->ifma_protospec
= inm
;
592 in6_multihead_lock_done();
598 * Clear recorded source entries for a group.
599 * Used by the MLD code. Caller must hold the IN6_MULTI lock.
600 * FIXME: Should reap.
603 in6m_clear_recorded(struct in6_multi
*inm
)
605 struct ip6_msource
*ims
;
607 IN6M_LOCK_ASSERT_HELD(inm
);
609 RB_FOREACH(ims
, ip6_msource_tree
, &inm
->in6m_srcs
) {
612 --inm
->in6m_st
[1].iss_rec
;
615 VERIFY(inm
->in6m_st
[1].iss_rec
== 0);
619 * Record a source as pending for a Source-Group MLDv2 query.
620 * This lives here as it modifies the shared tree.
622 * inm is the group descriptor.
623 * naddr is the address of the source to record in network-byte order.
625 * If the net.inet6.mld.sgalloc sysctl is non-zero, we will
626 * lazy-allocate a source node in response to an SG query.
627 * Otherwise, no allocation is performed. This saves some memory
628 * with the trade-off that the source will not be reported to the
629 * router if joined in the window between the query response and
630 * the group actually being joined on the local host.
632 * VIMAGE: XXX: Currently the mld_sgalloc feature has been removed.
633 * This turns off the allocation of a recorded source entry if
634 * the group has not been joined.
636 * Return 0 if the source didn't exist or was already marked as recorded.
637 * Return 1 if the source was marked as recorded by this function.
638 * Return <0 if any error occured (negated errno code).
641 in6m_record_source(struct in6_multi
*inm
, const struct in6_addr
*addr
)
643 struct ip6_msource find
;
644 struct ip6_msource
*ims
, *nims
;
646 IN6M_LOCK_ASSERT_HELD(inm
);
648 find
.im6s_addr
= *addr
;
649 ims
= RB_FIND(ip6_msource_tree
, &inm
->in6m_srcs
, &find
);
650 if (ims
&& ims
->im6s_stp
)
653 if (inm
->in6m_nsrc
== in6_mcast_maxgrpsrc
)
655 nims
= ip6ms_alloc(M_WAITOK
);
658 nims
->im6s_addr
= find
.im6s_addr
;
659 RB_INSERT(ip6_msource_tree
, &inm
->in6m_srcs
, nims
);
665 * Mark the source as recorded and update the recorded
669 ++inm
->in6m_st
[1].iss_rec
;
675 * Return a pointer to an in6_msource owned by an in6_mfilter,
676 * given its source address.
677 * Lazy-allocate if needed. If this is a new entry its filter state is
680 * imf is the filter set being modified.
681 * addr is the source address.
683 * Caller is expected to be holding im6o_lock.
686 im6f_get_source(struct in6_mfilter
*imf
, const struct sockaddr_in6
*psin
,
687 struct in6_msource
**plims
)
689 struct ip6_msource find
;
690 struct ip6_msource
*ims
;
691 struct in6_msource
*lims
;
698 find
.im6s_addr
= psin
->sin6_addr
;
699 ims
= RB_FIND(ip6_msource_tree
, &imf
->im6f_sources
, &find
);
700 lims
= (struct in6_msource
*)ims
;
702 if (imf
->im6f_nsrc
== in6_mcast_maxsocksrc
)
704 lims
= in6ms_alloc(M_WAITOK
);
707 lims
->im6s_addr
= find
.im6s_addr
;
708 lims
->im6sl_st
[0] = MCAST_UNDEFINED
;
709 RB_INSERT(ip6_msource_tree
, &imf
->im6f_sources
,
710 (struct ip6_msource
*)lims
);
720 * Graft a source entry into an existing socket-layer filter set,
721 * maintaining any required invariants and checking allocations.
723 * The source is marked as being in the new filter mode at t1.
725 * Return the pointer to the new node, otherwise return NULL.
727 * Caller is expected to be holding im6o_lock.
729 static struct in6_msource
*
730 im6f_graft(struct in6_mfilter
*imf
, const uint8_t st1
,
731 const struct sockaddr_in6
*psin
)
733 struct in6_msource
*lims
;
735 lims
= in6ms_alloc(M_WAITOK
);
738 lims
->im6s_addr
= psin
->sin6_addr
;
739 lims
->im6sl_st
[0] = MCAST_UNDEFINED
;
740 lims
->im6sl_st
[1] = st1
;
741 RB_INSERT(ip6_msource_tree
, &imf
->im6f_sources
,
742 (struct ip6_msource
*)lims
);
749 * Prune a source entry from an existing socket-layer filter set,
750 * maintaining any required invariants and checking allocations.
752 * The source is marked as being left at t1, it is not freed.
754 * Return 0 if no error occurred, otherwise return an errno value.
756 * Caller is expected to be holding im6o_lock.
759 im6f_prune(struct in6_mfilter
*imf
, const struct sockaddr_in6
*psin
)
761 struct ip6_msource find
;
762 struct ip6_msource
*ims
;
763 struct in6_msource
*lims
;
765 find
.im6s_addr
= psin
->sin6_addr
;
766 ims
= RB_FIND(ip6_msource_tree
, &imf
->im6f_sources
, &find
);
769 lims
= (struct in6_msource
*)ims
;
770 lims
->im6sl_st
[1] = MCAST_UNDEFINED
;
775 * Revert socket-layer filter set deltas at t1 to t0 state.
777 * Caller is expected to be holding im6o_lock.
780 im6f_rollback(struct in6_mfilter
*imf
)
782 struct ip6_msource
*ims
, *tims
;
783 struct in6_msource
*lims
;
785 RB_FOREACH_SAFE(ims
, ip6_msource_tree
, &imf
->im6f_sources
, tims
) {
786 lims
= (struct in6_msource
*)ims
;
787 if (lims
->im6sl_st
[0] == lims
->im6sl_st
[1]) {
788 /* no change at t1 */
790 } else if (lims
->im6sl_st
[0] != MCAST_UNDEFINED
) {
791 /* revert change to existing source at t1 */
792 lims
->im6sl_st
[1] = lims
->im6sl_st
[0];
794 /* revert source added t1 */
795 MLD_PRINTF(("%s: free in6ms 0x%llx\n", __func__
,
796 (uint64_t)VM_KERNEL_ADDRPERM(lims
)));
797 RB_REMOVE(ip6_msource_tree
, &imf
->im6f_sources
, ims
);
802 imf
->im6f_st
[1] = imf
->im6f_st
[0];
806 * Mark socket-layer filter set as INCLUDE {} at t1.
808 * Caller is expected to be holding im6o_lock.
811 im6f_leave(struct in6_mfilter
*imf
)
813 struct ip6_msource
*ims
;
814 struct in6_msource
*lims
;
816 RB_FOREACH(ims
, ip6_msource_tree
, &imf
->im6f_sources
) {
817 lims
= (struct in6_msource
*)ims
;
818 lims
->im6sl_st
[1] = MCAST_UNDEFINED
;
820 imf
->im6f_st
[1] = MCAST_INCLUDE
;
824 * Mark socket-layer filter set deltas as committed.
826 * Caller is expected to be holding im6o_lock.
829 im6f_commit(struct in6_mfilter
*imf
)
831 struct ip6_msource
*ims
;
832 struct in6_msource
*lims
;
834 RB_FOREACH(ims
, ip6_msource_tree
, &imf
->im6f_sources
) {
835 lims
= (struct in6_msource
*)ims
;
836 lims
->im6sl_st
[0] = lims
->im6sl_st
[1];
838 imf
->im6f_st
[0] = imf
->im6f_st
[1];
842 * Reap unreferenced sources from socket-layer filter set.
844 * Caller is expected to be holding im6o_lock.
847 im6f_reap(struct in6_mfilter
*imf
)
849 struct ip6_msource
*ims
, *tims
;
850 struct in6_msource
*lims
;
852 RB_FOREACH_SAFE(ims
, ip6_msource_tree
, &imf
->im6f_sources
, tims
) {
853 lims
= (struct in6_msource
*)ims
;
854 if ((lims
->im6sl_st
[0] == MCAST_UNDEFINED
) &&
855 (lims
->im6sl_st
[1] == MCAST_UNDEFINED
)) {
856 MLD_PRINTF(("%s: free in6ms 0x%llx\n", __func__
,
857 (uint64_t)VM_KERNEL_ADDRPERM(lims
)));
858 RB_REMOVE(ip6_msource_tree
, &imf
->im6f_sources
, ims
);
866 * Purge socket-layer filter set.
868 * Caller is expected to be holding im6o_lock.
871 im6f_purge(struct in6_mfilter
*imf
)
873 struct ip6_msource
*ims
, *tims
;
874 struct in6_msource
*lims
;
876 RB_FOREACH_SAFE(ims
, ip6_msource_tree
, &imf
->im6f_sources
, tims
) {
877 lims
= (struct in6_msource
*)ims
;
878 MLD_PRINTF(("%s: free in6ms 0x%llx\n", __func__
,
879 (uint64_t)VM_KERNEL_ADDRPERM(lims
)));
880 RB_REMOVE(ip6_msource_tree
, &imf
->im6f_sources
, ims
);
884 imf
->im6f_st
[0] = imf
->im6f_st
[1] = MCAST_UNDEFINED
;
885 VERIFY(RB_EMPTY(&imf
->im6f_sources
));
889 * Look up a source filter entry for a multicast group.
891 * inm is the group descriptor to work with.
892 * addr is the IPv6 address to look up.
893 * noalloc may be non-zero to suppress allocation of sources.
894 * *pims will be set to the address of the retrieved or allocated source.
896 * Return 0 if successful, otherwise return a non-zero error code.
899 in6m_get_source(struct in6_multi
*inm
, const struct in6_addr
*addr
,
900 const int noalloc
, struct ip6_msource
**pims
)
902 struct ip6_msource find
;
903 struct ip6_msource
*ims
, *nims
;
905 IN6M_LOCK_ASSERT_HELD(inm
);
907 find
.im6s_addr
= *addr
;
908 ims
= RB_FIND(ip6_msource_tree
, &inm
->in6m_srcs
, &find
);
909 if (ims
== NULL
&& !noalloc
) {
910 if (inm
->in6m_nsrc
== in6_mcast_maxgrpsrc
)
912 nims
= ip6ms_alloc(M_WAITOK
);
915 nims
->im6s_addr
= *addr
;
916 RB_INSERT(ip6_msource_tree
, &inm
->in6m_srcs
, nims
);
919 MLD_PRINTF(("%s: allocated %s as 0x%llx\n", __func__
,
920 ip6_sprintf(addr
), (uint64_t)VM_KERNEL_ADDRPERM(ims
)));
928 * Helper function to derive the filter mode on a source entry
929 * from its internal counters. Predicates are:
930 * A source is only excluded if all listeners exclude it.
931 * A source is only included if no listeners exclude it,
932 * and at least one listener includes it.
933 * May be used by ifmcstat(8).
936 im6s_get_mode(const struct in6_multi
*inm
, const struct ip6_msource
*ims
,
939 IN6M_LOCK_ASSERT_HELD(__DECONST(struct in6_multi
*, inm
));
942 if (inm
->in6m_st
[t
].iss_ex
> 0 &&
943 inm
->in6m_st
[t
].iss_ex
== ims
->im6s_st
[t
].ex
)
944 return (MCAST_EXCLUDE
);
945 else if (ims
->im6s_st
[t
].in
> 0 && ims
->im6s_st
[t
].ex
== 0)
946 return (MCAST_INCLUDE
);
947 return (MCAST_UNDEFINED
);
951 * Merge socket-layer source into MLD-layer source.
952 * If rollback is non-zero, perform the inverse of the merge.
955 im6s_merge(struct ip6_msource
*ims
, const struct in6_msource
*lims
,
958 int n
= rollback
? -1 : 1;
960 if (lims
->im6sl_st
[0] == MCAST_EXCLUDE
) {
961 MLD_PRINTF(("%s: t1 ex -= %d on %s\n", __func__
, n
,
962 ip6_sprintf(&lims
->im6s_addr
)));
963 ims
->im6s_st
[1].ex
-= n
;
964 } else if (lims
->im6sl_st
[0] == MCAST_INCLUDE
) {
965 MLD_PRINTF(("%s: t1 in -= %d on %s\n", __func__
, n
,
966 ip6_sprintf(&lims
->im6s_addr
)));
967 ims
->im6s_st
[1].in
-= n
;
970 if (lims
->im6sl_st
[1] == MCAST_EXCLUDE
) {
971 MLD_PRINTF(("%s: t1 ex += %d on %s\n", __func__
, n
,
972 ip6_sprintf(&lims
->im6s_addr
)));
973 ims
->im6s_st
[1].ex
+= n
;
974 } else if (lims
->im6sl_st
[1] == MCAST_INCLUDE
) {
975 MLD_PRINTF(("%s: t1 in += %d on %s\n", __func__
, n
,
976 ip6_sprintf(&lims
->im6s_addr
)));
977 ims
->im6s_st
[1].in
+= n
;
982 * Atomically update the global in6_multi state, when a membership's
983 * filter list is being updated in any way.
985 * imf is the per-inpcb-membership group filter pointer.
986 * A fake imf may be passed for in-kernel consumers.
988 * XXX This is a candidate for a set-symmetric-difference style loop
989 * which would eliminate the repeated lookup from root of ims nodes,
990 * as they share the same key space.
992 * If any error occurred this function will back out of refcounts
993 * and return a non-zero value.
996 in6m_merge(struct in6_multi
*inm
, /*const*/ struct in6_mfilter
*imf
)
998 struct ip6_msource
*ims
, *nims
;
999 struct in6_msource
*lims
;
1000 int schanged
, error
;
1003 IN6M_LOCK_ASSERT_HELD(inm
);
1010 * Update the source filters first, as this may fail.
1011 * Maintain count of in-mode filters at t0, t1. These are
1012 * used to work out if we transition into ASM mode or not.
1013 * Maintain a count of source filters whose state was
1014 * actually modified by this operation.
1016 RB_FOREACH(ims
, ip6_msource_tree
, &imf
->im6f_sources
) {
1017 lims
= (struct in6_msource
*)ims
;
1018 if (lims
->im6sl_st
[0] == imf
->im6f_st
[0]) nsrc0
++;
1019 if (lims
->im6sl_st
[1] == imf
->im6f_st
[1]) nsrc1
++;
1020 if (lims
->im6sl_st
[0] == lims
->im6sl_st
[1]) continue;
1021 error
= in6m_get_source(inm
, &lims
->im6s_addr
, 0, &nims
);
1025 im6s_merge(nims
, lims
, 0);
1028 struct ip6_msource
*bims
;
1030 RB_FOREACH_REVERSE_FROM(ims
, ip6_msource_tree
, nims
) {
1031 lims
= (struct in6_msource
*)ims
;
1032 if (lims
->im6sl_st
[0] == lims
->im6sl_st
[1])
1034 (void) in6m_get_source(inm
, &lims
->im6s_addr
, 1, &bims
);
1037 im6s_merge(bims
, lims
, 1);
1042 MLD_PRINTF(("%s: imf filters in-mode: %d at t0, %d at t1\n",
1043 __func__
, nsrc0
, nsrc1
));
1045 /* Handle transition between INCLUDE {n} and INCLUDE {} on socket. */
1046 if (imf
->im6f_st
[0] == imf
->im6f_st
[1] &&
1047 imf
->im6f_st
[1] == MCAST_INCLUDE
) {
1049 MLD_PRINTF(("%s: --in on inm at t1\n", __func__
));
1050 --inm
->in6m_st
[1].iss_in
;
1054 /* Handle filter mode transition on socket. */
1055 if (imf
->im6f_st
[0] != imf
->im6f_st
[1]) {
1056 MLD_PRINTF(("%s: imf transition %d to %d\n",
1057 __func__
, imf
->im6f_st
[0], imf
->im6f_st
[1]));
1059 if (imf
->im6f_st
[0] == MCAST_EXCLUDE
) {
1060 MLD_PRINTF(("%s: --ex on inm at t1\n", __func__
));
1061 --inm
->in6m_st
[1].iss_ex
;
1062 } else if (imf
->im6f_st
[0] == MCAST_INCLUDE
) {
1063 MLD_PRINTF(("%s: --in on inm at t1\n", __func__
));
1064 --inm
->in6m_st
[1].iss_in
;
1067 if (imf
->im6f_st
[1] == MCAST_EXCLUDE
) {
1068 MLD_PRINTF(("%s: ex++ on inm at t1\n", __func__
));
1069 inm
->in6m_st
[1].iss_ex
++;
1070 } else if (imf
->im6f_st
[1] == MCAST_INCLUDE
&& nsrc1
> 0) {
1071 MLD_PRINTF(("%s: in++ on inm at t1\n", __func__
));
1072 inm
->in6m_st
[1].iss_in
++;
1077 * Track inm filter state in terms of listener counts.
1078 * If there are any exclusive listeners, stack-wide
1079 * membership is exclusive.
1080 * Otherwise, if only inclusive listeners, stack-wide is inclusive.
1081 * If no listeners remain, state is undefined at t1,
1082 * and the MLD lifecycle for this group should finish.
1084 if (inm
->in6m_st
[1].iss_ex
> 0) {
1085 MLD_PRINTF(("%s: transition to EX\n", __func__
));
1086 inm
->in6m_st
[1].iss_fmode
= MCAST_EXCLUDE
;
1087 } else if (inm
->in6m_st
[1].iss_in
> 0) {
1088 MLD_PRINTF(("%s: transition to IN\n", __func__
));
1089 inm
->in6m_st
[1].iss_fmode
= MCAST_INCLUDE
;
1091 MLD_PRINTF(("%s: transition to UNDEF\n", __func__
));
1092 inm
->in6m_st
[1].iss_fmode
= MCAST_UNDEFINED
;
1095 /* Decrement ASM listener count on transition out of ASM mode. */
1096 if (imf
->im6f_st
[0] == MCAST_EXCLUDE
&& nsrc0
== 0) {
1097 if ((imf
->im6f_st
[1] != MCAST_EXCLUDE
) ||
1098 (imf
->im6f_st
[1] == MCAST_EXCLUDE
&& nsrc1
> 0)) {
1099 MLD_PRINTF(("%s: --asm on inm at t1\n", __func__
));
1100 --inm
->in6m_st
[1].iss_asm
;
1104 /* Increment ASM listener count on transition to ASM mode. */
1105 if (imf
->im6f_st
[1] == MCAST_EXCLUDE
&& nsrc1
== 0) {
1106 MLD_PRINTF(("%s: asm++ on inm at t1\n", __func__
));
1107 inm
->in6m_st
[1].iss_asm
++;
1110 MLD_PRINTF(("%s: merged imf 0x%llx to inm 0x%llx\n", __func__
,
1111 (uint64_t)VM_KERNEL_ADDRPERM(imf
),
1112 (uint64_t)VM_KERNEL_ADDRPERM(inm
)));
1117 MLD_PRINTF(("%s: sources changed; reaping\n", __func__
));
1124 * Mark an in6_multi's filter set deltas as committed.
1125 * Called by MLD after a state change has been enqueued.
1128 in6m_commit(struct in6_multi
*inm
)
1130 struct ip6_msource
*ims
;
1132 IN6M_LOCK_ASSERT_HELD(inm
);
1134 MLD_PRINTF(("%s: commit inm 0x%llx\n", __func__
,
1135 (uint64_t)VM_KERNEL_ADDRPERM(inm
)));
1136 MLD_PRINTF(("%s: pre commit:\n", __func__
));
1139 RB_FOREACH(ims
, ip6_msource_tree
, &inm
->in6m_srcs
) {
1140 ims
->im6s_st
[0] = ims
->im6s_st
[1];
1142 inm
->in6m_st
[0] = inm
->in6m_st
[1];
1146 * Reap unreferenced nodes from an in6_multi's filter set.
1149 in6m_reap(struct in6_multi
*inm
)
1151 struct ip6_msource
*ims
, *tims
;
1153 IN6M_LOCK_ASSERT_HELD(inm
);
1155 RB_FOREACH_SAFE(ims
, ip6_msource_tree
, &inm
->in6m_srcs
, tims
) {
1156 if (ims
->im6s_st
[0].ex
> 0 || ims
->im6s_st
[0].in
> 0 ||
1157 ims
->im6s_st
[1].ex
> 0 || ims
->im6s_st
[1].in
> 0 ||
1160 MLD_PRINTF(("%s: free ims 0x%llx\n", __func__
,
1161 (uint64_t)VM_KERNEL_ADDRPERM(ims
)));
1162 RB_REMOVE(ip6_msource_tree
, &inm
->in6m_srcs
, ims
);
1169 * Purge all source nodes from an in6_multi's filter set.
1172 in6m_purge(struct in6_multi
*inm
)
1174 struct ip6_msource
*ims
, *tims
;
1176 IN6M_LOCK_ASSERT_HELD(inm
);
1178 RB_FOREACH_SAFE(ims
, ip6_msource_tree
, &inm
->in6m_srcs
, tims
) {
1179 MLD_PRINTF(("%s: free ims 0x%llx\n", __func__
,
1180 (uint64_t)VM_KERNEL_ADDRPERM(ims
)));
1181 RB_REMOVE(ip6_msource_tree
, &inm
->in6m_srcs
, ims
);
1188 * Join a multicast address w/o sources.
1189 * KAME compatibility entry point.
1192 struct in6_multi_mship
*
1193 in6_joingroup(struct ifnet
*ifp
, struct in6_addr
*mcaddr
,
1194 int *errorp
, int delay
)
1196 struct in6_multi_mship
*imm
;
1201 imm
= in6_multi_mship_alloc(M_WAITOK
);
1207 error
= in6_mc_join(ifp
, mcaddr
, NULL
, &imm
->i6mm_maddr
, delay
);
1210 in6_multi_mship_free(imm
);
1218 * Leave a multicast address w/o sources.
1219 * KAME compatibility entry point.
1222 in6_leavegroup(struct in6_multi_mship
*imm
)
1224 if (imm
->i6mm_maddr
!= NULL
) {
1225 in6_mc_leave(imm
->i6mm_maddr
, NULL
);
1226 IN6M_REMREF(imm
->i6mm_maddr
);
1227 imm
->i6mm_maddr
= NULL
;
1229 in6_multi_mship_free(imm
);
1234 * Join a multicast group; real entry point.
1236 * Only preserves atomicity at inm level.
1237 * NOTE: imf argument cannot be const due to sys/tree.h limitations.
1239 * If the MLD downcall fails, the group is not joined, and an error
1243 in6_mc_join(struct ifnet
*ifp
, const struct in6_addr
*mcaddr
,
1244 /*const*/ struct in6_mfilter
*imf
, struct in6_multi
**pinm
,
1247 struct in6_mfilter timf
;
1248 struct in6_multi
*inm
= NULL
;
1250 struct mld_tparams mtp
;
1253 * Sanity: Check scope zone ID was set for ifp, if and
1254 * only if group is scoped to an interface.
1256 VERIFY(IN6_IS_ADDR_MULTICAST(mcaddr
));
1257 if (IN6_IS_ADDR_MC_LINKLOCAL(mcaddr
) ||
1258 IN6_IS_ADDR_MC_INTFACELOCAL(mcaddr
)) {
1259 VERIFY(mcaddr
->s6_addr16
[1] != 0);
1262 MLD_PRINTF(("%s: join %s on 0x%llx(%s))\n", __func__
,
1263 ip6_sprintf(mcaddr
), (uint64_t)VM_KERNEL_ADDRPERM(ifp
),
1266 bzero(&mtp
, sizeof (mtp
));
1270 * If no imf was specified (i.e. kernel consumer),
1271 * fake one up and assume it is an ASM join.
1274 im6f_init(&timf
, MCAST_UNDEFINED
, MCAST_EXCLUDE
);
1278 error
= in6_mc_get(ifp
, mcaddr
, &inm
);
1280 MLD_PRINTF(("%s: in6_mc_get() failure\n", __func__
));
1284 MLD_PRINTF(("%s: merge inm state\n", __func__
));
1287 error
= in6m_merge(inm
, imf
);
1289 MLD_PRINTF(("%s: failed to merge inm state\n", __func__
));
1290 goto out_in6m_release
;
1293 MLD_PRINTF(("%s: doing mld downcall\n", __func__
));
1294 error
= mld_change_state(inm
, &mtp
, delay
);
1296 MLD_PRINTF(("%s: failed to update source\n", __func__
));
1298 goto out_in6m_release
;
1303 MLD_PRINTF(("%s: dropping ref on 0x%llx\n", __func__
,
1304 (uint64_t)VM_KERNEL_ADDRPERM(inm
)));
1309 *pinm
= inm
; /* keep refcount from in6_mc_get() */
1312 /* schedule timer now that we've dropped the lock(s) */
1313 mld_set_timeout(&mtp
);
1319 * Leave a multicast group; real entry point.
1320 * All source filters will be expunged.
1322 * Only preserves atomicity at inm level.
1324 * Holding the write lock for the INP which contains imf
1325 * is highly advisable. We can't assert for it as imf does not
1326 * contain a back-pointer to the owning inp.
1328 * Note: This is not the same as in6m_release(*) as this function also
1329 * makes a state change downcall into MLD.
1332 in6_mc_leave(struct in6_multi
*inm
, /*const*/ struct in6_mfilter
*imf
)
1334 struct in6_mfilter timf
;
1336 struct mld_tparams mtp
;
1338 bzero(&mtp
, sizeof (mtp
));
1341 IN6M_LOCK_ASSERT_NOTHELD(inm
);
1343 in6_multihead_lock_exclusive();
1346 MLD_PRINTF(("%s: leave inm 0x%llx, %s/%s%d, imf 0x%llx\n", __func__
,
1347 (uint64_t)VM_KERNEL_ADDRPERM(inm
), ip6_sprintf(&inm
->in6m_addr
),
1348 (in6m_is_ifp_detached(inm
) ? "null" : inm
->in6m_ifp
->if_name
),
1349 inm
->in6m_ifp
->if_unit
, (uint64_t)VM_KERNEL_ADDRPERM(imf
)));
1352 * If no imf was specified (i.e. kernel consumer),
1353 * fake one up and assume it is an ASM join.
1356 im6f_init(&timf
, MCAST_EXCLUDE
, MCAST_UNDEFINED
);
1361 * Begin state merge transaction at MLD layer.
1363 * As this particular invocation should not cause any memory
1364 * to be allocated, and there is no opportunity to roll back
1365 * the transaction, it MUST NOT fail.
1367 MLD_PRINTF(("%s: merge inm state\n", __func__
));
1369 error
= in6m_merge(inm
, imf
);
1370 KASSERT(error
== 0, ("%s: failed to merge inm state\n", __func__
));
1372 MLD_PRINTF(("%s: doing mld downcall\n", __func__
));
1373 error
= mld_change_state(inm
, &mtp
, 0);
1376 MLD_PRINTF(("%s: failed mld downcall\n", __func__
));
1378 lastref
= in6_multi_detach(inm
);
1379 VERIFY(!lastref
|| (!(inm
->in6m_debug
& IFD_ATTACHED
) &&
1380 inm
->in6m_reqcnt
== 0));
1382 in6_multihead_lock_done();
1385 IN6M_REMREF(inm
); /* for in6_multihead list */
1387 /* schedule timer now that we've dropped the lock(s) */
1388 mld_set_timeout(&mtp
);
1394 * Block or unblock an ASM multicast source on an inpcb.
1395 * This implements the delta-based API described in RFC 3678.
1397 * The delta-based API applies only to exclusive-mode memberships.
1398 * An MLD downcall will be performed.
1400 * Return 0 if successful, otherwise return an appropriate error code.
1403 in6p_block_unblock_source(struct inpcb
*inp
, struct sockopt
*sopt
)
1405 struct group_source_req gsr
;
1406 sockunion_t
*gsa
, *ssa
;
1408 struct in6_mfilter
*imf
;
1409 struct ip6_moptions
*imo
;
1410 struct in6_msource
*ims
;
1411 struct in6_multi
*inm
;
1415 struct mld_tparams mtp
;
1417 bzero(&mtp
, sizeof (mtp
));
1422 memset(&gsr
, 0, sizeof(struct group_source_req
));
1423 gsa
= (sockunion_t
*)&gsr
.gsr_group
;
1424 ssa
= (sockunion_t
*)&gsr
.gsr_source
;
1426 switch (sopt
->sopt_name
) {
1427 case MCAST_BLOCK_SOURCE
:
1428 case MCAST_UNBLOCK_SOURCE
:
1429 error
= sooptcopyin(sopt
, &gsr
,
1430 sizeof(struct group_source_req
),
1431 sizeof(struct group_source_req
));
1435 if (gsa
->sin6
.sin6_family
!= AF_INET6
||
1436 gsa
->sin6
.sin6_len
!= sizeof(struct sockaddr_in6
))
1439 if (ssa
->sin6
.sin6_family
!= AF_INET6
||
1440 ssa
->sin6
.sin6_len
!= sizeof(struct sockaddr_in6
))
1443 ifnet_head_lock_shared();
1444 if (gsr
.gsr_interface
== 0 ||
1445 (u_int
)if_index
< gsr
.gsr_interface
) {
1447 return (EADDRNOTAVAIL
);
1450 ifp
= ifindex2ifnet
[gsr
.gsr_interface
];
1454 return (EADDRNOTAVAIL
);
1456 if (sopt
->sopt_name
== MCAST_BLOCK_SOURCE
)
1461 MLD_PRINTF(("%s: unknown sopt_name %d\n",
1462 __func__
, sopt
->sopt_name
));
1463 return (EOPNOTSUPP
);
1466 if (!IN6_IS_ADDR_MULTICAST(&gsa
->sin6
.sin6_addr
))
1469 (void) in6_setscope(&gsa
->sin6
.sin6_addr
, ifp
, NULL
);
1472 * Check if we are actually a member of this group.
1474 imo
= in6p_findmoptions(inp
);
1479 idx
= im6o_match_group(imo
, ifp
, &gsa
->sa
);
1480 if (idx
== (size_t)-1 || imo
->im6o_mfilters
== NULL
) {
1481 error
= EADDRNOTAVAIL
;
1482 goto out_imo_locked
;
1485 VERIFY(imo
->im6o_mfilters
!= NULL
);
1486 imf
= &imo
->im6o_mfilters
[idx
];
1487 inm
= imo
->im6o_membership
[idx
];
1490 * Attempting to use the delta-based API on an
1491 * non exclusive-mode membership is an error.
1493 fmode
= imf
->im6f_st
[0];
1494 if (fmode
!= MCAST_EXCLUDE
) {
1496 goto out_imo_locked
;
1500 * Deal with error cases up-front:
1501 * Asked to block, but already blocked; or
1502 * Asked to unblock, but nothing to unblock.
1503 * If adding a new block entry, allocate it.
1505 ims
= im6o_match_source(imo
, idx
, &ssa
->sa
);
1506 if ((ims
!= NULL
&& doblock
) || (ims
== NULL
&& !doblock
)) {
1507 MLD_PRINTF(("%s: source %s %spresent\n", __func__
,
1508 ip6_sprintf(&ssa
->sin6
.sin6_addr
),
1509 doblock
? "" : "not "));
1510 error
= EADDRNOTAVAIL
;
1511 goto out_imo_locked
;
1515 * Begin state merge transaction at socket layer.
1518 MLD_PRINTF(("%s: %s source\n", __func__
, "block"));
1519 ims
= im6f_graft(imf
, fmode
, &ssa
->sin6
);
1523 MLD_PRINTF(("%s: %s source\n", __func__
, "allow"));
1524 error
= im6f_prune(imf
, &ssa
->sin6
);
1528 MLD_PRINTF(("%s: merge imf state failed\n", __func__
));
1529 goto out_im6f_rollback
;
1533 * Begin state merge transaction at MLD layer.
1536 MLD_PRINTF(("%s: merge inm state\n", __func__
));
1537 error
= in6m_merge(inm
, imf
);
1539 MLD_PRINTF(("%s: failed to merge inm state\n", __func__
));
1541 goto out_im6f_rollback
;
1544 MLD_PRINTF(("%s: doing mld downcall\n", __func__
));
1545 error
= mld_change_state(inm
, &mtp
, 0);
1549 MLD_PRINTF(("%s: failed mld downcall\n", __func__
));
1562 IM6O_REMREF(imo
); /* from in6p_findmoptions() */
1564 /* schedule timer now that we've dropped the lock(s) */
1565 mld_set_timeout(&mtp
);
1571 * Given an inpcb, return its multicast options structure pointer. Accepts
1572 * an unlocked inpcb pointer, but will return it locked. May sleep.
1575 static struct ip6_moptions
*
1576 in6p_findmoptions(struct inpcb
*inp
)
1578 struct ip6_moptions
*imo
;
1579 struct in6_multi
**immp
;
1580 struct in6_mfilter
*imfp
;
1583 if ((imo
= inp
->in6p_moptions
) != NULL
) {
1584 IM6O_ADDREF(imo
); /* for caller */
1588 imo
= ip6_allocmoptions(M_WAITOK
);
1592 immp
= _MALLOC(sizeof (*immp
) * IPV6_MIN_MEMBERSHIPS
, M_IP6MOPTS
,
1599 imfp
= _MALLOC(sizeof (struct in6_mfilter
) * IPV6_MIN_MEMBERSHIPS
,
1600 M_IN6MFILTER
, M_WAITOK
| M_ZERO
);
1602 _FREE(immp
, M_IP6MOPTS
);
1607 imo
->im6o_multicast_ifp
= NULL
;
1608 imo
->im6o_multicast_hlim
= ip6_defmcasthlim
;
1609 imo
->im6o_multicast_loop
= in6_mcast_loop
;
1610 imo
->im6o_num_memberships
= 0;
1611 imo
->im6o_max_memberships
= IPV6_MIN_MEMBERSHIPS
;
1612 imo
->im6o_membership
= immp
;
1614 /* Initialize per-group source filters. */
1615 for (idx
= 0; idx
< IPV6_MIN_MEMBERSHIPS
; idx
++)
1616 im6f_init(&imfp
[idx
], MCAST_UNDEFINED
, MCAST_EXCLUDE
);
1618 imo
->im6o_mfilters
= imfp
;
1619 inp
->in6p_moptions
= imo
; /* keep reference from ip6_allocmoptions() */
1620 IM6O_ADDREF(imo
); /* for caller */
1626 * Atomically get source filters on a socket for an IPv6 multicast group.
1627 * Called with INP lock held; returns with lock released.
1630 in6p_get_source_filters(struct inpcb
*inp
, struct sockopt
*sopt
)
1632 struct __msfilterreq64 msfr
, msfr64
;
1633 struct __msfilterreq32 msfr32
;
1636 struct ip6_moptions
*imo
;
1637 struct in6_mfilter
*imf
;
1638 struct ip6_msource
*ims
;
1639 struct in6_msource
*lims
;
1640 struct sockaddr_in6
*psin
;
1641 struct sockaddr_storage
*ptss
;
1642 struct sockaddr_storage
*tss
;
1644 size_t idx
, nsrcs
, ncsrcs
;
1645 user_addr_t tmp_ptr
;
1647 imo
= inp
->in6p_moptions
;
1648 VERIFY(imo
!= NULL
);
1650 if (IS_64BIT_PROCESS(current_proc())) {
1651 error
= sooptcopyin(sopt
, &msfr64
,
1652 sizeof(struct __msfilterreq64
),
1653 sizeof(struct __msfilterreq64
));
1656 /* we never use msfr.msfr_srcs; */
1657 memcpy(&msfr
, &msfr64
, sizeof(msfr64
));
1659 error
= sooptcopyin(sopt
, &msfr32
,
1660 sizeof(struct __msfilterreq32
),
1661 sizeof(struct __msfilterreq32
));
1664 /* we never use msfr.msfr_srcs; */
1665 memcpy(&msfr
, &msfr32
, sizeof(msfr32
));
1668 if (msfr
.msfr_group
.ss_family
!= AF_INET6
||
1669 msfr
.msfr_group
.ss_len
!= sizeof(struct sockaddr_in6
))
1672 gsa
= (sockunion_t
*)&msfr
.msfr_group
;
1673 if (!IN6_IS_ADDR_MULTICAST(&gsa
->sin6
.sin6_addr
))
1676 ifnet_head_lock_shared();
1677 if (msfr
.msfr_ifindex
== 0 || (u_int
)if_index
< msfr
.msfr_ifindex
) {
1679 return (EADDRNOTAVAIL
);
1681 ifp
= ifindex2ifnet
[msfr
.msfr_ifindex
];
1685 return (EADDRNOTAVAIL
);
1687 if ((size_t) msfr
.msfr_nsrcs
>
1688 UINT32_MAX
/ sizeof(struct sockaddr_storage
))
1689 msfr
.msfr_nsrcs
= UINT32_MAX
/ sizeof(struct sockaddr_storage
);
1691 if (msfr
.msfr_nsrcs
> in6_mcast_maxsocksrc
)
1692 msfr
.msfr_nsrcs
= in6_mcast_maxsocksrc
;
1694 (void)in6_setscope(&gsa
->sin6
.sin6_addr
, ifp
, NULL
);
1698 * Lookup group on the socket.
1700 idx
= im6o_match_group(imo
, ifp
, &gsa
->sa
);
1701 if (idx
== (size_t)-1 || imo
->im6o_mfilters
== NULL
) {
1703 return (EADDRNOTAVAIL
);
1705 imf
= &imo
->im6o_mfilters
[idx
];
1708 * Ignore memberships which are in limbo.
1710 if (imf
->im6f_st
[1] == MCAST_UNDEFINED
) {
1714 msfr
.msfr_fmode
= imf
->im6f_st
[1];
1717 * If the user specified a buffer, copy out the source filter
1718 * entries to userland gracefully.
1719 * We only copy out the number of entries which userland
1720 * has asked for, but we always tell userland how big the
1721 * buffer really needs to be.
1725 if (IS_64BIT_PROCESS(current_proc()))
1726 tmp_ptr
= msfr64
.msfr_srcs
;
1728 tmp_ptr
= CAST_USER_ADDR_T(msfr32
.msfr_srcs
);
1730 if (tmp_ptr
!= USER_ADDR_NULL
&& msfr
.msfr_nsrcs
> 0) {
1731 tss
= _MALLOC((size_t) msfr
.msfr_nsrcs
* sizeof(*tss
),
1732 M_TEMP
, M_WAITOK
| M_ZERO
);
1740 * Count number of sources in-mode at t0.
1741 * If buffer space exists and remains, copy out source entries.
1743 nsrcs
= msfr
.msfr_nsrcs
;
1746 RB_FOREACH(ims
, ip6_msource_tree
, &imf
->im6f_sources
) {
1747 lims
= (struct in6_msource
*)ims
;
1748 if (lims
->im6sl_st
[0] == MCAST_UNDEFINED
||
1749 lims
->im6sl_st
[0] != imf
->im6f_st
[0])
1751 if (tss
!= NULL
&& nsrcs
> 0) {
1752 psin
= (struct sockaddr_in6
*)ptss
;
1753 psin
->sin6_family
= AF_INET6
;
1754 psin
->sin6_len
= sizeof(struct sockaddr_in6
);
1755 psin
->sin6_addr
= lims
->im6s_addr
;
1756 psin
->sin6_port
= 0;
1766 error
= copyout(tss
, tmp_ptr
, ncsrcs
* sizeof(*tss
));
1772 msfr
.msfr_nsrcs
= ncsrcs
;
1773 if (IS_64BIT_PROCESS(current_proc())) {
1774 msfr64
.msfr_ifindex
= msfr
.msfr_ifindex
;
1775 msfr64
.msfr_fmode
= msfr
.msfr_fmode
;
1776 msfr64
.msfr_nsrcs
= msfr
.msfr_nsrcs
;
1777 memcpy(&msfr64
.msfr_group
, &msfr
.msfr_group
,
1778 sizeof(struct sockaddr_storage
));
1779 error
= sooptcopyout(sopt
, &msfr64
,
1780 sizeof(struct __msfilterreq64
));
1782 msfr32
.msfr_ifindex
= msfr
.msfr_ifindex
;
1783 msfr32
.msfr_fmode
= msfr
.msfr_fmode
;
1784 msfr32
.msfr_nsrcs
= msfr
.msfr_nsrcs
;
1785 memcpy(&msfr32
.msfr_group
, &msfr
.msfr_group
,
1786 sizeof(struct sockaddr_storage
));
1787 error
= sooptcopyout(sopt
, &msfr32
,
1788 sizeof(struct __msfilterreq32
));
1795 * Return the IP multicast options in response to user getsockopt().
1798 ip6_getmoptions(struct inpcb
*inp
, struct sockopt
*sopt
)
1800 struct ip6_moptions
*im6o
;
1804 im6o
= inp
->in6p_moptions
;
1806 * If socket is neither of type SOCK_RAW or SOCK_DGRAM,
1807 * or is a divert socket, reject it.
1809 if (SOCK_PROTO(inp
->inp_socket
) == IPPROTO_DIVERT
||
1810 (SOCK_TYPE(inp
->inp_socket
) != SOCK_RAW
&&
1811 SOCK_TYPE(inp
->inp_socket
) != SOCK_DGRAM
)) {
1812 return (EOPNOTSUPP
);
1816 switch (sopt
->sopt_name
) {
1817 case IPV6_MULTICAST_IF
:
1820 if (im6o
== NULL
|| im6o
->im6o_multicast_ifp
== NULL
) {
1823 optval
= im6o
->im6o_multicast_ifp
->if_index
;
1827 error
= sooptcopyout(sopt
, &optval
, sizeof(u_int
));
1830 case IPV6_MULTICAST_HOPS
:
1832 optval
= ip6_defmcasthlim
;
1835 optval
= im6o
->im6o_multicast_hlim
;
1838 error
= sooptcopyout(sopt
, &optval
, sizeof(u_int
));
1841 case IPV6_MULTICAST_LOOP
:
1843 optval
= in6_mcast_loop
; /* XXX VIMAGE */
1846 optval
= im6o
->im6o_multicast_loop
;
1849 error
= sooptcopyout(sopt
, &optval
, sizeof(u_int
));
1854 error
= EADDRNOTAVAIL
;
1856 error
= in6p_get_source_filters(inp
, sopt
);
1861 error
= ENOPROTOOPT
;
1869 * Look up the ifnet to use for a multicast group membership,
1870 * given the address of an IPv6 group.
1872 * This routine exists to support legacy IPv6 multicast applications.
1874 * If inp is non-NULL and is bound to an interface, use this socket's
1875 * inp_boundif for any required routing table lookup.
1877 * If the route lookup fails, return NULL.
1879 * FUTURE: Support multiple forwarding tables for IPv6.
1881 * Returns NULL if no ifp could be found.
1883 static struct ifnet
*
1884 in6p_lookup_mcast_ifp(const struct inpcb
*in6p
,
1885 const struct sockaddr_in6
*gsin6
)
1887 struct route_in6 ro6
;
1889 unsigned int ifscope
= IFSCOPE_NONE
;
1891 VERIFY(in6p
== NULL
|| (in6p
->inp_vflag
& INP_IPV6
));
1892 VERIFY(gsin6
->sin6_family
== AF_INET6
);
1893 if (IN6_IS_ADDR_MULTICAST(&gsin6
->sin6_addr
) == 0)
1896 if (in6p
!= NULL
&& (in6p
->inp_flags
& INP_BOUND_IF
))
1897 ifscope
= in6p
->inp_boundifp
->if_index
;
1900 memset(&ro6
, 0, sizeof(struct route_in6
));
1901 memcpy(&ro6
.ro_dst
, gsin6
, sizeof(struct sockaddr_in6
));
1902 rtalloc_scoped_ign((struct route
*)&ro6
, 0, ifscope
);
1903 if (ro6
.ro_rt
!= NULL
) {
1904 ifp
= ro6
.ro_rt
->rt_ifp
;
1905 VERIFY(ifp
!= NULL
);
1907 ROUTE_RELEASE(&ro6
);
1913 * Since ipv6_mreq contains an ifindex and ip_mreq contains an AF_INET
1914 * address, we need to lookup the AF_INET address when translating an
1915 * ipv6_mreq structure into an ipmreq structure.
1916 * This is used when userland performs multicast setsockopt() on AF_INET6
1917 * sockets with AF_INET multicast addresses (IPv6 v4 mapped addresses).
1920 in6p_lookup_v4addr(struct ipv6_mreq
*mreq
, struct ip_mreq
*v4mreq
)
1924 struct sockaddr_in
*sin
;
1926 ifnet_head_lock_shared();
1927 if (mreq
->ipv6mr_interface
> (unsigned int)if_index
) {
1929 return (EADDRNOTAVAIL
);
1931 ifp
= ifindex2ifnet
[mreq
->ipv6mr_interface
];
1934 return (EADDRNOTAVAIL
);
1935 ifa
= ifa_ifpgetprimary(ifp
, AF_INET
);
1937 return (EADDRNOTAVAIL
);
1938 sin
= (struct sockaddr_in
*)(uintptr_t)(size_t)ifa
->ifa_addr
;
1939 v4mreq
->imr_interface
.s_addr
= sin
->sin_addr
.s_addr
;
1946 * Join an IPv6 multicast group, possibly with a source.
1948 * FIXME: The KAME use of the unspecified address (::)
1949 * to join *all* multicast groups is currently unsupported.
1952 in6p_join_group(struct inpcb
*inp
, struct sockopt
*sopt
)
1954 struct group_source_req gsr
;
1955 sockunion_t
*gsa
, *ssa
;
1957 struct in6_mfilter
*imf
;
1958 struct ip6_moptions
*imo
;
1959 struct in6_multi
*inm
= NULL
;
1960 struct in6_msource
*lims
= NULL
;
1963 uint32_t scopeid
= 0;
1964 struct mld_tparams mtp
;
1966 bzero(&mtp
, sizeof (mtp
));
1972 memset(&gsr
, 0, sizeof(struct group_source_req
));
1973 gsa
= (sockunion_t
*)&gsr
.gsr_group
;
1974 gsa
->ss
.ss_family
= AF_UNSPEC
;
1975 ssa
= (sockunion_t
*)&gsr
.gsr_source
;
1976 ssa
->ss
.ss_family
= AF_UNSPEC
;
1979 * Chew everything into struct group_source_req.
1980 * Overwrite the port field if present, as the sockaddr
1981 * being copied in may be matched with a binary comparison.
1982 * Ignore passed-in scope ID.
1984 switch (sopt
->sopt_name
) {
1985 case IPV6_JOIN_GROUP
: {
1986 struct ipv6_mreq mreq
;
1987 struct sockaddr_in6
*gsin6
;
1989 error
= sooptcopyin(sopt
, &mreq
, sizeof(struct ipv6_mreq
),
1990 sizeof(struct ipv6_mreq
));
1993 if (IN6_IS_ADDR_V4MAPPED(&mreq
.ipv6mr_multiaddr
)) {
1994 struct ip_mreq v4mreq
;
1995 struct sockopt v4sopt
;
1997 v4mreq
.imr_multiaddr
.s_addr
=
1998 mreq
.ipv6mr_multiaddr
.s6_addr32
[3];
1999 if (mreq
.ipv6mr_interface
== 0)
2000 v4mreq
.imr_interface
.s_addr
= INADDR_ANY
;
2002 error
= in6p_lookup_v4addr(&mreq
, &v4mreq
);
2005 v4sopt
.sopt_dir
= SOPT_SET
;
2006 v4sopt
.sopt_level
= sopt
->sopt_level
;
2007 v4sopt
.sopt_name
= IP_ADD_MEMBERSHIP
;
2008 v4sopt
.sopt_val
= CAST_USER_ADDR_T(&v4mreq
);
2009 v4sopt
.sopt_valsize
= sizeof(v4mreq
);
2010 v4sopt
.sopt_p
= kernproc
;
2012 return (inp_join_group(inp
, &v4sopt
));
2014 gsa
->sin6
.sin6_family
= AF_INET6
;
2015 gsa
->sin6
.sin6_len
= sizeof(struct sockaddr_in6
);
2016 gsa
->sin6
.sin6_addr
= mreq
.ipv6mr_multiaddr
;
2020 /* Only allow IPv6 multicast addresses */
2021 if (IN6_IS_ADDR_MULTICAST(&gsin6
->sin6_addr
) == 0) {
2025 if (mreq
.ipv6mr_interface
== 0) {
2026 ifp
= in6p_lookup_mcast_ifp(inp
, gsin6
);
2028 ifnet_head_lock_shared();
2029 if ((u_int
)if_index
< mreq
.ipv6mr_interface
) {
2031 return (EADDRNOTAVAIL
);
2033 ifp
= ifindex2ifnet
[mreq
.ipv6mr_interface
];
2036 MLD_PRINTF(("%s: ipv6mr_interface = %d, ifp = 0x%llx\n",
2037 __func__
, mreq
.ipv6mr_interface
,
2038 (uint64_t)VM_KERNEL_ADDRPERM(ifp
)));
2042 case MCAST_JOIN_GROUP
:
2043 case MCAST_JOIN_SOURCE_GROUP
:
2044 if (sopt
->sopt_name
== MCAST_JOIN_GROUP
) {
2045 error
= sooptcopyin(sopt
, &gsr
,
2046 sizeof(struct group_req
),
2047 sizeof(struct group_req
));
2048 } else if (sopt
->sopt_name
== MCAST_JOIN_SOURCE_GROUP
) {
2049 error
= sooptcopyin(sopt
, &gsr
,
2050 sizeof(struct group_source_req
),
2051 sizeof(struct group_source_req
));
2056 if (gsa
->sin6
.sin6_family
!= AF_INET6
||
2057 gsa
->sin6
.sin6_len
!= sizeof(struct sockaddr_in6
))
2060 if (sopt
->sopt_name
== MCAST_JOIN_SOURCE_GROUP
) {
2061 if (ssa
->sin6
.sin6_family
!= AF_INET6
||
2062 ssa
->sin6
.sin6_len
!= sizeof(struct sockaddr_in6
))
2064 if (IN6_IS_ADDR_MULTICAST(&ssa
->sin6
.sin6_addr
))
2067 * TODO: Validate embedded scope ID in source
2068 * list entry against passed-in ifp, if and only
2069 * if source list filter entry is iface or node local.
2071 in6_clearscope(&ssa
->sin6
.sin6_addr
);
2072 ssa
->sin6
.sin6_port
= 0;
2073 ssa
->sin6
.sin6_scope_id
= 0;
2076 ifnet_head_lock_shared();
2077 if (gsr
.gsr_interface
== 0 ||
2078 (u_int
)if_index
< gsr
.gsr_interface
) {
2080 return (EADDRNOTAVAIL
);
2082 ifp
= ifindex2ifnet
[gsr
.gsr_interface
];
2087 MLD_PRINTF(("%s: unknown sopt_name %d\n",
2088 __func__
, sopt
->sopt_name
));
2089 return (EOPNOTSUPP
);
2092 if (!IN6_IS_ADDR_MULTICAST(&gsa
->sin6
.sin6_addr
))
2095 if (ifp
== NULL
|| (ifp
->if_flags
& IFF_MULTICAST
) == 0)
2096 return (EADDRNOTAVAIL
);
2098 gsa
->sin6
.sin6_port
= 0;
2099 gsa
->sin6
.sin6_scope_id
= 0;
2102 * Always set the scope zone ID on memberships created from userland.
2103 * Use the passed-in ifp to do this.
2105 (void)in6_setscope(&gsa
->sin6
.sin6_addr
, ifp
, &scopeid
);
2107 * Some addresses are not valid without an embedded scopeid.
2108 * This check must be present because otherwise we will later hit
2109 * a VERIFY() in in6_mc_join().
2111 if ((IN6_IS_ADDR_MC_LINKLOCAL(&gsa
->sin6
.sin6_addr
) ||
2112 IN6_IS_ADDR_MC_INTFACELOCAL(&gsa
->sin6
.sin6_addr
)) &&
2113 (scopeid
== 0 || gsa
->sin6
.sin6_addr
.s6_addr16
[1] == 0))
2116 imo
= in6p_findmoptions(inp
);
2121 idx
= im6o_match_group(imo
, ifp
, &gsa
->sa
);
2122 if (idx
== (size_t)-1) {
2125 inm
= imo
->im6o_membership
[idx
];
2126 imf
= &imo
->im6o_mfilters
[idx
];
2127 if (ssa
->ss
.ss_family
!= AF_UNSPEC
) {
2129 * MCAST_JOIN_SOURCE_GROUP on an exclusive membership
2130 * is an error. On an existing inclusive membership,
2131 * it just adds the source to the filter list.
2133 if (imf
->im6f_st
[1] != MCAST_INCLUDE
) {
2135 goto out_imo_locked
;
2138 * Throw out duplicates.
2140 * XXX FIXME: This makes a naive assumption that
2141 * even if entries exist for *ssa in this imf,
2142 * they will be rejected as dupes, even if they
2143 * are not valid in the current mode (in-mode).
2145 * in6_msource is transactioned just as for anything
2146 * else in SSM -- but note naive use of in6m_graft()
2147 * below for allocating new filter entries.
2149 * This is only an issue if someone mixes the
2150 * full-state SSM API with the delta-based API,
2151 * which is discouraged in the relevant RFCs.
2153 lims
= im6o_match_source(imo
, idx
, &ssa
->sa
);
2154 if (lims
!= NULL
/*&&
2155 lims->im6sl_st[1] == MCAST_INCLUDE*/) {
2156 error
= EADDRNOTAVAIL
;
2157 goto out_imo_locked
;
2161 * MCAST_JOIN_GROUP on an existing exclusive
2162 * membership is an error; return EADDRINUSE
2163 * to preserve 4.4BSD API idempotence, and
2164 * avoid tedious detour to code below.
2165 * NOTE: This is bending RFC 3678 a bit.
2167 * On an existing inclusive membership, this is also
2168 * an error; if you want to change filter mode,
2169 * you must use the userland API setsourcefilter().
2170 * XXX We don't reject this for imf in UNDEFINED
2171 * state at t1, because allocation of a filter
2172 * is atomic with allocation of a membership.
2175 /* See comments above for EADDRINUSE */
2176 if (imf
->im6f_st
[1] == MCAST_EXCLUDE
)
2178 goto out_imo_locked
;
2183 * Begin state merge transaction at socket layer.
2187 if (imo
->im6o_num_memberships
== imo
->im6o_max_memberships
) {
2188 error
= im6o_grow(imo
, 0);
2190 goto out_imo_locked
;
2193 * Allocate the new slot upfront so we can deal with
2194 * grafting the new source filter in same code path
2195 * as for join-source on existing membership.
2197 idx
= imo
->im6o_num_memberships
;
2198 imo
->im6o_membership
[idx
] = NULL
;
2199 imo
->im6o_num_memberships
++;
2200 VERIFY(imo
->im6o_mfilters
!= NULL
);
2201 imf
= &imo
->im6o_mfilters
[idx
];
2202 VERIFY(RB_EMPTY(&imf
->im6f_sources
));
2206 * Graft new source into filter list for this inpcb's
2207 * membership of the group. The in6_multi may not have
2208 * been allocated yet if this is a new membership, however,
2209 * the in_mfilter slot will be allocated and must be initialized.
2211 * Note: Grafting of exclusive mode filters doesn't happen
2213 * XXX: Should check for non-NULL lims (node exists but may
2214 * not be in-mode) for interop with full-state API.
2216 if (ssa
->ss
.ss_family
!= AF_UNSPEC
) {
2217 /* Membership starts in IN mode */
2219 MLD_PRINTF(("%s: new join w/source\n", __func__
);
2220 im6f_init(imf
, MCAST_UNDEFINED
, MCAST_INCLUDE
));
2222 MLD_PRINTF(("%s: %s source\n", __func__
, "allow"));
2224 lims
= im6f_graft(imf
, MCAST_INCLUDE
, &ssa
->sin6
);
2226 MLD_PRINTF(("%s: merge imf state failed\n",
2232 /* No address specified; Membership starts in EX mode */
2234 MLD_PRINTF(("%s: new join w/o source", __func__
));
2235 im6f_init(imf
, MCAST_UNDEFINED
, MCAST_EXCLUDE
);
2240 * Begin state merge transaction at MLD layer.
2245 * See inp_join_group() for why we need to unlock
2247 IM6O_ADDREF_LOCKED(imo
);
2249 socket_unlock(inp
->inp_socket
, 0);
2251 VERIFY(inm
== NULL
);
2252 error
= in6_mc_join(ifp
, &gsa
->sin6
.sin6_addr
, imf
, &inm
, 0);
2253 VERIFY(inm
!= NULL
|| error
!= 0);
2255 socket_lock(inp
->inp_socket
, 0);
2261 imo
->im6o_membership
[idx
] = inm
; /* from in6_mc_join() */
2263 MLD_PRINTF(("%s: merge inm state\n", __func__
));
2265 error
= in6m_merge(inm
, imf
);
2267 MLD_PRINTF(("%s: failed to merge inm state\n",
2270 goto out_im6f_rollback
;
2272 MLD_PRINTF(("%s: doing mld downcall\n", __func__
));
2273 error
= mld_change_state(inm
, &mtp
, 0);
2276 MLD_PRINTF(("%s: failed mld downcall\n",
2278 goto out_im6f_rollback
;
2294 if (error
&& is_new
) {
2295 VERIFY(inm
== NULL
);
2296 imo
->im6o_membership
[idx
] = NULL
;
2297 --imo
->im6o_num_memberships
;
2302 IM6O_REMREF(imo
); /* from in6p_findmoptions() */
2304 /* schedule timer now that we've dropped the lock(s) */
2305 mld_set_timeout(&mtp
);
2311 * Leave an IPv6 multicast group on an inpcb, possibly with a source.
2314 in6p_leave_group(struct inpcb
*inp
, struct sockopt
*sopt
)
2316 struct ipv6_mreq mreq
;
2317 struct group_source_req gsr
;
2318 sockunion_t
*gsa
, *ssa
;
2320 struct in6_mfilter
*imf
;
2321 struct ip6_moptions
*imo
;
2322 struct in6_msource
*ims
;
2323 struct in6_multi
*inm
= NULL
;
2324 uint32_t ifindex
= 0;
2326 int error
, is_final
;
2327 struct mld_tparams mtp
;
2329 bzero(&mtp
, sizeof (mtp
));
2334 memset(&gsr
, 0, sizeof(struct group_source_req
));
2335 gsa
= (sockunion_t
*)&gsr
.gsr_group
;
2336 gsa
->ss
.ss_family
= AF_UNSPEC
;
2337 ssa
= (sockunion_t
*)&gsr
.gsr_source
;
2338 ssa
->ss
.ss_family
= AF_UNSPEC
;
2341 * Chew everything passed in up into a struct group_source_req
2342 * as that is easier to process.
2343 * Note: Any embedded scope ID in the multicast group passed
2344 * in by userland is ignored, the interface index is the recommended
2345 * mechanism to specify an interface; see below.
2347 switch (sopt
->sopt_name
) {
2348 case IPV6_LEAVE_GROUP
: {
2349 struct sockaddr_in6
*gsin6
;
2351 error
= sooptcopyin(sopt
, &mreq
, sizeof(struct ipv6_mreq
),
2352 sizeof(struct ipv6_mreq
));
2355 if (IN6_IS_ADDR_V4MAPPED(&mreq
.ipv6mr_multiaddr
)) {
2356 struct ip_mreq v4mreq
;
2357 struct sockopt v4sopt
;
2359 v4mreq
.imr_multiaddr
.s_addr
=
2360 mreq
.ipv6mr_multiaddr
.s6_addr32
[3];
2361 if (mreq
.ipv6mr_interface
== 0)
2362 v4mreq
.imr_interface
.s_addr
= INADDR_ANY
;
2364 error
= in6p_lookup_v4addr(&mreq
, &v4mreq
);
2367 v4sopt
.sopt_dir
= SOPT_SET
;
2368 v4sopt
.sopt_level
= sopt
->sopt_level
;
2369 v4sopt
.sopt_name
= IP_DROP_MEMBERSHIP
;
2370 v4sopt
.sopt_val
= CAST_USER_ADDR_T(&v4mreq
);
2371 v4sopt
.sopt_valsize
= sizeof(v4mreq
);
2372 v4sopt
.sopt_p
= kernproc
;
2374 return (inp_leave_group(inp
, &v4sopt
));
2376 gsa
->sin6
.sin6_family
= AF_INET6
;
2377 gsa
->sin6
.sin6_len
= sizeof(struct sockaddr_in6
);
2378 gsa
->sin6
.sin6_addr
= mreq
.ipv6mr_multiaddr
;
2379 gsa
->sin6
.sin6_port
= 0;
2380 gsa
->sin6
.sin6_scope_id
= 0;
2381 ifindex
= mreq
.ipv6mr_interface
;
2383 /* Only allow IPv6 multicast addresses */
2384 if (IN6_IS_ADDR_MULTICAST(&gsin6
->sin6_addr
) == 0) {
2390 case MCAST_LEAVE_GROUP
:
2391 case MCAST_LEAVE_SOURCE_GROUP
:
2392 if (sopt
->sopt_name
== MCAST_LEAVE_GROUP
) {
2393 error
= sooptcopyin(sopt
, &gsr
,
2394 sizeof(struct group_req
),
2395 sizeof(struct group_req
));
2396 } else if (sopt
->sopt_name
== MCAST_LEAVE_SOURCE_GROUP
) {
2397 error
= sooptcopyin(sopt
, &gsr
,
2398 sizeof(struct group_source_req
),
2399 sizeof(struct group_source_req
));
2404 if (gsa
->sin6
.sin6_family
!= AF_INET6
||
2405 gsa
->sin6
.sin6_len
!= sizeof(struct sockaddr_in6
))
2407 if (sopt
->sopt_name
== MCAST_LEAVE_SOURCE_GROUP
) {
2408 if (ssa
->sin6
.sin6_family
!= AF_INET6
||
2409 ssa
->sin6
.sin6_len
!= sizeof(struct sockaddr_in6
))
2411 if (IN6_IS_ADDR_MULTICAST(&ssa
->sin6
.sin6_addr
))
2414 * TODO: Validate embedded scope ID in source
2415 * list entry against passed-in ifp, if and only
2416 * if source list filter entry is iface or node local.
2418 in6_clearscope(&ssa
->sin6
.sin6_addr
);
2420 gsa
->sin6
.sin6_port
= 0;
2421 gsa
->sin6
.sin6_scope_id
= 0;
2422 ifindex
= gsr
.gsr_interface
;
2426 MLD_PRINTF(("%s: unknown sopt_name %d\n",
2427 __func__
, sopt
->sopt_name
));
2428 return (EOPNOTSUPP
);
2431 if (!IN6_IS_ADDR_MULTICAST(&gsa
->sin6
.sin6_addr
))
2435 * Validate interface index if provided. If no interface index
2436 * was provided separately, attempt to look the membership up
2437 * from the default scope as a last resort to disambiguate
2438 * the membership we are being asked to leave.
2439 * XXX SCOPE6 lock potentially taken here.
2442 ifnet_head_lock_shared();
2443 if ((u_int
)if_index
< ifindex
) {
2445 return (EADDRNOTAVAIL
);
2447 ifp
= ifindex2ifnet
[ifindex
];
2450 return (EADDRNOTAVAIL
);
2451 (void) in6_setscope(&gsa
->sin6
.sin6_addr
, ifp
, NULL
);
2453 error
= sa6_embedscope(&gsa
->sin6
, ip6_use_defzone
);
2455 return (EADDRNOTAVAIL
);
2457 * Some badly behaved applications don't pass an ifindex
2458 * or a scope ID, which is an API violation. In this case,
2459 * perform a lookup as per a v6 join.
2461 * XXX For now, stomp on zone ID for the corner case.
2462 * This is not the 'KAME way', but we need to see the ifp
2463 * directly until such time as this implementation is
2464 * refactored, assuming the scope IDs are the way to go.
2466 ifindex
= ntohs(gsa
->sin6
.sin6_addr
.s6_addr16
[1]);
2468 MLD_PRINTF(("%s: warning: no ifindex, looking up "
2469 "ifp for group %s.\n", __func__
,
2470 ip6_sprintf(&gsa
->sin6
.sin6_addr
)));
2471 ifp
= in6p_lookup_mcast_ifp(inp
, &gsa
->sin6
);
2473 if (!IF_INDEX_IN_RANGE(ifindex
))
2474 return (EADDRNOTAVAIL
);
2475 ifnet_head_lock_shared();
2476 ifp
= ifindex2ifnet
[ifindex
];
2480 return (EADDRNOTAVAIL
);
2483 VERIFY(ifp
!= NULL
);
2484 MLD_PRINTF(("%s: ifp = 0x%llx\n", __func__
,
2485 (uint64_t)VM_KERNEL_ADDRPERM(ifp
)));
2488 * Find the membership in the membership array.
2490 imo
= in6p_findmoptions(inp
);
2495 idx
= im6o_match_group(imo
, ifp
, &gsa
->sa
);
2496 if (idx
== (size_t)-1) {
2497 error
= EADDRNOTAVAIL
;
2500 inm
= imo
->im6o_membership
[idx
];
2501 imf
= &imo
->im6o_mfilters
[idx
];
2503 if (ssa
->ss
.ss_family
!= AF_UNSPEC
)
2507 * Begin state merge transaction at socket layer.
2511 * If we were instructed only to leave a given source, do so.
2512 * MCAST_LEAVE_SOURCE_GROUP is only valid for inclusive memberships.
2517 if (imf
->im6f_st
[0] == MCAST_EXCLUDE
) {
2518 error
= EADDRNOTAVAIL
;
2521 ims
= im6o_match_source(imo
, idx
, &ssa
->sa
);
2523 MLD_PRINTF(("%s: source %s %spresent\n", __func__
,
2524 ip6_sprintf(&ssa
->sin6
.sin6_addr
),
2526 error
= EADDRNOTAVAIL
;
2529 MLD_PRINTF(("%s: %s source\n", __func__
, "block"));
2530 error
= im6f_prune(imf
, &ssa
->sin6
);
2532 MLD_PRINTF(("%s: merge imf state failed\n",
2539 * Begin state merge transaction at MLD layer.
2544 * Give up the multicast address record to which
2545 * the membership points. Reference held in im6o
2546 * will be released below.
2548 (void) in6_mc_leave(inm
, imf
);
2550 MLD_PRINTF(("%s: merge inm state\n", __func__
));
2552 error
= in6m_merge(inm
, imf
);
2554 MLD_PRINTF(("%s: failed to merge inm state\n",
2557 goto out_im6f_rollback
;
2560 MLD_PRINTF(("%s: doing mld downcall\n", __func__
));
2561 error
= mld_change_state(inm
, &mtp
, 0);
2563 MLD_PRINTF(("%s: failed mld downcall\n", __func__
));
2577 /* Remove the gap in the membership array. */
2578 VERIFY(inm
== imo
->im6o_membership
[idx
]);
2579 imo
->im6o_membership
[idx
] = NULL
;
2582 * See inp_join_group() for why we need to unlock
2584 IM6O_ADDREF_LOCKED(imo
);
2586 socket_unlock(inp
->inp_socket
, 0);
2590 socket_lock(inp
->inp_socket
, 0);
2594 for (++idx
; idx
< imo
->im6o_num_memberships
; ++idx
) {
2595 imo
->im6o_membership
[idx
-1] = imo
->im6o_membership
[idx
];
2596 imo
->im6o_mfilters
[idx
-1] = imo
->im6o_mfilters
[idx
];
2598 imo
->im6o_num_memberships
--;
2603 IM6O_REMREF(imo
); /* from in6p_findmoptions() */
2605 /* schedule timer now that we've dropped the lock(s) */
2606 mld_set_timeout(&mtp
);
2612 * Select the interface for transmitting IPv6 multicast datagrams.
2614 * Either an instance of struct in6_addr or an instance of struct ipv6_mreqn
2615 * may be passed to this socket option. An address of in6addr_any or an
2616 * interface index of 0 is used to remove a previous selection.
2617 * When no interface is selected, one is chosen for every send.
2620 in6p_set_multicast_if(struct inpcb
*inp
, struct sockopt
*sopt
)
2623 struct ip6_moptions
*imo
;
2627 if (sopt
->sopt_valsize
!= sizeof(u_int
))
2630 error
= sooptcopyin(sopt
, &ifindex
, sizeof(u_int
), sizeof(u_int
));
2634 ifnet_head_lock_shared();
2635 if ((u_int
)if_index
< ifindex
) {
2640 ifp
= ifindex2ifnet
[ifindex
];
2642 if (ifp
== NULL
|| (ifp
->if_flags
& IFF_MULTICAST
) == 0)
2643 return (EADDRNOTAVAIL
);
2645 imo
= in6p_findmoptions(inp
);
2650 imo
->im6o_multicast_ifp
= ifp
;
2652 IM6O_REMREF(imo
); /* from in6p_findmoptions() */
2658 * Atomically set source filters on a socket for an IPv6 multicast group.
2662 in6p_set_source_filters(struct inpcb
*inp
, struct sockopt
*sopt
)
2664 struct __msfilterreq64 msfr
, msfr64
;
2665 struct __msfilterreq32 msfr32
;
2668 struct in6_mfilter
*imf
;
2669 struct ip6_moptions
*imo
;
2670 struct in6_multi
*inm
;
2673 user_addr_t tmp_ptr
;
2674 struct mld_tparams mtp
;
2676 bzero(&mtp
, sizeof (mtp
));
2678 if (IS_64BIT_PROCESS(current_proc())) {
2679 error
= sooptcopyin(sopt
, &msfr64
,
2680 sizeof(struct __msfilterreq64
),
2681 sizeof(struct __msfilterreq64
));
2684 /* we never use msfr.msfr_srcs; */
2685 memcpy(&msfr
, &msfr64
, sizeof(msfr
));
2687 error
= sooptcopyin(sopt
, &msfr32
,
2688 sizeof(struct __msfilterreq32
),
2689 sizeof(struct __msfilterreq32
));
2692 /* we never use msfr.msfr_srcs; */
2693 memcpy(&msfr
, &msfr32
, sizeof(msfr
));
2696 if ((size_t) msfr
.msfr_nsrcs
>
2697 UINT32_MAX
/ sizeof(struct sockaddr_storage
))
2698 msfr
.msfr_nsrcs
= UINT32_MAX
/ sizeof(struct sockaddr_storage
);
2700 if (msfr
.msfr_nsrcs
> in6_mcast_maxsocksrc
)
2703 if (msfr
.msfr_fmode
!= MCAST_EXCLUDE
&&
2704 msfr
.msfr_fmode
!= MCAST_INCLUDE
)
2707 if (msfr
.msfr_group
.ss_family
!= AF_INET6
||
2708 msfr
.msfr_group
.ss_len
!= sizeof(struct sockaddr_in6
))
2711 gsa
= (sockunion_t
*)&msfr
.msfr_group
;
2712 if (!IN6_IS_ADDR_MULTICAST(&gsa
->sin6
.sin6_addr
))
2715 gsa
->sin6
.sin6_port
= 0; /* ignore port */
2717 ifnet_head_lock_shared();
2718 if (msfr
.msfr_ifindex
== 0 || (u_int
)if_index
< msfr
.msfr_ifindex
) {
2720 return (EADDRNOTAVAIL
);
2722 ifp
= ifindex2ifnet
[msfr
.msfr_ifindex
];
2725 return (EADDRNOTAVAIL
);
2727 (void)in6_setscope(&gsa
->sin6
.sin6_addr
, ifp
, NULL
);
2730 * Take the INP write lock.
2731 * Check if this socket is a member of this group.
2733 imo
= in6p_findmoptions(inp
);
2738 idx
= im6o_match_group(imo
, ifp
, &gsa
->sa
);
2739 if (idx
== (size_t)-1 || imo
->im6o_mfilters
== NULL
) {
2740 error
= EADDRNOTAVAIL
;
2741 goto out_imo_locked
;
2743 inm
= imo
->im6o_membership
[idx
];
2744 imf
= &imo
->im6o_mfilters
[idx
];
2747 * Begin state merge transaction at socket layer.
2750 imf
->im6f_st
[1] = msfr
.msfr_fmode
;
2753 * Apply any new source filters, if present.
2754 * Make a copy of the user-space source vector so
2755 * that we may copy them with a single copyin. This
2756 * allows us to deal with page faults up-front.
2758 if (msfr
.msfr_nsrcs
> 0) {
2759 struct in6_msource
*lims
;
2760 struct sockaddr_in6
*psin
;
2761 struct sockaddr_storage
*kss
, *pkss
;
2764 if (IS_64BIT_PROCESS(current_proc()))
2765 tmp_ptr
= msfr64
.msfr_srcs
;
2767 tmp_ptr
= CAST_USER_ADDR_T(msfr32
.msfr_srcs
);
2769 MLD_PRINTF(("%s: loading %lu source list entries\n",
2770 __func__
, (unsigned long)msfr
.msfr_nsrcs
));
2771 kss
= _MALLOC((size_t) msfr
.msfr_nsrcs
* sizeof(*kss
),
2775 goto out_imo_locked
;
2778 error
= copyin(tmp_ptr
, kss
,
2779 (size_t) msfr
.msfr_nsrcs
* sizeof(*kss
));
2782 goto out_imo_locked
;
2786 * Mark all source filters as UNDEFINED at t1.
2787 * Restore new group filter mode, as im6f_leave()
2788 * will set it to INCLUDE.
2791 imf
->im6f_st
[1] = msfr
.msfr_fmode
;
2794 * Update socket layer filters at t1, lazy-allocating
2795 * new entries. This saves a bunch of memory at the
2796 * cost of one RB_FIND() per source entry; duplicate
2797 * entries in the msfr_nsrcs vector are ignored.
2798 * If we encounter an error, rollback transaction.
2800 * XXX This too could be replaced with a set-symmetric
2801 * difference like loop to avoid walking from root
2802 * every time, as the key space is common.
2804 for (i
= 0, pkss
= kss
; i
< msfr
.msfr_nsrcs
; i
++, pkss
++) {
2805 psin
= (struct sockaddr_in6
*)pkss
;
2806 if (psin
->sin6_family
!= AF_INET6
) {
2807 error
= EAFNOSUPPORT
;
2810 if (psin
->sin6_len
!= sizeof(struct sockaddr_in6
)) {
2814 if (IN6_IS_ADDR_MULTICAST(&psin
->sin6_addr
)) {
2819 * TODO: Validate embedded scope ID in source
2820 * list entry against passed-in ifp, if and only
2821 * if source list filter entry is iface or node local.
2823 in6_clearscope(&psin
->sin6_addr
);
2824 error
= im6f_get_source(imf
, psin
, &lims
);
2827 lims
->im6sl_st
[1] = imf
->im6f_st
[1];
2833 goto out_im6f_rollback
;
2836 * Begin state merge transaction at MLD layer.
2839 MLD_PRINTF(("%s: merge inm state\n", __func__
));
2840 error
= in6m_merge(inm
, imf
);
2842 MLD_PRINTF(("%s: failed to merge inm state\n", __func__
));
2844 goto out_im6f_rollback
;
2847 MLD_PRINTF(("%s: doing mld downcall\n", __func__
));
2848 error
= mld_change_state(inm
, &mtp
, 0);
2852 MLD_PRINTF(("%s: failed mld downcall\n", __func__
));
2865 IM6O_REMREF(imo
); /* from in6p_findmoptions() */
2867 /* schedule timer now that we've dropped the lock(s) */
2868 mld_set_timeout(&mtp
);
2874 * Set the IP multicast options in response to user setsockopt().
2876 * Many of the socket options handled in this function duplicate the
2877 * functionality of socket options in the regular unicast API. However,
2878 * it is not possible to merge the duplicate code, because the idempotence
2879 * of the IPv6 multicast part of the BSD Sockets API must be preserved;
2880 * the effects of these options must be treated as separate and distinct.
2884 ip6_setmoptions(struct inpcb
*inp
, struct sockopt
*sopt
)
2886 struct ip6_moptions
*im6o
;
2892 * If socket is neither of type SOCK_RAW or SOCK_DGRAM,
2893 * or is a divert socket, reject it.
2895 if (SOCK_PROTO(inp
->inp_socket
) == IPPROTO_DIVERT
||
2896 (SOCK_TYPE(inp
->inp_socket
) != SOCK_RAW
&&
2897 SOCK_TYPE(inp
->inp_socket
) != SOCK_DGRAM
))
2898 return (EOPNOTSUPP
);
2900 switch (sopt
->sopt_name
) {
2901 case IPV6_MULTICAST_IF
:
2902 error
= in6p_set_multicast_if(inp
, sopt
);
2905 case IPV6_MULTICAST_HOPS
: {
2908 if (sopt
->sopt_valsize
!= sizeof(int)) {
2912 error
= sooptcopyin(sopt
, &hlim
, sizeof(hlim
), sizeof(int));
2915 if (hlim
< -1 || hlim
> 255) {
2918 } else if (hlim
== -1) {
2919 hlim
= ip6_defmcasthlim
;
2921 im6o
= in6p_findmoptions(inp
);
2927 im6o
->im6o_multicast_hlim
= hlim
;
2929 IM6O_REMREF(im6o
); /* from in6p_findmoptions() */
2933 case IPV6_MULTICAST_LOOP
: {
2937 * Set the loopback flag for outgoing multicast packets.
2938 * Must be zero or one.
2940 if (sopt
->sopt_valsize
!= sizeof(u_int
)) {
2944 error
= sooptcopyin(sopt
, &loop
, sizeof(u_int
), sizeof(u_int
));
2951 im6o
= in6p_findmoptions(inp
);
2957 im6o
->im6o_multicast_loop
= loop
;
2959 IM6O_REMREF(im6o
); /* from in6p_findmoptions() */
2963 case IPV6_JOIN_GROUP
:
2964 case MCAST_JOIN_GROUP
:
2965 case MCAST_JOIN_SOURCE_GROUP
:
2966 error
= in6p_join_group(inp
, sopt
);
2969 case IPV6_LEAVE_GROUP
:
2970 case MCAST_LEAVE_GROUP
:
2971 case MCAST_LEAVE_SOURCE_GROUP
:
2972 error
= in6p_leave_group(inp
, sopt
);
2975 case MCAST_BLOCK_SOURCE
:
2976 case MCAST_UNBLOCK_SOURCE
:
2977 error
= in6p_block_unblock_source(inp
, sopt
);
2981 error
= in6p_set_source_filters(inp
, sopt
);
2992 * Expose MLD's multicast filter mode and source list(s) to userland,
2993 * keyed by (ifindex, group).
2994 * The filter mode is written out as a uint32_t, followed by
2995 * 0..n of struct in6_addr.
2996 * For use by ifmcstat(8).
2999 sysctl_ip6_mcast_filters SYSCTL_HANDLER_ARGS
3001 #pragma unused(oidp)
3003 struct in6_addr mcaddr
;
3004 struct in6_addr src
;
3006 struct in6_multi
*inm
;
3007 struct in6_multistep step
;
3008 struct ip6_msource
*ims
;
3012 uint32_t fmode
, ifindex
;
3017 if (req
->newptr
!= USER_ADDR_NULL
)
3020 /* int: ifindex + 4 * 32 bits of IPv6 address */
3025 ifnet_head_lock_shared();
3026 if (ifindex
<= 0 || ifindex
> (u_int
)if_index
) {
3027 MLD_PRINTF(("%s: ifindex %u out of range\n",
3028 __func__
, ifindex
));
3033 memcpy(&mcaddr
, &name
[1], sizeof(struct in6_addr
));
3034 if (!IN6_IS_ADDR_MULTICAST(&mcaddr
)) {
3035 MLD_PRINTF(("%s: group %s is not multicast\n",
3036 __func__
, ip6_sprintf(&mcaddr
)));
3041 ifp
= ifindex2ifnet
[ifindex
];
3044 MLD_PRINTF(("%s: no ifp for ifindex %u\n", __func__
, ifindex
));
3048 * Internal MLD lookups require that scope/zone ID is set.
3050 (void)in6_setscope(&mcaddr
, ifp
, NULL
);
3052 in6_multihead_lock_shared();
3053 IN6_FIRST_MULTI(step
, inm
);
3054 while (inm
!= NULL
) {
3056 if (inm
->in6m_ifp
!= ifp
)
3059 if (!IN6_ARE_ADDR_EQUAL(&inm
->in6m_addr
, &mcaddr
))
3062 fmode
= inm
->in6m_st
[1].iss_fmode
;
3063 retval
= SYSCTL_OUT(req
, &fmode
, sizeof(uint32_t));
3068 RB_FOREACH(ims
, ip6_msource_tree
, &inm
->in6m_srcs
) {
3069 MLD_PRINTF(("%s: visit node 0x%llx\n", __func__
,
3070 (uint64_t)VM_KERNEL_ADDRPERM(ims
)));
3072 * Only copy-out sources which are in-mode.
3074 if (fmode
!= im6s_get_mode(inm
, ims
, 1)) {
3075 MLD_PRINTF(("%s: skip non-in-mode\n",
3077 continue; /* process next source */
3079 src
= ims
->im6s_addr
;
3080 retval
= SYSCTL_OUT(req
, &src
, sizeof(struct in6_addr
));
3082 break; /* process next inm */
3086 IN6_NEXT_MULTI(step
, inm
);
3088 in6_multihead_lock_done();
3094 in6_multi_init(void)
3096 PE_parse_boot_argn("ifa_debug", &in6m_debug
, sizeof (in6m_debug
));
3098 /* Setup lock group and attribute for in6_multihead */
3099 in6_multihead_lock_grp_attr
= lck_grp_attr_alloc_init();
3100 in6_multihead_lock_grp
= lck_grp_alloc_init("in6_multihead",
3101 in6_multihead_lock_grp_attr
);
3102 in6_multihead_lock_attr
= lck_attr_alloc_init();
3103 lck_rw_init(&in6_multihead_lock
, in6_multihead_lock_grp
,
3104 in6_multihead_lock_attr
);
3106 lck_mtx_init(&in6m_trash_lock
, in6_multihead_lock_grp
,
3107 in6_multihead_lock_attr
);
3108 TAILQ_INIT(&in6m_trash_head
);
3110 in6m_size
= (in6m_debug
== 0) ? sizeof (struct in6_multi
) :
3111 sizeof (struct in6_multi_dbg
);
3112 in6m_zone
= zinit(in6m_size
, IN6M_ZONE_MAX
* in6m_size
,
3114 if (in6m_zone
== NULL
) {
3115 panic("%s: failed allocating %s", __func__
, IN6M_ZONE_NAME
);
3118 zone_change(in6m_zone
, Z_EXPAND
, TRUE
);
3120 imm_size
= sizeof (struct in6_multi_mship
);
3121 imm_zone
= zinit(imm_size
, IMM_ZONE_MAX
* imm_size
, 0, IMM_ZONE_NAME
);
3122 if (imm_zone
== NULL
) {
3123 panic("%s: failed allocating %s", __func__
, IMM_ZONE_NAME
);
3126 zone_change(imm_zone
, Z_EXPAND
, TRUE
);
3128 ip6ms_size
= sizeof (struct ip6_msource
);
3129 ip6ms_zone
= zinit(ip6ms_size
, IP6MS_ZONE_MAX
* ip6ms_size
,
3130 0, IP6MS_ZONE_NAME
);
3131 if (ip6ms_zone
== NULL
) {
3132 panic("%s: failed allocating %s", __func__
, IP6MS_ZONE_NAME
);
3135 zone_change(ip6ms_zone
, Z_EXPAND
, TRUE
);
3137 in6ms_size
= sizeof (struct in6_msource
);
3138 in6ms_zone
= zinit(in6ms_size
, IN6MS_ZONE_MAX
* in6ms_size
,
3139 0, IN6MS_ZONE_NAME
);
3140 if (in6ms_zone
== NULL
) {
3141 panic("%s: failed allocating %s", __func__
, IN6MS_ZONE_NAME
);
3144 zone_change(in6ms_zone
, Z_EXPAND
, TRUE
);
3147 static struct in6_multi
*
3148 in6_multi_alloc(int how
)
3150 struct in6_multi
*in6m
;
3152 in6m
= (how
== M_WAITOK
) ? zalloc(in6m_zone
) :
3153 zalloc_noblock(in6m_zone
);
3155 bzero(in6m
, in6m_size
);
3156 lck_mtx_init(&in6m
->in6m_lock
, in6_multihead_lock_grp
,
3157 in6_multihead_lock_attr
);
3158 in6m
->in6m_debug
|= IFD_ALLOC
;
3159 if (in6m_debug
!= 0) {
3160 in6m
->in6m_debug
|= IFD_DEBUG
;
3161 in6m
->in6m_trace
= in6m_trace
;
3168 in6_multi_free(struct in6_multi
*in6m
)
3171 if (in6m
->in6m_debug
& IFD_ATTACHED
) {
3172 panic("%s: attached in6m=%p is being freed", __func__
, in6m
);
3174 } else if (in6m
->in6m_ifma
!= NULL
) {
3175 panic("%s: ifma not NULL for in6m=%p", __func__
, in6m
);
3177 } else if (!(in6m
->in6m_debug
& IFD_ALLOC
)) {
3178 panic("%s: in6m %p cannot be freed", __func__
, in6m
);
3180 } else if (in6m
->in6m_refcount
!= 0) {
3181 panic("%s: non-zero refcount in6m=%p", __func__
, in6m
);
3183 } else if (in6m
->in6m_reqcnt
!= 0) {
3184 panic("%s: non-zero reqcnt in6m=%p", __func__
, in6m
);
3188 /* Free any pending MLDv2 state-change records */
3189 IF_DRAIN(&in6m
->in6m_scq
);
3191 in6m
->in6m_debug
&= ~IFD_ALLOC
;
3192 if ((in6m
->in6m_debug
& (IFD_DEBUG
| IFD_TRASHED
)) ==
3193 (IFD_DEBUG
| IFD_TRASHED
)) {
3194 lck_mtx_lock(&in6m_trash_lock
);
3195 TAILQ_REMOVE(&in6m_trash_head
, (struct in6_multi_dbg
*)in6m
,
3197 lck_mtx_unlock(&in6m_trash_lock
);
3198 in6m
->in6m_debug
&= ~IFD_TRASHED
;
3202 lck_mtx_destroy(&in6m
->in6m_lock
, in6_multihead_lock_grp
);
3203 zfree(in6m_zone
, in6m
);
3207 in6_multi_attach(struct in6_multi
*in6m
)
3209 in6_multihead_lock_assert(LCK_RW_ASSERT_EXCLUSIVE
);
3210 IN6M_LOCK_ASSERT_HELD(in6m
);
3212 if (in6m
->in6m_debug
& IFD_ATTACHED
) {
3213 panic("%s: Attempt to attach an already attached in6m=%p",
3218 in6m
->in6m_reqcnt
++;
3219 VERIFY(in6m
->in6m_reqcnt
== 1);
3220 IN6M_ADDREF_LOCKED(in6m
);
3221 in6m
->in6m_debug
|= IFD_ATTACHED
;
3223 * Reattach case: If debugging is enabled, take it
3224 * out of the trash list and clear IFD_TRASHED.
3226 if ((in6m
->in6m_debug
& (IFD_DEBUG
| IFD_TRASHED
)) ==
3227 (IFD_DEBUG
| IFD_TRASHED
)) {
3228 /* Become a regular mutex, just in case */
3229 IN6M_CONVERT_LOCK(in6m
);
3230 lck_mtx_lock(&in6m_trash_lock
);
3231 TAILQ_REMOVE(&in6m_trash_head
, (struct in6_multi_dbg
*)in6m
,
3233 lck_mtx_unlock(&in6m_trash_lock
);
3234 in6m
->in6m_debug
&= ~IFD_TRASHED
;
3237 LIST_INSERT_HEAD(&in6_multihead
, in6m
, in6m_entry
);
3241 in6_multi_detach(struct in6_multi
*in6m
)
3243 in6_multihead_lock_assert(LCK_RW_ASSERT_EXCLUSIVE
);
3244 IN6M_LOCK_ASSERT_HELD(in6m
);
3246 if (in6m
->in6m_reqcnt
== 0) {
3247 panic("%s: in6m=%p negative reqcnt", __func__
, in6m
);
3251 --in6m
->in6m_reqcnt
;
3252 if (in6m
->in6m_reqcnt
> 0)
3255 if (!(in6m
->in6m_debug
& IFD_ATTACHED
)) {
3256 panic("%s: Attempt to detach an unattached record in6m=%p",
3259 } else if (in6m
->in6m_debug
& IFD_TRASHED
) {
3260 panic("%s: in6m %p is already in trash list", __func__
, in6m
);
3265 * NOTE: Caller calls IFMA_REMREF
3267 in6m
->in6m_debug
&= ~IFD_ATTACHED
;
3268 LIST_REMOVE(in6m
, in6m_entry
);
3270 if (in6m
->in6m_debug
& IFD_DEBUG
) {
3271 /* Become a regular mutex, just in case */
3272 IN6M_CONVERT_LOCK(in6m
);
3273 lck_mtx_lock(&in6m_trash_lock
);
3274 TAILQ_INSERT_TAIL(&in6m_trash_head
,
3275 (struct in6_multi_dbg
*)in6m
, in6m_trash_link
);
3276 lck_mtx_unlock(&in6m_trash_lock
);
3277 in6m
->in6m_debug
|= IFD_TRASHED
;
3284 in6m_addref(struct in6_multi
*in6m
, int locked
)
3287 IN6M_LOCK_SPIN(in6m
);
3289 IN6M_LOCK_ASSERT_HELD(in6m
);
3291 if (++in6m
->in6m_refcount
== 0) {
3292 panic("%s: in6m=%p wraparound refcnt", __func__
, in6m
);
3294 } else if (in6m
->in6m_trace
!= NULL
) {
3295 (*in6m
->in6m_trace
)(in6m
, TRUE
);
3302 in6m_remref(struct in6_multi
*in6m
, int locked
)
3304 struct ifmultiaddr
*ifma
;
3305 struct mld_ifinfo
*mli
;
3308 IN6M_LOCK_SPIN(in6m
);
3310 IN6M_LOCK_ASSERT_HELD(in6m
);
3312 if (in6m
->in6m_refcount
== 0 || (in6m
->in6m_refcount
== 1 && locked
)) {
3313 panic("%s: in6m=%p negative refcnt", __func__
, in6m
);
3315 } else if (in6m
->in6m_trace
!= NULL
) {
3316 (*in6m
->in6m_trace
)(in6m
, FALSE
);
3319 --in6m
->in6m_refcount
;
3320 if (in6m
->in6m_refcount
> 0) {
3327 * Synchronization with in6_mc_get(). In the event the in6m has been
3328 * detached, the underlying ifma would still be in the if_multiaddrs
3329 * list, and thus can be looked up via if_addmulti(). At that point,
3330 * the only way to find this in6m is via ifma_protospec. To avoid
3331 * race conditions between the last in6m_remref() of that in6m and its
3332 * use via ifma_protospec, in6_multihead lock is used for serialization.
3333 * In order to avoid violating the lock order, we must drop in6m_lock
3334 * before acquiring in6_multihead lock. To prevent the in6m from being
3335 * freed prematurely, we hold an extra reference.
3337 ++in6m
->in6m_refcount
;
3339 in6_multihead_lock_shared();
3340 IN6M_LOCK_SPIN(in6m
);
3341 --in6m
->in6m_refcount
;
3342 if (in6m
->in6m_refcount
> 0) {
3343 /* We've lost the race, so abort since in6m is still in use */
3345 in6_multihead_lock_done();
3346 /* If it was locked, return it as such */
3352 ifma
= in6m
->in6m_ifma
;
3353 in6m
->in6m_ifma
= NULL
;
3354 in6m
->in6m_ifp
= NULL
;
3355 mli
= in6m
->in6m_mli
;
3356 in6m
->in6m_mli
= NULL
;
3358 IFMA_LOCK_SPIN(ifma
);
3359 ifma
->ifma_protospec
= NULL
;
3361 in6_multihead_lock_done();
3363 in6_multi_free(in6m
);
3364 if_delmulti_ifma(ifma
);
3365 /* Release reference held to the underlying ifmultiaddr */
3373 in6m_trace(struct in6_multi
*in6m
, int refhold
)
3375 struct in6_multi_dbg
*in6m_dbg
= (struct in6_multi_dbg
*)in6m
;
3380 if (!(in6m
->in6m_debug
& IFD_DEBUG
)) {
3381 panic("%s: in6m %p has no debug structure", __func__
, in6m
);
3385 cnt
= &in6m_dbg
->in6m_refhold_cnt
;
3386 tr
= in6m_dbg
->in6m_refhold
;
3388 cnt
= &in6m_dbg
->in6m_refrele_cnt
;
3389 tr
= in6m_dbg
->in6m_refrele
;
3392 idx
= atomic_add_16_ov(cnt
, 1) % IN6M_TRACE_HIST_SIZE
;
3393 ctrace_record(&tr
[idx
]);
3396 static struct in6_multi_mship
*
3397 in6_multi_mship_alloc(int how
)
3399 struct in6_multi_mship
*imm
;
3401 imm
= (how
== M_WAITOK
) ? zalloc(imm_zone
) : zalloc_noblock(imm_zone
);
3403 bzero(imm
, imm_size
);
3409 in6_multi_mship_free(struct in6_multi_mship
*imm
)
3411 if (imm
->i6mm_maddr
!= NULL
) {
3412 panic("%s: i6mm_maddr not NULL for imm=%p", __func__
, imm
);
3415 zfree(imm_zone
, imm
);
3419 in6_multihead_lock_exclusive(void)
3421 lck_rw_lock_exclusive(&in6_multihead_lock
);
3425 in6_multihead_lock_shared(void)
3427 lck_rw_lock_shared(&in6_multihead_lock
);
3431 in6_multihead_lock_assert(int what
)
3433 lck_rw_assert(&in6_multihead_lock
, what
);
3437 in6_multihead_lock_done(void)
3439 lck_rw_done(&in6_multihead_lock
);
3442 static struct ip6_msource
*
3443 ip6ms_alloc(int how
)
3445 struct ip6_msource
*i6ms
;
3447 i6ms
= (how
== M_WAITOK
) ? zalloc(ip6ms_zone
) :
3448 zalloc_noblock(ip6ms_zone
);
3450 bzero(i6ms
, ip6ms_size
);
3456 ip6ms_free(struct ip6_msource
*i6ms
)
3458 zfree(ip6ms_zone
, i6ms
);
3461 static struct in6_msource
*
3462 in6ms_alloc(int how
)
3464 struct in6_msource
*in6ms
;
3466 in6ms
= (how
== M_WAITOK
) ? zalloc(in6ms_zone
) :
3467 zalloc_noblock(in6ms_zone
);
3469 bzero(in6ms
, in6ms_size
);
3475 in6ms_free(struct in6_msource
*in6ms
)
3477 zfree(in6ms_zone
, in6ms
);
3482 static const char *in6m_modestrs
[] = { "un\n", "in", "ex" };
3485 in6m_mode_str(const int mode
)
3487 if (mode
>= MCAST_UNDEFINED
&& mode
<= MCAST_EXCLUDE
)
3488 return (in6m_modestrs
[mode
]);
3492 static const char *in6m_statestrs
[] = {
3501 "sg-query-pending\n",
3506 in6m_state_str(const int state
)
3508 if (state
>= MLD_NOT_MEMBER
&& state
<= MLD_LEAVING_MEMBER
)
3509 return (in6m_statestrs
[state
]);
3514 * Dump an in6_multi structure to the console.
3517 in6m_print(const struct in6_multi
*inm
)
3521 IN6M_LOCK_ASSERT_HELD(__DECONST(struct in6_multi
*, inm
));
3526 printf("%s: --- begin in6m 0x%llx ---\n", __func__
,
3527 (uint64_t)VM_KERNEL_ADDRPERM(inm
));
3528 printf("addr %s ifp 0x%llx(%s) ifma 0x%llx\n",
3529 ip6_sprintf(&inm
->in6m_addr
),
3530 (uint64_t)VM_KERNEL_ADDRPERM(inm
->in6m_ifp
),
3531 if_name(inm
->in6m_ifp
),
3532 (uint64_t)VM_KERNEL_ADDRPERM(inm
->in6m_ifma
));
3533 printf("timer %u state %s refcount %u scq.len %u\n",
3535 in6m_state_str(inm
->in6m_state
),
3537 inm
->in6m_scq
.ifq_len
);
3538 printf("mli 0x%llx nsrc %lu sctimer %u scrv %u\n",
3539 (uint64_t)VM_KERNEL_ADDRPERM(inm
->in6m_mli
),
3543 for (t
= 0; t
< 2; t
++) {
3544 printf("t%d: fmode %s asm %u ex %u in %u rec %u\n", t
,
3545 in6m_mode_str(inm
->in6m_st
[t
].iss_fmode
),
3546 inm
->in6m_st
[t
].iss_asm
,
3547 inm
->in6m_st
[t
].iss_ex
,
3548 inm
->in6m_st
[t
].iss_in
,
3549 inm
->in6m_st
[t
].iss_rec
);
3551 printf("%s: --- end in6m 0x%llx ---\n", __func__
,
3552 (uint64_t)VM_KERNEL_ADDRPERM(inm
));
3558 in6m_print(__unused
const struct in6_multi
*inm
)