-/* $FreeBSD: src/sys/netinet6/nd6_rtr.c,v 1.11 2002/04/19 04:46:23 suz Exp $ */
-/* $KAME: nd6_rtr.c,v 1.111 2001/04/27 01:37:15 jinmei Exp $ */
+/*
+ * Copyright (c) 2003-2020 Apple Inc. All rights reserved.
+ *
+ * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
+ *
+ * This file contains Original Code and/or Modifications of Original Code
+ * as defined in and that are subject to the Apple Public Source License
+ * Version 2.0 (the 'License'). You may not use this file except in
+ * compliance with the License. The rights granted to you under the License
+ * may not be used to create, or enable the creation or redistribution of,
+ * unlawful or unlicensed copies of an Apple operating system, or to
+ * circumvent, violate, or enable the circumvention or violation of, any
+ * terms of an Apple operating system software license agreement.
+ *
+ * Please obtain a copy of the License at
+ * http://www.opensource.apple.com/apsl/ and read it before using this file.
+ *
+ * The Original Code and all software distributed under the License are
+ * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
+ * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
+ * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
+ * Please see the License for the specific language governing rights and
+ * limitations under the License.
+ *
+ * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
+ */
/*
* Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*/
-
-
#include <sys/param.h>
#include <sys/systm.h>
#include <sys/malloc.h>
#include <sys/errno.h>
#include <sys/syslog.h>
#include <sys/queue.h>
-#include <kern/lock.h>
+#include <sys/mcache.h>
+#include <sys/protosw.h>
+
+#include <dev/random/randomdev.h>
+
+#include <kern/locks.h>
+#include <kern/zalloc.h>
+#include <machine/machine_routines.h>
#include <net/if.h>
+#include <net/if_var.h>
#include <net/if_types.h>
#include <net/if_dl.h>
#include <net/route.h>
#include <net/net_osdep.h>
-#define SDL(s) ((struct sockaddr_dl *)s)
-
-static struct nd_defrouter *defrtrlist_update(struct nd_defrouter *);
-static struct in6_ifaddr *in6_ifadd(struct nd_prefix *,
- struct in6_addr *);
+static void defrouter_addreq(struct nd_defrouter *, struct nd_route_info *, boolean_t);
+static void defrouter_delreq(struct nd_defrouter *, struct nd_route_info *);
+static struct nd_defrouter *defrtrlist_update_common(struct nd_defrouter *,
+ struct nd_drhead *, boolean_t);
static struct nd_pfxrouter *pfxrtr_lookup(struct nd_prefix *,
- struct nd_defrouter *);
+ struct nd_defrouter *);
static void pfxrtr_add(struct nd_prefix *, struct nd_defrouter *);
-static void pfxrtr_del(struct nd_pfxrouter *);
+static void pfxrtr_del(struct nd_pfxrouter *, struct nd_prefix *);
static struct nd_pfxrouter *find_pfxlist_reachable_router(struct nd_prefix *);
-static void defrouter_addifreq(struct ifnet *);
-static void nd6_rtmsg(int, struct rtentry *);
+static void nd6_rtmsg(u_char, struct rtentry *);
-static void in6_init_address_ltimes(struct nd_prefix *ndpr,
- struct in6_addrlifetime *lt6);
+static int nd6_prefix_onlink_common(struct nd_prefix *, boolean_t,
+ unsigned int);
+static struct nd_prefix *nd6_prefix_equal_lookup(struct nd_prefix *, boolean_t);
+static void nd6_prefix_sync(struct ifnet *);
+
+static void in6_init_address_ltimes(struct nd_prefix *,
+ struct in6_addrlifetime *);
static int rt6_deleteroute(struct radix_node *, void *);
+static struct nd_defrouter *nddr_alloc(zalloc_flags_t);
+static void nddr_free(struct nd_defrouter *);
+static void nddr_trace(struct nd_defrouter *, int);
+
+static struct nd_prefix *ndpr_alloc(int);
+static void ndpr_free(struct nd_prefix *);
+static void ndpr_trace(struct nd_prefix *, int);
+
extern int nd6_recalc_reachtm_interval;
-static struct ifnet *nd6_defifp;
-int nd6_defifindex;
+static struct ifnet *nd6_defifp = NULL;
+int nd6_defifindex = 0;
+static unsigned int nd6_defrouter_genid;
+
+int ip6_use_tempaddr = IP6_USE_TMPADDR_DEFAULT; /* use temp addr by default for testing now */
-int ip6_use_tempaddr = 0;
+int nd6_accept_6to4 = 1;
int ip6_desync_factor;
u_int32_t ip6_temp_preferred_lifetime = DEF_TEMP_PREFERRED_LIFETIME;
u_int32_t ip6_temp_valid_lifetime = DEF_TEMP_VALID_LIFETIME;
/*
* shorter lifetimes for debugging purposes.
-int ip6_temp_preferred_lifetime = 800;
-static int ip6_temp_valid_lifetime = 1800;
-*/
+ * u_int32_t ip6_temp_preferred_lifetime = 800;
+ * static u_int32_t ip6_temp_valid_lifetime = 1800;
+ */
int ip6_temp_regen_advance = TEMPADDR_REGEN_ADVANCE;
-extern lck_mtx_t *rt_mtx;
extern lck_mtx_t *nd6_mutex;
+/* Serialization variables for single thread access to nd_prefix */
+static boolean_t nd_prefix_busy;
+static void *nd_prefix_waitchan = &nd_prefix_busy;
+static int nd_prefix_waiters = 0;
+
+/* Serialization variables for single thread access to nd_defrouter */
+static boolean_t nd_defrouter_busy;
+static void *nd_defrouter_waitchan = &nd_defrouter_busy;
+static int nd_defrouter_waiters = 0;
+
+#define equal(a1, a2) (bcmp((caddr_t)(a1), (caddr_t)(a2), (a1)->sa_len) == 0)
+/* RTPREF_MEDIUM has to be 0! */
+#define RTPREF_HIGH 1
+#define RTPREF_MEDIUM 0
+#define RTPREF_LOW (-1)
+#define RTPREF_RESERVED (-2)
+#define RTPREF_INVALID (-3) /* internal */
+
+#define NDPR_TRACE_HIST_SIZE 32 /* size of trace history */
+
+/* For gdb */
+__private_extern__ unsigned int ndpr_trace_hist_size = NDPR_TRACE_HIST_SIZE;
+
+struct nd_prefix_dbg {
+ struct nd_prefix ndpr_pr; /* nd_prefix */
+ u_int16_t ndpr_refhold_cnt; /* # of ref */
+ u_int16_t ndpr_refrele_cnt; /* # of rele */
+ /*
+ * Circular lists of ndpr_addref and ndpr_remref callers.
+ */
+ ctrace_t ndpr_refhold[NDPR_TRACE_HIST_SIZE];
+ ctrace_t ndpr_refrele[NDPR_TRACE_HIST_SIZE];
+};
+
+static unsigned int ndpr_debug; /* debug flags */
+static struct zone *ndpr_zone; /* zone for nd_prefix */
+#define NDPR_ZONE_NAME "nd6_prefix" /* zone name */
+
+#define NDDR_TRACE_HIST_SIZE 32 /* size of trace history */
+
+/* For gdb */
+__private_extern__ unsigned int nddr_trace_hist_size = NDDR_TRACE_HIST_SIZE;
+
+struct nd_defrouter_dbg {
+ struct nd_defrouter nddr_dr; /* nd_defrouter */
+ uint16_t nddr_refhold_cnt; /* # of ref */
+ uint16_t nddr_refrele_cnt; /* # of rele */
+ /*
+ * Circular lists of nddr_addref and nddr_remref callers.
+ */
+ ctrace_t nddr_refhold[NDDR_TRACE_HIST_SIZE];
+ ctrace_t nddr_refrele[NDDR_TRACE_HIST_SIZE];
+};
+
+static unsigned int nddr_debug; /* debug flags */
+static struct zone *nddr_zone; /* zone for nd_defrouter */
+#define NDDR_ZONE_NAME "nd6_defrouter" /* zone name */
+
+static ZONE_DECLARE(ndprtr_zone, "nd6_pfxrouter",
+ sizeof(struct nd_pfxrouter), ZC_NONE);
+
+#define TWOHOUR (120*60)
+extern int nd6_process_rti; /* Default to 0 for now */
+
+
+static void
+nd6_prefix_glb_init(void)
+{
+ PE_parse_boot_argn("ifa_debug", &ndpr_debug, sizeof(ndpr_debug));
+ vm_size_t ndpr_size = (ndpr_debug == 0) ? sizeof(struct nd_prefix) :
+ sizeof(struct nd_prefix_dbg);
+ ndpr_zone = zone_create(NDPR_ZONE_NAME, ndpr_size, ZC_ZFREE_CLEARMEM);
+}
+
+static void
+nd6_defrouter_glb_init(void)
+{
+ PE_parse_boot_argn("ifa_debug", &nddr_debug, sizeof(nddr_debug));
+ vm_size_t nddr_size = (nddr_debug == 0) ? sizeof(struct nd_defrouter) :
+ sizeof(struct nd_defrouter_dbg);
+ nddr_zone = zone_create(NDDR_ZONE_NAME, nddr_size, ZC_ZFREE_CLEARMEM);
+}
+
+void
+nd6_rtr_init(void)
+{
+ nd6_prefix_glb_init();
+ nd6_defrouter_glb_init();
+}
+
/*
* Receive Router Solicitation Message - just for routers.
* Router solicitation/advertisement is mostly managed by userland program
*/
void
nd6_rs_input(
- struct mbuf *m,
+ struct mbuf *m,
int off,
int icmp6len)
{
struct ifnet *ifp = m->m_pkthdr.rcvif;
struct ip6_hdr *ip6 = mtod(m, struct ip6_hdr *);
- struct nd_router_solicit *nd_rs;
+ struct nd_router_solicit *nd_rs = NULL;
struct in6_addr saddr6 = ip6->ip6_src;
-#if 0
- struct in6_addr daddr6 = ip6->ip6_dst;
-#endif
char *lladdr = NULL;
int lladdrlen = 0;
-#if 0
- struct sockaddr_dl *sdl = (struct sockaddr_dl *)NULL;
- struct llinfo_nd6 *ln = (struct llinfo_nd6 *)NULL;
- struct rtentry *rt = NULL;
- int is_newentry;
-#endif
- union nd_opts ndopts;
+ union nd_opts ndopts = {};
+
+ /* Expect 32-bit aligned data pointer on strict-align platforms */
+ MBUF_STRICT_DATA_ALIGNMENT_CHECK_32(m);
/* If I'm not a router, ignore it. */
- if (ip6_accept_rtadv != 0 || (ifp->if_eflags & IFEF_ACCEPT_RTADVD) || ip6_forwarding != 1)
+ if (!ip6_forwarding || ifp->if_ipv6_router_mode == IPV6_ROUTER_MODE_DISABLED) {
goto freeit;
+ }
/* Sanity checks */
- if (ip6->ip6_hlim != 255) {
- nd6log((LOG_ERR,
+ if (ip6->ip6_hlim != IPV6_MAXHLIM) {
+ nd6log(error,
"nd6_rs_input: invalid hlim (%d) from %s to %s on %s\n",
ip6->ip6_hlim, ip6_sprintf(&ip6->ip6_src),
- ip6_sprintf(&ip6->ip6_dst), if_name(ifp)));
+ ip6_sprintf(&ip6->ip6_dst), if_name(ifp));
goto bad;
}
/*
- * Don't update the neighbor cache, if src = ::.
- * This indicates that the src has no IP address assigned yet.
+ * Don't update the neighbor cache, if src = :: or a non-neighbor.
+ * The former case indicates that the src has no IP address assigned
+ * yet. See nd6_ns_input() for the latter case.
*/
- if (IN6_IS_ADDR_UNSPECIFIED(&saddr6))
+ if (IN6_IS_ADDR_UNSPECIFIED(&ip6->ip6_src)) {
goto freeit;
-
-#ifndef PULLDOWN_TEST
- IP6_EXTHDR_CHECK(m, off, icmp6len, return);
- nd_rs = (struct nd_router_solicit *)((caddr_t)ip6 + off);
-#else
- IP6_EXTHDR_GET(nd_rs, struct nd_router_solicit *, m, off, icmp6len);
- if (nd_rs == NULL) {
- icmp6stat.icp6s_tooshort++;
- return;
+ } else {
+ struct sockaddr_in6 src_sa6;
+
+ bzero(&src_sa6, sizeof(src_sa6));
+ src_sa6.sin6_family = AF_INET6;
+ src_sa6.sin6_len = sizeof(src_sa6);
+ src_sa6.sin6_addr = ip6->ip6_src;
+ if (!nd6_is_addr_neighbor(&src_sa6, ifp, 0)) {
+ nd6log(info, "nd6_rs_input: "
+ "RS packet from non-neighbor\n");
+ goto freeit;
+ }
}
-#endif
+ IP6_EXTHDR_CHECK(m, off, icmp6len, return );
+ ip6 = mtod(m, struct ip6_hdr *);
+ nd_rs = (struct nd_router_solicit *)((caddr_t)ip6 + off);
icmp6len -= sizeof(*nd_rs);
nd6_option_init(nd_rs + 1, icmp6len, &ndopts);
if (nd6_options(&ndopts) < 0) {
- nd6log((LOG_INFO,
- "nd6_rs_input: invalid ND option, ignored\n"));
+ nd6log(info,
+ "nd6_rs_input: invalid ND option, ignored\n");
/* nd6_options have incremented stats */
goto freeit;
}
}
if (lladdr && ((ifp->if_addrlen + 2 + 7) & ~7) != lladdrlen) {
- nd6log((LOG_INFO,
+ nd6log(info,
"nd6_rs_input: lladdrlen mismatch for %s "
"(if %d, RS packet %d)\n",
- ip6_sprintf(&saddr6), ifp->if_addrlen, lladdrlen - 2));
+ ip6_sprintf(&saddr6), ifp->if_addrlen, lladdrlen - 2);
goto bad;
}
nd6_cache_lladdr(ifp, &saddr6, lladdr, lladdrlen, ND_ROUTER_SOLICIT, 0);
- freeit:
+freeit:
m_freem(m);
return;
- bad:
+bad:
icmp6stat.icp6s_badrs++;
m_freem(m);
}
+#define ND_OPT_LEN_TO_BYTE_SCALE 3 /* ND opt len is in units of 8 octets */
+
+#define ND_OPT_LEN_RTI_MIN 1
+#define ND_OPT_LEN_RTI_MAX 3
+#define ND_OPT_RTI_PFXLEN_MAX 128
/*
* Receive Router Advertisement Message.
*
*/
void
nd6_ra_input(
- struct mbuf *m,
- int off,
+ struct mbuf *m,
+ int off,
int icmp6len)
{
struct ifnet *ifp = m->m_pkthdr.rcvif;
- struct nd_ifinfo *ndi = &nd_ifinfo[ifp->if_index];
+ struct nd_ifinfo *ndi = NULL;
struct ip6_hdr *ip6 = mtod(m, struct ip6_hdr *);
struct nd_router_advert *nd_ra;
struct in6_addr saddr6 = ip6->ip6_src;
-#if 0
- struct in6_addr daddr6 = ip6->ip6_dst;
- int flags; /* = nd_ra->nd_ra_flags_reserved; */
- int is_managed = ((flags & ND_RA_FLAG_MANAGED) != 0);
- int is_other = ((flags & ND_RA_FLAG_OTHER) != 0);
-#endif
+ int mcast = 0;
union nd_opts ndopts;
- struct nd_defrouter *dr;
- struct timeval timenow;
-
- getmicrotime(&timenow);
+ struct nd_defrouter *dr = NULL;
+ u_int32_t mtu = 0;
+ char *lladdr = NULL;
+ u_int32_t lladdrlen = 0;
+ struct nd_prefix_list *nd_prefix_list_head = NULL;
+ u_int32_t nd_prefix_list_length = 0;
+ struct in6_ifaddr *ia6 = NULL;
+ struct nd_prefix_list *prfl;
+ struct nd_defrouter dr0;
+ u_int32_t advreachable;
+ boolean_t rti_defrtr_processed = FALSE;
- if (ip6_accept_rtadv == 0 && ((ifp->if_eflags & IFEF_ACCEPT_RTADVD) == 0))
+#if (DEVELOPMENT || DEBUG)
+ if (ip6_accept_rtadv == 0) {
goto freeit;
+ }
+#endif /* (DEVELOPMENT || DEBUG) */
+ /* Expect 32-bit aligned data pointer on strict-align platforms */
+ MBUF_STRICT_DATA_ALIGNMENT_CHECK_32(m);
+
+ /*
+ * Accept the RA if IFEF_ACCEPT_RTADV is set, or when
+ * we're acting as a router and the RA is locally generated.
+ * For convenience, we allow locally generated (rtadvd)
+ * RAs to be processed on the advertising interface, as a router.
+ *
+ * Note that we don't test against ip6_forwarding as we could be
+ * both a host and a router on different interfaces, hence the
+ * check against the per-interface flags.
+ */
+ if ((ifp->if_eflags & IFEF_ACCEPT_RTADV) == 0) {
+ if (ifp->if_ipv6_router_mode == IPV6_ROUTER_MODE_EXCLUSIVE &&
+ (ia6 = ifa_foraddr6(&saddr6)) != NULL) {
+ /* accept locally generated RA */
+ } else {
+ goto freeit;
+ }
+ }
+
+ if (ia6 != NULL) {
+ IFA_REMREF(&ia6->ia_ifa);
+ ia6 = NULL;
+ }
- if (ip6->ip6_hlim != 255) {
- nd6log((LOG_ERR,
+ if (ip6->ip6_hlim != IPV6_MAXHLIM) {
+ nd6log(error,
"nd6_ra_input: invalid hlim (%d) from %s to %s on %s\n",
ip6->ip6_hlim, ip6_sprintf(&ip6->ip6_src),
- ip6_sprintf(&ip6->ip6_dst), if_name(ifp)));
+ ip6_sprintf(&ip6->ip6_dst), if_name(ifp));
goto bad;
}
if (!IN6_IS_ADDR_LINKLOCAL(&saddr6)) {
- nd6log((LOG_ERR,
+ nd6log(error,
"nd6_ra_input: src %s is not link-local\n",
- ip6_sprintf(&saddr6)));
+ ip6_sprintf(&saddr6));
goto bad;
}
-#ifndef PULLDOWN_TEST
- IP6_EXTHDR_CHECK(m, off, icmp6len, return);
+ IP6_EXTHDR_CHECK(m, off, icmp6len, return );
+ ip6 = mtod(m, struct ip6_hdr *);
nd_ra = (struct nd_router_advert *)((caddr_t)ip6 + off);
-#else
- IP6_EXTHDR_GET(nd_ra, struct nd_router_advert *, m, off, icmp6len);
- if (nd_ra == NULL) {
- icmp6stat.icp6s_tooshort++;
- return;
- }
-#endif
icmp6len -= sizeof(*nd_ra);
nd6_option_init(nd_ra + 1, icmp6len, &ndopts);
if (nd6_options(&ndopts) < 0) {
- nd6log((LOG_INFO,
- "nd6_ra_input: invalid ND option, ignored\n"));
+ nd6log(info,
+ "nd6_ra_input: invalid ND option, ignored\n");
/* nd6_options have incremented stats */
goto freeit;
}
- {
- struct nd_defrouter dr0;
- u_int32_t advreachable = nd_ra->nd_ra_reachable;
+ advreachable = nd_ra->nd_ra_reachable;
- dr0.rtaddr = saddr6;
- dr0.flags = nd_ra->nd_ra_flags_reserved;
- dr0.rtlifetime = ntohs(nd_ra->nd_ra_router_lifetime);
- dr0.expire = timenow.tv_sec + dr0.rtlifetime;
- dr0.ifp = ifp;
- dr0.advint = 0; /* Mobile IPv6 */
- dr0.advint_expire = 0; /* Mobile IPv6 */
- dr0.advints_lost = 0; /* Mobile IPv6 */
+ /* remember if this is a multicasted advertisement */
+ if (IN6_IS_ADDR_MULTICAST(&ip6->ip6_dst)) {
+ mcast = 1;
+ }
+
+ ndi = ND_IFINFO(ifp);
+ VERIFY(NULL != ndi && TRUE == ndi->initialized);
+ lck_mtx_lock(&ndi->lock);
/* unspecified or not? (RFC 2461 6.3.4) */
if (advreachable) {
advreachable = ntohl(advreachable);
ndi->recalctm = nd6_recalc_reachtm_interval; /* reset */
}
}
- if (nd_ra->nd_ra_retransmit)
+ if (nd_ra->nd_ra_retransmit) {
ndi->retrans = ntohl(nd_ra->nd_ra_retransmit);
- if (nd_ra->nd_ra_curhoplimit)
- ndi->chlim = nd_ra->nd_ra_curhoplimit;
- dr = defrtrlist_update(&dr0);
- }
+ }
+ if (nd_ra->nd_ra_curhoplimit) {
+ if (ndi->chlim < nd_ra->nd_ra_curhoplimit) {
+ ndi->chlim = nd_ra->nd_ra_curhoplimit;
+ } else if (ndi->chlim != nd_ra->nd_ra_curhoplimit) {
+ nd6log(error,
+ "RA with a lower CurHopLimit sent from "
+ "%s on %s (current = %d, received = %d). "
+ "Ignored.\n", ip6_sprintf(&ip6->ip6_src),
+ if_name(ifp), ndi->chlim,
+ nd_ra->nd_ra_curhoplimit);
+ }
+ }
+ lck_mtx_unlock(&ndi->lock);
+
+ /* Initialize nd_defrouter invariants for RA processing */
+ bzero(&dr0, sizeof(dr0));
+ dr0.rtaddr = saddr6;
+ dr0.ifp = ifp;
+
+ /*
+ * Route Information Option
+ */
+ if (ndopts.nd_opts_rti && IFNET_IS_ETHERNET(ifp)) {
+ struct nd_opt_hdr *rt = NULL;
+ struct sockaddr_in6 rti_gateway = {0};
+
+ rti_gateway.sin6_family = AF_INET6;
+ rti_gateway.sin6_len = sizeof(rti_gateway);
+ memcpy(&rti_gateway.sin6_addr, &saddr6, sizeof(rti_gateway.sin6_addr));
+
+ for (rt = (struct nd_opt_hdr *)ndopts.nd_opts_rti;
+ rt <= (struct nd_opt_hdr *)ndopts.nd_opts_rti_end;
+ rt = (struct nd_opt_hdr *)((caddr_t)rt +
+ (rt->nd_opt_len << ND_OPT_LEN_TO_BYTE_SCALE))) {
+ struct sockaddr_in6 rti_prefix = {};
+ struct nd_route_info rti = {};
+ struct nd_opt_route_info *rti_opt = NULL;
+ u_int32_t rounded_prefix_bytes = 0;
+
+ if (rt->nd_opt_type != ND_OPT_ROUTE_INFO) {
+ continue;
+ }
+
+ rti_opt = (struct nd_opt_route_info *)rt;
+ if ((rti_opt->nd_opt_rti_len < ND_OPT_LEN_RTI_MIN) ||
+ (rti_opt->nd_opt_rti_len > ND_OPT_LEN_RTI_MAX)) {
+ nd6log(info,
+ "%s: invalid option "
+ "len %d for route information option, "
+ "ignored\n", __func__,
+ rti_opt->nd_opt_rti_len);
+ continue;
+ }
+
+ if (rti_opt->nd_opt_rti_prefixlen > ND_OPT_RTI_PFXLEN_MAX) {
+ nd6log(info,
+ "%s: invalid prefix length %d "
+ "in the route information option, "
+ "ignored\n", __func__, rti_opt->nd_opt_rti_prefixlen);
+ continue;
+ }
+
+ if (rti_opt->nd_opt_rti_prefixlen != 0 &&
+ rti_opt->nd_opt_rti_prefixlen <= 64 &&
+ rti_opt->nd_opt_rti_len == ND_OPT_LEN_RTI_MIN) {
+ nd6log(info,
+ "%s: invalid prefix "
+ "len %d is OOB for route information option, "
+ "with total option length of %d. Ignored.\n",
+ __func__, rti_opt->nd_opt_rti_prefixlen,
+ rti_opt->nd_opt_rti_len);
+ continue;
+ }
+
+ if (rti_opt->nd_opt_rti_prefixlen > 64 &&
+ rti_opt->nd_opt_rti_len != ND_OPT_LEN_RTI_MAX) {
+ nd6log(info,
+ "%s: invalid prefix "
+ "len %d is OOB for route information option, "
+ "with total option length of %d. Ignored.\n",
+ __func__, rti_opt->nd_opt_rti_prefixlen,
+ rti_opt->nd_opt_rti_len);
+ continue;
+ }
+
+ if ((rti_opt->nd_opt_rti_flags & ND_RA_FLAG_RTPREF_MASK) ==
+ ND_RA_FLAG_RTPREF_RSV) {
+ nd6log(info,
+ "%s: using reserved preference mask, "
+ "ignored\n", __func__);
+ continue;
+ }
+
+ rti_prefix.sin6_family = AF_INET6;
+ rti_prefix.sin6_len = sizeof(rti_prefix);
+
+ rounded_prefix_bytes = rti_opt->nd_opt_rti_prefixlen >> 3;
+ if (rti_opt->nd_opt_rti_prefixlen & 0x7) {
+ rounded_prefix_bytes++;
+ }
+ memcpy(&rti_prefix.sin6_addr, rti_opt + 1, rounded_prefix_bytes);
+
+ nd6log(info, "%s: received RA with route opt, "
+ "prefix %s/%u pref %u lifetime %u\n", __func__,
+ ip6_sprintf(&rti_prefix.sin6_addr),
+ rti_opt->nd_opt_rti_prefixlen,
+ rti_opt->nd_opt_rti_flags,
+ ntohl(rti_opt->nd_opt_rti_lifetime));
+
+ dr0.flags = rti_opt->nd_opt_rti_flags;
+ dr0.stateflags = 0;
+
+ /*
+ * https://tools.ietf.org/html/rfc4191#section-3.1
+ * Type C Host requirements:
+ * The Router Preference and Lifetime values in a
+ * ::/0 Route Information Option override the
+ * preference and lifetime values in the Router
+ * Advertisement header.
+ */
+ if (IN6_IS_ADDR_UNSPECIFIED(&rti_prefix.sin6_addr)) {
+ rti_defrtr_processed = TRUE;
+ /*
+ * If the router lifetime is 0, set the state flag
+ * to dummy, so that it is skipped and not used as a
+ * default router.
+ * Set the lifetime to 2 hrs to make sure we get rid
+ * of the router eventually if this was indeed for a router
+ * going away.
+ *
+ * We partly have to do this to ensure advertised prefixes
+ * stay onlink.
+ * A periodic RA would also keep refreshing the cached
+ * neighbor cache entry if it contains source link layer
+ * information.
+ */
+ if (rti_opt->nd_opt_rti_lifetime == 0) {
+ dr0.rtlifetime = TWOHOUR;
+ dr0.stateflags |= NDDRF_INELIGIBLE;
+ } else {
+ dr0.rtlifetime = ntohl(rti_opt->nd_opt_rti_lifetime);
+ }
+ dr0.expire = net_uptime() + dr0.rtlifetime;
+
+ lck_mtx_lock(nd6_mutex);
+ dr = defrtrlist_update(&dr0, NULL);
+ lck_mtx_unlock(nd6_mutex);
+ continue;
+ }
+
+ dr0.rtlifetime = ntohl(rti_opt->nd_opt_rti_lifetime);
+ dr0.expire = net_uptime() + dr0.rtlifetime;
+ bzero(&rti, sizeof(rti));
+ rti.nd_rti_prefixlen = rti_opt->nd_opt_rti_prefixlen;
+ rti.nd_rti_prefix = rti_prefix.sin6_addr;
+ nd6_rtilist_update(&rti, &dr0);
+ }
+ }
+
+ if (!rti_defrtr_processed) {
+ dr0.flags = nd_ra->nd_ra_flags_reserved;
+ dr0.stateflags = 0;
+ /*
+ * If the router lifetime is 0, set the state flag
+ * to dummy, so that it is skipped and not used as a
+ * default router.
+ * Set the lifetime to 2 hrs to make sure we get rid
+ * of the router eventually if this was indeed for a router
+ * going away.
+ *
+ * We partly have to do this to ensure advertised prefixes
+ * stay onlink.
+ * A periodic RA would also keep refreshing the cached
+ * neighbor cache entry if it contains source link layer
+ * information.
+ */
+ if (nd_ra->nd_ra_router_lifetime == 0) {
+ dr0.rtlifetime = TWOHOUR;
+ dr0.stateflags |= NDDRF_INELIGIBLE;
+ } else {
+ dr0.rtlifetime = ntohs(nd_ra->nd_ra_router_lifetime);
+ }
+ dr0.expire = net_uptime() + dr0.rtlifetime;
+ lck_mtx_lock(nd6_mutex);
+ dr = defrtrlist_update(&dr0, NULL);
+ lck_mtx_unlock(nd6_mutex);
+ }
/*
* prefix
struct nd_prefix pr;
for (pt = (struct nd_opt_hdr *)ndopts.nd_opts_pi;
- pt <= (struct nd_opt_hdr *)ndopts.nd_opts_pi_end;
- pt = (struct nd_opt_hdr *)((caddr_t)pt +
- (pt->nd_opt_len << 3))) {
- if (pt->nd_opt_type != ND_OPT_PREFIX_INFORMATION)
+ pt <= (struct nd_opt_hdr *)ndopts.nd_opts_pi_end;
+ pt = (struct nd_opt_hdr *)((caddr_t)pt +
+ (pt->nd_opt_len << ND_OPT_LEN_TO_BYTE_SCALE))) {
+ struct in6_addr pi_mask;
+ bzero(&pi_mask, sizeof(pi_mask));
+
+ if (pt->nd_opt_type != ND_OPT_PREFIX_INFORMATION) {
continue;
+ }
pi = (struct nd_opt_prefix_info *)pt;
if (pi->nd_opt_pi_len != 4) {
- nd6log((LOG_INFO,
+ nd6log(info,
"nd6_ra_input: invalid option "
"len %d for prefix information option, "
- "ignored\n", pi->nd_opt_pi_len));
+ "ignored\n", pi->nd_opt_pi_len);
continue;
}
if (128 < pi->nd_opt_pi_prefix_len) {
- nd6log((LOG_INFO,
+ nd6log(info,
"nd6_ra_input: invalid prefix "
"len %d for prefix information option, "
- "ignored\n", pi->nd_opt_pi_prefix_len));
- continue;
- }
-
- if (IN6_IS_ADDR_MULTICAST(&pi->nd_opt_pi_prefix)
- || IN6_IS_ADDR_LINKLOCAL(&pi->nd_opt_pi_prefix)) {
- nd6log((LOG_INFO,
- "nd6_ra_input: invalid prefix "
- "%s, ignored\n",
- ip6_sprintf(&pi->nd_opt_pi_prefix)));
+ "ignored\n", pi->nd_opt_pi_prefix_len);
continue;
}
- /* aggregatable unicast address, rfc2374 */
- if ((pi->nd_opt_pi_prefix.s6_addr8[0] & 0xe0) == 0x20
- && pi->nd_opt_pi_prefix_len != 64) {
- nd6log((LOG_INFO,
- "nd6_ra_input: invalid prefixlen "
- "%d for rfc2374 prefix %s, ignored\n",
- pi->nd_opt_pi_prefix_len,
- ip6_sprintf(&pi->nd_opt_pi_prefix)));
+ /*
+ * To ignore ::/64 make sure bits beyond prefixlen
+ * are set to zero
+ */
+ in6_prefixlen2mask(&pi_mask, pi->nd_opt_pi_prefix_len);
+ pi->nd_opt_pi_prefix.s6_addr32[0] &= pi_mask.s6_addr32[0];
+ pi->nd_opt_pi_prefix.s6_addr32[1] &= pi_mask.s6_addr32[1];
+ pi->nd_opt_pi_prefix.s6_addr32[2] &= pi_mask.s6_addr32[2];
+ pi->nd_opt_pi_prefix.s6_addr32[3] &= pi_mask.s6_addr32[3];
+
+ if (IN6_IS_ADDR_UNSPECIFIED(&pi->nd_opt_pi_prefix) ||
+ IN6_IS_ADDR_MULTICAST(&pi->nd_opt_pi_prefix) ||
+ IN6_IS_ADDR_LINKLOCAL(&pi->nd_opt_pi_prefix)) {
+ nd6log(info,
+ "%s: invalid prefix %s, ignored\n",
+ __func__,
+ ip6_sprintf(&pi->nd_opt_pi_prefix));
continue;
}
bzero(&pr, sizeof(pr));
+ lck_mtx_init(&pr.ndpr_lock, ifa_mtx_grp, ifa_mtx_attr);
+ NDPR_LOCK(&pr);
pr.ndpr_prefix.sin6_family = AF_INET6;
pr.ndpr_prefix.sin6_len = sizeof(pr.ndpr_prefix);
pr.ndpr_prefix.sin6_addr = pi->nd_opt_pi_prefix;
pr.ndpr_ifp = m->m_pkthdr.rcvif;
pr.ndpr_raf_onlink = (pi->nd_opt_pi_flags_reserved &
- ND_OPT_PI_FLAG_ONLINK) ? 1 : 0;
+ ND_OPT_PI_FLAG_ONLINK) ? 1 : 0;
pr.ndpr_raf_auto = (pi->nd_opt_pi_flags_reserved &
- ND_OPT_PI_FLAG_AUTO) ? 1 : 0;
+ ND_OPT_PI_FLAG_AUTO) ? 1 : 0;
pr.ndpr_plen = pi->nd_opt_pi_prefix_len;
pr.ndpr_vltime = ntohl(pi->nd_opt_pi_valid_time);
pr.ndpr_pltime =
- ntohl(pi->nd_opt_pi_preferred_time);
+ ntohl(pi->nd_opt_pi_preferred_time);
+
+ /*
+ * Exceptions to stateless autoconfiguration processing:
+ * + nd6_accept_6to4 == 0 && address has 6to4 prefix
+ * + ip6_only_allow_rfc4193_prefix != 0 &&
+ * address not RFC 4193
+ */
+ if (ip6_only_allow_rfc4193_prefix &&
+ !IN6_IS_ADDR_UNIQUE_LOCAL(&pi->nd_opt_pi_prefix)) {
+ nd6log(info,
+ "nd6_ra_input: no SLAAC on prefix %s "
+ "[not RFC 4193]\n",
+ ip6_sprintf(&pi->nd_opt_pi_prefix));
+ pr.ndpr_raf_auto = 0;
+ } else if (!nd6_accept_6to4 &&
+ IN6_IS_ADDR_6TO4(&pi->nd_opt_pi_prefix)) {
+ nd6log(info,
+ "%s: no SLAAC on prefix %s "
+ "[6to4]\n", __func__,
+ ip6_sprintf(&pi->nd_opt_pi_prefix));
+ pr.ndpr_raf_auto = 0;
+ }
- if (in6_init_prefix_ltimes(&pr))
+ if (in6_init_prefix_ltimes(&pr)) {
+ NDPR_UNLOCK(&pr);
+ lck_mtx_destroy(&pr.ndpr_lock, ifa_mtx_grp);
continue; /* prefix lifetime init failed */
+ } else {
+ NDPR_UNLOCK(&pr);
+ }
+ (void) prelist_update(&pr, dr, m, mcast);
+ lck_mtx_destroy(&pr.ndpr_lock, ifa_mtx_grp);
+
+ /*
+ * We have to copy the values out after the
+ * prelist_update call since some of these values won't
+ * be properly set until after the router advertisement
+ * updating can vet the values.
+ */
+ prfl = NULL;
+ MALLOC(prfl, struct nd_prefix_list *, sizeof(*prfl),
+ M_TEMP, M_WAITOK | M_ZERO);
+
+ if (prfl == NULL) {
+ log(LOG_DEBUG, "%s: unable to MALLOC RA prefix "
+ "structure\n", __func__);
+ continue;
+ }
- (void)prelist_update(&pr, dr, m);
+ /* this is only for nd6_post_msg(), otherwise unused */
+ bcopy(&pr.ndpr_prefix, &prfl->pr.ndpr_prefix,
+ sizeof(prfl->pr.ndpr_prefix));
+ prfl->pr.ndpr_raf = pr.ndpr_raf;
+ prfl->pr.ndpr_plen = pr.ndpr_plen;
+ prfl->pr.ndpr_vltime = pr.ndpr_vltime;
+ prfl->pr.ndpr_pltime = pr.ndpr_pltime;
+ prfl->pr.ndpr_expire = pr.ndpr_expire;
+ prfl->pr.ndpr_base_calendartime =
+ pr.ndpr_base_calendartime;
+ prfl->pr.ndpr_base_uptime = pr.ndpr_base_uptime;
+ prfl->pr.ndpr_stateflags = pr.ndpr_stateflags;
+ prfl->pr.ndpr_addrcnt = pr.ndpr_addrcnt;
+ prfl->pr.ndpr_ifp = pr.ndpr_ifp;
+
+ prfl->next = nd_prefix_list_head;
+ nd_prefix_list_head = prfl;
+ nd_prefix_list_length++;
}
}
+
/*
* MTU
*/
if (ndopts.nd_opts_mtu && ndopts.nd_opts_mtu->nd_opt_mtu_len == 1) {
- u_int32_t mtu = ntohl(ndopts.nd_opts_mtu->nd_opt_mtu_mtu);
-
+ mtu = ntohl(ndopts.nd_opts_mtu->nd_opt_mtu_mtu);
/* lower bound */
if (mtu < IPV6_MMTU) {
- nd6log((LOG_INFO, "nd6_ra_input: bogus mtu option "
+ nd6log(info, "nd6_ra_input: bogus mtu option "
"mtu=%d sent from %s, ignoring\n",
- mtu, ip6_sprintf(&ip6->ip6_src)));
+ mtu, ip6_sprintf(&ip6->ip6_src));
goto skip;
}
+ lck_mtx_lock(&ndi->lock);
/* upper bound */
if (ndi->maxmtu) {
if (mtu <= ndi->maxmtu) {
int change = (ndi->linkmtu != mtu);
ndi->linkmtu = mtu;
- if (change) /* in6_maxmtu may change */
+ lck_mtx_unlock(&ndi->lock);
+ if (change) { /* in6_maxmtu may change */
in6_setmaxmtu();
+ }
} else {
- nd6log((LOG_INFO, "nd6_ra_input: bogus mtu "
+ nd6log(info, "nd6_ra_input: bogus mtu "
"mtu=%d sent from %s; "
"exceeds maxmtu %d, ignoring\n",
mtu, ip6_sprintf(&ip6->ip6_src),
- ndi->maxmtu));
+ ndi->maxmtu);
+ lck_mtx_unlock(&ndi->lock);
}
} else {
- nd6log((LOG_INFO, "nd6_ra_input: mtu option "
+ lck_mtx_unlock(&ndi->lock);
+ nd6log(info, "nd6_ra_input: mtu option "
"mtu=%d sent from %s; maxmtu unknown, "
"ignoring\n",
- mtu, ip6_sprintf(&ip6->ip6_src)));
+ mtu, ip6_sprintf(&ip6->ip6_src));
}
}
- skip:
-
+skip:
+
/*
* Source link layer address
*/
- {
- char *lladdr = NULL;
- int lladdrlen = 0;
-
if (ndopts.nd_opts_src_lladdr) {
lladdr = (char *)(ndopts.nd_opts_src_lladdr + 1);
lladdrlen = ndopts.nd_opts_src_lladdr->nd_opt_len << 3;
}
if (lladdr && ((ifp->if_addrlen + 2 + 7) & ~7) != lladdrlen) {
- nd6log((LOG_INFO,
+ nd6log(info,
"nd6_ra_input: lladdrlen mismatch for %s "
"(if %d, RA packet %d)\n",
- ip6_sprintf(&saddr6), ifp->if_addrlen, lladdrlen - 2));
+ ip6_sprintf(&saddr6), ifp->if_addrlen, lladdrlen - 2);
goto bad;
}
- nd6_cache_lladdr(ifp, &saddr6, lladdr, lladdrlen, ND_ROUTER_ADVERT, 0);
+ if (dr && dr->stateflags & NDDRF_MAPPED) {
+ saddr6 = dr->rtaddr_mapped;
+ }
+
+ nd6_cache_lladdr(ifp, &saddr6, lladdr, (int)lladdrlen,
+ ND_ROUTER_ADVERT, 0);
+
+ /* Post message */
+ nd6_post_msg(KEV_ND6_RA, nd_prefix_list_head, nd_prefix_list_length,
+ mtu);
/*
* Installing a link-layer address might change the state of the
* router's neighbor cache, which might also affect our on-link
* detection of adveritsed prefixes.
*/
- pfxlist_onlink_check(0);
- }
+ lck_mtx_lock(nd6_mutex);
+ pfxlist_onlink_check();
+ lck_mtx_unlock(nd6_mutex);
- freeit:
+freeit:
m_freem(m);
+ if (dr) {
+ NDDR_REMREF(dr);
+ }
+
+ prfl = NULL;
+ while ((prfl = nd_prefix_list_head) != NULL) {
+ nd_prefix_list_head = prfl->next;
+ FREE(prfl, M_TEMP);
+ }
+
return;
- bad:
+bad:
icmp6stat.icp6s_badra++;
- m_freem(m);
+ goto freeit;
}
/*
/* tell the change to user processes watching the routing socket. */
static void
-nd6_rtmsg(cmd, rt)
- int cmd;
- struct rtentry *rt;
+nd6_rtmsg(u_char cmd, struct rtentry *rt)
{
struct rt_addrinfo info;
+ struct ifnet *ifp = rt->rt_ifp;
- lck_mtx_assert(rt_mtx, LCK_MTX_ASSERT_OWNED);
+ RT_LOCK_ASSERT_HELD(rt);
bzero((caddr_t)&info, sizeof(info));
+ /* It's not necessary to lock ifp for if_lladdr */
info.rti_info[RTAX_DST] = rt_key(rt);
info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
info.rti_info[RTAX_NETMASK] = rt_mask(rt);
- info.rti_info[RTAX_IFP] =
- TAILQ_FIRST(&rt->rt_ifp->if_addrlist)->ifa_addr;
+ /*
+ * ifa_addr pointers for both should always be valid
+ * in this context; no need to hold locks.
+ */
+ info.rti_info[RTAX_IFP] = ifp->if_lladdr->ifa_addr;
info.rti_info[RTAX_IFA] = rt->rt_ifa->ifa_addr;
rt_missmsg(cmd, &info, rt->rt_flags, 0);
}
-void
-defrouter_addreq(
- struct nd_defrouter *new)
+static void
+defrouter_addreq(struct nd_defrouter *new, struct nd_route_info *rti, boolean_t scoped)
{
- struct sockaddr_in6 def, mask, gate;
+ struct sockaddr_in6 key, mask, gate;
struct rtentry *newrt = NULL;
+ unsigned int ifscope;
+ int err;
+ struct nd_ifinfo *ndi = ND_IFINFO(new->ifp);
+ int rtflags = RTF_GATEWAY;
+
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_NOTOWNED);
+ NDDR_LOCK_ASSERT_NOTHELD(new);
+ /*
+ * We're free to lock and unlock NDDR because our callers
+ * are holding an extra reference for us.
+ */
+
+ NDDR_LOCK(new);
+ if (new->stateflags & NDDRF_INSTALLED) {
+ goto out;
+ }
+ if (new->ifp->if_ipv6_router_mode == IPV6_ROUTER_MODE_EXCLUSIVE) {
+ nd6log2(info, "%s: ignoring router %s, scoped=%d, "
+ "static=%d on advertising interface\n", if_name(new->ifp),
+ ip6_sprintf(&new->rtaddr), scoped,
+ (new->stateflags & NDDRF_STATIC) ? 1 : 0);
+ goto out;
+ }
- Bzero(&def, sizeof(def));
+ nd6log2(info, "%s: adding default router %s, scoped=%d, "
+ "static=%d\n", if_name(new->ifp), ip6_sprintf(&new->rtaddr),
+ scoped, (new->stateflags & NDDRF_STATIC) ? 1 : 0);
+
+ Bzero(&key, sizeof(key));
Bzero(&mask, sizeof(mask));
Bzero(&gate, sizeof(gate));
- def.sin6_len = mask.sin6_len = gate.sin6_len
- = sizeof(struct sockaddr_in6);
- def.sin6_family = mask.sin6_family = gate.sin6_family = AF_INET6;
- gate.sin6_addr = new->rtaddr;
+ key.sin6_len = mask.sin6_len = gate.sin6_len
+ = sizeof(struct sockaddr_in6);
+ key.sin6_family = mask.sin6_family = gate.sin6_family = AF_INET6;
- lck_mtx_lock(rt_mtx);
- (void)rtrequest_locked(RTM_ADD, (struct sockaddr *)&def,
- (struct sockaddr *)&gate, (struct sockaddr *)&mask,
- RTF_GATEWAY, &newrt);
- if (newrt) {
- nd6_rtmsg(RTM_ADD, newrt); /* tell user process */
- rtunref(newrt);
+ if (rti != NULL) {
+ key.sin6_addr = rti->nd_rti_prefix;
+ in6_len2mask(&mask.sin6_addr, rti->nd_rti_prefixlen);
+ if (rti->nd_rti_prefixlen == ND_OPT_RTI_PFXLEN_MAX) {
+ rtflags |= RTF_HOST;
+ } else {
+ rtflags |= RTF_PRCLONING;
+ }
}
- lck_mtx_unlock(rt_mtx);
- return;
-}
-
-/* Add a route to a given interface as default */
-void
-defrouter_addifreq(
- struct ifnet *ifp)
-{
- struct sockaddr_in6 def, mask;
- struct ifaddr *ifa = NULL;
- struct rtentry *newrt = NULL;
- int error;
- u_long flags;
- bzero(&def, sizeof(def));
- bzero(&mask, sizeof(mask));
+ if (new->stateflags & NDDRF_MAPPED) {
+ gate.sin6_addr = new->rtaddr_mapped;
+ } else {
+ gate.sin6_addr = new->rtaddr;
+ }
- def.sin6_len = mask.sin6_len = sizeof(struct sockaddr_in6);
- def.sin6_family = mask.sin6_family = AF_INET6;
+ ifscope = scoped ? new->ifp->if_index : IFSCOPE_NONE;
+ NDDR_UNLOCK(new);
/*
- * Search for an ifaddr beloging to the specified interface.
- * XXX: An IPv6 address are required to be assigned on the interface.
+ * Cellular networks may have buggy deployments
+ * with gateway IPv6 link local address with same
+ * interface identifier as the one that has been
+ * assigned for the cellular context.
+ * If gateway is same as locally configured link local
+ * interface on cellular interface, generated a different one
+ * and store it in the nd_defrouter entry and use it to work
+ * on routing table
*/
- if ((ifa = ifaof_ifpforaddr((struct sockaddr *)&def, ifp)) == NULL) {
- nd6log((LOG_ERR, /* better error? */
- "defrouter_addifreq: failed to find an ifaddr "
- "to install a route to interface %s\n",
- if_name(ifp)));
- return;
+ if (new->ifp->if_type == IFT_CELLULAR &&
+ !(new->stateflags & NDDRF_STATIC) &&
+ !(new->stateflags & NDDRF_MAPPED) &&
+ IN6_IS_ADDR_LINKLOCAL(&gate.sin6_addr) &&
+ ndi && !(ndi->flags & ND6_IFF_PERFORMNUD)) {
+ struct in6_ifaddr *tmp_ia6 = in6ifa_ifpforlinklocal(new->ifp, 0);
+
+ if (tmp_ia6 != NULL &&
+ !(tmp_ia6->ia6_flags & IN6_IFF_NOTMANUAL) &&
+ IN6_ARE_ADDR_EQUAL(&tmp_ia6->ia_addr.sin6_addr,
+ &gate.sin6_addr)) {
+ gate.sin6_addr.s6_addr8[15] += 1;
+ new->rtaddr_mapped = gate.sin6_addr;
+ new->stateflags |= NDDRF_MAPPED;
+
+ nd6log(info, "%s: Default router %s mapped "
+ "to ", if_name(new->ifp), ip6_sprintf(&new->rtaddr));
+ nd6log(info, "%s\n", ip6_sprintf(&new->rtaddr_mapped));
+ }
}
- lck_mtx_lock(rt_mtx);
- flags = ifa->ifa_flags;
- error = rtrequest_locked(RTM_ADD, (struct sockaddr *)&def, ifa->ifa_addr,
- (struct sockaddr *)&mask, flags, &newrt);
- if (error != 0) {
- nd6log((LOG_ERR,
- "defrouter_addifreq: failed to install a route to "
- "interface %s (errno = %d)\n",
- if_name(ifp), error));
+ err = rtrequest_scoped(RTM_ADD, (struct sockaddr *)&key,
+ (struct sockaddr *)&gate, (struct sockaddr *)&mask,
+ rtflags, &newrt, ifscope);
- if (newrt) /* maybe unnecessary, but do it for safety */
- rtunref(newrt);
- } else {
- if (newrt) {
- nd6_rtmsg(RTM_ADD, newrt);
- rtunref(newrt);
+ if (newrt) {
+ RT_LOCK(newrt);
+ nd6_rtmsg(RTM_ADD, newrt); /* tell user process */
+ RT_REMREF_LOCKED(newrt);
+ RT_UNLOCK(newrt);
+ NDDR_LOCK(new);
+ new->stateflags |= NDDRF_INSTALLED;
+ if (ifscope != IFSCOPE_NONE) {
+ new->stateflags |= NDDRF_IFSCOPE;
}
- in6_post_msg(ifp, KEV_INET6_DEFROUTER, (struct in6_ifaddr *)ifa);
+ } else {
+ nd6log(error, "%s: failed to add default router "
+ "%s on %s scoped %d (errno = %d)\n", __func__,
+ ip6_sprintf(&gate.sin6_addr), if_name(new->ifp),
+ (ifscope != IFSCOPE_NONE), err);
+ NDDR_LOCK(new);
}
- lck_mtx_unlock(rt_mtx);
- ifafree(ifa);
+ new->err = err;
+
+out:
+ NDDR_UNLOCK(new);
}
struct nd_defrouter *
defrouter_lookup(
+ struct nd_drhead *nd_router_listp,
struct in6_addr *addr,
struct ifnet *ifp)
{
struct nd_defrouter *dr;
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
- lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
-
- for (dr = TAILQ_FIRST(&nd_defrouter); dr;
- dr = TAILQ_NEXT(dr, dr_entry)) {
- if (dr->ifp == ifp && IN6_ARE_ADDR_EQUAL(addr, &dr->rtaddr))
- return(dr);
+ if (nd_router_listp == NULL) {
+ nd_router_listp = &nd_defrouter_list;
}
- return(NULL); /* search failed */
-}
-
-void
-defrouter_delreq(
- struct nd_defrouter *dr,
- int dofree)
-{
- struct sockaddr_in6 def, mask, gate;
- struct rtentry *oldrt = NULL;
-
- Bzero(&def, sizeof(def));
- Bzero(&mask, sizeof(mask));
- Bzero(&gate, sizeof(gate));
-
- def.sin6_len = mask.sin6_len = gate.sin6_len
- = sizeof(struct sockaddr_in6);
- def.sin6_family = mask.sin6_family = gate.sin6_family = AF_INET6;
- gate.sin6_addr = dr->rtaddr;
-
- lck_mtx_lock(rt_mtx);
- rtrequest_locked(RTM_DELETE, (struct sockaddr *)&def,
- (struct sockaddr *)&gate,
- (struct sockaddr *)&mask,
- RTF_GATEWAY, &oldrt);
- if (oldrt) {
- nd6_rtmsg(RTM_DELETE, oldrt);
- if (oldrt->rt_refcnt <= 0) {
- /*
- * XXX: borrowed from the RTM_DELETE case of
- * rtrequest().
- */
- rtref(oldrt);
- rtfree_locked(oldrt);
+ for (dr = TAILQ_FIRST(nd_router_listp); dr;
+ dr = TAILQ_NEXT(dr, dr_entry)) {
+ NDDR_LOCK(dr);
+ if (dr->ifp == ifp && IN6_ARE_ADDR_EQUAL(addr, &dr->rtaddr)) {
+ NDDR_ADDREF(dr);
+ NDDR_UNLOCK(dr);
+ return dr;
}
+ NDDR_UNLOCK(dr);
}
- if (dofree) /* XXX: necessary? */
- FREE(dr, M_IP6NDP);
- lck_mtx_unlock(rt_mtx);
+ return NULL; /* search failed */
}
-void
-defrtrlist_del(
- struct nd_defrouter *dr, int nd6locked)
+/*
+ * Remove the default route for a given router.
+ * This is just a subroutine function for defrouter_select(), and should
+ * not be called from anywhere else.
+ */
+static void
+defrouter_delreq(struct nd_defrouter *dr, struct nd_route_info *rti)
{
- struct nd_defrouter *deldr = NULL;
- struct nd_prefix *pr;
+ struct sockaddr_in6 key, mask, gate;
+ struct rtentry *oldrt = NULL;
+ unsigned int ifscope;
+ int err;
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_NOTOWNED);
+ NDDR_LOCK_ASSERT_NOTHELD(dr);
/*
- * Flush all the routing table entries that use the router
- * as a next hop.
+ * We're free to lock and unlock NDDR because our callers
+ * are holding an extra reference for us.
*/
- if (!ip6_forwarding && (ip6_accept_rtadv || (dr->ifp->if_eflags & IFEF_ACCEPT_RTADVD))) {
- /* above is a good condition? */
- rt6_flush(&dr->rtaddr, dr->ifp);
+ NDDR_LOCK(dr);
+ /* ifp would be NULL for the "drany" case */
+ if (dr->ifp != NULL && !(dr->stateflags & NDDRF_INSTALLED)) {
+ goto out;
}
- if (nd6locked == 0)
- lck_mtx_lock(nd6_mutex);
- if (dr == TAILQ_FIRST(&nd_defrouter))
- deldr = dr; /* The router is primary. */
+ nd6log2(info, "%s: removing default router %s, scoped=%d, "
+ "static=%d\n", dr->ifp != NULL ? if_name(dr->ifp) : "ANY",
+ ip6_sprintf(&dr->rtaddr), (dr->stateflags & NDDRF_IFSCOPE) ? 1 : 0,
+ (dr->stateflags & NDDRF_STATIC) ? 1 : 0);
+
+ Bzero(&key, sizeof(key));
+ Bzero(&mask, sizeof(mask));
+ Bzero(&gate, sizeof(gate));
+
+ key.sin6_len = mask.sin6_len = gate.sin6_len
+ = sizeof(struct sockaddr_in6);
+ key.sin6_family = mask.sin6_family = gate.sin6_family = AF_INET6;
- TAILQ_REMOVE(&nd_defrouter, dr, dr_entry);
+ if (rti != NULL) {
+ key.sin6_addr = rti->nd_rti_prefix;
+ in6_len2mask(&mask.sin6_addr, rti->nd_rti_prefixlen);
+ }
/*
- * Also delete all the pointers to the router in each prefix lists.
+ * The router entry may be mapped to a different address.
+ * If that is the case, use the mapped address as gateway
+ * to do operation on the routing table.
+ * To get more context, read the related comment in
+ * defrouter_addreq
*/
- for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
- struct nd_pfxrouter *pfxrtr;
- if ((pfxrtr = pfxrtr_lookup(pr, dr)) != NULL)
- pfxrtr_del(pfxrtr);
+ if (dr->stateflags & NDDRF_MAPPED) {
+ gate.sin6_addr = dr->rtaddr_mapped;
+ } else {
+ gate.sin6_addr = dr->rtaddr;
}
- pfxlist_onlink_check(1);
- /*
- * If the router is the primary one, choose a new one.
- * Note that defrouter_select() will remove the current gateway
- * from the routing table.
- */
- if (deldr)
- defrouter_select();
+ if (dr->ifp != NULL) {
+ ifscope = (dr->stateflags & NDDRF_IFSCOPE) ?
+ dr->ifp->if_index : IFSCOPE_NONE;
+ } else {
+ ifscope = IFSCOPE_NONE;
+ }
+ NDDR_UNLOCK(dr);
- if (nd6locked == 0)
- lck_mtx_unlock(nd6_mutex);
+ err = rtrequest_scoped(RTM_DELETE,
+ (struct sockaddr *)&key, (struct sockaddr *)&gate,
+ (struct sockaddr *)&mask, RTF_GATEWAY, &oldrt, ifscope);
- FREE(dr, M_IP6NDP);
+ if (oldrt) {
+ RT_LOCK(oldrt);
+ nd6_rtmsg(RTM_DELETE, oldrt);
+ RT_UNLOCK(oldrt);
+ rtfree(oldrt);
+ } else if (err != ESRCH) {
+ nd6log(error, "%s: failed to delete default router "
+ "%s on %s scoped %d (errno = %d)\n", __func__,
+ ip6_sprintf(&gate.sin6_addr), dr->ifp != NULL ?
+ if_name(dr->ifp) : "ANY", (ifscope != IFSCOPE_NONE), err);
+ }
+ NDDR_LOCK(dr);
+ /* ESRCH means it's no longer in the routing table; ignore it */
+ if (oldrt != NULL || err == ESRCH) {
+ dr->stateflags &= ~NDDRF_INSTALLED;
+ if (ifscope != IFSCOPE_NONE) {
+ dr->stateflags &= ~NDDRF_IFSCOPE;
+ }
+ }
+ dr->err = 0;
+out:
+ NDDR_UNLOCK(dr);
}
+
/*
- * Default Router Selection according to Section 6.3.6 of RFC 2461:
- * 1) Routers that are reachable or probably reachable should be
- * preferred.
- * 2) When no routers on the list are known to be reachable or
- * probably reachable, routers SHOULD be selected in a round-robin
- * fashion.
- * 3) If the Default Router List is empty, assume that all
- * destinations are on-link.
+ * remove all default routes from default router list
*/
void
-defrouter_select()
+defrouter_reset(void)
{
- struct nd_defrouter *dr, anydr;
- struct rtentry *rt = NULL;
- struct llinfo_nd6 *ln = NULL;
-
- /*
- * Search for a (probably) reachable router from the list.
- */
- lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
-
- for (dr = TAILQ_FIRST(&nd_defrouter); dr;
- dr = TAILQ_NEXT(dr, dr_entry)) {
- if ((rt = nd6_lookup(&dr->rtaddr, 0, dr->ifp, 0)) &&
- (ln = (struct llinfo_nd6 *)rt->rt_llinfo) &&
- ND6_IS_LLINFO_PROBREACH(ln)) {
- /* Got it, and move it to the head */
- TAILQ_REMOVE(&nd_defrouter, dr, dr_entry);
- TAILQ_INSERT_HEAD(&nd_defrouter, dr, dr_entry);
- break;
+ struct nd_defrouter *dr, drany;
+
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ dr = TAILQ_FIRST(&nd_defrouter_list);
+ while (dr) {
+ NDDR_LOCK(dr);
+ if (dr->stateflags & NDDRF_INSTALLED) {
+ NDDR_ADDREF(dr);
+ NDDR_UNLOCK(dr);
+ lck_mtx_unlock(nd6_mutex);
+ defrouter_delreq(dr, NULL);
+ lck_mtx_lock(nd6_mutex);
+ NDDR_REMREF(dr);
+ dr = TAILQ_FIRST(&nd_defrouter_list);
+ } else {
+ NDDR_UNLOCK(dr);
+ dr = TAILQ_NEXT(dr, dr_entry);
}
}
- if ((dr = TAILQ_FIRST(&nd_defrouter))) {
- /*
- * De-install the previous default gateway and install
- * a new one.
- * Note that if there is no reachable router in the list,
- * the head entry will be used anyway.
- * XXX: do we have to check the current routing table entry?
+ /* Nuke primary (non-scoped) default router */
+ bzero(&drany, sizeof(drany));
+ lck_mtx_init(&drany.nddr_lock, ifa_mtx_grp, ifa_mtx_attr);
+ lck_mtx_unlock(nd6_mutex);
+ defrouter_delreq(&drany, NULL);
+ lck_mtx_destroy(&drany.nddr_lock, ifa_mtx_grp);
+ lck_mtx_lock(nd6_mutex);
+}
+
+int
+defrtrlist_ioctl(u_long cmd, caddr_t data)
+{
+ struct nd_defrouter dr0;
+ unsigned int ifindex;
+ struct ifnet *dr_ifp;
+ int error = 0, add = 0;
+
+ /* XXX Handle mapped default router entries */
+ switch (cmd) {
+ case SIOCDRADD_IN6_32: /* struct in6_defrouter_32 */
+ case SIOCDRADD_IN6_64: /* struct in6_defrouter_64 */
+ ++add;
+ OS_FALLTHROUGH;
+ case SIOCDRDEL_IN6_32: /* struct in6_defrouter_32 */
+ case SIOCDRDEL_IN6_64: /* struct in6_defrouter_64 */
+ bzero(&dr0, sizeof(dr0));
+ if (cmd == SIOCDRADD_IN6_64 || cmd == SIOCDRDEL_IN6_64) {
+ struct in6_defrouter_64 *r_64 =
+ (struct in6_defrouter_64 *)(void *)data;
+ u_int16_t i;
+
+ bcopy(&r_64->rtaddr.sin6_addr, &dr0.rtaddr,
+ sizeof(dr0.rtaddr));
+ dr0.flags = r_64->flags;
+ bcopy(&r_64->if_index, &i, sizeof(i));
+ ifindex = i;
+ } else {
+ struct in6_defrouter_32 *r_32 =
+ (struct in6_defrouter_32 *)(void *)data;
+ u_int16_t i;
+
+ bcopy(&r_32->rtaddr.sin6_addr, &dr0.rtaddr,
+ sizeof(dr0.rtaddr));
+ dr0.flags = r_32->flags;
+ bcopy(&r_32->if_index, &i, sizeof(i));
+ ifindex = i;
+ }
+ ifnet_head_lock_shared();
+ /* Don't need to check is ifindex is < 0 since it's unsigned */
+ if (if_index < ifindex ||
+ (dr_ifp = ifindex2ifnet[ifindex]) == NULL) {
+ ifnet_head_done();
+ error = EINVAL;
+ break;
+ }
+ dr0.ifp = dr_ifp;
+ ifnet_head_done();
+
+ if (ND_IFINFO(dr_ifp) == NULL ||
+ !ND_IFINFO(dr_ifp)->initialized) {
+ error = ENXIO;
+ break;
+ }
+
+ if (IN6_IS_SCOPE_EMBED(&dr0.rtaddr)) {
+ uint16_t *scope = &dr0.rtaddr.s6_addr16[1];
+
+ if (*scope == 0) {
+ *scope = htons(dr_ifp->if_index);
+ } else if (*scope != htons(dr_ifp->if_index)) {
+ error = EINVAL;
+ break;
+ }
+ }
+
+ if (add) {
+ error = defrtrlist_add_static(&dr0);
+ }
+ if (!add || error != 0) {
+ int err = defrtrlist_del_static(&dr0);
+ if (!add) {
+ error = err;
+ }
+ }
+ break;
+
+ default:
+ error = EOPNOTSUPP; /* check for safety */
+ break;
+ }
+
+ return error;
+}
+
+/*
+ * XXX Please make sure to remove dr from the
+ * global default router tailq list before this
+ * function call.
+ * Also ensure that you release the list reference
+ * only after calling this routine.
+ */
+void
+defrtrlist_del(struct nd_defrouter *dr, struct nd_drhead *nd_router_listp)
+{
+#if (DEVELOPMENT || DEBUG)
+ struct nd_defrouter *dr_itr = NULL;
+#endif
+ struct nd_prefix *pr;
+ struct ifnet *ifp = dr->ifp;
+ struct nd_ifinfo *ndi = NULL;
+ boolean_t resetmtu = FALSE;
+ struct nd_route_info *rti = NULL;
+
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ if (nd_router_listp == NULL) {
+ nd_router_listp = &nd_defrouter_list;
+ }
+
+ if (nd_router_listp != &nd_defrouter_list) {
+ rti = (struct nd_route_info *)nd_router_listp;
+ }
+
+#if (DEVELOPMENT || DEBUG)
+ /*
+ * Verify that the router is not in the global default
+ * router list.
+ * Can't use defrouter_lookup here because that just works
+ * with address and ifp pointer.
+ * We have to compare the memory here.
+ * Also we can't use ASSERT here as that is not defined
+ * for development builds.
+ */
+ TAILQ_FOREACH(dr_itr, nd_router_listp, dr_entry)
+ VERIFY(dr != dr_itr);
+#endif
+ ++nd6_defrouter_genid;
+ /*
+ * Flush all the routing table entries that use the router
+ * as a next hop.
+ *
+ * XXX Note that for a router advertising itself as default router
+ * and also advertising route information option, the following
+ * code will have the default router entry and router entry of
+ * RTI step over each other.
+ * The following therefore may not be efficient but won't be
+ * causing blocking issues.
+ */
+ NDDR_ADDREF(dr);
+ lck_mtx_unlock(nd6_mutex);
+ if (dr->stateflags & NDDRF_MAPPED) {
+ rt6_flush(&dr->rtaddr_mapped, ifp);
+ } else {
+ rt6_flush(&dr->rtaddr, ifp);
+ }
+ lck_mtx_lock(nd6_mutex);
+ NDDR_REMREF(dr);
+ nd6log2(info, "%s: freeing route to %s with gateway %s\n", if_name(dr->ifp),
+ (rti == NULL)? "::" : ip6_sprintf(&rti->nd_rti_prefix),
+ ip6_sprintf(&dr->rtaddr));
+ /*
+ * Delete it from the routing table.
+ */
+ NDDR_ADDREF(dr);
+ lck_mtx_unlock(nd6_mutex);
+ defrouter_delreq(dr, rti);
+ lck_mtx_lock(nd6_mutex);
+ NDDR_REMREF(dr);
+
+ /*
+ * The following should mostly be limited to when we are working
+ * with a default router entry and not a router entry from
+ * rti router list.
+ */
+ if (rti == NULL) {
+ /*
+ * Also delete all the pointers to the router in each prefix lists.
+ */
+ for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
+ struct nd_pfxrouter *pfxrtr;
+
+ NDPR_LOCK(pr);
+ if ((pfxrtr = pfxrtr_lookup(pr, dr)) != NULL) {
+ pfxrtr_del(pfxrtr, pr);
+ }
+ NDPR_UNLOCK(pr);
+ }
+ pfxlist_onlink_check();
+ }
+ ndi = ND_IFINFO(ifp);
+ VERIFY(NULL != ndi && TRUE == ndi->initialized);
+ lck_mtx_lock(&ndi->lock);
+ VERIFY(ndi->ndefrouters >= 0);
+ if (ndi->ndefrouters > 0 && --ndi->ndefrouters == 0) {
+ nd6_ifreset(ifp);
+ resetmtu = TRUE;
+ }
+ lck_mtx_unlock(&ndi->lock);
+ /*
+ * If the router is the primary one, choose a new one.
+ * We always try to pick another eligible router
+ * on this interface as we do scoped routing
+ */
+ defrouter_select(ifp, nd_router_listp);
+
+ if (resetmtu) {
+ nd6_setmtu(ifp);
+ }
+}
+
+int
+defrtrlist_add_static(struct nd_defrouter *new)
+{
+ struct nd_defrouter *dr;
+ int err = 0;
+
+ new->rtlifetime = -1;
+ new->stateflags |= NDDRF_STATIC;
+
+ /* we only want the preference level */
+ new->flags &= ND_RA_FLAG_RTPREF_MASK;
+
+ lck_mtx_lock(nd6_mutex);
+ dr = defrouter_lookup(NULL, &new->rtaddr, new->ifp);
+ if (dr != NULL && !(dr->stateflags & NDDRF_STATIC)) {
+ err = EINVAL;
+ } else {
+ if (dr != NULL) {
+ NDDR_REMREF(dr);
+ }
+ dr = defrtrlist_update(new, NULL);
+ if (dr != NULL) {
+ err = dr->err;
+ } else {
+ err = ENOMEM;
+ }
+ }
+ if (dr != NULL) {
+ NDDR_REMREF(dr);
+ }
+ lck_mtx_unlock(nd6_mutex);
+
+ return err;
+}
+
+int
+defrtrlist_del_static(struct nd_defrouter *new)
+{
+ struct nd_defrouter *dr;
+
+ lck_mtx_lock(nd6_mutex);
+ dr = defrouter_lookup(NULL, &new->rtaddr, new->ifp);
+ if (dr == NULL || !(dr->stateflags & NDDRF_STATIC)) {
+ if (dr != NULL) {
+ NDDR_REMREF(dr);
+ }
+ dr = NULL;
+ } else {
+ TAILQ_REMOVE(&nd_defrouter_list, dr, dr_entry);
+ defrtrlist_del(dr, NULL);
+ NDDR_REMREF(dr); /* remove list reference */
+ NDDR_REMREF(dr);
+ }
+ lck_mtx_unlock(nd6_mutex);
+
+ return dr != NULL ? 0 : EINVAL;
+}
+
+/*
+ * for default router selection
+ * regards router-preference field as a 2-bit signed integer
+ */
+static int
+rtpref(struct nd_defrouter *dr)
+{
+ switch (dr->flags & ND_RA_FLAG_RTPREF_MASK) {
+ case ND_RA_FLAG_RTPREF_HIGH:
+ return RTPREF_HIGH;
+ case ND_RA_FLAG_RTPREF_MEDIUM:
+ case ND_RA_FLAG_RTPREF_RSV:
+ return RTPREF_MEDIUM;
+ case ND_RA_FLAG_RTPREF_LOW:
+ return RTPREF_LOW;
+ default:
+ /*
+ * This case should never happen. If it did, it would mean a
+ * serious bug of kernel internal. We thus always bark here.
+ * Or, can we even panic?
+ */
+ log(LOG_ERR, "rtpref: impossible RA flag %x\n", dr->flags);
+ return RTPREF_INVALID;
+ }
+ /* NOTREACHED */
+}
+
+/*
+ * Default Router Selection according to Section 6.3.6 of RFC 2461 and RFC 4191:
+ *
+ * 1) Routers that are reachable or probably reachable should be preferred.
+ * If we have more than one (probably) reachable router, prefer ones
+ * with the highest router preference.
+ * 2) When no routers on the list are known to be reachable or
+ * probably reachable, routers SHOULD be selected in a round-robin
+ * fashion, regardless of router preference values.
+ * 3) If the Default Router List is empty, assume that all
+ * destinations are on-link.
+ *
+ * When Scoped Routing is enabled, the selection logic is amended as follows:
+ *
+ * a) When a default interface is specified, the primary/non-scoped default
+ * router will be set to the reachable router on that link (if any) with
+ * the highest router preference.
+ * b) When there are more than one routers on the same link, the one with
+ * the highest router preference will be installed, either as scoped or
+ * non-scoped route entry. If they all share the same preference value,
+ * the one installed will be the static or the first encountered reachable
+ * router, i.e. static one wins over dynamic.
+ * c) When no routers on the list are known to be reachable, or probably
+ * reachable, no round-robin selection will take place when the default
+ * interface is set.
+ *
+ * We assume nd_defrouter is sorted by router preference value.
+ * Since the code below covers both with and without router preference cases,
+ * we do not need to classify the cases by ifdef.
+ */
+void
+defrouter_select(struct ifnet *ifp, struct nd_drhead *nd_router_listp)
+{
+ struct nd_defrouter *dr = NULL;
+ struct nd_defrouter *selected_dr = NULL;
+ struct nd_defrouter *installed_dr = NULL;
+ struct llinfo_nd6 *ln = NULL;
+ struct rtentry *rt = NULL;
+ struct nd_ifinfo *ndi = NULL;
+ unsigned int genid = 0;
+ boolean_t is_installed_reachable = FALSE;
+ struct nd_route_info *rti = NULL;
+ boolean_t scoped = TRUE;
+ boolean_t is_rti_rtrlist = FALSE;
+
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ if (nd_router_listp == NULL) {
+ nd_router_listp = &nd_defrouter_list;
+ }
+
+ if (nd_router_listp != &nd_defrouter_list) {
+ rti = (struct nd_route_info *)nd_router_listp;
+ /* XXX For now we treat RTI routes as un-scoped */
+ scoped = FALSE;
+ is_rti_rtrlist = TRUE;
+ }
+
+
+ if (ifp == NULL) {
+ ifp = nd6_defifp;
+ if (ifp == NULL) {
+ nd6log2(info,
+ "%s:%d: Return early. NULL interface",
+ __func__, __LINE__);
+ return;
+ }
+ nd6log2(info,
+ "%s:%d: NULL interface passed. Setting to default interface %s.\n",
+ __func__, __LINE__, if_name(ifp));
+ }
+
+ /*
+ * When we are working with RTI router list, the nd6_defifp may be
+ * NULL. That is the scenario when the network may not have WAN
+ * v6 connectivity and the only RAs we may be getting are with lifetime
+ * 0.
+ */
+ if (ifp == lo_ifp && !is_rti_rtrlist) {
+ nd6log2(info,
+ "%s:%d: Return early. "
+ "Default router select called for loopback.\n",
+ __func__, __LINE__);
+ return;
+ }
+
+ if (ifp->if_ipv6_router_mode == IPV6_ROUTER_MODE_EXCLUSIVE) {
+ nd6log2(info,
+ "%s:%d: Return early. "
+ "Default router select called for interface"
+ " %s in IPV6_ROUTER_MODE_EXCLUSIVE\n",
+ __func__, __LINE__, if_name(ifp));
+ return;
+ }
+
+ /*
+ * Let's handle easy case (3) first:
+ * If default router list is empty, there's nothing to be done.
+ */
+ if (!TAILQ_FIRST(nd_router_listp)) {
+ nd6log2(info,
+ "%s:%d: Return early. "
+ "Default router is empty.\n", __func__, __LINE__);
+ return;
+ }
+
+ /*
+ * Take an early exit if number of routers in nd_ifinfo is
+ * 0 for the interface.
+ */
+ ndi = ND_IFINFO(ifp);
+ if (!ndi || !ndi->initialized) {
+ nd6log2(info,
+ "%s:%d: Return early. "
+ "Interface %s's nd_ifinfo not initialized.\n",
+ __func__, __LINE__, if_name(ifp));
+ return;
+ }
+
+ /*
+ * RTI router list routes are installed as unscoped.
+ * Since there can be only one unscoped route, we need to
+ * go through the entire list and consider all interfaces.
+ * Further, for now, RTI option is only processed on Ethernet
+ * type interfaces only.
+ */
+ if (ndi->ndefrouters == 0 && !is_rti_rtrlist) {
+ nd6log2(info,
+ "%s:%d: Return early. "
+ "%s does not have any default routers.\n",
+ __func__, __LINE__, if_name(ifp));
+ return;
+ }
+
+ /*
+ * Due to the number of times we drop nd6_mutex, we need to
+ * serialize this function.
+ */
+ while (nd_defrouter_busy) {
+ nd_defrouter_waiters++;
+ msleep(nd_defrouter_waitchan, nd6_mutex, (PZERO - 1),
+ __func__, NULL);
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ }
+ nd_defrouter_busy = TRUE;
+
+ /*
+ * Search for a (probably) reachable router from the list.
+ * We just pick up the first reachable one (if any), assuming that
+ * the ordering rule of the list described in defrtrlist_update().
+ *
+ * For all intents and purposes of Scoped Routing:
+ * selected_dr = candidate for primary router
+ * installed_dr = currently installed primary router
+ */
+ genid = nd6_defrouter_genid;
+ dr = TAILQ_FIRST(nd_router_listp);
+
+ while (dr != NULL) {
+ struct in6_addr rtaddr;
+ struct ifnet *drifp = NULL;
+ struct nd_defrouter *drrele = NULL;
+
+ NDDR_LOCK(dr);
+ drifp = dr->ifp;
+ if (drifp != ifp && !is_rti_rtrlist) {
+ NDDR_UNLOCK(dr);
+ dr = TAILQ_NEXT(dr, dr_entry);
+ continue;
+ }
+
+ if (dr->stateflags & NDDRF_INELIGIBLE) {
+ NDDR_UNLOCK(dr);
+ dr = TAILQ_NEXT(dr, dr_entry);
+ nd6log(info, "Ignoring dummy entry for default router.");
+ continue;
+ }
+
+ /*
+ * Optimize for the common case.
+ * When the interface has only one default router
+ * there's no point checking for reachability as
+ * there's nothing else to choose from.
+ */
+ if (ndi->ndefrouters == 1 && !is_rti_rtrlist) {
+ nd6log2(info,
+ "%s:%d: Fast forward default router selection "
+ "as interface %s has learned only one default "
+ "router and there's nothing else to choose from.\n",
+ __func__, __LINE__, if_name(ifp));
+ VERIFY(selected_dr == NULL && installed_dr == NULL);
+ selected_dr = dr;
+ if (dr->stateflags & NDDRF_INSTALLED) {
+ installed_dr = dr;
+ }
+ NDDR_ADDREF(selected_dr);
+ NDDR_UNLOCK(dr);
+ goto install_route;
+ }
+
+ if (dr->stateflags & NDDRF_MAPPED) {
+ rtaddr = dr->rtaddr_mapped;
+ } else {
+ rtaddr = dr->rtaddr;
+ }
+
+ NDDR_ADDREF(dr); /* for this for loop */
+ NDDR_UNLOCK(dr);
+
+ /* Callee returns a locked route upon success */
+ if (selected_dr == NULL) {
+ lck_mtx_unlock(nd6_mutex);
+ if ((rt = nd6_lookup(&rtaddr, 0, drifp, 0)) != NULL &&
+ (ln = rt->rt_llinfo) != NULL &&
+ ND6_IS_LLINFO_PROBREACH(ln)) {
+ RT_LOCK_ASSERT_HELD(rt);
+ selected_dr = dr;
+ NDDR_ADDREF(selected_dr);
+ }
+ lck_mtx_lock(nd6_mutex);
+ }
+
+ if (rt) {
+ RT_REMREF_LOCKED(rt);
+ RT_UNLOCK(rt);
+ rt = NULL;
+ }
+
+ /*
+ * Handle case (b)
+ * When there are more than one routers on the same link, the one with
+ * the highest router preference will be installed.
+ * Since the list is in decreasing order of preference:
+ * 1) If selected_dr is not NULL, only use dr if it is static and has
+ * equal preference and selected_dr is not static.
+ * 2) Else if selected_dr is NULL, and dr is static make selected_dr = dr
+ */
+ NDDR_LOCK(dr);
+ if (((selected_dr && (rtpref(dr) >= rtpref(selected_dr)) &&
+ !(selected_dr->stateflags & NDDRF_STATIC)) ||
+ (selected_dr == NULL)) &&
+ (dr->stateflags & NDDRF_STATIC)) {
+ if (selected_dr) {
+ /* Release it later on */
+ VERIFY(drrele == NULL);
+ drrele = selected_dr;
+ }
+ selected_dr = dr;
+ NDDR_ADDREF(selected_dr);
+ }
+
+ /* Record the currently installed router */
+ if (dr->stateflags & NDDRF_INSTALLED) {
+ if (installed_dr == NULL) {
+ installed_dr = dr;
+ NDDR_ADDREF(installed_dr);
+ if (dr->stateflags & NDDRF_MAPPED) {
+ rtaddr = installed_dr->rtaddr_mapped;
+ } else {
+ rtaddr = installed_dr->rtaddr;
+ }
+ NDDR_UNLOCK(dr);
+ lck_mtx_unlock(nd6_mutex);
+ /* Callee returns a locked route upon success */
+ if ((rt = nd6_lookup(&rtaddr, 0, installed_dr->ifp, 0)) != NULL) {
+ RT_LOCK_ASSERT_HELD(rt);
+ if ((ln = rt->rt_llinfo) != NULL &&
+ ND6_IS_LLINFO_PROBREACH(ln)) {
+ is_installed_reachable = TRUE;
+ }
+
+ RT_REMREF_LOCKED(rt);
+ RT_UNLOCK(rt);
+ rt = NULL;
+ }
+ lck_mtx_lock(nd6_mutex);
+ } else {
+ /* this should not happen; warn for diagnosis */
+ nd6log(error, "defrouter_select: more than one "
+ "default router is installed for interface :%s.\n",
+ if_name(installed_dr->ifp));
+ NDDR_UNLOCK(dr);
+ }
+ } else {
+ NDDR_UNLOCK(dr);
+ }
+
+ NDDR_REMREF(dr); /* for this for loop */
+ if (drrele != NULL) {
+ NDDR_REMREF(drrele);
+ }
+
+ /*
+ * Check if the list changed when we gave up
+ * the nd6_mutex lock
*/
- bzero(&anydr, sizeof(anydr));
- defrouter_delreq(&anydr, 0);
- defrouter_addreq(dr);
+ if (genid != nd6_defrouter_genid) {
+ if (selected_dr) {
+ NDDR_REMREF(selected_dr);
+ selected_dr = NULL;
+ }
+
+ if (installed_dr) {
+ NDDR_REMREF(installed_dr);
+ installed_dr = NULL;
+ }
+
+ if (ndi->ndefrouters == 0 && !is_rti_rtrlist) {
+ nd6log2(info,
+ "%s:%d: Interface %s no longer "
+ "has any default routers. Abort.\n",
+ __func__, __LINE__, if_name(ifp));
+ goto out;
+ }
+ nd6log2(info,
+ "%s:%d: Iterate default router list again "
+ "for interface %s, as the list seems to have "
+ "changed during release-reaquire of global "
+ "nd6_mutex lock.\n",
+ __func__, __LINE__, if_name(ifp));
+
+ is_installed_reachable = FALSE;
+ genid = nd6_defrouter_genid;
+ dr = TAILQ_FIRST(nd_router_listp);
+ } else {
+ dr = TAILQ_NEXT(dr, dr_entry);
+ }
}
- else {
+
+ /*
+ * If none of the default routers was found to be reachable,
+ * round-robin the list regardless of preference.
+ * Please note selected_dr equal to NULL implies that even
+ * installed default router is not reachable
+ */
+ if (selected_dr == NULL) {
+ if (installed_dr) {
+ for (dr = TAILQ_NEXT(installed_dr, dr_entry); dr;
+ dr = TAILQ_NEXT(dr, dr_entry)) {
+ if (installed_dr->ifp != dr->ifp && !is_rti_rtrlist) {
+ continue;
+ }
+ if (dr->stateflags & NDDRF_INELIGIBLE) {
+ continue;
+ }
+ selected_dr = dr;
+ break;
+ }
+ }
+
/*
- * The Default Router List is empty, so install the default
- * route to an inteface.
- * XXX: The specification does not say this mechanism should
- * be restricted to hosts, but this would be not useful
- * (even harmful) for routers.
+ * If none was installed or the installed one if the last
+ * one on the list, select the first one from the list
*/
- if (!ip6_forwarding) {
+ if ((installed_dr == NULL) || (selected_dr == NULL)) {
+ for (dr = TAILQ_FIRST(nd_router_listp); dr;
+ dr = TAILQ_NEXT(dr, dr_entry)) {
+ if (dr->stateflags & NDDRF_INELIGIBLE) {
+ continue;
+ }
+ if (dr->ifp == ifp || is_rti_rtrlist) {
+ selected_dr = dr;
+ break;
+ }
+ }
+ }
+
+ if ((selected_dr == NULL) && (installed_dr == NULL)) {
+ nd6log2(info,
+ "%s:%d: Between release and reaquire of global "
+ "nd6_mutex lock, the list seems to have changed "
+ "and it does not have any default routers for "
+ "interface %s.\n",
+ __func__, __LINE__, if_name(ifp));
+ goto out;
+ }
+
+ if (selected_dr != installed_dr) {
+ NDDR_ADDREF(selected_dr);
+ }
+ } else if (installed_dr != NULL) {
+ if (installed_dr != selected_dr) {
/*
- * De-install the current default route
- * in advance.
+ * This means that selected default router is reachable
+ * while installed one may or may not be.
+ * Static router should always be considered as reachable
+ * for router selection process.
*/
- bzero(&anydr, sizeof(anydr));
- defrouter_delreq(&anydr, 0);
- if (nd6_defifp) {
- /*
- * Install a route to the default interface
- * as default route.
- * XXX: we enable this for host only, because
- * this may override a default route installed
- * a user process (e.g. routing daemon) in a
- * router case.
- */
- defrouter_addifreq(nd6_defifp);
- } else {
- nd6log((LOG_INFO, "defrouter_select: "
- "there's no default router and no default"
- " interface\n"));
+ if ((installed_dr->stateflags & NDDRF_STATIC) &&
+ rtpref(installed_dr) >= rtpref(selected_dr)) {
+ NDDR_REMREF(selected_dr);
+ selected_dr = installed_dr;
+ } else if (is_installed_reachable) {
+ if (rtpref(selected_dr) <= rtpref(installed_dr)) {
+ NDDR_REMREF(selected_dr);
+ selected_dr = installed_dr;
+ }
}
+ } else {
+ NDDR_REMREF(selected_dr);
}
}
- return;
+install_route:
+ /*
+ * If the selected router is different than the installed one,
+ * remove the installed router and install the selected one.
+ * Note that the selected router is never NULL here.
+ * Else check if the route entry scope has to be changed.
+ */
+ lck_mtx_unlock(nd6_mutex);
+ if (installed_dr != selected_dr) {
+ nd6log(info,
+ "%s:%d: Found a better router for interface "
+ "%s. Installing new default route.\n",
+ __func__, __LINE__, if_name(ifp));
+ if (installed_dr != NULL) {
+ defrouter_delreq(installed_dr, rti);
+ }
+ /*
+ * Install scoped route if the interface is not
+ * the default nd6 interface.
+ */
+ defrouter_addreq(selected_dr, rti,
+ scoped && (selected_dr->ifp != nd6_defifp));
+ } else if (((installed_dr->stateflags & NDDRF_IFSCOPE) &&
+ (installed_dr->ifp == nd6_defifp)) ||
+ (scoped && !(installed_dr->stateflags & NDDRF_IFSCOPE) &&
+ (installed_dr->ifp != nd6_defifp))) {
+ nd6log(info,
+ "%s:%d: Need to reinstall default route for interface "
+ "%s as its scope has changed.\n",
+ __func__, __LINE__, if_name(ifp));
+ defrouter_delreq(installed_dr, rti);
+ defrouter_addreq(installed_dr, rti,
+ scoped && (installed_dr->ifp != nd6_defifp));
+ } else {
+ nd6log2(info,
+ "%s:%d: No need to change the default "
+ "route for interface %s.\n",
+ __func__, __LINE__, if_name(ifp));
+ }
+ lck_mtx_lock(nd6_mutex);
+out:
+ if (selected_dr && (selected_dr != installed_dr)) {
+ NDDR_REMREF(selected_dr);
+ }
+ if (installed_dr) {
+ NDDR_REMREF(installed_dr);
+ }
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ VERIFY(nd_defrouter_busy);
+ nd_defrouter_busy = FALSE;
+ if (nd_defrouter_waiters > 0) {
+ nd_defrouter_waiters = 0;
+ wakeup(nd_defrouter_waitchan);
+ }
}
static struct nd_defrouter *
-defrtrlist_update(
- struct nd_defrouter *new)
+defrtrlist_update_common(struct nd_defrouter *new, struct nd_drhead *nd_router_listp, boolean_t scoped)
{
struct nd_defrouter *dr, *n;
+ struct ifnet *ifp = new->ifp;
+ struct nd_ifinfo *ndi = NULL;
+ struct timeval caltime;
- lck_mtx_lock(nd6_mutex);
- if ((dr = defrouter_lookup(&new->rtaddr, new->ifp)) != NULL) {
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ if (nd_router_listp == NULL) {
+ nd_router_listp = &nd_defrouter_list;
+ }
+
+ /*
+ * If we are not operating on default router list,
+ * it implies we are operating on RTI's router list.
+ * XXX For now we manage RTI routes un-scoped.
+ */
+ if (nd_router_listp != &nd_defrouter_list) {
+ scoped = FALSE;
+ }
+
+ if ((dr = defrouter_lookup(nd_router_listp, &new->rtaddr, ifp)) != NULL) {
/* entry exists */
- if (new->rtlifetime == 0) {
- defrtrlist_del(dr, 1);
+ /*
+ * 1. If previous entry was not dummy and new is,
+ * delete it and return NULL.
+ * 2. If previous entry was dummy and the new one
+ * is also dummy, simply return dr.
+ * 3. If previous was dummy but new one is not,
+ * make sure we perform default router selection again.
+ */
+ /* If the router was not added as a dummy and there's
+ * been a change (lifetime advertised was 0, communicated
+ * as NDDRF_INELIGIBLE flag), remove the entry.
+ */
+ if ((new->stateflags & NDDRF_INELIGIBLE) != 0 &&
+ (dr->stateflags & NDDRF_INELIGIBLE) == 0) {
+ TAILQ_REMOVE(nd_router_listp, dr, dr_entry);
+ defrtrlist_del(dr, nd_router_listp);
+ NDDR_REMREF(dr); /* remove list reference */
+ NDDR_REMREF(dr);
dr = NULL;
+ return NULL;
} else {
+ int oldpref = rtpref(dr);
+ struct nd_defrouter *p = NULL;
+ boolean_t dummy_change = FALSE;
+ /*
+ * If new one is not dummy but the old one was,
+ * reset the stateflag.
+ */
+ if ((new->stateflags & NDDRF_INELIGIBLE) == 0 &&
+ (dr->stateflags & NDDRF_INELIGIBLE) != 0) {
+ dummy_change = TRUE;
+ dr->stateflags &= ~NDDRF_INELIGIBLE;
+ }
+
/* override */
dr->flags = new->flags; /* xxx flag check */
dr->rtlifetime = new->rtlifetime;
dr->expire = new->expire;
+
+ /*
+ * If the preference does not change, there's no need
+ * to sort the entries. If Scoped Routing is enabled,
+ * put the primary/non-scoped router at the top of the
+ * list of routers in the same preference band, unless
+ * it's already at that position.
+ */
+ /* same preference and scoped; just return */
+ if (rtpref(new) == oldpref && scoped && dummy_change == FALSE) {
+ return dr;
+ }
+
+ n = TAILQ_FIRST(nd_router_listp);
+ while (n != NULL) {
+ /* preference changed; sort it */
+ if (rtpref(new) != oldpref) {
+ break;
+ }
+
+ /* not at the top of band; sort it */
+ if (n != dr && rtpref(n) == oldpref &&
+ (!p || rtpref(p) > rtpref(n))) {
+ break;
+ }
+
+ p = n;
+ n = TAILQ_NEXT(n, dr_entry);
+ }
+
+ /* nothing has changed, just return */
+ if (n == NULL && (scoped ||
+ !(dr->stateflags & NDDRF_IFSCOPE)) && dummy_change == FALSE) {
+ return dr;
+ }
+
+ /*
+ * preferred router may be changed, so relocate
+ * this router.
+ * XXX: calling TAILQ_REMOVE directly is a bad manner.
+ * However, since defrtrlist_del() has many side
+ * effects, we intentionally do so here.
+ * defrouter_select() below will handle routing
+ * changes later.
+ */
+ TAILQ_REMOVE(nd_router_listp, dr, dr_entry);
+ new->stateflags = dr->stateflags;
+
+ n = dr;
+ goto insert;
}
- lck_mtx_unlock(nd6_mutex);
- return(dr);
}
- /* entry does not exist */
- if (new->rtlifetime == 0) {
- lck_mtx_unlock(nd6_mutex);
- return(NULL);
- }
+ VERIFY(dr == NULL);
+ n = nddr_alloc(Z_WAITOK);
- n = (struct nd_defrouter *)_MALLOC(sizeof(*n), M_IP6NDP, M_NOWAIT);
- if (n == NULL) {
- lck_mtx_unlock(nd6_mutex);
- return(NULL);
+ ndi = ND_IFINFO(ifp);
+ VERIFY((NULL != ndi) && (TRUE == ndi->initialized));
+ lck_mtx_lock(&ndi->lock);
+
+ if (ip6_maxifdefrouters >= 0 &&
+ ndi->ndefrouters >= ip6_maxifdefrouters) {
+ lck_mtx_unlock(&ndi->lock);
+ nddr_free(n);
+ nd6log(error, "%s: ignoring router addition as we have hit the "
+ "max limit of %d for max default routers.\n", __func__,
+ ip6_maxifdefrouters);
+ return NULL;
}
- bzero(n, sizeof(*n));
- *n = *new;
+
+ NDDR_ADDREF(n); /* for the nd_defrouter list */
+ NDDR_ADDREF(n); /* for the caller */
+
+ ++nd6_defrouter_genid;
+ ndi->ndefrouters++;
+ VERIFY(ndi->ndefrouters != 0);
+ lck_mtx_unlock(&ndi->lock);
+
+ nd6log2(info, "%s: allocating defrouter %s\n", if_name(ifp),
+ ip6_sprintf(&new->rtaddr));
+
+ getmicrotime(&caltime);
+ NDDR_LOCK(n);
+ memcpy(&n->rtaddr, &new->rtaddr, sizeof(n->rtaddr));
+ n->flags = new->flags;
+ n->stateflags = new->stateflags;
+ n->rtlifetime = new->rtlifetime;
+ n->expire = new->expire;
+ n->base_calendartime = caltime.tv_sec;
+ n->base_uptime = net_uptime();
+ n->ifp = new->ifp;
+ n->err = new->err;
+ NDDR_UNLOCK(n);
+insert:
+ /* get nd6_service() to be scheduled as soon as it's convenient */
+ ++nd6_sched_timeout_want;
/*
- * Insert the new router at the end of the Default Router List.
- * If there is no other router, install it anyway. Otherwise,
- * just continue to use the current default router.
+ * Insert the new router in the Default Router List;
+ * The Default Router List should be in the descending order
+ * of router-preferece. When Scoped Routing is disabled, routers
+ * with the same preference are sorted in the arriving time order;
+ * otherwise, the first entry in the list of routers having the same
+ * preference is the primary default router, when the interface used
+ * by the entry is the default interface.
*/
- TAILQ_INSERT_TAIL(&nd_defrouter, n, dr_entry);
- if (TAILQ_FIRST(&nd_defrouter) == n)
- defrouter_select();
-
- lck_mtx_unlock(nd6_mutex);
- return(n);
+
+ /* insert at the end of the group */
+ for (dr = TAILQ_FIRST(nd_router_listp); dr;
+ dr = TAILQ_NEXT(dr, dr_entry)) {
+ if (rtpref(n) > rtpref(dr) ||
+ (!scoped && rtpref(n) == rtpref(dr))) {
+ break;
+ }
+ }
+ if (dr) {
+ TAILQ_INSERT_BEFORE(dr, n, dr_entry);
+ } else {
+ TAILQ_INSERT_TAIL(nd_router_listp, n, dr_entry);
+ }
+
+ defrouter_select(ifp, nd_router_listp);
+
+ return n;
+}
+
+struct nd_defrouter *
+defrtrlist_update(struct nd_defrouter *new, struct nd_drhead *nd_router_list)
+{
+ struct nd_defrouter *dr;
+
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ dr = defrtrlist_update_common(new, nd_router_list,
+ (nd6_defifp != NULL && new->ifp != nd6_defifp));
+
+ return dr;
}
static struct nd_pfxrouter *
-pfxrtr_lookup(
- struct nd_prefix *pr,
- struct nd_defrouter *dr)
+pfxrtr_lookup(struct nd_prefix *pr, struct nd_defrouter *dr)
{
struct nd_pfxrouter *search;
-
- lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
- for (search = pr->ndpr_advrtrs.lh_first; search; search = search->pfr_next) {
- if (search->router == dr)
+
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ NDPR_LOCK_ASSERT_HELD(pr);
+
+ for (search = pr->ndpr_advrtrs.lh_first; search;
+ search = search->pfr_next) {
+ if (search->router == dr) {
break;
+ }
}
- return(search);
+ return search;
}
static void
-pfxrtr_add(
- struct nd_prefix *pr,
- struct nd_defrouter *dr)
+pfxrtr_add(struct nd_prefix *pr, struct nd_defrouter *dr)
{
struct nd_pfxrouter *new;
- lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ NDPR_LOCK_ASSERT_NOTHELD(pr);
- new = (struct nd_pfxrouter *)_MALLOC(sizeof(*new), M_IP6NDP, M_NOWAIT);
- if (new == NULL)
+ new = zalloc(ndprtr_zone);
+ if (new == NULL) {
return;
+ }
bzero(new, sizeof(*new));
new->router = dr;
+ NDPR_LOCK(pr);
LIST_INSERT_HEAD(&pr->ndpr_advrtrs, new, pfr_entry);
+ pr->ndpr_genid++;
+ NDPR_UNLOCK(pr);
- pfxlist_onlink_check(1);
+ pfxlist_onlink_check();
}
static void
-pfxrtr_del(
- struct nd_pfxrouter *pfr)
+pfxrtr_del(struct nd_pfxrouter *pfr, struct nd_prefix *pr)
{
- lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ NDPR_LOCK_ASSERT_HELD(pr);
+ pr->ndpr_genid++;
LIST_REMOVE(pfr, pfr_entry);
- FREE(pfr, M_IP6NDP);
+ zfree(ndprtr_zone, pfr);
}
+/*
+ * The routine has been modified to atomically refresh expiry
+ * time for nd6 prefix as the part of lookup.
+ * There's a corner case where a system going
+ * in sleep gets rid of manual addresses configured in the system
+ * and then schedules the prefix for deletion.
+ * However before the prefix gets deleted, if system comes out
+ * from sleep and configures same address before prefix deletion
+ * , the later prefix deletion will remove the prefix route and
+ * the system will not be able to communicate with other IPv6
+ * neighbor nodes in the same subnet.
+ */
struct nd_prefix *
-nd6_prefix_lookup(
- struct nd_prefix *pr)
+nd6_prefix_lookup(struct nd_prefix *pr, int nd6_prefix_expiry)
{
struct nd_prefix *search;
lck_mtx_lock(nd6_mutex);
for (search = nd_prefix.lh_first; search; search = search->ndpr_next) {
+ NDPR_LOCK(search);
if (pr->ndpr_ifp == search->ndpr_ifp &&
pr->ndpr_plen == search->ndpr_plen &&
in6_are_prefix_equal(&pr->ndpr_prefix.sin6_addr,
- &search->ndpr_prefix.sin6_addr,
- pr->ndpr_plen)
- ) {
+ &search->ndpr_prefix.sin6_addr, pr->ndpr_plen)) {
+ if (nd6_prefix_expiry != ND6_PREFIX_EXPIRY_UNSPEC) {
+ search->ndpr_expire = nd6_prefix_expiry;
+ }
+ NDPR_ADDREF(search);
+ NDPR_UNLOCK(search);
break;
}
+ NDPR_UNLOCK(search);
}
lck_mtx_unlock(nd6_mutex);
- return(search);
+ return search;
}
int
-nd6_prelist_add(
- struct nd_prefix *pr,
- struct nd_defrouter *dr,
- struct nd_prefix **newp)
+nd6_prelist_add(struct nd_prefix *pr, struct nd_defrouter *dr,
+ struct nd_prefix **newp, boolean_t force_scoped)
{
struct nd_prefix *new = NULL;
- int i;
+ struct ifnet *ifp = pr->ndpr_ifp;
+ struct nd_ifinfo *ndi = NULL;
+ int i, error;
+
+ if (ip6_maxifprefixes >= 0) {
+ ndi = ND_IFINFO(ifp);
+ VERIFY((NULL != ndi) && (TRUE == ndi->initialized));
+ lck_mtx_lock(&ndi->lock);
+ if (ndi->nprefixes >= ip6_maxifprefixes) {
+ lck_mtx_unlock(&ndi->lock);
+ return ENOMEM;
+ }
+ lck_mtx_unlock(&ndi->lock);
+ }
- new = (struct nd_prefix *)_MALLOC(sizeof(*new), M_IP6NDP, M_NOWAIT);
- if (new == NULL)
+ new = ndpr_alloc(M_WAITOK);
+ if (new == NULL) {
return ENOMEM;
- bzero(new, sizeof(*new));
- *new = *pr;
- if (newp != NULL)
- *newp = new;
+ }
- /* initilization */
+ NDPR_LOCK(new);
+ NDPR_LOCK(pr);
+ new->ndpr_ifp = pr->ndpr_ifp;
+ new->ndpr_prefix = pr->ndpr_prefix;
+ new->ndpr_plen = pr->ndpr_plen;
+ new->ndpr_vltime = pr->ndpr_vltime;
+ new->ndpr_pltime = pr->ndpr_pltime;
+ new->ndpr_flags = pr->ndpr_flags;
+ if (pr->ndpr_stateflags & NDPRF_STATIC) {
+ new->ndpr_stateflags |= NDPRF_STATIC;
+ }
+ NDPR_UNLOCK(pr);
+ if ((error = in6_init_prefix_ltimes(new)) != 0) {
+ NDPR_UNLOCK(new);
+ ndpr_free(new);
+ return error;
+ }
+ new->ndpr_lastupdate = net_uptime();
+ if (newp != NULL) {
+ *newp = new;
+ NDPR_ADDREF(new); /* for caller */
+ }
+ /* initialization */
LIST_INIT(&new->ndpr_advrtrs);
in6_prefixlen2mask(&new->ndpr_mask, new->ndpr_plen);
/* make prefix in the canonical form */
- for (i = 0; i < 4; i++)
+ for (i = 0; i < 4; i++) {
new->ndpr_prefix.sin6_addr.s6_addr32[i] &=
- new->ndpr_mask.s6_addr32[i];
+ new->ndpr_mask.s6_addr32[i];
+ }
+
+ NDPR_UNLOCK(new);
+
+ /* get nd6_service() to be scheduled as soon as it's convenient */
+ ++nd6_sched_timeout_want;
- /* link ndpr_entry to nd_prefix list */
lck_mtx_lock(nd6_mutex);
+ /* link ndpr_entry to nd_prefix list */
LIST_INSERT_HEAD(&nd_prefix, new, ndpr_entry);
+ new->ndpr_debug |= IFD_ATTACHED;
+ NDPR_ADDREF(new); /* for nd_prefix list */
+
+ lck_mtx_lock(&ndi->lock);
+ ndi->nprefixes++;
+ VERIFY(ndi->nprefixes != 0);
+ lck_mtx_unlock(&ndi->lock);
/* ND_OPT_PI_FLAG_ONLINK processing */
if (new->ndpr_raf_onlink) {
int e;
- if ((e = nd6_prefix_onlink(new, 0, 1)) != 0) {
- nd6log((LOG_ERR, "nd6_prelist_add: failed to make "
- "the prefix %s/%d on-link on %s (errno=%d)\n",
- ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
- pr->ndpr_plen, if_name(pr->ndpr_ifp), e));
+ if ((e = nd6_prefix_onlink_common(new, force_scoped,
+ new->ndpr_ifp->if_index)) != 0) {
+ nd6log(error, "nd6_prelist_add: failed to make "
+ "the prefix %s/%d on-link %s on %s (errno=%d)\n",
+ ip6_sprintf(&new->ndpr_prefix.sin6_addr),
+ new->ndpr_plen, force_scoped ? "scoped" :
+ "non-scoped", if_name(ifp), e);
/* proceed anyway. XXX: is it correct? */
}
}
if (dr) {
pfxrtr_add(new, dr);
}
+
lck_mtx_unlock(nd6_mutex);
return 0;
}
+/*
+ * Caller must have held an extra reference on nd_prefix.
+ */
void
-prelist_remove(
- struct nd_prefix *pr, int nd6locked)
+prelist_remove(struct nd_prefix *pr)
{
struct nd_pfxrouter *pfr, *next;
+ struct ifnet *ifp = pr->ndpr_ifp;
int e;
+ struct nd_ifinfo *ndi = NULL;
+
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ NDPR_LOCK_ASSERT_HELD(pr);
+
+ if (pr->ndpr_stateflags & NDPRF_DEFUNCT) {
+ return;
+ }
+
+ /*
+ * If there are no more addresses, defunct the prefix. This is needed
+ * because we don't want multiple threads calling prelist_remove() for
+ * the same prefix and this might happen because we unlock nd6_mutex
+ * down below.
+ */
+ if (pr->ndpr_addrcnt == 0) {
+ pr->ndpr_stateflags |= NDPRF_DEFUNCT;
+ }
/* make sure to invalidate the prefix until it is really freed. */
pr->ndpr_vltime = 0;
pr->ndpr_pltime = 0;
-#if 0
+
/*
* Though these flags are now meaningless, we'd rather keep the value
- * not to confuse users when executing "ndp -p".
+ * of pr->ndpr_raf_onlink and pr->ndpr_raf_auto not to confuse users
+ * when executing "ndp -p".
*/
- pr->ndpr_raf_onlink = 0;
- pr->ndpr_raf_auto = 0;
-#endif
- if ((pr->ndpr_stateflags & NDPRF_ONLINK) != 0 &&
- (e = nd6_prefix_offlink(pr)) != 0) {
- nd6log((LOG_ERR, "prelist_remove: failed to make %s/%d offlink "
- "on %s, errno=%d\n",
- ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
- pr->ndpr_plen, if_name(pr->ndpr_ifp), e));
- /* what should we do? */
+ if (pr->ndpr_stateflags & NDPRF_ONLINK) {
+ NDPR_ADDREF(pr);
+ NDPR_UNLOCK(pr);
+ lck_mtx_unlock(nd6_mutex);
+ if ((e = nd6_prefix_offlink(pr)) != 0) {
+ nd6log(error, "prelist_remove: failed to make "
+ "%s/%d offlink on %s, errno=%d\n",
+ ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(ifp), e);
+ /* what should we do? */
+ }
+ lck_mtx_lock(nd6_mutex);
+ NDPR_LOCK(pr);
+ if (NDPR_REMREF(pr) == NULL) {
+ return;
+ }
}
- if (pr->ndpr_refcnt > 0)
- return; /* notice here? */
+ if (pr->ndpr_addrcnt > 0) {
+ /*
+ * The state might have changed if we called
+ * nd6_prefix_offlink().
+ */
+ pr->ndpr_stateflags &= ~NDPRF_DEFUNCT;
+ return; /* notice here? */
+ }
- if (nd6locked == 0)
- lck_mtx_lock(nd6_mutex);
/* unlink ndpr_entry from nd_prefix list */
LIST_REMOVE(pr, ndpr_entry);
+ pr->ndpr_debug &= ~IFD_ATTACHED;
/* free list of routers that adversed the prefix */
for (pfr = pr->ndpr_advrtrs.lh_first; pfr; pfr = next) {
next = pfr->pfr_next;
-
- FREE(pfr, M_IP6NDP);
+ pfxrtr_del(pfr, pr);
}
- FREE(pr, M_IP6NDP);
+ ndi = ND_IFINFO(ifp);
+ VERIFY((NULL != ndi) && (TRUE == ndi->initialized));
+ lck_mtx_lock(&ndi->lock);
+ VERIFY(ndi->nprefixes > 0);
+ ndi->nprefixes--;
+ lck_mtx_unlock(&ndi->lock);
+
+ /* This must not be the last reference to the nd_prefix */
+ if (NDPR_REMREF(pr) == NULL) {
+ panic("%s: unexpected (missing) refcnt ndpr=%p", __func__, pr);
+ /* NOTREACHED */
+ }
- pfxlist_onlink_check(1);
- if (nd6locked == 0)
- lck_mtx_unlock(nd6_mutex);
+ /*
+ * Don't call pfxlist_onlink_check() here because we are
+ * holding the NDPR lock and this could cause a deadlock when
+ * there are multiple threads executing pfxlist_onlink_check().
+ */
}
int
prelist_update(
struct nd_prefix *new,
struct nd_defrouter *dr, /* may be NULL */
- struct mbuf *m)
+ struct mbuf *m,
+ int mcast)
{
struct in6_ifaddr *ia6 = NULL, *ia6_match = NULL;
struct ifaddr *ifa;
int newprefix = 0;
int auth;
struct in6_addrlifetime lt6_tmp;
- struct timeval timenow;
+ uint64_t timenow = net_uptime();
+
+ /* no need to lock "new" here, as it is local to the caller */
+ NDPR_LOCK_ASSERT_NOTHELD(new);
auth = 0;
if (m) {
* both IP header and IP datagrams, doesn't it ?
*/
#if defined(M_AUTHIPHDR) && defined(M_AUTHIPDGM)
- auth = (m->m_flags & M_AUTHIPHDR
- && m->m_flags & M_AUTHIPDGM) ? 1 : 0;
+ auth = (m->m_flags & M_AUTHIPHDR) && (m->m_flags & M_AUTHIPDGM);
#endif
}
-
- if ((pr = nd6_prefix_lookup(new)) != NULL) {
+ if ((pr = nd6_prefix_lookup(new, ND6_PREFIX_EXPIRY_UNSPEC)) != NULL) {
/*
* nd6_prefix_lookup() ensures that pr and new have the same
* prefix on a same interface.
* and the autonomous (A) bit should NOT be changed from 1
* to 0.
*/
- if (new->ndpr_raf_onlink == 1)
+ lck_mtx_lock(nd6_mutex);
+ NDPR_LOCK(pr);
+ if (new->ndpr_raf_onlink == 1) {
pr->ndpr_raf_onlink = 1;
- if (new->ndpr_raf_auto == 1)
+ }
+ if (new->ndpr_raf_auto == 1) {
pr->ndpr_raf_auto = 1;
+ }
if (new->ndpr_raf_onlink) {
pr->ndpr_vltime = new->ndpr_vltime;
pr->ndpr_pltime = new->ndpr_pltime;
- pr->ndpr_preferred = new->ndpr_preferred;
- pr->ndpr_expire = new->ndpr_expire;
+ (void) in6_init_prefix_ltimes(pr); /* XXX error case? */
+ pr->ndpr_lastupdate = net_uptime();
}
+ NDPR_ADDREF(pr);
if (new->ndpr_raf_onlink &&
(pr->ndpr_stateflags & NDPRF_ONLINK) == 0) {
int e;
- if ((e = nd6_prefix_onlink(pr, 0, 0)) != 0) {
- nd6log((LOG_ERR,
+ NDPR_UNLOCK(pr);
+ if ((e = nd6_prefix_onlink(pr)) != 0) {
+ nd6log(error,
"prelist_update: failed to make "
"the prefix %s/%d on-link on %s "
"(errno=%d)\n",
ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
- pr->ndpr_plen, if_name(pr->ndpr_ifp), e));
+ pr->ndpr_plen, if_name(pr->ndpr_ifp), e);
/* proceed anyway. XXX: is it correct? */
}
+ NDPR_LOCK(pr);
}
-
- lck_mtx_lock(nd6_mutex);
- if (dr && pfxrtr_lookup(pr, dr) == NULL)
+
+ if (dr && pfxrtr_lookup(pr, dr) == NULL) {
+ NDPR_UNLOCK(pr);
pfxrtr_add(pr, dr);
+ } else {
+ NDPR_UNLOCK(pr);
+ }
+ NDPR_REMREF(pr);
lck_mtx_unlock(nd6_mutex);
} else {
- struct nd_prefix *newpr = NULL;
-
newprefix = 1;
- if (new->ndpr_vltime == 0)
+ if (new->ndpr_vltime == 0) {
goto end;
- if (new->ndpr_raf_onlink == 0 && new->ndpr_raf_auto == 0)
+ }
+ if (new->ndpr_raf_onlink == 0 && new->ndpr_raf_auto == 0) {
goto end;
+ }
bzero(&new->ndpr_addr, sizeof(struct in6_addr));
- error = nd6_prelist_add(new, dr, &newpr);
- if (error != 0 || newpr == NULL) {
- nd6log((LOG_NOTICE, "prelist_update: "
+ error = nd6_prelist_add(new, dr, &pr, FALSE);
+ if (error != 0 || pr == NULL) {
+ nd6log(info, "prelist_update: "
"nd6_prelist_add failed for %s/%d on %s "
- "errno=%d, returnpr=%p\n",
+ "errno=%d, returnpr=0x%llx\n",
ip6_sprintf(&new->ndpr_prefix.sin6_addr),
- new->ndpr_plen, if_name(new->ndpr_ifp),
- error, newpr));
+ new->ndpr_plen, if_name(new->ndpr_ifp),
+ error, (uint64_t)VM_KERNEL_ADDRPERM(pr));
goto end; /* we should just give up in this case. */
}
-
- /*
- * XXX: from the ND point of view, we can ignore a prefix
- * with the on-link bit being zero. However, we need a
- * prefix structure for references from autoconfigured
- * addresses. Thus, we explicitly make suret that the prefix
- * itself expires now.
- */
- if (newpr->ndpr_raf_onlink == 0) {
- newpr->ndpr_vltime = 0;
- newpr->ndpr_pltime = 0;
- in6_init_prefix_ltimes(newpr);
- }
-
- pr = newpr;
}
/*
- * Address autoconfiguration based on Section 5.5.3 of RFC 2462.
+ * Address autoconfiguration based on Section 5.5.3 of RFC 4862.
* Note that pr must be non NULL at this point.
*/
/* 5.5.3 (a). Ignore the prefix without the A bit set. */
- if (!new->ndpr_raf_auto)
- goto afteraddrconf;
+ if (!new->ndpr_raf_auto) {
+ goto end;
+ }
/*
* 5.5.3 (b). the link-local prefix should have been ignored in
* nd6_ra_input.
*/
- /*
- * 5.5.3 (c). Consistency check on lifetimes: pltime <= vltime.
- * This should have been done in nd6_ra_input.
- */
+ /* 5.5.3 (c). Consistency check on lifetimes: pltime <= vltime. */
+ if (new->ndpr_pltime > new->ndpr_vltime) {
+ error = EINVAL; /* XXX: won't be used */
+ goto end;
+ }
- /*
- * 5.5.3 (d). If the prefix advertised does not match the prefix of an
- * address already in the list, and the Valid Lifetime is not 0,
- * form an address. Note that even a manually configured address
- * should reject autoconfiguration of a new address.
+ /*
+ * 5.5.3 (d). If the prefix advertised is not equal to the prefix of
+ * an address configured by stateless autoconfiguration already in the
+ * list of addresses associated with the interface, and the Valid
+ * Lifetime is not 0, form an address. We first check if we have
+ * a matching prefix.
*/
- getmicrotime(&timenow);
-
- ifnet_lock_exclusive(ifp);
- TAILQ_FOREACH(ifa, &ifp->if_addrlist, ifa_list)
- {
+ ifnet_lock_shared(ifp);
+ TAILQ_FOREACH(ifa, &ifp->if_addrlist, ifa_list) {
struct in6_ifaddr *ifa6;
- int ifa_plen;
- u_int32_t storedlifetime;
+ u_int32_t remaininglifetime;
- if (ifa->ifa_addr->sa_family != AF_INET6)
+ IFA_LOCK(ifa);
+ if (ifa->ifa_addr->sa_family != AF_INET6) {
+ IFA_UNLOCK(ifa);
continue;
-
+ }
ifa6 = (struct in6_ifaddr *)ifa;
+ /*
+ * We only consider autoconfigured addresses as per RFC 4862.
+ */
+ if (!(ifa6->ia6_flags & IN6_IFF_AUTOCONF)) {
+ IFA_UNLOCK(ifa);
+ continue;
+ }
/*
* Spec is not clear here, but I believe we should concentrate
* on unicast (i.e. not anycast) addresses.
* XXX: other ia6_flags? detached or duplicated?
*/
- if ((ifa6->ia6_flags & IN6_IFF_ANYCAST) != 0)
+ if ((ifa6->ia6_flags & IN6_IFF_ANYCAST) != 0) {
+ IFA_UNLOCK(ifa);
continue;
-
- ifa_plen = in6_mask2len(&ifa6->ia_prefixmask.sin6_addr, NULL);
- if (ifa_plen != new->ndpr_plen ||
- !in6_are_prefix_equal(&ifa6->ia_addr.sin6_addr,
- &new->ndpr_prefix.sin6_addr,
- ifa_plen))
+ }
+ /*
+ * Ignore the address if it is not associated with a prefix
+ * or is associated with a prefix that is different from this
+ * one. (pr is never NULL here)
+ */
+ if (ifa6->ia6_ndpr != pr) {
+ IFA_UNLOCK(ifa);
continue;
+ }
- if (ia6_match == NULL) /* remember the first one */
+ if (ia6_match == NULL) { /* remember the first one */
ia6_match = ifa6;
-
- if ((ifa6->ia6_flags & IN6_IFF_AUTOCONF) == 0)
- continue;
+ IFA_ADDREF_LOCKED(ifa); /* for ia6_match */
+ }
/*
* An already autoconfigured address matched. Now that we
* proceed to 5.5.3. (e): update the lifetimes according to the
* "two hours" rule and the privacy extension.
*/
-#define TWOHOUR (120*60)
- lt6_tmp = ifa6->ia6_lifetime;
+ /* retrieve time as uptime (last arg is 0) */
+ in6ifa_getlifetime(ifa6, <6_tmp, 0);
- storedlifetime = IFA6_IS_INVALID(ifa6) ? 0 :
- (lt6_tmp.ia6t_expire - timenow.tv_sec);
+ if (lt6_tmp.ia6t_vltime == ND6_INFINITE_LIFETIME) {
+ remaininglifetime = ND6_INFINITE_LIFETIME;
+ } else if (timenow - ifa6->ia6_updatetime > lt6_tmp.ia6t_vltime) {
+ /*
+ * The case of "invalid" address. We should usually
+ * not see this case.
+ */
+ remaininglifetime = 0;
+ } else {
+ remaininglifetime = lt6_tmp.ia6t_vltime -
+ (uint32_t)(timenow - ifa6->ia6_updatetime);
+ }
+ /* when not updating, keep the current stored lifetime. */
+ lt6_tmp.ia6t_vltime = remaininglifetime;
if (TWOHOUR < new->ndpr_vltime ||
- storedlifetime < new->ndpr_vltime) {
+ remaininglifetime < new->ndpr_vltime) {
lt6_tmp.ia6t_vltime = new->ndpr_vltime;
- } else if (storedlifetime <= TWOHOUR
-#if 0
- /*
- * This condition is logically redundant, so we just
- * omit it.
- * See IPng 6712, 6717, and 6721.
- */
- && new->ndpr_vltime <= storedlifetime
-#endif
- ) {
+ } else if (remaininglifetime <= TWOHOUR) {
if (auth) {
lt6_tmp.ia6t_vltime = new->ndpr_vltime;
}
} else {
/*
* new->ndpr_vltime <= TWOHOUR &&
- * TWOHOUR < storedlifetime
+ * TWOHOUR < remaininglifetime
*/
lt6_tmp.ia6t_vltime = TWOHOUR;
}
/* The 2 hour rule is not imposed for preferred lifetime. */
lt6_tmp.ia6t_pltime = new->ndpr_pltime;
- in6_init_address_ltimes(pr, <6_tmp);
-
- /*
- * When adjusting the lifetimes of an existing temporary
- * address, only lower the lifetimes.
- * RFC 3041 3.3. (1).
- * XXX: how should we modify ia6t_[pv]ltime?
- */
+ /* Special handling for lifetimes of temporary addresses. */
if ((ifa6->ia6_flags & IN6_IFF_TEMPORARY) != 0) {
- if (lt6_tmp.ia6t_expire == 0 || /* no expire */
- lt6_tmp.ia6t_expire >
- ifa6->ia6_lifetime.ia6t_expire) {
- lt6_tmp.ia6t_expire =
- ifa6->ia6_lifetime.ia6t_expire;
+ u_int32_t maxvltime, maxpltime;
+
+ /* Constrain lifetimes to system limits. */
+ if (lt6_tmp.ia6t_vltime > ip6_temp_valid_lifetime) {
+ lt6_tmp.ia6t_vltime = ip6_temp_valid_lifetime;
+ }
+ if (lt6_tmp.ia6t_pltime > ip6_temp_preferred_lifetime) {
+ lt6_tmp.ia6t_pltime =
+ ip6_temp_preferred_lifetime -
+ ip6_desync_factor;
+ }
+
+ /*
+ * According to RFC 4941, section 3.3 (1), we only
+ * update the lifetimes when they are in the maximum
+ * intervals.
+ */
+ if (ip6_temp_valid_lifetime >
+ (u_int32_t)((timenow - ifa6->ia6_createtime) +
+ ip6_desync_factor)) {
+ maxvltime = ip6_temp_valid_lifetime -
+ (uint32_t)((timenow - ifa6->ia6_createtime) +
+ ip6_desync_factor);
+ } else {
+ maxvltime = 0;
+ }
+ if (ip6_temp_preferred_lifetime >
+ (u_int32_t)((timenow - ifa6->ia6_createtime) +
+ ip6_desync_factor)) {
+ maxpltime = ip6_temp_preferred_lifetime -
+ (uint32_t)((timenow - ifa6->ia6_createtime) +
+ ip6_desync_factor);
+ } else {
+ maxpltime = 0;
+ }
+
+ if (lt6_tmp.ia6t_vltime == ND6_INFINITE_LIFETIME ||
+ lt6_tmp.ia6t_vltime > maxvltime) {
+ lt6_tmp.ia6t_vltime = maxvltime;
}
- if (lt6_tmp.ia6t_preferred == 0 || /* no expire */
- lt6_tmp.ia6t_preferred >
- ifa6->ia6_lifetime.ia6t_preferred) {
- lt6_tmp.ia6t_preferred =
- ifa6->ia6_lifetime.ia6t_preferred;
+
+ if (lt6_tmp.ia6t_pltime == ND6_INFINITE_LIFETIME ||
+ lt6_tmp.ia6t_pltime > maxpltime) {
+ lt6_tmp.ia6t_pltime = maxpltime;
}
}
- ifa6->ia6_lifetime = lt6_tmp;
+ in6_init_address_ltimes(pr, <6_tmp);
+
+ in6ifa_setlifetime(ifa6, <6_tmp);
+ ifa6->ia6_updatetime = timenow;
+ IFA_UNLOCK(ifa);
}
ifnet_lock_done(ifp);
if (ia6_match == NULL && new->ndpr_vltime) {
/*
+ * 5.5.3 (d) (continued)
* No address matched and the valid lifetime is non-zero.
* Create a new address.
*/
- if ((ia6 = in6_ifadd(new, NULL)) != NULL) {
+ if ((ia6 = in6_pfx_newpersistaddr(new, mcast, &error, FALSE, 0))
+ != NULL) {
/*
* note that we should use pr (not new) for reference.
*/
- pr->ndpr_refcnt++;
+ IFA_LOCK(&ia6->ia_ifa);
+ NDPR_LOCK(pr);
ia6->ia6_ndpr = pr;
-
-#if 0
- /* XXXYYY Don't do this, according to Jinmei. */
- pr->ndpr_addr = new->ndpr_addr;
-#endif
+ NDPR_ADDREF(pr); /* for addr reference */
+ pr->ndpr_addrcnt++;
+ VERIFY(pr->ndpr_addrcnt != 0);
+ NDPR_UNLOCK(pr);
+ IFA_UNLOCK(&ia6->ia_ifa);
/*
- * RFC 3041 3.3 (2).
+ * RFC 4941 3.3 (2).
* When a new public address is created as described
- * in RFC2462, also create a new temporary address.
+ * in RFC 4862, also create a new temporary address.
*
- * RFC 3041 3.5.
+ * RFC 4941 3.5.
* When an interface connects to a new link, a new
* randomized interface identifier should be generated
* immediately together with a new set of temporary
if (ip6_use_tempaddr) {
int e;
if ((e = in6_tmpifadd(ia6, 1)) != 0) {
- nd6log((LOG_NOTICE, "prelist_update: "
+ nd6log(info, "prelist_update: "
"failed to create a temporary "
"address, errno=%d\n",
- e));
+ e);
+ }
+ }
+ IFA_REMREF(&ia6->ia_ifa);
+ ia6 = NULL;
+
+ /*
+ * If the interface is marked for CLAT46 configuration
+ * try and configure the reserved IPv6 address for
+ * stateless translation.
+ */
+ if (IS_INTF_CLAT46(ifp)) {
+ if ((ia6 = in6_pfx_newpersistaddr(new, mcast,
+ &error, TRUE, CLAT46_COLLISION_COUNT_OFFSET))
+ != NULL) {
+ IFA_LOCK(&ia6->ia_ifa);
+ NDPR_LOCK(pr);
+ ia6->ia6_ndpr = pr;
+ NDPR_ADDREF(pr); /* for addr reference */
+ pr->ndpr_addrcnt++;
+ VERIFY(pr->ndpr_addrcnt != 0);
+ pr->ndpr_stateflags |= NDPRF_CLAT46;
+ NDPR_UNLOCK(pr);
+ IFA_UNLOCK(&ia6->ia_ifa);
+ IFA_REMREF(&ia6->ia_ifa);
+ ia6 = NULL;
+ } else if (error != EEXIST) {
+ uuid_t tmp_uuid = {};
+ /*
+ * Only report the error if it is not
+ * EEXIST.
+ */
+ ip6stat.ip6s_clat464_v6addr_conffail++;
+ in6_clat46_event_enqueue_nwk_wq_entry(
+ IN6_CLAT46_EVENT_V6_ADDR_CONFFAIL,
+ 0,
+ tmp_uuid);
+ nd6log0(error, "Could not configure CLAT46 address on interface %s.\n", ifp->if_xname);
}
+ /*
+ * Reset the error as we do not want to
+ * treat failure of CLAT46 address configuration
+ * as complete failure in prelist update path.
+ */
+ error = 0;
}
/*
* of other addresses, so we check and update it.
* XXX: what if address duplication happens?
*/
- pfxlist_onlink_check(0);
- } else {
- /* just set an error. do not bark here. */
- error = EADDRNOTAVAIL; /* XXX: might be unused. */
+ lck_mtx_lock(nd6_mutex);
+ pfxlist_onlink_check();
+ lck_mtx_unlock(nd6_mutex);
}
}
+end:
+ if (pr != NULL) {
+ NDPR_REMREF(pr);
+ }
+ if (ia6_match != NULL) {
+ IFA_REMREF(&ia6_match->ia_ifa);
+ }
+ return error;
+}
- afteraddrconf:
+/*
+ * Neighbor Discover Default Router structure reference counting routines.
+ */
+static struct nd_defrouter *
+nddr_alloc(zalloc_flags_t how)
+{
+ struct nd_defrouter *dr;
- end:
- return error;
+ dr = zalloc_flags(nddr_zone, how | Z_ZERO);
+ if (dr) {
+ lck_mtx_init(&dr->nddr_lock, ifa_mtx_grp, ifa_mtx_attr);
+ lck_mtx_init(&dr->nddr_ref_lock, ifa_mtx_grp, ifa_mtx_attr);
+ dr->nddr_debug |= IFD_ALLOC;
+ if (nddr_debug != 0) {
+ dr->nddr_debug |= IFD_DEBUG;
+ dr->nddr_trace = nddr_trace;
+ }
+ }
+ return dr;
+}
+
+static void
+nddr_free(struct nd_defrouter *dr)
+{
+ if (dr->nddr_debug & IFD_ATTACHED) {
+ panic("%s: attached nddr %p is being freed", __func__, dr);
+ /* NOTREACHED */
+ } else if (!(dr->nddr_debug & IFD_ALLOC)) {
+ panic("%s: nddr %p cannot be freed", __func__, dr);
+ /* NOTREACHED */
+ }
+ dr->nddr_debug &= ~IFD_ALLOC;
+ lck_mtx_destroy(&dr->nddr_lock, ifa_mtx_grp);
+ lck_mtx_destroy(&dr->nddr_ref_lock, ifa_mtx_grp);
+ zfree(nddr_zone, dr);
+}
+
+static void
+nddr_trace(struct nd_defrouter *dr, int refhold)
+{
+ struct nd_defrouter_dbg *dr_dbg = (struct nd_defrouter_dbg *)dr;
+ ctrace_t *tr;
+ uint32_t idx;
+ uint16_t *cnt;
+
+ if (!(dr->nddr_debug & IFD_DEBUG)) {
+ panic("%s: nddr %p has no debug structure", __func__, dr);
+ /* NOTREACHED */
+ }
+ if (refhold) {
+ cnt = &dr_dbg->nddr_refhold_cnt;
+ tr = dr_dbg->nddr_refhold;
+ } else {
+ cnt = &dr_dbg->nddr_refrele_cnt;
+ tr = dr_dbg->nddr_refrele;
+ }
+
+ idx = atomic_add_16_ov(cnt, 1) % NDDR_TRACE_HIST_SIZE;
+ ctrace_record(&tr[idx]);
+}
+
+void
+nddr_addref(struct nd_defrouter *nddr)
+{
+ NDDR_REF_LOCK_SPIN(nddr);
+ if (++nddr->nddr_refcount == 0) {
+ panic("%s: nddr %p wraparound refcnt\n", __func__, nddr);
+ /* NOTREACHED */
+ } else if (nddr->nddr_trace != NULL) {
+ (*nddr->nddr_trace)(nddr, TRUE);
+ }
+ NDDR_REF_UNLOCK(nddr);
+}
+
+struct nd_defrouter *
+nddr_remref(struct nd_defrouter *nddr)
+{
+ NDDR_REF_LOCK_SPIN(nddr);
+ if (nddr->nddr_refcount == 0) {
+ panic("%s: nddr %p negative refcnt\n", __func__, nddr);
+ /* NOTREACHED */
+ } else if (nddr->nddr_trace != NULL) {
+ (*nddr->nddr_trace)(nddr, FALSE);
+ }
+
+ if (--nddr->nddr_refcount == 0) {
+ NDDR_REF_UNLOCK(nddr);
+ nddr_free(nddr);
+ nddr = NULL;
+ } else {
+ NDDR_REF_UNLOCK(nddr);
+ }
+ return nddr;
+}
+
+uint64_t
+nddr_getexpire(struct nd_defrouter *dr)
+{
+ struct timeval caltime;
+ uint64_t expiry;
+
+ if (dr->expire != 0) {
+ /* account for system time change */
+ getmicrotime(&caltime);
+
+ dr->base_calendartime +=
+ NET_CALCULATE_CLOCKSKEW(caltime,
+ dr->base_calendartime, net_uptime(), dr->base_uptime);
+
+ expiry = dr->base_calendartime +
+ dr->expire - dr->base_uptime;
+ } else {
+ expiry = 0;
+ }
+ return expiry;
+}
+
+/*
+ * Neighbor Discover Prefix structure reference counting routines.
+ */
+static struct nd_prefix *
+ndpr_alloc(int how)
+{
+ struct nd_prefix *pr;
+
+ pr = zalloc_flags(ndpr_zone, how | Z_ZERO);
+ if (pr != NULL) {
+ lck_mtx_init(&pr->ndpr_lock, ifa_mtx_grp, ifa_mtx_attr);
+ lck_mtx_init(&pr->ndpr_ref_lock, ifa_mtx_grp, ifa_mtx_attr);
+ RB_INIT(&pr->ndpr_prproxy_sols);
+ pr->ndpr_debug |= IFD_ALLOC;
+ if (ndpr_debug != 0) {
+ pr->ndpr_debug |= IFD_DEBUG;
+ pr->ndpr_trace = ndpr_trace;
+ }
+ }
+ return pr;
+}
+
+static void
+ndpr_free(struct nd_prefix *pr)
+{
+ if (pr->ndpr_debug & IFD_ATTACHED) {
+ panic("%s: attached ndpr %p is being freed", __func__, pr);
+ /* NOTREACHED */
+ } else if (!(pr->ndpr_debug & IFD_ALLOC)) {
+ panic("%s: ndpr %p cannot be freed", __func__, pr);
+ /* NOTREACHED */
+ } else if (pr->ndpr_rt != NULL) {
+ panic("%s: ndpr %p route %p not freed", __func__, pr,
+ pr->ndpr_rt);
+ /* NOTREACHED */
+ } else if (pr->ndpr_prproxy_sols_cnt != 0) {
+ panic("%s: ndpr %p non-zero solicitors count (%d)",
+ __func__, pr, pr->ndpr_prproxy_sols_cnt);
+ /* NOTREACHED */
+ } else if (!RB_EMPTY(&pr->ndpr_prproxy_sols)) {
+ panic("%s: ndpr %p non-empty solicitors tree", __func__, pr);
+ /* NOTREACHED */
+ }
+ pr->ndpr_debug &= ~IFD_ALLOC;
+ lck_mtx_destroy(&pr->ndpr_lock, ifa_mtx_grp);
+ lck_mtx_destroy(&pr->ndpr_ref_lock, ifa_mtx_grp);
+ zfree(ndpr_zone, pr);
+}
+
+static void
+ndpr_trace(struct nd_prefix *pr, int refhold)
+{
+ struct nd_prefix_dbg *pr_dbg = (struct nd_prefix_dbg *)pr;
+ ctrace_t *tr;
+ u_int32_t idx;
+ u_int16_t *cnt;
+
+ if (!(pr->ndpr_debug & IFD_DEBUG)) {
+ panic("%s: ndpr %p has no debug structure", __func__, pr);
+ /* NOTREACHED */
+ }
+ if (refhold) {
+ cnt = &pr_dbg->ndpr_refhold_cnt;
+ tr = pr_dbg->ndpr_refhold;
+ } else {
+ cnt = &pr_dbg->ndpr_refrele_cnt;
+ tr = pr_dbg->ndpr_refrele;
+ }
+
+ idx = atomic_add_16_ov(cnt, 1) % NDPR_TRACE_HIST_SIZE;
+ ctrace_record(&tr[idx]);
+}
+
+void
+ndpr_addref(struct nd_prefix *ndpr)
+{
+ NDPR_REF_LOCK_SPIN(ndpr);
+ if (++ndpr->ndpr_refcount == 0) {
+ panic("%s: ndpr %p wraparound refcnt\n", __func__, ndpr);
+ /* NOTREACHED */
+ } else if (ndpr->ndpr_trace != NULL) {
+ (*ndpr->ndpr_trace)(ndpr, TRUE);
+ }
+ NDPR_REF_UNLOCK(ndpr);
+}
+
+struct nd_prefix *
+ndpr_remref(struct nd_prefix *ndpr)
+{
+ NDPR_REF_LOCK_SPIN(ndpr);
+ if (ndpr->ndpr_refcount == 0) {
+ panic("%s: ndpr %p negative refcnt\n", __func__, ndpr);
+ /* NOTREACHED */
+ } else if (ndpr->ndpr_trace != NULL) {
+ (*ndpr->ndpr_trace)(ndpr, FALSE);
+ }
+
+ if (--ndpr->ndpr_refcount == 0) {
+ if (ndpr->ndpr_addrcnt != 0) {
+ panic("%s: freeing ndpr %p with outstanding address "
+ "reference (%d)", __func__, ndpr,
+ ndpr->ndpr_addrcnt);
+ /* NOTREACHED */
+ }
+ NDPR_REF_UNLOCK(ndpr);
+ ndpr_free(ndpr);
+ ndpr = NULL;
+ } else {
+ NDPR_REF_UNLOCK(ndpr);
+ }
+ return ndpr;
+}
+
+uint64_t
+ndpr_getexpire(struct nd_prefix *pr)
+{
+ struct timeval caltime;
+ uint64_t expiry;
+
+ if (pr->ndpr_expire != 0 && pr->ndpr_vltime != ND6_INFINITE_LIFETIME) {
+ /* account for system time change */
+ getmicrotime(&caltime);
+
+ pr->ndpr_base_calendartime +=
+ NET_CALCULATE_CLOCKSKEW(caltime,
+ pr->ndpr_base_calendartime, net_uptime(),
+ pr->ndpr_base_uptime);
+
+ expiry = pr->ndpr_base_calendartime +
+ pr->ndpr_expire - pr->ndpr_base_uptime;
+ } else {
+ expiry = 0;
+ }
+ return expiry;
}
/*
* A supplement function used in the on-link detection below;
* detect if a given prefix has a (probably) reachable advertising router.
* XXX: lengthy function name...
+ *
+ * Callers *must* increase the reference count of nd_prefix.
*/
static struct nd_pfxrouter *
-find_pfxlist_reachable_router(
- struct nd_prefix *pr)
+find_pfxlist_reachable_router(struct nd_prefix *pr)
{
struct nd_pfxrouter *pfxrtr;
struct rtentry *rt;
struct llinfo_nd6 *ln;
+ struct ifnet *ifp;
+ struct in6_addr rtaddr;
+ unsigned int genid;
+
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ NDPR_LOCK_ASSERT_HELD(pr);
+
+ genid = pr->ndpr_genid;
+ pfxrtr = LIST_FIRST(&pr->ndpr_advrtrs);
+ while (pfxrtr) {
+ ifp = pfxrtr->router->ifp;
+ if (pfxrtr->router->stateflags & NDDRF_MAPPED) {
+ rtaddr = pfxrtr->router->rtaddr_mapped;
+ } else {
+ rtaddr = pfxrtr->router->rtaddr;
+ }
- lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
-
- for (pfxrtr = LIST_FIRST(&pr->ndpr_advrtrs); pfxrtr;
- pfxrtr = LIST_NEXT(pfxrtr, pfr_entry)) {
- if ((rt = nd6_lookup(&pfxrtr->router->rtaddr, 0,
- pfxrtr->router->ifp, 0)) &&
- (ln = (struct llinfo_nd6 *)rt->rt_llinfo) &&
- ND6_IS_LLINFO_PROBREACH(ln))
- break; /* found */
+ NDPR_UNLOCK(pr);
+ lck_mtx_unlock(nd6_mutex);
+ /* Callee returns a locked route upon success */
+ if ((rt = nd6_lookup(&rtaddr, 0, ifp, 0)) != NULL) {
+ RT_LOCK_ASSERT_HELD(rt);
+ if ((ln = rt->rt_llinfo) != NULL &&
+ ND6_IS_LLINFO_PROBREACH(ln)) {
+ RT_REMREF_LOCKED(rt);
+ RT_UNLOCK(rt);
+ lck_mtx_lock(nd6_mutex);
+ NDPR_LOCK(pr);
+ break; /* found */
+ }
+ RT_REMREF_LOCKED(rt);
+ RT_UNLOCK(rt);
+ }
+ lck_mtx_lock(nd6_mutex);
+ NDPR_LOCK(pr);
+ if (pr->ndpr_genid != genid) {
+ pfxrtr = LIST_FIRST(&pr->ndpr_advrtrs);
+ genid = pr->ndpr_genid;
+ } else {
+ pfxrtr = LIST_NEXT(pfxrtr, pfr_entry);
+ }
}
+ NDPR_LOCK_ASSERT_HELD(pr);
- return(pfxrtr);
-
+ return pfxrtr;
}
/*
* is no router around us.
*/
void
-pfxlist_onlink_check(int nd6locked)
+pfxlist_onlink_check(void)
{
- struct nd_prefix *pr;
+ struct nd_prefix *pr, *prclear;
struct in6_ifaddr *ifa;
+ struct nd_defrouter *dr;
+ struct nd_pfxrouter *pfxrtr = NULL;
+ int err, i, found = 0;
+ struct ifaddr **ifap = NULL;
+ struct nd_prefix *ndpr;
+
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ while (nd_prefix_busy) {
+ nd_prefix_waiters++;
+ msleep(nd_prefix_waitchan, nd6_mutex, (PZERO - 1),
+ __func__, NULL);
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ }
+ nd_prefix_busy = TRUE;
/*
* Check if there is a prefix that has a reachable advertising
* router.
*/
- if (nd6locked == 0)
- lck_mtx_lock(nd6_mutex);
- lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
- for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
- if (pr->ndpr_raf_onlink && find_pfxlist_reachable_router(pr))
+ pr = nd_prefix.lh_first;
+ while (pr) {
+ NDPR_LOCK(pr);
+ if (pr->ndpr_stateflags & NDPRF_PROCESSED_ONLINK) {
+ NDPR_UNLOCK(pr);
+ pr = pr->ndpr_next;
+ continue;
+ }
+ NDPR_ADDREF(pr);
+ if (pr->ndpr_raf_onlink && find_pfxlist_reachable_router(pr) &&
+ (pr->ndpr_debug & IFD_ATTACHED)) {
+ if (NDPR_REMREF(pr) == NULL) {
+ pr = NULL;
+ } else {
+ NDPR_UNLOCK(pr);
+ }
break;
+ }
+ pr->ndpr_stateflags |= NDPRF_PROCESSED_ONLINK;
+ NDPR_UNLOCK(pr);
+ NDPR_REMREF(pr);
+ /*
+ * Since find_pfxlist_reachable_router() drops the nd6_mutex, we
+ * have to start over, but the NDPRF_PROCESSED_ONLINK flag will
+ * stop us from checking the same prefix twice.
+ */
+ pr = nd_prefix.lh_first;
}
-
- if (pr) {
+ LIST_FOREACH(prclear, &nd_prefix, ndpr_entry) {
+ NDPR_LOCK(prclear);
+ prclear->ndpr_stateflags &= ~NDPRF_PROCESSED_ONLINK;
+ NDPR_UNLOCK(prclear);
+ }
+ /*
+ * If we have no such prefix, check whether we still have a router
+ * that does not advertise any prefixes.
+ */
+ if (pr == NULL) {
+ for (dr = TAILQ_FIRST(&nd_defrouter_list); dr;
+ dr = TAILQ_NEXT(dr, dr_entry)) {
+ struct nd_prefix *pr0;
+
+ for (pr0 = nd_prefix.lh_first; pr0;
+ pr0 = pr0->ndpr_next) {
+ NDPR_LOCK(pr0);
+ if ((pfxrtr = pfxrtr_lookup(pr0, dr)) != NULL) {
+ NDPR_UNLOCK(pr0);
+ break;
+ }
+ NDPR_UNLOCK(pr0);
+ }
+ if (pfxrtr != NULL) {
+ break;
+ }
+ }
+ }
+ if (pr != NULL || (TAILQ_FIRST(&nd_defrouter_list) && pfxrtr == NULL)) {
/*
- * There is at least one prefix that has a reachable router.
+ * There is at least one prefix that has a reachable router,
+ * or at least a router which probably does not advertise
+ * any prefixes. The latter would be the case when we move
+ * to a new link where we have a router that does not provide
+ * prefixes and we configure an address by hand.
* Detach prefixes which have no reachable advertising
* router, and attach other prefixes.
*/
- for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
- /* XXX: a link-local prefix should never be detached */
- if (IN6_IS_ADDR_LINKLOCAL(&pr->ndpr_prefix.sin6_addr))
- continue;
-
+ pr = nd_prefix.lh_first;
+ while (pr) {
+ NDPR_LOCK(pr);
/*
- * we aren't interested in prefixes without the L bit
- * set.
+ * We aren't interested prefixes already processed,
+ * nor in prefixes without the L bit
+ * set nor in static prefixes
*/
- if (pr->ndpr_raf_onlink == 0)
+ if (pr->ndpr_raf_onlink == 0 ||
+ pr->ndpr_stateflags & NDPRF_PROCESSED_ONLINK ||
+ pr->ndpr_stateflags & NDPRF_STATIC) {
+ NDPR_UNLOCK(pr);
+ pr = pr->ndpr_next;
continue;
-
+ }
+ NDPR_ADDREF(pr);
if ((pr->ndpr_stateflags & NDPRF_DETACHED) == 0 &&
- find_pfxlist_reachable_router(pr) == NULL)
+ find_pfxlist_reachable_router(pr) == NULL &&
+ (pr->ndpr_debug & IFD_ATTACHED)) {
pr->ndpr_stateflags |= NDPRF_DETACHED;
+ }
if ((pr->ndpr_stateflags & NDPRF_DETACHED) != 0 &&
- find_pfxlist_reachable_router(pr) != 0)
+ find_pfxlist_reachable_router(pr) != NULL &&
+ (pr->ndpr_debug & IFD_ATTACHED)) {
pr->ndpr_stateflags &= ~NDPRF_DETACHED;
+ }
+ pr->ndpr_stateflags |= NDPRF_PROCESSED_ONLINK;
+ NDPR_UNLOCK(pr);
+ NDPR_REMREF(pr);
+ /*
+ * Since find_pfxlist_reachable_router() drops the
+ * nd6_mutex, we have to start over, but the
+ * NDPRF_PROCESSED_ONLINK flag will stop us from
+ * checking the same prefix twice.
+ */
+ pr = nd_prefix.lh_first;
}
} else {
/* there is no prefix that has a reachable router */
for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
- if (IN6_IS_ADDR_LINKLOCAL(&pr->ndpr_prefix.sin6_addr))
- continue;
-
- if (pr->ndpr_raf_onlink == 0)
+ NDPR_LOCK(pr);
+ if (pr->ndpr_raf_onlink == 0 ||
+ pr->ndpr_stateflags & NDPRF_STATIC) {
+ NDPR_UNLOCK(pr);
continue;
-
- if ((pr->ndpr_stateflags & NDPRF_DETACHED) != 0)
+ }
+ if ((pr->ndpr_stateflags & NDPRF_DETACHED) != 0) {
pr->ndpr_stateflags &= ~NDPRF_DETACHED;
+ }
+ NDPR_UNLOCK(pr);
}
}
-
+ LIST_FOREACH(prclear, &nd_prefix, ndpr_entry) {
+ NDPR_LOCK(prclear);
+ prclear->ndpr_stateflags &= ~NDPRF_PROCESSED_ONLINK;
+ NDPR_UNLOCK(prclear);
+ }
/*
* Remove each interface route associated with a (just) detached
* prefix, and reinstall the interface route for a (just) attached
* interfaces. Such cases will be handled in nd6_prefix_onlink,
* so we don't have to care about them.
*/
- for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
+ pr = nd_prefix.lh_first;
+ while (pr) {
int e;
- if (IN6_IS_ADDR_LINKLOCAL(&pr->ndpr_prefix.sin6_addr))
- continue;
-
- if (pr->ndpr_raf_onlink == 0)
+ NDPR_LOCK(pr);
+ if (pr->ndpr_raf_onlink == 0 ||
+ pr->ndpr_stateflags & NDPRF_STATIC ||
+ pr->ndpr_stateflags & NDPRF_PROCESSED_ONLINK ||
+ pr->ndpr_stateflags & NDPRF_DEFUNCT) {
+ NDPR_UNLOCK(pr);
+ pr = pr->ndpr_next;
continue;
-
+ }
+ pr->ndpr_stateflags |= NDPRF_PROCESSED_ONLINK;
+ NDPR_ADDREF(pr);
if ((pr->ndpr_stateflags & NDPRF_DETACHED) != 0 &&
(pr->ndpr_stateflags & NDPRF_ONLINK) != 0) {
+ NDPR_UNLOCK(pr);
+ lck_mtx_unlock(nd6_mutex);
if ((e = nd6_prefix_offlink(pr)) != 0) {
- nd6log((LOG_ERR,
+ nd6log(error,
"pfxlist_onlink_check: failed to "
"make %s/%d offlink, errno=%d\n",
ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
- pr->ndpr_plen, e));
+ pr->ndpr_plen, e);
}
+ lck_mtx_lock(nd6_mutex);
+ NDPR_REMREF(pr);
+ pr = nd_prefix.lh_first;
+ continue;
}
if ((pr->ndpr_stateflags & NDPRF_DETACHED) == 0 &&
(pr->ndpr_stateflags & NDPRF_ONLINK) == 0 &&
pr->ndpr_raf_onlink) {
- if ((e = nd6_prefix_onlink(pr, 0, 1)) != 0) {
- nd6log((LOG_ERR,
+ NDPR_UNLOCK(pr);
+ if ((e = nd6_prefix_onlink(pr)) != 0) {
+ nd6log(error,
"pfxlist_onlink_check: failed to "
"make %s/%d offlink, errno=%d\n",
ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
- pr->ndpr_plen, e));
+ pr->ndpr_plen, e);
+ }
+ NDPR_REMREF(pr);
+ pr = nd_prefix.lh_first;
+ continue;
+ } else {
+ NDPR_UNLOCK(pr);
+ }
+ NDPR_REMREF(pr);
+ pr = pr->ndpr_next;
+ }
+ LIST_FOREACH(prclear, &nd_prefix, ndpr_entry) {
+ NDPR_LOCK(prclear);
+ prclear->ndpr_stateflags &= ~NDPRF_PROCESSED_ONLINK;
+ NDPR_UNLOCK(prclear);
+ }
+ VERIFY(nd_prefix_busy);
+ nd_prefix_busy = FALSE;
+ if (nd_prefix_waiters > 0) {
+ nd_prefix_waiters = 0;
+ wakeup(nd_prefix_waitchan);
+ }
+
+ /*
+ * Changes on the prefix status might affect address status as well.
+ * Make sure that all addresses derived from an attached prefix are
+ * attached, and that all addresses derived from a detached prefix are
+ * detached. Note, however, that a manually configured address should
+ * always be attached.
+ * The precise detection logic is same as the one for prefixes.
+ *
+ * ifnet_get_address_list_family_internal() may fail due to memory
+ * pressure, but we will eventually be called again when we receive
+ * another NA, RA, or when the link status changes.
+ */
+ err = ifnet_get_address_list_family_internal(NULL, &ifap, AF_INET6, 0,
+ M_NOWAIT, 0);
+ if (err != 0 || ifap == NULL) {
+ nd6log(error, "%s: ifnet_get_address_list_family_internal "
+ "failed", __func__);
+ return;
+ }
+ for (i = 0; ifap[i]; i++) {
+ ifa = ifatoia6(ifap[i]);
+ IFA_LOCK(&ifa->ia_ifa);
+ if ((ifa->ia6_flags & IN6_IFF_AUTOCONF) == 0 ||
+ (ifap[i]->ifa_debug & IFD_ATTACHED) == 0) {
+ IFA_UNLOCK(&ifa->ia_ifa);
+ continue;
+ }
+ if ((ndpr = ifa->ia6_ndpr) == NULL) {
+ /*
+ * This can happen when we first configure the address
+ * (i.e. the address exists, but the prefix does not).
+ * XXX: complicated relationships...
+ */
+ IFA_UNLOCK(&ifa->ia_ifa);
+ continue;
+ }
+ IFA_UNLOCK(&ifa->ia_ifa);
+
+ NDPR_LOCK(ndpr);
+ NDPR_ADDREF(ndpr);
+ if (find_pfxlist_reachable_router(ndpr)) {
+ if (NDPR_REMREF(ndpr) == NULL) {
+ found = 0;
+ } else {
+ NDPR_UNLOCK(ndpr);
+ found = 1;
+ }
+ break;
+ }
+ NDPR_UNLOCK(ndpr);
+ NDPR_REMREF(ndpr);
+ }
+ if (found) {
+ for (i = 0; ifap[i]; i++) {
+ ifa = ifatoia6(ifap[i]);
+ IFA_LOCK(&ifa->ia_ifa);
+ if ((ifa->ia6_flags & IN6_IFF_AUTOCONF) == 0 ||
+ (ifap[i]->ifa_debug & IFD_ATTACHED) == 0) {
+ IFA_UNLOCK(&ifa->ia_ifa);
+ continue;
+ }
+ if ((ndpr = ifa->ia6_ndpr) == NULL) {
+ /* XXX: see above. */
+ IFA_UNLOCK(&ifa->ia_ifa);
+ continue;
+ }
+ IFA_UNLOCK(&ifa->ia_ifa);
+ NDPR_LOCK(ndpr);
+ NDPR_ADDREF(ndpr);
+ if (find_pfxlist_reachable_router(ndpr)) {
+ NDPR_UNLOCK(ndpr);
+ IFA_LOCK(&ifa->ia_ifa);
+ if (ifa->ia6_flags & IN6_IFF_DETACHED) {
+ ifa->ia6_flags &= ~IN6_IFF_DETACHED;
+ in6_ifaddr_set_dadprogress((struct in6_ifaddr *)ifa);
+ IFA_UNLOCK(&ifa->ia_ifa);
+ nd6_dad_start((struct ifaddr *)ifa, 0);
+ } else {
+ IFA_UNLOCK(&ifa->ia_ifa);
+ }
+ } else {
+ NDPR_UNLOCK(ndpr);
+ IFA_LOCK(&ifa->ia_ifa);
+ if ((ifa->ia6_flags & IN6_IFF_DETACHED) == 0) {
+ ifa->ia6_flags |= IN6_IFF_DETACHED;
+ in6_event_enqueue_nwk_wq_entry(IN6_ADDR_MARKED_DETACHED,
+ ifa->ia_ifa.ifa_ifp, &ifa->ia_addr.sin6_addr,
+ 0);
+ }
+ IFA_UNLOCK(&ifa->ia_ifa);
+ }
+ NDPR_REMREF(ndpr);
+ }
+ } else {
+ for (i = 0; ifap[i]; i++) {
+ ifa = ifatoia6(ifap[i]);
+ IFA_LOCK(&ifa->ia_ifa);
+ if ((ifa->ia6_flags & IN6_IFF_AUTOCONF) == 0) {
+ IFA_UNLOCK(&ifa->ia_ifa);
+ continue;
+ }
+ if (ifa->ia6_flags & IN6_IFF_DETACHED) {
+ ifa->ia6_flags &= ~IN6_IFF_DETACHED;
+ in6_ifaddr_set_dadprogress((struct in6_ifaddr *)ifa);
+ IFA_UNLOCK(&ifa->ia_ifa);
+ /* Do we need a delay in this case? */
+ nd6_dad_start((struct ifaddr *)ifa, 0);
+ } else {
+ IFA_UNLOCK(&ifa->ia_ifa);
}
}
- }
+ }
+ ifnet_free_address_list(ifap);
+}
+
+static struct nd_prefix *
+nd6_prefix_equal_lookup(struct nd_prefix *pr, boolean_t primary_only)
+{
+ struct nd_prefix *opr;
+
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ for (opr = nd_prefix.lh_first; opr; opr = opr->ndpr_next) {
+ if (opr == pr) {
+ continue;
+ }
- /*
- * Changes on the prefix status might affect address status as well.
- * Make sure that all addresses derived from an attached prefix are
- * attached, and that all addresses derived from a detached prefix are
- * detached. Note, however, that a manually configured address should
- * always be attached.
- * The precise detection logic is same as the one for prefixes.
- */
- for (ifa = in6_ifaddrs; ifa; ifa = ifa->ia_next) {
- if ((ifa->ia6_flags & IN6_IFF_AUTOCONF) == 0)
+ NDPR_LOCK(opr);
+ if ((opr->ndpr_stateflags & NDPRF_ONLINK) == 0) {
+ NDPR_UNLOCK(opr);
continue;
+ }
+ if (opr->ndpr_plen == pr->ndpr_plen &&
+ in6_are_prefix_equal(&pr->ndpr_prefix.sin6_addr,
+ &opr->ndpr_prefix.sin6_addr, pr->ndpr_plen) &&
+ (!primary_only ||
+ !(opr->ndpr_stateflags & NDPRF_IFSCOPE))) {
+ NDPR_ADDREF(opr);
+ NDPR_UNLOCK(opr);
+ return opr;
+ }
+ NDPR_UNLOCK(opr);
+ }
+ return NULL;
+}
- if (ifa->ia6_ndpr == NULL) {
- /*
- * This can happen when we first configure the address
- * (i.e. the address exists, but the prefix does not).
- * XXX: complicated relationships...
- */
+/*
+ * Synchronize the interface routes of similar prefixes on different
+ * interfaces; the one using the default interface would be (re)installed
+ * as a primary/non-scoped entry, and the rest as scoped entri(es).
+ */
+static void
+nd6_prefix_sync(struct ifnet *ifp)
+{
+ struct nd_prefix *pr, *opr;
+ int err = 0;
+
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ if (ifp == NULL) {
+ return;
+ }
+
+ for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
+ NDPR_LOCK(pr);
+ if (!(pr->ndpr_stateflags & NDPRF_ONLINK)) {
+ NDPR_UNLOCK(pr);
continue;
}
-
- if (find_pfxlist_reachable_router(ifa->ia6_ndpr))
+ if (pr->ndpr_ifp == ifp &&
+ (pr->ndpr_stateflags & NDPRF_IFSCOPE) &&
+ !IN6_IS_ADDR_LINKLOCAL(&pr->ndpr_prefix.sin6_addr)) {
+ NDPR_UNLOCK(pr);
break;
+ }
+ NDPR_UNLOCK(pr);
}
- if (ifa) {
- for (ifa = in6_ifaddrs; ifa; ifa = ifa->ia_next) {
- if ((ifa->ia6_flags & IN6_IFF_AUTOCONF) == 0)
- continue;
- if (ifa->ia6_ndpr == NULL) /* XXX: see above. */
- continue;
+ if (pr == NULL) {
+ return;
+ }
- if (find_pfxlist_reachable_router(ifa->ia6_ndpr))
- ifa->ia6_flags &= ~IN6_IFF_DETACHED;
- else
- ifa->ia6_flags |= IN6_IFF_DETACHED;
+ /* Remove conflicting entries */
+ opr = nd6_prefix_equal_lookup(pr, TRUE);
+ if (opr != NULL) {
+ lck_mtx_unlock(nd6_mutex);
+ err = nd6_prefix_offlink(opr);
+ lck_mtx_lock(nd6_mutex);
+ if (err != 0) {
+ nd6log(error,
+ "%s: failed to make %s/%d offlink on %s, "
+ "errno=%d\n", __func__,
+ ip6_sprintf(&opr->ndpr_prefix.sin6_addr),
+ opr->ndpr_plen, if_name(opr->ndpr_ifp), err);
}
+ } else {
+ nd6log(error,
+ "%s: scoped %s/%d on %s has no matching unscoped prefix\n",
+ __func__, ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp));
+ }
+
+ lck_mtx_unlock(nd6_mutex);
+ err = nd6_prefix_offlink(pr);
+ lck_mtx_lock(nd6_mutex);
+ if (err != 0) {
+ nd6log(error,
+ "%s: failed to make %s/%d offlink on %s, errno=%d\n",
+ __func__, ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp), err);
}
- else {
- for (ifa = in6_ifaddrs; ifa; ifa = ifa->ia_next) {
- if ((ifa->ia6_flags & IN6_IFF_AUTOCONF) == 0)
- continue;
- ifa->ia6_flags &= ~IN6_IFF_DETACHED;
+ /* Add the entries back */
+ if (opr != NULL) {
+ err = nd6_prefix_onlink_scoped(opr, opr->ndpr_ifp->if_index);
+ if (err != 0) {
+ nd6log(error,
+ "%s: failed to make %s/%d scoped onlink on %s, "
+ "errno=%d\n", __func__,
+ ip6_sprintf(&opr->ndpr_prefix.sin6_addr),
+ opr->ndpr_plen, if_name(opr->ndpr_ifp), err);
}
}
- if (nd6locked == 0)
- lck_mtx_unlock(nd6_mutex);
+
+ err = nd6_prefix_onlink_scoped(pr, IFSCOPE_NONE);
+ if (err != 0) {
+ nd6log(error,
+ "%s: failed to make %s/%d onlink on %s, errno=%d\n",
+ __func__, ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp), err);
+ }
+
+ if (err != 0) {
+ nd6log(error,
+ "%s: error promoting %s/%d to %s from %s\n",
+ __func__, ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp),
+ (opr != NULL) ? if_name(opr->ndpr_ifp) : "NONE");
+ } else {
+ nd6log2(info,
+ "%s: %s/%d promoted, previously on %s\n",
+ if_name(pr->ndpr_ifp),
+ ip6_sprintf(&pr->ndpr_prefix.sin6_addr), pr->ndpr_plen,
+ (opr != NULL) ? if_name(opr->ndpr_ifp) : "NONE");
+ }
+
+ if (opr != NULL) {
+ NDPR_REMREF(opr);
+ }
}
-int
-nd6_prefix_onlink(
- struct nd_prefix *pr, int rtlocked, int nd6locked)
+static int
+nd6_prefix_onlink_common(struct nd_prefix *pr, boolean_t force_scoped,
+ unsigned int ifscope)
{
struct ifaddr *ifa;
struct ifnet *ifp = pr->ndpr_ifp;
- struct sockaddr_in6 mask6;
+ struct sockaddr_in6 mask6, prefix;
struct nd_prefix *opr;
- u_long rtflags;
- int error = 0;
+ u_int32_t rtflags;
+ int error = 0, prproxy = 0;
struct rtentry *rt = NULL;
+ u_char prefix_len = 0;
+
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_OWNED);
/* sanity check */
+ NDPR_LOCK(pr);
if ((pr->ndpr_stateflags & NDPRF_ONLINK) != 0) {
- nd6log((LOG_ERR,
- "nd6_prefix_onlink: %s/%d is already on-link\n",
- ip6_sprintf(&pr->ndpr_prefix.sin6_addr), pr->ndpr_plen);
- return(EEXIST));
+ nd6log(error,
+ "%s: %s/%d on %s scoped=%d is already on-link\n",
+ __func__, ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp),
+ (pr->ndpr_stateflags & NDPRF_IFSCOPE) ? 1 : 0);
+ NDPR_UNLOCK(pr);
+ return EEXIST;
}
+ NDPR_UNLOCK(pr);
/*
* Add the interface route associated with the prefix. Before
* installing the route, check if there's the same prefix on another
* interface, and the prefix has already installed the interface route.
- * Although such a configuration is expected to be rare, we explicitly
- * allow it.
*/
- if (nd6locked == 0)
- lck_mtx_lock(nd6_mutex);
- else
- lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
- for (opr = nd_prefix.lh_first; opr; opr = opr->ndpr_next) {
- if (opr == pr)
- continue;
-
- if ((opr->ndpr_stateflags & NDPRF_ONLINK) == 0)
- continue;
+ opr = nd6_prefix_equal_lookup(pr, FALSE);
+ if (opr != NULL) {
+ NDPR_REMREF(opr);
+ }
- if (opr->ndpr_plen == pr->ndpr_plen &&
- in6_are_prefix_equal(&pr->ndpr_prefix.sin6_addr,
- &opr->ndpr_prefix.sin6_addr,
- pr->ndpr_plen)) {
- if (nd6locked == 0)
- lck_mtx_unlock(nd6_mutex);
- return(0);
+ if (!force_scoped) {
+ /*
+ * If a primary/non-scoped interface route already exists,
+ * install the new one as a scoped entry. If the existing
+ * interface route is scoped, install new as non-scoped.
+ */
+ ifscope = (opr != NULL) ? ifp->if_index : IFSCOPE_NONE;
+ opr = nd6_prefix_equal_lookup(pr, TRUE);
+ if (opr != NULL) {
+ NDPR_REMREF(opr);
+ } else if (ifscope != IFSCOPE_NONE) {
+ ifscope = IFSCOPE_NONE;
}
}
- if (nd6locked == 0)
- lck_mtx_unlock(nd6_mutex);
/*
- * We prefer link-local addresses as the associated interface address.
+ * We prefer link-local addresses as the associated interface address.
*/
/* search for a link-local addr */
ifa = (struct ifaddr *)in6ifa_ifpforlinklocal(ifp,
- IN6_IFF_NOTREADY|
- IN6_IFF_ANYCAST);
+ IN6_IFF_NOTREADY | IN6_IFF_ANYCAST);
if (ifa == NULL) {
- /* XXX: freebsd does not have ifa_ifwithaf */
- ifnet_lock_exclusive(ifp);
- TAILQ_FOREACH(ifa, &ifp->if_addrlist, ifa_list)
- {
- if (ifa->ifa_addr->sa_family == AF_INET6)
- break;
- }
+ struct in6_ifaddr *ia6;
+ ifnet_lock_shared(ifp);
+ IFP_TO_IA6(ifp, ia6);
ifnet_lock_done(ifp);
+ if (ia6 != NULL) {
+ ifa = &ia6->ia_ifa;
+ }
/* should we care about ia6_flags? */
}
+ NDPR_LOCK(pr);
if (ifa == NULL) {
/*
* This can still happen, when, for example, we receive an RA
* after removing all IPv6 addresses on the receiving
* interface. This should, of course, be rare though.
*/
- nd6log((LOG_NOTICE,
+ nd6log(info,
"nd6_prefix_onlink: failed to find any ifaddr"
" to add route for a prefix(%s/%d) on %s\n",
ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
- pr->ndpr_plen, if_name(ifp)));
- return(0);
+ pr->ndpr_plen, if_name(ifp));
+ NDPR_UNLOCK(pr);
+ return 0;
}
/*
bzero(&mask6, sizeof(mask6));
mask6.sin6_len = sizeof(mask6);
mask6.sin6_addr = pr->ndpr_mask;
+ prefix = pr->ndpr_prefix;
+ prefix_len = pr->ndpr_plen;
+ if ((rt = pr->ndpr_rt) != NULL) {
+ pr->ndpr_rt = NULL;
+ }
+ NDPR_ADDREF(pr); /* keep reference for this routine */
+ NDPR_UNLOCK(pr);
- if (rtlocked == 0)
- lck_mtx_lock(rt_mtx);
-
+ IFA_LOCK_SPIN(ifa);
rtflags = ifa->ifa_flags | RTF_CLONING | RTF_UP;
+ IFA_UNLOCK(ifa);
if (nd6_need_cache(ifp)) {
/* explicitly set in case ifa_flags does not set the flag. */
rtflags |= RTF_CLONING;
*/
rtflags &= ~RTF_CLONING;
}
- error = rtrequest_locked(RTM_ADD, (struct sockaddr *)&pr->ndpr_prefix,
- ifa->ifa_addr, (struct sockaddr *)&mask6,
- rtflags, &rt);
- if (error == 0) {
- if (rt != NULL) /* this should be non NULL, though */
- nd6_rtmsg(RTM_ADD, rt);
- pr->ndpr_stateflags |= NDPRF_ONLINK;
+
+ lck_mtx_unlock(nd6_mutex);
+
+ /*
+ * check if it conflicts with a indirect prefix route added by RIO
+ * if so, remove the rti entry.
+ */
+ if (ifscope == IFSCOPE_NONE) {
+ struct rtentry *temp_route = NULL;
+ LCK_MTX_ASSERT(rnh_lock, LCK_MTX_ASSERT_NOTOWNED);
+ lck_mtx_lock(rnh_lock);
+ temp_route = rt_lookup(TRUE, (struct sockaddr *)&prefix, (struct sockaddr *)&mask6, rt_tables[AF_INET6], IFSCOPE_NONE);
+ lck_mtx_unlock(rnh_lock);
+
+ if (temp_route != NULL && temp_route->rt_flags & RTF_GATEWAY && temp_route->rt_ifp != NULL) {
+ struct nd_route_info rti = {};
+ bzero(&rti, sizeof(rti));
+ rti.nd_rti_prefixlen = prefix_len;
+ rti.nd_rti_prefix = prefix.sin6_addr;
+ lck_mtx_lock(nd6_mutex);
+ nd6_rti_purge(&rti);
+ lck_mtx_unlock(nd6_mutex);
+ }
+ if (temp_route != NULL) {
+ rtfree(temp_route);
+ }
+ }
+
+ if (rt != NULL) {
+ rtfree(rt);
+ rt = NULL;
}
- else {
- nd6log((LOG_ERR, "nd6_prefix_onlink: failed to add route for a"
- " prefix (%s/%d) on %s, gw=%s, mask=%s, flags=%lx "
- "errno = %d\n",
+
+ error = rtrequest_scoped(RTM_ADD, (struct sockaddr *)&prefix,
+ ifa->ifa_addr, (struct sockaddr *)&mask6, rtflags, &rt,
+ ifscope);
+
+ /*
+ * Serialize the setting of NDPRF_PRPROXY.
+ */
+ lck_mtx_lock(&proxy6_lock);
+
+ if (rt != NULL) {
+ RT_LOCK(rt);
+ nd6_rtmsg(RTM_ADD, rt);
+ RT_UNLOCK(rt);
+ NDPR_LOCK(pr);
+ } else {
+ NDPR_LOCK(pr);
+ nd6log(error, "nd6_prefix_onlink: failed to add route for a"
+ " prefix (%s/%d) on %s, gw=%s, mask=%s, flags=%x,"
+ " scoped=%d, errno = %d\n",
ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
pr->ndpr_plen, if_name(ifp),
- ip6_sprintf(&((struct sockaddr_in6 *)ifa->ifa_addr)->sin6_addr),
- ip6_sprintf(&mask6.sin6_addr), rtflags, error));
+ ip6_sprintf(&((struct sockaddr_in6 *)
+ (void *)ifa->ifa_addr)->sin6_addr),
+ ip6_sprintf(&mask6.sin6_addr), rtflags,
+ (ifscope != IFSCOPE_NONE), error);
+ }
+ NDPR_LOCK_ASSERT_HELD(pr);
+
+ pr->ndpr_stateflags &= ~(NDPRF_IFSCOPE | NDPRF_PRPROXY);
+
+ /*
+ * TODO: If the prefix route exists, we should really find it and
+ * refer the prefix to it; otherwise ndpr_rt is NULL.
+ */
+ if (!(pr->ndpr_stateflags & NDPRF_DEFUNCT) &&
+ (rt != NULL || error == EEXIST)) {
+ struct nd_ifinfo *ndi = NULL;
+
+ VERIFY(pr->ndpr_prproxy_sols_cnt == 0);
+ VERIFY(RB_EMPTY(&pr->ndpr_prproxy_sols));
+
+ ndi = ND_IFINFO(ifp);
+ VERIFY((NULL != ndi) && (TRUE == ndi->initialized));
+ lck_mtx_lock(&ndi->lock);
+
+ pr->ndpr_rt = rt; /* keep reference from rtrequest */
+ pr->ndpr_stateflags |= NDPRF_ONLINK;
+ if (ifscope != IFSCOPE_NONE) {
+ pr->ndpr_stateflags |= NDPRF_IFSCOPE;
+ } else if ((rtflags & RTF_CLONING) &&
+ (ndi->flags & ND6_IFF_PROXY_PREFIXES) &&
+ !IN6_IS_ADDR_LINKLOCAL(&pr->ndpr_prefix.sin6_addr)) {
+ /*
+ * At present, in order for the prefix to be eligible
+ * as a proxying/proxied prefix, we require that the
+ * prefix route entry be marked as a cloning route with
+ * RTF_PROXY; i.e. nd6_need_cache() needs to return
+ * true for the interface type, hence the test for
+ * RTF_CLONING above.
+ */
+ pr->ndpr_stateflags |= NDPRF_PRPROXY;
+ }
+
+ lck_mtx_unlock(&ndi->lock);
+ } else if (rt != NULL && pr->ndpr_stateflags & NDPRF_DEFUNCT) {
+ rtfree(rt);
}
- if (rt != NULL)
- rtunref(rt);
+ prproxy = (pr->ndpr_stateflags & NDPRF_PRPROXY);
+ VERIFY(!prproxy || !(pr->ndpr_stateflags & NDPRF_IFSCOPE));
+ NDPR_UNLOCK(pr);
+
+ IFA_REMREF(ifa);
+
+ /*
+ * If this is an upstream prefix, find the downstream ones (if any)
+ * and re-configure their prefix routes accordingly. Otherwise,
+ * this could be potentially be a downstream prefix, and so find the
+ * upstream prefix, if any.
+ */
+ nd6_prproxy_prelist_update(pr, prproxy ? pr : NULL);
+
+ NDPR_REMREF(pr); /* release reference for this routine */
+ lck_mtx_unlock(&proxy6_lock);
+
+ lck_mtx_lock(nd6_mutex);
+
+ return error;
+}
- if (rtlocked == 0)
- lck_mtx_unlock(rt_mtx);
- return(error);
+int
+nd6_prefix_onlink(struct nd_prefix *pr)
+{
+ return nd6_prefix_onlink_common(pr, FALSE, IFSCOPE_NONE);
}
int
-nd6_prefix_offlink(
- struct nd_prefix *pr)
+nd6_prefix_onlink_scoped(struct nd_prefix *pr, unsigned int ifscope)
{
- int error = 0;
+ return nd6_prefix_onlink_common(pr, TRUE, ifscope);
+}
+
+int
+nd6_prefix_offlink(struct nd_prefix *pr)
+{
+ int plen, error = 0, prproxy;
struct ifnet *ifp = pr->ndpr_ifp;
- struct nd_prefix *opr;
- struct sockaddr_in6 sa6, mask6;
- struct rtentry *rt = NULL;
+ struct sockaddr_in6 sa6, mask6, prefix;
+ struct rtentry *rt = NULL, *ndpr_rt = NULL;
+ unsigned int ifscope;
+
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_NOTOWNED);
/* sanity check */
+ NDPR_LOCK(pr);
if ((pr->ndpr_stateflags & NDPRF_ONLINK) == 0) {
- nd6log((LOG_ERR,
- "nd6_prefix_offlink: %s/%d is already off-link\n",
- ip6_sprintf(&pr->ndpr_prefix.sin6_addr), pr->ndpr_plen));
- return(EEXIST);
+ nd6log(error,
+ "nd6_prefix_offlink: %s/%d on %s scoped=%d is already "
+ "off-link\n", ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp),
+ (pr->ndpr_stateflags & NDPRF_IFSCOPE) ? 1 : 0);
+ NDPR_UNLOCK(pr);
+ return EEXIST;
}
bzero(&sa6, sizeof(sa6));
sa6.sin6_family = AF_INET6;
sa6.sin6_len = sizeof(sa6);
bcopy(&pr->ndpr_prefix.sin6_addr, &sa6.sin6_addr,
- sizeof(struct in6_addr));
+ sizeof(struct in6_addr));
bzero(&mask6, sizeof(mask6));
mask6.sin6_family = AF_INET6;
mask6.sin6_len = sizeof(sa6);
bcopy(&pr->ndpr_mask, &mask6.sin6_addr, sizeof(struct in6_addr));
- lck_mtx_lock(rt_mtx);
- error = rtrequest_locked(RTM_DELETE, (struct sockaddr *)&sa6, NULL,
- (struct sockaddr *)&mask6, 0, &rt);
- if (error == 0) {
- pr->ndpr_stateflags &= ~NDPRF_ONLINK;
-
- /* report the route deletion to the routing socket. */
- if (rt != NULL)
- nd6_rtmsg(RTM_DELETE, rt);
-
- /*
- * There might be the same prefix on another interface,
- * the prefix which could not be on-link just because we have
- * the interface route (see comments in nd6_prefix_onlink).
- * If there's one, try to make the prefix on-link on the
- * interface.
- */
- lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
- for (opr = nd_prefix.lh_first; opr; opr = opr->ndpr_next) {
- if (opr == pr)
- continue;
-
- if ((opr->ndpr_stateflags & NDPRF_ONLINK) != 0)
- continue;
+ prefix = pr->ndpr_prefix;
+ plen = pr->ndpr_plen;
+ if ((ndpr_rt = pr->ndpr_rt) != NULL) {
+ pr->ndpr_rt = NULL;
+ }
+ NDPR_ADDREF(pr); /* keep reference for this routine */
+ NDPR_UNLOCK(pr);
- /*
- * KAME specific: detached prefixes should not be
- * on-link.
- */
- if ((opr->ndpr_stateflags & NDPRF_DETACHED) != 0)
- continue;
+ ifscope = (pr->ndpr_stateflags & NDPRF_IFSCOPE) ?
+ ifp->if_index : IFSCOPE_NONE;
- if (opr->ndpr_plen == pr->ndpr_plen &&
- in6_are_prefix_equal(&pr->ndpr_prefix.sin6_addr,
- &opr->ndpr_prefix.sin6_addr,
- pr->ndpr_plen)) {
- int e;
+ error = rtrequest_scoped(RTM_DELETE, (struct sockaddr *)&sa6,
+ NULL, (struct sockaddr *)&mask6, 0, &rt, ifscope);
- if ((e = nd6_prefix_onlink(opr, 1, 1)) != 0) {
- nd6log((LOG_ERR,
- "nd6_prefix_offlink: failed to "
- "recover a prefix %s/%d from %s "
- "to %s (errno = %d)\n",
- ip6_sprintf(&opr->ndpr_prefix.sin6_addr),
- opr->ndpr_plen, if_name(ifp),
- if_name(opr->ndpr_ifp), e));
- }
- }
- }
- }
- else {
- /* XXX: can we still set the NDPRF_ONLINK flag? */
- nd6log((LOG_ERR,
+ if (rt != NULL) {
+ /* report the route deletion to the routing socket. */
+ RT_LOCK(rt);
+ nd6_rtmsg(RTM_DELETE, rt);
+ RT_UNLOCK(rt);
+ rtfree(rt);
+ } else {
+ nd6log(error,
"nd6_prefix_offlink: failed to delete route: "
- "%s/%d on %s (errno = %d)\n",
- ip6_sprintf(&sa6.sin6_addr), pr->ndpr_plen, if_name(ifp),
- error));
+ "%s/%d on %s, scoped %d, (errno = %d)\n",
+ ip6_sprintf(&sa6.sin6_addr), plen, if_name(ifp),
+ (ifscope != IFSCOPE_NONE), error);
}
- if (rt != NULL) {
- if (rt->rt_refcnt <= 0) {
- /* XXX: we should free the entry ourselves. */
- rtref(rt);
- rtfree_locked(rt);
- }
+ if (ndpr_rt != NULL) {
+ rtfree(ndpr_rt);
+ }
+
+ lck_mtx_lock(&proxy6_lock);
+
+ NDPR_LOCK(pr);
+ prproxy = (pr->ndpr_stateflags & NDPRF_PRPROXY);
+ VERIFY(!prproxy || !(pr->ndpr_stateflags & NDPRF_IFSCOPE));
+ pr->ndpr_stateflags &= ~(NDPRF_ONLINK | NDPRF_IFSCOPE | NDPRF_PRPROXY);
+ if (pr->ndpr_prproxy_sols_cnt > 0) {
+ VERIFY(prproxy);
+ nd6_prproxy_sols_reap(pr);
+ VERIFY(pr->ndpr_prproxy_sols_cnt == 0);
+ VERIFY(RB_EMPTY(&pr->ndpr_prproxy_sols));
}
- lck_mtx_unlock(rt_mtx);
+ NDPR_UNLOCK(pr);
+
+ /*
+ * If this was an upstream prefix, find the downstream ones and do
+ * some cleanups. If this was a downstream prefix, the prefix route
+ * has been removed from the routing table above, but there may be
+ * other tasks to perform.
+ */
+ nd6_prproxy_prelist_update(pr, prproxy ? pr : NULL);
- return(error);
+ NDPR_REMREF(pr); /* release reference for this routine */
+ lck_mtx_unlock(&proxy6_lock);
+
+ return error;
}
-static struct in6_ifaddr *
-in6_ifadd(
- struct nd_prefix *pr,
- struct in6_addr *ifid) /* Mobile IPv6 addition */
+struct in6_ifaddr *
+in6_pfx_newpersistaddr(struct nd_prefix *pr, int mcast, int *errorp,
+ boolean_t is_clat46, uint8_t collision_count)
{
- struct ifnet *ifp = pr->ndpr_ifp;
- struct ifaddr *ifa;
- struct in6_aliasreq ifra;
- struct in6_ifaddr *ia, *ib;
- int error, plen0;
+ struct in6_ifaddr *ia6 = NULL;
+ struct ifnet *ifp = NULL;
+ struct nd_ifinfo *ndi = NULL;
struct in6_addr mask;
- int prefixlen = pr->ndpr_plen;
+ struct in6_aliasreq ifra;
+ int error, ifaupdate, iidlen, notcga;
- in6_len2mask(&mask, prefixlen);
+ VERIFY(pr != NULL);
+ VERIFY(errorp != NULL);
+
+ NDPR_LOCK(pr);
+ ifp = pr->ndpr_ifp;
+ ia6 = NULL;
+ error = 0;
/*
- * find a link-local address (will be interface ID).
- * Is it really mandatory? Theoretically, a global or a site-local
- * address can be configured without a link-local address, if we
- * have a unique interface identifier...
- *
- * it is not mandatory to have a link-local address, we can generate
- * interface identifier on the fly. we do this because:
- * (1) it should be the easiest way to find interface identifier.
- * (2) RFC2462 5.4 suggesting the use of the same interface identifier
- * for multiple addresses on a single interface, and possible shortcut
- * of DAD. we omitted DAD for this reason in the past.
- * (3) a user can prevent autoconfiguration of global address
- * by removing link-local address by hand (this is partly because we
- * don't have other way to control the use of IPv6 on a interface.
- * this has been our design choice - cf. NRL's "ifconfig auto").
- * (4) it is easier to manage when an interface has addresses
- * with the same interface identifier, than to have multiple addresses
- * with different interface identifiers.
- *
- * Mobile IPv6 addition: allow for caller to specify a wished interface
- * ID. This is to not break connections when moving addresses between
- * interfaces.
+ * Prefix Length check:
+ * If the sum of the prefix length and interface identifier
+ * length does not equal 128 bits, the Prefix Information
+ * option MUST be ignored. The length of the interface
+ * identifier is defined in a separate link-type specific
+ * document.
*/
- ifa = (struct ifaddr *)in6ifa_ifpforlinklocal(ifp, 0);/* 0 is OK? */
- if (ifa)
- ib = (struct in6_ifaddr *)ifa;
- else
- return NULL;
-
-#if 0 /* don't care link local addr state, and always do DAD */
- /* if link-local address is not eligible, do not autoconfigure. */
- if (((struct in6_ifaddr *)ifa)->ia6_flags & IN6_IFF_NOTREADY) {
- printf("in6_ifadd: link-local address not ready\n");
- return NULL;
+ iidlen = in6_if2idlen(ifp);
+ if (iidlen < 0) {
+ error = EADDRNOTAVAIL;
+ /* this should not happen, so we always log it. */
+ log(LOG_ERR, "%s: IID length undefined (%s)\n",
+ __func__, if_name(ifp));
+ goto unlock1;
+ } else if (iidlen != 64) {
+ error = EADDRNOTAVAIL;
+ /*
+ * stateless autoconfiguration not yet well-defined for IID
+ * lengths other than 64 octets. Just give up for now.
+ */
+ nd6log(info, "%s: IID length not 64 octets (%s)\n",
+ __func__, if_name(ifp));
+ goto unlock1;
}
-#endif
- /* prefixlen + ifidlen must be equal to 128 */
- plen0 = in6_mask2len(&ib->ia_prefixmask.sin6_addr, NULL);
- if (prefixlen != plen0) {
- nd6log((LOG_INFO, "in6_ifadd: wrong prefixlen for %s "
- "(prefix=%d ifid=%d)\n",
- if_name(ifp), prefixlen, 128 - plen0));
- return NULL;
+ if (iidlen + pr->ndpr_plen != 128) {
+ error = EADDRNOTAVAIL;
+ nd6log(info,
+ "%s: invalid prefix length %d for %s, ignored\n",
+ __func__, pr->ndpr_plen, if_name(ifp));
+ goto unlock1;
}
- /* make ifaddr */
-
bzero(&ifra, sizeof(ifra));
- /*
- * in6_update_ifa() does not use ifra_name, but we accurately set it
- * for safety.
- */
- strncpy(ifra.ifra_name, if_name(ifp), sizeof(ifra.ifra_name));
+ strlcpy(ifra.ifra_name, if_name(ifp), sizeof(ifra.ifra_name));
ifra.ifra_addr.sin6_family = AF_INET6;
ifra.ifra_addr.sin6_len = sizeof(struct sockaddr_in6);
+
/* prefix */
bcopy(&pr->ndpr_prefix.sin6_addr, &ifra.ifra_addr.sin6_addr,
- sizeof(ifra.ifra_addr.sin6_addr));
+ sizeof(ifra.ifra_addr.sin6_addr));
+ in6_len2mask(&mask, pr->ndpr_plen);
ifra.ifra_addr.sin6_addr.s6_addr32[0] &= mask.s6_addr32[0];
ifra.ifra_addr.sin6_addr.s6_addr32[1] &= mask.s6_addr32[1];
ifra.ifra_addr.sin6_addr.s6_addr32[2] &= mask.s6_addr32[2];
ifra.ifra_addr.sin6_addr.s6_addr32[3] &= mask.s6_addr32[3];
- /* interface ID */
- if (ifid == NULL || IN6_IS_ADDR_UNSPECIFIED(ifid))
- ifid = &ib->ia_addr.sin6_addr;
- ifra.ifra_addr.sin6_addr.s6_addr32[0]
- |= (ifid->s6_addr32[0] & ~mask.s6_addr32[0]);
- ifra.ifra_addr.sin6_addr.s6_addr32[1]
- |= (ifid->s6_addr32[1] & ~mask.s6_addr32[1]);
- ifra.ifra_addr.sin6_addr.s6_addr32[2]
- |= (ifid->s6_addr32[2] & ~mask.s6_addr32[2]);
- ifra.ifra_addr.sin6_addr.s6_addr32[3]
- |= (ifid->s6_addr32[3] & ~mask.s6_addr32[3]);
-
+ ndi = ND_IFINFO(ifp);
+ VERIFY(ndi->initialized);
+ lck_mtx_lock(&ndi->lock);
+
+ notcga = nd6_send_opstate == ND6_SEND_OPMODE_DISABLED ||
+ (ndi->flags & ND6_IFF_INSECURE) != 0;
+
+ lck_mtx_unlock(&ndi->lock);
+ NDPR_UNLOCK(pr);
+
+ if (notcga && !is_clat46) {
+ ia6 = in6ifa_ifpforlinklocal(ifp, 0);
+ if (ia6 == NULL) {
+ error = EADDRNOTAVAIL;
+ nd6log(info, "%s: no link-local address (%s)\n",
+ __func__, if_name(ifp));
+ goto done;
+ }
+
+ IFA_LOCK(&ia6->ia_ifa);
+ ifra.ifra_addr.sin6_addr.s6_addr32[0] |=
+ (ia6->ia_addr.sin6_addr.s6_addr32[0] & ~mask.s6_addr32[0]);
+ ifra.ifra_addr.sin6_addr.s6_addr32[1] |=
+ (ia6->ia_addr.sin6_addr.s6_addr32[1] & ~mask.s6_addr32[1]);
+ ifra.ifra_addr.sin6_addr.s6_addr32[2] |=
+ (ia6->ia_addr.sin6_addr.s6_addr32[2] & ~mask.s6_addr32[2]);
+ ifra.ifra_addr.sin6_addr.s6_addr32[3] |=
+ (ia6->ia_addr.sin6_addr.s6_addr32[3] & ~mask.s6_addr32[3]);
+ IFA_UNLOCK(&ia6->ia_ifa);
+ IFA_REMREF(&ia6->ia_ifa);
+ ia6 = NULL;
+ } else {
+ struct in6_cga_prepare local_cga_prepare;
+ struct in6_cga_prepare *prepare_p;
+
+
+ in6_cga_node_lock();
+
+ if (ndi->cga_initialized) {
+ bcopy(&(ndi->local_cga_modifier),
+ &(local_cga_prepare.cga_modifier),
+ sizeof(local_cga_prepare.cga_modifier));
+ prepare_p = &local_cga_prepare;
+ } else {
+ prepare_p = NULL;
+ }
+ error = in6_cga_generate(prepare_p, collision_count,
+ &ifra.ifra_addr.sin6_addr, ifp);
+ in6_cga_node_unlock();
+ if (error == 0) {
+ ifra.ifra_flags |= IN6_IFF_SECURED;
+ if (is_clat46) {
+ ifra.ifra_flags |= IN6_IFF_CLAT46;
+ }
+ } else {
+ if (!is_clat46) {
+ nd6log(error, "%s: no CGA available (%s)\n",
+ __func__, if_name(ifp));
+ } else {
+ nd6log(error, "%s: no CLAT46 available (%s)\n",
+ __func__, if_name(ifp));
+ }
+ goto done;
+ }
+ }
+
+ VERIFY(ia6 == NULL);
+
/* new prefix mask. */
ifra.ifra_prefixmask.sin6_len = sizeof(struct sockaddr_in6);
ifra.ifra_prefixmask.sin6_family = AF_INET6;
bcopy(&mask, &ifra.ifra_prefixmask.sin6_addr,
- sizeof(ifra.ifra_prefixmask.sin6_addr));
+ sizeof(ifra.ifra_prefixmask.sin6_addr));
- /*
- * lifetime.
- * XXX: in6_init_address_ltimes would override these values later.
- * We should reconsider this logic.
- */
+ /* lifetimes. */
ifra.ifra_lifetime.ia6t_vltime = pr->ndpr_vltime;
ifra.ifra_lifetime.ia6t_pltime = pr->ndpr_pltime;
- /* XXX: scope zone ID? */
-
+ /* address flags */
ifra.ifra_flags |= IN6_IFF_AUTOCONF; /* obey autoconf */
+
/*
- * temporarily set the nopfx flag to avoid conflict.
- * XXX: we should reconsider the entire mechanism about prefix
- * manipulation.
+ * Make sure that we do not have this address already. This should
+ * usually not happen, but we can still see this case, e.g., if we
+ * have manually configured the exact address to be configured.
*/
- ifra.ifra_flags |= IN6_IFF_NOPFX;
+ if ((ia6 = in6ifa_ifpwithaddr(ifp, &ifra.ifra_addr.sin6_addr))
+ != NULL) {
+ error = EEXIST;
+ IFA_REMREF(&ia6->ia_ifa);
+ ia6 = NULL;
+
+ /* this should be rare enough to make an explicit log */
+ log(LOG_INFO, "%s: %s is already configured!\n",
+ __func__, ip6_sprintf(&ifra.ifra_addr.sin6_addr));
+ goto done;
+ }
/*
- * keep the new address, regardless of the result of in6_update_ifa.
- * XXX: this address is now meaningless.
- * We should reconsider its role.
+ * Allocate ifaddr structure, link into chain, etc.
+ * If we are going to create a new address upon receiving a multicasted
+ * RA, we need to impose a random delay before starting DAD.
+ * [RFC 4862, Section 5.4.2]
*/
- pr->ndpr_addr = ifra.ifra_addr.sin6_addr;
-
- /* allocate ifaddr structure, link into chain, etc. */
- if ((error = in6_update_ifa(ifp, &ifra, NULL)) != 0) {
- nd6log((LOG_ERR,
- "in6_ifadd: failed to make ifaddr %s on %s (errno=%d)\n",
- ip6_sprintf(&ifra.ifra_addr.sin6_addr), if_name(ifp),
- error));
- return(NULL); /* ifaddr must not have been allocated. */
+ ifaupdate = IN6_IFAUPDATE_NOWAIT;
+ if (mcast) {
+ ifaupdate |= IN6_IFAUPDATE_DADDELAY;
+ }
+ error = in6_update_ifa(ifp, &ifra, ifaupdate, &ia6);
+ if (error != 0) {
+ nd6log(error,
+ "%s: failed to make ifaddr %s on %s (errno=%d)\n",
+ __func__, ip6_sprintf(&ifra.ifra_addr.sin6_addr),
+ if_name(ifp), error);
+ error = EADDRNOTAVAIL;
+ goto done;
+ } else {
+ /* remember the collision count */
+ ia6->ia6_cga_collision_count = collision_count;
}
- ia = in6ifa_ifpwithaddr(ifp, &ifra.ifra_addr.sin6_addr);
+ VERIFY(ia6 != NULL);
+ in6_post_msg(ifp, KEV_INET6_NEW_RTADV_ADDR, ia6, NULL);
+ goto done;
- in6_post_msg(ifp, KEV_INET6_NEW_RTADV_ADDR, ia);
+unlock1:
+ NDPR_UNLOCK(pr);
- return(ia); /* this must NOT be NULL. */
+done:
+ *errorp = error;
+ return ia6;
}
+#define IA6_NONCONST(i) ((struct in6_ifaddr *)(uintptr_t)(i))
+
int
-in6_tmpifadd(
- const struct in6_ifaddr *ia0, /* corresponding public address */
- int forcegen)
+in6_tmpifadd(const struct in6_ifaddr *ia0, int forcegen)
{
struct ifnet *ifp = ia0->ia_ifa.ifa_ifp;
- struct in6_ifaddr *newia;
+ struct in6_ifaddr *ia, *newia;
struct in6_aliasreq ifra;
- int i, error;
- int trylimit = 3; /* XXX: adhoc value */
+ int i, error, ifaupdate;
+ int trylimit = 3; /* XXX: adhoc value */
u_int32_t randid[2];
- time_t vltime0, pltime0;
- struct timeval timenow;
-
- getmicrotime(&timenow);
+ uint32_t vltime0, pltime0;
+ uint64_t timenow = net_uptime();
+ struct in6_addr addr;
+ struct nd_prefix *ndpr;
bzero(&ifra, sizeof(ifra));
- strncpy(ifra.ifra_name, if_name(ifp), sizeof(ifra.ifra_name));
+ strlcpy(ifra.ifra_name, if_name(ifp), sizeof(ifra.ifra_name));
+ IFA_LOCK(&IA6_NONCONST(ia0)->ia_ifa);
ifra.ifra_addr = ia0->ia_addr;
/* copy prefix mask */
ifra.ifra_prefixmask = ia0->ia_prefixmask;
/* clear the old IFID */
for (i = 0; i < 4; i++) {
ifra.ifra_addr.sin6_addr.s6_addr32[i]
- &= ifra.ifra_prefixmask.sin6_addr.s6_addr32[i];
+ &= ifra.ifra_prefixmask.sin6_addr.s6_addr32[i];
}
+ addr = ia0->ia_addr.sin6_addr;
+ IFA_UNLOCK(&IA6_NONCONST(ia0)->ia_ifa);
+
+again:
+ in6_iid_mktmp(ifp, (u_int8_t *)randid,
+ (const u_int8_t *)&addr.s6_addr[8], forcegen);
- again:
- in6_get_tmpifid(ifp, (u_int8_t *)randid,
- (const u_int8_t *)&ia0->ia_addr.sin6_addr.s6_addr[8],
- forcegen);
- ifra.ifra_addr.sin6_addr.s6_addr32[2]
- |= (randid[0] & ~(ifra.ifra_prefixmask.sin6_addr.s6_addr32[2]));
- ifra.ifra_addr.sin6_addr.s6_addr32[3]
- |= (randid[1] & ~(ifra.ifra_prefixmask.sin6_addr.s6_addr32[3]));
+ ifra.ifra_addr.sin6_addr.s6_addr32[2] |=
+ (randid[0] & ~(ifra.ifra_prefixmask.sin6_addr.s6_addr32[2]));
+ ifra.ifra_addr.sin6_addr.s6_addr32[3] |=
+ (randid[1] & ~(ifra.ifra_prefixmask.sin6_addr.s6_addr32[3]));
/*
- * If by chance the new temporary address is the same as an address
- * already assigned to the interface, generate a new randomized
- * interface identifier and repeat this step.
- * RFC 3041 3.3 (4).
+ * in6_iid_mktmp() quite likely provided a unique interface ID.
+ * However, we may still have a chance to see collision, because
+ * there may be a time lag between generation of the ID and generation
+ * of the address. So, we'll do one more sanity check.
*/
- if (in6ifa_ifpwithaddr(ifp, &ifra.ifra_addr.sin6_addr) != NULL) {
+ if ((ia = in6ifa_ifpwithaddr(ifp, &ifra.ifra_addr.sin6_addr)) != NULL) {
+ IFA_REMREF(&ia->ia_ifa);
if (trylimit-- == 0) {
- nd6log((LOG_NOTICE, "in6_tmpifadd: failed to find "
- "a unique random IFID\n"));
- return(EEXIST);
+ nd6log(info, "in6_tmpifadd: failed to find "
+ "a unique random IFID\n");
+ return EEXIST;
}
forcegen = 1;
goto again;
/*
* The Valid Lifetime is the lower of the Valid Lifetime of the
- * public address or TEMP_VALID_LIFETIME.
+ * public address or TEMP_VALID_LIFETIME.
* The Preferred Lifetime is the lower of the Preferred Lifetime
- * of the public address or TEMP_PREFERRED_LIFETIME -
- * DESYNC_FACTOR.
+ * of the public address or TEMP_PREFERRED_LIFETIME -
+ * DESYNC_FACTOR.
*/
- if (ia0->ia6_lifetime.ia6t_expire != 0) {
- vltime0 = IFA6_IS_INVALID(ia0) ? 0 :
- (ia0->ia6_lifetime.ia6t_expire - timenow.tv_sec);
- if (vltime0 > ip6_temp_valid_lifetime)
+ IFA_LOCK(&IA6_NONCONST(ia0)->ia_ifa);
+ if (ia0->ia6_lifetime.ia6ti_vltime != ND6_INFINITE_LIFETIME) {
+ vltime0 = IFA6_IS_INVALID(ia0, timenow) ? 0 :
+ (ia0->ia6_lifetime.ia6ti_vltime -
+ (uint32_t)(timenow - ia0->ia6_updatetime));
+ if (vltime0 > ip6_temp_valid_lifetime) {
vltime0 = ip6_temp_valid_lifetime;
- } else
+ }
+ } else {
vltime0 = ip6_temp_valid_lifetime;
- if (ia0->ia6_lifetime.ia6t_preferred != 0) {
- pltime0 = IFA6_IS_DEPRECATED(ia0) ? 0 :
- (ia0->ia6_lifetime.ia6t_preferred - timenow.tv_sec);
- if (pltime0 > ip6_temp_preferred_lifetime - ip6_desync_factor){
+ }
+ if (ia0->ia6_lifetime.ia6ti_pltime != ND6_INFINITE_LIFETIME) {
+ pltime0 = IFA6_IS_DEPRECATED(ia0, timenow) ? 0 :
+ (ia0->ia6_lifetime.ia6ti_pltime -
+ (uint32_t)(timenow - ia0->ia6_updatetime));
+ if (pltime0 > ip6_temp_preferred_lifetime - ip6_desync_factor) {
pltime0 = ip6_temp_preferred_lifetime -
- ip6_desync_factor;
+ ip6_desync_factor;
}
- } else
+ } else {
pltime0 = ip6_temp_preferred_lifetime - ip6_desync_factor;
+ }
ifra.ifra_lifetime.ia6t_vltime = vltime0;
ifra.ifra_lifetime.ia6t_pltime = pltime0;
-
+ IFA_UNLOCK(&IA6_NONCONST(ia0)->ia_ifa);
/*
* A temporary address is created only if this calculated Preferred
* Lifetime is greater than REGEN_ADVANCE time units.
*/
- if (ifra.ifra_lifetime.ia6t_pltime <= ip6_temp_regen_advance)
- return(0);
+ if (ifra.ifra_lifetime.ia6t_pltime <= ip6_temp_regen_advance) {
+ return 0;
+ }
/* XXX: scope zone ID? */
- ifra.ifra_flags |= (IN6_IFF_AUTOCONF|IN6_IFF_TEMPORARY);
+ ifra.ifra_flags |= (IN6_IFF_AUTOCONF | IN6_IFF_TEMPORARY);
/* allocate ifaddr structure, link into chain, etc. */
- if ((error = in6_update_ifa(ifp, &ifra, NULL)) != 0)
- return(error);
-
- newia = in6ifa_ifpwithaddr(ifp, &ifra.ifra_addr.sin6_addr);
- if (newia == NULL) { /* XXX: can it happen? */
- nd6log((LOG_ERR,
- "in6_tmpifadd: ifa update succeeded, but we got "
- "no ifaddr\n"));
- return(EINVAL); /* XXX */
+ ifaupdate = IN6_IFAUPDATE_NOWAIT | IN6_IFAUPDATE_DADDELAY;
+ error = in6_update_ifa(ifp, &ifra, ifaupdate, &newia);
+ if (error != 0) {
+ nd6log(error, "in6_tmpifadd: failed to add address.\n");
+ return error;
}
- newia->ia6_ndpr = ia0->ia6_ndpr;
- newia->ia6_ndpr->ndpr_refcnt++;
+ VERIFY(newia != NULL);
+ IFA_LOCK(&IA6_NONCONST(ia0)->ia_ifa);
+ ndpr = ia0->ia6_ndpr;
+ if (ndpr == NULL) {
+ /*
+ * We lost the race with another thread that has purged
+ * ia0 address; in this case, purge the tmp addr as well.
+ */
+ nd6log(error, "in6_tmpifadd: no public address\n");
+ VERIFY(!(ia0->ia6_flags & IN6_IFF_AUTOCONF));
+ IFA_UNLOCK(&IA6_NONCONST(ia0)->ia_ifa);
+ in6_purgeaddr(&newia->ia_ifa);
+ IFA_REMREF(&newia->ia_ifa);
+ return EADDRNOTAVAIL;
+ }
+ NDPR_ADDREF(ndpr); /* for us */
+ IFA_UNLOCK(&IA6_NONCONST(ia0)->ia_ifa);
+ IFA_LOCK(&newia->ia_ifa);
+ if (newia->ia6_ndpr != NULL) {
+ NDPR_LOCK(newia->ia6_ndpr);
+ VERIFY(newia->ia6_ndpr->ndpr_addrcnt != 0);
+ newia->ia6_ndpr->ndpr_addrcnt--;
+ NDPR_UNLOCK(newia->ia6_ndpr);
+ NDPR_REMREF(newia->ia6_ndpr); /* release addr reference */
+ }
+ newia->ia6_ndpr = ndpr;
+ NDPR_LOCK(newia->ia6_ndpr);
+ newia->ia6_ndpr->ndpr_addrcnt++;
+ VERIFY(newia->ia6_ndpr->ndpr_addrcnt != 0);
+ NDPR_ADDREF(newia->ia6_ndpr); /* for addr reference */
+ NDPR_UNLOCK(newia->ia6_ndpr);
+ IFA_UNLOCK(&newia->ia_ifa);
/*
* A newly added address might affect the status of other addresses.
* XXX: when the temporary address is generated with a new public
* and, in fact, we surely need the check when we create a new
* temporary address due to deprecation of an old temporary address.
*/
- pfxlist_onlink_check(0);
+ lck_mtx_lock(nd6_mutex);
+ pfxlist_onlink_check();
+ lck_mtx_unlock(nd6_mutex);
+ IFA_REMREF(&newia->ia_ifa);
+
+ /* remove our reference */
+ NDPR_REMREF(ndpr);
- return(0);
-}
+ return 0;
+}
+#undef IA6_NONCONST
int
in6_init_prefix_ltimes(struct nd_prefix *ndpr)
{
- struct timeval timenow;
+ struct timeval caltime;
+ u_int64_t timenow = net_uptime();
- getmicrotime(&timenow);
- /* check if preferred lifetime > valid lifetime. RFC2462 5.5.3 (c) */
+ NDPR_LOCK_ASSERT_HELD(ndpr);
+
+ getmicrotime(&caltime);
+ ndpr->ndpr_base_calendartime = caltime.tv_sec;
+ ndpr->ndpr_base_uptime = timenow;
+
+ /* check if preferred lifetime > valid lifetime. RFC 4862 5.5.3 (c) */
if (ndpr->ndpr_pltime > ndpr->ndpr_vltime) {
- nd6log((LOG_INFO, "in6_init_prefix_ltimes: preferred lifetime"
+ nd6log(info, "in6_init_prefix_ltimes: preferred lifetime"
"(%d) is greater than valid lifetime(%d)\n",
- (u_int)ndpr->ndpr_pltime, (u_int)ndpr->ndpr_vltime));
- return (EINVAL);
+ (u_int)ndpr->ndpr_pltime, (u_int)ndpr->ndpr_vltime);
+ return EINVAL;
}
- if (ndpr->ndpr_pltime == ND6_INFINITE_LIFETIME)
+ if (ndpr->ndpr_pltime == ND6_INFINITE_LIFETIME) {
ndpr->ndpr_preferred = 0;
- else
- ndpr->ndpr_preferred = timenow.tv_sec + ndpr->ndpr_pltime;
- if (ndpr->ndpr_vltime == ND6_INFINITE_LIFETIME)
+ } else {
+ ndpr->ndpr_preferred = timenow + ndpr->ndpr_pltime;
+ }
+ if (ndpr->ndpr_vltime == ND6_INFINITE_LIFETIME) {
ndpr->ndpr_expire = 0;
- else
- ndpr->ndpr_expire = timenow.tv_sec + ndpr->ndpr_vltime;
+ } else {
+ ndpr->ndpr_expire = timenow + ndpr->ndpr_vltime;
+ }
return 0;
}
static void
in6_init_address_ltimes(struct nd_prefix *new, struct in6_addrlifetime *lt6)
{
- struct timeval timenow;
+#pragma unused(new)
+ uint64_t timenow = net_uptime();
- getmicrotime(&timenow);
/* Valid lifetime must not be updated unless explicitly specified. */
/* init ia6t_expire */
- if (lt6->ia6t_vltime == ND6_INFINITE_LIFETIME)
+ if (lt6->ia6t_vltime == ND6_INFINITE_LIFETIME) {
lt6->ia6t_expire = 0;
- else {
- lt6->ia6t_expire = timenow.tv_sec;
+ } else {
+ lt6->ia6t_expire = timenow;
lt6->ia6t_expire += lt6->ia6t_vltime;
}
/* init ia6t_preferred */
- if (lt6->ia6t_pltime == ND6_INFINITE_LIFETIME)
+ if (lt6->ia6t_pltime == ND6_INFINITE_LIFETIME) {
lt6->ia6t_preferred = 0;
- else {
- lt6->ia6t_preferred = timenow.tv_sec;
+ } else {
+ lt6->ia6t_preferred = timenow;
lt6->ia6t_preferred += lt6->ia6t_pltime;
}
}
* Delete all the routing table entries that use the specified gateway.
* XXX: this function causes search through all entries of routing table, so
* it shouldn't be called when acting as a router.
+ *
+ * This should really be working on entries that have a specific
+ * parent route.
*/
void
rt6_flush(
if (!IN6_IS_ADDR_LINKLOCAL(gateway)) {
return;
}
- lck_mtx_lock(rt_mtx);
+ lck_mtx_lock(rnh_lock);
/* XXX: hack for KAME's link-local address kludge */
gateway->s6_addr16[1] = htons(ifp->if_index);
rnh->rnh_walktree(rnh, rt6_deleteroute, (void *)gateway);
- lck_mtx_unlock(rt_mtx);
+ lck_mtx_unlock(rnh_lock);
}
static int
struct radix_node *rn,
void *arg)
{
-#define SIN6(s) ((struct sockaddr_in6 *)s)
struct rtentry *rt = (struct rtentry *)rn;
struct in6_addr *gate = (struct in6_addr *)arg;
- lck_mtx_assert(rt_mtx, LCK_MTX_ASSERT_OWNED);
-
- if (rt->rt_gateway == NULL || rt->rt_gateway->sa_family != AF_INET6)
- return(0);
+ LCK_MTX_ASSERT(rnh_lock, LCK_MTX_ASSERT_OWNED);
- if (!IN6_ARE_ADDR_EQUAL(gate, &SIN6(rt->rt_gateway)->sin6_addr))
- return(0);
+ RT_LOCK(rt);
+ if (rt->rt_gateway == NULL || rt->rt_gateway->sa_family != AF_INET6) {
+ RT_UNLOCK(rt);
+ return 0;
+ }
+ if (!IN6_ARE_ADDR_EQUAL(gate, &SIN6(rt->rt_gateway)->sin6_addr)) {
+ RT_UNLOCK(rt);
+ return 0;
+ }
/*
* Do not delete a static route.
* XXX: this seems to be a bit ad-hoc. Should we consider the
* 'cloned' bit instead?
*/
- if ((rt->rt_flags & RTF_STATIC) != 0)
- return(0);
-
+ if ((rt->rt_flags & RTF_STATIC) != 0) {
+ RT_UNLOCK(rt);
+ return 0;
+ }
/*
* We delete only host route. This means, in particular, we don't
* delete default route.
*/
- if ((rt->rt_flags & RTF_HOST) == 0)
- return(0);
+ if ((rt->rt_flags & RTF_HOST) == 0) {
+ RT_UNLOCK(rt);
+ return 0;
+ }
- return(rtrequest_locked(RTM_DELETE, rt_key(rt),
- rt->rt_gateway, rt_mask(rt), rt->rt_flags, 0));
-#undef SIN6
+ /*
+ * Safe to drop rt_lock and use rt_key, rt_gateway, since holding
+ * rnh_lock here prevents another thread from calling rt_setgate()
+ * on this route.
+ */
+ RT_UNLOCK(rt);
+ return rtrequest_locked(RTM_DELETE, rt_key(rt), rt->rt_gateway,
+ rt_mask(rt), rt->rt_flags, 0);
}
int
int ifindex)
{
int error = 0;
+ ifnet_t def_ifp = NULL;
+
+ LCK_MTX_ASSERT(nd6_mutex, LCK_MTX_ASSERT_NOTOWNED);
- if (ifindex < 0 || if_index < ifindex)
- return(EINVAL);
+ ifnet_head_lock_shared();
+ if (ifindex < 0 || if_index < ifindex) {
+ ifnet_head_done();
+ return EINVAL;
+ }
+ def_ifp = ifindex2ifnet[ifindex];
+ ifnet_head_done();
lck_mtx_lock(nd6_mutex);
if (nd6_defifindex != ifindex) {
+ struct ifnet *odef_ifp = nd6_defifp;
+
nd6_defifindex = ifindex;
- if (nd6_defifindex > 0)
- nd6_defifp = ifindex2ifnet[nd6_defifindex];
- else
+ if (nd6_defifindex > 0) {
+ nd6_defifp = def_ifp;
+ } else {
nd6_defifp = NULL;
+ }
+
+ if (nd6_defifp != NULL) {
+ nd6log(info, "%s: is now the default "
+ "interface (was %s)\n", if_name(nd6_defifp),
+ odef_ifp != NULL ? if_name(odef_ifp) : "NONE");
+ } else {
+ nd6log(info, "No default interface set\n");
+ }
/*
* If the Default Router List is empty, install a route
* we do this here to avoid re-install the default route
* if the list is NOT empty.
*/
- if (TAILQ_FIRST(&nd_defrouter) == NULL)
- defrouter_select();
+ if (odef_ifp != NULL) {
+ defrouter_select(odef_ifp, NULL);
+ }
+
+ if (nd6_defifp != NULL) {
+ defrouter_select(nd6_defifp, NULL);
+ nd6_prefix_sync(nd6_defifp);
+ }
/*
- * Our current implementation assumes one-to-one maping between
+ * XXX For now we managed RTI routes as un-scoped.
+ * Therefore we ignore the change in nd6_defifindex
+ * for RTI routes for now.
+ */
+ /*
+ * Our current implementation assumes one-to-one mapping between
* interfaces and links, so it would be natural to use the
* default interface as the default link.
*/
scope6_setdefault(nd6_defifp);
}
-
lck_mtx_unlock(nd6_mutex);
- return(error);
+ return error;
}