-/* $FreeBSD: src/sys/netinet6/nd6_rtr.c,v 1.11 2002/04/19 04:46:23 suz Exp $ */
-/* $KAME: nd6_rtr.c,v 1.111 2001/04/27 01:37:15 jinmei Exp $ */
+/*
+ * Copyright (c) 2003-2016 Apple Inc. All rights reserved.
+ *
+ * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
+ *
+ * This file contains Original Code and/or Modifications of Original Code
+ * as defined in and that are subject to the Apple Public Source License
+ * Version 2.0 (the 'License'). You may not use this file except in
+ * compliance with the License. The rights granted to you under the License
+ * may not be used to create, or enable the creation or redistribution of,
+ * unlawful or unlicensed copies of an Apple operating system, or to
+ * circumvent, violate, or enable the circumvention or violation of, any
+ * terms of an Apple operating system software license agreement.
+ *
+ * Please obtain a copy of the License at
+ * http://www.opensource.apple.com/apsl/ and read it before using this file.
+ *
+ * The Original Code and all software distributed under the License are
+ * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
+ * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
+ * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
+ * Please see the License for the specific language governing rights and
+ * limitations under the License.
+ *
+ * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
+ */
/*
* Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
#include <sys/errno.h>
#include <sys/syslog.h>
#include <sys/queue.h>
-#include <kern/lock.h>
+#include <sys/mcache.h>
+#include <sys/protosw.h>
+
+#include <dev/random/randomdev.h>
+
+#include <kern/locks.h>
+#include <kern/zalloc.h>
+#include <machine/machine_routines.h>
#include <net/if.h>
+#include <net/if_var.h>
#include <net/if_types.h>
#include <net/if_dl.h>
#include <net/route.h>
#include <net/net_osdep.h>
-#define SDL(s) ((struct sockaddr_dl *)s)
-
+static void defrouter_addreq(struct nd_defrouter *, boolean_t);
+static void defrouter_delreq(struct nd_defrouter *);
+static struct nd_defrouter *defrtrlist_update_common(struct nd_defrouter *,
+ boolean_t);
static struct nd_defrouter *defrtrlist_update(struct nd_defrouter *);
-static struct in6_ifaddr *in6_ifadd(struct nd_prefix *,
- struct in6_addr *);
+
+static struct in6_ifaddr *in6_pfx_newpersistaddr(struct nd_prefix *, int,
+ int *);
+
static struct nd_pfxrouter *pfxrtr_lookup(struct nd_prefix *,
struct nd_defrouter *);
static void pfxrtr_add(struct nd_prefix *, struct nd_defrouter *);
-static void pfxrtr_del(struct nd_pfxrouter *);
+static void pfxrtr_del(struct nd_pfxrouter *, struct nd_prefix *);
static struct nd_pfxrouter *find_pfxlist_reachable_router(struct nd_prefix *);
-static void defrouter_addifreq(struct ifnet *);
static void nd6_rtmsg(int, struct rtentry *);
-static void in6_init_address_ltimes(struct nd_prefix *ndpr,
- struct in6_addrlifetime *lt6);
+static int nd6_prefix_onlink_common(struct nd_prefix *, boolean_t,
+ unsigned int);
+static struct nd_prefix *nd6_prefix_equal_lookup(struct nd_prefix *, boolean_t);
+static void nd6_prefix_sync(struct ifnet *);
+
+static void in6_init_address_ltimes(struct nd_prefix *,
+ struct in6_addrlifetime *);
static int rt6_deleteroute(struct radix_node *, void *);
+static struct nd_defrouter *nddr_alloc(int);
+static void nddr_free(struct nd_defrouter *);
+static void nddr_trace(struct nd_defrouter *, int);
+
+static struct nd_prefix *ndpr_alloc(int);
+static void ndpr_free(struct nd_prefix *);
+static void ndpr_trace(struct nd_prefix *, int);
+
extern int nd6_recalc_reachtm_interval;
-static struct ifnet *nd6_defifp;
-int nd6_defifindex;
+static struct ifnet *nd6_defifp = NULL;
+int nd6_defifindex = 0;
+static unsigned int nd6_defrouter_genid;
+
+int ip6_use_tempaddr = 1; /* use temp addr by default for testing now */
-int ip6_use_tempaddr = 0;
+int nd6_accept_6to4 = 1;
int ip6_desync_factor;
u_int32_t ip6_temp_preferred_lifetime = DEF_TEMP_PREFERRED_LIFETIME;
u_int32_t ip6_temp_valid_lifetime = DEF_TEMP_VALID_LIFETIME;
/*
* shorter lifetimes for debugging purposes.
-int ip6_temp_preferred_lifetime = 800;
-static int ip6_temp_valid_lifetime = 1800;
-*/
+ * u_int32_t ip6_temp_preferred_lifetime = 800;
+ * static u_int32_t ip6_temp_valid_lifetime = 1800;
+ */
int ip6_temp_regen_advance = TEMPADDR_REGEN_ADVANCE;
-extern lck_mtx_t *rt_mtx;
extern lck_mtx_t *nd6_mutex;
+/* Serialization variables for single thread access to nd_prefix */
+static boolean_t nd_prefix_busy;
+static void *nd_prefix_waitchan = &nd_prefix_busy;
+static int nd_prefix_waiters = 0;
+
+/* Serialization variables for single thread access to nd_defrouter */
+static boolean_t nd_defrouter_busy;
+static void *nd_defrouter_waitchan = &nd_defrouter_busy;
+static int nd_defrouter_waiters = 0;
+
+/* RTPREF_MEDIUM has to be 0! */
+#define RTPREF_HIGH 1
+#define RTPREF_MEDIUM 0
+#define RTPREF_LOW (-1)
+#define RTPREF_RESERVED (-2)
+#define RTPREF_INVALID (-3) /* internal */
+
+#define NDPR_TRACE_HIST_SIZE 32 /* size of trace history */
+
+/* For gdb */
+__private_extern__ unsigned int ndpr_trace_hist_size = NDPR_TRACE_HIST_SIZE;
+
+struct nd_prefix_dbg {
+ struct nd_prefix ndpr_pr; /* nd_prefix */
+ u_int16_t ndpr_refhold_cnt; /* # of ref */
+ u_int16_t ndpr_refrele_cnt; /* # of rele */
+ /*
+ * Circular lists of ndpr_addref and ndpr_remref callers.
+ */
+ ctrace_t ndpr_refhold[NDPR_TRACE_HIST_SIZE];
+ ctrace_t ndpr_refrele[NDPR_TRACE_HIST_SIZE];
+};
+
+static unsigned int ndpr_debug; /* debug flags */
+static unsigned int ndpr_size; /* size of zone element */
+static struct zone *ndpr_zone; /* zone for nd_prefix */
+
+#define NDPR_ZONE_MAX 64 /* maximum elements in zone */
+#define NDPR_ZONE_NAME "nd6_prefix" /* zone name */
+
+#define NDDR_TRACE_HIST_SIZE 32 /* size of trace history */
+
+/* For gdb */
+__private_extern__ unsigned int nddr_trace_hist_size = NDDR_TRACE_HIST_SIZE;
+
+struct nd_defrouter_dbg {
+ struct nd_defrouter nddr_dr; /* nd_defrouter */
+ uint16_t nddr_refhold_cnt; /* # of ref */
+ uint16_t nddr_refrele_cnt; /* # of rele */
+ /*
+ * Circular lists of ndpr_addref and ndpr_remref callers.
+ */
+ ctrace_t nddr_refhold[NDDR_TRACE_HIST_SIZE];
+ ctrace_t nddr_refrele[NDDR_TRACE_HIST_SIZE];
+};
+
+static unsigned int nddr_debug; /* debug flags */
+static unsigned int nddr_size; /* size of zone element */
+static struct zone *nddr_zone; /* zone for nd_defrouter */
+
+#define NDDR_ZONE_MAX 64 /* maximum elements in zone */
+#define NDDR_ZONE_NAME "nd6_defrouter" /* zone name */
+
+static unsigned int ndprtr_size; /* size of zone element */
+static struct zone *ndprtr_zone; /* zone for nd_pfxrouter */
+
+#define NDPRTR_ZONE_MAX 64 /* maximum elements in zone */
+#define NDPRTR_ZONE_NAME "nd6_pfxrouter" /* zone name */
+
+void
+nd6_rtr_init(void)
+{
+ PE_parse_boot_argn("ifa_debug", &ndpr_debug, sizeof (ndpr_debug));
+ PE_parse_boot_argn("ifa_debug", &nddr_debug, sizeof (nddr_debug));
+
+ ndpr_size = (ndpr_debug == 0) ? sizeof (struct nd_prefix) :
+ sizeof (struct nd_prefix_dbg);
+ ndpr_zone = zinit(ndpr_size, NDPR_ZONE_MAX * ndpr_size, 0,
+ NDPR_ZONE_NAME);
+ if (ndpr_zone == NULL) {
+ panic("%s: failed allocating %s", __func__, NDPR_ZONE_NAME);
+ /* NOTREACHED */
+ }
+ zone_change(ndpr_zone, Z_EXPAND, TRUE);
+ zone_change(ndpr_zone, Z_CALLERACCT, FALSE);
+
+ nddr_size = (nddr_debug == 0) ? sizeof (struct nd_defrouter) :
+ sizeof (struct nd_defrouter_dbg);
+ nddr_zone = zinit(nddr_size, NDDR_ZONE_MAX * nddr_size, 0,
+ NDDR_ZONE_NAME);
+ if (nddr_zone == NULL) {
+ panic("%s: failed allocating %s", __func__, NDDR_ZONE_NAME);
+ /* NOTREACHED */
+ }
+ zone_change(nddr_zone, Z_EXPAND, TRUE);
+ zone_change(nddr_zone, Z_CALLERACCT, FALSE);
+
+ ndprtr_size = sizeof (struct nd_pfxrouter);
+ ndprtr_zone = zinit(ndprtr_size, NDPRTR_ZONE_MAX * ndprtr_size, 0,
+ NDPRTR_ZONE_NAME);
+ if (ndprtr_zone == NULL) {
+ panic("%s: failed allocating %s", __func__, NDPRTR_ZONE_NAME);
+ /* NOTREACHED */
+ }
+ zone_change(ndprtr_zone, Z_EXPAND, TRUE);
+ zone_change(ndprtr_zone, Z_CALLERACCT, FALSE);
+}
+
/*
* Receive Router Solicitation Message - just for routers.
* Router solicitation/advertisement is mostly managed by userland program
struct ip6_hdr *ip6 = mtod(m, struct ip6_hdr *);
struct nd_router_solicit *nd_rs;
struct in6_addr saddr6 = ip6->ip6_src;
-#if 0
- struct in6_addr daddr6 = ip6->ip6_dst;
-#endif
char *lladdr = NULL;
int lladdrlen = 0;
-#if 0
- struct sockaddr_dl *sdl = (struct sockaddr_dl *)NULL;
- struct llinfo_nd6 *ln = (struct llinfo_nd6 *)NULL;
- struct rtentry *rt = NULL;
- int is_newentry;
-#endif
union nd_opts ndopts;
+ /* Expect 32-bit aligned data pointer on strict-align platforms */
+ MBUF_STRICT_DATA_ALIGNMENT_CHECK_32(m);
+
/* If I'm not a router, ignore it. */
- if (ip6_accept_rtadv != 0 || (ifp->if_eflags & IFEF_ACCEPT_RTADVD) || ip6_forwarding != 1)
+ if (!ip6_forwarding || !(ifp->if_eflags & IFEF_IPV6_ROUTER))
goto freeit;
/* Sanity checks */
}
/*
- * Don't update the neighbor cache, if src = ::.
- * This indicates that the src has no IP address assigned yet.
+ * Don't update the neighbor cache, if src = :: or a non-neighbor.
+ * The former case indicates that the src has no IP address assigned
+ * yet. See nd6_ns_input() for the latter case.
*/
- if (IN6_IS_ADDR_UNSPECIFIED(&saddr6))
+ if (IN6_IS_ADDR_UNSPECIFIED(&ip6->ip6_src)) {
goto freeit;
+ } else {
+ struct sockaddr_in6 src_sa6;
+
+ bzero(&src_sa6, sizeof (src_sa6));
+ src_sa6.sin6_family = AF_INET6;
+ src_sa6.sin6_len = sizeof (src_sa6);
+ src_sa6.sin6_addr = ip6->ip6_src;
+ if (!nd6_is_addr_neighbor(&src_sa6, ifp, 0)) {
+ nd6log((LOG_INFO, "nd6_rs_input: "
+ "RS packet from non-neighbor\n"));
+ goto freeit;
+ }
+ }
-#ifndef PULLDOWN_TEST
IP6_EXTHDR_CHECK(m, off, icmp6len, return);
nd_rs = (struct nd_router_solicit *)((caddr_t)ip6 + off);
-#else
- IP6_EXTHDR_GET(nd_rs, struct nd_router_solicit *, m, off, icmp6len);
- if (nd_rs == NULL) {
- icmp6stat.icp6s_tooshort++;
- return;
- }
-#endif
-
- icmp6len -= sizeof(*nd_rs);
+ icmp6len -= sizeof (*nd_rs);
nd6_option_init(nd_rs + 1, icmp6len, &ndopts);
if (nd6_options(&ndopts) < 0) {
nd6log((LOG_INFO,
nd6_cache_lladdr(ifp, &saddr6, lladdr, lladdrlen, ND_ROUTER_SOLICIT, 0);
- freeit:
+freeit:
m_freem(m);
return;
- bad:
+bad:
icmp6stat.icp6s_badrs++;
m_freem(m);
}
void
nd6_ra_input(
struct mbuf *m,
- int off,
+ int off,
int icmp6len)
{
struct ifnet *ifp = m->m_pkthdr.rcvif;
- struct nd_ifinfo *ndi = &nd_ifinfo[ifp->if_index];
+ struct nd_ifinfo *ndi = NULL;
struct ip6_hdr *ip6 = mtod(m, struct ip6_hdr *);
struct nd_router_advert *nd_ra;
struct in6_addr saddr6 = ip6->ip6_src;
-#if 0
- struct in6_addr daddr6 = ip6->ip6_dst;
- int flags; /* = nd_ra->nd_ra_flags_reserved; */
- int is_managed = ((flags & ND_RA_FLAG_MANAGED) != 0);
- int is_other = ((flags & ND_RA_FLAG_OTHER) != 0);
-#endif
+ int mcast = 0;
union nd_opts ndopts;
- struct nd_defrouter *dr;
- struct timeval timenow;
+ struct nd_defrouter *dr = NULL;
+ u_int32_t mtu = 0;
+ char *lladdr = NULL;
+ u_int32_t lladdrlen = 0;
+ struct nd_prefix_list *nd_prefix_list_head = NULL;
+ u_int32_t nd_prefix_list_length = 0;
+ struct in6_ifaddr *ia6 = NULL;
+ struct nd_prefix_list *prfl;
+ struct nd_defrouter dr0;
+ u_int32_t advreachable;
- getmicrotime(&timenow);
- if (ip6_accept_rtadv == 0 && ((ifp->if_eflags & IFEF_ACCEPT_RTADVD) == 0))
+ /* Expect 32-bit aligned data pointer on strict-align platforms */
+ MBUF_STRICT_DATA_ALIGNMENT_CHECK_32(m);
+
+ /*
+ * Discard RA unless IFEF_ACCEPT_RTADV is set (as host), or when
+ * IFEF_IPV6_ROUTER is set (as router) but the RA is not locally
+ * generated. For convenience, we allow locally generated (rtadvd)
+ * RAs to be processed on the advertising interface, as a router.
+ *
+ * Note that we don't test against ip6_forwarding as we could be
+ * both a host and a router on different interfaces, hence the
+ * check against the per-interface flags.
+ */
+ if (!(ifp->if_eflags & (IFEF_ACCEPT_RTADV | IFEF_IPV6_ROUTER)) ||
+ ((ifp->if_eflags & IFEF_IPV6_ROUTER) &&
+ (ia6 = ifa_foraddr6(&saddr6)) == NULL))
goto freeit;
+ if (ia6 != NULL) {
+ IFA_REMREF(&ia6->ia_ifa);
+ ia6 = NULL;
+ }
+
if (ip6->ip6_hlim != 255) {
nd6log((LOG_ERR,
"nd6_ra_input: invalid hlim (%d) from %s to %s on %s\n",
goto bad;
}
-#ifndef PULLDOWN_TEST
IP6_EXTHDR_CHECK(m, off, icmp6len, return);
nd_ra = (struct nd_router_advert *)((caddr_t)ip6 + off);
-#else
- IP6_EXTHDR_GET(nd_ra, struct nd_router_advert *, m, off, icmp6len);
- if (nd_ra == NULL) {
- icmp6stat.icp6s_tooshort++;
- return;
- }
-#endif
- icmp6len -= sizeof(*nd_ra);
+ icmp6len -= sizeof (*nd_ra);
nd6_option_init(nd_ra + 1, icmp6len, &ndopts);
if (nd6_options(&ndopts) < 0) {
nd6log((LOG_INFO,
goto freeit;
}
- {
- struct nd_defrouter dr0;
- u_int32_t advreachable = nd_ra->nd_ra_reachable;
+ advreachable = nd_ra->nd_ra_reachable;
+ /* remember if this is a multicasted advertisement */
+ if (IN6_IS_ADDR_MULTICAST(&ip6->ip6_dst))
+ mcast = 1;
+
+ ndi = ND_IFINFO(ifp);
+ VERIFY((NULL != ndi) && (TRUE == ndi->initialized));
+ lck_mtx_lock(&ndi->lock);
+ bzero(&dr0, sizeof (dr0));
dr0.rtaddr = saddr6;
dr0.flags = nd_ra->nd_ra_flags_reserved;
dr0.rtlifetime = ntohs(nd_ra->nd_ra_router_lifetime);
- dr0.expire = timenow.tv_sec + dr0.rtlifetime;
+ dr0.expire = net_uptime() + dr0.rtlifetime;
dr0.ifp = ifp;
- dr0.advint = 0; /* Mobile IPv6 */
- dr0.advint_expire = 0; /* Mobile IPv6 */
- dr0.advints_lost = 0; /* Mobile IPv6 */
/* unspecified or not? (RFC 2461 6.3.4) */
if (advreachable) {
advreachable = ntohl(advreachable);
}
if (nd_ra->nd_ra_retransmit)
ndi->retrans = ntohl(nd_ra->nd_ra_retransmit);
- if (nd_ra->nd_ra_curhoplimit)
- ndi->chlim = nd_ra->nd_ra_curhoplimit;
+ if (nd_ra->nd_ra_curhoplimit) {
+ if (ndi->chlim < nd_ra->nd_ra_curhoplimit) {
+ ndi->chlim = nd_ra->nd_ra_curhoplimit;
+ } else if (ndi->chlim != nd_ra->nd_ra_curhoplimit) {
+ nd6log((LOG_ERR,
+ "RA with a lower CurHopLimit sent from "
+ "%s on %s (current = %d, received = %d). "
+ "Ignored.\n", ip6_sprintf(&ip6->ip6_src),
+ if_name(ifp), ndi->chlim,
+ nd_ra->nd_ra_curhoplimit));
+ }
+ }
+ lck_mtx_unlock(&ndi->lock);
+ lck_mtx_lock(nd6_mutex);
dr = defrtrlist_update(&dr0);
- }
+ lck_mtx_unlock(nd6_mutex);
/*
* prefix
struct nd_prefix pr;
for (pt = (struct nd_opt_hdr *)ndopts.nd_opts_pi;
- pt <= (struct nd_opt_hdr *)ndopts.nd_opts_pi_end;
- pt = (struct nd_opt_hdr *)((caddr_t)pt +
- (pt->nd_opt_len << 3))) {
+ pt <= (struct nd_opt_hdr *)ndopts.nd_opts_pi_end;
+ pt = (struct nd_opt_hdr *)((caddr_t)pt +
+ (pt->nd_opt_len << 3))) {
+ struct in6_addr pi_mask;
+ bzero(&pi_mask, sizeof(pi_mask));
+
if (pt->nd_opt_type != ND_OPT_PREFIX_INFORMATION)
continue;
pi = (struct nd_opt_prefix_info *)pt;
continue;
}
- if (IN6_IS_ADDR_MULTICAST(&pi->nd_opt_pi_prefix)
- || IN6_IS_ADDR_LINKLOCAL(&pi->nd_opt_pi_prefix)) {
- nd6log((LOG_INFO,
- "nd6_ra_input: invalid prefix "
- "%s, ignored\n",
- ip6_sprintf(&pi->nd_opt_pi_prefix)));
- continue;
- }
-
- /* aggregatable unicast address, rfc2374 */
- if ((pi->nd_opt_pi_prefix.s6_addr8[0] & 0xe0) == 0x20
- && pi->nd_opt_pi_prefix_len != 64) {
+ /*
+ * To ignore ::/64 make sure bits beyond prefixlen
+ * are set to zero
+ */
+ in6_prefixlen2mask(&pi_mask, pi->nd_opt_pi_prefix_len);
+ pi->nd_opt_pi_prefix.s6_addr32[0] &= pi_mask.s6_addr32[0];
+ pi->nd_opt_pi_prefix.s6_addr32[1] &= pi_mask.s6_addr32[1];
+ pi->nd_opt_pi_prefix.s6_addr32[2] &= pi_mask.s6_addr32[2];
+ pi->nd_opt_pi_prefix.s6_addr32[3] &= pi_mask.s6_addr32[3];
+
+ if (IN6_IS_ADDR_UNSPECIFIED(&pi->nd_opt_pi_prefix) ||
+ IN6_IS_ADDR_MULTICAST(&pi->nd_opt_pi_prefix) ||
+ IN6_IS_ADDR_LINKLOCAL(&pi->nd_opt_pi_prefix)) {
nd6log((LOG_INFO,
- "nd6_ra_input: invalid prefixlen "
- "%d for rfc2374 prefix %s, ignored\n",
- pi->nd_opt_pi_prefix_len,
+ "%s: invalid prefix %s, ignored\n",
+ __func__,
ip6_sprintf(&pi->nd_opt_pi_prefix)));
continue;
}
- bzero(&pr, sizeof(pr));
+ bzero(&pr, sizeof (pr));
+ lck_mtx_init(&pr.ndpr_lock, ifa_mtx_grp, ifa_mtx_attr);
+ NDPR_LOCK(&pr);
pr.ndpr_prefix.sin6_family = AF_INET6;
- pr.ndpr_prefix.sin6_len = sizeof(pr.ndpr_prefix);
+ pr.ndpr_prefix.sin6_len = sizeof (pr.ndpr_prefix);
pr.ndpr_prefix.sin6_addr = pi->nd_opt_pi_prefix;
pr.ndpr_ifp = m->m_pkthdr.rcvif;
pr.ndpr_raf_onlink = (pi->nd_opt_pi_flags_reserved &
- ND_OPT_PI_FLAG_ONLINK) ? 1 : 0;
+ ND_OPT_PI_FLAG_ONLINK) ? 1 : 0;
pr.ndpr_raf_auto = (pi->nd_opt_pi_flags_reserved &
- ND_OPT_PI_FLAG_AUTO) ? 1 : 0;
+ ND_OPT_PI_FLAG_AUTO) ? 1 : 0;
pr.ndpr_plen = pi->nd_opt_pi_prefix_len;
pr.ndpr_vltime = ntohl(pi->nd_opt_pi_valid_time);
pr.ndpr_pltime =
ntohl(pi->nd_opt_pi_preferred_time);
- if (in6_init_prefix_ltimes(&pr))
+ /*
+ * Exceptions to stateless autoconfiguration processing:
+ * + nd6_accept_6to4 == 0 && address has 6to4 prefix
+ * + ip6_only_allow_rfc4193_prefix != 0 &&
+ * address not RFC 4193
+ */
+ if (ip6_only_allow_rfc4193_prefix &&
+ !IN6_IS_ADDR_UNIQUE_LOCAL(&pi->nd_opt_pi_prefix)) {
+ nd6log((LOG_INFO,
+ "nd6_ra_input: no SLAAC on prefix %s "
+ "[not RFC 4193]\n",
+ ip6_sprintf(&pi->nd_opt_pi_prefix)));
+ pr.ndpr_raf_auto = 0;
+ } else if (!nd6_accept_6to4 &&
+ IN6_IS_ADDR_6TO4(&pi->nd_opt_pi_prefix)) {
+ nd6log((LOG_INFO,
+ "%s: no SLAAC on prefix %s "
+ "[6to4]\n", __func__,
+ ip6_sprintf(&pi->nd_opt_pi_prefix)));
+ pr.ndpr_raf_auto = 0;
+ }
+
+ if (in6_init_prefix_ltimes(&pr)) {
+ NDPR_UNLOCK(&pr);
+ lck_mtx_destroy(&pr.ndpr_lock, ifa_mtx_grp);
continue; /* prefix lifetime init failed */
+ } else {
+ NDPR_UNLOCK(&pr);
+ }
+ (void) prelist_update(&pr, dr, m, mcast);
+ lck_mtx_destroy(&pr.ndpr_lock, ifa_mtx_grp);
+
+ /*
+ * We have to copy the values out after the
+ * prelist_update call since some of these values won't
+ * be properly set until after the router advertisement
+ * updating can vet the values.
+ */
+ prfl = NULL;
+ MALLOC(prfl, struct nd_prefix_list *, sizeof (*prfl),
+ M_TEMP, M_WAITOK | M_ZERO);
+
+ if (prfl == NULL) {
+ log(LOG_DEBUG, "%s: unable to MALLOC RA prefix "
+ "structure\n", __func__);
+ continue;
+ }
- (void)prelist_update(&pr, dr, m);
+ /* this is only for nd6_post_msg(), otherwise unused */
+ bcopy(&pr.ndpr_prefix, &prfl->pr.ndpr_prefix,
+ sizeof (prfl->pr.ndpr_prefix));
+ prfl->pr.ndpr_raf = pr.ndpr_raf;
+ prfl->pr.ndpr_plen = pr.ndpr_plen;
+ prfl->pr.ndpr_vltime = pr.ndpr_vltime;
+ prfl->pr.ndpr_pltime = pr.ndpr_pltime;
+ prfl->pr.ndpr_expire = pr.ndpr_expire;
+ prfl->pr.ndpr_base_calendartime =
+ pr.ndpr_base_calendartime;
+ prfl->pr.ndpr_base_uptime = pr.ndpr_base_uptime;
+ prfl->pr.ndpr_stateflags = pr.ndpr_stateflags;
+ prfl->pr.ndpr_addrcnt = pr.ndpr_addrcnt;
+ prfl->pr.ndpr_ifp = pr.ndpr_ifp;
+
+ prfl->next = nd_prefix_list_head;
+ nd_prefix_list_head = prfl;
+ nd_prefix_list_length++;
}
}
* MTU
*/
if (ndopts.nd_opts_mtu && ndopts.nd_opts_mtu->nd_opt_mtu_len == 1) {
- u_int32_t mtu = ntohl(ndopts.nd_opts_mtu->nd_opt_mtu_mtu);
+ mtu = ntohl(ndopts.nd_opts_mtu->nd_opt_mtu_mtu);
/* lower bound */
if (mtu < IPV6_MMTU) {
goto skip;
}
+ lck_mtx_lock(&ndi->lock);
/* upper bound */
if (ndi->maxmtu) {
if (mtu <= ndi->maxmtu) {
int change = (ndi->linkmtu != mtu);
ndi->linkmtu = mtu;
+ lck_mtx_unlock(&ndi->lock);
if (change) /* in6_maxmtu may change */
in6_setmaxmtu();
} else {
"exceeds maxmtu %d, ignoring\n",
mtu, ip6_sprintf(&ip6->ip6_src),
ndi->maxmtu));
+ lck_mtx_unlock(&ndi->lock);
}
} else {
+ lck_mtx_unlock(&ndi->lock);
nd6log((LOG_INFO, "nd6_ra_input: mtu option "
"mtu=%d sent from %s; maxmtu unknown, "
"ignoring\n",
}
}
- skip:
-
+skip:
+
/*
* Source link layer address
*/
- {
- char *lladdr = NULL;
- int lladdrlen = 0;
-
if (ndopts.nd_opts_src_lladdr) {
lladdr = (char *)(ndopts.nd_opts_src_lladdr + 1);
lladdrlen = ndopts.nd_opts_src_lladdr->nd_opt_len << 3;
goto bad;
}
- nd6_cache_lladdr(ifp, &saddr6, lladdr, lladdrlen, ND_ROUTER_ADVERT, 0);
+ if (dr && dr->stateflags & NDDRF_MAPPED)
+ saddr6 = dr->rtaddr_mapped;
+
+ nd6_cache_lladdr(ifp, &saddr6, lladdr, (int)lladdrlen,
+ ND_ROUTER_ADVERT, 0);
+
+ /* Post message */
+ nd6_post_msg(KEV_ND6_RA, nd_prefix_list_head, nd_prefix_list_length,
+ mtu, lladdr, lladdrlen);
/*
* Installing a link-layer address might change the state of the
* router's neighbor cache, which might also affect our on-link
* detection of adveritsed prefixes.
*/
- pfxlist_onlink_check(0);
- }
+ lck_mtx_lock(nd6_mutex);
+ pfxlist_onlink_check();
+ lck_mtx_unlock(nd6_mutex);
- freeit:
+freeit:
m_freem(m);
+ if (dr)
+ NDDR_REMREF(dr);
+
+ prfl = NULL;
+ while ((prfl = nd_prefix_list_head) != NULL) {
+ nd_prefix_list_head = prfl->next;
+ FREE(prfl, M_TEMP);
+ }
+
return;
- bad:
+bad:
icmp6stat.icp6s_badra++;
- m_freem(m);
+ goto freeit;
}
/*
/* tell the change to user processes watching the routing socket. */
static void
-nd6_rtmsg(cmd, rt)
- int cmd;
- struct rtentry *rt;
+nd6_rtmsg(int cmd, struct rtentry *rt)
{
struct rt_addrinfo info;
+ struct ifnet *ifp = rt->rt_ifp;
- lck_mtx_assert(rt_mtx, LCK_MTX_ASSERT_OWNED);
+ RT_LOCK_ASSERT_HELD(rt);
- bzero((caddr_t)&info, sizeof(info));
+ bzero((caddr_t)&info, sizeof (info));
+ /* It's not necessary to lock ifp for if_lladdr */
info.rti_info[RTAX_DST] = rt_key(rt);
info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
info.rti_info[RTAX_NETMASK] = rt_mask(rt);
- info.rti_info[RTAX_IFP] =
- TAILQ_FIRST(&rt->rt_ifp->if_addrlist)->ifa_addr;
+ /*
+ * ifa_addr pointers for both should always be valid
+ * in this context; no need to hold locks.
+ */
+ info.rti_info[RTAX_IFP] = ifp->if_lladdr->ifa_addr;
info.rti_info[RTAX_IFA] = rt->rt_ifa->ifa_addr;
rt_missmsg(cmd, &info, rt->rt_flags, 0);
}
-void
-defrouter_addreq(
- struct nd_defrouter *new)
+static void
+defrouter_addreq(struct nd_defrouter *new, boolean_t scoped)
{
struct sockaddr_in6 def, mask, gate;
struct rtentry *newrt = NULL;
+ unsigned int ifscope;
+ int err;
+ struct nd_ifinfo *ndi = ND_IFINFO(new->ifp);
- Bzero(&def, sizeof(def));
- Bzero(&mask, sizeof(mask));
- Bzero(&gate, sizeof(gate));
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_NOTOWNED);
+ NDDR_LOCK_ASSERT_NOTHELD(new);
+ /*
+ * We're free to lock and unlock NDDR because our callers
+ * are holding an extra reference for us.
+ */
- def.sin6_len = mask.sin6_len = gate.sin6_len
- = sizeof(struct sockaddr_in6);
- def.sin6_family = mask.sin6_family = gate.sin6_family = AF_INET6;
- gate.sin6_addr = new->rtaddr;
+ NDDR_LOCK(new);
+ if (new->stateflags & NDDRF_INSTALLED)
+ goto out;
- lck_mtx_lock(rt_mtx);
- (void)rtrequest_locked(RTM_ADD, (struct sockaddr *)&def,
- (struct sockaddr *)&gate, (struct sockaddr *)&mask,
- RTF_GATEWAY, &newrt);
- if (newrt) {
- nd6_rtmsg(RTM_ADD, newrt); /* tell user process */
- rtunref(newrt);
+ if (new->ifp->if_eflags & IFEF_IPV6_ROUTER) {
+ nd6log2((LOG_INFO, "%s: ignoring router %s, scoped=%d, "
+ "static=%d on advertising interface\n", if_name(new->ifp),
+ ip6_sprintf(&new->rtaddr), scoped,
+ (new->stateflags & NDDRF_STATIC) ? 1 : 0));
+ goto out;
}
- lck_mtx_unlock(rt_mtx);
- return;
-}
-/* Add a route to a given interface as default */
-void
-defrouter_addifreq(
- struct ifnet *ifp)
-{
- struct sockaddr_in6 def, mask;
- struct ifaddr *ifa = NULL;
- struct rtentry *newrt = NULL;
- int error;
- u_long flags;
+ nd6log2((LOG_INFO, "%s: adding default router %s, scoped=%d, "
+ "static=%d\n", if_name(new->ifp), ip6_sprintf(&new->rtaddr),
+ scoped, (new->stateflags & NDDRF_STATIC) ? 1 : 0));
+
+ Bzero(&def, sizeof (def));
+ Bzero(&mask, sizeof (mask));
+ Bzero(&gate, sizeof (gate));
- bzero(&def, sizeof(def));
- bzero(&mask, sizeof(mask));
+ def.sin6_len = mask.sin6_len = gate.sin6_len
+ = sizeof (struct sockaddr_in6);
+ def.sin6_family = mask.sin6_family = gate.sin6_family = AF_INET6;
+
+ if (new->stateflags & NDDRF_MAPPED)
+ gate.sin6_addr = new->rtaddr_mapped;
+ else
+ gate.sin6_addr = new->rtaddr;
- def.sin6_len = mask.sin6_len = sizeof(struct sockaddr_in6);
- def.sin6_family = mask.sin6_family = AF_INET6;
+ ifscope = scoped ? new->ifp->if_index : IFSCOPE_NONE;
+ NDDR_UNLOCK(new);
/*
- * Search for an ifaddr beloging to the specified interface.
- * XXX: An IPv6 address are required to be assigned on the interface.
+ * Cellular networks may have buggy deployments
+ * with gateway IPv6 link local address with same
+ * interface identifier as the one that has been
+ * assigned for the cellular context.
+ * If gateway is same as locally configured link local
+ * interface on cellular interface, generated a different one
+ * and store it in the nd_defrouter entry and use it to work
+ * on routing table
*/
- if ((ifa = ifaof_ifpforaddr((struct sockaddr *)&def, ifp)) == NULL) {
- nd6log((LOG_ERR, /* better error? */
- "defrouter_addifreq: failed to find an ifaddr "
- "to install a route to interface %s\n",
- if_name(ifp)));
- return;
+ if (new->ifp->if_type == IFT_CELLULAR &&
+ !(new->stateflags & NDDRF_STATIC) &&
+ !(new->stateflags & NDDRF_MAPPED) &&
+ IN6_IS_ADDR_LINKLOCAL(&gate.sin6_addr) &&
+ ndi && !(ndi->flags & ND6_IFF_PERFORMNUD)) {
+ struct in6_ifaddr *tmp_ia6 = in6ifa_ifpforlinklocal(new->ifp, 0);
+
+ if (tmp_ia6 != NULL &&
+ !(tmp_ia6->ia6_flags & IN6_IFF_NOTMANUAL) &&
+ IN6_ARE_ADDR_EQUAL(&tmp_ia6->ia_addr.sin6_addr,
+ &gate.sin6_addr)) {
+ gate.sin6_addr.s6_addr8[15] += 1;
+ new->rtaddr_mapped = gate.sin6_addr;
+ new->stateflags |= NDDRF_MAPPED;
+
+ nd6log((LOG_INFO, "%s: Default router %s mapped "
+ "to ", if_name(new->ifp), ip6_sprintf(&new->rtaddr)));
+ nd6log((LOG_INFO, "%s\n", ip6_sprintf(&new->rtaddr_mapped)));
+ }
}
- lck_mtx_lock(rt_mtx);
- flags = ifa->ifa_flags;
- error = rtrequest_locked(RTM_ADD, (struct sockaddr *)&def, ifa->ifa_addr,
- (struct sockaddr *)&mask, flags, &newrt);
- if (error != 0) {
- nd6log((LOG_ERR,
- "defrouter_addifreq: failed to install a route to "
- "interface %s (errno = %d)\n",
- if_name(ifp), error));
+ err = rtrequest_scoped(RTM_ADD, (struct sockaddr *)&def,
+ (struct sockaddr *)&gate, (struct sockaddr *)&mask,
+ RTF_GATEWAY, &newrt, ifscope);
- if (newrt) /* maybe unnecessary, but do it for safety */
- rtunref(newrt);
+ if (newrt) {
+ RT_LOCK(newrt);
+ nd6_rtmsg(RTM_ADD, newrt); /* tell user process */
+ RT_REMREF_LOCKED(newrt);
+ RT_UNLOCK(newrt);
+ NDDR_LOCK(new);
+ new->stateflags |= NDDRF_INSTALLED;
+ if (ifscope != IFSCOPE_NONE)
+ new->stateflags |= NDDRF_IFSCOPE;
} else {
- if (newrt) {
- nd6_rtmsg(RTM_ADD, newrt);
- rtunref(newrt);
- }
- in6_post_msg(ifp, KEV_INET6_DEFROUTER, (struct in6_ifaddr *)ifa);
+ nd6log((LOG_ERR, "%s: failed to add default router "
+ "%s on %s scoped %d (errno = %d)\n", __func__,
+ ip6_sprintf(&gate.sin6_addr), if_name(new->ifp),
+ (ifscope != IFSCOPE_NONE), err));
+ NDDR_LOCK(new);
}
- lck_mtx_unlock(rt_mtx);
- ifafree(ifa);
+ new->err = err;
+
+out:
+ NDDR_UNLOCK(new);
}
struct nd_defrouter *
{
struct nd_defrouter *dr;
-
lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
for (dr = TAILQ_FIRST(&nd_defrouter); dr;
- dr = TAILQ_NEXT(dr, dr_entry)) {
- if (dr->ifp == ifp && IN6_ARE_ADDR_EQUAL(addr, &dr->rtaddr))
- return(dr);
+ dr = TAILQ_NEXT(dr, dr_entry)) {
+ NDDR_LOCK(dr);
+ if (dr->ifp == ifp && IN6_ARE_ADDR_EQUAL(addr, &dr->rtaddr)) {
+ NDDR_ADDREF_LOCKED(dr);
+ NDDR_UNLOCK(dr);
+ return (dr);
+ }
+ NDDR_UNLOCK(dr);
}
- return(NULL); /* search failed */
+ return (NULL); /* search failed */
}
-void
-defrouter_delreq(
- struct nd_defrouter *dr,
- int dofree)
+/*
+ * Remove the default route for a given router.
+ * This is just a subroutine function for defrouter_select(), and should
+ * not be called from anywhere else.
+ */
+static void
+defrouter_delreq(struct nd_defrouter *dr)
{
struct sockaddr_in6 def, mask, gate;
struct rtentry *oldrt = NULL;
+ unsigned int ifscope;
+ int err;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_NOTOWNED);
+ NDDR_LOCK_ASSERT_NOTHELD(dr);
+ /*
+ * We're free to lock and unlock NDDR because our callers
+ * are holding an extra reference for us.
+ */
+ NDDR_LOCK(dr);
+ /* ifp would be NULL for the "drany" case */
+ if (dr->ifp != NULL && !(dr->stateflags & NDDRF_INSTALLED))
+ goto out;
+
+ nd6log2((LOG_INFO, "%s: removing default router %s, scoped=%d, "
+ "static=%d\n", dr->ifp != NULL ? if_name(dr->ifp) : "ANY",
+ ip6_sprintf(&dr->rtaddr), (dr->stateflags & NDDRF_IFSCOPE) ? 1 : 0,
+ (dr->stateflags & NDDRF_STATIC) ? 1 : 0));
- Bzero(&def, sizeof(def));
- Bzero(&mask, sizeof(mask));
- Bzero(&gate, sizeof(gate));
+ Bzero(&def, sizeof (def));
+ Bzero(&mask, sizeof (mask));
+ Bzero(&gate, sizeof (gate));
def.sin6_len = mask.sin6_len = gate.sin6_len
- = sizeof(struct sockaddr_in6);
+ = sizeof (struct sockaddr_in6);
def.sin6_family = mask.sin6_family = gate.sin6_family = AF_INET6;
- gate.sin6_addr = dr->rtaddr;
- lck_mtx_lock(rt_mtx);
- rtrequest_locked(RTM_DELETE, (struct sockaddr *)&def,
- (struct sockaddr *)&gate,
- (struct sockaddr *)&mask,
- RTF_GATEWAY, &oldrt);
+ /*
+ * The router entry may be mapped to a different address.
+ * If that is the case, use the mapped address as gateway
+ * to do operation on the routing table.
+ * To get more context, read the related comment in
+ * defrouter_addreq
+ */
+ if (dr->stateflags & NDDRF_MAPPED)
+ gate.sin6_addr = dr->rtaddr_mapped;
+ else
+ gate.sin6_addr = dr->rtaddr;
+
+ if (dr->ifp != NULL) {
+ ifscope = (dr->stateflags & NDDRF_IFSCOPE) ?
+ dr->ifp->if_index : IFSCOPE_NONE;
+ } else {
+ ifscope = IFSCOPE_NONE;
+ }
+ NDDR_UNLOCK(dr);
+
+ err = rtrequest_scoped(RTM_DELETE,
+ (struct sockaddr *)&def, (struct sockaddr *)&gate,
+ (struct sockaddr *)&mask, RTF_GATEWAY, &oldrt, ifscope);
+
if (oldrt) {
+ RT_LOCK(oldrt);
nd6_rtmsg(RTM_DELETE, oldrt);
- if (oldrt->rt_refcnt <= 0) {
- /*
- * XXX: borrowed from the RTM_DELETE case of
- * rtrequest().
- */
- rtref(oldrt);
- rtfree_locked(oldrt);
+ RT_UNLOCK(oldrt);
+ rtfree(oldrt);
+ } else if (err != ESRCH) {
+ nd6log((LOG_ERR, "%s: failed to delete default router "
+ "%s on %s scoped %d (errno = %d)\n", __func__,
+ ip6_sprintf(&gate.sin6_addr), dr->ifp != NULL ?
+ if_name(dr->ifp) : "ANY", (ifscope != IFSCOPE_NONE), err));
+ }
+ NDDR_LOCK(dr);
+ /* ESRCH means it's no longer in the routing table; ignore it */
+ if (oldrt != NULL || err == ESRCH) {
+ dr->stateflags &= ~NDDRF_INSTALLED;
+ if (ifscope != IFSCOPE_NONE)
+ dr->stateflags &= ~NDDRF_IFSCOPE;
+ }
+ dr->err = 0;
+out:
+ NDDR_UNLOCK(dr);
+}
+
+
+/*
+ * remove all default routes from default router list
+ */
+void
+defrouter_reset(void)
+{
+ struct nd_defrouter *dr, drany;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ dr = TAILQ_FIRST(&nd_defrouter);
+ while (dr) {
+ NDDR_LOCK(dr);
+ if (dr->stateflags & NDDRF_INSTALLED) {
+ NDDR_ADDREF_LOCKED(dr);
+ NDDR_UNLOCK(dr);
+ lck_mtx_unlock(nd6_mutex);
+ defrouter_delreq(dr);
+ lck_mtx_lock(nd6_mutex);
+ NDDR_REMREF(dr);
+ dr = TAILQ_FIRST(&nd_defrouter);
+ } else {
+ NDDR_UNLOCK(dr);
+ dr = TAILQ_NEXT(dr, dr_entry);
+ }
+ }
+
+ /* Nuke primary (non-scoped) default router */
+ bzero(&drany, sizeof (drany));
+ lck_mtx_init(&drany.nddr_lock, ifa_mtx_grp, ifa_mtx_attr);
+ lck_mtx_unlock(nd6_mutex);
+ defrouter_delreq(&drany);
+ lck_mtx_destroy(&drany.nddr_lock, ifa_mtx_grp);
+ lck_mtx_lock(nd6_mutex);
+}
+
+int
+defrtrlist_ioctl(u_long cmd, caddr_t data)
+{
+ struct nd_defrouter dr0;
+ unsigned int ifindex;
+ struct ifnet *dr_ifp;
+ int error = 0, add = 0;
+
+ /* XXX Handle mapped default router entries */
+ switch (cmd) {
+ case SIOCDRADD_IN6_32: /* struct in6_defrouter_32 */
+ case SIOCDRADD_IN6_64: /* struct in6_defrouter_64 */
+ ++add;
+ /* FALLTHRU */
+ case SIOCDRDEL_IN6_32: /* struct in6_defrouter_32 */
+ case SIOCDRDEL_IN6_64: /* struct in6_defrouter_64 */
+ bzero(&dr0, sizeof (dr0));
+ if (cmd == SIOCDRADD_IN6_64 || cmd == SIOCDRDEL_IN6_64) {
+ struct in6_defrouter_64 *r_64 =
+ (struct in6_defrouter_64 *)(void *)data;
+ u_int16_t i;
+
+ bcopy(&r_64->rtaddr.sin6_addr, &dr0.rtaddr,
+ sizeof (dr0.rtaddr));
+ dr0.flags = r_64->flags;
+ bcopy(&r_64->if_index, &i, sizeof (i));
+ ifindex = i;
+ } else {
+ struct in6_defrouter_32 *r_32 =
+ (struct in6_defrouter_32 *)(void *)data;
+ u_int16_t i;
+
+ bcopy(&r_32->rtaddr.sin6_addr, &dr0.rtaddr,
+ sizeof (dr0.rtaddr));
+ dr0.flags = r_32->flags;
+ bcopy(&r_32->if_index, &i, sizeof (i));
+ ifindex = i;
+ }
+ ifnet_head_lock_shared();
+ /* Don't need to check is ifindex is < 0 since it's unsigned */
+ if (if_index < ifindex ||
+ (dr_ifp = ifindex2ifnet[ifindex]) == NULL) {
+ ifnet_head_done();
+ error = EINVAL;
+ break;
+ }
+ dr0.ifp = dr_ifp;
+ ifnet_head_done();
+
+ if (IN6_IS_SCOPE_EMBED(&dr0.rtaddr)) {
+ uint16_t *scope = &dr0.rtaddr.s6_addr16[1];
+
+ if (*scope == 0) {
+ *scope = htons(dr_ifp->if_index);
+ } else if (*scope != htons(dr_ifp->if_index)) {
+ error = EINVAL;
+ break;
+ }
+ }
+
+ if (add)
+ error = defrtrlist_add_static(&dr0);
+ if (!add || error != 0) {
+ int err = defrtrlist_del_static(&dr0);
+ if (!add)
+ error = err;
}
+ break;
+
+ default:
+ error = EOPNOTSUPP; /* check for safety */
+ break;
}
- if (dofree) /* XXX: necessary? */
- FREE(dr, M_IP6NDP);
- lck_mtx_unlock(rt_mtx);
+ return (error);
}
+/*
+ * XXX Please make sure to remove dr from the
+ * global default router tailq list before this
+ * function call.
+ * Also ensure that you release the list reference
+ * only after calling this routine.
+ */
void
-defrtrlist_del(
- struct nd_defrouter *dr, int nd6locked)
+defrtrlist_del(struct nd_defrouter *dr)
{
- struct nd_defrouter *deldr = NULL;
+#if (DEVELOPMENT || DEBUG)
+ struct nd_defrouter *dr_itr = NULL;
+#endif
struct nd_prefix *pr;
+ struct ifnet *ifp = dr->ifp;
+ struct nd_ifinfo *ndi = NULL;
+ boolean_t resetmtu;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+#if (DEVELOPMENT || DEBUG)
+ /*
+ * Verify that the router is not in the global default
+ * router list.
+ * Can't use defrouter_lookup here because that just works
+ * with address and ifp pointer.
+ * We have to compare the memory here.
+ * Also we can't use ASSERT here as that is not defined
+ * for development builds.
+ */
+ TAILQ_FOREACH(dr_itr, &nd_defrouter, dr_entry)
+ VERIFY(dr != dr_itr);
+#endif
+ ++nd6_defrouter_genid;
/*
* Flush all the routing table entries that use the router
* as a next hop.
*/
- if (!ip6_forwarding && (ip6_accept_rtadv || (dr->ifp->if_eflags & IFEF_ACCEPT_RTADVD))) {
- /* above is a good condition? */
- rt6_flush(&dr->rtaddr, dr->ifp);
- }
-
- if (nd6locked == 0)
- lck_mtx_lock(nd6_mutex);
- if (dr == TAILQ_FIRST(&nd_defrouter))
- deldr = dr; /* The router is primary. */
+ /* above is a good condition? */
+ NDDR_ADDREF(dr);
+ lck_mtx_unlock(nd6_mutex);
+ if (dr->stateflags & NDDRF_MAPPED)
+ rt6_flush(&dr->rtaddr_mapped, ifp);
+ else
+ rt6_flush(&dr->rtaddr, ifp);
- TAILQ_REMOVE(&nd_defrouter, dr, dr_entry);
+ lck_mtx_lock(nd6_mutex);
+ NDDR_REMREF(dr);
+ nd6log2((LOG_INFO, "%s: freeing defrouter %s\n", if_name(dr->ifp),
+ ip6_sprintf(&dr->rtaddr)));
+ /*
+ * Delete it from the routing table.
+ */
+ NDDR_ADDREF(dr);
+ lck_mtx_unlock(nd6_mutex);
+ defrouter_delreq(dr);
+ lck_mtx_lock(nd6_mutex);
+ NDDR_REMREF(dr);
/*
* Also delete all the pointers to the router in each prefix lists.
*/
for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
struct nd_pfxrouter *pfxrtr;
+
+ NDPR_LOCK(pr);
if ((pfxrtr = pfxrtr_lookup(pr, dr)) != NULL)
- pfxrtr_del(pfxrtr);
+ pfxrtr_del(pfxrtr, pr);
+ NDPR_UNLOCK(pr);
+ }
+
+ pfxlist_onlink_check();
+
+ resetmtu = FALSE;
+ ndi = ND_IFINFO(ifp);
+ VERIFY((NULL != ndi) && (TRUE == ndi->initialized));
+ lck_mtx_lock(&ndi->lock);
+ VERIFY(ndi->ndefrouters >= 0);
+ if (ndi->ndefrouters > 0 && --ndi->ndefrouters == 0) {
+ nd6_ifreset(ifp);
+ resetmtu = TRUE;
}
- pfxlist_onlink_check(1);
+ lck_mtx_unlock(&ndi->lock);
/*
* If the router is the primary one, choose a new one.
- * Note that defrouter_select() will remove the current gateway
- * from the routing table.
+ * We always try to pick another eligible router
+ * on this interface as we do scoped routing
*/
- if (deldr)
- defrouter_select();
+ defrouter_select(ifp);
- if (nd6locked == 0)
- lck_mtx_unlock(nd6_mutex);
+ if (resetmtu)
+ nd6_setmtu(ifp);
+}
+
+int
+defrtrlist_add_static(struct nd_defrouter *new)
+{
+ struct nd_defrouter *dr;
+ int err = 0;
+
+ new->rtlifetime = -1;
+ new->stateflags |= NDDRF_STATIC;
+
+ /* we only want the preference level */
+ new->flags &= ND_RA_FLAG_RTPREF_MASK;
+
+ lck_mtx_lock(nd6_mutex);
+ dr = defrouter_lookup(&new->rtaddr, new->ifp);
+ if (dr != NULL && !(dr->stateflags & NDDRF_STATIC)) {
+ err = EINVAL;
+ } else {
+ if (dr != NULL)
+ NDDR_REMREF(dr);
+ dr = defrtrlist_update(new);
+ if (dr != NULL)
+ err = dr->err;
+ else
+ err = ENOMEM;
+ }
+ if (dr != NULL)
+ NDDR_REMREF(dr);
+ lck_mtx_unlock(nd6_mutex);
- FREE(dr, M_IP6NDP);
+ return (err);
+}
+
+int
+defrtrlist_del_static(struct nd_defrouter *new)
+{
+ struct nd_defrouter *dr;
+
+ lck_mtx_lock(nd6_mutex);
+ dr = defrouter_lookup(&new->rtaddr, new->ifp);
+ if (dr == NULL || !(dr->stateflags & NDDRF_STATIC)) {
+ if (dr != NULL)
+ NDDR_REMREF(dr);
+ dr = NULL;
+ } else {
+ TAILQ_REMOVE(&nd_defrouter, dr, dr_entry);
+ defrtrlist_del(dr);
+ NDDR_REMREF(dr); /* remove list reference */
+ NDDR_REMREF(dr);
+ }
+ lck_mtx_unlock(nd6_mutex);
+
+ return (dr != NULL ? 0 : EINVAL);
+}
+
+/*
+ * for default router selection
+ * regards router-preference field as a 2-bit signed integer
+ */
+static int
+rtpref(struct nd_defrouter *dr)
+{
+ switch (dr->flags & ND_RA_FLAG_RTPREF_MASK) {
+ case ND_RA_FLAG_RTPREF_HIGH:
+ return (RTPREF_HIGH);
+ case ND_RA_FLAG_RTPREF_MEDIUM:
+ case ND_RA_FLAG_RTPREF_RSV:
+ return (RTPREF_MEDIUM);
+ case ND_RA_FLAG_RTPREF_LOW:
+ return (RTPREF_LOW);
+ default:
+ /*
+ * This case should never happen. If it did, it would mean a
+ * serious bug of kernel internal. We thus always bark here.
+ * Or, can we even panic?
+ */
+ log(LOG_ERR, "rtpref: impossible RA flag %x\n", dr->flags);
+ return (RTPREF_INVALID);
+ }
+ /* NOTREACHED */
}
/*
- * Default Router Selection according to Section 6.3.6 of RFC 2461:
- * 1) Routers that are reachable or probably reachable should be
- * preferred.
+ * Default Router Selection according to Section 6.3.6 of RFC 2461 and RFC 4191:
+ *
+ * 1) Routers that are reachable or probably reachable should be preferred.
+ * If we have more than one (probably) reachable router, prefer ones
+ * with the highest router preference.
* 2) When no routers on the list are known to be reachable or
* probably reachable, routers SHOULD be selected in a round-robin
- * fashion.
+ * fashion, regardless of router preference values.
* 3) If the Default Router List is empty, assume that all
* destinations are on-link.
+ *
+ * When Scoped Routing is enabled, the selection logic is amended as follows:
+ *
+ * a) When a default interface is specified, the primary/non-scoped default
+ * router will be set to the reachable router on that link (if any) with
+ * the highest router preference.
+ * b) When there are more than one routers on the same link, the one with
+ * the highest router preference will be installed, either as scoped or
+ * non-scoped route entry. If they all share the same preference value,
+ * the one installed will be the static or the first encountered reachable
+ * router, i.e. static one wins over dynamic.
+ * c) When no routers on the list are known to be reachable, or probably
+ * reachable, no round-robin selection will take place when the default
+ * interface is set.
+ *
+ * We assume nd_defrouter is sorted by router preference value.
+ * Since the code below covers both with and without router preference cases,
+ * we do not need to classify the cases by ifdef.
*/
void
-defrouter_select()
+defrouter_select(struct ifnet *ifp)
{
- struct nd_defrouter *dr, anydr;
- struct rtentry *rt = NULL;
+ struct nd_defrouter *dr = NULL;
+ struct nd_defrouter *selected_dr = NULL;
+ struct nd_defrouter *installed_dr = NULL;
struct llinfo_nd6 *ln = NULL;
+ struct rtentry *rt = NULL;
+ struct nd_ifinfo *ndi = NULL;
+ unsigned int genid = 0;
+ boolean_t is_installed_reachable = FALSE;
- /*
- * Search for a (probably) reachable router from the list.
- */
lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
- for (dr = TAILQ_FIRST(&nd_defrouter); dr;
- dr = TAILQ_NEXT(dr, dr_entry)) {
- if ((rt = nd6_lookup(&dr->rtaddr, 0, dr->ifp, 0)) &&
- (ln = (struct llinfo_nd6 *)rt->rt_llinfo) &&
- ND6_IS_LLINFO_PROBREACH(ln)) {
- /* Got it, and move it to the head */
- TAILQ_REMOVE(&nd_defrouter, dr, dr_entry);
- TAILQ_INSERT_HEAD(&nd_defrouter, dr, dr_entry);
- break;
- }
+ if (ifp == NULL) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Return early. NULL interface",
+ __func__, __LINE__));
+ return;
+ }
+
+ if (ifp == lo_ifp) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Return early. "
+ "Default router select called for loopback.\n",
+ __func__, __LINE__));
+ return;
+ }
+
+ if (ifp->if_eflags & IFEF_IPV6_ROUTER) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Return early. "
+ "Default router select called for interface"
+ " %s with IFEF_IPV6_ROUTER flag set\n",
+ __func__, __LINE__, if_name(ifp)));
+ return;
+ }
+
+ /*
+ * Let's handle easy case (3) first:
+ * If default router list is empty, there's nothing to be done.
+ */
+ if (!TAILQ_FIRST(&nd_defrouter)) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Return early. "
+ "Default router is empty.\n", __func__, __LINE__));
+ return;
+ }
+
+ /*
+ * Take an early exit if number of routers in nd_ifinfo is
+ * 0 for the interface.
+ */
+ ndi = ND_IFINFO(ifp);
+ if (!ndi || !ndi->initialized) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Return early. "
+ "Interface %s's nd_ifinfo not initialized.\n",
+ __func__, __LINE__, if_name(ifp)));
+ return;
}
- if ((dr = TAILQ_FIRST(&nd_defrouter))) {
+ if (ndi->ndefrouters == 0) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Return early. "
+ "%s does not have any default routers.\n",
+ __func__, __LINE__, if_name(ifp)));
+ return;
+ }
+
+ /*
+ * Due to the number of times we drop nd6_mutex, we need to
+ * serialize this function.
+ */
+ while (nd_defrouter_busy) {
+ nd_defrouter_waiters++;
+ msleep(nd_defrouter_waitchan, nd6_mutex, (PZERO-1),
+ __func__, NULL);
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ }
+ nd_defrouter_busy = TRUE;
+
+ /*
+ * Search for a (probably) reachable router from the list.
+ * We just pick up the first reachable one (if any), assuming that
+ * the ordering rule of the list described in defrtrlist_update().
+ *
+ * For all intents and purposes of Scoped Routing:
+ * selected_dr = candidate for primary router
+ * installed_dr = currently installed primary router
+ */
+ genid = nd6_defrouter_genid;
+ dr = TAILQ_FIRST(&nd_defrouter);
+
+ while (dr != NULL) {
+ struct in6_addr rtaddr;
+ struct ifnet *drifp = NULL;
+ struct nd_defrouter *drrele = NULL;
+
+ NDDR_LOCK(dr);
+ drifp = dr->ifp;
+ if (drifp != ifp) {
+ NDDR_UNLOCK(dr);
+ dr = TAILQ_NEXT(dr, dr_entry);
+ continue;
+ }
+
+ /*
+ * Optimize for the common case.
+ * When the interface has only one default router
+ * there's no point checking for reachability as
+ * there's nothing else to choose from.
+ */
+ if (ndi->ndefrouters == 1) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Fast forward default router selection "
+ "as interface %s has learned only one default "
+ "router and there's nothing else to choose from.\n",
+ __func__, __LINE__, if_name(ifp)));
+ VERIFY(selected_dr == NULL && installed_dr == NULL);
+ selected_dr = dr;
+ if (dr->stateflags & NDDRF_INSTALLED)
+ installed_dr = dr;
+ NDDR_ADDREF_LOCKED(selected_dr);
+ NDDR_UNLOCK(dr);
+ goto install_route;
+ }
+
+ if (dr->stateflags & NDDRF_MAPPED)
+ rtaddr = dr->rtaddr_mapped;
+ else
+ rtaddr = dr->rtaddr;
+
+ NDDR_ADDREF_LOCKED(dr); /* for this for loop */
+ NDDR_UNLOCK(dr);
+
+ /* Callee returns a locked route upon success */
+ if (selected_dr == NULL) {
+ lck_mtx_unlock(nd6_mutex);
+ if ((rt = nd6_lookup(&rtaddr, 0, drifp, 0)) != NULL &&
+ (ln = rt->rt_llinfo) != NULL &&
+ ND6_IS_LLINFO_PROBREACH(ln)) {
+ RT_LOCK_ASSERT_HELD(rt);
+ selected_dr = dr;
+ NDDR_ADDREF(selected_dr);
+ }
+ lck_mtx_lock(nd6_mutex);
+ }
+
+ if (rt) {
+ RT_REMREF_LOCKED(rt);
+ RT_UNLOCK(rt);
+ rt = NULL;
+ }
+
+ /*
+ * Handle case (b)
+ * When there are more than one routers on the same link, the one with
+ * the highest router preference will be installed.
+ * Since the list is in decreasing order of preference:
+ * 1) If selected_dr is not NULL, only use dr if it is static and has
+ * equal preference and selected_dr is not static.
+ * 2) Else if selected_dr is NULL, and dr is static make selected_dr = dr
+ */
+ NDDR_LOCK(dr);
+ if (((selected_dr && (rtpref(dr) >= rtpref(selected_dr)) &&
+ !(selected_dr->stateflags & NDDRF_STATIC)) ||
+ (selected_dr == NULL)) &&
+ (dr->stateflags & NDDRF_STATIC)) {
+ if (selected_dr) {
+ /* Release it later on */
+ VERIFY(drrele == NULL);
+ drrele = selected_dr;
+ }
+ selected_dr = dr;
+ NDDR_ADDREF_LOCKED(selected_dr);
+ }
+
+ /* Record the currently installed router */
+ if (dr->stateflags & NDDRF_INSTALLED) {
+ if (installed_dr == NULL) {
+ installed_dr = dr;
+ NDDR_ADDREF_LOCKED(installed_dr);
+ if (dr->stateflags & NDDRF_MAPPED)
+ rtaddr = installed_dr->rtaddr_mapped;
+ else
+ rtaddr = installed_dr->rtaddr;
+ NDDR_UNLOCK(dr);
+ lck_mtx_unlock(nd6_mutex);
+ /* Callee returns a locked route upon success */
+ if ((rt = nd6_lookup(&rtaddr, 0, ifp, 0)) != NULL) {
+ RT_LOCK_ASSERT_HELD(rt);
+ if ((ln = rt->rt_llinfo) != NULL &&
+ ND6_IS_LLINFO_PROBREACH(ln))
+ is_installed_reachable = TRUE;
+
+ RT_REMREF_LOCKED(rt);
+ RT_UNLOCK(rt);
+ rt = NULL;
+ }
+ lck_mtx_lock(nd6_mutex);
+ } else {
+ /* this should not happen; warn for diagnosis */
+ nd6log((LOG_ERR, "defrouter_select: more than one "
+ "default router is installed for interface :%s.\n",
+ if_name(ifp)));
+ NDDR_UNLOCK(dr);
+ }
+ } else
+ NDDR_UNLOCK(dr);
+
+ NDDR_REMREF(dr); /* for this for loop */
+ if (drrele != NULL)
+ NDDR_REMREF(drrele);
+
/*
- * De-install the previous default gateway and install
- * a new one.
- * Note that if there is no reachable router in the list,
- * the head entry will be used anyway.
- * XXX: do we have to check the current routing table entry?
+ * Check if the list changed when we gave up
+ * the nd6_mutex lock
*/
- bzero(&anydr, sizeof(anydr));
- defrouter_delreq(&anydr, 0);
- defrouter_addreq(dr);
+ if(genid != nd6_defrouter_genid) {
+ if (selected_dr) {
+ NDDR_REMREF(selected_dr);
+ selected_dr = NULL;
+ }
+
+ if (installed_dr) {
+ NDDR_REMREF(installed_dr);
+ installed_dr = NULL;
+ }
+
+ if (ndi->ndefrouters == 0) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Interface %s no longer "
+ "has any default routers. Abort.\n",
+ __func__, __LINE__, if_name(ifp)));
+ goto out;
+ }
+ nd6log2((LOG_INFO,
+ "%s:%d: Iterate default router list again "
+ "for interface %s, as the list seems to have "
+ "changed during release-reaquire of global "
+ "nd6_mutex lock.\n",
+ __func__, __LINE__, if_name(ifp)));
+
+ is_installed_reachable = FALSE;
+ genid = nd6_defrouter_genid;
+ dr = TAILQ_FIRST(&nd_defrouter);
+ } else {
+ dr = TAILQ_NEXT(dr, dr_entry);
+ }
}
- else {
+
+ /*
+ * If none of the default routers was found to be reachable,
+ * round-robin the list regardless of preference.
+ * Please note selected_dr equal to NULL implies that even
+ * installed default router is not reachable
+ */
+ if (selected_dr == NULL) {
+ if (installed_dr) {
+ for (dr = TAILQ_NEXT(installed_dr, dr_entry); dr;
+ dr = TAILQ_NEXT(dr, dr_entry)) {
+ if (installed_dr->ifp != dr->ifp)
+ continue;
+ selected_dr = dr;
+ break;
+ }
+ }
+
/*
- * The Default Router List is empty, so install the default
- * route to an inteface.
- * XXX: The specification does not say this mechanism should
- * be restricted to hosts, but this would be not useful
- * (even harmful) for routers.
+ * If none was installed or the installed one if the last
+ * one on the list, select the first one from the list
*/
- if (!ip6_forwarding) {
+ if ((installed_dr == NULL) || (selected_dr == NULL)) {
+ for (dr = TAILQ_FIRST(&nd_defrouter); dr;
+ dr = TAILQ_NEXT(dr, dr_entry)) {
+ if (dr->ifp == ifp) {
+ selected_dr = dr;
+ break;
+ }
+ }
+ }
+
+ if ((selected_dr == NULL) && (installed_dr == NULL)) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Between release and reaquire of global "
+ "nd6_mutex lock, the list seems to have changed "
+ "and it does not have any default routers for "
+ "interface %s.\n",
+ __func__, __LINE__, if_name(ifp)));
+ goto out;
+ }
+
+ if (selected_dr != installed_dr)
+ NDDR_ADDREF(selected_dr);
+ } else if (installed_dr != NULL) {
+ if (installed_dr != selected_dr) {
/*
- * De-install the current default route
- * in advance.
+ * This means that selected default router is reachable
+ * while installed one may or may not be.
+ * Static router should always be considered as reachable
+ * for router selection process.
*/
- bzero(&anydr, sizeof(anydr));
- defrouter_delreq(&anydr, 0);
- if (nd6_defifp) {
- /*
- * Install a route to the default interface
- * as default route.
- * XXX: we enable this for host only, because
- * this may override a default route installed
- * a user process (e.g. routing daemon) in a
- * router case.
- */
- defrouter_addifreq(nd6_defifp);
- } else {
- nd6log((LOG_INFO, "defrouter_select: "
- "there's no default router and no default"
- " interface\n"));
+ if ((installed_dr->stateflags & NDDRF_STATIC) &&
+ rtpref(installed_dr) >= rtpref(selected_dr)) {
+ NDDR_REMREF(selected_dr);
+ selected_dr = installed_dr;
+ } else if (is_installed_reachable) {
+ if (rtpref(selected_dr) <= rtpref(installed_dr)) {
+ NDDR_REMREF(selected_dr);
+ selected_dr = installed_dr;
+ }
}
+ } else {
+ NDDR_REMREF(selected_dr);
}
}
- return;
+install_route:
+ /*
+ * If the selected router is different than the installed one,
+ * remove the installed router and install the selected one.
+ * Note that the selected router is never NULL here.
+ * Else check if the route entry scope has to be changed.
+ */
+ lck_mtx_unlock(nd6_mutex);
+ if (installed_dr != selected_dr) {
+ nd6log((LOG_INFO,
+ "%s:%d: Found a better router for interface "
+ "%s. Installing new default route.\n",
+ __func__, __LINE__, if_name(ifp)));
+ if (installed_dr != NULL) {
+ defrouter_delreq(installed_dr);
+ }
+ /*
+ * Install scoped route if the interface is not
+ * the default nd6 interface.
+ */
+ defrouter_addreq(selected_dr,
+ (selected_dr->ifp != nd6_defifp));
+ } else if (((installed_dr->stateflags & NDDRF_IFSCOPE) &&
+ (installed_dr->ifp == nd6_defifp)) ||
+ (!(installed_dr->stateflags & NDDRF_IFSCOPE) &&
+ (installed_dr->ifp != nd6_defifp))) {
+ nd6log((LOG_INFO,
+ "%s:%d: Need to reinstall default route for interface "
+ "%s as its scope has changed.\n",
+ __func__, __LINE__, if_name(ifp)));
+ defrouter_delreq(installed_dr);
+ defrouter_addreq(installed_dr,
+ (installed_dr->ifp != nd6_defifp));
+ } else {
+ nd6log2((LOG_INFO,
+ "%s:%d: No need to change the default "
+ "route for interface %s.\n",
+ __func__, __LINE__, if_name(ifp)));
+ }
+ lck_mtx_lock(nd6_mutex);
+out:
+ if (selected_dr && (selected_dr != installed_dr))
+ NDDR_REMREF(selected_dr);
+ if (installed_dr)
+ NDDR_REMREF(installed_dr);
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ VERIFY(nd_defrouter_busy);
+ nd_defrouter_busy = FALSE;
+ if (nd_defrouter_waiters > 0) {
+ nd_defrouter_waiters = 0;
+ wakeup(nd_defrouter_waitchan);
+ }
}
static struct nd_defrouter *
-defrtrlist_update(
- struct nd_defrouter *new)
+defrtrlist_update_common(struct nd_defrouter *new, boolean_t scoped)
{
struct nd_defrouter *dr, *n;
+ struct ifnet *ifp = new->ifp;
+ struct nd_ifinfo *ndi = NULL;
+ struct timeval caltime;
- lck_mtx_lock(nd6_mutex);
- if ((dr = defrouter_lookup(&new->rtaddr, new->ifp)) != NULL) {
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ if ((dr = defrouter_lookup(&new->rtaddr, ifp)) != NULL) {
/* entry exists */
if (new->rtlifetime == 0) {
- defrtrlist_del(dr, 1);
+ TAILQ_REMOVE(&nd_defrouter, dr, dr_entry);
+ defrtrlist_del(dr);
+ NDDR_REMREF(dr); /* remove list reference */
+ NDDR_REMREF(dr);
dr = NULL;
} else {
+ int oldpref = rtpref(dr);
+ struct nd_defrouter *p = NULL;
/* override */
dr->flags = new->flags; /* xxx flag check */
dr->rtlifetime = new->rtlifetime;
dr->expire = new->expire;
+
+ /*
+ * If the preference does not change, there's no need
+ * to sort the entries. If Scoped Routing is enabled,
+ * put the primary/non-scoped router at the top of the
+ * list of routers in the same preference band, unless
+ * it's already at that position.
+ */
+ /* same preference and scoped; just return */
+ if (rtpref(new) == oldpref && scoped)
+ return (dr);
+
+ n = TAILQ_FIRST(&nd_defrouter);
+ while (n != NULL) {
+ /* preference changed; sort it */
+ if (rtpref(new) != oldpref)
+ break;
+
+ /* not at the top of band; sort it */
+ if (n != dr && rtpref(n) == oldpref &&
+ (!p || rtpref(p) > rtpref(n)))
+ break;
+
+ p = n;
+ n = TAILQ_NEXT(n, dr_entry);
+ }
+
+ /* nothing has changed, just return */
+ if (n == NULL && (scoped ||
+ !(dr->stateflags & NDDRF_IFSCOPE)))
+ return (dr);
+
+ /*
+ * preferred router may be changed, so relocate
+ * this router.
+ * XXX: calling TAILQ_REMOVE directly is a bad manner.
+ * However, since defrtrlist_del() has many side
+ * effects, we intentionally do so here.
+ * defrouter_select() below will handle routing
+ * changes later.
+ */
+ TAILQ_REMOVE(&nd_defrouter, dr, dr_entry);
+ new->stateflags = dr->stateflags;
+
+ n = dr;
+ goto insert;
}
- lck_mtx_unlock(nd6_mutex);
- return(dr);
+ return (dr);
}
+ VERIFY(dr == NULL);
+
/* entry does not exist */
if (new->rtlifetime == 0) {
- lck_mtx_unlock(nd6_mutex);
- return(NULL);
+ return (NULL);
}
- n = (struct nd_defrouter *)_MALLOC(sizeof(*n), M_IP6NDP, M_NOWAIT);
+ n = nddr_alloc(M_WAITOK);
if (n == NULL) {
- lck_mtx_unlock(nd6_mutex);
- return(NULL);
- }
- bzero(n, sizeof(*n));
- *n = *new;
+ return (NULL);
+ }
+
+ ndi = ND_IFINFO(ifp);
+ VERIFY((NULL != ndi) && (TRUE == ndi->initialized));
+ lck_mtx_lock(&ndi->lock);
+ if (ip6_maxifdefrouters >= 0 &&
+ ndi->ndefrouters >= ip6_maxifdefrouters) {
+ lck_mtx_unlock(&ndi->lock);
+ nddr_free(n);
+ return (NULL);
+ }
+
+ NDDR_ADDREF(n); /* for the nd_defrouter list */
+ NDDR_ADDREF(n); /* for the caller */
+
+ ++nd6_defrouter_genid;
+ ndi->ndefrouters++;
+ VERIFY(ndi->ndefrouters != 0);
+ lck_mtx_unlock(&ndi->lock);
+
+ nd6log2((LOG_INFO, "%s: allocating defrouter %s\n", if_name(ifp),
+ ip6_sprintf(&new->rtaddr)));
+
+ getmicrotime(&caltime);
+ NDDR_LOCK(n);
+ memcpy(&n->rtaddr, &new->rtaddr, sizeof (n->rtaddr));
+ n->flags = new->flags;
+ n->stateflags = new->stateflags;
+ n->rtlifetime = new->rtlifetime;
+ n->expire = new->expire;
+ n->base_calendartime = caltime.tv_sec;
+ n->base_uptime = net_uptime();
+ n->ifp = new->ifp;
+ n->err = new->err;
+ NDDR_UNLOCK(n);
+insert:
+ /* get nd6_service() to be scheduled as soon as it's convenient */
+ ++nd6_sched_timeout_want;
/*
- * Insert the new router at the end of the Default Router List.
- * If there is no other router, install it anyway. Otherwise,
- * just continue to use the current default router.
+ * Insert the new router in the Default Router List;
+ * The Default Router List should be in the descending order
+ * of router-preferece. When Scoped Routing is disabled, routers
+ * with the same preference are sorted in the arriving time order;
+ * otherwise, the first entry in the list of routers having the same
+ * preference is the primary default router, when the interface used
+ * by the entry is the default interface.
*/
- TAILQ_INSERT_TAIL(&nd_defrouter, n, dr_entry);
- if (TAILQ_FIRST(&nd_defrouter) == n)
- defrouter_select();
-
- lck_mtx_unlock(nd6_mutex);
- return(n);
+
+ /* insert at the end of the group */
+ for (dr = TAILQ_FIRST(&nd_defrouter); dr;
+ dr = TAILQ_NEXT(dr, dr_entry)) {
+ if (rtpref(n) > rtpref(dr) ||
+ (!scoped && rtpref(n) == rtpref(dr)))
+ break;
+ }
+ if (dr)
+ TAILQ_INSERT_BEFORE(dr, n, dr_entry);
+ else
+ TAILQ_INSERT_TAIL(&nd_defrouter, n, dr_entry);
+
+ defrouter_select(ifp);
+
+ return (n);
+}
+
+static struct nd_defrouter *
+defrtrlist_update(struct nd_defrouter *new)
+{
+ struct nd_defrouter *dr;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ dr = defrtrlist_update_common(new,
+ (nd6_defifp != NULL && new->ifp != nd6_defifp));
+
+ return (dr);
}
static struct nd_pfxrouter *
-pfxrtr_lookup(
- struct nd_prefix *pr,
- struct nd_defrouter *dr)
+pfxrtr_lookup(struct nd_prefix *pr, struct nd_defrouter *dr)
{
struct nd_pfxrouter *search;
-
+
lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
- for (search = pr->ndpr_advrtrs.lh_first; search; search = search->pfr_next) {
+ NDPR_LOCK_ASSERT_HELD(pr);
+
+ for (search = pr->ndpr_advrtrs.lh_first; search;
+ search = search->pfr_next) {
if (search->router == dr)
break;
}
- return(search);
+ return (search);
}
static void
-pfxrtr_add(
- struct nd_prefix *pr,
- struct nd_defrouter *dr)
+pfxrtr_add(struct nd_prefix *pr, struct nd_defrouter *dr)
{
struct nd_pfxrouter *new;
lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ NDPR_LOCK_ASSERT_NOTHELD(pr);
- new = (struct nd_pfxrouter *)_MALLOC(sizeof(*new), M_IP6NDP, M_NOWAIT);
+ new = zalloc(ndprtr_zone);
if (new == NULL)
return;
- bzero(new, sizeof(*new));
+ bzero(new, sizeof (*new));
new->router = dr;
+ NDPR_LOCK(pr);
LIST_INSERT_HEAD(&pr->ndpr_advrtrs, new, pfr_entry);
+ pr->ndpr_genid++;
+ NDPR_UNLOCK(pr);
- pfxlist_onlink_check(1);
+ pfxlist_onlink_check();
}
static void
-pfxrtr_del(
- struct nd_pfxrouter *pfr)
+pfxrtr_del(struct nd_pfxrouter *pfr, struct nd_prefix *pr)
{
lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ NDPR_LOCK_ASSERT_HELD(pr);
+ pr->ndpr_genid++;
LIST_REMOVE(pfr, pfr_entry);
- FREE(pfr, M_IP6NDP);
+ zfree(ndprtr_zone, pfr);
}
+/*
+ * The routine has been modified to atomically refresh expiry
+ * time for nd6 prefix as the part of lookup.
+ * There's a corner case where a system going
+ * in sleep gets rid of manual addresses configured in the system
+ * and then schedules the prefix for deletion.
+ * However before the prefix gets deleted, if system comes out
+ * from sleep and configures same address before prefix deletion
+ * , the later prefix deletion will remove the prefix route and
+ * the system will not be able to communicate with other IPv6
+ * neighbor nodes in the same subnet.
+ */
struct nd_prefix *
-nd6_prefix_lookup(
- struct nd_prefix *pr)
+nd6_prefix_lookup(struct nd_prefix *pr, int nd6_prefix_expiry)
{
struct nd_prefix *search;
lck_mtx_lock(nd6_mutex);
for (search = nd_prefix.lh_first; search; search = search->ndpr_next) {
+ NDPR_LOCK(search);
if (pr->ndpr_ifp == search->ndpr_ifp &&
pr->ndpr_plen == search->ndpr_plen &&
in6_are_prefix_equal(&pr->ndpr_prefix.sin6_addr,
- &search->ndpr_prefix.sin6_addr,
- pr->ndpr_plen)
- ) {
+ &search->ndpr_prefix.sin6_addr, pr->ndpr_plen)) {
+ if (nd6_prefix_expiry != ND6_PREFIX_EXPIRY_UNSPEC) {
+ search->ndpr_expire = nd6_prefix_expiry;
+ }
+ NDPR_ADDREF_LOCKED(search);
+ NDPR_UNLOCK(search);
break;
}
+ NDPR_UNLOCK(search);
}
lck_mtx_unlock(nd6_mutex);
- return(search);
+ return (search);
}
int
-nd6_prelist_add(
- struct nd_prefix *pr,
- struct nd_defrouter *dr,
- struct nd_prefix **newp)
+nd6_prelist_add(struct nd_prefix *pr, struct nd_defrouter *dr,
+ struct nd_prefix **newp, boolean_t force_scoped)
{
struct nd_prefix *new = NULL;
- int i;
+ struct ifnet *ifp = pr->ndpr_ifp;
+ struct nd_ifinfo *ndi = NULL;
+ int i, error;
+
+ if (ip6_maxifprefixes >= 0) {
+ ndi = ND_IFINFO(ifp);
+ VERIFY((NULL != ndi) && (TRUE == ndi->initialized));
+ lck_mtx_lock(&ndi->lock);
+ if (ndi->nprefixes >= ip6_maxifprefixes) {
+ lck_mtx_unlock(&ndi->lock);
+ return (ENOMEM);
+ }
+ lck_mtx_unlock(&ndi->lock);
+ }
- new = (struct nd_prefix *)_MALLOC(sizeof(*new), M_IP6NDP, M_NOWAIT);
+ new = ndpr_alloc(M_WAITOK);
if (new == NULL)
- return ENOMEM;
- bzero(new, sizeof(*new));
- *new = *pr;
- if (newp != NULL)
+ return (ENOMEM);
+
+ NDPR_LOCK(new);
+ NDPR_LOCK(pr);
+ new->ndpr_ifp = pr->ndpr_ifp;
+ new->ndpr_prefix = pr->ndpr_prefix;
+ new->ndpr_plen = pr->ndpr_plen;
+ new->ndpr_vltime = pr->ndpr_vltime;
+ new->ndpr_pltime = pr->ndpr_pltime;
+ new->ndpr_flags = pr->ndpr_flags;
+ if (pr->ndpr_stateflags & NDPRF_STATIC)
+ new->ndpr_stateflags |= NDPRF_STATIC;
+ NDPR_UNLOCK(pr);
+ if ((error = in6_init_prefix_ltimes(new)) != 0) {
+ NDPR_UNLOCK(new);
+ ndpr_free(new);
+ return (error);
+ }
+ new->ndpr_lastupdate = net_uptime();
+ if (newp != NULL) {
*newp = new;
-
- /* initilization */
+ NDPR_ADDREF_LOCKED(new); /* for caller */
+ }
+ /* initialization */
LIST_INIT(&new->ndpr_advrtrs);
in6_prefixlen2mask(&new->ndpr_mask, new->ndpr_plen);
/* make prefix in the canonical form */
new->ndpr_prefix.sin6_addr.s6_addr32[i] &=
new->ndpr_mask.s6_addr32[i];
- /* link ndpr_entry to nd_prefix list */
+ NDPR_UNLOCK(new);
+
+ /* get nd6_service() to be scheduled as soon as it's convenient */
+ ++nd6_sched_timeout_want;
+
lck_mtx_lock(nd6_mutex);
+ /* link ndpr_entry to nd_prefix list */
LIST_INSERT_HEAD(&nd_prefix, new, ndpr_entry);
+ new->ndpr_debug |= IFD_ATTACHED;
+ NDPR_ADDREF(new); /* for nd_prefix list */
+
+ lck_mtx_lock(&ndi->lock);
+ ndi->nprefixes++;
+ VERIFY(ndi->nprefixes != 0);
+ lck_mtx_unlock(&ndi->lock);
/* ND_OPT_PI_FLAG_ONLINK processing */
if (new->ndpr_raf_onlink) {
int e;
- if ((e = nd6_prefix_onlink(new, 0, 1)) != 0) {
+ if ((e = nd6_prefix_onlink_common(new, force_scoped,
+ new->ndpr_ifp->if_index)) != 0) {
nd6log((LOG_ERR, "nd6_prelist_add: failed to make "
- "the prefix %s/%d on-link on %s (errno=%d)\n",
- ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
- pr->ndpr_plen, if_name(pr->ndpr_ifp), e));
+ "the prefix %s/%d on-link %s on %s (errno=%d)\n",
+ ip6_sprintf(&new->ndpr_prefix.sin6_addr),
+ new->ndpr_plen, force_scoped ? "scoped" :
+ "non-scoped", if_name(ifp), e));
/* proceed anyway. XXX: is it correct? */
}
}
if (dr) {
pfxrtr_add(new, dr);
}
+
lck_mtx_unlock(nd6_mutex);
- return 0;
+ return (0);
}
+/*
+ * Caller must have held an extra reference on nd_prefix.
+ */
void
-prelist_remove(
- struct nd_prefix *pr, int nd6locked)
+prelist_remove(struct nd_prefix *pr)
{
struct nd_pfxrouter *pfr, *next;
+ struct ifnet *ifp = pr->ndpr_ifp;
int e;
+ struct nd_ifinfo *ndi = NULL;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ NDPR_LOCK_ASSERT_HELD(pr);
+
+ if (pr->ndpr_stateflags & NDPRF_DEFUNCT)
+ return;
+
+ /*
+ * If there are no more addresses, defunct the prefix. This is needed
+ * because we don't want multiple threads calling prelist_remove() for
+ * the same prefix and this might happen because we unlock nd6_mutex
+ * down below.
+ */
+ if (pr->ndpr_addrcnt == 0)
+ pr->ndpr_stateflags |= NDPRF_DEFUNCT;
/* make sure to invalidate the prefix until it is really freed. */
pr->ndpr_vltime = 0;
pr->ndpr_pltime = 0;
-#if 0
+
/*
* Though these flags are now meaningless, we'd rather keep the value
- * not to confuse users when executing "ndp -p".
+ * of pr->ndpr_raf_onlink and pr->ndpr_raf_auto not to confuse users
+ * when executing "ndp -p".
*/
- pr->ndpr_raf_onlink = 0;
- pr->ndpr_raf_auto = 0;
-#endif
- if ((pr->ndpr_stateflags & NDPRF_ONLINK) != 0 &&
- (e = nd6_prefix_offlink(pr)) != 0) {
- nd6log((LOG_ERR, "prelist_remove: failed to make %s/%d offlink "
- "on %s, errno=%d\n",
- ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
- pr->ndpr_plen, if_name(pr->ndpr_ifp), e));
- /* what should we do? */
+ if (pr->ndpr_stateflags & NDPRF_ONLINK) {
+ NDPR_ADDREF_LOCKED(pr);
+ NDPR_UNLOCK(pr);
+ lck_mtx_unlock(nd6_mutex);
+ if ((e = nd6_prefix_offlink(pr)) != 0) {
+ nd6log((LOG_ERR, "prelist_remove: failed to make "
+ "%s/%d offlink on %s, errno=%d\n",
+ ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(ifp), e));
+ /* what should we do? */
+ }
+ lck_mtx_lock(nd6_mutex);
+ NDPR_LOCK(pr);
+ if (NDPR_REMREF_LOCKED(pr) == NULL)
+ return;
}
- if (pr->ndpr_refcnt > 0)
- return; /* notice here? */
+ if (pr->ndpr_addrcnt > 0) {
+ /*
+ * The state might have changed if we called
+ * nd6_prefix_offlink().
+ */
+ pr->ndpr_stateflags &= ~NDPRF_DEFUNCT;
+ return; /* notice here? */
+ }
- if (nd6locked == 0)
- lck_mtx_lock(nd6_mutex);
/* unlink ndpr_entry from nd_prefix list */
LIST_REMOVE(pr, ndpr_entry);
+ pr->ndpr_debug &= ~IFD_ATTACHED;
/* free list of routers that adversed the prefix */
for (pfr = pr->ndpr_advrtrs.lh_first; pfr; pfr = next) {
next = pfr->pfr_next;
-
- FREE(pfr, M_IP6NDP);
+ pfxrtr_del(pfr, pr);
}
- FREE(pr, M_IP6NDP);
+ ndi = ND_IFINFO(ifp);
+ VERIFY((NULL != ndi) && (TRUE == ndi->initialized));
+ lck_mtx_lock(&ndi->lock);
+ VERIFY(ndi->nprefixes > 0);
+ ndi->nprefixes--;
+ lck_mtx_unlock(&ndi->lock);
- pfxlist_onlink_check(1);
- if (nd6locked == 0)
- lck_mtx_unlock(nd6_mutex);
+ /* This must not be the last reference to the nd_prefix */
+ if (NDPR_REMREF_LOCKED(pr) == NULL) {
+ panic("%s: unexpected (missing) refcnt ndpr=%p", __func__, pr);
+ /* NOTREACHED */
+ }
+
+ /*
+ * Don't call pfxlist_onlink_check() here because we are
+ * holding the NDPR lock and this could cause a deadlock when
+ * there are multiple threads executing pfxlist_onlink_check().
+ */
}
int
prelist_update(
struct nd_prefix *new,
struct nd_defrouter *dr, /* may be NULL */
- struct mbuf *m)
+ struct mbuf *m,
+ int mcast)
{
struct in6_ifaddr *ia6 = NULL, *ia6_match = NULL;
struct ifaddr *ifa;
int newprefix = 0;
int auth;
struct in6_addrlifetime lt6_tmp;
- struct timeval timenow;
+ uint64_t timenow = net_uptime();
+
+ /* no need to lock "new" here, as it is local to the caller */
+ NDPR_LOCK_ASSERT_NOTHELD(new);
auth = 0;
if (m) {
* both IP header and IP datagrams, doesn't it ?
*/
#if defined(M_AUTHIPHDR) && defined(M_AUTHIPDGM)
- auth = (m->m_flags & M_AUTHIPHDR
- && m->m_flags & M_AUTHIPDGM) ? 1 : 0;
+ auth = (m->m_flags & M_AUTHIPHDR) && (m->m_flags & M_AUTHIPDGM);
#endif
}
-
- if ((pr = nd6_prefix_lookup(new)) != NULL) {
+ if ((pr = nd6_prefix_lookup(new, ND6_PREFIX_EXPIRY_UNSPEC)) != NULL) {
/*
* nd6_prefix_lookup() ensures that pr and new have the same
* prefix on a same interface.
* and the autonomous (A) bit should NOT be changed from 1
* to 0.
*/
+ lck_mtx_lock(nd6_mutex);
+ NDPR_LOCK(pr);
if (new->ndpr_raf_onlink == 1)
pr->ndpr_raf_onlink = 1;
if (new->ndpr_raf_auto == 1)
if (new->ndpr_raf_onlink) {
pr->ndpr_vltime = new->ndpr_vltime;
pr->ndpr_pltime = new->ndpr_pltime;
- pr->ndpr_preferred = new->ndpr_preferred;
- pr->ndpr_expire = new->ndpr_expire;
+ (void) in6_init_prefix_ltimes(pr); /* XXX error case? */
+ pr->ndpr_lastupdate = net_uptime();
}
+ NDPR_ADDREF_LOCKED(pr);
if (new->ndpr_raf_onlink &&
(pr->ndpr_stateflags & NDPRF_ONLINK) == 0) {
int e;
- if ((e = nd6_prefix_onlink(pr, 0, 0)) != 0) {
+ NDPR_UNLOCK(pr);
+ if ((e = nd6_prefix_onlink(pr)) != 0) {
nd6log((LOG_ERR,
"prelist_update: failed to make "
"the prefix %s/%d on-link on %s "
pr->ndpr_plen, if_name(pr->ndpr_ifp), e));
/* proceed anyway. XXX: is it correct? */
}
+ NDPR_LOCK(pr);
}
-
- lck_mtx_lock(nd6_mutex);
- if (dr && pfxrtr_lookup(pr, dr) == NULL)
+
+ if (dr && pfxrtr_lookup(pr, dr) == NULL) {
+ NDPR_UNLOCK(pr);
pfxrtr_add(pr, dr);
+ } else {
+ NDPR_UNLOCK(pr);
+ }
+ NDPR_REMREF(pr);
lck_mtx_unlock(nd6_mutex);
} else {
- struct nd_prefix *newpr = NULL;
-
newprefix = 1;
if (new->ndpr_vltime == 0)
if (new->ndpr_raf_onlink == 0 && new->ndpr_raf_auto == 0)
goto end;
- bzero(&new->ndpr_addr, sizeof(struct in6_addr));
+ bzero(&new->ndpr_addr, sizeof (struct in6_addr));
- error = nd6_prelist_add(new, dr, &newpr);
- if (error != 0 || newpr == NULL) {
+ error = nd6_prelist_add(new, dr, &pr, FALSE);
+ if (error != 0 || pr == NULL) {
nd6log((LOG_NOTICE, "prelist_update: "
"nd6_prelist_add failed for %s/%d on %s "
- "errno=%d, returnpr=%p\n",
+ "errno=%d, returnpr=0x%llx\n",
ip6_sprintf(&new->ndpr_prefix.sin6_addr),
- new->ndpr_plen, if_name(new->ndpr_ifp),
- error, newpr));
+ new->ndpr_plen, if_name(new->ndpr_ifp),
+ error, (uint64_t)VM_KERNEL_ADDRPERM(pr)));
goto end; /* we should just give up in this case. */
}
-
- /*
- * XXX: from the ND point of view, we can ignore a prefix
- * with the on-link bit being zero. However, we need a
- * prefix structure for references from autoconfigured
- * addresses. Thus, we explicitly make suret that the prefix
- * itself expires now.
- */
- if (newpr->ndpr_raf_onlink == 0) {
- newpr->ndpr_vltime = 0;
- newpr->ndpr_pltime = 0;
- in6_init_prefix_ltimes(newpr);
- }
-
- pr = newpr;
}
/*
- * Address autoconfiguration based on Section 5.5.3 of RFC 2462.
+ * Address autoconfiguration based on Section 5.5.3 of RFC 4862.
* Note that pr must be non NULL at this point.
*/
/* 5.5.3 (a). Ignore the prefix without the A bit set. */
if (!new->ndpr_raf_auto)
- goto afteraddrconf;
+ goto end;
/*
* 5.5.3 (b). the link-local prefix should have been ignored in
* nd6_ra_input.
*/
- /*
- * 5.5.3 (c). Consistency check on lifetimes: pltime <= vltime.
- * This should have been done in nd6_ra_input.
- */
+ /* 5.5.3 (c). Consistency check on lifetimes: pltime <= vltime. */
+ if (new->ndpr_pltime > new->ndpr_vltime) {
+ error = EINVAL; /* XXX: won't be used */
+ goto end;
+ }
- /*
- * 5.5.3 (d). If the prefix advertised does not match the prefix of an
- * address already in the list, and the Valid Lifetime is not 0,
- * form an address. Note that even a manually configured address
- * should reject autoconfiguration of a new address.
+ /*
+ * 5.5.3 (d). If the prefix advertised is not equal to the prefix of
+ * an address configured by stateless autoconfiguration already in the
+ * list of addresses associated with the interface, and the Valid
+ * Lifetime is not 0, form an address. We first check if we have
+ * a matching prefix.
*/
- getmicrotime(&timenow);
-
- ifnet_lock_exclusive(ifp);
- TAILQ_FOREACH(ifa, &ifp->if_addrlist, ifa_list)
- {
+ ifnet_lock_shared(ifp);
+ TAILQ_FOREACH(ifa, &ifp->if_addrlist, ifa_list) {
struct in6_ifaddr *ifa6;
- int ifa_plen;
- u_int32_t storedlifetime;
+ u_int32_t remaininglifetime;
- if (ifa->ifa_addr->sa_family != AF_INET6)
+ IFA_LOCK(ifa);
+ if (ifa->ifa_addr->sa_family != AF_INET6) {
+ IFA_UNLOCK(ifa);
continue;
-
+ }
ifa6 = (struct in6_ifaddr *)ifa;
+ /*
+ * We only consider autoconfigured addresses as per RFC 4862.
+ */
+ if (!(ifa6->ia6_flags & IN6_IFF_AUTOCONF)) {
+ IFA_UNLOCK(ifa);
+ continue;
+ }
/*
* Spec is not clear here, but I believe we should concentrate
* on unicast (i.e. not anycast) addresses.
* XXX: other ia6_flags? detached or duplicated?
*/
- if ((ifa6->ia6_flags & IN6_IFF_ANYCAST) != 0)
+ if ((ifa6->ia6_flags & IN6_IFF_ANYCAST) != 0) {
+ IFA_UNLOCK(ifa);
continue;
-
- ifa_plen = in6_mask2len(&ifa6->ia_prefixmask.sin6_addr, NULL);
- if (ifa_plen != new->ndpr_plen ||
- !in6_are_prefix_equal(&ifa6->ia_addr.sin6_addr,
- &new->ndpr_prefix.sin6_addr,
- ifa_plen))
+ }
+ /*
+ * Ignore the address if it is not associated with a prefix
+ * or is associated with a prefix that is different from this
+ * one. (pr is never NULL here)
+ */
+ if (ifa6->ia6_ndpr != pr) {
+ IFA_UNLOCK(ifa);
continue;
+ }
- if (ia6_match == NULL) /* remember the first one */
+ if (ia6_match == NULL) { /* remember the first one */
ia6_match = ifa6;
-
- if ((ifa6->ia6_flags & IN6_IFF_AUTOCONF) == 0)
- continue;
+ IFA_ADDREF_LOCKED(ifa); /* for ia6_match */
+ }
/*
* An already autoconfigured address matched. Now that we
* proceed to 5.5.3. (e): update the lifetimes according to the
* "two hours" rule and the privacy extension.
*/
-#define TWOHOUR (120*60)
- lt6_tmp = ifa6->ia6_lifetime;
+#define TWOHOUR (120*60)
+
+ /* retrieve time as uptime (last arg is 0) */
+ in6ifa_getlifetime(ifa6, <6_tmp, 0);
- storedlifetime = IFA6_IS_INVALID(ifa6) ? 0 :
- (lt6_tmp.ia6t_expire - timenow.tv_sec);
+ if (lt6_tmp.ia6t_vltime == ND6_INFINITE_LIFETIME)
+ remaininglifetime = ND6_INFINITE_LIFETIME;
+ else if (timenow - ifa6->ia6_updatetime > lt6_tmp.ia6t_vltime) {
+ /*
+ * The case of "invalid" address. We should usually
+ * not see this case.
+ */
+ remaininglifetime = 0;
+ } else {
+ remaininglifetime = lt6_tmp.ia6t_vltime -
+ (timenow - ifa6->ia6_updatetime);
+ }
+ /* when not updating, keep the current stored lifetime. */
+ lt6_tmp.ia6t_vltime = remaininglifetime;
if (TWOHOUR < new->ndpr_vltime ||
- storedlifetime < new->ndpr_vltime) {
+ remaininglifetime < new->ndpr_vltime) {
lt6_tmp.ia6t_vltime = new->ndpr_vltime;
- } else if (storedlifetime <= TWOHOUR
-#if 0
- /*
- * This condition is logically redundant, so we just
- * omit it.
- * See IPng 6712, 6717, and 6721.
- */
- && new->ndpr_vltime <= storedlifetime
-#endif
- ) {
+ } else if (remaininglifetime <= TWOHOUR) {
if (auth) {
lt6_tmp.ia6t_vltime = new->ndpr_vltime;
}
} else {
/*
* new->ndpr_vltime <= TWOHOUR &&
- * TWOHOUR < storedlifetime
+ * TWOHOUR < remaininglifetime
*/
lt6_tmp.ia6t_vltime = TWOHOUR;
}
/* The 2 hour rule is not imposed for preferred lifetime. */
lt6_tmp.ia6t_pltime = new->ndpr_pltime;
- in6_init_address_ltimes(pr, <6_tmp);
-
- /*
- * When adjusting the lifetimes of an existing temporary
- * address, only lower the lifetimes.
- * RFC 3041 3.3. (1).
- * XXX: how should we modify ia6t_[pv]ltime?
- */
+ /* Special handling for lifetimes of temporary addresses. */
if ((ifa6->ia6_flags & IN6_IFF_TEMPORARY) != 0) {
- if (lt6_tmp.ia6t_expire == 0 || /* no expire */
- lt6_tmp.ia6t_expire >
- ifa6->ia6_lifetime.ia6t_expire) {
- lt6_tmp.ia6t_expire =
- ifa6->ia6_lifetime.ia6t_expire;
- }
- if (lt6_tmp.ia6t_preferred == 0 || /* no expire */
- lt6_tmp.ia6t_preferred >
- ifa6->ia6_lifetime.ia6t_preferred) {
- lt6_tmp.ia6t_preferred =
- ifa6->ia6_lifetime.ia6t_preferred;
- }
+ u_int32_t maxvltime, maxpltime;
+
+ /* Constrain lifetimes to system limits. */
+ if (lt6_tmp.ia6t_vltime > ip6_temp_valid_lifetime)
+ lt6_tmp.ia6t_vltime = ip6_temp_valid_lifetime;
+ if (lt6_tmp.ia6t_pltime > ip6_temp_preferred_lifetime)
+ lt6_tmp.ia6t_pltime =
+ ip6_temp_preferred_lifetime -
+ ip6_desync_factor;
+
+ /*
+ * According to RFC 4941, section 3.3 (1), we only
+ * update the lifetimes when they are in the maximum
+ * intervals.
+ */
+ if (ip6_temp_valid_lifetime >
+ (u_int32_t)((timenow - ifa6->ia6_createtime) +
+ ip6_desync_factor)) {
+ maxvltime = ip6_temp_valid_lifetime -
+ (timenow - ifa6->ia6_createtime) -
+ ip6_desync_factor;
+ } else
+ maxvltime = 0;
+ if (ip6_temp_preferred_lifetime >
+ (u_int32_t)((timenow - ifa6->ia6_createtime) +
+ ip6_desync_factor)) {
+ maxpltime = ip6_temp_preferred_lifetime -
+ (timenow - ifa6->ia6_createtime) -
+ ip6_desync_factor;
+ } else
+ maxpltime = 0;
+
+ if (lt6_tmp.ia6t_vltime == ND6_INFINITE_LIFETIME ||
+ lt6_tmp.ia6t_vltime > maxvltime)
+ lt6_tmp.ia6t_vltime = maxvltime;
+
+ if (lt6_tmp.ia6t_pltime == ND6_INFINITE_LIFETIME ||
+ lt6_tmp.ia6t_pltime > maxpltime)
+ lt6_tmp.ia6t_pltime = maxpltime;
}
- ifa6->ia6_lifetime = lt6_tmp;
+ in6_init_address_ltimes(pr, <6_tmp);
+
+ in6ifa_setlifetime(ifa6, <6_tmp);
+ ifa6->ia6_updatetime = timenow;
+ IFA_UNLOCK(ifa);
}
ifnet_lock_done(ifp);
if (ia6_match == NULL && new->ndpr_vltime) {
/*
+ * 5.5.3 (d) (continued)
* No address matched and the valid lifetime is non-zero.
* Create a new address.
*/
- if ((ia6 = in6_ifadd(new, NULL)) != NULL) {
+
+ if ((ia6 = in6_pfx_newpersistaddr(new, mcast, &error))
+ != NULL) {
/*
* note that we should use pr (not new) for reference.
*/
- pr->ndpr_refcnt++;
+ IFA_LOCK(&ia6->ia_ifa);
+ NDPR_LOCK(pr);
ia6->ia6_ndpr = pr;
-
-#if 0
- /* XXXYYY Don't do this, according to Jinmei. */
- pr->ndpr_addr = new->ndpr_addr;
-#endif
+ NDPR_ADDREF_LOCKED(pr); /* for addr reference */
+ pr->ndpr_addrcnt++;
+ VERIFY(pr->ndpr_addrcnt != 0);
+ NDPR_UNLOCK(pr);
+ IFA_UNLOCK(&ia6->ia_ifa);
/*
- * RFC 3041 3.3 (2).
+ * RFC 4941 3.3 (2).
* When a new public address is created as described
- * in RFC2462, also create a new temporary address.
+ * in RFC 4862, also create a new temporary address.
*
- * RFC 3041 3.5.
+ * RFC 4941 3.5.
* When an interface connects to a new link, a new
* randomized interface identifier should be generated
* immediately together with a new set of temporary
e));
}
}
+ IFA_REMREF(&ia6->ia_ifa);
+ ia6 = NULL;
/*
* A newly added address might affect the status
* of other addresses, so we check and update it.
* XXX: what if address duplication happens?
*/
- pfxlist_onlink_check(0);
- } else {
- /* just set an error. do not bark here. */
- error = EADDRNOTAVAIL; /* XXX: might be unused. */
+ lck_mtx_lock(nd6_mutex);
+ pfxlist_onlink_check();
+ lck_mtx_unlock(nd6_mutex);
+ }
+ }
+
+end:
+ if (pr != NULL)
+ NDPR_REMREF(pr);
+ if (ia6_match != NULL)
+ IFA_REMREF(&ia6_match->ia_ifa);
+ return (error);
+}
+
+/*
+ * Neighbor Discover Default Router structure reference counting routines.
+ */
+static struct nd_defrouter *
+nddr_alloc(int how)
+{
+ struct nd_defrouter *dr;
+
+ dr = (how == M_WAITOK) ? zalloc(nddr_zone) : zalloc_noblock(nddr_zone);
+ if (dr != NULL) {
+ bzero(dr, nddr_size);
+ lck_mtx_init(&dr->nddr_lock, ifa_mtx_grp, ifa_mtx_attr);
+ dr->nddr_debug |= IFD_ALLOC;
+ if (nddr_debug != 0) {
+ dr->nddr_debug |= IFD_DEBUG;
+ dr->nddr_trace = nddr_trace;
}
}
+ return (dr);
+}
+
+static void
+nddr_free(struct nd_defrouter *dr)
+{
+ NDDR_LOCK(dr);
+ if (dr->nddr_debug & IFD_ATTACHED) {
+ panic("%s: attached nddr %p is being freed", __func__, dr);
+ /* NOTREACHED */
+ } else if (!(dr->nddr_debug & IFD_ALLOC)) {
+ panic("%s: nddr %p cannot be freed", __func__, dr);
+ /* NOTREACHED */
+ }
+ dr->nddr_debug &= ~IFD_ALLOC;
+ NDDR_UNLOCK(dr);
+
+ lck_mtx_destroy(&dr->nddr_lock, ifa_mtx_grp);
+ zfree(nddr_zone, dr);
+}
+
+static void
+nddr_trace(struct nd_defrouter *dr, int refhold)
+{
+ struct nd_defrouter_dbg *dr_dbg = (struct nd_defrouter_dbg *)dr;
+ ctrace_t *tr;
+ uint32_t idx;
+ uint16_t *cnt;
+
+ if (!(dr->nddr_debug & IFD_DEBUG)) {
+ panic("%s: nddr %p has no debug structure", __func__, dr);
+ /* NOTREACHED */
+ }
+ if (refhold) {
+ cnt = &dr_dbg->nddr_refhold_cnt;
+ tr = dr_dbg->nddr_refhold;
+ } else {
+ cnt = &dr_dbg->nddr_refrele_cnt;
+ tr = dr_dbg->nddr_refrele;
+ }
+
+ idx = atomic_add_16_ov(cnt, 1) % NDDR_TRACE_HIST_SIZE;
+ ctrace_record(&tr[idx]);
+}
+
+void
+nddr_addref(struct nd_defrouter *nddr, int locked)
+{
- afteraddrconf:
+ if (!locked)
+ NDDR_LOCK_SPIN(nddr);
+ else
+ NDDR_LOCK_ASSERT_HELD(nddr);
+
+ if (++nddr->nddr_refcount == 0) {
+ panic("%s: nddr %p wraparound refcnt\n", __func__, nddr);
+ /* NOTREACHED */
+ } else if (nddr->nddr_trace != NULL) {
+ (*nddr->nddr_trace)(nddr, TRUE);
+ }
- end:
- return error;
+ if (!locked)
+ NDDR_UNLOCK(nddr);
+}
+
+struct nd_defrouter *
+nddr_remref(struct nd_defrouter *nddr, int locked)
+{
+
+ if (!locked)
+ NDDR_LOCK_SPIN(nddr);
+ else
+ NDDR_LOCK_ASSERT_HELD(nddr);
+
+ if (nddr->nddr_refcount == 0) {
+ panic("%s: nddr %p negative refcnt\n", __func__, nddr);
+ /* NOTREACHED */
+ } else if (nddr->nddr_trace != NULL) {
+ (*nddr->nddr_trace)(nddr, FALSE);
+ }
+
+ if (--nddr->nddr_refcount == 0) {
+ NDDR_UNLOCK(nddr);
+ nddr_free(nddr);
+ nddr = NULL;
+ }
+
+ if (!locked && nddr != NULL)
+ NDDR_UNLOCK(nddr);
+
+ return (nddr);
+}
+
+uint64_t
+nddr_getexpire(struct nd_defrouter *dr)
+{
+ struct timeval caltime;
+ uint64_t expiry;
+
+ if (dr->expire != 0) {
+ /* account for system time change */
+ getmicrotime(&caltime);
+
+ dr->base_calendartime +=
+ NET_CALCULATE_CLOCKSKEW(caltime,
+ dr->base_calendartime, net_uptime(), dr->base_uptime);
+
+ expiry = dr->base_calendartime +
+ dr->expire - dr->base_uptime;
+ } else {
+ expiry = 0;
+ }
+ return (expiry);
+}
+
+/*
+ * Neighbor Discover Prefix structure reference counting routines.
+ */
+static struct nd_prefix *
+ndpr_alloc(int how)
+{
+ struct nd_prefix *pr;
+
+ pr = (how == M_WAITOK) ? zalloc(ndpr_zone) : zalloc_noblock(ndpr_zone);
+ if (pr != NULL) {
+ bzero(pr, ndpr_size);
+ lck_mtx_init(&pr->ndpr_lock, ifa_mtx_grp, ifa_mtx_attr);
+ RB_INIT(&pr->ndpr_prproxy_sols);
+ pr->ndpr_debug |= IFD_ALLOC;
+ if (ndpr_debug != 0) {
+ pr->ndpr_debug |= IFD_DEBUG;
+ pr->ndpr_trace = ndpr_trace;
+ }
+ }
+ return (pr);
+}
+
+static void
+ndpr_free(struct nd_prefix *pr)
+{
+ NDPR_LOCK(pr);
+ if (pr->ndpr_debug & IFD_ATTACHED) {
+ panic("%s: attached ndpr %p is being freed", __func__, pr);
+ /* NOTREACHED */
+ } else if (!(pr->ndpr_debug & IFD_ALLOC)) {
+ panic("%s: ndpr %p cannot be freed", __func__, pr);
+ /* NOTREACHED */
+ } else if (pr->ndpr_rt != NULL) {
+ panic("%s: ndpr %p route %p not freed", __func__, pr,
+ pr->ndpr_rt);
+ /* NOTREACHED */
+ } else if (pr->ndpr_prproxy_sols_cnt != 0) {
+ panic("%s: ndpr %p non-zero solicitors count (%d)",
+ __func__, pr, pr->ndpr_prproxy_sols_cnt);
+ /* NOTREACHED */
+ } else if (!RB_EMPTY(&pr->ndpr_prproxy_sols)) {
+ panic("%s: ndpr %p non-empty solicitors tree", __func__, pr);
+ /* NOTREACHED */
+ }
+ pr->ndpr_debug &= ~IFD_ALLOC;
+ NDPR_UNLOCK(pr);
+
+ lck_mtx_destroy(&pr->ndpr_lock, ifa_mtx_grp);
+ zfree(ndpr_zone, pr);
+}
+
+static void
+ndpr_trace(struct nd_prefix *pr, int refhold)
+{
+ struct nd_prefix_dbg *pr_dbg = (struct nd_prefix_dbg *)pr;
+ ctrace_t *tr;
+ u_int32_t idx;
+ u_int16_t *cnt;
+
+ if (!(pr->ndpr_debug & IFD_DEBUG)) {
+ panic("%s: ndpr %p has no debug structure", __func__, pr);
+ /* NOTREACHED */
+ }
+ if (refhold) {
+ cnt = &pr_dbg->ndpr_refhold_cnt;
+ tr = pr_dbg->ndpr_refhold;
+ } else {
+ cnt = &pr_dbg->ndpr_refrele_cnt;
+ tr = pr_dbg->ndpr_refrele;
+ }
+
+ idx = atomic_add_16_ov(cnt, 1) % NDPR_TRACE_HIST_SIZE;
+ ctrace_record(&tr[idx]);
+}
+
+void
+ndpr_addref(struct nd_prefix *ndpr, int locked)
+{
+ if (!locked)
+ NDPR_LOCK_SPIN(ndpr);
+ else
+ NDPR_LOCK_ASSERT_HELD(ndpr);
+
+ if (++ndpr->ndpr_refcount == 0) {
+ panic("%s: ndpr %p wraparound refcnt\n", __func__, ndpr);
+ /* NOTREACHED */
+ } else if (ndpr->ndpr_trace != NULL) {
+ (*ndpr->ndpr_trace)(ndpr, TRUE);
+ }
+
+ if (!locked)
+ NDPR_UNLOCK(ndpr);
+}
+
+struct nd_prefix *
+ndpr_remref(struct nd_prefix *ndpr, int locked)
+{
+ if (!locked)
+ NDPR_LOCK_SPIN(ndpr);
+ else
+ NDPR_LOCK_ASSERT_HELD(ndpr);
+
+ if (ndpr->ndpr_refcount == 0) {
+ panic("%s: ndpr %p negative refcnt\n", __func__, ndpr);
+ /* NOTREACHED */
+ } else if (ndpr->ndpr_trace != NULL) {
+ (*ndpr->ndpr_trace)(ndpr, FALSE);
+ }
+
+ if (--ndpr->ndpr_refcount == 0) {
+ if (ndpr->ndpr_addrcnt != 0) {
+ panic("%s: freeing ndpr %p with outstanding address "
+ "reference (%d)", __func__, ndpr,
+ ndpr->ndpr_addrcnt);
+ /* NOTREACHED */
+ }
+ NDPR_UNLOCK(ndpr);
+ ndpr_free(ndpr);
+ ndpr = NULL;
+ }
+
+ if (!locked && ndpr != NULL)
+ NDPR_UNLOCK(ndpr);
+
+ return (ndpr);
+}
+
+uint64_t
+ndpr_getexpire(struct nd_prefix *pr)
+{
+ struct timeval caltime;
+ uint64_t expiry;
+
+ if (pr->ndpr_expire != 0 && pr->ndpr_vltime != ND6_INFINITE_LIFETIME) {
+ /* account for system time change */
+ getmicrotime(&caltime);
+
+ pr->ndpr_base_calendartime +=
+ NET_CALCULATE_CLOCKSKEW(caltime,
+ pr->ndpr_base_calendartime, net_uptime(),
+ pr->ndpr_base_uptime);
+
+ expiry = pr->ndpr_base_calendartime +
+ pr->ndpr_expire - pr->ndpr_base_uptime;
+ } else {
+ expiry = 0;
+ }
+ return (expiry);
}
/*
* A supplement function used in the on-link detection below;
* detect if a given prefix has a (probably) reachable advertising router.
* XXX: lengthy function name...
+ *
+ * Callers *must* increase the reference count of nd_prefix.
*/
static struct nd_pfxrouter *
-find_pfxlist_reachable_router(
- struct nd_prefix *pr)
+find_pfxlist_reachable_router(struct nd_prefix *pr)
{
struct nd_pfxrouter *pfxrtr;
struct rtentry *rt;
struct llinfo_nd6 *ln;
+ struct ifnet *ifp;
+ struct in6_addr rtaddr;
+ unsigned int genid;
lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ NDPR_LOCK_ASSERT_HELD(pr);
+
+ genid = pr->ndpr_genid;
+ pfxrtr = LIST_FIRST(&pr->ndpr_advrtrs);
+ while (pfxrtr) {
+ ifp = pfxrtr->router->ifp;
+ if (pfxrtr->router->stateflags & NDDRF_MAPPED)
+ rtaddr = pfxrtr->router->rtaddr_mapped;
+ else
+ rtaddr = pfxrtr->router->rtaddr;
- for (pfxrtr = LIST_FIRST(&pr->ndpr_advrtrs); pfxrtr;
- pfxrtr = LIST_NEXT(pfxrtr, pfr_entry)) {
- if ((rt = nd6_lookup(&pfxrtr->router->rtaddr, 0,
- pfxrtr->router->ifp, 0)) &&
- (ln = (struct llinfo_nd6 *)rt->rt_llinfo) &&
- ND6_IS_LLINFO_PROBREACH(ln))
- break; /* found */
+ NDPR_UNLOCK(pr);
+ lck_mtx_unlock(nd6_mutex);
+ /* Callee returns a locked route upon success */
+ if ((rt = nd6_lookup(&rtaddr, 0, ifp, 0)) != NULL) {
+ RT_LOCK_ASSERT_HELD(rt);
+ if ((ln = rt->rt_llinfo) != NULL &&
+ ND6_IS_LLINFO_PROBREACH(ln)) {
+ RT_REMREF_LOCKED(rt);
+ RT_UNLOCK(rt);
+ lck_mtx_lock(nd6_mutex);
+ NDPR_LOCK(pr);
+ break; /* found */
+ }
+ RT_REMREF_LOCKED(rt);
+ RT_UNLOCK(rt);
+ }
+ lck_mtx_lock(nd6_mutex);
+ NDPR_LOCK(pr);
+ if (pr->ndpr_genid != genid) {
+ pfxrtr = LIST_FIRST(&pr->ndpr_advrtrs);
+ genid = pr->ndpr_genid;
+ } else
+ pfxrtr = LIST_NEXT(pfxrtr, pfr_entry);
}
+ NDPR_LOCK_ASSERT_HELD(pr);
- return(pfxrtr);
+ return (pfxrtr);
}
* is no router around us.
*/
void
-pfxlist_onlink_check(int nd6locked)
+pfxlist_onlink_check(void)
{
- struct nd_prefix *pr;
+ struct nd_prefix *pr, *prclear;
struct in6_ifaddr *ifa;
+ struct nd_defrouter *dr;
+ struct nd_pfxrouter *pfxrtr = NULL;
+ int err, i, found = 0;
+ struct ifaddr **ifap = NULL;
+ struct nd_prefix *ndpr;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ while (nd_prefix_busy) {
+ nd_prefix_waiters++;
+ msleep(nd_prefix_waitchan, nd6_mutex, (PZERO-1),
+ __func__, NULL);
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ }
+ nd_prefix_busy = TRUE;
/*
* Check if there is a prefix that has a reachable advertising
* router.
*/
- if (nd6locked == 0)
- lck_mtx_lock(nd6_mutex);
- lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
- for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
- if (pr->ndpr_raf_onlink && find_pfxlist_reachable_router(pr))
+ pr = nd_prefix.lh_first;
+ while (pr) {
+ NDPR_LOCK(pr);
+ if (pr->ndpr_stateflags & NDPRF_PROCESSED_ONLINK) {
+ NDPR_UNLOCK(pr);
+ pr = pr->ndpr_next;
+ continue;
+ }
+ NDPR_ADDREF_LOCKED(pr);
+ if (pr->ndpr_raf_onlink && find_pfxlist_reachable_router(pr) &&
+ (pr->ndpr_debug & IFD_ATTACHED)) {
+ if (NDPR_REMREF_LOCKED(pr) == NULL)
+ pr = NULL;
+ else
+ NDPR_UNLOCK(pr);
break;
+ }
+ pr->ndpr_stateflags |= NDPRF_PROCESSED_ONLINK;
+ NDPR_UNLOCK(pr);
+ NDPR_REMREF(pr);
+ /*
+ * Since find_pfxlist_reachable_router() drops the nd6_mutex, we
+ * have to start over, but the NDPRF_PROCESSED_ONLINK flag will
+ * stop us from checking the same prefix twice.
+ */
+ pr = nd_prefix.lh_first;
}
-
- if (pr) {
+ LIST_FOREACH(prclear, &nd_prefix, ndpr_entry) {
+ NDPR_LOCK(prclear);
+ prclear->ndpr_stateflags &= ~NDPRF_PROCESSED_ONLINK;
+ NDPR_UNLOCK(prclear);
+ }
+ /*
+ * If we have no such prefix, check whether we still have a router
+ * that does not advertise any prefixes.
+ */
+ if (pr == NULL) {
+ for (dr = TAILQ_FIRST(&nd_defrouter); dr;
+ dr = TAILQ_NEXT(dr, dr_entry)) {
+ struct nd_prefix *pr0;
+
+ for (pr0 = nd_prefix.lh_first; pr0;
+ pr0 = pr0->ndpr_next) {
+ NDPR_LOCK(pr0);
+ if ((pfxrtr = pfxrtr_lookup(pr0, dr)) != NULL) {
+ NDPR_UNLOCK(pr0);
+ break;
+ }
+ NDPR_UNLOCK(pr0);
+ }
+ if (pfxrtr != NULL)
+ break;
+ }
+ }
+ if (pr != NULL || (TAILQ_FIRST(&nd_defrouter) && pfxrtr == NULL)) {
/*
- * There is at least one prefix that has a reachable router.
+ * There is at least one prefix that has a reachable router,
+ * or at least a router which probably does not advertise
+ * any prefixes. The latter would be the case when we move
+ * to a new link where we have a router that does not provide
+ * prefixes and we configure an address by hand.
* Detach prefixes which have no reachable advertising
* router, and attach other prefixes.
*/
- for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
- /* XXX: a link-local prefix should never be detached */
- if (IN6_IS_ADDR_LINKLOCAL(&pr->ndpr_prefix.sin6_addr))
- continue;
-
+ pr = nd_prefix.lh_first;
+ while (pr) {
+ NDPR_LOCK(pr);
/*
- * we aren't interested in prefixes without the L bit
- * set.
+ * We aren't interested prefixes already processed,
+ * nor in prefixes without the L bit
+ * set nor in static prefixes
*/
- if (pr->ndpr_raf_onlink == 0)
+ if (pr->ndpr_raf_onlink == 0 ||
+ pr->ndpr_stateflags & NDPRF_PROCESSED_ONLINK ||
+ pr->ndpr_stateflags & NDPRF_STATIC) {
+ NDPR_UNLOCK(pr);
+ pr = pr->ndpr_next;
continue;
-
+ }
+ NDPR_ADDREF_LOCKED(pr);
if ((pr->ndpr_stateflags & NDPRF_DETACHED) == 0 &&
- find_pfxlist_reachable_router(pr) == NULL)
+ find_pfxlist_reachable_router(pr) == NULL &&
+ (pr->ndpr_debug & IFD_ATTACHED))
pr->ndpr_stateflags |= NDPRF_DETACHED;
if ((pr->ndpr_stateflags & NDPRF_DETACHED) != 0 &&
- find_pfxlist_reachable_router(pr) != 0)
+ find_pfxlist_reachable_router(pr) != NULL &&
+ (pr->ndpr_debug & IFD_ATTACHED))
pr->ndpr_stateflags &= ~NDPRF_DETACHED;
+ pr->ndpr_stateflags |= NDPRF_PROCESSED_ONLINK;
+ NDPR_UNLOCK(pr);
+ NDPR_REMREF(pr);
+ /*
+ * Since find_pfxlist_reachable_router() drops the
+ * nd6_mutex, we have to start over, but the
+ * NDPRF_PROCESSED_ONLINK flag will stop us from
+ * checking the same prefix twice.
+ */
+ pr = nd_prefix.lh_first;
}
} else {
/* there is no prefix that has a reachable router */
for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
- if (IN6_IS_ADDR_LINKLOCAL(&pr->ndpr_prefix.sin6_addr))
- continue;
-
- if (pr->ndpr_raf_onlink == 0)
+ NDPR_LOCK(pr);
+ if (pr->ndpr_raf_onlink == 0 ||
+ pr->ndpr_stateflags & NDPRF_STATIC) {
+ NDPR_UNLOCK(pr);
continue;
-
+ }
if ((pr->ndpr_stateflags & NDPRF_DETACHED) != 0)
pr->ndpr_stateflags &= ~NDPRF_DETACHED;
+ NDPR_UNLOCK(pr);
}
}
-
+ LIST_FOREACH(prclear, &nd_prefix, ndpr_entry) {
+ NDPR_LOCK(prclear);
+ prclear->ndpr_stateflags &= ~NDPRF_PROCESSED_ONLINK;
+ NDPR_UNLOCK(prclear);
+ }
/*
* Remove each interface route associated with a (just) detached
* prefix, and reinstall the interface route for a (just) attached
* interfaces. Such cases will be handled in nd6_prefix_onlink,
* so we don't have to care about them.
*/
- for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
+ pr = nd_prefix.lh_first;
+ while (pr) {
int e;
- if (IN6_IS_ADDR_LINKLOCAL(&pr->ndpr_prefix.sin6_addr))
+ NDPR_LOCK(pr);
+ if (pr->ndpr_raf_onlink == 0 ||
+ pr->ndpr_stateflags & NDPRF_STATIC ||
+ pr->ndpr_stateflags & NDPRF_PROCESSED_ONLINK ||
+ pr->ndpr_stateflags & NDPRF_DEFUNCT) {
+ NDPR_UNLOCK(pr);
+ pr = pr->ndpr_next;
continue;
-
- if (pr->ndpr_raf_onlink == 0)
- continue;
-
+ }
+ pr->ndpr_stateflags |= NDPRF_PROCESSED_ONLINK;
+ NDPR_ADDREF_LOCKED(pr);
if ((pr->ndpr_stateflags & NDPRF_DETACHED) != 0 &&
(pr->ndpr_stateflags & NDPRF_ONLINK) != 0) {
+ NDPR_UNLOCK(pr);
+ lck_mtx_unlock(nd6_mutex);
if ((e = nd6_prefix_offlink(pr)) != 0) {
nd6log((LOG_ERR,
"pfxlist_onlink_check: failed to "
ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
pr->ndpr_plen, e));
}
+ lck_mtx_lock(nd6_mutex);
+ NDPR_REMREF(pr);
+ pr = nd_prefix.lh_first;
+ continue;
}
if ((pr->ndpr_stateflags & NDPRF_DETACHED) == 0 &&
(pr->ndpr_stateflags & NDPRF_ONLINK) == 0 &&
pr->ndpr_raf_onlink) {
- if ((e = nd6_prefix_onlink(pr, 0, 1)) != 0) {
+ NDPR_UNLOCK(pr);
+ if ((e = nd6_prefix_onlink(pr)) != 0) {
nd6log((LOG_ERR,
"pfxlist_onlink_check: failed to "
"make %s/%d offlink, errno=%d\n",
ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
pr->ndpr_plen, e));
}
+ NDPR_REMREF(pr);
+ pr = nd_prefix.lh_first;
+ continue;
+ } else {
+ NDPR_UNLOCK(pr);
}
+ NDPR_REMREF(pr);
+ pr = pr->ndpr_next;
+ }
+ LIST_FOREACH(prclear, &nd_prefix, ndpr_entry) {
+ NDPR_LOCK(prclear);
+ prclear->ndpr_stateflags &= ~NDPRF_PROCESSED_ONLINK;
+ NDPR_UNLOCK(prclear);
+ }
+ VERIFY(nd_prefix_busy);
+ nd_prefix_busy = FALSE;
+ if (nd_prefix_waiters > 0) {
+ nd_prefix_waiters = 0;
+ wakeup(nd_prefix_waitchan);
}
/*
* detached. Note, however, that a manually configured address should
* always be attached.
* The precise detection logic is same as the one for prefixes.
+ *
+ * ifnet_get_address_list_family_internal() may fail due to memory
+ * pressure, but we will eventually be called again when we receive
+ * another NA, RA, or when the link status changes.
*/
- for (ifa = in6_ifaddrs; ifa; ifa = ifa->ia_next) {
- if ((ifa->ia6_flags & IN6_IFF_AUTOCONF) == 0)
+ err = ifnet_get_address_list_family_internal(NULL, &ifap, AF_INET6, 0,
+ M_NOWAIT, 0);
+ if (err != 0 || ifap == NULL) {
+ nd6log((LOG_ERR, "%s: ifnet_get_address_list_family_internal "
+ "failed", __func__));
+ return;
+ }
+ for (i = 0; ifap[i]; i++) {
+ ifa = ifatoia6(ifap[i]);
+ IFA_LOCK(&ifa->ia_ifa);
+ if ((ifa->ia6_flags & IN6_IFF_AUTOCONF) == 0 ||
+ (ifap[i]->ifa_debug & IFD_ATTACHED) == 0) {
+ IFA_UNLOCK(&ifa->ia_ifa);
continue;
-
- if (ifa->ia6_ndpr == NULL) {
+ }
+ if ((ndpr = ifa->ia6_ndpr) == NULL) {
/*
* This can happen when we first configure the address
* (i.e. the address exists, but the prefix does not).
* XXX: complicated relationships...
*/
+ IFA_UNLOCK(&ifa->ia_ifa);
continue;
}
+ IFA_UNLOCK(&ifa->ia_ifa);
- if (find_pfxlist_reachable_router(ifa->ia6_ndpr))
+ NDPR_LOCK(ndpr);
+ NDPR_ADDREF_LOCKED(ndpr);
+ if (find_pfxlist_reachable_router(ndpr)) {
+ if (NDPR_REMREF_LOCKED(ndpr) == NULL) {
+ found = 0;
+ } else {
+ NDPR_UNLOCK(ndpr);
+ found = 1;
+ }
break;
- }
- if (ifa) {
- for (ifa = in6_ifaddrs; ifa; ifa = ifa->ia_next) {
- if ((ifa->ia6_flags & IN6_IFF_AUTOCONF) == 0)
+ }
+ NDPR_UNLOCK(ndpr);
+ NDPR_REMREF(ndpr);
+ }
+ if (found) {
+ for (i = 0; ifap[i]; i++) {
+ ifa = ifatoia6(ifap[i]);
+ IFA_LOCK(&ifa->ia_ifa);
+ if ((ifa->ia6_flags & IN6_IFF_AUTOCONF) == 0 ||
+ (ifap[i]->ifa_debug & IFD_ATTACHED) == 0) {
+ IFA_UNLOCK(&ifa->ia_ifa);
continue;
-
- if (ifa->ia6_ndpr == NULL) /* XXX: see above. */
+ }
+ if ((ndpr = ifa->ia6_ndpr) == NULL) {
+ /* XXX: see above. */
+ IFA_UNLOCK(&ifa->ia_ifa);
continue;
-
- if (find_pfxlist_reachable_router(ifa->ia6_ndpr))
- ifa->ia6_flags &= ~IN6_IFF_DETACHED;
- else
+ }
+ IFA_UNLOCK(&ifa->ia_ifa);
+ NDPR_LOCK(ndpr);
+ NDPR_ADDREF_LOCKED(ndpr);
+ if (find_pfxlist_reachable_router(ndpr)) {
+ NDPR_UNLOCK(ndpr);
+ IFA_LOCK(&ifa->ia_ifa);
+ if (ifa->ia6_flags & IN6_IFF_DETACHED) {
+ ifa->ia6_flags &= ~IN6_IFF_DETACHED;
+ in6_ifaddr_set_dadprogress((struct in6_ifaddr *)ifa);
+ IFA_UNLOCK(&ifa->ia_ifa);
+ nd6_dad_start((struct ifaddr *)ifa, 0);
+ } else {
+ IFA_UNLOCK(&ifa->ia_ifa);
+ }
+ } else {
+ NDPR_UNLOCK(ndpr);
+ IFA_LOCK(&ifa->ia_ifa);
ifa->ia6_flags |= IN6_IFF_DETACHED;
+ IFA_UNLOCK(&ifa->ia_ifa);
+ }
+ NDPR_REMREF(ndpr);
}
- }
- else {
- for (ifa = in6_ifaddrs; ifa; ifa = ifa->ia_next) {
- if ((ifa->ia6_flags & IN6_IFF_AUTOCONF) == 0)
+ } else {
+ for (i = 0; ifap[i]; i++) {
+ ifa = ifatoia6(ifap[i]);
+ IFA_LOCK(&ifa->ia_ifa);
+ if ((ifa->ia6_flags & IN6_IFF_AUTOCONF) == 0) {
+ IFA_UNLOCK(&ifa->ia_ifa);
continue;
+ }
+ if (ifa->ia6_flags & IN6_IFF_DETACHED) {
+ ifa->ia6_flags &= ~IN6_IFF_DETACHED;
+ in6_ifaddr_set_dadprogress((struct in6_ifaddr *)ifa);
+ IFA_UNLOCK(&ifa->ia_ifa);
+ /* Do we need a delay in this case? */
+ nd6_dad_start((struct ifaddr *)ifa, 0);
+ } else {
+ IFA_UNLOCK(&ifa->ia_ifa);
+ }
+ }
+ }
+ ifnet_free_address_list(ifap);
+}
+
+static struct nd_prefix *
+nd6_prefix_equal_lookup(struct nd_prefix *pr, boolean_t primary_only)
+{
+ struct nd_prefix *opr;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ for (opr = nd_prefix.lh_first; opr; opr = opr->ndpr_next) {
+ if (opr == pr)
+ continue;
+
+ NDPR_LOCK(opr);
+ if ((opr->ndpr_stateflags & NDPRF_ONLINK) == 0) {
+ NDPR_UNLOCK(opr);
+ continue;
+ }
+ if (opr->ndpr_plen == pr->ndpr_plen &&
+ in6_are_prefix_equal(&pr->ndpr_prefix.sin6_addr,
+ &opr->ndpr_prefix.sin6_addr, pr->ndpr_plen) &&
+ (!primary_only ||
+ !(opr->ndpr_stateflags & NDPRF_IFSCOPE))) {
+ NDPR_ADDREF_LOCKED(opr);
+ NDPR_UNLOCK(opr);
+ return (opr);
+ }
+ NDPR_UNLOCK(opr);
+ }
+ return (NULL);
+}
+
+/*
+ * Synchronize the interface routes of similar prefixes on different
+ * interfaces; the one using the default interface would be (re)installed
+ * as a primary/non-scoped entry, and the rest as scoped entri(es).
+ */
+static void
+nd6_prefix_sync(struct ifnet *ifp)
+{
+ struct nd_prefix *pr, *opr;
+ int err = 0;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ if (ifp == NULL)
+ return;
- ifa->ia6_flags &= ~IN6_IFF_DETACHED;
+ for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
+ NDPR_LOCK(pr);
+ if (!(pr->ndpr_stateflags & NDPRF_ONLINK)) {
+ NDPR_UNLOCK(pr);
+ continue;
+ }
+ if (pr->ndpr_ifp == ifp &&
+ (pr->ndpr_stateflags & NDPRF_IFSCOPE) &&
+ !IN6_IS_ADDR_LINKLOCAL(&pr->ndpr_prefix.sin6_addr)) {
+ NDPR_UNLOCK(pr);
+ break;
}
+ NDPR_UNLOCK(pr);
}
- if (nd6locked == 0)
+
+ if (pr == NULL)
+ return;
+
+ /* Remove conflicting entries */
+ opr = nd6_prefix_equal_lookup(pr, TRUE);
+ if (opr != NULL) {
lck_mtx_unlock(nd6_mutex);
+ err = nd6_prefix_offlink(opr);
+ lck_mtx_lock(nd6_mutex);
+ if (err != 0) {
+ nd6log((LOG_ERR,
+ "%s: failed to make %s/%d offlink on %s, "
+ "errno=%d\n", __func__,
+ ip6_sprintf(&opr->ndpr_prefix.sin6_addr),
+ opr->ndpr_plen, if_name(opr->ndpr_ifp), err));
+ }
+ } else {
+ nd6log((LOG_ERR,
+ "%s: scoped %s/%d on %s has no matching unscoped prefix\n",
+ __func__, ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp)));
+ }
+
+ lck_mtx_unlock(nd6_mutex);
+ err = nd6_prefix_offlink(pr);
+ lck_mtx_lock(nd6_mutex);
+ if (err != 0) {
+ nd6log((LOG_ERR,
+ "%s: failed to make %s/%d offlink on %s, errno=%d\n",
+ __func__, ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp), err));
+ }
+
+ /* Add the entries back */
+ if (opr != NULL) {
+ err = nd6_prefix_onlink_scoped(opr, opr->ndpr_ifp->if_index);
+ if (err != 0) {
+ nd6log((LOG_ERR,
+ "%s: failed to make %s/%d scoped onlink on %s, "
+ "errno=%d\n", __func__,
+ ip6_sprintf(&opr->ndpr_prefix.sin6_addr),
+ opr->ndpr_plen, if_name(opr->ndpr_ifp), err));
+ }
+ }
+
+ err = nd6_prefix_onlink_scoped(pr, IFSCOPE_NONE);
+ if (err != 0) {
+ nd6log((LOG_ERR,
+ "%s: failed to make %s/%d onlink on %s, errno=%d\n",
+ __func__, ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp), err));
+ }
+
+ if (err != 0) {
+ nd6log((LOG_ERR,
+ "%s: error promoting %s/%d to %s from %s\n",
+ __func__, ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp),
+ (opr != NULL) ? if_name(opr->ndpr_ifp) : "NONE"));
+ } else {
+ nd6log2((LOG_INFO,
+ "%s: %s/%d promoted, previously on %s\n",
+ if_name(pr->ndpr_ifp),
+ ip6_sprintf(&pr->ndpr_prefix.sin6_addr), pr->ndpr_plen,
+ (opr != NULL) ? if_name(opr->ndpr_ifp) : "NONE"));
+ }
+
+ if (opr != NULL)
+ NDPR_REMREF(opr);
}
-int
-nd6_prefix_onlink(
- struct nd_prefix *pr, int rtlocked, int nd6locked)
+static int
+nd6_prefix_onlink_common(struct nd_prefix *pr, boolean_t force_scoped,
+ unsigned int ifscope)
{
struct ifaddr *ifa;
struct ifnet *ifp = pr->ndpr_ifp;
- struct sockaddr_in6 mask6;
+ struct sockaddr_in6 mask6, prefix;
struct nd_prefix *opr;
- u_long rtflags;
- int error = 0;
+ u_int32_t rtflags;
+ int error = 0, prproxy = 0;
struct rtentry *rt = NULL;
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
/* sanity check */
+ NDPR_LOCK(pr);
if ((pr->ndpr_stateflags & NDPRF_ONLINK) != 0) {
nd6log((LOG_ERR,
- "nd6_prefix_onlink: %s/%d is already on-link\n",
- ip6_sprintf(&pr->ndpr_prefix.sin6_addr), pr->ndpr_plen);
- return(EEXIST));
+ "%s: %s/%d on %s scoped=%d is already on-link\n",
+ __func__, ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp),
+ (pr->ndpr_stateflags & NDPRF_IFSCOPE) ? 1 : 0);
+ NDPR_UNLOCK(pr);
+ return (EEXIST));
}
+ NDPR_UNLOCK(pr);
/*
* Add the interface route associated with the prefix. Before
* installing the route, check if there's the same prefix on another
* interface, and the prefix has already installed the interface route.
- * Although such a configuration is expected to be rare, we explicitly
- * allow it.
*/
- if (nd6locked == 0)
- lck_mtx_lock(nd6_mutex);
- else
- lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
- for (opr = nd_prefix.lh_first; opr; opr = opr->ndpr_next) {
- if (opr == pr)
- continue;
-
- if ((opr->ndpr_stateflags & NDPRF_ONLINK) == 0)
- continue;
+ opr = nd6_prefix_equal_lookup(pr, FALSE);
+ if (opr != NULL)
+ NDPR_REMREF(opr);
- if (opr->ndpr_plen == pr->ndpr_plen &&
- in6_are_prefix_equal(&pr->ndpr_prefix.sin6_addr,
- &opr->ndpr_prefix.sin6_addr,
- pr->ndpr_plen)) {
- if (nd6locked == 0)
- lck_mtx_unlock(nd6_mutex);
- return(0);
- }
+ if (!force_scoped) {
+ /*
+ * If a primary/non-scoped interface route already exists,
+ * install the new one as a scoped entry. If the existing
+ * interface route is scoped, install new as non-scoped.
+ */
+ ifscope = (opr != NULL) ? ifp->if_index : IFSCOPE_NONE;
+ opr = nd6_prefix_equal_lookup(pr, TRUE);
+ if (opr != NULL)
+ NDPR_REMREF(opr);
+ else if (ifscope != IFSCOPE_NONE)
+ ifscope = IFSCOPE_NONE;
}
- if (nd6locked == 0)
- lck_mtx_unlock(nd6_mutex);
/*
- * We prefer link-local addresses as the associated interface address.
+ * We prefer link-local addresses as the associated interface address.
*/
/* search for a link-local addr */
ifa = (struct ifaddr *)in6ifa_ifpforlinklocal(ifp,
- IN6_IFF_NOTREADY|
- IN6_IFF_ANYCAST);
+ IN6_IFF_NOTREADY | IN6_IFF_ANYCAST);
if (ifa == NULL) {
- /* XXX: freebsd does not have ifa_ifwithaf */
- ifnet_lock_exclusive(ifp);
- TAILQ_FOREACH(ifa, &ifp->if_addrlist, ifa_list)
- {
- if (ifa->ifa_addr->sa_family == AF_INET6)
- break;
- }
+ struct in6_ifaddr *ia6;
+ ifnet_lock_shared(ifp);
+ IFP_TO_IA6(ifp, ia6);
ifnet_lock_done(ifp);
+ if (ia6 != NULL)
+ ifa = &ia6->ia_ifa;
/* should we care about ia6_flags? */
}
+ NDPR_LOCK(pr);
if (ifa == NULL) {
/*
* This can still happen, when, for example, we receive an RA
" to add route for a prefix(%s/%d) on %s\n",
ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
pr->ndpr_plen, if_name(ifp)));
- return(0);
+ NDPR_UNLOCK(pr);
+ return (0);
}
/*
* in6_ifinit() sets nd6_rtrequest to ifa_rtrequest for all ifaddrs.
* ifa->ifa_rtrequest = nd6_rtrequest;
*/
- bzero(&mask6, sizeof(mask6));
- mask6.sin6_len = sizeof(mask6);
+ bzero(&mask6, sizeof (mask6));
+ mask6.sin6_len = sizeof (mask6);
mask6.sin6_addr = pr->ndpr_mask;
+ prefix = pr->ndpr_prefix;
+ if ((rt = pr->ndpr_rt) != NULL)
+ pr->ndpr_rt = NULL;
+ NDPR_ADDREF_LOCKED(pr); /* keep reference for this routine */
+ NDPR_UNLOCK(pr);
- if (rtlocked == 0)
- lck_mtx_lock(rt_mtx);
-
+ IFA_LOCK_SPIN(ifa);
rtflags = ifa->ifa_flags | RTF_CLONING | RTF_UP;
+ IFA_UNLOCK(ifa);
if (nd6_need_cache(ifp)) {
/* explicitly set in case ifa_flags does not set the flag. */
rtflags |= RTF_CLONING;
*/
rtflags &= ~RTF_CLONING;
}
- error = rtrequest_locked(RTM_ADD, (struct sockaddr *)&pr->ndpr_prefix,
- ifa->ifa_addr, (struct sockaddr *)&mask6,
- rtflags, &rt);
- if (error == 0) {
- if (rt != NULL) /* this should be non NULL, though */
- nd6_rtmsg(RTM_ADD, rt);
- pr->ndpr_stateflags |= NDPRF_ONLINK;
+
+ lck_mtx_unlock(nd6_mutex);
+
+ if (rt != NULL) {
+ rtfree(rt);
+ rt = NULL;
}
- else {
+
+ error = rtrequest_scoped(RTM_ADD, (struct sockaddr *)&prefix,
+ ifa->ifa_addr, (struct sockaddr *)&mask6, rtflags, &rt,
+ ifscope);
+
+ /*
+ * Serialize the setting of NDPRF_PRPROXY.
+ */
+ lck_mtx_lock(&proxy6_lock);
+
+ if (rt != NULL) {
+ RT_LOCK(rt);
+ nd6_rtmsg(RTM_ADD, rt);
+ RT_UNLOCK(rt);
+ NDPR_LOCK(pr);
+ } else {
+ NDPR_LOCK(pr);
nd6log((LOG_ERR, "nd6_prefix_onlink: failed to add route for a"
- " prefix (%s/%d) on %s, gw=%s, mask=%s, flags=%lx "
- "errno = %d\n",
+ " prefix (%s/%d) on %s, gw=%s, mask=%s, flags=%lx,"
+ " scoped=%d, errno = %d\n",
ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
pr->ndpr_plen, if_name(ifp),
- ip6_sprintf(&((struct sockaddr_in6 *)ifa->ifa_addr)->sin6_addr),
- ip6_sprintf(&mask6.sin6_addr), rtflags, error));
+ ip6_sprintf(&((struct sockaddr_in6 *)
+ (void *)ifa->ifa_addr)->sin6_addr),
+ ip6_sprintf(&mask6.sin6_addr), rtflags,
+ (ifscope != IFSCOPE_NONE), error));
}
+ NDPR_LOCK_ASSERT_HELD(pr);
+
+ pr->ndpr_stateflags &= ~(NDPRF_IFSCOPE | NDPRF_PRPROXY);
+
+ /*
+ * TODO: If the prefix route exists, we should really find it and
+ * refer the prefix to it; otherwise ndpr_rt is NULL.
+ */
+ if (!(pr->ndpr_stateflags & NDPRF_DEFUNCT) &&
+ (rt != NULL || error == EEXIST)) {
+ struct nd_ifinfo *ndi = NULL;
+
+ VERIFY(pr->ndpr_prproxy_sols_cnt == 0);
+ VERIFY(RB_EMPTY(&pr->ndpr_prproxy_sols));
+
+ ndi = ND_IFINFO(ifp);
+ VERIFY((NULL != ndi) && (TRUE == ndi->initialized));
+ lck_mtx_lock(&ndi->lock);
+
+ pr->ndpr_rt = rt; /* keep reference from rtrequest */
+ pr->ndpr_stateflags |= NDPRF_ONLINK;
+ if (ifscope != IFSCOPE_NONE) {
+ pr->ndpr_stateflags |= NDPRF_IFSCOPE;
+ } else if ((rtflags & RTF_CLONING) &&
+ (ndi->flags & ND6_IFF_PROXY_PREFIXES) &&
+ !IN6_IS_ADDR_LINKLOCAL(&pr->ndpr_prefix.sin6_addr)) {
+ /*
+ * At present, in order for the prefix to be eligible
+ * as a proxying/proxied prefix, we require that the
+ * prefix route entry be marked as a cloning route with
+ * RTF_PROXY; i.e. nd6_need_cache() needs to return
+ * true for the interface type, hence the test for
+ * RTF_CLONING above.
+ */
+ pr->ndpr_stateflags |= NDPRF_PRPROXY;
+ }
- if (rt != NULL)
- rtunref(rt);
+ lck_mtx_unlock(&ndi->lock);
+ } else if (rt != NULL && pr->ndpr_stateflags & NDPRF_DEFUNCT)
+ rtfree(rt);
- if (rtlocked == 0)
- lck_mtx_unlock(rt_mtx);
- return(error);
+ prproxy = (pr->ndpr_stateflags & NDPRF_PRPROXY);
+ VERIFY(!prproxy || !(pr->ndpr_stateflags & NDPRF_IFSCOPE));
+ NDPR_UNLOCK(pr);
+
+ IFA_REMREF(ifa);
+
+ /*
+ * If this is an upstream prefix, find the downstream ones (if any)
+ * and re-configure their prefix routes accordingly. Otherwise,
+ * this could be potentially be a downstream prefix, and so find the
+ * upstream prefix, if any.
+ */
+ nd6_prproxy_prelist_update(pr, prproxy ? pr : NULL);
+
+ NDPR_REMREF(pr); /* release reference for this routine */
+ lck_mtx_unlock(&proxy6_lock);
+
+ lck_mtx_lock(nd6_mutex);
+
+ return (error);
}
int
-nd6_prefix_offlink(
- struct nd_prefix *pr)
+nd6_prefix_onlink(struct nd_prefix *pr)
{
- int error = 0;
+ return (nd6_prefix_onlink_common(pr, FALSE, IFSCOPE_NONE));
+}
+
+int
+nd6_prefix_onlink_scoped(struct nd_prefix *pr, unsigned int ifscope)
+{
+ return (nd6_prefix_onlink_common(pr, TRUE, ifscope));
+}
+
+int
+nd6_prefix_offlink(struct nd_prefix *pr)
+{
+ int plen, error = 0, prproxy;
struct ifnet *ifp = pr->ndpr_ifp;
- struct nd_prefix *opr;
- struct sockaddr_in6 sa6, mask6;
- struct rtentry *rt = NULL;
+ struct sockaddr_in6 sa6, mask6, prefix;
+ struct rtentry *rt = NULL, *ndpr_rt = NULL;
+ unsigned int ifscope;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_NOTOWNED);
/* sanity check */
+ NDPR_LOCK(pr);
if ((pr->ndpr_stateflags & NDPRF_ONLINK) == 0) {
nd6log((LOG_ERR,
- "nd6_prefix_offlink: %s/%d is already off-link\n",
- ip6_sprintf(&pr->ndpr_prefix.sin6_addr), pr->ndpr_plen));
- return(EEXIST);
+ "nd6_prefix_offlink: %s/%d on %s scoped=%d is already "
+ "off-link\n", ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp),
+ (pr->ndpr_stateflags & NDPRF_IFSCOPE) ? 1 : 0));
+ NDPR_UNLOCK(pr);
+ return (EEXIST);
}
- bzero(&sa6, sizeof(sa6));
+ bzero(&sa6, sizeof (sa6));
sa6.sin6_family = AF_INET6;
- sa6.sin6_len = sizeof(sa6);
+ sa6.sin6_len = sizeof (sa6);
bcopy(&pr->ndpr_prefix.sin6_addr, &sa6.sin6_addr,
- sizeof(struct in6_addr));
- bzero(&mask6, sizeof(mask6));
+ sizeof (struct in6_addr));
+ bzero(&mask6, sizeof (mask6));
mask6.sin6_family = AF_INET6;
- mask6.sin6_len = sizeof(sa6);
- bcopy(&pr->ndpr_mask, &mask6.sin6_addr, sizeof(struct in6_addr));
- lck_mtx_lock(rt_mtx);
- error = rtrequest_locked(RTM_DELETE, (struct sockaddr *)&sa6, NULL,
- (struct sockaddr *)&mask6, 0, &rt);
- if (error == 0) {
- pr->ndpr_stateflags &= ~NDPRF_ONLINK;
-
- /* report the route deletion to the routing socket. */
- if (rt != NULL)
- nd6_rtmsg(RTM_DELETE, rt);
-
- /*
- * There might be the same prefix on another interface,
- * the prefix which could not be on-link just because we have
- * the interface route (see comments in nd6_prefix_onlink).
- * If there's one, try to make the prefix on-link on the
- * interface.
- */
- lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
- for (opr = nd_prefix.lh_first; opr; opr = opr->ndpr_next) {
- if (opr == pr)
- continue;
+ mask6.sin6_len = sizeof (sa6);
+ bcopy(&pr->ndpr_mask, &mask6.sin6_addr, sizeof (struct in6_addr));
+ prefix = pr->ndpr_prefix;
+ plen = pr->ndpr_plen;
+ if ((ndpr_rt = pr->ndpr_rt) != NULL)
+ pr->ndpr_rt = NULL;
+ NDPR_ADDREF_LOCKED(pr); /* keep reference for this routine */
+ NDPR_UNLOCK(pr);
- if ((opr->ndpr_stateflags & NDPRF_ONLINK) != 0)
- continue;
+ ifscope = (pr->ndpr_stateflags & NDPRF_IFSCOPE) ?
+ ifp->if_index : IFSCOPE_NONE;
- /*
- * KAME specific: detached prefixes should not be
- * on-link.
- */
- if ((opr->ndpr_stateflags & NDPRF_DETACHED) != 0)
- continue;
+ error = rtrequest_scoped(RTM_DELETE, (struct sockaddr *)&sa6,
+ NULL, (struct sockaddr *)&mask6, 0, &rt, ifscope);
- if (opr->ndpr_plen == pr->ndpr_plen &&
- in6_are_prefix_equal(&pr->ndpr_prefix.sin6_addr,
- &opr->ndpr_prefix.sin6_addr,
- pr->ndpr_plen)) {
- int e;
+ if (rt != NULL) {
+ /* report the route deletion to the routing socket. */
+ RT_LOCK(rt);
+ nd6_rtmsg(RTM_DELETE, rt);
+ RT_UNLOCK(rt);
+ rtfree(rt);
- if ((e = nd6_prefix_onlink(opr, 1, 1)) != 0) {
- nd6log((LOG_ERR,
- "nd6_prefix_offlink: failed to "
- "recover a prefix %s/%d from %s "
- "to %s (errno = %d)\n",
- ip6_sprintf(&opr->ndpr_prefix.sin6_addr),
- opr->ndpr_plen, if_name(ifp),
- if_name(opr->ndpr_ifp), e));
- }
- }
- }
- }
- else {
- /* XXX: can we still set the NDPRF_ONLINK flag? */
+ } else {
nd6log((LOG_ERR,
"nd6_prefix_offlink: failed to delete route: "
- "%s/%d on %s (errno = %d)\n",
- ip6_sprintf(&sa6.sin6_addr), pr->ndpr_plen, if_name(ifp),
- error));
+ "%s/%d on %s, scoped %d, (errno = %d)\n",
+ ip6_sprintf(&sa6.sin6_addr), plen, if_name(ifp),
+ (ifscope != IFSCOPE_NONE), error));
}
- if (rt != NULL) {
- if (rt->rt_refcnt <= 0) {
- /* XXX: we should free the entry ourselves. */
- rtref(rt);
- rtfree_locked(rt);
- }
+ if (ndpr_rt != NULL)
+ rtfree(ndpr_rt);
+
+ lck_mtx_lock(&proxy6_lock);
+
+ NDPR_LOCK(pr);
+ prproxy = (pr->ndpr_stateflags & NDPRF_PRPROXY);
+ VERIFY(!prproxy || !(pr->ndpr_stateflags & NDPRF_IFSCOPE));
+ pr->ndpr_stateflags &= ~(NDPRF_ONLINK | NDPRF_IFSCOPE | NDPRF_PRPROXY);
+ if (pr->ndpr_prproxy_sols_cnt > 0) {
+ VERIFY(prproxy);
+ nd6_prproxy_sols_reap(pr);
+ VERIFY(pr->ndpr_prproxy_sols_cnt == 0);
+ VERIFY(RB_EMPTY(&pr->ndpr_prproxy_sols));
}
- lck_mtx_unlock(rt_mtx);
+ NDPR_UNLOCK(pr);
+
+ /*
+ * If this was an upstream prefix, find the downstream ones and do
+ * some cleanups. If this was a downstream prefix, the prefix route
+ * has been removed from the routing table above, but there may be
+ * other tasks to perform.
+ */
+ nd6_prproxy_prelist_update(pr, prproxy ? pr : NULL);
- return(error);
+ NDPR_REMREF(pr); /* release reference for this routine */
+ lck_mtx_unlock(&proxy6_lock);
+
+ return (error);
}
static struct in6_ifaddr *
-in6_ifadd(
- struct nd_prefix *pr,
- struct in6_addr *ifid) /* Mobile IPv6 addition */
+in6_pfx_newpersistaddr(struct nd_prefix *pr, int mcast, int *errorp)
{
- struct ifnet *ifp = pr->ndpr_ifp;
- struct ifaddr *ifa;
- struct in6_aliasreq ifra;
- struct in6_ifaddr *ia, *ib;
- int error, plen0;
+ struct in6_ifaddr *ia6 = NULL;
+ struct ifnet *ifp = NULL;
+ struct nd_ifinfo *ndi = NULL;
struct in6_addr mask;
- int prefixlen = pr->ndpr_plen;
+ struct in6_aliasreq ifra;
+ int error, ifaupdate, iidlen, notcga;
+
+ VERIFY(pr != NULL);
+ VERIFY(errorp != NULL);
- in6_len2mask(&mask, prefixlen);
+ NDPR_LOCK(pr);
+ ifp = pr->ndpr_ifp;
+ ia6 = NULL;
+ error = 0;
/*
- * find a link-local address (will be interface ID).
- * Is it really mandatory? Theoretically, a global or a site-local
- * address can be configured without a link-local address, if we
- * have a unique interface identifier...
- *
- * it is not mandatory to have a link-local address, we can generate
- * interface identifier on the fly. we do this because:
- * (1) it should be the easiest way to find interface identifier.
- * (2) RFC2462 5.4 suggesting the use of the same interface identifier
- * for multiple addresses on a single interface, and possible shortcut
- * of DAD. we omitted DAD for this reason in the past.
- * (3) a user can prevent autoconfiguration of global address
- * by removing link-local address by hand (this is partly because we
- * don't have other way to control the use of IPv6 on a interface.
- * this has been our design choice - cf. NRL's "ifconfig auto").
- * (4) it is easier to manage when an interface has addresses
- * with the same interface identifier, than to have multiple addresses
- * with different interface identifiers.
- *
- * Mobile IPv6 addition: allow for caller to specify a wished interface
- * ID. This is to not break connections when moving addresses between
- * interfaces.
+ * Prefix Length check:
+ * If the sum of the prefix length and interface identifier
+ * length does not equal 128 bits, the Prefix Information
+ * option MUST be ignored. The length of the interface
+ * identifier is defined in a separate link-type specific
+ * document.
*/
- ifa = (struct ifaddr *)in6ifa_ifpforlinklocal(ifp, 0);/* 0 is OK? */
- if (ifa)
- ib = (struct in6_ifaddr *)ifa;
- else
- return NULL;
-
-#if 0 /* don't care link local addr state, and always do DAD */
- /* if link-local address is not eligible, do not autoconfigure. */
- if (((struct in6_ifaddr *)ifa)->ia6_flags & IN6_IFF_NOTREADY) {
- printf("in6_ifadd: link-local address not ready\n");
- return NULL;
+ iidlen = in6_if2idlen(ifp);
+ if (iidlen < 0) {
+ error = EADDRNOTAVAIL;
+ /* this should not happen, so we always log it. */
+ log(LOG_ERR, "%s: IID length undefined (%s)\n",
+ __func__, if_name(ifp));
+ goto unlock1;
+ } else if (iidlen != 64) {
+ error = EADDRNOTAVAIL;
+ /*
+ * stateless autoconfiguration not yet well-defined for IID
+ * lengths other than 64 octets. Just give up for now.
+ */
+ nd6log((LOG_INFO, "%s: IID length not 64 octets (%s)\n",
+ __func__, if_name(ifp)));
+ goto unlock1;
}
-#endif
- /* prefixlen + ifidlen must be equal to 128 */
- plen0 = in6_mask2len(&ib->ia_prefixmask.sin6_addr, NULL);
- if (prefixlen != plen0) {
- nd6log((LOG_INFO, "in6_ifadd: wrong prefixlen for %s "
- "(prefix=%d ifid=%d)\n",
- if_name(ifp), prefixlen, 128 - plen0));
- return NULL;
+ if (iidlen + pr->ndpr_plen != 128) {
+ error = EADDRNOTAVAIL;
+ nd6log((LOG_INFO,
+ "%s: invalid prefix length %d for %s, ignored\n",
+ __func__, pr->ndpr_plen, if_name(ifp)));
+ goto unlock1;
}
- /* make ifaddr */
-
- bzero(&ifra, sizeof(ifra));
- /*
- * in6_update_ifa() does not use ifra_name, but we accurately set it
- * for safety.
- */
- strncpy(ifra.ifra_name, if_name(ifp), sizeof(ifra.ifra_name));
+ bzero(&ifra, sizeof (ifra));
+ strlcpy(ifra.ifra_name, if_name(ifp), sizeof (ifra.ifra_name));
ifra.ifra_addr.sin6_family = AF_INET6;
- ifra.ifra_addr.sin6_len = sizeof(struct sockaddr_in6);
+ ifra.ifra_addr.sin6_len = sizeof (struct sockaddr_in6);
+
/* prefix */
bcopy(&pr->ndpr_prefix.sin6_addr, &ifra.ifra_addr.sin6_addr,
- sizeof(ifra.ifra_addr.sin6_addr));
+ sizeof (ifra.ifra_addr.sin6_addr));
+ in6_len2mask(&mask, pr->ndpr_plen);
ifra.ifra_addr.sin6_addr.s6_addr32[0] &= mask.s6_addr32[0];
ifra.ifra_addr.sin6_addr.s6_addr32[1] &= mask.s6_addr32[1];
ifra.ifra_addr.sin6_addr.s6_addr32[2] &= mask.s6_addr32[2];
ifra.ifra_addr.sin6_addr.s6_addr32[3] &= mask.s6_addr32[3];
- /* interface ID */
- if (ifid == NULL || IN6_IS_ADDR_UNSPECIFIED(ifid))
- ifid = &ib->ia_addr.sin6_addr;
- ifra.ifra_addr.sin6_addr.s6_addr32[0]
- |= (ifid->s6_addr32[0] & ~mask.s6_addr32[0]);
- ifra.ifra_addr.sin6_addr.s6_addr32[1]
- |= (ifid->s6_addr32[1] & ~mask.s6_addr32[1]);
- ifra.ifra_addr.sin6_addr.s6_addr32[2]
- |= (ifid->s6_addr32[2] & ~mask.s6_addr32[2]);
- ifra.ifra_addr.sin6_addr.s6_addr32[3]
- |= (ifid->s6_addr32[3] & ~mask.s6_addr32[3]);
-
+ ndi = ND_IFINFO(ifp);
+ VERIFY(ndi->initialized);
+ lck_mtx_lock(&ndi->lock);
+
+ notcga = nd6_send_opstate == ND6_SEND_OPMODE_DISABLED ||
+ (ndi->flags & ND6_IFF_INSECURE) != 0;
+
+ lck_mtx_unlock(&ndi->lock);
+ NDPR_UNLOCK(pr);
+
+ if (notcga) {
+ ia6 = in6ifa_ifpforlinklocal(ifp, 0);
+ if (ia6 == NULL) {
+ error = EADDRNOTAVAIL;
+ nd6log((LOG_INFO, "%s: no link-local address (%s)\n",
+ __func__, if_name(ifp)));
+ goto done;
+ }
+
+ IFA_LOCK(&ia6->ia_ifa);
+ ifra.ifra_addr.sin6_addr.s6_addr32[0] |=
+ (ia6->ia_addr.sin6_addr.s6_addr32[0] & ~mask.s6_addr32[0]);
+ ifra.ifra_addr.sin6_addr.s6_addr32[1] |=
+ (ia6->ia_addr.sin6_addr.s6_addr32[1] & ~mask.s6_addr32[1]);
+ ifra.ifra_addr.sin6_addr.s6_addr32[2] |=
+ (ia6->ia_addr.sin6_addr.s6_addr32[2] & ~mask.s6_addr32[2]);
+ ifra.ifra_addr.sin6_addr.s6_addr32[3] |=
+ (ia6->ia_addr.sin6_addr.s6_addr32[3] & ~mask.s6_addr32[3]);
+ IFA_UNLOCK(&ia6->ia_ifa);
+ IFA_REMREF(&ia6->ia_ifa);
+ ia6 = NULL;
+ } else {
+ in6_cga_node_lock();
+ struct in6_cga_prepare local_cga_prepare;
+
+ if (ndi->cga_initialized) {
+ bcopy(&(ndi->local_cga_modifier),
+ &(local_cga_prepare.cga_modifier),
+ sizeof(local_cga_prepare.cga_modifier));
+ error = in6_cga_generate(&local_cga_prepare, 0,
+ &ifra.ifra_addr.sin6_addr);
+ } else {
+ error = in6_cga_generate(NULL, 0,
+ &ifra.ifra_addr.sin6_addr);
+ }
+ in6_cga_node_unlock();
+ if (error == 0)
+ ifra.ifra_flags |= IN6_IFF_SECURED;
+ else {
+ nd6log((LOG_ERR, "%s: no CGA available (%s)\n",
+ __func__, if_name(ifp)));
+ goto done;
+ }
+ }
+
+ VERIFY(ia6 == NULL);
+
/* new prefix mask. */
- ifra.ifra_prefixmask.sin6_len = sizeof(struct sockaddr_in6);
+ ifra.ifra_prefixmask.sin6_len = sizeof (struct sockaddr_in6);
ifra.ifra_prefixmask.sin6_family = AF_INET6;
bcopy(&mask, &ifra.ifra_prefixmask.sin6_addr,
- sizeof(ifra.ifra_prefixmask.sin6_addr));
+ sizeof (ifra.ifra_prefixmask.sin6_addr));
- /*
- * lifetime.
- * XXX: in6_init_address_ltimes would override these values later.
- * We should reconsider this logic.
- */
+ /* lifetimes. */
ifra.ifra_lifetime.ia6t_vltime = pr->ndpr_vltime;
ifra.ifra_lifetime.ia6t_pltime = pr->ndpr_pltime;
- /* XXX: scope zone ID? */
-
+ /* address flags */
ifra.ifra_flags |= IN6_IFF_AUTOCONF; /* obey autoconf */
+
/*
- * temporarily set the nopfx flag to avoid conflict.
- * XXX: we should reconsider the entire mechanism about prefix
- * manipulation.
+ * Make sure that we do not have this address already. This should
+ * usually not happen, but we can still see this case, e.g., if we
+ * have manually configured the exact address to be configured.
*/
- ifra.ifra_flags |= IN6_IFF_NOPFX;
+ if ((ia6 = in6ifa_ifpwithaddr(ifp, &ifra.ifra_addr.sin6_addr))
+ != NULL) {
+ error = EADDRNOTAVAIL;
+ IFA_REMREF(&ia6->ia_ifa);
+ ia6 = NULL;
+
+ /* this should be rare enough to make an explicit log */
+ log(LOG_INFO, "%s: %s is already configured!\n",
+ __func__, ip6_sprintf(&ifra.ifra_addr.sin6_addr));
+ goto done;
+ }
/*
- * keep the new address, regardless of the result of in6_update_ifa.
- * XXX: this address is now meaningless.
- * We should reconsider its role.
+ * Allocate ifaddr structure, link into chain, etc.
+ * If we are going to create a new address upon receiving a multicasted
+ * RA, we need to impose a random delay before starting DAD.
+ * [RFC 4862, Section 5.4.2]
*/
- pr->ndpr_addr = ifra.ifra_addr.sin6_addr;
-
- /* allocate ifaddr structure, link into chain, etc. */
- if ((error = in6_update_ifa(ifp, &ifra, NULL)) != 0) {
+ ifaupdate = IN6_IFAUPDATE_NOWAIT;
+ if (mcast)
+ ifaupdate |= IN6_IFAUPDATE_DADDELAY;
+ error = in6_update_ifa(ifp, &ifra, ifaupdate, &ia6);
+ if (error != 0) {
nd6log((LOG_ERR,
- "in6_ifadd: failed to make ifaddr %s on %s (errno=%d)\n",
- ip6_sprintf(&ifra.ifra_addr.sin6_addr), if_name(ifp),
- error));
- return(NULL); /* ifaddr must not have been allocated. */
+ "%s: failed to make ifaddr %s on %s (errno=%d)\n",
+ __func__, ip6_sprintf(&ifra.ifra_addr.sin6_addr),
+ if_name(ifp), error));
+ error = EADDRNOTAVAIL;
+ goto done;
}
- ia = in6ifa_ifpwithaddr(ifp, &ifra.ifra_addr.sin6_addr);
+ VERIFY(ia6 != NULL);
+ in6_post_msg(ifp, KEV_INET6_NEW_RTADV_ADDR, ia6, NULL);
+ goto done;
- in6_post_msg(ifp, KEV_INET6_NEW_RTADV_ADDR, ia);
+unlock1:
+ NDPR_UNLOCK(pr);
- return(ia); /* this must NOT be NULL. */
+done:
+ *errorp = error;
+ return (ia6);
}
+#define IA6_NONCONST(i) ((struct in6_ifaddr *)(uintptr_t)(i))
+
int
-in6_tmpifadd(
- const struct in6_ifaddr *ia0, /* corresponding public address */
- int forcegen)
+in6_tmpifadd(const struct in6_ifaddr *ia0, int forcegen)
{
struct ifnet *ifp = ia0->ia_ifa.ifa_ifp;
- struct in6_ifaddr *newia;
+ struct in6_ifaddr *ia, *newia;
struct in6_aliasreq ifra;
- int i, error;
+ int i, error, ifaupdate;
int trylimit = 3; /* XXX: adhoc value */
u_int32_t randid[2];
time_t vltime0, pltime0;
- struct timeval timenow;
-
- getmicrotime(&timenow);
+ uint64_t timenow = net_uptime();
+ struct in6_addr addr;
+ struct nd_prefix *ndpr;
- bzero(&ifra, sizeof(ifra));
- strncpy(ifra.ifra_name, if_name(ifp), sizeof(ifra.ifra_name));
+ bzero(&ifra, sizeof (ifra));
+ strlcpy(ifra.ifra_name, if_name(ifp), sizeof (ifra.ifra_name));
+ IFA_LOCK(&IA6_NONCONST(ia0)->ia_ifa);
ifra.ifra_addr = ia0->ia_addr;
/* copy prefix mask */
ifra.ifra_prefixmask = ia0->ia_prefixmask;
ifra.ifra_addr.sin6_addr.s6_addr32[i]
&= ifra.ifra_prefixmask.sin6_addr.s6_addr32[i];
}
+ addr = ia0->ia_addr.sin6_addr;
+ IFA_UNLOCK(&IA6_NONCONST(ia0)->ia_ifa);
- again:
- in6_get_tmpifid(ifp, (u_int8_t *)randid,
- (const u_int8_t *)&ia0->ia_addr.sin6_addr.s6_addr[8],
- forcegen);
- ifra.ifra_addr.sin6_addr.s6_addr32[2]
- |= (randid[0] & ~(ifra.ifra_prefixmask.sin6_addr.s6_addr32[2]));
- ifra.ifra_addr.sin6_addr.s6_addr32[3]
- |= (randid[1] & ~(ifra.ifra_prefixmask.sin6_addr.s6_addr32[3]));
+again:
+ in6_iid_mktmp(ifp, (u_int8_t *)randid,
+ (const u_int8_t *)&addr.s6_addr[8], forcegen);
+
+ ifra.ifra_addr.sin6_addr.s6_addr32[2] |=
+ (randid[0] & ~(ifra.ifra_prefixmask.sin6_addr.s6_addr32[2]));
+ ifra.ifra_addr.sin6_addr.s6_addr32[3] |=
+ (randid[1] & ~(ifra.ifra_prefixmask.sin6_addr.s6_addr32[3]));
/*
- * If by chance the new temporary address is the same as an address
- * already assigned to the interface, generate a new randomized
- * interface identifier and repeat this step.
- * RFC 3041 3.3 (4).
+ * in6_iid_mktmp() quite likely provided a unique interface ID.
+ * However, we may still have a chance to see collision, because
+ * there may be a time lag between generation of the ID and generation
+ * of the address. So, we'll do one more sanity check.
*/
- if (in6ifa_ifpwithaddr(ifp, &ifra.ifra_addr.sin6_addr) != NULL) {
+ if ((ia = in6ifa_ifpwithaddr(ifp, &ifra.ifra_addr.sin6_addr)) != NULL) {
+ IFA_REMREF(&ia->ia_ifa);
if (trylimit-- == 0) {
nd6log((LOG_NOTICE, "in6_tmpifadd: failed to find "
"a unique random IFID\n"));
- return(EEXIST);
+ return (EEXIST);
}
forcegen = 1;
goto again;
/*
* The Valid Lifetime is the lower of the Valid Lifetime of the
- * public address or TEMP_VALID_LIFETIME.
+ * public address or TEMP_VALID_LIFETIME.
* The Preferred Lifetime is the lower of the Preferred Lifetime
- * of the public address or TEMP_PREFERRED_LIFETIME -
- * DESYNC_FACTOR.
+ * of the public address or TEMP_PREFERRED_LIFETIME -
+ * DESYNC_FACTOR.
*/
- if (ia0->ia6_lifetime.ia6t_expire != 0) {
- vltime0 = IFA6_IS_INVALID(ia0) ? 0 :
- (ia0->ia6_lifetime.ia6t_expire - timenow.tv_sec);
+ IFA_LOCK(&IA6_NONCONST(ia0)->ia_ifa);
+ if (ia0->ia6_lifetime.ia6ti_vltime != ND6_INFINITE_LIFETIME) {
+ vltime0 = IFA6_IS_INVALID(ia0, timenow) ? 0 :
+ (ia0->ia6_lifetime.ia6ti_vltime -
+ (timenow - ia0->ia6_updatetime));
if (vltime0 > ip6_temp_valid_lifetime)
vltime0 = ip6_temp_valid_lifetime;
- } else
+ } else {
vltime0 = ip6_temp_valid_lifetime;
- if (ia0->ia6_lifetime.ia6t_preferred != 0) {
- pltime0 = IFA6_IS_DEPRECATED(ia0) ? 0 :
- (ia0->ia6_lifetime.ia6t_preferred - timenow.tv_sec);
- if (pltime0 > ip6_temp_preferred_lifetime - ip6_desync_factor){
+ }
+ if (ia0->ia6_lifetime.ia6ti_pltime != ND6_INFINITE_LIFETIME) {
+ pltime0 = IFA6_IS_DEPRECATED(ia0, timenow) ? 0 :
+ (ia0->ia6_lifetime.ia6ti_pltime -
+ (timenow - ia0->ia6_updatetime));
+ if (pltime0 > ip6_temp_preferred_lifetime - ip6_desync_factor)
pltime0 = ip6_temp_preferred_lifetime -
- ip6_desync_factor;
- }
- } else
+ ip6_desync_factor;
+ } else {
pltime0 = ip6_temp_preferred_lifetime - ip6_desync_factor;
+ }
ifra.ifra_lifetime.ia6t_vltime = vltime0;
ifra.ifra_lifetime.ia6t_pltime = pltime0;
-
+ IFA_UNLOCK(&IA6_NONCONST(ia0)->ia_ifa);
/*
* A temporary address is created only if this calculated Preferred
* Lifetime is greater than REGEN_ADVANCE time units.
*/
if (ifra.ifra_lifetime.ia6t_pltime <= ip6_temp_regen_advance)
- return(0);
+ return (0);
/* XXX: scope zone ID? */
ifra.ifra_flags |= (IN6_IFF_AUTOCONF|IN6_IFF_TEMPORARY);
/* allocate ifaddr structure, link into chain, etc. */
- if ((error = in6_update_ifa(ifp, &ifra, NULL)) != 0)
- return(error);
-
- newia = in6ifa_ifpwithaddr(ifp, &ifra.ifra_addr.sin6_addr);
- if (newia == NULL) { /* XXX: can it happen? */
- nd6log((LOG_ERR,
- "in6_tmpifadd: ifa update succeeded, but we got "
- "no ifaddr\n"));
- return(EINVAL); /* XXX */
+ ifaupdate = IN6_IFAUPDATE_NOWAIT | IN6_IFAUPDATE_DADDELAY;
+ error = in6_update_ifa(ifp, &ifra, ifaupdate, &newia);
+ if (error != 0) {
+ nd6log((LOG_ERR, "in6_tmpifadd: failed to add address.\n"));
+ return (error);
}
- newia->ia6_ndpr = ia0->ia6_ndpr;
- newia->ia6_ndpr->ndpr_refcnt++;
+ VERIFY(newia != NULL);
+ IFA_LOCK(&IA6_NONCONST(ia0)->ia_ifa);
+ ndpr = ia0->ia6_ndpr;
+ if (ndpr == NULL) {
+ /*
+ * We lost the race with another thread that has purged
+ * ia0 address; in this case, purge the tmp addr as well.
+ */
+ nd6log((LOG_ERR, "in6_tmpifadd: no public address\n"));
+ VERIFY(!(ia0->ia6_flags & IN6_IFF_AUTOCONF));
+ IFA_UNLOCK(&IA6_NONCONST(ia0)->ia_ifa);
+ in6_purgeaddr(&newia->ia_ifa);
+ IFA_REMREF(&newia->ia_ifa);
+ return (EADDRNOTAVAIL);
+ }
+ NDPR_ADDREF(ndpr); /* for us */
+ IFA_UNLOCK(&IA6_NONCONST(ia0)->ia_ifa);
+ IFA_LOCK(&newia->ia_ifa);
+ if (newia->ia6_ndpr != NULL) {
+ NDPR_LOCK(newia->ia6_ndpr);
+ VERIFY(newia->ia6_ndpr->ndpr_addrcnt != 0);
+ newia->ia6_ndpr->ndpr_addrcnt--;
+ NDPR_UNLOCK(newia->ia6_ndpr);
+ NDPR_REMREF(newia->ia6_ndpr); /* release addr reference */
+ }
+ newia->ia6_ndpr = ndpr;
+ NDPR_LOCK(newia->ia6_ndpr);
+ newia->ia6_ndpr->ndpr_addrcnt++;
+ VERIFY(newia->ia6_ndpr->ndpr_addrcnt != 0);
+ NDPR_ADDREF_LOCKED(newia->ia6_ndpr); /* for addr reference */
+ NDPR_UNLOCK(newia->ia6_ndpr);
+ IFA_UNLOCK(&newia->ia_ifa);
/*
* A newly added address might affect the status of other addresses.
* XXX: when the temporary address is generated with a new public
* and, in fact, we surely need the check when we create a new
* temporary address due to deprecation of an old temporary address.
*/
- pfxlist_onlink_check(0);
+ lck_mtx_lock(nd6_mutex);
+ pfxlist_onlink_check();
+ lck_mtx_unlock(nd6_mutex);
+ IFA_REMREF(&newia->ia_ifa);
- return(0);
-}
+ /* remove our reference */
+ NDPR_REMREF(ndpr);
+
+ return (0);
+}
+#undef IA6_NONCONST
int
in6_init_prefix_ltimes(struct nd_prefix *ndpr)
{
- struct timeval timenow;
+ struct timeval caltime;
+ u_int64_t timenow = net_uptime();
+
+ NDPR_LOCK_ASSERT_HELD(ndpr);
+
+ getmicrotime(&caltime);
+ ndpr->ndpr_base_calendartime = caltime.tv_sec;
+ ndpr->ndpr_base_uptime = timenow;
- getmicrotime(&timenow);
- /* check if preferred lifetime > valid lifetime. RFC2462 5.5.3 (c) */
+ /* check if preferred lifetime > valid lifetime. RFC 4862 5.5.3 (c) */
if (ndpr->ndpr_pltime > ndpr->ndpr_vltime) {
nd6log((LOG_INFO, "in6_init_prefix_ltimes: preferred lifetime"
"(%d) is greater than valid lifetime(%d)\n",
if (ndpr->ndpr_pltime == ND6_INFINITE_LIFETIME)
ndpr->ndpr_preferred = 0;
else
- ndpr->ndpr_preferred = timenow.tv_sec + ndpr->ndpr_pltime;
+ ndpr->ndpr_preferred = timenow + ndpr->ndpr_pltime;
if (ndpr->ndpr_vltime == ND6_INFINITE_LIFETIME)
ndpr->ndpr_expire = 0;
else
- ndpr->ndpr_expire = timenow.tv_sec + ndpr->ndpr_vltime;
+ ndpr->ndpr_expire = timenow + ndpr->ndpr_vltime;
- return 0;
+ return (0);
}
static void
in6_init_address_ltimes(struct nd_prefix *new, struct in6_addrlifetime *lt6)
{
- struct timeval timenow;
+#pragma unused(new)
+ uint64_t timenow = net_uptime();
- getmicrotime(&timenow);
/* Valid lifetime must not be updated unless explicitly specified. */
/* init ia6t_expire */
- if (lt6->ia6t_vltime == ND6_INFINITE_LIFETIME)
+ if (lt6->ia6t_vltime == ND6_INFINITE_LIFETIME) {
lt6->ia6t_expire = 0;
- else {
- lt6->ia6t_expire = timenow.tv_sec;
+ } else {
+ lt6->ia6t_expire = timenow;
lt6->ia6t_expire += lt6->ia6t_vltime;
}
/* init ia6t_preferred */
- if (lt6->ia6t_pltime == ND6_INFINITE_LIFETIME)
+ if (lt6->ia6t_pltime == ND6_INFINITE_LIFETIME) {
lt6->ia6t_preferred = 0;
- else {
- lt6->ia6t_preferred = timenow.tv_sec;
+ } else {
+ lt6->ia6t_preferred = timenow;
lt6->ia6t_preferred += lt6->ia6t_pltime;
}
}
if (!IN6_IS_ADDR_LINKLOCAL(gateway)) {
return;
}
- lck_mtx_lock(rt_mtx);
+ lck_mtx_lock(rnh_lock);
/* XXX: hack for KAME's link-local address kludge */
gateway->s6_addr16[1] = htons(ifp->if_index);
rnh->rnh_walktree(rnh, rt6_deleteroute, (void *)gateway);
- lck_mtx_unlock(rt_mtx);
+ lck_mtx_unlock(rnh_lock);
}
static int
struct radix_node *rn,
void *arg)
{
-#define SIN6(s) ((struct sockaddr_in6 *)s)
struct rtentry *rt = (struct rtentry *)rn;
struct in6_addr *gate = (struct in6_addr *)arg;
- lck_mtx_assert(rt_mtx, LCK_MTX_ASSERT_OWNED);
+ lck_mtx_assert(rnh_lock, LCK_MTX_ASSERT_OWNED);
- if (rt->rt_gateway == NULL || rt->rt_gateway->sa_family != AF_INET6)
- return(0);
-
- if (!IN6_ARE_ADDR_EQUAL(gate, &SIN6(rt->rt_gateway)->sin6_addr))
- return(0);
+ RT_LOCK(rt);
+ if (rt->rt_gateway == NULL || rt->rt_gateway->sa_family != AF_INET6) {
+ RT_UNLOCK(rt);
+ return (0);
+ }
+ if (!IN6_ARE_ADDR_EQUAL(gate, &SIN6(rt->rt_gateway)->sin6_addr)) {
+ RT_UNLOCK(rt);
+ return (0);
+ }
/*
* Do not delete a static route.
* XXX: this seems to be a bit ad-hoc. Should we consider the
* 'cloned' bit instead?
*/
- if ((rt->rt_flags & RTF_STATIC) != 0)
- return(0);
-
+ if ((rt->rt_flags & RTF_STATIC) != 0) {
+ RT_UNLOCK(rt);
+ return (0);
+ }
/*
* We delete only host route. This means, in particular, we don't
* delete default route.
*/
- if ((rt->rt_flags & RTF_HOST) == 0)
- return(0);
+ if ((rt->rt_flags & RTF_HOST) == 0) {
+ RT_UNLOCK(rt);
+ return (0);
+ }
- return(rtrequest_locked(RTM_DELETE, rt_key(rt),
- rt->rt_gateway, rt_mask(rt), rt->rt_flags, 0));
-#undef SIN6
+ /*
+ * Safe to drop rt_lock and use rt_key, rt_gateway, since holding
+ * rnh_lock here prevents another thread from calling rt_setgate()
+ * on this route.
+ */
+ RT_UNLOCK(rt);
+ return (rtrequest_locked(RTM_DELETE, rt_key(rt), rt->rt_gateway,
+ rt_mask(rt), rt->rt_flags, 0));
}
int
int ifindex)
{
int error = 0;
+ ifnet_t def_ifp = NULL;
- if (ifindex < 0 || if_index < ifindex)
- return(EINVAL);
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_NOTOWNED);
+
+ ifnet_head_lock_shared();
+ if (ifindex < 0 || if_index < ifindex) {
+ ifnet_head_done();
+ return (EINVAL);
+ }
+ def_ifp = ifindex2ifnet[ifindex];
+ ifnet_head_done();
lck_mtx_lock(nd6_mutex);
if (nd6_defifindex != ifindex) {
+ struct ifnet *odef_ifp = nd6_defifp;
+
nd6_defifindex = ifindex;
if (nd6_defifindex > 0)
- nd6_defifp = ifindex2ifnet[nd6_defifindex];
+ nd6_defifp = def_ifp;
else
nd6_defifp = NULL;
+ if (nd6_defifp != NULL)
+ nd6log((LOG_INFO, "%s: is now the default "
+ "interface (was %s)\n", if_name(nd6_defifp),
+ odef_ifp != NULL ? if_name(odef_ifp) : "NONE"));
+ else
+ nd6log((LOG_INFO, "No default interface set\n"));
+
/*
* If the Default Router List is empty, install a route
* to the specified interface as default or remove the default
* we do this here to avoid re-install the default route
* if the list is NOT empty.
*/
- if (TAILQ_FIRST(&nd_defrouter) == NULL)
- defrouter_select();
+ if (odef_ifp != NULL) {
+ defrouter_select(odef_ifp);
+ }
+
+ if (nd6_defifp != NULL) {
+ defrouter_select(nd6_defifp);
+ nd6_prefix_sync(nd6_defifp);
+ }
/*
- * Our current implementation assumes one-to-one maping between
+ * Our current implementation assumes one-to-one mapping between
* interfaces and links, so it would be natural to use the
* default interface as the default link.
*/
scope6_setdefault(nd6_defifp);
}
-
lck_mtx_unlock(nd6_mutex);
- return(error);
+ return (error);
}