-/* $KAME: nd6_rtr.c,v 1.30 2000/03/21 11:37:31 itojun Exp $ */
+/*
+ * Copyright (c) 2003-2016 Apple Inc. All rights reserved.
+ *
+ * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
+ *
+ * This file contains Original Code and/or Modifications of Original Code
+ * as defined in and that are subject to the Apple Public Source License
+ * Version 2.0 (the 'License'). You may not use this file except in
+ * compliance with the License. The rights granted to you under the License
+ * may not be used to create, or enable the creation or redistribution of,
+ * unlawful or unlicensed copies of an Apple operating system, or to
+ * circumvent, violate, or enable the circumvention or violation of, any
+ * terms of an Apple operating system software license agreement.
+ *
+ * Please obtain a copy of the License at
+ * http://www.opensource.apple.com/apsl/ and read it before using this file.
+ *
+ * The Original Code and all software distributed under the License are
+ * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
+ * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
+ * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
+ * Please see the License for the specific language governing rights and
+ * limitations under the License.
+ *
+ * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
+ */
/*
* Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
* SUCH DAMAGE.
*/
+
#include <sys/param.h>
#include <sys/systm.h>
#include <sys/malloc.h>
#include <sys/time.h>
#include <sys/kernel.h>
#include <sys/errno.h>
-#if !(defined(__FreeBSD__) && __FreeBSD__ >= 3)
-#include <sys/ioctl.h>
-#endif
#include <sys/syslog.h>
+#include <sys/queue.h>
+#include <sys/mcache.h>
+#include <sys/protosw.h>
+
+#include <dev/random/randomdev.h>
+
+#include <kern/locks.h>
+#include <kern/zalloc.h>
+#include <machine/machine_routines.h>
#include <net/if.h>
+#include <net/if_var.h>
#include <net/if_types.h>
#include <net/if_dl.h>
#include <net/route.h>
#include <netinet/in.h>
#include <netinet6/in6_var.h>
+#include <netinet6/in6_ifattach.h>
#include <netinet/ip6.h>
#include <netinet6/ip6_var.h>
#include <netinet6/nd6.h>
#include <netinet/icmp6.h>
-
-#if MIP6
-#include <netinet6/mip6.h>
-#endif
+#include <netinet6/scope6_var.h>
#include <net/net_osdep.h>
-#define SDL(s) ((struct sockaddr_dl *)s)
+static void defrouter_addreq(struct nd_defrouter *, boolean_t);
+static void defrouter_delreq(struct nd_defrouter *);
+static struct nd_defrouter *defrtrlist_update_common(struct nd_defrouter *,
+ boolean_t);
+static struct nd_defrouter *defrtrlist_update(struct nd_defrouter *);
+
+static struct in6_ifaddr *in6_pfx_newpersistaddr(struct nd_prefix *, int,
+ int *);
+
+static struct nd_pfxrouter *pfxrtr_lookup(struct nd_prefix *,
+ struct nd_defrouter *);
+static void pfxrtr_add(struct nd_prefix *, struct nd_defrouter *);
+static void pfxrtr_del(struct nd_pfxrouter *, struct nd_prefix *);
+static struct nd_pfxrouter *find_pfxlist_reachable_router(struct nd_prefix *);
+static void nd6_rtmsg(int, struct rtentry *);
+
+static int nd6_prefix_onlink_common(struct nd_prefix *, boolean_t,
+ unsigned int);
+static struct nd_prefix *nd6_prefix_equal_lookup(struct nd_prefix *, boolean_t);
+static void nd6_prefix_sync(struct ifnet *);
-static struct nd_defrouter *defrtrlist_update __P((struct nd_defrouter *));
-static int prelist_add __P((struct nd_prefix *, struct nd_defrouter *));
-/* static struct nd_prefix *prefix_lookup __P((struct nd_prefix *)); XXXYYY */
-static struct in6_ifaddr *in6_ifadd __P((struct ifnet *, struct in6_addr *,
- struct in6_addr *, int));
-/*static struct nd_pfxrouter *pfxrtr_lookup __P((struct nd_prefix *,
- struct nd_defrouter *)); XXXYYYY */
-static void pfxrtr_add __P((struct nd_prefix *, struct nd_defrouter *));
-static void pfxrtr_del __P((struct nd_pfxrouter *));
-/*static struct nd_pfxrouter *find_pfxlist_reachable_router __P((struct nd_prefix *)); XXXYYY */
-static void nd6_detach_prefix __P((struct nd_prefix *));
-static void nd6_attach_prefix __P((struct nd_prefix *));
-/* static void defrouter_addifreq __P((struct ifnet *)); XXXYYY */
+static void in6_init_address_ltimes(struct nd_prefix *,
+ struct in6_addrlifetime *);
-static void in6_init_address_ltimes __P((struct nd_prefix *ndpr,
- struct in6_addrlifetime *lt6,
- int update_vltime));
+static int rt6_deleteroute(struct radix_node *, void *);
-static int rt6_deleteroute __P((struct radix_node *, void *));
+static struct nd_defrouter *nddr_alloc(int);
+static void nddr_free(struct nd_defrouter *);
+static void nddr_trace(struct nd_defrouter *, int);
+
+static struct nd_prefix *ndpr_alloc(int);
+static void ndpr_free(struct nd_prefix *);
+static void ndpr_trace(struct nd_prefix *, int);
extern int nd6_recalc_reachtm_interval;
-struct ifnet *nd6_defifp;
-int nd6_defifindex;
+static struct ifnet *nd6_defifp = NULL;
+int nd6_defifindex = 0;
+static unsigned int nd6_defrouter_genid;
+
+int ip6_use_tempaddr = 1; /* use temp addr by default for testing now */
+
+int nd6_accept_6to4 = 1;
+
+int ip6_desync_factor;
+u_int32_t ip6_temp_preferred_lifetime = DEF_TEMP_PREFERRED_LIFETIME;
+u_int32_t ip6_temp_valid_lifetime = DEF_TEMP_VALID_LIFETIME;
+/*
+ * shorter lifetimes for debugging purposes.
+ * u_int32_t ip6_temp_preferred_lifetime = 800;
+ * static u_int32_t ip6_temp_valid_lifetime = 1800;
+ */
+int ip6_temp_regen_advance = TEMPADDR_REGEN_ADVANCE;
+
+extern lck_mtx_t *nd6_mutex;
+
+/* Serialization variables for single thread access to nd_prefix */
+static boolean_t nd_prefix_busy;
+static void *nd_prefix_waitchan = &nd_prefix_busy;
+static int nd_prefix_waiters = 0;
+
+/* Serialization variables for single thread access to nd_defrouter */
+static boolean_t nd_defrouter_busy;
+static void *nd_defrouter_waitchan = &nd_defrouter_busy;
+static int nd_defrouter_waiters = 0;
+
+/* RTPREF_MEDIUM has to be 0! */
+#define RTPREF_HIGH 1
+#define RTPREF_MEDIUM 0
+#define RTPREF_LOW (-1)
+#define RTPREF_RESERVED (-2)
+#define RTPREF_INVALID (-3) /* internal */
+
+#define NDPR_TRACE_HIST_SIZE 32 /* size of trace history */
+
+/* For gdb */
+__private_extern__ unsigned int ndpr_trace_hist_size = NDPR_TRACE_HIST_SIZE;
+
+struct nd_prefix_dbg {
+ struct nd_prefix ndpr_pr; /* nd_prefix */
+ u_int16_t ndpr_refhold_cnt; /* # of ref */
+ u_int16_t ndpr_refrele_cnt; /* # of rele */
+ /*
+ * Circular lists of ndpr_addref and ndpr_remref callers.
+ */
+ ctrace_t ndpr_refhold[NDPR_TRACE_HIST_SIZE];
+ ctrace_t ndpr_refrele[NDPR_TRACE_HIST_SIZE];
+};
+
+static unsigned int ndpr_debug; /* debug flags */
+static unsigned int ndpr_size; /* size of zone element */
+static struct zone *ndpr_zone; /* zone for nd_prefix */
+#define NDPR_ZONE_MAX 64 /* maximum elements in zone */
+#define NDPR_ZONE_NAME "nd6_prefix" /* zone name */
-#if MIP6
-void (*mip6_select_defrtr_hook)(void) = NULL;
-struct nd_prefix * (*mip6_get_home_prefix_hook)(void) = NULL;
-void (*mip6_prelist_update_hook)(struct nd_prefix *pr,
- struct nd_defrouter *dr) = NULL;
-void (*mip6_probe_pfxrtrs_hook)(void) = NULL;
-void (*mip6_store_advint_hook)(struct nd_opt_advint *ai,
- struct nd_defrouter *dr) = NULL;
-int (*mip6_get_md_state_hook)(void) = 0;
-void (*mip6_minus_a_case_hook)(struct nd_prefix *) = NULL;
-#endif /* MIP6 */
+#define NDDR_TRACE_HIST_SIZE 32 /* size of trace history */
+
+/* For gdb */
+__private_extern__ unsigned int nddr_trace_hist_size = NDDR_TRACE_HIST_SIZE;
+
+struct nd_defrouter_dbg {
+ struct nd_defrouter nddr_dr; /* nd_defrouter */
+ uint16_t nddr_refhold_cnt; /* # of ref */
+ uint16_t nddr_refrele_cnt; /* # of rele */
+ /*
+ * Circular lists of ndpr_addref and ndpr_remref callers.
+ */
+ ctrace_t nddr_refhold[NDDR_TRACE_HIST_SIZE];
+ ctrace_t nddr_refrele[NDDR_TRACE_HIST_SIZE];
+};
+
+static unsigned int nddr_debug; /* debug flags */
+static unsigned int nddr_size; /* size of zone element */
+static struct zone *nddr_zone; /* zone for nd_defrouter */
+
+#define NDDR_ZONE_MAX 64 /* maximum elements in zone */
+#define NDDR_ZONE_NAME "nd6_defrouter" /* zone name */
+
+static unsigned int ndprtr_size; /* size of zone element */
+static struct zone *ndprtr_zone; /* zone for nd_pfxrouter */
+
+#define NDPRTR_ZONE_MAX 64 /* maximum elements in zone */
+#define NDPRTR_ZONE_NAME "nd6_pfxrouter" /* zone name */
+
+void
+nd6_rtr_init(void)
+{
+ PE_parse_boot_argn("ifa_debug", &ndpr_debug, sizeof (ndpr_debug));
+ PE_parse_boot_argn("ifa_debug", &nddr_debug, sizeof (nddr_debug));
+
+ ndpr_size = (ndpr_debug == 0) ? sizeof (struct nd_prefix) :
+ sizeof (struct nd_prefix_dbg);
+ ndpr_zone = zinit(ndpr_size, NDPR_ZONE_MAX * ndpr_size, 0,
+ NDPR_ZONE_NAME);
+ if (ndpr_zone == NULL) {
+ panic("%s: failed allocating %s", __func__, NDPR_ZONE_NAME);
+ /* NOTREACHED */
+ }
+ zone_change(ndpr_zone, Z_EXPAND, TRUE);
+ zone_change(ndpr_zone, Z_CALLERACCT, FALSE);
+
+ nddr_size = (nddr_debug == 0) ? sizeof (struct nd_defrouter) :
+ sizeof (struct nd_defrouter_dbg);
+ nddr_zone = zinit(nddr_size, NDDR_ZONE_MAX * nddr_size, 0,
+ NDDR_ZONE_NAME);
+ if (nddr_zone == NULL) {
+ panic("%s: failed allocating %s", __func__, NDDR_ZONE_NAME);
+ /* NOTREACHED */
+ }
+ zone_change(nddr_zone, Z_EXPAND, TRUE);
+ zone_change(nddr_zone, Z_CALLERACCT, FALSE);
+
+ ndprtr_size = sizeof (struct nd_pfxrouter);
+ ndprtr_zone = zinit(ndprtr_size, NDPRTR_ZONE_MAX * ndprtr_size, 0,
+ NDPRTR_ZONE_NAME);
+ if (ndprtr_zone == NULL) {
+ panic("%s: failed allocating %s", __func__, NDPRTR_ZONE_NAME);
+ /* NOTREACHED */
+ }
+ zone_change(ndprtr_zone, Z_EXPAND, TRUE);
+ zone_change(ndprtr_zone, Z_CALLERACCT, FALSE);
+}
/*
* Receive Router Solicitation Message - just for routers.
* Based on RFC 2461
*/
void
-nd6_rs_input(m, off, icmp6len)
- struct mbuf *m;
- int off, icmp6len;
+nd6_rs_input(
+ struct mbuf *m,
+ int off,
+ int icmp6len)
{
struct ifnet *ifp = m->m_pkthdr.rcvif;
struct ip6_hdr *ip6 = mtod(m, struct ip6_hdr *);
struct nd_router_solicit *nd_rs;
struct in6_addr saddr6 = ip6->ip6_src;
-#if 0
- struct in6_addr daddr6 = ip6->ip6_dst;
-#endif
char *lladdr = NULL;
int lladdrlen = 0;
-#if 0
- struct sockaddr_dl *sdl = (struct sockaddr_dl *)NULL;
- struct llinfo_nd6 *ln = (struct llinfo_nd6 *)NULL;
- struct rtentry *rt = NULL;
- int is_newentry;
-#endif
union nd_opts ndopts;
+ /* Expect 32-bit aligned data pointer on strict-align platforms */
+ MBUF_STRICT_DATA_ALIGNMENT_CHECK_32(m);
+
/* If I'm not a router, ignore it. */
- if (ip6_accept_rtadv != 0 || ip6_forwarding != 1)
+ if (!ip6_forwarding || !(ifp->if_eflags & IFEF_IPV6_ROUTER))
goto freeit;
/* Sanity checks */
if (ip6->ip6_hlim != 255) {
- log(LOG_ERR,
- "nd6_rs_input: invalid hlim %d\n", ip6->ip6_hlim);
- goto freeit;
+ nd6log((LOG_ERR,
+ "nd6_rs_input: invalid hlim (%d) from %s to %s on %s\n",
+ ip6->ip6_hlim, ip6_sprintf(&ip6->ip6_src),
+ ip6_sprintf(&ip6->ip6_dst), if_name(ifp)));
+ goto bad;
}
/*
- * Don't update the neighbor cache, if src = ::.
- * This indicates that the src has no IP address assigned yet.
+ * Don't update the neighbor cache, if src = :: or a non-neighbor.
+ * The former case indicates that the src has no IP address assigned
+ * yet. See nd6_ns_input() for the latter case.
*/
- if (IN6_IS_ADDR_UNSPECIFIED(&saddr6))
+ if (IN6_IS_ADDR_UNSPECIFIED(&ip6->ip6_src)) {
goto freeit;
-
-#ifndef PULLDOWN_TEST
- IP6_EXTHDR_CHECK(m, off, icmp6len,);
- nd_rs = (struct nd_router_solicit *)((caddr_t)ip6 + off);
-#else
- IP6_EXTHDR_GET(nd_rs, struct nd_router_solicit *, m, off, icmp6len);
- if (nd_rs == NULL) {
- icmp6stat.icp6s_tooshort++;
- return;
+ } else {
+ struct sockaddr_in6 src_sa6;
+
+ bzero(&src_sa6, sizeof (src_sa6));
+ src_sa6.sin6_family = AF_INET6;
+ src_sa6.sin6_len = sizeof (src_sa6);
+ src_sa6.sin6_addr = ip6->ip6_src;
+ if (!nd6_is_addr_neighbor(&src_sa6, ifp, 0)) {
+ nd6log((LOG_INFO, "nd6_rs_input: "
+ "RS packet from non-neighbor\n"));
+ goto freeit;
+ }
}
-#endif
- icmp6len -= sizeof(*nd_rs);
+ IP6_EXTHDR_CHECK(m, off, icmp6len, return);
+ nd_rs = (struct nd_router_solicit *)((caddr_t)ip6 + off);
+ icmp6len -= sizeof (*nd_rs);
nd6_option_init(nd_rs + 1, icmp6len, &ndopts);
if (nd6_options(&ndopts) < 0) {
- log(LOG_INFO, "nd6_rs_input: invalid ND option, ignored\n");
+ nd6log((LOG_INFO,
+ "nd6_rs_input: invalid ND option, ignored\n"));
+ /* nd6_options have incremented stats */
goto freeit;
}
}
if (lladdr && ((ifp->if_addrlen + 2 + 7) & ~7) != lladdrlen) {
- log(LOG_INFO,
+ nd6log((LOG_INFO,
"nd6_rs_input: lladdrlen mismatch for %s "
"(if %d, RS packet %d)\n",
- ip6_sprintf(&saddr6), ifp->if_addrlen, lladdrlen - 2);
+ ip6_sprintf(&saddr6), ifp->if_addrlen, lladdrlen - 2));
+ goto bad;
}
nd6_cache_lladdr(ifp, &saddr6, lladdr, lladdrlen, ND_ROUTER_SOLICIT, 0);
- freeit:
+freeit:
+ m_freem(m);
+ return;
+
+bad:
+ icmp6stat.icp6s_badrs++;
m_freem(m);
}
* TODO: ND_RA_FLAG_{OTHER,MANAGED} processing
*/
void
-nd6_ra_input(m, off, icmp6len)
- struct mbuf *m;
- int off, icmp6len;
+nd6_ra_input(
+ struct mbuf *m,
+ int off,
+ int icmp6len)
{
struct ifnet *ifp = m->m_pkthdr.rcvif;
- struct nd_ifinfo *ndi = &nd_ifinfo[ifp->if_index];
+ struct nd_ifinfo *ndi = NULL;
struct ip6_hdr *ip6 = mtod(m, struct ip6_hdr *);
struct nd_router_advert *nd_ra;
struct in6_addr saddr6 = ip6->ip6_src;
-#if 0
- struct in6_addr daddr6 = ip6->ip6_dst;
- int flags; /* = nd_ra->nd_ra_flags_reserved; */
- int is_managed = ((flags & ND_RA_FLAG_MANAGED) != 0);
- int is_other = ((flags & ND_RA_FLAG_OTHER) != 0);
-#endif
+ int mcast = 0;
union nd_opts ndopts;
- struct nd_defrouter *dr;
+ struct nd_defrouter *dr = NULL;
+ u_int32_t mtu = 0;
+ char *lladdr = NULL;
+ u_int32_t lladdrlen = 0;
+ struct nd_prefix_list *nd_prefix_list_head = NULL;
+ u_int32_t nd_prefix_list_length = 0;
+ struct in6_ifaddr *ia6 = NULL;
+ struct nd_prefix_list *prfl;
+ struct nd_defrouter dr0;
+ u_int32_t advreachable;
- if (ip6_accept_rtadv == 0)
+
+ /* Expect 32-bit aligned data pointer on strict-align platforms */
+ MBUF_STRICT_DATA_ALIGNMENT_CHECK_32(m);
+
+ /*
+ * Discard RA unless IFEF_ACCEPT_RTADV is set (as host), or when
+ * IFEF_IPV6_ROUTER is set (as router) but the RA is not locally
+ * generated. For convenience, we allow locally generated (rtadvd)
+ * RAs to be processed on the advertising interface, as a router.
+ *
+ * Note that we don't test against ip6_forwarding as we could be
+ * both a host and a router on different interfaces, hence the
+ * check against the per-interface flags.
+ */
+ if (!(ifp->if_eflags & (IFEF_ACCEPT_RTADV | IFEF_IPV6_ROUTER)) ||
+ ((ifp->if_eflags & IFEF_IPV6_ROUTER) &&
+ (ia6 = ifa_foraddr6(&saddr6)) == NULL))
goto freeit;
+ if (ia6 != NULL) {
+ IFA_REMREF(&ia6->ia_ifa);
+ ia6 = NULL;
+ }
+
if (ip6->ip6_hlim != 255) {
- log(LOG_ERR,
- "nd6_ra_input: invalid hlim %d\n", ip6->ip6_hlim);
- goto freeit;
+ nd6log((LOG_ERR,
+ "nd6_ra_input: invalid hlim (%d) from %s to %s on %s\n",
+ ip6->ip6_hlim, ip6_sprintf(&ip6->ip6_src),
+ ip6_sprintf(&ip6->ip6_dst), if_name(ifp)));
+ goto bad;
}
if (!IN6_IS_ADDR_LINKLOCAL(&saddr6)) {
- log(LOG_ERR,
+ nd6log((LOG_ERR,
"nd6_ra_input: src %s is not link-local\n",
- ip6_sprintf(&saddr6));
- goto freeit;
+ ip6_sprintf(&saddr6)));
+ goto bad;
}
-#ifndef PULLDOWN_TEST
- IP6_EXTHDR_CHECK(m, off, icmp6len,);
+ IP6_EXTHDR_CHECK(m, off, icmp6len, return);
nd_ra = (struct nd_router_advert *)((caddr_t)ip6 + off);
-#else
- IP6_EXTHDR_GET(nd_ra, struct nd_router_advert *, m, off, icmp6len);
- if (nd_ra == NULL) {
- icmp6stat.icp6s_tooshort++;
- return;
- }
-#endif
- icmp6len -= sizeof(*nd_ra);
+ icmp6len -= sizeof (*nd_ra);
nd6_option_init(nd_ra + 1, icmp6len, &ndopts);
if (nd6_options(&ndopts) < 0) {
- log(LOG_INFO, "nd6_ra_input: invalid ND option, ignored\n");
+ nd6log((LOG_INFO,
+ "nd6_ra_input: invalid ND option, ignored\n"));
+ /* nd6_options have incremented stats */
goto freeit;
}
- {
- struct nd_defrouter dr0;
- u_int32_t advreachable = nd_ra->nd_ra_reachable;
-#if !(defined(__FreeBSD__) && __FreeBSD__ >= 3) && !defined (__APPLE__)
- long time_second = time.tv_sec;
-#endif
+ advreachable = nd_ra->nd_ra_reachable;
+ /* remember if this is a multicasted advertisement */
+ if (IN6_IS_ADDR_MULTICAST(&ip6->ip6_dst))
+ mcast = 1;
+
+ ndi = ND_IFINFO(ifp);
+ VERIFY((NULL != ndi) && (TRUE == ndi->initialized));
+ lck_mtx_lock(&ndi->lock);
+ bzero(&dr0, sizeof (dr0));
dr0.rtaddr = saddr6;
dr0.flags = nd_ra->nd_ra_flags_reserved;
dr0.rtlifetime = ntohs(nd_ra->nd_ra_router_lifetime);
- dr0.expire = time_second + dr0.rtlifetime;
+ dr0.expire = net_uptime() + dr0.rtlifetime;
dr0.ifp = ifp;
- dr0.advint = 0; /* Mobile IPv6 */
- dr0.advint_expire = 0; /* Mobile IPv6 */
- dr0.advints_lost = 0; /* Mobile IPv6 */
/* unspecified or not? (RFC 2461 6.3.4) */
if (advreachable) {
- NTOHL(advreachable);
+ advreachable = ntohl(advreachable);
if (advreachable <= MAX_REACHABLE_TIME &&
ndi->basereachable != advreachable) {
ndi->basereachable = advreachable;
}
if (nd_ra->nd_ra_retransmit)
ndi->retrans = ntohl(nd_ra->nd_ra_retransmit);
- if (nd_ra->nd_ra_curhoplimit)
- ndi->chlim = nd_ra->nd_ra_curhoplimit;
+ if (nd_ra->nd_ra_curhoplimit) {
+ if (ndi->chlim < nd_ra->nd_ra_curhoplimit) {
+ ndi->chlim = nd_ra->nd_ra_curhoplimit;
+ } else if (ndi->chlim != nd_ra->nd_ra_curhoplimit) {
+ nd6log((LOG_ERR,
+ "RA with a lower CurHopLimit sent from "
+ "%s on %s (current = %d, received = %d). "
+ "Ignored.\n", ip6_sprintf(&ip6->ip6_src),
+ if_name(ifp), ndi->chlim,
+ nd_ra->nd_ra_curhoplimit));
+ }
+ }
+ lck_mtx_unlock(&ndi->lock);
+ lck_mtx_lock(nd6_mutex);
dr = defrtrlist_update(&dr0);
- }
+ lck_mtx_unlock(nd6_mutex);
/*
* prefix
*/
if (ndopts.nd_opts_pi) {
struct nd_opt_hdr *pt;
- struct nd_opt_prefix_info *pi;
+ struct nd_opt_prefix_info *pi = NULL;
struct nd_prefix pr;
for (pt = (struct nd_opt_hdr *)ndopts.nd_opts_pi;
- pt <= (struct nd_opt_hdr *)ndopts.nd_opts_pi_end;
- pt = (struct nd_opt_hdr *)((caddr_t)pt +
- (pt->nd_opt_len << 3))) {
+ pt <= (struct nd_opt_hdr *)ndopts.nd_opts_pi_end;
+ pt = (struct nd_opt_hdr *)((caddr_t)pt +
+ (pt->nd_opt_len << 3))) {
+ struct in6_addr pi_mask;
+ bzero(&pi_mask, sizeof(pi_mask));
+
if (pt->nd_opt_type != ND_OPT_PREFIX_INFORMATION)
continue;
pi = (struct nd_opt_prefix_info *)pt;
if (pi->nd_opt_pi_len != 4) {
- log(LOG_INFO, "nd6_ra_input: invalid option "
- "len %d for prefix information option, "
- "ignored\n", pi->nd_opt_pi_len);
+ nd6log((LOG_INFO,
+ "nd6_ra_input: invalid option "
+ "len %d for prefix information option, "
+ "ignored\n", pi->nd_opt_pi_len));
continue;
}
if (128 < pi->nd_opt_pi_prefix_len) {
- log(LOG_INFO, "nd6_ra_input: invalid prefix "
- "len %d for prefix information option, "
- "ignored\n", pi->nd_opt_pi_prefix_len);
- continue;
- }
-
- if (IN6_IS_ADDR_MULTICAST(&pi->nd_opt_pi_prefix)
- || IN6_IS_ADDR_LINKLOCAL(&pi->nd_opt_pi_prefix)) {
- log(LOG_INFO, "nd6_ra_input: invalid prefix "
- "%s, ignored\n",
- ip6_sprintf(&pi->nd_opt_pi_prefix));
+ nd6log((LOG_INFO,
+ "nd6_ra_input: invalid prefix "
+ "len %d for prefix information option, "
+ "ignored\n", pi->nd_opt_pi_prefix_len));
continue;
}
- /* aggregatable unicast address, rfc2374 */
- if ((pi->nd_opt_pi_prefix.s6_addr8[0] & 0xe0) == 0x20
- && pi->nd_opt_pi_prefix_len != 64) {
- log(LOG_INFO, "nd6_ra_input: invalid prefixlen "
- "%d for rfc2374 prefix %s, ignored\n",
- pi->nd_opt_pi_prefix_len,
- ip6_sprintf(&pi->nd_opt_pi_prefix));
+ /*
+ * To ignore ::/64 make sure bits beyond prefixlen
+ * are set to zero
+ */
+ in6_prefixlen2mask(&pi_mask, pi->nd_opt_pi_prefix_len);
+ pi->nd_opt_pi_prefix.s6_addr32[0] &= pi_mask.s6_addr32[0];
+ pi->nd_opt_pi_prefix.s6_addr32[1] &= pi_mask.s6_addr32[1];
+ pi->nd_opt_pi_prefix.s6_addr32[2] &= pi_mask.s6_addr32[2];
+ pi->nd_opt_pi_prefix.s6_addr32[3] &= pi_mask.s6_addr32[3];
+
+ if (IN6_IS_ADDR_UNSPECIFIED(&pi->nd_opt_pi_prefix) ||
+ IN6_IS_ADDR_MULTICAST(&pi->nd_opt_pi_prefix) ||
+ IN6_IS_ADDR_LINKLOCAL(&pi->nd_opt_pi_prefix)) {
+ nd6log((LOG_INFO,
+ "%s: invalid prefix %s, ignored\n",
+ __func__,
+ ip6_sprintf(&pi->nd_opt_pi_prefix)));
continue;
}
- bzero(&pr, sizeof(pr));
+ bzero(&pr, sizeof (pr));
+ lck_mtx_init(&pr.ndpr_lock, ifa_mtx_grp, ifa_mtx_attr);
+ NDPR_LOCK(&pr);
pr.ndpr_prefix.sin6_family = AF_INET6;
- pr.ndpr_prefix.sin6_len = sizeof(pr.ndpr_prefix);
+ pr.ndpr_prefix.sin6_len = sizeof (pr.ndpr_prefix);
pr.ndpr_prefix.sin6_addr = pi->nd_opt_pi_prefix;
- pr.ndpr_ifp = (struct ifnet *)m->m_pkthdr.rcvif;
+ pr.ndpr_ifp = m->m_pkthdr.rcvif;
pr.ndpr_raf_onlink = (pi->nd_opt_pi_flags_reserved &
- ND_OPT_PI_FLAG_ONLINK) ? 1 : 0;
+ ND_OPT_PI_FLAG_ONLINK) ? 1 : 0;
pr.ndpr_raf_auto = (pi->nd_opt_pi_flags_reserved &
- ND_OPT_PI_FLAG_AUTO) ? 1 : 0;
+ ND_OPT_PI_FLAG_AUTO) ? 1 : 0;
pr.ndpr_plen = pi->nd_opt_pi_prefix_len;
pr.ndpr_vltime = ntohl(pi->nd_opt_pi_valid_time);
pr.ndpr_pltime =
ntohl(pi->nd_opt_pi_preferred_time);
- if (in6_init_prefix_ltimes(&pr))
+ /*
+ * Exceptions to stateless autoconfiguration processing:
+ * + nd6_accept_6to4 == 0 && address has 6to4 prefix
+ * + ip6_only_allow_rfc4193_prefix != 0 &&
+ * address not RFC 4193
+ */
+ if (ip6_only_allow_rfc4193_prefix &&
+ !IN6_IS_ADDR_UNIQUE_LOCAL(&pi->nd_opt_pi_prefix)) {
+ nd6log((LOG_INFO,
+ "nd6_ra_input: no SLAAC on prefix %s "
+ "[not RFC 4193]\n",
+ ip6_sprintf(&pi->nd_opt_pi_prefix)));
+ pr.ndpr_raf_auto = 0;
+ } else if (!nd6_accept_6to4 &&
+ IN6_IS_ADDR_6TO4(&pi->nd_opt_pi_prefix)) {
+ nd6log((LOG_INFO,
+ "%s: no SLAAC on prefix %s "
+ "[6to4]\n", __func__,
+ ip6_sprintf(&pi->nd_opt_pi_prefix)));
+ pr.ndpr_raf_auto = 0;
+ }
+
+ if (in6_init_prefix_ltimes(&pr)) {
+ NDPR_UNLOCK(&pr);
+ lck_mtx_destroy(&pr.ndpr_lock, ifa_mtx_grp);
continue; /* prefix lifetime init failed */
+ } else {
+ NDPR_UNLOCK(&pr);
+ }
+ (void) prelist_update(&pr, dr, m, mcast);
+ lck_mtx_destroy(&pr.ndpr_lock, ifa_mtx_grp);
+
+ /*
+ * We have to copy the values out after the
+ * prelist_update call since some of these values won't
+ * be properly set until after the router advertisement
+ * updating can vet the values.
+ */
+ prfl = NULL;
+ MALLOC(prfl, struct nd_prefix_list *, sizeof (*prfl),
+ M_TEMP, M_WAITOK | M_ZERO);
- (void)prelist_update(&pr, dr, m);
+ if (prfl == NULL) {
+ log(LOG_DEBUG, "%s: unable to MALLOC RA prefix "
+ "structure\n", __func__);
+ continue;
+ }
+
+ /* this is only for nd6_post_msg(), otherwise unused */
+ bcopy(&pr.ndpr_prefix, &prfl->pr.ndpr_prefix,
+ sizeof (prfl->pr.ndpr_prefix));
+ prfl->pr.ndpr_raf = pr.ndpr_raf;
+ prfl->pr.ndpr_plen = pr.ndpr_plen;
+ prfl->pr.ndpr_vltime = pr.ndpr_vltime;
+ prfl->pr.ndpr_pltime = pr.ndpr_pltime;
+ prfl->pr.ndpr_expire = pr.ndpr_expire;
+ prfl->pr.ndpr_base_calendartime =
+ pr.ndpr_base_calendartime;
+ prfl->pr.ndpr_base_uptime = pr.ndpr_base_uptime;
+ prfl->pr.ndpr_stateflags = pr.ndpr_stateflags;
+ prfl->pr.ndpr_addrcnt = pr.ndpr_addrcnt;
+ prfl->pr.ndpr_ifp = pr.ndpr_ifp;
+
+ prfl->next = nd_prefix_list_head;
+ nd_prefix_list_head = prfl;
+ nd_prefix_list_length++;
}
}
* MTU
*/
if (ndopts.nd_opts_mtu && ndopts.nd_opts_mtu->nd_opt_mtu_len == 1) {
- u_int32_t mtu = ntohl(ndopts.nd_opts_mtu->nd_opt_mtu_mtu);
+ mtu = ntohl(ndopts.nd_opts_mtu->nd_opt_mtu_mtu);
/* lower bound */
if (mtu < IPV6_MMTU) {
- log(LOG_INFO, "nd6_ra_input: bogus mtu option "
+ nd6log((LOG_INFO, "nd6_ra_input: bogus mtu option "
"mtu=%d sent from %s, ignoring\n",
- mtu, ip6_sprintf(&ip6->ip6_src));
+ mtu, ip6_sprintf(&ip6->ip6_src)));
goto skip;
}
+ lck_mtx_lock(&ndi->lock);
/* upper bound */
if (ndi->maxmtu) {
if (mtu <= ndi->maxmtu) {
int change = (ndi->linkmtu != mtu);
ndi->linkmtu = mtu;
+ lck_mtx_unlock(&ndi->lock);
if (change) /* in6_maxmtu may change */
in6_setmaxmtu();
} else {
- log(LOG_INFO, "nd6_ra_input: bogus mtu "
+ nd6log((LOG_INFO, "nd6_ra_input: bogus mtu "
"mtu=%d sent from %s; "
"exceeds maxmtu %d, ignoring\n",
mtu, ip6_sprintf(&ip6->ip6_src),
- ndi->maxmtu);
+ ndi->maxmtu));
+ lck_mtx_unlock(&ndi->lock);
}
} else {
- log(LOG_INFO, "nd6_ra_input: mtu option "
+ lck_mtx_unlock(&ndi->lock);
+ nd6log((LOG_INFO, "nd6_ra_input: mtu option "
"mtu=%d sent from %s; maxmtu unknown, "
"ignoring\n",
- mtu, ip6_sprintf(&ip6->ip6_src));
+ mtu, ip6_sprintf(&ip6->ip6_src)));
}
}
- skip:
-
+skip:
+
/*
- * Src linkaddress
+ * Source link layer address
*/
- {
- char *lladdr = NULL;
- int lladdrlen = 0;
-
if (ndopts.nd_opts_src_lladdr) {
lladdr = (char *)(ndopts.nd_opts_src_lladdr + 1);
lladdrlen = ndopts.nd_opts_src_lladdr->nd_opt_len << 3;
}
if (lladdr && ((ifp->if_addrlen + 2 + 7) & ~7) != lladdrlen) {
- log(LOG_INFO,
+ nd6log((LOG_INFO,
"nd6_ra_input: lladdrlen mismatch for %s "
"(if %d, RA packet %d)\n",
- ip6_sprintf(&saddr6), ifp->if_addrlen, lladdrlen - 2);
+ ip6_sprintf(&saddr6), ifp->if_addrlen, lladdrlen - 2));
+ goto bad;
}
- nd6_cache_lladdr(ifp, &saddr6, lladdr, lladdrlen, ND_ROUTER_ADVERT, 0);
+ if (dr && dr->stateflags & NDDRF_MAPPED)
+ saddr6 = dr->rtaddr_mapped;
+
+ nd6_cache_lladdr(ifp, &saddr6, lladdr, (int)lladdrlen,
+ ND_ROUTER_ADVERT, 0);
+
+ /* Post message */
+ nd6_post_msg(KEV_ND6_RA, nd_prefix_list_head, nd_prefix_list_length,
+ mtu, lladdr, lladdrlen);
/*
* Installing a link-layer address might change the state of the
* router's neighbor cache, which might also affect our on-link
* detection of adveritsed prefixes.
*/
+ lck_mtx_lock(nd6_mutex);
pfxlist_onlink_check();
- }
-
-#if MIP6
- if (mip6_store_advint_hook) {
- if (ndopts.nd_opts_adv)
- (*mip6_store_advint_hook)(ndopts.nd_opts_adv, dr);
- }
-#endif
+ lck_mtx_unlock(nd6_mutex);
freeit:
m_freem(m);
+ if (dr)
+ NDDR_REMREF(dr);
+
+ prfl = NULL;
+ while ((prfl = nd_prefix_list_head) != NULL) {
+ nd_prefix_list_head = prfl->next;
+ FREE(prfl, M_TEMP);
+ }
+
+ return;
+
+bad:
+ icmp6stat.icp6s_badra++;
+ goto freeit;
}
/*
* default router list proccessing sub routines
*/
-void
-defrouter_addreq(new)
- struct nd_defrouter *new;
+
+/* tell the change to user processes watching the routing socket. */
+static void
+nd6_rtmsg(int cmd, struct rtentry *rt)
{
- struct sockaddr_in6 def, mask, gate;
- int s;
+ struct rt_addrinfo info;
+ struct ifnet *ifp = rt->rt_ifp;
- Bzero(&def, sizeof(def));
- Bzero(&mask, sizeof(mask));
- Bzero(&gate, sizeof(gate));
+ RT_LOCK_ASSERT_HELD(rt);
- def.sin6_len = mask.sin6_len = gate.sin6_len
- = sizeof(struct sockaddr_in6);
- def.sin6_family = mask.sin6_family = gate.sin6_family = AF_INET6;
- gate.sin6_addr = new->rtaddr;
+ bzero((caddr_t)&info, sizeof (info));
+ /* It's not necessary to lock ifp for if_lladdr */
+ info.rti_info[RTAX_DST] = rt_key(rt);
+ info.rti_info[RTAX_GATEWAY] = rt->rt_gateway;
+ info.rti_info[RTAX_NETMASK] = rt_mask(rt);
+ /*
+ * ifa_addr pointers for both should always be valid
+ * in this context; no need to hold locks.
+ */
+ info.rti_info[RTAX_IFP] = ifp->if_lladdr->ifa_addr;
+ info.rti_info[RTAX_IFA] = rt->rt_ifa->ifa_addr;
-#ifdef __NetBSD__
- s = splsoftnet();
-#else
- s = splnet();
-#endif
- (void)rtrequest(RTM_ADD, (struct sockaddr *)&def,
- (struct sockaddr *)&gate, (struct sockaddr *)&mask,
- RTF_GATEWAY, NULL);
- splx(s);
- return;
+ rt_missmsg(cmd, &info, rt->rt_flags, 0);
}
-/* Add a route to a given interface as default */
-void
-defrouter_addifreq(ifp)
- struct ifnet *ifp;
+static void
+defrouter_addreq(struct nd_defrouter *new, boolean_t scoped)
{
- struct sockaddr_in6 def, mask;
- struct ifaddr *ifa;
- int error, flags;
+ struct sockaddr_in6 def, mask, gate;
+ struct rtentry *newrt = NULL;
+ unsigned int ifscope;
+ int err;
+ struct nd_ifinfo *ndi = ND_IFINFO(new->ifp);
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_NOTOWNED);
+ NDDR_LOCK_ASSERT_NOTHELD(new);
+ /*
+ * We're free to lock and unlock NDDR because our callers
+ * are holding an extra reference for us.
+ */
+
+ NDDR_LOCK(new);
+ if (new->stateflags & NDDRF_INSTALLED)
+ goto out;
+
+ if (new->ifp->if_eflags & IFEF_IPV6_ROUTER) {
+ nd6log2((LOG_INFO, "%s: ignoring router %s, scoped=%d, "
+ "static=%d on advertising interface\n", if_name(new->ifp),
+ ip6_sprintf(&new->rtaddr), scoped,
+ (new->stateflags & NDDRF_STATIC) ? 1 : 0));
+ goto out;
+ }
+
+ nd6log2((LOG_INFO, "%s: adding default router %s, scoped=%d, "
+ "static=%d\n", if_name(new->ifp), ip6_sprintf(&new->rtaddr),
+ scoped, (new->stateflags & NDDRF_STATIC) ? 1 : 0));
+
+ Bzero(&def, sizeof (def));
+ Bzero(&mask, sizeof (mask));
+ Bzero(&gate, sizeof (gate));
+
+ def.sin6_len = mask.sin6_len = gate.sin6_len
+ = sizeof (struct sockaddr_in6);
+ def.sin6_family = mask.sin6_family = gate.sin6_family = AF_INET6;
- bzero(&def, sizeof(def));
- bzero(&mask, sizeof(mask));
+ if (new->stateflags & NDDRF_MAPPED)
+ gate.sin6_addr = new->rtaddr_mapped;
+ else
+ gate.sin6_addr = new->rtaddr;
- def.sin6_len = mask.sin6_len = sizeof(struct sockaddr_in6);
- def.sin6_family = mask.sin6_family = AF_INET6;
+ ifscope = scoped ? new->ifp->if_index : IFSCOPE_NONE;
+ NDDR_UNLOCK(new);
/*
- * Search for an ifaddr beloging to the specified interface.
- * XXX: An IPv6 address are required to be assigned on the interface.
+ * Cellular networks may have buggy deployments
+ * with gateway IPv6 link local address with same
+ * interface identifier as the one that has been
+ * assigned for the cellular context.
+ * If gateway is same as locally configured link local
+ * interface on cellular interface, generated a different one
+ * and store it in the nd_defrouter entry and use it to work
+ * on routing table
*/
- if ((ifa = ifaof_ifpforaddr((struct sockaddr *)&def, ifp)) == NULL) {
- log(LOG_ERR, /* better error? */
- "defrouter_addifreq: failed to find an ifaddr "
- "to install a route to interface %s\n",
- if_name(ifp));
- return;
+ if (new->ifp->if_type == IFT_CELLULAR &&
+ !(new->stateflags & NDDRF_STATIC) &&
+ !(new->stateflags & NDDRF_MAPPED) &&
+ IN6_IS_ADDR_LINKLOCAL(&gate.sin6_addr) &&
+ ndi && !(ndi->flags & ND6_IFF_PERFORMNUD)) {
+ struct in6_ifaddr *tmp_ia6 = in6ifa_ifpforlinklocal(new->ifp, 0);
+
+ if (tmp_ia6 != NULL &&
+ !(tmp_ia6->ia6_flags & IN6_IFF_NOTMANUAL) &&
+ IN6_ARE_ADDR_EQUAL(&tmp_ia6->ia_addr.sin6_addr,
+ &gate.sin6_addr)) {
+ gate.sin6_addr.s6_addr8[15] += 1;
+ new->rtaddr_mapped = gate.sin6_addr;
+ new->stateflags |= NDDRF_MAPPED;
+
+ nd6log((LOG_INFO, "%s: Default router %s mapped "
+ "to ", if_name(new->ifp), ip6_sprintf(&new->rtaddr)));
+ nd6log((LOG_INFO, "%s\n", ip6_sprintf(&new->rtaddr_mapped)));
+ }
}
- flags = ifa->ifa_flags;
- if ((ifp->if_flags & IFF_POINTOPOINT) != 0)
- flags &= ~RTF_CLONING;
- if ((error = rtrequest(RTM_ADD, (struct sockaddr *)&def,
- ifa->ifa_addr, (struct sockaddr *)&mask,
- flags, NULL)) != 0) {
- log(LOG_ERR,
- "defrouter_addifreq: failed to install a route to "
- "interface %s (errno = %d)\n",
- if_name(ifp), error);
+ err = rtrequest_scoped(RTM_ADD, (struct sockaddr *)&def,
+ (struct sockaddr *)&gate, (struct sockaddr *)&mask,
+ RTF_GATEWAY, &newrt, ifscope);
+
+ if (newrt) {
+ RT_LOCK(newrt);
+ nd6_rtmsg(RTM_ADD, newrt); /* tell user process */
+ RT_REMREF_LOCKED(newrt);
+ RT_UNLOCK(newrt);
+ NDDR_LOCK(new);
+ new->stateflags |= NDDRF_INSTALLED;
+ if (ifscope != IFSCOPE_NONE)
+ new->stateflags |= NDDRF_IFSCOPE;
+ } else {
+ nd6log((LOG_ERR, "%s: failed to add default router "
+ "%s on %s scoped %d (errno = %d)\n", __func__,
+ ip6_sprintf(&gate.sin6_addr), if_name(new->ifp),
+ (ifscope != IFSCOPE_NONE), err));
+ NDDR_LOCK(new);
}
+ new->err = err;
+
+out:
+ NDDR_UNLOCK(new);
}
struct nd_defrouter *
-defrouter_lookup(addr, ifp)
- struct in6_addr *addr;
- struct ifnet *ifp;
+defrouter_lookup(
+ struct in6_addr *addr,
+ struct ifnet *ifp)
{
struct nd_defrouter *dr;
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
for (dr = TAILQ_FIRST(&nd_defrouter); dr;
- dr = TAILQ_NEXT(dr, dr_entry)) {
- if (dr->ifp == ifp && IN6_ARE_ADDR_EQUAL(addr, &dr->rtaddr))
- return(dr);
+ dr = TAILQ_NEXT(dr, dr_entry)) {
+ NDDR_LOCK(dr);
+ if (dr->ifp == ifp && IN6_ARE_ADDR_EQUAL(addr, &dr->rtaddr)) {
+ NDDR_ADDREF_LOCKED(dr);
+ NDDR_UNLOCK(dr);
+ return (dr);
+ }
+ NDDR_UNLOCK(dr);
}
- return(NULL); /* search failed */
+ return (NULL); /* search failed */
}
-void
-defrouter_delreq(dr, dofree)
- struct nd_defrouter *dr;
- int dofree;
+/*
+ * Remove the default route for a given router.
+ * This is just a subroutine function for defrouter_select(), and should
+ * not be called from anywhere else.
+ */
+static void
+defrouter_delreq(struct nd_defrouter *dr)
{
struct sockaddr_in6 def, mask, gate;
+ struct rtentry *oldrt = NULL;
+ unsigned int ifscope;
+ int err;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_NOTOWNED);
+ NDDR_LOCK_ASSERT_NOTHELD(dr);
+ /*
+ * We're free to lock and unlock NDDR because our callers
+ * are holding an extra reference for us.
+ */
+ NDDR_LOCK(dr);
+ /* ifp would be NULL for the "drany" case */
+ if (dr->ifp != NULL && !(dr->stateflags & NDDRF_INSTALLED))
+ goto out;
- Bzero(&def, sizeof(def));
- Bzero(&mask, sizeof(mask));
- Bzero(&gate, sizeof(gate));
+ nd6log2((LOG_INFO, "%s: removing default router %s, scoped=%d, "
+ "static=%d\n", dr->ifp != NULL ? if_name(dr->ifp) : "ANY",
+ ip6_sprintf(&dr->rtaddr), (dr->stateflags & NDDRF_IFSCOPE) ? 1 : 0,
+ (dr->stateflags & NDDRF_STATIC) ? 1 : 0));
+
+ Bzero(&def, sizeof (def));
+ Bzero(&mask, sizeof (mask));
+ Bzero(&gate, sizeof (gate));
def.sin6_len = mask.sin6_len = gate.sin6_len
- = sizeof(struct sockaddr_in6);
+ = sizeof (struct sockaddr_in6);
def.sin6_family = mask.sin6_family = gate.sin6_family = AF_INET6;
- gate.sin6_addr = dr->rtaddr;
- rtrequest(RTM_DELETE, (struct sockaddr *)&def,
- (struct sockaddr *)&gate,
- (struct sockaddr *)&mask,
- RTF_GATEWAY, (struct rtentry **)0);
+ /*
+ * The router entry may be mapped to a different address.
+ * If that is the case, use the mapped address as gateway
+ * to do operation on the routing table.
+ * To get more context, read the related comment in
+ * defrouter_addreq
+ */
+ if (dr->stateflags & NDDRF_MAPPED)
+ gate.sin6_addr = dr->rtaddr_mapped;
+ else
+ gate.sin6_addr = dr->rtaddr;
- if (dofree) /* XXX: necessary? */
- _FREE(dr, M_IP6NDP);
+ if (dr->ifp != NULL) {
+ ifscope = (dr->stateflags & NDDRF_IFSCOPE) ?
+ dr->ifp->if_index : IFSCOPE_NONE;
+ } else {
+ ifscope = IFSCOPE_NONE;
+ }
+ NDDR_UNLOCK(dr);
+
+ err = rtrequest_scoped(RTM_DELETE,
+ (struct sockaddr *)&def, (struct sockaddr *)&gate,
+ (struct sockaddr *)&mask, RTF_GATEWAY, &oldrt, ifscope);
+
+ if (oldrt) {
+ RT_LOCK(oldrt);
+ nd6_rtmsg(RTM_DELETE, oldrt);
+ RT_UNLOCK(oldrt);
+ rtfree(oldrt);
+ } else if (err != ESRCH) {
+ nd6log((LOG_ERR, "%s: failed to delete default router "
+ "%s on %s scoped %d (errno = %d)\n", __func__,
+ ip6_sprintf(&gate.sin6_addr), dr->ifp != NULL ?
+ if_name(dr->ifp) : "ANY", (ifscope != IFSCOPE_NONE), err));
+ }
+ NDDR_LOCK(dr);
+ /* ESRCH means it's no longer in the routing table; ignore it */
+ if (oldrt != NULL || err == ESRCH) {
+ dr->stateflags &= ~NDDRF_INSTALLED;
+ if (ifscope != IFSCOPE_NONE)
+ dr->stateflags &= ~NDDRF_IFSCOPE;
+ }
+ dr->err = 0;
+out:
+ NDDR_UNLOCK(dr);
}
+
+/*
+ * remove all default routes from default router list
+ */
void
-defrtrlist_del(dr)
- struct nd_defrouter *dr;
+defrouter_reset(void)
+{
+ struct nd_defrouter *dr, drany;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ dr = TAILQ_FIRST(&nd_defrouter);
+ while (dr) {
+ NDDR_LOCK(dr);
+ if (dr->stateflags & NDDRF_INSTALLED) {
+ NDDR_ADDREF_LOCKED(dr);
+ NDDR_UNLOCK(dr);
+ lck_mtx_unlock(nd6_mutex);
+ defrouter_delreq(dr);
+ lck_mtx_lock(nd6_mutex);
+ NDDR_REMREF(dr);
+ dr = TAILQ_FIRST(&nd_defrouter);
+ } else {
+ NDDR_UNLOCK(dr);
+ dr = TAILQ_NEXT(dr, dr_entry);
+ }
+ }
+
+ /* Nuke primary (non-scoped) default router */
+ bzero(&drany, sizeof (drany));
+ lck_mtx_init(&drany.nddr_lock, ifa_mtx_grp, ifa_mtx_attr);
+ lck_mtx_unlock(nd6_mutex);
+ defrouter_delreq(&drany);
+ lck_mtx_destroy(&drany.nddr_lock, ifa_mtx_grp);
+ lck_mtx_lock(nd6_mutex);
+}
+
+int
+defrtrlist_ioctl(u_long cmd, caddr_t data)
+{
+ struct nd_defrouter dr0;
+ unsigned int ifindex;
+ struct ifnet *dr_ifp;
+ int error = 0, add = 0;
+
+ /* XXX Handle mapped default router entries */
+ switch (cmd) {
+ case SIOCDRADD_IN6_32: /* struct in6_defrouter_32 */
+ case SIOCDRADD_IN6_64: /* struct in6_defrouter_64 */
+ ++add;
+ /* FALLTHRU */
+ case SIOCDRDEL_IN6_32: /* struct in6_defrouter_32 */
+ case SIOCDRDEL_IN6_64: /* struct in6_defrouter_64 */
+ bzero(&dr0, sizeof (dr0));
+ if (cmd == SIOCDRADD_IN6_64 || cmd == SIOCDRDEL_IN6_64) {
+ struct in6_defrouter_64 *r_64 =
+ (struct in6_defrouter_64 *)(void *)data;
+ u_int16_t i;
+
+ bcopy(&r_64->rtaddr.sin6_addr, &dr0.rtaddr,
+ sizeof (dr0.rtaddr));
+ dr0.flags = r_64->flags;
+ bcopy(&r_64->if_index, &i, sizeof (i));
+ ifindex = i;
+ } else {
+ struct in6_defrouter_32 *r_32 =
+ (struct in6_defrouter_32 *)(void *)data;
+ u_int16_t i;
+
+ bcopy(&r_32->rtaddr.sin6_addr, &dr0.rtaddr,
+ sizeof (dr0.rtaddr));
+ dr0.flags = r_32->flags;
+ bcopy(&r_32->if_index, &i, sizeof (i));
+ ifindex = i;
+ }
+ ifnet_head_lock_shared();
+ /* Don't need to check is ifindex is < 0 since it's unsigned */
+ if (if_index < ifindex ||
+ (dr_ifp = ifindex2ifnet[ifindex]) == NULL) {
+ ifnet_head_done();
+ error = EINVAL;
+ break;
+ }
+ dr0.ifp = dr_ifp;
+ ifnet_head_done();
+
+ if (IN6_IS_SCOPE_EMBED(&dr0.rtaddr)) {
+ uint16_t *scope = &dr0.rtaddr.s6_addr16[1];
+
+ if (*scope == 0) {
+ *scope = htons(dr_ifp->if_index);
+ } else if (*scope != htons(dr_ifp->if_index)) {
+ error = EINVAL;
+ break;
+ }
+ }
+
+ if (add)
+ error = defrtrlist_add_static(&dr0);
+ if (!add || error != 0) {
+ int err = defrtrlist_del_static(&dr0);
+ if (!add)
+ error = err;
+ }
+ break;
+
+ default:
+ error = EOPNOTSUPP; /* check for safety */
+ break;
+ }
+
+ return (error);
+}
+
+/*
+ * XXX Please make sure to remove dr from the
+ * global default router tailq list before this
+ * function call.
+ * Also ensure that you release the list reference
+ * only after calling this routine.
+ */
+void
+defrtrlist_del(struct nd_defrouter *dr)
{
- struct nd_defrouter *deldr = NULL;
+#if (DEVELOPMENT || DEBUG)
+ struct nd_defrouter *dr_itr = NULL;
+#endif
struct nd_prefix *pr;
+ struct ifnet *ifp = dr->ifp;
+ struct nd_ifinfo *ndi = NULL;
+ boolean_t resetmtu;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+#if (DEVELOPMENT || DEBUG)
+ /*
+ * Verify that the router is not in the global default
+ * router list.
+ * Can't use defrouter_lookup here because that just works
+ * with address and ifp pointer.
+ * We have to compare the memory here.
+ * Also we can't use ASSERT here as that is not defined
+ * for development builds.
+ */
+ TAILQ_FOREACH(dr_itr, &nd_defrouter, dr_entry)
+ VERIFY(dr != dr_itr);
+#endif
+ ++nd6_defrouter_genid;
/*
* Flush all the routing table entries that use the router
* as a next hop.
*/
- if (!ip6_forwarding && ip6_accept_rtadv) {
- /* above is a good condition? */
- rt6_flush(&dr->rtaddr, dr->ifp);
- }
-
- if (dr == TAILQ_FIRST(&nd_defrouter))
- deldr = dr; /* The router is primary. */
+ /* above is a good condition? */
+ NDDR_ADDREF(dr);
+ lck_mtx_unlock(nd6_mutex);
+ if (dr->stateflags & NDDRF_MAPPED)
+ rt6_flush(&dr->rtaddr_mapped, ifp);
+ else
+ rt6_flush(&dr->rtaddr, ifp);
- TAILQ_REMOVE(&nd_defrouter, dr, dr_entry);
+ lck_mtx_lock(nd6_mutex);
+ NDDR_REMREF(dr);
+ nd6log2((LOG_INFO, "%s: freeing defrouter %s\n", if_name(dr->ifp),
+ ip6_sprintf(&dr->rtaddr)));
+ /*
+ * Delete it from the routing table.
+ */
+ NDDR_ADDREF(dr);
+ lck_mtx_unlock(nd6_mutex);
+ defrouter_delreq(dr);
+ lck_mtx_lock(nd6_mutex);
+ NDDR_REMREF(dr);
/*
* Also delete all the pointers to the router in each prefix lists.
*/
for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
struct nd_pfxrouter *pfxrtr;
+
+ NDPR_LOCK(pr);
if ((pfxrtr = pfxrtr_lookup(pr, dr)) != NULL)
- pfxrtr_del(pfxrtr);
+ pfxrtr_del(pfxrtr, pr);
+ NDPR_UNLOCK(pr);
}
+
pfxlist_onlink_check();
+ resetmtu = FALSE;
+ ndi = ND_IFINFO(ifp);
+ VERIFY((NULL != ndi) && (TRUE == ndi->initialized));
+ lck_mtx_lock(&ndi->lock);
+ VERIFY(ndi->ndefrouters >= 0);
+ if (ndi->ndefrouters > 0 && --ndi->ndefrouters == 0) {
+ nd6_ifreset(ifp);
+ resetmtu = TRUE;
+ }
+ lck_mtx_unlock(&ndi->lock);
+
/*
* If the router is the primary one, choose a new one.
- * Note that defrouter_select() will remove the current gateway
- * from the routing table.
+ * We always try to pick another eligible router
+ * on this interface as we do scoped routing
*/
- if (deldr)
- defrouter_select();
+ defrouter_select(ifp);
+
+ if (resetmtu)
+ nd6_setmtu(ifp);
+}
+
+int
+defrtrlist_add_static(struct nd_defrouter *new)
+{
+ struct nd_defrouter *dr;
+ int err = 0;
+
+ new->rtlifetime = -1;
+ new->stateflags |= NDDRF_STATIC;
+
+ /* we only want the preference level */
+ new->flags &= ND_RA_FLAG_RTPREF_MASK;
+
+ lck_mtx_lock(nd6_mutex);
+ dr = defrouter_lookup(&new->rtaddr, new->ifp);
+ if (dr != NULL && !(dr->stateflags & NDDRF_STATIC)) {
+ err = EINVAL;
+ } else {
+ if (dr != NULL)
+ NDDR_REMREF(dr);
+ dr = defrtrlist_update(new);
+ if (dr != NULL)
+ err = dr->err;
+ else
+ err = ENOMEM;
+ }
+ if (dr != NULL)
+ NDDR_REMREF(dr);
+ lck_mtx_unlock(nd6_mutex);
- _FREE(dr, M_IP6NDP);
+ return (err);
+}
+
+int
+defrtrlist_del_static(struct nd_defrouter *new)
+{
+ struct nd_defrouter *dr;
+
+ lck_mtx_lock(nd6_mutex);
+ dr = defrouter_lookup(&new->rtaddr, new->ifp);
+ if (dr == NULL || !(dr->stateflags & NDDRF_STATIC)) {
+ if (dr != NULL)
+ NDDR_REMREF(dr);
+ dr = NULL;
+ } else {
+ TAILQ_REMOVE(&nd_defrouter, dr, dr_entry);
+ defrtrlist_del(dr);
+ NDDR_REMREF(dr); /* remove list reference */
+ NDDR_REMREF(dr);
+ }
+ lck_mtx_unlock(nd6_mutex);
+
+ return (dr != NULL ? 0 : EINVAL);
+}
+
+/*
+ * for default router selection
+ * regards router-preference field as a 2-bit signed integer
+ */
+static int
+rtpref(struct nd_defrouter *dr)
+{
+ switch (dr->flags & ND_RA_FLAG_RTPREF_MASK) {
+ case ND_RA_FLAG_RTPREF_HIGH:
+ return (RTPREF_HIGH);
+ case ND_RA_FLAG_RTPREF_MEDIUM:
+ case ND_RA_FLAG_RTPREF_RSV:
+ return (RTPREF_MEDIUM);
+ case ND_RA_FLAG_RTPREF_LOW:
+ return (RTPREF_LOW);
+ default:
+ /*
+ * This case should never happen. If it did, it would mean a
+ * serious bug of kernel internal. We thus always bark here.
+ * Or, can we even panic?
+ */
+ log(LOG_ERR, "rtpref: impossible RA flag %x\n", dr->flags);
+ return (RTPREF_INVALID);
+ }
+ /* NOTREACHED */
}
/*
- * Default Router Selection according to Section 6.3.6 of RFC 2461:
- * 1) Routers that are reachable or probably reachable should be
- * preferred.
+ * Default Router Selection according to Section 6.3.6 of RFC 2461 and RFC 4191:
+ *
+ * 1) Routers that are reachable or probably reachable should be preferred.
+ * If we have more than one (probably) reachable router, prefer ones
+ * with the highest router preference.
* 2) When no routers on the list are known to be reachable or
* probably reachable, routers SHOULD be selected in a round-robin
- * fashion.
+ * fashion, regardless of router preference values.
* 3) If the Default Router List is empty, assume that all
* destinations are on-link.
+ *
+ * When Scoped Routing is enabled, the selection logic is amended as follows:
+ *
+ * a) When a default interface is specified, the primary/non-scoped default
+ * router will be set to the reachable router on that link (if any) with
+ * the highest router preference.
+ * b) When there are more than one routers on the same link, the one with
+ * the highest router preference will be installed, either as scoped or
+ * non-scoped route entry. If they all share the same preference value,
+ * the one installed will be the static or the first encountered reachable
+ * router, i.e. static one wins over dynamic.
+ * c) When no routers on the list are known to be reachable, or probably
+ * reachable, no round-robin selection will take place when the default
+ * interface is set.
+ *
+ * We assume nd_defrouter is sorted by router preference value.
+ * Since the code below covers both with and without router preference cases,
+ * we do not need to classify the cases by ifdef.
*/
void
-defrouter_select()
+defrouter_select(struct ifnet *ifp)
{
-#ifdef __NetBSD__
- int s = splsoftnet();
-#else
- int s = splnet();
-#endif
- struct nd_defrouter *dr, anydr;
- struct rtentry *rt = NULL;
+ struct nd_defrouter *dr = NULL;
+ struct nd_defrouter *selected_dr = NULL;
+ struct nd_defrouter *installed_dr = NULL;
struct llinfo_nd6 *ln = NULL;
+ struct rtentry *rt = NULL;
+ struct nd_ifinfo *ndi = NULL;
+ unsigned int genid = 0;
+ boolean_t is_installed_reachable = FALSE;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ if (ifp == NULL) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Return early. NULL interface",
+ __func__, __LINE__));
+ return;
+ }
+
+ if (ifp == lo_ifp) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Return early. "
+ "Default router select called for loopback.\n",
+ __func__, __LINE__));
+ return;
+ }
-#if MIP6
- /* Mobile IPv6 alternative routine */
- if (mip6_select_defrtr_hook) {
- (*mip6_select_defrtr_hook)(); /* XXXYYY Temporary? */
- splx(s);
+ if (ifp->if_eflags & IFEF_IPV6_ROUTER) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Return early. "
+ "Default router select called for interface"
+ " %s with IFEF_IPV6_ROUTER flag set\n",
+ __func__, __LINE__, if_name(ifp)));
return;
}
- /* End of Mobile IPv6 */
-#endif /* MIP6 */
+
+ /*
+ * Let's handle easy case (3) first:
+ * If default router list is empty, there's nothing to be done.
+ */
+ if (!TAILQ_FIRST(&nd_defrouter)) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Return early. "
+ "Default router is empty.\n", __func__, __LINE__));
+ return;
+ }
+
+ /*
+ * Take an early exit if number of routers in nd_ifinfo is
+ * 0 for the interface.
+ */
+ ndi = ND_IFINFO(ifp);
+ if (!ndi || !ndi->initialized) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Return early. "
+ "Interface %s's nd_ifinfo not initialized.\n",
+ __func__, __LINE__, if_name(ifp)));
+ return;
+ }
+
+ if (ndi->ndefrouters == 0) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Return early. "
+ "%s does not have any default routers.\n",
+ __func__, __LINE__, if_name(ifp)));
+ return;
+ }
+
+ /*
+ * Due to the number of times we drop nd6_mutex, we need to
+ * serialize this function.
+ */
+ while (nd_defrouter_busy) {
+ nd_defrouter_waiters++;
+ msleep(nd_defrouter_waitchan, nd6_mutex, (PZERO-1),
+ __func__, NULL);
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ }
+ nd_defrouter_busy = TRUE;
/*
* Search for a (probably) reachable router from the list.
+ * We just pick up the first reachable one (if any), assuming that
+ * the ordering rule of the list described in defrtrlist_update().
+ *
+ * For all intents and purposes of Scoped Routing:
+ * selected_dr = candidate for primary router
+ * installed_dr = currently installed primary router
*/
- for (dr = TAILQ_FIRST(&nd_defrouter); dr;
- dr = TAILQ_NEXT(dr, dr_entry)) {
- if ((rt = nd6_lookup(&dr->rtaddr, 0, dr->ifp)) &&
- (ln = (struct llinfo_nd6 *)rt->rt_llinfo) &&
- ND6_IS_LLINFO_PROBREACH(ln)) {
- /* Got it, and move it to the head */
- TAILQ_REMOVE(&nd_defrouter, dr, dr_entry);
- TAILQ_INSERT_HEAD(&nd_defrouter, dr, dr_entry);
- break;
+ genid = nd6_defrouter_genid;
+ dr = TAILQ_FIRST(&nd_defrouter);
+
+ while (dr != NULL) {
+ struct in6_addr rtaddr;
+ struct ifnet *drifp = NULL;
+ struct nd_defrouter *drrele = NULL;
+
+ NDDR_LOCK(dr);
+ drifp = dr->ifp;
+ if (drifp != ifp) {
+ NDDR_UNLOCK(dr);
+ dr = TAILQ_NEXT(dr, dr_entry);
+ continue;
+ }
+
+ /*
+ * Optimize for the common case.
+ * When the interface has only one default router
+ * there's no point checking for reachability as
+ * there's nothing else to choose from.
+ */
+ if (ndi->ndefrouters == 1) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Fast forward default router selection "
+ "as interface %s has learned only one default "
+ "router and there's nothing else to choose from.\n",
+ __func__, __LINE__, if_name(ifp)));
+ VERIFY(selected_dr == NULL && installed_dr == NULL);
+ selected_dr = dr;
+ if (dr->stateflags & NDDRF_INSTALLED)
+ installed_dr = dr;
+ NDDR_ADDREF_LOCKED(selected_dr);
+ NDDR_UNLOCK(dr);
+ goto install_route;
+ }
+
+ if (dr->stateflags & NDDRF_MAPPED)
+ rtaddr = dr->rtaddr_mapped;
+ else
+ rtaddr = dr->rtaddr;
+
+ NDDR_ADDREF_LOCKED(dr); /* for this for loop */
+ NDDR_UNLOCK(dr);
+
+ /* Callee returns a locked route upon success */
+ if (selected_dr == NULL) {
+ lck_mtx_unlock(nd6_mutex);
+ if ((rt = nd6_lookup(&rtaddr, 0, drifp, 0)) != NULL &&
+ (ln = rt->rt_llinfo) != NULL &&
+ ND6_IS_LLINFO_PROBREACH(ln)) {
+ RT_LOCK_ASSERT_HELD(rt);
+ selected_dr = dr;
+ NDDR_ADDREF(selected_dr);
+ }
+ lck_mtx_lock(nd6_mutex);
+ }
+
+ if (rt) {
+ RT_REMREF_LOCKED(rt);
+ RT_UNLOCK(rt);
+ rt = NULL;
}
- }
- if ((dr = TAILQ_FIRST(&nd_defrouter))) {
/*
- * De-install the previous default gateway and install
- * a new one.
- * Note that if there is no reachable router in the list,
- * the head entry will be used anyway.
- * XXX: do we have to check the current routing table entry?
+ * Handle case (b)
+ * When there are more than one routers on the same link, the one with
+ * the highest router preference will be installed.
+ * Since the list is in decreasing order of preference:
+ * 1) If selected_dr is not NULL, only use dr if it is static and has
+ * equal preference and selected_dr is not static.
+ * 2) Else if selected_dr is NULL, and dr is static make selected_dr = dr
*/
- bzero(&anydr, sizeof(anydr));
- defrouter_delreq(&anydr, 0);
- defrouter_addreq(dr);
+ NDDR_LOCK(dr);
+ if (((selected_dr && (rtpref(dr) >= rtpref(selected_dr)) &&
+ !(selected_dr->stateflags & NDDRF_STATIC)) ||
+ (selected_dr == NULL)) &&
+ (dr->stateflags & NDDRF_STATIC)) {
+ if (selected_dr) {
+ /* Release it later on */
+ VERIFY(drrele == NULL);
+ drrele = selected_dr;
+ }
+ selected_dr = dr;
+ NDDR_ADDREF_LOCKED(selected_dr);
+ }
+
+ /* Record the currently installed router */
+ if (dr->stateflags & NDDRF_INSTALLED) {
+ if (installed_dr == NULL) {
+ installed_dr = dr;
+ NDDR_ADDREF_LOCKED(installed_dr);
+ if (dr->stateflags & NDDRF_MAPPED)
+ rtaddr = installed_dr->rtaddr_mapped;
+ else
+ rtaddr = installed_dr->rtaddr;
+ NDDR_UNLOCK(dr);
+ lck_mtx_unlock(nd6_mutex);
+ /* Callee returns a locked route upon success */
+ if ((rt = nd6_lookup(&rtaddr, 0, ifp, 0)) != NULL) {
+ RT_LOCK_ASSERT_HELD(rt);
+ if ((ln = rt->rt_llinfo) != NULL &&
+ ND6_IS_LLINFO_PROBREACH(ln))
+ is_installed_reachable = TRUE;
+
+ RT_REMREF_LOCKED(rt);
+ RT_UNLOCK(rt);
+ rt = NULL;
+ }
+ lck_mtx_lock(nd6_mutex);
+ } else {
+ /* this should not happen; warn for diagnosis */
+ nd6log((LOG_ERR, "defrouter_select: more than one "
+ "default router is installed for interface :%s.\n",
+ if_name(ifp)));
+ NDDR_UNLOCK(dr);
+ }
+ } else
+ NDDR_UNLOCK(dr);
+
+ NDDR_REMREF(dr); /* for this for loop */
+ if (drrele != NULL)
+ NDDR_REMREF(drrele);
+
+ /*
+ * Check if the list changed when we gave up
+ * the nd6_mutex lock
+ */
+ if(genid != nd6_defrouter_genid) {
+ if (selected_dr) {
+ NDDR_REMREF(selected_dr);
+ selected_dr = NULL;
+ }
+
+ if (installed_dr) {
+ NDDR_REMREF(installed_dr);
+ installed_dr = NULL;
+ }
+
+ if (ndi->ndefrouters == 0) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Interface %s no longer "
+ "has any default routers. Abort.\n",
+ __func__, __LINE__, if_name(ifp)));
+ goto out;
+ }
+ nd6log2((LOG_INFO,
+ "%s:%d: Iterate default router list again "
+ "for interface %s, as the list seems to have "
+ "changed during release-reaquire of global "
+ "nd6_mutex lock.\n",
+ __func__, __LINE__, if_name(ifp)));
+
+ is_installed_reachable = FALSE;
+ genid = nd6_defrouter_genid;
+ dr = TAILQ_FIRST(&nd_defrouter);
+ } else {
+ dr = TAILQ_NEXT(dr, dr_entry);
+ }
}
- else {
+
+ /*
+ * If none of the default routers was found to be reachable,
+ * round-robin the list regardless of preference.
+ * Please note selected_dr equal to NULL implies that even
+ * installed default router is not reachable
+ */
+ if (selected_dr == NULL) {
+ if (installed_dr) {
+ for (dr = TAILQ_NEXT(installed_dr, dr_entry); dr;
+ dr = TAILQ_NEXT(dr, dr_entry)) {
+ if (installed_dr->ifp != dr->ifp)
+ continue;
+ selected_dr = dr;
+ break;
+ }
+ }
+
/*
- * The Default Router List is empty, so install the default
- * route to an inteface.
- * XXX: The specification does not say this mechanism should
- * be restricted to hosts, but this would be not useful
- * (even harmful) for routers.
+ * If none was installed or the installed one if the last
+ * one on the list, select the first one from the list
*/
- if (!ip6_forwarding) {
+ if ((installed_dr == NULL) || (selected_dr == NULL)) {
+ for (dr = TAILQ_FIRST(&nd_defrouter); dr;
+ dr = TAILQ_NEXT(dr, dr_entry)) {
+ if (dr->ifp == ifp) {
+ selected_dr = dr;
+ break;
+ }
+ }
+ }
+
+ if ((selected_dr == NULL) && (installed_dr == NULL)) {
+ nd6log2((LOG_INFO,
+ "%s:%d: Between release and reaquire of global "
+ "nd6_mutex lock, the list seems to have changed "
+ "and it does not have any default routers for "
+ "interface %s.\n",
+ __func__, __LINE__, if_name(ifp)));
+ goto out;
+ }
+
+ if (selected_dr != installed_dr)
+ NDDR_ADDREF(selected_dr);
+ } else if (installed_dr != NULL) {
+ if (installed_dr != selected_dr) {
/*
- * De-install the current default route
- * in advance.
+ * This means that selected default router is reachable
+ * while installed one may or may not be.
+ * Static router should always be considered as reachable
+ * for router selection process.
*/
- bzero(&anydr, sizeof(anydr));
- defrouter_delreq(&anydr, 0);
- if (nd6_defifp) {
- /*
- * Install a route to the default interface
- * as default route.
- */
- defrouter_addifreq(nd6_defifp);
+ if ((installed_dr->stateflags & NDDRF_STATIC) &&
+ rtpref(installed_dr) >= rtpref(selected_dr)) {
+ NDDR_REMREF(selected_dr);
+ selected_dr = installed_dr;
+ } else if (is_installed_reachable) {
+ if (rtpref(selected_dr) <= rtpref(installed_dr)) {
+ NDDR_REMREF(selected_dr);
+ selected_dr = installed_dr;
+ }
}
-#if ND6_DEBUG
- else /* noisy log? */
- log(LOG_INFO, "defrouter_select: "
- "there's no default router and no default"
- " interface\n");
-#endif
+ } else {
+ NDDR_REMREF(selected_dr);
}
}
- splx(s);
- return;
+install_route:
+ /*
+ * If the selected router is different than the installed one,
+ * remove the installed router and install the selected one.
+ * Note that the selected router is never NULL here.
+ * Else check if the route entry scope has to be changed.
+ */
+ lck_mtx_unlock(nd6_mutex);
+ if (installed_dr != selected_dr) {
+ nd6log((LOG_INFO,
+ "%s:%d: Found a better router for interface "
+ "%s. Installing new default route.\n",
+ __func__, __LINE__, if_name(ifp)));
+ if (installed_dr != NULL) {
+ defrouter_delreq(installed_dr);
+ }
+ /*
+ * Install scoped route if the interface is not
+ * the default nd6 interface.
+ */
+ defrouter_addreq(selected_dr,
+ (selected_dr->ifp != nd6_defifp));
+ } else if (((installed_dr->stateflags & NDDRF_IFSCOPE) &&
+ (installed_dr->ifp == nd6_defifp)) ||
+ (!(installed_dr->stateflags & NDDRF_IFSCOPE) &&
+ (installed_dr->ifp != nd6_defifp))) {
+ nd6log((LOG_INFO,
+ "%s:%d: Need to reinstall default route for interface "
+ "%s as its scope has changed.\n",
+ __func__, __LINE__, if_name(ifp)));
+ defrouter_delreq(installed_dr);
+ defrouter_addreq(installed_dr,
+ (installed_dr->ifp != nd6_defifp));
+ } else {
+ nd6log2((LOG_INFO,
+ "%s:%d: No need to change the default "
+ "route for interface %s.\n",
+ __func__, __LINE__, if_name(ifp)));
+ }
+ lck_mtx_lock(nd6_mutex);
+out:
+ if (selected_dr && (selected_dr != installed_dr))
+ NDDR_REMREF(selected_dr);
+ if (installed_dr)
+ NDDR_REMREF(installed_dr);
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ VERIFY(nd_defrouter_busy);
+ nd_defrouter_busy = FALSE;
+ if (nd_defrouter_waiters > 0) {
+ nd_defrouter_waiters = 0;
+ wakeup(nd_defrouter_waitchan);
+ }
}
static struct nd_defrouter *
-defrtrlist_update(new)
- struct nd_defrouter *new;
+defrtrlist_update_common(struct nd_defrouter *new, boolean_t scoped)
{
struct nd_defrouter *dr, *n;
-#ifdef __NetBSD__
- int s = splsoftnet();
-#else
- int s = splnet();
-#endif
+ struct ifnet *ifp = new->ifp;
+ struct nd_ifinfo *ndi = NULL;
+ struct timeval caltime;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
- if ((dr = defrouter_lookup(&new->rtaddr, new->ifp)) != NULL) {
+ if ((dr = defrouter_lookup(&new->rtaddr, ifp)) != NULL) {
/* entry exists */
if (new->rtlifetime == 0) {
+ TAILQ_REMOVE(&nd_defrouter, dr, dr_entry);
defrtrlist_del(dr);
+ NDDR_REMREF(dr); /* remove list reference */
+ NDDR_REMREF(dr);
dr = NULL;
} else {
+ int oldpref = rtpref(dr);
+ struct nd_defrouter *p = NULL;
/* override */
dr->flags = new->flags; /* xxx flag check */
dr->rtlifetime = new->rtlifetime;
dr->expire = new->expire;
+
+ /*
+ * If the preference does not change, there's no need
+ * to sort the entries. If Scoped Routing is enabled,
+ * put the primary/non-scoped router at the top of the
+ * list of routers in the same preference band, unless
+ * it's already at that position.
+ */
+ /* same preference and scoped; just return */
+ if (rtpref(new) == oldpref && scoped)
+ return (dr);
+
+ n = TAILQ_FIRST(&nd_defrouter);
+ while (n != NULL) {
+ /* preference changed; sort it */
+ if (rtpref(new) != oldpref)
+ break;
+
+ /* not at the top of band; sort it */
+ if (n != dr && rtpref(n) == oldpref &&
+ (!p || rtpref(p) > rtpref(n)))
+ break;
+
+ p = n;
+ n = TAILQ_NEXT(n, dr_entry);
+ }
+
+ /* nothing has changed, just return */
+ if (n == NULL && (scoped ||
+ !(dr->stateflags & NDDRF_IFSCOPE)))
+ return (dr);
+
+ /*
+ * preferred router may be changed, so relocate
+ * this router.
+ * XXX: calling TAILQ_REMOVE directly is a bad manner.
+ * However, since defrtrlist_del() has many side
+ * effects, we intentionally do so here.
+ * defrouter_select() below will handle routing
+ * changes later.
+ */
+ TAILQ_REMOVE(&nd_defrouter, dr, dr_entry);
+ new->stateflags = dr->stateflags;
+
+ n = dr;
+ goto insert;
}
- splx(s);
- return(dr);
+ return (dr);
}
+ VERIFY(dr == NULL);
+
/* entry does not exist */
if (new->rtlifetime == 0) {
- splx(s);
- return(NULL);
+ return (NULL);
}
- n = (struct nd_defrouter *)_MALLOC(sizeof(*n), M_IP6NDP, M_NOWAIT);
+ n = nddr_alloc(M_WAITOK);
if (n == NULL) {
- splx(s);
- return(NULL);
+ return (NULL);
}
- bzero(n, sizeof(*n));
- *n = *new;
+
+ ndi = ND_IFINFO(ifp);
+ VERIFY((NULL != ndi) && (TRUE == ndi->initialized));
+ lck_mtx_lock(&ndi->lock);
+ if (ip6_maxifdefrouters >= 0 &&
+ ndi->ndefrouters >= ip6_maxifdefrouters) {
+ lck_mtx_unlock(&ndi->lock);
+ nddr_free(n);
+ return (NULL);
+ }
+
+ NDDR_ADDREF(n); /* for the nd_defrouter list */
+ NDDR_ADDREF(n); /* for the caller */
+
+ ++nd6_defrouter_genid;
+ ndi->ndefrouters++;
+ VERIFY(ndi->ndefrouters != 0);
+ lck_mtx_unlock(&ndi->lock);
+
+ nd6log2((LOG_INFO, "%s: allocating defrouter %s\n", if_name(ifp),
+ ip6_sprintf(&new->rtaddr)));
+
+ getmicrotime(&caltime);
+ NDDR_LOCK(n);
+ memcpy(&n->rtaddr, &new->rtaddr, sizeof (n->rtaddr));
+ n->flags = new->flags;
+ n->stateflags = new->stateflags;
+ n->rtlifetime = new->rtlifetime;
+ n->expire = new->expire;
+ n->base_calendartime = caltime.tv_sec;
+ n->base_uptime = net_uptime();
+ n->ifp = new->ifp;
+ n->err = new->err;
+ NDDR_UNLOCK(n);
+insert:
+ /* get nd6_service() to be scheduled as soon as it's convenient */
+ ++nd6_sched_timeout_want;
/*
- * Insert the new router at the end of the Default Router List.
- * If there is no other router, install it anyway. Otherwise,
- * just continue to use the current default router.
+ * Insert the new router in the Default Router List;
+ * The Default Router List should be in the descending order
+ * of router-preferece. When Scoped Routing is disabled, routers
+ * with the same preference are sorted in the arriving time order;
+ * otherwise, the first entry in the list of routers having the same
+ * preference is the primary default router, when the interface used
+ * by the entry is the default interface.
*/
- TAILQ_INSERT_TAIL(&nd_defrouter, n, dr_entry);
- if (TAILQ_FIRST(&nd_defrouter) == n)
- defrouter_select();
- splx(s);
-
- return(n);
+
+ /* insert at the end of the group */
+ for (dr = TAILQ_FIRST(&nd_defrouter); dr;
+ dr = TAILQ_NEXT(dr, dr_entry)) {
+ if (rtpref(n) > rtpref(dr) ||
+ (!scoped && rtpref(n) == rtpref(dr)))
+ break;
+ }
+ if (dr)
+ TAILQ_INSERT_BEFORE(dr, n, dr_entry);
+ else
+ TAILQ_INSERT_TAIL(&nd_defrouter, n, dr_entry);
+
+ defrouter_select(ifp);
+
+ return (n);
}
-struct nd_pfxrouter *
-pfxrtr_lookup(pr, dr)
- struct nd_prefix *pr;
+static struct nd_defrouter *
+defrtrlist_update(struct nd_defrouter *new)
+{
struct nd_defrouter *dr;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ dr = defrtrlist_update_common(new,
+ (nd6_defifp != NULL && new->ifp != nd6_defifp));
+
+ return (dr);
+}
+
+static struct nd_pfxrouter *
+pfxrtr_lookup(struct nd_prefix *pr, struct nd_defrouter *dr)
{
struct nd_pfxrouter *search;
-
- for (search = pr->ndpr_advrtrs.lh_first; search; search = search->pfr_next) {
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ NDPR_LOCK_ASSERT_HELD(pr);
+
+ for (search = pr->ndpr_advrtrs.lh_first; search;
+ search = search->pfr_next) {
if (search->router == dr)
break;
}
- return(search);
+ return (search);
}
static void
-pfxrtr_add(pr, dr)
- struct nd_prefix *pr;
- struct nd_defrouter *dr;
+pfxrtr_add(struct nd_prefix *pr, struct nd_defrouter *dr)
{
struct nd_pfxrouter *new;
- new = (struct nd_pfxrouter *)_MALLOC(sizeof(*new), M_IP6NDP, M_NOWAIT);
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ NDPR_LOCK_ASSERT_NOTHELD(pr);
+
+ new = zalloc(ndprtr_zone);
if (new == NULL)
return;
- bzero(new, sizeof(*new));
+ bzero(new, sizeof (*new));
new->router = dr;
+ NDPR_LOCK(pr);
LIST_INSERT_HEAD(&pr->ndpr_advrtrs, new, pfr_entry);
+ pr->ndpr_genid++;
+ NDPR_UNLOCK(pr);
pfxlist_onlink_check();
}
static void
-pfxrtr_del(pfr)
- struct nd_pfxrouter *pfr;
+pfxrtr_del(struct nd_pfxrouter *pfr, struct nd_prefix *pr)
{
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ NDPR_LOCK_ASSERT_HELD(pr);
+ pr->ndpr_genid++;
LIST_REMOVE(pfr, pfr_entry);
- _FREE(pfr, M_IP6NDP);
+ zfree(ndprtr_zone, pfr);
}
+/*
+ * The routine has been modified to atomically refresh expiry
+ * time for nd6 prefix as the part of lookup.
+ * There's a corner case where a system going
+ * in sleep gets rid of manual addresses configured in the system
+ * and then schedules the prefix for deletion.
+ * However before the prefix gets deleted, if system comes out
+ * from sleep and configures same address before prefix deletion
+ * , the later prefix deletion will remove the prefix route and
+ * the system will not be able to communicate with other IPv6
+ * neighbor nodes in the same subnet.
+ */
struct nd_prefix *
-prefix_lookup(pr)
- struct nd_prefix *pr;
+nd6_prefix_lookup(struct nd_prefix *pr, int nd6_prefix_expiry)
{
struct nd_prefix *search;
+ lck_mtx_lock(nd6_mutex);
for (search = nd_prefix.lh_first; search; search = search->ndpr_next) {
+ NDPR_LOCK(search);
if (pr->ndpr_ifp == search->ndpr_ifp &&
pr->ndpr_plen == search->ndpr_plen &&
in6_are_prefix_equal(&pr->ndpr_prefix.sin6_addr,
- &search->ndpr_prefix.sin6_addr,
- pr->ndpr_plen)
- ) {
+ &search->ndpr_prefix.sin6_addr, pr->ndpr_plen)) {
+ if (nd6_prefix_expiry != ND6_PREFIX_EXPIRY_UNSPEC) {
+ search->ndpr_expire = nd6_prefix_expiry;
+ }
+ NDPR_ADDREF_LOCKED(search);
+ NDPR_UNLOCK(search);
break;
}
+ NDPR_UNLOCK(search);
}
+ lck_mtx_unlock(nd6_mutex);
- return(search);
+ return (search);
}
-static int
-prelist_add(pr, dr)
- struct nd_prefix *pr;
- struct nd_defrouter *dr;
+int
+nd6_prelist_add(struct nd_prefix *pr, struct nd_defrouter *dr,
+ struct nd_prefix **newp, boolean_t force_scoped)
{
- struct nd_prefix *new;
- int i, s;
+ struct nd_prefix *new = NULL;
+ struct ifnet *ifp = pr->ndpr_ifp;
+ struct nd_ifinfo *ndi = NULL;
+ int i, error;
+
+ if (ip6_maxifprefixes >= 0) {
+ ndi = ND_IFINFO(ifp);
+ VERIFY((NULL != ndi) && (TRUE == ndi->initialized));
+ lck_mtx_lock(&ndi->lock);
+ if (ndi->nprefixes >= ip6_maxifprefixes) {
+ lck_mtx_unlock(&ndi->lock);
+ return (ENOMEM);
+ }
+ lck_mtx_unlock(&ndi->lock);
+ }
- new = (struct nd_prefix *)_MALLOC(sizeof(*new), M_IP6NDP, M_NOWAIT);
+ new = ndpr_alloc(M_WAITOK);
if (new == NULL)
- return ENOMEM;
- bzero(new, sizeof(*new));
- *new = *pr;
-
- /* initilization */
- new->ndpr_statef_onlink = pr->ndpr_statef_onlink;
+ return (ENOMEM);
+
+ NDPR_LOCK(new);
+ NDPR_LOCK(pr);
+ new->ndpr_ifp = pr->ndpr_ifp;
+ new->ndpr_prefix = pr->ndpr_prefix;
+ new->ndpr_plen = pr->ndpr_plen;
+ new->ndpr_vltime = pr->ndpr_vltime;
+ new->ndpr_pltime = pr->ndpr_pltime;
+ new->ndpr_flags = pr->ndpr_flags;
+ if (pr->ndpr_stateflags & NDPRF_STATIC)
+ new->ndpr_stateflags |= NDPRF_STATIC;
+ NDPR_UNLOCK(pr);
+ if ((error = in6_init_prefix_ltimes(new)) != 0) {
+ NDPR_UNLOCK(new);
+ ndpr_free(new);
+ return (error);
+ }
+ new->ndpr_lastupdate = net_uptime();
+ if (newp != NULL) {
+ *newp = new;
+ NDPR_ADDREF_LOCKED(new); /* for caller */
+ }
+ /* initialization */
LIST_INIT(&new->ndpr_advrtrs);
in6_prefixlen2mask(&new->ndpr_mask, new->ndpr_plen);
/* make prefix in the canonical form */
new->ndpr_prefix.sin6_addr.s6_addr32[i] &=
new->ndpr_mask.s6_addr32[i];
- /* xxx ND_OPT_PI_FLAG_ONLINK processing */
+ NDPR_UNLOCK(new);
-#ifdef __NetBSD__
- s = splsoftnet();
-#else
- s = splnet();
-#endif
+ /* get nd6_service() to be scheduled as soon as it's convenient */
+ ++nd6_sched_timeout_want;
+
+ lck_mtx_lock(nd6_mutex);
/* link ndpr_entry to nd_prefix list */
LIST_INSERT_HEAD(&nd_prefix, new, ndpr_entry);
- splx(s);
+ new->ndpr_debug |= IFD_ATTACHED;
+ NDPR_ADDREF(new); /* for nd_prefix list */
+
+ lck_mtx_lock(&ndi->lock);
+ ndi->nprefixes++;
+ VERIFY(ndi->nprefixes != 0);
+ lck_mtx_unlock(&ndi->lock);
+
+ /* ND_OPT_PI_FLAG_ONLINK processing */
+ if (new->ndpr_raf_onlink) {
+ int e;
+
+ if ((e = nd6_prefix_onlink_common(new, force_scoped,
+ new->ndpr_ifp->if_index)) != 0) {
+ nd6log((LOG_ERR, "nd6_prelist_add: failed to make "
+ "the prefix %s/%d on-link %s on %s (errno=%d)\n",
+ ip6_sprintf(&new->ndpr_prefix.sin6_addr),
+ new->ndpr_plen, force_scoped ? "scoped" :
+ "non-scoped", if_name(ifp), e));
+ /* proceed anyway. XXX: is it correct? */
+ }
+ }
if (dr) {
pfxrtr_add(new, dr);
-#if MIP6
- if (mip6_get_md_state_hook) {
- /*
- * If we are in UNDEFINED state and a router appears,
- * select that router and change state.
- * This case takes care of transitions from UNDEFINED
- * to FOREIGN when the prefix is not known from before.
- */
- if ((*mip6_get_md_state_hook)() == MIP6_MD_UNDEFINED) {
- if (mip6_select_defrtr_hook)
- (*mip6_select_defrtr_hook)();
- }
- }
-#endif /* MIP6 */
}
- return 0;
+ lck_mtx_unlock(nd6_mutex);
+
+ return (0);
}
+/*
+ * Caller must have held an extra reference on nd_prefix.
+ */
void
-prelist_remove(pr)
- struct nd_prefix *pr;
+prelist_remove(struct nd_prefix *pr)
{
struct nd_pfxrouter *pfr, *next;
- int s;
+ struct ifnet *ifp = pr->ndpr_ifp;
+ int e;
+ struct nd_ifinfo *ndi = NULL;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ NDPR_LOCK_ASSERT_HELD(pr);
+
+ if (pr->ndpr_stateflags & NDPRF_DEFUNCT)
+ return;
+
+ /*
+ * If there are no more addresses, defunct the prefix. This is needed
+ * because we don't want multiple threads calling prelist_remove() for
+ * the same prefix and this might happen because we unlock nd6_mutex
+ * down below.
+ */
+ if (pr->ndpr_addrcnt == 0)
+ pr->ndpr_stateflags |= NDPRF_DEFUNCT;
+
+ /* make sure to invalidate the prefix until it is really freed. */
+ pr->ndpr_vltime = 0;
+ pr->ndpr_pltime = 0;
+
+ /*
+ * Though these flags are now meaningless, we'd rather keep the value
+ * of pr->ndpr_raf_onlink and pr->ndpr_raf_auto not to confuse users
+ * when executing "ndp -p".
+ */
+ if (pr->ndpr_stateflags & NDPRF_ONLINK) {
+ NDPR_ADDREF_LOCKED(pr);
+ NDPR_UNLOCK(pr);
+ lck_mtx_unlock(nd6_mutex);
+ if ((e = nd6_prefix_offlink(pr)) != 0) {
+ nd6log((LOG_ERR, "prelist_remove: failed to make "
+ "%s/%d offlink on %s, errno=%d\n",
+ ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(ifp), e));
+ /* what should we do? */
+ }
+ lck_mtx_lock(nd6_mutex);
+ NDPR_LOCK(pr);
+ if (NDPR_REMREF_LOCKED(pr) == NULL)
+ return;
+ }
+
+ if (pr->ndpr_addrcnt > 0) {
+ /*
+ * The state might have changed if we called
+ * nd6_prefix_offlink().
+ */
+ pr->ndpr_stateflags &= ~NDPRF_DEFUNCT;
+ return; /* notice here? */
+ }
-#ifdef __NetBSD__
- s = splsoftnet();
-#else
- s = splnet();
-#endif
/* unlink ndpr_entry from nd_prefix list */
LIST_REMOVE(pr, ndpr_entry);
- splx(s);
+ pr->ndpr_debug &= ~IFD_ATTACHED;
/* free list of routers that adversed the prefix */
for (pfr = pr->ndpr_advrtrs.lh_first; pfr; pfr = next) {
next = pfr->pfr_next;
+ pfxrtr_del(pfr, pr);
+ }
- _FREE(pfr, M_IP6NDP);
+ ndi = ND_IFINFO(ifp);
+ VERIFY((NULL != ndi) && (TRUE == ndi->initialized));
+ lck_mtx_lock(&ndi->lock);
+ VERIFY(ndi->nprefixes > 0);
+ ndi->nprefixes--;
+ lck_mtx_unlock(&ndi->lock);
+
+ /* This must not be the last reference to the nd_prefix */
+ if (NDPR_REMREF_LOCKED(pr) == NULL) {
+ panic("%s: unexpected (missing) refcnt ndpr=%p", __func__, pr);
+ /* NOTREACHED */
}
- _FREE(pr, M_IP6NDP);
- pfxlist_onlink_check();
+ /*
+ * Don't call pfxlist_onlink_check() here because we are
+ * holding the NDPR lock and this could cause a deadlock when
+ * there are multiple threads executing pfxlist_onlink_check().
+ */
}
-/*
- * NOTE: We set address lifetime to keep
- * address lifetime <= prefix lifetime
- * invariant. This is to simplify on-link determination code.
- * If onlink determination is udated, this routine may have to be updated too.
- */
int
-prelist_update(new, dr, m)
- struct nd_prefix *new;
- struct nd_defrouter *dr; /* may be NULL */
- struct mbuf *m;
+prelist_update(
+ struct nd_prefix *new,
+ struct nd_defrouter *dr, /* may be NULL */
+ struct mbuf *m,
+ int mcast)
{
- struct in6_ifaddr *ia6 = NULL;
+ struct in6_ifaddr *ia6 = NULL, *ia6_match = NULL;
+ struct ifaddr *ifa;
+ struct ifnet *ifp = new->ndpr_ifp;
struct nd_prefix *pr;
-#ifdef __NetBSD__
- int s = splsoftnet();
-#else
- int s = splnet();
-#endif
int error = 0;
+ int newprefix = 0;
int auth;
- struct in6_addrlifetime *lt6;
- u_char onlink; /* Mobile IPv6 */
+ struct in6_addrlifetime lt6_tmp;
+ uint64_t timenow = net_uptime();
+
+ /* no need to lock "new" here, as it is local to the caller */
+ NDPR_LOCK_ASSERT_NOTHELD(new);
auth = 0;
if (m) {
* both IP header and IP datagrams, doesn't it ?
*/
#if defined(M_AUTHIPHDR) && defined(M_AUTHIPDGM)
- auth = (m->m_flags & M_AUTHIPHDR
- && m->m_flags & M_AUTHIPDGM) ? 1 : 0;
+ auth = (m->m_flags & M_AUTHIPHDR) && (m->m_flags & M_AUTHIPDGM);
#endif
}
- if ((pr = prefix_lookup(new)) != NULL) {
- if (pr->ndpr_ifp != new->ndpr_ifp) {
- error = EADDRNOTAVAIL;
- goto end;
+ if ((pr = nd6_prefix_lookup(new, ND6_PREFIX_EXPIRY_UNSPEC)) != NULL) {
+ /*
+ * nd6_prefix_lookup() ensures that pr and new have the same
+ * prefix on a same interface.
+ */
+
+ /*
+ * Update prefix information. Note that the on-link (L) bit
+ * and the autonomous (A) bit should NOT be changed from 1
+ * to 0.
+ */
+ lck_mtx_lock(nd6_mutex);
+ NDPR_LOCK(pr);
+ if (new->ndpr_raf_onlink == 1)
+ pr->ndpr_raf_onlink = 1;
+ if (new->ndpr_raf_auto == 1)
+ pr->ndpr_raf_auto = 1;
+ if (new->ndpr_raf_onlink) {
+ pr->ndpr_vltime = new->ndpr_vltime;
+ pr->ndpr_pltime = new->ndpr_pltime;
+ (void) in6_init_prefix_ltimes(pr); /* XXX error case? */
+ pr->ndpr_lastupdate = net_uptime();
}
-#if MIP6
- if (mip6_get_home_prefix_hook) {
- /*
- * The home prefix should be kept away from updates.
- * XXXYYY Tunneled RA? New Home Prefix? Unless
- * configured, the code below will be executed.
- */
- if (pr == (*mip6_get_home_prefix_hook)())
- goto noautoconf1;
+ NDPR_ADDREF_LOCKED(pr);
+ if (new->ndpr_raf_onlink &&
+ (pr->ndpr_stateflags & NDPRF_ONLINK) == 0) {
+ int e;
+
+ NDPR_UNLOCK(pr);
+ if ((e = nd6_prefix_onlink(pr)) != 0) {
+ nd6log((LOG_ERR,
+ "prelist_update: failed to make "
+ "the prefix %s/%d on-link on %s "
+ "(errno=%d)\n",
+ ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp), e));
+ /* proceed anyway. XXX: is it correct? */
+ }
+ NDPR_LOCK(pr);
}
-#endif /* MIP6 */
- /* update prefix information */
- pr->ndpr_flags = new->ndpr_flags;
- pr->ndpr_vltime = new->ndpr_vltime;
- pr->ndpr_pltime = new->ndpr_pltime;
- pr->ndpr_preferred = new->ndpr_preferred;
- pr->ndpr_expire = new->ndpr_expire;
+ if (dr && pfxrtr_lookup(pr, dr) == NULL) {
+ NDPR_UNLOCK(pr);
+ pfxrtr_add(pr, dr);
+ } else {
+ NDPR_UNLOCK(pr);
+ }
+ NDPR_REMREF(pr);
+ lck_mtx_unlock(nd6_mutex);
+ } else {
+ newprefix = 1;
- /*
- * RFC 2462 5.5.3 (d) or (e)
- * We got a prefix which we have seen in the past.
- */
- if (!new->ndpr_raf_auto)
- goto noautoconf1;
+ if (new->ndpr_vltime == 0)
+ goto end;
+ if (new->ndpr_raf_onlink == 0 && new->ndpr_raf_auto == 0)
+ goto end;
- if (IN6_IS_ADDR_UNSPECIFIED(&pr->ndpr_addr))
- ia6 = NULL;
- else
- ia6 = in6ifa_ifpwithaddr(pr->ndpr_ifp, &pr->ndpr_addr);
+ bzero(&new->ndpr_addr, sizeof (struct in6_addr));
+
+ error = nd6_prelist_add(new, dr, &pr, FALSE);
+ if (error != 0 || pr == NULL) {
+ nd6log((LOG_NOTICE, "prelist_update: "
+ "nd6_prelist_add failed for %s/%d on %s "
+ "errno=%d, returnpr=0x%llx\n",
+ ip6_sprintf(&new->ndpr_prefix.sin6_addr),
+ new->ndpr_plen, if_name(new->ndpr_ifp),
+ error, (uint64_t)VM_KERNEL_ADDRPERM(pr)));
+ goto end; /* we should just give up in this case. */
+ }
+ }
- if (ia6 == NULL) {
- /*
- * Special case:
- * (1) We have seen the prefix advertised before, but
- * we have never performed autoconfig for this prefix.
- * This is because Autonomous bit was 0 previously, or
- * autoconfig failed due to some other reasons.
- * (2) We have seen the prefix advertised before and
- * we have performed autoconfig in the past, but
- * we seem to have no interface address right now.
- * This is because the interface address have expired.
- *
- * This prefix is fresh, with respect to autoconfig
- * process.
- *
- * Add an address based on RFC 2462 5.5.3 (d).
- */
- ia6 = in6_ifadd(pr->ndpr_ifp,
- &pr->ndpr_prefix.sin6_addr, &pr->ndpr_addr,
- new->ndpr_plen);
- if (!ia6) {
- error = EADDRNOTAVAIL;
- log(LOG_ERR, "prelist_update: failed to add a "
- "new address\n");
- goto noautoconf1;
- }
+ /*
+ * Address autoconfiguration based on Section 5.5.3 of RFC 4862.
+ * Note that pr must be non NULL at this point.
+ */
- lt6 = &ia6->ia6_lifetime;
+ /* 5.5.3 (a). Ignore the prefix without the A bit set. */
+ if (!new->ndpr_raf_auto)
+ goto end;
- /* address lifetime <= prefix lifetime */
- lt6->ia6t_vltime = new->ndpr_vltime;
- lt6->ia6t_pltime = new->ndpr_pltime;
- in6_init_address_ltimes(new, lt6, 1);
- } else {
-#define TWOHOUR (120*60)
- /*
- * We have seen the prefix before, and we have added
- * interface address in the past. We still have
- * the interface address assigned.
- *
- * update address lifetime based on RFC 2462
- * 5.5.3 (e).
- */
- int update = 0;
-
- lt6 = &ia6->ia6_lifetime;
-
-#if 0 /* RFC 2462 5.5.3 (e) */
- lt6->ia6t_pltime = new->ndpr_pltime;
- if (TWOHOUR < new->ndpr_vltime
- || lt6pr->nd < new->ndpr_vltime) {
- lt6->ia6t_vltime = new->ndpr_vltime;
- update++;
- } else if (auth
- && lt6->ia6t_vltime <= TWOHOUR0
- && new->ndpr_vltime <= lt6->ia6t_vltime) {
- lt6->ia6t_vltime = new->ndpr_vltime;
- update++;
- } else {
- lt6->ia6t_vltime = TWOHOUR;
- update++;
- }
+ /*
+ * 5.5.3 (b). the link-local prefix should have been ignored in
+ * nd6_ra_input.
+ */
- /* 2 hour rule is not imposed for pref lifetime */
- new->ndpr_apltime = new->ndpr_pltime;
- lt6->ia6t_pltime = new->ndpr_pltime;
-#else /* update from Jim Bound, (ipng 6712) */
- if (TWOHOUR < new->ndpr_vltime
- || lt6->ia6t_vltime < new->ndpr_vltime) {
- lt6->ia6t_vltime = new->ndpr_vltime;
- update++;
- } else if (auth) {
- lt6->ia6t_vltime = new->ndpr_vltime;
- update++;
- }
+ /* 5.5.3 (c). Consistency check on lifetimes: pltime <= vltime. */
+ if (new->ndpr_pltime > new->ndpr_vltime) {
+ error = EINVAL; /* XXX: won't be used */
+ goto end;
+ }
- /* jim bound rule is not imposed for pref lifetime */
- lt6->ia6t_pltime = new->ndpr_pltime;
-#endif
- in6_init_address_ltimes(new, lt6, update);
+ /*
+ * 5.5.3 (d). If the prefix advertised is not equal to the prefix of
+ * an address configured by stateless autoconfiguration already in the
+ * list of addresses associated with the interface, and the Valid
+ * Lifetime is not 0, form an address. We first check if we have
+ * a matching prefix.
+ */
+ ifnet_lock_shared(ifp);
+ TAILQ_FOREACH(ifa, &ifp->if_addrlist, ifa_list) {
+ struct in6_ifaddr *ifa6;
+ u_int32_t remaininglifetime;
+
+ IFA_LOCK(ifa);
+ if (ifa->ifa_addr->sa_family != AF_INET6) {
+ IFA_UNLOCK(ifa);
+ continue;
}
+ ifa6 = (struct in6_ifaddr *)ifa;
- noautoconf1:
-
-#if 0
- /* address lifetime expire processing, RFC 2462 5.5.4. */
- if (pr->ndpr_preferred && pr->ndpr_preferred < time_second) {
- struct in6_ifaddr *ia6;
+ /*
+ * We only consider autoconfigured addresses as per RFC 4862.
+ */
+ if (!(ifa6->ia6_flags & IN6_IFF_AUTOCONF)) {
+ IFA_UNLOCK(ifa);
+ continue;
+ }
+ /*
+ * Spec is not clear here, but I believe we should concentrate
+ * on unicast (i.e. not anycast) addresses.
+ * XXX: other ia6_flags? detached or duplicated?
+ */
+ if ((ifa6->ia6_flags & IN6_IFF_ANYCAST) != 0) {
+ IFA_UNLOCK(ifa);
+ continue;
+ }
+ /*
+ * Ignore the address if it is not associated with a prefix
+ * or is associated with a prefix that is different from this
+ * one. (pr is never NULL here)
+ */
+ if (ifa6->ia6_ndpr != pr) {
+ IFA_UNLOCK(ifa);
+ continue;
+ }
- ia6 = in6ifa_ifpwithaddr(pr->ndpr_ifp, &pr->ndpr_addr);
- if (ia6)
- ia6->ia6_flags &= ~IN6_IFF_DEPRECATED;
+ if (ia6_match == NULL) { /* remember the first one */
+ ia6_match = ifa6;
+ IFA_ADDREF_LOCKED(ifa); /* for ia6_match */
}
-#endif
- onlink = pr->ndpr_statef_onlink; /* Mobile IPv6 */
+ /*
+ * An already autoconfigured address matched. Now that we
+ * are sure there is at least one matched address, we can
+ * proceed to 5.5.3. (e): update the lifetimes according to the
+ * "two hours" rule and the privacy extension.
+ */
+#define TWOHOUR (120*60)
- if (dr && pfxrtr_lookup(pr, dr) == NULL)
- pfxrtr_add(pr, dr);
+ /* retrieve time as uptime (last arg is 0) */
+ in6ifa_getlifetime(ifa6, <6_tmp, 0);
-#if MIP6
- if (mip6_prelist_update_hook) {
+ if (lt6_tmp.ia6t_vltime == ND6_INFINITE_LIFETIME)
+ remaininglifetime = ND6_INFINITE_LIFETIME;
+ else if (timenow - ifa6->ia6_updatetime > lt6_tmp.ia6t_vltime) {
/*
- * Check for home prefix. It can't be a fresh prefix
- * (since it's static), so check here.
+ * The case of "invalid" address. We should usually
+ * not see this case.
*/
- (*mip6_prelist_update_hook)(pr, dr);
+ remaininglifetime = 0;
+ } else {
+ remaininglifetime = lt6_tmp.ia6t_vltime -
+ (timenow - ifa6->ia6_updatetime);
}
-
- if (mip6_probe_pfxrtrs_hook) {
+ /* when not updating, keep the current stored lifetime. */
+ lt6_tmp.ia6t_vltime = remaininglifetime;
+
+ if (TWOHOUR < new->ndpr_vltime ||
+ remaininglifetime < new->ndpr_vltime) {
+ lt6_tmp.ia6t_vltime = new->ndpr_vltime;
+ } else if (remaininglifetime <= TWOHOUR) {
+ if (auth) {
+ lt6_tmp.ia6t_vltime = new->ndpr_vltime;
+ }
+ } else {
/*
- * If this prefix previously was detached, maybe we
- * have moved.
+ * new->ndpr_vltime <= TWOHOUR &&
+ * TWOHOUR < remaininglifetime
*/
- if (!onlink)
- (*mip6_probe_pfxrtrs_hook)();
+ lt6_tmp.ia6t_vltime = TWOHOUR;
}
-#endif /* MIP6 */
-
- } else {
- int error_tmp;
- if (new->ndpr_vltime == 0) goto end;
+ /* The 2 hour rule is not imposed for preferred lifetime. */
+ lt6_tmp.ia6t_pltime = new->ndpr_pltime;
- bzero(&new->ndpr_addr, sizeof(struct in6_addr));
+ /* Special handling for lifetimes of temporary addresses. */
+ if ((ifa6->ia6_flags & IN6_IFF_TEMPORARY) != 0) {
+ u_int32_t maxvltime, maxpltime;
- /*
- * RFC 2462 5.5.3 (d)
- * We got a fresh prefix. Perform some sanity checks
- * and add an interface address by appending interface ID
- * to the advertised prefix.
- */
- if (!new->ndpr_raf_auto)
- goto noautoconf2;
+ /* Constrain lifetimes to system limits. */
+ if (lt6_tmp.ia6t_vltime > ip6_temp_valid_lifetime)
+ lt6_tmp.ia6t_vltime = ip6_temp_valid_lifetime;
+ if (lt6_tmp.ia6t_pltime > ip6_temp_preferred_lifetime)
+ lt6_tmp.ia6t_pltime =
+ ip6_temp_preferred_lifetime -
+ ip6_desync_factor;
- ia6 = in6_ifadd(new->ndpr_ifp, &new->ndpr_prefix.sin6_addr,
- &new->ndpr_addr, new->ndpr_plen);
- if (!ia6) {
- error = EADDRNOTAVAIL;
- log(LOG_ERR, "prelist_update: "
- "failed to add a new address\n");
- goto noautoconf2;
+ /*
+ * According to RFC 4941, section 3.3 (1), we only
+ * update the lifetimes when they are in the maximum
+ * intervals.
+ */
+ if (ip6_temp_valid_lifetime >
+ (u_int32_t)((timenow - ifa6->ia6_createtime) +
+ ip6_desync_factor)) {
+ maxvltime = ip6_temp_valid_lifetime -
+ (timenow - ifa6->ia6_createtime) -
+ ip6_desync_factor;
+ } else
+ maxvltime = 0;
+ if (ip6_temp_preferred_lifetime >
+ (u_int32_t)((timenow - ifa6->ia6_createtime) +
+ ip6_desync_factor)) {
+ maxpltime = ip6_temp_preferred_lifetime -
+ (timenow - ifa6->ia6_createtime) -
+ ip6_desync_factor;
+ } else
+ maxpltime = 0;
+
+ if (lt6_tmp.ia6t_vltime == ND6_INFINITE_LIFETIME ||
+ lt6_tmp.ia6t_vltime > maxvltime)
+ lt6_tmp.ia6t_vltime = maxvltime;
+
+ if (lt6_tmp.ia6t_pltime == ND6_INFINITE_LIFETIME ||
+ lt6_tmp.ia6t_pltime > maxpltime)
+ lt6_tmp.ia6t_pltime = maxpltime;
}
- /* set onlink bit if an interface route is configured */
- new->ndpr_statef_onlink = (ia6->ia_flags & IFA_ROUTE) ? 1 : 0;
- lt6 = &ia6->ia6_lifetime;
+ in6_init_address_ltimes(pr, <6_tmp);
- /* address lifetime <= prefix lifetime */
- lt6->ia6t_vltime = new->ndpr_vltime;
- lt6->ia6t_pltime = new->ndpr_pltime;
- in6_init_address_ltimes(new, lt6, 1);
+ in6ifa_setlifetime(ifa6, <6_tmp);
+ ifa6->ia6_updatetime = timenow;
+ IFA_UNLOCK(ifa);
+ }
+ ifnet_lock_done(ifp);
+ if (ia6_match == NULL && new->ndpr_vltime) {
+ /*
+ * 5.5.3 (d) (continued)
+ * No address matched and the valid lifetime is non-zero.
+ * Create a new address.
+ */
- noautoconf2:
- error_tmp = prelist_add(new, dr);
- error = error_tmp ? error_tmp : error;
+ if ((ia6 = in6_pfx_newpersistaddr(new, mcast, &error))
+ != NULL) {
+ /*
+ * note that we should use pr (not new) for reference.
+ */
+ IFA_LOCK(&ia6->ia_ifa);
+ NDPR_LOCK(pr);
+ ia6->ia6_ndpr = pr;
+ NDPR_ADDREF_LOCKED(pr); /* for addr reference */
+ pr->ndpr_addrcnt++;
+ VERIFY(pr->ndpr_addrcnt != 0);
+ NDPR_UNLOCK(pr);
+ IFA_UNLOCK(&ia6->ia_ifa);
-#if MIP6
- if (mip6_probe_pfxrtrs_hook) {
- /* This is a new prefix, maybe we have moved. */
- (*mip6_probe_pfxrtrs_hook)();
- }
+ /*
+ * RFC 4941 3.3 (2).
+ * When a new public address is created as described
+ * in RFC 4862, also create a new temporary address.
+ *
+ * RFC 4941 3.5.
+ * When an interface connects to a new link, a new
+ * randomized interface identifier should be generated
+ * immediately together with a new set of temporary
+ * addresses. Thus, we specifiy 1 as the 2nd arg of
+ * in6_tmpifadd().
+ */
+ if (ip6_use_tempaddr) {
+ int e;
+ if ((e = in6_tmpifadd(ia6, 1)) != 0) {
+ nd6log((LOG_NOTICE, "prelist_update: "
+ "failed to create a temporary "
+ "address, errno=%d\n",
+ e));
+ }
+ }
+ IFA_REMREF(&ia6->ia_ifa);
+ ia6 = NULL;
- if (mip6_minus_a_case_hook) {
/*
- * If we are still looking for an autoconfigured home
- * address when we are in "minus a" case, here's a new
- * prefix and hopefully we can use the address derived
- *from that.
+ * A newly added address might affect the status
+ * of other addresses, so we check and update it.
+ * XXX: what if address duplication happens?
*/
- if (ia6)
- (*mip6_minus_a_case_hook)(new);
+ lck_mtx_lock(nd6_mutex);
+ pfxlist_onlink_check();
+ lck_mtx_unlock(nd6_mutex);
}
-#endif /* MIP6 */
-
}
- end:
- splx(s);
- return error;
+end:
+ if (pr != NULL)
+ NDPR_REMREF(pr);
+ if (ia6_match != NULL)
+ IFA_REMREF(&ia6_match->ia_ifa);
+ return (error);
}
/*
- * A supplement function used in the on-link detection below;
- * detect if a given prefix has a (probably) reachable advertising router.
- * XXX: lengthy function name...
+ * Neighbor Discover Default Router structure reference counting routines.
*/
-struct nd_pfxrouter *
-find_pfxlist_reachable_router(pr)
- struct nd_prefix *pr;
+static struct nd_defrouter *
+nddr_alloc(int how)
{
- struct nd_pfxrouter *pfxrtr;
- struct rtentry *rt;
- struct llinfo_nd6 *ln;
+ struct nd_defrouter *dr;
- for (pfxrtr = LIST_FIRST(&pr->ndpr_advrtrs); pfxrtr;
- pfxrtr = LIST_NEXT(pfxrtr, pfr_entry)) {
- if ((rt = nd6_lookup(&pfxrtr->router->rtaddr, 0,
- pfxrtr->router->ifp)) &&
- (ln = (struct llinfo_nd6 *)rt->rt_llinfo) &&
- ND6_IS_LLINFO_PROBREACH(ln))
- break; /* found */
+ dr = (how == M_WAITOK) ? zalloc(nddr_zone) : zalloc_noblock(nddr_zone);
+ if (dr != NULL) {
+ bzero(dr, nddr_size);
+ lck_mtx_init(&dr->nddr_lock, ifa_mtx_grp, ifa_mtx_attr);
+ dr->nddr_debug |= IFD_ALLOC;
+ if (nddr_debug != 0) {
+ dr->nddr_debug |= IFD_DEBUG;
+ dr->nddr_trace = nddr_trace;
+ }
}
+ return (dr);
+}
+
+static void
+nddr_free(struct nd_defrouter *dr)
+{
+ NDDR_LOCK(dr);
+ if (dr->nddr_debug & IFD_ATTACHED) {
+ panic("%s: attached nddr %p is being freed", __func__, dr);
+ /* NOTREACHED */
+ } else if (!(dr->nddr_debug & IFD_ALLOC)) {
+ panic("%s: nddr %p cannot be freed", __func__, dr);
+ /* NOTREACHED */
+ }
+ dr->nddr_debug &= ~IFD_ALLOC;
+ NDDR_UNLOCK(dr);
+
+ lck_mtx_destroy(&dr->nddr_lock, ifa_mtx_grp);
+ zfree(nddr_zone, dr);
+}
+
+static void
+nddr_trace(struct nd_defrouter *dr, int refhold)
+{
+ struct nd_defrouter_dbg *dr_dbg = (struct nd_defrouter_dbg *)dr;
+ ctrace_t *tr;
+ uint32_t idx;
+ uint16_t *cnt;
+
+ if (!(dr->nddr_debug & IFD_DEBUG)) {
+ panic("%s: nddr %p has no debug structure", __func__, dr);
+ /* NOTREACHED */
+ }
+ if (refhold) {
+ cnt = &dr_dbg->nddr_refhold_cnt;
+ tr = dr_dbg->nddr_refhold;
+ } else {
+ cnt = &dr_dbg->nddr_refrele_cnt;
+ tr = dr_dbg->nddr_refrele;
+ }
+
+ idx = atomic_add_16_ov(cnt, 1) % NDDR_TRACE_HIST_SIZE;
+ ctrace_record(&tr[idx]);
+}
+
+void
+nddr_addref(struct nd_defrouter *nddr, int locked)
+{
+
+ if (!locked)
+ NDDR_LOCK_SPIN(nddr);
+ else
+ NDDR_LOCK_ASSERT_HELD(nddr);
+
+ if (++nddr->nddr_refcount == 0) {
+ panic("%s: nddr %p wraparound refcnt\n", __func__, nddr);
+ /* NOTREACHED */
+ } else if (nddr->nddr_trace != NULL) {
+ (*nddr->nddr_trace)(nddr, TRUE);
+ }
+
+ if (!locked)
+ NDDR_UNLOCK(nddr);
+}
+
+struct nd_defrouter *
+nddr_remref(struct nd_defrouter *nddr, int locked)
+{
+
+ if (!locked)
+ NDDR_LOCK_SPIN(nddr);
+ else
+ NDDR_LOCK_ASSERT_HELD(nddr);
+
+ if (nddr->nddr_refcount == 0) {
+ panic("%s: nddr %p negative refcnt\n", __func__, nddr);
+ /* NOTREACHED */
+ } else if (nddr->nddr_trace != NULL) {
+ (*nddr->nddr_trace)(nddr, FALSE);
+ }
+
+ if (--nddr->nddr_refcount == 0) {
+ NDDR_UNLOCK(nddr);
+ nddr_free(nddr);
+ nddr = NULL;
+ }
+
+ if (!locked && nddr != NULL)
+ NDDR_UNLOCK(nddr);
+
+ return (nddr);
+}
+
+uint64_t
+nddr_getexpire(struct nd_defrouter *dr)
+{
+ struct timeval caltime;
+ uint64_t expiry;
+
+ if (dr->expire != 0) {
+ /* account for system time change */
+ getmicrotime(&caltime);
+
+ dr->base_calendartime +=
+ NET_CALCULATE_CLOCKSKEW(caltime,
+ dr->base_calendartime, net_uptime(), dr->base_uptime);
+
+ expiry = dr->base_calendartime +
+ dr->expire - dr->base_uptime;
+ } else {
+ expiry = 0;
+ }
+ return (expiry);
+}
+
+/*
+ * Neighbor Discover Prefix structure reference counting routines.
+ */
+static struct nd_prefix *
+ndpr_alloc(int how)
+{
+ struct nd_prefix *pr;
+
+ pr = (how == M_WAITOK) ? zalloc(ndpr_zone) : zalloc_noblock(ndpr_zone);
+ if (pr != NULL) {
+ bzero(pr, ndpr_size);
+ lck_mtx_init(&pr->ndpr_lock, ifa_mtx_grp, ifa_mtx_attr);
+ RB_INIT(&pr->ndpr_prproxy_sols);
+ pr->ndpr_debug |= IFD_ALLOC;
+ if (ndpr_debug != 0) {
+ pr->ndpr_debug |= IFD_DEBUG;
+ pr->ndpr_trace = ndpr_trace;
+ }
+ }
+ return (pr);
+}
+
+static void
+ndpr_free(struct nd_prefix *pr)
+{
+ NDPR_LOCK(pr);
+ if (pr->ndpr_debug & IFD_ATTACHED) {
+ panic("%s: attached ndpr %p is being freed", __func__, pr);
+ /* NOTREACHED */
+ } else if (!(pr->ndpr_debug & IFD_ALLOC)) {
+ panic("%s: ndpr %p cannot be freed", __func__, pr);
+ /* NOTREACHED */
+ } else if (pr->ndpr_rt != NULL) {
+ panic("%s: ndpr %p route %p not freed", __func__, pr,
+ pr->ndpr_rt);
+ /* NOTREACHED */
+ } else if (pr->ndpr_prproxy_sols_cnt != 0) {
+ panic("%s: ndpr %p non-zero solicitors count (%d)",
+ __func__, pr, pr->ndpr_prproxy_sols_cnt);
+ /* NOTREACHED */
+ } else if (!RB_EMPTY(&pr->ndpr_prproxy_sols)) {
+ panic("%s: ndpr %p non-empty solicitors tree", __func__, pr);
+ /* NOTREACHED */
+ }
+ pr->ndpr_debug &= ~IFD_ALLOC;
+ NDPR_UNLOCK(pr);
+
+ lck_mtx_destroy(&pr->ndpr_lock, ifa_mtx_grp);
+ zfree(ndpr_zone, pr);
+}
+
+static void
+ndpr_trace(struct nd_prefix *pr, int refhold)
+{
+ struct nd_prefix_dbg *pr_dbg = (struct nd_prefix_dbg *)pr;
+ ctrace_t *tr;
+ u_int32_t idx;
+ u_int16_t *cnt;
+
+ if (!(pr->ndpr_debug & IFD_DEBUG)) {
+ panic("%s: ndpr %p has no debug structure", __func__, pr);
+ /* NOTREACHED */
+ }
+ if (refhold) {
+ cnt = &pr_dbg->ndpr_refhold_cnt;
+ tr = pr_dbg->ndpr_refhold;
+ } else {
+ cnt = &pr_dbg->ndpr_refrele_cnt;
+ tr = pr_dbg->ndpr_refrele;
+ }
+
+ idx = atomic_add_16_ov(cnt, 1) % NDPR_TRACE_HIST_SIZE;
+ ctrace_record(&tr[idx]);
+}
+
+void
+ndpr_addref(struct nd_prefix *ndpr, int locked)
+{
+ if (!locked)
+ NDPR_LOCK_SPIN(ndpr);
+ else
+ NDPR_LOCK_ASSERT_HELD(ndpr);
+
+ if (++ndpr->ndpr_refcount == 0) {
+ panic("%s: ndpr %p wraparound refcnt\n", __func__, ndpr);
+ /* NOTREACHED */
+ } else if (ndpr->ndpr_trace != NULL) {
+ (*ndpr->ndpr_trace)(ndpr, TRUE);
+ }
+
+ if (!locked)
+ NDPR_UNLOCK(ndpr);
+}
+
+struct nd_prefix *
+ndpr_remref(struct nd_prefix *ndpr, int locked)
+{
+ if (!locked)
+ NDPR_LOCK_SPIN(ndpr);
+ else
+ NDPR_LOCK_ASSERT_HELD(ndpr);
+
+ if (ndpr->ndpr_refcount == 0) {
+ panic("%s: ndpr %p negative refcnt\n", __func__, ndpr);
+ /* NOTREACHED */
+ } else if (ndpr->ndpr_trace != NULL) {
+ (*ndpr->ndpr_trace)(ndpr, FALSE);
+ }
+
+ if (--ndpr->ndpr_refcount == 0) {
+ if (ndpr->ndpr_addrcnt != 0) {
+ panic("%s: freeing ndpr %p with outstanding address "
+ "reference (%d)", __func__, ndpr,
+ ndpr->ndpr_addrcnt);
+ /* NOTREACHED */
+ }
+ NDPR_UNLOCK(ndpr);
+ ndpr_free(ndpr);
+ ndpr = NULL;
+ }
+
+ if (!locked && ndpr != NULL)
+ NDPR_UNLOCK(ndpr);
+
+ return (ndpr);
+}
+
+uint64_t
+ndpr_getexpire(struct nd_prefix *pr)
+{
+ struct timeval caltime;
+ uint64_t expiry;
+
+ if (pr->ndpr_expire != 0 && pr->ndpr_vltime != ND6_INFINITE_LIFETIME) {
+ /* account for system time change */
+ getmicrotime(&caltime);
+
+ pr->ndpr_base_calendartime +=
+ NET_CALCULATE_CLOCKSKEW(caltime,
+ pr->ndpr_base_calendartime, net_uptime(),
+ pr->ndpr_base_uptime);
+
+ expiry = pr->ndpr_base_calendartime +
+ pr->ndpr_expire - pr->ndpr_base_uptime;
+ } else {
+ expiry = 0;
+ }
+ return (expiry);
+}
+
+/*
+ * A supplement function used in the on-link detection below;
+ * detect if a given prefix has a (probably) reachable advertising router.
+ * XXX: lengthy function name...
+ *
+ * Callers *must* increase the reference count of nd_prefix.
+ */
+static struct nd_pfxrouter *
+find_pfxlist_reachable_router(struct nd_prefix *pr)
+{
+ struct nd_pfxrouter *pfxrtr;
+ struct rtentry *rt;
+ struct llinfo_nd6 *ln;
+ struct ifnet *ifp;
+ struct in6_addr rtaddr;
+ unsigned int genid;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ NDPR_LOCK_ASSERT_HELD(pr);
+
+ genid = pr->ndpr_genid;
+ pfxrtr = LIST_FIRST(&pr->ndpr_advrtrs);
+ while (pfxrtr) {
+ ifp = pfxrtr->router->ifp;
+ if (pfxrtr->router->stateflags & NDDRF_MAPPED)
+ rtaddr = pfxrtr->router->rtaddr_mapped;
+ else
+ rtaddr = pfxrtr->router->rtaddr;
+
+ NDPR_UNLOCK(pr);
+ lck_mtx_unlock(nd6_mutex);
+ /* Callee returns a locked route upon success */
+ if ((rt = nd6_lookup(&rtaddr, 0, ifp, 0)) != NULL) {
+ RT_LOCK_ASSERT_HELD(rt);
+ if ((ln = rt->rt_llinfo) != NULL &&
+ ND6_IS_LLINFO_PROBREACH(ln)) {
+ RT_REMREF_LOCKED(rt);
+ RT_UNLOCK(rt);
+ lck_mtx_lock(nd6_mutex);
+ NDPR_LOCK(pr);
+ break; /* found */
+ }
+ RT_REMREF_LOCKED(rt);
+ RT_UNLOCK(rt);
+ }
+ lck_mtx_lock(nd6_mutex);
+ NDPR_LOCK(pr);
+ if (pr->ndpr_genid != genid) {
+ pfxrtr = LIST_FIRST(&pr->ndpr_advrtrs);
+ genid = pr->ndpr_genid;
+ } else
+ pfxrtr = LIST_NEXT(pfxrtr, pfr_entry);
+ }
+ NDPR_LOCK_ASSERT_HELD(pr);
- return(pfxrtr);
+ return (pfxrtr);
}
/*
* Check if each prefix in the prefix list has at least one available router
- * that advertised the prefix (A router is "available" if its neighbor cache
- * entry has reachable or probably reachable).
+ * that advertised the prefix (a router is "available" if its neighbor cache
+ * entry is reachable or probably reachable).
* If the check fails, the prefix may be off-link, because, for example,
* we have moved from the network but the lifetime of the prefix has not
- * been expired yet. So we should not use the prefix if there is another
- * prefix that has an available router.
- * But if there is no prefix that has an available router, we still regards
- * all the prefixes as on-link. This is because we can't tell if all the
+ * expired yet. So we should not use the prefix if there is another prefix
+ * that has an available router.
+ * But, if there is no prefix that has an available router, we still regards
+ * all the prefixes as on-link. This is because we can't tell if all the
* routers are simply dead or if we really moved from the network and there
* is no router around us.
*/
void
-pfxlist_onlink_check()
+pfxlist_onlink_check(void)
{
- struct nd_prefix *pr;
+ struct nd_prefix *pr, *prclear;
+ struct in6_ifaddr *ifa;
+ struct nd_defrouter *dr;
+ struct nd_pfxrouter *pfxrtr = NULL;
+ int err, i, found = 0;
+ struct ifaddr **ifap = NULL;
+ struct nd_prefix *ndpr;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ while (nd_prefix_busy) {
+ nd_prefix_waiters++;
+ msleep(nd_prefix_waitchan, nd6_mutex, (PZERO-1),
+ __func__, NULL);
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+ }
+ nd_prefix_busy = TRUE;
/*
* Check if there is a prefix that has a reachable advertising
* router.
*/
- for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
- if (find_pfxlist_reachable_router(pr))
+ pr = nd_prefix.lh_first;
+ while (pr) {
+ NDPR_LOCK(pr);
+ if (pr->ndpr_stateflags & NDPRF_PROCESSED_ONLINK) {
+ NDPR_UNLOCK(pr);
+ pr = pr->ndpr_next;
+ continue;
+ }
+ NDPR_ADDREF_LOCKED(pr);
+ if (pr->ndpr_raf_onlink && find_pfxlist_reachable_router(pr) &&
+ (pr->ndpr_debug & IFD_ATTACHED)) {
+ if (NDPR_REMREF_LOCKED(pr) == NULL)
+ pr = NULL;
+ else
+ NDPR_UNLOCK(pr);
break;
+ }
+ pr->ndpr_stateflags |= NDPRF_PROCESSED_ONLINK;
+ NDPR_UNLOCK(pr);
+ NDPR_REMREF(pr);
+ /*
+ * Since find_pfxlist_reachable_router() drops the nd6_mutex, we
+ * have to start over, but the NDPRF_PROCESSED_ONLINK flag will
+ * stop us from checking the same prefix twice.
+ */
+ pr = nd_prefix.lh_first;
}
-
- if (pr) {
+ LIST_FOREACH(prclear, &nd_prefix, ndpr_entry) {
+ NDPR_LOCK(prclear);
+ prclear->ndpr_stateflags &= ~NDPRF_PROCESSED_ONLINK;
+ NDPR_UNLOCK(prclear);
+ }
+ /*
+ * If we have no such prefix, check whether we still have a router
+ * that does not advertise any prefixes.
+ */
+ if (pr == NULL) {
+ for (dr = TAILQ_FIRST(&nd_defrouter); dr;
+ dr = TAILQ_NEXT(dr, dr_entry)) {
+ struct nd_prefix *pr0;
+
+ for (pr0 = nd_prefix.lh_first; pr0;
+ pr0 = pr0->ndpr_next) {
+ NDPR_LOCK(pr0);
+ if ((pfxrtr = pfxrtr_lookup(pr0, dr)) != NULL) {
+ NDPR_UNLOCK(pr0);
+ break;
+ }
+ NDPR_UNLOCK(pr0);
+ }
+ if (pfxrtr != NULL)
+ break;
+ }
+ }
+ if (pr != NULL || (TAILQ_FIRST(&nd_defrouter) && pfxrtr == NULL)) {
/*
- * There is at least one prefix that has a reachable router.
- * First, detach prefixes which has no reachable advertising
- * router and then attach other prefixes.
- * The order is important since an attached prefix and a
- * detached prefix may have a same interface route.
+ * There is at least one prefix that has a reachable router,
+ * or at least a router which probably does not advertise
+ * any prefixes. The latter would be the case when we move
+ * to a new link where we have a router that does not provide
+ * prefixes and we configure an address by hand.
+ * Detach prefixes which have no reachable advertising
+ * router, and attach other prefixes.
*/
- for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
- if (find_pfxlist_reachable_router(pr) == NULL &&
- pr->ndpr_statef_onlink) {
- pr->ndpr_statef_onlink = 0;
- nd6_detach_prefix(pr);
+ pr = nd_prefix.lh_first;
+ while (pr) {
+ NDPR_LOCK(pr);
+ /*
+ * We aren't interested prefixes already processed,
+ * nor in prefixes without the L bit
+ * set nor in static prefixes
+ */
+ if (pr->ndpr_raf_onlink == 0 ||
+ pr->ndpr_stateflags & NDPRF_PROCESSED_ONLINK ||
+ pr->ndpr_stateflags & NDPRF_STATIC) {
+ NDPR_UNLOCK(pr);
+ pr = pr->ndpr_next;
+ continue;
}
+ NDPR_ADDREF_LOCKED(pr);
+ if ((pr->ndpr_stateflags & NDPRF_DETACHED) == 0 &&
+ find_pfxlist_reachable_router(pr) == NULL &&
+ (pr->ndpr_debug & IFD_ATTACHED))
+ pr->ndpr_stateflags |= NDPRF_DETACHED;
+ if ((pr->ndpr_stateflags & NDPRF_DETACHED) != 0 &&
+ find_pfxlist_reachable_router(pr) != NULL &&
+ (pr->ndpr_debug & IFD_ATTACHED))
+ pr->ndpr_stateflags &= ~NDPRF_DETACHED;
+ pr->ndpr_stateflags |= NDPRF_PROCESSED_ONLINK;
+ NDPR_UNLOCK(pr);
+ NDPR_REMREF(pr);
+ /*
+ * Since find_pfxlist_reachable_router() drops the
+ * nd6_mutex, we have to start over, but the
+ * NDPRF_PROCESSED_ONLINK flag will stop us from
+ * checking the same prefix twice.
+ */
+ pr = nd_prefix.lh_first;
}
+ } else {
+ /* there is no prefix that has a reachable router */
for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
- if (find_pfxlist_reachable_router(pr) &&
- pr->ndpr_statef_onlink == 0)
- nd6_attach_prefix(pr);
+ NDPR_LOCK(pr);
+ if (pr->ndpr_raf_onlink == 0 ||
+ pr->ndpr_stateflags & NDPRF_STATIC) {
+ NDPR_UNLOCK(pr);
+ continue;
+ }
+ if ((pr->ndpr_stateflags & NDPRF_DETACHED) != 0)
+ pr->ndpr_stateflags &= ~NDPRF_DETACHED;
+ NDPR_UNLOCK(pr);
}
}
- else {
- /* there is no prefix that has a reachable router */
- for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next)
- if (pr->ndpr_statef_onlink == 0)
- nd6_attach_prefix(pr);
+ LIST_FOREACH(prclear, &nd_prefix, ndpr_entry) {
+ NDPR_LOCK(prclear);
+ prclear->ndpr_stateflags &= ~NDPRF_PROCESSED_ONLINK;
+ NDPR_UNLOCK(prclear);
}
-}
-
-static void
-nd6_detach_prefix(pr)
- struct nd_prefix *pr;
-{
- struct in6_ifaddr *ia6;
- struct sockaddr_in6 sa6, mask6;
-
/*
- * Delete the interface route associated with the prefix.
+ * Remove each interface route associated with a (just) detached
+ * prefix, and reinstall the interface route for a (just) attached
+ * prefix. Note that all attempt of reinstallation does not
+ * necessarily success, when a same prefix is shared among multiple
+ * interfaces. Such cases will be handled in nd6_prefix_onlink,
+ * so we don't have to care about them.
*/
- bzero(&sa6, sizeof(sa6));
- sa6.sin6_family = AF_INET6;
- sa6.sin6_len = sizeof(sa6);
- bcopy(&pr->ndpr_prefix.sin6_addr, &sa6.sin6_addr,
- sizeof(struct in6_addr));
- bzero(&mask6, sizeof(mask6));
- mask6.sin6_family = AF_INET6;
- mask6.sin6_len = sizeof(sa6);
- bcopy(&pr->ndpr_mask, &mask6.sin6_addr, sizeof(struct in6_addr));
- {
+ pr = nd_prefix.lh_first;
+ while (pr) {
int e;
- e = rtrequest(RTM_DELETE, (struct sockaddr *)&sa6, NULL,
- (struct sockaddr *)&mask6, 0, NULL);
- if (e) {
- log(LOG_ERR,
- "nd6_detach_prefix: failed to delete route: "
- "%s/%d (errno = %d)\n",
- ip6_sprintf(&sa6.sin6_addr),
- pr->ndpr_plen,
- e);
+ NDPR_LOCK(pr);
+ if (pr->ndpr_raf_onlink == 0 ||
+ pr->ndpr_stateflags & NDPRF_STATIC ||
+ pr->ndpr_stateflags & NDPRF_PROCESSED_ONLINK ||
+ pr->ndpr_stateflags & NDPRF_DEFUNCT) {
+ NDPR_UNLOCK(pr);
+ pr = pr->ndpr_next;
+ continue;
+ }
+ pr->ndpr_stateflags |= NDPRF_PROCESSED_ONLINK;
+ NDPR_ADDREF_LOCKED(pr);
+ if ((pr->ndpr_stateflags & NDPRF_DETACHED) != 0 &&
+ (pr->ndpr_stateflags & NDPRF_ONLINK) != 0) {
+ NDPR_UNLOCK(pr);
+ lck_mtx_unlock(nd6_mutex);
+ if ((e = nd6_prefix_offlink(pr)) != 0) {
+ nd6log((LOG_ERR,
+ "pfxlist_onlink_check: failed to "
+ "make %s/%d offlink, errno=%d\n",
+ ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, e));
+ }
+ lck_mtx_lock(nd6_mutex);
+ NDPR_REMREF(pr);
+ pr = nd_prefix.lh_first;
+ continue;
+ }
+ if ((pr->ndpr_stateflags & NDPRF_DETACHED) == 0 &&
+ (pr->ndpr_stateflags & NDPRF_ONLINK) == 0 &&
+ pr->ndpr_raf_onlink) {
+ NDPR_UNLOCK(pr);
+ if ((e = nd6_prefix_onlink(pr)) != 0) {
+ nd6log((LOG_ERR,
+ "pfxlist_onlink_check: failed to "
+ "make %s/%d offlink, errno=%d\n",
+ ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, e));
+ }
+ NDPR_REMREF(pr);
+ pr = nd_prefix.lh_first;
+ continue;
+ } else {
+ NDPR_UNLOCK(pr);
}
+ NDPR_REMREF(pr);
+ pr = pr->ndpr_next;
+ }
+ LIST_FOREACH(prclear, &nd_prefix, ndpr_entry) {
+ NDPR_LOCK(prclear);
+ prclear->ndpr_stateflags &= ~NDPRF_PROCESSED_ONLINK;
+ NDPR_UNLOCK(prclear);
+ }
+ VERIFY(nd_prefix_busy);
+ nd_prefix_busy = FALSE;
+ if (nd_prefix_waiters > 0) {
+ nd_prefix_waiters = 0;
+ wakeup(nd_prefix_waitchan);
}
/*
- * Mark the address derived from the prefix detached so that
- * it won't be used as a source address for a new connection.
+ * Changes on the prefix status might affect address status as well.
+ * Make sure that all addresses derived from an attached prefix are
+ * attached, and that all addresses derived from a detached prefix are
+ * detached. Note, however, that a manually configured address should
+ * always be attached.
+ * The precise detection logic is same as the one for prefixes.
+ *
+ * ifnet_get_address_list_family_internal() may fail due to memory
+ * pressure, but we will eventually be called again when we receive
+ * another NA, RA, or when the link status changes.
*/
- if (IN6_IS_ADDR_UNSPECIFIED(&pr->ndpr_addr))
- ia6 = NULL;
- else
- ia6 = in6ifa_ifpwithaddr(pr->ndpr_ifp, &pr->ndpr_addr);
- if (ia6)
-#if MIP6
- if (mip6_get_home_prefix_hook)
- if (pr != (*mip6_get_home_prefix_hook)())
- ia6->ia6_flags |= IN6_IFF_DETACHED;
-#else
- ia6->ia6_flags |= IN6_IFF_DETACHED;
-#endif
+ err = ifnet_get_address_list_family_internal(NULL, &ifap, AF_INET6, 0,
+ M_NOWAIT, 0);
+ if (err != 0 || ifap == NULL) {
+ nd6log((LOG_ERR, "%s: ifnet_get_address_list_family_internal "
+ "failed", __func__));
+ return;
+ }
+ for (i = 0; ifap[i]; i++) {
+ ifa = ifatoia6(ifap[i]);
+ IFA_LOCK(&ifa->ia_ifa);
+ if ((ifa->ia6_flags & IN6_IFF_AUTOCONF) == 0 ||
+ (ifap[i]->ifa_debug & IFD_ATTACHED) == 0) {
+ IFA_UNLOCK(&ifa->ia_ifa);
+ continue;
+ }
+ if ((ndpr = ifa->ia6_ndpr) == NULL) {
+ /*
+ * This can happen when we first configure the address
+ * (i.e. the address exists, but the prefix does not).
+ * XXX: complicated relationships...
+ */
+ IFA_UNLOCK(&ifa->ia_ifa);
+ continue;
+ }
+ IFA_UNLOCK(&ifa->ia_ifa);
+
+ NDPR_LOCK(ndpr);
+ NDPR_ADDREF_LOCKED(ndpr);
+ if (find_pfxlist_reachable_router(ndpr)) {
+ if (NDPR_REMREF_LOCKED(ndpr) == NULL) {
+ found = 0;
+ } else {
+ NDPR_UNLOCK(ndpr);
+ found = 1;
+ }
+ break;
+ }
+ NDPR_UNLOCK(ndpr);
+ NDPR_REMREF(ndpr);
+ }
+ if (found) {
+ for (i = 0; ifap[i]; i++) {
+ ifa = ifatoia6(ifap[i]);
+ IFA_LOCK(&ifa->ia_ifa);
+ if ((ifa->ia6_flags & IN6_IFF_AUTOCONF) == 0 ||
+ (ifap[i]->ifa_debug & IFD_ATTACHED) == 0) {
+ IFA_UNLOCK(&ifa->ia_ifa);
+ continue;
+ }
+ if ((ndpr = ifa->ia6_ndpr) == NULL) {
+ /* XXX: see above. */
+ IFA_UNLOCK(&ifa->ia_ifa);
+ continue;
+ }
+ IFA_UNLOCK(&ifa->ia_ifa);
+ NDPR_LOCK(ndpr);
+ NDPR_ADDREF_LOCKED(ndpr);
+ if (find_pfxlist_reachable_router(ndpr)) {
+ NDPR_UNLOCK(ndpr);
+ IFA_LOCK(&ifa->ia_ifa);
+ if (ifa->ia6_flags & IN6_IFF_DETACHED) {
+ ifa->ia6_flags &= ~IN6_IFF_DETACHED;
+ in6_ifaddr_set_dadprogress((struct in6_ifaddr *)ifa);
+ IFA_UNLOCK(&ifa->ia_ifa);
+ nd6_dad_start((struct ifaddr *)ifa, 0);
+ } else {
+ IFA_UNLOCK(&ifa->ia_ifa);
+ }
+ } else {
+ NDPR_UNLOCK(ndpr);
+ IFA_LOCK(&ifa->ia_ifa);
+ ifa->ia6_flags |= IN6_IFF_DETACHED;
+ IFA_UNLOCK(&ifa->ia_ifa);
+ }
+ NDPR_REMREF(ndpr);
+ }
+ } else {
+ for (i = 0; ifap[i]; i++) {
+ ifa = ifatoia6(ifap[i]);
+ IFA_LOCK(&ifa->ia_ifa);
+ if ((ifa->ia6_flags & IN6_IFF_AUTOCONF) == 0) {
+ IFA_UNLOCK(&ifa->ia_ifa);
+ continue;
+ }
+ if (ifa->ia6_flags & IN6_IFF_DETACHED) {
+ ifa->ia6_flags &= ~IN6_IFF_DETACHED;
+ in6_ifaddr_set_dadprogress((struct in6_ifaddr *)ifa);
+ IFA_UNLOCK(&ifa->ia_ifa);
+ /* Do we need a delay in this case? */
+ nd6_dad_start((struct ifaddr *)ifa, 0);
+ } else {
+ IFA_UNLOCK(&ifa->ia_ifa);
+ }
+ }
+ }
+ ifnet_free_address_list(ifap);
}
+static struct nd_prefix *
+nd6_prefix_equal_lookup(struct nd_prefix *pr, boolean_t primary_only)
+{
+ struct nd_prefix *opr;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ for (opr = nd_prefix.lh_first; opr; opr = opr->ndpr_next) {
+ if (opr == pr)
+ continue;
+
+ NDPR_LOCK(opr);
+ if ((opr->ndpr_stateflags & NDPRF_ONLINK) == 0) {
+ NDPR_UNLOCK(opr);
+ continue;
+ }
+ if (opr->ndpr_plen == pr->ndpr_plen &&
+ in6_are_prefix_equal(&pr->ndpr_prefix.sin6_addr,
+ &opr->ndpr_prefix.sin6_addr, pr->ndpr_plen) &&
+ (!primary_only ||
+ !(opr->ndpr_stateflags & NDPRF_IFSCOPE))) {
+ NDPR_ADDREF_LOCKED(opr);
+ NDPR_UNLOCK(opr);
+ return (opr);
+ }
+ NDPR_UNLOCK(opr);
+ }
+ return (NULL);
+}
+
+/*
+ * Synchronize the interface routes of similar prefixes on different
+ * interfaces; the one using the default interface would be (re)installed
+ * as a primary/non-scoped entry, and the rest as scoped entri(es).
+ */
static void
-nd6_attach_prefix(pr)
- struct nd_prefix *pr;
+nd6_prefix_sync(struct ifnet *ifp)
+{
+ struct nd_prefix *pr, *opr;
+ int err = 0;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ if (ifp == NULL)
+ return;
+
+ for (pr = nd_prefix.lh_first; pr; pr = pr->ndpr_next) {
+ NDPR_LOCK(pr);
+ if (!(pr->ndpr_stateflags & NDPRF_ONLINK)) {
+ NDPR_UNLOCK(pr);
+ continue;
+ }
+ if (pr->ndpr_ifp == ifp &&
+ (pr->ndpr_stateflags & NDPRF_IFSCOPE) &&
+ !IN6_IS_ADDR_LINKLOCAL(&pr->ndpr_prefix.sin6_addr)) {
+ NDPR_UNLOCK(pr);
+ break;
+ }
+ NDPR_UNLOCK(pr);
+ }
+
+ if (pr == NULL)
+ return;
+
+ /* Remove conflicting entries */
+ opr = nd6_prefix_equal_lookup(pr, TRUE);
+ if (opr != NULL) {
+ lck_mtx_unlock(nd6_mutex);
+ err = nd6_prefix_offlink(opr);
+ lck_mtx_lock(nd6_mutex);
+ if (err != 0) {
+ nd6log((LOG_ERR,
+ "%s: failed to make %s/%d offlink on %s, "
+ "errno=%d\n", __func__,
+ ip6_sprintf(&opr->ndpr_prefix.sin6_addr),
+ opr->ndpr_plen, if_name(opr->ndpr_ifp), err));
+ }
+ } else {
+ nd6log((LOG_ERR,
+ "%s: scoped %s/%d on %s has no matching unscoped prefix\n",
+ __func__, ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp)));
+ }
+
+ lck_mtx_unlock(nd6_mutex);
+ err = nd6_prefix_offlink(pr);
+ lck_mtx_lock(nd6_mutex);
+ if (err != 0) {
+ nd6log((LOG_ERR,
+ "%s: failed to make %s/%d offlink on %s, errno=%d\n",
+ __func__, ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp), err));
+ }
+
+ /* Add the entries back */
+ if (opr != NULL) {
+ err = nd6_prefix_onlink_scoped(opr, opr->ndpr_ifp->if_index);
+ if (err != 0) {
+ nd6log((LOG_ERR,
+ "%s: failed to make %s/%d scoped onlink on %s, "
+ "errno=%d\n", __func__,
+ ip6_sprintf(&opr->ndpr_prefix.sin6_addr),
+ opr->ndpr_plen, if_name(opr->ndpr_ifp), err));
+ }
+ }
+
+ err = nd6_prefix_onlink_scoped(pr, IFSCOPE_NONE);
+ if (err != 0) {
+ nd6log((LOG_ERR,
+ "%s: failed to make %s/%d onlink on %s, errno=%d\n",
+ __func__, ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp), err));
+ }
+
+ if (err != 0) {
+ nd6log((LOG_ERR,
+ "%s: error promoting %s/%d to %s from %s\n",
+ __func__, ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp),
+ (opr != NULL) ? if_name(opr->ndpr_ifp) : "NONE"));
+ } else {
+ nd6log2((LOG_INFO,
+ "%s: %s/%d promoted, previously on %s\n",
+ if_name(pr->ndpr_ifp),
+ ip6_sprintf(&pr->ndpr_prefix.sin6_addr), pr->ndpr_plen,
+ (opr != NULL) ? if_name(opr->ndpr_ifp) : "NONE"));
+ }
+
+ if (opr != NULL)
+ NDPR_REMREF(opr);
+}
+
+static int
+nd6_prefix_onlink_common(struct nd_prefix *pr, boolean_t force_scoped,
+ unsigned int ifscope)
{
struct ifaddr *ifa;
- struct in6_ifaddr *ia6;
+ struct ifnet *ifp = pr->ndpr_ifp;
+ struct sockaddr_in6 mask6, prefix;
+ struct nd_prefix *opr;
+ u_int32_t rtflags;
+ int error = 0, prproxy = 0;
+ struct rtentry *rt = NULL;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_OWNED);
+
+ /* sanity check */
+ NDPR_LOCK(pr);
+ if ((pr->ndpr_stateflags & NDPRF_ONLINK) != 0) {
+ nd6log((LOG_ERR,
+ "%s: %s/%d on %s scoped=%d is already on-link\n",
+ __func__, ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp),
+ (pr->ndpr_stateflags & NDPRF_IFSCOPE) ? 1 : 0);
+ NDPR_UNLOCK(pr);
+ return (EEXIST));
+ }
+ NDPR_UNLOCK(pr);
/*
- * Add the interface route associated with the prefix(if necessary)
- * Should we consider if the L bit is set in pr->ndpr_flags?
+ * Add the interface route associated with the prefix. Before
+ * installing the route, check if there's the same prefix on another
+ * interface, and the prefix has already installed the interface route.
*/
- ifa = ifaof_ifpforaddr((struct sockaddr *)&pr->ndpr_prefix,
- pr->ndpr_ifp);
+ opr = nd6_prefix_equal_lookup(pr, FALSE);
+ if (opr != NULL)
+ NDPR_REMREF(opr);
+
+ if (!force_scoped) {
+ /*
+ * If a primary/non-scoped interface route already exists,
+ * install the new one as a scoped entry. If the existing
+ * interface route is scoped, install new as non-scoped.
+ */
+ ifscope = (opr != NULL) ? ifp->if_index : IFSCOPE_NONE;
+ opr = nd6_prefix_equal_lookup(pr, TRUE);
+ if (opr != NULL)
+ NDPR_REMREF(opr);
+ else if (ifscope != IFSCOPE_NONE)
+ ifscope = IFSCOPE_NONE;
+ }
+
+ /*
+ * We prefer link-local addresses as the associated interface address.
+ */
+ /* search for a link-local addr */
+ ifa = (struct ifaddr *)in6ifa_ifpforlinklocal(ifp,
+ IN6_IFF_NOTREADY | IN6_IFF_ANYCAST);
if (ifa == NULL) {
- log(LOG_ERR,
- "nd6_attach_prefix: failed to find any ifaddr"
- " to add route for a prefix(%s/%d)\n",
- ip6_sprintf(&pr->ndpr_addr), pr->ndpr_plen);
+ struct in6_ifaddr *ia6;
+ ifnet_lock_shared(ifp);
+ IFP_TO_IA6(ifp, ia6);
+ ifnet_lock_done(ifp);
+ if (ia6 != NULL)
+ ifa = &ia6->ia_ifa;
+ /* should we care about ia6_flags? */
}
- else {
- int e;
- struct sockaddr_in6 mask6;
-
- bzero(&mask6, sizeof(mask6));
- mask6.sin6_family = AF_INET6;
- mask6.sin6_len = sizeof(mask6);
- mask6.sin6_addr = pr->ndpr_mask;
- e = rtrequest(RTM_ADD, (struct sockaddr *)&pr->ndpr_prefix,
- ifa->ifa_addr, (struct sockaddr *)&mask6,
- ifa->ifa_flags, NULL);
- if (e == 0)
- pr->ndpr_statef_onlink = 1;
- else {
- log(LOG_ERR,
- "nd6_attach_prefix: failed to add route for"
- " a prefix(%s/%d), errno = %d\n",
- ip6_sprintf(&pr->ndpr_addr), pr->ndpr_plen, e);
- }
+ NDPR_LOCK(pr);
+ if (ifa == NULL) {
+ /*
+ * This can still happen, when, for example, we receive an RA
+ * containing a prefix with the L bit set and the A bit clear,
+ * after removing all IPv6 addresses on the receiving
+ * interface. This should, of course, be rare though.
+ */
+ nd6log((LOG_NOTICE,
+ "nd6_prefix_onlink: failed to find any ifaddr"
+ " to add route for a prefix(%s/%d) on %s\n",
+ ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(ifp)));
+ NDPR_UNLOCK(pr);
+ return (0);
}
/*
- * Now the address derived from the prefix can be used as a source
- * for a new connection, so clear the detached flag.
+ * in6_ifinit() sets nd6_rtrequest to ifa_rtrequest for all ifaddrs.
+ * ifa->ifa_rtrequest = nd6_rtrequest;
*/
- if (IN6_IS_ADDR_UNSPECIFIED(&pr->ndpr_addr))
- ia6 = NULL;
- else
- ia6 = in6ifa_ifpwithaddr(pr->ndpr_ifp, &pr->ndpr_addr);
- if (ia6) {
- ia6->ia6_flags &= ~IN6_IFF_DETACHED;
- if (pr->ndpr_statef_onlink)
- ia6->ia_flags |= IFA_ROUTE;
+ bzero(&mask6, sizeof (mask6));
+ mask6.sin6_len = sizeof (mask6);
+ mask6.sin6_addr = pr->ndpr_mask;
+ prefix = pr->ndpr_prefix;
+ if ((rt = pr->ndpr_rt) != NULL)
+ pr->ndpr_rt = NULL;
+ NDPR_ADDREF_LOCKED(pr); /* keep reference for this routine */
+ NDPR_UNLOCK(pr);
+
+ IFA_LOCK_SPIN(ifa);
+ rtflags = ifa->ifa_flags | RTF_CLONING | RTF_UP;
+ IFA_UNLOCK(ifa);
+ if (nd6_need_cache(ifp)) {
+ /* explicitly set in case ifa_flags does not set the flag. */
+ rtflags |= RTF_CLONING;
+ } else {
+ /*
+ * explicitly clear the cloning bit in case ifa_flags sets it.
+ */
+ rtflags &= ~RTF_CLONING;
}
-}
-static struct in6_ifaddr *
-in6_ifadd(ifp, in6, addr, prefixlen)
- struct ifnet *ifp;
- struct in6_addr *in6;
- struct in6_addr *addr;
- int prefixlen; /* prefix len of the new prefix in "in6" */
-{
- struct ifaddr *ifa;
- struct in6_ifaddr *ia, *ib, *oia;
- int s, error;
- struct in6_addr mask;
+ lck_mtx_unlock(nd6_mutex);
- in6_len2mask(&mask, prefixlen);
+ if (rt != NULL) {
+ rtfree(rt);
+ rt = NULL;
+ }
- /* find link-local address (will be interface ID) */
- ifa = (struct ifaddr *)in6ifa_ifpforlinklocal(ifp, 0);/* 0 is OK? */
- if (ifa)
- ib = (struct in6_ifaddr *)ifa;
- else
- return NULL;
+ error = rtrequest_scoped(RTM_ADD, (struct sockaddr *)&prefix,
+ ifa->ifa_addr, (struct sockaddr *)&mask6, rtflags, &rt,
+ ifscope);
-#if 0 /* don't care link local addr state, and always do DAD */
- /* if link-local address is not eligible, do not autoconfigure. */
- if (((struct in6_ifaddr *)ifa)->ia6_flags & IN6_IFF_NOTREADY) {
- printf("in6_ifadd: link-local address not ready\n");
- return NULL;
- }
-#endif
+ /*
+ * Serialize the setting of NDPRF_PRPROXY.
+ */
+ lck_mtx_lock(&proxy6_lock);
- /* prefixlen + ifidlen must be equal to 128 */
- if (prefixlen != in6_mask2len(&ib->ia_prefixmask.sin6_addr)) {
- log(LOG_ERR, "in6_ifadd: wrong prefixlen for %s"
- "(prefix=%d ifid=%d)\n", if_name(ifp),
- prefixlen,
- 128 - in6_mask2len(&ib->ia_prefixmask.sin6_addr));
- return NULL;
+ if (rt != NULL) {
+ RT_LOCK(rt);
+ nd6_rtmsg(RTM_ADD, rt);
+ RT_UNLOCK(rt);
+ NDPR_LOCK(pr);
+ } else {
+ NDPR_LOCK(pr);
+ nd6log((LOG_ERR, "nd6_prefix_onlink: failed to add route for a"
+ " prefix (%s/%d) on %s, gw=%s, mask=%s, flags=%lx,"
+ " scoped=%d, errno = %d\n",
+ ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(ifp),
+ ip6_sprintf(&((struct sockaddr_in6 *)
+ (void *)ifa->ifa_addr)->sin6_addr),
+ ip6_sprintf(&mask6.sin6_addr), rtflags,
+ (ifscope != IFSCOPE_NONE), error));
}
+ NDPR_LOCK_ASSERT_HELD(pr);
+
+ pr->ndpr_stateflags &= ~(NDPRF_IFSCOPE | NDPRF_PRPROXY);
+
+ /*
+ * TODO: If the prefix route exists, we should really find it and
+ * refer the prefix to it; otherwise ndpr_rt is NULL.
+ */
+ if (!(pr->ndpr_stateflags & NDPRF_DEFUNCT) &&
+ (rt != NULL || error == EEXIST)) {
+ struct nd_ifinfo *ndi = NULL;
+
+ VERIFY(pr->ndpr_prproxy_sols_cnt == 0);
+ VERIFY(RB_EMPTY(&pr->ndpr_prproxy_sols));
+
+ ndi = ND_IFINFO(ifp);
+ VERIFY((NULL != ndi) && (TRUE == ndi->initialized));
+ lck_mtx_lock(&ndi->lock);
+
+ pr->ndpr_rt = rt; /* keep reference from rtrequest */
+ pr->ndpr_stateflags |= NDPRF_ONLINK;
+ if (ifscope != IFSCOPE_NONE) {
+ pr->ndpr_stateflags |= NDPRF_IFSCOPE;
+ } else if ((rtflags & RTF_CLONING) &&
+ (ndi->flags & ND6_IFF_PROXY_PREFIXES) &&
+ !IN6_IS_ADDR_LINKLOCAL(&pr->ndpr_prefix.sin6_addr)) {
+ /*
+ * At present, in order for the prefix to be eligible
+ * as a proxying/proxied prefix, we require that the
+ * prefix route entry be marked as a cloning route with
+ * RTF_PROXY; i.e. nd6_need_cache() needs to return
+ * true for the interface type, hence the test for
+ * RTF_CLONING above.
+ */
+ pr->ndpr_stateflags |= NDPRF_PRPROXY;
+ }
+
+ lck_mtx_unlock(&ndi->lock);
+ } else if (rt != NULL && pr->ndpr_stateflags & NDPRF_DEFUNCT)
+ rtfree(rt);
+
+ prproxy = (pr->ndpr_stateflags & NDPRF_PRPROXY);
+ VERIFY(!prproxy || !(pr->ndpr_stateflags & NDPRF_IFSCOPE));
+ NDPR_UNLOCK(pr);
+
+ IFA_REMREF(ifa);
+
+ /*
+ * If this is an upstream prefix, find the downstream ones (if any)
+ * and re-configure their prefix routes accordingly. Otherwise,
+ * this could be potentially be a downstream prefix, and so find the
+ * upstream prefix, if any.
+ */
+ nd6_prproxy_prelist_update(pr, prproxy ? pr : NULL);
- /* make ifaddr */
- ia = (struct in6_ifaddr *)_MALLOC(sizeof(*ia), M_IFADDR, M_NOWAIT);
- if (ia == NULL) {
- printf("ENOBUFS in in6_ifadd %d\n", __LINE__);
- return NULL;
+ NDPR_REMREF(pr); /* release reference for this routine */
+ lck_mtx_unlock(&proxy6_lock);
+
+ lck_mtx_lock(nd6_mutex);
+
+ return (error);
+}
+
+int
+nd6_prefix_onlink(struct nd_prefix *pr)
+{
+ return (nd6_prefix_onlink_common(pr, FALSE, IFSCOPE_NONE));
+}
+
+int
+nd6_prefix_onlink_scoped(struct nd_prefix *pr, unsigned int ifscope)
+{
+ return (nd6_prefix_onlink_common(pr, TRUE, ifscope));
+}
+
+int
+nd6_prefix_offlink(struct nd_prefix *pr)
+{
+ int plen, error = 0, prproxy;
+ struct ifnet *ifp = pr->ndpr_ifp;
+ struct sockaddr_in6 sa6, mask6, prefix;
+ struct rtentry *rt = NULL, *ndpr_rt = NULL;
+ unsigned int ifscope;
+
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_NOTOWNED);
+
+ /* sanity check */
+ NDPR_LOCK(pr);
+ if ((pr->ndpr_stateflags & NDPRF_ONLINK) == 0) {
+ nd6log((LOG_ERR,
+ "nd6_prefix_offlink: %s/%d on %s scoped=%d is already "
+ "off-link\n", ip6_sprintf(&pr->ndpr_prefix.sin6_addr),
+ pr->ndpr_plen, if_name(pr->ndpr_ifp),
+ (pr->ndpr_stateflags & NDPRF_IFSCOPE) ? 1 : 0));
+ NDPR_UNLOCK(pr);
+ return (EEXIST);
}
- bzero((caddr_t)ia, sizeof(*ia));
- ia->ia_ifa.ifa_addr = (struct sockaddr *)&ia->ia_addr;
- if (ifp->if_flags & IFF_POINTOPOINT)
- ia->ia_ifa.ifa_dstaddr = (struct sockaddr *)&ia->ia_dstaddr;
- else
- ia->ia_ifa.ifa_dstaddr = NULL;
- ia->ia_ifa.ifa_netmask = (struct sockaddr *)&ia->ia_prefixmask;
- ia->ia_ifp = ifp;
+ bzero(&sa6, sizeof (sa6));
+ sa6.sin6_family = AF_INET6;
+ sa6.sin6_len = sizeof (sa6);
+ bcopy(&pr->ndpr_prefix.sin6_addr, &sa6.sin6_addr,
+ sizeof (struct in6_addr));
+ bzero(&mask6, sizeof (mask6));
+ mask6.sin6_family = AF_INET6;
+ mask6.sin6_len = sizeof (sa6);
+ bcopy(&pr->ndpr_mask, &mask6.sin6_addr, sizeof (struct in6_addr));
+ prefix = pr->ndpr_prefix;
+ plen = pr->ndpr_plen;
+ if ((ndpr_rt = pr->ndpr_rt) != NULL)
+ pr->ndpr_rt = NULL;
+ NDPR_ADDREF_LOCKED(pr); /* keep reference for this routine */
+ NDPR_UNLOCK(pr);
+
+ ifscope = (pr->ndpr_stateflags & NDPRF_IFSCOPE) ?
+ ifp->if_index : IFSCOPE_NONE;
+
+ error = rtrequest_scoped(RTM_DELETE, (struct sockaddr *)&sa6,
+ NULL, (struct sockaddr *)&mask6, 0, &rt, ifscope);
+
+ if (rt != NULL) {
+ /* report the route deletion to the routing socket. */
+ RT_LOCK(rt);
+ nd6_rtmsg(RTM_DELETE, rt);
+ RT_UNLOCK(rt);
+ rtfree(rt);
- /* link to in6_ifaddr */
- if ((oia = in6_ifaddr) != NULL) {
- for( ; oia->ia_next; oia = oia->ia_next)
- continue;
- oia->ia_next = ia;
- } else
- in6_ifaddr = ia;
- ia->ia_ifa.ifa_refcnt++;
-
- /* link to if_addrlist */
-#if defined(__bsdi__) || (defined(__FreeBSD__) && __FreeBSD__ < 3)
- if ((ifa = ifp->if_addrlist) != NULL) {
- for ( ; ifa->ifa_next; ifa = ifa->ifa_next)
- continue;
- ifa->ifa_next = (struct ifaddr *)ia;
+ } else {
+ nd6log((LOG_ERR,
+ "nd6_prefix_offlink: failed to delete route: "
+ "%s/%d on %s, scoped %d, (errno = %d)\n",
+ ip6_sprintf(&sa6.sin6_addr), plen, if_name(ifp),
+ (ifscope != IFSCOPE_NONE), error));
}
-#else
- if (ifp->if_addrlist.tqh_first != NULL) {
- TAILQ_INSERT_TAIL(&ifp->if_addrlist, (struct ifaddr *)ia,
- ifa_list);
- ia->ia_ifa.ifa_refcnt++;
+
+ if (ndpr_rt != NULL)
+ rtfree(ndpr_rt);
+
+ lck_mtx_lock(&proxy6_lock);
+
+ NDPR_LOCK(pr);
+ prproxy = (pr->ndpr_stateflags & NDPRF_PRPROXY);
+ VERIFY(!prproxy || !(pr->ndpr_stateflags & NDPRF_IFSCOPE));
+ pr->ndpr_stateflags &= ~(NDPRF_ONLINK | NDPRF_IFSCOPE | NDPRF_PRPROXY);
+ if (pr->ndpr_prproxy_sols_cnt > 0) {
+ VERIFY(prproxy);
+ nd6_prproxy_sols_reap(pr);
+ VERIFY(pr->ndpr_prproxy_sols_cnt == 0);
+ VERIFY(RB_EMPTY(&pr->ndpr_prproxy_sols));
}
-#endif
-#if 0
- else {
+ NDPR_UNLOCK(pr);
+
+ /*
+ * If this was an upstream prefix, find the downstream ones and do
+ * some cleanups. If this was a downstream prefix, the prefix route
+ * has been removed from the routing table above, but there may be
+ * other tasks to perform.
+ */
+ nd6_prproxy_prelist_update(pr, prproxy ? pr : NULL);
+
+ NDPR_REMREF(pr); /* release reference for this routine */
+ lck_mtx_unlock(&proxy6_lock);
+
+ return (error);
+}
+
+static struct in6_ifaddr *
+in6_pfx_newpersistaddr(struct nd_prefix *pr, int mcast, int *errorp)
+{
+ struct in6_ifaddr *ia6 = NULL;
+ struct ifnet *ifp = NULL;
+ struct nd_ifinfo *ndi = NULL;
+ struct in6_addr mask;
+ struct in6_aliasreq ifra;
+ int error, ifaupdate, iidlen, notcga;
+
+ VERIFY(pr != NULL);
+ VERIFY(errorp != NULL);
+
+ NDPR_LOCK(pr);
+ ifp = pr->ndpr_ifp;
+ ia6 = NULL;
+ error = 0;
+
+ /*
+ * Prefix Length check:
+ * If the sum of the prefix length and interface identifier
+ * length does not equal 128 bits, the Prefix Information
+ * option MUST be ignored. The length of the interface
+ * identifier is defined in a separate link-type specific
+ * document.
+ */
+ iidlen = in6_if2idlen(ifp);
+ if (iidlen < 0) {
+ error = EADDRNOTAVAIL;
+ /* this should not happen, so we always log it. */
+ log(LOG_ERR, "%s: IID length undefined (%s)\n",
+ __func__, if_name(ifp));
+ goto unlock1;
+ } else if (iidlen != 64) {
+ error = EADDRNOTAVAIL;
/*
- * this should not be the case because there is at least one
- * link-local address(see the beginning of the function).
+ * stateless autoconfiguration not yet well-defined for IID
+ * lengths other than 64 octets. Just give up for now.
*/
- TAILQ_INIT(&ifp->if_addrlist);
+ nd6log((LOG_INFO, "%s: IID length not 64 octets (%s)\n",
+ __func__, if_name(ifp)));
+ goto unlock1;
}
-#endif
- /* new address */
- ia->ia_addr.sin6_len = sizeof(struct sockaddr_in6);
- ia->ia_addr.sin6_family = AF_INET6;
- /* prefix */
- bcopy(in6, &ia->ia_addr.sin6_addr, sizeof(ia->ia_addr.sin6_addr));
- ia->ia_addr.sin6_addr.s6_addr32[0] &= mask.s6_addr32[0];
- ia->ia_addr.sin6_addr.s6_addr32[1] &= mask.s6_addr32[1];
- ia->ia_addr.sin6_addr.s6_addr32[2] &= mask.s6_addr32[2];
- ia->ia_addr.sin6_addr.s6_addr32[3] &= mask.s6_addr32[3];
- /* interface ID */
- ia->ia_addr.sin6_addr.s6_addr32[0]
- |= (ib->ia_addr.sin6_addr.s6_addr32[0] & ~mask.s6_addr32[0]);
- ia->ia_addr.sin6_addr.s6_addr32[1]
- |= (ib->ia_addr.sin6_addr.s6_addr32[1] & ~mask.s6_addr32[1]);
- ia->ia_addr.sin6_addr.s6_addr32[2]
- |= (ib->ia_addr.sin6_addr.s6_addr32[2] & ~mask.s6_addr32[2]);
- ia->ia_addr.sin6_addr.s6_addr32[3]
- |= (ib->ia_addr.sin6_addr.s6_addr32[3] & ~mask.s6_addr32[3]);
-
- /* new prefix */
- ia->ia_prefixmask.sin6_len = sizeof(struct sockaddr_in6);
- ia->ia_prefixmask.sin6_family = AF_INET6;
- bcopy(&mask, &ia->ia_prefixmask.sin6_addr,
- sizeof(ia->ia_prefixmask.sin6_addr));
-
- /* same routine */
- ia->ia_ifa.ifa_rtrequest =
- (ifp->if_type == IFT_PPP) ? nd6_p2p_rtrequest : nd6_rtrequest;
- ia->ia_ifa.ifa_flags |= RTF_CLONING;
- ia->ia_ifa.ifa_metric = ifp->if_metric;
-
- /* add interface route */
- if ((error = rtinit(&(ia->ia_ifa), (int)RTM_ADD, RTF_UP|RTF_CLONING))) {
- log(LOG_NOTICE, "in6_ifadd: failed to add an interface route "
- "for %s/%d on %s, errno = %d\n",
- ip6_sprintf(&ia->ia_addr.sin6_addr), prefixlen,
- if_name(ifp), error);
+ if (iidlen + pr->ndpr_plen != 128) {
+ error = EADDRNOTAVAIL;
+ nd6log((LOG_INFO,
+ "%s: invalid prefix length %d for %s, ignored\n",
+ __func__, pr->ndpr_plen, if_name(ifp)));
+ goto unlock1;
}
- else
- ia->ia_flags |= IFA_ROUTE;
-
- *addr = ia->ia_addr.sin6_addr;
- if (ifp->if_flags & IFF_MULTICAST) {
- int error; /* not used */
- struct in6_addr sol6;
+ bzero(&ifra, sizeof (ifra));
+ strlcpy(ifra.ifra_name, if_name(ifp), sizeof (ifra.ifra_name));
+ ifra.ifra_addr.sin6_family = AF_INET6;
+ ifra.ifra_addr.sin6_len = sizeof (struct sockaddr_in6);
-#if !(defined(__FreeBSD__) && __FreeBSD__ >= 3) && !defined (__APPLE__)
- /* Restore saved multicast addresses(if any). */
- in6_restoremkludge(ia, ifp);
-#endif
+ /* prefix */
+ bcopy(&pr->ndpr_prefix.sin6_addr, &ifra.ifra_addr.sin6_addr,
+ sizeof (ifra.ifra_addr.sin6_addr));
+ in6_len2mask(&mask, pr->ndpr_plen);
+ ifra.ifra_addr.sin6_addr.s6_addr32[0] &= mask.s6_addr32[0];
+ ifra.ifra_addr.sin6_addr.s6_addr32[1] &= mask.s6_addr32[1];
+ ifra.ifra_addr.sin6_addr.s6_addr32[2] &= mask.s6_addr32[2];
+ ifra.ifra_addr.sin6_addr.s6_addr32[3] &= mask.s6_addr32[3];
+
+ ndi = ND_IFINFO(ifp);
+ VERIFY(ndi->initialized);
+ lck_mtx_lock(&ndi->lock);
+
+ notcga = nd6_send_opstate == ND6_SEND_OPMODE_DISABLED ||
+ (ndi->flags & ND6_IFF_INSECURE) != 0;
+
+ lck_mtx_unlock(&ndi->lock);
+ NDPR_UNLOCK(pr);
+
+ if (notcga) {
+ ia6 = in6ifa_ifpforlinklocal(ifp, 0);
+ if (ia6 == NULL) {
+ error = EADDRNOTAVAIL;
+ nd6log((LOG_INFO, "%s: no link-local address (%s)\n",
+ __func__, if_name(ifp)));
+ goto done;
+ }
- /* join solicited node multicast address */
- bzero(&sol6, sizeof(sol6));
- sol6.s6_addr16[0] = htons(0xff02);
- sol6.s6_addr16[1] = htons(ifp->if_index);
- sol6.s6_addr32[1] = 0;
- sol6.s6_addr32[2] = htonl(1);
- sol6.s6_addr32[3] = ia->ia_addr.sin6_addr.s6_addr32[3];
- sol6.s6_addr8[12] = 0xff;
- (void)in6_addmulti(&sol6, ifp, &error);
+ IFA_LOCK(&ia6->ia_ifa);
+ ifra.ifra_addr.sin6_addr.s6_addr32[0] |=
+ (ia6->ia_addr.sin6_addr.s6_addr32[0] & ~mask.s6_addr32[0]);
+ ifra.ifra_addr.sin6_addr.s6_addr32[1] |=
+ (ia6->ia_addr.sin6_addr.s6_addr32[1] & ~mask.s6_addr32[1]);
+ ifra.ifra_addr.sin6_addr.s6_addr32[2] |=
+ (ia6->ia_addr.sin6_addr.s6_addr32[2] & ~mask.s6_addr32[2]);
+ ifra.ifra_addr.sin6_addr.s6_addr32[3] |=
+ (ia6->ia_addr.sin6_addr.s6_addr32[3] & ~mask.s6_addr32[3]);
+ IFA_UNLOCK(&ia6->ia_ifa);
+ IFA_REMREF(&ia6->ia_ifa);
+ ia6 = NULL;
+ } else {
+ in6_cga_node_lock();
+ struct in6_cga_prepare local_cga_prepare;
+
+ if (ndi->cga_initialized) {
+ bcopy(&(ndi->local_cga_modifier),
+ &(local_cga_prepare.cga_modifier),
+ sizeof(local_cga_prepare.cga_modifier));
+ error = in6_cga_generate(&local_cga_prepare, 0,
+ &ifra.ifra_addr.sin6_addr);
+ } else {
+ error = in6_cga_generate(NULL, 0,
+ &ifra.ifra_addr.sin6_addr);
+ }
+ in6_cga_node_unlock();
+ if (error == 0)
+ ifra.ifra_flags |= IN6_IFF_SECURED;
+ else {
+ nd6log((LOG_ERR, "%s: no CGA available (%s)\n",
+ __func__, if_name(ifp)));
+ goto done;
+ }
}
- ia->ia6_flags |= IN6_IFF_TENTATIVE;
+ VERIFY(ia6 == NULL);
+
+ /* new prefix mask. */
+ ifra.ifra_prefixmask.sin6_len = sizeof (struct sockaddr_in6);
+ ifra.ifra_prefixmask.sin6_family = AF_INET6;
+ bcopy(&mask, &ifra.ifra_prefixmask.sin6_addr,
+ sizeof (ifra.ifra_prefixmask.sin6_addr));
+
+ /* lifetimes. */
+ ifra.ifra_lifetime.ia6t_vltime = pr->ndpr_vltime;
+ ifra.ifra_lifetime.ia6t_pltime = pr->ndpr_pltime;
+
+ /* address flags */
+ ifra.ifra_flags |= IN6_IFF_AUTOCONF; /* obey autoconf */
/*
- * To make the interface up. Only AF_INET6 in ia is used...
+ * Make sure that we do not have this address already. This should
+ * usually not happen, but we can still see this case, e.g., if we
+ * have manually configured the exact address to be configured.
*/
- s = splimp();
- error = dlil_ioctl(PF_INET6, ifp, SIOCSIFADDR, (caddr_t)ia);
- if (error == EOPNOTSUPP)
- error = 0;
- if (error) {
+ if ((ia6 = in6ifa_ifpwithaddr(ifp, &ifra.ifra_addr.sin6_addr))
+ != NULL) {
+ error = EADDRNOTAVAIL;
+ IFA_REMREF(&ia6->ia_ifa);
+ ia6 = NULL;
+
+ /* this should be rare enough to make an explicit log */
+ log(LOG_INFO, "%s: %s is already configured!\n",
+ __func__, ip6_sprintf(&ifra.ifra_addr.sin6_addr));
+ goto done;
+ }
- splx(s);
- return NULL;
+ /*
+ * Allocate ifaddr structure, link into chain, etc.
+ * If we are going to create a new address upon receiving a multicasted
+ * RA, we need to impose a random delay before starting DAD.
+ * [RFC 4862, Section 5.4.2]
+ */
+ ifaupdate = IN6_IFAUPDATE_NOWAIT;
+ if (mcast)
+ ifaupdate |= IN6_IFAUPDATE_DADDELAY;
+ error = in6_update_ifa(ifp, &ifra, ifaupdate, &ia6);
+ if (error != 0) {
+ nd6log((LOG_ERR,
+ "%s: failed to make ifaddr %s on %s (errno=%d)\n",
+ __func__, ip6_sprintf(&ifra.ifra_addr.sin6_addr),
+ if_name(ifp), error));
+ error = EADDRNOTAVAIL;
+ goto done;
}
- splx(s);
- /* Perform DAD, if needed. */
- nd6_dad_start((struct ifaddr *)ia, NULL);
+ VERIFY(ia6 != NULL);
+ in6_post_msg(ifp, KEV_INET6_NEW_RTADV_ADDR, ia6, NULL);
+ goto done;
- return ia;
+unlock1:
+ NDPR_UNLOCK(pr);
+
+done:
+ *errorp = error;
+ return (ia6);
}
+#define IA6_NONCONST(i) ((struct in6_ifaddr *)(uintptr_t)(i))
+
int
-in6_ifdel(ifp, in6)
- struct ifnet *ifp;
- struct in6_addr *in6;
+in6_tmpifadd(const struct in6_ifaddr *ia0, int forcegen)
{
-#if defined(__bsdi__) || (defined(__FreeBSD__) && __FreeBSD__ < 3)
- struct ifaddr *ifa;
-#endif
- struct in6_ifaddr *ia = (struct in6_ifaddr *)NULL;
- struct in6_ifaddr *oia = (struct in6_ifaddr *)NULL;
+ struct ifnet *ifp = ia0->ia_ifa.ifa_ifp;
+ struct in6_ifaddr *ia, *newia;
+ struct in6_aliasreq ifra;
+ int i, error, ifaupdate;
+ int trylimit = 3; /* XXX: adhoc value */
+ u_int32_t randid[2];
+ time_t vltime0, pltime0;
+ uint64_t timenow = net_uptime();
+ struct in6_addr addr;
+ struct nd_prefix *ndpr;
+
+ bzero(&ifra, sizeof (ifra));
+ strlcpy(ifra.ifra_name, if_name(ifp), sizeof (ifra.ifra_name));
+ IFA_LOCK(&IA6_NONCONST(ia0)->ia_ifa);
+ ifra.ifra_addr = ia0->ia_addr;
+ /* copy prefix mask */
+ ifra.ifra_prefixmask = ia0->ia_prefixmask;
+ /* clear the old IFID */
+ for (i = 0; i < 4; i++) {
+ ifra.ifra_addr.sin6_addr.s6_addr32[i]
+ &= ifra.ifra_prefixmask.sin6_addr.s6_addr32[i];
+ }
+ addr = ia0->ia_addr.sin6_addr;
+ IFA_UNLOCK(&IA6_NONCONST(ia0)->ia_ifa);
+
+again:
+ in6_iid_mktmp(ifp, (u_int8_t *)randid,
+ (const u_int8_t *)&addr.s6_addr[8], forcegen);
+
+ ifra.ifra_addr.sin6_addr.s6_addr32[2] |=
+ (randid[0] & ~(ifra.ifra_prefixmask.sin6_addr.s6_addr32[2]));
+ ifra.ifra_addr.sin6_addr.s6_addr32[3] |=
+ (randid[1] & ~(ifra.ifra_prefixmask.sin6_addr.s6_addr32[3]));
+
+ /*
+ * in6_iid_mktmp() quite likely provided a unique interface ID.
+ * However, we may still have a chance to see collision, because
+ * there may be a time lag between generation of the ID and generation
+ * of the address. So, we'll do one more sanity check.
+ */
+ if ((ia = in6ifa_ifpwithaddr(ifp, &ifra.ifra_addr.sin6_addr)) != NULL) {
+ IFA_REMREF(&ia->ia_ifa);
+ if (trylimit-- == 0) {
+ nd6log((LOG_NOTICE, "in6_tmpifadd: failed to find "
+ "a unique random IFID\n"));
+ return (EEXIST);
+ }
+ forcegen = 1;
+ goto again;
+ }
- if (!ifp)
- return -1;
+ /*
+ * The Valid Lifetime is the lower of the Valid Lifetime of the
+ * public address or TEMP_VALID_LIFETIME.
+ * The Preferred Lifetime is the lower of the Preferred Lifetime
+ * of the public address or TEMP_PREFERRED_LIFETIME -
+ * DESYNC_FACTOR.
+ */
+ IFA_LOCK(&IA6_NONCONST(ia0)->ia_ifa);
+ if (ia0->ia6_lifetime.ia6ti_vltime != ND6_INFINITE_LIFETIME) {
+ vltime0 = IFA6_IS_INVALID(ia0, timenow) ? 0 :
+ (ia0->ia6_lifetime.ia6ti_vltime -
+ (timenow - ia0->ia6_updatetime));
+ if (vltime0 > ip6_temp_valid_lifetime)
+ vltime0 = ip6_temp_valid_lifetime;
+ } else {
+ vltime0 = ip6_temp_valid_lifetime;
+ }
+ if (ia0->ia6_lifetime.ia6ti_pltime != ND6_INFINITE_LIFETIME) {
+ pltime0 = IFA6_IS_DEPRECATED(ia0, timenow) ? 0 :
+ (ia0->ia6_lifetime.ia6ti_pltime -
+ (timenow - ia0->ia6_updatetime));
+ if (pltime0 > ip6_temp_preferred_lifetime - ip6_desync_factor)
+ pltime0 = ip6_temp_preferred_lifetime -
+ ip6_desync_factor;
+ } else {
+ pltime0 = ip6_temp_preferred_lifetime - ip6_desync_factor;
+ }
+ ifra.ifra_lifetime.ia6t_vltime = vltime0;
+ ifra.ifra_lifetime.ia6t_pltime = pltime0;
+ IFA_UNLOCK(&IA6_NONCONST(ia0)->ia_ifa);
+ /*
+ * A temporary address is created only if this calculated Preferred
+ * Lifetime is greater than REGEN_ADVANCE time units.
+ */
+ if (ifra.ifra_lifetime.ia6t_pltime <= ip6_temp_regen_advance)
+ return (0);
+
+ /* XXX: scope zone ID? */
- ia = in6ifa_ifpwithaddr(ifp, in6);
- if (!ia)
- return -1;
+ ifra.ifra_flags |= (IN6_IFF_AUTOCONF|IN6_IFF_TEMPORARY);
- if (ifp->if_flags & IFF_MULTICAST) {
+ /* allocate ifaddr structure, link into chain, etc. */
+ ifaupdate = IN6_IFAUPDATE_NOWAIT | IN6_IFAUPDATE_DADDELAY;
+ error = in6_update_ifa(ifp, &ifra, ifaupdate, &newia);
+ if (error != 0) {
+ nd6log((LOG_ERR, "in6_tmpifadd: failed to add address.\n"));
+ return (error);
+ }
+ VERIFY(newia != NULL);
+
+ IFA_LOCK(&IA6_NONCONST(ia0)->ia_ifa);
+ ndpr = ia0->ia6_ndpr;
+ if (ndpr == NULL) {
/*
- * delete solicited multicast addr for deleting host id
+ * We lost the race with another thread that has purged
+ * ia0 address; in this case, purge the tmp addr as well.
*/
- struct in6_multi *in6m;
- struct in6_addr llsol;
- bzero(&llsol, sizeof(struct in6_addr));
- llsol.s6_addr16[0] = htons(0xff02);
- llsol.s6_addr16[1] = htons(ifp->if_index);
- llsol.s6_addr32[1] = 0;
- llsol.s6_addr32[2] = htonl(1);
- llsol.s6_addr32[3] =
- ia->ia_addr.sin6_addr.s6_addr32[3];
- llsol.s6_addr8[12] = 0xff;
-
- IN6_LOOKUP_MULTI(llsol, ifp, in6m);
- if (in6m)
- in6_delmulti(in6m);
- }
-
- if (ia->ia_flags & IFA_ROUTE) {
- rtinit(&(ia->ia_ifa), (int)RTM_DELETE, 0);
- ia->ia_flags &= ~IFA_ROUTE;
- }
-
-#if defined(__bsdi__) || (defined(__FreeBSD__) && __FreeBSD__ < 3)
- if ((ifa = ifp->if_addrlist) == (struct ifaddr *)ia) {
- ifp->if_addrlist = ifa->ifa_next;
- } else {
- while (ifa->ifa_next &&
- (ifa->ifa_next != (struct ifaddr *)ia))
- ifa = ifa->ifa_next;
- if (ifa->ifa_next)
- ifa->ifa_next = ((struct ifaddr *)ia)->ifa_next;
- else
- return -1;
+ nd6log((LOG_ERR, "in6_tmpifadd: no public address\n"));
+ VERIFY(!(ia0->ia6_flags & IN6_IFF_AUTOCONF));
+ IFA_UNLOCK(&IA6_NONCONST(ia0)->ia_ifa);
+ in6_purgeaddr(&newia->ia_ifa);
+ IFA_REMREF(&newia->ia_ifa);
+ return (EADDRNOTAVAIL);
}
-#else
- TAILQ_REMOVE(&ifp->if_addrlist, (struct ifaddr *)ia, ifa_list);
-#endif
- IFAFREE(&ia->ia_ifa);
-
- /* lladdr is never deleted */
- oia = ia;
- if (oia == (ia = in6_ifaddr))
- in6_ifaddr = ia->ia_next;
- else {
- while (ia->ia_next && (ia->ia_next != oia))
- ia = ia->ia_next;
- if (ia->ia_next)
- ia->ia_next = oia->ia_next;
- else
- return -1;
+ NDPR_ADDREF(ndpr); /* for us */
+ IFA_UNLOCK(&IA6_NONCONST(ia0)->ia_ifa);
+ IFA_LOCK(&newia->ia_ifa);
+ if (newia->ia6_ndpr != NULL) {
+ NDPR_LOCK(newia->ia6_ndpr);
+ VERIFY(newia->ia6_ndpr->ndpr_addrcnt != 0);
+ newia->ia6_ndpr->ndpr_addrcnt--;
+ NDPR_UNLOCK(newia->ia6_ndpr);
+ NDPR_REMREF(newia->ia6_ndpr); /* release addr reference */
}
+ newia->ia6_ndpr = ndpr;
+ NDPR_LOCK(newia->ia6_ndpr);
+ newia->ia6_ndpr->ndpr_addrcnt++;
+ VERIFY(newia->ia6_ndpr->ndpr_addrcnt != 0);
+ NDPR_ADDREF_LOCKED(newia->ia6_ndpr); /* for addr reference */
+ NDPR_UNLOCK(newia->ia6_ndpr);
+ IFA_UNLOCK(&newia->ia_ifa);
+ /*
+ * A newly added address might affect the status of other addresses.
+ * XXX: when the temporary address is generated with a new public
+ * address, the onlink check is redundant. However, it would be safe
+ * to do the check explicitly everywhere a new address is generated,
+ * and, in fact, we surely need the check when we create a new
+ * temporary address due to deprecation of an old temporary address.
+ */
+ lck_mtx_lock(nd6_mutex);
+ pfxlist_onlink_check();
+ lck_mtx_unlock(nd6_mutex);
+ IFA_REMREF(&newia->ia_ifa);
-#if !(defined(__FreeBSD__) && __FreeBSD__ >= 3) && !defined (__APPLE__)
- in6_savemkludge(oia);
-#endif
- IFAFREE((&oia->ia_ifa));
-/* xxx
- rtrequest(RTM_DELETE,
- (struct sockaddr *)&ia->ia_addr,
- (struct sockaddr *)0
- (struct sockaddr *)&ia->ia_prefixmask,
- RTF_UP|RTF_CLONING,
- (struct rtentry **)0);
-*/
- return 0;
+ /* remove our reference */
+ NDPR_REMREF(ndpr);
+
+ return (0);
}
+#undef IA6_NONCONST
int
in6_init_prefix_ltimes(struct nd_prefix *ndpr)
{
-#if !(defined(__FreeBSD__) && __FreeBSD__ >= 3) && !defined (__APPLE__)
- long time_second = time.tv_sec;
-#endif
+ struct timeval caltime;
+ u_int64_t timenow = net_uptime();
+
+ NDPR_LOCK_ASSERT_HELD(ndpr);
- /* check if preferred lifetime > valid lifetime */
+ getmicrotime(&caltime);
+ ndpr->ndpr_base_calendartime = caltime.tv_sec;
+ ndpr->ndpr_base_uptime = timenow;
+
+ /* check if preferred lifetime > valid lifetime. RFC 4862 5.5.3 (c) */
if (ndpr->ndpr_pltime > ndpr->ndpr_vltime) {
- log(LOG_INFO, "in6_init_prefix_ltimes: preferred lifetime"
+ nd6log((LOG_INFO, "in6_init_prefix_ltimes: preferred lifetime"
"(%d) is greater than valid lifetime(%d)\n",
- (u_int)ndpr->ndpr_pltime, (u_int)ndpr->ndpr_vltime);
+ (u_int)ndpr->ndpr_pltime, (u_int)ndpr->ndpr_vltime));
return (EINVAL);
}
if (ndpr->ndpr_pltime == ND6_INFINITE_LIFETIME)
ndpr->ndpr_preferred = 0;
else
- ndpr->ndpr_preferred = time_second + ndpr->ndpr_pltime;
+ ndpr->ndpr_preferred = timenow + ndpr->ndpr_pltime;
if (ndpr->ndpr_vltime == ND6_INFINITE_LIFETIME)
ndpr->ndpr_expire = 0;
else
- ndpr->ndpr_expire = time_second + ndpr->ndpr_vltime;
+ ndpr->ndpr_expire = timenow + ndpr->ndpr_vltime;
- return 0;
+ return (0);
}
static void
-in6_init_address_ltimes(struct nd_prefix *new,
- struct in6_addrlifetime *lt6,
- int update_vltime)
+in6_init_address_ltimes(struct nd_prefix *new, struct in6_addrlifetime *lt6)
{
-#if !(defined(__FreeBSD__) && __FreeBSD__ >= 3) && !defined (__APPLE__)
- long time_second = time.tv_sec;
-#endif
+#pragma unused(new)
+ uint64_t timenow = net_uptime();
/* Valid lifetime must not be updated unless explicitly specified. */
- if (update_vltime) {
- /* init ia6t_expire */
- if (lt6->ia6t_vltime == ND6_INFINITE_LIFETIME)
- lt6->ia6t_expire = 0;
- else {
- lt6->ia6t_expire = time_second;
- lt6->ia6t_expire += lt6->ia6t_vltime;
- }
- /* Ensure addr lifetime <= prefix lifetime. */
- if (new->ndpr_expire && lt6->ia6t_expire &&
- new->ndpr_expire < lt6->ia6t_expire)
- lt6->ia6t_expire = new->ndpr_expire;
+ /* init ia6t_expire */
+ if (lt6->ia6t_vltime == ND6_INFINITE_LIFETIME) {
+ lt6->ia6t_expire = 0;
+ } else {
+ lt6->ia6t_expire = timenow;
+ lt6->ia6t_expire += lt6->ia6t_vltime;
}
/* init ia6t_preferred */
- if (lt6->ia6t_pltime == ND6_INFINITE_LIFETIME)
+ if (lt6->ia6t_pltime == ND6_INFINITE_LIFETIME) {
lt6->ia6t_preferred = 0;
- else {
- lt6->ia6t_preferred = time_second;
+ } else {
+ lt6->ia6t_preferred = timenow;
lt6->ia6t_preferred += lt6->ia6t_pltime;
}
- /* Ensure addr lifetime <= prefix lifetime. */
- if (new->ndpr_preferred && lt6->ia6t_preferred
- && new->ndpr_preferred < lt6->ia6t_preferred)
- lt6->ia6t_preferred = new->ndpr_preferred;
}
/*
* it shouldn't be called when acting as a router.
*/
void
-rt6_flush(gateway, ifp)
- struct in6_addr *gateway;
- struct ifnet *ifp;
+rt6_flush(
+ struct in6_addr *gateway,
+ struct ifnet *ifp)
{
struct radix_node_head *rnh = rt_tables[AF_INET6];
-#ifdef __NetBSD__
- int s = splsoftnet();
-#else
- int s = splnet();
-#endif
/* We'll care only link-local addresses */
if (!IN6_IS_ADDR_LINKLOCAL(gateway)) {
- splx(s);
return;
}
+ lck_mtx_lock(rnh_lock);
/* XXX: hack for KAME's link-local address kludge */
gateway->s6_addr16[1] = htons(ifp->if_index);
rnh->rnh_walktree(rnh, rt6_deleteroute, (void *)gateway);
- splx(s);
+ lck_mtx_unlock(rnh_lock);
}
static int
-rt6_deleteroute(rn, arg)
- struct radix_node *rn;
- void *arg;
+rt6_deleteroute(
+ struct radix_node *rn,
+ void *arg)
{
-#define SIN6(s) ((struct sockaddr_in6 *)s)
struct rtentry *rt = (struct rtentry *)rn;
struct in6_addr *gate = (struct in6_addr *)arg;
- if (rt->rt_gateway == NULL || rt->rt_gateway->sa_family != AF_INET6)
- return(0);
+ lck_mtx_assert(rnh_lock, LCK_MTX_ASSERT_OWNED);
- if (!IN6_ARE_ADDR_EQUAL(gate, &SIN6(rt->rt_gateway)->sin6_addr))
- return(0);
+ RT_LOCK(rt);
+ if (rt->rt_gateway == NULL || rt->rt_gateway->sa_family != AF_INET6) {
+ RT_UNLOCK(rt);
+ return (0);
+ }
+ if (!IN6_ARE_ADDR_EQUAL(gate, &SIN6(rt->rt_gateway)->sin6_addr)) {
+ RT_UNLOCK(rt);
+ return (0);
+ }
+ /*
+ * Do not delete a static route.
+ * XXX: this seems to be a bit ad-hoc. Should we consider the
+ * 'cloned' bit instead?
+ */
+ if ((rt->rt_flags & RTF_STATIC) != 0) {
+ RT_UNLOCK(rt);
+ return (0);
+ }
/*
* We delete only host route. This means, in particular, we don't
* delete default route.
*/
- if ((rt->rt_flags & RTF_HOST) == 0)
- return(0);
+ if ((rt->rt_flags & RTF_HOST) == 0) {
+ RT_UNLOCK(rt);
+ return (0);
+ }
- return(rtrequest(RTM_DELETE, rt_key(rt),
- rt->rt_gateway, rt_mask(rt), rt->rt_flags, 0));
-#undef SIN6
+ /*
+ * Safe to drop rt_lock and use rt_key, rt_gateway, since holding
+ * rnh_lock here prevents another thread from calling rt_setgate()
+ * on this route.
+ */
+ RT_UNLOCK(rt);
+ return (rtrequest_locked(RTM_DELETE, rt_key(rt), rt->rt_gateway,
+ rt_mask(rt), rt->rt_flags, 0));
}
int
-nd6_setdefaultiface(ifindex)
- int ifindex;
+nd6_setdefaultiface(
+ int ifindex)
{
int error = 0;
+ ifnet_t def_ifp = NULL;
- if (ifindex < 0 || if_index < ifindex)
- return(EINVAL);
+ lck_mtx_assert(nd6_mutex, LCK_MTX_ASSERT_NOTOWNED);
+ ifnet_head_lock_shared();
+ if (ifindex < 0 || if_index < ifindex) {
+ ifnet_head_done();
+ return (EINVAL);
+ }
+ def_ifp = ifindex2ifnet[ifindex];
+ ifnet_head_done();
+
+ lck_mtx_lock(nd6_mutex);
if (nd6_defifindex != ifindex) {
+ struct ifnet *odef_ifp = nd6_defifp;
+
nd6_defifindex = ifindex;
if (nd6_defifindex > 0)
- nd6_defifp = ifindex2ifnet[nd6_defifindex];
+ nd6_defifp = def_ifp;
else
nd6_defifp = NULL;
+ if (nd6_defifp != NULL)
+ nd6log((LOG_INFO, "%s: is now the default "
+ "interface (was %s)\n", if_name(nd6_defifp),
+ odef_ifp != NULL ? if_name(odef_ifp) : "NONE"));
+ else
+ nd6log((LOG_INFO, "No default interface set\n"));
+
/*
* If the Default Router List is empty, install a route
* to the specified interface as default or remove the default
* we do this here to avoid re-install the default route
* if the list is NOT empty.
*/
- if (TAILQ_FIRST(&nd_defrouter) == NULL)
- defrouter_select();
- }
+ if (odef_ifp != NULL) {
+ defrouter_select(odef_ifp);
+ }
+
+ if (nd6_defifp != NULL) {
+ defrouter_select(nd6_defifp);
+ nd6_prefix_sync(nd6_defifp);
+ }
- return(error);
+ /*
+ * Our current implementation assumes one-to-one mapping between
+ * interfaces and links, so it would be natural to use the
+ * default interface as the default link.
+ */
+ scope6_setdefault(nd6_defifp);
+ }
+ lck_mtx_unlock(nd6_mutex);
+ return (error);
}