]> git.saurik.com Git - apple/xnu.git/blobdiff - bsd/netinet6/esp_input.c
xnu-1228.0.2.tar.gz
[apple/xnu.git] / bsd / netinet6 / esp_input.c
index 7bd490e8f9573a055b9078d2f254e5f18e05aa97..1286b439f7f685764e519f8212ffa4a62cf38d12 100644 (file)
@@ -1,4 +1,5 @@
-/*     $KAME: esp_input.c,v 1.22 2000/03/21 05:14:49 itojun Exp $      */
+/*     $FreeBSD: src/sys/netinet6/esp_input.c,v 1.1.2.3 2001/07/03 11:01:50 ume Exp $  */
+/*     $KAME: esp_input.c,v 1.55 2001/03/23 08:08:47 itojun Exp $      */
 
 /*
  * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
  * RFC1827/2406 Encapsulated Security Payload.
  */
 
-#define _IP_VHL
-#if (defined(__FreeBSD__) && __FreeBSD__ >= 3) || defined(__NetBSD__)
-#include "opt_inet.h"
-#endif
-
 #include <sys/param.h>
 #include <sys/systm.h>
 #include <sys/malloc.h>
@@ -52,8 +48,8 @@
 
 #include <net/if.h>
 #include <net/route.h>
-#include <net/netisr.h>
 #include <kern/cpu_number.h>
+#include <kern/locks.h>
 
 #include <netinet/in.h>
 #include <netinet/in_systm.h>
 #include <netinet/ip_var.h>
 #include <netinet/in_var.h>
 #include <netinet/ip_ecn.h>
+#include <netinet/in_pcb.h>
+#include <netinet/udp.h>
+#if INET6
+#include <netinet6/ip6_ecn.h>
+#endif
 
 #if INET6
 #include <netinet/ip6.h>
+#include <netinet6/in6_pcb.h>
 #include <netinet6/ip6_var.h>
 #include <netinet/icmp6.h>
+#include <netinet6/ip6protosw.h>
 #endif
 
 #include <netinet6/ipsec.h>
+#if INET6
+#include <netinet6/ipsec6.h>
+#endif
 #include <netinet6/ah.h>
+#if INET6
+#include <netinet6/ah6.h>
+#endif
 #include <netinet6/esp.h>
+#if INET6
+#include <netinet6/esp6.h>
+#endif
 #include <netkey/key.h>
 #include <netkey/keydb.h>
 #include <netkey/key_debug.h>
 
+#include <net/kpi_protocol.h>
+#include <netinet/kpi_ipfilter_var.h>
 
 #include <net/net_osdep.h>
 
+#include <sys/kdebug.h>
+#define DBG_LAYER_BEG          NETDBG_CODE(DBG_NETIPSEC, 1)
+#define DBG_LAYER_END          NETDBG_CODE(DBG_NETIPSEC, 3)
+#define DBG_FNC_ESPIN          NETDBG_CODE(DBG_NETIPSEC, (6 << 8))
+#define DBG_FNC_DECRYPT                NETDBG_CODE(DBG_NETIPSEC, (7 << 8))
 #define IPLEN_FLIPPED
 
+extern lck_mtx_t  *sadb_mutex;
+
 #if INET
 extern struct protosw inetsw[];
-#if defined(__bsdi__) || defined(__NetBSD__)
-extern u_char ip_protox[];
-#endif
 
 #define ESPMAXLEN \
        (sizeof(struct esp) < sizeof(struct newesp) \
@@ -96,23 +114,25 @@ esp4_input(m, off)
        int off;
 {
        struct ip *ip;
+       struct ip6_hdr *ip6;
        struct esp *esp;
        struct esptail esptail;
        u_int32_t spi;
        struct secasvar *sav = NULL;
        size_t taillen;
        u_int16_t nxt;
-       struct esp_algorithm *algo;
+       const struct esp_algorithm *algo;
        int ivlen;
        size_t hlen;
        size_t esplen;
-       int s;
+       sa_family_t     ifamily;
 
+       KERNEL_DEBUG(DBG_FNC_ESPIN | DBG_FUNC_START, 0,0,0,0,0);
        /* sanity check for alignment. */
        if (off % 4 != 0 || m->m_pkthdr.len % 4 != 0) {
                ipseclog((LOG_ERR, "IPv4 ESP input: packet alignment problem "
                        "(off=%d, pktlen=%d)\n", off, m->m_pkthdr.len));
-               ipsecstat.in_inval++;
+               IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
                goto bad;
        }
 
@@ -121,7 +141,7 @@ esp4_input(m, off)
                if (!m) {
                        ipseclog((LOG_DEBUG,
                            "IPv4 ESP input: can't pullup in esp4_input\n"));
-                       ipsecstat.in_inval++;
+                       IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
                        goto bad;
                }
        }
@@ -143,7 +163,7 @@ esp4_input(m, off)
                ipseclog((LOG_WARNING,
                    "IPv4 ESP input: no key association found for spi %u\n",
                    (u_int32_t)ntohl(spi)));
-               ipsecstat.in_nosa++;
+               IPSEC_STAT_INCREMENT(ipsecstat.in_nosa);
                goto bad;
        }
        KEYDEBUG(KEYDEBUG_IPSEC_STAMP,
@@ -153,25 +173,24 @@ esp4_input(m, off)
                ipseclog((LOG_DEBUG,
                    "IPv4 ESP input: non-mature/dying SA found for spi %u\n",
                    (u_int32_t)ntohl(spi)));
-               ipsecstat.in_badspi++;
+               IPSEC_STAT_INCREMENT(ipsecstat.in_badspi);
                goto bad;
        }
-       if (sav->alg_enc == SADB_EALG_NONE) {
+       algo = esp_algorithm_lookup(sav->alg_enc);
+       if (!algo) {
                ipseclog((LOG_DEBUG, "IPv4 ESP input: "
-                   "unspecified encryption algorithm for spi %u\n",
+                   "unsupported encryption algorithm for spi %u\n",
                    (u_int32_t)ntohl(spi)));
-               ipsecstat.in_badspi++;
+               IPSEC_STAT_INCREMENT(ipsecstat.in_badspi);
                goto bad;
        }
 
-       algo = &esp_algorithms[sav->alg_enc];   /*XXX*/
-
        /* check if we have proper ivlen information */
        ivlen = sav->ivlen;
        if (ivlen < 0) {
                ipseclog((LOG_ERR, "inproper ivlen in IPv4 ESP input: %s %s\n",
                    ipsec4_logpacketstr(ip, spi), ipsec_logsastr(sav)));
-               ipsecstat.in_inval++;
+               IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
                goto bad;
        }
 
@@ -179,7 +198,8 @@ esp4_input(m, off)
         && (sav->alg_auth && sav->key_auth)))
                goto noreplaycheck;
 
-       if (sav->alg_auth == SADB_AALG_NULL)
+       if (sav->alg_auth == SADB_X_AALG_NULL ||
+           sav->alg_auth == SADB_AALG_NONE)
                goto noreplaycheck;
 
        /*
@@ -188,7 +208,7 @@ esp4_input(m, off)
        if (ipsec_chkreplay(ntohl(((struct newesp *)esp)->esp_seq), sav))
                ; /*okey*/
        else {
-               ipsecstat.in_espreplay++;
+               IPSEC_STAT_INCREMENT(ipsecstat.in_espreplay);
                ipseclog((LOG_WARNING,
                    "replay packet in IPv4 ESP input: %s %s\n",
                    ipsec4_logpacketstr(ip, spi), ipsec_logsastr(sav)));
@@ -199,16 +219,22 @@ esp4_input(m, off)
     {
        u_char sum0[AH_MAXSUMSIZE];
        u_char sum[AH_MAXSUMSIZE];
-       struct ah_algorithm *sumalgo;
+       const struct ah_algorithm *sumalgo;
        size_t siz;
 
-       sumalgo = &ah_algorithms[sav->alg_auth];
+       sumalgo = ah_algorithm_lookup(sav->alg_auth);
+       if (!sumalgo)
+               goto noreplaycheck;
        siz = (((*sumalgo->sumsiz)(sav) + 3) & ~(4 - 1));
+       if (m->m_pkthdr.len < off + ESPMAXLEN + siz) {
+               IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
+               goto bad;
+       }
        if (AH_MAXSUMSIZE < siz) {
                ipseclog((LOG_DEBUG,
                    "internal error: AH_MAXSUMSIZE must be larger than %lu\n",
                    (u_long)siz));
-               ipsecstat.in_inval++;
+               IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
                goto bad;
        }
 
@@ -217,14 +243,14 @@ esp4_input(m, off)
        if (esp_auth(m, off, m->m_pkthdr.len - off - siz, sav, sum)) {
                ipseclog((LOG_WARNING, "auth fail in IPv4 ESP input: %s %s\n",
                    ipsec4_logpacketstr(ip, spi), ipsec_logsastr(sav)));
-               ipsecstat.in_espauthfail++;
+               IPSEC_STAT_INCREMENT(ipsecstat.in_espauthfail);
                goto bad;
        }
 
        if (bcmp(sum0, sum, siz) != 0) {
                ipseclog((LOG_WARNING, "auth fail in IPv4 ESP input: %s %s\n",
                    ipsec4_logpacketstr(ip, spi), ipsec_logsastr(sav)));
-               ipsecstat.in_espauthfail++;
+               IPSEC_STAT_INCREMENT(ipsecstat.in_espauthfail);
                goto bad;
        }
 
@@ -237,7 +263,7 @@ esp4_input(m, off)
        ip->ip_len = htons(ntohs(ip->ip_len) - siz);
 #endif
        m->m_flags |= M_AUTHIPDGM;
-       ipsecstat.in_espauthsucc++;
+       IPSEC_STAT_INCREMENT(ipsecstat.in_espauthsucc);
     }
 
        /*
@@ -245,7 +271,7 @@ esp4_input(m, off)
         */
        if ((sav->flags & SADB_X_EXT_OLD) == 0 && sav->replay) {
                if (ipsec_updatereplay(ntohl(((struct newesp *)esp)->esp_seq), sav)) {
-                       ipsecstat.in_espreplay++;
+                       IPSEC_STAT_INCREMENT(ipsecstat.in_espreplay);
                        goto bad;
                }
        }
@@ -267,7 +293,7 @@ noreplaycheck:
        if (m->m_pkthdr.len < off + esplen + ivlen + sizeof(esptail)) {
                ipseclog((LOG_WARNING,
                    "IPv4 ESP input: packet too short\n"));
-               ipsecstat.in_inval++;
+               IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
                goto bad;
        }
 
@@ -276,27 +302,38 @@ noreplaycheck:
                if (!m) {
                        ipseclog((LOG_DEBUG,
                            "IPv4 ESP input: can't pullup in esp4_input\n"));
-                       ipsecstat.in_inval++;
+                       IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
                        goto bad;
                }
        }
 
-    {
+       /*
+        * pre-compute and cache intermediate key
+        */
+       if (esp_schedule(algo, sav) != 0) {
+               IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
+               goto bad;
+       }
+
        /*
         * decrypt the packet.
         */
        if (!algo->decrypt)
                panic("internal error: no decrypt function");
+       KERNEL_DEBUG(DBG_FNC_DECRYPT | DBG_FUNC_START, 0,0,0,0,0);
        if ((*algo->decrypt)(m, off, sav, algo, ivlen)) {
-               ipseclog((LOG_ERR, "decrypt fail in IPv4 ESP input: %s %s\n",
-                   ipsec4_logpacketstr(ip, spi), ipsec_logsastr(sav)));
-               ipsecstat.in_inval++;
+               /* m is already freed */
+               m = NULL;
+               ipseclog((LOG_ERR, "decrypt fail in IPv4 ESP input: %s\n",
+                   ipsec_logsastr(sav)));
+               IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
+               KERNEL_DEBUG(DBG_FNC_DECRYPT | DBG_FUNC_END, 1,0,0,0,0);
                goto bad;
        }
-       ipsecstat.in_esphist[sav->alg_enc]++;
+       KERNEL_DEBUG(DBG_FNC_DECRYPT | DBG_FUNC_END, 2,0,0,0,0);
+       IPSEC_STAT_INCREMENT(ipsecstat.in_esphist[sav->alg_enc]);
 
        m->m_flags |= M_DECRYPTED;
-    }
 
        /*
         * find the trailer of the ESP.
@@ -311,7 +348,7 @@ noreplaycheck:
                ipseclog((LOG_WARNING,
                    "bad pad length in IPv4 ESP input: %s %s\n",
                    ipsec4_logpacketstr(ip, spi), ipsec_logsastr(sav)));
-               ipsecstat.in_inval++;
+               IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
                goto bad;
        }
 
@@ -325,7 +362,7 @@ noreplaycheck:
 #endif
 
        /* was it transmitted over the IPsec tunnel SA? */
-       if (ipsec4_tunnel_validate(ip, nxt, sav)) {
+       if (ipsec4_tunnel_validate(m, off + esplen + ivlen, nxt, sav, &ifamily)) {
                /*
                 * strip off all the headers that precedes ESP header.
                 *      IP4 xx ESP IP4' payload -> IP4' payload
@@ -337,45 +374,76 @@ noreplaycheck:
 
                tos = ip->ip_tos;
                m_adj(m, off + esplen + ivlen);
-               if (m->m_len < sizeof(*ip)) {
-                       m = m_pullup(m, sizeof(*ip));
-                       if (!m) {
-                               ipsecstat.in_inval++;
-                               goto bad;
+               if (ifamily == AF_INET) {
+                       if (m->m_len < sizeof(*ip)) {
+                               m = m_pullup(m, sizeof(*ip));
+                               if (!m) {
+                                       IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
+                                       goto bad;
+                               }
                        }
-               }
-               ip = mtod(m, struct ip *);
-               /* ECN consideration. */
-               ip_ecn_egress(ip4_ipsec_ecn, &tos, &ip->ip_tos);
-               if (!key_checktunnelsanity(sav, AF_INET,
+                       ip = mtod(m, struct ip *);
+                       /* ECN consideration. */
+                       ip_ecn_egress(ip4_ipsec_ecn, &tos, &ip->ip_tos);
+                       if (!key_checktunnelsanity(sav, AF_INET,
                            (caddr_t)&ip->ip_src, (caddr_t)&ip->ip_dst)) {
-                       ipseclog((LOG_ERR, "ipsec tunnel address mismatch "
-                           "in IPv4 ESP input: %s %s\n",
+                               ipseclog((LOG_ERR, "ipsec tunnel address mismatch "
+                           "in ESP input: %s %s\n",
                            ipsec4_logpacketstr(ip, spi), ipsec_logsastr(sav)));
-                       ipsecstat.in_inval++;
-                       goto bad;
-               }
+                               IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
+                               goto bad;
+                       }
+#if INET6
+               } else if (ifamily == AF_INET6) {
+#ifndef PULLDOWN_TEST
+                       /*
+                        * m_pullup is prohibited in KAME IPv6 input processing
+                        * but there's no other way!
+                        */
+#else
+                       /* okay to pullup in m_pulldown style */
+#endif
+                       if (m->m_len < sizeof(*ip6)) {
+                               m = m_pullup(m, sizeof(*ip6));
+                               if (!m) {
+                                       IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
+                                       goto bad;
+                               }
+                       }
+
+                       ip6 = mtod(m, struct ip6_hdr *);
+
+                       /* ECN consideration. */
+                       /* XXX To be fixed later if needed */
+                       //  ip_ecn_egress(ip4_ipsec_ecn, &tos, &ip->ip_tos);
 
-#if 0 /* XXX should call ipfw rather than ipsec_in_reject, shouldn't it ? */
-               /* drop it if it does not match the default policy */
-               if (ipsec4_in_reject(m, NULL)) {
-                       ipsecstat.in_polvio++;
+                       if (!key_checktunnelsanity(sav, AF_INET6,
+                           (caddr_t)&ip6->ip6_src, (caddr_t)&ip6->ip6_dst)) {
+                               ipseclog((LOG_ERR, "ipsec tunnel address mismatch "
+                           "in ESP input: %s %s\n",
+                           ipsec6_logpacketstr(ip6, spi), ipsec_logsastr(sav)));
+                               IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
+                               goto bad;
+                       }               
+#endif /* INET6 */
+               } else {
+                       ipseclog((LOG_ERR, "ipsec tunnel unsupported address family "
+                                 "in ESP input\n"));
                        goto bad;
                }
-#endif
 
                key_sa_recordxfer(sav, m);
-
-               s = splimp();
-               if (IF_QFULL(&ipintrq)) {
-                       ipsecstat.in_inval++;
+               if (ipsec_addhist(m, IPPROTO_ESP, spi) != 0 ||
+                   ipsec_addhist(m, IPPROTO_IPV4, 0) != 0) {
+                       IPSEC_STAT_INCREMENT(ipsecstat.in_nomem);
                        goto bad;
                }
-               IF_ENQUEUE(&ipintrq, m);
-               m = NULL;
-               schednetisr(NETISR_IP); /*can be skipped but to make sure*/
-               splx(s);
+               
+               /* Clear the csum flags, they can't be valid for the inner headers */
+               m->m_pkthdr.csum_flags = 0;
+               proto_input(ifamily == AF_INET ? PF_INET : PF_INET6, m);
                nxt = IPPROTO_DONE;
+               KERNEL_DEBUG(DBG_FNC_ESPIN | DBG_FUNC_END, 2,0,0,0,0);
        } else {
                /*
                 * strip off ESP header and IV.
@@ -401,10 +469,65 @@ noreplaycheck:
                ip->ip_p = nxt;
 
                key_sa_recordxfer(sav, m);
+               if (ipsec_addhist(m, IPPROTO_ESP, spi) != 0) {
+                       IPSEC_STAT_INCREMENT(ipsecstat.in_nomem);
+                       goto bad;
+               }
+               
+               /*
+                * Set the csum valid flag, if we authenticated the
+                * packet, the payload shouldn't be corrupt unless
+                * it was corrupted before being signed on the other
+                * side.
+                */
+               if (nxt == IPPROTO_TCP || nxt == IPPROTO_UDP) {
+                       m->m_pkthdr.csum_flags = CSUM_DATA_VALID | CSUM_PSEUDO_HDR;
+                       m->m_pkthdr.csum_data = 0xFFFF;
+               }
 
-               if (nxt != IPPROTO_DONE)
-                       (*ip_protox[nxt]->pr_input)(m, off);
-               else
+               if (nxt != IPPROTO_DONE) {
+                       if ((ip_protox[nxt]->pr_flags & PR_LASTHDR) != 0 &&
+                           ipsec4_in_reject(m, NULL)) {
+                               IPSEC_STAT_INCREMENT(ipsecstat.in_polvio);
+                               goto bad;
+                       }
+                       KERNEL_DEBUG(DBG_FNC_ESPIN | DBG_FUNC_END, 3,0,0,0,0);
+                       
+                       /* translate encapsulated UDP port ? */
+                       if ((sav->flags & SADB_X_EXT_NATT_MULTIPLEUSERS) != 0)  {
+                               struct udphdr   *udp;
+                               
+                               if (nxt != IPPROTO_UDP) {       /* not UPD packet - drop it */
+                                       IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
+                                       goto bad;
+                               }
+                                       
+                               if (m->m_len < off + sizeof(struct udphdr)) {
+                                       m = m_pullup(m, off + sizeof(struct udphdr));
+                                       if (!m) {
+                                               ipseclog((LOG_DEBUG,
+                                                       "IPv4 ESP input: can't pullup UDP header in esp4_input\n"));
+                                               IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
+                                               goto bad;
+                                       }
+                                       ip = mtod(m, struct ip *);
+                               }
+                               udp = (struct udphdr *)(((u_int8_t *)ip) + off);
+                       
+                               lck_mtx_lock(sadb_mutex);
+                               if (sav->natt_encapsulated_src_port == 0) {     
+                                       sav->natt_encapsulated_src_port = udp->uh_sport;
+                               } else if (sav->natt_encapsulated_src_port != udp->uh_sport) {  /* something wrong */
+                                       IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
+                                       lck_mtx_unlock(sadb_mutex);
+                                       goto bad;
+                               }
+                               lck_mtx_unlock(sadb_mutex);
+                               udp->uh_sport = htons(sav->remote_ike_port);
+                               udp->uh_sum = 0;
+                       }
+                       ip_proto_dispatch_in(m, off, nxt, 0);
+               } else
                        m_freem(m);
                m = NULL;
        }
@@ -412,28 +535,29 @@ noreplaycheck:
        if (sav) {
                KEYDEBUG(KEYDEBUG_IPSEC_STAMP,
                        printf("DP esp4_input call free SA:%p\n", sav));
-               key_freesav(sav);
+               key_freesav(sav, KEY_SADB_UNLOCKED);
        }
-       ipsecstat.in_success++;
+       IPSEC_STAT_INCREMENT(ipsecstat.in_success);
        return;
 
 bad:
        if (sav) {
                KEYDEBUG(KEYDEBUG_IPSEC_STAMP,
                        printf("DP esp4_input call free SA:%p\n", sav));
-               key_freesav(sav);
+               key_freesav(sav, KEY_SADB_UNLOCKED);
        }
        if (m)
                m_freem(m);
+       KERNEL_DEBUG(DBG_FNC_ESPIN | DBG_FUNC_END, 4,0,0,0,0);
        return;
 }
 #endif /* INET */
 
 #if INET6
 int
-esp6_input(mp, offp, proto)
+esp6_input(mp, offp)
        struct mbuf **mp;
-       int *offp, proto;
+       int *offp;
 {
        struct mbuf *m = *mp;
        int off = *offp;
@@ -444,26 +568,25 @@ esp6_input(mp, offp, proto)
        struct secasvar *sav = NULL;
        size_t taillen;
        u_int16_t nxt;
-       struct esp_algorithm *algo;
+       const struct esp_algorithm *algo;
        int ivlen;
        size_t esplen;
-       int s;
 
        /* sanity check for alignment. */
        if (off % 4 != 0 || m->m_pkthdr.len % 4 != 0) {
                ipseclog((LOG_ERR, "IPv6 ESP input: packet alignment problem "
                        "(off=%d, pktlen=%d)\n", off, m->m_pkthdr.len));
-               ipsec6stat.in_inval++;
+               IPSEC_STAT_INCREMENT(ipsec6stat.in_inval);
                goto bad;
        }
 
 #ifndef PULLDOWN_TEST
-       IP6_EXTHDR_CHECK(m, off, ESPMAXLEN, IPPROTO_DONE);
+       IP6_EXTHDR_CHECK(m, off, ESPMAXLEN, {return IPPROTO_DONE;});
        esp = (struct esp *)(mtod(m, caddr_t) + off);
 #else
        IP6_EXTHDR_GET(esp, struct esp *, m, off, ESPMAXLEN);
        if (esp == NULL) {
-               ipsec6stat.in_inval++;
+               IPSEC_STAT_INCREMENT(ipsec6stat.in_inval);
                return IPPROTO_DONE;
        }
 #endif
@@ -472,7 +595,7 @@ esp6_input(mp, offp, proto)
        if (ntohs(ip6->ip6_plen) == 0) {
                ipseclog((LOG_ERR, "IPv6 ESP input: "
                    "ESP with IPv6 jumbogram is not supported.\n"));
-               ipsec6stat.in_inval++;
+               IPSEC_STAT_INCREMENT(ipsec6stat.in_inval);
                goto bad;
        }
 
@@ -485,7 +608,7 @@ esp6_input(mp, offp, proto)
                ipseclog((LOG_WARNING,
                    "IPv6 ESP input: no key association found for spi %u\n",
                    (u_int32_t)ntohl(spi)));
-               ipsec6stat.in_nosa++;
+               IPSEC_STAT_INCREMENT(ipsec6stat.in_nosa);
                goto bad;
        }
        KEYDEBUG(KEYDEBUG_IPSEC_STAMP,
@@ -495,25 +618,24 @@ esp6_input(mp, offp, proto)
                ipseclog((LOG_DEBUG,
                    "IPv6 ESP input: non-mature/dying SA found for spi %u\n",
                    (u_int32_t)ntohl(spi)));
-               ipsec6stat.in_badspi++;
+               IPSEC_STAT_INCREMENT(ipsec6stat.in_badspi);
                goto bad;
        }
-       if (sav->alg_enc == SADB_EALG_NONE) {
+       algo = esp_algorithm_lookup(sav->alg_enc);
+       if (!algo) {
                ipseclog((LOG_DEBUG, "IPv6 ESP input: "
-                   "unspecified encryption algorithm for spi %u\n",
+                   "unsupported encryption algorithm for spi %u\n",
                    (u_int32_t)ntohl(spi)));
-               ipsec6stat.in_badspi++;
+               IPSEC_STAT_INCREMENT(ipsec6stat.in_badspi);
                goto bad;
        }
 
-       algo = &esp_algorithms[sav->alg_enc];   /*XXX*/
-
        /* check if we have proper ivlen information */
        ivlen = sav->ivlen;
        if (ivlen < 0) {
                ipseclog((LOG_ERR, "inproper ivlen in IPv6 ESP input: %s %s\n",
                    ipsec6_logpacketstr(ip6, spi), ipsec_logsastr(sav)));
-               ipsec6stat.in_badspi++;
+               IPSEC_STAT_INCREMENT(ipsec6stat.in_badspi);
                goto bad;
        }
 
@@ -521,7 +643,8 @@ esp6_input(mp, offp, proto)
         && (sav->alg_auth && sav->key_auth)))
                goto noreplaycheck;
 
-       if (sav->alg_auth == SADB_AALG_NULL)
+       if (sav->alg_auth == SADB_X_AALG_NULL ||
+           sav->alg_auth == SADB_AALG_NONE)
                goto noreplaycheck;
 
        /*
@@ -530,7 +653,7 @@ esp6_input(mp, offp, proto)
        if (ipsec_chkreplay(ntohl(((struct newesp *)esp)->esp_seq), sav))
                ; /*okey*/
        else {
-               ipsec6stat.in_espreplay++;
+               IPSEC_STAT_INCREMENT(ipsec6stat.in_espreplay);
                ipseclog((LOG_WARNING,
                    "replay packet in IPv6 ESP input: %s %s\n",
                    ipsec6_logpacketstr(ip6, spi), ipsec_logsastr(sav)));
@@ -541,16 +664,22 @@ esp6_input(mp, offp, proto)
     {
        u_char sum0[AH_MAXSUMSIZE];
        u_char sum[AH_MAXSUMSIZE];
-       struct ah_algorithm *sumalgo;
+       const struct ah_algorithm *sumalgo;
        size_t siz;
 
-       sumalgo = &ah_algorithms[sav->alg_auth];
+       sumalgo = ah_algorithm_lookup(sav->alg_auth);
+       if (!sumalgo)
+               goto noreplaycheck;
        siz = (((*sumalgo->sumsiz)(sav) + 3) & ~(4 - 1));
+       if (m->m_pkthdr.len < off + ESPMAXLEN + siz) {
+               IPSEC_STAT_INCREMENT(ipsecstat.in_inval);
+               goto bad;
+       }
        if (AH_MAXSUMSIZE < siz) {
                ipseclog((LOG_DEBUG,
                    "internal error: AH_MAXSUMSIZE must be larger than %lu\n",
                    (u_long)siz));
-               ipsec6stat.in_inval++;
+               IPSEC_STAT_INCREMENT(ipsec6stat.in_inval);
                goto bad;
        }
 
@@ -559,14 +688,14 @@ esp6_input(mp, offp, proto)
        if (esp_auth(m, off, m->m_pkthdr.len - off - siz, sav, sum)) {
                ipseclog((LOG_WARNING, "auth fail in IPv6 ESP input: %s %s\n",
                    ipsec6_logpacketstr(ip6, spi), ipsec_logsastr(sav)));
-               ipsec6stat.in_espauthfail++;
+               IPSEC_STAT_INCREMENT(ipsec6stat.in_espauthfail);
                goto bad;
        }
 
        if (bcmp(sum0, sum, siz) != 0) {
                ipseclog((LOG_WARNING, "auth fail in IPv6 ESP input: %s %s\n",
                    ipsec6_logpacketstr(ip6, spi), ipsec_logsastr(sav)));
-               ipsec6stat.in_espauthfail++;
+               IPSEC_STAT_INCREMENT(ipsec6stat.in_espauthfail);
                goto bad;
        }
 
@@ -576,7 +705,7 @@ esp6_input(mp, offp, proto)
        ip6->ip6_plen = htons(ntohs(ip6->ip6_plen) - siz);
 
        m->m_flags |= M_AUTHIPDGM;
-       ipsec6stat.in_espauthsucc++;
+       IPSEC_STAT_INCREMENT(ipsec6stat.in_espauthsucc);
     }
 
        /*
@@ -584,7 +713,7 @@ esp6_input(mp, offp, proto)
         */
        if ((sav->flags & SADB_X_EXT_OLD) == 0 && sav->replay) {
                if (ipsec_updatereplay(ntohl(((struct newesp *)esp)->esp_seq), sav)) {
-                       ipsec6stat.in_espreplay++;
+                       IPSEC_STAT_INCREMENT(ipsec6stat.in_espreplay);
                        goto bad;
                }
        }
@@ -606,34 +735,44 @@ noreplaycheck:
        if (m->m_pkthdr.len < off + esplen + ivlen + sizeof(esptail)) {
                ipseclog((LOG_WARNING,
                    "IPv6 ESP input: packet too short\n"));
-               ipsec6stat.in_inval++;
+               IPSEC_STAT_INCREMENT(ipsec6stat.in_inval);
                goto bad;
        }
 
 #ifndef PULLDOWN_TEST
-       IP6_EXTHDR_CHECK(m, off, esplen + ivlen, IPPROTO_DONE); /*XXX*/
+       IP6_EXTHDR_CHECK(m, off, esplen + ivlen, return IPPROTO_DONE);  /*XXX*/
 #else
        IP6_EXTHDR_GET(esp, struct esp *, m, off, esplen + ivlen);
        if (esp == NULL) {
-               ipsec6stat.in_inval++;
+               IPSEC_STAT_INCREMENT(ipsec6stat.in_inval);
                m = NULL;
                goto bad;
        }
 #endif
        ip6 = mtod(m, struct ip6_hdr *);        /*set it again just in case*/
 
+       /*
+        * pre-compute and cache intermediate key
+        */
+       if (esp_schedule(algo, sav) != 0) {
+               IPSEC_STAT_INCREMENT(ipsec6stat.in_inval);
+               goto bad;
+       }
+
        /*
         * decrypt the packet.
         */
        if (!algo->decrypt)
                panic("internal error: no decrypt function");
        if ((*algo->decrypt)(m, off, sav, algo, ivlen)) {
-               ipseclog((LOG_ERR, "decrypt fail in IPv6 ESP input: %s %s\n",
-                   ipsec6_logpacketstr(ip6, spi), ipsec_logsastr(sav)));
-               ipsec6stat.in_inval++;
+               /* m is already freed */
+               m = NULL;
+               ipseclog((LOG_ERR, "decrypt fail in IPv6 ESP input: %s\n",
+                   ipsec_logsastr(sav)));
+               IPSEC_STAT_INCREMENT(ipsec6stat.in_inval);
                goto bad;
        }
-       ipsec6stat.in_esphist[sav->alg_enc]++;
+       IPSEC_STAT_INCREMENT(ipsec6stat.in_esphist[sav->alg_enc]);
 
        m->m_flags |= M_DECRYPTED;
 
@@ -650,7 +789,7 @@ noreplaycheck:
                ipseclog((LOG_WARNING,
                    "bad pad length in IPv6 ESP input: %s %s\n",
                    ipsec6_logpacketstr(ip6, spi), ipsec_logsastr(sav)));
-               ipsec6stat.in_inval++;
+               IPSEC_STAT_INCREMENT(ipsec6stat.in_inval);
                goto bad;
        }
 
@@ -660,7 +799,7 @@ noreplaycheck:
        ip6->ip6_plen = htons(ntohs(ip6->ip6_plen) - taillen);
 
        /* was it transmitted over the IPsec tunnel SA? */
-       if (ipsec6_tunnel_validate(ip6, nxt, sav)) {
+       if (ipsec6_tunnel_validate(m, off + esplen + ivlen, nxt, sav)) {
                /*
                 * strip off all the headers that precedes ESP header.
                 *      IP6 xx ESP IP6' payload -> IP6' payload
@@ -682,7 +821,7 @@ noreplaycheck:
 #endif
                        m = m_pullup(m, sizeof(*ip6));
                        if (!m) {
-                               ipsec6stat.in_inval++;
+                               IPSEC_STAT_INCREMENT(ipsec6stat.in_inval);
                                goto bad;
                        }
                }
@@ -695,29 +834,17 @@ noreplaycheck:
                            "in IPv6 ESP input: %s %s\n",
                            ipsec6_logpacketstr(ip6, spi),
                            ipsec_logsastr(sav)));
-                       ipsec6stat.in_inval++;
-                       goto bad;
-               }
-
-#if 0 /* XXX should call ipfw rather than ipsec_in_reject, shouldn't it ? */
-               /* drop it if it does not match the default policy */
-               if (ipsec6_in_reject(m, NULL)) {
-                       ipsec6stat.in_polvio++;
+                       IPSEC_STAT_INCREMENT(ipsec6stat.in_inval);
                        goto bad;
                }
-#endif
 
                key_sa_recordxfer(sav, m);
-
-               s = splimp();
-               if (IF_QFULL(&ip6intrq)) {
-                       ipsec6stat.in_inval++;
+               if (ipsec_addhist(m, IPPROTO_ESP, spi) != 0 || 
+                   ipsec_addhist(m, IPPROTO_IPV6, 0) != 0) {
+                       IPSEC_STAT_INCREMENT(ipsec6stat.in_nomem);
                        goto bad;
                }
-               IF_ENQUEUE(&ip6intrq, m);
-               m = NULL;
-               schednetisr(NETISR_IPV6); /*can be skipped but to make sure*/
-               splx(s);
+               proto_input(PF_INET6, m);
                nxt = IPPROTO_DONE;
        } else {
                /*
@@ -755,15 +882,65 @@ noreplaycheck:
                                goto bad;
                        }
                        m_adj(n, stripsiz);
-                       m_cat(m, n);
                        /* m_cat does not update m_pkthdr.len */
                        m->m_pkthdr.len += n->m_pkthdr.len;
+                       m_cat(m, n);
+               }
+
+#ifndef PULLDOWN_TEST
+               /*
+                * KAME requires that the packet to be contiguous on the
+                * mbuf.  We need to make that sure.
+                * this kind of code should be avoided.
+                * XXX other conditions to avoid running this part?
+                */
+               if (m->m_len != m->m_pkthdr.len) {
+                       struct mbuf *n = NULL;
+                       int maxlen;
+
+                       MGETHDR(n, M_DONTWAIT, MT_HEADER);      /* MAC-OK */
+                       maxlen = MHLEN;
+                       if (n)
+                               M_COPY_PKTHDR(n, m);
+                       if (n && m->m_pkthdr.len > maxlen) {
+                               MCLGET(n, M_DONTWAIT);
+                               maxlen = MCLBYTES;
+                               if ((n->m_flags & M_EXT) == 0) {
+                                       m_free(n);
+                                       n = NULL;
+                               }
+                       }
+                       if (!n) {
+                               printf("esp6_input: mbuf allocation failed\n");
+                               goto bad;
+                       }
+
+                       if (m->m_pkthdr.len <= maxlen) {
+                               m_copydata(m, 0, m->m_pkthdr.len, mtod(n, caddr_t));
+                               n->m_len = m->m_pkthdr.len;
+                               n->m_pkthdr.len = m->m_pkthdr.len;
+                               n->m_next = NULL;
+                               m_freem(m);
+                       } else {
+                               m_copydata(m, 0, maxlen, mtod(n, caddr_t));
+                               n->m_len = maxlen;
+                               n->m_pkthdr.len = m->m_pkthdr.len;
+                               n->m_next = m;
+                               m_adj(m, maxlen);
+                               m->m_flags &= ~M_PKTHDR;
+                       }
+                       m = n;
                }
+#endif
 
                ip6 = mtod(m, struct ip6_hdr *);
                ip6->ip6_plen = htons(ntohs(ip6->ip6_plen) - stripsiz);
 
                key_sa_recordxfer(sav, m);
+               if (ipsec_addhist(m, IPPROTO_ESP, spi) != 0) {
+                       IPSEC_STAT_INCREMENT(ipsec6stat.in_nomem);
+                       goto bad;
+               }
        }
 
        *offp = off;
@@ -772,19 +949,125 @@ noreplaycheck:
        if (sav) {
                KEYDEBUG(KEYDEBUG_IPSEC_STAMP,
                        printf("DP esp6_input call free SA:%p\n", sav));
-               key_freesav(sav);
+               key_freesav(sav, KEY_SADB_UNLOCKED);
        }
-       ipsec6stat.in_success++;
+       IPSEC_STAT_INCREMENT(ipsec6stat.in_success);
        return nxt;
 
 bad:
        if (sav) {
                KEYDEBUG(KEYDEBUG_IPSEC_STAMP,
                        printf("DP esp6_input call free SA:%p\n", sav));
-               key_freesav(sav);
+               key_freesav(sav, KEY_SADB_UNLOCKED);
        }
        if (m)
                m_freem(m);
        return IPPROTO_DONE;
 }
+
+void
+esp6_ctlinput(cmd, sa, d)
+       int cmd;
+       struct sockaddr *sa;
+       void *d;
+{
+       const struct newesp *espp;
+       struct newesp esp;
+       struct ip6ctlparam *ip6cp = NULL, ip6cp1;
+       struct secasvar *sav;
+       struct ip6_hdr *ip6;
+       struct mbuf *m;
+       int off;
+       struct sockaddr_in6 *sa6_src, *sa6_dst;
+
+       if (sa->sa_family != AF_INET6 ||
+           sa->sa_len != sizeof(struct sockaddr_in6))
+               return;
+       if ((unsigned)cmd >= PRC_NCMDS)
+               return;
+
+       /* if the parameter is from icmp6, decode it. */
+       if (d != NULL) {
+               ip6cp = (struct ip6ctlparam *)d;
+               m = ip6cp->ip6c_m;
+               ip6 = ip6cp->ip6c_ip6;
+               off = ip6cp->ip6c_off;
+       } else {
+               m = NULL;
+               ip6 = NULL;
+       }
+
+       if (ip6) {
+               /*
+                * Notify the error to all possible sockets via pfctlinput2.
+                * Since the upper layer information (such as protocol type,
+                * source and destination ports) is embedded in the encrypted
+                * data and might have been cut, we can't directly call
+                * an upper layer ctlinput function. However, the pcbnotify
+                * function will consider source and destination addresses
+                * as well as the flow info value, and may be able to find
+                * some PCB that should be notified.
+                * Although pfctlinput2 will call esp6_ctlinput(), there is
+                * no possibility of an infinite loop of function calls,
+                * because we don't pass the inner IPv6 header.
+                */
+               bzero(&ip6cp1, sizeof(ip6cp1));
+               ip6cp1.ip6c_src = ip6cp->ip6c_src;
+               pfctlinput2(cmd, sa, (void *)&ip6cp1);
+
+               /*
+                * Then go to special cases that need ESP header information.
+                * XXX: We assume that when ip6 is non NULL,
+                * M and OFF are valid.
+                */
+
+               /* check if we can safely examine src and dst ports */
+               if (m->m_pkthdr.len < off + sizeof(esp))
+                       return;
+
+               if (m->m_len < off + sizeof(esp)) {
+                       /*
+                        * this should be rare case,
+                        * so we compromise on this copy...
+                        */
+                       m_copydata(m, off, sizeof(esp), (caddr_t)&esp);
+                       espp = &esp;
+               } else
+                       espp = (struct newesp*)(mtod(m, caddr_t) + off);
+
+               if (cmd == PRC_MSGSIZE) {
+                       int valid = 0;
+
+                       /*
+                        * Check to see if we have a valid SA corresponding to
+                        * the address in the ICMP message payload.
+                        */
+                       sa6_src = ip6cp->ip6c_src;
+                       sa6_dst = (struct sockaddr_in6 *)sa;
+                       sav = key_allocsa(AF_INET6,
+                                         (caddr_t)&sa6_src->sin6_addr,
+                                         (caddr_t)&sa6_dst->sin6_addr,
+                                         IPPROTO_ESP, espp->esp_spi);
+                       if (sav) {
+                               if (sav->state == SADB_SASTATE_MATURE ||
+                                   sav->state == SADB_SASTATE_DYING)
+                                       valid++;
+                               key_freesav(sav, KEY_SADB_LOCKED);
+                       }
+
+                       /* XXX Further validation? */
+
+                       /*
+                        * Depending on the value of "valid" and routing table
+                        * size (mtudisc_{hi,lo}wat), we will:
+                        * - recalcurate the new MTU and create the
+                        *   corresponding routing entry, or
+                        * - ignore the MTU change notification.
+                        */
+                       icmp6_mtudisc_update((struct ip6ctlparam *)d, valid);
+               }
+       } else {
+               /* we normally notify any pcb here */
+       }
+}
 #endif /* INET6 */