2 * Copyright (c) 2012-2017 Apple Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
28 #include <sys/param.h>
29 #include <sys/systm.h>
30 #include <netinet/in_systm.h>
31 #include <sys/socket.h>
32 #include <sys/socketvar.h>
33 #include <sys/syslog.h>
34 #include <net/route.h>
35 #include <netinet/in.h>
38 #include <netinet/ip.h>
39 #include <netinet/ip_var.h>
40 #include <netinet/in_var.h>
41 #include <netinet/tcp.h>
42 #include <netinet/tcp_cache.h>
43 #include <netinet/tcp_seq.h>
44 #include <netinet/tcpip.h>
45 #include <netinet/tcp_fsm.h>
46 #include <netinet/mptcp_var.h>
47 #include <netinet/mptcp.h>
48 #include <netinet/mptcp_opt.h>
49 #include <netinet/mptcp_seq.h>
51 #include <libkern/crypto/sha1.h>
52 #include <netinet/mptcp_timer.h>
56 static int mptcp_validate_join_hmac(struct tcpcb
*, u_char
*, int);
57 static int mptcp_snd_mpprio(struct tcpcb
*tp
, u_char
*cp
, int optlen
);
58 static void mptcp_send_remaddr_opt(struct tcpcb
*, struct mptcp_remaddr_opt
*);
61 * MPTCP Options Output Processing
65 mptcp_setup_first_subflow_syn_opts(struct socket
*so
, u_char
*opt
, unsigned optlen
)
67 struct mptcp_mpcapable_opt_common mptcp_opt
;
68 struct tcpcb
*tp
= sototcpcb(so
);
69 struct mptcb
*mp_tp
= tptomptp(tp
);
71 mpte_lock_assert_held(mp_tp
->mpt_mpte
);
74 * Avoid retransmitting the MP_CAPABLE option.
76 if (tp
->t_rxtshift
> mptcp_mpcap_retries
) {
77 if (!(mp_tp
->mpt_flags
& (MPTCPF_FALLBACK_HEURISTIC
| MPTCPF_HEURISTIC_TRAC
))) {
78 mp_tp
->mpt_flags
|= MPTCPF_HEURISTIC_TRAC
;
79 tcp_heuristic_mptcp_loss(tp
);
84 if (!tcp_heuristic_do_mptcp(tp
)) {
85 mp_tp
->mpt_flags
|= MPTCPF_FALLBACK_HEURISTIC
;
89 bzero(&mptcp_opt
, sizeof (struct mptcp_mpcapable_opt_common
));
91 mptcp_opt
.mmco_kind
= TCPOPT_MULTIPATH
;
93 sizeof (struct mptcp_mpcapable_opt_common
) +
95 mptcp_opt
.mmco_subtype
= MPO_CAPABLE
;
96 mptcp_opt
.mmco_version
= mp_tp
->mpt_version
;
97 mptcp_opt
.mmco_flags
|= MPCAP_PROPOSAL_SBIT
;
98 if (mp_tp
->mpt_flags
& MPTCPF_CHECKSUM
)
99 mptcp_opt
.mmco_flags
|= MPCAP_CHECKSUM_CBIT
;
100 memcpy(opt
+ optlen
, &mptcp_opt
, sizeof (struct mptcp_mpcapable_opt_common
));
101 optlen
+= sizeof (struct mptcp_mpcapable_opt_common
);
102 memcpy(opt
+ optlen
, &mp_tp
->mpt_localkey
, sizeof (mptcp_key_t
));
103 optlen
+= sizeof (mptcp_key_t
);
109 mptcp_setup_join_subflow_syn_opts(struct socket
*so
, u_char
*opt
, unsigned optlen
)
111 struct mptcp_mpjoin_opt_req mpjoin_req
;
112 struct inpcb
*inp
= sotoinpcb(so
);
113 struct tcpcb
*tp
= NULL
;
125 VERIFY(tptomptp(tp
));
126 mpte_lock_assert_held(tptomptp(tp
)->mpt_mpte
);
128 bzero(&mpjoin_req
, sizeof (mpjoin_req
));
129 mpjoin_req
.mmjo_kind
= TCPOPT_MULTIPATH
;
130 mpjoin_req
.mmjo_len
= sizeof (mpjoin_req
);
131 mpjoin_req
.mmjo_subtype_bkp
= MPO_JOIN
<< 4;
133 if (tp
->t_mpflags
& TMPF_BACKUP_PATH
) {
134 mpjoin_req
.mmjo_subtype_bkp
|= MPTCP_BACKUP
;
135 } else if (inp
->inp_boundifp
&& IFNET_IS_CELLULAR(inp
->inp_boundifp
) &&
136 mpts
->mpts_mpte
->mpte_svctype
!= MPTCP_SVCTYPE_AGGREGATE
) {
137 mpjoin_req
.mmjo_subtype_bkp
|= MPTCP_BACKUP
;
138 tp
->t_mpflags
|= TMPF_BACKUP_PATH
;
140 mpts
->mpts_flags
|= MPTSF_PREFERRED
;
143 mpjoin_req
.mmjo_addr_id
= tp
->t_local_aid
;
144 mpjoin_req
.mmjo_peer_token
= tptomptp(tp
)->mpt_remotetoken
;
145 if (mpjoin_req
.mmjo_peer_token
== 0) {
146 mptcplog((LOG_DEBUG
, "%s: peer token 0", __func__
),
147 MPTCP_SOCKET_DBG
, MPTCP_LOGLVL_ERR
);
149 mptcp_get_rands(tp
->t_local_aid
, tptomptp(tp
),
150 &mpjoin_req
.mmjo_rand
, NULL
);
151 memcpy(opt
+ optlen
, &mpjoin_req
, mpjoin_req
.mmjo_len
);
152 optlen
+= mpjoin_req
.mmjo_len
;
158 mptcp_setup_join_ack_opts(struct tcpcb
*tp
, u_char
*opt
, unsigned optlen
)
161 struct mptcp_mpjoin_opt_rsp2 join_rsp2
;
163 if ((MAX_TCPOPTLEN
- optlen
) < sizeof (struct mptcp_mpjoin_opt_rsp2
)) {
164 printf("%s: no space left %d \n", __func__
, optlen
);
168 bzero(&join_rsp2
, sizeof (struct mptcp_mpjoin_opt_rsp2
));
169 join_rsp2
.mmjo_kind
= TCPOPT_MULTIPATH
;
170 join_rsp2
.mmjo_len
= sizeof (struct mptcp_mpjoin_opt_rsp2
);
171 join_rsp2
.mmjo_subtype
= MPO_JOIN
;
172 mptcp_get_hmac(tp
->t_local_aid
, tptomptp(tp
),
173 (u_char
*)&join_rsp2
.mmjo_mac
);
174 memcpy(opt
+ optlen
, &join_rsp2
, join_rsp2
.mmjo_len
);
175 new_optlen
= optlen
+ join_rsp2
.mmjo_len
;
180 mptcp_setup_syn_opts(struct socket
*so
, u_char
*opt
, unsigned optlen
)
184 if (!(so
->so_flags
& SOF_MP_SEC_SUBFLOW
))
185 new_optlen
= mptcp_setup_first_subflow_syn_opts(so
, opt
, optlen
);
187 new_optlen
= mptcp_setup_join_subflow_syn_opts(so
, opt
, optlen
);
193 mptcp_send_mpfail(struct tcpcb
*tp
, u_char
*opt
, unsigned int optlen
)
195 #pragma unused(tp, opt, optlen)
197 struct mptcb
*mp_tp
= NULL
;
198 struct mptcp_mpfail_opt fail_opt
;
200 int len
= sizeof (struct mptcp_mpfail_opt
);
202 mp_tp
= tptomptp(tp
);
204 tp
->t_mpflags
&= ~TMPF_SND_MPFAIL
;
208 mpte_lock_assert_held(mp_tp
->mpt_mpte
);
210 /* if option space low give up */
211 if ((MAX_TCPOPTLEN
- optlen
) < sizeof (struct mptcp_mpfail_opt
)) {
212 tp
->t_mpflags
&= ~TMPF_SND_MPFAIL
;
216 dsn
= mp_tp
->mpt_rcvnxt
;
218 bzero(&fail_opt
, sizeof (fail_opt
));
219 fail_opt
.mfail_kind
= TCPOPT_MULTIPATH
;
220 fail_opt
.mfail_len
= len
;
221 fail_opt
.mfail_subtype
= MPO_FAIL
;
222 fail_opt
.mfail_dsn
= mptcp_hton64(dsn
);
223 memcpy(opt
+ optlen
, &fail_opt
, len
);
225 tp
->t_mpflags
&= ~TMPF_SND_MPFAIL
;
226 mptcplog((LOG_DEBUG
, "%s: %d \n", __func__
,
227 tp
->t_local_aid
), (MPTCP_SOCKET_DBG
| MPTCP_SENDER_DBG
),
233 mptcp_send_infinite_mapping(struct tcpcb
*tp
, u_char
*opt
, unsigned int optlen
)
235 struct mptcp_dsn_opt infin_opt
;
236 struct mptcb
*mp_tp
= NULL
;
237 size_t len
= sizeof (struct mptcp_dsn_opt
);
238 struct socket
*so
= tp
->t_inpcb
->inp_socket
;
244 mp_tp
= tptomptp(tp
);
248 mpte_lock_assert_held(mp_tp
->mpt_mpte
);
250 if (mp_tp
->mpt_flags
& MPTCPF_CHECKSUM
)
254 if ((MAX_TCPOPTLEN
- optlen
) < (len
+ csum_len
))
257 bzero(&infin_opt
, sizeof (infin_opt
));
258 infin_opt
.mdss_copt
.mdss_kind
= TCPOPT_MULTIPATH
;
259 infin_opt
.mdss_copt
.mdss_len
= len
+ csum_len
;
260 infin_opt
.mdss_copt
.mdss_subtype
= MPO_DSS
;
261 infin_opt
.mdss_copt
.mdss_flags
|= MDSS_M
;
262 if (mp_tp
->mpt_flags
& MPTCPF_RECVD_MPFAIL
) {
263 infin_opt
.mdss_dsn
= (u_int32_t
)
264 MPTCP_DATASEQ_LOW32(mp_tp
->mpt_dsn_at_csum_fail
);
265 infin_opt
.mdss_subflow_seqn
= mp_tp
->mpt_ssn_at_csum_fail
;
268 * If MPTCP fallback happens, but TFO succeeds, the data on the
269 * SYN does not belong to the MPTCP data sequence space.
271 if ((tp
->t_tfo_stats
& TFO_S_SYN_DATA_ACKED
) &&
272 ((mp_tp
->mpt_local_idsn
+ 1) == mp_tp
->mpt_snduna
)) {
273 infin_opt
.mdss_subflow_seqn
= 1;
275 mptcplog((LOG_DEBUG
, "%s: idsn %llu snduna %llu \n",
276 __func__
, mp_tp
->mpt_local_idsn
,
278 (MPTCP_SOCKET_DBG
| MPTCP_SENDER_DBG
),
281 infin_opt
.mdss_subflow_seqn
= tp
->snd_una
- tp
->t_mpsub
->mpts_iss
;
283 infin_opt
.mdss_dsn
= (u_int32_t
)
284 MPTCP_DATASEQ_LOW32(mp_tp
->mpt_snduna
);
287 if ((infin_opt
.mdss_dsn
== 0) || (infin_opt
.mdss_subflow_seqn
== 0)) {
290 infin_opt
.mdss_dsn
= htonl(infin_opt
.mdss_dsn
);
291 infin_opt
.mdss_subflow_seqn
= htonl(infin_opt
.mdss_subflow_seqn
);
292 infin_opt
.mdss_data_len
= 0;
294 memcpy(opt
+ optlen
, &infin_opt
, len
);
297 /* The checksum field is set to 0 for infinite mapping */
299 memcpy(opt
+ optlen
, &csum
, csum_len
);
303 mptcplog((LOG_DEBUG
, "%s: dsn = %x, seq = %x len = %x\n", __func__
,
304 ntohl(infin_opt
.mdss_dsn
),
305 ntohl(infin_opt
.mdss_subflow_seqn
),
306 ntohs(infin_opt
.mdss_data_len
)),
307 (MPTCP_SOCKET_DBG
| MPTCP_SENDER_DBG
),
310 tp
->t_mpflags
|= TMPF_INFIN_SENT
;
311 tcpstat
.tcps_estab_fallback
++;
317 mptcp_ok_to_fin(struct tcpcb
*tp
, u_int64_t dsn
, u_int32_t datalen
)
319 struct mptcb
*mp_tp
= tptomptp(tp
);
321 mpte_lock_assert_held(mp_tp
->mpt_mpte
);
323 dsn
= (mp_tp
->mpt_sndmax
& MPTCP_DATASEQ_LOW32_MASK
) | dsn
;
324 if ((dsn
+ datalen
) == mp_tp
->mpt_sndmax
)
331 mptcp_setup_opts(struct tcpcb
*tp
, int32_t off
, u_char
*opt
,
332 unsigned int optlen
, int flags
, int len
,
333 boolean_t
*p_mptcp_acknow
)
335 struct inpcb
*inp
= (struct inpcb
*)tp
->t_inpcb
;
336 struct socket
*so
= inp
->inp_socket
;
337 struct mptcb
*mp_tp
= tptomptp(tp
);
338 boolean_t do_csum
= FALSE
;
339 boolean_t send_64bit_dsn
= FALSE
;
340 boolean_t send_64bit_ack
= FALSE
;
341 u_int32_t old_mpt_flags
= tp
->t_mpflags
& TMPF_MPTCP_SIGNALS
;
343 if (mptcp_enable
== 0 || mp_tp
== NULL
|| tp
->t_state
== TCPS_CLOSED
) {
348 mpte_lock_assert_held(mp_tp
->mpt_mpte
);
350 if (mp_tp
->mpt_flags
& MPTCPF_CHECKSUM
) {
354 /* tcp_output handles the SYN path separately */
355 if (flags
& TH_SYN
) {
359 if ((MAX_TCPOPTLEN
- optlen
) <
360 sizeof (struct mptcp_mpcapable_opt_common
)) {
361 mptcplog((LOG_ERR
, "%s: no space left %d flags %x tp->t_mpflags %x len %d\n",
362 __func__
, optlen
, flags
, tp
->t_mpflags
, len
),
363 MPTCP_SOCKET_DBG
, MPTCP_LOGLVL_ERR
);
367 if (tp
->t_mpflags
& TMPF_TCP_FALLBACK
) {
368 if (tp
->t_mpflags
& TMPF_SND_MPFAIL
)
369 optlen
= mptcp_send_mpfail(tp
, opt
, optlen
);
370 else if (!(tp
->t_mpflags
& TMPF_INFIN_SENT
))
371 optlen
= mptcp_send_infinite_mapping(tp
, opt
, optlen
);
375 if (tp
->t_mpflags
& TMPF_SND_KEYS
) {
376 struct mptcp_mpcapable_opt_rsp1 mptcp_opt
;
377 if ((MAX_TCPOPTLEN
- optlen
) <
378 sizeof (struct mptcp_mpcapable_opt_rsp1
))
380 bzero(&mptcp_opt
, sizeof (struct mptcp_mpcapable_opt_rsp1
));
381 mptcp_opt
.mmc_common
.mmco_kind
= TCPOPT_MULTIPATH
;
382 mptcp_opt
.mmc_common
.mmco_len
=
383 sizeof (struct mptcp_mpcapable_opt_rsp1
);
384 mptcp_opt
.mmc_common
.mmco_subtype
= MPO_CAPABLE
;
385 mptcp_opt
.mmc_common
.mmco_version
= mp_tp
->mpt_version
;
386 /* HMAC-SHA1 is the proposal */
387 mptcp_opt
.mmc_common
.mmco_flags
|= MPCAP_PROPOSAL_SBIT
;
388 if (mp_tp
->mpt_flags
& MPTCPF_CHECKSUM
)
389 mptcp_opt
.mmc_common
.mmco_flags
|= MPCAP_CHECKSUM_CBIT
;
390 mptcp_opt
.mmc_localkey
= mp_tp
->mpt_localkey
;
391 mptcp_opt
.mmc_remotekey
= mp_tp
->mpt_remotekey
;
392 memcpy(opt
+ optlen
, &mptcp_opt
, mptcp_opt
.mmc_common
.mmco_len
);
393 optlen
+= mptcp_opt
.mmc_common
.mmco_len
;
394 tp
->t_mpflags
&= ~TMPF_SND_KEYS
;
397 tp
->t_mpuna
= tp
->snd_una
;
399 /* its a retransmission of the MP_CAPABLE ACK */
404 if (tp
->t_mpflags
& TMPF_SND_JACK
) {
405 /* Do the ACK part */
406 optlen
= mptcp_setup_join_ack_opts(tp
, opt
, optlen
);
408 tp
->t_mpuna
= tp
->snd_una
;
410 /* Start a timer to retransmit the ACK */
411 tp
->t_timer
[TCPT_JACK_RXMT
] =
412 OFFSET_FROM_START(tp
, tcp_jack_rxmt
);
414 tp
->t_mpflags
&= ~TMPF_SND_JACK
;
418 if (!(tp
->t_mpflags
& TMPF_MPTCP_TRUE
))
421 * From here on, all options are sent only if MPTCP_TRUE
422 * or when data is sent early on as in Fast Join
425 if ((tp
->t_mpflags
& TMPF_MPTCP_TRUE
) &&
426 (tp
->t_mpflags
& TMPF_SND_REM_ADDR
)) {
427 int rem_opt_len
= sizeof (struct mptcp_remaddr_opt
);
428 if ((optlen
+ rem_opt_len
) <= MAX_TCPOPTLEN
) {
429 mptcp_send_remaddr_opt(tp
,
430 (struct mptcp_remaddr_opt
*)(opt
+ optlen
));
431 optlen
+= rem_opt_len
;
433 tp
->t_mpflags
&= ~TMPF_SND_REM_ADDR
;
437 if (tp
->t_mpflags
& TMPF_SND_MPPRIO
) {
438 optlen
= mptcp_snd_mpprio(tp
, opt
, optlen
);
441 if (mp_tp
->mpt_flags
& MPTCPF_SND_64BITDSN
) {
442 send_64bit_dsn
= TRUE
;
444 if (mp_tp
->mpt_flags
& MPTCPF_SND_64BITACK
)
445 send_64bit_ack
= TRUE
;
447 #define CHECK_OPTLEN { \
448 if ((MAX_TCPOPTLEN - optlen) < dssoptlen) { \
449 mptcplog((LOG_ERR, "%s: dssoptlen %d optlen %d \n", __func__, \
450 dssoptlen, optlen), \
451 MPTCP_SOCKET_DBG, MPTCP_LOGLVL_ERR); \
456 #define DO_FIN(dsn_opt) { \
458 sndfin = mptcp_ok_to_fin(tp, dsn_opt.mdss_dsn, len); \
460 dsn_opt.mdss_copt.mdss_flags |= MDSS_F; \
461 dsn_opt.mdss_data_len += 1; \
463 dss_csum = in_addword(dss_csum, 1); \
467 #define CHECK_DATALEN { \
468 /* MPTCP socket does not support IP options */ \
469 if ((len + optlen + dssoptlen) > tp->t_maxopd) { \
470 mptcplog((LOG_ERR, "%s: nosp %d len %d opt %d %d %d\n", \
471 __func__, len, dssoptlen, optlen, \
472 tp->t_maxseg, tp->t_maxopd), \
473 MPTCP_SOCKET_DBG, MPTCP_LOGLVL_ERR); \
474 /* remove option length from payload len */ \
475 len = tp->t_maxopd - optlen - dssoptlen; \
479 if ((tp
->t_mpflags
& TMPF_SEND_DSN
) &&
482 * If there was the need to send 64-bit Data ACK along
483 * with 64-bit DSN, then 26 or 28 bytes would be used.
484 * With timestamps and NOOP padding that will cause
485 * overflow. Hence, in the rare event that both 64-bit
486 * DSN and 64-bit ACK have to be sent, delay the send of
487 * 64-bit ACK until our 64-bit DSN is acked with a 64-bit ack.
488 * XXX If this delay causes issue, remove the 2-byte padding.
490 struct mptcp_dss64_ack32_opt dsn_ack_opt
;
491 unsigned int dssoptlen
= sizeof (dsn_ack_opt
);
500 bzero(&dsn_ack_opt
, sizeof (dsn_ack_opt
));
501 dsn_ack_opt
.mdss_copt
.mdss_kind
= TCPOPT_MULTIPATH
;
502 dsn_ack_opt
.mdss_copt
.mdss_subtype
= MPO_DSS
;
503 dsn_ack_opt
.mdss_copt
.mdss_len
= dssoptlen
;
504 dsn_ack_opt
.mdss_copt
.mdss_flags
|=
505 MDSS_M
| MDSS_m
| MDSS_A
;
509 mptcp_output_getm_dsnmap64(so
, off
,
510 &dsn_ack_opt
.mdss_dsn
,
511 &dsn_ack_opt
.mdss_subflow_seqn
,
512 &dsn_ack_opt
.mdss_data_len
,
515 if ((dsn_ack_opt
.mdss_data_len
== 0) ||
516 (dsn_ack_opt
.mdss_dsn
== 0)) {
520 if (tp
->t_mpflags
& TMPF_SEND_DFIN
) {
524 dsn_ack_opt
.mdss_ack
=
525 htonl(MPTCP_DATAACK_LOW32(mp_tp
->mpt_rcvnxt
));
527 dsn_ack_opt
.mdss_dsn
= mptcp_hton64(dsn_ack_opt
.mdss_dsn
);
528 dsn_ack_opt
.mdss_subflow_seqn
= htonl(
529 dsn_ack_opt
.mdss_subflow_seqn
);
530 dsn_ack_opt
.mdss_data_len
= htons(
531 dsn_ack_opt
.mdss_data_len
);
533 memcpy(opt
+ optlen
, &dsn_ack_opt
, sizeof (dsn_ack_opt
));
535 *((uint16_t *)(void *)(opt
+ optlen
+ sizeof (dsn_ack_opt
))) = dss_csum
;
538 mptcplog((LOG_DEBUG
,"%s: long DSS = %llx ACK = %llx \n", __func__
,
539 mptcp_ntoh64(dsn_ack_opt
.mdss_dsn
),
540 mptcp_ntoh64(dsn_ack_opt
.mdss_ack
)),
541 MPTCP_SOCKET_DBG
, MPTCP_LOGLVL_LOG
);
543 tp
->t_mpflags
&= ~TMPF_MPTCP_ACKNOW
;
547 if ((tp
->t_mpflags
& TMPF_SEND_DSN
) &&
549 !(tp
->t_mpflags
& TMPF_MPTCP_ACKNOW
)) {
550 struct mptcp_dsn_opt dsn_opt
;
551 unsigned int dssoptlen
= sizeof (struct mptcp_dsn_opt
);
560 bzero(&dsn_opt
, sizeof (dsn_opt
));
561 dsn_opt
.mdss_copt
.mdss_kind
= TCPOPT_MULTIPATH
;
562 dsn_opt
.mdss_copt
.mdss_subtype
= MPO_DSS
;
563 dsn_opt
.mdss_copt
.mdss_len
= dssoptlen
;
564 dsn_opt
.mdss_copt
.mdss_flags
|= MDSS_M
;
568 mptcp_output_getm_dsnmap32(so
, off
, &dsn_opt
.mdss_dsn
,
569 &dsn_opt
.mdss_subflow_seqn
,
570 &dsn_opt
.mdss_data_len
,
573 if ((dsn_opt
.mdss_data_len
== 0) ||
574 (dsn_opt
.mdss_dsn
== 0)) {
578 if (tp
->t_mpflags
& TMPF_SEND_DFIN
) {
582 dsn_opt
.mdss_dsn
= htonl(dsn_opt
.mdss_dsn
);
583 dsn_opt
.mdss_subflow_seqn
= htonl(dsn_opt
.mdss_subflow_seqn
);
584 dsn_opt
.mdss_data_len
= htons(dsn_opt
.mdss_data_len
);
585 memcpy(opt
+ optlen
, &dsn_opt
, sizeof (dsn_opt
));
587 *((uint16_t *)(void *)(opt
+ optlen
+ sizeof (dsn_opt
))) = dss_csum
;
590 tp
->t_mpflags
&= ~TMPF_MPTCP_ACKNOW
;
594 /* 32-bit Data ACK option */
595 if ((tp
->t_mpflags
& TMPF_MPTCP_ACKNOW
) &&
597 !(tp
->t_mpflags
& TMPF_SEND_DSN
) &&
598 !(tp
->t_mpflags
& TMPF_SEND_DFIN
)) {
600 struct mptcp_data_ack_opt dack_opt
;
601 unsigned int dssoptlen
= 0;
603 dssoptlen
= sizeof (dack_opt
);
607 bzero(&dack_opt
, dssoptlen
);
608 dack_opt
.mdss_copt
.mdss_kind
= TCPOPT_MULTIPATH
;
609 dack_opt
.mdss_copt
.mdss_len
= dssoptlen
;
610 dack_opt
.mdss_copt
.mdss_subtype
= MPO_DSS
;
611 dack_opt
.mdss_copt
.mdss_flags
|= MDSS_A
;
613 htonl(MPTCP_DATAACK_LOW32(mp_tp
->mpt_rcvnxt
));
614 memcpy(opt
+ optlen
, &dack_opt
, dssoptlen
);
616 VERIFY(optlen
<= MAX_TCPOPTLEN
);
617 tp
->t_mpflags
&= ~TMPF_MPTCP_ACKNOW
;
621 /* 64-bit Data ACK option */
622 if ((tp
->t_mpflags
& TMPF_MPTCP_ACKNOW
) &&
624 !(tp
->t_mpflags
& TMPF_SEND_DSN
) &&
625 !(tp
->t_mpflags
& TMPF_SEND_DFIN
)) {
626 struct mptcp_data_ack64_opt dack_opt
;
627 unsigned int dssoptlen
= 0;
629 dssoptlen
= sizeof (dack_opt
);
633 bzero(&dack_opt
, dssoptlen
);
634 dack_opt
.mdss_copt
.mdss_kind
= TCPOPT_MULTIPATH
;
635 dack_opt
.mdss_copt
.mdss_len
= dssoptlen
;
636 dack_opt
.mdss_copt
.mdss_subtype
= MPO_DSS
;
637 dack_opt
.mdss_copt
.mdss_flags
|= (MDSS_A
| MDSS_a
);
638 dack_opt
.mdss_ack
= mptcp_hton64(mp_tp
->mpt_rcvnxt
);
640 * The other end should retransmit 64-bit DSN until it
641 * receives a 64-bit ACK.
643 mp_tp
->mpt_flags
&= ~MPTCPF_SND_64BITACK
;
644 memcpy(opt
+ optlen
, &dack_opt
, dssoptlen
);
646 VERIFY(optlen
<= MAX_TCPOPTLEN
);
647 tp
->t_mpflags
&= ~TMPF_MPTCP_ACKNOW
;
651 /* 32-bit DSS+Data ACK option */
652 if ((tp
->t_mpflags
& TMPF_SEND_DSN
) &&
655 (tp
->t_mpflags
& TMPF_MPTCP_ACKNOW
)) {
656 struct mptcp_dss_ack_opt dss_ack_opt
;
657 unsigned int dssoptlen
= sizeof (dss_ack_opt
);
665 bzero(&dss_ack_opt
, sizeof (dss_ack_opt
));
666 dss_ack_opt
.mdss_copt
.mdss_kind
= TCPOPT_MULTIPATH
;
667 dss_ack_opt
.mdss_copt
.mdss_len
= dssoptlen
;
668 dss_ack_opt
.mdss_copt
.mdss_subtype
= MPO_DSS
;
669 dss_ack_opt
.mdss_copt
.mdss_flags
|= MDSS_A
| MDSS_M
;
670 dss_ack_opt
.mdss_ack
=
671 htonl(MPTCP_DATAACK_LOW32(mp_tp
->mpt_rcvnxt
));
675 mptcp_output_getm_dsnmap32(so
, off
, &dss_ack_opt
.mdss_dsn
,
676 &dss_ack_opt
.mdss_subflow_seqn
,
677 &dss_ack_opt
.mdss_data_len
,
680 if ((dss_ack_opt
.mdss_data_len
== 0) ||
681 (dss_ack_opt
.mdss_dsn
== 0)) {
685 if (tp
->t_mpflags
& TMPF_SEND_DFIN
) {
689 dss_ack_opt
.mdss_dsn
= htonl(dss_ack_opt
.mdss_dsn
);
690 dss_ack_opt
.mdss_subflow_seqn
=
691 htonl(dss_ack_opt
.mdss_subflow_seqn
);
692 dss_ack_opt
.mdss_data_len
= htons(dss_ack_opt
.mdss_data_len
);
693 memcpy(opt
+ optlen
, &dss_ack_opt
, sizeof (dss_ack_opt
));
695 *((uint16_t *)(void *)(opt
+ optlen
+ sizeof (dss_ack_opt
))) = dss_csum
;
699 if (optlen
> MAX_TCPOPTLEN
)
700 panic("optlen too large");
701 tp
->t_mpflags
&= ~TMPF_MPTCP_ACKNOW
;
705 /* 32-bit DSS + 64-bit DACK option */
706 if ((tp
->t_mpflags
& TMPF_SEND_DSN
) &&
709 (tp
->t_mpflags
& TMPF_MPTCP_ACKNOW
)) {
710 struct mptcp_dss32_ack64_opt dss_ack_opt
;
711 unsigned int dssoptlen
= sizeof (dss_ack_opt
);
719 bzero(&dss_ack_opt
, sizeof (dss_ack_opt
));
720 dss_ack_opt
.mdss_copt
.mdss_kind
= TCPOPT_MULTIPATH
;
721 dss_ack_opt
.mdss_copt
.mdss_len
= dssoptlen
;
722 dss_ack_opt
.mdss_copt
.mdss_subtype
= MPO_DSS
;
723 dss_ack_opt
.mdss_copt
.mdss_flags
|= MDSS_M
| MDSS_A
| MDSS_a
;
724 dss_ack_opt
.mdss_ack
=
725 mptcp_hton64(mp_tp
->mpt_rcvnxt
);
729 mptcp_output_getm_dsnmap32(so
, off
, &dss_ack_opt
.mdss_dsn
,
730 &dss_ack_opt
.mdss_subflow_seqn
,
731 &dss_ack_opt
.mdss_data_len
,
734 if ((dss_ack_opt
.mdss_data_len
== 0) ||
735 (dss_ack_opt
.mdss_dsn
== 0)) {
739 if (tp
->t_mpflags
& TMPF_SEND_DFIN
) {
743 dss_ack_opt
.mdss_dsn
= htonl(dss_ack_opt
.mdss_dsn
);
744 dss_ack_opt
.mdss_subflow_seqn
=
745 htonl(dss_ack_opt
.mdss_subflow_seqn
);
746 dss_ack_opt
.mdss_data_len
= htons(dss_ack_opt
.mdss_data_len
);
747 memcpy(opt
+ optlen
, &dss_ack_opt
, sizeof (dss_ack_opt
));
749 *((uint16_t *)(void *)(opt
+ optlen
+ sizeof (dss_ack_opt
))) = dss_csum
;
753 if (optlen
> MAX_TCPOPTLEN
)
754 panic("optlen too large");
755 tp
->t_mpflags
&= ~TMPF_MPTCP_ACKNOW
;
759 if (tp
->t_mpflags
& TMPF_SEND_DFIN
) {
760 unsigned int dssoptlen
= sizeof(struct mptcp_dss_ack_opt
);
761 struct mptcp_dss_ack_opt dss_ack_opt
;
765 uint64_t dss_val
= mptcp_hton64(mp_tp
->mpt_sndmax
- 1);
766 uint16_t dlen
= htons(1);
773 sum
= in_pseudo64(dss_val
, sseq
, dlen
);
775 dss_csum
= ~sum
& 0xffff;
780 bzero(&dss_ack_opt
, sizeof (dss_ack_opt
));
783 * Data FIN occupies one sequence space.
784 * Don't send it if it has been Acked.
786 if ((mp_tp
->mpt_sndnxt
+ 1 != mp_tp
->mpt_sndmax
) ||
787 (mp_tp
->mpt_snduna
== mp_tp
->mpt_sndmax
))
790 dss_ack_opt
.mdss_copt
.mdss_kind
= TCPOPT_MULTIPATH
;
791 dss_ack_opt
.mdss_copt
.mdss_len
= dssoptlen
;
792 dss_ack_opt
.mdss_copt
.mdss_subtype
= MPO_DSS
;
793 dss_ack_opt
.mdss_copt
.mdss_flags
|= MDSS_A
| MDSS_M
| MDSS_F
;
794 dss_ack_opt
.mdss_ack
=
795 htonl(MPTCP_DATAACK_LOW32(mp_tp
->mpt_rcvnxt
));
796 dss_ack_opt
.mdss_dsn
=
797 htonl(MPTCP_DATASEQ_LOW32(mp_tp
->mpt_sndmax
- 1));
798 dss_ack_opt
.mdss_subflow_seqn
= 0;
799 dss_ack_opt
.mdss_data_len
= 1;
800 dss_ack_opt
.mdss_data_len
= htons(dss_ack_opt
.mdss_data_len
);
801 memcpy(opt
+ optlen
, &dss_ack_opt
, sizeof (dss_ack_opt
));
803 *((uint16_t *)(void *)(opt
+ optlen
+ sizeof (dss_ack_opt
))) = dss_csum
;
809 if (TRUE
== *p_mptcp_acknow
) {
810 VERIFY(old_mpt_flags
!= 0);
811 u_int32_t new_mpt_flags
= tp
->t_mpflags
& TMPF_MPTCP_SIGNALS
;
814 * If none of the above mpflags were acted on by
815 * this routine, reset these flags and set p_mptcp_acknow
818 * XXX The reset value of p_mptcp_acknow can be used
819 * to communicate tcp_output to NOT send a pure ack without any
820 * MPTCP options as it will be treated as a dup ack.
821 * Since the instances of mptcp_setup_opts not acting on
822 * these options are mostly corner cases and sending a dup
823 * ack here would only have an impact if the system
824 * has sent consecutive dup acks before this false one,
825 * we haven't modified the logic in tcp_output to avoid
828 if (old_mpt_flags
== new_mpt_flags
) {
829 tp
->t_mpflags
&= ~TMPF_MPTCP_SIGNALS
;
830 *p_mptcp_acknow
= FALSE
;
831 mptcplog((LOG_DEBUG
, "%s: no action \n", __func__
),
832 MPTCP_SENDER_DBG
, MPTCP_LOGLVL_LOG
);
834 mptcplog((LOG_DEBUG
, "%s: acknow set, old flags %x new flags %x \n",
835 __func__
, old_mpt_flags
, new_mpt_flags
),
836 MPTCP_SENDER_DBG
, MPTCP_LOGLVL_LOG
);
844 * MPTCP Options Input Processing
848 mptcp_sanitize_option(struct tcpcb
*tp
, int mptcp_subtype
)
850 struct mptcb
*mp_tp
= tptomptp(tp
);
854 mptcplog((LOG_ERR
, "%s: NULL mpsocket \n", __func__
),
855 MPTCP_SOCKET_DBG
, MPTCP_LOGLVL_ERR
);
859 switch (mptcp_subtype
) {
862 case MPO_JOIN
: /* fall through */
863 case MPO_DSS
: /* fall through */
864 case MPO_FASTCLOSE
: /* fall through */
865 case MPO_FAIL
: /* fall through */
866 case MPO_REMOVE_ADDR
: /* fall through */
867 case MPO_ADD_ADDR
: /* fall through */
868 case MPO_PRIO
: /* fall through */
869 if (mp_tp
->mpt_state
< MPTCPS_ESTABLISHED
)
874 mptcplog((LOG_ERR
, "%s: type = %d \n", __func__
,
876 MPTCP_SOCKET_DBG
, MPTCP_LOGLVL_ERR
);
883 mptcp_valid_mpcapable_common_opt(u_char
*cp
)
885 struct mptcp_mpcapable_opt_common
*rsp
=
886 (struct mptcp_mpcapable_opt_common
*)cp
;
888 /* mmco_kind, mmco_len and mmco_subtype are validated before */
890 if (!(rsp
->mmco_flags
& MPCAP_PROPOSAL_SBIT
))
893 if (rsp
->mmco_flags
& (MPCAP_BBIT
| MPCAP_CBIT
| MPCAP_DBIT
|
894 MPCAP_EBIT
| MPCAP_FBIT
| MPCAP_GBIT
))
902 mptcp_do_mpcapable_opt(struct tcpcb
*tp
, u_char
*cp
, struct tcphdr
*th
,
905 struct mptcp_mpcapable_opt_rsp
*rsp
= NULL
;
906 struct mptcb
*mp_tp
= tptomptp(tp
);
908 mpte_lock_assert_held(mp_tp
->mpt_mpte
);
910 /* Only valid on SYN/ACK */
911 if ((th
->th_flags
& (TH_SYN
| TH_ACK
)) != (TH_SYN
| TH_ACK
))
914 /* Validate the kind, len, flags */
915 if (mptcp_valid_mpcapable_common_opt(cp
) != 1) {
916 tcpstat
.tcps_invalid_mpcap
++;
920 /* handle SYN/ACK retransmission by acknowledging with ACK */
921 if (mp_tp
->mpt_state
>= MPTCPS_ESTABLISHED
)
924 /* A SYN/ACK contains peer's key and flags */
925 if (optlen
!= sizeof (struct mptcp_mpcapable_opt_rsp
)) {
927 mptcplog((LOG_ERR
, "%s: SYN_ACK optlen = %d, sizeof mp opt = %lu \n",
929 sizeof (struct mptcp_mpcapable_opt_rsp
)),
930 MPTCP_SOCKET_DBG
, MPTCP_LOGLVL_ERR
);
931 tcpstat
.tcps_invalid_mpcap
++;
936 * If checksum flag is set, enable MPTCP checksum, even if
937 * it was not negotiated on the first SYN.
939 if (((struct mptcp_mpcapable_opt_common
*)cp
)->mmco_flags
&
941 mp_tp
->mpt_flags
|= MPTCPF_CHECKSUM
;
943 rsp
= (struct mptcp_mpcapable_opt_rsp
*)cp
;
944 mp_tp
->mpt_remotekey
= rsp
->mmc_localkey
;
945 /* For now just downgrade to the peer's version */
946 mp_tp
->mpt_peer_version
= rsp
->mmc_common
.mmco_version
;
947 if (rsp
->mmc_common
.mmco_version
< mp_tp
->mpt_version
) {
948 mp_tp
->mpt_version
= rsp
->mmc_common
.mmco_version
;
949 tcpstat
.tcps_mp_verdowngrade
++;
951 if (mptcp_init_remote_parms(mp_tp
) != 0) {
952 tcpstat
.tcps_invalid_mpcap
++;
955 tcp_heuristic_mptcp_success(tp
);
956 tp
->t_mpflags
|= (TMPF_SND_KEYS
| TMPF_MPTCP_TRUE
);
961 mptcp_do_mpjoin_opt(struct tcpcb
*tp
, u_char
*cp
, struct tcphdr
*th
, int optlen
)
963 #define MPTCP_JOPT_ERROR_PATH(tp) { \
964 tp->t_mpflags |= TMPF_RESET; \
965 tcpstat.tcps_invalid_joins++; \
966 if (tp->t_inpcb->inp_socket != NULL) { \
967 soevent(tp->t_inpcb->inp_socket, \
968 SO_FILT_HINT_LOCKED | SO_FILT_HINT_MUSTRST); \
972 struct mptcp_mpjoin_opt_rsp
*join_rsp
=
973 (struct mptcp_mpjoin_opt_rsp
*)cp
;
975 /* Only valid on SYN/ACK */
976 if ((th
->th_flags
& (TH_SYN
| TH_ACK
)) != (TH_SYN
| TH_ACK
))
979 if (optlen
!= sizeof (struct mptcp_mpjoin_opt_rsp
)) {
980 mptcplog((LOG_ERR
, "%s: SYN_ACK: unexpected optlen = %d mp "
981 "option = %lu\n", __func__
, optlen
,
982 sizeof (struct mptcp_mpjoin_opt_rsp
)),
983 MPTCP_SOCKET_DBG
, MPTCP_LOGLVL_ERR
);
984 tp
->t_mpflags
&= ~TMPF_PREESTABLISHED
;
985 /* send RST and close */
986 MPTCP_JOPT_ERROR_PATH(tp
);
990 mptcp_set_raddr_rand(tp
->t_local_aid
, tptomptp(tp
),
991 join_rsp
->mmjo_addr_id
, join_rsp
->mmjo_rand
);
992 error
= mptcp_validate_join_hmac(tp
,
993 (u_char
*)&join_rsp
->mmjo_mac
, SHA1_TRUNCATED
);
995 mptcplog((LOG_ERR
, "%s: SYN_ACK error = %d \n", __func__
, error
),
996 MPTCP_SOCKET_DBG
, MPTCP_LOGLVL_ERR
);
997 tp
->t_mpflags
&= ~TMPF_PREESTABLISHED
;
998 /* send RST and close */
999 MPTCP_JOPT_ERROR_PATH(tp
);
1002 tp
->t_mpflags
|= (TMPF_SENT_JOIN
| TMPF_SND_JACK
);
1006 mptcp_validate_join_hmac(struct tcpcb
*tp
, u_char
* hmac
, int mac_len
)
1008 u_char digest
[SHA1_RESULTLEN
] = {0};
1009 struct mptcb
*mp_tp
= tptomptp(tp
);
1010 u_int32_t rem_rand
, loc_rand
;
1012 mpte_lock_assert_held(mp_tp
->mpt_mpte
);
1014 rem_rand
= loc_rand
= 0;
1016 mptcp_get_rands(tp
->t_local_aid
, mp_tp
, &loc_rand
, &rem_rand
);
1017 if ((rem_rand
== 0) || (loc_rand
== 0))
1020 mptcp_hmac_sha1(mp_tp
->mpt_remotekey
, mp_tp
->mpt_localkey
, rem_rand
, loc_rand
,
1023 if (bcmp(digest
, hmac
, mac_len
) == 0)
1024 return (0); /* matches */
1026 printf("%s: remote key %llx local key %llx remote rand %x "
1027 "local rand %x \n", __func__
, mp_tp
->mpt_remotekey
, mp_tp
->mpt_localkey
,
1028 rem_rand
, loc_rand
);
1034 * Update the mptcb send state variables, but the actual sbdrop occurs
1038 mptcp_data_ack_rcvd(struct mptcb
*mp_tp
, struct tcpcb
*tp
, u_int64_t full_dack
)
1040 u_int64_t acked
= full_dack
- mp_tp
->mpt_snduna
;
1043 struct socket
*mp_so
= mptetoso(mp_tp
->mpt_mpte
);
1045 if (acked
> mp_so
->so_snd
.sb_cc
) {
1046 if (acked
> mp_so
->so_snd
.sb_cc
+ 1 ||
1047 mp_tp
->mpt_state
< MPTCPS_FIN_WAIT_1
)
1048 mptcplog((LOG_ERR
, "%s: acked %u, sb_cc %u full %u suna %u state %u\n",
1049 __func__
, (uint32_t)acked
, mp_so
->so_snd
.sb_cc
,
1050 (uint32_t)full_dack
, (uint32_t)mp_tp
->mpt_snduna
,
1052 MPTCP_RECEIVER_DBG
, MPTCP_LOGLVL_ERR
);
1054 sbdrop(&mp_so
->so_snd
, (int)mp_so
->so_snd
.sb_cc
);
1056 sbdrop(&mp_so
->so_snd
, acked
);
1059 mp_tp
->mpt_snduna
+= acked
;
1060 /* In degraded mode, we may get some Data ACKs */
1061 if ((tp
->t_mpflags
& TMPF_TCP_FALLBACK
) &&
1062 !(mp_tp
->mpt_flags
& MPTCPF_POST_FALLBACK_SYNC
) &&
1063 MPTCP_SEQ_GT(mp_tp
->mpt_sndnxt
, mp_tp
->mpt_snduna
)) {
1064 /* bring back sndnxt to retransmit MPTCP data */
1065 mp_tp
->mpt_sndnxt
= mp_tp
->mpt_dsn_at_csum_fail
;
1066 mp_tp
->mpt_flags
|= MPTCPF_POST_FALLBACK_SYNC
;
1067 tp
->t_inpcb
->inp_socket
->so_flags1
|=
1068 SOF1_POST_FALLBACK_SYNC
;
1071 mptcp_clean_reinjectq(mp_tp
->mpt_mpte
);
1075 if (full_dack
== mp_tp
->mpt_sndmax
&&
1076 mp_tp
->mpt_state
>= MPTCPS_FIN_WAIT_1
) {
1077 mptcp_close_fsm(mp_tp
, MPCE_RECV_DATA_ACK
);
1078 tp
->t_mpflags
&= ~TMPF_SEND_DFIN
;
1083 mptcp_update_window_fallback(struct tcpcb
*tp
)
1085 struct mptcb
*mp_tp
= tptomptp(tp
);
1087 mpte_lock_assert_held(mp_tp
->mpt_mpte
);
1089 if (!(mp_tp
->mpt_flags
& MPTCPF_FALLBACK_TO_TCP
))
1092 mptcplog((LOG_DEBUG
, "%s: update window to %u\n", __func__
, tp
->snd_wnd
),
1093 MPTCP_SOCKET_DBG
, MPTCP_LOGLVL_VERBOSE
);
1095 mp_tp
->mpt_sndwnd
= tp
->snd_wnd
;
1096 mp_tp
->mpt_sndwl1
= mp_tp
->mpt_rcvnxt
;
1097 mp_tp
->mpt_sndwl2
= mp_tp
->mpt_snduna
;
1099 sowwakeup(tp
->t_inpcb
->inp_socket
);
1103 mptcp_update_window(struct mptcb
*mp_tp
, u_int64_t ack
, u_int64_t seq
,
1106 /* Don't look at the window if there is no ACK flag */
1107 if ((SEQ_LT(mp_tp
->mpt_sndwl1
, seq
) ||
1108 (mp_tp
->mpt_sndwl1
== seq
&& (SEQ_LT(mp_tp
->mpt_sndwl2
, ack
) ||
1109 (mp_tp
->mpt_sndwl2
== ack
&& tiwin
> mp_tp
->mpt_sndwnd
))))) {
1110 mp_tp
->mpt_sndwnd
= tiwin
;
1111 mp_tp
->mpt_sndwl1
= seq
;
1112 mp_tp
->mpt_sndwl2
= ack
;
1114 mptcplog((LOG_DEBUG
, "%s: Updating window to %u\n", __func__
,
1115 mp_tp
->mpt_sndwnd
), MPTCP_RECEIVER_DBG
, MPTCP_LOGLVL_VERBOSE
);
1120 mptcp_do_dss_opt_ack_meat(u_int64_t full_dack
, u_int64_t full_dsn
,
1121 struct tcpcb
*tp
, u_int32_t tiwin
)
1123 struct mptcb
*mp_tp
= tptomptp(tp
);
1124 int close_notify
= 0;
1126 tp
->t_mpflags
|= TMPF_RCVD_DACK
;
1128 if (MPTCP_SEQ_LEQ(full_dack
, mp_tp
->mpt_sndmax
) &&
1129 MPTCP_SEQ_GEQ(full_dack
, mp_tp
->mpt_snduna
)) {
1130 mptcp_data_ack_rcvd(mp_tp
, tp
, full_dack
);
1131 if (mp_tp
->mpt_state
> MPTCPS_FIN_WAIT_2
)
1133 if (mp_tp
->mpt_flags
& MPTCPF_RCVD_64BITACK
) {
1134 mp_tp
->mpt_flags
&= ~MPTCPF_RCVD_64BITACK
;
1135 mp_tp
->mpt_flags
&= ~MPTCPF_SND_64BITDSN
;
1137 mptcp_notify_mpready(tp
->t_inpcb
->inp_socket
);
1139 mptcp_notify_close(tp
->t_inpcb
->inp_socket
);
1141 mptcplog((LOG_ERR
,"%s: unexpected dack %u snduna %u sndmax %u\n", __func__
,
1142 (u_int32_t
)full_dack
, (u_int32_t
)mp_tp
->mpt_snduna
,
1143 (u_int32_t
)mp_tp
->mpt_sndmax
),
1144 (MPTCP_SOCKET_DBG
|MPTCP_RECEIVER_DBG
),
1148 mptcp_update_window(mp_tp
, full_dack
, full_dsn
, tiwin
);
1152 mptcp_do_dss_opt_meat(u_char
*cp
, struct tcpcb
*tp
, struct tcphdr
*th
)
1154 struct mptcp_dss_copt
*dss_rsp
= (struct mptcp_dss_copt
*)cp
;
1155 u_int64_t full_dack
= 0;
1156 u_int32_t tiwin
= th
->th_win
<< tp
->snd_scale
;
1157 struct mptcb
*mp_tp
= tptomptp(tp
);
1160 #define MPTCP_DSS_OPT_SZ_CHK(len, expected_len) { \
1161 if (len != expected_len) { \
1162 mptcplog((LOG_ERR, "%s: bad len = %d dss: %x \n", __func__, \
1163 len, dss_rsp->mdss_flags), \
1164 (MPTCP_SOCKET_DBG|MPTCP_RECEIVER_DBG), \
1165 MPTCP_LOGLVL_LOG); \
1170 if (mp_tp
->mpt_flags
& MPTCPF_CHECKSUM
)
1173 dss_rsp
->mdss_flags
&= (MDSS_A
|MDSS_a
|MDSS_M
|MDSS_m
);
1174 switch (dss_rsp
->mdss_flags
) {
1177 /* 32-bit DSS, No Data ACK */
1178 struct mptcp_dsn_opt
*dss_rsp1
;
1179 dss_rsp1
= (struct mptcp_dsn_opt
*)cp
;
1181 MPTCP_DSS_OPT_SZ_CHK(dss_rsp1
->mdss_copt
.mdss_len
,
1182 sizeof (struct mptcp_dsn_opt
) + csum_len
);
1184 mptcp_update_dss_rcv_state(dss_rsp1
, tp
, 0);
1186 mptcp_update_dss_rcv_state(dss_rsp1
, tp
,
1187 *(uint16_t *)(void *)(cp
+
1188 (dss_rsp1
->mdss_copt
.mdss_len
- csum_len
)));
1193 /* 32-bit Data ACK, no DSS */
1194 struct mptcp_data_ack_opt
*dack_opt
;
1195 dack_opt
= (struct mptcp_data_ack_opt
*)cp
;
1197 MPTCP_DSS_OPT_SZ_CHK(dack_opt
->mdss_copt
.mdss_len
,
1198 sizeof (struct mptcp_data_ack_opt
));
1200 u_int32_t dack
= dack_opt
->mdss_ack
;
1202 MPTCP_EXTEND_DSN(mp_tp
->mpt_snduna
, dack
, full_dack
);
1203 mptcp_do_dss_opt_ack_meat(full_dack
, mp_tp
->mpt_sndwl1
, tp
, tiwin
);
1206 case (MDSS_M
| MDSS_A
):
1208 /* 32-bit Data ACK + 32-bit DSS */
1209 struct mptcp_dss_ack_opt
*dss_ack_rsp
;
1210 dss_ack_rsp
= (struct mptcp_dss_ack_opt
*)cp
;
1214 MPTCP_DSS_OPT_SZ_CHK(dss_ack_rsp
->mdss_copt
.mdss_len
,
1215 sizeof (struct mptcp_dss_ack_opt
) + csum_len
);
1217 u_int32_t dack
= dss_ack_rsp
->mdss_ack
;
1219 MPTCP_EXTEND_DSN(mp_tp
->mpt_snduna
, dack
, full_dack
);
1221 NTOHL(dss_ack_rsp
->mdss_dsn
);
1222 NTOHL(dss_ack_rsp
->mdss_subflow_seqn
);
1223 NTOHS(dss_ack_rsp
->mdss_data_len
);
1224 MPTCP_EXTEND_DSN(mp_tp
->mpt_rcvnxt
, dss_ack_rsp
->mdss_dsn
, full_dsn
);
1226 mptcp_do_dss_opt_ack_meat(full_dack
, full_dsn
, tp
, tiwin
);
1229 csum
= *(uint16_t *)(void *)(cp
+ (dss_ack_rsp
->mdss_copt
.mdss_len
- csum_len
));
1231 mptcp_update_rcv_state_meat(mp_tp
, tp
,
1233 dss_ack_rsp
->mdss_subflow_seqn
,
1234 dss_ack_rsp
->mdss_data_len
,
1238 case (MDSS_M
| MDSS_m
):
1240 /* 64-bit DSS , No Data ACK */
1241 struct mptcp_dsn64_opt
*dsn64
;
1242 dsn64
= (struct mptcp_dsn64_opt
*)cp
;
1246 MPTCP_DSS_OPT_SZ_CHK(dsn64
->mdss_copt
.mdss_len
,
1247 sizeof (struct mptcp_dsn64_opt
) + csum_len
);
1249 mp_tp
->mpt_flags
|= MPTCPF_SND_64BITACK
;
1251 full_dsn
= mptcp_ntoh64(dsn64
->mdss_dsn
);
1252 NTOHL(dsn64
->mdss_subflow_seqn
);
1253 NTOHS(dsn64
->mdss_data_len
);
1256 csum
= *(uint16_t *)(void *)(cp
+ dsn64
->mdss_copt
.mdss_len
- csum_len
);
1258 mptcp_update_rcv_state_meat(mp_tp
, tp
, full_dsn
,
1259 dsn64
->mdss_subflow_seqn
,
1260 dsn64
->mdss_data_len
,
1264 case (MDSS_A
| MDSS_a
):
1266 /* 64-bit Data ACK, no DSS */
1267 struct mptcp_data_ack64_opt
*dack64
;
1268 dack64
= (struct mptcp_data_ack64_opt
*)cp
;
1270 MPTCP_DSS_OPT_SZ_CHK(dack64
->mdss_copt
.mdss_len
,
1271 sizeof (struct mptcp_data_ack64_opt
));
1273 mp_tp
->mpt_flags
|= MPTCPF_RCVD_64BITACK
;
1275 full_dack
= mptcp_ntoh64(dack64
->mdss_ack
);
1276 mptcp_do_dss_opt_ack_meat(full_dack
, mp_tp
->mpt_sndwl1
, tp
, tiwin
);
1279 case (MDSS_M
| MDSS_m
| MDSS_A
):
1281 /* 64-bit DSS + 32-bit Data ACK */
1282 struct mptcp_dss64_ack32_opt
*dss_ack_rsp
;
1283 dss_ack_rsp
= (struct mptcp_dss64_ack32_opt
*)cp
;
1287 MPTCP_DSS_OPT_SZ_CHK(dss_ack_rsp
->mdss_copt
.mdss_len
,
1288 sizeof (struct mptcp_dss64_ack32_opt
) + csum_len
);
1290 u_int32_t dack
= dss_ack_rsp
->mdss_ack
;
1292 mp_tp
->mpt_flags
|= MPTCPF_SND_64BITACK
;
1293 MPTCP_EXTEND_DSN(mp_tp
->mpt_snduna
, dack
, full_dack
);
1295 full_dsn
= mptcp_ntoh64(dss_ack_rsp
->mdss_dsn
);
1296 NTOHL(dss_ack_rsp
->mdss_subflow_seqn
);
1297 NTOHS(dss_ack_rsp
->mdss_data_len
);
1299 mptcp_do_dss_opt_ack_meat(full_dack
, full_dsn
, tp
, tiwin
);
1302 csum
= *(uint16_t *)(void *)(cp
+ dss_ack_rsp
->mdss_copt
.mdss_len
- csum_len
);
1304 mptcp_update_rcv_state_meat(mp_tp
, tp
, full_dsn
,
1305 dss_ack_rsp
->mdss_subflow_seqn
,
1306 dss_ack_rsp
->mdss_data_len
,
1311 case (MDSS_M
| MDSS_A
| MDSS_a
):
1313 /* 32-bit DSS + 64-bit Data ACK */
1314 struct mptcp_dss32_ack64_opt
*dss32_ack64_opt
;
1315 dss32_ack64_opt
= (struct mptcp_dss32_ack64_opt
*)cp
;
1318 MPTCP_DSS_OPT_SZ_CHK(
1319 dss32_ack64_opt
->mdss_copt
.mdss_len
,
1320 sizeof (struct mptcp_dss32_ack64_opt
) + csum_len
);
1322 full_dack
= mptcp_ntoh64(dss32_ack64_opt
->mdss_ack
);
1323 NTOHL(dss32_ack64_opt
->mdss_dsn
);
1324 mp_tp
->mpt_flags
|= MPTCPF_RCVD_64BITACK
;
1325 MPTCP_EXTEND_DSN(mp_tp
->mpt_rcvnxt
,
1326 dss32_ack64_opt
->mdss_dsn
, full_dsn
);
1327 NTOHL(dss32_ack64_opt
->mdss_subflow_seqn
);
1328 NTOHS(dss32_ack64_opt
->mdss_data_len
);
1330 mptcp_do_dss_opt_ack_meat(full_dack
, full_dsn
, tp
, tiwin
);
1332 mptcp_update_rcv_state_meat(mp_tp
, tp
, full_dsn
,
1333 dss32_ack64_opt
->mdss_subflow_seqn
,
1334 dss32_ack64_opt
->mdss_data_len
, 0);
1336 mptcp_update_rcv_state_meat(mp_tp
, tp
, full_dsn
,
1337 dss32_ack64_opt
->mdss_subflow_seqn
,
1338 dss32_ack64_opt
->mdss_data_len
,
1339 *(uint16_t *)(void *)(cp
+
1340 dss32_ack64_opt
->mdss_copt
.mdss_len
-
1344 case (MDSS_M
| MDSS_m
| MDSS_A
| MDSS_a
):
1346 /* 64-bit DSS + 64-bit Data ACK */
1347 struct mptcp_dss64_ack64_opt
*dss64_ack64
;
1348 dss64_ack64
= (struct mptcp_dss64_ack64_opt
*)cp
;
1351 MPTCP_DSS_OPT_SZ_CHK(dss64_ack64
->mdss_copt
.mdss_len
,
1352 sizeof (struct mptcp_dss64_ack64_opt
) + csum_len
);
1354 mp_tp
->mpt_flags
|= MPTCPF_RCVD_64BITACK
;
1355 mp_tp
->mpt_flags
|= MPTCPF_SND_64BITACK
;
1356 full_dsn
= mptcp_ntoh64(dss64_ack64
->mdss_dsn
);
1357 full_dack
= mptcp_ntoh64(dss64_ack64
->mdss_dsn
);
1358 mptcp_do_dss_opt_ack_meat(full_dack
, full_dsn
, tp
, tiwin
);
1359 NTOHL(dss64_ack64
->mdss_subflow_seqn
);
1360 NTOHS(dss64_ack64
->mdss_data_len
);
1362 mptcp_update_rcv_state_meat(mp_tp
, tp
, full_dsn
,
1363 dss64_ack64
->mdss_subflow_seqn
,
1364 dss64_ack64
->mdss_data_len
, 0);
1366 mptcp_update_rcv_state_meat(mp_tp
, tp
, full_dsn
,
1367 dss64_ack64
->mdss_subflow_seqn
,
1368 dss64_ack64
->mdss_data_len
,
1369 *(uint16_t *)(void *)(cp
+
1370 dss64_ack64
->mdss_copt
.mdss_len
-
1375 mptcplog((LOG_DEBUG
,"%s: File bug, DSS flags = %x\n",
1376 __func__
, dss_rsp
->mdss_flags
),
1377 (MPTCP_SOCKET_DBG
|MPTCP_RECEIVER_DBG
),
1384 mptcp_do_dss_opt(struct tcpcb
*tp
, u_char
*cp
, struct tcphdr
*th
, int optlen
)
1386 #pragma unused(optlen)
1387 struct mptcb
*mp_tp
= tptomptp(tp
);
1392 /* We may get Data ACKs just during fallback, so don't ignore those */
1393 if ((tp
->t_mpflags
& TMPF_MPTCP_TRUE
) ||
1394 (tp
->t_mpflags
& TMPF_TCP_FALLBACK
)) {
1395 struct mptcp_dss_copt
*dss_rsp
= (struct mptcp_dss_copt
*)cp
;
1397 if (dss_rsp
->mdss_subtype
== MPO_DSS
) {
1398 if (dss_rsp
->mdss_flags
& MDSS_F
)
1399 tp
->t_rcv_map
.mpt_dfin
= 1;
1401 mptcp_do_dss_opt_meat(cp
, tp
, th
);
1407 mptcp_do_fastclose_opt(struct tcpcb
*tp
, u_char
*cp
, struct tcphdr
*th
)
1409 struct mptcb
*mp_tp
= NULL
;
1410 struct mptcp_fastclose_opt
*fc_opt
= (struct mptcp_fastclose_opt
*)cp
;
1412 if (th
->th_flags
!= TH_ACK
)
1415 if (fc_opt
->mfast_len
!= sizeof (struct mptcp_fastclose_opt
)) {
1416 tcpstat
.tcps_invalid_opt
++;
1420 mp_tp
= tptomptp(tp
);
1424 if (fc_opt
->mfast_key
!= mp_tp
->mpt_localkey
) {
1425 tcpstat
.tcps_invalid_opt
++;
1430 * fastclose could make us more vulnerable to attacks, hence
1431 * accept only those that are at the next expected sequence number.
1433 if (th
->th_seq
!= tp
->rcv_nxt
) {
1434 tcpstat
.tcps_invalid_opt
++;
1438 /* Reset this flow */
1439 tp
->t_mpflags
|= (TMPF_RESET
| TMPF_FASTCLOSERCV
);
1441 if (tp
->t_inpcb
->inp_socket
!= NULL
) {
1442 soevent(tp
->t_inpcb
->inp_socket
,
1443 SO_FILT_HINT_LOCKED
| SO_FILT_HINT_MUSTRST
);
1449 mptcp_do_mpfail_opt(struct tcpcb
*tp
, u_char
*cp
, struct tcphdr
*th
)
1451 struct mptcb
*mp_tp
= NULL
;
1452 struct mptcp_mpfail_opt
*fail_opt
= (struct mptcp_mpfail_opt
*)cp
;
1453 u_int32_t mdss_subflow_seqn
= 0;
1457 * mpfail could make us more vulnerable to attacks. Hence accept
1458 * only those that are the next expected sequence number.
1460 if (th
->th_seq
!= tp
->rcv_nxt
) {
1461 tcpstat
.tcps_invalid_opt
++;
1465 /* A packet without RST, must atleast have the ACK bit set */
1466 if ((th
->th_flags
!= TH_ACK
) && (th
->th_flags
!= TH_RST
))
1469 if (fail_opt
->mfail_len
!= sizeof (struct mptcp_mpfail_opt
))
1472 mp_tp
= tptomptp(tp
);
1474 mp_tp
->mpt_flags
|= MPTCPF_RECVD_MPFAIL
;
1475 mp_tp
->mpt_dsn_at_csum_fail
= mptcp_hton64(fail_opt
->mfail_dsn
);
1476 error
= mptcp_get_map_for_dsn(tp
->t_inpcb
->inp_socket
,
1477 mp_tp
->mpt_dsn_at_csum_fail
, &mdss_subflow_seqn
);
1479 mp_tp
->mpt_ssn_at_csum_fail
= mdss_subflow_seqn
;
1482 mptcp_notify_mpfail(tp
->t_inpcb
->inp_socket
);
1486 tcp_do_mptcp_options(struct tcpcb
*tp
, u_char
*cp
, struct tcphdr
*th
,
1487 struct tcpopt
*to
, int optlen
)
1490 struct mptcb
*mp_tp
= tptomptp(tp
);
1495 mpte_lock_assert_held(mp_tp
->mpt_mpte
);
1497 /* All MPTCP options have atleast 4 bytes */
1501 mptcp_subtype
= (cp
[2] >> 4);
1503 if (mptcp_sanitize_option(tp
, mptcp_subtype
) == 0)
1506 switch (mptcp_subtype
) {
1508 mptcp_do_mpcapable_opt(tp
, cp
, th
, optlen
);
1511 mptcp_do_mpjoin_opt(tp
, cp
, th
, optlen
);
1514 mptcp_do_dss_opt(tp
, cp
, th
, optlen
);
1517 mptcp_do_fastclose_opt(tp
, cp
, th
);
1520 mptcp_do_mpfail_opt(tp
, cp
, th
);
1522 case MPO_ADD_ADDR
: /* fall through */
1523 case MPO_REMOVE_ADDR
: /* fall through */
1525 to
->to_flags
|= TOF_MPTCP
;
1533 /* REMOVE_ADDR option is sent when a source address goes away */
1535 mptcp_send_remaddr_opt(struct tcpcb
*tp
, struct mptcp_remaddr_opt
*opt
)
1537 mptcplog((LOG_DEBUG
,"%s: local id %d remove id %d \n",
1538 __func__
, tp
->t_local_aid
, tp
->t_rem_aid
),
1539 (MPTCP_SOCKET_DBG
|MPTCP_SENDER_DBG
), MPTCP_LOGLVL_LOG
);
1541 bzero(opt
, sizeof (*opt
));
1542 opt
->mr_kind
= TCPOPT_MULTIPATH
;
1543 opt
->mr_len
= sizeof (*opt
);
1544 opt
->mr_subtype
= MPO_REMOVE_ADDR
;
1545 opt
->mr_addr_id
= tp
->t_rem_aid
;
1546 tp
->t_mpflags
&= ~TMPF_SND_REM_ADDR
;
1549 /* We send MP_PRIO option based on the values set by the SIOCSCONNORDER ioctl */
1551 mptcp_snd_mpprio(struct tcpcb
*tp
, u_char
*cp
, int optlen
)
1553 struct mptcp_mpprio_addr_opt mpprio
;
1555 if (tp
->t_state
!= TCPS_ESTABLISHED
) {
1556 tp
->t_mpflags
&= ~TMPF_SND_MPPRIO
;
1560 if ((MAX_TCPOPTLEN
- optlen
) <
1561 (int)sizeof (mpprio
))
1564 bzero(&mpprio
, sizeof (mpprio
));
1565 mpprio
.mpprio_kind
= TCPOPT_MULTIPATH
;
1566 mpprio
.mpprio_len
= sizeof (mpprio
);
1567 mpprio
.mpprio_subtype
= MPO_PRIO
;
1568 if (tp
->t_mpflags
& TMPF_BACKUP_PATH
)
1569 mpprio
.mpprio_flags
|= MPTCP_MPPRIO_BKP
;
1570 mpprio
.mpprio_addrid
= tp
->t_local_aid
;
1571 memcpy(cp
+ optlen
, &mpprio
, sizeof (mpprio
));
1572 optlen
+= sizeof (mpprio
);
1573 tp
->t_mpflags
&= ~TMPF_SND_MPPRIO
;
1574 mptcplog((LOG_DEBUG
, "%s: aid = %d \n", __func__
,
1576 (MPTCP_SOCKET_DBG
|MPTCP_SENDER_DBG
), MPTCP_LOGLVL_LOG
);