]> git.saurik.com Git - apple/xnu.git/blob - bsd/netinet/mptcp_usrreq.c
xnu-6153.141.1.tar.gz
[apple/xnu.git] / bsd / netinet / mptcp_usrreq.c
1 /*
2 * Copyright (c) 2012-2017 Apple Inc. All rights reserved.
3 *
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5 *
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
14 *
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
25 *
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27 */
28
29 #include <sys/param.h>
30 #include <sys/systm.h>
31 #include <sys/kernel.h>
32 #include <sys/socket.h>
33 #include <sys/socketvar.h>
34 #include <sys/protosw.h>
35 #include <sys/mcache.h>
36 #include <sys/syslog.h>
37 #include <sys/proc.h>
38 #include <sys/proc_internal.h>
39 #include <sys/resourcevar.h>
40 #include <sys/kauth.h>
41 #include <sys/priv.h>
42
43 #include <net/if.h>
44 #include <netinet/in.h>
45 #include <netinet/in_var.h>
46 #include <netinet/tcp.h>
47 #include <netinet/tcp_fsm.h>
48 #include <netinet/tcp_seq.h>
49 #include <netinet/tcp_var.h>
50 #include <netinet/tcp_timer.h>
51 #include <netinet/mptcp_var.h>
52 #include <netinet/mptcp_timer.h>
53
54 #include <mach/sdt.h>
55
56 static int mptcp_usr_attach(struct socket *, int, struct proc *);
57 static int mptcp_usr_detach(struct socket *);
58 static int mptcp_attach(struct socket *, struct proc *);
59 static int mptcp_usr_connectx(struct socket *, struct sockaddr *,
60 struct sockaddr *, struct proc *, uint32_t, sae_associd_t,
61 sae_connid_t *, uint32_t, void *, uint32_t, struct uio *, user_ssize_t *);
62 static int mptcp_getassocids(struct mptses *, uint32_t *, user_addr_t);
63 static int mptcp_getconnids(struct mptses *, sae_associd_t, uint32_t *,
64 user_addr_t);
65 static int mptcp_getconninfo(struct mptses *, sae_connid_t *, uint32_t *,
66 uint32_t *, int32_t *, user_addr_t, socklen_t *, user_addr_t, socklen_t *,
67 uint32_t *, user_addr_t, uint32_t *);
68 static int mptcp_usr_control(struct socket *, u_long, caddr_t, struct ifnet *,
69 struct proc *);
70 static int mptcp_disconnect(struct mptses *);
71 static int mptcp_usr_disconnect(struct socket *);
72 static int mptcp_usr_disconnectx(struct socket *, sae_associd_t, sae_connid_t);
73 static struct mptses *mptcp_usrclosed(struct mptses *);
74 static int mptcp_usr_rcvd(struct socket *, int);
75 static int mptcp_usr_send(struct socket *, int, struct mbuf *,
76 struct sockaddr *, struct mbuf *, struct proc *);
77 static int mptcp_usr_shutdown(struct socket *);
78 static int mptcp_usr_sosend(struct socket *, struct sockaddr *, struct uio *,
79 struct mbuf *, struct mbuf *, int);
80 static int mptcp_usr_socheckopt(struct socket *, struct sockopt *);
81 static int mptcp_usr_preconnect(struct socket *so);
82
83 struct pr_usrreqs mptcp_usrreqs = {
84 .pru_attach = mptcp_usr_attach,
85 .pru_connectx = mptcp_usr_connectx,
86 .pru_control = mptcp_usr_control,
87 .pru_detach = mptcp_usr_detach,
88 .pru_disconnect = mptcp_usr_disconnect,
89 .pru_disconnectx = mptcp_usr_disconnectx,
90 .pru_peeraddr = mp_getpeeraddr,
91 .pru_rcvd = mptcp_usr_rcvd,
92 .pru_send = mptcp_usr_send,
93 .pru_shutdown = mptcp_usr_shutdown,
94 .pru_sockaddr = mp_getsockaddr,
95 .pru_sosend = mptcp_usr_sosend,
96 .pru_soreceive = soreceive,
97 .pru_socheckopt = mptcp_usr_socheckopt,
98 .pru_preconnect = mptcp_usr_preconnect,
99 };
100
101
102 #if (DEVELOPMENT || DEBUG)
103 static int mptcp_disable_entitlements = 0;
104 SYSCTL_INT(_net_inet_mptcp, OID_AUTO, disable_entitlements, CTLFLAG_RW | CTLFLAG_LOCKED,
105 &mptcp_disable_entitlements, 0, "Disable Multipath TCP Entitlement Checking");
106 #endif
107
108 int mptcp_developer_mode = 0;
109 SYSCTL_INT(_net_inet_mptcp, OID_AUTO, allow_aggregate, CTLFLAG_RW | CTLFLAG_LOCKED,
110 &mptcp_developer_mode, 0, "Allow the Multipath aggregation mode");
111
112 static unsigned long mptcp_expected_progress_headstart = 5000;
113 SYSCTL_ULONG(_net_inet_mptcp, OID_AUTO, expected_progress_headstart, CTLFLAG_RW | CTLFLAG_LOCKED,
114 &mptcp_expected_progress_headstart, "Headstart to give MPTCP before meeting the progress deadline");
115
116
117 /*
118 * Attaches an MPTCP control block to a socket.
119 */
120 static int
121 mptcp_usr_attach(struct socket *mp_so, int proto, struct proc *p)
122 {
123 #pragma unused(proto)
124 int error;
125
126 VERIFY(mpsotomppcb(mp_so) == NULL);
127
128 error = mptcp_attach(mp_so, p);
129 if (error != 0) {
130 goto out;
131 }
132 /*
133 * XXX: adi@apple.com
134 *
135 * Might want to use a different SO_LINGER timeout than TCP's?
136 */
137 if ((mp_so->so_options & SO_LINGER) && mp_so->so_linger == 0) {
138 mp_so->so_linger = TCP_LINGERTIME * hz;
139 }
140 out:
141 return error;
142 }
143
144 /*
145 * Detaches an MPTCP control block from a socket.
146 */
147 static int
148 mptcp_usr_detach(struct socket *mp_so)
149 {
150 struct mptses *mpte = mpsotompte(mp_so);
151 struct mppcb *mpp = mpsotomppcb(mp_so);
152
153 if (mpp == NULL || mpp->mpp_state == MPPCB_STATE_DEAD) {
154 os_log_error(mptcp_log_handle, "%s - %lx: state: %d\n",
155 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte),
156 mpp ? mpp->mpp_state : -1);
157 return EINVAL;
158 }
159
160 /*
161 * We are done with this MPTCP socket (it has been closed);
162 * trigger all subflows to be disconnected, if not already,
163 * by initiating the PCB detach sequence (SOF_PCBCLEARING
164 * will be set.)
165 */
166 mp_pcbdetach(mp_so);
167
168 mptcp_disconnect(mpte);
169
170 return 0;
171 }
172
173 /*
174 * Attach MPTCP protocol to socket, allocating MP control block,
175 * MPTCP session, control block, buffer space, etc.
176 */
177 static int
178 mptcp_attach(struct socket *mp_so, struct proc *p)
179 {
180 #pragma unused(p)
181 struct mptses *mpte = NULL;
182 struct mptcb *mp_tp = NULL;
183 struct mppcb *mpp = NULL;
184 int error = 0;
185
186 if (mp_so->so_snd.sb_hiwat == 0 || mp_so->so_rcv.sb_hiwat == 0) {
187 error = soreserve(mp_so, tcp_sendspace, tcp_recvspace);
188 if (error != 0) {
189 goto out;
190 }
191 }
192
193 if (mp_so->so_snd.sb_preconn_hiwat == 0) {
194 soreserve_preconnect(mp_so, 2048);
195 }
196
197 if ((mp_so->so_rcv.sb_flags & SB_USRSIZE) == 0) {
198 mp_so->so_rcv.sb_flags |= SB_AUTOSIZE;
199 }
200 if ((mp_so->so_snd.sb_flags & SB_USRSIZE) == 0) {
201 mp_so->so_snd.sb_flags |= SB_AUTOSIZE;
202 }
203
204 /*
205 * MPTCP send-socket buffers cannot be compressed, due to the
206 * fact that each mbuf chained via m_next is a M_PKTHDR
207 * which carries some MPTCP metadata.
208 */
209 mp_so->so_snd.sb_flags |= SB_NOCOMPRESS;
210
211 if ((error = mp_pcballoc(mp_so, &mtcbinfo)) != 0) {
212 goto out;
213 }
214
215 mpp = mpsotomppcb(mp_so);
216 mpte = (struct mptses *)mpp->mpp_pcbe;
217 mp_tp = mpte->mpte_mptcb;
218
219 VERIFY(mp_tp != NULL);
220 out:
221 return error;
222 }
223
224 static int
225 mptcp_entitlement_check(struct socket *mp_so, uint8_t svctype)
226 {
227 struct mptses *mpte = mpsotompte(mp_so);
228
229 /* First, check for mptcp_extended without delegation */
230 if (soopt_cred_check(mp_so, PRIV_NET_RESTRICTED_MULTIPATH_EXTENDED, TRUE, FALSE) == 0) {
231 /*
232 * This means the app has the extended entitlement. Thus,
233 * it's a first party app and can run without restrictions.
234 */
235 mpte->mpte_flags |= MPTE_FIRSTPARTY;
236 return 0;
237 }
238
239 /* Now with delegation */
240 if (mp_so->so_flags & SOF_DELEGATED &&
241 soopt_cred_check(mp_so, PRIV_NET_RESTRICTED_MULTIPATH_EXTENDED, TRUE, TRUE) == 0) {
242 /*
243 * This means the app has the extended entitlement. Thus,
244 * it's a first party app and can run without restrictions.
245 */
246 mpte->mpte_flags |= MPTE_FIRSTPARTY;
247 return 0;
248 }
249
250 /* Now, take a look at exceptions configured through sysctl */
251 #if (DEVELOPMENT || DEBUG)
252 if (mptcp_disable_entitlements) {
253 return 0;
254 }
255 #endif
256
257 if (svctype == MPTCP_SVCTYPE_AGGREGATE) {
258 if (mptcp_developer_mode) {
259 return 0;
260 }
261
262 goto deny;
263 }
264
265 /* Second, check for regular users that are within the data-limits */
266 if (soopt_cred_check(mp_so, PRIV_NET_PRIVILEGED_MULTIPATH, TRUE, FALSE) == 0) {
267 return 0;
268 }
269
270 if (mp_so->so_flags & SOF_DELEGATED &&
271 soopt_cred_check(mp_so, PRIV_NET_PRIVILEGED_MULTIPATH, TRUE, TRUE) == 0) {
272 return 0;
273 }
274
275 deny:
276 os_log_error(mptcp_log_handle, "%s - %lx: MPTCP prohibited on svc %u\n",
277 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte), svctype);
278
279 return -1;
280 }
281
282 /*
283 * Common subroutine to open a MPTCP connection to one of the remote hosts
284 * specified by dst_sl. This includes allocating and establishing a
285 * subflow TCP connection, either initially to establish MPTCP connection,
286 * or to join an existing one. Returns a connection handle upon success.
287 */
288 static int
289 mptcp_connectx(struct mptses *mpte, struct sockaddr *src,
290 struct sockaddr *dst, uint32_t ifscope, sae_connid_t *pcid)
291 {
292 int error = 0;
293
294 VERIFY(dst != NULL);
295 VERIFY(pcid != NULL);
296
297 error = mptcp_subflow_add(mpte, src, dst, ifscope, pcid);
298
299 return error;
300 }
301
302 /*
303 * User-protocol pru_connectx callback.
304 */
305 static int
306 mptcp_usr_connectx(struct socket *mp_so, struct sockaddr *src,
307 struct sockaddr *dst, struct proc *p, uint32_t ifscope,
308 sae_associd_t aid, sae_connid_t *pcid, uint32_t flags, void *arg,
309 uint32_t arglen, struct uio *auio, user_ssize_t *bytes_written)
310 {
311 #pragma unused(p, aid, flags, arg, arglen)
312 struct mppcb *mpp = mpsotomppcb(mp_so);
313 struct mptses *mpte = NULL;
314 struct mptcb *mp_tp = NULL;
315 user_ssize_t datalen;
316 int error = 0;
317
318 if (mpp == NULL || mpp->mpp_state == MPPCB_STATE_DEAD) {
319 os_log_error(mptcp_log_handle, "%s - %lx: state %d\n",
320 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte),
321 mpp ? mpp->mpp_state : -1);
322 error = EINVAL;
323 goto out;
324 }
325 mpte = mptompte(mpp);
326 mp_tp = mpte->mpte_mptcb;
327
328 if (mp_tp->mpt_flags & MPTCPF_FALLBACK_TO_TCP) {
329 os_log_error(mptcp_log_handle, "%s - %lx: fell back to TCP\n",
330 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte));
331 error = EINVAL;
332 goto out;
333 }
334
335 if (dst->sa_family != AF_INET && dst->sa_family != AF_INET6) {
336 error = EAFNOSUPPORT;
337 goto out;
338 }
339
340 if (dst->sa_family == AF_INET &&
341 dst->sa_len != sizeof(mpte->__mpte_dst_v4)) {
342 os_log_error(mptcp_log_handle, "%s - %lx: IPv4 dst len %u\n",
343 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte), dst->sa_len);
344 error = EINVAL;
345 goto out;
346 }
347
348 if (dst->sa_family == AF_INET6 &&
349 dst->sa_len != sizeof(mpte->__mpte_dst_v6)) {
350 os_log_error(mptcp_log_handle, "%s - %lx: IPv6 dst len %u\n",
351 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte), dst->sa_len);
352 error = EINVAL;
353 goto out;
354 }
355
356 if (!(mpte->mpte_flags & MPTE_SVCTYPE_CHECKED)) {
357 if (mptcp_entitlement_check(mp_so, mpte->mpte_svctype) < 0) {
358 error = EPERM;
359 goto out;
360 }
361
362 mpte->mpte_flags |= MPTE_SVCTYPE_CHECKED;
363 }
364
365 if ((mp_so->so_state & (SS_ISCONNECTED | SS_ISCONNECTING)) == 0) {
366 memcpy(&mpte->mpte_u_dst, dst, dst->sa_len);
367 }
368
369 if (src) {
370 if (src->sa_family != AF_INET && src->sa_family != AF_INET6) {
371 error = EAFNOSUPPORT;
372 goto out;
373 }
374
375 if (src->sa_family == AF_INET &&
376 src->sa_len != sizeof(mpte->__mpte_src_v4)) {
377 os_log_error(mptcp_log_handle, "%s - %lx: IPv4 src len %u\n",
378 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte), src->sa_len);
379 error = EINVAL;
380 goto out;
381 }
382
383 if (src->sa_family == AF_INET6 &&
384 src->sa_len != sizeof(mpte->__mpte_src_v6)) {
385 os_log_error(mptcp_log_handle, "%s - %lx: IPv6 src len %u\n",
386 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte), src->sa_len);
387 error = EINVAL;
388 goto out;
389 }
390
391 if ((mp_so->so_state & (SS_ISCONNECTED | SS_ISCONNECTING)) == 0) {
392 memcpy(&mpte->mpte_u_src, src, src->sa_len);
393 }
394 }
395
396 error = mptcp_connectx(mpte, src, dst, ifscope, pcid);
397
398 /* If there is data, copy it */
399 if (auio != NULL) {
400 datalen = uio_resid(auio);
401 socket_unlock(mp_so, 0);
402 error = mp_so->so_proto->pr_usrreqs->pru_sosend(mp_so, NULL,
403 (uio_t) auio, NULL, NULL, 0);
404
405 if (error == 0 || error == EWOULDBLOCK) {
406 *bytes_written = datalen - uio_resid(auio);
407 }
408
409 if (error == EWOULDBLOCK) {
410 error = EINPROGRESS;
411 }
412
413 socket_lock(mp_so, 0);
414 }
415
416 out:
417 return error;
418 }
419
420 /*
421 * Handle SIOCGASSOCIDS ioctl for PF_MULTIPATH domain.
422 */
423 static int
424 mptcp_getassocids(struct mptses *mpte, uint32_t *cnt, user_addr_t aidp)
425 {
426 /* MPTCP has at most 1 association */
427 *cnt = (mpte->mpte_associd != SAE_ASSOCID_ANY) ? 1 : 0;
428
429 /* just asking how many there are? */
430 if (aidp == USER_ADDR_NULL) {
431 return 0;
432 }
433
434 return copyout(&mpte->mpte_associd, aidp,
435 sizeof(mpte->mpte_associd));
436 }
437
438 /*
439 * Handle SIOCGCONNIDS ioctl for PF_MULTIPATH domain.
440 */
441 static int
442 mptcp_getconnids(struct mptses *mpte, sae_associd_t aid, uint32_t *cnt,
443 user_addr_t cidp)
444 {
445 struct mptsub *mpts;
446 int error = 0;
447
448 if (aid != SAE_ASSOCID_ANY && aid != SAE_ASSOCID_ALL &&
449 aid != mpte->mpte_associd) {
450 return EINVAL;
451 }
452
453 *cnt = mpte->mpte_numflows;
454
455 /* just asking how many there are? */
456 if (cidp == USER_ADDR_NULL) {
457 return 0;
458 }
459
460 TAILQ_FOREACH(mpts, &mpte->mpte_subflows, mpts_entry) {
461 if ((error = copyout(&mpts->mpts_connid, cidp,
462 sizeof(mpts->mpts_connid))) != 0) {
463 break;
464 }
465
466 cidp += sizeof(mpts->mpts_connid);
467 }
468
469 return error;
470 }
471
472 /*
473 * Handle SIOCGCONNINFO ioctl for PF_MULTIPATH domain.
474 */
475 static int
476 mptcp_getconninfo(struct mptses *mpte, sae_connid_t *cid, uint32_t *flags,
477 uint32_t *ifindex, int32_t *soerror, user_addr_t src, socklen_t *src_len,
478 user_addr_t dst, socklen_t *dst_len, uint32_t *aux_type,
479 user_addr_t aux_data, uint32_t *aux_len)
480 {
481 *flags = 0;
482 *aux_type = 0;
483 *ifindex = 0;
484 *soerror = 0;
485
486 /* MPTCP-level global stats */
487 if (*cid == SAE_CONNID_ALL) {
488 struct socket *mp_so = mptetoso(mpte);
489 struct mptcb *mp_tp = mpte->mpte_mptcb;
490 struct conninfo_multipathtcp mptcp_ci;
491 int error = 0;
492
493 if (*aux_len != 0 && *aux_len != sizeof(mptcp_ci)) {
494 return EINVAL;
495 }
496
497 if (mp_so->so_state & SS_ISCONNECTING) {
498 *flags |= CIF_CONNECTING;
499 }
500 if (mp_so->so_state & SS_ISCONNECTED) {
501 *flags |= CIF_CONNECTED;
502 }
503 if (mp_so->so_state & SS_ISDISCONNECTING) {
504 *flags |= CIF_DISCONNECTING;
505 }
506 if (mp_so->so_state & SS_ISDISCONNECTED) {
507 *flags |= CIF_DISCONNECTED;
508 }
509 if (!(mp_tp->mpt_flags & MPTCPF_FALLBACK_TO_TCP)) {
510 *flags |= CIF_MP_CAPABLE;
511 }
512 if (mp_tp->mpt_flags & MPTCPF_FALLBACK_TO_TCP) {
513 *flags |= CIF_MP_DEGRADED;
514 }
515
516 *src_len = 0;
517 *dst_len = 0;
518
519 *aux_type = CIAUX_MPTCP;
520 *aux_len = sizeof(mptcp_ci);
521
522 if (aux_data != USER_ADDR_NULL) {
523 const struct mptsub *mpts;
524 int initial_info_set = 0;
525 unsigned long i = 0;
526
527 bzero(&mptcp_ci, sizeof(mptcp_ci));
528 mptcp_ci.mptcpci_subflow_count = mpte->mpte_numflows;
529 mptcp_ci.mptcpci_switch_count = mpte->mpte_subflow_switches;
530
531 VERIFY(sizeof(mptcp_ci.mptcpci_itfstats) == sizeof(mpte->mpte_itfstats));
532 memcpy(mptcp_ci.mptcpci_itfstats, mpte->mpte_itfstats, sizeof(mptcp_ci.mptcpci_itfstats));
533
534 TAILQ_FOREACH(mpts, &mpte->mpte_subflows, mpts_entry) {
535 if (i >= sizeof(mptcp_ci.mptcpci_subflow_connids) / sizeof(sae_connid_t)) {
536 break;
537 }
538 mptcp_ci.mptcpci_subflow_connids[i] = mpts->mpts_connid;
539
540 if (mpts->mpts_flags & MPTSF_INITIAL_SUB) {
541 const struct inpcb *inp;
542
543 inp = sotoinpcb(mpts->mpts_socket);
544
545 mptcp_ci.mptcpci_init_rxbytes = inp->inp_stat->rxbytes;
546 mptcp_ci.mptcpci_init_txbytes = inp->inp_stat->txbytes;
547 initial_info_set = 1;
548 }
549
550 mptcpstats_update(mptcp_ci.mptcpci_itfstats, mpts);
551
552 i++;
553 }
554
555 if (initial_info_set == 0) {
556 mptcp_ci.mptcpci_init_rxbytes = mpte->mpte_init_rxbytes;
557 mptcp_ci.mptcpci_init_txbytes = mpte->mpte_init_txbytes;
558 }
559
560 if (mpte->mpte_flags & MPTE_FIRSTPARTY) {
561 mptcp_ci.mptcpci_flags |= MPTCPCI_FIRSTPARTY;
562 }
563
564 error = copyout(&mptcp_ci, aux_data, sizeof(mptcp_ci));
565 if (error != 0) {
566 os_log_error(mptcp_log_handle, "%s - %lx: copyout failed: %d\n",
567 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte), error);
568 return error;
569 }
570 }
571
572 return 0;
573 }
574
575 /* Any stats of any subflow */
576 if (*cid == SAE_CONNID_ANY) {
577 const struct mptsub *mpts;
578 struct socket *so;
579 const struct inpcb *inp;
580 int error = 0;
581
582 mpts = TAILQ_FIRST(&mpte->mpte_subflows);
583 if (mpts == NULL) {
584 return ENXIO;
585 }
586
587 so = mpts->mpts_socket;
588 inp = sotoinpcb(so);
589
590 if (inp->inp_vflag & INP_IPV4) {
591 error = in_getconninfo(so, SAE_CONNID_ANY, flags, ifindex,
592 soerror, src, src_len, dst, dst_len,
593 aux_type, aux_data, aux_len);
594 } else {
595 error = in6_getconninfo(so, SAE_CONNID_ANY, flags, ifindex,
596 soerror, src, src_len, dst, dst_len,
597 aux_type, aux_data, aux_len);
598 }
599
600 if (error != 0) {
601 os_log_error(mptcp_log_handle, "%s - %lx:error from in_getconninfo %d\n",
602 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte), error);
603 return error;
604 }
605
606 if (mpts->mpts_flags & MPTSF_MP_CAPABLE) {
607 *flags |= CIF_MP_CAPABLE;
608 }
609 if (mpts->mpts_flags & MPTSF_MP_DEGRADED) {
610 *flags |= CIF_MP_DEGRADED;
611 }
612 if (mpts->mpts_flags & MPTSF_MP_READY) {
613 *flags |= CIF_MP_READY;
614 }
615 if (mpts->mpts_flags & MPTSF_ACTIVE) {
616 *flags |= CIF_MP_ACTIVE;
617 }
618
619 return 0;
620 } else {
621 /* Per-interface stats */
622 const struct mptsub *mpts, *orig_mpts;
623 struct conninfo_tcp tcp_ci;
624 const struct inpcb *inp;
625 struct socket *so;
626 int error = 0;
627 int index;
628
629 bzero(&tcp_ci, sizeof(tcp_ci));
630
631 /* First, get a subflow to fill in the "regular" info. */
632 TAILQ_FOREACH(mpts, &mpte->mpte_subflows, mpts_entry) {
633 const struct ifnet *ifp = sotoinpcb(mpts->mpts_socket)->inp_last_outifp;
634
635 if (ifp && ifp->if_index == *cid) {
636 break;
637 }
638 }
639
640 if (mpts == NULL) {
641 /* No subflow there - well, let's just get the basic itf-info */
642 goto interface_info;
643 }
644
645 so = mpts->mpts_socket;
646 inp = sotoinpcb(so);
647
648 /* Give it USER_ADDR_NULL, because we are doing this on our own */
649 if (inp->inp_vflag & INP_IPV4) {
650 error = in_getconninfo(so, SAE_CONNID_ANY, flags, ifindex,
651 soerror, src, src_len, dst, dst_len,
652 aux_type, USER_ADDR_NULL, aux_len);
653 } else {
654 error = in6_getconninfo(so, SAE_CONNID_ANY, flags, ifindex,
655 soerror, src, src_len, dst, dst_len,
656 aux_type, USER_ADDR_NULL, aux_len);
657 }
658
659 if (error != 0) {
660 os_log_error(mptcp_log_handle, "%s - %lx:error from in_getconninfo %d\n",
661 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte), error);
662 return error;
663 }
664
665 /* ToDo: Nobody is reading these flags on subflows. Why bother ? */
666 if (mpts->mpts_flags & MPTSF_MP_CAPABLE) {
667 *flags |= CIF_MP_CAPABLE;
668 }
669 if (mpts->mpts_flags & MPTSF_MP_DEGRADED) {
670 *flags |= CIF_MP_DEGRADED;
671 }
672 if (mpts->mpts_flags & MPTSF_MP_READY) {
673 *flags |= CIF_MP_READY;
674 }
675 if (mpts->mpts_flags & MPTSF_ACTIVE) {
676 *flags |= CIF_MP_ACTIVE;
677 }
678
679 /*
680 * Now, we gather the metrics (aka., tcp_info) and roll them in
681 * across all subflows of this interface to build an aggregated
682 * view.
683 *
684 * We take the TCP_INFO from the first subflow as the "master",
685 * feeding into those fields that we do not roll.
686 */
687 if (aux_data != USER_ADDR_NULL) {
688 tcp_getconninfo(so, &tcp_ci);
689
690 orig_mpts = mpts;
691 TAILQ_FOREACH(mpts, &mpte->mpte_subflows, mpts_entry) {
692 const struct inpcb *mptsinp = sotoinpcb(mpts->mpts_socket);
693 const struct ifnet *ifp;
694
695 ifp = mptsinp->inp_last_outifp;
696
697 if (ifp == NULL || ifp->if_index != *cid || mpts == orig_mpts) {
698 continue;
699 }
700
701 /* Roll the itf-stats into the tcp_info */
702 tcp_ci.tcpci_tcp_info.tcpi_txbytes +=
703 mptsinp->inp_stat->txbytes;
704 tcp_ci.tcpci_tcp_info.tcpi_rxbytes +=
705 mptsinp->inp_stat->rxbytes;
706
707 tcp_ci.tcpci_tcp_info.tcpi_wifi_txbytes +=
708 mptsinp->inp_wstat->txbytes;
709 tcp_ci.tcpci_tcp_info.tcpi_wifi_rxbytes +=
710 mptsinp->inp_wstat->rxbytes;
711
712 tcp_ci.tcpci_tcp_info.tcpi_wired_txbytes +=
713 mptsinp->inp_Wstat->txbytes;
714 tcp_ci.tcpci_tcp_info.tcpi_wired_rxbytes +=
715 mptsinp->inp_Wstat->rxbytes;
716
717 tcp_ci.tcpci_tcp_info.tcpi_cell_txbytes +=
718 mptsinp->inp_cstat->txbytes;
719 tcp_ci.tcpci_tcp_info.tcpi_cell_rxbytes +=
720 mptsinp->inp_cstat->rxbytes;
721 }
722 }
723
724 interface_info:
725 *aux_type = CIAUX_TCP;
726 if (*aux_len == 0) {
727 *aux_len = sizeof(tcp_ci);
728 } else if (aux_data != USER_ADDR_NULL) {
729 boolean_t create;
730
731 /*
732 * Finally, old subflows might have been closed - we
733 * want this data as well, so grab it from the interface
734 * stats.
735 */
736 create = orig_mpts != NULL;
737
738 /*
739 * When we found a subflow, we are willing to create a stats-index
740 * because we have some data to return. If there isn't a subflow,
741 * nor anything in the stats, return EINVAL. Because the
742 * ifindex belongs to something that doesn't exist.
743 */
744 index = mptcpstats_get_index_by_ifindex(mpte->mpte_itfstats, *cid, false);
745 if (index == -1) {
746 os_log_error(mptcp_log_handle,
747 "%s - %lx: Asking for too many ifindex: %u subcount %u, mpts? %s\n",
748 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte),
749 *cid, mpte->mpte_numflows,
750 orig_mpts ? "yes" : "no");
751
752 if (orig_mpts == NULL) {
753 return EINVAL;
754 }
755 } else {
756 struct mptcp_itf_stats *stats;
757
758 stats = &mpte->mpte_itfstats[index];
759
760 /* Roll the itf-stats into the tcp_info */
761 tcp_ci.tcpci_tcp_info.tcpi_last_outif = *cid;
762 tcp_ci.tcpci_tcp_info.tcpi_txbytes +=
763 stats->mpis_txbytes;
764 tcp_ci.tcpci_tcp_info.tcpi_rxbytes +=
765 stats->mpis_rxbytes;
766
767 tcp_ci.tcpci_tcp_info.tcpi_wifi_txbytes +=
768 stats->mpis_wifi_txbytes;
769 tcp_ci.tcpci_tcp_info.tcpi_wifi_rxbytes +=
770 stats->mpis_wifi_rxbytes;
771
772 tcp_ci.tcpci_tcp_info.tcpi_wired_txbytes +=
773 stats->mpis_wired_txbytes;
774 tcp_ci.tcpci_tcp_info.tcpi_wired_rxbytes +=
775 stats->mpis_wired_rxbytes;
776
777 tcp_ci.tcpci_tcp_info.tcpi_cell_txbytes +=
778 stats->mpis_cell_txbytes;
779 tcp_ci.tcpci_tcp_info.tcpi_cell_rxbytes +=
780 stats->mpis_cell_rxbytes;
781 }
782
783 *aux_len = min(*aux_len, sizeof(tcp_ci));
784 error = copyout(&tcp_ci, aux_data, *aux_len);
785 if (error != 0) {
786 return error;
787 }
788 }
789 }
790
791 return 0;
792 }
793
794 /*
795 * User-protocol pru_control callback.
796 */
797 static int
798 mptcp_usr_control(struct socket *mp_so, u_long cmd, caddr_t data,
799 struct ifnet *ifp, struct proc *p)
800 {
801 #pragma unused(ifp, p)
802 struct mppcb *mpp = mpsotomppcb(mp_so);
803 struct mptses *mpte;
804 int error = 0;
805
806 if (mpp == NULL || mpp->mpp_state == MPPCB_STATE_DEAD) {
807 error = EINVAL;
808 goto out;
809 }
810 mpte = mptompte(mpp);
811
812 switch (cmd) {
813 case SIOCGASSOCIDS32: { /* struct so_aidreq32 */
814 struct so_aidreq32 aidr;
815 bcopy(data, &aidr, sizeof(aidr));
816 error = mptcp_getassocids(mpte, &aidr.sar_cnt,
817 aidr.sar_aidp);
818 if (error == 0) {
819 bcopy(&aidr, data, sizeof(aidr));
820 }
821 break;
822 }
823
824 case SIOCGASSOCIDS64: { /* struct so_aidreq64 */
825 struct so_aidreq64 aidr;
826 bcopy(data, &aidr, sizeof(aidr));
827 error = mptcp_getassocids(mpte, &aidr.sar_cnt,
828 aidr.sar_aidp);
829 if (error == 0) {
830 bcopy(&aidr, data, sizeof(aidr));
831 }
832 break;
833 }
834
835 case SIOCGCONNIDS32: { /* struct so_cidreq32 */
836 struct so_cidreq32 cidr;
837 bcopy(data, &cidr, sizeof(cidr));
838 error = mptcp_getconnids(mpte, cidr.scr_aid, &cidr.scr_cnt,
839 cidr.scr_cidp);
840 if (error == 0) {
841 bcopy(&cidr, data, sizeof(cidr));
842 }
843 break;
844 }
845
846 case SIOCGCONNIDS64: { /* struct so_cidreq64 */
847 struct so_cidreq64 cidr;
848 bcopy(data, &cidr, sizeof(cidr));
849 error = mptcp_getconnids(mpte, cidr.scr_aid, &cidr.scr_cnt,
850 cidr.scr_cidp);
851 if (error == 0) {
852 bcopy(&cidr, data, sizeof(cidr));
853 }
854 break;
855 }
856
857 case SIOCGCONNINFO32: { /* struct so_cinforeq32 */
858 struct so_cinforeq32 cifr;
859 bcopy(data, &cifr, sizeof(cifr));
860 error = mptcp_getconninfo(mpte, &cifr.scir_cid,
861 &cifr.scir_flags, &cifr.scir_ifindex, &cifr.scir_error,
862 cifr.scir_src, &cifr.scir_src_len, cifr.scir_dst,
863 &cifr.scir_dst_len, &cifr.scir_aux_type, cifr.scir_aux_data,
864 &cifr.scir_aux_len);
865 if (error == 0) {
866 bcopy(&cifr, data, sizeof(cifr));
867 }
868 break;
869 }
870
871 case SIOCGCONNINFO64: { /* struct so_cinforeq64 */
872 struct so_cinforeq64 cifr;
873 bcopy(data, &cifr, sizeof(cifr));
874 error = mptcp_getconninfo(mpte, &cifr.scir_cid,
875 &cifr.scir_flags, &cifr.scir_ifindex, &cifr.scir_error,
876 cifr.scir_src, &cifr.scir_src_len, cifr.scir_dst,
877 &cifr.scir_dst_len, &cifr.scir_aux_type, cifr.scir_aux_data,
878 &cifr.scir_aux_len);
879 if (error == 0) {
880 bcopy(&cifr, data, sizeof(cifr));
881 }
882 break;
883 }
884
885 default:
886 error = EOPNOTSUPP;
887 break;
888 }
889 out:
890 return error;
891 }
892
893 static int
894 mptcp_disconnect(struct mptses *mpte)
895 {
896 struct socket *mp_so;
897 struct mptcb *mp_tp;
898 int error = 0;
899
900 mp_so = mptetoso(mpte);
901 mp_tp = mpte->mpte_mptcb;
902
903 DTRACE_MPTCP3(disconnectx, struct mptses *, mpte,
904 struct socket *, mp_so, struct mptcb *, mp_tp);
905
906 /* if we're not detached, go thru socket state checks */
907 if (!(mp_so->so_flags & SOF_PCBCLEARING)) {
908 if (!(mp_so->so_state & (SS_ISCONNECTED |
909 SS_ISCONNECTING))) {
910 error = ENOTCONN;
911 goto out;
912 }
913 if (mp_so->so_state & SS_ISDISCONNECTING) {
914 error = EALREADY;
915 goto out;
916 }
917 }
918
919 mptcp_cancel_all_timers(mp_tp);
920 if (mp_tp->mpt_state < MPTCPS_ESTABLISHED) {
921 mptcp_close(mpte, mp_tp);
922 } else if ((mp_so->so_options & SO_LINGER) &&
923 mp_so->so_linger == 0) {
924 mptcp_drop(mpte, mp_tp, 0);
925 } else {
926 soisdisconnecting(mp_so);
927 sbflush(&mp_so->so_rcv);
928 if (mptcp_usrclosed(mpte) != NULL) {
929 mptcp_output(mpte);
930 }
931 }
932
933 if (error == 0) {
934 mptcp_subflow_workloop(mpte);
935 }
936
937 out:
938 return error;
939 }
940
941 /*
942 * Wrapper function to support disconnect on socket
943 */
944 static int
945 mptcp_usr_disconnect(struct socket *mp_so)
946 {
947 return mptcp_disconnect(mpsotompte(mp_so));
948 }
949
950 /*
951 * User-protocol pru_disconnectx callback.
952 */
953 static int
954 mptcp_usr_disconnectx(struct socket *mp_so, sae_associd_t aid, sae_connid_t cid)
955 {
956 if (aid != SAE_ASSOCID_ANY && aid != SAE_ASSOCID_ALL) {
957 return EINVAL;
958 }
959
960 if (cid != SAE_CONNID_ANY && cid != SAE_CONNID_ALL) {
961 return EINVAL;
962 }
963
964 return mptcp_usr_disconnect(mp_so);
965 }
966
967 void
968 mptcp_finish_usrclosed(struct mptses *mpte)
969 {
970 struct mptcb *mp_tp = mpte->mpte_mptcb;
971 struct socket *mp_so = mptetoso(mpte);
972
973 if (mp_tp->mpt_state == MPTCPS_CLOSED) {
974 mpte = mptcp_close(mpte, mp_tp);
975 } else if (mp_tp->mpt_state >= MPTCPS_FIN_WAIT_2) {
976 soisdisconnected(mp_so);
977 } else {
978 struct mptsub *mpts;
979
980 TAILQ_FOREACH(mpts, &mpte->mpte_subflows, mpts_entry) {
981 if ((mp_so->so_state & (SS_CANTRCVMORE | SS_CANTSENDMORE)) ==
982 (SS_CANTRCVMORE | SS_CANTSENDMORE)) {
983 mptcp_subflow_disconnect(mpte, mpts);
984 } else {
985 mptcp_subflow_shutdown(mpte, mpts);
986 }
987 }
988 }
989 }
990
991 /*
992 * User issued close, and wish to trail thru shutdown states.
993 */
994 static struct mptses *
995 mptcp_usrclosed(struct mptses *mpte)
996 {
997 struct mptcb *mp_tp = mpte->mpte_mptcb;
998
999 mptcp_close_fsm(mp_tp, MPCE_CLOSE);
1000
1001 /* Not everything has been acknowledged - don't close the subflows! */
1002 if (mp_tp->mpt_sndnxt + 1 != mp_tp->mpt_sndmax) {
1003 return mpte;
1004 }
1005
1006 mptcp_finish_usrclosed(mpte);
1007
1008 return mpte;
1009 }
1010
1011 /*
1012 * After a receive, possible send some update to peer.
1013 */
1014 static int
1015 mptcp_usr_rcvd(struct socket *mp_so, int flags)
1016 {
1017 #pragma unused(flags)
1018 struct mppcb *mpp = mpsotomppcb(mp_so);
1019 struct mptses *mpte;
1020 struct mptsub *mpts;
1021 int error = 0;
1022
1023 if (mpp == NULL || mpp->mpp_state == MPPCB_STATE_DEAD) {
1024 error = EINVAL;
1025 goto out;
1026 }
1027
1028 mpte = mptompte(mpp);
1029
1030 TAILQ_FOREACH(mpts, &mpte->mpte_subflows, mpts_entry) {
1031 struct socket *so = mpts->mpts_socket;
1032
1033 if (so->so_proto->pr_flags & PR_WANTRCVD && so->so_pcb != NULL) {
1034 (*so->so_proto->pr_usrreqs->pru_rcvd)(so, 0);
1035 }
1036 }
1037
1038 error = mptcp_output(mpte);
1039 out:
1040 return error;
1041 }
1042
1043 /*
1044 * Do a send by putting data in the output queue.
1045 */
1046 static int
1047 mptcp_usr_send(struct socket *mp_so, int prus_flags, struct mbuf *m,
1048 struct sockaddr *nam, struct mbuf *control, struct proc *p)
1049 {
1050 #pragma unused(nam, p)
1051 struct mppcb *mpp = mpsotomppcb(mp_so);
1052 struct mptses *mpte;
1053 int error = 0;
1054
1055 if (prus_flags & (PRUS_OOB | PRUS_EOF)) {
1056 error = EOPNOTSUPP;
1057 goto out;
1058 }
1059
1060 if (nam != NULL) {
1061 error = EOPNOTSUPP;
1062 goto out;
1063 }
1064
1065 if (control != NULL && control->m_len != 0) {
1066 error = EOPNOTSUPP;
1067 goto out;
1068 }
1069
1070 if (mpp == NULL || mpp->mpp_state == MPPCB_STATE_DEAD) {
1071 error = ECONNRESET;
1072 goto out;
1073 }
1074 mpte = mptompte(mpp);
1075 VERIFY(mpte != NULL);
1076
1077 if (!(mp_so->so_state & SS_ISCONNECTED) &&
1078 !(mp_so->so_flags1 & SOF1_PRECONNECT_DATA)) {
1079 error = ENOTCONN;
1080 goto out;
1081 }
1082
1083 mptcp_insert_dsn(mpp, m);
1084 VERIFY(mp_so->so_snd.sb_flags & SB_NOCOMPRESS);
1085 sbappendstream(&mp_so->so_snd, m);
1086 m = NULL;
1087
1088 error = mptcp_output(mpte);
1089 if (error != 0) {
1090 goto out;
1091 }
1092
1093 if (mp_so->so_state & SS_ISCONNECTING) {
1094 if (mp_so->so_state & SS_NBIO) {
1095 error = EWOULDBLOCK;
1096 } else {
1097 error = sbwait(&mp_so->so_snd);
1098 }
1099 }
1100
1101 out:
1102 if (error) {
1103 if (m != NULL) {
1104 m_freem(m);
1105 }
1106 if (control != NULL) {
1107 m_freem(control);
1108 }
1109 }
1110 return error;
1111 }
1112
1113 /*
1114 * Mark the MPTCP connection as being incapable of further output.
1115 */
1116 static int
1117 mptcp_usr_shutdown(struct socket *mp_so)
1118 {
1119 struct mppcb *mpp = mpsotomppcb(mp_so);
1120 struct mptses *mpte;
1121 int error = 0;
1122
1123 if (mpp == NULL || mpp->mpp_state == MPPCB_STATE_DEAD) {
1124 error = EINVAL;
1125 goto out;
1126 }
1127 mpte = mptompte(mpp);
1128 VERIFY(mpte != NULL);
1129
1130 socantsendmore(mp_so);
1131
1132 mpte = mptcp_usrclosed(mpte);
1133 if (mpte != NULL) {
1134 error = mptcp_output(mpte);
1135 }
1136 out:
1137 return error;
1138 }
1139
1140 /*
1141 * Copy the contents of uio into a properly sized mbuf chain.
1142 */
1143 static int
1144 mptcp_uiotombuf(struct uio *uio, int how, int space, uint32_t align,
1145 struct mbuf **top)
1146 {
1147 struct mbuf *m, *mb, *nm = NULL, *mtail = NULL;
1148 user_ssize_t resid, tot, len, progress; /* must be user_ssize_t */
1149 int error;
1150
1151 VERIFY(top != NULL && *top == NULL);
1152
1153 /*
1154 * space can be zero or an arbitrary large value bound by
1155 * the total data supplied by the uio.
1156 */
1157 resid = uio_resid(uio);
1158 if (space > 0) {
1159 tot = imin(resid, space);
1160 } else {
1161 tot = resid;
1162 }
1163
1164 /*
1165 * The smallest unit is a single mbuf with pkthdr.
1166 * We can't align past it.
1167 */
1168 if (align >= MHLEN) {
1169 return EINVAL;
1170 }
1171
1172 /*
1173 * Give us the full allocation or nothing.
1174 * If space is zero return the smallest empty mbuf.
1175 */
1176 if ((len = tot + align) == 0) {
1177 len = 1;
1178 }
1179
1180 /* Loop and append maximum sized mbufs to the chain tail. */
1181 while (len > 0) {
1182 uint32_t m_needed = 1;
1183
1184 if (njcl > 0 && len > MBIGCLBYTES) {
1185 mb = m_getpackets_internal(&m_needed, 1,
1186 how, 1, M16KCLBYTES);
1187 } else if (len > MCLBYTES) {
1188 mb = m_getpackets_internal(&m_needed, 1,
1189 how, 1, MBIGCLBYTES);
1190 } else if (len >= (signed)MINCLSIZE) {
1191 mb = m_getpackets_internal(&m_needed, 1,
1192 how, 1, MCLBYTES);
1193 } else {
1194 mb = m_gethdr(how, MT_DATA);
1195 }
1196
1197 /* Fail the whole operation if one mbuf can't be allocated. */
1198 if (mb == NULL) {
1199 if (nm != NULL) {
1200 m_freem(nm);
1201 }
1202 return ENOBUFS;
1203 }
1204
1205 /* Book keeping. */
1206 VERIFY(mb->m_flags & M_PKTHDR);
1207 len -= ((mb->m_flags & M_EXT) ? mb->m_ext.ext_size : MHLEN);
1208 if (mtail != NULL) {
1209 mtail->m_next = mb;
1210 } else {
1211 nm = mb;
1212 }
1213 mtail = mb;
1214 }
1215
1216 m = nm;
1217 m->m_data += align;
1218
1219 progress = 0;
1220 /* Fill all mbufs with uio data and update header information. */
1221 for (mb = m; mb != NULL; mb = mb->m_next) {
1222 len = imin(M_TRAILINGSPACE(mb), tot - progress);
1223
1224 error = uiomove(mtod(mb, char *), len, uio);
1225 if (error != 0) {
1226 m_freem(m);
1227 return error;
1228 }
1229
1230 /* each mbuf is M_PKTHDR chained via m_next */
1231 mb->m_len = len;
1232 mb->m_pkthdr.len = len;
1233
1234 progress += len;
1235 }
1236 VERIFY(progress == tot);
1237 *top = m;
1238 return 0;
1239 }
1240
1241 /*
1242 * MPTCP socket protocol-user socket send routine, derived from sosend().
1243 */
1244 static int
1245 mptcp_usr_sosend(struct socket *mp_so, struct sockaddr *addr, struct uio *uio,
1246 struct mbuf *top, struct mbuf *control, int flags)
1247 {
1248 #pragma unused(addr)
1249 int32_t space;
1250 user_ssize_t resid;
1251 int error, sendflags;
1252 struct proc *p = current_proc();
1253 int sblocked = 0;
1254
1255 /* UIO is required for now, due to per-mbuf M_PKTHDR constrains */
1256 if (uio == NULL || top != NULL) {
1257 error = EINVAL;
1258 goto out;
1259 }
1260 resid = uio_resid(uio);
1261
1262 socket_lock(mp_so, 1);
1263 so_update_last_owner_locked(mp_so, p);
1264 so_update_policy(mp_so);
1265
1266 VERIFY(mp_so->so_type == SOCK_STREAM);
1267 VERIFY(!(mp_so->so_flags & SOF_MP_SUBFLOW));
1268
1269 if ((flags & (MSG_OOB | MSG_DONTROUTE)) ||
1270 (mp_so->so_flags & SOF_ENABLE_MSGS)) {
1271 error = EOPNOTSUPP;
1272 socket_unlock(mp_so, 1);
1273 goto out;
1274 }
1275
1276 /*
1277 * In theory resid should be unsigned. However, space must be
1278 * signed, as it might be less than 0 if we over-committed, and we
1279 * must use a signed comparison of space and resid. On the other
1280 * hand, a negative resid causes us to loop sending 0-length
1281 * segments to the protocol.
1282 */
1283 if (resid < 0 || (flags & MSG_EOR) || control != NULL) {
1284 error = EINVAL;
1285 socket_unlock(mp_so, 1);
1286 goto out;
1287 }
1288
1289 OSIncrementAtomicLong(&p->p_stats->p_ru.ru_msgsnd);
1290
1291 do {
1292 error = sosendcheck(mp_so, NULL, resid, 0, 0, flags,
1293 &sblocked, NULL);
1294 if (error != 0) {
1295 goto release;
1296 }
1297
1298 space = sbspace(&mp_so->so_snd);
1299 do {
1300 socket_unlock(mp_so, 0);
1301 /*
1302 * Copy the data from userland into an mbuf chain.
1303 */
1304 error = mptcp_uiotombuf(uio, M_WAITOK, space, 0, &top);
1305 if (error != 0) {
1306 socket_lock(mp_so, 0);
1307 goto release;
1308 }
1309 VERIFY(top != NULL);
1310 space -= resid - uio_resid(uio);
1311 resid = uio_resid(uio);
1312 socket_lock(mp_so, 0);
1313
1314 /*
1315 * Compute flags here, for pru_send and NKEs.
1316 */
1317 sendflags = (resid > 0 && space > 0) ?
1318 PRUS_MORETOCOME : 0;
1319
1320 /*
1321 * Socket filter processing
1322 */
1323 VERIFY(control == NULL);
1324 error = sflt_data_out(mp_so, NULL, &top, &control, 0);
1325 if (error != 0) {
1326 if (error == EJUSTRETURN) {
1327 error = 0;
1328 top = NULL;
1329 /* always free control if any */
1330 }
1331 goto release;
1332 }
1333 if (control != NULL) {
1334 m_freem(control);
1335 control = NULL;
1336 }
1337
1338 /*
1339 * Pass data to protocol.
1340 */
1341 error = (*mp_so->so_proto->pr_usrreqs->pru_send)
1342 (mp_so, sendflags, top, NULL, NULL, p);
1343
1344 top = NULL;
1345 if (error != 0) {
1346 goto release;
1347 }
1348 } while (resid != 0 && space > 0);
1349 } while (resid != 0);
1350
1351 release:
1352 if (sblocked) {
1353 sbunlock(&mp_so->so_snd, FALSE); /* will unlock socket */
1354 } else {
1355 socket_unlock(mp_so, 1);
1356 }
1357 out:
1358 if (top != NULL) {
1359 m_freem(top);
1360 }
1361 if (control != NULL) {
1362 m_freem(control);
1363 }
1364
1365 soclearfastopen(mp_so);
1366
1367 return error;
1368 }
1369
1370 /*
1371 * Called to filter SOPT_{SET,GET} for SOL_SOCKET level socket options.
1372 * This routine simply indicates to the caller whether or not to proceed
1373 * further with the given socket option. This is invoked by sosetoptlock()
1374 * and sogetoptlock().
1375 */
1376 static int
1377 mptcp_usr_socheckopt(struct socket *mp_so, struct sockopt *sopt)
1378 {
1379 #pragma unused(mp_so)
1380 int error = 0;
1381
1382 VERIFY(sopt->sopt_level == SOL_SOCKET);
1383
1384 /*
1385 * We could check for sopt_dir (set/get) here, but we'll just
1386 * let the caller deal with it as appropriate; therefore the
1387 * following is a superset of the socket options which we
1388 * allow for set/get.
1389 *
1390 * XXX: adi@apple.com
1391 *
1392 * Need to consider the following cases:
1393 *
1394 * a. Certain socket options don't have a clear definition
1395 * on the expected behavior post connect(2). At the time
1396 * those options are issued on the MP socket, there may
1397 * be existing subflow sockets that are already connected.
1398 */
1399 switch (sopt->sopt_name) {
1400 case SO_LINGER: /* MP */
1401 case SO_LINGER_SEC: /* MP */
1402 case SO_TYPE: /* MP */
1403 case SO_NREAD: /* MP */
1404 case SO_NWRITE: /* MP */
1405 case SO_ERROR: /* MP */
1406 case SO_SNDBUF: /* MP */
1407 case SO_RCVBUF: /* MP */
1408 case SO_SNDLOWAT: /* MP */
1409 case SO_RCVLOWAT: /* MP */
1410 case SO_SNDTIMEO: /* MP */
1411 case SO_RCVTIMEO: /* MP */
1412 case SO_NKE: /* MP */
1413 case SO_NOSIGPIPE: /* MP */
1414 case SO_NOADDRERR: /* MP */
1415 case SO_LABEL: /* MP */
1416 case SO_PEERLABEL: /* MP */
1417 case SO_DEFUNCTIT: /* MP */
1418 case SO_DEFUNCTOK: /* MP */
1419 case SO_ISDEFUNCT: /* MP */
1420 case SO_TRAFFIC_CLASS_DBG: /* MP */
1421 case SO_DELEGATED: /* MP */
1422 case SO_DELEGATED_UUID: /* MP */
1423 #if NECP
1424 case SO_NECP_ATTRIBUTES:
1425 case SO_NECP_CLIENTUUID:
1426 #endif /* NECP */
1427 case SO_MPKL_SEND_INFO:
1428 /*
1429 * Tell the caller that these options are to be processed.
1430 */
1431 break;
1432
1433 case SO_DEBUG: /* MP + subflow */
1434 case SO_KEEPALIVE: /* MP + subflow */
1435 case SO_USELOOPBACK: /* MP + subflow */
1436 case SO_RANDOMPORT: /* MP + subflow */
1437 case SO_TRAFFIC_CLASS: /* MP + subflow */
1438 case SO_RECV_TRAFFIC_CLASS: /* MP + subflow */
1439 case SO_PRIVILEGED_TRAFFIC_CLASS: /* MP + subflow */
1440 case SO_RECV_ANYIF: /* MP + subflow */
1441 case SO_RESTRICTIONS: /* MP + subflow */
1442 case SO_FLUSH: /* MP + subflow */
1443 case SO_NOWAKEFROMSLEEP:
1444 case SO_NOAPNFALLBK:
1445 case SO_MARK_CELLFALLBACK:
1446 /*
1447 * Tell the caller that these options are to be processed;
1448 * these will also be recorded later by mptcp_setopt().
1449 *
1450 * NOTE: Only support integer option value for now.
1451 */
1452 if (sopt->sopt_valsize != sizeof(int)) {
1453 error = EINVAL;
1454 }
1455 break;
1456
1457 default:
1458 /*
1459 * Tell the caller to stop immediately and return an error.
1460 */
1461 error = ENOPROTOOPT;
1462 break;
1463 }
1464
1465 return error;
1466 }
1467
1468 /*
1469 * Issue SOPT_SET for all MPTCP subflows (for integer option values.)
1470 */
1471 static int
1472 mptcp_setopt_apply(struct mptses *mpte, struct mptopt *mpo)
1473 {
1474 struct socket *mp_so;
1475 struct mptsub *mpts;
1476 struct mptopt smpo;
1477 int error = 0;
1478
1479 /* just bail now if this isn't applicable to subflow sockets */
1480 if (!(mpo->mpo_flags & MPOF_SUBFLOW_OK)) {
1481 error = ENOPROTOOPT;
1482 goto out;
1483 }
1484
1485 /*
1486 * Skip those that are handled internally; these options
1487 * should not have been recorded and marked with the
1488 * MPOF_SUBFLOW_OK by mptcp_setopt(), but just in case.
1489 */
1490 if (mpo->mpo_level == SOL_SOCKET &&
1491 (mpo->mpo_name == SO_NOSIGPIPE || mpo->mpo_name == SO_NOADDRERR)) {
1492 error = ENOPROTOOPT;
1493 goto out;
1494 }
1495
1496 mp_so = mptetoso(mpte);
1497
1498 /*
1499 * Don't bother going further if there's no subflow; mark the option
1500 * with MPOF_INTERIM so that we know whether or not to remove this
1501 * option upon encountering an error while issuing it during subflow
1502 * socket creation.
1503 */
1504 if (mpte->mpte_numflows == 0) {
1505 VERIFY(TAILQ_EMPTY(&mpte->mpte_subflows));
1506 mpo->mpo_flags |= MPOF_INTERIM;
1507 /* return success */
1508 goto out;
1509 }
1510
1511 bzero(&smpo, sizeof(smpo));
1512 smpo.mpo_flags |= MPOF_SUBFLOW_OK;
1513 smpo.mpo_level = mpo->mpo_level;
1514 smpo.mpo_name = mpo->mpo_name;
1515
1516 /* grab exisiting values in case we need to rollback */
1517 TAILQ_FOREACH(mpts, &mpte->mpte_subflows, mpts_entry) {
1518 struct socket *so;
1519
1520 mpts->mpts_flags &= ~(MPTSF_SOPT_OLDVAL | MPTSF_SOPT_INPROG);
1521 mpts->mpts_oldintval = 0;
1522 smpo.mpo_intval = 0;
1523 VERIFY(mpts->mpts_socket != NULL);
1524 so = mpts->mpts_socket;
1525 if (mptcp_subflow_sogetopt(mpte, so, &smpo) == 0) {
1526 mpts->mpts_flags |= MPTSF_SOPT_OLDVAL;
1527 mpts->mpts_oldintval = smpo.mpo_intval;
1528 }
1529 }
1530
1531 /* apply socket option */
1532 TAILQ_FOREACH(mpts, &mpte->mpte_subflows, mpts_entry) {
1533 struct socket *so;
1534
1535 mpts->mpts_flags |= MPTSF_SOPT_INPROG;
1536 VERIFY(mpts->mpts_socket != NULL);
1537 so = mpts->mpts_socket;
1538 error = mptcp_subflow_sosetopt(mpte, mpts, mpo);
1539 if (error != 0) {
1540 break;
1541 }
1542 }
1543
1544 /* cleanup, and rollback if needed */
1545 TAILQ_FOREACH(mpts, &mpte->mpte_subflows, mpts_entry) {
1546 struct socket *so;
1547
1548 if (!(mpts->mpts_flags & MPTSF_SOPT_INPROG)) {
1549 /* clear in case it's set */
1550 mpts->mpts_flags &= ~MPTSF_SOPT_OLDVAL;
1551 mpts->mpts_oldintval = 0;
1552 continue;
1553 }
1554 if (!(mpts->mpts_flags & MPTSF_SOPT_OLDVAL)) {
1555 mpts->mpts_flags &= ~MPTSF_SOPT_INPROG;
1556 VERIFY(mpts->mpts_oldintval == 0);
1557 continue;
1558 }
1559 /* error during sosetopt, so roll it back */
1560 if (error != 0) {
1561 VERIFY(mpts->mpts_socket != NULL);
1562 so = mpts->mpts_socket;
1563 smpo.mpo_intval = mpts->mpts_oldintval;
1564 mptcp_subflow_sosetopt(mpte, mpts, &smpo);
1565 }
1566 mpts->mpts_oldintval = 0;
1567 mpts->mpts_flags &= ~(MPTSF_SOPT_OLDVAL | MPTSF_SOPT_INPROG);
1568 }
1569
1570 out:
1571 return error;
1572 }
1573
1574 /*
1575 * Handle SOPT_SET for socket options issued on MP socket.
1576 */
1577 static int
1578 mptcp_setopt(struct mptses *mpte, struct sockopt *sopt)
1579 {
1580 int error = 0, optval = 0, level, optname, rec = 1;
1581 struct mptopt smpo, *mpo = NULL;
1582 struct socket *mp_so;
1583
1584 level = sopt->sopt_level;
1585 optname = sopt->sopt_name;
1586
1587 mp_so = mptetoso(mpte);
1588
1589 /*
1590 * Record socket options which are applicable to subflow sockets so
1591 * that we can replay them for new ones; see mptcp_usr_socheckopt()
1592 * for the list of eligible socket-level options.
1593 */
1594 if (level == SOL_SOCKET) {
1595 switch (optname) {
1596 case SO_DEBUG:
1597 case SO_KEEPALIVE:
1598 case SO_USELOOPBACK:
1599 case SO_RANDOMPORT:
1600 case SO_TRAFFIC_CLASS:
1601 case SO_RECV_TRAFFIC_CLASS:
1602 case SO_PRIVILEGED_TRAFFIC_CLASS:
1603 case SO_RECV_ANYIF:
1604 case SO_RESTRICTIONS:
1605 case SO_NOWAKEFROMSLEEP:
1606 case SO_NOAPNFALLBK:
1607 case SO_MARK_CELLFALLBACK:
1608 /* record it */
1609 break;
1610 case SO_FLUSH:
1611 /* don't record it */
1612 rec = 0;
1613 break;
1614
1615 /* Next ones, record at MPTCP-level */
1616 case SO_DELEGATED:
1617 error = sooptcopyin(sopt, &mpte->mpte_epid,
1618 sizeof(int), sizeof(int));
1619 if (error != 0) {
1620 goto err_out;
1621 }
1622
1623 goto out;
1624 case SO_DELEGATED_UUID:
1625 error = sooptcopyin(sopt, &mpte->mpte_euuid,
1626 sizeof(uuid_t), sizeof(uuid_t));
1627 if (error != 0) {
1628 goto err_out;
1629 }
1630
1631 goto out;
1632 #if NECP
1633 case SO_NECP_CLIENTUUID:
1634 if (!uuid_is_null(mpsotomppcb(mp_so)->necp_client_uuid)) {
1635 error = EINVAL;
1636 goto err_out;
1637 }
1638
1639 error = sooptcopyin(sopt, &mpsotomppcb(mp_so)->necp_client_uuid,
1640 sizeof(uuid_t), sizeof(uuid_t));
1641 if (error != 0) {
1642 goto err_out;
1643 }
1644
1645 mpsotomppcb(mp_so)->necp_cb = mptcp_session_necp_cb;
1646 error = necp_client_register_multipath_cb(mp_so->last_pid,
1647 mpsotomppcb(mp_so)->necp_client_uuid,
1648 mpsotomppcb(mp_so));
1649 if (error) {
1650 goto err_out;
1651 }
1652
1653 if (uuid_is_null(mpsotomppcb(mp_so)->necp_client_uuid)) {
1654 error = EINVAL;
1655 goto err_out;
1656 }
1657
1658 goto out;
1659 case SO_NECP_ATTRIBUTES:
1660 #endif /* NECP */
1661 default:
1662 /* nothing to do; just return */
1663 goto out;
1664 }
1665 } else {
1666 switch (optname) {
1667 case TCP_NODELAY:
1668 case TCP_RXT_FINDROP:
1669 case TCP_KEEPALIVE:
1670 case TCP_KEEPINTVL:
1671 case TCP_KEEPCNT:
1672 case TCP_CONNECTIONTIMEOUT:
1673 case TCP_RXT_CONNDROPTIME:
1674 case PERSIST_TIMEOUT:
1675 case TCP_ADAPTIVE_READ_TIMEOUT:
1676 case TCP_ADAPTIVE_WRITE_TIMEOUT:
1677 /* eligible; record it */
1678 break;
1679 case TCP_NOTSENT_LOWAT:
1680 /* record at MPTCP level */
1681 error = sooptcopyin(sopt, &optval, sizeof(optval),
1682 sizeof(optval));
1683 if (error) {
1684 goto err_out;
1685 }
1686 if (optval < 0) {
1687 error = EINVAL;
1688 goto err_out;
1689 } else {
1690 if (optval == 0) {
1691 mp_so->so_flags &= ~SOF_NOTSENT_LOWAT;
1692 error = mptcp_set_notsent_lowat(mpte, 0);
1693 } else {
1694 mp_so->so_flags |= SOF_NOTSENT_LOWAT;
1695 error = mptcp_set_notsent_lowat(mpte,
1696 optval);
1697 }
1698
1699 if (error) {
1700 goto err_out;
1701 }
1702 }
1703 goto out;
1704 case MPTCP_SERVICE_TYPE:
1705 /* record at MPTCP level */
1706 error = sooptcopyin(sopt, &optval, sizeof(optval),
1707 sizeof(optval));
1708 if (error) {
1709 goto err_out;
1710 }
1711 if (optval < 0 || optval >= MPTCP_SVCTYPE_MAX) {
1712 error = EINVAL;
1713 goto err_out;
1714 }
1715
1716 if (mptcp_entitlement_check(mp_so, optval) < 0) {
1717 error = EACCES;
1718 goto err_out;
1719 }
1720
1721 mpte->mpte_svctype = optval;
1722 mpte->mpte_flags |= MPTE_SVCTYPE_CHECKED;
1723
1724 goto out;
1725 case MPTCP_ALTERNATE_PORT:
1726 /* record at MPTCP level */
1727 error = sooptcopyin(sopt, &optval, sizeof(optval),
1728 sizeof(optval));
1729 if (error) {
1730 goto err_out;
1731 }
1732
1733 if (optval < 0 || optval > UINT16_MAX) {
1734 error = EINVAL;
1735 goto err_out;
1736 }
1737
1738 mpte->mpte_alternate_port = optval;
1739
1740 goto out;
1741 case MPTCP_FORCE_ENABLE:
1742 /* record at MPTCP level */
1743 error = sooptcopyin(sopt, &optval, sizeof(optval),
1744 sizeof(optval));
1745 if (error) {
1746 goto err_out;
1747 }
1748
1749 if (optval < 0 || optval > 1) {
1750 error = EINVAL;
1751 goto err_out;
1752 }
1753
1754 if (optval) {
1755 mpte->mpte_flags |= MPTE_FORCE_ENABLE;
1756 } else {
1757 mpte->mpte_flags &= ~MPTE_FORCE_ENABLE;
1758 }
1759
1760 goto out;
1761 case MPTCP_EXPECTED_PROGRESS_TARGET:
1762 {
1763 struct mptcb *mp_tp = mpte->mpte_mptcb;
1764 uint64_t mach_time_target;
1765 uint64_t nanoseconds;
1766
1767 if (mpte->mpte_svctype != MPTCP_SVCTYPE_TARGET_BASED) {
1768 os_log(mptcp_log_handle, "%s - %lx: Can't set urgent activity when svctype is %u\n",
1769 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte), mpte->mpte_svctype);
1770 error = EINVAL;
1771 goto err_out;
1772 }
1773
1774 error = sooptcopyin(sopt, &mach_time_target, sizeof(mach_time_target), sizeof(mach_time_target));
1775 if (error) {
1776 goto err_out;
1777 }
1778
1779 if (!mptcp_ok_to_create_subflows(mp_tp)) {
1780 os_log(mptcp_log_handle, "%s - %lx: Not ok to create subflows, state %u flags %#x\n",
1781 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte), mp_tp->mpt_state, mp_tp->mpt_flags);
1782 error = EINVAL;
1783 goto err_out;
1784 }
1785
1786 if (mach_time_target) {
1787 uint64_t time_now = 0;
1788 uint64_t time_now_nanoseconds;
1789
1790 absolutetime_to_nanoseconds(mach_time_target, &nanoseconds);
1791 nanoseconds = nanoseconds - (mptcp_expected_progress_headstart * NSEC_PER_MSEC);
1792
1793 time_now = mach_continuous_time();
1794 absolutetime_to_nanoseconds(time_now, &time_now_nanoseconds);
1795
1796 nanoseconds_to_absolutetime(nanoseconds, &mach_time_target);
1797 /* If the timer is already running and it would
1798 * fire in less than mptcp_expected_progress_headstart
1799 * seconds, then it's not worth canceling it.
1800 */
1801 if (mpte->mpte_time_target &&
1802 mpte->mpte_time_target < time_now &&
1803 time_now_nanoseconds > nanoseconds - (mptcp_expected_progress_headstart * NSEC_PER_MSEC)) {
1804 os_log(mptcp_log_handle, "%s - %lx: Not rescheduling timer %llu now %llu target %llu\n",
1805 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte),
1806 mpte->mpte_time_target,
1807 time_now,
1808 mach_time_target);
1809 goto out;
1810 }
1811 }
1812
1813 mpte->mpte_time_target = mach_time_target;
1814 mptcp_set_urgency_timer(mpte);
1815
1816 goto out;
1817 }
1818 default:
1819 /* not eligible */
1820 error = ENOPROTOOPT;
1821 goto err_out;
1822 }
1823 }
1824
1825 if ((error = sooptcopyin(sopt, &optval, sizeof(optval),
1826 sizeof(optval))) != 0) {
1827 goto err_out;
1828 }
1829
1830 if (rec) {
1831 /* search for an existing one; if not found, allocate */
1832 if ((mpo = mptcp_sopt_find(mpte, sopt)) == NULL) {
1833 mpo = mptcp_sopt_alloc(M_WAITOK);
1834 }
1835
1836 if (mpo == NULL) {
1837 error = ENOBUFS;
1838 goto err_out;
1839 } else {
1840 /* initialize or update, as needed */
1841 mpo->mpo_intval = optval;
1842 if (!(mpo->mpo_flags & MPOF_ATTACHED)) {
1843 mpo->mpo_level = level;
1844 mpo->mpo_name = optname;
1845 mptcp_sopt_insert(mpte, mpo);
1846 }
1847 /* this can be issued on the subflow socket */
1848 mpo->mpo_flags |= MPOF_SUBFLOW_OK;
1849 }
1850 } else {
1851 bzero(&smpo, sizeof(smpo));
1852 mpo = &smpo;
1853 mpo->mpo_flags |= MPOF_SUBFLOW_OK;
1854 mpo->mpo_level = level;
1855 mpo->mpo_name = optname;
1856 mpo->mpo_intval = optval;
1857 }
1858
1859 /* issue this socket option on existing subflows */
1860 error = mptcp_setopt_apply(mpte, mpo);
1861 if (error != 0 && (mpo->mpo_flags & MPOF_ATTACHED)) {
1862 VERIFY(mpo != &smpo);
1863 mptcp_sopt_remove(mpte, mpo);
1864 mptcp_sopt_free(mpo);
1865 }
1866 if (mpo == &smpo) {
1867 mpo->mpo_flags &= ~MPOF_INTERIM;
1868 }
1869
1870 if (error) {
1871 goto err_out;
1872 }
1873
1874 out:
1875
1876 return 0;
1877
1878 err_out:
1879 os_log_error(mptcp_log_handle, "%s - %lx: sopt %s (%d, %d) val %d can't be issued error %d\n",
1880 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte),
1881 mptcp_sopt2str(level, optname), level, optname, optval, error);
1882 return error;
1883 }
1884
1885 static void
1886 mptcp_fill_info_bytestats(struct tcp_info *ti, struct mptses *mpte)
1887 {
1888 struct mptsub *mpts;
1889 int i;
1890
1891 TAILQ_FOREACH(mpts, &mpte->mpte_subflows, mpts_entry) {
1892 const struct inpcb *inp = sotoinpcb(mpts->mpts_socket);
1893
1894 if (inp == NULL) {
1895 continue;
1896 }
1897
1898 ti->tcpi_txbytes += inp->inp_stat->txbytes;
1899 ti->tcpi_rxbytes += inp->inp_stat->rxbytes;
1900 ti->tcpi_cell_txbytes += inp->inp_cstat->txbytes;
1901 ti->tcpi_cell_rxbytes += inp->inp_cstat->rxbytes;
1902 ti->tcpi_wifi_txbytes += inp->inp_wstat->txbytes;
1903 ti->tcpi_wifi_rxbytes += inp->inp_wstat->rxbytes;
1904 ti->tcpi_wired_txbytes += inp->inp_Wstat->txbytes;
1905 ti->tcpi_wired_rxbytes += inp->inp_Wstat->rxbytes;
1906 }
1907
1908 for (i = 0; i < MPTCP_ITFSTATS_SIZE; i++) {
1909 struct mptcp_itf_stats *stats = &mpte->mpte_itfstats[i];
1910
1911 ti->tcpi_txbytes += stats->mpis_txbytes;
1912 ti->tcpi_rxbytes += stats->mpis_rxbytes;
1913
1914 ti->tcpi_wifi_txbytes += stats->mpis_wifi_txbytes;
1915 ti->tcpi_wifi_rxbytes += stats->mpis_wifi_rxbytes;
1916
1917 ti->tcpi_wired_txbytes += stats->mpis_wired_txbytes;
1918 ti->tcpi_wired_rxbytes += stats->mpis_wired_rxbytes;
1919
1920 ti->tcpi_cell_txbytes += stats->mpis_cell_txbytes;
1921 ti->tcpi_cell_rxbytes += stats->mpis_cell_rxbytes;
1922 }
1923 }
1924
1925 static void
1926 mptcp_fill_info(struct mptses *mpte, struct tcp_info *ti)
1927 {
1928 struct mptsub *actsub = mpte->mpte_active_sub;
1929 struct mptcb *mp_tp = mpte->mpte_mptcb;
1930 struct tcpcb *acttp = NULL;
1931
1932 if (actsub) {
1933 acttp = sototcpcb(actsub->mpts_socket);
1934 }
1935
1936 bzero(ti, sizeof(*ti));
1937
1938 ti->tcpi_state = mp_tp->mpt_state;
1939 /* tcpi_options */
1940 /* tcpi_snd_wscale */
1941 /* tcpi_rcv_wscale */
1942 /* tcpi_flags */
1943 if (acttp) {
1944 ti->tcpi_rto = acttp->t_timer[TCPT_REXMT] ? acttp->t_rxtcur : 0;
1945 }
1946
1947 /* tcpi_snd_mss */
1948 /* tcpi_rcv_mss */
1949 if (acttp) {
1950 ti->tcpi_rttcur = acttp->t_rttcur;
1951 ti->tcpi_srtt = acttp->t_srtt >> TCP_RTT_SHIFT;
1952 ti->tcpi_rttvar = acttp->t_rttvar >> TCP_RTTVAR_SHIFT;
1953 ti->tcpi_rttbest = acttp->t_rttbest >> TCP_RTT_SHIFT;
1954 }
1955 /* tcpi_snd_ssthresh */
1956 /* tcpi_snd_cwnd */
1957 /* tcpi_rcv_space */
1958 ti->tcpi_snd_wnd = mp_tp->mpt_sndwnd;
1959 ti->tcpi_snd_nxt = mp_tp->mpt_sndnxt;
1960 ti->tcpi_rcv_nxt = mp_tp->mpt_rcvnxt;
1961 if (acttp) {
1962 ti->tcpi_last_outif = (acttp->t_inpcb->inp_last_outifp == NULL) ? 0 :
1963 acttp->t_inpcb->inp_last_outifp->if_index;
1964 }
1965
1966 mptcp_fill_info_bytestats(ti, mpte);
1967 /* tcpi_txpackets */
1968
1969 /* tcpi_txretransmitbytes */
1970 /* tcpi_txunacked */
1971 /* tcpi_rxpackets */
1972
1973 /* tcpi_rxduplicatebytes */
1974 /* tcpi_rxoutoforderbytes */
1975 /* tcpi_snd_bw */
1976 /* tcpi_synrexmits */
1977 /* tcpi_unused1 */
1978 /* tcpi_unused2 */
1979 /* tcpi_cell_rxpackets */
1980
1981 /* tcpi_cell_txpackets */
1982
1983 /* tcpi_wifi_rxpackets */
1984
1985 /* tcpi_wifi_txpackets */
1986
1987 /* tcpi_wired_rxpackets */
1988 /* tcpi_wired_txpackets */
1989 /* tcpi_connstatus */
1990 /* TFO-stuff */
1991 /* ECN stuff */
1992 /* tcpi_ecn_recv_ce */
1993 /* tcpi_ecn_recv_cwr */
1994 if (acttp) {
1995 ti->tcpi_rcvoopack = acttp->t_rcvoopack;
1996 }
1997 /* tcpi_pawsdrop */
1998 /* tcpi_sack_recovery_episode */
1999 /* tcpi_reordered_pkts */
2000 /* tcpi_dsack_sent */
2001 /* tcpi_dsack_recvd */
2002 /* tcpi_flowhash */
2003 if (acttp) {
2004 ti->tcpi_txretransmitpackets = acttp->t_stat.rxmitpkts;
2005 }
2006 }
2007
2008 /*
2009 * Handle SOPT_GET for socket options issued on MP socket.
2010 */
2011 static int
2012 mptcp_getopt(struct mptses *mpte, struct sockopt *sopt)
2013 {
2014 int error = 0, optval = 0;
2015
2016 /*
2017 * We only handle SOPT_GET for TCP level socket options; we should
2018 * not get here for socket level options since they are already
2019 * handled at the socket layer.
2020 */
2021 if (sopt->sopt_level != IPPROTO_TCP) {
2022 error = ENOPROTOOPT;
2023 goto out;
2024 }
2025
2026 switch (sopt->sopt_name) {
2027 case PERSIST_TIMEOUT:
2028 /* Only case for which we have a non-zero default */
2029 optval = tcp_max_persist_timeout;
2030 case TCP_NODELAY:
2031 case TCP_RXT_FINDROP:
2032 case TCP_KEEPALIVE:
2033 case TCP_KEEPINTVL:
2034 case TCP_KEEPCNT:
2035 case TCP_CONNECTIONTIMEOUT:
2036 case TCP_RXT_CONNDROPTIME:
2037 case TCP_ADAPTIVE_READ_TIMEOUT:
2038 case TCP_ADAPTIVE_WRITE_TIMEOUT:
2039 {
2040 struct mptopt *mpo = mptcp_sopt_find(mpte, sopt);
2041
2042 if (mpo != NULL) {
2043 optval = mpo->mpo_intval;
2044 }
2045 break;
2046 }
2047
2048 /* The next ones are stored at the MPTCP-level */
2049 case TCP_NOTSENT_LOWAT:
2050 if (mptetoso(mpte)->so_flags & SOF_NOTSENT_LOWAT) {
2051 optval = mptcp_get_notsent_lowat(mpte);
2052 } else {
2053 optval = 0;
2054 }
2055 break;
2056 case TCP_INFO:
2057 {
2058 struct tcp_info ti;
2059
2060 mptcp_fill_info(mpte, &ti);
2061 error = sooptcopyout(sopt, &ti, sizeof(struct tcp_info));
2062
2063 goto out;
2064 }
2065 case MPTCP_SERVICE_TYPE:
2066 optval = mpte->mpte_svctype;
2067 break;
2068 case MPTCP_ALTERNATE_PORT:
2069 optval = mpte->mpte_alternate_port;
2070 break;
2071 case MPTCP_FORCE_ENABLE:
2072 optval = !!(mpte->mpte_flags & MPTE_FORCE_ENABLE);
2073 break;
2074 case MPTCP_EXPECTED_PROGRESS_TARGET:
2075 error = sooptcopyout(sopt, &mpte->mpte_time_target, sizeof(mpte->mpte_time_target));
2076
2077 goto out;
2078 default:
2079 /* not eligible */
2080 error = ENOPROTOOPT;
2081 break;
2082 }
2083
2084 if (error == 0) {
2085 error = sooptcopyout(sopt, &optval, sizeof(int));
2086 }
2087
2088 out:
2089 return error;
2090 }
2091
2092 /*
2093 * MPTCP SOPT_{SET,GET} socket option handler, for options issued on the MP
2094 * socket, at SOL_SOCKET and IPPROTO_TCP levels. The former is restricted
2095 * to those that are allowed by mptcp_usr_socheckopt().
2096 */
2097 int
2098 mptcp_ctloutput(struct socket *mp_so, struct sockopt *sopt)
2099 {
2100 struct mppcb *mpp = mpsotomppcb(mp_so);
2101 struct mptses *mpte;
2102 int error = 0;
2103
2104 if (mpp == NULL || mpp->mpp_state == MPPCB_STATE_DEAD) {
2105 error = EINVAL;
2106 goto out;
2107 }
2108 mpte = mptompte(mpp);
2109 socket_lock_assert_owned(mp_so);
2110
2111 /* we only handle socket and TCP-level socket options for MPTCP */
2112 if (sopt->sopt_level != SOL_SOCKET && sopt->sopt_level != IPPROTO_TCP) {
2113 error = EINVAL;
2114 goto out;
2115 }
2116
2117 switch (sopt->sopt_dir) {
2118 case SOPT_SET:
2119 error = mptcp_setopt(mpte, sopt);
2120 break;
2121
2122 case SOPT_GET:
2123 error = mptcp_getopt(mpte, sopt);
2124 break;
2125 }
2126 out:
2127 return error;
2128 }
2129
2130 const char *
2131 mptcp_sopt2str(int level, int optname)
2132 {
2133 switch (level) {
2134 case SOL_SOCKET:
2135 switch (optname) {
2136 case SO_LINGER:
2137 return "SO_LINGER";
2138 case SO_LINGER_SEC:
2139 return "SO_LINGER_SEC";
2140 case SO_DEBUG:
2141 return "SO_DEBUG";
2142 case SO_KEEPALIVE:
2143 return "SO_KEEPALIVE";
2144 case SO_USELOOPBACK:
2145 return "SO_USELOOPBACK";
2146 case SO_TYPE:
2147 return "SO_TYPE";
2148 case SO_NREAD:
2149 return "SO_NREAD";
2150 case SO_NWRITE:
2151 return "SO_NWRITE";
2152 case SO_ERROR:
2153 return "SO_ERROR";
2154 case SO_SNDBUF:
2155 return "SO_SNDBUF";
2156 case SO_RCVBUF:
2157 return "SO_RCVBUF";
2158 case SO_SNDLOWAT:
2159 return "SO_SNDLOWAT";
2160 case SO_RCVLOWAT:
2161 return "SO_RCVLOWAT";
2162 case SO_SNDTIMEO:
2163 return "SO_SNDTIMEO";
2164 case SO_RCVTIMEO:
2165 return "SO_RCVTIMEO";
2166 case SO_NKE:
2167 return "SO_NKE";
2168 case SO_NOSIGPIPE:
2169 return "SO_NOSIGPIPE";
2170 case SO_NOADDRERR:
2171 return "SO_NOADDRERR";
2172 case SO_RESTRICTIONS:
2173 return "SO_RESTRICTIONS";
2174 case SO_LABEL:
2175 return "SO_LABEL";
2176 case SO_PEERLABEL:
2177 return "SO_PEERLABEL";
2178 case SO_RANDOMPORT:
2179 return "SO_RANDOMPORT";
2180 case SO_TRAFFIC_CLASS:
2181 return "SO_TRAFFIC_CLASS";
2182 case SO_RECV_TRAFFIC_CLASS:
2183 return "SO_RECV_TRAFFIC_CLASS";
2184 case SO_TRAFFIC_CLASS_DBG:
2185 return "SO_TRAFFIC_CLASS_DBG";
2186 case SO_PRIVILEGED_TRAFFIC_CLASS:
2187 return "SO_PRIVILEGED_TRAFFIC_CLASS";
2188 case SO_DEFUNCTIT:
2189 return "SO_DEFUNCTIT";
2190 case SO_DEFUNCTOK:
2191 return "SO_DEFUNCTOK";
2192 case SO_ISDEFUNCT:
2193 return "SO_ISDEFUNCT";
2194 case SO_OPPORTUNISTIC:
2195 return "SO_OPPORTUNISTIC";
2196 case SO_FLUSH:
2197 return "SO_FLUSH";
2198 case SO_RECV_ANYIF:
2199 return "SO_RECV_ANYIF";
2200 case SO_NOWAKEFROMSLEEP:
2201 return "SO_NOWAKEFROMSLEEP";
2202 case SO_NOAPNFALLBK:
2203 return "SO_NOAPNFALLBK";
2204 case SO_MARK_CELLFALLBACK:
2205 return "SO_CELLFALLBACK";
2206 case SO_DELEGATED:
2207 return "SO_DELEGATED";
2208 case SO_DELEGATED_UUID:
2209 return "SO_DELEGATED_UUID";
2210 #if NECP
2211 case SO_NECP_ATTRIBUTES:
2212 return "SO_NECP_ATTRIBUTES";
2213 case SO_NECP_CLIENTUUID:
2214 return "SO_NECP_CLIENTUUID";
2215 #endif /* NECP */
2216 }
2217
2218 break;
2219 case IPPROTO_TCP:
2220 switch (optname) {
2221 case TCP_NODELAY:
2222 return "TCP_NODELAY";
2223 case TCP_KEEPALIVE:
2224 return "TCP_KEEPALIVE";
2225 case TCP_KEEPINTVL:
2226 return "TCP_KEEPINTVL";
2227 case TCP_KEEPCNT:
2228 return "TCP_KEEPCNT";
2229 case TCP_CONNECTIONTIMEOUT:
2230 return "TCP_CONNECTIONTIMEOUT";
2231 case TCP_RXT_CONNDROPTIME:
2232 return "TCP_RXT_CONNDROPTIME";
2233 case PERSIST_TIMEOUT:
2234 return "PERSIST_TIMEOUT";
2235 case TCP_NOTSENT_LOWAT:
2236 return "NOTSENT_LOWAT";
2237 case TCP_ADAPTIVE_READ_TIMEOUT:
2238 return "ADAPTIVE_READ_TIMEOUT";
2239 case TCP_ADAPTIVE_WRITE_TIMEOUT:
2240 return "ADAPTIVE_WRITE_TIMEOUT";
2241 case MPTCP_SERVICE_TYPE:
2242 return "MPTCP_SERVICE_TYPE";
2243 case MPTCP_ALTERNATE_PORT:
2244 return "MPTCP_ALTERNATE_PORT";
2245 case MPTCP_FORCE_ENABLE:
2246 return "MPTCP_FORCE_ENABLE";
2247 case MPTCP_EXPECTED_PROGRESS_TARGET:
2248 return "MPTCP_EXPECTED_PROGRESS_TARGET";
2249 }
2250
2251 break;
2252 }
2253
2254 return "unknown";
2255 }
2256
2257 static int
2258 mptcp_usr_preconnect(struct socket *mp_so)
2259 {
2260 struct mptsub *mpts = NULL;
2261 struct mppcb *mpp = mpsotomppcb(mp_so);
2262 struct mptses *mpte;
2263 struct socket *so;
2264 struct tcpcb *tp = NULL;
2265 int error;
2266
2267 mpte = mptompte(mpp);
2268
2269 mpts = mptcp_get_subflow(mpte, NULL);
2270 if (mpts == NULL) {
2271 os_log_error(mptcp_log_handle, "%s - %lx: invalid preconnect ",
2272 __func__, (unsigned long)VM_KERNEL_ADDRPERM(mpte));
2273 return EINVAL;
2274 }
2275 mpts->mpts_flags &= ~MPTSF_TFO_REQD;
2276 so = mpts->mpts_socket;
2277 tp = intotcpcb(sotoinpcb(so));
2278 tp->t_mpflags &= ~TMPF_TFO_REQUEST;
2279 error = tcp_output(sototcpcb(so));
2280
2281 soclearfastopen(mp_so);
2282
2283 return error;
2284 }