]> git.saurik.com Git - apple/xnu.git/blob - bsd/netinet/in_pcblist.c
09cc79674f3e563365027934f9dd8b55f35b7207
[apple/xnu.git] / bsd / netinet / in_pcblist.c
1 /*
2 * Copyright (c) 2010-2013 Apple Inc. All rights reserved.
3 *
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5 *
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
14 *
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
25 *
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27 */
28 /*
29 * Copyright (c) 1982, 1986, 1990, 1993
30 * The Regents of the University of California. All rights reserved.
31 *
32 * Redistribution and use in source and binary forms, with or without
33 * modification, are permitted provided that the following conditions
34 * are met:
35 * 1. Redistributions of source code must retain the above copyright
36 * notice, this list of conditions and the following disclaimer.
37 * 2. Redistributions in binary form must reproduce the above copyright
38 * notice, this list of conditions and the following disclaimer in the
39 * documentation and/or other materials provided with the distribution.
40 * 3. All advertising materials mentioning features or use of this software
41 * must display the following acknowledgement:
42 * This product includes software developed by the University of
43 * California, Berkeley and its contributors.
44 * 4. Neither the name of the University nor the names of its contributors
45 * may be used to endorse or promote products derived from this software
46 * without specific prior written permission.
47 *
48 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
49 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
50 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
51 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
52 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
53 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
54 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
55 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
56 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
57 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
58 * SUCH DAMAGE.
59 */
60
61 #include <sys/types.h>
62 #include <sys/malloc.h>
63 #include <sys/socket.h>
64 #include <sys/socketvar.h>
65 #include <sys/protosw.h>
66 #include <sys/domain.h>
67 #include <sys/kernel.h>
68 #include <sys/sysctl.h>
69 #include <sys/dtrace.h>
70 #include <sys/kauth.h>
71
72 #include <net/route.h>
73 #include <net/if_var.h>
74
75 #include <netinet/in.h>
76 #include <netinet/in_pcb.h>
77 #include <netinet/in_var.h>
78 #include <netinet/ip_var.h>
79
80 #include <netinet/udp.h>
81 #include <netinet/udp_var.h>
82
83 #include <netinet/tcp.h>
84 #include <netinet/tcp_fsm.h>
85 #include <netinet/tcp_seq.h>
86 #include <netinet/tcp_timer.h>
87 #include <netinet/tcp_var.h>
88 #include <netinet6/in6_var.h>
89
90 #ifndef ROUNDUP64
91 #define ROUNDUP64(x) P2ROUNDUP((x), sizeof (u_int64_t))
92 #endif
93
94 #ifndef ADVANCE64
95 #define ADVANCE64(p, n) (void*)((char *)(p) + ROUNDUP64(n))
96 #endif
97
98 static void sotoxsocket_n(struct socket *, struct xsocket_n *);
99 static void sbtoxsockbuf_n(struct sockbuf *, struct xsockbuf_n *);
100 static void sbtoxsockstat_n(struct socket *, struct xsockstat_n *);
101 static void inpcb_to_xinpcb_n(struct inpcb *, struct xinpcb_n *);
102 static void tcpcb_to_xtcpcb_n(struct tcpcb *, struct xtcpcb_n *);
103
104 static void
105 sotoxsocket_n(struct socket *so, struct xsocket_n *xso)
106 {
107 xso->xso_len = sizeof (struct xsocket_n);
108 xso->xso_kind = XSO_SOCKET;
109
110 if (so != NULL) {
111 xso->xso_so = (u_int64_t)(uintptr_t)so;
112 xso->so_type = so->so_type;
113 xso->so_options = so->so_options;
114 xso->so_linger = so->so_linger;
115 xso->so_state = so->so_state;
116 xso->so_pcb = (u_int64_t)(uintptr_t)so->so_pcb;
117 if (so->so_proto) {
118 xso->xso_protocol = SOCK_PROTO(so);
119 xso->xso_family = SOCK_DOM(so);
120 } else {
121 xso->xso_protocol = xso->xso_family = 0;
122 }
123 xso->so_qlen = so->so_qlen;
124 xso->so_incqlen = so->so_incqlen;
125 xso->so_qlimit = so->so_qlimit;
126 xso->so_timeo = so->so_timeo;
127 xso->so_error = so->so_error;
128 xso->so_pgid = so->so_pgid;
129 xso->so_oobmark = so->so_oobmark;
130 xso->so_uid = kauth_cred_getuid(so->so_cred);
131 }
132 }
133
134 static void
135 sbtoxsockbuf_n(struct sockbuf *sb, struct xsockbuf_n *xsb)
136 {
137 xsb->xsb_len = sizeof (struct xsockbuf_n);
138 xsb->xsb_kind = (sb->sb_flags & SB_RECV) ? XSO_RCVBUF : XSO_SNDBUF;
139
140 if (sb != NULL) {
141 xsb->sb_cc = sb->sb_cc;
142 xsb->sb_hiwat = sb->sb_hiwat;
143 xsb->sb_mbcnt = sb->sb_mbcnt;
144 xsb->sb_mbmax = sb->sb_mbmax;
145 xsb->sb_lowat = sb->sb_lowat;
146 xsb->sb_flags = sb->sb_flags;
147 xsb->sb_timeo = (short)(sb->sb_timeo.tv_sec * hz) +
148 sb->sb_timeo.tv_usec / tick;
149 if (xsb->sb_timeo == 0 && sb->sb_timeo.tv_usec != 0)
150 xsb->sb_timeo = 1;
151 }
152 }
153
154 static void
155 sbtoxsockstat_n(struct socket *so, struct xsockstat_n *xst)
156 {
157 int i;
158
159 xst->xst_len = sizeof (struct xsockstat_n);
160 xst->xst_kind = XSO_STATS;
161
162 for (i = 0; i < SO_TC_STATS_MAX; i++) {
163 xst->xst_tc_stats[i].rxpackets = so->so_tc_stats[i].rxpackets;
164 xst->xst_tc_stats[i].rxbytes = so->so_tc_stats[i].rxbytes;
165 xst->xst_tc_stats[i].txpackets = so->so_tc_stats[i].txpackets;
166 xst->xst_tc_stats[i].txbytes = so->so_tc_stats[i].txbytes;
167 }
168 }
169
170 static void
171 inpcb_to_xinpcb_n(struct inpcb *inp, struct xinpcb_n *xinp)
172 {
173 xinp->xi_len = sizeof (struct xinpcb_n);
174 xinp->xi_kind = XSO_INPCB;
175 xinp->xi_inpp = (u_int64_t)(uintptr_t)inp;
176 xinp->inp_fport = inp->inp_fport;
177 xinp->inp_lport = inp->inp_lport;
178 xinp->inp_ppcb = (u_int64_t)(uintptr_t)inp->inp_ppcb;
179 xinp->inp_gencnt = inp->inp_gencnt;
180 xinp->inp_flags = inp->inp_flags;
181 xinp->inp_flow = inp->inp_flow;
182 xinp->inp_vflag = inp->inp_vflag;
183 xinp->inp_ip_ttl = inp->inp_ip_ttl;
184 xinp->inp_ip_p = inp->inp_ip_p;
185 xinp->inp_dependfaddr.inp6_foreign = inp->inp_dependfaddr.inp6_foreign;
186 xinp->inp_dependladdr.inp6_local = inp->inp_dependladdr.inp6_local;
187 xinp->inp_depend4.inp4_ip_tos = inp->inp_depend4.inp4_ip_tos;
188 xinp->inp_depend6.inp6_hlim = 0;
189 xinp->inp_depend6.inp6_cksum = inp->inp_depend6.inp6_cksum;
190 xinp->inp_depend6.inp6_ifindex = 0;
191 xinp->inp_depend6.inp6_hops = inp->inp_depend6.inp6_hops;
192 xinp->inp_flowhash = inp->inp_flowhash;
193 }
194
195 __private_extern__ void
196 tcpcb_to_xtcpcb_n(struct tcpcb *tp, struct xtcpcb_n *xt)
197 {
198 int i;
199
200 xt->xt_len = sizeof (struct xtcpcb_n);
201 xt->xt_kind = XSO_TCPCB;
202
203 xt->t_segq = (u_int32_t)(uintptr_t)tp->t_segq.lh_first;
204 xt->t_dupacks = tp->t_dupacks;
205 for (i = 0; i < TCPT_NTIMERS_EXT; i++)
206 xt->t_timer[i] = tp->t_timer[i];
207 xt->t_state = tp->t_state;
208 xt->t_flags = tp->t_flags;
209 xt->t_force = tp->t_force;
210 xt->snd_una = tp->snd_una;
211 xt->snd_max = tp->snd_max;
212 xt->snd_nxt = tp->snd_nxt;
213 xt->snd_up = tp->snd_up;
214 xt->snd_wl1 = tp->snd_wl1;
215 xt->snd_wl2 = tp->snd_wl2;
216 xt->iss = tp->iss;
217 xt->irs = tp->irs;
218 xt->rcv_nxt = tp->rcv_nxt;
219 xt->rcv_adv = tp->rcv_adv;
220 xt->rcv_wnd = tp->rcv_wnd;
221 xt->rcv_up = tp->rcv_up;
222 xt->snd_wnd = tp->snd_wnd;
223 xt->snd_cwnd = tp->snd_cwnd;
224 xt->snd_ssthresh = tp->snd_ssthresh;
225 xt->t_maxopd = tp->t_maxopd;
226 xt->t_rcvtime = tp->t_rcvtime;
227 xt->t_starttime = tp->t_starttime;
228 xt->t_rtttime = tp->t_rtttime;
229 xt->t_rtseq = tp->t_rtseq;
230 xt->t_rxtcur = tp->t_rxtcur;
231 xt->t_maxseg = tp->t_maxseg;
232 xt->t_srtt = tp->t_srtt;
233 xt->t_rttvar = tp->t_rttvar;
234 xt->t_rxtshift = tp->t_rxtshift;
235 xt->t_rttmin = tp->t_rttmin;
236 xt->t_rttupdated = tp->t_rttupdated;
237 xt->max_sndwnd = tp->max_sndwnd;
238 xt->t_softerror = tp->t_softerror;
239 xt->t_oobflags = tp->t_oobflags;
240 xt->t_iobc = tp->t_iobc;
241 xt->snd_scale = tp->snd_scale;
242 xt->rcv_scale = tp->rcv_scale;
243 xt->request_r_scale = tp->request_r_scale;
244 xt->requested_s_scale = tp->requested_s_scale;
245 xt->ts_recent = tp->ts_recent;
246 xt->ts_recent_age = tp->ts_recent_age;
247 xt->last_ack_sent = tp->last_ack_sent;
248 xt->cc_send = tp->cc_send;
249 xt->cc_recv = tp->cc_recv;
250 xt->snd_recover = tp->snd_recover;
251 xt->snd_cwnd_prev = tp->snd_cwnd_prev;
252 xt->snd_ssthresh_prev = tp->snd_ssthresh_prev;
253 }
254
255 __private_extern__ int
256 get_pcblist_n(short proto, struct sysctl_req *req, struct inpcbinfo *pcbinfo)
257 {
258 int error = 0;
259 int i, n;
260 struct inpcb *inp, **inp_list = NULL;
261 inp_gen_t gencnt;
262 struct xinpgen xig;
263 void *buf = NULL;
264 size_t item_size = ROUNDUP64(sizeof (struct xinpcb_n)) +
265 ROUNDUP64(sizeof (struct xsocket_n)) +
266 2 * ROUNDUP64(sizeof (struct xsockbuf_n)) +
267 ROUNDUP64(sizeof (struct xsockstat_n));
268
269 if (proto == IPPROTO_TCP)
270 item_size += ROUNDUP64(sizeof (struct xtcpcb_n));
271
272 /*
273 * The process of preparing the PCB list is too time-consuming and
274 * resource-intensive to repeat twice on every request.
275 */
276 lck_rw_lock_exclusive(pcbinfo->ipi_lock);
277 if (req->oldptr == USER_ADDR_NULL) {
278 n = pcbinfo->ipi_count;
279 req->oldidx = 2 * (sizeof (xig)) + (n + n/8) * item_size;
280 goto done;
281 }
282
283 if (req->newptr != USER_ADDR_NULL) {
284 error = EPERM;
285 goto done;
286 }
287
288 /*
289 * OK, now we're committed to doing something.
290 */
291 gencnt = pcbinfo->ipi_gencnt;
292 n = pcbinfo->ipi_count;
293
294 bzero(&xig, sizeof (xig));
295 xig.xig_len = sizeof (xig);
296 xig.xig_count = n;
297 xig.xig_gen = gencnt;
298 xig.xig_sogen = so_gencnt;
299 error = SYSCTL_OUT(req, &xig, sizeof (xig));
300 if (error) {
301 goto done;
302 }
303 /*
304 * We are done if there is no pcb
305 */
306 if (n == 0) {
307 goto done;
308 }
309
310 buf = _MALLOC(item_size, M_TEMP, M_WAITOK);
311 if (buf == NULL) {
312 error = ENOMEM;
313 goto done;
314 }
315
316 inp_list = _MALLOC(n * sizeof (*inp_list), M_TEMP, M_WAITOK);
317 if (inp_list == NULL) {
318 error = ENOMEM;
319 goto done;
320 }
321
322 for (inp = pcbinfo->ipi_listhead->lh_first, i = 0; inp && i < n;
323 inp = inp->inp_list.le_next) {
324 if (inp->inp_gencnt <= gencnt &&
325 inp->inp_state != INPCB_STATE_DEAD)
326 inp_list[i++] = inp;
327 }
328 n = i;
329
330 error = 0;
331 for (i = 0; i < n; i++) {
332 inp = inp_list[i];
333 if (inp->inp_gencnt <= gencnt &&
334 inp->inp_state != INPCB_STATE_DEAD) {
335 struct xinpcb_n *xi = (struct xinpcb_n *)buf;
336 struct xsocket_n *xso = (struct xsocket_n *)
337 ADVANCE64(xi, sizeof (*xi));
338 struct xsockbuf_n *xsbrcv = (struct xsockbuf_n *)
339 ADVANCE64(xso, sizeof (*xso));
340 struct xsockbuf_n *xsbsnd = (struct xsockbuf_n *)
341 ADVANCE64(xsbrcv, sizeof (*xsbrcv));
342 struct xsockstat_n *xsostats = (struct xsockstat_n *)
343 ADVANCE64(xsbsnd, sizeof (*xsbsnd));
344
345 bzero(buf, item_size);
346
347 inpcb_to_xinpcb_n(inp, xi);
348 sotoxsocket_n(inp->inp_socket, xso);
349 sbtoxsockbuf_n(inp->inp_socket ?
350 &inp->inp_socket->so_rcv : NULL, xsbrcv);
351 sbtoxsockbuf_n(inp->inp_socket ?
352 &inp->inp_socket->so_snd : NULL, xsbsnd);
353 sbtoxsockstat_n(inp->inp_socket, xsostats);
354 if (proto == IPPROTO_TCP) {
355 struct xtcpcb_n *xt = (struct xtcpcb_n *)
356 ADVANCE64(xsostats, sizeof (*xsostats));
357
358 /*
359 * inp->inp_ppcb, can only be NULL on
360 * an initialization race window.
361 * No need to lock.
362 */
363 if (inp->inp_ppcb == NULL)
364 continue;
365
366 tcpcb_to_xtcpcb_n((struct tcpcb *)
367 inp->inp_ppcb, xt);
368 }
369 error = SYSCTL_OUT(req, buf, item_size);
370 }
371 }
372 if (!error) {
373 /*
374 * Give the user an updated idea of our state.
375 * If the generation differs from what we told
376 * her before, she knows that something happened
377 * while we were processing this request, and it
378 * might be necessary to retry.
379 */
380 bzero(&xig, sizeof (xig));
381 xig.xig_len = sizeof (xig);
382 xig.xig_gen = pcbinfo->ipi_gencnt;
383 xig.xig_sogen = so_gencnt;
384 xig.xig_count = pcbinfo->ipi_count;
385 error = SYSCTL_OUT(req, &xig, sizeof (xig));
386 }
387 done:
388 lck_rw_done(pcbinfo->ipi_lock);
389 if (inp_list != NULL)
390 FREE(inp_list, M_TEMP);
391 if (buf != NULL)
392 FREE(buf, M_TEMP);
393 return (error);
394 }
395
396 __private_extern__ void
397 inpcb_get_ports_used(uint32_t ifindex, int protocol, uint32_t wildcardok,
398 bitstr_t *bitfield, struct inpcbinfo *pcbinfo)
399 {
400 struct inpcb *inp;
401 struct socket *so;
402 inp_gen_t gencnt;
403 uint32_t iswildcard;
404
405 lck_rw_lock_shared(pcbinfo->ipi_lock);
406 gencnt = pcbinfo->ipi_gencnt;
407 for (inp = LIST_FIRST(pcbinfo->ipi_listhead); inp;
408 inp = LIST_NEXT(inp, inp_list)) {
409 uint16_t port;
410
411 if (inp->inp_gencnt > gencnt ||
412 inp->inp_state == INPCB_STATE_DEAD)
413 continue;
414
415 if ((so = inp->inp_socket) == NULL ||
416 (so->so_state & SS_DEFUNCT))
417 continue;
418
419 if (!(protocol == PF_UNSPEC ||
420 (protocol == PF_INET && (inp->inp_vflag & INP_IPV4)) ||
421 (protocol == PF_INET6 && (inp->inp_vflag & INP_IPV6))))
422 continue;
423
424 iswildcard = (((inp->inp_vflag & INP_IPV4) &&
425 inp->inp_laddr.s_addr == INADDR_ANY) ||
426 ((inp->inp_vflag & INP_IPV6) &&
427 IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr)));
428
429 if (!wildcardok && iswildcard)
430 continue;
431
432 if (!iswildcard &&
433 !(ifindex == 0 || inp->inp_last_outifp == NULL ||
434 ifindex == inp->inp_last_outifp->if_index))
435 continue;
436
437 port = ntohs(inp->inp_lport);
438 bit_set(bitfield, port);
439 }
440 lck_rw_done(pcbinfo->ipi_lock);
441 }
442
443 __private_extern__ uint32_t
444 inpcb_count_opportunistic(unsigned int ifindex, struct inpcbinfo *pcbinfo,
445 u_int32_t flags)
446 {
447 uint32_t opportunistic = 0;
448 struct inpcb *inp;
449 inp_gen_t gencnt;
450
451 lck_rw_lock_shared(pcbinfo->ipi_lock);
452 gencnt = pcbinfo->ipi_gencnt;
453 for (inp = LIST_FIRST(pcbinfo->ipi_listhead);
454 inp != NULL; inp = LIST_NEXT(inp, inp_list)) {
455 if (inp->inp_gencnt <= gencnt &&
456 inp->inp_state != INPCB_STATE_DEAD &&
457 inp->inp_socket != NULL &&
458 so_get_opportunistic(inp->inp_socket) &&
459 inp->inp_last_outifp != NULL &&
460 ifindex == inp->inp_last_outifp->if_index) {
461 opportunistic++;
462 struct socket *so = inp->inp_socket;
463 if ((flags & INPCB_OPPORTUNISTIC_SETCMD) &&
464 (so->so_state & SS_ISCONNECTED)) {
465 socket_lock(so, 1);
466 if (flags & INPCB_OPPORTUNISTIC_THROTTLEON) {
467 so->so_flags |= SOF_SUSPENDED;
468 soevent(so,
469 (SO_FILT_HINT_LOCKED |
470 SO_FILT_HINT_SUSPEND));
471 } else {
472 so->so_flags &= ~(SOF_SUSPENDED);
473 soevent(so,
474 (SO_FILT_HINT_LOCKED |
475 SO_FILT_HINT_RESUME));
476 }
477 SOTHROTTLELOG(("throttle[%d]: so 0x%llx "
478 "[%d,%d] %s\n", so->last_pid,
479 (uint64_t)VM_KERNEL_ADDRPERM(so),
480 SOCK_DOM(so), SOCK_TYPE(so),
481 (so->so_flags & SOF_SUSPENDED) ?
482 "SUSPENDED" : "RESUMED"));
483 socket_unlock(so, 1);
484 }
485 }
486 }
487
488 lck_rw_done(pcbinfo->ipi_lock);
489
490 return (opportunistic);
491 }
492
493 __private_extern__ uint32_t
494 inpcb_find_anypcb_byaddr(struct ifaddr *ifa, struct inpcbinfo *pcbinfo)
495 {
496 struct inpcb *inp;
497 inp_gen_t gencnt = pcbinfo->ipi_gencnt;
498 struct socket *so = NULL;
499 int af;
500
501 if ((ifa->ifa_addr->sa_family != AF_INET) &&
502 (ifa->ifa_addr->sa_family != AF_INET6)) {
503 return (0);
504 }
505
506 lck_rw_lock_shared(pcbinfo->ipi_lock);
507 for (inp = LIST_FIRST(pcbinfo->ipi_listhead);
508 inp != NULL; inp = LIST_NEXT(inp, inp_list)) {
509
510 if (inp->inp_gencnt <= gencnt &&
511 inp->inp_state != INPCB_STATE_DEAD &&
512 inp->inp_socket != NULL) {
513 so = inp->inp_socket;
514 af = SOCK_DOM(so);
515 if (af != ifa->ifa_addr->sa_family)
516 continue;
517 if (inp->inp_last_outifp != ifa->ifa_ifp)
518 continue;
519
520 if (af == AF_INET) {
521 if (inp->inp_laddr.s_addr ==
522 (satosin(ifa->ifa_addr))->sin_addr.s_addr) {
523 lck_rw_done(pcbinfo->ipi_lock);
524 return (1);
525 }
526 }
527 if (af == AF_INET6) {
528 if (IN6_ARE_ADDR_EQUAL(IFA_IN6(ifa),
529 &inp->in6p_laddr)) {
530 lck_rw_done(pcbinfo->ipi_lock);
531 return (1);
532 }
533 }
534 }
535 }
536 lck_rw_done(pcbinfo->ipi_lock);
537 return (0);
538 }