]>
Commit | Line | Data |
---|---|---|
1c79356b | 1 | /* |
8a3053a0 | 2 | * Copyright (c) 2000-2014 Apple Computer, Inc. All rights reserved. |
5d5c5d0d | 3 | * |
2d21ac55 | 4 | * @APPLE_OSREFERENCE_LICENSE_HEADER_START@ |
1c79356b | 5 | * |
2d21ac55 A |
6 | * This file contains Original Code and/or Modifications of Original Code |
7 | * as defined in and that are subject to the Apple Public Source License | |
8 | * Version 2.0 (the 'License'). You may not use this file except in | |
9 | * compliance with the License. The rights granted to you under the License | |
10 | * may not be used to create, or enable the creation or redistribution of, | |
11 | * unlawful or unlicensed copies of an Apple operating system, or to | |
12 | * circumvent, violate, or enable the circumvention or violation of, any | |
13 | * terms of an Apple operating system software license agreement. | |
8f6c56a5 | 14 | * |
2d21ac55 A |
15 | * Please obtain a copy of the License at |
16 | * http://www.opensource.apple.com/apsl/ and read it before using this file. | |
17 | * | |
18 | * The Original Code and all software distributed under the License are | |
19 | * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER | |
8f6c56a5 A |
20 | * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES, |
21 | * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY, | |
2d21ac55 A |
22 | * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT. |
23 | * Please see the License for the specific language governing rights and | |
24 | * limitations under the License. | |
8f6c56a5 | 25 | * |
2d21ac55 | 26 | * @APPLE_OSREFERENCE_LICENSE_HEADER_END@ |
1c79356b A |
27 | */ |
28 | /* | |
29 | * Copyright (c) 1982, 1986, 1993 | |
30 | * The Regents of the University of California. All rights reserved. | |
31 | * | |
32 | * Redistribution and use in source and binary forms, with or without | |
33 | * modification, are permitted provided that the following conditions | |
34 | * are met: | |
35 | * 1. Redistributions of source code must retain the above copyright | |
36 | * notice, this list of conditions and the following disclaimer. | |
37 | * 2. Redistributions in binary form must reproduce the above copyright | |
38 | * notice, this list of conditions and the following disclaimer in the | |
39 | * documentation and/or other materials provided with the distribution. | |
40 | * 3. All advertising materials mentioning features or use of this software | |
41 | * must display the following acknowledgement: | |
42 | * This product includes software developed by the University of | |
43 | * California, Berkeley and its contributors. | |
44 | * 4. Neither the name of the University nor the names of its contributors | |
45 | * may be used to endorse or promote products derived from this software | |
46 | * without specific prior written permission. | |
47 | * | |
48 | * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND | |
49 | * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | |
50 | * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | |
51 | * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE | |
52 | * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL | |
53 | * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS | |
54 | * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) | |
55 | * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT | |
56 | * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY | |
57 | * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF | |
58 | * SUCH DAMAGE. | |
59 | * | |
60 | * @(#)tcp_timer.h 8.1 (Berkeley) 6/10/93 | |
9bccf70c | 61 | * $FreeBSD: src/sys/netinet/tcp_timer.h,v 1.18 1999/12/29 04:41:03 peter Exp $ |
1c79356b A |
62 | */ |
63 | ||
64 | #ifndef _NETINET_TCP_TIMER_H_ | |
65 | #define _NETINET_TCP_TIMER_H_ | |
9bccf70c | 66 | #include <sys/appleapiopts.h> |
1c79356b | 67 | |
6d2010ae A |
68 | #ifdef KERNEL |
69 | #include <kern/thread_call.h> | |
70 | #endif /* KERNEL */ | |
71 | ||
1c79356b | 72 | /* |
6d2010ae | 73 | * Definitions of the TCP timers. |
1c79356b | 74 | */ |
39236c6e | 75 | #define TCPT_NTIMERS (TCPT_MAX + 1) |
6d2010ae A |
76 | |
77 | /* Keep the external definition the same for binary compatibility */ | |
78 | #define TCPT_NTIMERS_EXT 4 | |
1c79356b A |
79 | |
80 | #define TCPT_REXMT 0 /* retransmit */ | |
81 | #define TCPT_PERSIST 1 /* retransmit persistence */ | |
82 | #define TCPT_KEEP 2 /* keep alive */ | |
83 | #define TCPT_2MSL 3 /* 2*msl quiet time timer */ | |
6d2010ae | 84 | #define TCPT_DELACK 4 /* delayed ack timer */ |
39236c6e A |
85 | #if MPTCP |
86 | #define TCPT_JACK_RXMT 5 /* retransmit timer for join ack */ | |
87 | #define TCPT_MAX 5 | |
88 | #else /* MPTCP */ | |
6d2010ae | 89 | #define TCPT_MAX 4 |
39236c6e | 90 | #endif /* !MPTCP */ |
6d2010ae | 91 | #define TCPT_NONE (TCPT_MAX + 1) |
1c79356b A |
92 | |
93 | /* | |
94 | * The TCPT_REXMT timer is used to force retransmissions. | |
95 | * The TCP has the TCPT_REXMT timer set whenever segments | |
96 | * have been sent for which ACKs are expected but not yet | |
97 | * received. If an ACK is received which advances tp->snd_una, | |
98 | * then the retransmit timer is cleared (if there are no more | |
99 | * outstanding segments) or reset to the base value (if there | |
100 | * are more ACKs expected). Whenever the retransmit timer goes off, | |
101 | * we retransmit one unacknowledged segment, and do a backoff | |
102 | * on the retransmit timer. | |
103 | * | |
104 | * The TCPT_PERSIST timer is used to keep window size information | |
105 | * flowing even if the window goes shut. If all previous transmissions | |
106 | * have been acknowledged (so that there are no retransmissions in progress), | |
107 | * and the window is too small to bother sending anything, then we start | |
108 | * the TCPT_PERSIST timer. When it expires, if the window is nonzero, | |
109 | * we go to transmit state. Otherwise, at intervals send a single byte | |
110 | * into the peer's window to force him to update our window information. | |
111 | * We do this at most as often as TCPT_PERSMIN time intervals, | |
112 | * but no more frequently than the current estimate of round-trip | |
113 | * packet time. The TCPT_PERSIST timer is cleared whenever we receive | |
114 | * a window update from the peer. | |
115 | * | |
116 | * The TCPT_KEEP timer is used to keep connections alive. If an | |
117 | * connection is idle (no segments received) for TCPTV_KEEP_INIT amount of time, | |
118 | * but not yet established, then we drop the connection. Once the connection | |
119 | * is established, if the connection is idle for TCPTV_KEEP_IDLE time | |
120 | * (and keepalives have been enabled on the socket), we begin to probe | |
121 | * the connection. We force the peer to send us a segment by sending: | |
122 | * <SEQ=SND.UNA-1><ACK=RCV.NXT><CTL=ACK> | |
123 | * This segment is (deliberately) outside the window, and should elicit | |
124 | * an ack segment in response from the peer. If, despite the TCPT_KEEP | |
125 | * initiated segments we cannot elicit a response from a peer in TCPT_MAXIDLE | |
126 | * amount of time probing, then we drop the connection. | |
127 | */ | |
128 | ||
91447636 A |
129 | #ifdef PRIVATE |
130 | ||
1c79356b A |
131 | /* |
132 | * Time constants. | |
133 | */ | |
2d21ac55 | 134 | #define TCPTV_MSL ( 15*TCP_RETRANSHZ) /* max seg lifetime (hah!) */ |
1c79356b | 135 | #define TCPTV_SRTTBASE 0 /* base roundtrip time; |
6d2010ae | 136 | if 0, no idea yet */ |
2d21ac55 A |
137 | #define TCPTV_RTOBASE ( 1*TCP_RETRANSHZ) /* assumed RTO if no info */ |
138 | #define TCPTV_SRTTDFLT ( 1*TCP_RETRANSHZ) /* assumed RTT if no info */ | |
1c79356b | 139 | |
2d21ac55 A |
140 | #define TCPTV_PERSMIN ( 5*TCP_RETRANSHZ) /* retransmit persistence */ |
141 | #define TCPTV_PERSMAX ( 60*TCP_RETRANSHZ) /* maximum persist interval */ | |
1c79356b | 142 | |
2d21ac55 A |
143 | #define TCPTV_KEEP_INIT ( 75*TCP_RETRANSHZ) /* initial connect keep alive */ |
144 | #define TCPTV_KEEP_IDLE (120*60*TCP_RETRANSHZ) /* dflt time before probing */ | |
145 | #define TCPTV_KEEPINTVL ( 75*TCP_RETRANSHZ) /* default probe interval */ | |
1c79356b A |
146 | #define TCPTV_KEEPCNT 8 /* max probes before drop */ |
147 | ||
6d2010ae A |
148 | #define TCPTV_REXMTMAX ( 64*TCP_RETRANSHZ ) /* max allowable REXMT value */ |
149 | #define TCPTV_REXMTMIN ( TCP_RETRANSHZ/33 ) /* min REXMT for non-local connections */ | |
150 | #define TCPTV_UNACKWIN ( TCP_RETRANSHZ/10 ) /* Window for counting rcv bytes to see if | |
151 | ack-stretching can start (default 100 ms) */ | |
152 | #define TCPTV_MAXRCVIDLE (TCP_RETRANSHZ/5 ) /* Receiver idle time, avoid ack-stretching after that*/ | |
316670eb | 153 | #define TCPTV_RCVBUFIDLE (TCP_RETRANSHZ/2) /* Receiver idle time, for rcv socket buffer resizing */ |
6d2010ae A |
154 | |
155 | /* No ack stretching during slow-start, until we see some packets. | |
156 | * By the time the receiver gets 512 packets, the senders cwnd | |
316670eb A |
157 | * should open by a few hundred packets consdering the |
158 | * slow-start progression. | |
6d2010ae A |
159 | */ |
160 | #define TCP_RCV_SS_PKTCOUNT 512 | |
1c79356b A |
161 | |
162 | #define TCPTV_TWTRUNC 8 /* RTO factor to truncate TW */ | |
163 | ||
164 | #define TCP_LINGERTIME 120 /* linger at most 2 minutes */ | |
165 | ||
166 | #define TCP_MAXRXTSHIFT 12 /* maximum retransmits */ | |
167 | ||
168 | #ifdef TCPTIMERS | |
169 | static char *tcptimers[] = | |
6d2010ae | 170 | { "REXMT", "PERSIST", "KEEP", "2MSL" , "DELACK"}; |
1c79356b A |
171 | #endif |
172 | ||
91447636 | 173 | #ifdef KERNEL |
6d2010ae A |
174 | |
175 | /* We consider persist, keep and 2msl as slow timers which can be coalesced | |
176 | * at a higher granularity (500 ms). Rexmt and delayed ack are considered fast | |
177 | * timers which fire in the order of 100ms. | |
178 | * | |
179 | * The following conditional is to check if a timer is one of the slow timers. This | |
180 | * is fast and works well for now. If we add more slow timers for any reason, | |
181 | * we may need to change this. | |
182 | */ | |
183 | #define IS_TIMER_SLOW(ind) ((ind & 0x3) != 0) | |
184 | ||
185 | struct tcptimerlist; | |
186 | ||
187 | struct tcptimerentry { | |
188 | LIST_ENTRY(tcptimerentry) le; /* links for timer list */ | |
189 | uint32_t timer_start; /* tcp clock when the timer was started */ | |
190 | uint16_t index; /* index of lowest timer that needs to run first */ | |
191 | uint32_t runtime; /* deadline at which the first timer has to fire */ | |
192 | }; | |
193 | ||
194 | LIST_HEAD(timerlisthead, tcptimerentry); | |
195 | ||
196 | struct tcptimerlist { | |
197 | struct timerlisthead lhead; /* head of the list of timer entries */ | |
198 | lck_mtx_t *mtx; /* lock to protect the list */ | |
199 | lck_attr_t *mtx_attr; /* mutex attributes */ | |
200 | lck_grp_t *mtx_grp; /* mutex group definition */ | |
201 | lck_grp_attr_t *mtx_grp_attr; /* mutex group attributes */ | |
202 | uint32_t fast_quantum; /* minimum time quantum to coalesce fast timers */ | |
203 | uint32_t slow_quantum; /* minimum time quantum to coalesce slow timers */ | |
204 | thread_call_t call; /* call entry */ | |
205 | uint32_t runtime; /* time at which this list is going to run */ | |
206 | uint32_t entries; /* Number of entries on the list */ | |
207 | uint32_t maxentries; /* Max number of entries at any time */ | |
208 | ||
209 | /* Set desired mode when timer list running */ | |
210 | boolean_t running; /* Set when timer list is being processed */ | |
8a3053a0 | 211 | boolean_t scheduled; /* Set when timer is scheduled */ |
6d2010ae A |
212 | #define TCP_TIMERLIST_FASTMODE 0x1 |
213 | #define TCP_TIMERLIST_SLOWMODE 0x2 | |
214 | uint32_t mode; /* Current mode, fast or slow */ | |
215 | uint32_t pref_mode; /* Preferred mode set by a connection, fast or slow */ | |
216 | uint32_t pref_offset; /* Preferred offset set by a connection */ | |
217 | uint32_t idlegen; /* Number of times the list has been idle in fast mode */ | |
218 | struct tcptimerentry *next_te; /* Store the next timer entry pointer to process */ | |
219 | ||
220 | }; | |
221 | ||
222 | #define TCP_FASTMODE_IDLEGEN_MAX 20 /* Approximately 2 seconds */ | |
223 | ||
1c79356b | 224 | /* |
6d2010ae A |
225 | * Minimum retransmit timeout is set to 30ms. We add a slop of |
226 | * 200 ms to the retransmit value to account for processing | |
227 | * variance and delayed ack. This extra 200ms will help to avoid | |
228 | * spurious retransmits by taking into consideration the receivers | |
229 | * that wait for delayed ack timer instead of generating an ack | |
230 | * for every two packets. | |
231 | * | |
232 | * On a local link, the minimum retransmit timeout is 100ms and | |
233 | * variance is set to 0. This will make the sender a little bit more | |
234 | * aggressive on local link. When the connection is not established yet, | |
235 | * there is no need to add an extra 200ms to retransmit timeout because | |
236 | * the initial value is high (1s) and delayed ack is not a problem in | |
237 | * that case. | |
1c79356b | 238 | */ |
6d2010ae A |
239 | #define TCPTV_REXMTSLOP ( TCP_RETRANSHZ/5 ) /* rexmt slop allowed (200 ms) */ |
240 | ||
241 | /* macro to decide when retransmit slop (described above) should be added */ | |
316670eb | 242 | #define TCP_ADD_REXMTSLOP(tp) (tp->t_state >= TCPS_ESTABLISHED) |
6d2010ae A |
243 | |
244 | #define TCPT_RANGESET(tv, value, tvmin, tvmax, addslop) do { \ | |
245 | (tv) = ((addslop) ? tcp_rexmt_slop : 0) + (value); \ | |
b0d623f7 | 246 | if ((uint32_t)(tv) < (uint32_t)(tvmin)) \ |
1c79356b | 247 | (tv) = (tvmin); \ |
b0d623f7 | 248 | else if ((uint32_t)(tv) > (uint32_t)(tvmax)) \ |
1c79356b | 249 | (tv) = (tvmax); \ |
9bccf70c | 250 | } while(0) |
1c79356b | 251 | |
39236c6e A |
252 | #define TCP_CONN_KEEPIDLE(tp) \ |
253 | ((tp)->t_keepidle && \ | |
254 | ((tp)->t_inpcb->inp_socket->so_options & SO_KEEPALIVE) ? \ | |
255 | (tp)->t_keepidle : tcp_keepidle) | |
256 | #define TCP_CONN_KEEPINIT(tp) \ | |
257 | (((tp)->t_keepinit > 0) ? (tp)->t_keepinit : tcp_keepinit) | |
258 | #define TCP_CONN_KEEPCNT(tp) \ | |
259 | (((tp)->t_keepcnt > 0) ? (tp)->t_keepcnt : tcp_keepcnt) | |
260 | #define TCP_CONN_KEEPINTVL(tp) \ | |
261 | (((tp)->t_keepintvl > 0) ? (tp)->t_keepintvl : tcp_keepintvl) | |
262 | #define TCP_CONN_MAXIDLE(tp) \ | |
263 | (TCP_CONN_KEEPCNT(tp) * TCP_CONN_KEEPINTVL(tp)) | |
55e303ae | 264 | |
316670eb A |
265 | /* Since we did not add rexmt slop for local connections, we should add |
266 | * it to idle timeout. Otherwise local connections will reach idle state | |
267 | * quickly | |
268 | */ | |
269 | #define TCP_IDLETIMEOUT(tp) \ | |
270 | (((TCP_ADD_REXMTSLOP(tp)) ? 0 : tcp_rexmt_slop) + tp->t_rxtcur) | |
271 | ||
39236c6e A |
272 | TAILQ_HEAD(tcptailq, tcpcb); |
273 | ||
1c79356b A |
274 | extern int tcp_keepinit; /* time to establish connection */ |
275 | extern int tcp_keepidle; /* time before keepalive probes begin */ | |
9bccf70c | 276 | extern int tcp_keepintvl; /* time between keepalive probes */ |
39236c6e | 277 | extern int tcp_keepcnt; /* number of keepalives */ |
6d2010ae | 278 | extern int tcp_delack; /* delayed ack timer */ |
9bccf70c A |
279 | extern int tcp_maxpersistidle; |
280 | extern int tcp_msl; | |
1c79356b A |
281 | extern int tcp_ttl; /* time to live for TCP segs */ |
282 | extern int tcp_backoff[]; | |
6d2010ae A |
283 | extern int tcp_rexmt_slop; |
284 | extern u_int32_t tcp_max_persist_timeout; /* Maximum persistence for Zero Window Probes */ | |
1c79356b | 285 | |
6d2010ae | 286 | #define OFFSET_FROM_START(tp, off) ((tcp_now + (off)) - (tp)->tentry.timer_start) |
9bccf70c A |
287 | |
288 | #endif /* KERNEL */ | |
91447636 | 289 | #endif /* PRIVATE */ |
9bccf70c | 290 | #endif /* !_NETINET_TCP_TIMER_H_ */ |
91447636 | 291 |