]> git.saurik.com Git - apple/xnu.git/blame - bsd/netinet/tcp_timer.h
xnu-1699.24.23.tar.gz
[apple/xnu.git] / bsd / netinet / tcp_timer.h
CommitLineData
1c79356b 1/*
6d2010ae 2 * Copyright (c) 2000-2010 Apple Computer, Inc. All rights reserved.
5d5c5d0d 3 *
2d21ac55 4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
1c79356b 5 *
2d21ac55
A
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
8f6c56a5 14 *
2d21ac55
A
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
8f6c56a5
A
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
2d21ac55
A
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
8f6c56a5 25 *
2d21ac55 26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
1c79356b
A
27 */
28/*
29 * Copyright (c) 1982, 1986, 1993
30 * The Regents of the University of California. All rights reserved.
31 *
32 * Redistribution and use in source and binary forms, with or without
33 * modification, are permitted provided that the following conditions
34 * are met:
35 * 1. Redistributions of source code must retain the above copyright
36 * notice, this list of conditions and the following disclaimer.
37 * 2. Redistributions in binary form must reproduce the above copyright
38 * notice, this list of conditions and the following disclaimer in the
39 * documentation and/or other materials provided with the distribution.
40 * 3. All advertising materials mentioning features or use of this software
41 * must display the following acknowledgement:
42 * This product includes software developed by the University of
43 * California, Berkeley and its contributors.
44 * 4. Neither the name of the University nor the names of its contributors
45 * may be used to endorse or promote products derived from this software
46 * without specific prior written permission.
47 *
48 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
49 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
50 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
51 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
52 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
53 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
54 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
55 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
56 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
57 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
58 * SUCH DAMAGE.
59 *
60 * @(#)tcp_timer.h 8.1 (Berkeley) 6/10/93
9bccf70c 61 * $FreeBSD: src/sys/netinet/tcp_timer.h,v 1.18 1999/12/29 04:41:03 peter Exp $
1c79356b
A
62 */
63
64#ifndef _NETINET_TCP_TIMER_H_
65#define _NETINET_TCP_TIMER_H_
9bccf70c 66#include <sys/appleapiopts.h>
1c79356b 67
6d2010ae
A
68#ifdef KERNEL
69#include <kern/thread_call.h>
70#endif /* KERNEL */
71
1c79356b 72/*
6d2010ae 73 * Definitions of the TCP timers.
1c79356b 74 */
6d2010ae
A
75#define TCPT_NTIMERS 5
76
77/* Keep the external definition the same for binary compatibility */
78#define TCPT_NTIMERS_EXT 4
1c79356b
A
79
80#define TCPT_REXMT 0 /* retransmit */
81#define TCPT_PERSIST 1 /* retransmit persistence */
82#define TCPT_KEEP 2 /* keep alive */
83#define TCPT_2MSL 3 /* 2*msl quiet time timer */
6d2010ae
A
84#define TCPT_DELACK 4 /* delayed ack timer */
85#define TCPT_MAX 4
86#define TCPT_NONE (TCPT_MAX + 1)
1c79356b
A
87
88/*
89 * The TCPT_REXMT timer is used to force retransmissions.
90 * The TCP has the TCPT_REXMT timer set whenever segments
91 * have been sent for which ACKs are expected but not yet
92 * received. If an ACK is received which advances tp->snd_una,
93 * then the retransmit timer is cleared (if there are no more
94 * outstanding segments) or reset to the base value (if there
95 * are more ACKs expected). Whenever the retransmit timer goes off,
96 * we retransmit one unacknowledged segment, and do a backoff
97 * on the retransmit timer.
98 *
99 * The TCPT_PERSIST timer is used to keep window size information
100 * flowing even if the window goes shut. If all previous transmissions
101 * have been acknowledged (so that there are no retransmissions in progress),
102 * and the window is too small to bother sending anything, then we start
103 * the TCPT_PERSIST timer. When it expires, if the window is nonzero,
104 * we go to transmit state. Otherwise, at intervals send a single byte
105 * into the peer's window to force him to update our window information.
106 * We do this at most as often as TCPT_PERSMIN time intervals,
107 * but no more frequently than the current estimate of round-trip
108 * packet time. The TCPT_PERSIST timer is cleared whenever we receive
109 * a window update from the peer.
110 *
111 * The TCPT_KEEP timer is used to keep connections alive. If an
112 * connection is idle (no segments received) for TCPTV_KEEP_INIT amount of time,
113 * but not yet established, then we drop the connection. Once the connection
114 * is established, if the connection is idle for TCPTV_KEEP_IDLE time
115 * (and keepalives have been enabled on the socket), we begin to probe
116 * the connection. We force the peer to send us a segment by sending:
117 * <SEQ=SND.UNA-1><ACK=RCV.NXT><CTL=ACK>
118 * This segment is (deliberately) outside the window, and should elicit
119 * an ack segment in response from the peer. If, despite the TCPT_KEEP
120 * initiated segments we cannot elicit a response from a peer in TCPT_MAXIDLE
121 * amount of time probing, then we drop the connection.
122 */
123
91447636
A
124#ifdef PRIVATE
125
1c79356b
A
126/*
127 * Time constants.
128 */
2d21ac55 129#define TCPTV_MSL ( 15*TCP_RETRANSHZ) /* max seg lifetime (hah!) */
1c79356b 130#define TCPTV_SRTTBASE 0 /* base roundtrip time;
6d2010ae 131 if 0, no idea yet */
2d21ac55
A
132#define TCPTV_RTOBASE ( 1*TCP_RETRANSHZ) /* assumed RTO if no info */
133#define TCPTV_SRTTDFLT ( 1*TCP_RETRANSHZ) /* assumed RTT if no info */
1c79356b 134
2d21ac55
A
135#define TCPTV_PERSMIN ( 5*TCP_RETRANSHZ) /* retransmit persistence */
136#define TCPTV_PERSMAX ( 60*TCP_RETRANSHZ) /* maximum persist interval */
1c79356b 137
2d21ac55
A
138#define TCPTV_KEEP_INIT ( 75*TCP_RETRANSHZ) /* initial connect keep alive */
139#define TCPTV_KEEP_IDLE (120*60*TCP_RETRANSHZ) /* dflt time before probing */
140#define TCPTV_KEEPINTVL ( 75*TCP_RETRANSHZ) /* default probe interval */
1c79356b
A
141#define TCPTV_KEEPCNT 8 /* max probes before drop */
142
6d2010ae
A
143#define TCPTV_REXMTMAX ( 64*TCP_RETRANSHZ ) /* max allowable REXMT value */
144#define TCPTV_REXMTMIN ( TCP_RETRANSHZ/33 ) /* min REXMT for non-local connections */
145#define TCPTV_UNACKWIN ( TCP_RETRANSHZ/10 ) /* Window for counting rcv bytes to see if
146 ack-stretching can start (default 100 ms) */
147#define TCPTV_MAXRCVIDLE (TCP_RETRANSHZ/5 ) /* Receiver idle time, avoid ack-stretching after that*/
148
149/* No ack stretching during slow-start, until we see some packets.
150 * By the time the receiver gets 512 packets, the senders cwnd
151 * should open by a few hundred packets considering the progression
152 * during slow-start.
153 */
154#define TCP_RCV_SS_PKTCOUNT 512
1c79356b
A
155
156#define TCPTV_TWTRUNC 8 /* RTO factor to truncate TW */
157
158#define TCP_LINGERTIME 120 /* linger at most 2 minutes */
159
160#define TCP_MAXRXTSHIFT 12 /* maximum retransmits */
161
162#ifdef TCPTIMERS
163static char *tcptimers[] =
6d2010ae 164 { "REXMT", "PERSIST", "KEEP", "2MSL" , "DELACK"};
1c79356b
A
165#endif
166
91447636 167#ifdef KERNEL
6d2010ae
A
168
169/* We consider persist, keep and 2msl as slow timers which can be coalesced
170 * at a higher granularity (500 ms). Rexmt and delayed ack are considered fast
171 * timers which fire in the order of 100ms.
172 *
173 * The following conditional is to check if a timer is one of the slow timers. This
174 * is fast and works well for now. If we add more slow timers for any reason,
175 * we may need to change this.
176 */
177#define IS_TIMER_SLOW(ind) ((ind & 0x3) != 0)
178
179struct tcptimerlist;
180
181struct tcptimerentry {
182 LIST_ENTRY(tcptimerentry) le; /* links for timer list */
183 uint32_t timer_start; /* tcp clock when the timer was started */
184 uint16_t index; /* index of lowest timer that needs to run first */
185 uint32_t runtime; /* deadline at which the first timer has to fire */
186};
187
188LIST_HEAD(timerlisthead, tcptimerentry);
189
190struct tcptimerlist {
191 struct timerlisthead lhead; /* head of the list of timer entries */
192 lck_mtx_t *mtx; /* lock to protect the list */
193 lck_attr_t *mtx_attr; /* mutex attributes */
194 lck_grp_t *mtx_grp; /* mutex group definition */
195 lck_grp_attr_t *mtx_grp_attr; /* mutex group attributes */
196 uint32_t fast_quantum; /* minimum time quantum to coalesce fast timers */
197 uint32_t slow_quantum; /* minimum time quantum to coalesce slow timers */
198 thread_call_t call; /* call entry */
199 uint32_t runtime; /* time at which this list is going to run */
200 uint32_t entries; /* Number of entries on the list */
201 uint32_t maxentries; /* Max number of entries at any time */
202
203 /* Set desired mode when timer list running */
204 boolean_t running; /* Set when timer list is being processed */
205#define TCP_TIMERLIST_FASTMODE 0x1
206#define TCP_TIMERLIST_SLOWMODE 0x2
207 uint32_t mode; /* Current mode, fast or slow */
208 uint32_t pref_mode; /* Preferred mode set by a connection, fast or slow */
209 uint32_t pref_offset; /* Preferred offset set by a connection */
210 uint32_t idlegen; /* Number of times the list has been idle in fast mode */
211 struct tcptimerentry *next_te; /* Store the next timer entry pointer to process */
212
213};
214
215#define TCP_FASTMODE_IDLEGEN_MAX 20 /* Approximately 2 seconds */
216
1c79356b 217/*
6d2010ae
A
218 * Minimum retransmit timeout is set to 30ms. We add a slop of
219 * 200 ms to the retransmit value to account for processing
220 * variance and delayed ack. This extra 200ms will help to avoid
221 * spurious retransmits by taking into consideration the receivers
222 * that wait for delayed ack timer instead of generating an ack
223 * for every two packets.
224 *
225 * On a local link, the minimum retransmit timeout is 100ms and
226 * variance is set to 0. This will make the sender a little bit more
227 * aggressive on local link. When the connection is not established yet,
228 * there is no need to add an extra 200ms to retransmit timeout because
229 * the initial value is high (1s) and delayed ack is not a problem in
230 * that case.
1c79356b 231 */
6d2010ae
A
232#define TCPTV_REXMTSLOP ( TCP_RETRANSHZ/5 ) /* rexmt slop allowed (200 ms) */
233
234/* macro to decide when retransmit slop (described above) should be added */
235#define TCP_ADD_REXMTSLOP(tp) ((tp->t_flags & TF_LOCAL) != 0 || tp->t_state >= TCPS_ESTABLISHED)
236
237#define TCPT_RANGESET(tv, value, tvmin, tvmax, addslop) do { \
238 (tv) = ((addslop) ? tcp_rexmt_slop : 0) + (value); \
b0d623f7 239 if ((uint32_t)(tv) < (uint32_t)(tvmin)) \
1c79356b 240 (tv) = (tvmin); \
b0d623f7 241 else if ((uint32_t)(tv) > (uint32_t)(tvmax)) \
1c79356b 242 (tv) = (tvmax); \
9bccf70c 243} while(0)
1c79356b 244
55e303ae
A
245#define TCP_KEEPIDLE(tp) \
246 (tp->t_keepidle && (tp->t_inpcb->inp_socket->so_options & SO_KEEPALIVE) ? \
247 tp->t_keepidle : tcp_keepidle)
248
1c79356b
A
249extern int tcp_keepinit; /* time to establish connection */
250extern int tcp_keepidle; /* time before keepalive probes begin */
9bccf70c 251extern int tcp_keepintvl; /* time between keepalive probes */
1c79356b 252extern int tcp_maxidle; /* time to drop after starting probes */
6d2010ae 253extern int tcp_delack; /* delayed ack timer */
9bccf70c
A
254extern int tcp_maxpersistidle;
255extern int tcp_msl;
1c79356b
A
256extern int tcp_ttl; /* time to live for TCP segs */
257extern int tcp_backoff[];
6d2010ae
A
258extern int tcp_rexmt_slop;
259extern u_int32_t tcp_max_persist_timeout; /* Maximum persistence for Zero Window Probes */
1c79356b 260
6d2010ae 261#define OFFSET_FROM_START(tp, off) ((tcp_now + (off)) - (tp)->tentry.timer_start)
9bccf70c
A
262
263#endif /* KERNEL */
91447636 264#endif /* PRIVATE */
9bccf70c 265#endif /* !_NETINET_TCP_TIMER_H_ */
91447636 266