tcp_timer.c revision 1.72 1 1.72 christos /* $NetBSD: tcp_timer.c,v 1.72 2005/07/19 17:00:02 christos Exp $ */
2 1.44 itojun
3 1.44 itojun /*
4 1.44 itojun * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
5 1.44 itojun * All rights reserved.
6 1.59 itojun *
7 1.44 itojun * Redistribution and use in source and binary forms, with or without
8 1.44 itojun * modification, are permitted provided that the following conditions
9 1.44 itojun * are met:
10 1.44 itojun * 1. Redistributions of source code must retain the above copyright
11 1.44 itojun * notice, this list of conditions and the following disclaimer.
12 1.44 itojun * 2. Redistributions in binary form must reproduce the above copyright
13 1.44 itojun * notice, this list of conditions and the following disclaimer in the
14 1.44 itojun * documentation and/or other materials provided with the distribution.
15 1.44 itojun * 3. Neither the name of the project nor the names of its contributors
16 1.44 itojun * may be used to endorse or promote products derived from this software
17 1.44 itojun * without specific prior written permission.
18 1.59 itojun *
19 1.44 itojun * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
20 1.44 itojun * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 1.44 itojun * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 1.44 itojun * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
23 1.44 itojun * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 1.44 itojun * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25 1.44 itojun * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 1.44 itojun * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 1.44 itojun * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 1.44 itojun * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 1.44 itojun * SUCH DAMAGE.
30 1.44 itojun */
31 1.30 thorpej
32 1.30 thorpej /*-
33 1.71 mycroft * Copyright (c) 1997, 1998, 2001, 2005 The NetBSD Foundation, Inc.
34 1.30 thorpej * All rights reserved.
35 1.30 thorpej *
36 1.30 thorpej * This code is derived from software contributed to The NetBSD Foundation
37 1.30 thorpej * by Jason R. Thorpe and Kevin M. Lahey of the Numerical Aerospace Simulation
38 1.30 thorpej * Facility, NASA Ames Research Center.
39 1.71 mycroft * This code is derived from software contributed to The NetBSD Foundation
40 1.71 mycroft * by Charles M. Hannum.
41 1.30 thorpej *
42 1.30 thorpej * Redistribution and use in source and binary forms, with or without
43 1.30 thorpej * modification, are permitted provided that the following conditions
44 1.30 thorpej * are met:
45 1.30 thorpej * 1. Redistributions of source code must retain the above copyright
46 1.30 thorpej * notice, this list of conditions and the following disclaimer.
47 1.30 thorpej * 2. Redistributions in binary form must reproduce the above copyright
48 1.30 thorpej * notice, this list of conditions and the following disclaimer in the
49 1.30 thorpej * documentation and/or other materials provided with the distribution.
50 1.30 thorpej * 3. All advertising materials mentioning features or use of this software
51 1.30 thorpej * must display the following acknowledgement:
52 1.30 thorpej * This product includes software developed by the NetBSD
53 1.30 thorpej * Foundation, Inc. and its contributors.
54 1.30 thorpej * 4. Neither the name of The NetBSD Foundation nor the names of its
55 1.30 thorpej * contributors may be used to endorse or promote products derived
56 1.30 thorpej * from this software without specific prior written permission.
57 1.30 thorpej *
58 1.30 thorpej * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
59 1.30 thorpej * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
60 1.30 thorpej * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
61 1.30 thorpej * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
62 1.30 thorpej * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
63 1.30 thorpej * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
64 1.30 thorpej * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
65 1.30 thorpej * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
66 1.30 thorpej * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
67 1.30 thorpej * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
68 1.30 thorpej * POSSIBILITY OF SUCH DAMAGE.
69 1.30 thorpej */
70 1.8 cgd
71 1.1 cgd /*
72 1.28 thorpej * Copyright (c) 1982, 1986, 1988, 1990, 1993, 1995
73 1.7 mycroft * The Regents of the University of California. All rights reserved.
74 1.1 cgd *
75 1.1 cgd * Redistribution and use in source and binary forms, with or without
76 1.1 cgd * modification, are permitted provided that the following conditions
77 1.1 cgd * are met:
78 1.1 cgd * 1. Redistributions of source code must retain the above copyright
79 1.1 cgd * notice, this list of conditions and the following disclaimer.
80 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
81 1.1 cgd * notice, this list of conditions and the following disclaimer in the
82 1.1 cgd * documentation and/or other materials provided with the distribution.
83 1.64 agc * 3. Neither the name of the University nor the names of its contributors
84 1.1 cgd * may be used to endorse or promote products derived from this software
85 1.1 cgd * without specific prior written permission.
86 1.1 cgd *
87 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
88 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
89 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
90 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
91 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
92 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
93 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
94 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
95 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
96 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
97 1.1 cgd * SUCH DAMAGE.
98 1.1 cgd *
99 1.28 thorpej * @(#)tcp_timer.c 8.2 (Berkeley) 5/24/95
100 1.1 cgd */
101 1.57 lukem
102 1.57 lukem #include <sys/cdefs.h>
103 1.72 christos __KERNEL_RCSID(0, "$NetBSD: tcp_timer.c,v 1.72 2005/07/19 17:00:02 christos Exp $");
104 1.29 scottr
105 1.44 itojun #include "opt_inet.h"
106 1.51 thorpej #include "opt_tcp_debug.h"
107 1.44 itojun
108 1.4 mycroft #include <sys/param.h>
109 1.4 mycroft #include <sys/systm.h>
110 1.4 mycroft #include <sys/malloc.h>
111 1.4 mycroft #include <sys/mbuf.h>
112 1.4 mycroft #include <sys/socket.h>
113 1.4 mycroft #include <sys/socketvar.h>
114 1.4 mycroft #include <sys/protosw.h>
115 1.4 mycroft #include <sys/errno.h>
116 1.49 thorpej #include <sys/kernel.h>
117 1.1 cgd
118 1.4 mycroft #include <net/if.h>
119 1.4 mycroft #include <net/route.h>
120 1.1 cgd
121 1.4 mycroft #include <netinet/in.h>
122 1.4 mycroft #include <netinet/in_systm.h>
123 1.4 mycroft #include <netinet/ip.h>
124 1.4 mycroft #include <netinet/in_pcb.h>
125 1.4 mycroft #include <netinet/ip_var.h>
126 1.72 christos #include <netinet/ip_icmp.h>
127 1.44 itojun
128 1.44 itojun #ifdef INET6
129 1.44 itojun #ifndef INET
130 1.44 itojun #include <netinet/in.h>
131 1.44 itojun #endif
132 1.44 itojun #include <netinet/ip6.h>
133 1.44 itojun #include <netinet6/in6_pcb.h>
134 1.44 itojun #endif
135 1.44 itojun
136 1.4 mycroft #include <netinet/tcp.h>
137 1.4 mycroft #include <netinet/tcp_fsm.h>
138 1.4 mycroft #include <netinet/tcp_seq.h>
139 1.4 mycroft #include <netinet/tcp_timer.h>
140 1.4 mycroft #include <netinet/tcp_var.h>
141 1.4 mycroft #include <netinet/tcpip.h>
142 1.51 thorpej #ifdef TCP_DEBUG
143 1.51 thorpej #include <netinet/tcp_debug.h>
144 1.51 thorpej #endif
145 1.1 cgd
146 1.52 thorpej /*
147 1.52 thorpej * Various tunable timer parameters. These are initialized in tcp_init(),
148 1.52 thorpej * unless they are patched.
149 1.52 thorpej */
150 1.52 thorpej int tcp_keepidle = 0;
151 1.52 thorpej int tcp_keepintvl = 0;
152 1.52 thorpej int tcp_keepcnt = 0; /* max idle probes */
153 1.52 thorpej int tcp_maxpersistidle = 0; /* max idle time in persist */
154 1.52 thorpej int tcp_maxidle; /* computed in tcp_slowtimo() */
155 1.26 thorpej
156 1.49 thorpej /*
157 1.49 thorpej * Time to delay the ACK. This is initialized in tcp_init(), unless
158 1.49 thorpej * its patched.
159 1.49 thorpej */
160 1.49 thorpej int tcp_delack_ticks = 0;
161 1.27 thorpej
162 1.51 thorpej void tcp_timer_rexmt(void *);
163 1.51 thorpej void tcp_timer_persist(void *);
164 1.51 thorpej void tcp_timer_keep(void *);
165 1.51 thorpej void tcp_timer_2msl(void *);
166 1.51 thorpej
167 1.56 matt const tcp_timer_func_t tcp_timer_funcs[TCPT_NTIMERS] = {
168 1.51 thorpej tcp_timer_rexmt,
169 1.51 thorpej tcp_timer_persist,
170 1.51 thorpej tcp_timer_keep,
171 1.51 thorpej tcp_timer_2msl,
172 1.51 thorpej };
173 1.52 thorpej
174 1.52 thorpej /*
175 1.52 thorpej * Timer state initialization, called from tcp_init().
176 1.52 thorpej */
177 1.52 thorpej void
178 1.52 thorpej tcp_timer_init(void)
179 1.52 thorpej {
180 1.52 thorpej
181 1.52 thorpej if (tcp_keepidle == 0)
182 1.52 thorpej tcp_keepidle = TCPTV_KEEP_IDLE;
183 1.52 thorpej
184 1.52 thorpej if (tcp_keepintvl == 0)
185 1.52 thorpej tcp_keepintvl = TCPTV_KEEPINTVL;
186 1.52 thorpej
187 1.52 thorpej if (tcp_keepcnt == 0)
188 1.52 thorpej tcp_keepcnt = TCPTV_KEEPCNT;
189 1.52 thorpej
190 1.52 thorpej if (tcp_maxpersistidle == 0)
191 1.52 thorpej tcp_maxpersistidle = TCPTV_KEEP_IDLE;
192 1.52 thorpej
193 1.52 thorpej if (tcp_delack_ticks == 0)
194 1.52 thorpej tcp_delack_ticks = TCP_DELACK_TICKS;
195 1.52 thorpej }
196 1.51 thorpej
197 1.1 cgd /*
198 1.63 he * Return how many timers are currently being invoked.
199 1.63 he */
200 1.63 he int
201 1.63 he tcp_timers_invoking(struct tcpcb *tp)
202 1.63 he {
203 1.63 he int i;
204 1.63 he int count = 0;
205 1.63 he
206 1.63 he for (i = 0; i < TCPT_NTIMERS; i++)
207 1.63 he if (callout_invoking(&tp->t_timer[i]))
208 1.63 he count++;
209 1.63 he if (callout_invoking(&tp->t_delack_ch))
210 1.63 he count++;
211 1.63 he
212 1.63 he return count;
213 1.63 he }
214 1.63 he
215 1.63 he /*
216 1.49 thorpej * Callout to process delayed ACKs for a TCPCB.
217 1.1 cgd */
218 1.6 mycroft void
219 1.49 thorpej tcp_delack(void *arg)
220 1.1 cgd {
221 1.49 thorpej struct tcpcb *tp = arg;
222 1.11 mycroft int s;
223 1.1 cgd
224 1.49 thorpej /*
225 1.49 thorpej * If tcp_output() wasn't able to transmit the ACK
226 1.49 thorpej * for whatever reason, it will restart the delayed
227 1.49 thorpej * ACK callout.
228 1.49 thorpej */
229 1.49 thorpej
230 1.13 mycroft s = splsoftnet();
231 1.63 he callout_ack(&tp->t_delack_ch);
232 1.63 he if (tcp_isdead(tp)) {
233 1.63 he splx(s);
234 1.63 he return;
235 1.63 he }
236 1.63 he
237 1.49 thorpej tp->t_flags |= TF_ACKNOW;
238 1.49 thorpej (void) tcp_output(tp);
239 1.1 cgd splx(s);
240 1.1 cgd }
241 1.1 cgd
242 1.1 cgd /*
243 1.1 cgd * Tcp protocol timeout routine called every 500 ms.
244 1.1 cgd * Updates the timers in all active tcb's and
245 1.1 cgd * causes finite state machine actions if timers expire.
246 1.1 cgd */
247 1.6 mycroft void
248 1.69 perry tcp_slowtimo(void)
249 1.1 cgd {
250 1.11 mycroft int s;
251 1.1 cgd
252 1.13 mycroft s = splsoftnet();
253 1.26 thorpej tcp_maxidle = tcp_keepcnt * tcp_keepintvl;
254 1.21 explorer tcp_iss_seq += TCP_ISSINCR; /* increment iss */
255 1.7 mycroft tcp_now++; /* for timestamps */
256 1.1 cgd splx(s);
257 1.1 cgd }
258 1.1 cgd
259 1.1 cgd /*
260 1.1 cgd * Cancel all timers for TCP tp.
261 1.1 cgd */
262 1.6 mycroft void
263 1.69 perry tcp_canceltimers(struct tcpcb *tp)
264 1.1 cgd {
265 1.46 augustss int i;
266 1.1 cgd
267 1.1 cgd for (i = 0; i < TCPT_NTIMERS; i++)
268 1.36 thorpej TCP_TIMER_DISARM(tp, i);
269 1.1 cgd }
270 1.1 cgd
271 1.56 matt const int tcp_backoff[TCP_MAXRXTSHIFT + 1] =
272 1.1 cgd { 1, 2, 4, 8, 16, 32, 64, 64, 64, 64, 64, 64, 64 };
273 1.1 cgd
274 1.56 matt const int tcp_totbackoff = 511; /* sum of tcp_backoff[] */
275 1.26 thorpej
276 1.1 cgd /*
277 1.1 cgd * TCP timer processing.
278 1.1 cgd */
279 1.51 thorpej
280 1.51 thorpej void
281 1.51 thorpej tcp_timer_rexmt(void *arg)
282 1.1 cgd {
283 1.51 thorpej struct tcpcb *tp = arg;
284 1.51 thorpej uint32_t rto;
285 1.51 thorpej int s;
286 1.51 thorpej #ifdef TCP_DEBUG
287 1.65 itojun struct socket *so = NULL;
288 1.51 thorpej short ostate;
289 1.47 itojun #endif
290 1.47 itojun
291 1.51 thorpej s = splsoftnet();
292 1.66 itojun callout_ack(&tp->t_timer[TCPT_REXMT]);
293 1.63 he if (tcp_isdead(tp)) {
294 1.63 he splx(s);
295 1.63 he return;
296 1.63 he }
297 1.1 cgd
298 1.72 christos if ((tp->t_flags & TF_PMTUD_PEND) && tp->t_inpcb &&
299 1.72 christos SEQ_GEQ(tp->t_pmtud_th_seq, tp->snd_una) &&
300 1.72 christos SEQ_LT(tp->t_pmtud_th_seq, (int)(tp->snd_una + tp->t_ourmss))) {
301 1.72 christos extern struct sockaddr_in icmpsrc;
302 1.72 christos struct icmp icmp;
303 1.72 christos
304 1.72 christos tp->t_flags &= ~TF_PMTUD_PEND;
305 1.72 christos
306 1.72 christos /* XXX create fake icmp message with relevant entries */
307 1.72 christos icmp.icmp_nextmtu = tp->t_pmtud_nextmtu;
308 1.72 christos icmp.icmp_ip.ip_len = tp->t_pmtud_ip_len;
309 1.72 christos icmp.icmp_ip.ip_hl = tp->t_pmtud_ip_hl;
310 1.72 christos icmpsrc.sin_addr = tp->t_inpcb->inp_faddr;
311 1.72 christos icmp_mtudisc(&icmp, icmpsrc.sin_addr);
312 1.72 christos
313 1.72 christos /*
314 1.72 christos * Notify all connections to the same peer about
315 1.72 christos * new mss and trigger retransmit.
316 1.72 christos */
317 1.72 christos in_pcbnotifyall(&tcbtable, icmpsrc.sin_addr, EMSGSIZE,
318 1.72 christos tcp_mtudisc);
319 1.72 christos splx(s);
320 1.72 christos return;
321 1.72 christos }
322 1.51 thorpej #ifdef TCP_DEBUG
323 1.51 thorpej #ifdef INET
324 1.51 thorpej if (tp->t_inpcb)
325 1.51 thorpej so = tp->t_inpcb->inp_socket;
326 1.51 thorpej #endif
327 1.51 thorpej #ifdef INET6
328 1.51 thorpej if (tp->t_in6pcb)
329 1.51 thorpej so = tp->t_in6pcb->in6p_socket;
330 1.51 thorpej #endif
331 1.51 thorpej ostate = tp->t_state;
332 1.51 thorpej #endif /* TCP_DEBUG */
333 1.1 cgd
334 1.1 cgd /*
335 1.70 jonathan * Clear the SACK scoreboard, reset FACK estimate.
336 1.70 jonathan */
337 1.70 jonathan tcp_free_sackholes(tp);
338 1.70 jonathan tp->snd_fack = tp->snd_una;
339 1.70 jonathan
340 1.70 jonathan /*
341 1.1 cgd * Retransmission timer went off. Message has not
342 1.1 cgd * been acked within retransmit interval. Back off
343 1.1 cgd * to a longer retransmit interval and retransmit one segment.
344 1.1 cgd */
345 1.51 thorpej
346 1.51 thorpej if (++tp->t_rxtshift > TCP_MAXRXTSHIFT) {
347 1.51 thorpej tp->t_rxtshift = TCP_MAXRXTSHIFT;
348 1.51 thorpej tcpstat.tcps_timeoutdrop++;
349 1.51 thorpej tp = tcp_drop(tp, tp->t_softerror ?
350 1.51 thorpej tp->t_softerror : ETIMEDOUT);
351 1.51 thorpej goto out;
352 1.51 thorpej }
353 1.51 thorpej tcpstat.tcps_rexmttimeo++;
354 1.51 thorpej rto = TCP_REXMTVAL(tp);
355 1.51 thorpej if (rto < tp->t_rttmin)
356 1.51 thorpej rto = tp->t_rttmin;
357 1.51 thorpej TCPT_RANGESET(tp->t_rxtcur, rto * tcp_backoff[tp->t_rxtshift],
358 1.51 thorpej tp->t_rttmin, TCPTV_REXMTMAX);
359 1.51 thorpej TCP_TIMER_ARM(tp, TCPT_REXMT, tp->t_rxtcur);
360 1.58 itojun
361 1.59 itojun /*
362 1.51 thorpej * If we are losing and we are trying path MTU discovery,
363 1.51 thorpej * try turning it off. This will avoid black holes in
364 1.51 thorpej * the network which suppress or fail to send "packet
365 1.51 thorpej * too big" ICMP messages. We should ideally do
366 1.51 thorpej * lots more sophisticated searching to find the right
367 1.51 thorpej * value here...
368 1.51 thorpej */
369 1.58 itojun if (tp->t_mtudisc && tp->t_rxtshift > TCP_MAXRXTSHIFT / 6) {
370 1.58 itojun tcpstat.tcps_pmtublackhole++;
371 1.44 itojun
372 1.47 itojun #ifdef INET
373 1.58 itojun /* try turning PMTUD off */
374 1.51 thorpej if (tp->t_inpcb)
375 1.58 itojun tp->t_mtudisc = 0;
376 1.47 itojun #endif
377 1.44 itojun #ifdef INET6
378 1.58 itojun /* try using IPv6 minimum MTU */
379 1.51 thorpej if (tp->t_in6pcb)
380 1.58 itojun tp->t_mtudisc = 0;
381 1.44 itojun #endif
382 1.33 kml
383 1.58 itojun /* XXX: more sophisticated Black hole recovery code? */
384 1.51 thorpej }
385 1.58 itojun
386 1.51 thorpej /*
387 1.51 thorpej * If losing, let the lower level know and try for
388 1.51 thorpej * a better route. Also, if we backed off this far,
389 1.51 thorpej * our srtt estimate is probably bogus. Clobber it
390 1.51 thorpej * so we'll take the next rtt measurement as our srtt;
391 1.51 thorpej * move the current srtt into rttvar to keep the current
392 1.51 thorpej * retransmit times until then.
393 1.51 thorpej */
394 1.51 thorpej if (tp->t_rxtshift > TCP_MAXRXTSHIFT / 4) {
395 1.51 thorpej #ifdef INET
396 1.51 thorpej if (tp->t_inpcb)
397 1.51 thorpej in_losing(tp->t_inpcb);
398 1.51 thorpej #endif
399 1.51 thorpej #ifdef INET6
400 1.51 thorpej if (tp->t_in6pcb)
401 1.51 thorpej in6_losing(tp->t_in6pcb);
402 1.51 thorpej #endif
403 1.51 thorpej tp->t_rttvar += (tp->t_srtt >> TCP_RTT_SHIFT);
404 1.51 thorpej tp->t_srtt = 0;
405 1.51 thorpej }
406 1.51 thorpej tp->snd_nxt = tp->snd_una;
407 1.67 mycroft tp->snd_high = tp->snd_max;
408 1.51 thorpej /*
409 1.51 thorpej * If timing a segment in this window, stop the timer.
410 1.51 thorpej */
411 1.51 thorpej tp->t_rtttime = 0;
412 1.51 thorpej /*
413 1.51 thorpej * Remember if we are retransmitting a SYN, because if
414 1.51 thorpej * we do, set the initial congestion window must be set
415 1.51 thorpej * to 1 segment.
416 1.51 thorpej */
417 1.51 thorpej if (tp->t_state == TCPS_SYN_SENT)
418 1.51 thorpej tp->t_flags |= TF_SYN_REXMT;
419 1.51 thorpej /*
420 1.51 thorpej * Close the congestion window down to one segment
421 1.51 thorpej * (we'll open it by one segment for each ack we get).
422 1.51 thorpej * Since we probably have a window's worth of unacked
423 1.51 thorpej * data accumulated, this "slow start" keeps us from
424 1.51 thorpej * dumping all that data as back-to-back packets (which
425 1.51 thorpej * might overwhelm an intermediate gateway).
426 1.51 thorpej *
427 1.51 thorpej * There are two phases to the opening: Initially we
428 1.51 thorpej * open by one mss on each ack. This makes the window
429 1.51 thorpej * size increase exponentially with time. If the
430 1.51 thorpej * window is larger than the path can handle, this
431 1.51 thorpej * exponential growth results in dropped packet(s)
432 1.59 itojun * almost immediately. To get more time between
433 1.51 thorpej * drops but still "push" the network to take advantage
434 1.51 thorpej * of improving conditions, we switch from exponential
435 1.51 thorpej * to linear window opening at some threshhold size.
436 1.51 thorpej * For a threshhold, we use half the current window
437 1.51 thorpej * size, truncated to a multiple of the mss.
438 1.51 thorpej *
439 1.51 thorpej * (the minimum cwnd that will give us exponential
440 1.51 thorpej * growth is 2 mss. We don't allow the threshhold
441 1.51 thorpej * to go below this.)
442 1.51 thorpej */
443 1.51 thorpej {
444 1.51 thorpej u_int win = min(tp->snd_wnd, tp->snd_cwnd) / 2 / tp->t_segsz;
445 1.51 thorpej if (win < 2)
446 1.51 thorpej win = 2;
447 1.51 thorpej /* Loss Window MUST be one segment. */
448 1.51 thorpej tp->snd_cwnd = tp->t_segsz;
449 1.51 thorpej tp->snd_ssthresh = win * tp->t_segsz;
450 1.68 mycroft tp->t_partialacks = -1;
451 1.51 thorpej tp->t_dupacks = 0;
452 1.51 thorpej }
453 1.51 thorpej (void) tcp_output(tp);
454 1.51 thorpej
455 1.51 thorpej out:
456 1.51 thorpej #ifdef TCP_DEBUG
457 1.51 thorpej if (tp && so->so_options & SO_DEBUG)
458 1.51 thorpej tcp_trace(TA_USER, ostate, tp, NULL,
459 1.51 thorpej PRU_SLOWTIMO | (TCPT_REXMT << 8));
460 1.51 thorpej #endif
461 1.51 thorpej splx(s);
462 1.51 thorpej }
463 1.51 thorpej
464 1.51 thorpej void
465 1.51 thorpej tcp_timer_persist(void *arg)
466 1.51 thorpej {
467 1.51 thorpej struct tcpcb *tp = arg;
468 1.51 thorpej uint32_t rto;
469 1.51 thorpej int s;
470 1.51 thorpej #ifdef TCP_DEBUG
471 1.65 itojun struct socket *so = NULL;
472 1.51 thorpej short ostate;
473 1.35 kml #endif
474 1.51 thorpej
475 1.51 thorpej s = splsoftnet();
476 1.63 he callout_ack(&tp->t_timer[TCPT_PERSIST]);
477 1.63 he if (tcp_isdead(tp)) {
478 1.63 he splx(s);
479 1.63 he return;
480 1.63 he }
481 1.51 thorpej
482 1.60 simonb #ifdef TCP_DEBUG
483 1.47 itojun #ifdef INET
484 1.51 thorpej if (tp->t_inpcb)
485 1.51 thorpej so = tp->t_inpcb->inp_socket;
486 1.47 itojun #endif
487 1.44 itojun #ifdef INET6
488 1.51 thorpej if (tp->t_in6pcb)
489 1.51 thorpej so = tp->t_in6pcb->in6p_socket;
490 1.51 thorpej #endif
491 1.51 thorpej
492 1.51 thorpej ostate = tp->t_state;
493 1.60 simonb #endif /* TCP_DEBUG */
494 1.1 cgd
495 1.1 cgd /*
496 1.1 cgd * Persistance timer into zero window.
497 1.1 cgd * Force a byte to be output, if possible.
498 1.1 cgd */
499 1.51 thorpej
500 1.51 thorpej /*
501 1.51 thorpej * Hack: if the peer is dead/unreachable, we do not
502 1.51 thorpej * time out if the window is closed. After a full
503 1.51 thorpej * backoff, drop the connection if the idle time
504 1.51 thorpej * (no responses to probes) reaches the maximum
505 1.51 thorpej * backoff that we would use if retransmitting.
506 1.51 thorpej */
507 1.51 thorpej rto = TCP_REXMTVAL(tp);
508 1.51 thorpej if (rto < tp->t_rttmin)
509 1.51 thorpej rto = tp->t_rttmin;
510 1.51 thorpej if (tp->t_rxtshift == TCP_MAXRXTSHIFT &&
511 1.51 thorpej ((tcp_now - tp->t_rcvtime) >= tcp_maxpersistidle ||
512 1.51 thorpej (tcp_now - tp->t_rcvtime) >= rto * tcp_totbackoff)) {
513 1.51 thorpej tcpstat.tcps_persistdrops++;
514 1.51 thorpej tp = tcp_drop(tp, ETIMEDOUT);
515 1.51 thorpej goto out;
516 1.51 thorpej }
517 1.51 thorpej tcpstat.tcps_persisttimeo++;
518 1.51 thorpej tcp_setpersist(tp);
519 1.51 thorpej tp->t_force = 1;
520 1.51 thorpej (void) tcp_output(tp);
521 1.51 thorpej tp->t_force = 0;
522 1.51 thorpej
523 1.51 thorpej out:
524 1.51 thorpej #ifdef TCP_DEBUG
525 1.51 thorpej if (tp && so->so_options & SO_DEBUG)
526 1.51 thorpej tcp_trace(TA_USER, ostate, tp, NULL,
527 1.51 thorpej PRU_SLOWTIMO | (TCPT_PERSIST << 8));
528 1.51 thorpej #endif
529 1.51 thorpej splx(s);
530 1.51 thorpej }
531 1.51 thorpej
532 1.51 thorpej void
533 1.51 thorpej tcp_timer_keep(void *arg)
534 1.51 thorpej {
535 1.51 thorpej struct tcpcb *tp = arg;
536 1.61 scw struct socket *so = NULL; /* Quell compiler warning */
537 1.51 thorpej int s;
538 1.51 thorpej #ifdef TCP_DEBUG
539 1.51 thorpej short ostate;
540 1.51 thorpej #endif
541 1.51 thorpej
542 1.51 thorpej s = splsoftnet();
543 1.63 he callout_ack(&tp->t_timer[TCPT_KEEP]);
544 1.63 he if (tcp_isdead(tp)) {
545 1.63 he splx(s);
546 1.63 he return;
547 1.63 he }
548 1.51 thorpej
549 1.51 thorpej #ifdef TCP_DEBUG
550 1.51 thorpej ostate = tp->t_state;
551 1.51 thorpej #endif /* TCP_DEBUG */
552 1.1 cgd
553 1.1 cgd /*
554 1.1 cgd * Keep-alive timer went off; send something
555 1.1 cgd * or drop connection if idle for too long.
556 1.1 cgd */
557 1.44 itojun
558 1.51 thorpej tcpstat.tcps_keeptimeo++;
559 1.51 thorpej if (TCPS_HAVEESTABLISHED(tp->t_state) == 0)
560 1.51 thorpej goto dropit;
561 1.47 itojun #ifdef INET
562 1.51 thorpej if (tp->t_inpcb)
563 1.51 thorpej so = tp->t_inpcb->inp_socket;
564 1.47 itojun #endif
565 1.44 itojun #ifdef INET6
566 1.51 thorpej if (tp->t_in6pcb)
567 1.51 thorpej so = tp->t_in6pcb->in6p_socket;
568 1.44 itojun #endif
569 1.51 thorpej if (so->so_options & SO_KEEPALIVE &&
570 1.51 thorpej tp->t_state <= TCPS_CLOSE_WAIT) {
571 1.51 thorpej if ((tcp_maxidle > 0) &&
572 1.51 thorpej ((tcp_now - tp->t_rcvtime) >=
573 1.51 thorpej tcp_keepidle + tcp_maxidle))
574 1.51 thorpej goto dropit;
575 1.51 thorpej /*
576 1.51 thorpej * Send a packet designed to force a response
577 1.51 thorpej * if the peer is up and reachable:
578 1.51 thorpej * either an ACK if the connection is still alive,
579 1.51 thorpej * or an RST if the peer has closed the connection
580 1.51 thorpej * due to timeout or reboot.
581 1.51 thorpej * Using sequence number tp->snd_una-1
582 1.51 thorpej * causes the transmitted zero-length segment
583 1.51 thorpej * to lie outside the receive window;
584 1.51 thorpej * by the protocol spec, this requires the
585 1.51 thorpej * correspondent TCP to respond.
586 1.51 thorpej */
587 1.51 thorpej tcpstat.tcps_keepprobe++;
588 1.51 thorpej if (tcp_compat_42) {
589 1.1 cgd /*
590 1.51 thorpej * The keepalive packet must have nonzero
591 1.51 thorpej * length to get a 4.2 host to respond.
592 1.1 cgd */
593 1.51 thorpej (void)tcp_respond(tp, tp->t_template,
594 1.51 thorpej (struct mbuf *)NULL, NULL, tp->rcv_nxt - 1,
595 1.51 thorpej tp->snd_una - 1, 0);
596 1.51 thorpej } else {
597 1.51 thorpej (void)tcp_respond(tp, tp->t_template,
598 1.51 thorpej (struct mbuf *)NULL, NULL, tp->rcv_nxt,
599 1.51 thorpej tp->snd_una - 1, 0);
600 1.51 thorpej }
601 1.51 thorpej TCP_TIMER_ARM(tp, TCPT_KEEP, tcp_keepintvl);
602 1.51 thorpej } else
603 1.51 thorpej TCP_TIMER_ARM(tp, TCPT_KEEP, tcp_keepidle);
604 1.51 thorpej
605 1.51 thorpej #ifdef TCP_DEBUG
606 1.51 thorpej if (tp && so->so_options & SO_DEBUG)
607 1.51 thorpej tcp_trace(TA_USER, ostate, tp, NULL,
608 1.51 thorpej PRU_SLOWTIMO | (TCPT_KEEP << 8));
609 1.51 thorpej #endif
610 1.51 thorpej splx(s);
611 1.51 thorpej return;
612 1.51 thorpej
613 1.51 thorpej dropit:
614 1.51 thorpej tcpstat.tcps_keepdrops++;
615 1.51 thorpej (void) tcp_drop(tp, ETIMEDOUT);
616 1.51 thorpej splx(s);
617 1.51 thorpej }
618 1.51 thorpej
619 1.51 thorpej void
620 1.51 thorpej tcp_timer_2msl(void *arg)
621 1.51 thorpej {
622 1.51 thorpej struct tcpcb *tp = arg;
623 1.51 thorpej int s;
624 1.51 thorpej #ifdef TCP_DEBUG
625 1.65 itojun struct socket *so = NULL;
626 1.51 thorpej short ostate;
627 1.51 thorpej #endif
628 1.51 thorpej
629 1.51 thorpej s = splsoftnet();
630 1.63 he callout_ack(&tp->t_timer[TCPT_2MSL]);
631 1.63 he if (tcp_isdead(tp)) {
632 1.63 he splx(s);
633 1.63 he return;
634 1.63 he }
635 1.51 thorpej
636 1.70 jonathan /*
637 1.70 jonathan * 2 MSL timeout went off, clear the SACK scoreboard, reset
638 1.70 jonathan * the FACK estimate.
639 1.70 jonathan */
640 1.70 jonathan tcp_free_sackholes(tp);
641 1.70 jonathan tp->snd_fack = tp->snd_una;
642 1.70 jonathan
643 1.60 simonb #ifdef TCP_DEBUG
644 1.51 thorpej #ifdef INET
645 1.51 thorpej if (tp->t_inpcb)
646 1.51 thorpej so = tp->t_inpcb->inp_socket;
647 1.51 thorpej #endif
648 1.51 thorpej #ifdef INET6
649 1.51 thorpej if (tp->t_in6pcb)
650 1.51 thorpej so = tp->t_in6pcb->in6p_socket;
651 1.51 thorpej #endif
652 1.51 thorpej
653 1.51 thorpej ostate = tp->t_state;
654 1.60 simonb #endif /* TCP_DEBUG */
655 1.51 thorpej
656 1.51 thorpej /*
657 1.51 thorpej * 2 MSL timeout in shutdown went off. If we're closed but
658 1.51 thorpej * still waiting for peer to close and connection has been idle
659 1.51 thorpej * too long, or if 2MSL time is up from TIME_WAIT, delete connection
660 1.51 thorpej * control block. Otherwise, check again in a bit.
661 1.51 thorpej */
662 1.51 thorpej if (tp->t_state != TCPS_TIME_WAIT &&
663 1.51 thorpej ((tcp_maxidle == 0) || ((tcp_now - tp->t_rcvtime) <= tcp_maxidle)))
664 1.51 thorpej TCP_TIMER_ARM(tp, TCPT_2MSL, tcp_keepintvl);
665 1.51 thorpej else
666 1.51 thorpej tp = tcp_close(tp);
667 1.51 thorpej
668 1.51 thorpej #ifdef TCP_DEBUG
669 1.51 thorpej if (tp && so->so_options & SO_DEBUG)
670 1.51 thorpej tcp_trace(TA_USER, ostate, tp, NULL,
671 1.51 thorpej PRU_SLOWTIMO | (TCPT_2MSL << 8));
672 1.51 thorpej #endif
673 1.51 thorpej splx(s);
674 1.1 cgd }
675