2 * Copyright (c) 2003, 2004 Jeffrey M. Hsu. All rights reserved.
3 * Copyright (c) 2003, 2004 The DragonFly Project. All rights reserved.
5 * This code is derived from software contributed to The DragonFly Project
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
16 * 3. Neither the name of The DragonFly Project nor the names of its
17 * contributors may be used to endorse or promote products derived
18 * from this software without specific, prior written permission.
20 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
21 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
22 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
23 * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
24 * COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
25 * INCIDENTAL, SPECIAL, EXEMPLARY OR CONSEQUENTIAL DAMAGES (INCLUDING,
26 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
27 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
28 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
29 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
30 * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
35 * Copyright (c) 1982, 1986, 1988, 1990, 1993, 1995
36 * The Regents of the University of California. All rights reserved.
38 * Redistribution and use in source and binary forms, with or without
39 * modification, are permitted provided that the following conditions
41 * 1. Redistributions of source code must retain the above copyright
42 * notice, this list of conditions and the following disclaimer.
43 * 2. Redistributions in binary form must reproduce the above copyright
44 * notice, this list of conditions and the following disclaimer in the
45 * documentation and/or other materials provided with the distribution.
46 * 3. All advertising materials mentioning features or use of this software
47 * must display the following acknowledgement:
48 * This product includes software developed by the University of
49 * California, Berkeley and its contributors.
50 * 4. Neither the name of the University nor the names of its contributors
51 * may be used to endorse or promote products derived from this software
52 * without specific prior written permission.
54 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
55 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
56 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
57 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
58 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
59 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
60 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
61 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
62 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
63 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
66 * @(#)tcp_timer.c 8.2 (Berkeley) 5/24/95
67 * $FreeBSD: src/sys/netinet/tcp_timer.c,v 1.34.2.14 2003/02/03 02:33:41 hsu Exp $
68 * $DragonFly: src/sys/netinet/tcp_timer.c,v 1.17 2008/03/30 20:39:01 dillon Exp $
71 #include "opt_compat.h"
72 #include "opt_inet6.h"
73 #include "opt_tcpdebug.h"
75 #include <sys/param.h>
76 #include <sys/systm.h>
77 #include <sys/kernel.h>
79 #include <sys/sysctl.h>
80 #include <sys/socket.h>
81 #include <sys/socketvar.h>
82 #include <sys/protosw.h>
83 #include <sys/thread.h>
84 #include <sys/globaldata.h>
85 #include <sys/thread2.h>
86 #include <sys/msgport2.h>
88 #include <machine/cpu.h> /* before tcp_seq.h, for tcp_random18() */
90 #include <net/route.h>
91 #include <net/netmsg2.h>
93 #include <netinet/in.h>
94 #include <netinet/in_systm.h>
95 #include <netinet/in_pcb.h>
97 #include <netinet6/in6_pcb.h>
99 #include <netinet/ip_var.h>
100 #include <netinet/tcp.h>
101 #include <netinet/tcp_fsm.h>
102 #include <netinet/tcp_seq.h>
103 #include <netinet/tcp_timer.h>
104 #include <netinet/tcp_timer2.h>
105 #include <netinet/tcp_var.h>
106 #include <netinet/tcpip.h>
108 #include <netinet/tcp_debug.h>
111 #define TCP_TIMER_REXMT 0x01
112 #define TCP_TIMER_PERSIST 0x02
113 #define TCP_TIMER_KEEP 0x04
114 #define TCP_TIMER_2MSL 0x08
115 #define TCP_TIMER_DELACK 0x10
117 static struct tcpcb
*tcp_timer_rexmt_handler(struct tcpcb
*);
118 static struct tcpcb
*tcp_timer_persist_handler(struct tcpcb
*);
119 static struct tcpcb
*tcp_timer_keep_handler(struct tcpcb
*);
120 static struct tcpcb
*tcp_timer_2msl_handler(struct tcpcb
*);
121 static struct tcpcb
*tcp_timer_delack_handler(struct tcpcb
*);
123 static const struct tcp_timer
{
125 struct tcpcb
*(*tt_handler
)(struct tcpcb
*);
126 } tcp_timer_handlers
[] = {
127 { TCP_TIMER_DELACK
, tcp_timer_delack_handler
},
128 { TCP_TIMER_REXMT
, tcp_timer_rexmt_handler
},
129 { TCP_TIMER_PERSIST
, tcp_timer_persist_handler
},
130 { TCP_TIMER_KEEP
, tcp_timer_keep_handler
},
131 { TCP_TIMER_2MSL
, tcp_timer_2msl_handler
},
136 sysctl_msec_to_ticks(SYSCTL_HANDLER_ARGS
)
140 tt
= *(int *)oidp
->oid_arg1
;
141 s
= (int)((int64_t)tt
* 1000 / hz
);
143 error
= sysctl_handle_int(oidp
, &s
, 0, req
);
144 if (error
|| !req
->newptr
)
147 tt
= (int)((int64_t)s
* hz
/ 1000);
151 *(int *)oidp
->oid_arg1
= tt
;
156 SYSCTL_PROC(_net_inet_tcp
, TCPCTL_KEEPINIT
, keepinit
, CTLTYPE_INT
|CTLFLAG_RW
,
157 &tcp_keepinit
, 0, sysctl_msec_to_ticks
, "I", "Time to establish TCP connection");
160 SYSCTL_PROC(_net_inet_tcp
, TCPCTL_KEEPIDLE
, keepidle
, CTLTYPE_INT
|CTLFLAG_RW
,
161 &tcp_keepidle
, 0, sysctl_msec_to_ticks
, "I", "Time before TCP keepalive probes begin");
164 SYSCTL_PROC(_net_inet_tcp
, TCPCTL_KEEPINTVL
, keepintvl
, CTLTYPE_INT
|CTLFLAG_RW
,
165 &tcp_keepintvl
, 0, sysctl_msec_to_ticks
, "I", "Time between TCP keepalive probes");
168 SYSCTL_PROC(_net_inet_tcp
, TCPCTL_DELACKTIME
, delacktime
,
169 CTLTYPE_INT
|CTLFLAG_RW
, &tcp_delacktime
, 0, sysctl_msec_to_ticks
, "I",
170 "Time before a delayed ACK is sent");
173 SYSCTL_PROC(_net_inet_tcp
, OID_AUTO
, msl
, CTLTYPE_INT
|CTLFLAG_RW
,
174 &tcp_msl
, 0, sysctl_msec_to_ticks
, "I", "Maximum segment lifetime");
177 SYSCTL_PROC(_net_inet_tcp
, OID_AUTO
, rexmit_min
, CTLTYPE_INT
|CTLFLAG_RW
,
178 &tcp_rexmit_min
, 0, sysctl_msec_to_ticks
, "I", "Minimum Retransmission Timeout");
181 SYSCTL_PROC(_net_inet_tcp
, OID_AUTO
, rexmit_slop
, CTLTYPE_INT
|CTLFLAG_RW
,
182 &tcp_rexmit_slop
, 0, sysctl_msec_to_ticks
, "I",
183 "Retransmission Timer Slop");
185 static int always_keepalive
= 1;
186 SYSCTL_INT(_net_inet_tcp
, OID_AUTO
, always_keepalive
, CTLFLAG_RW
,
187 &always_keepalive
, 0, "Assume SO_KEEPALIVE on all TCP connections");
189 /* max idle probes */
190 int tcp_keepcnt
= TCPTV_KEEPCNT
;
191 SYSCTL_INT(_net_inet_tcp
, OID_AUTO
, keepcnt
, CTLFLAG_RW
,
192 &tcp_keepcnt
, 0, "Maximum number of keepalive probes to be sent");
194 /* max idle time in persist */
195 int tcp_maxpersistidle
;
198 * Cancel all timers for TCP tp.
201 tcp_canceltimers(struct tcpcb
*tp
)
203 tcp_callout_stop(tp
, tp
->tt_2msl
);
204 tcp_callout_stop(tp
, tp
->tt_persist
);
205 tcp_callout_stop(tp
, tp
->tt_keep
);
206 tcp_callout_stop(tp
, tp
->tt_rexmt
);
210 * Caller should be in critical section
213 tcp_send_timermsg(struct tcpcb
*tp
, uint32_t task
)
215 struct netmsg_tcp_timer
*tmsg
= tp
->tt_msg
;
217 KKASSERT(tmsg
!= NULL
&& tmsg
->tt_cpuid
== mycpuid
&&
218 tmsg
->tt_tcb
!= NULL
);
220 tmsg
->tt_tasks
|= task
;
221 if (tmsg
->tt_msg
.lmsg
.ms_flags
& MSGF_DONE
)
222 lwkt_sendmsg(tmsg
->tt_msgport
, &tmsg
->tt_msg
.lmsg
);
225 int tcp_syn_backoff
[TCP_MAXRXTSHIFT
+ 1] =
226 { 1, 1, 1, 1, 1, 2, 4, 8, 16, 32, 64, 64, 64 };
228 int tcp_syn_backoff_low
[TCP_MAXRXTSHIFT
+ 1] =
229 { 1, 2, 4, 4, 4, 8, 16, 16, 32, 64, 64, 64, 64 };
231 int tcp_backoff
[TCP_MAXRXTSHIFT
+ 1] =
232 { 1, 2, 4, 8, 16, 32, 64, 64, 64, 64, 64, 64, 64 };
234 static int tcp_totbackoff
= 511; /* sum of tcp_backoff[] */
236 /* Caller should be in critical section */
237 static struct tcpcb
*
238 tcp_timer_delack_handler(struct tcpcb
*tp
)
240 tp
->t_flags
|= TF_ACKNOW
;
241 tcpstat
.tcps_delack
++;
247 * TCP timer processing.
250 tcp_timer_delack(void *xtp
)
252 struct tcpcb
*tp
= xtp
;
253 struct callout
*co
= &tp
->tt_delack
->tc_callout
;
256 if (callout_pending(co
) || !callout_active(co
)) {
260 callout_deactivate(co
);
261 tcp_send_timermsg(tp
, TCP_TIMER_DELACK
);
265 /* Caller should be in critical section */
266 static struct tcpcb
*
267 tcp_timer_2msl_handler(struct tcpcb
*tp
)
274 ostate
= tp
->t_state
;
277 * 2 MSL timeout in shutdown went off. If we're closed but
278 * still waiting for peer to close and connection has been idle
279 * too long, or if 2MSL time is up from TIME_WAIT, delete connection
280 * control block. Otherwise, check again in a bit.
282 if (tp
->t_state
!= TCPS_TIME_WAIT
&&
283 (ticks
- tp
->t_rcvtime
) <= tp
->t_maxidle
) {
284 tcp_callout_reset(tp
, tp
->tt_2msl
, tp
->t_keepintvl
,
291 if (tp
&& (tp
->t_inpcb
->inp_socket
->so_options
& SO_DEBUG
))
292 tcp_trace(TA_USER
, ostate
, tp
, NULL
, NULL
, PRU_SLOWTIMO
);
298 tcp_timer_2msl(void *xtp
)
300 struct tcpcb
*tp
= xtp
;
301 struct callout
*co
= &tp
->tt_2msl
->tc_callout
;
304 if (callout_pending(co
) || !callout_active(co
)) {
308 callout_deactivate(co
);
309 tcp_send_timermsg(tp
, TCP_TIMER_2MSL
);
313 /* Caller should be in critical section */
314 static struct tcpcb
*
315 tcp_timer_keep_handler(struct tcpcb
*tp
)
317 struct tcptemp
*t_template
;
321 int keepidle
= tcp_getkeepidle(tp
);
324 ostate
= tp
->t_state
;
327 * Keep-alive timer went off; send something
328 * or drop connection if idle for too long.
330 tcpstat
.tcps_keeptimeo
++;
331 if (tp
->t_state
< TCPS_ESTABLISHED
)
333 if ((always_keepalive
|| (tp
->t_flags
& TF_KEEPALIVE
) ||
334 (tp
->t_inpcb
->inp_socket
->so_options
& SO_KEEPALIVE
)) &&
335 tp
->t_state
<= TCPS_CLOSING
) {
336 if ((ticks
- tp
->t_rcvtime
) >= keepidle
+ tp
->t_maxidle
)
339 * Send a packet designed to force a response
340 * if the peer is up and reachable:
341 * either an ACK if the connection is still alive,
342 * or an RST if the peer has closed the connection
343 * due to timeout or reboot.
344 * Using sequence number tp->snd_una-1
345 * causes the transmitted zero-length segment
346 * to lie outside the receive window;
347 * by the protocol spec, this requires the
348 * correspondent TCP to respond.
350 tcpstat
.tcps_keepprobe
++;
351 t_template
= tcp_maketemplate(tp
);
353 tcp_respond(tp
, t_template
->tt_ipgen
,
354 &t_template
->tt_t
, NULL
,
355 tp
->rcv_nxt
, tp
->snd_una
- 1, 0);
356 tcp_freetemplate(t_template
);
358 tcp_callout_reset(tp
, tp
->tt_keep
, tp
->t_keepintvl
,
361 tcp_callout_reset(tp
, tp
->tt_keep
, keepidle
,
366 if (tp
->t_inpcb
->inp_socket
->so_options
& SO_DEBUG
)
367 tcp_trace(TA_USER
, ostate
, tp
, NULL
, NULL
, PRU_SLOWTIMO
);
372 tcpstat
.tcps_keepdrops
++;
373 tp
= tcp_drop(tp
, ETIMEDOUT
);
376 if (tp
&& (tp
->t_inpcb
->inp_socket
->so_options
& SO_DEBUG
))
377 tcp_trace(TA_USER
, ostate
, tp
, NULL
, NULL
, PRU_SLOWTIMO
);
383 tcp_timer_keep(void *xtp
)
385 struct tcpcb
*tp
= xtp
;
386 struct callout
*co
= &tp
->tt_keep
->tc_callout
;
389 if (callout_pending(co
) || !callout_active(co
)) {
393 callout_deactivate(co
);
394 tcp_send_timermsg(tp
, TCP_TIMER_KEEP
);
398 /* Caller should be in critical section */
399 static struct tcpcb
*
400 tcp_timer_persist_handler(struct tcpcb
*tp
)
407 ostate
= tp
->t_state
;
410 * Persistance timer into zero window.
411 * Force a byte to be output, if possible.
413 tcpstat
.tcps_persisttimeo
++;
415 * Hack: if the peer is dead/unreachable, we do not
416 * time out if the window is closed. After a full
417 * backoff, drop the connection if the idle time
418 * (no responses to probes) reaches the maximum
419 * backoff that we would use if retransmitting.
421 if (tp
->t_rxtshift
== TCP_MAXRXTSHIFT
&&
422 ((ticks
- tp
->t_rcvtime
) >= tcp_maxpersistidle
||
423 (ticks
- tp
->t_rcvtime
) >= TCP_REXMTVAL(tp
) * tcp_totbackoff
)) {
424 tcpstat
.tcps_persistdrop
++;
425 tp
= tcp_drop(tp
, ETIMEDOUT
);
429 tp
->t_flags
|= TF_FORCE
;
431 tp
->t_flags
&= ~TF_FORCE
;
435 if (tp
&& tp
->t_inpcb
->inp_socket
->so_options
& SO_DEBUG
)
436 tcp_trace(TA_USER
, ostate
, tp
, NULL
, NULL
, PRU_SLOWTIMO
);
442 tcp_timer_persist(void *xtp
)
444 struct tcpcb
*tp
= xtp
;
445 struct callout
*co
= &tp
->tt_persist
->tc_callout
;
448 if (callout_pending(co
) || !callout_active(co
)){
452 callout_deactivate(co
);
453 tcp_send_timermsg(tp
, TCP_TIMER_PERSIST
);
458 tcp_save_congestion_state(struct tcpcb
*tp
)
460 tp
->snd_cwnd_prev
= tp
->snd_cwnd
;
461 tp
->snd_wacked_prev
= tp
->snd_wacked
;
462 tp
->snd_ssthresh_prev
= tp
->snd_ssthresh
;
463 tp
->snd_recover_prev
= tp
->snd_recover
;
464 if (IN_FASTRECOVERY(tp
))
465 tp
->t_flags
|= TF_WASFRECOVERY
;
467 tp
->t_flags
&= ~TF_WASFRECOVERY
;
468 if (tp
->t_flags
& TF_RCVD_TSTMP
) {
469 tp
->t_rexmtTS
= ticks
;
470 tp
->t_flags
|= TF_FIRSTACCACK
;
473 tcp_sack_save_scoreboard(&tp
->scb
);
478 tcp_revert_congestion_state(struct tcpcb
*tp
)
480 tp
->snd_cwnd
= tp
->snd_cwnd_prev
;
481 tp
->snd_wacked
= tp
->snd_wacked_prev
;
482 tp
->snd_ssthresh
= tp
->snd_ssthresh_prev
;
483 tp
->snd_recover
= tp
->snd_recover_prev
;
484 if (tp
->t_flags
& TF_WASFRECOVERY
)
485 ENTER_FASTRECOVERY(tp
);
486 if (tp
->t_flags
& TF_FASTREXMT
) {
487 ++tcpstat
.tcps_sndfastrexmitbad
;
488 if (tp
->t_flags
& TF_EARLYREXMT
)
489 ++tcpstat
.tcps_sndearlyrexmitbad
;
491 ++tcpstat
.tcps_sndrtobad
;
494 tp
->snd_nxt
= tp
->snd_max
;
496 tcp_sack_revert_scoreboard(&tp
->scb
, tp
->snd_una
);
500 /* Caller should be in critical section */
501 static struct tcpcb
*
502 tcp_timer_rexmt_handler(struct tcpcb
*tp
)
510 ostate
= tp
->t_state
;
513 * Retransmission timer went off. Message has not
514 * been acked within retransmit interval. Back off
515 * to a longer retransmit interval and retransmit one segment.
517 if (++tp
->t_rxtshift
> TCP_MAXRXTSHIFT
) {
518 tp
->t_rxtshift
= TCP_MAXRXTSHIFT
;
519 tcpstat
.tcps_timeoutdrop
++;
520 tp
= tcp_drop(tp
, tp
->t_softerror
?
521 tp
->t_softerror
: ETIMEDOUT
);
524 if (tp
->t_rxtshift
== 1) {
526 * first retransmit; record ssthresh and cwnd so they can
527 * be recovered if this turns out to be a "bad" retransmit.
528 * A retransmit is considered "bad" if an ACK for this
529 * segment is received within RTT/2 interval; the assumption
530 * here is that the ACK was already in flight. See
531 * "On Estimating End-to-End Network Path Properties" by
532 * Allman and Paxson for more details.
534 tp
->t_badrxtwin
= ticks
+ (tp
->t_srtt
>> (TCP_RTT_SHIFT
+ 1));
535 tcp_save_congestion_state(tp
);
536 tp
->t_flags
&= ~(TF_FASTREXMT
| TF_EARLYREXMT
);
538 if (tp
->t_state
== TCPS_SYN_SENT
||
539 tp
->t_state
== TCPS_SYN_RECEIVED
) {
541 * Record that SYN or SYN|ACK was lost.
542 * Needed by RFC3390 and RFC6298.
544 tp
->t_flags
|= TF_SYN_WASLOST
;
547 /* Throw away SACK blocks on a RTO, as specified by RFC2018. */
548 tcp_sack_cleanup(&tp
->scb
);
549 tcpstat
.tcps_rexmttimeo
++;
550 if (tp
->t_state
== TCPS_SYN_SENT
) {
551 if (tcp_low_rtobase
) {
552 rexmt
= TCP_REXMTVAL(tp
) *
553 tcp_syn_backoff_low
[tp
->t_rxtshift
];
555 rexmt
= TCP_REXMTVAL(tp
) *
556 tcp_syn_backoff
[tp
->t_rxtshift
];
559 rexmt
= TCP_REXMTVAL(tp
) * tcp_backoff
[tp
->t_rxtshift
];
561 TCPT_RANGESET(tp
->t_rxtcur
, rexmt
,
562 tp
->t_rttmin
, TCPTV_REXMTMAX
);
564 * If losing, let the lower level know and try for
565 * a better route. Also, if we backed off this far,
566 * our srtt estimate is probably bogus. Clobber it
567 * so we'll take the next rtt measurement as our srtt;
568 * move the current srtt into rttvar to keep the current
569 * retransmit times until then.
571 if (tp
->t_rxtshift
> TCP_MAXRXTSHIFT
/ 4) {
573 if ((tp
->t_inpcb
->inp_vflag
& INP_IPV6
) != 0)
574 in6_losing(tp
->t_inpcb
);
577 in_losing(tp
->t_inpcb
);
578 tp
->t_rttvar
+= (tp
->t_srtt
>> TCP_RTT_SHIFT
);
581 tp
->snd_nxt
= tp
->snd_una
;
582 tp
->rexmt_high
= tp
->snd_una
;
583 tp
->snd_recover
= tp
->snd_max
;
585 * Force a segment to be sent.
587 tp
->t_flags
|= TF_ACKNOW
;
589 * If timing a segment in this window, stop the timer.
593 * Close the congestion window down to one segment
594 * (we'll open it by one segment for each ack we get).
595 * Since we probably have a window's worth of unacked
596 * data accumulated, this "slow start" keeps us from
597 * dumping all that data as back-to-back packets (which
598 * might overwhelm an intermediate gateway).
600 * There are two phases to the opening: Initially we
601 * open by one mss on each ack. This makes the window
602 * size increase exponentially with time. If the
603 * window is larger than the path can handle, this
604 * exponential growth results in dropped packet(s)
605 * almost immediately. To get more time between
606 * drops but still "push" the network to take advantage
607 * of improving conditions, we switch from exponential
608 * to linear window opening at some threshhold size.
609 * For a threshhold, we use half the current window
610 * size, truncated to a multiple of the mss.
612 * (the minimum cwnd that will give us exponential
613 * growth is 2 mss. We don't allow the threshhold
617 u_int win
= min(tp
->snd_wnd
, tp
->snd_cwnd
) / 2 / tp
->t_maxseg
;
621 tp
->snd_cwnd
= tp
->t_maxseg
;
623 tp
->snd_ssthresh
= win
* tp
->t_maxseg
;
626 EXIT_FASTRECOVERY(tp
);
631 if (tp
&& (tp
->t_inpcb
->inp_socket
->so_options
& SO_DEBUG
))
632 tcp_trace(TA_USER
, ostate
, tp
, NULL
, NULL
, PRU_SLOWTIMO
);
638 tcp_timer_rexmt(void *xtp
)
640 struct tcpcb
*tp
= xtp
;
641 struct callout
*co
= &tp
->tt_rexmt
->tc_callout
;
644 if (callout_pending(co
) || !callout_active(co
)) {
648 callout_deactivate(co
);
649 tcp_send_timermsg(tp
, TCP_TIMER_REXMT
);
654 tcp_timer_handler(netmsg_t msg
)
656 struct netmsg_tcp_timer
*tmsg
= (struct netmsg_tcp_timer
*)msg
;
657 const struct tcp_timer
*tt
;
662 KKASSERT(tmsg
->tt_cpuid
== mycpuid
&& tmsg
->tt_tcb
!= NULL
);
665 /* Save pending tasks and reset the tasks in message */
666 tmsg
->tt_running_tasks
= tmsg
->tt_tasks
;
667 tmsg
->tt_prev_tasks
= tmsg
->tt_tasks
;
671 lwkt_replymsg(&tmsg
->tt_msg
.lmsg
, 0);
673 if (tmsg
->tt_running_tasks
== 0) {
675 * All of the timers are cancelled when the message
676 * is pending; bail out.
682 for (tt
= tcp_timer_handlers
; tt
->tt_handler
!= NULL
; ++tt
) {
683 if ((tmsg
->tt_running_tasks
& tt
->tt_task
) == 0)
686 tmsg
->tt_running_tasks
&= ~tt
->tt_task
;
687 tp
= tt
->tt_handler(tp
);
691 if (tmsg
->tt_running_tasks
== 0) /* nothing left to do */
699 tcp_create_timermsg(struct tcpcb
*tp
, struct lwkt_port
*msgport
)
701 struct netmsg_tcp_timer
*tmsg
= tp
->tt_msg
;
703 netmsg_init(&tmsg
->tt_msg
, NULL
, &netisr_adone_rport
,
704 MSGF_DROPABLE
| MSGF_PRIORITY
, tcp_timer_handler
);
705 tmsg
->tt_cpuid
= mycpuid
;
706 tmsg
->tt_msgport
= msgport
;
712 tcp_destroy_timermsg(struct tcpcb
*tp
)
714 struct netmsg_tcp_timer
*tmsg
= tp
->tt_msg
;
716 if (tmsg
== NULL
|| /* listen socket */
717 tmsg
->tt_tcb
== NULL
) /* only tcp_attach() is called */
720 KKASSERT(tmsg
->tt_cpuid
== mycpuid
);
722 if ((tmsg
->tt_msg
.lmsg
.ms_flags
& MSGF_DONE
) == 0) {
724 * This message is still pending to be processed;
727 lwkt_dropmsg(&tmsg
->tt_msg
.lmsg
);
733 tcp_callout_init(struct tcp_callout
*tc
, uint32_t task
)
735 callout_init_mp(&tc
->tc_callout
);
740 tcp_inittimers(struct tcpcb
*tp
)
742 tcp_callout_init(tp
->tt_rexmt
, TCP_TIMER_REXMT
);
743 tcp_callout_init(tp
->tt_persist
, TCP_TIMER_PERSIST
);
744 tcp_callout_init(tp
->tt_keep
, TCP_TIMER_KEEP
);
745 tcp_callout_init(tp
->tt_2msl
, TCP_TIMER_2MSL
);
746 tcp_callout_init(tp
->tt_delack
, TCP_TIMER_DELACK
);