patchable tcp_delack; fix rxtshift calculation
[unix-history] / usr / src / sys / netinet / tcp_output.c
CommitLineData
89413846 1/* tcp_output.c 4.25 81/12/20 */
76ee76df
BJ
2
3#include "../h/param.h"
4#include "../h/systm.h"
5#include "../h/mbuf.h"
405c9168 6#include "../h/protosw.h"
76ee76df 7#include "../h/socket.h"
d52566dd 8#include "../h/socketvar.h"
0974b45c
BJ
9#include "../net/in.h"
10#include "../net/in_pcb.h"
11#include "../net/in_systm.h"
d52566dd 12#include "../net/ip.h"
eb44bfb2 13#include "../net/ip_var.h"
d52566dd 14#include "../net/tcp.h"
0974b45c 15#define TCPOUTFLAGS
d52566dd 16#include "../net/tcp_fsm.h"
0974b45c
BJ
17#include "../net/tcp_seq.h"
18#include "../net/tcp_timer.h"
19#include "../net/tcp_var.h"
20#include "../net/tcpip.h"
f1dd32da 21#include "../net/tcp_debug.h"
f1b2fa5b 22#include "../errno.h"
76ee76df 23
4aed14e3 24char *tcpstates[]; /* XXX */
ea727f86 25/*
4aed14e3 26 * Tcp output routine: figure out what should be sent and send it.
ea727f86 27 */
a6503abf 28tcp_output(tp)
53a5409e 29 register struct tcpcb *tp;
ea727f86 30{
53a5409e 31 register struct socket *so = tp->t_inpcb->inp_socket;
a6503abf
BJ
32 register int len;
33 struct mbuf *m0;
34 int off, flags;
35 register struct mbuf *m;
36 register struct tcpiphdr *ti;
37 int win;
76ee76df 38
a6503abf 39COUNT(TCP_OUTPUT);
76ee76df 40
a6503abf 41 /*
0974b45c
BJ
42 * Determine length of data that can be transmitted,
43 * and flags that will be used.
44 * If there is some data or critical controls (SYN, RST)
45 * to send, then transmit; otherwise, investigate further.
a6503abf
BJ
46 */
47 off = tp->snd_nxt - tp->snd_una;
405c9168 48 len = MIN(so->so_snd.sb_cc, tp->snd_wnd+tp->t_force) - off;
0974b45c
BJ
49 if (len > tp->t_maxseg)
50 len = tp->t_maxseg;
4aed14e3
BJ
51 if (len < 0)
52 len = 0; /* FIN can cause -1 */
0974b45c 53 flags = tcp_outflags[tp->t_state];
405c9168
BJ
54 if (len < so->so_snd.sb_cc)
55 flags &= ~TH_FIN;
0974b45c 56 if (len || (flags & (TH_SYN|TH_RST)))
a6503abf
BJ
57 goto send;
58
59 /*
0974b45c 60 * See if we owe peer an ACK or have a unacked FIN to send.
a6503abf 61 */
0974b45c 62 if (tp->t_flags & TF_ACKNOW)
a6503abf 63 goto send;
0974b45c
BJ
64 if ((so->so_state & SS_CANTSENDMORE) &&
65 TCPS_OURFINNOTACKED(tp->t_state))
a6503abf 66 goto send;
76ee76df 67
a6503abf
BJ
68 /*
69 * Calculate available window in i, and also amount
70 * of window known to peer (as advertised window less
71 * next expected input.) If this is 35% or more of the
72 * maximum possible window, then want to send a segment to peer.
73 */
0974b45c
BJ
74 win = sbspace(&so->so_rcv);
75 if (win > 0 &&
76 ((100*(win-(tp->rcv_adv-tp->rcv_nxt))/so->so_rcv.sb_hiwat) >= 35))
a6503abf
BJ
77 goto send;
78
79 /*
80 * No reason to send a segment, just return.
81 */
f1b2fa5b 82 return (0);
a6503abf
BJ
83
84send:
85 /*
86 * Grab a header mbuf, attaching a copy of data to
87 * be transmitted, and initialize the header from
88 * the template for sends on this connection.
89 */
76ee76df
BJ
90 MGET(m, 0);
91 if (m == 0)
92 return (0);
4aed14e3 93 m->m_off = MMAXOFF - sizeof (struct tcpiphdr);
53a5409e 94 m->m_len = sizeof (struct tcpiphdr);
a6503abf
BJ
95 if (len) {
96 m->m_next = m_copy(so->so_snd.sb_mb, off, len);
97 if (m->m_next == 0)
98 len = 0;
99 }
100 ti = mtod(m, struct tcpiphdr *);
101 if (tp->t_template == 0)
102 panic("tcp_output");
f1b2fa5b 103 bcopy((caddr_t)tp->t_template, (caddr_t)ti, sizeof (struct tcpiphdr));
a6503abf
BJ
104
105 /*
106 * Fill in fields, remembering maximum advertised
107 * window for use in delaying messages about window sizes.
108 */
4aed14e3
BJ
109 ti->ti_seq = tp->snd_nxt;
110 ti->ti_ack = tp->rcv_nxt;
111#if vax
112 ti->ti_seq = htonl(ti->ti_seq);
113 ti->ti_ack = htonl(ti->ti_ack);
114#endif
0974b45c 115 if (tp->t_tcpopt) {
f1b2fa5b 116 m0 = m->m_next;
0974b45c
BJ
117 m->m_next = m_get(0);
118 if (m->m_next == 0) {
119 (void) m_free(m);
f1b2fa5b 120 m_freem(m);
0974b45c
BJ
121 return (0);
122 }
123 m->m_next->m_next = m0;
124 m->m_off = MMINOFF;
125 m->m_len = tp->t_tcpopt->m_len;
126 bcopy(mtod(tp->t_tcpopt, caddr_t), mtod(m, caddr_t),
f1b2fa5b 127 (unsigned)tp->t_tcpopt->m_len);
0974b45c
BJ
128 ti->ti_off = (sizeof (struct tcphdr)+tp->t_tcpopt->m_len) >> 2;
129 }
130 ti->ti_flags = flags;
a6503abf
BJ
131 win = sbspace(&so->so_rcv);
132 if (win > 0)
f1b2fa5b 133 ti->ti_win = htons((u_short)win);
0974b45c
BJ
134 if (SEQ_GT(tp->snd_up, tp->snd_nxt)) {
135 ti->ti_urp = htons((u_short)(tp->snd_up - tp->snd_nxt));
a6503abf
BJ
136 ti->ti_flags |= TH_URG;
137 } else
138 /*
139 * If no urgent pointer to send, then we pull
140 * the urgent pointer to the left edge of the send window
141 * so that it doesn't drift into the send window on sequence
142 * number wraparound.
143 */
0974b45c
BJ
144 tp->snd_up = tp->snd_una; /* drag it along */
145 /* PUSH */
a6503abf
BJ
146
147 /*
148 * Put TCP length in extended header, and then
149 * checksum extended header and data.
150 */
151 if (len)
152 ti->ti_len = htons((u_short)(len + sizeof (struct tcphdr)));
0974b45c
BJ
153 ti->ti_sum = in_cksum(m, sizeof (struct tcpiphdr) + len);
154
155 /*
156 * Advance snd_nxt over sequence space of this segment
157 */
158 if (flags & (TH_SYN|TH_FIN))
4aed14e3 159 tp->snd_nxt++;
0974b45c
BJ
160 tp->snd_nxt += len;
161
162 /*
405c9168 163 * If this transmission closes the window,
4aed14e3
BJ
164 * start persistance timer at 2 round trip times
165 * but at least TCPTV_PERSMIN ticks.
0974b45c 166 */
89413846
BJ
167 if (TCPS_HAVERCVDSYN(tp->t_state) &&
168 SEQ_GT(tp->snd_nxt, tp->snd_una+tp->snd_wnd) &&
4aed14e3
BJ
169 tp->t_timer[TCPT_PERSIST] == 0)
170 TCPT_RANGESET(tp->t_timer[TCPT_PERSIST],
171 2 * tp->t_srtt, TCPTV_PERSMIN, TCPTV_MAX);
405c9168
BJ
172
173 /*
174 * Time this transmission if not a retransmission and
175 * not currently timing anything.
176 */
177 if (SEQ_GT(tp->snd_nxt, tp->snd_max) && tp->t_rtt == 0) {
178 tp->t_rtt = 1;
179 tp->t_rtseq = tp->snd_nxt - len;
180 }
181
182 /*
183 * Set retransmit timer if not currently set.
4aed14e3 184 * Initial value for retransmit timer to tcp_beta*tp->t_srtt.
405c9168
BJ
185 * Initialize shift counter which is used for exponential
186 * backoff of retransmit time.
187 */
4aed14e3
BJ
188 if (tp->t_timer[TCPT_REXMT] == 0 && tp->snd_nxt != tp->snd_una) {
189 TCPT_RANGESET(tp->t_timer[TCPT_REXMT],
190 tcp_beta * tp->t_srtt, TCPTV_MIN, TCPTV_MAX);
405c9168 191 tp->t_rxtshift = 0;
0974b45c 192 }
a6503abf 193
f1dd32da
BJ
194 /*
195 * Trace.
196 */
197 if (tp->t_inpcb->inp_socket->so_options & SO_DEBUG)
198 tcp_trace(TA_OUTPUT, tp->t_state, tp, ti, 0);
199
a6503abf
BJ
200 /*
201 * Fill in IP length and desired time to live and
202 * send to IP level.
203 */
204 ((struct ip *)ti)->ip_len = len + sizeof (struct tcpiphdr);
205 ((struct ip *)ti)->ip_ttl = TCP_TTL;
be43ac7f 206 if (ip_output(m, tp->t_ipopt) == 0)
0974b45c 207 return (0);
a6503abf
BJ
208
209 /*
210 * Data sent (as far as we can tell).
211 * If this advertises a larger window than any other segment,
4aed14e3 212 * then remember the size of the advertised window.
0974b45c 213 * Drop send for purpose of ACK requirements.
a6503abf 214 */
be43ac7f 215 if (win > 0 && SEQ_GT(tp->rcv_nxt+win, tp->rcv_adv))
a6503abf 216 tp->rcv_adv = tp->rcv_nxt + win;
0974b45c 217 tp->t_flags &= ~(TF_ACKNOW|TF_DELACK);
4aed14e3
BJ
218 if (SEQ_GT(tp->snd_nxt, tp->snd_max))
219 tp->snd_max = tp->snd_nxt;
0974b45c 220 return (1);
76ee76df 221}