Commit | Line | Data |
---|---|---|
f4d55810 | 1 | /* tcp_usrreq.c 1.74 83/02/10 */ |
72f24d7d | 2 | |
4eb5d593 | 3 | #include "../h/param.h" |
72f24d7d | 4 | #include "../h/systm.h" |
dad64fdf BJ |
5 | #include "../h/mbuf.h" |
6 | #include "../h/socket.h" | |
eee3ab16 BJ |
7 | #include "../h/socketvar.h" |
8 | #include "../h/protosw.h" | |
f4d55810 | 9 | #include "../h/errno.h" |
6e7edb25 BJ |
10 | |
11 | #include "../net/if.h" | |
c124e997 | 12 | #include "../net/route.h" |
f4d55810 | 13 | |
6e7edb25 | 14 | #include "../netinet/in.h" |
839fe741 BJ |
15 | #include "../netinet/in_pcb.h" |
16 | #include "../netinet/in_systm.h" | |
839fe741 BJ |
17 | #include "../netinet/ip.h" |
18 | #include "../netinet/ip_var.h" | |
19 | #include "../netinet/tcp.h" | |
20 | #include "../netinet/tcp_fsm.h" | |
21 | #include "../netinet/tcp_seq.h" | |
22 | #include "../netinet/tcp_timer.h" | |
23 | #include "../netinet/tcp_var.h" | |
24 | #include "../netinet/tcpip.h" | |
25 | #include "../netinet/tcp_debug.h" | |
eee3ab16 | 26 | |
290e0b0a BJ |
27 | /* |
28 | * TCP protocol interface to socket abstraction. | |
29 | */ | |
30 | extern char *tcpstates[]; | |
4ad99bae | 31 | struct tcpcb *tcp_newtcpcb(); |
290e0b0a | 32 | |
9c5022e3 | 33 | /* |
290e0b0a | 34 | * Process a TCP user request for TCP tb. If this is a send request |
9c5022e3 BJ |
35 | * then m is the mbuf chain of send data. If this is a timer expiration |
36 | * (called from the software clock routine), then timertype tells which timer. | |
37 | */ | |
a8d3bf7f | 38 | /*ARGSUSED*/ |
bc031e39 | 39 | tcp_usrreq(so, req, m, nam) |
eee3ab16 BJ |
40 | struct socket *so; |
41 | int req; | |
8075bb0e | 42 | struct mbuf *m, *nam; |
4eb5d593 | 43 | { |
53a5409e | 44 | register struct inpcb *inp = sotoinpcb(so); |
cdad2eb1 | 45 | register struct tcpcb *tp; |
72f24d7d | 46 | int s = splnet(); |
eee3ab16 | 47 | int error = 0; |
17b82ed4 | 48 | int ostate; |
72f24d7d | 49 | |
53a5409e | 50 | /* |
290e0b0a BJ |
51 | * When a TCP is attached to a socket, then there will be |
52 | * a (struct inpcb) pointed at by the socket, and this | |
53 | * structure will point at a subsidary (struct tcpcb). | |
53a5409e | 54 | */ |
0974b45c | 55 | if (inp == 0 && req != PRU_ATTACH) { |
a6503abf | 56 | splx(s); |
290e0b0a | 57 | return (EINVAL); /* XXX */ |
a6503abf BJ |
58 | } |
59 | if (inp) { | |
cdad2eb1 | 60 | tp = intotcpcb(inp); |
8075bb0e | 61 | /* WHAT IF TP IS 0? */ |
9c5022e3 | 62 | #ifdef KPROF |
a6503abf | 63 | tcp_acounts[tp->t_state][req]++; |
9c5022e3 | 64 | #endif |
17b82ed4 | 65 | ostate = tp->t_state; |
ebf42a75 BJ |
66 | } else |
67 | ostate = 0; | |
eee3ab16 | 68 | switch (req) { |
4eb5d593 | 69 | |
290e0b0a BJ |
70 | /* |
71 | * TCP attaches to socket via PRU_ATTACH, reserving space, | |
8075bb0e | 72 | * and an internet control block. |
290e0b0a | 73 | */ |
eee3ab16 | 74 | case PRU_ATTACH: |
4ad99bae | 75 | if (inp) { |
eee3ab16 | 76 | error = EISCONN; |
cdad2eb1 | 77 | break; |
53a5409e | 78 | } |
a1edc12b | 79 | error = tcp_attach(so); |
a6503abf | 80 | if (error) |
4ad99bae | 81 | break; |
0e3936fa | 82 | if ((so->so_options & SO_LINGER) && so->so_linger == 0) |
8e65fd66 | 83 | so->so_linger = TCP_LINGERTIME; |
290e0b0a | 84 | tp = sototcpcb(so); |
72f24d7d | 85 | break; |
4eb5d593 | 86 | |
290e0b0a BJ |
87 | /* |
88 | * PRU_DETACH detaches the TCP protocol from the socket. | |
89 | * If the protocol state is non-embryonic, then can't | |
90 | * do this directly: have to initiate a PRU_DISCONNECT, | |
91 | * which may finish later; embryonic TCB's can just | |
92 | * be discarded here. | |
93 | */ | |
eee3ab16 | 94 | case PRU_DETACH: |
290e0b0a | 95 | if (tp->t_state > TCPS_LISTEN) |
0e3936fa SL |
96 | tp = tcp_disconnect(tp); |
97 | else | |
98 | tp = tcp_close(tp); | |
eee3ab16 BJ |
99 | break; |
100 | ||
8075bb0e BJ |
101 | /* |
102 | * Give the socket an address. | |
103 | */ | |
104 | case PRU_BIND: | |
105 | error = in_pcbbind(inp, nam); | |
106 | if (error) | |
107 | break; | |
108 | break; | |
109 | ||
110 | /* | |
111 | * Prepare to accept connections. | |
112 | */ | |
113 | case PRU_LISTEN: | |
114 | if (inp->inp_lport == 0) | |
115 | error = in_pcbbind(inp, (struct mbuf *)0); | |
116 | if (error == 0) | |
117 | tp->t_state = TCPS_LISTEN; | |
118 | break; | |
119 | ||
290e0b0a BJ |
120 | /* |
121 | * Initiate connection to peer. | |
122 | * Create a template for use in transmissions on this connection. | |
123 | * Enter SYN_SENT state, and mark socket as connecting. | |
124 | * Start keep-alive timer, and seed output sequence space. | |
125 | * Send initial segment on connection. | |
126 | */ | |
eee3ab16 | 127 | case PRU_CONNECT: |
8075bb0e BJ |
128 | if (inp->inp_lport == 0) { |
129 | error = in_pcbbind(inp, (struct mbuf *)0); | |
130 | if (error) | |
131 | break; | |
132 | } | |
133 | error = in_pcbconnect(inp, nam); | |
4ad99bae | 134 | if (error) |
53a5409e | 135 | break; |
b454c3ea | 136 | tp->t_template = tcp_template(tp); |
290e0b0a BJ |
137 | if (tp->t_template == 0) { |
138 | in_pcbdisconnect(inp); | |
139 | error = ENOBUFS; | |
140 | break; | |
141 | } | |
53a5409e | 142 | soisconnecting(so); |
a6503abf | 143 | tp->t_state = TCPS_SYN_SENT; |
4aed14e3 BJ |
144 | tp->t_timer[TCPT_KEEP] = TCPTV_KEEP; |
145 | tp->iss = tcp_iss; tcp_iss += TCP_ISSINCR/2; | |
146 | tcp_sendseqinit(tp); | |
8a2f82db | 147 | error = tcp_output(tp); |
72f24d7d | 148 | break; |
4eb5d593 | 149 | |
290e0b0a BJ |
150 | /* |
151 | * Initiate disconnect from peer. | |
152 | * If connection never passed embryonic stage, just drop; | |
153 | * else if don't need to let data drain, then can just drop anyways, | |
154 | * else have to begin TCP shutdown process: mark socket disconnecting, | |
155 | * drain unread data, state switch to reflect user close, and | |
156 | * send segment (e.g. FIN) to peer. Socket will be really disconnected | |
157 | * when peer sends FIN and acks ours. | |
158 | * | |
159 | * SHOULD IMPLEMENT LATER PRU_CONNECT VIA REALLOC TCPCB. | |
160 | */ | |
161 | case PRU_DISCONNECT: | |
0e3936fa | 162 | tp = tcp_disconnect(tp); |
4aed14e3 BJ |
163 | break; |
164 | ||
290e0b0a BJ |
165 | /* |
166 | * Accept a connection. Essentially all the work is | |
167 | * done at higher levels; just return the address | |
168 | * of the peer, storing through addr. | |
169 | */ | |
1acff8ec | 170 | case PRU_ACCEPT: { |
8075bb0e | 171 | struct sockaddr_in *sin = mtod(nam, struct sockaddr_in *); |
1acff8ec | 172 | |
8075bb0e BJ |
173 | nam->m_len = sizeof (struct sockaddr_in); |
174 | sin->sin_family = AF_INET; | |
175 | sin->sin_port = inp->inp_fport; | |
176 | sin->sin_addr = inp->inp_faddr; | |
eee3ab16 | 177 | break; |
8075bb0e | 178 | } |
eee3ab16 | 179 | |
290e0b0a BJ |
180 | /* |
181 | * Mark the connection as being incapable of further output. | |
182 | */ | |
eee3ab16 | 183 | case PRU_SHUTDOWN: |
0974b45c | 184 | socantsendmore(so); |
0e3936fa SL |
185 | tp = tcp_usrclosed(tp); |
186 | if (tp) | |
187 | error = tcp_output(tp); | |
72f24d7d BJ |
188 | break; |
189 | ||
290e0b0a BJ |
190 | /* |
191 | * After a receive, possibly send window update to peer. | |
192 | */ | |
eee3ab16 | 193 | case PRU_RCVD: |
f1b2fa5b | 194 | (void) tcp_output(tp); |
72f24d7d BJ |
195 | break; |
196 | ||
290e0b0a BJ |
197 | /* |
198 | * Do a send by putting data in output queue and updating urgent | |
199 | * marker if URG set. Possibly send more data. | |
200 | */ | |
eee3ab16 | 201 | case PRU_SEND: |
a6503abf | 202 | sbappend(&so->so_snd, m); |
8a2f82db | 203 | #ifdef notdef |
0974b45c | 204 | if (tp->t_flags & TF_PUSH) |
a6503abf | 205 | tp->snd_end = tp->snd_una + so->so_snd.sb_cc; |
8a2f82db SL |
206 | #endif |
207 | error = tcp_output(tp); | |
72f24d7d BJ |
208 | break; |
209 | ||
290e0b0a BJ |
210 | /* |
211 | * Abort the TCP. | |
212 | */ | |
eee3ab16 | 213 | case PRU_ABORT: |
0e3936fa | 214 | tp = tcp_drop(tp, ECONNABORTED); |
72f24d7d BJ |
215 | break; |
216 | ||
290e0b0a | 217 | /* SOME AS YET UNIMPLEMENTED HOOKS */ |
eee3ab16 | 218 | case PRU_CONTROL: |
53a5409e | 219 | error = EOPNOTSUPP; |
eee3ab16 BJ |
220 | break; |
221 | ||
f1b2fa5b BJ |
222 | case PRU_SENSE: |
223 | error = EOPNOTSUPP; | |
224 | break; | |
0244dbc7 | 225 | /* END UNIMPLEMENTED HOOKS */ |
f1b2fa5b BJ |
226 | |
227 | case PRU_RCVOOB: | |
8b5a83bb BJ |
228 | if (so->so_oobmark == 0 && |
229 | (so->so_state & SS_RCVATMARK) == 0) { | |
0244dbc7 BJ |
230 | error = EINVAL; |
231 | break; | |
232 | } | |
b2db9217 | 233 | if ((tp->t_oobflags & TCPOOB_HAVEDATA) == 0) { |
8b5a83bb | 234 | error = EWOULDBLOCK; |
b2db9217 | 235 | break; |
8b5a83bb | 236 | } |
283ea225 | 237 | m->m_len = 1; |
b2db9217 | 238 | *mtod(m, caddr_t) = tp->t_iobc; |
f1b2fa5b BJ |
239 | break; |
240 | ||
241 | case PRU_SENDOOB: | |
8b5a83bb BJ |
242 | if (sbspace(&so->so_snd) < -512) { |
243 | error = ENOBUFS; | |
244 | break; | |
245 | } | |
0244dbc7 BJ |
246 | tp->snd_up = tp->snd_una + so->so_snd.sb_cc + 1; |
247 | sbappend(&so->so_snd, m); | |
b2db9217 | 248 | tp->t_force = 1; |
8a2f82db | 249 | error = tcp_output(tp); |
b2db9217 | 250 | tp->t_force = 0; |
f1b2fa5b BJ |
251 | break; |
252 | ||
126472ab | 253 | case PRU_SOCKADDR: |
8075bb0e | 254 | in_setsockaddr(inp, nam); |
126472ab SL |
255 | break; |
256 | ||
290e0b0a BJ |
257 | /* |
258 | * TCP slow timer went off; going through this | |
259 | * routine for tracing's sake. | |
260 | */ | |
eee3ab16 | 261 | case PRU_SLOWTIMO: |
0e3936fa | 262 | tp = tcp_timers(tp, (int)nam); |
8075bb0e | 263 | req |= (int)nam << 8; /* for debug's sake */ |
eee3ab16 BJ |
264 | break; |
265 | ||
9c5022e3 BJ |
266 | default: |
267 | panic("tcp_usrreq"); | |
72f24d7d | 268 | } |
17b82ed4 BJ |
269 | if (tp && (so->so_options & SO_DEBUG)) |
270 | tcp_trace(TA_USER, ostate, tp, (struct tcpiphdr *)0, req); | |
72f24d7d | 271 | splx(s); |
53a5409e | 272 | return (error); |
4eb5d593 | 273 | } |
4aed14e3 | 274 | |
306f91c9 | 275 | int tcp_sendspace = 1024*2; |
1bc20e72 | 276 | int tcp_recvspace = 1024*2; |
290e0b0a BJ |
277 | /* |
278 | * Attach TCP protocol to socket, allocating | |
279 | * internet protocol control block, tcp control block, | |
280 | * bufer space, and entering LISTEN state if to accept connections. | |
281 | */ | |
8075bb0e | 282 | tcp_attach(so) |
290e0b0a | 283 | struct socket *so; |
290e0b0a BJ |
284 | { |
285 | register struct tcpcb *tp; | |
286 | struct inpcb *inp; | |
287 | int error; | |
288 | ||
59965020 | 289 | error = soreserve(so, tcp_sendspace, tcp_recvspace); |
ebf42a75 BJ |
290 | if (error) |
291 | goto bad; | |
292 | error = in_pcballoc(so, &tcb); | |
290e0b0a | 293 | if (error) |
8075bb0e BJ |
294 | goto bad; |
295 | inp = sotoinpcb(so); | |
290e0b0a | 296 | tp = tcp_newtcpcb(inp); |
ebf42a75 BJ |
297 | if (tp == 0) { |
298 | error = ENOBUFS; | |
299 | goto bad2; | |
300 | } | |
8075bb0e | 301 | tp->t_state = TCPS_CLOSED; |
290e0b0a | 302 | return (0); |
ebf42a75 BJ |
303 | bad2: |
304 | in_pcbdetach(inp); | |
305 | bad: | |
306 | return (error); | |
290e0b0a BJ |
307 | } |
308 | ||
309 | /* | |
310 | * Initiate (or continue) disconnect. | |
311 | * If embryonic state, just send reset (once). | |
312 | * If not in ``let data drain'' option, just drop. | |
313 | * Otherwise (hard), mark socket disconnecting and drop | |
314 | * current input data; switch states based on user close, and | |
315 | * send segment to peer (with FIN). | |
316 | */ | |
0e3936fa | 317 | struct tcpcb * |
290e0b0a | 318 | tcp_disconnect(tp) |
0e3936fa | 319 | register struct tcpcb *tp; |
290e0b0a BJ |
320 | { |
321 | struct socket *so = tp->t_inpcb->inp_socket; | |
322 | ||
323 | if (tp->t_state < TCPS_ESTABLISHED) | |
0e3936fa | 324 | tp = tcp_close(tp); |
8e65fd66 | 325 | else if (so->so_linger == 0) |
0e3936fa | 326 | tp = tcp_drop(tp, 0); |
290e0b0a BJ |
327 | else { |
328 | soisdisconnecting(so); | |
329 | sbflush(&so->so_rcv); | |
0e3936fa SL |
330 | tp = tcp_usrclosed(tp); |
331 | if (tp) | |
332 | (void) tcp_output(tp); | |
290e0b0a | 333 | } |
0e3936fa | 334 | return (tp); |
290e0b0a BJ |
335 | } |
336 | ||
337 | /* | |
338 | * User issued close, and wish to trail through shutdown states: | |
339 | * if never received SYN, just forget it. If got a SYN from peer, | |
340 | * but haven't sent FIN, then go to FIN_WAIT_1 state to send peer a FIN. | |
341 | * If already got a FIN from peer, then almost done; go to LAST_ACK | |
342 | * state. In all other cases, have already sent FIN to peer (e.g. | |
343 | * after PRU_SHUTDOWN), and just have to play tedious game waiting | |
344 | * for peer to send FIN or not respond to keep-alives, etc. | |
085a0b90 | 345 | * We can let the user exit from the close as soon as the FIN is acked. |
290e0b0a | 346 | */ |
0e3936fa | 347 | struct tcpcb * |
4aed14e3 | 348 | tcp_usrclosed(tp) |
0e3936fa | 349 | register struct tcpcb *tp; |
4aed14e3 BJ |
350 | { |
351 | ||
4aed14e3 BJ |
352 | switch (tp->t_state) { |
353 | ||
354 | case TCPS_LISTEN: | |
355 | case TCPS_SYN_SENT: | |
356 | tp->t_state = TCPS_CLOSED; | |
0e3936fa | 357 | tp = tcp_close(tp); |
4aed14e3 BJ |
358 | break; |
359 | ||
360 | case TCPS_SYN_RECEIVED: | |
361 | case TCPS_ESTABLISHED: | |
362 | tp->t_state = TCPS_FIN_WAIT_1; | |
363 | break; | |
364 | ||
365 | case TCPS_CLOSE_WAIT: | |
366 | tp->t_state = TCPS_LAST_ACK; | |
367 | break; | |
368 | } | |
0e3936fa | 369 | if (tp && tp->t_state >= TCPS_FIN_WAIT_2) |
085a0b90 | 370 | soisdisconnected(tp->t_inpcb->inp_socket); |
0e3936fa | 371 | return (tp); |
4aed14e3 | 372 | } |