bwrite shouldn't clear B_AGE or brelse won't put it at the head
[unix-history] / usr / src / sys / kern / uipc_socket.c
index 55a0ac2..8733ca1 100644 (file)
@@ -1,4 +1,4 @@
-/*     uipc_socket.c   4.14    81/11/22        */
+/*     uipc_socket.c   4.66    82/12/14        */
 
 #include "../h/param.h"
 #include "../h/systm.h"
 
 #include "../h/param.h"
 #include "../h/systm.h"
 #include "../h/socket.h"
 #include "../h/socketvar.h"
 #include "../h/stat.h"
 #include "../h/socket.h"
 #include "../h/socketvar.h"
 #include "../h/stat.h"
-#include "../net/inet.h"
-#include "../net/inet_systm.h"
+#include "../h/ioctl.h"
+#include "../h/uio.h"
+#include "../net/route.h"
 
 /*
 
 /*
- * Socket support routines.
- *
- * DEAL WITH INTERRUPT NOTIFICATION.
+ * Socket operation routines.
+ * These routines are called by the routines in
+ * sys_socket.c or from a system process, and
+ * implement the semantics of socket operations by
+ * switching out to the protocol specific routines.
  */
 
  */
 
-/*
- * Create a socket.
- */
-socreate(aso, type, asp, asa, options)
+/*ARGSUSED*/
+socreate(dom, aso, type, proto, opt)
        struct socket **aso;
        struct socket **aso;
-       int type;
-       struct sockproto *asp;
-       struct sockaddr *asa;
-       int options;
+       int type, proto;
+       struct socketopt *opt;
 {
        register struct protosw *prp;
        register struct socket *so;
        struct mbuf *m;
 {
        register struct protosw *prp;
        register struct socket *so;
        struct mbuf *m;
-       int pf, proto, error;
-COUNT(SOCREATE);
-
-       /*
-        * Use process standard protocol/protocol family if none
-        * specified by address argument.
-        */
-       if (asp == 0) {
-               pf = PF_INET;           /* should be u.u_protof */
-               proto = 0;
-       } else {
-               pf = asp->sp_family;
-               proto = asp->sp_protocol;
-       }
+       int error;
 
 
-       /*
-        * If protocol specified, look for it, otherwise
-        * for a protocol of the correct type in the right family.
-        */
        if (proto)
        if (proto)
-               prp = pffindproto(pf, proto);
+               prp = pffindproto(dom, proto);
        else
        else
-               prp = pffindtype(pf, type);
+               prp = pffindtype(dom, type);
        if (prp == 0)
                return (EPROTONOSUPPORT);
        if (prp == 0)
                return (EPROTONOSUPPORT);
-
-       /*
-        * Get a socket structure.
-        */
-       m = m_getclr(M_WAIT);
+       if (prp->pr_type != type)
+               return (EPROTOTYPE);
+       m = m_getclr(M_WAIT, MT_SOCKET);
        if (m == 0)
                return (ENOBUFS);
        so = mtod(m, struct socket *);
        if (m == 0)
                return (ENOBUFS);
        so = mtod(m, struct socket *);
-       so->so_options = options;
-
-       /*
-        * Attach protocol to socket, initializing
-        * and reserving resources.
-        */
+       so->so_options = 0;
+       so->so_state = 0;
+       so->so_type = type;
+       if (u.u_uid == 0)
+               so->so_state = SS_PRIV;
        so->so_proto = prp;
        so->so_proto = prp;
-       error = (*prp->pr_usrreq)(so, PRU_ATTACH, 0, asa);
+       error = (*prp->pr_usrreq)(so, PRU_ATTACH,
+           (struct mbuf *)0, (struct mbuf *)0, (struct socketopt *)0);
        if (error) {
        if (error) {
-               (void) m_free(dtom(so));
+               so->so_state |= SS_NOFDREF;
+               sofree(so);
                return (error);
        }
        *aso = so;
        return (0);
 }
 
                return (error);
        }
        *aso = so;
        return (0);
 }
 
+sobind(so, nam, opt)
+       struct socket *so;
+       struct mbuf *nam;
+       struct socketopt *opt;
+{
+       int s = splnet();
+       int error;
+
+       error =
+           (*so->so_proto->pr_usrreq)(so, PRU_BIND,
+               (struct mbuf *)0, nam, opt);
+       splx(s);
+       return (error);
+}
+
+solisten(so, backlog)
+       struct socket *so;
+       int backlog;
+{
+       int s = splnet();
+       int error;
+
+       error = (*so->so_proto->pr_usrreq)(so, PRU_LISTEN,
+           (struct mbuf *)0, (struct mbuf *)0, (struct socketopt *)0);
+       if (error) {
+               splx(s);
+               return (error);
+       }
+       if (so->so_q == 0) {
+               so->so_q = so;
+               so->so_q0 = so;
+               so->so_options |= SO_ACCEPTCONN;
+       }
+       if (backlog < 0)
+               backlog = 0;
+       so->so_qlimit = backlog < 5 ? backlog : 5;
+       so->so_options |= SO_NEWFDONCONN;
+       return (0);
+}
+
 sofree(so)
        struct socket *so;
 {
 
 sofree(so)
        struct socket *so;
 {
 
-COUNT(SOFREE);
-       if (so->so_pcb || (so->so_state & SS_USERGONE) == 0)
+       if (so->so_head) {
+               if (!soqremque(so, 0) && !soqremque(so, 1))
+                       panic("sofree dq");
+               so->so_head = 0;
+       }
+       if (so->so_pcb || (so->so_state & SS_NOFDREF) == 0)
                return;
        sbrelease(&so->so_snd);
        sbrelease(&so->so_rcv);
                return;
        sbrelease(&so->so_snd);
        sbrelease(&so->so_rcv);
@@ -101,126 +126,111 @@ COUNT(SOFREE);
  * Initiate disconnect if connected.
  * Free socket when disconnect complete.
  */
  * Initiate disconnect if connected.
  * Free socket when disconnect complete.
  */
-soclose(so)
+soclose(so, exiting)
        register struct socket *so;
        register struct socket *so;
+       int exiting;
 {
        int s = splnet();               /* conservative */
 {
        int s = splnet();               /* conservative */
+       int error;
 
 
-COUNT(SOCLOSE);
+       if (so->so_options & SO_ACCEPTCONN) {
+               while (so->so_q0 != so)
+                       (void) soclose(so->so_q0, 1);
+               while (so->so_q != so)
+                       (void) soclose(so->so_q, 1);
+       }
        if (so->so_pcb == 0)
                goto discard;
        if (so->so_pcb == 0)
                goto discard;
+       if (exiting)
+               so->so_options |= SO_KEEPALIVE;
        if (so->so_state & SS_ISCONNECTED) {
                if ((so->so_state & SS_ISDISCONNECTING) == 0) {
        if (so->so_state & SS_ISCONNECTED) {
                if ((so->so_state & SS_ISDISCONNECTING) == 0) {
-                       u.u_error = sodisconnect(so, (struct sockaddr *)0);
-                       if (u.u_error) {
+                       error = sodisconnect(so, (struct mbuf *)0);
+                       if (error) {
+                               if (exiting)
+                                       goto drop;
                                splx(s);
                                splx(s);
-                               return;
+                               return (error);
                        }
                }
                        }
                }
-               if ((so->so_state & SS_ISDISCONNECTING) &&
-                   (so->so_options & SO_NBIO)) {
-                       u.u_error = EINPROGRESS;
+               if ((so->so_options & SO_DONTLINGER) == 0) {
+                       if ((so->so_state & SS_ISDISCONNECTING) &&
+                           (so->so_state & SS_NBIO) &&
+                           exiting == 0)
+                               return (EINPROGRESS);
+                       /* should use tsleep here, for at most linger */
+                       while (so->so_state & SS_ISCONNECTED)
+                               sleep((caddr_t)&so->so_timeo, PZERO+1);
+               }
+       }
+drop:
+       if (so->so_pcb) {
+               error = (*so->so_proto->pr_usrreq)(so, PRU_DETACH,
+                   (struct mbuf *)0, (struct mbuf *)0, (struct socketopt *)0);
+               if (exiting == 0 && error) {
                        splx(s);
                        splx(s);
-                       return;
+                       return (error);
                }
                }
-               while (so->so_state & SS_ISCONNECTED)
-                       sleep((caddr_t)&so->so_timeo, PZERO+1);
        }
        }
-       u.u_error = (*so->so_proto->pr_usrreq)(so, PRU_DETACH, 0, 0);
 discard:
 discard:
-       so->so_state |= SS_USERGONE;
+       so->so_state |= SS_NOFDREF;
        sofree(so);
        splx(s);
        sofree(so);
        splx(s);
-}
-
-sosplice(pso, so)
-       struct socket *pso, *so;
-{
-
-COUNT(SOSPLICE);
-       if (pso->so_proto->pr_family != PF_LOCAL) {
-               struct socket *tso;
-               tso = pso; pso = so; so = tso;
-       }
-       if (pso->so_proto->pr_family != PF_LOCAL)
-               return (EOPNOTSUPP);
-       /* check types and buffer space */
-       /* merge buffers */
        return (0);
 }
 
 /*ARGSUSED*/
        return (0);
 }
 
 /*ARGSUSED*/
-sostat(so, sb)
+sostat(so, ub)
        struct socket *so;
        struct socket *so;
-       struct stat *sb;
+       struct stat *ub;
 {
 {
+       struct stat sb;
 
 
-COUNT(SOSTAT);
-       return (EOPNOTSUPP);
+       bzero((caddr_t)&sb, sizeof (sb));               /* XXX */
+       (void) copyout((caddr_t)&sb, (caddr_t)ub, sizeof (sb));/* XXX */
+       return (0);                                     /* XXX */
 }
 
 }
 
-/*
- * Accept connection on a socket.
- */
-soaccept(so, asa)
+soaccept(so, nam, opt)
        struct socket *so;
        struct socket *so;
-       struct sockaddr *asa;
+       struct mbuf *nam;
+       struct socketopt *opt;
 {
        int s = splnet();
        int error;
 
 {
        int s = splnet();
        int error;
 
-COUNT(SOACCEPT);
-       if (so->so_state & (SS_ISCONNECTED|SS_ISCONNECTING)) {
-               error = EISCONN;
-               goto bad;
-       }
-       if ((so->so_options & SO_ACCEPTCONN) == 0) {
-               error = EINVAL;                 /* XXX */
-               goto bad;
-       }
-       error = (*so->so_proto->pr_usrreq)(so, PRU_ACCEPT, 0, (caddr_t)asa);
-bad:
+       error = (*so->so_proto->pr_usrreq)(so, PRU_ACCEPT,
+           (struct mbuf *)0, nam, opt);
        splx(s);
        return (error);
 }
 
        splx(s);
        return (error);
 }
 
-/*
- * Connect socket to a specified address.
- * If already connected or connecting, then avoid
- * the protocol entry, to keep its job simpler.
- */
-soconnect(so, asa)
+soconnect(so, nam, opt)
        struct socket *so;
        struct socket *so;
-       struct sockaddr *asa;
+       struct mbuf *nam;
+       struct socketopt *opt;
 {
        int s = splnet();
        int error;
 
 {
        int s = splnet();
        int error;
 
-COUNT(SOCONNECT);
        if (so->so_state & (SS_ISCONNECTED|SS_ISCONNECTING)) {
                error = EISCONN;
                goto bad;
        }
        if (so->so_state & (SS_ISCONNECTED|SS_ISCONNECTING)) {
                error = EISCONN;
                goto bad;
        }
-       error = (*so->so_proto->pr_usrreq)(so, PRU_CONNECT, 0, (caddr_t)asa);
+       error = (*so->so_proto->pr_usrreq)(so, PRU_CONNECT,
+           (struct mbuf *)0, nam, opt);
 bad:
        splx(s);
        return (error);
 }
 
 bad:
        splx(s);
        return (error);
 }
 
-/*
- * Disconnect from a socket.
- * Address parameter is from system call for later multicast
- * protocols.  Check to make sure that connected and no disconnect
- * in progress (for protocol's sake), and then invoke protocol.
- */
-sodisconnect(so, asa)
+sodisconnect(so, nam)
        struct socket *so;
        struct socket *so;
-       struct sockaddr *asa;
+       struct mbuf *nam;
 {
        int s = splnet();
        int error;
 
 {
        int s = splnet();
        int error;
 
-COUNT(SODISCONNECT);
        if ((so->so_state & SS_ISCONNECTED) == 0) {
                error = ENOTCONN;
                goto bad;
        if ((so->so_state & SS_ISCONNECTED) == 0) {
                error = ENOTCONN;
                goto bad;
@@ -229,7 +239,8 @@ COUNT(SODISCONNECT);
                error = EALREADY;
                goto bad;
        }
                error = EALREADY;
                goto bad;
        }
-       error = (*so->so_proto->pr_usrreq)(so, PRU_DISCONNECT, 0, asa);
+       error = (*so->so_proto->pr_usrreq)(so, PRU_DISCONNECT,
+           (struct mbuf *)0, nam, (struct socketopt *)0);
 bad:
        splx(s);
        return (error);
 bad:
        splx(s);
        return (error);
@@ -243,106 +254,158 @@ bad:
  * If must go all at once and not enough room now, then
  * inform user that this would block and do nothing.
  */
  * If must go all at once and not enough room now, then
  * inform user that this would block and do nothing.
  */
-sosend(so, asa)
+sosend(so, nam, uio, flags)
        register struct socket *so;
        register struct socket *so;
-       struct sockaddr *asa;
+       struct mbuf *nam;
+       struct uio *uio;
+       int flags;
 {
        struct mbuf *top = 0;
        register struct mbuf *m, **mp = &top;
 {
        struct mbuf *top = 0;
        register struct mbuf *m, **mp = &top;
-       register u_int len;
+       register int len;
        int error = 0, space, s;
 
        int error = 0, space, s;
 
-COUNT(SOSEND);
-       if (so->so_state & SS_CANTSENDMORE)
-               return (EPIPE);
-       if (sosendallatonce(so) && u.u_count > so->so_snd.sb_hiwat)
+       if (sosendallatonce(so) && uio->uio_resid > so->so_snd.sb_hiwat)
                return (EMSGSIZE);
                return (EMSGSIZE);
-       if ((so->so_snd.sb_flags & SB_LOCK) && (so->so_options & SO_NBIO))
-               return (EWOULDBLOCK);
+restart:
        sblock(&so->so_snd);
 #define        snderr(errno)   { error = errno; splx(s); goto release; }
 
        sblock(&so->so_snd);
 #define        snderr(errno)   { error = errno; splx(s); goto release; }
 
-       s = splnet();
+       u.u_ru.ru_msgsnd++;
 again:
 again:
+       s = splnet();
+       if (so->so_state & SS_CANTSENDMORE) {
+               psignal(u.u_procp, SIGPIPE);
+               snderr(EPIPE);
+       }
+       if (so->so_error) {
+               error = so->so_error;
+               so->so_error = 0;                               /* ??? */
+               splx(s);
+               goto release;
+       }
        if ((so->so_state & SS_ISCONNECTED) == 0) {
                if (so->so_proto->pr_flags & PR_CONNREQUIRED)
                        snderr(ENOTCONN);
        if ((so->so_state & SS_ISCONNECTED) == 0) {
                if (so->so_proto->pr_flags & PR_CONNREQUIRED)
                        snderr(ENOTCONN);
-               if (asa == 0)
+               if (nam == 0)
                        snderr(EDESTADDRREQ);
        }
                        snderr(EDESTADDRREQ);
        }
-       if (so->so_error)
-               snderr(so->so_error);
        if (top) {
        if (top) {
-               error = (*so->so_proto->pr_usrreq)(so, PRU_SEND, top, asa);
+               error = (*so->so_proto->pr_usrreq)(so,
+                   (flags & SOF_OOB) ? PRU_SENDOOB : PRU_SEND,
+                   top, (caddr_t)nam, (struct socketopt *)0);
+               top = 0;
                if (error) {
                        splx(s);
                        goto release;
                }
                if (error) {
                        splx(s);
                        goto release;
                }
-               top = 0;
                mp = &top;
        }
                mp = &top;
        }
-       if (u.u_count == 0) {
+       if (uio->uio_resid == 0) {
                splx(s);
                goto release;
        }
                splx(s);
                goto release;
        }
-       space = sbspace(&so->so_snd);
-       if (space == 0 || sosendallatonce(so) && space < u.u_count) {
-               if (so->so_options & SO_NBIO)
-                       snderr(EWOULDBLOCK);
-               sbunlock(&so->so_snd);
-               sbwait(&so->so_snd);
-               splx(s);
-               goto again;
+       if (flags & SOF_OOB)
+               space = 1024;
+       else {
+               space = sbspace(&so->so_snd);
+               if (space <= 0 ||
+                   sosendallatonce(so) && space < uio->uio_resid) {
+                       if (so->so_state & SS_NBIO)
+                               snderr(EWOULDBLOCK);
+                       sbunlock(&so->so_snd);
+                       sbwait(&so->so_snd);
+                       splx(s);
+                       goto restart;
+               }
        }
        splx(s);
        }
        splx(s);
-       while (u.u_count && space > 0) {
-               MGET(m, 1);
+       while (uio->uio_resid > 0 && space > 0) {
+               register struct iovec *iov = uio->uio_iov;
+
+               if (iov->iov_len == 0) {
+                       uio->uio_iov++;
+                       uio->uio_iovcnt--;
+                       if (uio->uio_iovcnt < 0)
+                               panic("sosend");
+                       continue;
+               }
+               MGET(m, M_WAIT, MT_DATA);
                if (m == NULL) {
                if (m == NULL) {
-                       error = ENOBUFS;
-                       m_freem(top);
+                       error = ENOBUFS;                        /* SIGPIPE? */
                        goto release;
                }
                        goto release;
                }
-               if (u.u_count >= PGSIZE && space >= NMBPG) {
+               if (iov->iov_len >= CLBYTES && space >= CLBYTES) {
                        register struct mbuf *p;
                        register struct mbuf *p;
-                       MPGET(p, 1);
+                       MCLGET(p, 1);
                        if (p == 0)
                                goto nopages;
                        m->m_off = (int)p - (int)m;
                        if (p == 0)
                                goto nopages;
                        m->m_off = (int)p - (int)m;
-                       len = PGSIZE;
+                       len = CLBYTES;
                } else {
 nopages:
                } else {
 nopages:
-                       m->m_off = MMINOFF;
-                       len = MIN(MLEN, u.u_count);
+                       len = MIN(MLEN, iov->iov_len);
                }
                }
-               iomove(mtod(m, caddr_t), len, B_WRITE);
+               (void) uiomove(mtod(m, caddr_t), len, UIO_WRITE, uio);
                m->m_len = len;
                *mp = m;
                mp = &m->m_next;
                m->m_len = len;
                *mp = m;
                mp = &m->m_next;
-               space = sbspace(&so->so_snd);
+               if (flags & SOF_OOB)
+                       space -= len;
+               else
+                       space = sbspace(&so->so_snd);
        }
        }
-       s = splnet();
        goto again;
 
 release:
        sbunlock(&so->so_snd);
        goto again;
 
 release:
        sbunlock(&so->so_snd);
+       if (top)
+               m_freem(top);
        return (error);
 }
 
        return (error);
 }
 
-soreceive(so, asa)
+soreceive(so, aname, uio, flags)
        register struct socket *so;
        register struct socket *so;
-       struct sockaddr *asa;
+       struct mbuf **aname;
+       struct uio *uio;
+       int flags;
 {
        register struct mbuf *m, *n;
 {
        register struct mbuf *m, *n;
-       u_int len;
-       int eor, s, error = 0;
+       int len;
+       int eor, s, error = 0, moff, tomark;
+
+       if (flags & SOF_OOB) {
+               m = m_get(M_WAIT, MT_DATA);
+               error = (*so->so_proto->pr_usrreq)(so, PRU_RCVOOB,
+                   m, (struct mbuf *)0, (struct socketopt *)0);
+               if (error)
+                       return (error);
+               len = uio->uio_resid;
+               do {
+                       if (len > m->m_len)
+                               len = m->m_len;
+                       error =
+                           uiomove(mtod(m, caddr_t), (int)len, UIO_READ, uio);
+                       m = m_free(m);
+               } while (uio->uio_resid && error == 0 && m);
+               if (m)
+                       m_freem(m);
+               return (error);
+       }
 
 
-COUNT(SORECEIVE);
 restart:
        sblock(&so->so_rcv);
        s = splnet();
 restart:
        sblock(&so->so_rcv);
        s = splnet();
+SBCHECK(&so->so_rcv, "soreceive restart");
 
 #define        rcverr(errno)   { error = errno; splx(s); goto release; }
        if (so->so_rcv.sb_cc == 0) {
 
 #define        rcverr(errno)   { error = errno; splx(s); goto release; }
        if (so->so_rcv.sb_cc == 0) {
+               if (so->so_error) {
+                       error = so->so_error;
+                       so->so_error = 0;
+                       splx(s);
+                       goto release;
+               }
                if (so->so_state & SS_CANTRCVMORE) {
                        splx(s);
                        goto release;
                if (so->so_state & SS_CANTRCVMORE) {
                        splx(s);
                        goto release;
@@ -350,47 +413,93 @@ restart:
                if ((so->so_state & SS_ISCONNECTED) == 0 &&
                    (so->so_proto->pr_flags & PR_CONNREQUIRED))
                        rcverr(ENOTCONN);
                if ((so->so_state & SS_ISCONNECTED) == 0 &&
                    (so->so_proto->pr_flags & PR_CONNREQUIRED))
                        rcverr(ENOTCONN);
-               if (so->so_options & SO_NBIO)
-                       rcverr (EWOULDBLOCK);
+               if (so->so_state & SS_NBIO)
+                       rcverr(EWOULDBLOCK);
                sbunlock(&so->so_rcv);
                sbwait(&so->so_rcv);
                splx(s);
                goto restart;
        }
                sbunlock(&so->so_rcv);
                sbwait(&so->so_rcv);
                splx(s);
                goto restart;
        }
+       u.u_ru.ru_msgrcv++;
        m = so->so_rcv.sb_mb;
        if (m == 0)
                panic("receive");
        m = so->so_rcv.sb_mb;
        if (m == 0)
                panic("receive");
+SBCHECK(&so->so_snd, "soreceive havecc");
        if (so->so_proto->pr_flags & PR_ADDR) {
        if (so->so_proto->pr_flags & PR_ADDR) {
-               if (m->m_len != sizeof (struct sockaddr))
-                       panic("soreceive addr");
-               if (asa)
-                       bcopy(mtod(m, caddr_t), (caddr_t)asa, sizeof (*asa));
-               so->so_rcv.sb_cc -= m->m_len;
-               so->so_rcv.sb_mbcnt -= MSIZE;
-               m = m_free(m);
+               if ((flags & SOF_PREVIEW) == 0) {
+                       so->so_rcv.sb_cc -= m->m_len;
+                       so->so_rcv.sb_mbcnt -= MSIZE;
+               }
+               if (aname) {
+                       if (flags & SOF_PREVIEW)
+                               *aname = m_copy(m, 0, m->m_len);
+                       else
+                               *aname = m;
+                       m = m->m_next;
+                       (*aname)->m_next = 0;
+               } else
+                       if (flags & SOF_PREVIEW)
+                               m = m->m_next;
+                       else
+                               m = m_free(m);
                if (m == 0)
                        panic("receive 2");
                if (m == 0)
                        panic("receive 2");
-               so->so_rcv.sb_mb = m;
+               if ((flags & SOF_PREVIEW) == 0)
+                       so->so_rcv.sb_mb = m;
+SBCHECK(&so->so_snd, "soreceive afteraddr");
        }
        eor = 0;
        }
        eor = 0;
+       moff = 0;
+       tomark = so->so_oobmark;
        do {
        do {
-               len = MIN(m->m_len, u.u_count);
-               if (len == m->m_len) {
-                       eor = (int)m->m_act;
-                       sbfree(&so->so_rcv, m);
-               }
+               if (uio->uio_resid <= 0)
+                       break;
+               len = uio->uio_resid;
+               so->so_state &= ~SS_RCVATMARK;
+               if (tomark && len > tomark)
+                       len = tomark;
+               if (moff+len > m->m_len - moff)
+                       len = m->m_len - moff;
                splx(s);
                splx(s);
-               iomove(mtod(m, caddr_t), len, B_READ);
+               error =
+                   uiomove(mtod(m, caddr_t) + moff, (int)len, UIO_READ, uio);
                s = splnet();
                if (len == m->m_len) {
                s = splnet();
                if (len == m->m_len) {
-                       MFREE(m, n);
-                       so->so_rcv.sb_mb = n;
+                       eor = (int)m->m_act;
+                       if (flags & SOF_PREVIEW)
+                               m = m->m_next;
+                       else {
+                               sbfree(&so->so_rcv, m);
+                               MFREE(m, n);
+                               m = n;
+                               so->so_rcv.sb_mb = m;
+                       }
+                       moff = 0;
                } else {
                } else {
-                       m->m_off += len;
-                       m->m_len -= len;
-                       so->so_rcv.sb_cc -= len;
+                       if (flags & SOF_PREVIEW)
+                               moff += len;
+                       else {
+                               m->m_off += len;
+                               m->m_len -= len;
+                               so->so_rcv.sb_cc -= len;
+                       }
+               }
+               if ((flags & SOF_PREVIEW) == 0 && so->so_oobmark) {
+                       so->so_oobmark -= len;
+                       if (so->so_oobmark == 0) {
+                               so->so_state |= SS_RCVATMARK;
+                               break;
+                       }
                }
                }
-       } while ((m = so->so_rcv.sb_mb) && u.u_count && !eor);
+               if (tomark) {
+                       tomark -= len;
+                       if (tomark == 0)
+                               break;
+               }
+SBCHECK(&so->so_snd, "soreceive rcvloop");
+       } while (m && error == 0 && !eor);
+       if (flags & SOF_PREVIEW)
+               goto release;
        if ((so->so_proto->pr_flags & PR_ATOMIC) && eor == 0)
                do {
                        if (m == 0)
        if ((so->so_proto->pr_flags & PR_ATOMIC) && eor == 0)
                do {
                        if (m == 0)
@@ -400,39 +509,118 @@ restart:
                        so->so_rcv.sb_mb = m->m_next;
                        MFREE(m, n);
                        m = n;
                        so->so_rcv.sb_mb = m->m_next;
                        MFREE(m, n);
                        m = n;
+SBCHECK(&so->so_snd, "soreceive atomicloop");
                } while (eor == 0);
        if ((so->so_proto->pr_flags & PR_WANTRCVD) && so->so_pcb)
                } while (eor == 0);
        if ((so->so_proto->pr_flags & PR_WANTRCVD) && so->so_pcb)
-               (*so->so_proto->pr_usrreq)(so, PRU_RCVD, 0, 0);
+               (*so->so_proto->pr_usrreq)(so, PRU_RCVD,
+                   (struct mbuf *)0, (struct mbuf *)0, (struct socketopt *)0);
 release:
        sbunlock(&so->so_rcv);
        splx(s);
        return (error);
 }
 
 release:
        sbunlock(&so->so_rcv);
        splx(s);
        return (error);
 }
 
+sohasoutofband(so)
+       struct socket *so;
+{
+
+       if (so->so_pgrp == 0)
+               return;
+       if (so->so_pgrp > 0)
+               gsignal(so->so_pgrp, SIGURG);
+       else {
+               struct proc *p = pfind(-so->so_pgrp);
+
+               if (p)
+                       psignal(p, SIGURG);
+       }
+}
+
 /*ARGSUSED*/
 /*ARGSUSED*/
-soioctl(so, cmd, cmdp)
+soioctl(so, cmd, data)
        register struct socket *so;
        int cmd;
        register struct socket *so;
        int cmd;
-       register caddr_t cmdp;
+       register char *data;
 {
 
 {
 
-COUNT(SOIOCTL);
-       switch (cmdp) {
+       switch (cmd) {
 
 
-       }
-       switch (so->so_type) {
+       case FIONBIO:
+               if (*(int *)data)
+                       so->so_state |= SS_NBIO;
+               else
+                       so->so_state &= ~SS_NBIO;
+               break;
+
+       case FIOASYNC:
+               if (*(int *)data)
+                       so->so_state |= SS_ASYNC;
+               else
+                       so->so_state &= ~SS_ASYNC;
+               break;
 
 
-       case SOCK_STREAM:
+       case SIOCSKEEP:
+               if (*(int *)data)
+                       so->so_options &= ~SO_KEEPALIVE;
+               else
+                       so->so_options |= SO_KEEPALIVE;
                break;
 
                break;
 
-       case SOCK_DGRAM:
+       case SIOCGKEEP:
+               *(int *)data = (so->so_options & SO_KEEPALIVE) != 0;
                break;
 
                break;
 
-       case SOCK_RDM:
+       case SIOCSLINGER:
+               so->so_linger = *(int *)data;
+               if (so->so_linger)
+                       so->so_options &= ~SO_DONTLINGER;
+               else
+                       so->so_options |= SO_DONTLINGER;
                break;
 
                break;
 
-       case SOCK_RAW:
+       case SIOCGLINGER:
+               *(int *)data = so->so_linger;
                break;
 
                break;
 
+       case SIOCSPGRP:
+               so->so_pgrp = *(int *)data;
+               break;
+
+       case SIOCGPGRP:
+               *(int *)data = so->so_pgrp;
+               break;
+
+       case SIOCDONE: {
+               int flags = *(int *)data;
+
+               flags++;
+               if (flags & FREAD) {
+                       int s = splimp();
+                       socantrcvmore(so);
+                       sbflush(&so->so_rcv);
+                       splx(s);
+               }
+               if (flags & FWRITE)
+                       return ((*so->so_proto->pr_usrreq)(so, PRU_SHUTDOWN,
+                           (struct mbuf *)0, (struct mbuf *)0,
+                           (struct socketopt *)0));
+               break;
        }
        }
+
+       case SIOCATMARK:
+               *(int *)data = (so->so_state&SS_RCVATMARK) != 0;
+               break;
+
+       /* routing table update calls */
+       case SIOCADDRT:
+       case SIOCDELRT:
+               if (!suser())
+                       return (u.u_error);             /* XXX */
+               return (rtrequest(cmd, (struct rtentry *)data));
+
+       /* type/protocol specific ioctls */
+       default:
+               return (ENOTTY);
+       }
+       return (0);
 }
 }