don't free ioctl cmds
[unix-history] / usr / src / sys / kern / uipc_usrreq.c
index 21082e5..acca526 100644 (file)
@@ -1,34 +1,56 @@
-/*     uipc_usrreq.c   1.4     82/11/23        */
-
-#include "../h/param.h"
-#include "../h/dir.h"
-#include "../h/user.h"
-#include "../h/mbuf.h"
-#include "../h/protosw.h"
-#include "../h/socket.h"
-#include "../h/socketvar.h"
-#include "../h/unpcb.h"
-#include "../h/un.h"
-#include "../h/inode.h"
-#include "../h/nami.h"
+/*
+ * Copyright (c) 1982 Regents of the University of California.
+ * All rights reserved.  The Berkeley software License Agreement
+ * specifies the terms and conditions for redistribution.
+ *
+ *     @(#)uipc_usrreq.c       6.17 (Berkeley) %G%
+ */
+
+#include "param.h"
+#include "dir.h"
+#include "user.h"
+#include "mbuf.h"
+#include "domain.h"
+#include "protosw.h"
+#include "socket.h"
+#include "socketvar.h"
+#include "unpcb.h"
+#include "un.h"
+#include "inode.h"
+#include "file.h"
+#include "stat.h"
 
 /*
  * Unix communications domain.
 
 /*
  * Unix communications domain.
+ *
+ * TODO:
+ *     SEQPACKET, RDM
+ *     rethink name space problems
+ *     need a proper out-of-band
  */
  */
+struct sockaddr sun_noname = { AF_UNIX };
+ino_t  unp_ino;                                /* fake inode numbers */
 
 /*ARGSUSED*/
 
 /*ARGSUSED*/
-uipc_usrreq(so, req, m, nam, opt)
+uipc_usrreq(so, req, m, nam, rights)
        struct socket *so;
        int req;
        struct socket *so;
        int req;
-       struct mbuf *m, *nam;
-       struct socketopt *opt;
+       struct mbuf *m, *nam, *rights;
 {
        struct unpcb *unp = sotounpcb(so);
        register struct socket *so2;
        int error = 0;
 
 {
        struct unpcb *unp = sotounpcb(so);
        register struct socket *so2;
        int error = 0;
 
-       if (unp == 0 && req != PRU_ATTACH)
-               return (EINVAL);                        /* XXX */
+       if (req == PRU_CONTROL)
+               return (EOPNOTSUPP);
+       if (req != PRU_SEND && rights && rights->m_len) {
+               error = EOPNOTSUPP;
+               goto release;
+       }
+       if (unp == 0 && req != PRU_ATTACH) {
+               error = EINVAL;
+               goto release;
+       }
        switch (req) {
 
        case PRU_ATTACH:
        switch (req) {
 
        case PRU_ATTACH:
@@ -56,6 +78,11 @@ uipc_usrreq(so, req, m, nam, opt)
                error = unp_connect(so, nam);
                break;
 
                error = unp_connect(so, nam);
                break;
 
+       case PRU_CONNECT2:
+               error = unp_connect2(so, (struct mbuf *)0,
+                   (struct socket *)nam);
+               break;
+
        case PRU_DISCONNECT:
                unp_disconnect(unp);
                break;
        case PRU_DISCONNECT:
                unp_disconnect(unp);
                break;
@@ -76,8 +103,9 @@ uipc_usrreq(so, req, m, nam, opt)
 
                case SOCK_DGRAM:
                        panic("uipc 1");
 
                case SOCK_DGRAM:
                        panic("uipc 1");
+                       /*NOTREACHED*/
 
 
-               case SOCK_STREAM: {
+               case SOCK_STREAM:
 #define        rcv (&so->so_rcv)
 #define snd (&so2->so_snd)
                        if (unp->unp_conn == 0)
 #define        rcv (&so->so_rcv)
 #define snd (&so2->so_snd)
                        if (unp->unp_conn == 0)
@@ -91,10 +119,9 @@ uipc_usrreq(so, req, m, nam, opt)
                        rcv->sb_mbmax = rcv->sb_mbcnt;
                        snd->sb_hiwat += rcv->sb_hiwat - rcv->sb_cc;
                        rcv->sb_hiwat = rcv->sb_cc;
                        rcv->sb_mbmax = rcv->sb_mbcnt;
                        snd->sb_hiwat += rcv->sb_hiwat - rcv->sb_cc;
                        rcv->sb_hiwat = rcv->sb_cc;
-                       sbwakeup(snd);
+                       sowwakeup(so2);
 #undef snd
 #undef rcv
 #undef snd
 #undef rcv
-                       }
                        break;
 
                default:
                        break;
 
                default:
@@ -122,9 +149,23 @@ uipc_usrreq(so, req, m, nam, opt)
                        }
                        so2 = unp->unp_conn->unp_socket;
                        /* BEGIN XXX */
                        }
                        so2 = unp->unp_conn->unp_socket;
                        /* BEGIN XXX */
-                       if (sbspace(&so2->so_rcv) > 0)
-                               (void) sbappendaddr(&so2->so_rcv,
-                                       mtod(nam, struct sockaddr *), m);
+                       if (rights) {
+                               error = unp_internalize(rights);
+                               if (error)
+                                       break;
+                       }
+                       if (sbspace(&so2->so_rcv) > 0) {
+                               /*
+                                * There's no record of source socket's
+                                * name, so send null name for the moment.
+                                */
+                               if (sbappendaddr(&so2->so_rcv,
+                                   &sun_noname, m, rights)) {
+                                       sorwakeup(so2);
+                                       m = 0;
+                               } else
+                                       error = ENOBUFS;
+                       }
                        /* END XXX */
                        if (nam)
                                unp_disconnect(unp);
                        /* END XXX */
                        if (nam)
                                unp_disconnect(unp);
@@ -133,6 +174,14 @@ uipc_usrreq(so, req, m, nam, opt)
                case SOCK_STREAM:
 #define        rcv (&so2->so_rcv)
 #define        snd (&so->so_snd)
                case SOCK_STREAM:
 #define        rcv (&so2->so_rcv)
 #define        snd (&so->so_snd)
+                       if (rights && rights->m_len) {
+                               error = EOPNOTSUPP;
+                               break;
+                       }
+                       if (so->so_state & SS_CANTSENDMORE) {
+                               error = EPIPE;
+                               break;
+                       }
                        if (unp->unp_conn == 0)
                                panic("uipc 3");
                        so2 = unp->unp_conn->unp_socket;
                        if (unp->unp_conn == 0)
                                panic("uipc 3");
                        so2 = unp->unp_conn->unp_socket;
@@ -146,7 +195,8 @@ uipc_usrreq(so, req, m, nam, opt)
                        rcv->sb_mbmax = rcv->sb_mbcnt;
                        snd->sb_hiwat -= rcv->sb_cc - rcv->sb_hiwat;
                        rcv->sb_hiwat = rcv->sb_cc;
                        rcv->sb_mbmax = rcv->sb_mbcnt;
                        snd->sb_hiwat -= rcv->sb_cc - rcv->sb_hiwat;
                        rcv->sb_hiwat = rcv->sb_cc;
-                       sbwakeup(rcv);
+                       sorwakeup(so2);
+                       m = 0;
 #undef snd
 #undef rcv
                        break;
 #undef snd
 #undef rcv
                        break;
@@ -160,36 +210,53 @@ uipc_usrreq(so, req, m, nam, opt)
                unp_drop(unp, ECONNABORTED);
                break;
 
                unp_drop(unp, ECONNABORTED);
                break;
 
-/* SOME AS YET UNIMPLEMENTED HOOKS */
-       case PRU_CONTROL:
-               error = EOPNOTSUPP;
-               break;
-
        case PRU_SENSE:
        case PRU_SENSE:
-               error = EOPNOTSUPP;
-               break;
-/* END UNIMPLEMENTED HOOKS */
+               ((struct stat *) m)->st_blksize = so->so_snd.sb_hiwat;
+               if (so->so_type == SOCK_STREAM && unp->unp_conn != 0) {
+                       so2 = unp->unp_conn->unp_socket;
+                       ((struct stat *) m)->st_blksize += so2->so_rcv.sb_cc;
+               }
+               ((struct stat *) m)->st_dev = NODEV;
+               ((struct stat *) m)->st_ino = unp_ino++;
+               return (0);
 
        case PRU_RCVOOB:
 
        case PRU_RCVOOB:
-               break;
+               return (EOPNOTSUPP);
 
        case PRU_SENDOOB:
 
        case PRU_SENDOOB:
+               error = EOPNOTSUPP;
                break;
 
        case PRU_SOCKADDR:
                break;
 
                break;
 
        case PRU_SOCKADDR:
                break;
 
+       case PRU_PEERADDR:
+               break;
+
        case PRU_SLOWTIMO:
                break;
 
        default:
                panic("piusrreq");
        }
        case PRU_SLOWTIMO:
                break;
 
        default:
                panic("piusrreq");
        }
-       return (0);
+release:
+       if (m)
+               m_freem(m);
+       return (error);
 }
 
 }
 
-int    unp_sendspace = 1024*2;
-int    unp_recvspace = 1024*2;
+/*
+ * We assign all buffering for stream sockets to the source,
+ * as that is where the flow control is implemented.
+ * Datagram sockets really use the sendspace as the maximum datagram size,
+ * and don't really want to reserve the sendspace.  Their recvspace should
+ * be large enough for at least one max-size datagram plus address.
+ */
+#define        PIPSIZ  4096
+int    unpst_sendspace = PIPSIZ;
+int    unpst_recvspace = 0;
+int    unpdg_sendspace = 2*1024;       /* really max datagram size */
+int    unpdg_recvspace = 4*1024;
 
 unp_attach(so)
        struct socket *so;
 
 unp_attach(so)
        struct socket *so;
@@ -198,20 +265,25 @@ unp_attach(so)
        register struct unpcb *unp;
        int error;
        
        register struct unpcb *unp;
        int error;
        
-       error = soreserve(so, unp_sendspace, unp_recvspace);
-       if (error)
-               goto bad;
-       m = m_getclr(M_DONTWAIT);
-       if (m == 0) {
-               error = ENOBUFS;
-               goto bad;
+       switch (so->so_type) {
+
+       case SOCK_STREAM:
+               error = soreserve(so, unpst_sendspace, unpst_recvspace);
+               break;
+
+       case SOCK_DGRAM:
+               error = soreserve(so, unpdg_sendspace, unpdg_recvspace);
+               break;
        }
        }
+       if (error)
+               return (error);
+       m = m_getclr(M_DONTWAIT, MT_PCB);
+       if (m == NULL)
+               return (ENOBUFS);
        unp = mtod(m, struct unpcb *);
        so->so_pcb = (caddr_t)unp;
        unp->unp_socket = so;
        return (0);
        unp = mtod(m, struct unpcb *);
        so->so_pcb = (caddr_t)unp;
        unp->unp_socket = so;
        return (0);
-bad:
-       return (error);
 }
 
 unp_detach(unp)
 }
 
 unp_detach(unp)
@@ -219,6 +291,7 @@ unp_detach(unp)
 {
        
        if (unp->unp_inode) {
 {
        
        if (unp->unp_inode) {
+               unp->unp_inode->i_socket = 0;
                irele(unp->unp_inode);
                unp->unp_inode = 0;
        }
                irele(unp->unp_inode);
                unp->unp_inode = 0;
        }
@@ -238,17 +311,26 @@ unp_bind(unp, nam)
 {
        struct sockaddr_un *soun = mtod(nam, struct sockaddr_un *);
        register struct inode *ip;
 {
        struct sockaddr_un *soun = mtod(nam, struct sockaddr_un *);
        register struct inode *ip;
-       extern schar();
+       register struct nameidata *ndp = &u.u_nd;
        int error;
 
        int error;
 
-       u.u_dirp = soun->sun_path;
-       soun->sun_path[sizeof(soun->sun_path)-1] = 0;
-       ip = namei(schar, CREATE, 1);
+       ndp->ni_dirp = soun->sun_path;
+       if (unp->unp_inode != NULL || nam->m_len == MLEN)
+               return (EINVAL);
+       *(mtod(nam, caddr_t) + nam->m_len) = 0;
+/* SHOULD BE ABLE TO ADOPT EXISTING AND wakeup() ALA FIFO's */
+       ndp->ni_nameiop = CREATE | FOLLOW;
+       ndp->ni_segflg = UIO_SYSSPACE;
+       ip = namei(ndp);
        if (ip) {
                iput(ip);
        if (ip) {
                iput(ip);
-               return (EEXIST);
+               return (EADDRINUSE);
        }
        }
-       ip = maknode(IFSOCK | 0777);
+       if (error = u.u_error) {
+               u.u_error = 0;                  /* XXX */
+               return (error);
+       }
+       ip = maknode(IFSOCK | 0777, ndp);
        if (ip == NULL) {
                error = u.u_error;              /* XXX */
                u.u_error = 0;                  /* XXX */
        if (ip == NULL) {
                error = u.u_error;              /* XXX */
                u.u_error = 0;                  /* XXX */
@@ -265,19 +347,27 @@ unp_connect(so, nam)
        struct mbuf *nam;
 {
        register struct sockaddr_un *soun = mtod(nam, struct sockaddr_un *);
        struct mbuf *nam;
 {
        register struct sockaddr_un *soun = mtod(nam, struct sockaddr_un *);
-       struct unpcb *unp = sotounpcb(so);
        register struct inode *ip;
        int error;
        register struct inode *ip;
        int error;
-       struct socket *so2;
-       struct unpcb *unp2;
-
-       u.u_dirp = soun->sun_path;
-       soun->sun_path[sizeof(soun->sun_path)-1] = 0;
-       ip = namei(schar, LOOKUP, 1);
+       register struct socket *so2;
+       register struct nameidata *ndp = &u.u_nd;
+
+       ndp->ni_dirp = soun->sun_path;
+       if (nam->m_len + (nam->m_off - MMINOFF) == MLEN)
+               return (EMSGSIZE);
+       *(mtod(nam, caddr_t) + nam->m_len) = 0;
+       ndp->ni_nameiop = LOOKUP | FOLLOW;
+       ndp->ni_segflg = UIO_SYSSPACE;
+       ip = namei(ndp);
        if (ip == 0) {
                error = u.u_error;
                u.u_error = 0;
        if (ip == 0) {
                error = u.u_error;
                u.u_error = 0;
-               return (ENOENT);
+               return (error);         /* XXX */
+       }
+       if (access(ip, IWRITE)) {
+               error = u.u_error;
+               u.u_error = 0;          /* XXX */
+               goto bad;
        }
        if ((ip->i_mode&IFMT) != IFSOCK) {
                error = ENOTSOCK;
        }
        if ((ip->i_mode&IFMT) != IFSOCK) {
                error = ENOTSOCK;
@@ -288,41 +378,54 @@ unp_connect(so, nam)
                error = ECONNREFUSED;
                goto bad;
        }
                error = ECONNREFUSED;
                goto bad;
        }
-       if (so2->so_type != so->so_type) {
+       if (so->so_type != so2->so_type) {
                error = EPROTOTYPE;
                goto bad;
        }
                error = EPROTOTYPE;
                goto bad;
        }
+       if (so->so_proto->pr_flags & PR_CONNREQUIRED &&
+           ((so2->so_options&SO_ACCEPTCONN) == 0 ||
+            (so2 = sonewconn(so2)) == 0)) {
+               error = ECONNREFUSED;
+               goto bad;
+       }
+       error = unp_connect2(so, nam, so2);
+bad:
+       iput(ip);
+       return (error);
+}
+
+unp_connect2(so, sonam, so2)
+       register struct socket *so;
+       struct mbuf *sonam;
+       register struct socket *so2;
+{
+       register struct unpcb *unp = sotounpcb(so);
+       register struct unpcb *unp2;
+
+       if (so2->so_type != so->so_type)
+               return (EPROTOTYPE);
+       unp2 = sotounpcb(so2);
+       unp->unp_conn = unp2;
        switch (so->so_type) {
 
        case SOCK_DGRAM:
        switch (so->so_type) {
 
        case SOCK_DGRAM:
-               unp->unp_conn = sotounpcb(so2);
-               unp2 = sotounpcb(so2);
                unp->unp_nextref = unp2->unp_refs;
                unp2->unp_refs = unp;
                unp->unp_nextref = unp2->unp_refs;
                unp2->unp_refs = unp;
+               soisconnected(so);
                break;
 
        case SOCK_STREAM:
                break;
 
        case SOCK_STREAM:
-               if ((so2->so_options&SO_ACCEPTCONN) == 0 ||
-                   (so2 = sonewconn(so2)) == 0) {
-                       error = ECONNREFUSED;
-                       goto bad;
-               }
-               unp2 = sotounpcb(so2);
-               unp->unp_conn = unp2;
                unp2->unp_conn = unp;
                unp2->unp_conn = unp;
-               unp2->unp_remaddr = m_copy(nam, 0, (int)M_COPYALL);
+               if (sonam)
+                       unp2->unp_remaddr = m_copy(sonam, 0, (int)M_COPYALL);
+               soisconnected(so2);
+               soisconnected(so);
                break;
 
        default:
                break;
 
        default:
-               panic("uipc connip");
+               panic("unp_connect2");
        }
        }
-       soisconnected(so2);
-       soisconnected(so);
-       iput(ip);
        return (0);
        return (0);
-bad:
-       iput(ip);
-       return (error);
 }
 
 unp_disconnect(unp)
 }
 
 unp_disconnect(unp)
@@ -333,7 +436,6 @@ unp_disconnect(unp)
        if (unp2 == 0)
                return;
        unp->unp_conn = 0;
        if (unp2 == 0)
                return;
        unp->unp_conn = 0;
-       soisdisconnected(unp->unp_socket);
        switch (unp->unp_socket->so_type) {
 
        case SOCK_DGRAM:
        switch (unp->unp_socket->so_type) {
 
        case SOCK_DGRAM:
@@ -351,21 +453,25 @@ unp_disconnect(unp)
                        unp2->unp_nextref = unp->unp_nextref;
                }
                unp->unp_nextref = 0;
                        unp2->unp_nextref = unp->unp_nextref;
                }
                unp->unp_nextref = 0;
+               unp->unp_socket->so_state &= ~SS_ISCONNECTED;
                break;
 
        case SOCK_STREAM:
                break;
 
        case SOCK_STREAM:
+               soisdisconnected(unp->unp_socket);
                unp2->unp_conn = 0;
                soisdisconnected(unp2->unp_socket);
                break;
        }
 }
 
                unp2->unp_conn = 0;
                soisdisconnected(unp2->unp_socket);
                break;
        }
 }
 
+#ifdef notdef
 unp_abort(unp)
        struct unpcb *unp;
 {
 
        unp_detach(unp);
 }
 unp_abort(unp)
        struct unpcb *unp;
 {
 
        unp_detach(unp);
 }
+#endif
 
 /*ARGSUSED*/
 unp_usrclosed(unp)
 
 /*ARGSUSED*/
 unp_usrclosed(unp)
@@ -378,12 +484,176 @@ unp_drop(unp, errno)
        struct unpcb *unp;
        int errno;
 {
        struct unpcb *unp;
        int errno;
 {
+       struct socket *so = unp->unp_socket;
 
 
-       unp->unp_socket->so_error = errno;
+       so->so_error = errno;
        unp_disconnect(unp);
        unp_disconnect(unp);
+       if (so->so_head) {
+               so->so_pcb = (caddr_t) 0;
+               m_freem(unp->unp_remaddr);
+               (void) m_free(dtom(unp));
+               sofree(so);
+       }
 }
 
 }
 
+#ifdef notdef
 unp_drain()
 {
 
 }
 unp_drain()
 {
 
 }
+#endif
+
+unp_externalize(rights)
+       struct mbuf *rights;
+{
+       int newfds = rights->m_len / sizeof (int);
+       register int i;
+       register struct file **rp = mtod(rights, struct file **);
+       register struct file *fp;
+       int f;
+
+       if (newfds > ufavail()) {
+               for (i = 0; i < newfds; i++) {
+                       fp = *rp;
+                       unp_discard(fp);
+                       *rp++ = 0;
+               }
+               return (EMSGSIZE);
+       }
+       for (i = 0; i < newfds; i++) {
+               f = ufalloc(0);
+               if (f < 0)
+                       panic("unp_externalize");
+               fp = *rp;
+               u.u_ofile[f] = fp;
+               fp->f_msgcount--;
+               *(int *)rp++ = f;
+       }
+       return (0);
+}
+
+unp_internalize(rights)
+       struct mbuf *rights;
+{
+       register struct file **rp;
+       int oldfds = rights->m_len / sizeof (int);
+       register int i;
+       register struct file *fp;
+
+       rp = mtod(rights, struct file **);
+       for (i = 0; i < oldfds; i++)
+               if (getf(*(int *)rp++) == 0)
+                       return (EBADF);
+       rp = mtod(rights, struct file **);
+       for (i = 0; i < oldfds; i++) {
+               fp = getf(*(int *)rp);
+               *rp++ = fp;
+               fp->f_count++;
+               fp->f_msgcount++;
+       }
+       return (0);
+}
+
+int    unp_defer, unp_gcing;
+int    unp_mark();
+extern struct domain unixdomain;
+
+unp_gc()
+{
+       register struct file *fp;
+       register struct socket *so;
+
+       if (unp_gcing)
+               return;
+       unp_gcing = 1;
+restart:
+       unp_defer = 0;
+       for (fp = file; fp < fileNFILE; fp++)
+               fp->f_flag &= ~(FMARK|FDEFER);
+       do {
+               for (fp = file; fp < fileNFILE; fp++) {
+                       if (fp->f_count == 0)
+                               continue;
+                       if (fp->f_flag & FDEFER) {
+                               fp->f_flag &= ~FDEFER;
+                               unp_defer--;
+                       } else {
+                               if (fp->f_flag & FMARK)
+                                       continue;
+                               if (fp->f_count == fp->f_msgcount)
+                                       continue;
+                               fp->f_flag |= FMARK;
+                       }
+                       if (fp->f_type != DTYPE_SOCKET)
+                               continue;
+                       so = (struct socket *)fp->f_data;
+                       if (so->so_proto->pr_domain != &unixdomain ||
+                           (so->so_proto->pr_flags&PR_RIGHTS) == 0)
+                               continue;
+                       if (so->so_rcv.sb_flags & SB_LOCK) {
+                               sbwait(&so->so_rcv);
+                               goto restart;
+                       }
+                       unp_scan(so->so_rcv.sb_mb, unp_mark);
+               }
+       } while (unp_defer);
+       for (fp = file; fp < fileNFILE; fp++) {
+               if (fp->f_count == 0)
+                       continue;
+               if (fp->f_count == fp->f_msgcount && (fp->f_flag&FMARK)==0) {
+                       if (fp->f_type != DTYPE_SOCKET)
+                               panic("unp_gc");
+                       (void) soshutdown((struct socket *)fp->f_data, 0);
+               }
+       }
+       unp_gcing = 0;
+}
+
+unp_dispose(m)
+       struct mbuf *m;
+{
+       int unp_discard();
+
+       if (m)
+               unp_scan(m, unp_discard);
+}
+
+unp_scan(m0, op)
+       register struct mbuf *m0;
+       int (*op)();
+{
+       register struct mbuf *m;
+       register struct file **rp;
+       register int i;
+       int qfds;
+
+       while (m0) {
+               for (m = m0; m; m = m->m_next)
+                       if (m->m_type == MT_RIGHTS && m->m_len) {
+                               qfds = m->m_len / sizeof (struct file *);
+                               rp = mtod(m, struct file **);
+                               for (i = 0; i < qfds; i++)
+                                       (*op)(*rp++);
+                               break;          /* XXX, but saves time */
+                       }
+               m0 = m0->m_act;
+       }
+}
+
+unp_mark(fp)
+       struct file *fp;
+{
+
+       if (fp->f_flag & FMARK)
+               return;
+       unp_defer++;
+       fp->f_flag |= (FMARK|FDEFER);
+}
+
+unp_discard(fp)
+       struct file *fp;
+{
+
+       fp->f_msgcount--;
+       closef(fp);
+}