-/* ufs_vnops.c 6.5 84/02/10 */
-
-#include "../h/param.h"
-#include "../h/systm.h"
-#include "../h/dir.h"
-#include "../h/user.h"
-#include "../h/kernel.h"
-#include "../h/file.h"
-#include "../h/stat.h"
-#include "../h/inode.h"
-#include "../h/fs.h"
-#include "../h/buf.h"
-#include "../h/proc.h"
-#include "../h/quota.h"
-#include "../h/uio.h"
-#include "../h/socket.h"
-#include "../h/socketvar.h"
-#include "../h/nami.h"
-#include "../h/mount.h"
-
-extern struct fileops inodeops;
-struct file *getinode();
+/*
+ * Copyright (c) 1982, 1986, 1989 Regents of the University of California.
+ * All rights reserved.
+ *
+ * %sccs.include.redist.c%
+ *
+ * @(#)ufs_vnops.c 7.50 (Berkeley) %G%
+ */
+
+#include "param.h"
+#include "systm.h"
+#include "user.h"
+#include "kernel.h"
+#include "file.h"
+#include "stat.h"
+#include "buf.h"
+#include "proc.h"
+#include "socket.h"
+#include "socketvar.h"
+#include "conf.h"
+#include "mount.h"
+#include "vnode.h"
+#include "specdev.h"
+#include "fcntl.h"
+#include "malloc.h"
+#include "../ufs/lockf.h"
+#include "../ufs/quota.h"
+#include "../ufs/inode.h"
+#include "../ufs/fs.h"
/*
- * Change current working directory (``.'').
+ * Global vfs data structures for ufs
*/
-chdir()
-{
- chdirec(&u.u_cdir);
-}
+int ufs_lookup(),
+ ufs_create(),
+ ufs_mknod(),
+ ufs_open(),
+ ufs_close(),
+ ufs_access(),
+ ufs_getattr(),
+ ufs_setattr(),
+ ufs_read(),
+ ufs_write(),
+ ufs_ioctl(),
+ ufs_select(),
+ ufs_mmap(),
+ ufs_fsync(),
+ ufs_seek(),
+ ufs_remove(),
+ ufs_link(),
+ ufs_rename(),
+ ufs_mkdir(),
+ ufs_rmdir(),
+ ufs_symlink(),
+ ufs_readdir(),
+ ufs_readlink(),
+ ufs_abortop(),
+ ufs_inactive(),
+ ufs_reclaim(),
+ ufs_lock(),
+ ufs_unlock(),
+ ufs_bmap(),
+ ufs_strategy(),
+ ufs_print(),
+ ufs_islocked(),
+ ufs_advlock();
+
+struct vnodeops ufs_vnodeops = {
+ ufs_lookup, /* lookup */
+ ufs_create, /* create */
+ ufs_mknod, /* mknod */
+ ufs_open, /* open */
+ ufs_close, /* close */
+ ufs_access, /* access */
+ ufs_getattr, /* getattr */
+ ufs_setattr, /* setattr */
+ ufs_read, /* read */
+ ufs_write, /* write */
+ ufs_ioctl, /* ioctl */
+ ufs_select, /* select */
+ ufs_mmap, /* mmap */
+ ufs_fsync, /* fsync */
+ ufs_seek, /* seek */
+ ufs_remove, /* remove */
+ ufs_link, /* link */
+ ufs_rename, /* rename */
+ ufs_mkdir, /* mkdir */
+ ufs_rmdir, /* rmdir */
+ ufs_symlink, /* symlink */
+ ufs_readdir, /* readdir */
+ ufs_readlink, /* readlink */
+ ufs_abortop, /* abortop */
+ ufs_inactive, /* inactive */
+ ufs_reclaim, /* reclaim */
+ ufs_lock, /* lock */
+ ufs_unlock, /* unlock */
+ ufs_bmap, /* bmap */
+ ufs_strategy, /* strategy */
+ ufs_print, /* print */
+ ufs_islocked, /* islocked */
+ ufs_advlock, /* advlock */
+};
+
+int spec_lookup(),
+ spec_open(),
+ ufsspec_read(),
+ ufsspec_write(),
+ spec_strategy(),
+ spec_bmap(),
+ spec_ioctl(),
+ spec_select(),
+ ufsspec_close(),
+ spec_advlock(),
+ spec_badop(),
+ spec_nullop();
+
+struct vnodeops spec_inodeops = {
+ spec_lookup, /* lookup */
+ spec_badop, /* create */
+ spec_badop, /* mknod */
+ spec_open, /* open */
+ ufsspec_close, /* close */
+ ufs_access, /* access */
+ ufs_getattr, /* getattr */
+ ufs_setattr, /* setattr */
+ ufsspec_read, /* read */
+ ufsspec_write, /* write */
+ spec_ioctl, /* ioctl */
+ spec_select, /* select */
+ spec_badop, /* mmap */
+ spec_nullop, /* fsync */
+ spec_badop, /* seek */
+ spec_badop, /* remove */
+ spec_badop, /* link */
+ spec_badop, /* rename */
+ spec_badop, /* mkdir */
+ spec_badop, /* rmdir */
+ spec_badop, /* symlink */
+ spec_badop, /* readdir */
+ spec_badop, /* readlink */
+ spec_badop, /* abortop */
+ ufs_inactive, /* inactive */
+ ufs_reclaim, /* reclaim */
+ ufs_lock, /* lock */
+ ufs_unlock, /* unlock */
+ spec_bmap, /* bmap */
+ spec_strategy, /* strategy */
+ ufs_print, /* print */
+ ufs_islocked, /* islocked */
+ spec_advlock, /* advlock */
+};
+
+#ifdef FIFO
+int fifo_lookup(),
+ fifo_open(),
+ ufsfifo_read(),
+ ufsfifo_write(),
+ fifo_bmap(),
+ fifo_ioctl(),
+ fifo_select(),
+ ufsfifo_close(),
+ fifo_print(),
+ fifo_advlock(),
+ fifo_badop(),
+ fifo_nullop();
+
+struct vnodeops fifo_inodeops = {
+ fifo_lookup, /* lookup */
+ fifo_badop, /* create */
+ fifo_badop, /* mknod */
+ fifo_open, /* open */
+ ufsfifo_close, /* close */
+ ufs_access, /* access */
+ ufs_getattr, /* getattr */
+ ufs_setattr, /* setattr */
+ ufsfifo_read, /* read */
+ ufsfifo_write, /* write */
+ fifo_ioctl, /* ioctl */
+ fifo_select, /* select */
+ fifo_badop, /* mmap */
+ fifo_nullop, /* fsync */
+ fifo_badop, /* seek */
+ fifo_badop, /* remove */
+ fifo_badop, /* link */
+ fifo_badop, /* rename */
+ fifo_badop, /* mkdir */
+ fifo_badop, /* rmdir */
+ fifo_badop, /* symlink */
+ fifo_badop, /* readdir */
+ fifo_badop, /* readlink */
+ fifo_badop, /* abortop */
+ ufs_inactive, /* inactive */
+ ufs_reclaim, /* reclaim */
+ ufs_lock, /* lock */
+ ufs_unlock, /* unlock */
+ fifo_bmap, /* bmap */
+ fifo_badop, /* strategy */
+ ufs_print, /* print */
+ ufs_islocked, /* islocked */
+ fifo_advlock, /* advlock */
+};
+#endif /* FIFO */
+
+enum vtype iftovt_tab[16] = {
+ VNON, VFIFO, VCHR, VNON, VDIR, VNON, VBLK, VNON,
+ VREG, VNON, VLNK, VNON, VSOCK, VNON, VNON, VBAD,
+};
+int vttoif_tab[9] = {
+ 0, IFREG, IFDIR, IFBLK, IFCHR, IFLNK, IFSOCK, IFIFO, IFMT,
+};
/*
- * Change notion of root (``/'') directory.
+ * Create a regular file
*/
-chroot()
+ufs_create(ndp, vap)
+ struct nameidata *ndp;
+ struct vattr *vap;
{
+ struct inode *ip;
+ int error;
- if (suser())
- chdirec(&u.u_rdir);
+ if (error = maknode(MAKEIMODE(vap->va_type, vap->va_mode), ndp, &ip))
+ return (error);
+ ndp->ni_vp = ITOV(ip);
+ return (0);
}
/*
- * Common routine for chroot and chdir.
+ * Mknod vnode call
*/
-chdirec(ipp)
- register struct inode **ipp;
+/* ARGSUSED */
+ufs_mknod(ndp, vap, cred)
+ struct nameidata *ndp;
+ struct ucred *cred;
+ struct vattr *vap;
{
- register struct inode *ip;
- struct a {
- char *fname;
- };
+ register struct vnode *vp;
+ struct inode *ip;
+ int error;
- ip = namei(uchar, LOOKUP, 1);
- if (ip == NULL)
- return;
- if ((ip->i_mode&IFMT) != IFDIR) {
- u.u_error = ENOTDIR;
- goto bad;
+ if (error = maknode(MAKEIMODE(vap->va_type, vap->va_mode), ndp, &ip))
+ return (error);
+ ip->i_flag |= IACC|IUPD|ICHG;
+ if (vap->va_rdev != VNOVAL) {
+ /*
+ * Want to be able to use this to make badblock
+ * inodes, so don't truncate the dev number.
+ */
+ ip->i_rdev = vap->va_rdev;
}
- if (access(ip, IEXEC))
- goto bad;
- iunlock(ip);
- if (*ipp)
- irele(*ipp);
- *ipp = ip;
- return;
-
-bad:
- iput(ip);
+ /*
+ * Remove inode so that it will be reloaded by iget and
+ * checked to see if it is an alias of an existing entry
+ * in the inode cache.
+ */
+ vp = ITOV(ip);
+ vput(vp);
+ vp->v_type = VNON;
+ vgone(vp);
+ return (0);
}
/*
- * Open system call.
+ * Open called.
+ *
+ * Nothing to do.
*/
-open()
+/* ARGSUSED */
+ufs_open(vp, mode, cred)
+ struct vnode *vp;
+ int mode;
+ struct ucred *cred;
{
- struct a {
- char *fname;
- int mode;
- int crtmode;
- } *uap = (struct a *) u.u_ap;
- copen(uap->mode-FOPEN, uap->crtmode);
+ return (0);
}
/*
- * Creat system call.
+ * Close called
+ *
+ * Update the times on the inode.
*/
-creat()
+/* ARGSUSED */
+ufs_close(vp, fflag, cred)
+ struct vnode *vp;
+ int fflag;
+ struct ucred *cred;
{
- struct a {
- char *fname;
- int fmode;
- } *uap = (struct a *)u.u_ap;
+ register struct inode *ip = VTOI(vp);
- copen(FWRITE|FCREAT|FTRUNC, uap->fmode);
+ if (vp->v_usecount > 1 && !(ip->i_flag & ILOCKED))
+ ITIMES(ip, &time, &time);
+ return (0);
}
/*
- * Common code for open and creat.
- * Check permissions, allocate an open file structure,
- * and call the device open routine if any.
+ * Check mode permission on inode pointer. Mode is READ, WRITE or EXEC.
+ * The mode is shifted to select the owner/group/other fields. The
+ * super user is granted all permissions.
*/
-copen(mode, arg)
+ufs_access(vp, mode, cred)
+ struct vnode *vp;
register int mode;
- int arg;
+ struct ucred *cred;
{
- register struct inode *ip;
- register struct file *fp;
- int i;
-
-#ifdef notdef
- if ((mode&(FREAD|FWRITE)) == 0) {
- u.u_error = EINVAL;
- return;
+ register struct inode *ip = VTOI(vp);
+ register gid_t *gp;
+ int i, error;
+
+#ifdef DIAGNOSTIC
+ if (!VOP_ISLOCKED(vp)) {
+ vprint("ufs_access: not locked", vp);
+ panic("ufs_access: not locked");
}
#endif
- if (mode&FCREAT) {
- ip = namei(uchar, CREATE, 1);
- if (ip == NULL) {
- if (u.u_error)
- return;
- ip = maknode(arg&07777&(~ISVTX));
- if (ip == NULL)
- return;
- mode &= ~FTRUNC;
- } else {
- if (mode&FEXCL) {
- u.u_error = EEXIST;
- iput(ip);
- return;
- }
- mode &= ~FCREAT;
- }
- } else {
- ip = namei(uchar, LOOKUP, 1);
- if (ip == NULL)
- return;
- }
- if ((ip->i_mode & IFMT) == IFSOCK) {
- u.u_error = EOPNOTSUPP;
- goto bad;
- }
- if ((mode&FCREAT) == 0) {
- if (mode&FREAD)
- if (access(ip, IREAD))
- goto bad;
- if (mode&(FWRITE|FTRUNC)) {
- if (access(ip, IWRITE))
- goto bad;
- if ((ip->i_mode&IFMT) == IFDIR) {
- u.u_error = EISDIR;
- goto bad;
- }
+#ifdef QUOTA
+ if (mode & VWRITE) {
+ switch (vp->v_type) {
+ case VREG: case VDIR: case VLNK:
+ if (error = getinoquota(ip))
+ return (error);
}
}
- fp = falloc();
- if (fp == NULL)
- goto bad;
- if (mode&FTRUNC)
- itrunc(ip, (u_long)0);
- iunlock(ip);
- fp->f_flag = mode&FMASK;
- fp->f_type = DTYPE_INODE;
- fp->f_ops = &inodeops;
- fp->f_data = (caddr_t)ip;
- i = u.u_r.r_val1;
- if (setjmp(&u.u_qsave)) {
- if (u.u_error == 0)
- u.u_error = EINTR;
- u.u_ofile[i] = NULL;
- closef(fp);
- return;
+#endif /* QUOTA */
+ /*
+ * If you're the super-user, you always get access.
+ */
+ if (cred->cr_uid == 0)
+ return (0);
+ /*
+ * Access check is based on only one of owner, group, public.
+ * If not owner, then check group. If not a member of the
+ * group, then check public access.
+ */
+ if (cred->cr_uid != ip->i_uid) {
+ mode >>= 3;
+ gp = cred->cr_groups;
+ for (i = 0; i < cred->cr_ngroups; i++, gp++)
+ if (ip->i_gid == *gp)
+ goto found;
+ mode >>= 3;
+found:
+ ;
}
- u.u_error = openi(ip, mode);
- if (u.u_error == 0)
- return;
- u.u_ofile[i] = NULL;
- fp->f_count--;
- irele(ip);
- return;
-bad:
- iput(ip);
+ if ((ip->i_mode & mode) != 0)
+ return (0);
+ return (EACCES);
}
-/*
- * Mknod system call
- */
-mknod()
+/* ARGSUSED */
+ufs_getattr(vp, vap, cred)
+ struct vnode *vp;
+ register struct vattr *vap;
+ struct ucred *cred;
{
- register struct inode *ip;
- register struct a {
- char *fname;
- int fmode;
- int dev;
- } *uap;
-
- uap = (struct a *)u.u_ap;
- if (!suser())
- return;
- ip = namei(uchar, CREATE, 0);
- if (ip != NULL) {
- u.u_error = EEXIST;
- goto out;
- }
- if (u.u_error)
- return;
- ip = maknode(uap->fmode);
- if (ip == NULL)
- return;
- switch (ip->i_mode & IFMT) {
-
- case IFMT: /* used by badsect to flag bad sectors */
- case IFCHR:
- case IFBLK:
- if (uap->dev) {
- /*
- * Want to be able to use this to make badblock
- * inodes, so don't truncate the dev number.
- */
- ip->i_rdev = uap->dev;
- ip->i_flag |= IACC|IUPD|ICHG;
- }
- }
+ register struct inode *ip = VTOI(vp);
-out:
- iput(ip);
+ ITIMES(ip, &time, &time);
+ /*
+ * Copy from inode table
+ */
+ vap->va_fsid = ip->i_dev;
+ vap->va_fileid = ip->i_number;
+ vap->va_mode = ip->i_mode & ~IFMT;
+ vap->va_nlink = ip->i_nlink;
+ vap->va_uid = ip->i_uid;
+ vap->va_gid = ip->i_gid;
+ vap->va_rdev = (dev_t)ip->i_rdev;
+#ifdef tahoe
+ vap->va_size = ip->i_size;
+ vap->va_size_rsv = 0;
+#else
+ vap->va_qsize = ip->i_din.di_qsize;
+#endif
+ vap->va_atime.tv_sec = ip->i_atime;
+ vap->va_atime.tv_usec = 0;
+ vap->va_mtime.tv_sec = ip->i_mtime;
+ vap->va_mtime.tv_usec = 0;
+ vap->va_ctime.tv_sec = ip->i_ctime;
+ vap->va_ctime.tv_usec = 0;
+ vap->va_flags = ip->i_flags;
+ vap->va_gen = ip->i_gen;
+ /* this doesn't belong here */
+ if (vp->v_type == VBLK)
+ vap->va_blocksize = BLKDEV_IOSIZE;
+ else if (vp->v_type == VCHR)
+ vap->va_blocksize = MAXBSIZE;
+ else
+ vap->va_blocksize = ip->i_fs->fs_bsize;
+ vap->va_bytes = dbtob(ip->i_blocks);
+ vap->va_bytes_rsv = 0;
+ vap->va_type = vp->v_type;
+ return (0);
}
/*
- * link system call
+ * Set attribute vnode op. called from several syscalls
*/
-link()
+ufs_setattr(vp, vap, cred)
+ register struct vnode *vp;
+ register struct vattr *vap;
+ register struct ucred *cred;
{
- register struct inode *ip, *xp;
- register struct a {
- char *target;
- char *linkname;
- } *uap;
-
- uap = (struct a *)u.u_ap;
- ip = namei(uchar, LOOKUP, 1); /* well, this routine is doomed anyhow */
- if (ip == NULL)
- return;
- if ((ip->i_mode&IFMT) == IFDIR && !suser()) {
- iput(ip);
- return;
+ register struct inode *ip = VTOI(vp);
+ int error = 0;
+
+ /*
+ * Check for unsetable attributes.
+ */
+ if ((vap->va_type != VNON) || (vap->va_nlink != VNOVAL) ||
+ (vap->va_fsid != VNOVAL) || (vap->va_fileid != VNOVAL) ||
+ (vap->va_blocksize != VNOVAL) || (vap->va_rdev != VNOVAL) ||
+ ((int)vap->va_bytes != VNOVAL) || (vap->va_gen != VNOVAL)) {
+ return (EINVAL);
}
- ip->i_nlink++;
- ip->i_flag |= ICHG;
- iupdat(ip, &time, &time, 1);
- iunlock(ip);
- u.u_dirp = (caddr_t)uap->linkname;
- xp = namei(uchar, CREATE, 0);
- if (xp != NULL) {
- u.u_error = EEXIST;
- iput(xp);
- goto out;
+ /*
+ * Go through the fields and update iff not VNOVAL.
+ */
+ if (vap->va_uid != (u_short)VNOVAL || vap->va_gid != (u_short)VNOVAL)
+ if (error = chown1(vp, vap->va_uid, vap->va_gid, cred))
+ return (error);
+ if (vap->va_size != VNOVAL) {
+ if (vp->v_type == VDIR)
+ return (EISDIR);
+ if (error = itrunc(ip, vap->va_size, 0)) /* XXX IO_SYNC? */
+ return (error);
}
- if (u.u_error)
- goto out;
- if (u.u_pdir->i_dev != ip->i_dev) {
- iput(u.u_pdir);
- u.u_error = EXDEV;
- goto out;
+ if (vap->va_atime.tv_sec != VNOVAL || vap->va_mtime.tv_sec != VNOVAL) {
+ if (cred->cr_uid != ip->i_uid &&
+ (error = suser(cred, &u.u_acflag)))
+ return (error);
+ if (vap->va_atime.tv_sec != VNOVAL)
+ ip->i_flag |= IACC;
+ if (vap->va_mtime.tv_sec != VNOVAL)
+ ip->i_flag |= IUPD;
+ ip->i_flag |= ICHG;
+ if (error = iupdat(ip, &vap->va_atime, &vap->va_mtime, 1))
+ return (error);
}
- u.u_error = direnter(ip);
-out:
- if (u.u_error) {
- ip->i_nlink--;
+ if (vap->va_mode != (u_short)VNOVAL)
+ error = chmod1(vp, (int)vap->va_mode, cred);
+ if (vap->va_flags != VNOVAL) {
+ if (cred->cr_uid != ip->i_uid &&
+ (error = suser(cred, &u.u_acflag)))
+ return (error);
+ if (cred->cr_uid == 0) {
+ ip->i_flags = vap->va_flags;
+ } else {
+ ip->i_flags &= 0xffff0000;
+ ip->i_flags |= (vap->va_flags & 0xffff);
+ }
ip->i_flag |= ICHG;
}
- irele(ip);
+ return (error);
}
/*
- * symlink -- make a symbolic link
+ * Change the mode on a file.
+ * Inode must be locked before calling.
*/
-symlink()
+chmod1(vp, mode, cred)
+ register struct vnode *vp;
+ register int mode;
+ struct ucred *cred;
{
- register struct a {
- char *target;
- char *linkname;
- } *uap;
- register struct inode *ip;
- register char *tp;
- register c, nc;
-
- uap = (struct a *)u.u_ap;
- tp = uap->target;
- nc = 0;
- while (c = fubyte(tp)) {
- if (c < 0) {
- u.u_error = EFAULT;
- return;
- }
- tp++;
- nc++;
- }
- u.u_dirp = uap->linkname;
- ip = namei(uchar, CREATE, 0);
- if (ip) {
- iput(ip);
- u.u_error = EEXIST;
- return;
+ register struct inode *ip = VTOI(vp);
+ int error;
+
+ if (cred->cr_uid != ip->i_uid &&
+ (error = suser(cred, &u.u_acflag)))
+ return (error);
+ if (cred->cr_uid) {
+ if (vp->v_type != VDIR && (mode & ISVTX))
+ return (EFTYPE);
+ if (!groupmember(ip->i_gid, cred) && (mode & ISGID))
+ return (EPERM);
}
- if (u.u_error)
- return;
- ip = maknode(IFLNK | 0777);
- if (ip == NULL)
- return;
- u.u_error = rdwri(UIO_WRITE, ip, uap->target, nc, 0, 0, (int *)0);
- /* handle u.u_error != 0 */
- iput(ip);
+ ip->i_mode &= ~07777;
+ ip->i_mode |= mode & 07777;
+ ip->i_flag |= ICHG;
+ if ((vp->v_flag & VTEXT) && (ip->i_mode & ISVTX) == 0)
+ (void) vnode_pager_uncache(vp);
+ return (0);
}
/*
- * Unlink system call.
- * Hard to avoid races here, especially
- * in unlinking directories.
+ * Perform chown operation on inode ip;
+ * inode must be locked prior to call.
*/
-unlink()
+chown1(vp, uid, gid, cred)
+ register struct vnode *vp;
+ uid_t uid;
+ gid_t gid;
+ struct ucred *cred;
{
- struct a {
- char *fname;
- };
- register struct inode *ip, *dp;
+ register struct inode *ip = VTOI(vp);
+ uid_t ouid;
+ gid_t ogid;
+ int error = 0;
+#ifdef QUOTA
+ register int i;
+ long change;
+#endif
- ip = namei(uchar, DELETE | LOCKPARENT, 0);
- if (ip == NULL)
- return;
- dp = u.u_pdir;
- if ((ip->i_mode&IFMT) == IFDIR && !suser())
- goto out;
+ if (uid == (u_short)VNOVAL)
+ uid = ip->i_uid;
+ if (gid == (u_short)VNOVAL)
+ gid = ip->i_gid;
/*
- * Don't unlink a mounted file.
+ * If we don't own the file, are trying to change the owner
+ * of the file, or are not a member of the target group,
+ * the caller must be superuser or the call fails.
*/
- if (ip->i_dev != dp->i_dev) {
- u.u_error = EBUSY;
- goto out;
+ if ((cred->cr_uid != ip->i_uid || uid != ip->i_uid ||
+ !groupmember((gid_t)gid, cred)) &&
+ (error = suser(cred, &u.u_acflag)))
+ return (error);
+ ouid = ip->i_uid;
+ ogid = ip->i_gid;
+#ifdef QUOTA
+ if (error = getinoquota(ip))
+ return (error);
+ if (ouid == uid) {
+ dqrele(vp, ip->i_dquot[USRQUOTA]);
+ ip->i_dquot[USRQUOTA] = NODQUOT;
}
- if (ip->i_flag&ITEXT)
- xrele(ip); /* try once to free text */
- if (dirremove()) {
- ip->i_nlink--;
- ip->i_flag |= ICHG;
+ if (ogid == gid) {
+ dqrele(vp, ip->i_dquot[GRPQUOTA]);
+ ip->i_dquot[GRPQUOTA] = NODQUOT;
}
-out:
- if (dp == ip)
- irele(ip);
- else
- iput(ip);
- iput(dp);
-}
-
-/*
- * Seek system call
- */
-lseek()
-{
- register struct file *fp;
- register struct a {
- int fd;
- off_t off;
- int sbase;
- } *uap;
-
- uap = (struct a *)u.u_ap;
- fp = getinode(uap->fd);
- if (fp == NULL)
- return;
- switch (uap->sbase) {
-
- case L_INCR:
- fp->f_offset += uap->off;
- break;
-
- case L_XTND:
- fp->f_offset = uap->off + ((struct inode *)fp->f_data)->i_size;
- break;
-
- case L_SET:
- fp->f_offset = uap->off;
- break;
-
- default:
- u.u_error = EINVAL;
- return;
+ change = ip->i_blocks;
+ (void) chkdq(ip, -change, cred, CHOWN);
+ (void) chkiq(ip, -1, cred, CHOWN);
+ for (i = 0; i < MAXQUOTAS; i++) {
+ dqrele(vp, ip->i_dquot[i]);
+ ip->i_dquot[i] = NODQUOT;
}
- u.u_r.r_off = fp->f_offset;
-}
-
-/*
- * Access system call
- */
-saccess()
-{
- register svuid, svgid;
- register struct inode *ip;
- register struct a {
- char *fname;
- int fmode;
- } *uap;
-
- uap = (struct a *)u.u_ap;
- svuid = u.u_uid;
- svgid = u.u_gid;
- u.u_uid = u.u_ruid;
- u.u_gid = u.u_rgid;
- ip = namei(uchar, LOOKUP, 1);
- if (ip != NULL) {
- if ((uap->fmode&R_OK) && access(ip, IREAD))
- goto done;
- if ((uap->fmode&W_OK) && access(ip, IWRITE))
- goto done;
- if ((uap->fmode&X_OK) && access(ip, IEXEC))
- goto done;
-done:
- iput(ip);
+#endif
+ ip->i_uid = uid;
+ ip->i_gid = gid;
+#ifdef QUOTA
+ if ((error = getinoquota(ip)) == 0) {
+ if (ouid == uid) {
+ dqrele(vp, ip->i_dquot[USRQUOTA]);
+ ip->i_dquot[USRQUOTA] = NODQUOT;
+ }
+ if (ogid == gid) {
+ dqrele(vp, ip->i_dquot[GRPQUOTA]);
+ ip->i_dquot[GRPQUOTA] = NODQUOT;
+ }
+ if ((error = chkdq(ip, change, cred, CHOWN)) == 0) {
+ if ((error = chkiq(ip, 1, cred, CHOWN)) == 0)
+ goto good;
+ else
+ (void) chkdq(ip, -change, cred, CHOWN|FORCE);
+ }
+ for (i = 0; i < MAXQUOTAS; i++) {
+ dqrele(vp, ip->i_dquot[i]);
+ ip->i_dquot[i] = NODQUOT;
+ }
+ }
+ ip->i_uid = ouid;
+ ip->i_gid = ogid;
+ if (getinoquota(ip) == 0) {
+ if (ouid == uid) {
+ dqrele(vp, ip->i_dquot[USRQUOTA]);
+ ip->i_dquot[USRQUOTA] = NODQUOT;
+ }
+ if (ogid == gid) {
+ dqrele(vp, ip->i_dquot[GRPQUOTA]);
+ ip->i_dquot[GRPQUOTA] = NODQUOT;
+ }
+ (void) chkdq(ip, change, cred, FORCE|CHOWN);
+ (void) chkiq(ip, 1, cred, FORCE|CHOWN);
+ (void) getinoquota(ip);
}
- u.u_uid = svuid;
- u.u_gid = svgid;
+ return (error);
+good:
+ if (getinoquota(ip))
+ panic("chown: lost quota");
+#endif /* QUOTA */
+ if (ouid != uid || ogid != gid)
+ ip->i_flag |= ICHG;
+ if (ouid != uid && cred->cr_uid != 0)
+ ip->i_mode &= ~ISUID;
+ if (ogid != gid && cred->cr_uid != 0)
+ ip->i_mode &= ~ISGID;
+ return (0);
}
/*
- * Stat system call. This version follows links.
+ * Vnode op for reading.
*/
-stat()
+/* ARGSUSED */
+ufs_read(vp, uio, ioflag, cred)
+ struct vnode *vp;
+ register struct uio *uio;
+ int ioflag;
+ struct ucred *cred;
{
-
- stat1(1);
+ register struct inode *ip = VTOI(vp);
+ register struct fs *fs;
+ struct buf *bp;
+ daddr_t lbn, bn, rablock;
+ int size, diff, error = 0;
+ long n, on, type;
+
+ if (uio->uio_rw != UIO_READ)
+ panic("ufs_read mode");
+ type = ip->i_mode & IFMT;
+ if (type != IFDIR && type != IFREG && type != IFLNK)
+ panic("ufs_read type");
+ if (uio->uio_resid == 0)
+ return (0);
+ if (uio->uio_offset < 0)
+ return (EINVAL);
+ ip->i_flag |= IACC;
+ fs = ip->i_fs;
+ do {
+ lbn = lblkno(fs, uio->uio_offset);
+ on = blkoff(fs, uio->uio_offset);
+ n = MIN((unsigned)(fs->fs_bsize - on), uio->uio_resid);
+ diff = ip->i_size - uio->uio_offset;
+ if (diff <= 0)
+ return (0);
+ if (diff < n)
+ n = diff;
+ size = blksize(fs, ip, lbn);
+ rablock = lbn + 1;
+ if (vp->v_lastr + 1 == lbn &&
+ lblktosize(fs, rablock) < ip->i_size)
+ error = breada(ITOV(ip), lbn, size, rablock,
+ blksize(fs, ip, rablock), NOCRED, &bp);
+ else
+ error = bread(ITOV(ip), lbn, size, NOCRED, &bp);
+ vp->v_lastr = lbn;
+ n = MIN(n, size - bp->b_resid);
+ if (error) {
+ brelse(bp);
+ return (error);
+ }
+ error = uiomove(bp->b_un.b_addr + on, (int)n, uio);
+ if (n + on == fs->fs_bsize || uio->uio_offset == ip->i_size)
+ bp->b_flags |= B_AGE;
+ brelse(bp);
+ } while (error == 0 && uio->uio_resid > 0 && n != 0);
+ return (error);
}
/*
- * Lstat system call. This version does not follow links.
+ * Vnode op for writing.
*/
-lstat()
+ufs_write(vp, uio, ioflag, cred)
+ register struct vnode *vp;
+ struct uio *uio;
+ int ioflag;
+ struct ucred *cred;
{
+ register struct inode *ip = VTOI(vp);
+ register struct fs *fs;
+ struct buf *bp;
+ daddr_t lbn, bn;
+ u_long osize;
+ int n, on, flags;
+ int size, resid, error = 0;
+
+ if (uio->uio_rw != UIO_WRITE)
+ panic("ufs_write mode");
+ switch (vp->v_type) {
+ case VREG:
+ if (ioflag & IO_APPEND)
+ uio->uio_offset = ip->i_size;
+ /* fall through */
+ case VLNK:
+ break;
- stat1(0);
-}
-
-stat1(follow)
- int follow;
-{
- register struct inode *ip;
- register struct a {
- char *fname;
- struct stat *ub;
- } *uap;
- struct stat sb;
-
- uap = (struct a *)u.u_ap;
- ip = namei(uchar, LOOKUP, follow);
- if (ip == NULL)
- return;
- (void) ino_stat(ip, &sb);
- iput(ip);
- u.u_error = copyout((caddr_t)&sb, (caddr_t)uap->ub, sizeof (sb));
-}
+ case VDIR:
+ if ((ioflag & IO_SYNC) == 0)
+ panic("ufs_write nonsync dir write");
+ break;
-/*
- * Return target name of a symbolic link
- */
-readlink()
-{
- register struct inode *ip;
- register struct a {
- char *name;
- char *buf;
- int count;
- } *uap = (struct a *)u.u_ap;
- int resid;
-
- ip = namei(uchar, LOOKUP, 0);
- if (ip == NULL)
- return;
- if ((ip->i_mode&IFMT) != IFLNK) {
- u.u_error = ENXIO;
- goto out;
+ default:
+ panic("ufs_write type");
}
- u.u_error = rdwri(UIO_READ, ip, uap->buf, uap->count, 0, 0, &resid);
-out:
- iput(ip);
- u.u_r.r_val1 = uap->count - resid;
+ if (uio->uio_offset < 0)
+ return (EINVAL);
+ if (uio->uio_resid == 0)
+ return (0);
+ /*
+ * Maybe this should be above the vnode op call, but so long as
+ * file servers have no limits, i don't think it matters
+ */
+ if (vp->v_type == VREG &&
+ uio->uio_offset + uio->uio_resid >
+ u.u_rlimit[RLIMIT_FSIZE].rlim_cur) {
+ psignal(u.u_procp, SIGXFSZ);
+ return (EFBIG);
+ }
+ resid = uio->uio_resid;
+ osize = ip->i_size;
+ fs = ip->i_fs;
+ flags = 0;
+ if (ioflag & IO_SYNC)
+ flags = B_SYNC;
+ do {
+ lbn = lblkno(fs, uio->uio_offset);
+ on = blkoff(fs, uio->uio_offset);
+ n = MIN((unsigned)(fs->fs_bsize - on), uio->uio_resid);
+ if (n < fs->fs_bsize)
+ flags |= B_CLRBUF;
+ else
+ flags &= ~B_CLRBUF;
+ if (error = balloc(ip, lbn, (int)(on + n), &bp, flags))
+ break;
+ bn = bp->b_blkno;
+ if (uio->uio_offset + n > ip->i_size) {
+ ip->i_size = uio->uio_offset + n;
+ vnode_pager_setsize(vp, ip->i_size);
+ }
+ size = blksize(fs, ip, lbn);
+ (void) vnode_pager_uncache(vp);
+ n = MIN(n, size - bp->b_resid);
+ error = uiomove(bp->b_un.b_addr + on, n, uio);
+ if (ioflag & IO_SYNC)
+ (void) bwrite(bp);
+ else if (n + on == fs->fs_bsize) {
+ bp->b_flags |= B_AGE;
+ bawrite(bp);
+ } else
+ bdwrite(bp);
+ ip->i_flag |= IUPD|ICHG;
+ if (cred->cr_uid != 0)
+ ip->i_mode &= ~(ISUID|ISGID);
+ } while (error == 0 && uio->uio_resid > 0 && n != 0);
+ if (error && (ioflag & IO_UNIT)) {
+ (void) itrunc(ip, osize, ioflag & IO_SYNC);
+ uio->uio_offset -= resid - uio->uio_resid;
+ uio->uio_resid = resid;
+ }
+ if (!error && (ioflag & IO_SYNC))
+ error = iupdat(ip, &time, &time, 1);
+ return (error);
}
-/*
- * Change mode of a file given path name.
- */
-chmod()
+/* ARGSUSED */
+ufs_ioctl(vp, com, data, fflag, cred)
+ struct vnode *vp;
+ int com;
+ caddr_t data;
+ int fflag;
+ struct ucred *cred;
{
- struct inode *ip;
- struct a {
- char *fname;
- int fmode;
- } *uap;
- uap = (struct a *)u.u_ap;
- if ((ip = owner(1)) == NULL)
- return;
- chmod1(ip, uap->fmode);
- iput(ip);
+ return (ENOTTY);
}
-/*
- * Change mode of a file given a file descriptor.
- */
-fchmod()
+/* ARGSUSED */
+ufs_select(vp, which, fflags, cred)
+ struct vnode *vp;
+ int which, fflags;
+ struct ucred *cred;
{
- struct a {
- int fd;
- int fmode;
- } *uap;
- register struct inode *ip;
- register struct file *fp;
- uap = (struct a *)u.u_ap;
- fp = getinode(uap->fd);
- if (fp == NULL)
- return;
- ip = (struct inode *)fp->f_data;
- if (u.u_uid != ip->i_uid && !suser())
- return;
- ilock(ip);
- chmod1(ip, uap->fmode);
- iunlock(ip);
+ return (1); /* XXX */
}
/*
- * Change the mode on a file.
- * Inode must be locked before calling.
+ * Mmap a file
+ *
+ * NB Currently unsupported.
*/
-chmod1(ip, mode)
- register struct inode *ip;
- register int mode;
+/* ARGSUSED */
+ufs_mmap(vp, fflags, cred)
+ struct vnode *vp;
+ int fflags;
+ struct ucred *cred;
{
- ip->i_mode &= ~07777;
- if (u.u_uid) {
- mode &= ~ISVTX;
- if (!groupmember(ip->i_gid))
- mode &= ~ISGID;
- }
- ip->i_mode |= mode&07777;
- ip->i_flag |= ICHG;
- if (ip->i_flag&ITEXT && (ip->i_mode&ISVTX)==0)
- xrele(ip);
+ return (EINVAL);
}
/*
- * Set ownership given a path name.
- */
-chown()
-{
- struct inode *ip;
- struct a {
- char *fname;
- int uid;
- int gid;
- } *uap;
-
- uap = (struct a *)u.u_ap;
- if (!suser() || (ip = owner(0)) == NULL)
- return;
- u.u_error = chown1(ip, uap->uid, uap->gid);
- iput(ip);
-}
-
-/*
- * Set ownership given a file descriptor.
+ * Synch an open file.
*/
-fchown()
+/* ARGSUSED */
+ufs_fsync(vp, fflags, cred, waitfor)
+ struct vnode *vp;
+ int fflags;
+ struct ucred *cred;
+ int waitfor;
{
- struct a {
- int fd;
- int uid;
- int gid;
- } *uap;
- register struct inode *ip;
- register struct file *fp;
+ struct inode *ip = VTOI(vp);
- uap = (struct a *)u.u_ap;
- fp = getinode(uap->fd);
- if (fp == NULL)
- return;
- ip = (struct inode *)fp->f_data;
- if (!suser())
- return;
- ilock(ip);
- u.u_error = chown1(ip, uap->uid, uap->gid);
- iunlock(ip);
+ if (fflags&FWRITE)
+ ip->i_flag |= ICHG;
+ vflushbuf(vp, waitfor == MNT_WAIT ? B_SYNC : 0);
+ return (iupdat(ip, &time, &time, waitfor == MNT_WAIT));
}
/*
- * Perform chown operation on inode ip;
- * inode must be locked prior to call.
+ * Seek on a file
+ *
+ * Nothing to do, so just return.
*/
-chown1(ip, uid, gid)
- register struct inode *ip;
- int uid, gid;
+/* ARGSUSED */
+ufs_seek(vp, oldoff, newoff, cred)
+ struct vnode *vp;
+ off_t oldoff, newoff;
+ struct ucred *cred;
{
-#ifdef QUOTA
- register long change;
-#endif
- if (uid == -1)
- uid = ip->i_uid;
- if (gid == -1)
- gid = ip->i_gid;
-#ifdef QUOTA
- if (ip->i_uid == uid) /* this just speeds things a little */
- change = 0;
- else
- change = ip->i_blocks;
- (void) chkdq(ip, -change, 1);
- (void) chkiq(ip->i_dev, ip, ip->i_uid, 1);
- dqrele(ip->i_dquot);
-#endif
- ip->i_uid = uid;
- ip->i_gid = gid;
- ip->i_flag |= ICHG;
- if (u.u_ruid != 0)
- ip->i_mode &= ~(ISUID|ISGID);
-#ifdef QUOTA
- ip->i_dquot = inoquota(ip);
- (void) chkdq(ip, change, 1);
- (void) chkiq(ip->i_dev, (struct inode *)NULL, uid, 1);
- return (u.u_error); /* should == 0 ALWAYS !! */
-#else
return (0);
-#endif
-}
-
-utimes()
-{
- register struct a {
- char *fname;
- struct timeval *tptr;
- } *uap = (struct a *)u.u_ap;
- register struct inode *ip;
- struct timeval tv[2];
-
- if ((ip = owner(1)) == NULL)
- return;
- u.u_error = copyin((caddr_t)uap->tptr, (caddr_t)tv, sizeof (tv));
- if (u.u_error == 0) {
- ip->i_flag |= IACC|IUPD|ICHG;
- iupdat(ip, &tv[0], &tv[1], 0);
- }
- iput(ip);
}
/*
- * Flush any pending I/O.
- */
-sync()
-{
-
- update();
-}
-
-/*
- * Truncate a file given its path name.
+ * ufs remove
+ * Hard to avoid races here, especially
+ * in unlinking directories.
*/
-truncate()
+ufs_remove(ndp)
+ struct nameidata *ndp;
{
- struct a {
- char *fname;
- u_long length;
- } *uap = (struct a *)u.u_ap;
- struct inode *ip;
+ register struct inode *ip, *dp;
+ int error;
- ip = namei(uchar, LOOKUP, 1);
- if (ip == NULL)
- return;
- if (access(ip, IWRITE))
- goto bad;
- if ((ip->i_mode&IFMT) == IFDIR) {
- u.u_error = EISDIR;
- goto bad;
+ ip = VTOI(ndp->ni_vp);
+ dp = VTOI(ndp->ni_dvp);
+ error = dirremove(ndp);
+ if (!error) {
+ ip->i_nlink--;
+ ip->i_flag |= ICHG;
}
- itrunc(ip, uap->length);
-bad:
- iput(ip);
+ if (dp == ip)
+ vrele(ITOV(ip));
+ else
+ iput(ip);
+ iput(dp);
+ return (error);
}
/*
- * Truncate a file given a file descriptor.
+ * link vnode call
*/
-ftruncate()
+ufs_link(vp, ndp)
+ register struct vnode *vp;
+ register struct nameidata *ndp;
{
- struct a {
- int fd;
- u_long length;
- } *uap = (struct a *)u.u_ap;
- struct inode *ip;
- struct file *fp;
+ register struct inode *ip = VTOI(vp);
+ int error;
- fp = getinode(uap->fd);
- if (fp == NULL)
- return;
- if ((fp->f_flag&FWRITE) == 0) {
- u.u_error = EINVAL;
- return;
+ if (ndp->ni_dvp != vp)
+ ILOCK(ip);
+ if (ip->i_nlink == LINK_MAX - 1) {
+ error = EMLINK;
+ goto out;
}
- ip = (struct inode *)fp->f_data;
- ilock(ip);
- itrunc(ip, uap->length);
- iunlock(ip);
-}
-
-/*
- * Synch an open file.
- */
-fsync()
-{
- struct a {
- int fd;
- } *uap = (struct a *)u.u_ap;
- struct inode *ip;
- struct file *fp;
-
- fp = getinode(uap->fd);
- if (fp == NULL)
- return;
- ip = (struct inode *)fp->f_data;
- ilock(ip);
- syncip(ip);
- iunlock(ip);
+ ip->i_nlink++;
+ ip->i_flag |= ICHG;
+ error = iupdat(ip, &time, &time, 1);
+ if (!error)
+ error = direnter(ip, ndp);
+out:
+ if (ndp->ni_dvp != vp)
+ IUNLOCK(ip);
+ if (error) {
+ ip->i_nlink--;
+ ip->i_flag |= ICHG;
+ }
+ return (error);
}
/*
* Basic algorithm is:
*
* 1) Bump link count on source while we're linking it to the
- * target. This also insure the inode won't be deleted out
- * from underneath us while we work.
+ * target. This also ensure the inode won't be deleted out
+ * from underneath us while we work (it may be truncated by
+ * a concurrent `trunc' or `open' for creation).
* 2) Link source to destination. If destination already exists,
* delete it first.
- * 3) Unlink source reference to inode if still around.
- * 4) If a directory was moved and the parent of the destination
+ * 3) Unlink source reference to inode if still around. If a
+ * directory was moved and the parent of the destination
* is different from the source, patch the ".." entry in the
* directory.
- *
- * Source and destination must either both be directories, or both
- * not be directories. If target is a directory, it must be empty.
*/
-rename()
+ufs_rename(fndp, tndp)
+ register struct nameidata *fndp, *tndp;
{
- struct a {
- char *from;
- char *to;
- } *uap;
register struct inode *ip, *xp, *dp;
- int oldparent, parentdifferent, doingdirectory;
+ struct dirtemplate dirbuf;
+ int doingdirectory = 0, oldparent = 0, newparent = 0;
int error = 0;
- uap = (struct a *)u.u_ap;
- ip = namei(uchar, DELETE | LOCKPARENT, 0);
- if (ip == NULL)
- return;
- dp = u.u_pdir;
- oldparent = 0, doingdirectory = 0;
+ dp = VTOI(fndp->ni_dvp);
+ ip = VTOI(fndp->ni_vp);
+ ILOCK(ip);
if ((ip->i_mode&IFMT) == IFDIR) {
- register struct direct *d;
+ register struct direct *d = &fndp->ni_dent;
- d = &u.u_dent;
/*
* Avoid ".", "..", and aliases of "." for obvious reasons.
*/
- if ((d->d_namlen == 1 && d->d_name[0] == '.') ||
- (d->d_namlen == 2 && bcmp(d->d_name, "..", 2) == 0) ||
- (dp == ip)) {
- iput(dp);
- if (dp == ip)
- irele(ip);
- else
- iput(ip);
- u.u_error = EINVAL;
- return;
+ if ((d->d_namlen == 1 && d->d_name[0] == '.') || dp == ip ||
+ fndp->ni_isdotdot || (ip->i_flag & IRENAME)) {
+ VOP_ABORTOP(tndp);
+ vput(tndp->ni_dvp);
+ if (tndp->ni_vp)
+ vput(tndp->ni_vp);
+ VOP_ABORTOP(fndp);
+ vrele(fndp->ni_dvp);
+ vput(fndp->ni_vp);
+ return (EINVAL);
}
+ ip->i_flag |= IRENAME;
oldparent = dp->i_number;
doingdirectory++;
}
- iput(dp);
+ vrele(fndp->ni_dvp);
/*
* 1) Bump link count while we're moving stuff
*/
ip->i_nlink++;
ip->i_flag |= ICHG;
- iupdat(ip, &time, &time, 1);
- iunlock(ip);
+ error = iupdat(ip, &time, &time, 1);
+ IUNLOCK(ip);
/*
* When the target exists, both the directory
- * and target inodes are returned locked.
+ * and target vnodes are returned locked.
*/
- u.u_dirp = (caddr_t)uap->to;
- xp = namei(uchar, CREATE | LOCKPARENT | NOCACHE, 0);
- if (u.u_error) {
- error = u.u_error;
- goto out;
- }
- dp = u.u_pdir;
+ dp = VTOI(tndp->ni_dvp);
+ xp = NULL;
+ if (tndp->ni_vp)
+ xp = VTOI(tndp->ni_vp);
/*
* If ".." must be changed (ie the directory gets a new
* parent) then the source directory must not be in the
* to namei, as the parent directory is unlocked by the
* call to checkpath().
*/
- parentdifferent = oldparent != dp->i_number;
- if (doingdirectory && parentdifferent) {
- if (access(ip, IWRITE))
+ if (oldparent != dp->i_number)
+ newparent = dp->i_number;
+ if (doingdirectory && newparent) {
+ VOP_LOCK(fndp->ni_vp);
+ error = ufs_access(fndp->ni_vp, VWRITE, tndp->ni_cred);
+ VOP_UNLOCK(fndp->ni_vp);
+ if (error)
goto bad;
+ tndp->ni_nameiop = RENAME | LOCKPARENT | LOCKLEAF | NOCACHE;
do {
- dp = u.u_pdir;
+ dp = VTOI(tndp->ni_dvp);
if (xp != NULL)
iput(xp);
- u.u_error = checkpath(ip, dp);
- if (u.u_error)
+ if (error = checkpath(ip, dp, tndp->ni_cred))
goto out;
- u.u_dirp = (caddr_t)uap->to;
- xp = namei(uchar, CREATE | LOCKPARENT | NOCACHE, 0);
- if (u.u_error) {
- error = u.u_error;
+ if (error = namei(tndp))
goto out;
- }
- } while (dp != u.u_pdir);
+ xp = NULL;
+ if (tndp->ni_vp)
+ xp = VTOI(tndp->ni_vp);
+ } while (dp != VTOI(tndp->ni_dvp));
}
/*
* 2) If target doesn't exist, link the target
* expunge the original entry's existence.
*/
if (xp == NULL) {
- if (dp->i_dev != ip->i_dev) {
- error = EXDEV;
- goto bad;
- }
+ if (dp->i_dev != ip->i_dev)
+ panic("rename: EXDEV");
/*
- * Account for ".." in directory.
- * When source and destination have the
- * same parent we don't fool with the
- * link count -- this isn't required
- * because we do a similar check below.
+ * Account for ".." in new directory.
+ * When source and destination have the same
+ * parent we don't fool with the link count.
*/
- if (doingdirectory && parentdifferent) {
+ if (doingdirectory && newparent) {
dp->i_nlink++;
dp->i_flag |= ICHG;
- iupdat(dp, &time, &time, 1);
+ error = iupdat(dp, &time, &time, 1);
}
- error = direnter(ip);
- if (error)
+ if (error = direnter(ip, tndp))
goto out;
} else {
- if (xp->i_dev != dp->i_dev || xp->i_dev != ip->i_dev) {
- error = EXDEV;
- goto bad;
- }
+ if (xp->i_dev != dp->i_dev || xp->i_dev != ip->i_dev)
+ panic("rename: EXDEV");
/*
* Short circuit rename(foo, foo).
*/
if (xp->i_number == ip->i_number)
+ panic("rename: same file");
+ /*
+ * If the parent directory is "sticky", then the user must
+ * own the parent directory, or the destination of the rename,
+ * otherwise the destination may not be changed (except by
+ * root). This implements append-only directories.
+ */
+ if ((dp->i_mode & ISVTX) && tndp->ni_cred->cr_uid != 0 &&
+ tndp->ni_cred->cr_uid != dp->i_uid &&
+ xp->i_uid != tndp->ni_cred->cr_uid) {
+ error = EPERM;
goto bad;
+ }
/*
* Target must be empty if a directory
* and have no links to it.
* not directories).
*/
if ((xp->i_mode&IFMT) == IFDIR) {
- if (!dirempty(xp) || xp->i_nlink > 2) {
+ if (!dirempty(xp, dp->i_number, tndp->ni_cred) ||
+ xp->i_nlink > 2) {
error = ENOTEMPTY;
goto bad;
}
error = ENOTDIR;
goto bad;
}
+ cache_purge(ITOV(dp));
} else if (doingdirectory) {
error = EISDIR;
goto bad;
}
- dirrewrite(dp, ip);
- if (u.u_error) {
- error = u.u_error;
- goto bad1;
+ if (error = dirrewrite(dp, ip, tndp))
+ goto bad;
+ /*
+ * If the target directory is in the same
+ * directory as the source directory,
+ * decrement the link count on the parent
+ * of the target directory.
+ */
+ if (doingdirectory && !newparent) {
+ dp->i_nlink--;
+ dp->i_flag |= ICHG;
}
+ vput(ITOV(dp));
/*
* Adjust the link count of the target to
* reflect the dirrewrite above. If this is
* no links to it, so we can squash the inode and
* any space associated with it. We disallowed
* renaming over top of a directory with links to
- * it above, as we've no way to determine if
- * we've got a link or the directory itself, and
- * if we get a link, then ".." will be screwed up.
+ * it above, as the remaining link would point to
+ * a directory without "." or ".." entries.
*/
xp->i_nlink--;
if (doingdirectory) {
if (--xp->i_nlink != 0)
panic("rename: linked directory");
- itrunc(xp, (u_long)0);
+ error = itrunc(xp, (u_long)0, IO_SYNC);
}
xp->i_flag |= ICHG;
iput(xp);
/*
* 3) Unlink the source.
*/
- u.u_dirp = uap->from;
- dp = namei(uchar, DELETE, 0);
+ fndp->ni_nameiop = DELETE | LOCKPARENT | LOCKLEAF;
+ (void)namei(fndp);
+ if (fndp->ni_vp != NULL) {
+ xp = VTOI(fndp->ni_vp);
+ dp = VTOI(fndp->ni_dvp);
+ } else {
+ if (fndp->ni_dvp != NULL)
+ vput(fndp->ni_dvp);
+ xp = NULL;
+ dp = NULL;
+ }
/*
- * Insure directory entry still exists and
- * has not changed since the start of all
- * this. If either has occured, forget about
- * about deleting the original entry and just
- * adjust the link count in the inode.
+ * Ensure that the directory entry still exists and has not
+ * changed while the new name has been entered. If the source is
+ * a file then the entry may have been unlinked or renamed. In
+ * either case there is no further work to be done. If the source
+ * is a directory then it cannot have been rmdir'ed; its link
+ * count of three would cause a rmdir to fail with ENOTEMPTY.
+ * The IRENAME flag ensures that it cannot be moved by another
+ * rename.
*/
- if (dp == NULL || u.u_dent.d_ino != ip->i_number) {
- ip->i_nlink--;
- ip->i_flag |= ICHG;
+ if (xp != ip) {
+ if (doingdirectory)
+ panic("rename: lost dir entry");
} else {
/*
- * If source is a directory, must adjust
- * link count of parent directory also.
- * If target didn't exist and source and
- * target have the same parent, then we
- * needn't touch the link count, it all
- * balances out in the end. Otherwise, we
- * must do so to reflect deletion of ".."
- * done above.
+ * If the source is a directory with a
+ * new parent, the link count of the old
+ * parent directory must be decremented
+ * and ".." set to point to the new parent.
*/
- if (doingdirectory && (xp != NULL || parentdifferent)) {
+ if (doingdirectory && newparent) {
dp->i_nlink--;
dp->i_flag |= ICHG;
+ error = vn_rdwr(UIO_READ, ITOV(xp), (caddr_t)&dirbuf,
+ sizeof (struct dirtemplate), (off_t)0,
+ UIO_SYSSPACE, IO_NODELOCKED,
+ tndp->ni_cred, (int *)0);
+ if (error == 0) {
+ if (dirbuf.dotdot_namlen != 2 ||
+ dirbuf.dotdot_name[0] != '.' ||
+ dirbuf.dotdot_name[1] != '.') {
+ dirbad(xp, 12, "rename: mangled dir");
+ } else {
+ dirbuf.dotdot_ino = newparent;
+ (void) vn_rdwr(UIO_WRITE, ITOV(xp),
+ (caddr_t)&dirbuf,
+ sizeof (struct dirtemplate),
+ (off_t)0, UIO_SYSSPACE,
+ IO_NODELOCKED|IO_SYNC,
+ tndp->ni_cred, (int *)0);
+ cache_purge(ITOV(dp));
+ }
+ }
}
- if (dirremove()) {
- ip->i_nlink--;
- ip->i_flag |= ICHG;
+ error = dirremove(fndp);
+ if (!error) {
+ xp->i_nlink--;
+ xp->i_flag |= ICHG;
}
- if (error == 0) /* conservative */
- error = u.u_error;
+ xp->i_flag &= ~IRENAME;
}
- irele(ip);
if (dp)
- iput(dp);
-
- /*
- * 4) Renaming a directory with the parent
- * different requires ".." to be rewritten.
- * The window is still there for ".." to
- * be inconsistent, but this is unavoidable,
- * and a lot shorter than when it was done
- * in a user process.
- */
- if (doingdirectory && parentdifferent && error == 0) {
- struct dirtemplate dirbuf;
-
- u.u_dirp = uap->to;
- ip = namei(uchar, LOOKUP | LOCKPARENT, 0);
- if (ip == NULL) {
- printf("rename: .. went away\n");
- return;
- }
- dp = u.u_pdir;
- if ((ip->i_mode&IFMT) != IFDIR) {
- printf("rename: .. not a directory\n");
- goto stuck;
- }
- error = rdwri(UIO_READ, ip, (caddr_t)&dirbuf,
- sizeof (struct dirtemplate), (off_t)0, 1, (int *)0);
- if (error == 0) {
- dirbuf.dotdot_ino = dp->i_number;
- (void) rdwri(UIO_WRITE, ip, (caddr_t)&dirbuf,
- sizeof (struct dirtemplate), (off_t)0, 1, (int *)0);
- }
-stuck:
- irele(dp);
- iput(ip);
- }
- goto done;
-
-bad:
- iput(dp);
-bad1:
+ vput(ITOV(dp));
if (xp)
- iput(xp);
-out:
- ip->i_nlink--;
- ip->i_flag |= ICHG;
- irele(ip);
-done:
- if (error)
- u.u_error = error;
-}
-
-/*
- * Make a new file.
- */
-struct inode *
-maknode(mode)
- int mode;
-{
- register struct inode *ip;
- ino_t ipref;
+ vput(ITOV(xp));
+ vrele(ITOV(ip));
+ return (error);
- if ((mode & IFMT) == IFDIR)
- ipref = dirpref(u.u_pdir->i_fs);
- else
- ipref = u.u_pdir->i_number;
- ip = ialloc(u.u_pdir, ipref, mode);
- if (ip == NULL) {
- iput(u.u_pdir);
- return (NULL);
- }
-#ifdef QUOTA
- if (ip->i_dquot != NODQUOT)
- panic("maknode: dquot");
-#endif
- ip->i_flag |= IACC|IUPD|ICHG;
- if ((mode & IFMT) == 0)
- mode |= IFREG;
- ip->i_mode = mode & ~u.u_cmask;
- ip->i_nlink = 1;
- ip->i_uid = u.u_uid;
- ip->i_gid = u.u_pdir->i_gid;
- if (ip->i_mode & ISGID && !groupmember(ip->i_gid))
- ip->i_mode &= ~ISGID;
-#ifdef QUOTA
- ip->i_dquot = inoquota(ip);
-#endif
-
- /*
- * Make sure inode goes to disk before directory entry.
- */
- iupdat(ip, &time, &time, 1);
- u.u_error = direnter(ip);
- if (u.u_error) {
- /*
- * Write error occurred trying to update directory
- * so must deallocate the inode.
- */
- ip->i_nlink = 0;
- ip->i_flag |= ICHG;
- iput(ip);
- return (NULL);
- }
- return (ip);
+bad:
+ if (xp)
+ vput(ITOV(xp));
+ vput(ITOV(dp));
+out:
+ ip->i_nlink--;
+ ip->i_flag |= ICHG;
+ vrele(ITOV(ip));
+ return (error);
}
/*
/*
* Mkdir system call
*/
-mkdir()
+ufs_mkdir(ndp, vap)
+ struct nameidata *ndp;
+ struct vattr *vap;
{
- struct a {
- char *name;
- int dmode;
- } *uap;
register struct inode *ip, *dp;
+ struct inode *tip;
+ struct vnode *dvp;
struct dirtemplate dirtemplate;
+ int error;
+ int dmode;
- uap = (struct a *)u.u_ap;
- ip = namei(uchar, CREATE, 0);
- if (u.u_error)
- return;
- if (ip != NULL) {
- iput(ip);
- u.u_error = EEXIST;
- return;
- }
- dp = u.u_pdir;
- uap->dmode &= 0777;
- uap->dmode |= IFDIR;
+ dvp = ndp->ni_dvp;
+ dp = VTOI(dvp);
+ dmode = vap->va_mode&0777;
+ dmode |= IFDIR;
/*
* Must simulate part of maknode here
* in order to acquire the inode, but
* directory. The entry is made later
* after writing "." and ".." entries out.
*/
- ip = ialloc(dp, dirpref(dp->i_fs), uap->dmode);
- if (ip == NULL) {
+ if (error = ialloc(dp, dirpref(dp->i_fs), dmode, ndp->ni_cred, &tip)) {
iput(dp);
- return;
+ return (error);
}
+ ip = tip;
+ ip->i_uid = ndp->ni_cred->cr_uid;
+ ip->i_gid = dp->i_gid;
#ifdef QUOTA
- if (ip->i_dquot != NODQUOT)
- panic("mkdir: dquot");
+ if ((error = getinoquota(ip)) ||
+ (error = chkiq(ip, 1, ndp->ni_cred, 0))) {
+ ifree(ip, ip->i_number, dmode);
+ iput(ip);
+ iput(dp);
+ return (error);
+ }
#endif
ip->i_flag |= IACC|IUPD|ICHG;
- ip->i_mode = uap->dmode & ~u.u_cmask;
+ ip->i_mode = dmode;
+ ITOV(ip)->v_type = VDIR; /* Rest init'd in iget() */
ip->i_nlink = 2;
- ip->i_uid = u.u_uid;
- ip->i_gid = dp->i_gid;
-#ifdef QUOTA
- ip->i_dquot = inoquota(ip);
-#endif
- iupdat(ip, &time, &time, 1);
+ error = iupdat(ip, &time, &time, 1);
/*
* Bump link count in parent directory
*/
dp->i_nlink++;
dp->i_flag |= ICHG;
- iupdat(dp, &time, &time, 1);
+ error = iupdat(dp, &time, &time, 1);
/*
* Initialize directory with "."
dirtemplate = mastertemplate;
dirtemplate.dot_ino = ip->i_number;
dirtemplate.dotdot_ino = dp->i_number;
- u.u_error = rdwri(UIO_WRITE, ip, (caddr_t)&dirtemplate,
- sizeof (dirtemplate), (off_t)0, 1, (int *)0);
- if (u.u_error) {
+ error = vn_rdwr(UIO_WRITE, ITOV(ip), (caddr_t)&dirtemplate,
+ sizeof (dirtemplate), (off_t)0, UIO_SYSSPACE,
+ IO_NODELOCKED|IO_SYNC, ndp->ni_cred, (int *)0);
+ if (error) {
dp->i_nlink--;
dp->i_flag |= ICHG;
goto bad;
}
+ if (DIRBLKSIZ > dp->i_fs->fs_fsize) {
+ panic("mkdir: blksize"); /* XXX - should grow w/balloc() */
+ } else {
+ ip->i_size = DIRBLKSIZ;
+ ip->i_flag |= ICHG;
+ }
/*
* Directory all set up, now
* install the entry for it in
* the parent directory.
*/
- u.u_error = direnter(ip);
+ error = direnter(ip, ndp);
dp = NULL;
- if (u.u_error) {
- u.u_dirp = uap->name;
- dp = namei(uchar, LOOKUP | NOCACHE, 0);
- if (dp) {
+ if (error) {
+ ndp->ni_nameiop = LOOKUP | NOCACHE;
+ error = namei(ndp);
+ if (!error) {
+ dp = VTOI(ndp->ni_vp);
dp->i_nlink--;
dp->i_flag |= ICHG;
}
bad:
/*
* No need to do an explicit itrunc here,
- * irele will do this for us because we set
+ * vrele will do this for us because we set
* the link count to 0.
*/
- if (u.u_error) {
+ if (error) {
ip->i_nlink = 0;
ip->i_flag |= ICHG;
- }
+ iput(ip);
+ } else
+ ndp->ni_vp = ITOV(ip);
if (dp)
iput(dp);
- iput(ip);
+ return (error);
}
/*
* Rmdir system call.
*/
-rmdir()
+ufs_rmdir(ndp)
+ register struct nameidata *ndp;
{
- struct a {
- char *name;
- };
register struct inode *ip, *dp;
+ int error = 0;
- ip = namei(uchar, DELETE | LOCKPARENT, 0);
- if (ip == NULL)
- return;
- dp = u.u_pdir;
+ ip = VTOI(ndp->ni_vp);
+ dp = VTOI(ndp->ni_dvp);
/*
* No rmdir "." please.
*/
if (dp == ip) {
- irele(dp);
+ vrele(ITOV(dp));
iput(ip);
- u.u_error = EINVAL;
- return;
- }
- if ((ip->i_mode&IFMT) != IFDIR) {
- u.u_error = ENOTDIR;
- goto out;
- }
- /*
- * Don't remove a mounted on directory.
- */
- if (ip->i_dev != dp->i_dev) {
- u.u_error = EBUSY;
- goto out;
+ return (EINVAL);
}
/*
* Verify the directory is empty (and valid).
* the current directory and thus be
* non-empty.)
*/
- if (ip->i_nlink != 2 || !dirempty(ip)) {
- u.u_error = ENOTEMPTY;
+ if (ip->i_nlink != 2 || !dirempty(ip, dp->i_number, ndp->ni_cred)) {
+ error = ENOTEMPTY;
goto out;
}
/*
* inode. If we crash in between, the directory
* will be reattached to lost+found,
*/
- if (dirremove() == 0)
+ if (error = dirremove(ndp))
goto out;
dp->i_nlink--;
dp->i_flag |= ICHG;
+ cache_purge(ITOV(dp));
iput(dp);
- dp = NULL;
+ ndp->ni_dvp = NULL;
/*
* Truncate inode. The only stuff left
* in the directory is "." and "..". The
* worry about them later.
*/
ip->i_nlink -= 2;
- itrunc(ip, (u_long)0);
+ error = itrunc(ip, (u_long)0, IO_SYNC);
+ cache_purge(ITOV(ip));
out:
- if (dp)
+ if (ndp->ni_dvp)
iput(dp);
iput(ip);
+ return (error);
+}
+
+/*
+ * symlink -- make a symbolic link
+ */
+ufs_symlink(ndp, vap, target)
+ struct nameidata *ndp;
+ struct vattr *vap;
+ char *target;
+{
+ struct inode *ip;
+ int error;
+
+ error = maknode(IFLNK | vap->va_mode, ndp, &ip);
+ if (error)
+ return (error);
+ error = vn_rdwr(UIO_WRITE, ITOV(ip), target, strlen(target), (off_t)0,
+ UIO_SYSSPACE, IO_NODELOCKED, ndp->ni_cred, (int *)0);
+ iput(ip);
+ return (error);
+}
+
+/*
+ * Vnode op for read and write
+ */
+ufs_readdir(vp, uio, cred, eofflagp)
+ struct vnode *vp;
+ register struct uio *uio;
+ struct ucred *cred;
+ int *eofflagp;
+{
+ int count, lost, error;
+
+ count = uio->uio_resid;
+ count &= ~(DIRBLKSIZ - 1);
+ lost = uio->uio_resid - count;
+ if (count < DIRBLKSIZ || (uio->uio_offset & (DIRBLKSIZ -1)))
+ return (EINVAL);
+ uio->uio_resid = count;
+ uio->uio_iov->iov_len = count;
+ error = ufs_read(vp, uio, 0, cred);
+ uio->uio_resid += lost;
+ if ((VTOI(vp)->i_size - uio->uio_offset) <= 0)
+ *eofflagp = 1;
+ else
+ *eofflagp = 0;
+ return (error);
+}
+
+/*
+ * Return target name of a symbolic link
+ */
+ufs_readlink(vp, uiop, cred)
+ struct vnode *vp;
+ struct uio *uiop;
+ struct ucred *cred;
+{
+
+ return (ufs_read(vp, uiop, 0, cred));
+}
+
+/*
+ * Ufs abort op, called after namei() when a CREATE/DELETE isn't actually
+ * done. Nothing to do at the moment.
+ */
+/* ARGSUSED */
+ufs_abortop(ndp)
+ struct nameidata *ndp;
+{
+
+ return (0);
+}
+
+/*
+ * Lock an inode.
+ */
+ufs_lock(vp)
+ struct vnode *vp;
+{
+ register struct inode *ip = VTOI(vp);
+
+ ILOCK(ip);
+ return (0);
+}
+
+/*
+ * Unlock an inode.
+ */
+ufs_unlock(vp)
+ struct vnode *vp;
+{
+ register struct inode *ip = VTOI(vp);
+
+ if (!(ip->i_flag & ILOCKED))
+ panic("ufs_unlock NOT LOCKED");
+ IUNLOCK(ip);
+ return (0);
+}
+
+/*
+ * Check for a locked inode.
+ */
+ufs_islocked(vp)
+ struct vnode *vp;
+{
+
+ if (VTOI(vp)->i_flag & ILOCKED)
+ return (1);
+ return (0);
}
-struct file *
-getinode(fdes)
- int fdes;
+/*
+ * Get access to bmap
+ */
+ufs_bmap(vp, bn, vpp, bnp)
+ struct vnode *vp;
+ daddr_t bn;
+ struct vnode **vpp;
+ daddr_t *bnp;
{
- register struct file *fp;
+ struct inode *ip = VTOI(vp);
- fp = getf(fdes);
- if (fp == 0)
+ if (vpp != NULL)
+ *vpp = ip->i_devvp;
+ if (bnp == NULL)
return (0);
- if (fp->f_type != DTYPE_INODE) {
- u.u_error = EINVAL;
+ return (bmap(ip, bn, bnp));
+}
+
+/*
+ * Calculate the logical to physical mapping if not done already,
+ * then call the device strategy routine.
+ */
+int checkoverlap = 0;
+
+ufs_strategy(bp)
+ register struct buf *bp;
+{
+ register struct inode *ip = VTOI(bp->b_vp);
+ struct vnode *vp;
+ int error;
+
+ if (bp->b_vp->v_type == VBLK || bp->b_vp->v_type == VCHR)
+ panic("ufs_strategy: spec");
+ if (bp->b_blkno == bp->b_lblkno) {
+ if (error = bmap(ip, bp->b_lblkno, &bp->b_blkno))
+ return (error);
+ if ((long)bp->b_blkno == -1)
+ clrbuf(bp);
+ }
+ if ((long)bp->b_blkno == -1) {
+ biodone(bp);
return (0);
}
- return (fp);
+#ifdef DIAGNOSTIC
+ if (checkoverlap) {
+ register struct buf *ep;
+ struct buf *ebp;
+ daddr_t start, last;
+
+ ebp = &buf[nbuf];
+ start = bp->b_blkno;
+ last = start + btodb(bp->b_bcount) - 1;
+ for (ep = buf; ep < ebp; ep++) {
+ if (ep == bp || (ep->b_flags & B_INVAL) ||
+ ep->b_vp == NULLVP)
+ continue;
+ if (VOP_BMAP(ep->b_vp, (daddr_t)0, &vp, (daddr_t)0))
+ continue;
+ if (vp != ip->i_devvp)
+ continue;
+ /* look for overlap */
+ if (ep->b_bcount == 0 || ep->b_blkno > last ||
+ ep->b_blkno + btodb(ep->b_bcount) <= start)
+ continue;
+ vprint("Disk overlap", vp);
+ printf("\tstart %d, end %d overlap start %d, end %d\n",
+ start, last, ep->b_blkno,
+ ep->b_blkno + btodb(ep->b_bcount) - 1);
+ panic("Disk buffer overlap");
+ }
+ }
+#endif /* DIAGNOSTIC */
+ vp = ip->i_devvp;
+ bp->b_dev = vp->v_rdev;
+ (*(vp->v_op->vn_strategy))(bp);
+ return (0);
+}
+
+/*
+ * Print out the contents of an inode.
+ */
+ufs_print(vp)
+ struct vnode *vp;
+{
+ register struct inode *ip = VTOI(vp);
+
+ printf("tag VT_UFS, ino %d, on dev %d, %d", ip->i_number,
+ major(ip->i_dev), minor(ip->i_dev));
+#ifdef FIFO
+ if (vp->v_type == VFIFO)
+ fifo_printinfo(vp);
+#endif /* FIFO */
+ printf("%s\n", (ip->i_flag & ILOCKED) ? " (LOCKED)" : "");
+ if (ip->i_spare0 == 0)
+ return;
+ printf("\towner pid %d", ip->i_spare0);
+ if (ip->i_spare1)
+ printf(" waiting pid %d", ip->i_spare1);
+ printf("\n");
+}
+
+/*
+ * Read wrapper for special devices.
+ */
+ufsspec_read(vp, uio, ioflag, cred)
+ struct vnode *vp;
+ struct uio *uio;
+ int ioflag;
+ struct ucred *cred;
+{
+
+ /*
+ * Set access flag.
+ */
+ VTOI(vp)->i_flag |= IACC;
+ return (spec_read(vp, uio, ioflag, cred));
+}
+
+/*
+ * Write wrapper for special devices.
+ */
+ufsspec_write(vp, uio, ioflag, cred)
+ struct vnode *vp;
+ struct uio *uio;
+ int ioflag;
+ struct ucred *cred;
+{
+
+ /*
+ * Set update and change flags.
+ */
+ VTOI(vp)->i_flag |= IUPD|ICHG;
+ return (spec_write(vp, uio, ioflag, cred));
+}
+
+/*
+ * Close wrapper for special devices.
+ *
+ * Update the times on the inode then do device close.
+ */
+ufsspec_close(vp, fflag, cred)
+ struct vnode *vp;
+ int fflag;
+ struct ucred *cred;
+{
+ register struct inode *ip = VTOI(vp);
+
+ if (vp->v_usecount > 1 && !(ip->i_flag & ILOCKED))
+ ITIMES(ip, &time, &time);
+ return (spec_close(vp, fflag, cred));
+}
+
+#ifdef FIFO
+/*
+ * Read wrapper for fifo's
+ */
+ufsfifo_read(vp, uio, ioflag, cred)
+ struct vnode *vp;
+ struct uio *uio;
+ int ioflag;
+ struct ucred *cred;
+{
+
+ /*
+ * Set access flag.
+ */
+ VTOI(vp)->i_flag |= IACC;
+ return (fifo_read(vp, uio, ioflag, cred));
+}
+
+/*
+ * Write wrapper for fifo's.
+ */
+ufsfifo_write(vp, uio, ioflag, cred)
+ struct vnode *vp;
+ struct uio *uio;
+ int ioflag;
+ struct ucred *cred;
+{
+
+ /*
+ * Set update and change flags.
+ */
+ VTOI(vp)->i_flag |= IUPD|ICHG;
+ return (fifo_write(vp, uio, ioflag, cred));
+}
+
+/*
+ * Close wrapper for fifo's.
+ *
+ * Update the times on the inode then do device close.
+ */
+ufsfifo_close(vp, fflag, cred)
+ struct vnode *vp;
+ int fflag;
+ struct ucred *cred;
+{
+ register struct inode *ip = VTOI(vp);
+
+ if (vp->v_usecount > 1 && !(ip->i_flag & ILOCKED))
+ ITIMES(ip, &time, &time);
+ return (fifo_close(vp, fflag, cred));
+}
+#endif /* FIFO */
+
+/*
+ * Make a new file.
+ */
+maknode(mode, ndp, ipp)
+ int mode;
+ register struct nameidata *ndp;
+ struct inode **ipp;
+{
+ register struct inode *ip;
+ struct inode *tip;
+ register struct inode *pdir = VTOI(ndp->ni_dvp);
+ ino_t ipref;
+ int error;
+
+ *ipp = 0;
+ if ((mode & IFMT) == 0)
+ mode |= IFREG;
+ if ((mode & IFMT) == IFDIR)
+ ipref = dirpref(pdir->i_fs);
+ else
+ ipref = pdir->i_number;
+ if (error = ialloc(pdir, ipref, mode, ndp->ni_cred, &tip)) {
+ iput(pdir);
+ return (error);
+ }
+ ip = tip;
+ ip->i_uid = ndp->ni_cred->cr_uid;
+ ip->i_gid = pdir->i_gid;
+#ifdef QUOTA
+ if ((error = getinoquota(ip)) ||
+ (error = chkiq(ip, 1, ndp->ni_cred, 0))) {
+ ifree(ip, ip->i_number, mode);
+ iput(ip);
+ iput(pdir);
+ return (error);
+ }
+#endif
+ ip->i_flag |= IACC|IUPD|ICHG;
+ ip->i_mode = mode;
+ ITOV(ip)->v_type = IFTOVT(mode); /* Rest init'd in iget() */
+ ip->i_nlink = 1;
+ if ((ip->i_mode & ISGID) && !groupmember(ip->i_gid, ndp->ni_cred) &&
+ suser(ndp->ni_cred, NULL))
+ ip->i_mode &= ~ISGID;
+
+ /*
+ * Make sure inode goes to disk before directory entry.
+ */
+ if (error = iupdat(ip, &time, &time, 1))
+ goto bad;
+ if (error = direnter(ip, ndp)) {
+ pdir = NULL;
+ goto bad;
+ }
+ *ipp = ip;
+ return (0);
+
+bad:
+ /*
+ * Write error occurred trying to update the inode
+ * or the directory so must deallocate the inode.
+ */
+ if (pdir)
+ iput(pdir);
+ ip->i_nlink = 0;
+ ip->i_flag |= ICHG;
+ iput(ip);
+ return (error);
+}
+
+/*
+ * Advisory record locking support
+ */
+ufs_advlock(vp, id, op, fl, flags)
+ struct vnode *vp;
+ caddr_t id;
+ int op;
+ register struct flock *fl;
+ int flags;
+{
+ register struct inode *ip = VTOI(vp);
+ register struct lockf *lock;
+ off_t start, end;
+ int error;
+
+ /*
+ * Avoid the common case of unlocking when inode has no locks.
+ */
+ if (ip->i_lockf == (struct lockf *)0) {
+ if (op != F_SETLK) {
+ fl->l_type = F_UNLCK;
+ return (0);
+ }
+ }
+ /*
+ * Convert the flock structure into a start and end.
+ */
+ switch (fl->l_whence) {
+
+ case SEEK_SET:
+ case SEEK_CUR:
+ /*
+ * Caller is responsible for adding any necessary offset
+ * when SEEK_CUR is used.
+ */
+ start = fl->l_start;
+ break;
+
+ case SEEK_END:
+ start = ip->i_size + fl->l_start;
+ break;
+
+ default:
+ return (EINVAL);
+ }
+ if (start < 0)
+ return (EINVAL);
+ if (fl->l_len == 0)
+ end = -1;
+ else
+ end = start + fl->l_len;
+ /*
+ * Create the lockf structure
+ */
+ MALLOC(lock, struct lockf *, sizeof *lock, M_LOCKF, M_WAITOK);
+ lock->lf_start = start;
+ lock->lf_end = end;
+ lock->lf_id = id;
+ lock->lf_inode = ip;
+ lock->lf_type = fl->l_type;
+ lock->lf_next = (struct lockf *)0;
+ lock->lf_block = (struct lockf *)0;
+ lock->lf_flags = flags;
+ /*
+ * Do the requested operation.
+ */
+ switch(op) {
+ case F_SETLK:
+ return (ufs_setlock(lock));
+
+ case F_UNLCK:
+ return (ufs_advunlock(lock));
+
+ case F_GETLK:
+ return (ufs_advgetlock(lock, fl));
+
+ default:
+ free(lock, M_LOCKF);
+ return (EINVAL);
+ }
+ /* NOTREACHED */
+}
+
+/*
+ * This variable controls the maximum number of processes that will
+ * be checked in doing deadlock detection.
+ */
+int maxlockdepth = MAXDEPTH;
+
+/*
+ * Set a byte-range lock.
+ */
+ufs_setlock(lock)
+ register struct lockf *lock;
+{
+ register struct inode *ip = lock->lf_inode;
+ register struct lockf *block;
+ static char lockstr[] = "lockf";
+ int priority, error;
+
+#ifdef LOCKF_DEBUG
+ if (lockf_debug & 4)
+ lf_print("ufs_setlock", lock);
+#endif /* LOCKF_DEBUG */
+
+ /*
+ * Set the priority
+ */
+ priority = PLOCK;
+ if ((lock->lf_type & F_WRLCK) == 0)
+ priority += 4;
+ priority |= PCATCH;
+ /*
+ * Scan lock list for this file looking for locks that would block us.
+ */
+ while (block = lf_getblock(lock)) {
+ /*
+ * Free the structure and return if nonblocking.
+ */
+ if ((lock->lf_flags & F_WAIT) == 0) {
+ free(lock, M_LOCKF);
+ return (EAGAIN);
+ }
+ /*
+ * We are blocked. Since flock style locks cover
+ * the whole file, there is no chance for deadlock.
+ * For byte-range locks we must check for deadlock.
+ *
+ * Deadlock detection is done by looking through the
+ * wait channels to see if there are any cycles that
+ * involve us. MAXDEPTH is set just to make sure we
+ * do not go off into neverland.
+ */
+ if ((lock->lf_flags & F_POSIX) &&
+ (block->lf_flags & F_POSIX)) {
+ register struct proc *wproc;
+ register struct lockf *waitblock;
+ int i = 0;
+
+ /* The block is waiting on something */
+ wproc = (struct proc *)block->lf_id;
+ while (wproc->p_wchan &&
+ (wproc->p_wmesg == lockstr) &&
+ (i++ < maxlockdepth)) {
+ waitblock = (struct lockf *)wproc->p_wchan;
+ /* Get the owner of the blocking lock */
+ waitblock = waitblock->lf_next;
+ if ((waitblock->lf_flags & F_POSIX) == 0)
+ break;
+ wproc = (struct proc *)waitblock->lf_id;
+ if (wproc == (struct proc *)lock->lf_id) {
+ free(lock, M_LOCKF);
+ return (EDEADLK);
+ }
+ }
+ }
+ /*
+ * Add our lock to the blocked
+ * list and sleep until we're free.
+ */
+#ifdef LOCKF_DEBUG
+ if (lockf_debug & 4)
+ lf_print("ufs_advlock: blocking on", block);
+#endif /* LOCKF_DEBUG */
+ /*
+ * Remember who blocked us (for deadlock detection)
+ */
+ lock->lf_next = block;
+ lf_addblock(block, lock);
+ if (error = tsleep((caddr_t *)lock, priority, lockstr, 0)) {
+ free(lock, M_LOCKF);
+ return (error);
+ }
+ }
+ /*
+ * No blocks!! Add the lock. Note that addlock will
+ * downgrade or upgrade any overlapping locks this
+ * process already owns.
+ */
+#ifdef LOCKF_DEBUG
+ if (lockf_debug & 4)
+ lf_print("ufs_advlock: got the lock", lock);
+#endif /* LOCKF_DEBUG */
+ lf_addlock(lock);
+ return (0);
}
/*
- * mode mask for creation of files
+ * Remove a byte-range lock on an inode.
*/
-umask()
+ufs_advunlock(lock)
+ struct lockf *lock;
{
- register struct a {
- int mask;
- } *uap;
+ struct lockf *blocklist;
+
+ if (lock->lf_inode->i_lockf == (struct lockf *)0)
+ return (0);
+#ifdef LOCKF_DEBUG
+ if (lockf_debug & 4)
+ lf_print("ufs_advunlock", lock);
+#endif /* LOCKF_DEBUG */
+ /*
+ * Generally, find the lock (or an overlap to that lock)
+ * and remove it (or shrink it), then wakeup anyone we can.
+ */
+ blocklist = lf_remove(lock);
+ FREE(lock, M_LOCKF);
+ lf_wakelock(blocklist);
+ return (0);
+}
- uap = (struct a *)u.u_ap;
- u.u_r.r_val1 = u.u_cmask;
- u.u_cmask = uap->mask & 07777;
+/*
+ * Return the blocking pid
+ */
+ufs_advgetlock(lock, fl)
+ register struct lockf *lock;
+ register struct flock *fl;
+{
+ register struct lockf *block;
+ off_t start, end;
+
+#ifdef LOCKF_DEBUG
+ if (lockf_debug & 4)
+ lf_print("ufs_advgetlock", lock);
+#endif /* LOCKF_DEBUG */
+
+ if (block = lf_getblock(lock)) {
+ fl->l_type = block->lf_type;
+ fl->l_whence = SEEK_SET;
+ fl->l_start = block->lf_start;
+ if (block->lf_end == -1)
+ fl->l_len = 0;
+ else
+ fl->l_len = block->lf_end - block->lf_start;
+ if (block->lf_flags & F_POSIX)
+ fl->l_pid = ((struct proc *)(block->lf_id))->p_pid;
+ else
+ fl->l_pid = -1;
+ }
+ FREE(lock, M_LOCKF);
+ return (0);
}