have to zero mount structures when they are allocated
[unix-history] / usr / src / sys / ufs / ffs / ffs_vfsops.c
/*
* Copyright (c) 1989, 1991 The Regents of the University of California.
* All rights reserved.
*
* %sccs.include.redist.c%
*
* @(#)ffs_vfsops.c 7.63 (Berkeley) %G%
*/
#include <sys/param.h>
#include <sys/systm.h>
#include <sys/namei.h>
#include <sys/proc.h>
#include <sys/kernel.h>
#include <sys/vnode.h>
#include <sys/specdev.h>
#include <sys/mount.h>
#include <sys/buf.h>
#include <sys/file.h>
#include <sys/disklabel.h>
#include <sys/ioctl.h>
#include <sys/errno.h>
#include <sys/malloc.h>
#include "ioctl.h"
#include "disklabel.h"
#include "stat.h"
#include <ufs/ufs/quota.h>
#include <ufs/ufs/ufsmount.h>
#include <ufs/ufs/inode.h>
#include <ufs/ufs/ufs_extern.h>
#include <ufs/ffs/fs.h>
#include <ufs/ffs/ffs_extern.h>
int ffs_sbupdate __P((struct ufsmount *, int));
struct vfsops ufs_vfsops = {
ffs_mount,
ufs_start,
ffs_unmount,
ffs_root,
ufs_quotactl,
ffs_statfs,
ffs_sync,
ffs_fhtovp,
ffs_vptofh,
ffs_init,
};
/*
* Called by vfs_mountroot when ufs is going to be mounted as root.
*
* Name is updated by mount(8) after booting.
*/
#define ROOTNAME "root_device"
ffs_mountroot()
{
extern struct vnode *rootvp;
register struct fs *fs;
register struct mount *mp;
struct proc *p = curproc; /* XXX */
struct ufsmount *ump;
u_int size;
int error;
mp = malloc((u_long)sizeof(struct mount),
M_MOUNT, M_WAITOK);
mp->mnt_op = &ufs_vfsops;
mp->mnt_flag = MNT_RDONLY;
mp->mnt_mounth = NULLVP;
if (error = ffs_mountfs(rootvp, mp, p)) {
free(mp, M_MOUNT);
return (error);
}
if (error = vfs_lock(mp)) {
(void)ffs_unmount(mp, 0, p);
free(mp, M_MOUNT);
return (error);
}
rootfs = mp;
mp->mnt_next = mp;
mp->mnt_prev = mp;
mp->mnt_vnodecovered = NULLVP;
ump = VFSTOUFS(mp);
fs = ump->um_fs;
bzero(fs->fs_fsmnt, sizeof(fs->fs_fsmnt));
fs->fs_fsmnt[0] = '/';
bcopy((caddr_t)fs->fs_fsmnt, (caddr_t)mp->mnt_stat.f_mntonname,
MNAMELEN);
(void) copystr(ROOTNAME, mp->mnt_stat.f_mntfromname, MNAMELEN - 1,
&size);
bzero(mp->mnt_stat.f_mntfromname + size, MNAMELEN - size);
(void)ffs_statfs(mp, &mp->mnt_stat, p);
vfs_unlock(mp);
inittodr(fs->fs_time);
return (0);
}
/*
* VFS Operations.
*
* mount system call
*/
int
ffs_mount(mp, path, data, ndp, p)
register struct mount *mp;
char *path;
caddr_t data;
struct nameidata *ndp;
struct proc *p;
{
struct vnode *devvp;
struct ufs_args args;
struct ufsmount *ump;
register struct fs *fs;
u_int size;
int error;
if (error = copyin(data, (caddr_t)&args, sizeof (struct ufs_args)))
return (error);
/*
* If updating, check whether changing from read-only to
* read/write; if there is no device name, that's all we do.
*/
if (mp->mnt_flag & MNT_UPDATE) {
ump = VFSTOUFS(mp);
fs = ump->um_fs;
if (fs->fs_ronly && (mp->mnt_flag & MNT_RDONLY) == 0)
fs->fs_ronly = 0;
if (args.fspec == 0) {
/*
* Process export requests.
*/
if (args.exflags & MNT_EXPORTED) {
if (error = hang_addrlist(mp, &args))
return (error);
mp->mnt_flag |= MNT_EXPORTED;
}
if (args.exflags & MNT_DELEXPORT) {
free_addrlist(ump);
mp->mnt_flag &=
~(MNT_EXPORTED | MNT_DEFEXPORTED);
}
return (0);
}
}
/*
* Not an update, or updating the name: look up the name
* and verify that it refers to a sensible block device.
*/
NDINIT(ndp, LOOKUP, FOLLOW, UIO_USERSPACE, args.fspec, p);
if (error = namei(ndp))
return (error);
devvp = ndp->ni_vp;
if (devvp->v_type != VBLK) {
vrele(devvp);
return (ENOTBLK);
}
if (major(devvp->v_rdev) >= nblkdev) {
vrele(devvp);
return (ENXIO);
}
if ((mp->mnt_flag & MNT_UPDATE) == 0)
error = ffs_mountfs(devvp, mp, p);
else {
if (devvp != ump->um_devvp)
error = EINVAL; /* needs translation */
else
vrele(devvp);
}
if (error) {
vrele(devvp);
return (error);
}
ump = VFSTOUFS(mp);
fs = ump->um_fs;
(void) copyinstr(path, fs->fs_fsmnt, sizeof(fs->fs_fsmnt) - 1, &size);
bzero(fs->fs_fsmnt + size, sizeof(fs->fs_fsmnt) - size);
bcopy((caddr_t)fs->fs_fsmnt, (caddr_t)mp->mnt_stat.f_mntonname,
MNAMELEN);
(void) copyinstr(args.fspec, mp->mnt_stat.f_mntfromname, MNAMELEN - 1,
&size);
bzero(mp->mnt_stat.f_mntfromname + size, MNAMELEN - size);
(void)ffs_statfs(mp, &mp->mnt_stat, p);
return (0);
}
/*
* Common code for mount and mountroot
*/
int
ffs_mountfs(devvp, mp, p)
register struct vnode *devvp;
struct mount *mp;
struct proc *p;
{
register struct ufsmount *ump = (struct ufsmount *)0;
struct buf *bp = NULL;
register struct fs *fs;
dev_t dev = devvp->v_rdev;
struct partinfo dpart;
int havepart = 0, blks;
caddr_t base, space;
int havepart = 0, blks;
int error, i, size;
int needclose = 0;
int ronly = (mp->mnt_flag & MNT_RDONLY) != 0;
extern struct vnode *rootvp;
if (error = VOP_OPEN(devvp, ronly ? FREAD : FREAD|FWRITE, NOCRED, p))
return (error);
needclose = 1;
if (VOP_IOCTL(devvp, DIOCGPART, (caddr_t)&dpart, FREAD, NOCRED, p) != 0)
size = DEV_BSIZE;
else {
havepart = 1;
size = dpart.disklab->d_secsize;
}
if (error = bread(devvp, SBLOCK, SBSIZE, NOCRED, &bp))
goto out;
fs = bp->b_un.b_fs;
error = EINVAL; /* XXX needs translation */
goto out;
}
ump = malloc(sizeof *ump, M_UFSMNT, M_WAITOK);
bzero((caddr_t)ump, sizeof *ump);
ump->um_fs = malloc((u_long)fs->fs_sbsize, M_UFSMNT,
M_WAITOK);
bcopy((caddr_t)bp->b_un.b_addr, (caddr_t)ump->um_fs,
(u_int)fs->fs_sbsize);
if (fs->fs_sbsize < SBSIZE)
bp->b_flags |= B_INVAL;
brelse(bp);
bp = NULL;
fs = ump->um_fs;
fs->fs_ronly = ronly;
if (ronly == 0)
fs->fs_fmod = 1;
if (havepart) {
dpart.part->p_fstype = FS_BSDFFS;
dpart.part->p_fsize = fs->fs_fsize;
dpart.part->p_frag = fs->fs_frag;
dpart.part->p_cpg = fs->fs_cpg;
}
#ifdef SECSIZE
/*
* If we have a disk label, force per-partition
* filesystem information to be correct
* and set correct current fsbtodb shift.
*/
#endif SECSIZE
if (havepart) {
dpart.part->p_fstype = FS_BSDFFS;
dpart.part->p_fsize = fs->fs_fsize;
dpart.part->p_frag = fs->fs_frag;
#ifdef SECSIZE
#ifdef tahoe
/*
* Save the original fsbtodb shift to restore on updates.
* (Console doesn't understand fsbtodb changes.)
*/
fs->fs_sparecon[0] = fs->fs_fsbtodb;
#endif
i = fs->fs_fsize / size;
for (fs->fs_fsbtodb = 0; i > 1; i >>= 1)
fs->fs_fsbtodb++;
#endif SECSIZE
fs->fs_dbsize = size;
}
blks = howmany(fs->fs_cssize, fs->fs_fsize);
base = space = malloc((u_long)fs->fs_cssize, M_UFSMNT,
M_WAITOK);
for (i = 0; i < blks; i += fs->fs_frag) {
size = fs->fs_bsize;
if (i + fs->fs_frag > blks)
size = (blks - i) * fs->fs_fsize;
#ifdef SECSIZE
tp = bread(dev, fsbtodb(fs, fs->fs_csaddr + i), size,
fs->fs_dbsize);
#else SECSIZE
error = bread(devvp, fsbtodb(fs, fs->fs_csaddr + i), size,
NOCRED, &bp);
if (error) {
free(base, M_UFSMNT);
goto out;
}
bcopy((caddr_t)bp->b_un.b_addr, space, (u_int)size);
fs->fs_csp[fragstoblks(fs, i)] = (struct csum *)space;
space += size;
brelse(bp);
bp = NULL;
}
mp->mnt_data = (qaddr_t)ump;
mp->mnt_stat.f_fsid.val[0] = (long)dev;
mp->mnt_stat.f_fsid.val[1] = MOUNT_UFS;
mp->mnt_flag |= MNT_LOCAL;
ump->um_mountp = mp;
ump->um_dev = dev;
ump->um_devvp = devvp;
for (i = 0; i < MAXQUOTAS; i++)
ump->um_quotas[i] = NULLVP;
devvp->v_specflags |= SI_MOUNTEDON;
/* Sanity checks for old file systems. XXX */
fs->fs_npsect = MAX(fs->fs_npsect, fs->fs_nsect); /* XXX */
fs->fs_interleave = MAX(fs->fs_interleave, 1); /* XXX */
if (fs->fs_postblformat == FS_42POSTBLFMT) /* XXX */
fs->fs_nrpos = 8; /* XXX */
return (0);
out:
if (bp)
brelse(bp);
if (needclose)
(void)VOP_CLOSE(devvp, ronly ? FREAD : FREAD|FWRITE, NOCRED, p);
if (ump) {
free(ump->um_fs, M_UFSMNT);
free(ump, M_UFSMNT);
mp->mnt_data = (qaddr_t)0;
}
return (error);
}
/*
* unmount system call
*/
int
ffs_unmount(mp, mntflags, p)
struct mount *mp;
int mntflags;
struct proc *p;
{
extern int doforce;
register struct ufsmount *ump;
register struct fs *fs;
int i, error, ronly, flags = 0;
if (mntflags & MNT_FORCE) {
if (!doforce || mp == rootfs)
return (EINVAL);
flags |= FORCECLOSE;
}
mntflushbuf(mp, 0);
if (mntinvalbuf(mp))
return (EBUSY);
ump = VFSTOUFS(mp);
return (error);
#ifdef QUOTA
if (mp->mnt_flag & MNT_QUOTA) {
if (error = vflush(mp, NULLVP, SKIPSYSTEM|flags))
return (error);
for (i = 0; i < MAXQUOTAS; i++) {
if (ump->um_quotas[i] == NULLVP)
continue;
quotaoff(p, mp, i);
}
/*
* Here we fall through to vflush again to ensure
* that we have gotten rid of all the system vnodes.
*/
}
#endif
if (error = vflush(mp, NULLVP, flags))
return (error);
fs = ump->um_fs;
ronly = !fs->fs_ronly;
* Get file system statistics.
*/
int
ffs_statfs(mp, sbp, p)
struct mount *mp;
register struct statfs *sbp;
struct proc *p;
{
register struct ufsmount *ump;
register struct fs *fs;
ump = VFSTOUFS(mp);
fs = ump->um_fs;
if (fs->fs_magic != FS_MAGIC)
panic("ffs_statfs");
sbp->f_type = MOUNT_UFS;
sbp->f_bsize = fs->fs_fsize;
sbp->f_iosize = fs->fs_bsize;
sbp->f_blocks = fs->fs_dsize;
sbp->f_bfree = fs->fs_cstotal.cs_nbfree * fs->fs_frag +
fs->fs_cstotal.cs_nffree;
sbp->f_bavail = (fs->fs_dsize * (100 - fs->fs_minfree) / 100) -
(fs->fs_dsize - sbp->f_bfree);
sbp->f_files = fs->fs_ncg * fs->fs_ipg - ROOTINO;
sbp->f_ffree = fs->fs_cstotal.cs_nifree;
if (sbp != &mp->mnt_stat) {
bcopy((caddr_t)mp->mnt_stat.f_mntonname,
(caddr_t)&sbp->f_mntonname[0], MNAMELEN);
bcopy((caddr_t)mp->mnt_stat.f_mntfromname,
(caddr_t)&sbp->f_mntfromname[0], MNAMELEN);
}
return (0);
}
/*
* Go through the disk queues to initiate sandbagged IO;
* go through the inodes to write those that have been modified;
* initiate the writing of the super block if it has been modified.
*
* Note: we are always called with the filesystem marked `MPBUSY'.
*/
int
ffs_sync(mp, waitfor)
struct mount *mp;
int waitfor;
{
extern int syncprt;
register struct vnode *vp;
register struct inode *ip;
register struct ufsmount *ump = VFSTOUFS(mp);
register struct fs *fs;
int error, allerror = 0;
if (syncprt)
ufs_bufstats();
fs = ump->um_fs;
/*
* Write back modified superblock.
* Consistency check that the superblock
* is still in the buffer cache.
*/
if (fs->fs_fmod != 0) {
if (fs->fs_ronly != 0) { /* XXX */
printf("fs = %s\n", fs->fs_fsmnt);
panic("update: rofs mod");
}
fs->fs_fmod = 0;
fs->fs_time = time.tv_sec;
allerror = ffs_sbupdate(ump, waitfor);
}
/*
* Write back each (modified) inode.
*/
loop:
for (vp = mp->mnt_mounth; vp; vp = vp->v_mountf) {
/*
* If the vnode that we are about to sync is no longer
* associated with this mount point, start over.
*/
if (vp->v_mount != mp)
goto loop;
if (VOP_ISLOCKED(vp))
continue;
ip = VTOI(vp);
if ((ip->i_flag & (IMOD|IACC|IUPD|ICHG)) == 0 &&
vp->v_dirtyblkhd == NULL)
continue;
if (vget(vp))
goto loop;
if (vp->v_dirtyblkhd)
vflushbuf(vp, 0);
if ((ip->i_flag & (IMOD|IACC|IUPD|ICHG)) &&
(error = ffs_update(vp, &time, &time, 0)))
allerror = error;
vput(vp);
}
/*
* Force stale file system control information to be flushed.
*/
vflushbuf(ump->um_devvp, waitfor == MNT_WAIT ? B_SYNC : 0);
#ifdef QUOTA
qsync(mp);
#endif
return (allerror);
}
/*
* File handle to vnode
*
* Have to be really careful about stale file handles:
* - check that the inode number is valid
* - call ffs_vget() to get the locked inode
* - check for an unallocated inode (i_mode == 0)
* - check that the generation number matches unless setgen true
*/
int
ffs_fhtovp(mp, fhp, setgen, vpp)
register struct mount *mp;
struct fid *fhp;
int setgen;
struct vnode **vpp;
{
register struct inode *ip;
register struct ufid *ufhp;
struct fs *fs;
struct vnode *nvp;
int error;
ufhp = (struct ufid *)fhp;
fs = VFSTOUFS(mp)->um_fs;
if (ufhp->ufid_ino < ROOTINO ||
ufhp->ufid_ino >= fs->fs_ncg * fs->fs_ipg)
return (EINVAL);
if (error = ffs_vget(mp, ufhp->ufid_ino, &nvp)) {
*vpp = NULLVP;
return (error);
}
ip = VTOI(nvp);
if (ip->i_mode == 0) {
ufs_iput(ip);
*vpp = NULLVP;
return (EINVAL);
}
if (ip->i_gen != ufhp->ufid_gen) {
if (setgen)
ufhp->ufid_gen = ip->i_gen;
else {
ufs_iput(ip);
*vpp = NULLVP;
return (EINVAL);
}
}
*vpp = nvp;
return (0);
}
/*
* Vnode pointer to File handle
*/
/* ARGSUSED */
ffs_vptofh(vp, fhp)
struct vnode *vp;
struct fid *fhp;
{
register struct inode *ip;
register struct ufid *ufhp;
ip = VTOI(vp);
ufhp = (struct ufid *)fhp;
ufhp->ufid_len = sizeof(struct ufid);
ufhp->ufid_ino = ip->i_number;
ufhp->ufid_gen = ip->i_gen;
return (0);
}
/*
* Write a superblock and associated information back to disk.
*/
int
ffs_sbupdate(mp, waitfor)
struct ufsmount *mp;
int waitfor;
{
register struct fs *fs = mp->um_fs;
register struct buf *bp;
int blks;
caddr_t space;
int i, size, error = 0;
#ifdef SECSIZE
bp = getblk(mp->m_dev, (daddr_t)fsbtodb(fs, SBOFF / fs->fs_fsize),
(int)fs->fs_sbsize, fs->fs_dbsize);
#else SECSIZE
bp = getblk(mp->um_devvp, SBLOCK, (int)fs->fs_sbsize);
#endif SECSIZE
bcopy((caddr_t)fs, bp->b_un.b_addr, (u_int)fs->fs_sbsize);
/* Restore compatibility to old file systems. XXX */
if (fs->fs_postblformat == FS_42POSTBLFMT) /* XXX */
bp->b_un.b_fs->fs_nrpos = -1; /* XXX */
#ifdef SECSIZE
#ifdef tahoe
/* restore standard fsbtodb shift */
bp->b_un.b_fs->fs_fsbtodb = fs->fs_sparecon[0];
bp->b_un.b_fs->fs_sparecon[0] = 0;
#endif
#endif SECSIZE
if (waitfor == MNT_WAIT)
error = bwrite(bp);
else
bawrite(bp);
blks = howmany(fs->fs_cssize, fs->fs_fsize);
space = (caddr_t)fs->fs_csp[0];
for (i = 0; i < blks; i += fs->fs_frag) {
size = fs->fs_bsize;
if (i + fs->fs_frag > blks)
size = (blks - i) * fs->fs_fsize;
#ifdef SECSIZE
bp = getblk(mp->m_dev, fsbtodb(fs, fs->fs_csaddr + i), size,
fs->fs_dbsize);
#else SECSIZE
bp = getblk(mp->um_devvp, fsbtodb(fs, fs->fs_csaddr + i), size);
#endif SECSIZE
bcopy(space, bp->b_un.b_addr, (u_int)size);
space += size;
if (waitfor == MNT_WAIT)
error = bwrite(bp);
else
bawrite(bp);
}
return (error);
}