NetBSD/sys/filecorefs/filecore_vfsops.c

725 lines
17 KiB
C

/* $NetBSD: filecore_vfsops.c,v 1.22 2002/09/21 20:28:50 mycroft Exp $ */
/*-
* Copyright (c) 1998 Andrew McMurry
* Copyright (c) 1994 The Regents of the University of California.
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
* 3. All advertising materials mentioning features or use of this software
* must display the following acknowledgement:
* This product includes software developed by the University of
* California, Berkeley and its contributors.
* 4. Neither the name of the University nor the names of its contributors
* may be used to endorse or promote products derived from this software
* without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*
* filecore_vfsops.c 1.1 1998/6/26
*/
#include <sys/cdefs.h>
__KERNEL_RCSID(0, "$NetBSD: filecore_vfsops.c,v 1.22 2002/09/21 20:28:50 mycroft Exp $");
#if defined(_KERNEL_OPT)
#include "opt_compat_netbsd.h"
#endif
#include <sys/param.h>
#include <sys/systm.h>
#include <sys/namei.h>
#include <sys/proc.h>
#include <sys/vnode.h>
#include <miscfs/specfs/specdev.h>
#include <sys/mount.h>
#include <sys/buf.h>
#include <sys/file.h>
#include <sys/device.h>
#include <sys/errno.h>
#include <sys/malloc.h>
#include <sys/pool.h>
#include <sys/conf.h>
#include <filecorefs/filecore.h>
#include <filecorefs/filecore_extern.h>
#include <filecorefs/filecore_node.h>
#include <filecorefs/filecore_mount.h>
extern const struct vnodeopv_desc filecore_vnodeop_opv_desc;
const struct vnodeopv_desc * const filecore_vnodeopv_descs[] = {
&filecore_vnodeop_opv_desc,
NULL,
};
struct vfsops filecore_vfsops = {
MOUNT_FILECORE,
filecore_mount,
filecore_start,
filecore_unmount,
filecore_root,
filecore_quotactl,
filecore_statfs,
filecore_sync,
filecore_vget,
filecore_fhtovp,
filecore_vptofh,
filecore_init,
filecore_reinit,
filecore_done,
filecore_sysctl,
NULL, /* filecore_mountroot */
filecore_checkexp,
filecore_vnodeopv_descs,
};
struct genfs_ops filecore_genfsops = {
genfs_size,
};
/*
* Called by vfs_mountroot when iso is going to be mounted as root.
*
* Name is updated by mount(8) after booting.
*/
static int filecore_mountfs __P((struct vnode *devvp, struct mount *mp,
struct proc *p, struct filecore_args *argp));
#if 0
int
filecore_mountroot()
{
struct mount *mp;
extern struct vnode *rootvp;
struct proc *p = curproc; /* XXX */
int error;
struct filecore_args args;
if (root_device->dv_class != DV_DISK)
return (ENODEV);
/*
* Get vnodes for swapdev and rootdev.
*/
if (bdevvp(rootdev, &rootvp))
panic("filecore_mountroot: can't setup rootvp");
if ((error = vfs_rootmountalloc(MOUNT_FILECORE, "root_device", &mp)) != 0)
return (error);
args.flags = FILECOREMNT_ROOT;
if ((error = filecore_mountfs(rootvp, mp, p, &args)) != 0) {
mp->mnt_op->vfs_refcount--;
vfs_unbusy(mp);
free(mp, M_MOUNT);
return (error);
}
simple_lock(&mountlist_slock);
CIRCLEQ_INSERT_TAIL(&mountlist, mp, mnt_list);
simple_unlock(&mountlist_slock);
(void)filecore_statfs(mp, &mp->mnt_stat, p);
vfs_unbusy(mp);
return (0);
}
#endif
/*
* VFS Operations.
*
* mount system call
*/
int
filecore_mount(mp, path, data, ndp, p)
struct mount *mp;
const char *path;
void *data;
struct nameidata *ndp;
struct proc *p;
{
struct vnode *devvp;
struct filecore_args args;
size_t size;
int error;
struct filecore_mnt *fcmp = NULL;
if (mp->mnt_flag & MNT_GETARGS) {
fcmp = VFSTOFILECORE(mp);
if (fcmp == NULL)
return EIO;
args.flags = fcmp->fc_mntflags;
args.uid = fcmp->fc_uid;
args.gid = fcmp->fc_gid;
args.fspec = NULL;
vfs_showexport(mp, &args.export, &fcmp->fc_export);
return copyout(&args, data, sizeof(args));
}
error = copyin(data, (caddr_t)&args, sizeof (struct filecore_args));
if (error)
return (error);
if ((mp->mnt_flag & MNT_RDONLY) == 0)
return (EROFS);
/*
* If updating, check whether changing from read-only to
* read/write; if there is no device name, that's all we do.
*/
if (mp->mnt_flag & MNT_UPDATE) {
fcmp = VFSTOFILECORE(mp);
if (args.fspec == 0)
return (vfs_export(mp, &fcmp->fc_export, &args.export));
}
/*
* Not an update, or updating the name: look up the name
* and verify that it refers to a sensible block device.
*/
NDINIT(ndp, LOOKUP, FOLLOW, UIO_USERSPACE, args.fspec, p);
if ((error = namei(ndp)) != 0)
return (error);
devvp = ndp->ni_vp;
if (devvp->v_type != VBLK) {
vrele(devvp);
return ENOTBLK;
}
if (bdevsw_lookup(devvp->v_rdev) == NULL) {
vrele(devvp);
return ENXIO;
}
/*
* If mount by non-root, then verify that user has necessary
* permissions on the device.
*/
if (p->p_ucred->cr_uid != 0) {
vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY);
error = VOP_ACCESS(devvp, VREAD, p->p_ucred, p);
VOP_UNLOCK(devvp, 0);
if (error) {
vrele(devvp);
return (error);
}
}
if ((mp->mnt_flag & MNT_UPDATE) == 0)
error = filecore_mountfs(devvp, mp, p, &args);
else {
if (devvp != fcmp->fc_devvp)
error = EINVAL; /* needs translation */
else
vrele(devvp);
}
if (error) {
vrele(devvp);
return error;
}
fcmp = VFSTOFILECORE(mp);
(void) copyinstr(path, mp->mnt_stat.f_mntonname, MNAMELEN - 1, &size);
memset(mp->mnt_stat.f_mntonname + size, 0, MNAMELEN - size);
(void) copyinstr(args.fspec, mp->mnt_stat.f_mntfromname, MNAMELEN - 1,
&size);
memset(mp->mnt_stat.f_mntfromname + size, 0, MNAMELEN - size);
return 0;
}
/*
* Common code for mount and mountroot
*/
static int
filecore_mountfs(devvp, mp, p, argp)
struct vnode *devvp;
struct mount *mp;
struct proc *p;
struct filecore_args *argp;
{
struct filecore_mnt *fcmp = (struct filecore_mnt *)0;
struct buf *bp = NULL;
dev_t dev = devvp->v_rdev;
int error = EINVAL;
int ronly = (mp->mnt_flag & MNT_RDONLY) != 0;
extern struct vnode *rootvp;
struct filecore_disc_record *fcdr;
unsigned map;
unsigned log2secsize;
if (!ronly)
return EROFS;
/*
* Disallow multiple mounts of the same device.
* Disallow mounting of a device that is currently in use
* (except for root, which might share swap device for miniroot).
* Flush out any old buffers remaining from a previous use.
*/
if ((error = vfs_mountedon(devvp)) != 0)
return error;
if (vcount(devvp) > 1 && devvp != rootvp)
return EBUSY;
if ((error = vinvalbuf(devvp, V_SAVE, p->p_ucred, p, 0, 0)) != 0)
return (error);
error = VOP_OPEN(devvp, ronly ? FREAD : FREAD|FWRITE, FSCRED, p);
if (error)
return error;
/* Read the filecore boot block to check FS validity and to find the map */
error = bread(devvp, FILECORE_BOOTBLOCK_BLKN,
FILECORE_BOOTBLOCK_SIZE, NOCRED, &bp);
#ifdef FILECORE_DEBUG_BR
printf("bread(%p, %x, %d, CRED, %p)=%d\n", devvp,
FILECORE_BOOTBLOCK_BLKN, FILECORE_BOOTBLOCK_SIZE,
bp, error);
#endif
if (error != 0)
goto out;
if (filecore_bbchecksum(bp->b_data) != 0) {
error = EINVAL;
goto out;
}
fcdr = (struct filecore_disc_record *)(bp->b_data+FILECORE_BB_DISCREC);
map = ((((8 << fcdr->log2secsize) - fcdr->zone_spare)
* (fcdr->nzones / 2) - 8 * FILECORE_DISCREC_SIZE)
<< fcdr->log2bpmb) >> fcdr->log2secsize;
log2secsize = fcdr->log2secsize;
bp->b_flags |= B_AGE;
#ifdef FILECORE_DEBUG_BR
printf("brelse(%p) vf1\n", bp);
#endif
brelse(bp);
bp = NULL;
/* Read the bootblock in the map */
error = bread(devvp, map, 1 << log2secsize, NOCRED, &bp);
#ifdef FILECORE_DEBUG_BR
printf("bread(%p, %x, %d, CRED, %p)=%d\n", devvp,
map, 1 << log2secsize, bp, error);
#endif
if (error != 0)
goto out;
fcdr = (struct filecore_disc_record *)(bp->b_data + 4);
fcmp = malloc(sizeof *fcmp, M_FILECOREMNT, M_WAITOK);
memset((caddr_t)fcmp, 0, sizeof *fcmp);
if (fcdr->log2bpmb > fcdr->log2secsize)
fcmp->log2bsize = fcdr->log2bpmb;
else fcmp->log2bsize = fcdr->log2secsize;
fcmp->blksize = 1 << fcmp->log2bsize;
memcpy((caddr_t)&fcmp->drec, (caddr_t)fcdr, sizeof(*fcdr));
fcmp->map = map;
fcmp->idspz = ((8 << fcdr->log2secsize) - fcdr->zone_spare)
/ (fcdr->idlen + 1);
fcmp->mask = (1 << fcdr->idlen) - 1;
if (fcdr->big_flag & 1) {
fcmp->nblks = ((((u_int64_t)fcdr->disc_size_2) << 32)
+ fcdr->disc_size) / fcmp->blksize;
} else {
fcmp->nblks=fcdr->disc_size / fcmp->blksize;
}
bp->b_flags |= B_AGE;
#ifdef FILECORE_DEBUG_BR
printf("brelse(%p) vf2\n", bp);
#endif
brelse(bp);
bp = NULL;
mp->mnt_data = fcmp;
mp->mnt_stat.f_fsid.val[0] = (long)dev;
mp->mnt_stat.f_fsid.val[1] = makefstype(MOUNT_FILECORE);
mp->mnt_maxsymlinklen = 0;
mp->mnt_flag |= MNT_LOCAL;
mp->mnt_dev_bshift = fcdr->log2secsize;
mp->mnt_fs_bshift = fcmp->log2bsize;
fcmp->fc_mountp = mp;
fcmp->fc_dev = dev;
fcmp->fc_devvp = devvp;
fcmp->fc_mntflags = argp->flags;
if (argp->flags & FILECOREMNT_USEUID) {
fcmp->fc_uid = p->p_cred->p_ruid;
fcmp->fc_gid = p->p_cred->p_rgid;
} else {
fcmp->fc_uid = argp->uid;
fcmp->fc_gid = argp->gid;
}
return 0;
out:
if (bp) {
#ifdef FILECORE_DEBUG_BR
printf("brelse(%p) vf3\n", bp);
#endif
brelse(bp);
}
vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY);
(void)VOP_CLOSE(devvp, ronly ? FREAD : FREAD|FWRITE, NOCRED, p);
VOP_UNLOCK(devvp, 0);
if (fcmp) {
free((caddr_t)fcmp, M_FILECOREMNT);
mp->mnt_data = NULL;
}
return error;
}
/*
* Make a filesystem operational.
* Nothing to do at the moment.
*/
/* ARGSUSED */
int
filecore_start(mp, flags, p)
struct mount *mp;
int flags;
struct proc *p;
{
return 0;
}
/*
* unmount system call
*/
int
filecore_unmount(mp, mntflags, p)
struct mount *mp;
int mntflags;
struct proc *p;
{
struct filecore_mnt *fcmp;
int error, flags = 0;
if (mntflags & MNT_FORCE)
flags |= FORCECLOSE;
#if 0
mntflushbuf(mp, 0);
if (mntinvalbuf(mp))
return EBUSY;
#endif
if ((error = vflush(mp, NULLVP, flags)) != 0)
return (error);
fcmp = VFSTOFILECORE(mp);
if (fcmp->fc_devvp->v_type != VBAD)
fcmp->fc_devvp->v_specmountpoint = NULL;
vn_lock(fcmp->fc_devvp, LK_EXCLUSIVE | LK_RETRY);
error = VOP_CLOSE(fcmp->fc_devvp, FREAD, NOCRED, p);
vput(fcmp->fc_devvp);
free((caddr_t)fcmp, M_FILECOREMNT);
mp->mnt_data = NULL;
mp->mnt_flag &= ~MNT_LOCAL;
return (error);
}
/*
* Return root of a filesystem
*/
int
filecore_root(mp, vpp)
struct mount *mp;
struct vnode **vpp;
{
struct vnode *nvp;
int error;
if ((error = VFS_VGET(mp, FILECORE_ROOTINO, &nvp)) != 0)
return (error);
*vpp = nvp;
return (0);
}
/*
* Do operations associated with quotas, not supported
*/
/* ARGSUSED */
int
filecore_quotactl(mp, cmd, uid, arg, p)
struct mount *mp;
int cmd;
uid_t uid;
caddr_t arg;
struct proc *p;
{
return (EOPNOTSUPP);
}
/*
* Get file system statistics.
*/
int
filecore_statfs(mp, sbp, p)
struct mount *mp;
struct statfs *sbp;
struct proc *p;
{
struct filecore_mnt *fcmp = VFSTOFILECORE(mp);
#ifdef COMPAT_09
sbp->f_type = 255;
#else
sbp->f_type = 0;
#endif
sbp->f_bsize = fcmp->blksize;
sbp->f_iosize = sbp->f_bsize; /* XXX */
sbp->f_blocks = fcmp->nblks;
sbp->f_bfree = 0; /* total free blocks */
sbp->f_bavail = 0; /* blocks free for non superuser */
sbp->f_files = 0; /* total files */
sbp->f_ffree = 0; /* free file nodes */
if (sbp != &mp->mnt_stat) {
memcpy(sbp->f_mntonname, mp->mnt_stat.f_mntonname, MNAMELEN);
memcpy(sbp->f_mntfromname, mp->mnt_stat.f_mntfromname, MNAMELEN);
}
strncpy(sbp->f_fstypename, mp->mnt_op->vfs_name, MFSNAMELEN);
return 0;
}
/* ARGSUSED */
int
filecore_sync(mp, waitfor, cred, p)
struct mount *mp;
int waitfor;
struct ucred *cred;
struct proc *p;
{
return (0);
}
/*
* File handle to vnode
*
* Have to be really careful about stale file handles:
* - check that the inode number is in range
* - call iget() to get the locked inode
* - check for an unallocated inode (i_mode == 0)
* - check that the generation number matches
*/
struct ifid {
ushort ifid_len;
ushort ifid_pad;
u_int32_t ifid_ino;
};
/* ARGSUSED */
int
filecore_fhtovp(mp, fhp, vpp)
struct mount *mp;
struct fid *fhp;
struct vnode **vpp;
{
struct ifid *ifhp = (struct ifid *)fhp;
struct vnode *nvp;
struct filecore_node *ip;
int error;
if ((error = VFS_VGET(mp, ifhp->ifid_ino, &nvp)) != 0) {
*vpp = NULLVP;
return (error);
}
ip = VTOI(nvp);
if (filecore_staleinode(ip)) {
vput(nvp);
*vpp = NULLVP;
return (ESTALE);
}
*vpp = nvp;
return (0);
}
/* ARGSUSED */
int
filecore_checkexp(mp, nam, exflagsp, credanonp)
struct mount *mp;
struct mbuf *nam;
int *exflagsp;
struct ucred **credanonp;
{
struct filecore_mnt *fcmp = VFSTOFILECORE(mp);
struct netcred *np;
/*
* Get the export permission structure for this <mp, client> tuple.
*/
np = vfs_export_lookup(mp, &fcmp->fc_export, nam);
if (np == NULL)
return (EACCES);
*exflagsp = np->netc_exflags;
*credanonp = &np->netc_anon;
return (0);
}
/* This looks complicated. Look at other vgets as well as the iso9660 one.
*
* The filecore inode number is made up of 1 byte directory entry index and
* 3 bytes of the internal disc address of the directory. On a read-only
* filesystem this is unique. For a read-write version we may not be able to
* do vget, see msdosfs.
*/
int
filecore_vget(mp, ino, vpp)
struct mount *mp;
ino_t ino;
struct vnode **vpp;
{
struct filecore_mnt *fcmp;
struct filecore_node *ip;
struct buf *bp;
struct vnode *vp;
dev_t dev;
int error;
fcmp = VFSTOFILECORE(mp);
dev = fcmp->fc_dev;
if ((*vpp = filecore_ihashget(dev, ino)) != NULLVP)
return (0);
/* Allocate a new vnode/filecore_node. */
if ((error = getnewvnode(VT_FILECORE, mp, filecore_vnodeop_p, &vp))
!= 0) {
*vpp = NULLVP;
return (error);
}
ip = pool_get(&filecore_node_pool, PR_WAITOK);
memset(ip, 0, sizeof(struct filecore_node));
vp->v_data = ip;
ip->i_vnode = vp;
ip->i_dev = dev;
ip->i_number = ino;
ip->i_block = -1;
ip->i_parent = -2;
/*
* Put it onto its hash chain and lock it so that other requests for
* this inode will block if they arrive while we are sleeping waiting
* for old data structures to be purged or for the contents of the
* disk portion of this inode to be read.
*/
filecore_ihashins(ip);
if (ino == FILECORE_ROOTINO) {
/* Here we need to construct a root directory inode */
memcpy((caddr_t)ip->i_dirent.name, (caddr_t)"root", 4);
ip->i_dirent.load = 0;
ip->i_dirent.exec = 0;
ip->i_dirent.len = FILECORE_DIR_SIZE;
ip->i_dirent.addr = fcmp->drec.root;
ip->i_dirent.attr = FILECORE_ATTR_DIR | FILECORE_ATTR_READ;
} else {
/* Read in Data from Directory Entry */
if ((error = filecore_bread(fcmp, ino & FILECORE_INO_MASK,
FILECORE_DIR_SIZE, NOCRED, &bp)) != 0) {
vput(vp);
#ifdef FILECORE_DEBUG_BR
printf("brelse(%p) vf4\n", bp);
#endif
brelse(bp);
*vpp = NULL;
return (error);
}
memcpy((caddr_t)&ip->i_dirent,
(caddr_t)fcdirentry(bp->b_data, ino >> FILECORE_INO_INDEX),
sizeof(struct filecore_direntry));
#ifdef FILECORE_DEBUG_BR
printf("brelse(%p) vf5\n", bp);
#endif
brelse(bp);
}
ip->i_mnt = fcmp;
ip->i_devvp = fcmp->fc_devvp;
ip->i_diroff = 0;
VREF(ip->i_devvp);
/*
* Setup type
*/
vp->v_type = VREG;
if (ip->i_dirent.attr & FILECORE_ATTR_DIR)
vp->v_type = VDIR;
/*
* Initialize the associated vnode
*/
switch (vp->v_type) {
case VFIFO:
case VCHR:
case VBLK:
/*
* Devices not supported.
*/
vput(vp);
return (EOPNOTSUPP);
case VLNK:
case VNON:
case VSOCK:
case VDIR:
case VBAD:
case VREG:
break;
}
if (ino == FILECORE_ROOTINO)
vp->v_flag |= VROOT;
/*
* XXX need generation number?
*/
genfs_node_init(vp, &filecore_genfsops);
vp->v_size = ip->i_size;
*vpp = vp;
return (0);
}
/*
* Vnode pointer to File handle
*/
/* ARGSUSED */
int
filecore_vptofh(vp, fhp)
struct vnode *vp;
struct fid *fhp;
{
struct filecore_node *ip = VTOI(vp);
struct ifid *ifhp;
ifhp = (struct ifid *)fhp;
ifhp->ifid_len = sizeof(struct ifid);
ifhp->ifid_ino = ip->i_number;
return 0;
}
int
filecore_sysctl(name, namelen, oldp, oldlenp, newp, newlen, p)
int *name;
u_int namelen;
void *oldp;
size_t *oldlenp;
void *newp;
size_t newlen;
struct proc *p;
{
return (EOPNOTSUPP);
}