2008-01-02 14:48:20 +03:00
|
|
|
/* $NetBSD: vfs_subr2.c,v 1.9 2008/01/02 11:48:56 ad Exp $ */
|
2007-07-29 18:44:08 +04:00
|
|
|
|
|
|
|
/*-
|
2007-10-11 00:42:20 +04:00
|
|
|
* Copyright (c) 1997, 1998, 2004, 2005, 2007 The NetBSD Foundation, Inc.
|
2007-07-29 18:44:08 +04:00
|
|
|
* All rights reserved.
|
|
|
|
*
|
|
|
|
* This code is derived from software contributed to The NetBSD Foundation
|
|
|
|
* by Jason R. Thorpe of the Numerical Aerospace Simulation Facility,
|
2007-10-11 00:42:20 +04:00
|
|
|
* NASA Ames Research Center, by Charles M. Hannum, and by Andrew Doran.
|
2007-07-29 18:44:08 +04:00
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or without
|
|
|
|
* modification, are permitted provided that the following conditions
|
|
|
|
* are met:
|
|
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer.
|
|
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
|
|
* documentation and/or other materials provided with the distribution.
|
|
|
|
* 3. All advertising materials mentioning features or use of this software
|
|
|
|
* must display the following acknowledgement:
|
|
|
|
* This product includes software developed by the NetBSD
|
|
|
|
* Foundation, Inc. and its contributors.
|
|
|
|
* 4. Neither the name of The NetBSD Foundation nor the names of its
|
|
|
|
* contributors may be used to endorse or promote products derived
|
|
|
|
* from this software without specific prior written permission.
|
|
|
|
*
|
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
|
|
|
|
* ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
|
|
|
|
* TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
|
|
|
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
|
|
|
|
* BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
|
|
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
|
|
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
|
|
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
|
|
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
|
|
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
|
|
* POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Copyright (c) 1989, 1993
|
|
|
|
* The Regents of the University of California. All rights reserved.
|
|
|
|
* (c) UNIX System Laboratories, Inc.
|
|
|
|
* All or some portions of this file are derived from material licensed
|
|
|
|
* to the University of California by American Telephone and Telegraph
|
|
|
|
* Co. or Unix System Laboratories, Inc. and are reproduced herein with
|
|
|
|
* the permission of UNIX System Laboratories, Inc.
|
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or without
|
|
|
|
* modification, are permitted provided that the following conditions
|
|
|
|
* are met:
|
|
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer.
|
|
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
|
|
* documentation and/or other materials provided with the distribution.
|
|
|
|
* 3. Neither the name of the University nor the names of its contributors
|
|
|
|
* may be used to endorse or promote products derived from this software
|
|
|
|
* without specific prior written permission.
|
|
|
|
*
|
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
|
|
|
|
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
|
|
* ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
|
|
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
|
|
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
|
|
|
|
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
|
|
|
|
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
|
|
|
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
|
|
|
|
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
|
|
|
|
* SUCH DAMAGE.
|
|
|
|
*
|
|
|
|
* @(#)vfs_subr.c 8.13 (Berkeley) 4/18/94
|
|
|
|
*/
|
|
|
|
|
|
|
|
/*
|
|
|
|
* External virtual filesystem routines.
|
|
|
|
*
|
|
|
|
* This file contains vfs subroutines which do not heavily depend on
|
|
|
|
* the kernel environment and are therefore suitable to be compiled
|
|
|
|
* outside of the kernel.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <sys/cdefs.h>
|
2008-01-02 14:48:20 +03:00
|
|
|
__KERNEL_RCSID(0, "$NetBSD: vfs_subr2.c,v 1.9 2008/01/02 11:48:56 ad Exp $");
|
2007-07-29 18:44:08 +04:00
|
|
|
|
|
|
|
#include "opt_ddb.h"
|
|
|
|
|
|
|
|
#include <sys/param.h>
|
|
|
|
#include <sys/filedesc.h>
|
|
|
|
#include <sys/kauth.h>
|
|
|
|
#include <sys/malloc.h>
|
|
|
|
#include <sys/mount.h>
|
|
|
|
#include <sys/stat.h>
|
|
|
|
#include <sys/systm.h>
|
|
|
|
#include <sys/vnode.h>
|
2007-10-11 00:42:20 +04:00
|
|
|
#include <sys/proc.h>
|
2008-01-02 14:48:20 +03:00
|
|
|
#include <sys/kthread.h>
|
2007-07-29 18:44:08 +04:00
|
|
|
|
2007-08-10 00:55:30 +04:00
|
|
|
#include <miscfs/syncfs/syncfs.h>
|
2007-07-29 18:44:08 +04:00
|
|
|
#include <miscfs/specfs/specdev.h>
|
|
|
|
|
|
|
|
#include <uvm/uvm_ddb.h>
|
|
|
|
|
|
|
|
const enum vtype iftovt_tab[16] = {
|
|
|
|
VNON, VFIFO, VCHR, VNON, VDIR, VNON, VBLK, VNON,
|
|
|
|
VREG, VNON, VLNK, VNON, VSOCK, VNON, VNON, VBAD,
|
|
|
|
};
|
|
|
|
const int vttoif_tab[9] = {
|
|
|
|
0, S_IFREG, S_IFDIR, S_IFBLK, S_IFCHR, S_IFLNK,
|
|
|
|
S_IFSOCK, S_IFIFO, S_IFMT,
|
|
|
|
};
|
|
|
|
|
2007-08-14 17:51:31 +04:00
|
|
|
/*
|
|
|
|
* Insq/Remq for the vnode usage lists.
|
|
|
|
*/
|
|
|
|
#define bufinsvn(bp, dp) LIST_INSERT_HEAD(dp, bp, b_vnbufs)
|
|
|
|
#define bufremvn(bp) { \
|
|
|
|
LIST_REMOVE(bp, b_vnbufs); \
|
|
|
|
(bp)->b_vnbufs.le_next = NOLIST; \
|
|
|
|
}
|
|
|
|
|
2007-07-29 18:44:08 +04:00
|
|
|
int doforce = 1; /* 1 => permit forcible unmounting */
|
|
|
|
int prtactive = 0; /* 1 => print out reclaim of active vnodes */
|
|
|
|
|
2007-10-11 00:42:20 +04:00
|
|
|
kmutex_t mountlist_lock;
|
|
|
|
kmutex_t mntid_lock;
|
2008-01-02 14:48:20 +03:00
|
|
|
kmutex_t mntvnode_lock;
|
|
|
|
kmutex_t vnode_free_list_lock;
|
|
|
|
kmutex_t spechash_lock;
|
2007-10-11 00:42:20 +04:00
|
|
|
kmutex_t vfs_list_lock;
|
2007-07-29 18:44:08 +04:00
|
|
|
|
|
|
|
struct mntlist mountlist = /* mounted filesystem list */
|
|
|
|
CIRCLEQ_HEAD_INITIALIZER(mountlist);
|
|
|
|
|
2007-08-10 00:55:30 +04:00
|
|
|
static specificdata_domain_t mount_specificdata_domain;
|
|
|
|
|
2007-07-29 18:44:08 +04:00
|
|
|
/*
|
|
|
|
* These define the root filesystem and device.
|
|
|
|
*/
|
|
|
|
struct vnode *rootvnode;
|
|
|
|
struct device *root_device; /* root device */
|
|
|
|
|
|
|
|
#ifdef DEBUG
|
|
|
|
void printlockedvnodes(void);
|
|
|
|
#endif
|
|
|
|
|
2008-01-02 14:48:20 +03:00
|
|
|
u_int numvnodes;
|
2007-07-29 18:44:08 +04:00
|
|
|
|
2007-08-10 00:55:30 +04:00
|
|
|
/*
|
|
|
|
* Initialize the vnode management data structures.
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
vntblinit(void)
|
|
|
|
{
|
|
|
|
|
2007-10-11 00:42:20 +04:00
|
|
|
mutex_init(&mountlist_lock, MUTEX_DEFAULT, IPL_NONE);
|
|
|
|
mutex_init(&mntid_lock, MUTEX_DEFAULT, IPL_NONE);
|
2008-01-02 14:48:20 +03:00
|
|
|
mutex_init(&mntvnode_lock, MUTEX_DEFAULT, IPL_NONE);
|
|
|
|
mutex_init(&vnode_free_list_lock, MUTEX_DEFAULT, IPL_NONE);
|
|
|
|
mutex_init(&spechash_lock, MUTEX_DEFAULT, IPL_NONE);
|
2007-10-11 00:42:20 +04:00
|
|
|
mutex_init(&vfs_list_lock, MUTEX_DEFAULT, IPL_NONE);
|
|
|
|
|
2007-08-10 00:55:30 +04:00
|
|
|
mount_specificdata_domain = specificdata_domain_create();
|
|
|
|
|
2008-01-02 14:48:20 +03:00
|
|
|
/* Initialize the filesystem syncer. */
|
2007-08-10 00:55:30 +04:00
|
|
|
vn_initialize_syncerd();
|
2008-01-02 14:48:20 +03:00
|
|
|
vn_init1();
|
2007-08-10 00:55:30 +04:00
|
|
|
}
|
|
|
|
|
2007-07-29 18:44:08 +04:00
|
|
|
/*
|
|
|
|
* Lookup a mount point by filesystem identifier.
|
|
|
|
*/
|
|
|
|
struct mount *
|
|
|
|
vfs_getvfs(fsid_t *fsid)
|
|
|
|
{
|
|
|
|
struct mount *mp;
|
|
|
|
|
2007-10-11 00:42:20 +04:00
|
|
|
mutex_enter(&mountlist_lock);
|
2007-07-29 18:44:08 +04:00
|
|
|
CIRCLEQ_FOREACH(mp, &mountlist, mnt_list) {
|
|
|
|
if (mp->mnt_stat.f_fsidx.__fsid_val[0] == fsid->__fsid_val[0] &&
|
|
|
|
mp->mnt_stat.f_fsidx.__fsid_val[1] == fsid->__fsid_val[1]) {
|
2007-10-11 00:42:20 +04:00
|
|
|
mutex_exit(&mountlist_lock);
|
2007-07-29 18:44:08 +04:00
|
|
|
return (mp);
|
|
|
|
}
|
|
|
|
}
|
2007-10-11 00:42:20 +04:00
|
|
|
mutex_exit(&mountlist_lock);
|
2007-07-29 18:44:08 +04:00
|
|
|
return ((struct mount *)0);
|
|
|
|
}
|
|
|
|
|
2007-10-11 00:42:20 +04:00
|
|
|
/*
|
|
|
|
* Free a mount structure.
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
vfs_destroy(struct mount *mp)
|
|
|
|
{
|
|
|
|
|
|
|
|
specificdata_fini(mount_specificdata_domain, &mp->mnt_specdataref);
|
2008-01-02 14:48:20 +03:00
|
|
|
mutex_destroy(&mp->mnt_mutex);
|
|
|
|
lockdestroy(&mp->mnt_lock);
|
2007-10-11 00:42:20 +04:00
|
|
|
free(mp, M_MOUNT);
|
|
|
|
}
|
|
|
|
|
2008-01-02 14:48:20 +03:00
|
|
|
/*
|
|
|
|
* Wait for a vnode (typically with VI_XLOCK set) to be cleaned or
|
|
|
|
* recycled.
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
vwait(vnode_t *vp, int flags)
|
|
|
|
{
|
|
|
|
|
|
|
|
KASSERT(mutex_owned(&vp->v_interlock));
|
|
|
|
KASSERT(vp->v_usecount != 0);
|
|
|
|
|
|
|
|
while ((vp->v_iflag & flags) != 0)
|
|
|
|
cv_wait(&vp->v_cv, &vp->v_interlock);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Insert a marker vnode into a mount's vnode list, after the
|
|
|
|
* specified vnode. mntvnode_lock must be held.
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
vmark(vnode_t *mvp, vnode_t *vp)
|
|
|
|
{
|
|
|
|
struct mount *mp;
|
|
|
|
|
|
|
|
mp = mvp->v_mount;
|
|
|
|
|
|
|
|
KASSERT(mutex_owned(&mntvnode_lock));
|
|
|
|
KASSERT((mvp->v_iflag & VI_MARKER) != 0);
|
|
|
|
KASSERT(vp->v_mount == mp);
|
|
|
|
|
|
|
|
TAILQ_INSERT_AFTER(&mp->mnt_vnodelist, vp, mvp, v_mntvnodes);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Remove a marker vnode from a mount's vnode list, and return
|
|
|
|
* a pointer to the next vnode in the list. mntvnode_lock must
|
|
|
|
* be held.
|
|
|
|
*/
|
|
|
|
vnode_t *
|
|
|
|
vunmark(vnode_t *mvp)
|
|
|
|
{
|
|
|
|
vnode_t *vp;
|
|
|
|
struct mount *mp;
|
|
|
|
|
|
|
|
mp = mvp->v_mount;
|
|
|
|
|
|
|
|
KASSERT(mutex_owned(&mntvnode_lock));
|
|
|
|
KASSERT((mvp->v_iflag & VI_MARKER) != 0);
|
|
|
|
|
|
|
|
vp = TAILQ_NEXT(mvp, v_mntvnodes);
|
|
|
|
TAILQ_REMOVE(&mp->mnt_vnodelist, mvp, v_mntvnodes);
|
|
|
|
|
|
|
|
KASSERT(vp == NULL || vp->v_mount == mp);
|
|
|
|
|
|
|
|
return vp;
|
|
|
|
}
|
|
|
|
|
2007-08-14 17:51:31 +04:00
|
|
|
/*
|
|
|
|
* Update outstanding I/O count and do wakeup if requested.
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
vwakeup(struct buf *bp)
|
|
|
|
{
|
|
|
|
struct vnode *vp;
|
|
|
|
|
2008-01-02 14:48:20 +03:00
|
|
|
if ((vp = bp->b_vp) == NULL)
|
|
|
|
return;
|
|
|
|
|
|
|
|
KASSERT(bp->b_objlock == &vp->v_interlock);
|
|
|
|
KASSERT(mutex_owned(bp->b_objlock));
|
|
|
|
|
|
|
|
if (--vp->v_numoutput < 0)
|
|
|
|
panic("vwakeup: neg numoutput, vp %p", vp);
|
|
|
|
if (vp->v_numoutput == 0)
|
|
|
|
cv_broadcast(&vp->v_cv);
|
2007-08-14 17:51:31 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Flush out and invalidate all buffers associated with a vnode.
|
|
|
|
* Called with the underlying vnode locked, which should prevent new dirty
|
|
|
|
* buffers from being queued.
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
vinvalbuf(struct vnode *vp, int flags, kauth_cred_t cred, struct lwp *l,
|
2008-01-02 14:48:20 +03:00
|
|
|
bool catch, int slptimeo)
|
2007-08-14 17:51:31 +04:00
|
|
|
{
|
|
|
|
struct buf *bp, *nbp;
|
2008-01-02 14:48:20 +03:00
|
|
|
int error;
|
2007-08-14 17:51:31 +04:00
|
|
|
int flushflags = PGO_ALLPAGES | PGO_FREE | PGO_SYNCIO |
|
2008-01-02 14:48:20 +03:00
|
|
|
(flags & V_SAVE ? PGO_CLEANIT | PGO_RECLAIM : 0);
|
2007-08-14 17:51:31 +04:00
|
|
|
|
|
|
|
/* XXXUBC this doesn't look at flags or slp* */
|
2008-01-02 14:48:20 +03:00
|
|
|
mutex_enter(&vp->v_interlock);
|
2007-08-14 17:51:31 +04:00
|
|
|
error = VOP_PUTPAGES(vp, 0, 0, flushflags);
|
|
|
|
if (error) {
|
|
|
|
return error;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (flags & V_SAVE) {
|
2007-11-26 22:01:26 +03:00
|
|
|
error = VOP_FSYNC(vp, cred, FSYNC_WAIT|FSYNC_RECLAIM, 0, 0);
|
2007-08-14 17:51:31 +04:00
|
|
|
if (error)
|
|
|
|
return (error);
|
2008-01-02 14:48:20 +03:00
|
|
|
KASSERT(vp->v_numoutput == 0 && LIST_EMPTY(&vp->v_dirtyblkhd));
|
2007-08-14 17:51:31 +04:00
|
|
|
}
|
|
|
|
|
2008-01-02 14:48:20 +03:00
|
|
|
mutex_enter(&bufcache_lock);
|
2007-08-14 17:51:31 +04:00
|
|
|
restart:
|
2008-01-02 14:48:20 +03:00
|
|
|
for (bp = LIST_FIRST(&vp->v_dirtyblkhd); bp; bp = nbp) {
|
2007-08-14 17:51:31 +04:00
|
|
|
nbp = LIST_NEXT(bp, b_vnbufs);
|
2008-01-02 14:48:20 +03:00
|
|
|
error = bbusy(bp, catch, slptimeo);
|
|
|
|
if (error != 0) {
|
|
|
|
if (error == EPASSTHROUGH)
|
|
|
|
goto restart;
|
|
|
|
mutex_exit(&bufcache_lock);
|
|
|
|
return (error);
|
2007-08-14 17:51:31 +04:00
|
|
|
}
|
2008-01-02 14:48:20 +03:00
|
|
|
brelsel(bp, BC_INVAL | BC_VFLUSH);
|
2007-08-14 17:51:31 +04:00
|
|
|
}
|
|
|
|
|
2008-01-02 14:48:20 +03:00
|
|
|
for (bp = LIST_FIRST(&vp->v_cleanblkhd); bp; bp = nbp) {
|
2007-08-14 17:51:31 +04:00
|
|
|
nbp = LIST_NEXT(bp, b_vnbufs);
|
2008-01-02 14:48:20 +03:00
|
|
|
error = bbusy(bp, catch, slptimeo);
|
|
|
|
if (error != 0) {
|
|
|
|
if (error == EPASSTHROUGH)
|
|
|
|
goto restart;
|
|
|
|
mutex_exit(&bufcache_lock);
|
|
|
|
return (error);
|
2007-08-14 17:51:31 +04:00
|
|
|
}
|
|
|
|
/*
|
|
|
|
* XXX Since there are no node locks for NFS, I believe
|
|
|
|
* there is a slight chance that a delayed write will
|
|
|
|
* occur while sleeping just above, so check for it.
|
|
|
|
*/
|
2008-01-02 14:48:20 +03:00
|
|
|
if ((bp->b_oflags & BO_DELWRI) && (flags & V_SAVE)) {
|
2007-08-14 17:51:31 +04:00
|
|
|
#ifdef DEBUG
|
|
|
|
printf("buffer still DELWRI\n");
|
|
|
|
#endif
|
2008-01-02 14:48:20 +03:00
|
|
|
bp->b_cflags |= BC_BUSY | BC_VFLUSH;
|
|
|
|
mutex_exit(&bufcache_lock);
|
2007-08-14 17:51:31 +04:00
|
|
|
VOP_BWRITE(bp);
|
2008-01-02 14:48:20 +03:00
|
|
|
mutex_enter(&bufcache_lock);
|
2007-08-14 17:51:31 +04:00
|
|
|
goto restart;
|
|
|
|
}
|
2008-01-02 14:48:20 +03:00
|
|
|
brelsel(bp, BC_INVAL | BC_VFLUSH);
|
2007-08-14 17:51:31 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
#ifdef DIAGNOSTIC
|
|
|
|
if (!LIST_EMPTY(&vp->v_cleanblkhd) || !LIST_EMPTY(&vp->v_dirtyblkhd))
|
|
|
|
panic("vinvalbuf: flush failed, vp %p", vp);
|
|
|
|
#endif
|
|
|
|
|
2008-01-02 14:48:20 +03:00
|
|
|
mutex_exit(&bufcache_lock);
|
2007-08-14 17:51:31 +04:00
|
|
|
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Destroy any in core blocks past the truncation length.
|
|
|
|
* Called with the underlying vnode locked, which should prevent new dirty
|
|
|
|
* buffers from being queued.
|
|
|
|
*/
|
|
|
|
int
|
2008-01-02 14:48:20 +03:00
|
|
|
vtruncbuf(struct vnode *vp, daddr_t lbn, bool catch, int slptimeo)
|
2007-08-14 17:51:31 +04:00
|
|
|
{
|
|
|
|
struct buf *bp, *nbp;
|
2008-01-02 14:48:20 +03:00
|
|
|
int error;
|
2007-08-14 17:51:31 +04:00
|
|
|
voff_t off;
|
|
|
|
|
|
|
|
off = round_page((voff_t)lbn << vp->v_mount->mnt_fs_bshift);
|
2008-01-02 14:48:20 +03:00
|
|
|
mutex_enter(&vp->v_interlock);
|
2007-08-14 17:51:31 +04:00
|
|
|
error = VOP_PUTPAGES(vp, off, 0, PGO_FREE | PGO_SYNCIO);
|
|
|
|
if (error) {
|
|
|
|
return error;
|
|
|
|
}
|
|
|
|
|
2008-01-02 14:48:20 +03:00
|
|
|
mutex_enter(&bufcache_lock);
|
2007-08-14 17:51:31 +04:00
|
|
|
restart:
|
2008-01-02 14:48:20 +03:00
|
|
|
for (bp = LIST_FIRST(&vp->v_dirtyblkhd); bp; bp = nbp) {
|
2007-08-14 17:51:31 +04:00
|
|
|
nbp = LIST_NEXT(bp, b_vnbufs);
|
|
|
|
if (bp->b_lblkno < lbn)
|
|
|
|
continue;
|
2008-01-02 14:48:20 +03:00
|
|
|
error = bbusy(bp, catch, slptimeo);
|
|
|
|
if (error != 0) {
|
|
|
|
if (error == EPASSTHROUGH)
|
|
|
|
goto restart;
|
|
|
|
mutex_exit(&bufcache_lock);
|
|
|
|
return (error);
|
2007-08-14 17:51:31 +04:00
|
|
|
}
|
2008-01-02 14:48:20 +03:00
|
|
|
brelsel(bp, BC_INVAL | BC_VFLUSH);
|
2007-08-14 17:51:31 +04:00
|
|
|
}
|
|
|
|
|
2008-01-02 14:48:20 +03:00
|
|
|
for (bp = LIST_FIRST(&vp->v_cleanblkhd); bp; bp = nbp) {
|
2007-08-14 17:51:31 +04:00
|
|
|
nbp = LIST_NEXT(bp, b_vnbufs);
|
|
|
|
if (bp->b_lblkno < lbn)
|
|
|
|
continue;
|
2008-01-02 14:48:20 +03:00
|
|
|
error = bbusy(bp, catch, slptimeo);
|
|
|
|
if (error != 0) {
|
|
|
|
if (error == EPASSTHROUGH)
|
|
|
|
goto restart;
|
|
|
|
mutex_exit(&bufcache_lock);
|
|
|
|
return (error);
|
2007-08-14 17:51:31 +04:00
|
|
|
}
|
2008-01-02 14:48:20 +03:00
|
|
|
brelsel(bp, BC_INVAL | BC_VFLUSH);
|
2007-08-14 17:51:31 +04:00
|
|
|
}
|
2008-01-02 14:48:20 +03:00
|
|
|
mutex_exit(&bufcache_lock);
|
2007-08-14 17:51:31 +04:00
|
|
|
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
2008-01-02 14:48:20 +03:00
|
|
|
/*
|
|
|
|
* Flush all dirty buffers from a vnode.
|
|
|
|
* Called with the underlying vnode locked, which should prevent new dirty
|
|
|
|
* buffers from being queued.
|
|
|
|
*/
|
2007-08-14 17:51:31 +04:00
|
|
|
void
|
|
|
|
vflushbuf(struct vnode *vp, int sync)
|
|
|
|
{
|
|
|
|
struct buf *bp, *nbp;
|
|
|
|
int flags = PGO_CLEANIT | PGO_ALLPAGES | (sync ? PGO_SYNCIO : 0);
|
2008-01-02 14:48:20 +03:00
|
|
|
bool dirty;
|
2007-08-14 17:51:31 +04:00
|
|
|
|
2008-01-02 14:48:20 +03:00
|
|
|
mutex_enter(&vp->v_interlock);
|
2007-08-14 17:51:31 +04:00
|
|
|
(void) VOP_PUTPAGES(vp, 0, 0, flags);
|
|
|
|
|
|
|
|
loop:
|
2008-01-02 14:48:20 +03:00
|
|
|
mutex_enter(&bufcache_lock);
|
2007-08-14 17:51:31 +04:00
|
|
|
for (bp = LIST_FIRST(&vp->v_dirtyblkhd); bp; bp = nbp) {
|
|
|
|
nbp = LIST_NEXT(bp, b_vnbufs);
|
2008-01-02 14:48:20 +03:00
|
|
|
if ((bp->b_cflags & BC_BUSY))
|
2007-08-14 17:51:31 +04:00
|
|
|
continue;
|
2008-01-02 14:48:20 +03:00
|
|
|
if ((bp->b_oflags & BO_DELWRI) == 0)
|
2007-08-14 17:51:31 +04:00
|
|
|
panic("vflushbuf: not dirty, bp %p", bp);
|
2008-01-02 14:48:20 +03:00
|
|
|
bp->b_cflags |= BC_BUSY | BC_VFLUSH;
|
|
|
|
mutex_exit(&bufcache_lock);
|
2007-08-14 17:51:31 +04:00
|
|
|
/*
|
|
|
|
* Wait for I/O associated with indirect blocks to complete,
|
|
|
|
* since there is no way to quickly wait for them below.
|
|
|
|
*/
|
|
|
|
if (bp->b_vp == vp || sync == 0)
|
|
|
|
(void) bawrite(bp);
|
|
|
|
else
|
|
|
|
(void) bwrite(bp);
|
|
|
|
goto loop;
|
|
|
|
}
|
2008-01-02 14:48:20 +03:00
|
|
|
mutex_exit(&bufcache_lock);
|
|
|
|
|
|
|
|
if (sync == 0)
|
2007-08-14 17:51:31 +04:00
|
|
|
return;
|
2008-01-02 14:48:20 +03:00
|
|
|
|
|
|
|
mutex_enter(&vp->v_interlock);
|
|
|
|
while (vp->v_numoutput != 0)
|
|
|
|
cv_wait(&vp->v_cv, &vp->v_interlock);
|
|
|
|
dirty = !LIST_EMPTY(&vp->v_dirtyblkhd);
|
|
|
|
mutex_exit(&vp->v_interlock);
|
|
|
|
|
|
|
|
if (dirty) {
|
2007-08-14 17:51:31 +04:00
|
|
|
vprint("vflushbuf: dirty", vp);
|
|
|
|
goto loop;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
2008-01-02 14:48:20 +03:00
|
|
|
* Associate a buffer with a vnode. There must already be a hold on
|
|
|
|
* the vnode.
|
2007-08-14 17:51:31 +04:00
|
|
|
*/
|
|
|
|
void
|
|
|
|
bgetvp(struct vnode *vp, struct buf *bp)
|
|
|
|
{
|
|
|
|
|
2008-01-02 14:48:20 +03:00
|
|
|
KASSERT(bp->b_vp == NULL);
|
|
|
|
KASSERT(bp->b_objlock == &buffer_lock);
|
|
|
|
KASSERT(mutex_owned(&vp->v_interlock));
|
|
|
|
KASSERT(mutex_owned(&bufcache_lock));
|
|
|
|
KASSERT((bp->b_cflags & BC_BUSY) != 0);
|
|
|
|
|
|
|
|
vholdl(vp);
|
2007-08-14 17:51:31 +04:00
|
|
|
bp->b_vp = vp;
|
|
|
|
if (vp->v_type == VBLK || vp->v_type == VCHR)
|
|
|
|
bp->b_dev = vp->v_rdev;
|
|
|
|
else
|
|
|
|
bp->b_dev = NODEV;
|
2008-01-02 14:48:20 +03:00
|
|
|
|
2007-08-14 17:51:31 +04:00
|
|
|
/*
|
|
|
|
* Insert onto list for new vnode.
|
|
|
|
*/
|
|
|
|
bufinsvn(bp, &vp->v_cleanblkhd);
|
2008-01-02 14:48:20 +03:00
|
|
|
bp->b_objlock = &vp->v_interlock;
|
2007-08-14 17:51:31 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Disassociate a buffer from a vnode.
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
brelvp(struct buf *bp)
|
|
|
|
{
|
2008-01-02 14:48:20 +03:00
|
|
|
struct vnode *vp = bp->b_vp;
|
2007-08-14 17:51:31 +04:00
|
|
|
|
2008-01-02 14:48:20 +03:00
|
|
|
KASSERT(vp != NULL);
|
|
|
|
KASSERT(bp->b_objlock == &vp->v_interlock);
|
|
|
|
KASSERT(mutex_owned(&vp->v_interlock));
|
|
|
|
KASSERT(mutex_owned(&bufcache_lock));
|
|
|
|
KASSERT((bp->b_cflags & BC_BUSY) != 0);
|
2007-08-14 17:51:31 +04:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Delete from old vnode list, if on one.
|
|
|
|
*/
|
|
|
|
if (LIST_NEXT(bp, b_vnbufs) != NOLIST)
|
|
|
|
bufremvn(bp);
|
|
|
|
|
2007-10-11 00:42:20 +04:00
|
|
|
if (TAILQ_EMPTY(&vp->v_uobj.memq) && (vp->v_iflag & VI_ONWORKLST) &&
|
2007-08-14 17:51:31 +04:00
|
|
|
LIST_FIRST(&vp->v_dirtyblkhd) == NULL) {
|
2007-10-11 00:42:20 +04:00
|
|
|
vp->v_iflag &= ~VI_WRMAPDIRTY;
|
2007-08-14 17:51:31 +04:00
|
|
|
vn_syncer_remove_from_worklist(vp);
|
|
|
|
}
|
|
|
|
|
2008-01-02 14:48:20 +03:00
|
|
|
bp->b_objlock = &buffer_lock;
|
2007-08-14 17:51:31 +04:00
|
|
|
bp->b_vp = NULL;
|
2008-01-02 14:48:20 +03:00
|
|
|
holdrelel(vp);
|
2007-08-14 17:51:31 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
2008-01-02 14:48:20 +03:00
|
|
|
* Reassign a buffer from one vnode list to another.
|
|
|
|
* The list reassignment must be within the same vnode.
|
2007-08-14 17:51:31 +04:00
|
|
|
* Used to assign file specific control information
|
2008-01-02 14:48:20 +03:00
|
|
|
* (indirect blocks) to the list to which they belong.
|
2007-08-14 17:51:31 +04:00
|
|
|
*/
|
|
|
|
void
|
2008-01-02 14:48:20 +03:00
|
|
|
reassignbuf(struct buf *bp, struct vnode *vp)
|
2007-08-14 17:51:31 +04:00
|
|
|
{
|
|
|
|
struct buflists *listheadp;
|
|
|
|
int delayx;
|
|
|
|
|
2008-01-02 14:48:20 +03:00
|
|
|
KASSERT(bp->b_objlock == &vp->v_interlock);
|
|
|
|
KASSERT(mutex_owned(&vp->v_interlock));
|
|
|
|
KASSERT((bp->b_cflags & BC_BUSY) != 0);
|
|
|
|
|
2007-08-14 17:51:31 +04:00
|
|
|
/*
|
|
|
|
* Delete from old vnode list, if on one.
|
|
|
|
*/
|
|
|
|
if (LIST_NEXT(bp, b_vnbufs) != NOLIST)
|
|
|
|
bufremvn(bp);
|
2008-01-02 14:48:20 +03:00
|
|
|
|
2007-08-14 17:51:31 +04:00
|
|
|
/*
|
|
|
|
* If dirty, put on list of dirty buffers;
|
|
|
|
* otherwise insert onto list of clean buffers.
|
|
|
|
*/
|
2008-01-02 14:48:20 +03:00
|
|
|
if ((bp->b_oflags & BO_DELWRI) == 0) {
|
|
|
|
listheadp = &vp->v_cleanblkhd;
|
|
|
|
if (TAILQ_EMPTY(&vp->v_uobj.memq) &&
|
|
|
|
(vp->v_iflag & VI_ONWORKLST) &&
|
|
|
|
LIST_FIRST(&vp->v_dirtyblkhd) == NULL) {
|
|
|
|
vp->v_iflag &= ~VI_WRMAPDIRTY;
|
|
|
|
vn_syncer_remove_from_worklist(vp);
|
2007-08-14 17:51:31 +04:00
|
|
|
}
|
|
|
|
} else {
|
2008-01-02 14:48:20 +03:00
|
|
|
listheadp = &vp->v_dirtyblkhd;
|
|
|
|
if ((vp->v_iflag & VI_ONWORKLST) == 0) {
|
|
|
|
switch (vp->v_type) {
|
2007-08-14 17:51:31 +04:00
|
|
|
case VDIR:
|
|
|
|
delayx = dirdelay;
|
|
|
|
break;
|
|
|
|
case VBLK:
|
2008-01-02 14:48:20 +03:00
|
|
|
if (vp->v_specmountpoint != NULL) {
|
2007-08-14 17:51:31 +04:00
|
|
|
delayx = metadelay;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
/* fall through */
|
|
|
|
default:
|
|
|
|
delayx = filedelay;
|
|
|
|
break;
|
|
|
|
}
|
2008-01-02 14:48:20 +03:00
|
|
|
if (!vp->v_mount ||
|
|
|
|
(vp->v_mount->mnt_flag & MNT_ASYNC) == 0)
|
|
|
|
vn_syncer_add_to_worklist(vp, delayx);
|
2007-08-14 17:51:31 +04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
bufinsvn(bp, listheadp);
|
|
|
|
}
|
|
|
|
|
2007-07-29 18:44:08 +04:00
|
|
|
/*
|
|
|
|
* Get a new unique fsid
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
vfs_getnewfsid(struct mount *mp)
|
|
|
|
{
|
|
|
|
static u_short xxxfs_mntid;
|
|
|
|
fsid_t tfsid;
|
|
|
|
int mtype;
|
|
|
|
|
2007-10-11 00:42:20 +04:00
|
|
|
mutex_enter(&mntid_lock);
|
2007-07-29 18:44:08 +04:00
|
|
|
mtype = makefstype(mp->mnt_op->vfs_name);
|
|
|
|
mp->mnt_stat.f_fsidx.__fsid_val[0] = makedev(mtype, 0);
|
|
|
|
mp->mnt_stat.f_fsidx.__fsid_val[1] = mtype;
|
|
|
|
mp->mnt_stat.f_fsid = mp->mnt_stat.f_fsidx.__fsid_val[0];
|
|
|
|
if (xxxfs_mntid == 0)
|
|
|
|
++xxxfs_mntid;
|
|
|
|
tfsid.__fsid_val[0] = makedev(mtype & 0xff, xxxfs_mntid);
|
|
|
|
tfsid.__fsid_val[1] = mtype;
|
|
|
|
if (!CIRCLEQ_EMPTY(&mountlist)) {
|
|
|
|
while (vfs_getvfs(&tfsid)) {
|
|
|
|
tfsid.__fsid_val[0]++;
|
|
|
|
xxxfs_mntid++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
mp->mnt_stat.f_fsidx.__fsid_val[0] = tfsid.__fsid_val[0];
|
|
|
|
mp->mnt_stat.f_fsid = mp->mnt_stat.f_fsidx.__fsid_val[0];
|
2007-10-11 00:42:20 +04:00
|
|
|
mutex_exit(&mntid_lock);
|
2007-07-29 18:44:08 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Make a 'unique' number from a mount type name.
|
|
|
|
*/
|
|
|
|
long
|
|
|
|
makefstype(const char *type)
|
|
|
|
{
|
|
|
|
long rv;
|
|
|
|
|
|
|
|
for (rv = 0; *type; type++) {
|
|
|
|
rv <<= 2;
|
|
|
|
rv ^= *type;
|
|
|
|
}
|
|
|
|
return rv;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Set vnode attributes to VNOVAL
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
vattr_null(struct vattr *vap)
|
|
|
|
{
|
|
|
|
|
|
|
|
vap->va_type = VNON;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Assign individually so that it is safe even if size and
|
|
|
|
* sign of each member are varied.
|
|
|
|
*/
|
|
|
|
vap->va_mode = VNOVAL;
|
|
|
|
vap->va_nlink = VNOVAL;
|
|
|
|
vap->va_uid = VNOVAL;
|
|
|
|
vap->va_gid = VNOVAL;
|
|
|
|
vap->va_fsid = VNOVAL;
|
|
|
|
vap->va_fileid = VNOVAL;
|
|
|
|
vap->va_size = VNOVAL;
|
|
|
|
vap->va_blocksize = VNOVAL;
|
|
|
|
vap->va_atime.tv_sec =
|
|
|
|
vap->va_mtime.tv_sec =
|
|
|
|
vap->va_ctime.tv_sec =
|
|
|
|
vap->va_birthtime.tv_sec = VNOVAL;
|
|
|
|
vap->va_atime.tv_nsec =
|
|
|
|
vap->va_mtime.tv_nsec =
|
|
|
|
vap->va_ctime.tv_nsec =
|
|
|
|
vap->va_birthtime.tv_nsec = VNOVAL;
|
|
|
|
vap->va_gen = VNOVAL;
|
|
|
|
vap->va_flags = VNOVAL;
|
|
|
|
vap->va_rdev = VNOVAL;
|
|
|
|
vap->va_bytes = VNOVAL;
|
|
|
|
vap->va_vaflags = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
#define ARRAY_SIZE(arr) (sizeof(arr) / sizeof(arr[0]))
|
|
|
|
#define ARRAY_PRINT(idx, arr) \
|
|
|
|
((idx) > 0 && (idx) < ARRAY_SIZE(arr) ? (arr)[(idx)] : "UNKNOWN")
|
|
|
|
|
|
|
|
const char * const vnode_tags[] = { VNODE_TAGS };
|
|
|
|
const char * const vnode_types[] = { VNODE_TYPES };
|
|
|
|
const char vnode_flagbits[] = VNODE_FLAGBITS;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Print out a description of a vnode.
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
vprint(const char *label, struct vnode *vp)
|
|
|
|
{
|
|
|
|
char bf[96];
|
2007-10-11 00:42:20 +04:00
|
|
|
int flag;
|
|
|
|
|
|
|
|
flag = vp->v_iflag | vp->v_vflag | vp->v_uflag;
|
|
|
|
bitmask_snprintf(flag, vnode_flagbits, bf, sizeof(bf));
|
2007-07-29 18:44:08 +04:00
|
|
|
|
|
|
|
if (label != NULL)
|
|
|
|
printf("%s: ", label);
|
2007-10-11 00:42:20 +04:00
|
|
|
printf("vnode @ %p, flags (%s)\n\ttag %s(%d), type %s(%d), "
|
|
|
|
"usecount %d, writecount %ld, holdcount %ld\n"
|
2008-01-02 14:48:20 +03:00
|
|
|
"\tfreelisthd %p, mount %p, data %p\n", vp, bf,
|
2007-10-11 00:42:20 +04:00
|
|
|
ARRAY_PRINT(vp->v_tag, vnode_tags), vp->v_tag,
|
2007-07-29 18:44:08 +04:00
|
|
|
ARRAY_PRINT(vp->v_type, vnode_types), vp->v_type,
|
2007-10-11 00:42:20 +04:00
|
|
|
vp->v_usecount, vp->v_writecount, vp->v_holdcnt,
|
2008-01-02 14:48:20 +03:00
|
|
|
vp->v_freelisthd, vp->v_mount, vp->v_data);
|
2007-10-11 00:42:20 +04:00
|
|
|
if (vp->v_data != NULL) {
|
|
|
|
printf("\t");
|
2007-07-29 18:44:08 +04:00
|
|
|
VOP_PRINT(vp);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
#ifdef DEBUG
|
|
|
|
/*
|
|
|
|
* List all of the locked vnodes in the system.
|
|
|
|
* Called when debugging the kernel.
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
printlockedvnodes(void)
|
|
|
|
{
|
|
|
|
struct mount *mp, *nmp;
|
|
|
|
struct vnode *vp;
|
|
|
|
|
|
|
|
printf("Locked vnodes\n");
|
2007-10-11 00:42:20 +04:00
|
|
|
mutex_enter(&mountlist_lock);
|
2007-07-29 18:44:08 +04:00
|
|
|
for (mp = CIRCLEQ_FIRST(&mountlist); mp != (void *)&mountlist;
|
|
|
|
mp = nmp) {
|
2007-10-11 00:42:20 +04:00
|
|
|
if (vfs_busy(mp, LK_NOWAIT, &mountlist_lock)) {
|
2007-07-29 18:44:08 +04:00
|
|
|
nmp = CIRCLEQ_NEXT(mp, mnt_list);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
TAILQ_FOREACH(vp, &mp->mnt_vnodelist, v_mntvnodes) {
|
|
|
|
if (VOP_ISLOCKED(vp))
|
|
|
|
vprint(NULL, vp);
|
|
|
|
}
|
2007-10-11 00:42:20 +04:00
|
|
|
mutex_enter(&mountlist_lock);
|
2007-07-29 18:44:08 +04:00
|
|
|
nmp = CIRCLEQ_NEXT(mp, mnt_list);
|
|
|
|
vfs_unbusy(mp);
|
|
|
|
}
|
2007-10-11 00:42:20 +04:00
|
|
|
mutex_exit(&mountlist_lock);
|
2007-07-29 18:44:08 +04:00
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Do the usual access checking.
|
|
|
|
* file_mode, uid and gid are from the vnode in question,
|
|
|
|
* while acc_mode and cred are from the VOP_ACCESS parameter list
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
vaccess(enum vtype type, mode_t file_mode, uid_t uid, gid_t gid,
|
|
|
|
mode_t acc_mode, kauth_cred_t cred)
|
|
|
|
{
|
|
|
|
mode_t mask;
|
|
|
|
int error, ismember;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Super-user always gets read/write access, but execute access depends
|
|
|
|
* on at least one execute bit being set.
|
|
|
|
*/
|
|
|
|
if (kauth_authorize_generic(cred, KAUTH_GENERIC_ISSUSER, NULL) == 0) {
|
|
|
|
if ((acc_mode & VEXEC) && type != VDIR &&
|
|
|
|
(file_mode & (S_IXUSR|S_IXGRP|S_IXOTH)) == 0)
|
|
|
|
return (EACCES);
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
|
|
|
mask = 0;
|
|
|
|
|
|
|
|
/* Otherwise, check the owner. */
|
|
|
|
if (kauth_cred_geteuid(cred) == uid) {
|
|
|
|
if (acc_mode & VEXEC)
|
|
|
|
mask |= S_IXUSR;
|
|
|
|
if (acc_mode & VREAD)
|
|
|
|
mask |= S_IRUSR;
|
|
|
|
if (acc_mode & VWRITE)
|
|
|
|
mask |= S_IWUSR;
|
|
|
|
return ((file_mode & mask) == mask ? 0 : EACCES);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Otherwise, check the groups. */
|
|
|
|
error = kauth_cred_ismember_gid(cred, gid, &ismember);
|
|
|
|
if (error)
|
|
|
|
return (error);
|
|
|
|
if (kauth_cred_getegid(cred) == gid || ismember) {
|
|
|
|
if (acc_mode & VEXEC)
|
|
|
|
mask |= S_IXGRP;
|
|
|
|
if (acc_mode & VREAD)
|
|
|
|
mask |= S_IRGRP;
|
|
|
|
if (acc_mode & VWRITE)
|
|
|
|
mask |= S_IWGRP;
|
|
|
|
return ((file_mode & mask) == mask ? 0 : EACCES);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Otherwise, check everyone else. */
|
|
|
|
if (acc_mode & VEXEC)
|
|
|
|
mask |= S_IXOTH;
|
|
|
|
if (acc_mode & VREAD)
|
|
|
|
mask |= S_IROTH;
|
|
|
|
if (acc_mode & VWRITE)
|
|
|
|
mask |= S_IWOTH;
|
|
|
|
return ((file_mode & mask) == mask ? 0 : EACCES);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Given a file system name, look up the vfsops for that
|
|
|
|
* file system, or return NULL if file system isn't present
|
|
|
|
* in the kernel.
|
|
|
|
*/
|
|
|
|
struct vfsops *
|
|
|
|
vfs_getopsbyname(const char *name)
|
|
|
|
{
|
|
|
|
struct vfsops *v;
|
|
|
|
|
2007-10-11 00:42:20 +04:00
|
|
|
mutex_enter(&vfs_list_lock);
|
2007-07-29 18:44:08 +04:00
|
|
|
LIST_FOREACH(v, &vfs_list, vfs_list) {
|
|
|
|
if (strcmp(v->vfs_name, name) == 0)
|
|
|
|
break;
|
|
|
|
}
|
2007-10-11 00:42:20 +04:00
|
|
|
if (v != NULL)
|
|
|
|
v->vfs_refcount++;
|
|
|
|
mutex_exit(&vfs_list_lock);
|
2007-07-29 18:44:08 +04:00
|
|
|
|
|
|
|
return (v);
|
|
|
|
}
|
|
|
|
|
|
|
|
void
|
|
|
|
copy_statvfs_info(struct statvfs *sbp, const struct mount *mp)
|
|
|
|
{
|
|
|
|
const struct statvfs *mbp;
|
|
|
|
|
|
|
|
if (sbp == (mbp = &mp->mnt_stat))
|
|
|
|
return;
|
|
|
|
|
|
|
|
(void)memcpy(&sbp->f_fsidx, &mbp->f_fsidx, sizeof(sbp->f_fsidx));
|
|
|
|
sbp->f_fsid = mbp->f_fsid;
|
|
|
|
sbp->f_owner = mbp->f_owner;
|
|
|
|
sbp->f_flag = mbp->f_flag;
|
|
|
|
sbp->f_syncwrites = mbp->f_syncwrites;
|
|
|
|
sbp->f_asyncwrites = mbp->f_asyncwrites;
|
|
|
|
sbp->f_syncreads = mbp->f_syncreads;
|
|
|
|
sbp->f_asyncreads = mbp->f_asyncreads;
|
|
|
|
(void)memcpy(sbp->f_spare, mbp->f_spare, sizeof(mbp->f_spare));
|
|
|
|
(void)memcpy(sbp->f_fstypename, mbp->f_fstypename,
|
|
|
|
sizeof(sbp->f_fstypename));
|
|
|
|
(void)memcpy(sbp->f_mntonname, mbp->f_mntonname,
|
|
|
|
sizeof(sbp->f_mntonname));
|
|
|
|
(void)memcpy(sbp->f_mntfromname, mp->mnt_stat.f_mntfromname,
|
|
|
|
sizeof(sbp->f_mntfromname));
|
|
|
|
sbp->f_namemax = mbp->f_namemax;
|
|
|
|
}
|
|
|
|
|
|
|
|
int
|
|
|
|
set_statvfs_info(const char *onp, int ukon, const char *fromp, int ukfrom,
|
|
|
|
const char *vfsname, struct mount *mp, struct lwp *l)
|
|
|
|
{
|
|
|
|
int error;
|
|
|
|
size_t size;
|
|
|
|
struct statvfs *sfs = &mp->mnt_stat;
|
|
|
|
int (*fun)(const void *, void *, size_t, size_t *);
|
|
|
|
|
|
|
|
(void)strlcpy(mp->mnt_stat.f_fstypename, vfsname,
|
|
|
|
sizeof(mp->mnt_stat.f_fstypename));
|
|
|
|
|
|
|
|
if (onp) {
|
|
|
|
struct cwdinfo *cwdi = l->l_proc->p_cwdi;
|
|
|
|
fun = (ukon == UIO_SYSSPACE) ? copystr : copyinstr;
|
|
|
|
if (cwdi->cwdi_rdir != NULL) {
|
|
|
|
size_t len;
|
|
|
|
char *bp;
|
|
|
|
char *path = malloc(MAXPATHLEN, M_TEMP, M_WAITOK);
|
|
|
|
|
|
|
|
if (!path) /* XXX can't happen with M_WAITOK */
|
|
|
|
return ENOMEM;
|
|
|
|
|
|
|
|
bp = path + MAXPATHLEN;
|
|
|
|
*--bp = '\0';
|
2007-10-08 19:12:05 +04:00
|
|
|
rw_enter(&cwdi->cwdi_lock, RW_READER);
|
2007-07-29 18:44:08 +04:00
|
|
|
error = getcwd_common(cwdi->cwdi_rdir, rootvnode, &bp,
|
|
|
|
path, MAXPATHLEN / 2, 0, l);
|
2007-10-08 19:12:05 +04:00
|
|
|
rw_exit(&cwdi->cwdi_lock);
|
2007-07-29 18:44:08 +04:00
|
|
|
if (error) {
|
|
|
|
free(path, M_TEMP);
|
|
|
|
return error;
|
|
|
|
}
|
|
|
|
|
|
|
|
len = strlen(bp);
|
|
|
|
if (len > sizeof(sfs->f_mntonname) - 1)
|
|
|
|
len = sizeof(sfs->f_mntonname) - 1;
|
|
|
|
(void)strncpy(sfs->f_mntonname, bp, len);
|
|
|
|
free(path, M_TEMP);
|
|
|
|
|
|
|
|
if (len < sizeof(sfs->f_mntonname) - 1) {
|
|
|
|
error = (*fun)(onp, &sfs->f_mntonname[len],
|
|
|
|
sizeof(sfs->f_mntonname) - len - 1, &size);
|
|
|
|
if (error)
|
|
|
|
return error;
|
|
|
|
size += len;
|
|
|
|
} else {
|
|
|
|
size = len;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
error = (*fun)(onp, &sfs->f_mntonname,
|
|
|
|
sizeof(sfs->f_mntonname) - 1, &size);
|
|
|
|
if (error)
|
|
|
|
return error;
|
|
|
|
}
|
|
|
|
(void)memset(sfs->f_mntonname + size, 0,
|
|
|
|
sizeof(sfs->f_mntonname) - size);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (fromp) {
|
|
|
|
fun = (ukfrom == UIO_SYSSPACE) ? copystr : copyinstr;
|
|
|
|
error = (*fun)(fromp, sfs->f_mntfromname,
|
|
|
|
sizeof(sfs->f_mntfromname) - 1, &size);
|
|
|
|
if (error)
|
|
|
|
return error;
|
|
|
|
(void)memset(sfs->f_mntfromname + size, 0,
|
|
|
|
sizeof(sfs->f_mntfromname) - size);
|
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
void
|
|
|
|
vfs_timestamp(struct timespec *ts)
|
|
|
|
{
|
|
|
|
|
|
|
|
nanotime(ts);
|
|
|
|
}
|
|
|
|
|
2007-07-30 12:45:26 +04:00
|
|
|
time_t rootfstime; /* recorded root fs time, if known */
|
|
|
|
void
|
|
|
|
setrootfstime(time_t t)
|
|
|
|
{
|
|
|
|
rootfstime = t;
|
|
|
|
}
|
|
|
|
|
2007-08-10 00:55:30 +04:00
|
|
|
/*
|
|
|
|
* mount_specific_key_create --
|
|
|
|
* Create a key for subsystem mount-specific data.
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
mount_specific_key_create(specificdata_key_t *keyp, specificdata_dtor_t dtor)
|
|
|
|
{
|
|
|
|
|
|
|
|
return (specificdata_key_create(mount_specificdata_domain, keyp, dtor));
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* mount_specific_key_delete --
|
|
|
|
* Delete a key for subsystem mount-specific data.
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
mount_specific_key_delete(specificdata_key_t key)
|
|
|
|
{
|
|
|
|
|
|
|
|
specificdata_key_delete(mount_specificdata_domain, key);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* mount_initspecific --
|
|
|
|
* Initialize a mount's specificdata container.
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
mount_initspecific(struct mount *mp)
|
|
|
|
{
|
|
|
|
int error;
|
|
|
|
|
|
|
|
error = specificdata_init(mount_specificdata_domain,
|
|
|
|
&mp->mnt_specdataref);
|
|
|
|
KASSERT(error == 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* mount_finispecific --
|
|
|
|
* Finalize a mount's specificdata container.
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
mount_finispecific(struct mount *mp)
|
|
|
|
{
|
|
|
|
|
|
|
|
specificdata_fini(mount_specificdata_domain, &mp->mnt_specdataref);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* mount_getspecific --
|
|
|
|
* Return mount-specific data corresponding to the specified key.
|
|
|
|
*/
|
|
|
|
void *
|
|
|
|
mount_getspecific(struct mount *mp, specificdata_key_t key)
|
|
|
|
{
|
|
|
|
|
|
|
|
return (specificdata_getspecific(mount_specificdata_domain,
|
|
|
|
&mp->mnt_specdataref, key));
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* mount_setspecific --
|
|
|
|
* Set mount-specific data corresponding to the specified key.
|
|
|
|
*/
|
|
|
|
void
|
|
|
|
mount_setspecific(struct mount *mp, specificdata_key_t key, void *data)
|
|
|
|
{
|
|
|
|
|
|
|
|
specificdata_setspecific(mount_specificdata_domain,
|
|
|
|
&mp->mnt_specdataref, key, data);
|
|
|
|
}
|
|
|
|
|
2007-07-29 18:44:08 +04:00
|
|
|
#ifdef DDB
|
|
|
|
static const char buf_flagbits[] = BUF_FLAGBITS;
|
|
|
|
|
|
|
|
void
|
|
|
|
vfs_buf_print(struct buf *bp, int full, void (*pr)(const char *, ...))
|
|
|
|
{
|
|
|
|
char bf[1024];
|
|
|
|
|
|
|
|
(*pr)(" vp %p lblkno 0x%"PRIx64" blkno 0x%"PRIx64" rawblkno 0x%"
|
|
|
|
PRIx64 " dev 0x%x\n",
|
|
|
|
bp->b_vp, bp->b_lblkno, bp->b_blkno, bp->b_rawblkno, bp->b_dev);
|
|
|
|
|
2008-01-02 14:48:20 +03:00
|
|
|
bitmask_snprintf(bp->b_flags | bp->b_oflags | bp->b_cflags,
|
|
|
|
buf_flagbits, bf, sizeof(bf));
|
2007-07-29 18:44:08 +04:00
|
|
|
(*pr)(" error %d flags 0x%s\n", bp->b_error, bf);
|
|
|
|
|
|
|
|
(*pr)(" bufsize 0x%lx bcount 0x%lx resid 0x%lx\n",
|
|
|
|
bp->b_bufsize, bp->b_bcount, bp->b_resid);
|
|
|
|
(*pr)(" data %p saveaddr %p dep %p\n",
|
|
|
|
bp->b_data, bp->b_saveaddr, LIST_FIRST(&bp->b_dep));
|
2008-01-02 14:48:20 +03:00
|
|
|
(*pr)(" iodone %p objlock %p\n", bp->b_iodone, bp->b_objlock);
|
2007-07-29 18:44:08 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
void
|
|
|
|
vfs_vnode_print(struct vnode *vp, int full, void (*pr)(const char *, ...))
|
|
|
|
{
|
|
|
|
char bf[256];
|
|
|
|
|
|
|
|
uvm_object_printit(&vp->v_uobj, full, pr);
|
2007-10-11 00:42:20 +04:00
|
|
|
bitmask_snprintf(vp->v_iflag | vp->v_vflag | vp->v_uflag,
|
|
|
|
vnode_flagbits, bf, sizeof(bf));
|
2007-07-29 18:44:08 +04:00
|
|
|
(*pr)("\nVNODE flags %s\n", bf);
|
|
|
|
(*pr)("mp %p numoutput %d size 0x%llx writesize 0x%llx\n",
|
|
|
|
vp->v_mount, vp->v_numoutput, vp->v_size, vp->v_writesize);
|
|
|
|
|
2007-10-11 00:42:20 +04:00
|
|
|
(*pr)("data %p writecount %ld holdcnt %ld\n",
|
|
|
|
vp->v_data, vp->v_writecount, vp->v_holdcnt);
|
2007-07-29 18:44:08 +04:00
|
|
|
|
|
|
|
(*pr)("tag %s(%d) type %s(%d) mount %p typedata %p\n",
|
|
|
|
ARRAY_PRINT(vp->v_tag, vnode_tags), vp->v_tag,
|
|
|
|
ARRAY_PRINT(vp->v_type, vnode_types), vp->v_type,
|
|
|
|
vp->v_mount, vp->v_mountedhere);
|
|
|
|
|
|
|
|
if (full) {
|
|
|
|
struct buf *bp;
|
|
|
|
|
|
|
|
(*pr)("clean bufs:\n");
|
|
|
|
LIST_FOREACH(bp, &vp->v_cleanblkhd, b_vnbufs) {
|
|
|
|
(*pr)(" bp %p\n", bp);
|
|
|
|
vfs_buf_print(bp, full, pr);
|
|
|
|
}
|
|
|
|
|
|
|
|
(*pr)("dirty bufs:\n");
|
|
|
|
LIST_FOREACH(bp, &vp->v_dirtyblkhd, b_vnbufs) {
|
|
|
|
(*pr)(" bp %p\n", bp);
|
|
|
|
vfs_buf_print(bp, full, pr);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void
|
|
|
|
vfs_mount_print(struct mount *mp, int full, void (*pr)(const char *, ...))
|
|
|
|
{
|
|
|
|
char sbuf[256];
|
|
|
|
|
|
|
|
(*pr)("vnodecovered = %p syncer = %p data = %p\n",
|
|
|
|
mp->mnt_vnodecovered,mp->mnt_syncer,mp->mnt_data);
|
|
|
|
|
|
|
|
(*pr)("fs_bshift %d dev_bshift = %d\n",
|
|
|
|
mp->mnt_fs_bshift,mp->mnt_dev_bshift);
|
|
|
|
|
|
|
|
bitmask_snprintf(mp->mnt_flag, __MNT_FLAG_BITS, sbuf, sizeof(sbuf));
|
|
|
|
(*pr)("flag = %s\n", sbuf);
|
|
|
|
|
|
|
|
bitmask_snprintf(mp->mnt_iflag, __IMNT_FLAG_BITS, sbuf, sizeof(sbuf));
|
|
|
|
(*pr)("iflag = %s\n", sbuf);
|
|
|
|
|
|
|
|
/* XXX use lockmgr_printinfo */
|
|
|
|
if (mp->mnt_lock.lk_sharecount)
|
|
|
|
(*pr)(" lock type %s: SHARED (count %d)", mp->mnt_lock.lk_wmesg,
|
|
|
|
mp->mnt_lock.lk_sharecount);
|
|
|
|
else if (mp->mnt_lock.lk_flags & LK_HAVE_EXCL) {
|
|
|
|
(*pr)(" lock type %s: EXCL (count %d) by ",
|
|
|
|
mp->mnt_lock.lk_wmesg, mp->mnt_lock.lk_exclusivecount);
|
|
|
|
(*pr)("pid %d.%d", mp->mnt_lock.lk_lockholder,
|
|
|
|
mp->mnt_lock.lk_locklwp);
|
|
|
|
} else
|
|
|
|
(*pr)(" not locked");
|
|
|
|
if (mp->mnt_lock.lk_waitcount > 0)
|
|
|
|
(*pr)(" with %d pending", mp->mnt_lock.lk_waitcount);
|
|
|
|
|
|
|
|
(*pr)("\n");
|
|
|
|
|
|
|
|
if (mp->mnt_unmounter) {
|
|
|
|
(*pr)("unmounter pid = %d ",mp->mnt_unmounter->l_proc);
|
|
|
|
}
|
|
|
|
|
|
|
|
(*pr)("statvfs cache:\n");
|
|
|
|
(*pr)("\tbsize = %lu\n",mp->mnt_stat.f_bsize);
|
|
|
|
(*pr)("\tfrsize = %lu\n",mp->mnt_stat.f_frsize);
|
|
|
|
(*pr)("\tiosize = %lu\n",mp->mnt_stat.f_iosize);
|
|
|
|
|
|
|
|
(*pr)("\tblocks = %"PRIu64"\n",mp->mnt_stat.f_blocks);
|
|
|
|
(*pr)("\tbfree = %"PRIu64"\n",mp->mnt_stat.f_bfree);
|
|
|
|
(*pr)("\tbavail = %"PRIu64"\n",mp->mnt_stat.f_bavail);
|
|
|
|
(*pr)("\tbresvd = %"PRIu64"\n",mp->mnt_stat.f_bresvd);
|
|
|
|
|
|
|
|
(*pr)("\tfiles = %"PRIu64"\n",mp->mnt_stat.f_files);
|
|
|
|
(*pr)("\tffree = %"PRIu64"\n",mp->mnt_stat.f_ffree);
|
|
|
|
(*pr)("\tfavail = %"PRIu64"\n",mp->mnt_stat.f_favail);
|
|
|
|
(*pr)("\tfresvd = %"PRIu64"\n",mp->mnt_stat.f_fresvd);
|
|
|
|
|
|
|
|
(*pr)("\tf_fsidx = { 0x%"PRIx32", 0x%"PRIx32" }\n",
|
|
|
|
mp->mnt_stat.f_fsidx.__fsid_val[0],
|
|
|
|
mp->mnt_stat.f_fsidx.__fsid_val[1]);
|
|
|
|
|
|
|
|
(*pr)("\towner = %"PRIu32"\n",mp->mnt_stat.f_owner);
|
|
|
|
(*pr)("\tnamemax = %lu\n",mp->mnt_stat.f_namemax);
|
|
|
|
|
|
|
|
bitmask_snprintf(mp->mnt_stat.f_flag, __MNT_FLAG_BITS, sbuf,
|
|
|
|
sizeof(sbuf));
|
|
|
|
(*pr)("\tflag = %s\n",sbuf);
|
|
|
|
(*pr)("\tsyncwrites = %" PRIu64 "\n",mp->mnt_stat.f_syncwrites);
|
|
|
|
(*pr)("\tasyncwrites = %" PRIu64 "\n",mp->mnt_stat.f_asyncwrites);
|
|
|
|
(*pr)("\tsyncreads = %" PRIu64 "\n",mp->mnt_stat.f_syncreads);
|
|
|
|
(*pr)("\tasyncreads = %" PRIu64 "\n",mp->mnt_stat.f_asyncreads);
|
|
|
|
(*pr)("\tfstypename = %s\n",mp->mnt_stat.f_fstypename);
|
|
|
|
(*pr)("\tmntonname = %s\n",mp->mnt_stat.f_mntonname);
|
|
|
|
(*pr)("\tmntfromname = %s\n",mp->mnt_stat.f_mntfromname);
|
|
|
|
|
|
|
|
{
|
|
|
|
int cnt = 0;
|
|
|
|
struct vnode *vp;
|
|
|
|
(*pr)("locked vnodes =");
|
|
|
|
/* XXX would take mountlist lock, except ddb may not have context */
|
|
|
|
TAILQ_FOREACH(vp, &mp->mnt_vnodelist, v_mntvnodes) {
|
|
|
|
if (VOP_ISLOCKED(vp)) {
|
|
|
|
if ((++cnt % 6) == 0) {
|
|
|
|
(*pr)(" %p,\n\t", vp);
|
|
|
|
} else {
|
|
|
|
(*pr)(" %p,", vp);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
(*pr)("\n");
|
|
|
|
}
|
|
|
|
|
|
|
|
if (full) {
|
|
|
|
int cnt = 0;
|
|
|
|
struct vnode *vp;
|
|
|
|
(*pr)("all vnodes =");
|
|
|
|
/* XXX would take mountlist lock, except ddb may not have context */
|
|
|
|
TAILQ_FOREACH(vp, &mp->mnt_vnodelist, v_mntvnodes) {
|
|
|
|
if (!TAILQ_NEXT(vp, v_mntvnodes)) {
|
|
|
|
(*pr)(" %p", vp);
|
|
|
|
} else if ((++cnt % 6) == 0) {
|
|
|
|
(*pr)(" %p,\n\t", vp);
|
|
|
|
} else {
|
|
|
|
(*pr)(" %p,", vp);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
(*pr)("\n", vp);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
#endif /* DDB */
|