Generalize use of Vnode::covered_by/covers

* Introduce Vnode flags for covered and covering. Can be used as a quick
  check when one doesn't already hold sVnodeLock.
* Rename resolve_mount_point_to_volume_root() to
  resolve_vnode_to_covering_vnode().
* Adjust all code that deals with transitions between mount points and
  volume root vnodes to generally support covered/covering vnodes.
This commit is contained in:
Ingo Weinhold 2011-06-21 03:51:50 +02:00
parent 02be66ca10
commit 47ea54c55b
4 changed files with 219 additions and 125 deletions

View File

@ -143,7 +143,7 @@ status_t vfs_create_special_node(const char *path, fs_vnode *subVnode,
struct vnode **_createdVnode); struct vnode **_createdVnode);
/* service call for the node monitor */ /* service call for the node monitor */
status_t resolve_mount_point_to_volume_root(dev_t mountID, ino_t nodeID, status_t resolve_vnode_to_covering_vnode(dev_t mountID, ino_t nodeID,
dev_t *resolvedMountID, ino_t *resolvedNodeID); dev_t *resolvedMountID, ino_t *resolvedNodeID);
/* calls the syscall dispatcher should use for user file I/O */ /* calls the syscall dispatcher should use for user file I/O */

View File

@ -52,6 +52,14 @@ public:
inline bool IsHot() const; inline bool IsHot() const;
inline void SetHot(bool hot); inline void SetHot(bool hot);
// setter requires sVnodeLock write-locked, getter is lockless
inline bool IsCovered() const;
inline void SetCovered(bool covered);
// setter requires sVnodeLock write-locked, getter is lockless
inline bool IsCovering() const;
inline void SetCovering(bool covering);
inline uint32 Type() const; inline uint32 Type() const;
inline void SetType(uint32 type); inline void SetType(uint32 type);
@ -68,6 +76,8 @@ private:
static const uint32 kFlagsUnpublished = 0x00000010; static const uint32 kFlagsUnpublished = 0x00000010;
static const uint32 kFlagsUnused = 0x00000020; static const uint32 kFlagsUnused = 0x00000020;
static const uint32 kFlagsHot = 0x00000040; static const uint32 kFlagsHot = 0x00000040;
static const uint32 kFlagsCovered = 0x00000080;
static const uint32 kFlagsCovering = 0x00000100;
static const uint32 kFlagsType = 0xfffff000; static const uint32 kFlagsType = 0xfffff000;
static const uint32 kBucketCount = 32; static const uint32 kBucketCount = 32;
@ -185,6 +195,40 @@ vnode::SetHot(bool hot)
} }
bool
vnode::IsCovered() const
{
return (fFlags & kFlagsCovered) != 0;
}
void
vnode::SetCovered(bool covered)
{
if (covered)
atomic_or(&fFlags, kFlagsCovered);
else
atomic_and(&fFlags, ~kFlagsCovered);
}
bool
vnode::IsCovering() const
{
return (fFlags & kFlagsCovering) != 0;
}
void
vnode::SetCovering(bool covering)
{
if (covering)
atomic_or(&fFlags, kFlagsCovering);
else
atomic_and(&fFlags, ~kFlagsCovering);
}
uint32 uint32
vnode::Type() const vnode::Type() const
{ {

View File

@ -687,7 +687,7 @@ NodeMonitorService::NotifyEntryMoved(dev_t device, ino_t fromDirectory,
// If node is a mount point, we need to resolve it to the mounted // If node is a mount point, we need to resolve it to the mounted
// volume's root node. // volume's root node.
dev_t nodeDevice = device; dev_t nodeDevice = device;
resolve_mount_point_to_volume_root(device, node, &nodeDevice, &node); resolve_vnode_to_covering_vnode(device, node, &nodeDevice, &node);
RecursiveLocker locker(fRecursiveLock); RecursiveLocker locker(fRecursiveLock);

View File

@ -219,7 +219,6 @@ static mutex sMountMutex = MUTEX_INITIALIZER("vfs_mount_lock");
- sMountsTable will not be modified, - sMountsTable will not be modified,
- the fields immutable after initialization of the fs_mount structures in - the fields immutable after initialization of the fs_mount structures in
sMountsTable will not be modified, sMountsTable will not be modified,
- vnode::covered_by of any vnode in sVnodeTable will not be modified.
The thread trying to lock the lock must not hold sVnodeLock or The thread trying to lock the lock must not hold sVnodeLock or
sMountMutex. sMountMutex.
@ -234,7 +233,8 @@ static recursive_lock sMountOpLock;
The mutable fields advisory_locking, mandatory_locked_by, and ref_count, as The mutable fields advisory_locking, mandatory_locked_by, and ref_count, as
well as the busy, removed, unused flags, and the vnode's type can also be well as the busy, removed, unused flags, and the vnode's type can also be
write accessed when holding a read lock to sVnodeLock *and* having the vnode write accessed when holding a read lock to sVnodeLock *and* having the vnode
locked. Write access to covered_by requires to write lock sVnodeLock. locked. Write access to covered_by and covers requires to write lock
sVnodeLock.
The thread trying to acquire the lock must not hold sMountMutex. The thread trying to acquire the lock must not hold sMountMutex.
You must not hold this lock when calling create_sem(), as this might call You must not hold this lock when calling create_sem(), as this might call
@ -1320,6 +1320,104 @@ free_unused_vnodes(int32 level)
} }
/*! Gets the vnode the given vnode is covering.
The caller must have \c sVnodeLock read-locked at least.
The function returns a reference to the retrieved vnode (if any), the caller
is responsible to free.
\param vnode The vnode whose covered node shall be returned.
\return The covered vnode, or \c NULL if the given vnode doesn't cover any
vnode.
*/
static inline Vnode*
get_covered_vnode_locked(Vnode* vnode)
{
if (Vnode* coveredNode = vnode->covers) {
while (coveredNode->covers != NULL)
coveredNode = coveredNode->covers;
inc_vnode_ref_count(coveredNode);
return coveredNode;
}
return NULL;
}
/*! Gets the vnode the given vnode is covering.
The caller must not hold \c sVnodeLock. Note that this implies a race
condition, since the situation can change at any time.
The function returns a reference to the retrieved vnode (if any), the caller
is responsible to free.
\param vnode The vnode whose covered node shall be returned.
\return The covered vnode, or \c NULL if the given vnode doesn't cover any
vnode.
*/
static inline Vnode*
get_covered_vnode(Vnode* vnode)
{
if (!vnode->IsCovering())
return NULL;
ReadLocker vnodeReadLocker(sVnodeLock);
return get_covered_vnode_locked(vnode);
}
/*! Gets the vnode the given vnode is covered by.
The caller must have \c sVnodeLock read-locked at least.
The function returns a reference to the retrieved vnode (if any), the caller
is responsible to free.
\param vnode The vnode whose covering node shall be returned.
\return The covering vnode, or \c NULL if the given vnode isn't covered by
any vnode.
*/
static Vnode*
get_covering_vnode_locked(Vnode* vnode)
{
if (Vnode* coveringNode = vnode->covered_by) {
while (coveringNode->covered_by != NULL)
coveringNode = coveringNode->covered_by;
inc_vnode_ref_count(coveringNode);
return coveringNode;
}
return NULL;
}
/*! Gets the vnode the given vnode is covered by.
The caller must not hold \c sVnodeLock. Note that this implies a race
condition, since the situation can change at any time.
The function returns a reference to the retrieved vnode (if any), the caller
is responsible to free.
\param vnode The vnode whose covering node shall be returned.
\return The covering vnode, or \c NULL if the given vnode isn't covered by
any vnode.
*/
static inline Vnode*
get_covering_vnode(Vnode* vnode)
{
if (!vnode->IsCovered())
return NULL;
ReadLocker vnodeReadLocker(sVnodeLock);
return get_covering_vnode_locked(vnode);
}
static void static void
free_unused_vnodes() free_unused_vnodes()
{ {
@ -1725,30 +1823,36 @@ replace_vnode_if_disconnected(struct fs_mount* mount,
struct vnode* vnodeToDisconnect, struct vnode*& vnode, struct vnode* vnodeToDisconnect, struct vnode*& vnode,
struct vnode* fallBack, bool lockRootLock) struct vnode* fallBack, bool lockRootLock)
{ {
struct vnode* givenVnode = vnode;
bool vnodeReplaced = false;
ReadLocker vnodeReadLocker(sVnodeLock);
if (lockRootLock) if (lockRootLock)
mutex_lock(&sIOContextRootLock); mutex_lock(&sIOContextRootLock);
struct vnode* obsoleteVnode = NULL; while (vnode != NULL && vnode->mount == mount
if (vnode != NULL && vnode->mount == mount
&& (vnodeToDisconnect == NULL || vnodeToDisconnect == vnode)) { && (vnodeToDisconnect == NULL || vnodeToDisconnect == vnode)) {
obsoleteVnode = vnode; if (vnode->covers != NULL) {
if (vnode == mount->root_vnode) {
// redirect the vnode to the covered vnode // redirect the vnode to the covered vnode
vnode = mount->root_vnode->covers; vnode = vnode->covers;
} else } else
vnode = fallBack; vnode = fallBack;
if (vnode != NULL) vnodeReplaced = true;
inc_vnode_ref_count(vnode);
} }
// If we've replaced the node, grab a reference for the new one.
if (vnodeReplaced && vnode != NULL)
inc_vnode_ref_count(vnode);
if (lockRootLock) if (lockRootLock)
mutex_unlock(&sIOContextRootLock); mutex_unlock(&sIOContextRootLock);
if (obsoleteVnode != NULL) vnodeReadLocker.Unlock();
put_vnode(obsoleteVnode);
if (vnodeReplaced)
put_vnode(givenVnode);
} }
@ -1834,44 +1938,11 @@ get_root_vnode(bool kernel)
} }
/*! \brief Resolves a mount point vnode to the volume root vnode it is covered /*! \brief Resolves a vnode to the vnode it is covered by, if any.
by.
Given an arbitrary vnode, the function checks, whether the node is covered
by the root of a volume. If it is the function obtains a reference to the
volume root node and returns it.
\param vnode The vnode in question.
\return The volume root vnode the vnode cover is covered by, if it is
indeed a mount point, or \c NULL otherwise.
*/
static struct vnode*
resolve_mount_point_to_volume_root(struct vnode* vnode)
{
if (!vnode)
return NULL;
struct vnode* volumeRoot = NULL;
rw_lock_read_lock(&sVnodeLock);
if (vnode->covered_by) {
volumeRoot = vnode->covered_by;
inc_vnode_ref_count(volumeRoot);
}
rw_lock_read_unlock(&sVnodeLock);
return volumeRoot;
}
/*! \brief Resolves a mount point vnode to the volume root vnode it is covered
by.
Given an arbitrary vnode (identified by mount and node ID), the function Given an arbitrary vnode (identified by mount and node ID), the function
checks, whether the node is covered by the root of a volume. If it is the checks, whether the vnode is covered by another vnode. If it is, the
function returns the mount and node ID of the volume root node. Otherwise function returns the mount and node ID of the covering vnode. Otherwise
it simply returns the supplied mount and node ID. it simply returns the supplied mount and node ID.
In case of error (e.g. the supplied node could not be found) the variables In case of error (e.g. the supplied node could not be found) the variables
@ -1887,7 +1958,7 @@ resolve_mount_point_to_volume_root(struct vnode* vnode)
- another error code, if something went wrong. - another error code, if something went wrong.
*/ */
status_t status_t
resolve_mount_point_to_volume_root(dev_t mountID, ino_t nodeID, resolve_vnode_to_covering_vnode(dev_t mountID, ino_t nodeID,
dev_t* resolvedMountID, ino_t* resolvedNodeID) dev_t* resolvedMountID, ino_t* resolvedNodeID)
{ {
// get the node // get the node
@ -1897,10 +1968,9 @@ resolve_mount_point_to_volume_root(dev_t mountID, ino_t nodeID,
return error; return error;
// resolve the node // resolve the node
struct vnode* resolvedNode = resolve_mount_point_to_volume_root(node); if (Vnode* coveringNode = get_covering_vnode(node)) {
if (resolvedNode) {
put_vnode(node); put_vnode(node);
node = resolvedNode; node = coveringNode;
} }
// set the return values // set the return values
@ -1913,34 +1983,6 @@ resolve_mount_point_to_volume_root(dev_t mountID, ino_t nodeID,
} }
/*! \brief Resolves a volume root vnode to the underlying mount point vnode.
Given an arbitrary vnode, the function checks, whether the node is the
root of a volume. If it is (and if it is not "/"), the function obtains
a reference to the underlying mount point node and returns it.
\param vnode The vnode in question (caller must have a reference).
\return The mount point vnode the vnode covers, if it is indeed a volume
root and not "/", or \c NULL otherwise.
*/
static struct vnode*
resolve_volume_root_to_mount_point(struct vnode* vnode)
{
if (!vnode)
return NULL;
struct vnode* mountPoint = NULL;
struct fs_mount* mount = vnode->mount;
if (vnode == mount->root_vnode && mount->root_vnode->covers != NULL) {
mountPoint = mount->root_vnode->covers;
inc_vnode_ref_count(mountPoint);
}
return mountPoint;
}
/*! \brief Gets the directory path and leaf name for a given path. /*! \brief Gets the directory path and leaf name for a given path.
The supplied \a path is transformed to refer to the directory part of The supplied \a path is transformed to refer to the directory part of
@ -2109,7 +2151,7 @@ vnode_path_to_vnode(struct vnode* vnode, char* path, bool traverseLeafLink,
while (*nextPath == '/'); while (*nextPath == '/');
} }
// See if the '..' is at the root of a mount and move to the covered // See if the '..' is at a covering vnode move to the covered
// vnode so we pass the '..' path to the underlying filesystem. // vnode so we pass the '..' path to the underlying filesystem.
// Also prevent breaking the root of the IO context. // Also prevent breaking the root of the IO context.
if (strcmp("..", path) == 0) { if (strcmp("..", path) == 0) {
@ -2117,10 +2159,10 @@ vnode_path_to_vnode(struct vnode* vnode, char* path, bool traverseLeafLink,
// Attempted prison break! Keep it contained. // Attempted prison break! Keep it contained.
path = nextPath; path = nextPath;
continue; continue;
} else if (vnode->mount->root_vnode == vnode }
&& vnode->mount->root_vnode->covers != NULL) {
nextVnode = vnode->mount->root_vnode->covers; if (Vnode* coveredVnode = get_covered_vnode(vnode)) {
inc_vnode_ref_count(nextVnode); nextVnode = coveredVnode;
put_vnode(vnode); put_vnode(vnode);
vnode = nextVnode; vnode = nextVnode;
} }
@ -2235,11 +2277,10 @@ vnode_path_to_vnode(struct vnode* vnode, char* path, bool traverseLeafLink,
path = nextPath; path = nextPath;
vnode = nextVnode; vnode = nextVnode;
// see if we hit a mount point // see if we hit a covered node
struct vnode* mountPoint = resolve_mount_point_to_volume_root(vnode); if (Vnode* coveringNode = get_covering_vnode(vnode)) {
if (mountPoint) {
put_vnode(vnode); put_vnode(vnode);
vnode = mountPoint; vnode = coveringNode;
} }
} }
@ -2422,13 +2463,11 @@ get_vnode_name(struct vnode* vnode, struct vnode* parent, struct dirent* buffer,
if (bufferSize < sizeof(struct dirent)) if (bufferSize < sizeof(struct dirent))
return B_BAD_VALUE; return B_BAD_VALUE;
// See if vnode is the root of a mount and move to the covered // See if the vnode is convering another vnode and move to the covered
// vnode so we get the underlying file system // vnode so we get the underlying file system
VNodePutter vnodePutter; VNodePutter vnodePutter;
if (vnode->mount->root_vnode == vnode if (Vnode* coveredVnode = get_covered_vnode(vnode)) {
&& vnode->mount->root_vnode->covers != NULL) { vnode = coveredVnode;
vnode = vnode->mount->root_vnode->covers;
inc_vnode_ref_count(vnode);
vnodePutter.SetTo(vnode); vnodePutter.SetTo(vnode);
} }
@ -2532,11 +2571,10 @@ dir_vnode_to_path(struct vnode* vnode, char* buffer, size_t bufferSize,
if (vnode != ioContext->root) { if (vnode != ioContext->root) {
// we don't hit the IO context root // we don't hit the IO context root
// resolve a volume root to its mount point // resolve a vnode to its covered vnode
struct vnode* mountPoint = resolve_volume_root_to_mount_point(vnode); if (Vnode* coveredVnode = get_covered_vnode(vnode)) {
if (mountPoint) {
put_vnode(vnode); put_vnode(vnode);
vnode = mountPoint; vnode = coveredVnode;
} }
} }
@ -2567,12 +2605,10 @@ dir_vnode_to_path(struct vnode* vnode, char* buffer, size_t bufferSize,
if (vnode != ioContext->root) { if (vnode != ioContext->root) {
// we don't hit the IO context root // we don't hit the IO context root
// resolve a volume root to its mount point // resolve a vnode to its covered vnode
struct vnode* mountPoint if (Vnode* coveredVnode = get_covered_vnode(parentVnode)) {
= resolve_volume_root_to_mount_point(parentVnode);
if (mountPoint) {
put_vnode(parentVnode); put_vnode(parentVnode);
parentVnode = mountPoint; parentVnode = coveredVnode;
parentID = parentVnode->id; parentID = parentVnode->id;
} }
} }
@ -3016,10 +3052,8 @@ debug_resolve_vnode_path(struct vnode* vnode, char* buffer, size_t bufferSize,
buffer[--bufferSize] = '\0'; buffer[--bufferSize] = '\0';
while (true) { while (true) {
while (vnode->mount->root_vnode == vnode while (vnode->covers != NULL)
&& vnode->mount->root_vnode->covers != NULL) { vnode = vnode->covers;
vnode = vnode->mount->root_vnode->covers;
}
if (vnode == sRoot) { if (vnode == sRoot) {
_truncated = bufferSize == 0; _truncated = bufferSize == 0;
@ -3068,6 +3102,7 @@ _dump_vnode(struct vnode* vnode, bool printPath)
kprintf(" private_node: %p\n", vnode->private_node); kprintf(" private_node: %p\n", vnode->private_node);
kprintf(" mount: %p\n", vnode->mount); kprintf(" mount: %p\n", vnode->mount);
kprintf(" covered_by: %p\n", vnode->covered_by); kprintf(" covered_by: %p\n", vnode->covered_by);
kprintf(" covers: %p\n", vnode->covers);
kprintf(" cache: %p\n", vnode->cache); kprintf(" cache: %p\n", vnode->cache);
kprintf(" type: %#" B_PRIx32 "\n", vnode->Type()); kprintf(" type: %#" B_PRIx32 "\n", vnode->Type());
kprintf(" flags: %s%s%s\n", vnode->IsRemoved() ? "r" : "-", kprintf(" flags: %s%s%s\n", vnode->IsRemoved() ? "r" : "-",
@ -3099,6 +3134,7 @@ _dump_vnode(struct vnode* vnode, bool printPath)
set_debug_variable("_node", (addr_t)vnode->private_node); set_debug_variable("_node", (addr_t)vnode->private_node);
set_debug_variable("_mount", (addr_t)vnode->mount); set_debug_variable("_mount", (addr_t)vnode->mount);
set_debug_variable("_covered_by", (addr_t)vnode->covered_by); set_debug_variable("_covered_by", (addr_t)vnode->covered_by);
set_debug_variable("_covers", (addr_t)vnode->covers);
set_debug_variable("_adv_lock", (addr_t)vnode->advisory_locking); set_debug_variable("_adv_lock", (addr_t)vnode->advisory_locking);
} }
@ -5670,11 +5706,9 @@ fix_dirent(struct vnode* parent, struct dirent* entry,
entry->d_pdev = parent->device; entry->d_pdev = parent->device;
entry->d_pino = parent->id; entry->d_pino = parent->id;
// If this is the ".." entry and the directory is the root of a FS, // If this is the ".." entry and the directory covering another vnode,
// we need to replace d_dev and d_ino with the actual values. // we need to replace d_dev and d_ino with the actual values.
if (strcmp(entry->d_name, "..") == 0 if (strcmp(entry->d_name, "..") == 0 && parent->IsCovering()) {
&& parent->mount->root_vnode == parent
&& parent->mount->root_vnode->covers != NULL) {
inc_vnode_ref_count(parent); inc_vnode_ref_count(parent);
// vnode_path_to_vnode() puts the node // vnode_path_to_vnode() puts the node
@ -5694,15 +5728,17 @@ fix_dirent(struct vnode* parent, struct dirent* entry,
} }
} }
} else { } else {
// resolve mount points // resolve covered vnodes
ReadLocker _(&sVnodeLock); ReadLocker _(&sVnodeLock);
struct vnode* vnode = lookup_vnode(entry->d_dev, entry->d_ino); struct vnode* vnode = lookup_vnode(entry->d_dev, entry->d_ino);
if (vnode != NULL) { if (vnode != NULL && vnode->covered_by != NULL) {
if (vnode->covered_by != NULL) { do {
entry->d_dev = vnode->covered_by->device; vnode = vnode->covered_by;
entry->d_ino = vnode->covered_by->id; } while (vnode->covered_by != NULL);
}
entry->d_dev = vnode->device;
entry->d_ino = vnode->id;
} }
} }
@ -7194,8 +7230,8 @@ fs_mount(char* path, const char* device, const char* fsName, uint32 flags,
goto err3; goto err3;
} }
if (coveredNode->mount->root_vnode == coveredNode) { if (coveredNode->IsCovered()) {
// this is already a mount point // this is already a covered vnode
status = B_BUSY; status = B_BUSY;
goto err3; goto err3;
} }
@ -7231,12 +7267,21 @@ fs_mount(char* path, const char* device, const char* fsName, uint32 flags,
goto err4; goto err4;
} }
// No race here, since fs_mount() is the only function changing // set up the links between the root vnode and the vnode it covers
// root_vnode->covers (and holds sMountOpLock at that time).
rw_lock_write_lock(&sVnodeLock); rw_lock_write_lock(&sVnodeLock);
if (coveredNode != NULL) { if (coveredNode != NULL) {
if (coveredNode->IsCovered()) {
// the vnode is covered now
status = B_BUSY;
rw_lock_write_unlock(&sVnodeLock);
goto err4;
}
mount->root_vnode->covers = coveredNode; mount->root_vnode->covers = coveredNode;
mount->root_vnode->SetCovering(true);
coveredNode->covered_by = mount->root_vnode; coveredNode->covered_by = mount->root_vnode;
coveredNode->SetCovered(true);
} }
rw_lock_write_unlock(&sVnodeLock); rw_lock_write_unlock(&sVnodeLock);
@ -7415,7 +7460,12 @@ fs_unmount(char* path, dev_t mountID, uint32 flags, bool kernel)
vnode_to_be_freed(mount->root_vnode); vnode_to_be_freed(mount->root_vnode);
Vnode* coveredNode = mount->root_vnode->covers; Vnode* coveredNode = mount->root_vnode->covers;
coveredNode->covered_by = NULL; coveredNode->covered_by = mount->root_vnode->covered_by;
coveredNode->SetCovered(coveredNode->covered_by != NULL);
mount->root_vnode->covered_by = NULL;
mount->root_vnode->SetCovered(false);
mount->root_vnode->SetCovering(false);
vnodesWriteLocker.Unlock(); vnodesWriteLocker.Unlock();