NetBSD/sys/nfs/nfs_nqlease.c

1289 lines
32 KiB
C

/* $NetBSD: nfs_nqlease.c,v 1.74 2006/11/09 09:53:57 yamt Exp $ */
/*
* Copyright (c) 1992, 1993
* The Regents of the University of California. All rights reserved.
*
* This code is derived from software contributed to Berkeley by
* Rick Macklem at The University of Guelph.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
* 3. Neither the name of the University nor the names of its contributors
* may be used to endorse or promote products derived from this software
* without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*
* @(#)nfs_nqlease.c 8.9 (Berkeley) 5/20/95
*/
/*
* References:
* Cary G. Gray and David R. Cheriton, "Leases: An Efficient Fault-Tolerant
* Mechanism for Distributed File Cache Consistency",
* In Proc. of the Twelfth ACM Symposium on Operating Systems
* Principals, pg. 202-210, Litchfield Park, AZ, Dec. 1989.
* Michael N. Nelson, Brent B. Welch and John K. Ousterhout, "Caching
* in the Sprite Network File System", ACM TOCS 6(1),
* pages 134-154, February 1988.
* V. Srinivasan and Jeffrey C. Mogul, "Spritely NFS: Implementation and
* Performance of Cache-Consistency Protocols", Digital
* Equipment Corporation WRL Research Report 89/5, May 1989.
*/
#include <sys/cdefs.h>
__KERNEL_RCSID(0, "$NetBSD: nfs_nqlease.c,v 1.74 2006/11/09 09:53:57 yamt Exp $");
#include "fs_nfs.h"
#include "opt_nfs.h"
#include "opt_nfsserver.h"
#include "opt_inet.h"
#include <sys/param.h>
#include <sys/vnode.h>
#include <sys/mount.h>
#include <sys/kernel.h>
#include <sys/namei.h>
#include <sys/proc.h>
#include <sys/systm.h>
#include <sys/mbuf.h>
#include <sys/socket.h>
#include <sys/socketvar.h>
#include <sys/file.h>
#include <sys/buf.h>
#include <sys/stat.h>
#include <sys/protosw.h>
#include <sys/signalvar.h>
#include <sys/kauth.h>
#include <miscfs/syncfs/syncfs.h>
#include <netinet/in.h>
#include <nfs/rpcv2.h>
#include <nfs/nfsproto.h>
#include <nfs/nfs.h>
#include <nfs/nfsm_subs.h>
#include <nfs/xdr_subs.h>
#include <nfs/nqnfs.h>
#include <nfs/nfsnode.h>
#include <nfs/nfsmount.h>
#include <nfs/nfs_var.h>
time_t nqnfsstarttime = (time_t)0;
int nqsrv_clockskew = NQ_CLOCKSKEW;
int nqsrv_writeslack = NQ_WRITESLACK;
int nqsrv_maxlease = NQ_MAXLEASE;
int nqsrv_maxnumlease = NQ_MAXNUMLEASE;
struct nqleasehead nqtimerhead;
struct nqfhhashhead *nqfhhashtbl;
u_long nqfhhash;
MALLOC_DEFINE(M_NQLEASE, "NQNFS Lease", "Nqnfs lease");
MALLOC_DEFINE(M_NQMHOST, "NQNFS Host", "Nqnfs host address table");
/*
* Signifies which rpcs can have piggybacked lease requests
*/
const int nqnfs_piggy[NFS_NPROCS] = {
0,
0,
ND_WRITE,
ND_READ,
0,
ND_READ,
ND_READ,
ND_WRITE,
0,
0,
0,
0,
0,
0,
0,
0,
ND_READ,
ND_READ,
0,
0,
0,
0,
0,
0,
0,
0,
};
extern const nfstype nfsv2_type[9];
extern const nfstype nfsv3_type[9];
extern struct nfssvc_sock *nfs_udpsock;
#ifdef ISO
extern struct nfssvc_sock *nfs_cltpsock
#endif
#ifdef INET6
extern struct nfssvc_sock *nfs_udp6sock;
#endif
extern int nfsd_waiting;
extern struct nfsstats nfsstats;
#if defined(NFSSERVER)
/*
* Get or check for a lease for "vp", based on ND_CHECK flag.
* The rules are as follows:
* - if a current non-caching lease, reply non-caching
* - if a current lease for same host only, extend lease
* - if a read cachable lease and a read lease request
* add host to list any reply cachable
* - else { set non-cachable for read-write sharing }
* send eviction notice messages to all other hosts that have lease
* wait for lease termination { either by receiving vacated messages
* from all the other hosts or expiry
* via. timeout }
* modify lease to non-cachable
* - else if no current lease, issue new one
* - reply
* - return boolean TRUE iff nam should be m_freem()'d
* NB: Since nqnfs_serverd() is called from a timer, any potential tsleep()
* in here must be framed by nqsrv_locklease() and nqsrv_unlocklease().
* nqsrv_locklease() is coded such that at least one of LC_LOCKED and
* LC_WANTED is set whenever a process is tsleeping in it. The exception
* is when a new lease is being allocated, since it is not in the timer
* queue yet. (Ditto for the splsoftnet() and splx(s) calls)
*/
int
nqsrv_getlease(vp, duration, flags, slp, lwp, nam, cachablep, frev, cred)
struct vnode *vp;
u_int32_t *duration;
int flags;
struct nfssvc_sock *slp;
struct lwp *lwp;
struct mbuf *nam;
int *cachablep;
u_quad_t *frev;
kauth_cred_t cred;
{
struct nqlease *lp;
struct nqfhhashhead *lpp = NULL;
struct nqhost *lph = NULL;
struct nqlease *tlp;
struct nqm **lphp;
struct vattr vattr;
nfsrvfh_t nsfh;
int i, ok, error, s;
if (vp->v_type != VREG && vp->v_type != VDIR && vp->v_type != VLNK)
return (0);
nfs_init();
if (*duration > nqsrv_maxlease)
*duration = nqsrv_maxlease;
error = VOP_GETATTR(vp, &vattr, cred, lwp);
if (error)
return (error);
*frev = vattr.va_filerev;
s = splsoftnet();
tlp = vp->v_lease;
if ((flags & ND_CHECK) == 0)
nfsstats.srvnqnfs_getleases++;
if (tlp == 0) {
/*
* Find the lease by searching the hash list.
*/
error = nfsrv_composefh(vp, &nsfh, TRUE);
if (error) {
splx(s);
return (error);
}
lpp = NQFHHASH(NFSRVFH_FHANDLE(&nsfh)->fh_fid.fid_data);
LIST_FOREACH (lp, lpp, lc_hash) {
if (!nfsrv_comparefh(&lp->lc_fh, &nsfh)) {
/* Found it */
lp->lc_vp = vp;
vp->v_lease = lp;
tlp = lp;
break;
}
}
} else
lp = tlp;
if (lp != 0) {
if ((lp->lc_flag & LC_NONCACHABLE) ||
(lp->lc_morehosts == (struct nqm *)0 &&
nqsrv_cmpnam(slp, nam, &lp->lc_host)))
goto doreply;
if ((flags & ND_READ) && (lp->lc_flag & LC_WRITE) == 0) {
if (flags & ND_CHECK)
goto doreply;
if (nqsrv_cmpnam(slp, nam, &lp->lc_host))
goto doreply;
i = 0;
if (lp->lc_morehosts) {
lph = lp->lc_morehosts->lpm_hosts;
lphp = &lp->lc_morehosts->lpm_next;
ok = 1;
} else {
lphp = &lp->lc_morehosts;
ok = 0;
}
while (ok && (lph->lph_flag & LC_VALID)) {
if (nqsrv_cmpnam(slp, nam, lph))
goto doreply;
if (++i == LC_MOREHOSTSIZ) {
i = 0;
if (*lphp) {
lph = (*lphp)->lpm_hosts;
lphp = &((*lphp)->lpm_next);
} else
ok = 0;
} else
lph++;
}
nqsrv_locklease(lp);
if (!ok) {
*lphp = (struct nqm *)
malloc(sizeof (struct nqm),
M_NQMHOST, M_WAITOK);
memset((caddr_t)*lphp, 0, sizeof (struct nqm));
lph = (*lphp)->lpm_hosts;
}
nqsrv_addhost(lph, slp, nam);
nqsrv_unlocklease(lp);
} else {
lp->lc_flag |= LC_NONCACHABLE;
nqsrv_locklease(lp);
nqsrv_send_eviction(vp, lp, slp, nam, cred, lwp);
nqsrv_waitfor_expiry(lp);
nqsrv_unlocklease(lp);
}
doreply:
/*
* Update the lease and return
*/
if ((flags & ND_CHECK) == 0)
nqsrv_instimeq(lp, *duration);
if (lp->lc_flag & LC_NONCACHABLE)
*cachablep = 0;
else {
*cachablep = 1;
if (flags & ND_WRITE)
lp->lc_flag |= LC_WRITTEN;
}
splx(s);
return (0);
}
splx(s);
if (flags & ND_CHECK) {
return (0);
}
/*
* Allocate new lease
* The value of nqsrv_maxnumlease should be set generously, so that
* the following "printf" happens infrequently.
*/
if (nfsstats.srvnqnfs_leases > nqsrv_maxnumlease) {
printf("Nqnfs server, too many leases\n");
do {
(void) tsleep((caddr_t)&lbolt, PSOCK,
"nqsrvnuml", 0);
} while (nfsstats.srvnqnfs_leases > nqsrv_maxnumlease);
}
MALLOC(lp, struct nqlease *, sizeof (struct nqlease), M_NQLEASE, M_WAITOK);
memset((caddr_t)lp, 0, sizeof (struct nqlease));
if (flags & ND_WRITE)
lp->lc_flag |= (LC_WRITE | LC_WRITTEN);
nqsrv_addhost(&lp->lc_host, slp, nam);
lp->lc_vp = vp;
nfsrv_copyfh(&lp->lc_fh, &nsfh);
if(!lpp)
panic("nfs_nqlease.c: Phoney lpp");
LIST_INSERT_HEAD(lpp, lp, lc_hash);
vp->v_lease = lp;
s = splsoftnet();
nqsrv_instimeq(lp, *duration);
splx(s);
*cachablep = 1;
if (++nfsstats.srvnqnfs_leases > nfsstats.srvnqnfs_maxleases)
nfsstats.srvnqnfs_maxleases = nfsstats.srvnqnfs_leases;
return (0);
}
/*
* Add a host to an nqhost structure for a lease.
*/
void
nqsrv_addhost(lph, slp, nam)
struct nqhost *lph;
struct nfssvc_sock *slp;
struct mbuf *nam;
{
struct sockaddr_in *saddr;
if (slp == NQLOCALSLP)
lph->lph_flag |= (LC_VALID | LC_LOCAL);
else if (slp == nfs_udpsock) {
saddr = mtod(nam, struct sockaddr_in *);
lph->lph_flag |= (LC_VALID | LC_UDP);
lph->lph_inetaddr = saddr->sin_addr.s_addr;
lph->lph_port = saddr->sin_port;
#ifdef INET6
} else if (slp == nfs_udp6sock) {
lph->lph_nam = m_copym(nam, 0, M_COPYALL, M_WAIT);
lph->lph_flag |= (LC_VALID | LC_UDP6);
#endif
#ifdef ISO
} else if (slp == nfs_cltpsock) {
lph->lph_nam = m_copym(nam, 0, M_COPYALL, M_WAIT);
lph->lph_flag |= (LC_VALID | LC_CLTP);
#endif
} else {
lph->lph_flag |= (LC_VALID | LC_SREF);
lph->lph_slp = slp;
slp->ns_sref++;
}
}
/*
* Update the lease expiry time and position it in the timer queue correctly.
*/
void
nqsrv_instimeq(lp, duration)
struct nqlease *lp;
u_int32_t duration;
{
struct nqlease *tlp;
time_t newexpiry;
newexpiry = time_second + duration + nqsrv_clockskew;
if (lp->lc_expiry == newexpiry)
return;
if (CIRCLEQ_NEXT(lp, lc_timer) != 0)
CIRCLEQ_REMOVE(&nqtimerhead, lp, lc_timer);
lp->lc_expiry = newexpiry;
/*
* Find where in the queue it should be.
*/
tlp = CIRCLEQ_LAST(&nqtimerhead);
while (tlp != (void *)&nqtimerhead && tlp->lc_expiry > newexpiry)
tlp = CIRCLEQ_PREV(tlp, lc_timer);
#ifdef HASNVRAM
if (tlp == CIRCLEQ_LAST(&nqtimerhead))
NQSTORENOVRAM(newexpiry);
#endif /* HASNVRAM */
if (tlp == (void *)&nqtimerhead) {
CIRCLEQ_INSERT_HEAD(&nqtimerhead, lp, lc_timer);
} else {
CIRCLEQ_INSERT_AFTER(&nqtimerhead, tlp, lp, lc_timer);
}
}
/*
* Compare the requesting host address with the lph entry in the lease.
* Return true iff it is the same.
* This is somewhat messy due to the union in the nqhost structure.
* The local host is indicated by the special value of NQLOCALSLP for slp.
*/
int
nqsrv_cmpnam(slp, nam, lph)
struct nfssvc_sock *slp;
struct mbuf *nam;
struct nqhost *lph;
{
struct sockaddr_in *saddr;
struct mbuf *addr;
union nethostaddr lhaddr;
int ret;
if (slp == NQLOCALSLP) {
if (lph->lph_flag & LC_LOCAL)
return (1);
else
return (0);
}
if (slp == nfs_udpsock
#ifdef ISO
|| slp == nfs_cltpsock
#endif
#ifdef INET6
|| slp == nfs_udp6sock
#endif
)
addr = nam;
else
addr = slp->ns_nam;
if (lph->lph_flag & LC_UDP)
ret = netaddr_match(AF_INET, &lph->lph_haddr, addr);
else if (lph->lph_flag & LC_CLTP)
ret = netaddr_match(AF_ISO, &lph->lph_claddr, addr);
else {
if ((lph->lph_slp->ns_flag & SLP_VALID) == 0)
return (0);
saddr = mtod(lph->lph_slp->ns_nam, struct sockaddr_in *);
if (saddr->sin_family == AF_INET)
lhaddr.had_inetaddr = saddr->sin_addr.s_addr;
else
lhaddr.had_nam = lph->lph_slp->ns_nam;
ret = netaddr_match(saddr->sin_family, &lhaddr, addr);
}
return (ret);
}
/*
* Send out eviction notice messages to all other hosts for the lease.
*/
void
nqsrv_send_eviction(vp, lp, slp, nam, cred, l)
struct vnode *vp;
struct nqlease *lp;
struct nfssvc_sock *slp;
struct mbuf *nam;
kauth_cred_t cred;
struct lwp *l;
{
struct nqhost *lph = &lp->lc_host;
struct mbuf *m;
int siz;
struct nqm *lphnext = lp->lc_morehosts;
struct mbuf *mreq, *mb, *nam2, *mheadend;
struct socket *so;
struct sockaddr_in *saddr;
nfsrvfh_t nsfh;
caddr_t bpos, cp;
u_int32_t xid, *tl;
int len = 1, ok = 1, i = 0;
int sotype, *solockp;
while (ok && (lph->lph_flag & LC_VALID)) {
if (nqsrv_cmpnam(slp, nam, lph))
lph->lph_flag |= LC_VACATED;
else if ((lph->lph_flag & (LC_LOCAL | LC_VACATED)) == 0) {
int error;
if (lph->lph_flag & LC_UDP) {
nam2 = m_get(M_WAIT, MT_SONAME);
MCLAIM(nam2, &nfs_mowner);
saddr = mtod(nam2, struct sockaddr_in *);
nam2->m_len = saddr->sin_len =
sizeof (struct sockaddr_in);
saddr->sin_family = AF_INET;
saddr->sin_addr.s_addr = lph->lph_inetaddr;
saddr->sin_port = lph->lph_port;
so = nfs_udpsock->ns_so;
#ifdef ISO
} else if (lph->lph_flag & LC_CLTP) {
nam2 = lph->lph_nam;
so = nfs_cltpsock->ns_so;
#endif
#ifdef INET6
} else if (lph->lph_flag & LC_UDP6) {
nam2 = lph->lph_nam;
so = nfs_udp6sock->ns_so;
#endif
} else if (lph->lph_slp->ns_flag & SLP_VALID) {
nam2 = (struct mbuf *)0;
so = lph->lph_slp->ns_so;
} else
goto nextone;
if (!so)
goto nextone;
sotype = so->so_type;
if (so->so_proto->pr_flags & PR_CONNREQUIRED)
solockp = &lph->lph_slp->ns_solock;
else
solockp = (int *)0;
nfsm_reqhead((struct nfsnode *)0, NQNFSPROC_EVICTED,
NFSX_V3FH + NFSX_UNSIGNED);
error = nfsrv_composefh(vp, &nsfh, 1);
KASSERT(error == 0); /* XXX */
nfsm_srvfhtom(&nsfh, 1);
m = mreq;
siz = 0;
while (m) {
siz += m->m_len;
m = m->m_next;
}
if (siz <= 0 || siz > NFS_MAXPACKET) {
printf("mbuf siz=%d\n",siz);
panic("Bad nfs svc reply");
}
m = nfsm_rpchead(cred, (NFSMNT_NFSV3 | NFSMNT_NQNFS),
NQNFSPROC_EVICTED,
RPCAUTH_UNIX, 5 * NFSX_UNSIGNED, (char *)0,
0, (char *)0, mreq, siz, &mheadend, &xid);
/*
* For stream protocols, prepend a Sun RPC
* Record Mark.
*/
if (sotype == SOCK_STREAM) {
M_PREPEND(m, NFSX_UNSIGNED, M_WAIT);
*mtod(m, u_int32_t *) = htonl(0x80000000 |
(m->m_pkthdr.len - NFSX_UNSIGNED));
}
if (((lph->lph_flag & (LC_UDP | LC_CLTP | LC_UDP6))
== 0 &&
(lph->lph_slp->ns_flag & SLP_VALID) == 0) ||
(solockp && (*solockp & NFSMNT_SNDLOCK)))
m_freem(m);
else {
if (solockp)
*solockp |= NFSMNT_SNDLOCK;
(void) nfs_send(so, nam2, m,
(struct nfsreq *)0, l);
if (solockp)
nfs_sndunlock(solockp);
}
if (lph->lph_flag & LC_UDP)
(void) m_free(nam2);
}
nextone:
if (++i == len) {
if (lphnext) {
i = 0;
len = LC_MOREHOSTSIZ;
lph = lphnext->lpm_hosts;
lphnext = lphnext->lpm_next;
} else
ok = 0;
} else
lph++;
}
}
/*
* Wait for the lease to expire.
* This will occur when all clients have sent "vacated" messages to
* this server OR when it expires do to timeout.
*/
void
nqsrv_waitfor_expiry(lp)
struct nqlease *lp;
{
struct nqhost *lph;
int i;
struct nqm *lphnext;
int len, ok;
tryagain:
if (time_second > lp->lc_expiry)
return;
lph = &lp->lc_host;
lphnext = lp->lc_morehosts;
len = 1;
i = 0;
ok = 1;
while (ok && (lph->lph_flag & LC_VALID)) {
if ((lph->lph_flag & (LC_LOCAL | LC_VACATED)) == 0) {
lp->lc_flag |= LC_EXPIREDWANTED;
(void) tsleep((caddr_t)&lp->lc_flag, PSOCK,
"nqexp", 0);
goto tryagain;
}
if (++i == len) {
if (lphnext) {
i = 0;
len = LC_MOREHOSTSIZ;
lph = lphnext->lpm_hosts;
lphnext = lphnext->lpm_next;
} else
ok = 0;
} else
lph++;
}
}
/*
* Nqnfs server timer that maintains the server lease queue.
* Scan the lease queue for expired entries:
* - when one is found, wakeup anyone waiting for it
* else dequeue and free
*/
void
nqnfs_serverd()
{
struct nqlease *lp;
struct nqhost *lph;
struct nqlease *nextlp;
struct nqm *lphnext, *olphnext;
int i, len, ok;
for (lp = CIRCLEQ_FIRST(&nqtimerhead); lp != (void *)&nqtimerhead;
lp = nextlp) {
if (lp->lc_expiry >= time_second)
break;
nextlp = CIRCLEQ_NEXT(lp, lc_timer);
if (lp->lc_flag & LC_EXPIREDWANTED) {
lp->lc_flag &= ~LC_EXPIREDWANTED;
wakeup((caddr_t)&lp->lc_flag);
} else if ((lp->lc_flag & (LC_LOCKED | LC_WANTED)) == 0) {
/*
* Make a best effort at keeping a write caching lease long
* enough by not deleting it until it has been explicitly
* vacated or there have been no writes in the previous
* write_slack seconds since expiry and the nfsds are not
* all busy. The assumption is that if the nfsds are not
* all busy now (no queue of nfs requests), then the client
* would have been able to do at least one write to the
* file during the last write_slack seconds if it was still
* trying to push writes to the server.
*/
if ((lp->lc_flag & (LC_WRITE | LC_VACATED)) == LC_WRITE &&
((lp->lc_flag & LC_WRITTEN) || nfsd_waiting == 0)) {
lp->lc_flag &= ~LC_WRITTEN;
nqsrv_instimeq(lp, nqsrv_writeslack);
} else {
CIRCLEQ_REMOVE(&nqtimerhead, lp, lc_timer);
LIST_REMOVE(lp, lc_hash);
/*
* This soft reference may no longer be valid, but
* no harm done. The worst case is if the vnode was
* recycled and has another valid lease reference,
* which is dereferenced prematurely.
*/
lp->lc_vp->v_lease = (struct nqlease *)0;
lph = &lp->lc_host;
lphnext = lp->lc_morehosts;
olphnext = (struct nqm *)0;
len = 1;
i = 0;
ok = 1;
while (ok && (lph->lph_flag & LC_VALID)) {
if (lph->lph_flag & (LC_CLTP | LC_UDP6))
(void) m_free(lph->lph_nam);
if (lph->lph_flag & LC_SREF)
nfsrv_slpderef(lph->lph_slp);
if (++i == len) {
if (olphnext) {
free((caddr_t)olphnext, M_NQMHOST);
olphnext = (struct nqm *)0;
}
if (lphnext) {
olphnext = lphnext;
i = 0;
len = LC_MOREHOSTSIZ;
lph = lphnext->lpm_hosts;
lphnext = lphnext->lpm_next;
} else
ok = 0;
} else
lph++;
}
FREE((caddr_t)lp, M_NQLEASE);
if (olphnext)
free((caddr_t)olphnext, M_NQMHOST);
nfsstats.srvnqnfs_leases--;
}
}
}
}
/*
* Called from nfssvc_nfsd() for a getlease rpc request.
* Do the from/to xdr translation and call nqsrv_getlease() to
* do the real work.
*/
int
nqnfsrv_getlease(nfsd, slp, lwp, mrq)
struct nfsrv_descript *nfsd;
struct nfssvc_sock *slp;
struct lwp *lwp;
struct mbuf **mrq;
{
struct mbuf *mrep = nfsd->nd_mrep, *md = nfsd->nd_md;
struct mbuf *nam = nfsd->nd_nam;
caddr_t dpos = nfsd->nd_dpos;
kauth_cred_t cred = nfsd->nd_cr;
struct nfs_fattr *fp;
struct vattr va;
struct vnode *vp;
nfsrvfh_t nsfh;
u_int32_t *tl;
int32_t t1;
u_quad_t frev;
caddr_t bpos;
int error = 0;
char *cp2;
struct mbuf *mb, *mreq;
int flags, rdonly, cache = 0;
nfsm_srvmtofh(&nsfh);
nfsm_dissect(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
flags = fxdr_unsigned(int, *tl++);
nfsd->nd_duration = fxdr_unsigned(int, *tl);
error = nfsrv_fhtovp(&nsfh, 1, &vp, cred, slp, nam, &rdonly,
(nfsd->nd_flag & ND_KERBAUTH), FALSE);
if (error) {
nfsm_reply(0);
return 0;
}
if (rdonly && flags == ND_WRITE) {
vput(vp);
error = EROFS;
nfsm_reply(0);
return 0;
}
(void) nqsrv_getlease(vp, &nfsd->nd_duration, flags, slp, lwp,
nam, &cache, &frev, cred);
error = VOP_GETATTR(vp, &va, cred, lwp);
vput(vp);
nfsm_reply(NFSX_V3FATTR + 4 * NFSX_UNSIGNED);
nfsm_build(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
*tl++ = txdr_unsigned(cache);
*tl++ = txdr_unsigned(nfsd->nd_duration);
txdr_hyper(frev, tl);
nfsm_build(fp, struct nfs_fattr *, NFSX_V3FATTR);
nfsm_srvfillattr(&va, fp);
nfsm_srvdone;
}
/*
* Called from nfssvc_nfsd() when a "vacated" message is received from a
* client. Find the entry and expire it.
*/
int
nqnfsrv_vacated(struct nfsrv_descript *nfsd, struct nfssvc_sock *slp,
struct lwp *lwp, struct mbuf **mrq)
{
struct mbuf *mrep = nfsd->nd_mrep, *md = nfsd->nd_md;
struct mbuf *nam = nfsd->nd_nam;
caddr_t dpos = nfsd->nd_dpos;
struct nqlease *lp;
struct nqhost *lph;
struct nqlease *tlp = (struct nqlease *)0;
nfsrvfh_t nsfh;
fhandle_t *fhp;
u_int32_t *tl;
int32_t t1;
struct nqm *lphnext;
struct mbuf *mreq, *mb;
int error = 0, i, len, ok, gotit = 0, cache = 0;
char *cp2, *bpos;
u_quad_t frev;
nfsm_srvmtofh(&nsfh);
m_freem(mrep);
fhp = &nsfh.nsfh_u.u_fh;
/*
* Find the lease by searching the hash list.
*/
LIST_FOREACH(lp, NQFHHASH(fhp->fh_fid.fid_data), lc_hash) {
if (!nfsrv_comparefh(&lp->lc_fh, &nsfh)) {
/* Found it */
tlp = lp;
break;
}
}
if (tlp != 0) {
lp = tlp;
len = 1;
i = 0;
lph = &lp->lc_host;
lphnext = lp->lc_morehosts;
ok = 1;
while (ok && (lph->lph_flag & LC_VALID)) {
if (nqsrv_cmpnam(slp, nam, lph)) {
lph->lph_flag |= LC_VACATED;
gotit++;
break;
}
if (++i == len) {
if (lphnext) {
len = LC_MOREHOSTSIZ;
i = 0;
lph = lphnext->lpm_hosts;
lphnext = lphnext->lpm_next;
} else
ok = 0;
} else
lph++;
}
if ((lp->lc_flag & LC_EXPIREDWANTED) && gotit) {
lp->lc_flag &= ~LC_EXPIREDWANTED;
wakeup((caddr_t)&lp->lc_flag);
}
nfsmout:
return (EPERM);
}
return (EPERM);
}
#endif /* NFSSERVER */
#if defined(NFS) && !defined(NFS_V2_ONLY)
/*
* Client get lease rpc function.
*/
int
nqnfs_getlease(vp, rwflag, cred, l)
struct vnode *vp;
int rwflag;
kauth_cred_t cred;
struct lwp *l;
{
u_int32_t *tl;
caddr_t cp;
int32_t t1, t2;
struct nfsnode *np;
struct nfsmount *nmp = VFSTONFS(vp->v_mount);
caddr_t bpos, dpos, cp2;
time_t reqtime;
int error = 0;
struct mbuf *mreq, *mrep, *md, *mb;
int cachable;
u_quad_t frev;
nfsstats.rpccnt[NQNFSPROC_GETLEASE]++;
np = VTONFS(vp);
mb = mreq = nfsm_reqh(np, NQNFSPROC_GETLEASE, NFSX_V3FH+2*NFSX_UNSIGNED,
&bpos);
nfsm_fhtom(np, 1);
nfsm_build(tl, u_int32_t *, 2 * NFSX_UNSIGNED);
*tl++ = txdr_unsigned(rwflag);
*tl = txdr_unsigned(nmp->nm_leaseterm);
reqtime = time_second;
nfsm_request(np, NQNFSPROC_GETLEASE, l, cred);
nfsm_dissect(tl, u_int32_t *, 4 * NFSX_UNSIGNED);
cachable = fxdr_unsigned(int, *tl++);
reqtime += fxdr_unsigned(int, *tl++);
if (reqtime > time_second) {
frev = fxdr_hyper(tl);
nqnfs_clientlease(nmp, np, rwflag, cachable, reqtime, frev);
nfsm_loadattr(vp, (struct vattr *)0, 0);
} else
error = NQNFS_EXPIRED;
nfsm_reqdone;
return (error);
}
/*
* Client vacated message function.
*/
int
nqnfs_vacated(vp, cred, l)
struct vnode *vp;
kauth_cred_t cred;
struct lwp *l;
{
caddr_t cp;
struct mbuf *m;
int i;
u_int32_t *tl;
int32_t t2;
caddr_t bpos;
u_int32_t xid;
int error = 0;
struct mbuf *mreq, *mb, *mheadend;
struct nfsmount *nmp;
struct nfsreq myrep;
struct nfsnode *np = VTONFS(vp);
nmp = VFSTONFS(vp->v_mount);
nfsstats.rpccnt[NQNFSPROC_VACATED]++;
nfsm_reqhead(np, NQNFSPROC_VACATED, NFSX_FH(1));
nfsm_fhtom(np, 1);
m = mreq;
i = 0;
while (m) {
i += m->m_len;
m = m->m_next;
}
m = nfsm_rpchead(cred, nmp->nm_flag, NQNFSPROC_VACATED,
RPCAUTH_UNIX, 5 * NFSX_UNSIGNED, (char *)0,
0, (char *)0, mreq, i, &mheadend, &xid);
if (nmp->nm_sotype == SOCK_STREAM) {
M_PREPEND(m, NFSX_UNSIGNED, M_WAIT);
*mtod(m, u_int32_t *) = htonl(0x80000000 | (m->m_pkthdr.len -
NFSX_UNSIGNED));
}
myrep.r_flags = 0;
myrep.r_nmp = nmp;
if (nmp->nm_soflags & PR_CONNREQUIRED)
(void) nfs_sndlock(&nmp->nm_iflag, (struct nfsreq *)0);
(void) nfs_send(nmp->nm_so, nmp->nm_nam, m, &myrep, l);
if (nmp->nm_soflags & PR_CONNREQUIRED)
nfs_sndunlock(&nmp->nm_iflag);
nfsmout:
return (error);
}
/*
* Called for client side callbacks
*/
static int
nqnfs_callback1(struct nfsmount *nmp, struct mbuf *mrep, struct mbuf *md,
caddr_t dpos, struct lwp *l, struct nfsrv_descript *nfsd)
{
struct vnode *vp;
u_int32_t *tl;
int32_t t1;
nfsrvfh_t nsfh;
fhandle_t *fhp;
struct nfsnode *np;
struct nfsd tnfsd;
struct nfssvc_sock *slp;
struct mbuf **mrq = (struct mbuf **)0, *mb, *mreq;
int error = 0, cache = 0;
char *cp2, *bpos;
u_quad_t frev;
#ifndef nolint
slp = NULL;
#endif
nfsd->nd_mrep = mrep;
nfsd->nd_md = md;
nfsd->nd_dpos = dpos;
error = nfs_getreq(nfsd, &tnfsd, FALSE);
if (error)
return (error);
md = nfsd->nd_md;
dpos = nfsd->nd_dpos;
if (nfsd->nd_procnum != NQNFSPROC_EVICTED) {
m_freem(mrep);
return (EPERM);
}
nfsm_srvmtofh(&nsfh);
m_freem(mrep);
fhp = &nsfh.nsfh_u.u_fh;
error = nfs_nget(nmp->nm_mountp, (nfsfh_t *)fhp, NFSX_V3FH, &np);
if (error)
return (error);
vp = NFSTOV(np);
if (CIRCLEQ_NEXT(np, n_timer) != 0) {
np->n_expiry = 0;
np->n_flag |= NQNFSEVICTED;
if (CIRCLEQ_FIRST(&nmp->nm_timerhead) != np) {
CIRCLEQ_REMOVE(&nmp->nm_timerhead, np, n_timer);
CIRCLEQ_INSERT_HEAD(&nmp->nm_timerhead, np, n_timer);
}
}
vput(vp);
kauth_cred_free(nfsd->nd_cr);
nfsm_srvdone;
}
int
nqnfs_callback(struct nfsmount *nmp, struct mbuf *mrep, struct mbuf *md,
caddr_t dpos, struct lwp *l)
{
struct nfsrv_descript *nd;
int error;
nd = nfsdreq_alloc();
error = nqnfs_callback1(nmp, mrep, md, dpos, l, nd);
nfsdreq_free(nd);
return error;
}
#endif /* NFS && !NFS_V2_ONLY */
#ifdef NFS /* Needed in V2_ONLY case for Kerberos stuff */
/*
* Nqnfs client helper daemon. Runs once a second to expire leases.
* It also get authorization strings for "kerb" mounts.
* It must start at the beginning of the list again after any potential
* "sleep" since nfs_reclaim() called from vclean() can pull a node off
* the list asynchronously.
*/
int
nqnfs_clientd(struct nfsmount *nmp, kauth_cred_t cred, struct nfsd_cargs *ncd,
int flag, caddr_t argp, struct lwp *l)
{
#ifndef NFS_V2_ONLY
struct nfsnode *np;
struct vnode *vp;
struct nfsreq myrep;
#endif
int error = 0, sleepreturn;
struct nfsuid *nuidp, *nnuidp;
/*
* First initialize some variables
*/
/*
* If an authorization string is being passed in, get it.
*/
if ((flag & NFSSVC_GOTAUTH) &&
(nmp->nm_iflag & (NFSMNT_WAITAUTH | NFSMNT_DISMNT)) == 0) {
if (nmp->nm_iflag & NFSMNT_HASAUTH)
panic("cld kerb");
if ((flag & NFSSVC_AUTHINFAIL) == 0) {
if (ncd->ncd_authlen <= nmp->nm_authlen &&
ncd->ncd_verflen <= nmp->nm_verflen &&
!copyin(ncd->ncd_authstr,nmp->nm_authstr,ncd->ncd_authlen)&&
!copyin(ncd->ncd_verfstr,nmp->nm_verfstr,ncd->ncd_verflen)){
nmp->nm_authtype = ncd->ncd_authtype;
nmp->nm_authlen = ncd->ncd_authlen;
nmp->nm_verflen = ncd->ncd_verflen;
#ifdef NFSKERB
nmp->nm_key = ncd->ncd_key;
#endif
} else
nmp->nm_iflag |= NFSMNT_AUTHERR;
} else
nmp->nm_iflag |= NFSMNT_AUTHERR;
nmp->nm_iflag |= NFSMNT_HASAUTH;
wakeup((caddr_t)&nmp->nm_authlen);
} else
nmp->nm_iflag |= NFSMNT_WAITAUTH;
/*
* Loop every second updating queue until there is a termination sig.
*/
sleepreturn = 0;
while ((nmp->nm_iflag & NFSMNT_DISMNT) == 0) {
if (sleepreturn == EINTR || sleepreturn == ERESTART) {
/*
* XXX Freeze syncer. Must do this before locking
* the mount point. See dounmount() for details.
*/
lockmgr(&syncer_lock, LK_EXCLUSIVE, NULL);
if (vfs_busy(nmp->nm_mountp, LK_NOWAIT, 0) != 0)
lockmgr(&syncer_lock, LK_EXCLUSIVE, NULL);
else if (dounmount(nmp->nm_mountp, 0, l) != 0)
CLRSIG(l);
sleepreturn = 0;
continue;
}
#ifndef NFS_V2_ONLY
if (nmp->nm_flag & NFSMNT_NQNFS) {
/*
* If there are no outstanding requests (and therefore no
* processes in nfs_reply) and there is data in the receive
* queue, poke for callbacks.
*/
if (TAILQ_EMPTY(&nfs_reqq) && nmp->nm_so &&
nmp->nm_so->so_rcv.sb_cc > 0) {
myrep.r_flags = R_GETONEREP;
myrep.r_nmp = nmp;
myrep.r_mrep = (struct mbuf *)0;
myrep.r_lwp = (struct lwp *)0;
(void) nfs_reply(&myrep, l);
}
/*
* Loop through the leases, updating as required.
*/
np = CIRCLEQ_FIRST(&nmp->nm_timerhead);
while (np != (void *)&nmp->nm_timerhead &&
(nmp->nm_iflag & NFSMNT_DISMINPROG) == 0) {
vp = NFSTOV(np);
if (np->n_expiry < time_second) {
if (vget(vp, LK_EXCLUSIVE) == 0) {
nmp->nm_inprog = vp;
CIRCLEQ_REMOVE(&nmp->nm_timerhead, np, n_timer);
/* mark this off the list */
CIRCLEQ_NEXT(np, n_timer) = 0; /* XXX */
if (np->n_flag & (NMODIFIED | NQNFSEVICTED)) {
if (np->n_flag & NQNFSEVICTED) {
if (vp->v_type == VDIR)
nfs_invaldircache(vp,0);
cache_purge(vp);
(void) nfs_vinvalbuf(vp,
V_SAVE, cred, l, 0);
np->n_flag &= ~NQNFSEVICTED;
(void) nqnfs_vacated(vp, cred, l);
} else if (vp->v_type == VREG) {
(void) VOP_FSYNC(vp, cred,
FSYNC_WAIT, 0, 0, l);
np->n_flag &= ~NMODIFIED;
}
}
vput(vp);
nmp->nm_inprog = NULLVP;
}
} else if ((np->n_expiry - NQ_RENEWAL) < time_second) {
if ((np->n_flag & (NQNFSWRITE | NQNFSNONCACHE))
== NQNFSWRITE &&
!LIST_EMPTY(&vp->v_dirtyblkhd) &&
vget(vp, LK_EXCLUSIVE) == 0) {
nmp->nm_inprog = vp;
if (nqnfs_getlease(vp, ND_WRITE, cred, l)==0)
np->n_brev = np->n_lrev;
vput(vp);
nmp->nm_inprog = NULLVP;
}
} else
break;
if (np == CIRCLEQ_FIRST(&nmp->nm_timerhead))
break;
np = CIRCLEQ_FIRST(&nmp->nm_timerhead);
}
}
#endif /* !NFS_V2_ONLY */
/*
* Get an authorization string, if required.
*/
if ((nmp->nm_iflag & (NFSMNT_WAITAUTH | NFSMNT_DISMNT | NFSMNT_HASAUTH)) == 0) {
ncd->ncd_authuid = nmp->nm_authuid;
if (copyout((caddr_t)ncd, argp, sizeof (struct nfsd_cargs)))
nmp->nm_iflag |= NFSMNT_WAITAUTH;
else
return (ENEEDAUTH);
}
/*
* Wait a bit (no pun) and do it again.
*/
if ((nmp->nm_iflag & NFSMNT_DISMNT) == 0 &&
(nmp->nm_iflag & (NFSMNT_WAITAUTH | NFSMNT_HASAUTH))) {
sleepreturn = tsleep((caddr_t)&nmp->nm_authstr,
PSOCK | PCATCH, "nqnfstimr", hz / 3);
}
}
/*
* Finally, we can free up the mount structure.
*/
for (nuidp = TAILQ_FIRST(&nmp->nm_uidlruhead); nuidp != 0;
nuidp = nnuidp) {
nnuidp = TAILQ_NEXT(nuidp, nu_lru);
LIST_REMOVE(nuidp, nu_hash);
TAILQ_REMOVE(&nmp->nm_uidlruhead, nuidp, nu_lru);
free((caddr_t)nuidp, M_NFSUID);
}
free((caddr_t)nmp, M_NFSMNT);
return (error);
}
#endif /* NFS */
#if defined(NFS) && !defined(NFS_V2_ONLY)
/*
* Update a client lease.
*/
void
nqnfs_clientlease(nmp, np, rwflag, cachable, expiry, frev)
struct nfsmount *nmp;
struct nfsnode *np;
int rwflag, cachable;
time_t expiry;
u_quad_t frev;
{
struct nfsnode *tp;
if (CIRCLEQ_NEXT(np, n_timer) != 0) {
CIRCLEQ_REMOVE(&nmp->nm_timerhead, np, n_timer);
if (rwflag == ND_WRITE)
np->n_flag |= NQNFSWRITE;
} else if (rwflag == ND_READ)
np->n_flag &= ~NQNFSWRITE;
else
np->n_flag |= NQNFSWRITE;
if (cachable)
np->n_flag &= ~NQNFSNONCACHE;
else
np->n_flag |= NQNFSNONCACHE;
np->n_expiry = expiry;
np->n_lrev = frev;
tp = nmp->nm_timerhead.cqh_last;
while (tp != (void *)&nmp->nm_timerhead && tp->n_expiry > np->n_expiry)
tp = tp->n_timer.cqe_prev;
if (tp == (void *)&nmp->nm_timerhead) {
CIRCLEQ_INSERT_HEAD(&nmp->nm_timerhead, np, n_timer);
} else {
CIRCLEQ_INSERT_AFTER(&nmp->nm_timerhead, tp, np, n_timer);
}
}
#endif /* NFS && !NFS_V2_ONLY */
#if defined(NFSSERVER) || (defined(NFS) && !defined(NFS_V2_ONLY))
/*
* Adjust all timer queue expiry times when the time of day clock is changed.
* Called from the settimeofday() syscall.
*/
void
nqnfs_lease_updatetime(deltat)
int deltat;
{
struct nqlease *lp;
struct nfsnode *np;
struct mount *mp;
struct nfsmount *nmp;
int s;
struct mount *nxtmp;
if (nqnfsstarttime != 0)
nqnfsstarttime += deltat;
s = splsoftnet();
CIRCLEQ_FOREACH(lp, &nqtimerhead, lc_timer) {
lp->lc_expiry += deltat;
}
splx(s);
/*
* Search the mount list for all nqnfs mounts and do their timer
* queues.
*/
simple_lock(&mountlist_slock);
for (mp = CIRCLEQ_FIRST(&mountlist); mp != (void *)&mountlist;
mp = nxtmp) {
if (vfs_busy(mp, LK_NOWAIT, &mountlist_slock)) {
nxtmp = CIRCLEQ_NEXT(mp, mnt_list);
continue;
}
if (!strncmp(&mp->mnt_stat.f_fstypename[0], MOUNT_NFS,
MFSNAMELEN)) {
nmp = VFSTONFS(mp);
if (nmp->nm_flag & NFSMNT_NQNFS) {
CIRCLEQ_FOREACH(np, &nmp->nm_timerhead,
n_timer) {
np->n_expiry += deltat;
}
}
}
simple_lock(&mountlist_slock);
nxtmp = CIRCLEQ_NEXT(mp, mnt_list);
vfs_unbusy(mp);
}
simple_unlock(&mountlist_slock);
}
/*
* Lock a server lease.
*/
void
nqsrv_locklease(lp)
struct nqlease *lp;
{
while (lp->lc_flag & LC_LOCKED) {
lp->lc_flag |= LC_WANTED;
(void) tsleep((caddr_t)lp, PSOCK, "nqlc", 0);
}
lp->lc_flag |= LC_LOCKED;
lp->lc_flag &= ~LC_WANTED;
}
/*
* Unlock a server lease.
*/
void
nqsrv_unlocklease(lp)
struct nqlease *lp;
{
lp->lc_flag &= ~LC_LOCKED;
if (lp->lc_flag & LC_WANTED)
wakeup((caddr_t)lp);
}
#endif /* NFSSERVER || NFS && !NFS_V2_ONLY */