1 files changed, 3200 insertions, 0 deletions
diff --git a/sys/nfs4client/nfs4_vnops.c b/sys/nfs4client/nfs4_vnops.c
new file mode 100644
index 0000000..48e4549
--- /dev/null
+++ b/sys/nfs4client/nfs4_vnops.c
@@ -0,0 +1,3200 @@
+/* $FreeBSD$ */
+/* $Id: nfs_vnops.c,v 1.45 2003/11/05 14:59:02 rees Exp $ */
+
+/*
+ * copyright (c) 2003
+ * the regents of the university of michigan
+ * all rights reserved
+ * 
+ * permission is granted to use, copy, create derivative works and redistribute
+ * this software and such derivative works for any purpose, so long as the name
+ * of the university of michigan is not used in any advertising or publicity
+ * pertaining to the use or distribution of this software without specific,
+ * written prior authorization.  if the above copyright notice or any other
+ * identification of the university of michigan is included in any copy of any
+ * portion of this software, then the disclaimer below must also be included.
+ * 
+ * this software is provided as is, without representation from the university
+ * of michigan as to its fitness for any purpose, and without warranty by the
+ * university of michigan of any kind, either express or implied, including
+ * without limitation the implied warranties of merchantability and fitness for
+ * a particular purpose. the regents of the university of michigan shall not be
+ * liable for any damages, including special, indirect, incidental, or
+ * consequential damages, with respect to any claim arising out of or in
+ * connection with the use of the software, even if it has been or is hereafter
+ * advised of the possibility of such damages.
+ */
+
+/*
+ * Copyright (c) 1989, 1993
+ *	The Regents of the University of California.  All rights reserved.
+ *
+ * This code is derived from software contributed to Berkeley by
+ * Rick Macklem at The University of Guelph.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ *    notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ *    notice, this list of conditions and the following disclaimer in the
+ *    documentation and/or other materials provided with the distribution.
+ * 3. All advertising materials mentioning features or use of this software
+ *    must display the following acknowledgement:
+ *	This product includes software developed by the University of
+ *	California, Berkeley and its contributors.
+ * 4. Neither the name of the University nor the names of its contributors
+ *    may be used to endorse or promote products derived from this software
+ *    without specific prior written permission.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
+ * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
+ * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+ * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+ * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+ * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+ * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ *
+ *	@(#)nfs_vnops.c	8.16 (Berkeley) 5/27/95
+ */
+
+#include <sys/cdefs.h>
+__FBSDID("$FreeBSD$");
+
+/*
+ * vnode op calls for Sun NFS version 2 and 3
+ */
+
+#include "opt_inet.h"
+
+#include <sys/param.h>
+#include <sys/kernel.h>
+#include <sys/systm.h>
+#include <sys/resourcevar.h>
+#include <sys/proc.h>
+#include <sys/mount.h>
+#include <sys/bio.h>
+#include <sys/buf.h>
+#include <sys/malloc.h>
+#include <sys/mbuf.h>
+#include <sys/namei.h>
+#include <sys/socket.h>
+#include <sys/vnode.h>
+#include <sys/dirent.h>
+#include <sys/fcntl.h>
+#include <sys/lockf.h>
+#include <sys/stat.h>
+#include <sys/sysctl.h>
+
+#include <vm/vm.h>
+#include <vm/vm_extern.h>
+
+#include <fs/fifofs/fifo.h>
+
+#include <rpc/rpcclnt.h>
+
+#include <nfs/rpcv2.h>
+#include <nfs/nfsproto.h>
+#include <nfsclient/nfs.h>
+#include <nfs4client/nfs4.h>
+#include <nfsclient/nfsnode.h>
+#include <nfsclient/nfsmount.h>
+#include <nfsclient/nfs_lock.h>
+#include <nfs/xdr_subs.h>
+#include <nfsclient/nfsm_subs.h>
+
+#include <net/if.h>
+#include <netinet/in.h>
+#include <netinet/in_var.h>
+
+/* NFSv4 */
+#include <nfs4client/nfs4m_subs.h>
+#include <nfs4client/nfs4_vn.h>
+
+/* Defs */
+#define	TRUE	1
+#define	FALSE	0
+
+/*
+ * Ifdef for FreeBSD-current merged buffer cache. It is unfortunate that these
+ * calls are not in getblk() and brelse() so that they would not be necessary
+ * here.
+ */
+#ifndef B_VMIO
+#define vfs_busy_pages(bp, f)
+#endif
+
+static int	nfsspec_read(struct vop_read_args *);
+static int	nfsspec_write(struct vop_write_args *);
+static int	nfsfifo_read(struct vop_read_args *);
+static int	nfsfifo_write(struct vop_write_args *);
+static int	nfsspec_close(struct vop_close_args *);
+static int	nfsfifo_close(struct vop_close_args *);
+static int	nfs4_flush(struct vnode *, struct ucred *, int, struct thread *,
+		    int);
+static int	nfs4_setattrrpc(struct vnode *, struct vattr *, struct ucred *,
+		    struct thread *);
+static int      nfs4_closerpc(struct vnode *, struct ucred *, struct thread *, int);
+
+static	int	nfs4_lookup(struct vop_lookup_args *);
+static	int	nfs4_create(struct vop_create_args *);
+static	int	nfs4_mknod(struct vop_mknod_args *);
+static	int	nfs4_open(struct vop_open_args *);
+static	int	nfs4_close(struct vop_close_args *);
+static	int	nfs4_access(struct vop_access_args *);
+static	int	nfs4_getattr(struct vop_getattr_args *);
+static	int	nfs4_setattr(struct vop_setattr_args *);
+static	int	nfs4_read(struct vop_read_args *);
+static	int	nfs4_fsync(struct vop_fsync_args *);
+static	int	nfs4_remove(struct vop_remove_args *);
+static	int	nfs4_link(struct vop_link_args *);
+static	int	nfs4_rename(struct vop_rename_args *);
+static	int	nfs4_mkdir(struct vop_mkdir_args *);
+static	int	nfs4_rmdir(struct vop_rmdir_args *);
+static	int	nfs4_symlink(struct vop_symlink_args *);
+static	int	nfs4_readdir(struct vop_readdir_args *);
+static	int	nfs4_strategy(struct vop_strategy_args *);
+static	int	nfs4_lookitup(struct vnode *, const char *, int,
+		    struct ucred *, struct thread *, struct nfsnode **);
+static	int	nfs4_sillyrename(struct vnode *, struct vnode *,
+		    struct componentname *);
+static int	nfsspec_access(struct vop_access_args *);
+static int	nfs4_readlink(struct vop_readlink_args *);
+static int	nfs4_print(struct vop_print_args *);
+static int	nfs4_advlock(struct vop_advlock_args *);
+
+/*
+ * Global vfs data structures for nfs
+ */
+vop_t **nfs4_vnodeop_p;
+static struct vnodeopv_entry_desc nfs4_vnodeop_entries[] = {
+	{ &vop_default_desc,		(vop_t *) vop_defaultop },
+	{ &vop_access_desc,		(vop_t *) nfs4_access },
+	{ &vop_advlock_desc,		(vop_t *) nfs4_advlock },
+	{ &vop_close_desc,		(vop_t *) nfs4_close },
+	{ &vop_create_desc,		(vop_t *) nfs4_create },
+	{ &vop_fsync_desc,		(vop_t *) nfs4_fsync },
+	{ &vop_getattr_desc,		(vop_t *) nfs4_getattr },
+	{ &vop_getpages_desc,		(vop_t *) nfs_getpages },
+	{ &vop_putpages_desc,		(vop_t *) nfs_putpages },
+	{ &vop_inactive_desc,		(vop_t *) nfs_inactive },
+	{ &vop_lease_desc,		(vop_t *) vop_null },
+	{ &vop_link_desc,		(vop_t *) nfs4_link },
+	{ &vop_lookup_desc,		(vop_t *) nfs4_lookup },
+	{ &vop_mkdir_desc,		(vop_t *) nfs4_mkdir },
+	{ &vop_mknod_desc,		(vop_t *) nfs4_mknod },
+	{ &vop_open_desc,		(vop_t *) nfs4_open },
+	{ &vop_print_desc,		(vop_t *) nfs4_print },
+	{ &vop_read_desc,		(vop_t *) nfs4_read },
+	{ &vop_readdir_desc,		(vop_t *) nfs4_readdir },
+	{ &vop_readlink_desc,		(vop_t *) nfs4_readlink },
+	{ &vop_reclaim_desc,		(vop_t *) nfs_reclaim },
+	{ &vop_remove_desc,		(vop_t *) nfs4_remove },
+	{ &vop_rename_desc,		(vop_t *) nfs4_rename },
+	{ &vop_rmdir_desc,		(vop_t *) nfs4_rmdir },
+	{ &vop_setattr_desc,		(vop_t *) nfs4_setattr },
+	{ &vop_strategy_desc,		(vop_t *) nfs4_strategy },
+	{ &vop_symlink_desc,		(vop_t *) nfs4_symlink },
+	{ &vop_write_desc,		(vop_t *) nfs_write },
+	{ NULL, NULL }
+};
+static struct vnodeopv_desc nfs4_vnodeop_opv_desc =
+	{ &nfs4_vnodeop_p, nfs4_vnodeop_entries };
+VNODEOP_SET(nfs4_vnodeop_opv_desc);
+
+/*
+ * Special device vnode ops
+ */
+vop_t **spec_nfs4nodeop_p;
+static struct vnodeopv_entry_desc nfs4_specop_entries[] = {
+	{ &vop_default_desc,		(vop_t *) spec_vnoperate },
+	{ &vop_access_desc,		(vop_t *) nfsspec_access },
+	{ &vop_close_desc,		(vop_t *) nfsspec_close },
+	{ &vop_fsync_desc,		(vop_t *) nfs4_fsync },
+	{ &vop_getattr_desc,		(vop_t *) nfs4_getattr },
+	{ &vop_inactive_desc,		(vop_t *) nfs_inactive },
+	{ &vop_print_desc,		(vop_t *) nfs4_print },
+	{ &vop_read_desc,		(vop_t *) nfsspec_read },
+	{ &vop_reclaim_desc,		(vop_t *) nfs_reclaim },
+	{ &vop_setattr_desc,		(vop_t *) nfs4_setattr },
+	{ &vop_write_desc,		(vop_t *) nfsspec_write },
+	{ NULL, NULL }
+};
+static struct vnodeopv_desc spec_nfs4nodeop_opv_desc =
+	{ &spec_nfs4nodeop_p, nfs4_specop_entries };
+VNODEOP_SET(spec_nfs4nodeop_opv_desc);
+
+vop_t **fifo_nfs4nodeop_p;
+static struct vnodeopv_entry_desc nfs4_fifoop_entries[] = {
+	{ &vop_default_desc,		(vop_t *) fifo_vnoperate },
+	{ &vop_access_desc,		(vop_t *) nfsspec_access },
+	{ &vop_close_desc,		(vop_t *) nfsfifo_close },
+	{ &vop_fsync_desc,		(vop_t *) nfs4_fsync },
+	{ &vop_getattr_desc,		(vop_t *) nfs4_getattr },
+	{ &vop_inactive_desc,		(vop_t *) nfs_inactive },
+	{ &vop_print_desc,		(vop_t *) nfs4_print },
+	{ &vop_read_desc,		(vop_t *) nfsfifo_read },
+	{ &vop_reclaim_desc,		(vop_t *) nfs_reclaim },
+	{ &vop_setattr_desc,		(vop_t *) nfs4_setattr },
+	{ &vop_write_desc,		(vop_t *) nfsfifo_write },
+	{ NULL, NULL }
+};
+static struct vnodeopv_desc fifo_nfs4nodeop_opv_desc =
+	{ &fifo_nfs4nodeop_p, nfs4_fifoop_entries };
+VNODEOP_SET(fifo_nfs4nodeop_opv_desc);
+
+static int	nfs4_removerpc(struct vnode *dvp, const char *name, int namelen,
+			      struct ucred *cred, struct thread *td);
+static int	nfs4_renamerpc(struct vnode *fdvp, const char *fnameptr,
+			      int fnamelen, struct vnode *tdvp,
+			      const char *tnameptr, int tnamelen,
+			      struct ucred *cred, struct thread *td);
+static int	nfs4_renameit(struct vnode *sdvp, struct componentname *scnp,
+			     struct sillyrename *sp);
+static int      nfs4_openrpc(struct vnode *, struct vnode **,
+                            struct componentname *, int, struct vattr *);
+static int	nfs4_open_confirm(struct vnode *vp, struct nfs4_compound *cpp,
+				 struct nfs4_oparg_open *openap,
+				 struct nfs4_oparg_getfh *gfh,
+				 struct ucred *cred, struct thread *td);
+static int      nfs4_createrpc(struct vnode *, struct vnode **,
+                              struct componentname *, nfstype,
+                              struct vattr *, char *);
+
+/*
+ * Global variables
+ */
+struct nfs4_lowner nfs4_masterlowner;
+
+#define	DIRHDSIZ	(sizeof (struct dirent) - (MAXNAMLEN + 1))
+
+SYSCTL_DECL(_vfs_nfs4);
+
+static int	nfsaccess_cache_timeout = NFS_MAXATTRTIMO;
+SYSCTL_INT(_vfs_nfs4, OID_AUTO, access_cache_timeout, CTLFLAG_RW,
+	   &nfsaccess_cache_timeout, 0, "NFS ACCESS cache timeout");
+
+static int	nfsv3_commit_on_close = 0;
+SYSCTL_INT(_vfs_nfs4, OID_AUTO, nfsv3_commit_on_close, CTLFLAG_RW,
+	   &nfsv3_commit_on_close, 0, "write+commit on close, else only write");
+#if 0
+SYSCTL_INT(_vfs_nfs4, OID_AUTO, access_cache_hits, CTLFLAG_RD,
+	   &nfsstats.accesscache_hits, 0, "NFS ACCESS cache hit count");
+
+SYSCTL_INT(_vfs_nfs4, OID_AUTO, access_cache_misses, CTLFLAG_RD,
+	   &nfsstats.accesscache_misses, 0, "NFS ACCESS cache miss count");
+#endif
+
+#define	NFSV3ACCESS_ALL (NFSV3ACCESS_READ | NFSV3ACCESS_MODIFY		\
+			 | NFSV3ACCESS_EXTEND | NFSV3ACCESS_EXECUTE	\
+			 | NFSV3ACCESS_DELETE | NFSV3ACCESS_LOOKUP)
+static int
+nfs3_access_otw(struct vnode *vp, int wmode, struct thread *td,
+    struct ucred *cred)
+{
+	const int v3 = 1;
+	u_int32_t *tl;
+	int error = 0, attrflag;
+
+	return (0);
+
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	caddr_t bpos, dpos;
+	u_int32_t rmode;
+	struct nfsnode *np = VTONFS(vp);
+
+	nfsstats.rpccnt[NFSPROC_ACCESS]++;
+	mreq = nfsm_reqhead(vp, NFSPROC_ACCESS, NFSX_FH(v3) + NFSX_UNSIGNED);
+	mb = mreq;
+	bpos = mtod(mb, caddr_t);
+	nfsm_fhtom(vp, v3);
+	tl = nfsm_build(u_int32_t *, NFSX_UNSIGNED);
+	*tl = txdr_unsigned(wmode);
+	nfsm_request(vp, NFSPROC_ACCESS, td, cred);
+	nfsm_postop_attr(vp, attrflag);
+	if (!error) {
+		tl = nfsm_dissect(u_int32_t *, NFSX_UNSIGNED);
+		rmode = fxdr_unsigned(u_int32_t, *tl);
+		np->n_mode = rmode;
+		np->n_modeuid = cred->cr_uid;
+		np->n_modestamp = time_second;
+	}
+	m_freem(mrep);
+nfsmout:
+	return error;
+}
+
+/*
+ * nfs access vnode op.
+ * For nfs version 2, just return ok. File accesses may fail later.
+ * For nfs version 3, use the access rpc to check accessibility. If file modes
+ * are changed on the server, accesses might still fail later.
+ */
+static int
+nfs4_access(struct vop_access_args *ap)
+{
+	struct vnode *vp = ap->a_vp;
+	int error = 0;
+	u_int32_t mode, wmode;
+	int v3 = NFS_ISV3(vp);	/* v3 \in v4 */
+	struct nfsnode *np = VTONFS(vp);
+	caddr_t bpos, dpos;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	struct nfs4_compound cp;
+	struct nfs4_oparg_access acc;
+	struct thread *td = ap->a_td;
+	struct ucred *cred = ap->a_cred;
+
+	/*
+	 * Disallow write attempts on filesystems mounted read-only;
+	 * unless the file is a socket, fifo, or a block or character
+	 * device resident on the filesystem.
+	 */
+	if ((ap->a_mode & VWRITE) && (vp->v_mount->mnt_flag & MNT_RDONLY)) {
+		switch (vp->v_type) {
+		case VREG:
+		case VDIR:
+		case VLNK:
+			return (EROFS);
+		default:
+			break;
+		}
+	}
+	/*
+	 * For nfs v3, check to see if we have done this recently, and if
+	 * so return our cached result instead of making an ACCESS call.
+	 * If not, do an access rpc, otherwise you are stuck emulating
+	 * ufs_access() locally using the vattr. This may not be correct,
+	 * since the server may apply other access criteria such as
+	 * client uid-->server uid mapping that we do not know about.
+	 */
+	/* XXX Disable this for now; needs fixing of _access_otw() */
+	if (0 && v3) {
+		if (ap->a_mode & VREAD)
+			mode = NFSV3ACCESS_READ;
+		else
+			mode = 0;
+		if (vp->v_type != VDIR) {
+			if (ap->a_mode & VWRITE)
+				mode |= (NFSV3ACCESS_MODIFY | NFSV3ACCESS_EXTEND);
+			if (ap->a_mode & VEXEC)
+				mode |= NFSV3ACCESS_EXECUTE;
+		} else {
+			if (ap->a_mode & VWRITE)
+				mode |= (NFSV3ACCESS_MODIFY | NFSV3ACCESS_EXTEND |
+				    NFSV3ACCESS_DELETE);
+			if (ap->a_mode & VEXEC)
+				mode |= NFSV3ACCESS_LOOKUP;
+		}
+		/* XXX safety belt, only make blanket request if caching */
+		if (nfsaccess_cache_timeout > 0) {
+			wmode = NFSV3ACCESS_READ | NFSV3ACCESS_MODIFY |
+			    NFSV3ACCESS_EXTEND | NFSV3ACCESS_EXECUTE |
+			    NFSV3ACCESS_DELETE | NFSV3ACCESS_LOOKUP;
+		} else {
+			wmode = mode;
+		}
+
+		/*
+		 * Does our cached result allow us to give a definite yes to
+		 * this request?
+		 */
+		if ((time_second < (np->n_modestamp + nfsaccess_cache_timeout)) &&
+		    (ap->a_cred->cr_uid == np->n_modeuid) &&
+		    ((np->n_mode & mode) == mode)) {
+			nfsstats.accesscache_hits++;
+		} else {
+			/*
+			 * Either a no, or a don't know.  Go to the wire.
+			 */
+			nfsstats.accesscache_misses++;
+		        error = nfs3_access_otw(vp, wmode, ap->a_td,ap->a_cred);
+			if (!error) {
+				if ((np->n_mode & mode) != mode) {
+					error = EACCES;
+				}
+			}
+		}
+		return (error);
+	}
+
+	/* XXX use generic access code here? */
+	mode = ap->a_mode & VREAD ? NFSV4ACCESS_READ : 0;
+	if (vp->v_type == VDIR) {
+		if (ap->a_mode & VWRITE)
+			mode |= NFSV4ACCESS_MODIFY | NFSV4ACCESS_EXTEND | NFSV4ACCESS_DELETE;
+		if (ap->a_mode & VEXEC)
+			mode |= NFSV4ACCESS_LOOKUP;
+	} else {
+		if (ap->a_mode & VWRITE)
+			mode |= NFSV4ACCESS_MODIFY | NFSV4ACCESS_EXTEND;
+		if (ap->a_mode & VEXEC)
+			mode |= NFSV4ACCESS_EXECUTE;
+	}
+
+	nfs_v4initcompound(&cp);
+	acc.mode = mode;
+
+	mreq = nfsm_reqhead(vp, NFSV4PROC_COMPOUND, 0);
+	mb = mreq;
+	bpos = mtod(mb, caddr_t);
+
+	nfsm_v4build_compound(&cp, "nfs4_access()");
+	nfsm_v4build_putfh(&cp, vp);
+	nfsm_v4build_access(&cp, &acc);
+	nfsm_v4build_finalize(&cp);
+
+	nfsm_request(vp, NFSV4PROC_COMPOUND, td, cred);
+	if (error != 0)
+		goto nfsmout;
+
+	nfsm_v4dissect_compound(&cp);
+	nfsm_v4dissect_putfh(&cp);
+	nfsm_v4dissect_access(&cp, &acc);
+
+	if ((acc.rmode & mode) != mode)
+		error = EACCES;
+
+ nfsmout:
+	error = nfs_v4postop(&cp, error);
+
+	if (mrep != NULL)
+		m_freem(mrep);
+
+	return (error);
+}
+
+static int
+nfs4_openrpc(struct vnode *dvp, struct vnode **vpp, struct componentname *cnp,
+    int flags, struct vattr *vap)
+{
+	struct vnode *vp = *vpp;
+	struct nfs4_oparg_getattr getattr;
+	struct nfs4_oparg_getfh getfh;
+	struct nfs4_oparg_open opena;
+	struct nfs4_compound cp;
+	caddr_t bpos, dpos;
+	int error = 0;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	struct ucred *cred = cnp->cn_cred;
+	struct thread *td = cnp->cn_thread;
+	struct nfs4_fctx xfc, *fcp;
+	struct nfsnode *np;
+
+	if (vp == NULL) {
+		/* Create a new file */
+		np = NULL;
+		fcp = &xfc;
+		bzero(fcp, sizeof(*fcp));
+	} else {
+		np = VTONFS(vp);
+		fcp = flags & FWRITE ? &np->n_wfc : &np->n_rfc;
+	}
+
+	/*
+	 * Since we are currently only one lockowner; we only open the
+	 * file one each for reading and writing.
+	 */
+	if (fcp->refcnt++ != 0) {
+		*vpp = vp;
+		/*printf("not opening %s\n", np->n_name != NULL ? np->n_name : "");*/
+		return (0);
+	}
+
+	fcp->lop = &nfs4_masterlowner;
+	fcp->pid = cnp->cn_thread->td_proc->p_pid;
+	fcp->np = np;
+
+	nfs_v4initcompound(&cp);
+	cp.nmp = VFSTONFS(dvp->v_mount);
+
+	opena.ctype = NCLNULL;
+	opena.flags = flags;
+	opena.vap = vap;
+	opena.fcp = fcp;		/* For lockowner */
+	opena.cnp = cnp;
+
+	getattr.bm = &nfsv4_getattrbm;
+
+	mreq = nfsm_reqhead(vp, NFSV4PROC_COMPOUND, 0);
+	mb = mreq;
+	bpos = mtod(mb, caddr_t);
+
+	nfsm_v4build_compound(&cp, "nfs4_openrpc()");
+	nfsm_v4build_putfh(&cp, dvp);
+	nfsm_v4build_open(&cp, &opena);
+	nfsm_v4build_getattr(&cp, &getattr);
+	nfsm_v4build_getfh(&cp, &getfh);
+	nfsm_v4build_finalize(&cp);
+
+	nfsm_request(vp != NULL ? vp : dvp, NFSV4PROC_COMPOUND, td, cred);
+	if (error != 0)
+		goto nfsmout;
+
+	nfsm_v4dissect_compound(&cp);
+	nfsm_v4dissect_putfh(&cp);
+	nfsm_v4dissect_open(&cp, &opena);
+	nfsm_v4dissect_getattr(&cp, &getattr);
+	nfsm_v4dissect_getfh(&cp, &getfh);
+
+	error = nfs_v4postop(&cp, error);
+
+	if (opena.rflags & NFSV4OPENRES_CONFIRM) {
+		error = nfs4_open_confirm(vp ? vp : dvp, &cp, &opena, &getfh, cred, td);
+		if (error != 0)
+			goto nfsmout;
+	}
+
+	if (vp == NULL) {
+		/* New file */
+		error = nfs_nget(dvp->v_mount, &getfh.fh_val,
+		    getfh.fh_len, &np);
+		if (error != 0)
+			goto nfsmout;
+
+		vp = NFSTOV(np);
+		np->n_dvp = dvp;
+		np->n_namelen = cnp->cn_namelen; /* XXX memory leaks on these; track! */
+		if (np->n_name != NULL)
+			FREE(np->n_name, M_NFSREQ);
+		MALLOC(np->n_name, u_char *, np->n_namelen + 1, M_NFSREQ, M_WAITOK);
+		bcopy(cnp->cn_nameptr, np->n_name, np->n_namelen);
+		np->n_name[np->n_namelen] = '\0';
+		if (flags & FWRITE)
+			np->n_wfc = *fcp;
+		else
+			np->n_rfc = *fcp;
+
+		/*printf("opened new file %s\n", np->n_name);*/
+
+		nfs4_vnop_loadattrcache(vp, &getattr.fa, NULL);
+		*vpp = vp;
+	} else {
+		/*printf("openend \"old\" %s\n", np->n_name != NULL ? np->n_name : "");*/
+
+		if (flags & O_TRUNC && np->n_size != 0) {
+			struct vattr va;
+
+			VATTR_NULL(&va);
+			va.va_size = 0;
+			error = nfs4_setattrrpc(vp, &va,
+			    cnp->cn_cred, cnp->cn_thread);
+		}
+		np->n_attrstamp = 0;
+	}
+
+ nfsmout:
+	if (mrep != NULL)
+		m_freem(mrep);
+
+	return (error);
+}
+
+static int
+nfs4_open_confirm(struct vnode *vp, struct nfs4_compound *cpp,
+    struct nfs4_oparg_open *openap, struct nfs4_oparg_getfh *gfh,
+    struct ucred *cred, struct thread *td)
+{
+	caddr_t bpos, dpos;
+	int error = 0;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+
+	nfs_v4initcompound(cpp);
+	cpp->nmp = VFSTONFS(vp->v_mount);
+
+	mreq = nfsm_reqhead(vp, NFSV4PROC_COMPOUND, 0);
+	mb = mreq;
+	bpos = mtod(mb, caddr_t);
+
+	nfsm_v4build_compound(cpp, "nfs4_open_confirm()");
+	nfsm_v4build_putfh_nv(cpp, gfh);
+	nfsm_v4build_open_confirm(cpp, openap);
+	nfsm_v4build_finalize(cpp);
+
+	nfsm_request(vp, NFSV4PROC_COMPOUND, td, cred);
+	if (error != 0)
+		goto nfsmout;
+
+	nfsm_v4dissect_compound(cpp);
+	nfsm_v4dissect_putfh(cpp);
+	nfsm_v4dissect_open_confirm(cpp, openap);
+
+ nfsmout:
+	error = nfs_v4postop(cpp, error);
+
+	if (mrep != NULL)
+		m_freem(mrep);
+
+	return (error);
+}
+
+
+/*
+ * nfs open vnode op
+ * Check to see if the type is ok
+ * and that deletion is not in progress.
+ * For paged in text files, you will need to flush the page cache
+ * if consistency is lost.
+ */
+/* ARGSUSED */
+static int
+nfs4_open(struct vop_open_args *ap)
+{
+	struct vnode *vp = ap->a_vp;
+	struct nfsnode *np = VTONFS(vp);
+	enum vtype vtype = vp->v_type;
+	int mode = ap->a_mode;
+	struct componentname cn;
+
+	if (vtype != VREG) {
+		if (vtype != VDIR && vtype != VLNK) {
+#ifdef DIAGNOSTIC
+			printf("open eacces vtyp=%d\n", vp->v_type);
+#endif
+			return (EACCES);
+		} else
+			return (0);
+	}
+
+	if (np->n_flag & NCREATED) {
+		np->n_flag &= ~NCREATED;
+		return (0);
+	}
+
+	cn.cn_nameptr = np->n_name;
+	cn.cn_namelen = np->n_namelen;
+	cn.cn_cred = ap->a_cred;
+	cn.cn_thread = ap->a_td;
+
+	return (nfs4_openrpc(np->n_dvp, &vp, &cn, mode, NULL));
+}
+
+static int
+nfs4_closerpc(struct vnode *vp, struct ucred *cred, struct thread *td, int flags)
+{
+	caddr_t bpos, dpos;
+	int error = 0;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	struct nfs4_fctx *fcp;
+	struct nfs4_compound cp;
+	struct nfsnode *np = VTONFS(vp);
+
+	fcp = flags & FWRITE ? &np->n_wfc : &np->n_rfc;
+
+	nfs_v4initcompound(&cp);
+
+	if (--fcp->refcnt != 0)
+		return (0);
+
+	/*printf("closing %s\n", np->n_name != NULL ? np->n_name : "");*/
+
+	cp.fcp = fcp;
+
+	mreq = nfsm_reqhead(vp, NFSV4PROC_COMPOUND, 0);
+	mb = mreq;
+	bpos = mtod(mb, caddr_t);
+
+	nfsm_v4build_compound(&cp, "nfs4_closerpc()");
+	nfsm_v4build_putfh(&cp, vp);
+	nfsm_v4build_close(&cp, fcp);
+	nfsm_v4build_finalize(&cp);
+
+	nfsm_request(vp, NFSV4PROC_COMPOUND, td, cred);
+	if (error != 0)
+		goto nfsmout;
+
+	nfsm_v4dissect_compound(&cp);
+	nfsm_v4dissect_putfh(&cp);
+	nfsm_v4dissect_close(&cp, fcp);
+
+ nfsmout:
+	error = nfs_v4postop(&cp, error);
+
+	if (mrep != NULL)
+		m_freem(mrep);
+
+	return (error);
+}
+
+/*
+ * nfs close vnode op
+ * What an NFS client should do upon close after writing is a debatable issue.
+ * Most NFS clients push delayed writes to the server upon close, basically for
+ * two reasons:
+ * 1 - So that any write errors may be reported back to the client process
+ *     doing the close system call. By far the two most likely errors are
+ *     NFSERR_NOSPC and NFSERR_DQUOT to indicate space allocation failure.
+ * 2 - To put a worst case upper bound on cache inconsistency between
+ *     multiple clients for the file.
+ * There is also a consistency problem for Version 2 of the protocol w.r.t.
+ * not being able to tell if other clients are writing a file concurrently,
+ * since there is no way of knowing if the changed modify time in the reply
+ * is only due to the write for this client.
+ * (NFS Version 3 provides weak cache consistency data in the reply that
+ *  should be sufficient to detect and handle this case.)
+ *
+ * The current code does the following:
+ * for NFS Version 2 - play it safe and flush/invalidate all dirty buffers
+ * for NFS Version 3 - flush dirty buffers to the server but don't invalidate
+ *                     or commit them (this satisfies 1 and 2 except for the
+ *                     case where the server crashes after this close but
+ *                     before the commit RPC, which is felt to be "good
+ *                     enough". Changing the last argument to nfs_flush() to
+ *                     a 1 would force a commit operation, if it is felt a
+ *                     commit is necessary now.
+ */
+/* ARGSUSED */
+static int
+nfs4_close(struct vop_close_args *ap)
+{
+	struct vnode *vp = ap->a_vp;
+	struct nfsnode *np = VTONFS(vp);
+	int error = 0;
+
+	if (vp->v_type != VREG)
+		return (0);
+
+	if (np->n_flag & NMODIFIED) {
+		if (NFS_ISV3(vp)) {
+			/*
+			 * Under NFSv3 we have dirty buffers to
+			 * dispose of.  We must flush them to the NFS
+			 * server.  We have the option of waiting all
+			 * the way through the commit rpc or just
+			 * waiting for the initial write.  The default
+			 * is to only wait through the initial write
+			 * so the data is in the server's cache, which
+			 * is roughly similar to the state a standard
+			 * disk subsystem leaves the file in on
+			 * close().
+			 *
+			 * We cannot clear the NMODIFIED bit in
+			 * np->n_flag due to potential races with
+			 * other processes, and certainly cannot clear
+			 * it if we don't commit.
+			 */
+			int cm = nfsv3_commit_on_close ? 1 : 0;
+			error = nfs4_flush(vp, ap->a_cred, MNT_WAIT, ap->a_td, cm);
+			/* np->n_flag &= ~NMODIFIED; */
+		} else {
+			vn_lock(vp, LK_EXCLUSIVE | LK_RETRY, ap->a_td);
+			error = nfs_vinvalbuf(vp, V_SAVE, ap->a_cred, ap->a_td, 1);
+			VOP_UNLOCK(vp, 0, ap->a_td);
+		}
+		np->n_attrstamp = 0;
+	}
+
+	error = nfs4_closerpc(vp, ap->a_cred, ap->a_td, ap->a_fflag);
+
+	if (!error && np->n_flag & NWRITEERR) {
+		np->n_flag &= ~NWRITEERR;
+		error = np->n_error;
+	}
+	return (error);
+}
+
+/*
+ * nfs getattr call from vfs.
+ */
+static int
+nfs4_getattr(struct vop_getattr_args *ap)
+{
+	struct vnode *vp = ap->a_vp;
+	struct nfsnode *np = VTONFS(vp);
+	caddr_t bpos, dpos;
+	int error = 0;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	struct nfs4_oparg_getattr ga;
+	struct nfs4_compound cp;
+
+	/*
+	 * Update local times for special files.
+	 */
+	if (np->n_flag & (NACC | NUPD))
+		np->n_flag |= NCHG;
+	/*
+	 * First look in the cache.
+	 */
+	if (nfs_getattrcache(vp, ap->a_vap) == 0)
+		return (0);
+
+	nfsstats.rpccnt[NFSPROC_GETATTR]++;
+
+	mreq = nfsm_reqhead(vp, NFSV4PROC_COMPOUND, NFSX_FH(1));
+	mb = mreq;
+	bpos = mtod(mb, caddr_t);
+
+	ga.bm = &nfsv4_getattrbm;
+	nfs_v4initcompound(&cp);
+
+	nfsm_v4build_compound(&cp, "nfs4_getattr()");
+	nfsm_v4build_putfh(&cp, vp);
+	nfsm_v4build_getattr(&cp, &ga);
+	nfsm_v4build_finalize(&cp);
+
+	nfsm_request(vp, NFSV4PROC_COMPOUND, ap->a_td, ap->a_cred);
+	if (error != 0)
+		goto nfsmout;
+
+	nfsm_v4dissect_compound(&cp);
+	nfsm_v4dissect_putfh(&cp);
+	nfsm_v4dissect_getattr(&cp, &ga);
+
+	nfs4_vnop_loadattrcache(vp, &ga.fa, ap->a_vap);
+
+nfsmout:
+	error = nfs_v4postop(&cp, error);
+
+	if (mrep != NULL)
+		m_freem(mrep);
+	return (error);
+}
+
+/*
+ * nfs setattr call.
+ */
+static int
+nfs4_setattr(struct vop_setattr_args *ap)
+{
+	struct vnode *vp = ap->a_vp;
+	struct nfsnode *np = VTONFS(vp);
+	struct vattr *vap = ap->a_vap;
+	int error = 0;
+	u_quad_t tsize;
+
+#ifndef nolint
+	tsize = (u_quad_t)0;
+#endif
+
+	/*
+	 * Setting of flags is not supported.
+	 */
+	if (vap->va_flags != VNOVAL)
+		return (EOPNOTSUPP);
+
+	/*
+	 * Disallow write attempts if the filesystem is mounted read-only.
+	 */
+  	if ((vap->va_flags != VNOVAL || vap->va_uid != (uid_t)VNOVAL ||
+	    vap->va_gid != (gid_t)VNOVAL || vap->va_atime.tv_sec != VNOVAL ||
+	    vap->va_mtime.tv_sec != VNOVAL || vap->va_mode != (mode_t)VNOVAL) &&
+	    (vp->v_mount->mnt_flag & MNT_RDONLY))
+		return (EROFS);
+	if (vap->va_size != VNOVAL) {
+ 		switch (vp->v_type) {
+ 		case VDIR:
+ 			return (EISDIR);
+ 		case VCHR:
+ 		case VBLK:
+ 		case VSOCK:
+ 		case VFIFO:
+			if (vap->va_mtime.tv_sec == VNOVAL &&
+			    vap->va_atime.tv_sec == VNOVAL &&
+			    vap->va_mode == (mode_t)VNOVAL &&
+			    vap->va_uid == (uid_t)VNOVAL &&
+			    vap->va_gid == (gid_t)VNOVAL)
+				return (0);
+ 			vap->va_size = VNOVAL;
+ 			break;
+ 		default:
+			/*
+			 * Disallow write attempts if the filesystem is
+			 * mounted read-only.
+			 */
+			if (vp->v_mount->mnt_flag & MNT_RDONLY)
+				return (EROFS);
+
+			/*
+			 *  We run vnode_pager_setsize() early (why?),
+			 * we must set np->n_size now to avoid vinvalbuf
+			 * V_SAVE races that might setsize a lower
+			 * value.
+			 */
+
+			tsize = np->n_size;
+			error = nfs_meta_setsize(vp, ap->a_cred, 
+						ap->a_td, vap->va_size);
+
+ 			if (np->n_flag & NMODIFIED) {
+ 			    if (vap->va_size == 0)
+ 				error = nfs_vinvalbuf(vp, 0,
+ 					ap->a_cred, ap->a_td, 1);
+ 			    else
+ 				error = nfs_vinvalbuf(vp, V_SAVE,
+ 					ap->a_cred, ap->a_td, 1);
+ 			    if (error) {
+				vnode_pager_setsize(vp, np->n_size);
+ 				return (error);
+			    }
+ 			}
+			/*
+			 * np->n_size has already been set to vap->va_size
+			 * in nfs_meta_setsize(). We must set it again since
+			 * nfs_loadattrcache() could be called through
+			 * nfs_meta_setsize() and could modify np->n_size.
+			 */
+ 			np->n_vattr.va_size = np->n_size = vap->va_size;
+  		};
+  	} else if ((vap->va_mtime.tv_sec != VNOVAL ||
+		vap->va_atime.tv_sec != VNOVAL) && (np->n_flag & NMODIFIED) &&
+		vp->v_type == VREG &&
+  		(error = nfs_vinvalbuf(vp, V_SAVE, ap->a_cred,
+		 ap->a_td, 1)) == EINTR)
+		return (error);
+	error = nfs4_setattrrpc(vp, vap, ap->a_cred, ap->a_td);
+	if (error && vap->va_size != VNOVAL) {
+		np->n_size = np->n_vattr.va_size = tsize;
+		vnode_pager_setsize(vp, np->n_size);
+	}
+	return (error);
+}
+
+/*
+ * Do an nfs setattr rpc.
+ */
+static int
+nfs4_setattrrpc(struct vnode *vp, struct vattr *vap, struct ucred *cred,
+    struct thread *td)
+{
+	caddr_t bpos, dpos;
+	int error = 0;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	struct nfs4_compound cp;
+	struct nfs4_oparg_getattr ga;
+	struct nfsnode *np = VTONFS(vp);
+	struct nfs4_fctx *fcp = &np->n_wfc;
+
+	nfsstats.rpccnt[NFSPROC_SETATTR]++;
+	mreq = nfsm_reqhead(vp, NFSV4PROC_COMPOUND, 0);
+	mb = mreq;
+	bpos = mtod(mb, caddr_t);
+
+	ga.bm = &nfsv4_getattrbm;
+	nfs_v4initcompound(&cp);
+
+	nfsm_v4build_compound(&cp, "nfs4_setattrrpc");
+	nfsm_v4build_putfh(&cp, vp);
+	nfsm_v4build_setattr(&cp, vap, fcp);
+	nfsm_v4build_getattr(&cp, &ga);
+	nfsm_v4build_finalize(&cp);
+
+	nfsm_request(vp, NFSV4PROC_COMPOUND, td, cred);
+	if (error != 0)
+		goto nfsmout;
+
+	nfsm_v4dissect_compound(&cp);
+	nfsm_v4dissect_putfh(&cp);
+	nfsm_v4dissect_setattr(&cp);
+	nfsm_v4dissect_getattr(&cp, &ga);
+
+	nfs4_vnop_loadattrcache(vp, &ga.fa, NULL);
+
+	/* XXX -- need to implement this in nfs4_setattr*/
+	if (np->n_flag & NTRUNCATE) {
+		error = nfs4_closerpc(vp, cred, td, FWRITE);
+		np->n_flag &= ~NTRUNCATE;
+	}
+
+nfsmout:
+	error = nfs_v4postop(&cp, error);
+
+	if (mrep != NULL)
+		m_freem(mrep);
+	
+	return (error);
+}
+
+/*
+ * nfs lookup call, one step at a time...
+ * First look in cache
+ * If not found, unlock the directory nfsnode and do the rpc
+ */
+static int
+nfs4_lookup(struct vop_lookup_args *ap)
+{
+	struct componentname *cnp = ap->a_cnp;
+	struct vnode *dvp = ap->a_dvp;
+	struct vnode **vpp = ap->a_vpp;
+	int isdot, flags = cnp->cn_flags;
+	struct vnode *newvp;
+	struct nfsmount *nmp;
+	caddr_t bpos, dpos;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	long len;
+	nfsfh_t *fhp;
+	struct nfsnode *np;
+	int lockparent, wantparent, error = 0, fhsize;
+	struct thread *td = cnp->cn_thread;
+	struct nfs4_compound cp;
+	struct nfs4_oparg_getattr ga, dga;
+	struct nfs4_oparg_lookup l;
+	struct nfs4_oparg_getfh gfh;
+
+	*vpp = NULLVP;
+	cnp->cn_flags &= ~PDIRUNLOCK;
+	if ((flags & ISLASTCN) && (dvp->v_mount->mnt_flag & MNT_RDONLY) &&
+	    (cnp->cn_nameiop == DELETE || cnp->cn_nameiop == RENAME))
+		return (EROFS);
+	if (dvp->v_type != VDIR)
+		return (ENOTDIR);
+	lockparent = flags & LOCKPARENT;
+	wantparent = flags & (LOCKPARENT|WANTPARENT);
+	nmp = VFSTONFS(dvp->v_mount);
+	np = VTONFS(dvp);
+
+	isdot = cnp->cn_namelen == 1 && cnp->cn_nameptr[0] == '.';
+
+	if ((error = cache_lookup(dvp, vpp, cnp)) && error != ENOENT) {
+		struct vattr vattr;
+		int vpid;
+
+		if ((error = VOP_ACCESS(dvp, VEXEC, cnp->cn_cred, td)) != 0) {
+			*vpp = NULLVP;
+			return (error);
+		}
+
+		vhold(*vpp);
+		newvp = *vpp;
+		vpid = newvp->v_id;
+		/*
+		 * See the comment starting `Step through' in ufs/ufs_lookup.c
+		 * for an explanation of the locking protocol
+		 */
+		if (dvp == newvp) {
+			VREF(newvp);
+			error = 0;
+		} else if (flags & ISDOTDOT) {
+			VOP_UNLOCK(dvp, 0, td);
+			cnp->cn_flags |= PDIRUNLOCK;
+			error = vget(newvp, LK_EXCLUSIVE, td);
+			if (!error && lockparent && (flags & ISLASTCN)) {
+				error = vn_lock(dvp, LK_EXCLUSIVE, td);
+				if (error == 0)
+					cnp->cn_flags &= ~PDIRUNLOCK;
+			}
+		} else {
+			error = vget(newvp, LK_EXCLUSIVE, td);
+			if (!lockparent || error || !(flags & ISLASTCN)) {
+				VOP_UNLOCK(dvp, 0, td);
+				cnp->cn_flags |= PDIRUNLOCK;
+			}
+		}
+		if (!error) {
+			if (vpid == newvp->v_id) {
+			   if (!VOP_GETATTR(newvp, &vattr, cnp->cn_cred, td)
+			    && vattr.va_ctime.tv_sec == VTONFS(newvp)->n_ctime) {
+				nfsstats.lookupcache_hits++;
+				if (cnp->cn_nameiop != LOOKUP &&
+				    (flags & ISLASTCN))
+					cnp->cn_flags |= SAVENAME;
+				vdrop(newvp);
+				return (0);
+			   }
+			   cache_purge(newvp);
+			}
+			vput(newvp);
+			if (lockparent && dvp != newvp && (flags & ISLASTCN))
+				VOP_UNLOCK(dvp, 0, td);
+		}
+		vdrop(newvp);
+		error = vn_lock(dvp, LK_EXCLUSIVE, td);
+		*vpp = NULLVP;
+		if (error) {
+			cnp->cn_flags |= PDIRUNLOCK;
+			return (error);
+		}
+		cnp->cn_flags &= ~PDIRUNLOCK;
+	}
+
+	error = 0;
+	newvp = NULLVP;
+	nfsstats.lookupcache_misses++;
+	nfsstats.rpccnt[NFSPROC_LOOKUP]++;
+
+	len = cnp->cn_namelen;
+	mreq = nfsm_reqhead(NULL, NFSV4PROC_COMPOUND, 0);
+	mb = mreq;
+	bpos = mtod(mb, caddr_t);
+
+	ga.bm = &nfsv4_getattrbm;
+	dga.bm = &nfsv4_getattrbm;
+	nfs_v4initcompound(&cp);
+
+	nfsm_v4build_compound(&cp, "nfs4_lookup()");
+	nfsm_v4build_putfh(&cp, dvp);
+	nfsm_v4build_getattr(&cp, &dga);
+	if (flags & ISDOTDOT)
+		nfsm_v4build_lookupp(&cp);
+	else if (!isdot) {
+		l.name = cnp->cn_nameptr;
+		l.namelen = len;
+		nfsm_v4build_lookup(&cp, &l);
+	}
+	nfsm_v4build_getattr(&cp, &ga);
+	nfsm_v4build_getfh(&cp, &gfh);
+	nfsm_v4build_finalize(&cp);
+
+	nfsm_request(dvp, NFSV4PROC_COMPOUND, cnp->cn_thread, cnp->cn_cred);
+	if (error != 0)
+		goto nfsmout;
+
+	nfsm_v4dissect_compound(&cp);
+	nfsm_v4dissect_putfh(&cp);
+	nfsm_v4dissect_getattr(&cp, &dga);
+	if (flags & ISDOTDOT)
+		nfsm_v4dissect_lookupp(&cp);
+	else if (!isdot)
+		nfsm_v4dissect_lookup(&cp);
+	nfsm_v4dissect_getattr(&cp, &ga);
+	nfsm_v4dissect_getfh(&cp, &gfh);
+
+	nfs4_vnop_loadattrcache(dvp, &dga.fa, NULL);
+	fhp = &gfh.fh_val;
+	fhsize = gfh.fh_len;
+
+	/*
+	 * Handle RENAME case...
+	 */
+	if (cnp->cn_nameiop == RENAME && wantparent && (flags & ISLASTCN)) {
+		if (NFS_CMPFH(np, fhp, fhsize))
+			return (EISDIR);
+
+		error = nfs_nget(dvp->v_mount, fhp, fhsize, &np);
+		if (error)
+			return (error);
+
+		newvp = NFSTOV(np);
+
+		nfs4_vnop_loadattrcache(newvp, &ga.fa, NULL);
+
+		*vpp = newvp;
+		cnp->cn_flags |= SAVENAME;
+		if (!lockparent) {
+			VOP_UNLOCK(dvp, 0, td);
+			cnp->cn_flags |= PDIRUNLOCK;
+		}
+		return (0);
+	}
+
+	if (flags & ISDOTDOT) {
+		VOP_UNLOCK(dvp, 0, td);
+
+		error = nfs_nget(dvp->v_mount, fhp, fhsize, &np);
+		if (error) {
+			vn_lock(dvp, LK_EXCLUSIVE | LK_RETRY, td);
+			return (error);
+		}
+		newvp = NFSTOV(np);
+
+		nfs4_vnop_loadattrcache(newvp, &ga.fa, NULL);
+
+		if (lockparent && (flags & ISLASTCN)) {
+			error = vn_lock(dvp, LK_EXCLUSIVE, td);
+			if (error) {
+				cnp->cn_flags |= PDIRUNLOCK;
+		    		vput(newvp);
+				return (error);
+			}
+		} else
+			cnp->cn_flags |= PDIRUNLOCK;
+	} else if (NFS_CMPFH(np, fhp, fhsize)) {
+		VREF(dvp);
+		newvp = dvp;
+	} else {
+		error = nfs_nget(dvp->v_mount, fhp, fhsize, &np);
+		if (error)
+			return (error);
+
+		if (!lockparent || !(flags & ISLASTCN)) {
+			cnp->cn_flags |= PDIRUNLOCK;
+			VOP_UNLOCK(dvp, 0, td);
+		}
+		newvp = NFSTOV(np);
+
+		/* Fill in np used by open. */
+		np->n_dvp = dvp;
+		np->n_namelen = cnp->cn_namelen;
+		if (np->n_name != NULL)
+			FREE(np->n_name, M_NFSREQ);
+		MALLOC(np->n_name, u_char *, np->n_namelen + 1, M_NFSREQ, M_WAITOK);
+		bcopy(cnp->cn_nameptr, np->n_name, np->n_namelen);
+		np->n_name[np->n_namelen] = '\0';
+
+		nfs4_vnop_loadattrcache(newvp, &ga.fa, NULL);
+	}
+
+	if (cnp->cn_nameiop != LOOKUP && (flags & ISLASTCN))
+		cnp->cn_flags |= SAVENAME;
+	if ((cnp->cn_flags & MAKEENTRY) &&
+	    (cnp->cn_nameiop != DELETE || !(flags & ISLASTCN))) {
+		np->n_ctime = np->n_vattr.va_ctime.tv_sec;
+		cache_enter(dvp, newvp, cnp);
+	}
+	*vpp = newvp;
+	m_freem(mrep);
+nfsmout:
+	error = nfs_v4postop(&cp, error);
+
+	if (error) {
+		if (newvp != NULLVP) {
+			vrele(newvp);
+			*vpp = NULLVP;
+		}
+		if ((cnp->cn_nameiop == CREATE || cnp->cn_nameiop == RENAME) &&
+		    (flags & ISLASTCN) && error == ENOENT) {
+			if (!lockparent) {
+				VOP_UNLOCK(dvp, 0, td);
+				cnp->cn_flags |= PDIRUNLOCK;
+			}
+			if (dvp->v_mount->mnt_flag & MNT_RDONLY)
+				error = EROFS;
+			else
+				error = EJUSTRETURN;
+		}
+		if (cnp->cn_nameiop != LOOKUP && (flags & ISLASTCN))
+			cnp->cn_flags |= SAVENAME;
+	}
+
+	return (error);
+}
+
+/*
+ * nfs read call.
+ * Just call nfs_bioread() to do the work.
+ */
+static int
+nfs4_read(struct vop_read_args *ap)
+{
+	struct vnode *vp = ap->a_vp;
+
+	switch (vp->v_type) {
+	case VREG:
+		return (nfs_bioread(vp, ap->a_uio, ap->a_ioflag, ap->a_cred));
+	case VDIR:
+		return (EISDIR);
+	default:
+		return (EOPNOTSUPP);
+	}
+}
+
+/*
+ * nfs readlink call
+ */
+static int
+nfs4_readlink(struct vop_readlink_args *ap)
+{
+	struct vnode *vp = ap->a_vp;
+
+	if (vp->v_type != VLNK)
+		return (EINVAL);
+	return (nfs_bioread(vp, ap->a_uio, 0, ap->a_cred));
+}
+
+/*
+ * Do a readlink rpc.
+ * Called by nfs_doio() from below the buffer cache.
+ */
+int
+nfs4_readlinkrpc(struct vnode *vp, struct uio *uiop, struct ucred *cred)
+{
+	caddr_t bpos, dpos;
+	int error = 0;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	struct nfs4_compound cp;
+
+	nfsstats.rpccnt[NFSPROC_READLINK]++;
+
+	mreq = nfsm_reqhead(vp, NFSV4PROC_COMPOUND, 0);
+	mb = mreq;
+	bpos = mtod(mb, caddr_t);
+
+	nfs_v4initcompound(&cp);
+
+	nfsm_v4build_compound(&cp, "nfs4_readlinkrpc()");
+	nfsm_v4build_putfh(&cp, vp);
+	nfsm_v4build_readlink(&cp);
+	nfsm_v4build_finalize(&cp);
+
+	nfsm_request(vp, NFSV4PROC_COMPOUND, uiop->uio_td, cred);
+	if (error != 0)
+		goto nfsmout;
+
+	nfsm_v4dissect_compound(&cp);
+	nfsm_v4dissect_putfh(&cp);
+	nfsm_v4dissect_readlink(&cp, uiop);
+
+nfsmout:
+	error = nfs_v4postop(&cp, error);
+
+	if (m_freem != NULL)
+		m_freem(mrep);
+	return (error);
+}
+
+/*
+ * nfs read rpc call
+ * Ditto above
+ */
+int
+nfs4_readrpc(struct vnode *vp, struct uio *uiop, struct ucred *cred)
+{
+	caddr_t bpos, dpos;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	struct nfsmount *nmp;
+	int error = 0, len, tsiz;
+	struct nfs4_compound cp;
+	struct nfs4_oparg_read read;
+	struct nfsnode *np = VTONFS(vp);
+
+	nmp = VFSTONFS(vp->v_mount);
+	tsiz = uiop->uio_resid;
+	if (uiop->uio_offset + tsiz > nmp->nm_maxfilesize)
+		return (EFBIG);
+
+	if (tsiz == 0)
+		return (0);
+
+	read.uiop = uiop;
+	read.fcp = np->n_rfc.refcnt > 0 ? &np->n_rfc : &np->n_wfc;
+
+	while (tsiz > 0) {
+		nfsstats.rpccnt[NFSPROC_READ]++;
+		len = (tsiz > nmp->nm_rsize) ? nmp->nm_rsize : tsiz;
+
+		read.off = uiop->uio_offset;
+		read.maxcnt = len;
+		nfs_v4initcompound(&cp);
+
+		mreq = nfsm_reqhead(vp, NFSV4PROC_COMPOUND, 0);
+		mb = mreq;
+		bpos = mtod(mb, caddr_t);
+
+		nfsm_v4build_compound(&cp, "nfs4_readrpc()");
+		nfsm_v4build_putfh(&cp, vp);
+		nfsm_v4build_read(&cp, &read);
+		nfsm_v4build_finalize(&cp);
+
+		nfsm_request(vp, NFSV4PROC_COMPOUND, uiop->uio_td, cred);
+		if (error != 0) {
+			error = nfs_v4postop(&cp, error);
+			goto nfsmout;
+		}
+
+		nfsm_v4dissect_compound(&cp);
+		nfsm_v4dissect_putfh(&cp);
+		nfsm_v4dissect_read(&cp, &read);
+
+		if (read.eof || read.retlen == 0)
+			tsiz = 0;
+		else
+			tsiz -= read.retlen;
+
+		error = nfs_v4postop(&cp, error);
+
+		m_freem(mrep);
+		mrep = NULL;
+	}
+nfsmout:
+	if (mrep != NULL)
+		m_freem(mrep);
+	
+	return (error);
+}
+
+/*
+ * nfs write call
+ */
+int
+nfs4_writerpc(struct vnode *vp, struct uio *uiop, struct ucred *cred,
+    int *iomode, int *must_commit)
+{
+	int32_t backup;
+	caddr_t bpos, dpos;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	struct nfsmount *nmp = VFSTONFS(vp->v_mount);
+	int error = 0, len, tsiz, wccflag = 1, rlen;
+	struct nfs4_compound cp;
+	struct nfs4_oparg_write write;
+	nfsv4stablehow commit, committed = NSHFILESYNC;
+	caddr_t verf;
+	struct nfsnode *np = VTONFS(vp);
+
+#ifndef DIAGNOSTIC
+	if (uiop->uio_iovcnt != 1)
+		panic("nfs: writerpc iovcnt > 1");
+#endif
+	*must_commit = 0;
+	tsiz = uiop->uio_resid;
+	if (uiop->uio_offset + tsiz > nmp->nm_maxfilesize)
+		return (EFBIG);
+
+	if (tsiz == 0)
+		return (0);
+
+	write.stable = (nfsv4stablehow)*iomode;
+	write.uiop = uiop;
+	write.fcp = &np->n_wfc;
+
+	while (tsiz > 0) {
+		nfsstats.rpccnt[NFSPROC_WRITE]++;
+		len = (tsiz > nmp->nm_wsize) ? nmp->nm_wsize : tsiz;
+
+		write.off = uiop->uio_offset;
+		write.cnt = len;
+		nfs_v4initcompound(&cp);
+
+		mreq = nfsm_reqhead(vp, NFSV4PROC_COMPOUND, 0);
+		mb = mreq;
+		bpos = mtod(mb, caddr_t);
+
+		nfsm_v4build_compound(&cp, "nfs4_writerpc()");
+		nfsm_v4build_putfh(&cp, vp);
+		nfsm_v4build_write(&cp, &write);
+		nfsm_v4build_finalize(&cp);
+
+		nfsm_request(vp, NFSV4PROC_COMPOUND, uiop->uio_td, cred);
+		if (error != 0) {
+			error = nfs_v4postop(&cp, error);
+			goto nfsmout;
+		}
+
+		nfsm_v4dissect_compound(&cp);
+		nfsm_v4dissect_putfh(&cp);
+		nfsm_v4dissect_write(&cp, &write);
+
+		rlen = write.retlen;
+		if (rlen == 0) {
+			error = NFSERR_IO;
+			break;
+		} else if (rlen < len) {
+			backup = len - rlen;
+			(char *)uiop->uio_iov->iov_base -= backup;
+			uiop->uio_iov->iov_len += backup;
+                        uiop->uio_offset -= backup;
+                        uiop->uio_resid += backup;
+                        len = rlen;
+		}
+
+		commit = write.committed;
+
+		if (committed == NSHFILESYNC ||
+		    (committed = NSHDATASYNC && commit == NSHUNSTABLE))
+			committed = commit;
+
+		verf = (caddr_t)write.wverf;
+
+                if ((nmp->nm_flag & NFSSTA_HASWRITEVERF) == 0) {
+                        bcopy(verf, nmp->nm_verf, NFSX_V4VERF);
+                        nmp->nm_flag |= NFSMNT_HASWRITEVERF;
+                } else if (bcmp(verf, nmp->nm_verf, NFSX_V4VERF)) {
+                        *must_commit = 1;
+                        bcopy(verf, nmp->nm_verf, NFSX_V4VERF);
+                }
+
+		/* XXX wccflag */
+		if (wccflag)
+			VTONFS(vp)->n_mtime = VTONFS(vp)->n_vattr.va_mtime.tv_sec;
+
+		error = nfs_v4postop(&cp, error);
+
+		m_freem(mrep);
+		mrep = NULL;
+		if (error)
+			break;
+		tsiz -= len;
+	}
+nfsmout:
+	if (mrep != NULL)
+		m_freem(mrep);
+	*iomode = committed;
+	if (error)
+		uiop->uio_resid = tsiz;
+	return (error);
+}
+
+/* ARGSUSED */
+static int
+nfs4_mknod(struct vop_mknod_args *ap)
+{
+	struct vattr *vap = ap->a_vap;
+	struct vnode *newvp = NULL;
+	int error;
+
+	error = nfs4_createrpc(ap->a_dvp, &newvp,
+	    ap->a_cnp, (nfstype)vap->va_type, vap, NULL);
+
+	/* XXX - is this actually referenced here? */
+	if (error == 0) {
+		*ap->a_vpp = newvp;
+		vrele(newvp);
+	}
+
+	return (error);
+}
+
+static int
+nfs4_createrpc(struct vnode *dvp, struct vnode **vpp, struct componentname *cnp,
+    nfstype ftype, struct vattr *vap, char *linktarget)
+{
+	struct nfsnode *dnp = VTONFS(dvp);
+	struct nfsnode *np = NULL;
+	struct vnode *newvp = NULL;
+	struct nfs4_compound cp;
+	struct nfs4_oparg_create c;
+	struct nfs4_oparg_getattr ga;
+	struct nfs4_oparg_getfh gfh;
+	caddr_t bpos, dpos;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	int error = 0;
+
+	nfsstats.rpccnt[NFSPROC_CREATE]++;
+
+	mreq = nfsm_reqhead(dvp, NFSV4PROC_COMPOUND, 0);
+	mb = mreq;
+	bpos = mtod(mb, caddr_t);
+
+	bzero(&c, sizeof(c));
+	bzero(&ga, sizeof(ga));
+
+	c.type = ftype;
+	c.vap = vap;
+	c.linktext = linktarget;
+	c.name = cnp->cn_nameptr;
+	c.namelen = cnp->cn_namelen;
+
+	ga.bm = &nfsv4_getattrbm;
+	nfs_v4initcompound(&cp);
+
+	nfsm_v4build_compound(&cp, "nfs4_createrpc()");
+	nfsm_v4build_putfh(&cp, dvp);
+	nfsm_v4build_create(&cp, &c);
+	nfsm_v4build_getattr(&cp, &ga);
+	nfsm_v4build_getfh(&cp, &gfh);	
+	nfsm_v4build_finalize(&cp); 
+
+	nfsm_request(dvp, NFSV4PROC_COMPOUND, cnp->cn_thread, cnp->cn_cred);
+	if (error != 0)
+		goto nfsmout;
+
+	nfsm_v4dissect_compound(&cp);
+	nfsm_v4dissect_putfh(&cp);
+	nfsm_v4dissect_create(&cp, &c);
+	nfsm_v4dissect_getattr(&cp, &ga);
+	nfsm_v4dissect_getfh(&cp, &gfh);	
+	
+	error = nfs_nget(dvp->v_mount, &gfh.fh_val, gfh.fh_len, &np);
+	if (error != 0)
+		goto nfsmout;
+
+	newvp = NFSTOV(np);
+	nfs4_vnop_loadattrcache(newvp, &ga.fa, NULL);
+
+	if (cnp->cn_flags & MAKEENTRY)
+		cache_enter(dvp, newvp, cnp);
+
+	dnp->n_flag |= NMODIFIED;
+	dnp->n_attrstamp = 0;
+
+ nfsmout:
+	error = nfs_v4postop(&cp, error);
+
+	if (mrep != NULL)
+		m_freem(mrep);
+
+	/* XXX */
+	/*FREE(cnp->cn_pnbuf, M_NAMEI);*/
+	if (error != 0 && newvp != NULL)
+		vrele(newvp);
+	else if (error == 0)
+		*vpp = newvp;
+
+	return (error);
+}
+
+static int
+nfs4_renamerpc(struct vnode *fdvp, const char *fnameptr, int fnamelen,
+    struct vnode *tdvp, const char *tnameptr, int tnamelen,
+    struct ucred *cred, struct thread *td)
+{
+
+	struct nfsnode *fnp = VTONFS(fdvp), *tnp = VTONFS(tdvp);
+	caddr_t bpos, dpos;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	struct nfs4_compound cp;
+	struct nfs4_oparg_rename r;
+	int error = 0;
+
+	nfsstats.rpccnt[NFSPROC_RENAME]++;
+
+	r.fname = fnameptr;
+	r.fnamelen = fnamelen;
+	r.tname = tnameptr;
+	r.tnamelen = tnamelen;
+	nfs_v4initcompound(&cp);
+
+	mreq = nfsm_reqhead(fdvp, NFSV4PROC_COMPOUND, 0);
+	mb = mreq;
+	bpos = mtod(mb, caddr_t);
+
+	nfsm_v4build_compound(&cp, "nfs4_renamerpc()");
+	nfsm_v4build_putfh(&cp, fdvp);
+	nfsm_v4build_savefh(&cp);
+	nfsm_v4build_putfh(&cp, tdvp);
+	nfsm_v4build_rename(&cp, &r);
+	nfsm_v4build_finalize(&cp);
+
+	nfsm_request(fdvp, NFSV4PROC_COMPOUND, td, cred);
+	if (error != 0)
+		goto nfsmout;
+
+	nfsm_v4dissect_compound(&cp);
+	nfsm_v4dissect_putfh(&cp);
+	nfsm_v4dissect_savefh(&cp);
+	nfsm_v4dissect_putfh(&cp);
+	nfsm_v4dissect_rename(&cp);
+
+	/* XXX should this always be performed?  */
+	fnp->n_flag |= NMODIFIED;
+	tnp->n_flag |= NMODIFIED;
+	fnp->n_attrstamp = tnp->n_attrstamp = 0;
+
+ nfsmout:
+	error = nfs_v4postop(&cp, error);
+
+	if (mrep != NULL)
+		m_freem(mrep);
+
+	return (error);
+}
+
+/*
+ * nfs file create call
+ */
+static int
+nfs4_create(struct vop_create_args *ap)
+{
+	struct vnode *dvp = ap->a_dvp;
+	struct vattr *vap = ap->a_vap;
+	struct nfsnode *dnp = VTONFS(dvp);
+	struct componentname *cnp = ap->a_cnp;
+	struct vnode *newvp = NULL;
+	int error = 0, fmode = (O_CREAT | FREAD | FWRITE);
+	struct vattr vattr;
+
+	if ((error = VOP_GETATTR(dvp, &vattr, cnp->cn_cred, cnp->cn_thread)) != 0)
+		return (error);
+
+	if (vap->va_vaflags & VA_EXCLUSIVE)
+		fmode |= O_EXCL;
+
+	error = nfs4_openrpc(dvp, &newvp, cnp, fmode, vap);
+	if (error != 0)
+		goto out;
+
+	VTONFS(newvp)->n_flag |= NCREATED;
+
+	if (cnp->cn_flags & MAKEENTRY)
+		cache_enter(dvp, newvp, cnp);
+
+	*ap->a_vpp = newvp;
+
+	dnp->n_flag |= NMODIFIED;
+	dnp->n_attrstamp = 0;	/* XXX; wccflag */
+
+ out:
+	return (error);
+}
+
+/*
+ * nfs file remove call
+ * To try and make nfs semantics closer to ufs semantics, a file that has
+ * other processes using the vnode is renamed instead of removed and then
+ * removed later on the last close.
+ * - If v_usecount > 1
+ *	  If a rename is not already in the works
+ *	     call nfs4_sillyrename() to set it up
+ *     else
+ *	  do the remove rpc
+ */
+static int
+nfs4_remove(struct vop_remove_args *ap)
+{
+	struct vnode *vp = ap->a_vp;
+	struct vnode *dvp = ap->a_dvp;
+	struct componentname *cnp = ap->a_cnp;
+	struct nfsnode *np = VTONFS(vp);
+	int error = 0;
+	struct vattr vattr;
+
+#ifndef DIAGNOSTIC
+	if ((cnp->cn_flags & HASBUF) == 0)
+		panic("nfs4_remove: no name");
+	if (vrefcnt(vp) < 1)
+		panic("nfs4_remove: bad v_usecount");
+#endif
+	if (vp->v_type == VDIR)
+		error = EPERM;
+	else if (vrefcnt(vp) == 1 || (np->n_sillyrename &&
+	    VOP_GETATTR(vp, &vattr, cnp->cn_cred, cnp->cn_thread) == 0 &&
+	    vattr.va_nlink > 1)) {
+		/*
+		 * Purge the name cache so that the chance of a lookup for
+		 * the name succeeding while the remove is in progress is
+		 * minimized. Without node locking it can still happen, such
+		 * that an I/O op returns ESTALE, but since you get this if
+		 * another host removes the file..
+		 */
+		cache_purge(vp);
+		/*
+		 * throw away biocache buffers, mainly to avoid
+		 * unnecessary delayed writes later.
+		 */
+		error = nfs_vinvalbuf(vp, 0, cnp->cn_cred, cnp->cn_thread, 1);
+		/* Do the rpc */
+		if (error != EINTR)
+			error = nfs4_removerpc(dvp, cnp->cn_nameptr,
+				cnp->cn_namelen, cnp->cn_cred, cnp->cn_thread);
+		/*
+		 * Kludge City: If the first reply to the remove rpc is lost..
+		 *   the reply to the retransmitted request will be ENOENT
+		 *   since the file was in fact removed
+		 *   Therefore, we cheat and return success.
+		 */
+		if (error == ENOENT)
+			error = 0;
+	} else if (!np->n_sillyrename)
+		error = nfs4_sillyrename(dvp, vp, cnp);
+	np->n_attrstamp = 0;
+	return (error);
+}
+
+/*
+ * nfs file remove rpc called from nfs_inactive
+ */
+int
+nfs4_removeit(struct sillyrename *sp)
+{
+	/*
+	 * Make sure that the directory vnode is still valid.
+	 * XXX we should lock sp->s_dvp here.
+	 */
+	if (sp->s_dvp->v_type == VBAD)
+		return (0);
+	return (nfs4_removerpc(sp->s_dvp, sp->s_name, sp->s_namlen, sp->s_cred,
+		NULL));
+}
+
+/*
+ * Nfs remove rpc, called from nfs4_remove() and nfs4_removeit().
+ */
+static int
+nfs4_removerpc(struct vnode *dvp, const char *name, int namelen,
+    struct ucred *cred, struct thread *td)
+{
+	caddr_t bpos, dpos;
+	int error = 0;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	struct nfs4_compound cp;
+
+	nfsstats.rpccnt[NFSPROC_REMOVE]++;
+
+	mreq = nfsm_reqhead(dvp, NFSV4PROC_COMPOUND, 0);
+	mb = mreq;
+	bpos = mtod(mb, caddr_t);
+
+	nfs_v4initcompound(&cp);
+
+	nfsm_v4build_compound(&cp, "nfs4_removerpc()");
+	nfsm_v4build_putfh(&cp, dvp);
+	nfsm_v4build_remove(&cp, name, namelen);
+	nfsm_v4build_finalize(&cp);
+
+	nfsm_request(dvp, NFSV4PROC_COMPOUND, td, cred);
+	if (error != 0)
+		goto nfsmout;
+
+	nfsm_v4dissect_compound(&cp);
+	nfsm_v4dissect_putfh(&cp);
+	nfsm_v4dissect_remove(&cp);
+
+ nfsmout:
+	error = nfs_v4postop(&cp, error);
+
+	if (mrep != NULL)
+		m_freem(mrep);
+
+	VTONFS(dvp)->n_flag |= NMODIFIED;
+	VTONFS(dvp)->n_attrstamp = 0; /* XXX wccflag */
+
+	return (error);
+}
+
+/*
+ * nfs file rename call
+ */
+static int
+nfs4_rename(struct vop_rename_args *ap)
+{
+	struct vnode *fvp = ap->a_fvp;
+	struct vnode *tvp = ap->a_tvp;
+	struct vnode *fdvp = ap->a_fdvp;
+	struct vnode *tdvp = ap->a_tdvp;
+	struct componentname *tcnp = ap->a_tcnp;
+	struct componentname *fcnp = ap->a_fcnp;
+	int error;
+
+ #ifndef DIAGNOSTIC
+	if ((tcnp->cn_flags & HASBUF) == 0 ||
+	    (fcnp->cn_flags & HASBUF) == 0)
+		panic("nfs4_rename: no name");
+#endif
+	/* Check for cross-device rename */
+	if ((fvp->v_mount != tdvp->v_mount) ||
+	    (tvp && (fvp->v_mount != tvp->v_mount))) {
+		error = EXDEV;
+		goto out;
+	}
+
+	if (fvp == tvp) {
+		printf("nfs4_rename: fvp == tvp (can't happen)\n");
+		error = 0;
+		goto out;
+	}
+	if ((error = vn_lock(fvp, LK_EXCLUSIVE, fcnp->cn_thread)) != 0)
+		goto out;
+
+	/*
+	 * We have to flush B_DELWRI data prior to renaming
+	 * the file.  If we don't, the delayed-write buffers
+	 * can be flushed out later after the file has gone stale
+	 * under NFSV3.  NFSV2 does not have this problem because
+	 * ( as far as I can tell ) it flushes dirty buffers more
+	 * often.
+	 */
+	VOP_FSYNC(fvp, fcnp->cn_cred, MNT_WAIT, fcnp->cn_thread);
+	VOP_UNLOCK(fvp, 0, fcnp->cn_thread);
+	if (tvp)
+	    VOP_FSYNC(tvp, tcnp->cn_cred, MNT_WAIT, tcnp->cn_thread);
+
+	/*
+	 * If the tvp exists and is in use, sillyrename it before doing the
+	 * rename of the new file over it.
+	 * XXX Can't sillyrename a directory.
+	 */
+	if (tvp && vrefcnt(tvp) > 1 && !VTONFS(tvp)->n_sillyrename &&
+		tvp->v_type != VDIR && !nfs4_sillyrename(tdvp, tvp, tcnp)) {
+		vput(tvp);
+		tvp = NULL;
+	}
+
+	error = nfs4_renamerpc(fdvp, fcnp->cn_nameptr, fcnp->cn_namelen,
+		tdvp, tcnp->cn_nameptr, tcnp->cn_namelen, tcnp->cn_cred,
+		tcnp->cn_thread);
+
+	if (fvp->v_type == VDIR) {
+		if (tvp != NULL && tvp->v_type == VDIR)
+			cache_purge(tdvp);
+		cache_purge(fdvp);
+	}
+
+out:
+	if (tdvp == tvp)
+		vrele(tdvp);
+	else
+		vput(tdvp);
+	if (tvp)
+		vput(tvp);
+	vrele(fdvp);
+	vrele(fvp);
+	/*
+	 * Kludge: Map ENOENT => 0 assuming that it is a reply to a retry.
+	 */
+	if (error == ENOENT)
+		error = 0;
+	return (error);
+}
+
+/*
+ * nfs file rename rpc called from nfs4_remove() above
+ */
+static int
+nfs4_renameit(struct vnode *sdvp, struct componentname *scnp,
+    struct sillyrename *sp)
+{
+	return (nfs4_renamerpc(sdvp, scnp->cn_nameptr, scnp->cn_namelen, sdvp,
+	    sp->s_name, sp->s_namlen, scnp->cn_cred, scnp->cn_thread));
+}
+
+/*
+ * nfs hard link create call
+ */
+static int
+nfs4_link(struct vop_link_args *ap)
+{
+	struct vnode *vp = ap->a_vp;
+	struct vnode *tdvp = ap->a_tdvp;
+	struct componentname *cnp = ap->a_cnp;
+	caddr_t bpos, dpos;
+	int error = 0;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	struct nfs4_compound cp;
+	struct nfs4_oparg_link l;
+
+	if (vp->v_mount != tdvp->v_mount) {
+		return (EXDEV);
+	}
+
+	/*
+	 * Push all writes to the server, so that the attribute cache
+	 * doesn't get "out of sync" with the server.
+	 * XXX There should be a better way!
+	 */
+	VOP_FSYNC(vp, cnp->cn_cred, MNT_WAIT, cnp->cn_thread);
+
+	nfsstats.rpccnt[NFSPROC_LINK]++;
+
+	l.name = cnp->cn_nameptr;
+	l.namelen = cnp->cn_namelen;
+	nfs_v4initcompound(&cp);
+
+	mreq = nfsm_reqhead(vp, NFSV4PROC_COMPOUND, 0);
+	mb = mreq;
+	bpos = mtod(mb, caddr_t);
+
+	nfsm_v4build_compound(&cp, "nfs4_link()");
+	nfsm_v4build_putfh(&cp, vp);
+	nfsm_v4build_savefh(&cp);
+	nfsm_v4build_putfh(&cp, tdvp);
+	nfsm_v4build_link(&cp, &l);
+	nfsm_v4build_finalize(&cp);
+
+	nfsm_request(vp, NFSV4PROC_COMPOUND, cnp->cn_thread, cnp->cn_cred);
+	if (error != 0)
+		goto nfsmout;
+
+	nfsm_v4dissect_compound(&cp);
+	nfsm_v4dissect_putfh(&cp);
+	nfsm_v4dissect_savefh(&cp);
+	nfsm_v4dissect_putfh(&cp);
+	nfsm_v4dissect_link(&cp);
+
+	VTONFS(tdvp)->n_flag |= NMODIFIED;
+	VTONFS(vp)->n_attrstamp = 0;
+	VTONFS(tdvp)->n_attrstamp = 0;
+
+nfsmout:
+	error = nfs_v4postop(&cp, error);
+
+	if (mrep != NULL)
+		m_freem(mrep);
+
+	return (error);
+}
+
+/*
+ * nfs symbolic link create call
+ */
+static int
+nfs4_symlink(struct vop_symlink_args *ap)
+{
+	struct vnode *dvp = ap->a_dvp;
+	int error = 0;
+	struct vnode *newvp = NULL;
+
+	nfsstats.rpccnt[NFSPROC_SYMLINK]++;
+
+	error = nfs4_createrpc(ap->a_dvp, &newvp, ap->a_cnp, NFLNK,
+	    ap->a_vap, ap->a_target);
+
+	if (error != 0 && newvp != NULL)
+		vput(newvp);
+	else if (error == 0)
+		 *ap->a_vpp = newvp;
+
+	VTONFS(dvp)->n_flag |= NMODIFIED;
+	VTONFS(dvp)->n_attrstamp = 0; /* XXX wccflags */
+
+	return (error);
+}
+
+/*
+ * nfs make dir call
+ */
+static int
+nfs4_mkdir(struct vop_mkdir_args *ap)
+{
+	return (nfs4_createrpc(ap->a_dvp, ap->a_vpp, ap->a_cnp, NFDIR,
+		    ap->a_vap, NULL));
+}
+
+/*
+ * nfs remove directory call
+ */
+static int
+nfs4_rmdir(struct vop_rmdir_args *ap)
+{
+	struct vnode *vp = ap->a_vp;
+	struct vnode *dvp = ap->a_dvp;
+	struct nfsnode *dnp = VTONFS(dvp);
+	struct componentname *cnp = ap->a_cnp;
+	int error = 0;
+
+	if (dvp == vp)
+		return (EINVAL);
+
+	error = (nfs4_removerpc(dvp, cnp->cn_nameptr, cnp->cn_namelen, cnp->cn_cred,
+			       NULL));
+	if (error)
+		return (error);
+
+	dnp->n_flag |= NMODIFIED;
+	dnp->n_attrstamp = 0;
+	cache_purge(dvp);
+	cache_purge(vp);
+
+	return (error);
+}
+
+/*
+ * nfs readdir call
+ */
+static int
+nfs4_readdir(struct vop_readdir_args *ap)
+{
+	struct vnode *vp = ap->a_vp;
+	struct nfsnode *np = VTONFS(vp);
+	struct uio *uio = ap->a_uio;
+	int tresid, error;
+	struct vattr vattr;
+
+	if (vp->v_type != VDIR)
+		return (EPERM);
+	/*
+	 * First, check for hit on the EOF offset cache
+	 */
+	if (np->n_direofoffset > 0 && uio->uio_offset >= np->n_direofoffset &&
+	    (np->n_flag & NMODIFIED) == 0) {
+		if (VOP_GETATTR(vp, &vattr, ap->a_cred, uio->uio_td) == 0 &&
+			np->n_mtime == vattr.va_mtime.tv_sec) {
+			nfsstats.direofcache_hits++;
+			return (0);
+		}
+	}
+
+	/*
+	 * Call nfs_bioread() to do the real work.
+	 */
+	tresid = uio->uio_resid;
+	error = nfs_bioread(vp, uio, 0, ap->a_cred);
+
+	if (!error && uio->uio_resid == tresid)
+		nfsstats.direofcache_misses++;
+	return (error);
+}
+
+static u_char fty_to_dty[] = {
+	DT_UNKNOWN,		/* NFNON */
+	DT_REG,			/* NFREG */
+	DT_DIR,			/* NFDIR */
+	DT_BLK,			/* NFBLK */
+	DT_CHR,			/* NFCHR */
+	DT_LNK,			/* NFLNK */
+	DT_SOCK,		/* NFSOCK */
+	DT_FIFO,		/* NFFIFO */
+        DT_UNKNOWN,		/* NFATTRDIT */
+        DT_UNKNOWN,		/* NFNAMEDATTR */
+        DT_UNKNOWN,		/* NFBAD */
+};
+
+/*
+ * Readdir rpc call.
+ * Called from below the buffer cache by nfs_doio().
+ */
+int
+nfs4_readdirrpc(struct vnode *vp, struct uio *uiop, struct ucred *cred)
+{
+	int len, left;
+	struct dirent *dp = NULL;
+	u_int32_t *tl;
+	caddr_t p;
+	uint64_t *cookiep;
+	caddr_t bpos, dpos;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	uint64_t cookie;
+	struct nfsmount *nmp = VFSTONFS(vp->v_mount);
+	struct nfsnode *dnp = VTONFS(vp);
+	int error = 0, tlen, more_dirs = 1, blksiz = 0, bigenough = 1;
+	struct nfs4_compound cp;
+	struct nfs4_oparg_readdir readdir;
+	struct nfsv4_fattr fattr;
+	u_int fty;
+
+#ifndef DIAGNOSTIC
+	if (uiop->uio_iovcnt != 1 || (uiop->uio_offset & (DIRBLKSIZ - 1)) ||
+		(uiop->uio_resid & (DIRBLKSIZ - 1)))
+		panic("nfs readdirrpc bad uio");
+#endif
+
+	/*
+	 * If there is no cookie, assume directory was stale.
+	 */
+	cookiep = nfs4_getcookie(dnp, uiop->uio_offset, 0);
+	if (cookiep)
+		cookie = *cookiep;
+	else
+		return (NFSERR_BAD_COOKIE);
+
+	/* Generate fake entries for "." and ".." */
+	while (cookie < 2 && bigenough) {
+		cookie++;
+		len = 4 + DIRHDSIZ;
+
+		if (len > uiop->uio_resid) {
+			bigenough = 0;
+			break;
+		}
+		dp = (struct dirent *)uiop->uio_iov->iov_base;
+
+		dp->d_namlen = cookie;
+		dp->d_reclen = len;
+		dp->d_type = DT_DIR;
+		if (cookie == 1)
+			dp->d_fileno = dnp->n_vattr.va_fileid; /* XXX has problems with pynfs virtualhandles */
+		else
+			dp->d_fileno = dnp->n_dvp != NULL ?
+			    VTONFS(dnp->n_dvp)->n_vattr.va_fileid : cookie;
+
+		p = dp->d_name;
+		*p++ = '.';
+		if (cookie == 2)
+			*p++ = '.';
+		*p = '\0';
+
+		blksiz += len;
+		if (blksiz == DIRBLKSIZ)
+			blksiz = 0;
+		uiop->uio_offset += len;
+		uiop->uio_resid -= len;
+		(char *)uiop->uio_iov->iov_base += len;
+		uiop->uio_iov->iov_len -= len;
+	}
+
+	if (cookie == 2)
+		cookie = 0;
+
+	/* This is sort of ugly, to prevent v4postop() from acting weird */
+	bzero(&cp, sizeof(cp));
+
+	/*
+	 * Loop around doing readdir rpc's of size nm_readdirsize
+	 * truncated to a multiple of DIRBLKSIZ.
+	 * The stopping criteria is EOF or buffer full.
+	 */
+	/*
+	 * XXX this is sort of ugly for nfsv4; we don't maintain the
+	 * strict abstraction, but do the decoding inline.  that's ok.
+	 */
+	while (more_dirs && bigenough) {
+		nfsstats.rpccnt[NFSPROC_READDIR]++;
+
+		mreq = nfsm_reqhead(vp, NFSV4PROC_COMPOUND, 0);
+		mb = mreq;
+		bpos = mtod(mb, caddr_t);
+
+		readdir.cnt = nmp->nm_readdirsize;
+		readdir.cookie = cookie;
+		readdir.bm = &nfsv4_readdirbm;
+		if (cookie == 0)
+			bzero(&readdir.verf, sizeof(readdir.verf));
+		else
+			bcopy(&dnp->n_cookieverf, &readdir.verf,
+			    sizeof(readdir.verf));
+
+		nfs_v4initcompound(&cp);
+
+		nfsm_v4build_compound(&cp, "nfs4_readdirrpc()");
+		nfsm_v4build_putfh(&cp, vp);
+		nfsm_v4build_readdir(&cp, &readdir);
+		nfsm_v4build_finalize(&cp);
+
+		nfsm_request(vp, NFSV4PROC_COMPOUND, uiop->uio_td, cred);
+		if (error != 0)
+			goto nfsmout;
+
+		nfsm_v4dissect_compound(&cp);
+		nfsm_v4dissect_putfh(&cp);
+
+		/*
+		 * XXX - Readdir gets handled inline like in
+		 * NFSv{2,3}.  This is a nasty inconsistency and
+		 * should be fixed.
+		 */
+
+		tl = nfsm_dissect(uint32_t *, 5 * NFSX_UNSIGNED);
+		if (fxdr_unsigned(uint32_t, *tl++) != NFSV4OP_READDIR) {
+			error = EBADRPC;
+			goto nfsmout;
+		}
+		if (fxdr_unsigned(uint32_t, *tl++) != 0) {
+			error = EBADRPC;
+			goto nfsmout;
+		}
+
+		bcopy(tl, &dnp->n_cookieverf, NFSX_V4VERF);
+		tl += 2;
+		more_dirs = fxdr_unsigned(int, *tl++);
+
+		/* loop thru the dir entries, doctoring them to 4bsd form */
+		while (more_dirs && bigenough) {
+			tl = nfsm_dissect(uint32_t *, 3 * NFSX_UNSIGNED);
+			cookie = fxdr_hyper(tl);
+			tl += 2;
+			/* XXX cookie sanity check */
+			len = fxdr_unsigned(int, *tl++);
+			if (len <= 0 || len > NFS_MAXNAMLEN) {
+				error = EBADRPC;
+				goto nfsmout;
+			}
+			tlen = nfsm_rndup(len);
+			if (tlen == len)
+				tlen += 4;	/* To ensure null termination */
+			left = DIRBLKSIZ - blksiz;
+			if ((tlen + DIRHDSIZ) > left) {
+				dp->d_reclen += left;
+				uiop->uio_iov->iov_base =
+				    (char *)uiop->uio_iov->iov_base + left;
+				uiop->uio_iov->iov_len -= left;
+				uiop->uio_offset += left;
+				uiop->uio_resid -= left;
+				blksiz = 0;
+			}
+			if ((tlen + DIRHDSIZ) > uiop->uio_resid)
+				bigenough = 0;
+			if (bigenough) {
+				dp = (struct dirent *)uiop->uio_iov->iov_base;
+
+				dp->d_namlen = len;
+				dp->d_reclen = tlen + DIRHDSIZ;
+
+				blksiz += dp->d_reclen;
+				if (blksiz == DIRBLKSIZ)
+					blksiz = 0;
+				uiop->uio_offset += DIRHDSIZ;
+				uiop->uio_resid -= DIRHDSIZ;
+				uiop->uio_iov->iov_base =
+				    (char *)uiop->uio_iov->iov_base + DIRHDSIZ;
+				uiop->uio_iov->iov_len -= DIRHDSIZ;
+
+				/* Copy name */
+				nfsm_mtouio(uiop, len);
+				p = uiop->uio_iov->iov_base;
+				tlen -= len;
+				*p = '\0';	/* null terminate */
+				/* printf("nfs4_readdirrpc: name: \"%s\" cookie %d\n",
+				   p - len, (int) cookie);*/
+				uiop->uio_iov->iov_base =
+				    (char *)uiop->uio_iov->iov_base + tlen;
+				uiop->uio_iov->iov_len -= tlen;
+				uiop->uio_offset += tlen;
+				uiop->uio_resid -= tlen;
+
+				/* Copy attributes */
+				nfsm_v4dissect_attrs(&fattr);
+
+				dp->d_fileno = nfs_v4fileid4_to_fileid(
+					fattr.fa4_valid & FA4V_FILEID &&
+					    fattr.fa4_fileid ?
+					    fattr.fa4_fileid : cookie);
+
+				fty = (u_int)fattr.fa4_type;
+				dp->d_type = fattr.fa4_valid & FA4V_TYPE &&
+				    (fty < sizeof(fty_to_dty)) ?
+				    fty_to_dty[fty] : DT_UNKNOWN;
+			} else
+				nfsm_adv(nfsm_rndup(len));
+
+			tl = nfsm_dissect(uint32_t *, NFSX_UNSIGNED);
+			more_dirs = fxdr_unsigned(int, *tl++);
+		}
+		/*
+		 * If at end of rpc data, get the eof boolean
+		 */
+		if (!more_dirs) {
+			tl = nfsm_dissect(u_int32_t *, NFSX_UNSIGNED);
+			more_dirs = (fxdr_unsigned(int, *tl) == 0);
+		}
+
+		error = nfs_v4postop(&cp, error);
+
+		m_freem(mrep);
+		mrep = NULL;
+	}
+	/*
+	 * Fill last record, iff any, out to a multiple of DIRBLKSIZ
+	 * by increasing d_reclen for the last record.
+	 */
+	if (blksiz > 0) {
+		left = DIRBLKSIZ - blksiz;
+		dp->d_reclen += left;
+		uiop->uio_iov->iov_base =
+		    (char *)uiop->uio_iov->iov_base + left;
+		uiop->uio_iov->iov_len -= left;
+		uiop->uio_offset += left;
+		uiop->uio_resid -= left;
+	}
+
+	/*
+	 * We are now either at the end of the directory or have filled the
+	 * block.
+	 */
+	if (bigenough)
+		dnp->n_direofoffset = uiop->uio_offset;
+	else {
+		if (uiop->uio_resid > 0)
+			printf("EEK! readdirrpc resid > 0\n");
+		cookiep = nfs4_getcookie(dnp, uiop->uio_offset, 1);
+		*cookiep = cookie;
+	}
+nfsmout:
+	if (mrep != NULL)
+		m_freem(mrep);
+	return (error);
+}
+
+/*
+ * Silly rename. To make the NFS filesystem that is stateless look a little
+ * more like the "ufs" a remove of an active vnode is translated to a rename
+ * to a funny looking filename that is removed by nfs_inactive on the
+ * nfsnode. There is the potential for another process on a different client
+ * to create the same funny name between the nfs_lookitup() fails and the
+ * nfs_rename() completes, but...
+ */
+static int
+nfs4_sillyrename(struct vnode *dvp, struct vnode *vp, struct componentname *cnp)
+{
+	struct sillyrename *sp;
+	struct nfsnode *np;
+	int error;
+	short pid;
+
+	cache_purge(dvp);
+	np = VTONFS(vp);
+#ifndef DIAGNOSTIC
+	if (vp->v_type == VDIR)
+		panic("nfs: sillyrename dir");
+#endif
+	MALLOC(sp, struct sillyrename *, sizeof (struct sillyrename),
+		M_NFSREQ, M_WAITOK);
+	sp->s_cred = crhold(cnp->cn_cred);
+	sp->s_dvp = dvp;
+	sp->s_removeit = nfs4_removeit;
+	VREF(dvp);
+
+	/* Fudge together a funny name */
+	pid = cnp->cn_thread->td_proc->p_pid;
+	sp->s_namlen = sprintf(sp->s_name, ".nfsA%04x4.4", pid);
+
+	/* Try lookitups until we get one that isn't there */
+	while (nfs4_lookitup(dvp, sp->s_name, sp->s_namlen, sp->s_cred,
+		cnp->cn_thread, NULL) == 0) {
+		sp->s_name[4]++;
+		if (sp->s_name[4] > 'z') {
+			error = EINVAL;
+			goto bad;
+		}
+	}
+	error = nfs4_renameit(dvp, cnp, sp);
+	if (error)
+		goto bad;
+	error = nfs4_lookitup(dvp, sp->s_name, sp->s_namlen, sp->s_cred,
+		cnp->cn_thread, &np);
+	np->n_sillyrename = sp;
+	return (0);
+bad:
+	vrele(sp->s_dvp);
+	crfree(sp->s_cred);
+	free((caddr_t)sp, M_NFSREQ);
+	return (error);
+}
+
+/*
+ * Look up a file name and optionally either update the file handle or
+ * allocate an nfsnode, depending on the value of npp.
+ * npp == NULL	--> just do the lookup
+ * *npp == NULL --> allocate a new nfsnode and make sure attributes are
+ *			handled too
+ * *npp != NULL --> update the file handle in the vnode
+ */
+static int
+nfs4_lookitup(struct vnode *dvp, const char *name, int len, struct ucred *cred,
+    struct thread *td, struct nfsnode **npp)
+{
+	struct vnode *newvp = NULL;
+	struct nfsnode *np, *dnp = VTONFS(dvp);
+	caddr_t bpos, dpos;
+	int error = 0, fhlen;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	nfsfh_t *nfhp;
+	struct nfs4_compound cp;
+	struct nfs4_oparg_lookup l;
+	struct nfs4_oparg_getfh gfh;
+	struct nfs4_oparg_getattr ga;
+
+	nfsstats.rpccnt[NFSPROC_RENAME]++;
+
+	mreq = nfsm_reqhead(dvp, NFSV4PROC_COMPOUND, 0);
+	mb = mreq;
+	bpos = mtod(mb, caddr_t);
+
+	l.name = name;
+	l.namelen = len;
+
+	nfs_v4initcompound(&cp);
+
+	ga.bm = &nfsv4_getattrbm;
+
+	nfsm_v4build_compound(&cp, "nfs4_renamerpc()");
+	nfsm_v4build_putfh(&cp, dvp);
+	nfsm_v4build_lookup(&cp, &l);
+	nfsm_v4build_getfh(&cp, &gfh);
+	nfsm_v4build_getattr(&cp, &ga);
+
+	nfsm_request(dvp, NFSV4PROC_COMPOUND, td, cred);
+	if (error != 0)
+		goto nfsmout;
+
+	nfsm_v4dissect_compound(&cp);
+	nfsm_v4dissect_putfh(&cp);
+	nfsm_v4dissect_lookup(&cp);
+	nfsm_v4dissect_getfh(&cp, &gfh);
+	nfsm_v4dissect_getattr(&cp, &ga);
+
+	if (npp != NULL && error == 0) {
+		nfhp = &gfh.fh_val;
+		fhlen = gfh.fh_len;
+
+		if (*npp != NULL) {
+			np = *npp;
+			if (np->n_fhsize > NFS_SMALLFH && fhlen <= NFS_SMALLFH) {
+				free((caddr_t)np->n_fhp, M_NFSBIGFH);
+				np->n_fhp = &np->n_fh;
+			} else if (np->n_fhsize <= NFS_SMALLFH && fhlen>NFS_SMALLFH)
+				np->n_fhp =(nfsfh_t *)malloc(fhlen, M_NFSBIGFH, M_WAITOK);
+			bcopy((caddr_t)nfhp, (caddr_t)np->n_fhp, fhlen);
+			np->n_fhsize = fhlen;
+			newvp = NFSTOV(np);
+		} else if (NFS_CMPFH(dnp, nfhp, fhlen)) {
+			VREF(dvp);
+			newvp = dvp;
+		} else {
+			error = nfs_nget(dvp->v_mount, nfhp, fhlen, &np);
+			if (error) {
+				m_freem(mrep);
+				return (error);
+			}
+			newvp = NFSTOV(np);
+		}
+
+		if (newvp != dvp) {
+			np->n_dvp = dvp;
+			np->n_namelen = len;
+			if (np->n_name != NULL)
+				FREE(np->n_name, M_NFSREQ);
+			MALLOC(np->n_name, u_char *,
+			    np->n_namelen + 1, M_NFSREQ, M_WAITOK);
+			memcpy(np->n_name, name, len);
+			np->n_name[len] = '\0';
+		}
+		nfs4_vnop_loadattrcache(newvp, &ga.fa, NULL);
+	}
+
+nfsmout:
+	error = nfs_v4postop(&cp, error);
+
+	if (mrep != NULL)
+		m_freem(mrep);
+	if (npp && *npp == NULL) {
+		if (error) {
+			if (newvp) {
+				if (newvp == dvp)
+					vrele(newvp);
+				else
+					vput(newvp);
+			}
+		} else
+			*npp = np;
+	}
+
+
+	return (error);
+}
+
+/*
+ * Nfs Version 3 commit rpc
+ */
+int
+nfs4_commit(struct vnode *vp, u_quad_t offset, int cnt, struct ucred *cred,
+    struct thread *td)
+{
+	struct nfsmount *nmp = VFSTONFS(vp->v_mount);
+	caddr_t bpos, dpos;
+	int error = 0;
+	struct mbuf *mreq, *mrep = NULL, *md, *mb;
+	struct nfs4_compound cp;
+	struct nfs4_oparg_commit commit;
+
+	if ((nmp->nm_state & NFSSTA_HASWRITEVERF) == 0)
+		return (0);
+	nfsstats.rpccnt[NFSPROC_COMMIT]++;
+
+	mreq = nfsm_reqhead(vp, NFSV4PROC_COMPOUND, 0);
+	mb = mreq;
+	bpos = mtod(mb, caddr_t);
+
+	commit.start = offset;
+	commit.len = cnt;
+
+	nfs_v4initcompound(&cp);
+
+	nfsm_v4build_compound(&cp, "nfs4_commit()");
+	nfsm_v4build_putfh(&cp, vp);
+	nfsm_v4build_commit(&cp, &commit);
+	nfsm_v4build_finalize(&cp);
+
+	nfsm_request(vp, NFSV4PROC_COMPOUND, td, cred);
+	if (error != 0)
+		goto nfsmout;
+
+	nfsm_v4dissect_compound(&cp);
+	nfsm_v4dissect_putfh(&cp);
+	nfsm_v4dissect_commit(&cp, &commit);
+	
+	/* XXX */
+	/* nfsm_wcc_data(vp, wccflag);*/
+	if (bcmp(nmp->nm_verf, commit.verf, NFSX_V4VERF)) {
+		bcopy(commit.verf, nmp->nm_verf, NFSX_V4VERF);
+		error = NFSERR_STALEWRITEVERF;
+	}
+
+nfsmout:
+	error = nfs_v4postop(&cp, error);
+
+	if (mrep == NULL)
+		m_freem(mrep);
+	return (error);
+}
+
+/*
+ * Strategy routine.
+ * For async requests when nfsiod(s) are running, queue the request by
+ * calling nfs_asyncio(), otherwise just all nfs_doio() to do the
+ * request.
+ */
+static int
+nfs4_strategy(struct vop_strategy_args *ap)
+{
+	struct buf *bp = ap->a_bp;
+	struct ucred *cr;
+	struct thread *td;
+	int error = 0;
+
+	KASSERT(ap->a_vp == ap->a_bp->b_vp, ("%s(%p != %p)",
+	    __func__, ap->a_vp, ap->a_bp->b_vp));
+	KASSERT(!(bp->b_flags & B_DONE), ("nfs4_strategy: buffer %p unexpectedly marked B_DONE", bp));
+	KASSERT(BUF_REFCNT(bp) > 0, ("nfs4_strategy: buffer %p not locked", bp));
+
+	if (bp->b_flags & B_ASYNC)
+		td = NULL;
+	else
+		td = curthread;	/* XXX */
+
+	if (bp->b_iocmd == BIO_READ)
+		cr = bp->b_rcred;
+	else
+		cr = bp->b_wcred;
+
+	/*
+	 * If the op is asynchronous and an i/o daemon is waiting
+	 * queue the request, wake it up and wait for completion
+	 * otherwise just do it ourselves.
+	 */
+	if ((bp->b_flags & B_ASYNC) == 0 ||
+		nfs_asyncio(bp, NOCRED, td))
+		error = nfs_doio(bp, cr, td);
+	return (error);
+}
+
+/*
+ * fsync vnode op. Just call nfs4_flush() with commit == 1.
+ */
+/* ARGSUSED */
+static int
+nfs4_fsync(struct vop_fsync_args *ap)
+{
+	return (nfs4_flush(ap->a_vp, ap->a_cred, ap->a_waitfor, ap->a_td, 1));
+}
+
+/*
+ * Flush all the blocks associated with a vnode.
+ * 	Walk through the buffer pool and push any dirty pages
+ *	associated with the vnode.
+ */
+static int
+nfs4_flush(struct vnode *vp, struct ucred *cred, int waitfor, struct thread *td,
+    int commit)
+{
+	struct nfsnode *np = VTONFS(vp);
+	struct buf *bp;
+	int i;
+	struct buf *nbp;
+	struct nfsmount *nmp = VFSTONFS(vp->v_mount);
+	int s, error = 0, slptimeo = 0, slpflag = 0, retv, bvecpos;
+	int passone = 1;
+	u_quad_t off, endoff, toff;
+	struct ucred* wcred = NULL;
+	struct buf **bvec = NULL;
+#ifndef NFS_COMMITBVECSIZ
+#define NFS_COMMITBVECSIZ	20
+#endif
+	struct buf *bvec_on_stack[NFS_COMMITBVECSIZ];
+	int bvecsize = 0, bveccount;
+
+	if (nmp->nm_flag & NFSMNT_INT)
+		slpflag = PCATCH;
+	if (!commit)
+		passone = 0;
+	/*
+	 * A b_flags == (B_DELWRI | B_NEEDCOMMIT) block has been written to the
+	 * server, but nas not been committed to stable storage on the server
+	 * yet. On the first pass, the byte range is worked out and the commit
+	 * rpc is done. On the second pass, nfs_writebp() is called to do the
+	 * job.
+	 */
+again:
+	off = (u_quad_t)-1;
+	endoff = 0;
+	bvecpos = 0;
+	if (NFS_ISV3(vp) && commit) {
+		s = splbio();
+		if (bvec != NULL && bvec != bvec_on_stack)
+			free(bvec, M_TEMP);
+		/*
+		 * Count up how many buffers waiting for a commit.
+		 */
+		bveccount = 0;
+		VI_LOCK(vp);
+		for (bp = TAILQ_FIRST(&vp->v_dirtyblkhd); bp; bp = nbp) {
+			nbp = TAILQ_NEXT(bp, b_vnbufs);
+			if (BUF_REFCNT(bp) == 0 &&
+			    (bp->b_flags & (B_DELWRI | B_NEEDCOMMIT))
+				== (B_DELWRI | B_NEEDCOMMIT))
+				bveccount++;
+		}
+		/*
+		 * Allocate space to remember the list of bufs to commit.  It is
+		 * important to use M_NOWAIT here to avoid a race with nfs4_write.
+		 * If we can't get memory (for whatever reason), we will end up
+		 * committing the buffers one-by-one in the loop below.
+		 */
+		if (bveccount > NFS_COMMITBVECSIZ) {
+			/*
+			 * Release the vnode interlock to avoid a lock
+			 * order reversal.
+			 */
+			VI_UNLOCK(vp);
+			bvec = (struct buf **)
+				malloc(bveccount * sizeof(struct buf *),
+				       M_TEMP, M_NOWAIT);
+			VI_LOCK(vp);
+			if (bvec == NULL) {
+				bvec = bvec_on_stack;
+				bvecsize = NFS_COMMITBVECSIZ;
+			} else
+				bvecsize = bveccount;
+		} else {
+			bvec = bvec_on_stack;
+			bvecsize = NFS_COMMITBVECSIZ;
+		}
+		for (bp = TAILQ_FIRST(&vp->v_dirtyblkhd); bp; bp = nbp) {
+			if (bvecpos >= bvecsize)
+				break;
+			if (BUF_LOCK(bp, LK_EXCLUSIVE | LK_NOWAIT, NULL)) {
+				nbp = TAILQ_NEXT(bp, b_vnbufs);
+				continue;
+			}
+			if ((bp->b_flags & (B_DELWRI | B_NEEDCOMMIT)) !=
+			    (B_DELWRI | B_NEEDCOMMIT)) {
+				BUF_UNLOCK(bp);
+				nbp = TAILQ_NEXT(bp, b_vnbufs);
+				continue;
+			}
+			VI_UNLOCK(vp);
+			bremfree(bp);
+			/*
+			 * Work out if all buffers are using the same cred
+			 * so we can deal with them all with one commit.
+			 *
+			 * NOTE: we are not clearing B_DONE here, so we have
+			 * to do it later on in this routine if we intend to
+			 * initiate I/O on the bp.
+			 *
+			 * Note: to avoid loopback deadlocks, we do not
+			 * assign b_runningbufspace.
+			 */
+			if (wcred == NULL)
+				wcred = bp->b_wcred;
+			else if (wcred != bp->b_wcred)
+				wcred = NOCRED;
+			bp->b_flags |= B_WRITEINPROG;
+			vfs_busy_pages(bp, 1);
+
+			VI_LOCK(vp);
+			/*
+			 * bp is protected by being locked, but nbp is not
+			 * and vfs_busy_pages() may sleep.  We have to
+			 * recalculate nbp.
+			 */
+			nbp = TAILQ_NEXT(bp, b_vnbufs);
+
+			/*
+			 * A list of these buffers is kept so that the
+			 * second loop knows which buffers have actually
+			 * been committed. This is necessary, since there
+			 * may be a race between the commit rpc and new
+			 * uncommitted writes on the file.
+			 */
+			bvec[bvecpos++] = bp;
+			toff = ((u_quad_t)bp->b_blkno) * DEV_BSIZE +
+				bp->b_dirtyoff;
+			if (toff < off)
+				off = toff;
+			toff += (u_quad_t)(bp->b_dirtyend - bp->b_dirtyoff);
+			if (toff > endoff)
+				endoff = toff;
+		}
+		splx(s);
+		VI_UNLOCK(vp);
+	}
+	if (bvecpos > 0) {
+		/*
+		 * Commit data on the server, as required.
+		 * If all bufs are using the same wcred, then use that with
+		 * one call for all of them, otherwise commit each one
+		 * separately.
+		 */
+		if (wcred != NOCRED)
+			retv = nfs4_commit(vp, off, (int)(endoff - off),
+					  wcred, td);
+		else {
+			retv = 0;
+			for (i = 0; i < bvecpos; i++) {
+				off_t off, size;
+				bp = bvec[i];
+				off = ((u_quad_t)bp->b_blkno) * DEV_BSIZE +
+					bp->b_dirtyoff;
+				size = (u_quad_t)(bp->b_dirtyend
+						  - bp->b_dirtyoff);
+				retv = nfs4_commit(vp, off, (int)size,
+						  bp->b_wcred, td);
+				if (retv) break;
+			}
+		}
+
+		if (retv == NFSERR_STALEWRITEVERF)
+			nfs_clearcommit(vp->v_mount);
+
+		/*
+		 * Now, either mark the blocks I/O done or mark the
+		 * blocks dirty, depending on whether the commit
+		 * succeeded.
+		 */
+		for (i = 0; i < bvecpos; i++) {
+			bp = bvec[i];
+			bp->b_flags &= ~(B_NEEDCOMMIT | B_WRITEINPROG | B_CLUSTEROK);
+			if (retv) {
+				/*
+				 * Error, leave B_DELWRI intact
+				 */
+				vfs_unbusy_pages(bp);
+				brelse(bp);
+			} else {
+				/*
+				 * Success, remove B_DELWRI ( bundirty() ).
+				 *
+				 * b_dirtyoff/b_dirtyend seem to be NFS
+				 * specific.  We should probably move that
+				 * into bundirty(). XXX
+				 */
+				s = splbio();
+				VI_LOCK(vp);
+				vp->v_numoutput++;
+				VI_UNLOCK(vp);
+				bp->b_flags |= B_ASYNC;
+				bundirty(bp);
+				bp->b_flags &= ~B_DONE;
+				bp->b_ioflags &= ~BIO_ERROR;
+				bp->b_dirtyoff = bp->b_dirtyend = 0;
+				splx(s);
+				bufdone(bp);
+			}
+		}
+	}
+
+	/*
+	 * Start/do any write(s) that are required.
+	 */
+loop:
+	s = splbio();
+	VI_LOCK(vp);
+	for (bp = TAILQ_FIRST(&vp->v_dirtyblkhd); bp; bp = nbp) {
+		nbp = TAILQ_NEXT(bp, b_vnbufs);
+		if (BUF_LOCK(bp, LK_EXCLUSIVE | LK_NOWAIT, NULL)) {
+			if (waitfor != MNT_WAIT || passone)
+				continue;
+
+			error = BUF_TIMELOCK(bp,
+			    LK_EXCLUSIVE | LK_SLEEPFAIL | LK_INTERLOCK,
+			    VI_MTX(vp), "nfsfsync", slpflag, slptimeo);
+			splx(s);
+			if (error == 0)
+				panic("nfs4_fsync: inconsistent lock");
+			if (error == ENOLCK)
+				goto loop;
+			if (nfs4_sigintr(nmp, NULL, td)) {
+				error = EINTR;
+				goto done;
+			}
+			if (slpflag == PCATCH) {
+				slpflag = 0;
+				slptimeo = 2 * hz;
+			}
+			goto loop;
+		}
+		if ((bp->b_flags & B_DELWRI) == 0)
+			panic("nfs4_fsync: not dirty");
+		if ((passone || !commit) && (bp->b_flags & B_NEEDCOMMIT)) {
+			BUF_UNLOCK(bp);
+			continue;
+		}
+		VI_UNLOCK(vp);
+		bremfree(bp);
+		if (passone || !commit)
+		    bp->b_flags |= B_ASYNC;
+		else
+		    bp->b_flags |= B_ASYNC | B_WRITEINPROG;
+		splx(s);
+		BUF_WRITE(bp);
+		goto loop;
+	}
+	splx(s);
+	if (passone) {
+		passone = 0;
+		VI_UNLOCK(vp);
+		goto again;
+	}
+	if (waitfor == MNT_WAIT) {
+		while (vp->v_numoutput) {
+			vp->v_iflag |= VI_BWAIT;
+			error = msleep((caddr_t)&vp->v_numoutput, VI_MTX(vp),
+				slpflag | (PRIBIO + 1), "nfsfsync", slptimeo);
+			if (error) {
+			    VI_UNLOCK(vp);
+			    if (nfs4_sigintr(nmp, NULL, td)) {
+				error = EINTR;
+				goto done;
+			    }
+			    if (slpflag == PCATCH) {
+				slpflag = 0;
+				slptimeo = 2 * hz;
+			    }
+			    VI_LOCK(vp);
+			}
+		}
+		if (!TAILQ_EMPTY(&vp->v_dirtyblkhd) && commit) {
+			VI_UNLOCK(vp);
+			goto loop;
+		}
+	}
+	VI_UNLOCK(vp);
+	if (np->n_flag & NWRITEERR) {
+		error = np->n_error;
+		np->n_flag &= ~NWRITEERR;
+	}
+done:
+	if (bvec != NULL && bvec != bvec_on_stack)
+		free(bvec, M_TEMP);
+	return (error);
+}
+
+/*
+ * NFS advisory byte-level locks.
+ */
+static int
+nfs4_advlock(struct vop_advlock_args *ap)
+{
+	return (EPERM);
+
+	if ((VFSTONFS(ap->a_vp->v_mount)->nm_flag & NFSMNT_NOLOCKD) != 0) {
+		struct nfsnode *np = VTONFS(ap->a_vp);
+
+		return (lf_advlock(ap, &(np->n_lockf), np->n_size));
+	}
+	return (nfs_dolock(ap));
+}
+
+/*
+ * Print out the contents of an nfsnode.
+ */
+static int
+nfs4_print(struct vop_print_args *ap)
+{
+	struct vnode *vp = ap->a_vp;
+	struct nfsnode *np = VTONFS(vp);
+
+	printf("\tfileid %ld fsid 0x%x",
+	   np->n_vattr.va_fileid, np->n_vattr.va_fsid);
+	if (vp->v_type == VFIFO)
+		fifo_printinfo(vp);
+	printf("\n");
+	return (0);
+}
+
+/*
+ * This is the "real" nfs::bwrite(struct buf*).
+ * B_WRITEINPROG isn't set unless the force flag is one and it
+ * handles the B_NEEDCOMMIT flag.
+ * We set B_CACHE if this is a VMIO buffer.
+ */
+int
+nfs4_writebp(struct buf *bp, int force, struct thread *td)
+{
+	int s;
+	int oldflags = bp->b_flags;
+#if 0
+	int retv = 1;
+	off_t off;
+#endif
+
+	if (BUF_REFCNT(bp) == 0)
+		panic("bwrite: buffer is not locked???");
+
+	if (bp->b_flags & B_INVAL) {
+		brelse(bp);
+		return(0);
+	}
+
+	bp->b_flags |= B_CACHE;
+
+	/*
+	 * Undirty the bp.  We will redirty it later if the I/O fails.
+	 */
+
+	s = splbio();
+	bundirty(bp);
+	bp->b_flags &= ~B_DONE;
+	bp->b_ioflags &= ~BIO_ERROR;
+	bp->b_iocmd = BIO_WRITE;
+
+	VI_LOCK(bp->b_vp);
+	bp->b_vp->v_numoutput++;
+	VI_UNLOCK(bp->b_vp);
+	curthread->td_proc->p_stats->p_ru.ru_oublock++;
+	splx(s);
+
+	/*
+	 * Note: to avoid loopback deadlocks, we do not
+	 * assign b_runningbufspace.
+	 */
+	vfs_busy_pages(bp, 1);
+
+	if (force)
+		bp->b_flags |= B_WRITEINPROG;
+	BUF_KERNPROC(bp);
+	bp->b_iooffset = dbtob(bp->b_blkno);
+	VOP_STRATEGY(bp->b_vp, bp);
+
+	if( (oldflags & B_ASYNC) == 0) {
+		int rtval = bufwait(bp);
+
+		if (oldflags & B_DELWRI) {
+			s = splbio();
+			reassignbuf(bp, bp->b_vp);
+			splx(s);
+		}
+
+		brelse(bp);
+		return (rtval);
+	}
+
+	return (0);
+}
+
+/*
+ * nfs special file access vnode op.
+ * Essentially just get vattr and then imitate iaccess() since the device is
+ * local to the client.
+ */
+static int
+nfsspec_access(struct vop_access_args *ap)
+{
+	struct vattr *vap;
+	struct ucred *cred = ap->a_cred;
+	struct vnode *vp = ap->a_vp;
+	mode_t mode = ap->a_mode;
+	struct vattr vattr;
+	int error;
+
+	/*
+	 * Disallow write attempts on filesystems mounted read-only;
+	 * unless the file is a socket, fifo, or a block or character
+	 * device resident on the filesystem.
+	 */
+	if ((mode & VWRITE) && (vp->v_mount->mnt_flag & MNT_RDONLY)) {
+		switch (vp->v_type) {
+		case VREG:
+		case VDIR:
+		case VLNK:
+			return (EROFS);
+		default:
+			break;
+		}
+	}
+	vap = &vattr;
+	error = VOP_GETATTR(vp, vap, cred, ap->a_td);
+	if (error)
+		return (error);
+	return (vaccess(vp->v_type, vap->va_mode, vap->va_uid, vap->va_gid,
+	    mode, cred, NULL));
+}
+
+/*
+ * Read wrapper for special devices.
+ */
+static int
+nfsspec_read(struct vop_read_args *ap)
+{
+	struct nfsnode *np = VTONFS(ap->a_vp);
+
+	/*
+	 * Set access flag.
+	 */
+	np->n_flag |= NACC;
+	getnanotime(&np->n_atim);
+	return (VOCALL(spec_vnodeop_p, VOFFSET(vop_read), ap));
+}
+
+/*
+ * Write wrapper for special devices.
+ */
+static int
+nfsspec_write(struct vop_write_args *ap)
+{
+	struct nfsnode *np = VTONFS(ap->a_vp);
+
+	/*
+	 * Set update flag.
+	 */
+	np->n_flag |= NUPD;
+	getnanotime(&np->n_mtim);
+	return (VOCALL(spec_vnodeop_p, VOFFSET(vop_write), ap));
+}
+
+/*
+ * Close wrapper for special devices.
+ *
+ * Update the times on the nfsnode then do device close.
+ */
+static int
+nfsspec_close(struct vop_close_args *ap)
+{
+	struct vnode *vp = ap->a_vp;
+	struct nfsnode *np = VTONFS(vp);
+	struct vattr vattr;
+
+	if (np->n_flag & (NACC | NUPD)) {
+		np->n_flag |= NCHG;
+		if (vrefcnt(vp) == 1 &&
+		    (vp->v_mount->mnt_flag & MNT_RDONLY) == 0) {
+			VATTR_NULL(&vattr);
+			if (np->n_flag & NACC)
+				vattr.va_atime = np->n_atim;
+			if (np->n_flag & NUPD)
+				vattr.va_mtime = np->n_mtim;
+			(void)VOP_SETATTR(vp, &vattr, ap->a_cred, ap->a_td);
+		}
+	}
+	return (VOCALL(spec_vnodeop_p, VOFFSET(vop_close), ap));
+}
+
+/*
+ * Read wrapper for fifos.
+ */
+static int
+nfsfifo_read(struct vop_read_args *ap)
+{
+	struct nfsnode *np = VTONFS(ap->a_vp);
+
+	/*
+	 * Set access flag.
+	 */
+	np->n_flag |= NACC;
+	getnanotime(&np->n_atim);
+	return (VOCALL(fifo_vnodeop_p, VOFFSET(vop_read), ap));
+}
+
+/*
+ * Write wrapper for fifos.
+ */
+static int
+nfsfifo_write(struct vop_write_args *ap)
+{
+	struct nfsnode *np = VTONFS(ap->a_vp);
+
+	/*
+	 * Set update flag.
+	 */
+	np->n_flag |= NUPD;
+	getnanotime(&np->n_mtim);
+	return (VOCALL(fifo_vnodeop_p, VOFFSET(vop_write), ap));
+}
+
+/*
+ * Close wrapper for fifos.
+ *
+ * Update the times on the nfsnode then do fifo close.
+ */
+static int
+nfsfifo_close(struct vop_close_args *ap)
+{
+	struct vnode *vp = ap->a_vp;
+	struct nfsnode *np = VTONFS(vp);
+	struct vattr vattr;
+	struct timespec ts;
+
+	if (np->n_flag & (NACC | NUPD)) {
+		getnanotime(&ts);
+		if (np->n_flag & NACC)
+			np->n_atim = ts;
+		if (np->n_flag & NUPD)
+			np->n_mtim = ts;
+		np->n_flag |= NCHG;
+		if (vrefcnt(vp) == 1 &&
+		    (vp->v_mount->mnt_flag & MNT_RDONLY) == 0) {
+			VATTR_NULL(&vattr);
+			if (np->n_flag & NACC)
+				vattr.va_atime = np->n_atim;
+			if (np->n_flag & NUPD)
+				vattr.va_mtime = np->n_mtim;
+			vn_lock(vp, LK_EXCLUSIVE | LK_RETRY, ap->a_td);
+			(void)VOP_SETATTR(vp, &vattr, ap->a_cred, ap->a_td);
+			VOP_UNLOCK(vp, 0, ap->a_td);
+		}
+	}
+	return (VOCALL(fifo_vnodeop_p, VOFFSET(vop_close), ap));
+}
+