Index: projects/fuse2/sys/fs/fuse/fuse_internal.c
===================================================================
--- projects/fuse2/sys/fs/fuse/fuse_internal.c	(revision 348581)
+++ projects/fuse2/sys/fs/fuse/fuse_internal.c	(revision 348582)
@@ -1,1121 +1,1100 @@
 /*-
  * SPDX-License-Identifier: BSD-3-Clause
  *
  * Copyright (c) 2007-2009 Google Inc. and Amit Singh
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions are
  * met:
  *
  * * Redistributions of source code must retain the above copyright
  *   notice, this list of conditions and the following disclaimer.
  * * Redistributions in binary form must reproduce the above
  *   copyright notice, this list of conditions and the following disclaimer
  *   in the documentation and/or other materials provided with the
  *   distribution.
  * * Neither the name of Google Inc. nor the names of its
  *   contributors may be used to endorse or promote products derived from
  *   this software without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  *
  * Copyright (C) 2005 Csaba Henk.
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include <sys/param.h>
 #include <sys/module.h>
 #include <sys/systm.h>
 #include <sys/errno.h>
 #include <sys/kernel.h>
 #include <sys/conf.h>
 #include <sys/uio.h>
 #include <sys/malloc.h>
 #include <sys/queue.h>
 #include <sys/lock.h>
 #include <sys/mutex.h>
 #include <sys/sdt.h>
 #include <sys/sx.h>
 #include <sys/proc.h>
 #include <sys/mount.h>
 #include <sys/vnode.h>
 #include <sys/namei.h>
 #include <sys/stat.h>
 #include <sys/unistd.h>
 #include <sys/filedesc.h>
 #include <sys/file.h>
 #include <sys/fcntl.h>
 #include <sys/dirent.h>
 #include <sys/bio.h>
 #include <sys/buf.h>
 #include <sys/sysctl.h>
 #include <sys/priv.h>
 
 #include "fuse.h"
 #include "fuse_file.h"
 #include "fuse_internal.h"
 #include "fuse_io.h"
 #include "fuse_ipc.h"
 #include "fuse_node.h"
 #include "fuse_file.h"
 
 SDT_PROVIDER_DECLARE(fusefs);
 /* 
  * Fuse trace probe:
  * arg0: verbosity.  Higher numbers give more verbose messages
  * arg1: Textual message
  */
 SDT_PROBE_DEFINE2(fusefs, , internal, trace, "int", "char*");
 
 #ifdef ZERO_PAD_INCOMPLETE_BUFS
 static int isbzero(void *buf, size_t len);
 
 #endif
 
 int
 fuse_internal_get_cached_vnode(struct mount* mp, ino_t ino, int flags,
 	struct vnode **vpp)
 {
 	struct bintime now;
 	struct thread *td = curthread;
 	uint64_t nodeid = ino;
 	int error;
 
 	*vpp = NULL;
 
 	error = vfs_hash_get(mp, fuse_vnode_hash(nodeid), flags, td, vpp,
 	    fuse_vnode_cmp, &nodeid);
 	if (error)
 		return error;
 	/*
 	 * Check the entry cache timeout.  We have to do this within fusefs
 	 * instead of by using cache_enter_time/cache_lookup because those
 	 * routines are only intended to work with pathnames, not inodes
 	 */
 	if (*vpp != NULL) {
 		getbinuptime(&now);
 		if (bintime_cmp(&(VTOFUD(*vpp)->entry_cache_timeout), &now, >)){
 			atomic_add_acq_long(&fuse_lookup_cache_hits, 1);
 			return 0;
 		} else {
 			/* Entry cache timeout */
 			atomic_add_acq_long(&fuse_lookup_cache_misses, 1);
 			cache_purge(*vpp);
 			vput(*vpp);
 			*vpp = NULL;
 		}
 	}
 	return 0;
 }
 
 /* Synchronously send a FUSE_ACCESS operation */
 int
 fuse_internal_access(struct vnode *vp,
     accmode_t mode,
     struct thread *td,
     struct ucred *cred)
 {
 	int err = 0;
 	uint32_t mask = F_OK;
 	int dataflags;
 	int vtype;
 	struct mount *mp;
 	struct fuse_dispatcher fdi;
 	struct fuse_access_in *fai;
 	struct fuse_data *data;
 
 	mp = vnode_mount(vp);
 	vtype = vnode_vtype(vp);
 
 	data = fuse_get_mpdata(mp);
 	dataflags = data->dataflags;
 
 	if (mode == 0)
 		return 0;
 
 	if (mode & VMODIFY_PERMS && vfs_isrdonly(mp)) {
 		switch (vp->v_type) {
 		case VDIR:
 			/* FALLTHROUGH */
 		case VLNK:
 			/* FALLTHROUGH */
 		case VREG:
 			return EROFS;
 		default:
 			break;
 		}
 	}
 
 	/* Unless explicitly permitted, deny everyone except the fs owner. */
 	if (!(dataflags & FSESS_DAEMON_CAN_SPY)) {
 		if (fuse_match_cred(data->daemoncred, cred))
 			return EPERM;
 	}
 
 	if (dataflags & FSESS_DEFAULT_PERMISSIONS) {
 		struct vattr va;
 
 		fuse_internal_getattr(vp, &va, cred, td);
 		return vaccess(vp->v_type, va.va_mode, va.va_uid,
 		    va.va_gid, mode, cred, NULL);
 	}
 
 	if (!fsess_isimpl(mp, FUSE_ACCESS))
 		return 0;
 
 	if ((mode & (VWRITE | VAPPEND | VADMIN)) != 0)
 		mask |= W_OK;
 	if ((mode & VREAD) != 0)
 		mask |= R_OK;
 	if ((mode & VEXEC) != 0)
 		mask |= X_OK;
 
 	fdisp_init(&fdi, sizeof(*fai));
 	fdisp_make_vp(&fdi, FUSE_ACCESS, vp, td, cred);
 
 	fai = fdi.indata;
 	fai->mask = mask;
 
 	err = fdisp_wait_answ(&fdi);
 	fdisp_destroy(&fdi);
 
 	if (err == ENOSYS) {
 		fsess_set_notimpl(mp, FUSE_ACCESS);
 		err = 0;
 	}
 	return err;
 }
 
 /*
  * Cache FUSE attributes from attr, in attribute cache associated with vnode
  * 'vp'.  Optionally, if argument 'vap' is not NULL, store a copy of the
  * converted attributes there as well.
  *
  * If the nominal attribute cache TTL is zero, do not cache on the 'vp' (but do
  * return the result to the caller).
  */
 void
 fuse_internal_cache_attrs(struct vnode *vp, struct ucred *cred,
 	struct fuse_attr *attr, uint64_t attr_valid, uint32_t attr_valid_nsec,
 	struct vattr *vap)
 {
 	struct mount *mp;
 	struct fuse_vnode_data *fvdat;
 	struct fuse_data *data;
 	struct vattr *vp_cache_at;
 
 	mp = vnode_mount(vp);
 	fvdat = VTOFUD(vp);
 	data = fuse_get_mpdata(mp);
 	if (!cred)
 		cred = curthread->td_ucred;
 
 	ASSERT_VOP_ELOCKED(vp, "fuse_internal_cache_attrs");
 
 	fuse_validity_2_bintime(attr_valid, attr_valid_nsec,
 		&fvdat->attr_cache_timeout);
 
 	/* Fix our buffers if the filesize changed without us knowing */
 	if (vnode_isreg(vp) && attr->size != fvdat->cached_attrs.va_size) {
 		(void)fuse_vnode_setsize(vp, cred, attr->size);
 		fvdat->cached_attrs.va_size = attr->size;
 	}
 
 	if (attr_valid > 0 || attr_valid_nsec > 0)
 		vp_cache_at = &(fvdat->cached_attrs);
 	else if (vap != NULL)
 		vp_cache_at = vap;
 	else
 		return;
 
 	vattr_null(vp_cache_at);
 	vp_cache_at->va_fsid = mp->mnt_stat.f_fsid.val[0];
 	vp_cache_at->va_fileid = attr->ino;
 	vp_cache_at->va_mode = attr->mode & ~S_IFMT;
 	vp_cache_at->va_nlink     = attr->nlink;
 	vp_cache_at->va_uid       = attr->uid;
 	vp_cache_at->va_gid       = attr->gid;
 	vp_cache_at->va_rdev      = attr->rdev;
 	vp_cache_at->va_size      = attr->size;
 	/* XXX on i386, seconds are truncated to 32 bits */
 	vp_cache_at->va_atime.tv_sec  = attr->atime;
 	vp_cache_at->va_atime.tv_nsec = attr->atimensec;
 	vp_cache_at->va_mtime.tv_sec  = attr->mtime;
 	vp_cache_at->va_mtime.tv_nsec = attr->mtimensec;
 	vp_cache_at->va_ctime.tv_sec  = attr->ctime;
 	vp_cache_at->va_ctime.tv_nsec = attr->ctimensec;
 	if (fuse_libabi_geq(data, 7, 9) && attr->blksize > 0)
 		vp_cache_at->va_blocksize = attr->blksize;
 	else
 		vp_cache_at->va_blocksize = PAGE_SIZE;
 	vp_cache_at->va_type = IFTOVT(attr->mode);
 	vp_cache_at->va_bytes = attr->blocks * S_BLKSIZE;
 	vp_cache_at->va_flags = 0;
 
 	if (vap != vp_cache_at && vap != NULL)
 		memcpy(vap, vp_cache_at, sizeof(*vap));
 }
 
 
 /* fsync */
 
 int
 fuse_internal_fsync_callback(struct fuse_ticket *tick, struct uio *uio)
 {
 	if (tick->tk_aw_ohead.error == ENOSYS) {
 		fsess_set_notimpl(tick->tk_data->mp, fticket_opcode(tick));
 	}
 	return 0;
 }
 
 int
 fuse_internal_fsync(struct vnode *vp,
     struct thread *td,
     int waitfor,
     bool datasync)
 {
 	struct fuse_fsync_in *ffsi = NULL;
 	struct fuse_dispatcher fdi;
 	struct fuse_filehandle *fufh;
 	struct fuse_vnode_data *fvdat = VTOFUD(vp);
 	struct mount *mp = vnode_mount(vp);
 	int op = FUSE_FSYNC;
 	int err = 0;
 
 	if (!fsess_isimpl(vnode_mount(vp),
 	    (vnode_vtype(vp) == VDIR ? FUSE_FSYNCDIR : FUSE_FSYNC))) {
 		return 0;
 	}
 	if (vnode_isdir(vp))
 		op = FUSE_FSYNCDIR;
 
 	if (!fsess_isimpl(mp, op))
 		return 0;
 
 	fdisp_init(&fdi, sizeof(*ffsi));
 	/*
 	 * fsync every open file handle for this file, because we can't be sure
 	 * which file handle the caller is really referring to.
 	 */
 	LIST_FOREACH(fufh, &fvdat->handles, next) {
 		if (ffsi == NULL)
 			fdisp_make_vp(&fdi, op, vp, td, NULL);
 		else
 			fdisp_refresh_vp(&fdi, op, vp, td, NULL);
 		ffsi = fdi.indata;
 		ffsi->fh = fufh->fh_id;
 		ffsi->fsync_flags = 0;
 
 		if (datasync)
 			ffsi->fsync_flags = 1;
 
 		if (waitfor == MNT_WAIT) {
 			err = fdisp_wait_answ(&fdi);
 		} else {
 			fuse_insert_callback(fdi.tick,
 				fuse_internal_fsync_callback);
 			fuse_insert_message(fdi.tick, false);
 		}
 		if (err == ENOSYS) {
 			/* ENOSYS means "success, and don't call again" */
 			fsess_set_notimpl(mp, op);
 			err = 0;
 			break;
 		}
 	}
 	fdisp_destroy(&fdi);
 
 	return err;
 }
 
 /* Asynchronous invalidation */
-SDT_PROBE_DEFINE1(fusefs, , internal, invalidate_without_export,
-	"struct mount*");
 SDT_PROBE_DEFINE2(fusefs, , internal, invalidate_cache_hit,
 	"struct vnode*", "struct vnode*");
 int
 fuse_internal_invalidate_entry(struct mount *mp, struct uio *uio)
 {
 	struct fuse_notify_inval_entry_out fnieo;
-	struct fuse_data *data = fuse_get_mpdata(mp);
 	struct componentname cn;
 	struct vnode *dvp, *vp;
 	char name[PATH_MAX];
 	int err;
 
-	if (!(data->dataflags & FSESS_EXPORT_SUPPORT)) {
-		/* 
-		 * Linux allows file systems without export support to use
-		 * asynchronous notification because its inode cache is indexed
-		 * purely by the inode number.  But FreeBSD's vnode is cache
-		 * requires access to the entire vnode structure.
-		 */
-		SDT_PROBE1(fusefs, , internal, invalidate_without_export, mp);
-		return (EINVAL);
-	}
-
 	if ((err = uiomove(&fnieo, sizeof(fnieo), uio)) != 0)
 		return (err);
 
 	if ((err = uiomove(name, fnieo.namelen, uio)) != 0)
 		return (err);
 	name[fnieo.namelen] = '\0';
 	/* fusefs does not cache "." or ".." entries */
 	if (strncmp(name, ".", sizeof(".")) == 0 ||
 	    strncmp(name, "..", sizeof("..")) == 0)
 		return (0);
 
 	if (fnieo.parent == FUSE_ROOT_ID)
 		err = VFS_ROOT(mp, LK_SHARED, &dvp);
 	else
 		err = fuse_internal_get_cached_vnode( mp, fnieo.parent,
 			LK_SHARED, &dvp);
+	/* 
+	 * If dvp is not in the cache, then it must've been reclaimed.  And
+	 * since fuse_vnop_reclaim does a cache_purge, name's entry must've
+	 * been invalidated already.  So we can safely return if dvp == NULL
+	 */
 	if (err != 0 || dvp == NULL)
 		return (err);
 	/*
 	 * XXX we can't check dvp's generation because the FUSE invalidate
 	 * entry message doesn't include it.  Worse case is that we invalidate
 	 * an entry that didn't need to be invalidated.
 	 */
 
 	cn.cn_nameiop = LOOKUP;
 	cn.cn_flags = 0;	/* !MAKEENTRY means free cached entry */
 	cn.cn_thread = curthread;
 	cn.cn_cred = curthread->td_ucred;
 	cn.cn_lkflags = LK_SHARED;
 	cn.cn_pnbuf = NULL;
 	cn.cn_nameptr = name;
 	cn.cn_namelen = fnieo.namelen;
 	err = cache_lookup(dvp, &vp, &cn, NULL, NULL);
 	MPASS(err == 0);
 	fuse_vnode_clear_attr_cache(dvp);
 	vput(dvp);
 	return (0);
 }
 
 int
 fuse_internal_invalidate_inode(struct mount *mp, struct uio *uio)
 {
 	struct fuse_notify_inval_inode_out fniio;
-	struct fuse_data *data = fuse_get_mpdata(mp);
 	struct vnode *vp;
 	int err;
-
-	if (!(data->dataflags & FSESS_EXPORT_SUPPORT)) {
-		/* 
-		 * Linux allows file systems without export support to use
-		 * asynchronous notification because its inode cache is indexed
-		 * purely by the inode number.  But FreeBSD's vnode is cache
-		 * requires access to the entire vnode structure.
-		 */
-		SDT_PROBE1(fusefs, , internal, invalidate_without_export, mp);
-		return (EINVAL);
-	}
 
 	if ((err = uiomove(&fniio, sizeof(fniio), uio)) != 0)
 		return (err);
 
 	if (fniio.ino == FUSE_ROOT_ID)
 		err = VFS_ROOT(mp, LK_EXCLUSIVE, &vp);
 	else
 		err = fuse_internal_get_cached_vnode(mp, fniio.ino, LK_SHARED,
 			&vp);
 	if (err != 0 || vp == NULL)
 		return (err);
 	/*
 	 * XXX we can't check vp's generation because the FUSE invalidate
 	 * entry message doesn't include it.  Worse case is that we invalidate
 	 * an inode that didn't need to be invalidated.
 	 */
 
 	/* 
 	 * Flush and invalidate buffers if off >= 0.  Technically we only need
 	 * to flush and invalidate the range of offsets [off, off + len), but
 	 * for simplicity's sake we do everything.
 	 */
 	if (fniio.off >= 0)
 		fuse_io_invalbuf(vp, curthread);
 	fuse_vnode_clear_attr_cache(vp);
 	vput(vp);
 	return (0);
 }
 
 /* mknod */
 int
 fuse_internal_mknod(struct vnode *dvp, struct vnode **vpp,
 	struct componentname *cnp, struct vattr *vap)
 {
 	struct fuse_data *data;
 	struct fuse_mknod_in fmni;
 	size_t insize;
 
 	data = fuse_get_mpdata(dvp->v_mount);
 
 	fmni.mode = MAKEIMODE(vap->va_type, vap->va_mode);
 	fmni.rdev = vap->va_rdev;
 	if (fuse_libabi_geq(data, 7, 12)) {
 		insize = sizeof(fmni);
 		fmni.umask = curthread->td_proc->p_fd->fd_cmask;
 	} else {
 		insize = FUSE_COMPAT_MKNOD_IN_SIZE;
 	}
 	return (fuse_internal_newentry(dvp, vpp, cnp, FUSE_MKNOD, &fmni,
 	    insize, vap->va_type));
 }
 
 /* readdir */
 
 int
 fuse_internal_readdir(struct vnode *vp,
     struct uio *uio,
     off_t startoff,
     struct fuse_filehandle *fufh,
     struct fuse_iov *cookediov,
     int *ncookies,
     u_long *cookies)
 {
 	int err = 0;
 	struct fuse_dispatcher fdi;
 	struct fuse_read_in *fri = NULL;
 	int fnd_start;
 
 	if (uio_resid(uio) == 0)
 		return 0;
 	fdisp_init(&fdi, 0);
 
 	/*
 	 * Note that we DO NOT have a UIO_SYSSPACE here (so no need for p2p
 	 * I/O).
 	 */
 
 	/*
 	 * fnd_start is set non-zero once the offset in the directory gets
 	 * to the startoff.  This is done because directories must be read
 	 * from the beginning (offset == 0) when fuse_vnop_readdir() needs
 	 * to do an open of the directory.
 	 * If it is not set non-zero here, it will be set non-zero in
 	 * fuse_internal_readdir_processdata() when uio_offset == startoff.
 	 */
 	fnd_start = 0;
 	if (uio->uio_offset == startoff)
 		fnd_start = 1;
 	while (uio_resid(uio) > 0) {
 		fdi.iosize = sizeof(*fri);
 		if (fri == NULL)
 			fdisp_make_vp(&fdi, FUSE_READDIR, vp, NULL, NULL);
 		else
 			fdisp_refresh_vp(&fdi, FUSE_READDIR, vp, NULL, NULL);
 
 		fri = fdi.indata;
 		fri->fh = fufh->fh_id;
 		fri->offset = uio_offset(uio);
 		fri->size = MIN(uio->uio_resid,
 		    fuse_get_mpdata(vp->v_mount)->max_read);
 
 		if ((err = fdisp_wait_answ(&fdi)))
 			break;
 		if ((err = fuse_internal_readdir_processdata(uio, startoff,
 		    &fnd_start, fri->size, fdi.answ, fdi.iosize, cookediov,
 		    ncookies, &cookies)))
 			break;
 	}
 
 	fdisp_destroy(&fdi);
 	return ((err == -1) ? 0 : err);
 }
 
 /*
  * Return -1 to indicate that this readdir is finished, 0 if it copied
  * all the directory data read in and it may be possible to read more
  * and greater than 0 for a failure.
  */
 int
 fuse_internal_readdir_processdata(struct uio *uio,
     off_t startoff,
     int *fnd_start,
     size_t reqsize,
     void *buf,
     size_t bufsize,
     struct fuse_iov *cookediov,
     int *ncookies,
     u_long **cookiesp)
 {
 	int err = 0;
 	int bytesavail;
 	size_t freclen;
 
 	struct dirent *de;
 	struct fuse_dirent *fudge;
 	u_long *cookies;
 
 	cookies = *cookiesp;
 	if (bufsize < FUSE_NAME_OFFSET)
 		return -1;
 	for (;;) {
 		if (bufsize < FUSE_NAME_OFFSET) {
 			err = -1;
 			break;
 		}
 		fudge = (struct fuse_dirent *)buf;
 		freclen = FUSE_DIRENT_SIZE(fudge);
 
 		if (bufsize < freclen) {
 			/*
 			 * This indicates a partial directory entry at the
 			 * end of the directory data.
 			 */
 			err = -1;
 			break;
 		}
 #ifdef ZERO_PAD_INCOMPLETE_BUFS
 		if (isbzero(buf, FUSE_NAME_OFFSET)) {
 			err = -1;
 			break;
 		}
 #endif
 
 		if (!fudge->namelen || fudge->namelen > MAXNAMLEN) {
 			err = EINVAL;
 			break;
 		}
 		bytesavail = GENERIC_DIRSIZ((struct pseudo_dirent *)
 					    &fudge->namelen);
 
 		if (bytesavail > uio_resid(uio)) {
 			/* Out of space for the dir so we are done. */
 			err = -1;
 			break;
 		}
 		/*
 		 * Don't start to copy the directory entries out until
 		 * the requested offset in the directory is found.
 		 */
 		if (*fnd_start != 0) {
 			fiov_adjust(cookediov, bytesavail);
 			bzero(cookediov->base, bytesavail);
 
 			de = (struct dirent *)cookediov->base;
 			de->d_fileno = fudge->ino;
 			de->d_reclen = bytesavail;
 			de->d_type = fudge->type;
 			de->d_namlen = fudge->namelen;
 			memcpy((char *)cookediov->base + sizeof(struct dirent) -
 			       MAXNAMLEN - 1,
 			       (char *)buf + FUSE_NAME_OFFSET, fudge->namelen);
 			dirent_terminate(de);
 
 			err = uiomove(cookediov->base, cookediov->len, uio);
 			if (err)
 				break;
 			if (cookies != NULL) {
 				if (*ncookies == 0) {
 					err = -1;
 					break;
 				}
 				*cookies = fudge->off;
 				cookies++;
 				(*ncookies)--;
 			}
 		} else if (startoff == fudge->off)
 			*fnd_start = 1;
 		buf = (char *)buf + freclen;
 		bufsize -= freclen;
 		uio_setoffset(uio, fudge->off);
 	}
 	*cookiesp = cookies;
 
 	return err;
 }
 
 /* remove */
 
 int
 fuse_internal_remove(struct vnode *dvp,
     struct vnode *vp,
     struct componentname *cnp,
     enum fuse_opcode op)
 {
 	struct fuse_dispatcher fdi;
 	int err = 0;
 
 	fdisp_init(&fdi, cnp->cn_namelen + 1);
 	fdisp_make_vp(&fdi, op, dvp, cnp->cn_thread, cnp->cn_cred);
 
 	memcpy(fdi.indata, cnp->cn_nameptr, cnp->cn_namelen);
 	((char *)fdi.indata)[cnp->cn_namelen] = '\0';
 
 	err = fdisp_wait_answ(&fdi);
 	fdisp_destroy(&fdi);
 	return err;
 }
 
 /* rename */
 
 int
 fuse_internal_rename(struct vnode *fdvp,
     struct componentname *fcnp,
     struct vnode *tdvp,
     struct componentname *tcnp)
 {
 	struct fuse_dispatcher fdi;
 	struct fuse_rename_in *fri;
 	int err = 0;
 
 	fdisp_init(&fdi, sizeof(*fri) + fcnp->cn_namelen + tcnp->cn_namelen + 2);
 	fdisp_make_vp(&fdi, FUSE_RENAME, fdvp, tcnp->cn_thread, tcnp->cn_cred);
 
 	fri = fdi.indata;
 	fri->newdir = VTOI(tdvp);
 	memcpy((char *)fdi.indata + sizeof(*fri), fcnp->cn_nameptr,
 	    fcnp->cn_namelen);
 	((char *)fdi.indata)[sizeof(*fri) + fcnp->cn_namelen] = '\0';
 	memcpy((char *)fdi.indata + sizeof(*fri) + fcnp->cn_namelen + 1,
 	    tcnp->cn_nameptr, tcnp->cn_namelen);
 	((char *)fdi.indata)[sizeof(*fri) + fcnp->cn_namelen +
 	    tcnp->cn_namelen + 1] = '\0';
 
 	err = fdisp_wait_answ(&fdi);
 	fdisp_destroy(&fdi);
 	return err;
 }
 
 /* strategy */
 
 /* entity creation */
 
 void
 fuse_internal_newentry_makerequest(struct mount *mp,
     uint64_t dnid,
     struct componentname *cnp,
     enum fuse_opcode op,
     void *buf,
     size_t bufsize,
     struct fuse_dispatcher *fdip)
 {
 	fdip->iosize = bufsize + cnp->cn_namelen + 1;
 
 	fdisp_make(fdip, op, mp, dnid, cnp->cn_thread, cnp->cn_cred);
 	memcpy(fdip->indata, buf, bufsize);
 	memcpy((char *)fdip->indata + bufsize, cnp->cn_nameptr, cnp->cn_namelen);
 	((char *)fdip->indata)[bufsize + cnp->cn_namelen] = '\0';
 }
 
 int
 fuse_internal_newentry_core(struct vnode *dvp,
     struct vnode **vpp,
     struct componentname *cnp,
     enum vtype vtyp,
     struct fuse_dispatcher *fdip)
 {
 	int err = 0;
 	struct fuse_entry_out *feo;
 	struct mount *mp = vnode_mount(dvp);
 
 	if ((err = fdisp_wait_answ(fdip))) {
 		return err;
 	}
 	feo = fdip->answ;
 
 	if ((err = fuse_internal_checkentry(feo, vtyp))) {
 		return err;
 	}
 	err = fuse_vnode_get(mp, feo, feo->nodeid, dvp, vpp, cnp, vtyp);
 	if (err) {
 		fuse_internal_forget_send(mp, cnp->cn_thread, cnp->cn_cred,
 		    feo->nodeid, 1);
 		return err;
 	}
 
 	/* 
 	 * Purge the parent's attribute cache because the daemon should've
 	 * updated its mtime and ctime
 	 */
 	fuse_vnode_clear_attr_cache(dvp);
 
 	fuse_internal_cache_attrs(*vpp, NULL, &feo->attr, feo->attr_valid,
 		feo->attr_valid_nsec, NULL);
 
 	return err;
 }
 
 int
 fuse_internal_newentry(struct vnode *dvp,
     struct vnode **vpp,
     struct componentname *cnp,
     enum fuse_opcode op,
     void *buf,
     size_t bufsize,
     enum vtype vtype)
 {
 	int err;
 	struct fuse_dispatcher fdi;
 	struct mount *mp = vnode_mount(dvp);
 
 	fdisp_init(&fdi, 0);
 	fuse_internal_newentry_makerequest(mp, VTOI(dvp), cnp, op, buf,
 	    bufsize, &fdi);
 	err = fuse_internal_newentry_core(dvp, vpp, cnp, vtype, &fdi);
 	fdisp_destroy(&fdi);
 
 	return err;
 }
 
 /* entity destruction */
 
 int
 fuse_internal_forget_callback(struct fuse_ticket *ftick, struct uio *uio)
 {
 	fuse_internal_forget_send(ftick->tk_data->mp, curthread, NULL,
 	    ((struct fuse_in_header *)ftick->tk_ms_fiov.base)->nodeid, 1);
 
 	return 0;
 }
 
 void
 fuse_internal_forget_send(struct mount *mp,
     struct thread *td,
     struct ucred *cred,
     uint64_t nodeid,
     uint64_t nlookup)
 {
 
 	struct fuse_dispatcher fdi;
 	struct fuse_forget_in *ffi;
 
 	/*
          * KASSERT(nlookup > 0, ("zero-times forget for vp #%llu",
          *         (long long unsigned) nodeid));
          */
 
 	fdisp_init(&fdi, sizeof(*ffi));
 	fdisp_make(&fdi, FUSE_FORGET, mp, nodeid, td, cred);
 
 	ffi = fdi.indata;
 	ffi->nlookup = nlookup;
 
 	fuse_insert_message(fdi.tick, false);
 	fdisp_destroy(&fdi);
 }
 
 /* Fetch the vnode's attributes from the daemon*/
 int
 fuse_internal_do_getattr(struct vnode *vp, struct vattr *vap,
 	struct ucred *cred, struct thread *td)
 {
 	struct fuse_dispatcher fdi;
 	struct fuse_vnode_data *fvdat = VTOFUD(vp);
 	struct fuse_getattr_in *fgai;
 	struct fuse_attr_out *fao;
 	off_t old_filesize = fvdat->cached_attrs.va_size;
 	enum vtype vtyp;
 	int err;
 
 	fdisp_init(&fdi, 0);
 	fdisp_make_vp(&fdi, FUSE_GETATTR, vp, td, cred);
 	fgai = fdi.indata;
 	/* 
 	 * We could look up a file handle and set it in fgai->fh, but that
 	 * involves extra runtime work and I'm unaware of any file systems that
 	 * care.
 	 */
 	fgai->getattr_flags = 0;
 	if ((err = fdisp_simple_putget_vp(&fdi, FUSE_GETATTR, vp, td, cred))) {
 		if (err == ENOENT)
 			fuse_internal_vnode_disappear(vp);
 		goto out;
 	}
 
 	fao = (struct fuse_attr_out *)fdi.answ;
 	vtyp = IFTOVT(fao->attr.mode);
 	if (fvdat->flag & FN_SIZECHANGE)
 		fao->attr.size = old_filesize;
 	fuse_internal_cache_attrs(vp, NULL, &fao->attr, fao->attr_valid,
 		fao->attr_valid_nsec, vap);
 	if (vtyp != vnode_vtype(vp)) {
 		fuse_internal_vnode_disappear(vp);
 		err = ENOENT;
 	}
 
 out:
 	fdisp_destroy(&fdi);
 	return err;
 }
 
 /* Read a vnode's attributes from cache or fetch them from the fuse daemon */
 int
 fuse_internal_getattr(struct vnode *vp, struct vattr *vap, struct ucred *cred,
 	struct thread *td)
 {
 	struct vattr *attrs;
 
 	if ((attrs = VTOVA(vp)) != NULL) {
 		*vap = *attrs;	/* struct copy */
 		return 0;
 	}
 
 	return fuse_internal_do_getattr(vp, vap, cred, td);
 }
 
 void
 fuse_internal_vnode_disappear(struct vnode *vp)
 {
 	struct fuse_vnode_data *fvdat = VTOFUD(vp);
 
 	ASSERT_VOP_ELOCKED(vp, "fuse_internal_vnode_disappear");
 	fvdat->flag |= FN_REVOKED;
 	bintime_clear(&fvdat->attr_cache_timeout);
 	bintime_clear(&fvdat->entry_cache_timeout);
 	cache_purge(vp);
 }
 
 /* fuse start/stop */
 
 int
 fuse_internal_init_callback(struct fuse_ticket *tick, struct uio *uio)
 {
 	int err = 0;
 	struct fuse_data *data = tick->tk_data;
 	struct fuse_init_out *fiio;
 
 	if ((err = tick->tk_aw_ohead.error)) {
 		goto out;
 	}
 	if ((err = fticket_pull(tick, uio))) {
 		goto out;
 	}
 	fiio = fticket_resp(tick)->base;
 
 	/* XXX: Do we want to check anything further besides this? */
 	if (fiio->major < 7) {
 		SDT_PROBE2(fusefs, , internal, trace, 1,
 			"userpace version too low");
 		err = EPROTONOSUPPORT;
 		goto out;
 	}
 	data->fuse_libabi_major = fiio->major;
 	data->fuse_libabi_minor = fiio->minor;
 
 	if (fuse_libabi_geq(data, 7, 5)) {
 		if (fticket_resp(tick)->len == sizeof(struct fuse_init_out)) {
 			data->max_write = fiio->max_write;
 			if (fiio->flags & FUSE_ASYNC_READ)
 				data->dataflags |= FSESS_ASYNC_READ;
 			if (fiio->flags & FUSE_POSIX_LOCKS)
 				data->dataflags |= FSESS_POSIX_LOCKS;
 			if (fiio->flags & FUSE_EXPORT_SUPPORT)
 				data->dataflags |= FSESS_EXPORT_SUPPORT;
 			/* 
 			 * Don't bother to check FUSE_BIG_WRITES, because it's
 			 * redundant with max_write
 			 */
 		} else {
 			err = EINVAL;
 		}
 	} else {
 		/* Old fix values */
 		data->max_write = 4096;
 	}
 
 out:
 	if (err) {
 		fdata_set_dead(data);
 	}
 	FUSE_LOCK();
 	data->dataflags |= FSESS_INITED;
 	wakeup(&data->ticketer);
 	FUSE_UNLOCK();
 
 	return 0;
 }
 
 void
 fuse_internal_send_init(struct fuse_data *data, struct thread *td)
 {
 	struct fuse_init_in *fiii;
 	struct fuse_dispatcher fdi;
 
 	fdisp_init(&fdi, sizeof(*fiii));
 	fdisp_make(&fdi, FUSE_INIT, data->mp, 0, td, NULL);
 	fiii = fdi.indata;
 	fiii->major = FUSE_KERNEL_VERSION;
 	fiii->minor = FUSE_KERNEL_MINOR_VERSION;
 	/* 
 	 * fusefs currently doesn't do any readahead other than fetching whole
 	 * buffer cache block sized regions at once.  So the max readahead is
 	 * the size of a buffer cache block.
 	 */
 	fiii->max_readahead = maxbcachebuf;
 	/*
 	 * Unsupported features:
 	 * FUSE_FILE_OPS: No known FUSE server or client supports it
 	 * FUSE_ATOMIC_O_TRUNC: our VFS cannot support it
 	 * FUSE_DONT_MASK: unlike Linux, FreeBSD always applies the umask, even
 	 *	when default ACLs are in use.
 	 */
 	fiii->flags = FUSE_ASYNC_READ | FUSE_POSIX_LOCKS | FUSE_EXPORT_SUPPORT
 		| FUSE_BIG_WRITES;
 
 	fuse_insert_callback(fdi.tick, fuse_internal_init_callback);
 	fuse_insert_message(fdi.tick, false);
 	fdisp_destroy(&fdi);
 }
 
 /* 
  * Send a FUSE_SETATTR operation with no permissions checks.  If cred is NULL,
  * send the request with root credentials
  */
 int fuse_internal_setattr(struct vnode *vp, struct vattr *vap,
 	struct thread *td, struct ucred *cred)
 {
 	struct fuse_dispatcher fdi;
 	struct fuse_setattr_in *fsai;
 	struct mount *mp;
 	pid_t pid = td->td_proc->p_pid;
 	struct fuse_data *data;
 	int dataflags;
 	int err = 0;
 	enum vtype vtyp;
 	int sizechanged = -1;
 	uint64_t newsize = 0;
 
 	mp = vnode_mount(vp);
 	data = fuse_get_mpdata(mp);
 	dataflags = data->dataflags;
 
 	fdisp_init(&fdi, sizeof(*fsai));
 	fdisp_make_vp(&fdi, FUSE_SETATTR, vp, td, cred);
 	if (!cred) {
 		fdi.finh->uid = 0;
 		fdi.finh->gid = 0;
 	}
 	fsai = fdi.indata;
 	fsai->valid = 0;
 
 	if (vap->va_uid != (uid_t)VNOVAL) {
 		fsai->uid = vap->va_uid;
 		fsai->valid |= FATTR_UID;
 	}
 	if (vap->va_gid != (gid_t)VNOVAL) {
 		fsai->gid = vap->va_gid;
 		fsai->valid |= FATTR_GID;
 	}
 	if (vap->va_size != VNOVAL) {
 		struct fuse_filehandle *fufh = NULL;
 
 		/*Truncate to a new value. */
 		fsai->size = vap->va_size;
 		sizechanged = 1;
 		newsize = vap->va_size;
 		fsai->valid |= FATTR_SIZE;
 
 		fuse_filehandle_getrw(vp, FWRITE, &fufh, cred, pid);
 		if (fufh) {
 			fsai->fh = fufh->fh_id;
 			fsai->valid |= FATTR_FH;
 		}
 		VTOFUD(vp)->flag &= ~FN_SIZECHANGE;
 	}
 	if (vap->va_atime.tv_sec != VNOVAL) {
 		fsai->atime = vap->va_atime.tv_sec;
 		fsai->atimensec = vap->va_atime.tv_nsec;
 		fsai->valid |= FATTR_ATIME;
 		if (vap->va_vaflags & VA_UTIMES_NULL)
 			fsai->valid |= FATTR_ATIME_NOW;
 	}
 	if (vap->va_mtime.tv_sec != VNOVAL) {
 		fsai->mtime = vap->va_mtime.tv_sec;
 		fsai->mtimensec = vap->va_mtime.tv_nsec;
 		fsai->valid |= FATTR_MTIME;
 		if (vap->va_vaflags & VA_UTIMES_NULL)
 			fsai->valid |= FATTR_MTIME_NOW;
 	}
 	if (vap->va_mode != (mode_t)VNOVAL) {
 		fsai->mode = vap->va_mode & ALLPERMS;
 		fsai->valid |= FATTR_MODE;
 	}
 	if (!fsai->valid) {
 		goto out;
 	}
 
 	if ((err = fdisp_wait_answ(&fdi)))
 		goto out;
 	vtyp = IFTOVT(((struct fuse_attr_out *)fdi.answ)->attr.mode);
 
 	if (vnode_vtype(vp) != vtyp) {
 		if (vnode_vtype(vp) == VNON && vtyp != VNON) {
 			SDT_PROBE2(fusefs, , internal, trace, 1, "FUSE: Dang! "
 				"vnode_vtype is VNON and vtype isn't.");
 		} else {
 			/*
 	                 * STALE vnode, ditch
 	                 *
 			 * The vnode has changed its type "behind our back".
 			 * There's nothing really we can do, so let us just
 			 * force an internal revocation and tell the caller to
 			 * try again, if interested.
 	                 */
 			fuse_internal_vnode_disappear(vp);
 			err = EAGAIN;
 		}
 	}
 	if (err == 0) {
 		struct fuse_attr_out *fao = (struct fuse_attr_out*)fdi.answ;
 		fuse_internal_cache_attrs(vp, cred, &fao->attr, fao->attr_valid,
 			fao->attr_valid_nsec, NULL);
 	}
 
 out:
 	fdisp_destroy(&fdi);
 	return err;
 }
 
 #ifdef ZERO_PAD_INCOMPLETE_BUFS
 static int
 isbzero(void *buf, size_t len)
 {
 	int i;
 
 	for (i = 0; i < len; i++) {
 		if (((char *)buf)[i])
 			return (0);
 	}
 
 	return (1);
 }
 
 #endif
Index: projects/fuse2/sys/fs/fuse/fuse_vfsops.c
===================================================================
--- projects/fuse2/sys/fs/fuse/fuse_vfsops.c	(revision 348581)
+++ projects/fuse2/sys/fs/fuse/fuse_vfsops.c	(revision 348582)
@@ -1,679 +1,691 @@
 /*-
  * SPDX-License-Identifier: BSD-3-Clause
  *
  * Copyright (c) 2007-2009 Google Inc. and Amit Singh
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions are
  * met:
  *
  * * Redistributions of source code must retain the above copyright
  *   notice, this list of conditions and the following disclaimer.
  * * Redistributions in binary form must reproduce the above
  *   copyright notice, this list of conditions and the following disclaimer
  *   in the documentation and/or other materials provided with the
  *   distribution.
  * * Neither the name of Google Inc. nor the names of its
  *   contributors may be used to endorse or promote products derived from
  *   this software without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  *
  * Copyright (C) 2005 Csaba Henk.
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 #include <sys/cdefs.h>
 __FBSDID("$FreeBSD$");
 
 #include <sys/param.h>
 #include <sys/buf.h>
 #include <sys/module.h>
 #include <sys/systm.h>
 #include <sys/errno.h>
 #include <sys/kernel.h>
 #include <sys/capsicum.h>
 #include <sys/conf.h>
 #include <sys/filedesc.h>
 #include <sys/uio.h>
 #include <sys/malloc.h>
 #include <sys/queue.h>
 #include <sys/lock.h>
 #include <sys/sx.h>
 #include <sys/mutex.h>
 #include <sys/proc.h>
 #include <sys/vnode.h>
 #include <sys/namei.h>
 #include <sys/mount.h>
 #include <sys/sysctl.h>
 #include <sys/fcntl.h>
 
 #include "fuse.h"
 #include "fuse_node.h"
 #include "fuse_ipc.h"
 #include "fuse_internal.h"
 
 #include <sys/priv.h>
 #include <security/mac/mac_framework.h>
 
 SDT_PROVIDER_DECLARE(fusefs);
 /* 
  * Fuse trace probe:
  * arg0: verbosity.  Higher numbers give more verbose messages
  * arg1: Textual message
  */
 SDT_PROBE_DEFINE2(fusefs, , vfsops, trace, "int", "char*");
 
 /* This will do for privilege types for now */
 #ifndef PRIV_VFS_FUSE_ALLOWOTHER
 #define PRIV_VFS_FUSE_ALLOWOTHER PRIV_VFS_MOUNT_NONUSER
 #endif
 #ifndef PRIV_VFS_FUSE_MOUNT_NONUSER
 #define PRIV_VFS_FUSE_MOUNT_NONUSER PRIV_VFS_MOUNT_NONUSER
 #endif
 #ifndef PRIV_VFS_FUSE_SYNC_UNMOUNT
 #define PRIV_VFS_FUSE_SYNC_UNMOUNT PRIV_VFS_MOUNT_NONUSER
 #endif
 
 static vfs_fhtovp_t fuse_vfsop_fhtovp;
 static vfs_mount_t fuse_vfsop_mount;
 static vfs_unmount_t fuse_vfsop_unmount;
 static vfs_root_t fuse_vfsop_root;
 static vfs_statfs_t fuse_vfsop_statfs;
 static vfs_vget_t fuse_vfsop_vget;
 
 struct vfsops fuse_vfsops = {
 	.vfs_fhtovp = fuse_vfsop_fhtovp,
 	.vfs_mount = fuse_vfsop_mount,
 	.vfs_unmount = fuse_vfsop_unmount,
 	.vfs_root = fuse_vfsop_root,
 	.vfs_statfs = fuse_vfsop_statfs,
 	.vfs_vget = fuse_vfsop_vget,
 };
 
 static int fuse_enforce_dev_perms = 0;
 
 SYSCTL_INT(_vfs_fusefs, OID_AUTO, enforce_dev_perms, CTLFLAG_RW,
     &fuse_enforce_dev_perms, 0,
     "enforce fuse device permissions for secondary mounts");
 
 MALLOC_DEFINE(M_FUSEVFS, "fuse_filesystem", "buffer for fuse vfs layer");
 
 static int
 fuse_getdevice(const char *fspec, struct thread *td, struct cdev **fdevp)
 {
 	struct nameidata nd, *ndp = &nd;
 	struct vnode *devvp;
 	struct cdev *fdev;
 	int err;
 
 	/*
 	 * Not an update, or updating the name: look up the name
 	 * and verify that it refers to a sensible disk device.
 	 */
 
 	NDINIT(ndp, LOOKUP, FOLLOW, UIO_SYSSPACE, fspec, td);
 	if ((err = namei(ndp)) != 0)
 		return err;
 	NDFREE(ndp, NDF_ONLY_PNBUF);
 	devvp = ndp->ni_vp;
 
 	if (devvp->v_type != VCHR) {
 		vrele(devvp);
 		return ENXIO;
 	}
 	fdev = devvp->v_rdev;
 	dev_ref(fdev);
 
 	if (fuse_enforce_dev_perms) {
 		/*
 	         * Check if mounter can open the fuse device.
 	         *
 	         * This has significance only if we are doing a secondary mount
 	         * which doesn't involve actually opening fuse devices, but we
 	         * still want to enforce the permissions of the device (in
 	         * order to keep control over the circle of fuse users).
 	         *
 	         * (In case of primary mounts, we are either the superuser so
 	         * we can do anything anyway, or we can mount only if the
 	         * device is already opened by us, ie. we are permitted to open
 	         * the device.)
 	         */
 #if 0
 #ifdef MAC
 		err = mac_check_vnode_open(td->td_ucred, devvp, VREAD | VWRITE);
 		if (!err)
 #endif
 #endif /* 0 */
 			err = VOP_ACCESS(devvp, VREAD | VWRITE, td->td_ucred, td);
 		if (err) {
 			vrele(devvp);
 			dev_rel(fdev);
 			return err;
 		}
 	}
 	/*
 	 * according to coda code, no extra lock is needed --
 	 * although in sys/vnode.h this field is marked "v"
 	 */
 	vrele(devvp);
 
 	if (!fdev->si_devsw ||
 	    strcmp("fuse", fdev->si_devsw->d_name)) {
 		dev_rel(fdev);
 		return ENXIO;
 	}
 	*fdevp = fdev;
 
 	return 0;
 }
 
 #define FUSE_FLAGOPT(fnam, fval) do {				\
 	vfs_flagopt(opts, #fnam, &mntopts, fval);		\
 	vfs_flagopt(opts, "__" #fnam, &__mntopts, fval);	\
 } while (0)
 
 SDT_PROBE_DEFINE1(fusefs, , vfsops, mntopts, "uint64_t");
 SDT_PROBE_DEFINE4(fusefs, , vfsops, mount_err, "char*", "struct fuse_data*",
 	"struct mount*", "int");
 
 static int
 fuse_vfs_remount(struct mount *mp, struct thread *td, uint64_t mntopts,
 	uint32_t max_read, int daemon_timeout)
 {
 	int err = 0;
 	struct fuse_data *data = fuse_get_mpdata(mp);
 	/* Don't allow these options to be changed */
 	const static unsigned long long cant_update_opts = 
 		MNT_USER;	/* Mount owner must be the user running the daemon */
 
 	FUSE_LOCK();
 
 	if ((mp->mnt_flag ^ data->mnt_flag) & cant_update_opts) {
 		err = EOPNOTSUPP;
 		SDT_PROBE4(fusefs, , vfsops, mount_err,
 			"Can't change these mount options during remount",
 			data, mp, err);
 		goto out;
 	}
 	if (((data->dataflags ^ mntopts) & FSESS_MNTOPTS_MASK) ||
 	     (data->max_read != max_read) ||
 	     (data->daemon_timeout != daemon_timeout)) {
 		// TODO: allow changing options where it makes sense
 		err = EOPNOTSUPP;
 		SDT_PROBE4(fusefs, , vfsops, mount_err,
 			"Can't change fuse mount options during remount",
 			data, mp, err);
 		goto out;
 	}
 
 	if (fdata_get_dead(data)) {
 		err = ENOTCONN;
 		SDT_PROBE4(fusefs, , vfsops, mount_err,
 			"device is dead during mount", data, mp, err);
 		goto out;
 	}
 
 	/* Sanity + permission checks */
 	if (!data->daemoncred)
 		panic("fuse daemon found, but identity unknown");
 	if (mntopts & FSESS_DAEMON_CAN_SPY)
 		err = priv_check(td, PRIV_VFS_FUSE_ALLOWOTHER);
 	if (err == 0 && td->td_ucred->cr_uid != data->daemoncred->cr_uid)
 		/* are we allowed to do the first mount? */
 		err = priv_check(td, PRIV_VFS_FUSE_MOUNT_NONUSER);
 
 out:
 	FUSE_UNLOCK();
 	return err;
 }
 
 static int
 fuse_vfsop_fhtovp(struct mount *mp, struct fid *fhp, int flags,
 	struct vnode **vpp)
 {
 	struct fuse_fid *ffhp = (struct fuse_fid *)fhp;
 	struct fuse_vnode_data *fvdat;
 	struct vnode *nvp;
 	int error;
 
 	if (!(fuse_get_mpdata(mp)->dataflags & FSESS_EXPORT_SUPPORT))
 		return EOPNOTSUPP;
 
 	error = VFS_VGET(mp, ffhp->nid, LK_EXCLUSIVE, &nvp);
 	if (error) {
 		*vpp = NULLVP;
 		return (error);
 	}
 	fvdat = VTOFUD(nvp);
 	if (fvdat->generation != ffhp->gen ) {
 		vput(nvp);
 		*vpp = NULLVP;
 		return (ESTALE);
 	}
 	*vpp = nvp;
 	vnode_create_vobject(*vpp, 0, curthread);
 	return (0);
 }
 
 static int
 fuse_vfsop_mount(struct mount *mp)
 {
 	int err;
 
 	uint64_t mntopts, __mntopts;
 	uint32_t max_read;
 	int daemon_timeout;
 	int fd;
 
 	size_t len;
 
 	struct cdev *fdev;
 	struct fuse_data *data = NULL;
 	struct thread *td;
 	struct file *fp, *fptmp;
 	char *fspec, *subtype;
 	struct vfsoptlist *opts;
 
 	subtype = NULL;
 	max_read = ~0;
 	err = 0;
 	mntopts = 0;
 	__mntopts = 0;
 	td = curthread;
 
 	MNT_ILOCK(mp);
 	mp->mnt_flag |= MNT_SYNCHRONOUS;
 	MNT_IUNLOCK(mp);
 	/* Get the new options passed to mount */
 	opts = mp->mnt_optnew;
 
 	if (!opts)
 		return EINVAL;
 
 	/* `fspath' contains the mount point (eg. /mnt/fuse/sshfs); REQUIRED */
 	if (!vfs_getopts(opts, "fspath", &err))
 		return err;
 
 	/*
 	 * With the help of underscored options the mount program
 	 * can inform us from the flags it sets by default
 	 */
 	FUSE_FLAGOPT(allow_other, FSESS_DAEMON_CAN_SPY);
 	FUSE_FLAGOPT(push_symlinks_in, FSESS_PUSH_SYMLINKS_IN);
 	FUSE_FLAGOPT(default_permissions, FSESS_DEFAULT_PERMISSIONS);
 	FUSE_FLAGOPT(no_attrcache, FSESS_NO_ATTRCACHE);
 	FUSE_FLAGOPT(no_readahed, FSESS_NO_READAHEAD);
 	FUSE_FLAGOPT(no_datacache, FSESS_NO_DATACACHE);
 	FUSE_FLAGOPT(no_namecache, FSESS_NO_NAMECACHE);
 	FUSE_FLAGOPT(no_mmap, FSESS_NO_MMAP);
 
 	(void)vfs_scanopt(opts, "max_read=", "%u", &max_read);
 	if (vfs_scanopt(opts, "timeout=", "%u", &daemon_timeout) == 1) {
 		if (daemon_timeout < FUSE_MIN_DAEMON_TIMEOUT)
 			daemon_timeout = FUSE_MIN_DAEMON_TIMEOUT;
 		else if (daemon_timeout > FUSE_MAX_DAEMON_TIMEOUT)
 			daemon_timeout = FUSE_MAX_DAEMON_TIMEOUT;
 	} else {
 		daemon_timeout = FUSE_DEFAULT_DAEMON_TIMEOUT;
 	}
 	subtype = vfs_getopts(opts, "subtype=", &err);
 
 	SDT_PROBE1(fusefs, , vfsops, mntopts, mntopts);
 
 	if (mp->mnt_flag & MNT_UPDATE) {
 		return fuse_vfs_remount(mp, td, mntopts, max_read,
 			daemon_timeout);
 	}
 
 	/* `from' contains the device name (eg. /dev/fuse0); REQUIRED */
 	fspec = vfs_getopts(opts, "from", &err);
 	if (!fspec)
 		return err;
 
 	/* `fd' contains the filedescriptor for this session; REQUIRED */
 	if (vfs_scanopt(opts, "fd", "%d", &fd) != 1)
 		return EINVAL;
 
 	err = fuse_getdevice(fspec, td, &fdev);
 	if (err != 0)
 		return err;
 
 	err = fget(td, fd, &cap_read_rights, &fp);
 	if (err != 0) {
 		SDT_PROBE2(fusefs, , vfsops, trace, 1,
 			"invalid or not opened device");
 		goto out;
 	}
 	fptmp = td->td_fpop;
 	td->td_fpop = fp;
 	err = devfs_get_cdevpriv((void **)&data);
 	td->td_fpop = fptmp;
 	fdrop(fp, td);
 	FUSE_LOCK();
 
 	if (err != 0 || data == NULL) {
 		err = ENXIO;
 		SDT_PROBE4(fusefs, , vfsops, mount_err,
 			"invalid or not opened device", data, mp, err);
 		FUSE_UNLOCK();
 		goto out;
 	}
 	if (fdata_get_dead(data)) {
 		err = ENOTCONN;
 		SDT_PROBE4(fusefs, , vfsops, mount_err,
 			"device is dead during mount", data, mp, err);
 		FUSE_UNLOCK();
 		goto out;
 	}
 	/* Sanity + permission checks */
 	if (!data->daemoncred)
 		panic("fuse daemon found, but identity unknown");
 	if (mntopts & FSESS_DAEMON_CAN_SPY)
 		err = priv_check(td, PRIV_VFS_FUSE_ALLOWOTHER);
 	if (err == 0 && td->td_ucred->cr_uid != data->daemoncred->cr_uid)
 		/* are we allowed to do the first mount? */
 		err = priv_check(td, PRIV_VFS_FUSE_MOUNT_NONUSER);
 	if (err) {
 		FUSE_UNLOCK();
 		goto out;
 	}
 	data->ref++;
 	data->mp = mp;
 	data->dataflags |= mntopts;
 	data->max_read = max_read;
 	data->daemon_timeout = daemon_timeout;
 	data->mnt_flag = mp->mnt_flag & MNT_UPDATEMASK;
 	FUSE_UNLOCK();
 
 	vfs_getnewfsid(mp);
 	MNT_ILOCK(mp);
 	mp->mnt_data = data;
 	/* 
 	 * FUSE file systems can be either local or remote, but the kernel
 	 * can't tell the difference.
 	 */
 	mp->mnt_flag &= ~MNT_LOCAL;
 	mp->mnt_kern_flag |= MNTK_USES_BCACHE;
 	MNT_IUNLOCK(mp);
 	/* We need this here as this slot is used by getnewvnode() */
 	mp->mnt_stat.f_iosize = maxbcachebuf;
 	if (subtype) {
 		strlcat(mp->mnt_stat.f_fstypename, ".", MFSNAMELEN);
 		strlcat(mp->mnt_stat.f_fstypename, subtype, MFSNAMELEN);
 	}
 	copystr(fspec, mp->mnt_stat.f_mntfromname, MNAMELEN - 1, &len);
 	bzero(mp->mnt_stat.f_mntfromname + len, MNAMELEN - len);
 
 	/* Now handshaking with daemon */
 	fuse_internal_send_init(data, td);
 
 out:
 	if (err) {
 		FUSE_LOCK();
 		if (data != NULL && data->mp == mp) {
 			/*
 			 * Destroy device only if we acquired reference to
 			 * it
 			 */
 			SDT_PROBE4(fusefs, , vfsops, mount_err,
 				"mount failed, destroy device", data, mp, err);
 			data->mp = NULL;
 			mp->mnt_data = NULL;
 			fdata_trydestroy(data);
 		}
 		FUSE_UNLOCK();
 		dev_rel(fdev);
 	}
 	return err;
 }
 
 static int
 fuse_vfsop_unmount(struct mount *mp, int mntflags)
 {
 	int err = 0;
 	int flags = 0;
 
 	struct cdev *fdev;
 	struct fuse_data *data;
 	struct fuse_dispatcher fdi;
 	struct thread *td = curthread;
 
 	if (mntflags & MNT_FORCE) {
 		flags |= FORCECLOSE;
 	}
 	data = fuse_get_mpdata(mp);
 	if (!data) {
 		panic("no private data for mount point?");
 	}
 	/* There is 1 extra root vnode reference (mp->mnt_data). */
 	FUSE_LOCK();
 	if (data->vroot != NULL) {
 		struct vnode *vroot = data->vroot;
 
 		data->vroot = NULL;
 		FUSE_UNLOCK();
 		vrele(vroot);
 	} else
 		FUSE_UNLOCK();
 	err = vflush(mp, 0, flags, td);
 	if (err) {
 		return err;
 	}
 	if (fdata_get_dead(data)) {
 		goto alreadydead;
 	}
 	fdisp_init(&fdi, 0);
 	fdisp_make(&fdi, FUSE_DESTROY, mp, 0, td, NULL);
 
 	err = fdisp_wait_answ(&fdi);
 	fdisp_destroy(&fdi);
 
 	fdata_set_dead(data);
 
 alreadydead:
 	FUSE_LOCK();
 	data->mp = NULL;
 	fdev = data->fdev;
 	fdata_trydestroy(data);
 	FUSE_UNLOCK();
 
 	MNT_ILOCK(mp);
 	mp->mnt_data = NULL;
 	MNT_IUNLOCK(mp);
 
 	dev_rel(fdev);
 
 	return 0;
 }
 
+SDT_PROBE_DEFINE1(fusefs, , vfsops, invalidate_without_export,
+	"struct mount*");
 static int
 fuse_vfsop_vget(struct mount *mp, ino_t ino, int flags, struct vnode **vpp)
 {
+	struct fuse_data *data = fuse_get_mpdata(mp);
 	uint64_t nodeid = ino;
 	struct thread *td = curthread;
 	struct fuse_dispatcher fdi;
 	struct fuse_entry_out *feo;
 	struct fuse_vnode_data *fvdat;
 	const char dot[] = ".";
 	off_t filesize;
 	enum vtype vtyp;
 	int error;
+
+	if (!(data->dataflags & FSESS_EXPORT_SUPPORT)) {
+		/*
+		 * Unreachable unless you do something stupid, like export a
+		 * nullfs mount of a fusefs file system.
+		 */
+		SDT_PROBE1(fusefs, , vfsops, invalidate_without_export, mp);
+		return (EOPNOTSUPP);
+	}
 
 	error = fuse_internal_get_cached_vnode(mp, ino, flags, vpp);
 	if (error || *vpp != NULL)
 		return error;
 
 	/* Do a LOOKUP, using nodeid as the parent and "." as filename */
 	fdisp_init(&fdi, sizeof(dot));
 	fdisp_make(&fdi, FUSE_LOOKUP, mp, nodeid, td, td->td_ucred);
 	memcpy(fdi.indata, dot, sizeof(dot));
 	error = fdisp_wait_answ(&fdi);
 
 	if (error)
 		return error;
 
 	feo = (struct fuse_entry_out *)fdi.answ;
 	if (feo->nodeid == 0) {
 		/* zero nodeid means ENOENT and cache it */
 		error = ENOENT;
 		goto out;
 	}
 
 	vtyp = IFTOVT(feo->attr.mode);
 	error = fuse_vnode_get(mp, feo, nodeid, NULL, vpp, NULL, vtyp);
 	if (error)
 		goto out;
 	filesize = feo->attr.size;
 
 	/*
 	 * In the case where we are looking up a FUSE node represented by an
 	 * existing cached vnode, and the true size reported by FUSE_LOOKUP
 	 * doesn't match the vnode's cached size, then any cached writes beyond
 	 * the file's current size are lost.
 	 *
 	 * We can get here:
 	 * * following attribute cache expiration, or
 	 * * due a bug in the daemon, or
 	 */
 	fvdat = VTOFUD(*vpp);
 	if (vnode_isreg(*vpp) &&
 	    filesize != fvdat->cached_attrs.va_size &&
 	    fvdat->flag & FN_SIZECHANGE) {
 		printf("%s: WB cache incoherent on %s!\n", __func__,
 		    vnode_mount(*vpp)->mnt_stat.f_mntonname);
 
 		fvdat->flag &= ~FN_SIZECHANGE;
 	}
 
 	fuse_internal_cache_attrs(*vpp, td->td_ucred, &feo->attr,
 		feo->attr_valid, feo->attr_valid_nsec, NULL);
 	fuse_validity_2_bintime(feo->entry_valid, feo->entry_valid_nsec,
 		&fvdat->entry_cache_timeout);
 out:
 	fdisp_destroy(&fdi);
 	return error;
 }
 
 static int
 fuse_vfsop_root(struct mount *mp, int lkflags, struct vnode **vpp)
 {
 	struct fuse_data *data = fuse_get_mpdata(mp);
 	int err = 0;
 
 	if (data->vroot != NULL) {
 		err = vget(data->vroot, lkflags, curthread);
 		if (err == 0)
 			*vpp = data->vroot;
 	} else {
 		err = fuse_vnode_get(mp, NULL, FUSE_ROOT_ID, NULL, vpp, NULL,
 		    VDIR);
 		if (err == 0) {
 			FUSE_LOCK();
 			MPASS(data->vroot == NULL || data->vroot == *vpp);
 			if (data->vroot == NULL) {
 				SDT_PROBE2(fusefs, , vfsops, trace, 1,
 					"new root vnode");
 				data->vroot = *vpp;
 				FUSE_UNLOCK();
 				vref(*vpp);
 			} else if (data->vroot != *vpp) {
 				SDT_PROBE2(fusefs, , vfsops, trace, 1,
 					"root vnode race");
 				FUSE_UNLOCK();
 				VOP_UNLOCK(*vpp, 0);
 				vrele(*vpp);
 				vrecycle(*vpp);
 				*vpp = data->vroot;
 			} else
 				FUSE_UNLOCK();
 		}
 	}
 	return err;
 }
 
 static int
 fuse_vfsop_statfs(struct mount *mp, struct statfs *sbp)
 {
 	struct fuse_dispatcher fdi;
 	int err = 0;
 
 	struct fuse_statfs_out *fsfo;
 	struct fuse_data *data;
 
 	data = fuse_get_mpdata(mp);
 
 	if (!(data->dataflags & FSESS_INITED))
 		goto fake;
 
 	fdisp_init(&fdi, 0);
 	fdisp_make(&fdi, FUSE_STATFS, mp, FUSE_ROOT_ID, NULL, NULL);
 	err = fdisp_wait_answ(&fdi);
 	if (err) {
 		fdisp_destroy(&fdi);
 		if (err == ENOTCONN) {
 			/*
 	                 * We want to seem a legitimate fs even if the daemon
 	                 * is stiff dead... (so that, eg., we can still do path
 	                 * based unmounting after the daemon dies).
 	                 */
 			goto fake;
 		}
 		return err;
 	}
 	fsfo = fdi.answ;
 
 	sbp->f_blocks = fsfo->st.blocks;
 	sbp->f_bfree = fsfo->st.bfree;
 	sbp->f_bavail = fsfo->st.bavail;
 	sbp->f_files = fsfo->st.files;
 	sbp->f_ffree = fsfo->st.ffree;	/* cast from uint64_t to int64_t */
 	sbp->f_namemax = fsfo->st.namelen;
 	sbp->f_bsize = fsfo->st.frsize;	/* cast from uint32_t to uint64_t */
 
 	fdisp_destroy(&fdi);
 	return 0;
 
 fake:
 	sbp->f_blocks = 0;
 	sbp->f_bfree = 0;
 	sbp->f_bavail = 0;
 	sbp->f_files = 0;
 	sbp->f_ffree = 0;
 	sbp->f_namemax = 0;
 	sbp->f_bsize = S_BLKSIZE;
 
 	return 0;
 }
Index: projects/fuse2/tests/sys/fs/fusefs/notify.cc
===================================================================
--- projects/fuse2/tests/sys/fs/fusefs/notify.cc	(revision 348581)
+++ projects/fuse2/tests/sys/fs/fusefs/notify.cc	(revision 348582)
@@ -1,464 +1,459 @@
 /*-
  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
  *
  * Copyright (c) 2019 The FreeBSD Foundation
  *
  * This software was developed by BFF Storage Systems, LLC under sponsorship
  * from the FreeBSD Foundation.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */
 
 extern "C" {
 #include <sys/types.h>
 #include <sys/sysctl.h>
 
 #include <fcntl.h>
 #include <pthread.h>
 }
 
 #include "mockfs.hh"
 #include "utils.hh"
 
 using namespace testing;
 
 /*
  * FUSE asynchonous notification
  *
  * FUSE servers can send unprompted notification messages for things like cache
  * invalidation.  This file tests our client's handling of those messages.
  */
 
 class Notify: public FuseTest {
 public:
-virtual void SetUp() {
-	m_init_flags = FUSE_EXPORT_SUPPORT;
-	FuseTest::SetUp();
-}
-
 void expect_lookup(uint64_t parent, const char *relpath, uint64_t ino,
 	off_t size, Sequence &seq)
 {
 	EXPECT_LOOKUP(parent, relpath)
 	.InSequence(seq)
 	.WillOnce(Invoke(
 		ReturnImmediate([=](auto in __unused, auto& out) {
 		SET_OUT_HEADER_LEN(out, entry);
 		out.body.entry.attr.mode = S_IFREG | 0644;
 		out.body.entry.nodeid = ino;
 		out.body.entry.attr.ino = ino;
 		out.body.entry.attr.nlink = 1;
 		out.body.entry.attr.size = size;
 		out.body.entry.attr_valid = UINT64_MAX;
 		out.body.entry.entry_valid = UINT64_MAX;
 	})));
 }
 };
 
 class NotifyWriteback: public Notify {
 public:
 virtual void SetUp() {
 	const char *node = "vfs.fusefs.data_cache_mode";
 	int val = 0;
 	size_t size = sizeof(val);
 
 	Notify::SetUp();
 	if (IsSkipped())
 		return;
 
 	ASSERT_EQ(0, sysctlbyname(node, &val, &size, NULL, 0))
 		<< strerror(errno);
 	if (val != 2)
 		GTEST_SKIP() << "vfs.fusefs.data_cache_mode must be set to 2 "
 			"(writeback) for this test";
 }
 
 void expect_write(uint64_t ino, uint64_t offset, uint64_t size,
 	const void *contents)
 {
 	FuseTest::expect_write(ino, offset, size, size, 0, 0, contents);
 }
 
 };
 
 struct inval_entry_args {
 	MockFS		*mock;
 	ino_t		parent;
 	const char	*name;
 	size_t		namelen;
 };
 
 static void* inval_entry(void* arg) {
 	const struct inval_entry_args *iea = (struct inval_entry_args*)arg;
 	ssize_t r;
 
 	r = iea->mock->notify_inval_entry(iea->parent, iea->name, iea->namelen);
 	if (r >= 0)
 		return 0;
 	else
 		return (void*)(intptr_t)errno;
 }
 
 struct inval_inode_args {
 	MockFS		*mock;
 	ino_t		ino;
 	off_t		off;
 	ssize_t		len;
 };
 
 static void* inval_inode(void* arg) {
 	const struct inval_inode_args *iia = (struct inval_inode_args*)arg;
 	ssize_t r;
 
 	r = iia->mock->notify_inval_inode(iia->ino, iia->off, iia->len);
 	if (r >= 0)
 		return 0;
 	else
 		return (void*)(intptr_t)errno;
 }
 
 /* Invalidate a nonexistent entry */
 TEST_F(Notify, inval_entry_nonexistent)
 {
 	const static char *name = "foo";
 	struct inval_entry_args iea;
 	void *thr0_value;
 	pthread_t th0;
 
 	iea.mock = m_mock;
 	iea.parent = FUSE_ROOT_ID;
 	iea.name = name;
 	iea.namelen = strlen(name);
 	ASSERT_EQ(0, pthread_create(&th0, NULL, inval_entry, &iea))
 		<< strerror(errno);
 	pthread_join(th0, &thr0_value);
 	/* It's not an error for an entry to not be cached */
 	EXPECT_EQ(0, (intptr_t)thr0_value);
 }
 
 /* Invalidate a cached entry */
 TEST_F(Notify, inval_entry)
 {
 	const static char FULLPATH[] = "mountpoint/foo";
 	const static char RELPATH[] = "foo";
 	struct inval_entry_args iea;
 	struct stat sb;
 	void *thr0_value;
 	uint64_t ino0 = 42;
 	uint64_t ino1 = 43;
 	Sequence seq;
 	pthread_t th0;
 
 	expect_lookup(FUSE_ROOT_ID, RELPATH, ino0, 0, seq);
 	expect_lookup(FUSE_ROOT_ID, RELPATH, ino1, 0, seq);
 
 	/* Fill the entry cache */
 	ASSERT_EQ(0, stat(FULLPATH, &sb)) << strerror(errno);
 	EXPECT_EQ(ino0, sb.st_ino);
 
 	/* Now invalidate the entry */
 	iea.mock = m_mock;
 	iea.parent = FUSE_ROOT_ID;
 	iea.name = RELPATH;
 	iea.namelen = strlen(RELPATH);
 	ASSERT_EQ(0, pthread_create(&th0, NULL, inval_entry, &iea))
 		<< strerror(errno);
 	pthread_join(th0, &thr0_value);
 	EXPECT_EQ(0, (intptr_t)thr0_value);
 
 	/* The second lookup should return the alternate ino */
 	ASSERT_EQ(0, stat(FULLPATH, &sb)) << strerror(errno);
 	EXPECT_EQ(ino1, sb.st_ino);
 }
 
 /*
  * Invalidate a cached entry beneath the root, which uses a slightly different
  * code path.
  */
 TEST_F(Notify, inval_entry_below_root)
 {
 	const static char FULLPATH[] = "mountpoint/some_dir/foo";
 	const static char DNAME[] = "some_dir";
 	const static char FNAME[] = "foo";
 	struct inval_entry_args iea;
 	struct stat sb;
 	void *thr0_value;
 	uint64_t dir_ino = 41;
 	uint64_t ino0 = 42;
 	uint64_t ino1 = 43;
 	Sequence seq;
 	pthread_t th0;
 
 	EXPECT_LOOKUP(FUSE_ROOT_ID, DNAME)
 	.WillOnce(Invoke(
 		ReturnImmediate([=](auto in __unused, auto& out) {
 		SET_OUT_HEADER_LEN(out, entry);
 		out.body.entry.attr.mode = S_IFDIR | 0755;
 		out.body.entry.nodeid = dir_ino;
 		out.body.entry.attr.nlink = 2;
 		out.body.entry.attr_valid = UINT64_MAX;
 		out.body.entry.entry_valid = UINT64_MAX;
 	})));
 	expect_lookup(dir_ino, FNAME, ino0, 0, seq);
 	expect_lookup(dir_ino, FNAME, ino1, 0, seq);
 
 	/* Fill the entry cache */
 	ASSERT_EQ(0, stat(FULLPATH, &sb)) << strerror(errno);
 	EXPECT_EQ(ino0, sb.st_ino);
 
 	/* Now invalidate the entry */
 	iea.mock = m_mock;
 	iea.parent = dir_ino;
 	iea.name = FNAME;
 	iea.namelen = strlen(FNAME);
 	ASSERT_EQ(0, pthread_create(&th0, NULL, inval_entry, &iea))
 		<< strerror(errno);
 	pthread_join(th0, &thr0_value);
 	EXPECT_EQ(0, (intptr_t)thr0_value);
 
 	/* The second lookup should return the alternate ino */
 	ASSERT_EQ(0, stat(FULLPATH, &sb)) << strerror(errno);
 	EXPECT_EQ(ino1, sb.st_ino);
 }
 
 /* Invalidating an entry invalidates the parent directory's attributes */
 TEST_F(Notify, inval_entry_invalidates_parent_attrs)
 {
 	const static char FULLPATH[] = "mountpoint/foo";
 	const static char RELPATH[] = "foo";
 	struct inval_entry_args iea;
 	struct stat sb;
 	void *thr0_value;
 	uint64_t ino = 42;
 	Sequence seq;
 	pthread_t th0;
 
 	expect_lookup(FUSE_ROOT_ID, RELPATH, ino, 0, seq);
 	EXPECT_CALL(*m_mock, process(
 		ResultOf([=](auto in) {
 			return (in.header.opcode == FUSE_GETATTR &&
 				in.header.nodeid == FUSE_ROOT_ID);
 		}, Eq(true)),
 		_)
 	).Times(2)
 	.WillRepeatedly(Invoke(ReturnImmediate([=](auto i __unused, auto& out) {
 		SET_OUT_HEADER_LEN(out, attr);
 		out.body.attr.attr.mode = S_IFDIR | 0755;
 		out.body.attr.attr_valid = UINT64_MAX;
 	})));
 
 	/* Fill the attr and entry cache */
 	ASSERT_EQ(0, stat("mountpoint", &sb)) << strerror(errno);
 	ASSERT_EQ(0, stat(FULLPATH, &sb)) << strerror(errno);
 
 	/* Now invalidate the entry */
 	iea.mock = m_mock;
 	iea.parent = FUSE_ROOT_ID;
 	iea.name = RELPATH;
 	iea.namelen = strlen(RELPATH);
 	ASSERT_EQ(0, pthread_create(&th0, NULL, inval_entry, &iea))
 		<< strerror(errno);
 	pthread_join(th0, &thr0_value);
 	EXPECT_EQ(0, (intptr_t)thr0_value);
 
 	/* /'s attribute cache should be cleared */
 	ASSERT_EQ(0, stat("mountpoint", &sb)) << strerror(errno);
 }
 
 
 TEST_F(Notify, inval_inode_nonexistent)
 {
 	struct inval_inode_args iia;
 	ino_t ino = 42;
 	void *thr0_value;
 	pthread_t th0;
 
 	iia.mock = m_mock;
 	iia.ino = ino;
 	iia.off = 0;
 	iia.len = 0;
 	ASSERT_EQ(0, pthread_create(&th0, NULL, inval_inode, &iia))
 		<< strerror(errno);
 	pthread_join(th0, &thr0_value);
 	/* It's not an error for an inode to not be cached */
 	EXPECT_EQ(0, (intptr_t)thr0_value);
 }
 
 TEST_F(Notify, inval_inode_with_clean_cache)
 {
 	const static char FULLPATH[] = "mountpoint/foo";
 	const static char RELPATH[] = "foo";
 	const char CONTENTS0[] = "abcdefgh";
 	const char CONTENTS1[] = "ijklmnopqrstuvwxyz";
 	struct inval_inode_args iia;
 	struct stat sb;
 	ino_t ino = 42;
 	void *thr0_value;
 	Sequence seq;
 	uid_t uid = 12345;
 	pthread_t th0;
 	ssize_t size0 = sizeof(CONTENTS0);
 	ssize_t size1 = sizeof(CONTENTS1);
 	char buf[80];
 	int fd;
 
 	expect_lookup(FUSE_ROOT_ID, RELPATH, ino, size0, seq);
 	expect_open(ino, 0, 1);
 	EXPECT_CALL(*m_mock, process(
 		ResultOf([=](auto in) {
 			return (in.header.opcode == FUSE_GETATTR &&
 				in.header.nodeid == ino);
 		}, Eq(true)),
 		_)
 	).WillOnce(Invoke(ReturnImmediate([=](auto i __unused, auto& out) {
 		SET_OUT_HEADER_LEN(out, attr);
 		out.body.attr.attr.mode = S_IFREG | 0644;
 		out.body.attr.attr_valid = UINT64_MAX;
 		out.body.attr.attr.size = size1;
 		out.body.attr.attr.uid = uid;
 	})));
 	expect_read(ino, 0, size0, size0, CONTENTS0);
 	expect_read(ino, 0, size1, size1, CONTENTS1);
 
 	/* Fill the data cache */
 	fd = open(FULLPATH, O_RDWR);
 	ASSERT_LE(0, fd) << strerror(errno);
 	ASSERT_EQ(size0, read(fd, buf, size0)) << strerror(errno);
 	EXPECT_EQ(0, memcmp(buf, CONTENTS0, size0));
 
 	/* Evict the data cache */
 	iia.mock = m_mock;
 	iia.ino = ino;
 	iia.off = 0;
 	iia.len = 0;
 	ASSERT_EQ(0, pthread_create(&th0, NULL, inval_inode, &iia))
 		<< strerror(errno);
 	pthread_join(th0, &thr0_value);
 	EXPECT_EQ(0, (intptr_t)thr0_value);
 
 	/* cache attributes were been purged; this will trigger a new GETATTR */
 	ASSERT_EQ(0, stat(FULLPATH, &sb)) << strerror(errno);
 	EXPECT_EQ(uid, sb.st_uid);
 	EXPECT_EQ(size1, sb.st_size);
 
 	/* This read should not be serviced by cache */
 	ASSERT_EQ(0, lseek(fd, 0, SEEK_SET)) << strerror(errno);
 	ASSERT_EQ(size1, read(fd, buf, size1)) << strerror(errno);
 	EXPECT_EQ(0, memcmp(buf, CONTENTS1, size1));
 
 	/* Deliberately leak fd.  close(2) will be tested in release.cc */
 }
 
 /* https://bugs.freebsd.org/bugzilla/show_bug.cgi?id=238312 */
 TEST_F(NotifyWriteback, DISABLED_inval_inode_with_dirty_cache)
 {
 	const static char FULLPATH[] = "mountpoint/foo";
 	const static char RELPATH[] = "foo";
 	const char CONTENTS[] = "abcdefgh";
 	struct inval_inode_args iia;
 	ino_t ino = 42;
 	void *thr0_value;
 	Sequence seq;
 	pthread_t th0;
 	ssize_t bufsize = sizeof(CONTENTS);
 	int fd;
 
 	expect_lookup(FUSE_ROOT_ID, RELPATH, ino, 0, seq);
 	expect_open(ino, 0, 1);
 
 	/* Fill the data cache */
 	fd = open(FULLPATH, O_RDWR);
 	ASSERT_EQ(bufsize, write(fd, CONTENTS, bufsize)) << strerror(errno);
 
 	/* Evict the data cache */
 	expect_write(ino, 0, bufsize, CONTENTS);
 	iia.mock = m_mock;
 	iia.ino = ino;
 	iia.off = 0;
 	iia.len = 0;
 	ASSERT_EQ(0, pthread_create(&th0, NULL, inval_inode, &iia))
 		<< strerror(errno);
 	pthread_join(th0, &thr0_value);
 	EXPECT_EQ(0, (intptr_t)thr0_value);
 
 	/* Deliberately leak fd.  close(2) will be tested in release.cc */
 }
 
 /* https://bugs.freebsd.org/bugzilla/show_bug.cgi?id=238312 */
 TEST_F(NotifyWriteback, DISABLED_inval_inode_attrs_only)
 {
 	const static char FULLPATH[] = "mountpoint/foo";
 	const static char RELPATH[] = "foo";
 	const char CONTENTS[] = "abcdefgh";
 	struct inval_inode_args iia;
 	struct stat sb;
 	uid_t uid = 12345;
 	ino_t ino = 42;
 	void *thr0_value;
 	Sequence seq;
 	pthread_t th0;
 	ssize_t bufsize = sizeof(CONTENTS);
 	int fd;
 
 	expect_lookup(FUSE_ROOT_ID, RELPATH, ino, 0, seq);
 	expect_open(ino, 0, 1);
 	EXPECT_CALL(*m_mock, process(
 		ResultOf([=](auto in) {
 			return (in.header.opcode == FUSE_WRITE);
 		}, Eq(true)),
 		_)
 	).Times(0);
 	EXPECT_CALL(*m_mock, process(
 		ResultOf([=](auto in) {
 			return (in.header.opcode == FUSE_GETATTR &&
 				in.header.nodeid == FUSE_ROOT_ID);
 		}, Eq(true)),
 		_)
 	).WillOnce(Invoke(ReturnImmediate([=](auto i __unused, auto& out) {
 		SET_OUT_HEADER_LEN(out, attr);
 		out.body.attr.attr.mode = S_IFREG | 0644;
 		out.body.attr.attr_valid = UINT64_MAX;
 		out.body.attr.attr.size = bufsize;
 		out.body.attr.attr.uid = uid;
 	})));
 
 	/* Fill the data cache */
 	fd = open(FULLPATH, O_RDWR);
 	ASSERT_EQ(bufsize, write(fd, CONTENTS, bufsize)) << strerror(errno);
 
 	/* Evict the attributes, but not data cache */
 	iia.mock = m_mock;
 	iia.ino = ino;
 	iia.off = -1;
 	iia.len = 0;
 	ASSERT_EQ(0, pthread_create(&th0, NULL, inval_inode, &iia))
 		<< strerror(errno);
 	pthread_join(th0, &thr0_value);
 	EXPECT_EQ(0, (intptr_t)thr0_value);
 
 	/* cache attributes were been purged; this will trigger a new GETATTR */
 	ASSERT_EQ(0, stat(FULLPATH, &sb)) << strerror(errno);
 	EXPECT_EQ(uid, sb.st_uid);
 	EXPECT_EQ(bufsize, sb.st_size);
 
 	/* Deliberately leak fd.  close(2) will be tested in release.cc */
 }