miscfs/nullfs/null_vnops.c

54753Sjohnh/*
54753Sjohnh * Copyright (c) 1992 The Regents of the University of California
54753Sjohnh * All rights reserved.
54753Sjohnh *
54766Sjohnh * This code is derived from the null layer of
*54893Sheideman * John Heidemann from the UCLA Ficus project and
*54893Sheideman * Jan-Simon Pendry's loopback file system.
54753Sjohnh *
54753Sjohnh * %sccs.include.redist.c%
54753Sjohnh *
*54893Sheideman *	@(#)null_vnops.c	1.4 (Berkeley) 07/10/92
54766Sjohnh *
54766Sjohnh * Ancestors:
54753Sjohnh *	@(#)lofs_vnops.c	1.2 (Berkeley) 6/18/92
54766Sjohnh *	$Id: lofs_vnops.c,v 1.11 1992/05/30 10:05:43 jsp Exp jsp $
54766Sjohnh *	...and...
54766Sjohnh *	@(#)null_vnodeops.c 1.20 92/07/07 UCLA Ficus project
54753Sjohnh */
54753Sjohnh
54753Sjohnh/*
54766Sjohnh * Null Layer
54766Sjohnh *
54766Sjohnh * The null layer duplicates a portion of the file system
54766Sjohnh * name space under a new name.  In this respect, it is
54766Sjohnh * similar to the loopback file system.  It differs from
54766Sjohnh * the loopback fs in two respects:  it is implemented using
*54893Sheideman * a bypass operation, and it's "null-node"s stack above
54766Sjohnh * all lower-layer vnodes, not just over directory vnodes.
54766Sjohnh *
54766Sjohnh * The null layer is the minimum file system layer,
54766Sjohnh * simply bypassing all possible operations to the lower layer
54766Sjohnh * for processing there.  All but vop_getattr, _inactive, _reclaim,
54766Sjohnh * and _print are bypassed.
54766Sjohnh *
54766Sjohnh * Vop_getattr is not bypassed so that we can change the fsid being
54766Sjohnh * returned.  Vop_{inactive,reclaim} are bypassed so that
54766Sjohnh * they can handle freeing null-layer specific data.
54766Sjohnh * Vop_print is not bypassed for debugging.
54766Sjohnh *
*54893Sheideman *
*54893Sheideman * INVOKING OPERATIONS ON LOWER LAYERS
*54893Sheideman *
54766Sjohnh * NEEDSWORK: Describe methods to invoke operations on the lower layer
54766Sjohnh * (bypass vs. VOP).
*54893Sheideman *
*54893Sheideman *
*54893Sheideman * CREATING NEW FILESYSTEM LAYERS
*54893Sheideman *
*54893Sheideman * One of the easiest ways to construct new file system layers is to make
*54893Sheideman * a copy of the null layer, rename all files and variables, and
*54893Sheideman * then begin modifing the copy.  Sed can be used to easily rename
*54893Sheideman * all variables.
*54893Sheideman *
54753Sjohnh */
54753Sjohnh
54753Sjohnh#include <sys/param.h>
54753Sjohnh#include <sys/systm.h>
54753Sjohnh#include <sys/proc.h>
54753Sjohnh#include <sys/time.h>
54753Sjohnh#include <sys/types.h>
54753Sjohnh#include <sys/vnode.h>
54753Sjohnh#include <sys/mount.h>
54753Sjohnh#include <sys/namei.h>
54753Sjohnh#include <sys/malloc.h>
54753Sjohnh#include <sys/buf.h>
*54893Sheideman#include <nullfs/null.h>
54753Sjohnh
54753Sjohnh
54766Sjohnhint null_bug_bypass = 0;   /* for debugging: enables bypass printf'ing */
54753Sjohnh
54753Sjohnh/*
54766Sjohnh * This is the 10-Apr-92 bypass routine.
54766Sjohnh *    This version has been optimized for speed, throwing away some
54766Sjohnh * safety checks.  It should still always work, but it's not as
54766Sjohnh * robust to programmer errors.
54766Sjohnh *    Define SAFETY to include some error checking code.
54766Sjohnh *
54766Sjohnh * In general, we map all vnodes going down and unmap them on the way back.
54766Sjohnh * As an exception to this, vnodes can be marked "unmapped" by setting
54766Sjohnh * the Nth bit in operation's vdesc_flags.
54766Sjohnh *
54766Sjohnh * Also, some BSD vnode operations have the side effect of vrele'ing
54766Sjohnh * their arguments.  With stacking, the reference counts are held
54766Sjohnh * by the upper node, not the lower one, so we must handle these
54766Sjohnh * side-effects here.  This is not of concern in Sun-derived systems
54766Sjohnh * since there are no such side-effects.
54766Sjohnh *
54766Sjohnh * This makes the following assumptions:
54766Sjohnh * - only one returned vpp
54766Sjohnh * - no INOUT vpp's (Sun's vop_open has one of these)
54766Sjohnh * - the vnode operation vector of the first vnode should be used
54766Sjohnh *   to determine what implementation of the op should be invoked
54766Sjohnh * - all mapped vnodes are of our vnode-type (NEEDSWORK:
54766Sjohnh *   problems on rmdir'ing mount points and renaming?)
54766Sjohnh */
54766Sjohnhint
54766Sjohnhnull_bypass(ap)
*54893Sheideman	struct vop_generic_args *ap;
54753Sjohnh{
*54893Sheideman	extern int (**null_vnodeop_p)();  /* not extern, really "forward" */
*54893Sheideman	register struct vnode **this_vp_p;
54753Sjohnh	int error;
54766Sjohnh	struct vnode *old_vps[VDESC_MAX_VPS];
54766Sjohnh	struct vnode **vps_p[VDESC_MAX_VPS];
54766Sjohnh	struct vnode ***vppp;
54766Sjohnh	struct vnodeop_desc *descp = ap->a_desc;
*54893Sheideman	int reles, i;
54753Sjohnh
54766Sjohnh	if (null_bug_bypass)
54766Sjohnh		printf ("null_bypass: %s\n", descp->vdesc_name);
54753Sjohnh
54766Sjohnh#ifdef SAFETY
54753Sjohnh	/*
54766Sjohnh	 * We require at least one vp.
54753Sjohnh	 */
54766Sjohnh	if (descp->vdesc_vp_offsets==NULL ||
54766Sjohnh	    descp->vdesc_vp_offsets[0]==VDESC_NO_OFFSET)
54766Sjohnh		panic ("null_bypass: no vp's in map.\n");
54753Sjohnh#endif
54753Sjohnh
54753Sjohnh	/*
54766Sjohnh	 * Map the vnodes going in.
54766Sjohnh	 * Later, we'll invoke the operation based on
54766Sjohnh	 * the first mapped vnode's operation vector.
54753Sjohnh	 */
*54893Sheideman	reles = descp->vdesc_flags;
*54893Sheideman	for (i=0; i<VDESC_MAX_VPS; reles>>=1, i++) {
54766Sjohnh		if (descp->vdesc_vp_offsets[i]==VDESC_NO_OFFSET)
54766Sjohnh			break;   /* bail out at end of list */
54766Sjohnh		vps_p[i] = this_vp_p =
54766Sjohnh			VOPARG_OFFSETTO(struct vnode**,descp->vdesc_vp_offsets[i],ap);
*54893Sheideman		/*
*54893Sheideman		 * We're not guaranteed that any but the first vnode
*54893Sheideman		 * are of our type.  Check for and don't map any
*54893Sheideman		 * that aren't.
*54893Sheideman		 */
*54893Sheideman		if ((*this_vp_p)->v_op != null_vnodeop_p) {
*54893Sheideman			old_vps[i] = NULL;
*54893Sheideman		} else {
*54893Sheideman			old_vps[i] = *this_vp_p;
*54893Sheideman			*(vps_p[i]) = NULLVPTOLOWERVP(*this_vp_p);
*54893Sheideman			if (reles & 1)
*54893Sheideman				VREF(*this_vp_p);
*54893Sheideman		};
54766Sjohnh
54766Sjohnh	};
54753Sjohnh
54753Sjohnh	/*
54766Sjohnh	 * Call the operation on the lower layer
54766Sjohnh	 * with the modified argument structure.
54753Sjohnh	 */
54766Sjohnh	error = VCALL(*(vps_p[0]), descp->vdesc_offset, ap);
54753Sjohnh
54753Sjohnh	/*
54766Sjohnh	 * Maintain the illusion of call-by-value
54766Sjohnh	 * by restoring vnodes in the argument structure
54766Sjohnh	 * to their original value.
54753Sjohnh	 */
*54893Sheideman	reles = descp->vdesc_flags;
*54893Sheideman	for (i=0; i<VDESC_MAX_VPS; reles>>=1, i++) {
54766Sjohnh		if (descp->vdesc_vp_offsets[i]==VDESC_NO_OFFSET)
54766Sjohnh			break;   /* bail out at end of list */
*54893Sheideman		if (old_vps[i]) {
*54893Sheideman			*(vps_p[i]) = old_vps[i];
*54893Sheideman			if (reles & 1)
*54893Sheideman				vrele(*(vps_p[i]));
*54893Sheideman		};
54766Sjohnh	};
54766Sjohnh
54753Sjohnh	/*
54766Sjohnh	 * Map the possible out-going vpp.
54753Sjohnh	 */
54766Sjohnh	if (descp->vdesc_vpp_offset != VDESC_NO_OFFSET &&
54766Sjohnh	    !(descp->vdesc_flags & VDESC_NOMAP_VPP) &&
54766Sjohnh	    !error) {
54766Sjohnh		vppp=VOPARG_OFFSETTO(struct vnode***,
54766Sjohnh				 descp->vdesc_vpp_offset,ap);
*54893Sheideman		error = null_node_create(old_vps[0]->v_mount, **vppp, *vppp);
54766Sjohnh	};
54753Sjohnh
54766Sjohnh	return (error);
54753Sjohnh}
54753Sjohnh
54753Sjohnh
54753Sjohnh/*
54766Sjohnh *  We handle getattr to change the fsid.
54753Sjohnh */
54766Sjohnhint
54766Sjohnhnull_getattr(ap)
*54893Sheideman	struct vop_getattr_args *ap;
54753Sjohnh{
54753Sjohnh	int error;
54766Sjohnh	if (error=null_bypass(ap))
54766Sjohnh		return error;
54766Sjohnh	/* Requires that arguments be restored. */
54766Sjohnh	ap->a_vap->va_fsid = ap->a_vp->v_mount->mnt_stat.f_fsid.val[0];
54766Sjohnh	return 0;
54766Sjohnh}
54753Sjohnh
54753Sjohnh
54766Sjohnhint
54754Sjohnhnull_inactive (ap)
54753Sjohnh	struct vop_inactive_args *ap;
54753Sjohnh{
54754Sjohnh#ifdef NULLFS_DIAGNOSTIC
*54893Sheideman	printf("null_inactive(ap->a_vp = %x->%x)\n", ap->a_vp, NULLVPTOLOWERVP(ap->a_vp));
54753Sjohnh#endif
54766Sjohnh	/*
54766Sjohnh	 * Do nothing (and _don't_ bypass).
54766Sjohnh	 * Wait to vrele lowervp until reclaim,
54766Sjohnh	 * so that until then our null_node is in the
54766Sjohnh	 * cache and reusable.
54766Sjohnh	 *
54766Sjohnh	 * NEEDSWORK: Someday, consider inactive'ing
54766Sjohnh	 * the lowervp and then trying to reactivate it
54766Sjohnh	 * like they do in the name lookup cache code.
54766Sjohnh	 * That's too much work for now.
54766Sjohnh	 */
54766Sjohnh	return 0;
54753Sjohnh}
54753Sjohnh
54754Sjohnhnull_reclaim (ap)
54753Sjohnh	struct vop_reclaim_args *ap;
54753Sjohnh{
54753Sjohnh	struct vnode *targetvp;
54754Sjohnh#ifdef NULLFS_DIAGNOSTIC
*54893Sheideman	printf("null_reclaim(ap->a_vp = %x->%x)\n", ap->a_vp, NULLVPTOLOWERVP(ap->a_vp));
54753Sjohnh#endif
*54893Sheideman	remque(VTONULL(ap->a_vp));	     /* NEEDSWORK: What? */
*54893Sheideman	vrele (NULLVPTOLOWERVP(ap->a_vp));   /* release lower layer */
54753Sjohnh	FREE(ap->a_vp->v_data, M_TEMP);
54753Sjohnh	ap->a_vp->v_data = 0;
54753Sjohnh	return (0);
54753Sjohnh}
54753Sjohnh
54754Sjohnhnull_bmap (ap)
54753Sjohnh	struct vop_bmap_args *ap;
54753Sjohnh{
54754Sjohnh#ifdef NULLFS_DIAGNOSTIC
*54893Sheideman	printf("null_bmap(ap->a_vp = %x->%x)\n", ap->a_vp, NULLVPTOLOWERVP(ap->a_vp));
54753Sjohnh#endif
54753Sjohnh
*54893Sheideman	return VOP_BMAP(NULLVPTOLOWERVP(ap->a_vp), ap->a_bn, ap->a_vpp, ap->a_bnp);
54753Sjohnh}
54753Sjohnh
54754Sjohnhnull_strategy (ap)
54753Sjohnh	struct vop_strategy_args *ap;
54753Sjohnh{
54753Sjohnh	int error;
54766Sjohnh	struct vnode *savedvp;
54753Sjohnh
54754Sjohnh#ifdef NULLFS_DIAGNOSTIC
*54893Sheideman	printf("null_strategy(vp = %x->%x)\n", ap->a_bp->b_vp, NULLVPTOLOWERVP(ap->a_bp->b_vp));
54753Sjohnh#endif
54753Sjohnh
54766Sjohnh	savedvp = ap->a_bp->b_vp;
54753Sjohnh
54753Sjohnh	error = VOP_STRATEGY(ap->a_bp);
54753Sjohnh
54766Sjohnh	ap->a_bp->b_vp = savedvp;
54753Sjohnh
54766Sjohnh	return error;
54753Sjohnh}
54753Sjohnh
54766Sjohnh
54766Sjohnhint
54754Sjohnhnull_print (ap)
54753Sjohnh	struct vop_print_args *ap;
54753Sjohnh{
54766Sjohnh	register struct vnode *vp = ap->a_vp;
*54893Sheideman	printf ("tag VT_NULLFS, vp=%x, lowervp=%x\n", vp, NULLVPTOLOWERVP(vp));
54766Sjohnh	return 0;
54753Sjohnh}
54753Sjohnh
54753Sjohnh
54753Sjohnh/*
54766Sjohnh * Global vfs data structures
54753Sjohnh */
54753Sjohnh/*
54766Sjohnh * NEEDSWORK: strategy,bmap are hand coded currently.  They should
54766Sjohnh * go away with a merged buffer/block cache.
54766Sjohnh *
54753Sjohnh */
54766Sjohnhint (**null_vnodeop_p)();
*54893Sheidemanstruct vnodeopv_entry_desc null_vnodeop_entries[] = {
54766Sjohnh	{ &vop_default_desc, null_bypass },
54753Sjohnh
54766Sjohnh	{ &vop_getattr_desc, null_getattr },
54766Sjohnh	{ &vop_inactive_desc, null_inactive },
54766Sjohnh	{ &vop_reclaim_desc, null_reclaim },
54766Sjohnh	{ &vop_print_desc, null_print },
54753Sjohnh
54766Sjohnh	{ &vop_bmap_desc, null_bmap },
54766Sjohnh	{ &vop_strategy_desc, null_strategy },
54753Sjohnh
54753Sjohnh	{ (struct vnodeop_desc*)NULL, (int(*)())NULL }
54753Sjohnh};
*54893Sheidemanstruct vnodeopv_desc null_vnodeop_opv_desc =
*54893Sheideman	{ &null_vnodeop_p, null_vnodeop_entries };