137488Smckusick /* 263180Sbostic * Copyright (c) 1989, 1993 363180Sbostic * The Regents of the University of California. All rights reserved. 4*65771Sbostic * (c) UNIX System Laboratories, Inc. 5*65771Sbostic * All or some portions of this file are derived from material licensed 6*65771Sbostic * to the University of California by American Telephone and Telegraph 7*65771Sbostic * Co. or Unix System Laboratories, Inc. and are reproduced herein with 8*65771Sbostic * the permission of UNIX System Laboratories, Inc. 937488Smckusick * 1044458Sbostic * %sccs.include.redist.c% 1137488Smckusick * 12*65771Sbostic * @(#)vfs_subr.c 8.9 (Berkeley) 01/21/94 1337488Smckusick */ 1437488Smckusick 1537488Smckusick /* 1637488Smckusick * External virtual filesystem routines 1737488Smckusick */ 1837488Smckusick 1951460Sbostic #include <sys/param.h> 2053829Spendry #include <sys/systm.h> 2151460Sbostic #include <sys/proc.h> 2251460Sbostic #include <sys/mount.h> 2351460Sbostic #include <sys/time.h> 2451460Sbostic #include <sys/vnode.h> 2552415Smckusick #include <sys/stat.h> 2651460Sbostic #include <sys/namei.h> 2751460Sbostic #include <sys/ucred.h> 2851460Sbostic #include <sys/buf.h> 2951460Sbostic #include <sys/errno.h> 3051460Sbostic #include <sys/malloc.h> 3165679Shibler #include <sys/domain.h> 3265679Shibler #include <sys/mbuf.h> 3337488Smckusick 3460930Smckusick #include <vm/vm.h> 3560930Smckusick #include <sys/sysctl.h> 3660930Smckusick 3755050Spendry #include <miscfs/specfs/specdev.h> 3855050Spendry 3952415Smckusick enum vtype iftovt_tab[16] = { 4052415Smckusick VNON, VFIFO, VCHR, VNON, VDIR, VNON, VBLK, VNON, 4152415Smckusick VREG, VNON, VLNK, VNON, VSOCK, VNON, VNON, VBAD, 4252415Smckusick }; 4352415Smckusick int vttoif_tab[9] = { 4452415Smckusick 0, S_IFREG, S_IFDIR, S_IFBLK, S_IFCHR, S_IFLNK, 4552415Smckusick S_IFSOCK, S_IFIFO, S_IFMT, 4652415Smckusick }; 4752415Smckusick 4837488Smckusick /* 4956608Smckusick * Insq/Remq for the vnode usage lists. 5056608Smckusick */ 5165260Smckusick #define bufinsvn(bp, dp) LIST_INSERT_HEAD(dp, bp, b_vnbufs) 5265260Smckusick #define bufremvn(bp) { \ 5365260Smckusick LIST_REMOVE(bp, b_vnbufs); \ 5465260Smckusick (bp)->b_vnbufs.le_next = NOLIST; \ 5565260Smckusick } 5656608Smckusick 5765260Smckusick TAILQ_HEAD(freelst, vnode) vnode_free_list; /* vnode free list */ 5865260Smckusick struct mntlist mountlist; /* mounted filesystem list */ 5965260Smckusick 6056608Smckusick /* 6165260Smckusick * Initialize the vnode management data structures. 6237488Smckusick */ 6365260Smckusick vntblinit() 6437488Smckusick { 6537488Smckusick 6665260Smckusick TAILQ_INIT(&vnode_free_list); 6765260Smckusick TAILQ_INIT(&mountlist); 6837488Smckusick } 6937488Smckusick 7037488Smckusick /* 7137488Smckusick * Lock a filesystem. 7237488Smckusick * Used to prevent access to it while mounting and unmounting. 7337488Smckusick */ 7437488Smckusick vfs_lock(mp) 7537488Smckusick register struct mount *mp; 7637488Smckusick { 7737488Smckusick 7841400Smckusick while(mp->mnt_flag & MNT_MLOCK) { 7941400Smckusick mp->mnt_flag |= MNT_MWAIT; 8039045Smckusick sleep((caddr_t)mp, PVFS); 8139045Smckusick } 8241400Smckusick mp->mnt_flag |= MNT_MLOCK; 8337488Smckusick return (0); 8437488Smckusick } 8537488Smckusick 8637488Smckusick /* 8737488Smckusick * Unlock a locked filesystem. 8837488Smckusick * Panic if filesystem is not locked. 8937488Smckusick */ 9037488Smckusick void 9137488Smckusick vfs_unlock(mp) 9237488Smckusick register struct mount *mp; 9337488Smckusick { 9437488Smckusick 9541400Smckusick if ((mp->mnt_flag & MNT_MLOCK) == 0) 9641300Smckusick panic("vfs_unlock: not locked"); 9741400Smckusick mp->mnt_flag &= ~MNT_MLOCK; 9841400Smckusick if (mp->mnt_flag & MNT_MWAIT) { 9941400Smckusick mp->mnt_flag &= ~MNT_MWAIT; 10037488Smckusick wakeup((caddr_t)mp); 10137488Smckusick } 10237488Smckusick } 10337488Smckusick 10437488Smckusick /* 10541300Smckusick * Mark a mount point as busy. 10641300Smckusick * Used to synchronize access and to delay unmounting. 10741300Smckusick */ 10841300Smckusick vfs_busy(mp) 10941300Smckusick register struct mount *mp; 11041300Smckusick { 11141300Smckusick 11241400Smckusick while(mp->mnt_flag & MNT_MPBUSY) { 11341400Smckusick mp->mnt_flag |= MNT_MPWANT; 11441400Smckusick sleep((caddr_t)&mp->mnt_flag, PVFS); 11541300Smckusick } 11641419Smckusick if (mp->mnt_flag & MNT_UNMOUNT) 11741419Smckusick return (1); 11841400Smckusick mp->mnt_flag |= MNT_MPBUSY; 11941300Smckusick return (0); 12041300Smckusick } 12141300Smckusick 12241300Smckusick /* 12341300Smckusick * Free a busy filesystem. 12441300Smckusick * Panic if filesystem is not busy. 12541300Smckusick */ 12641300Smckusick vfs_unbusy(mp) 12741300Smckusick register struct mount *mp; 12841300Smckusick { 12941300Smckusick 13041400Smckusick if ((mp->mnt_flag & MNT_MPBUSY) == 0) 13141300Smckusick panic("vfs_unbusy: not busy"); 13241400Smckusick mp->mnt_flag &= ~MNT_MPBUSY; 13341400Smckusick if (mp->mnt_flag & MNT_MPWANT) { 13441400Smckusick mp->mnt_flag &= ~MNT_MPWANT; 13541400Smckusick wakeup((caddr_t)&mp->mnt_flag); 13641300Smckusick } 13741300Smckusick } 13841300Smckusick 13941300Smckusick /* 14037488Smckusick * Lookup a mount point by filesystem identifier. 14137488Smckusick */ 14237488Smckusick struct mount * 14337488Smckusick getvfs(fsid) 14437488Smckusick fsid_t *fsid; 14537488Smckusick { 14637488Smckusick register struct mount *mp; 14737488Smckusick 14865260Smckusick for (mp = mountlist.tqh_first; mp != NULL; mp = mp->mnt_list.tqe_next) { 14941400Smckusick if (mp->mnt_stat.f_fsid.val[0] == fsid->val[0] && 15065260Smckusick mp->mnt_stat.f_fsid.val[1] == fsid->val[1]) 15138288Smckusick return (mp); 15265260Smckusick } 15338288Smckusick return ((struct mount *)0); 15437488Smckusick } 15537488Smckusick 15637488Smckusick /* 15753829Spendry * Get a new unique fsid 15853829Spendry */ 15953829Spendry void 16053829Spendry getnewfsid(mp, mtype) 16153829Spendry struct mount *mp; 16253829Spendry int mtype; 16353829Spendry { 16453829Spendry static u_short xxxfs_mntid; 16553829Spendry 16653829Spendry fsid_t tfsid; 16753829Spendry 16865507Spendry mp->mnt_stat.f_fsid.val[0] = makedev(nblkdev + mtype, 0); 16953829Spendry mp->mnt_stat.f_fsid.val[1] = mtype; 17053829Spendry if (xxxfs_mntid == 0) 17153829Spendry ++xxxfs_mntid; 17265507Spendry tfsid.val[0] = makedev(nblkdev + mtype, xxxfs_mntid); 17353829Spendry tfsid.val[1] = mtype; 17465260Smckusick if (mountlist.tqh_first != NULL) { 17553936Spendry while (getvfs(&tfsid)) { 17653936Spendry tfsid.val[0]++; 17753936Spendry xxxfs_mntid++; 17853936Spendry } 17953829Spendry } 18053829Spendry mp->mnt_stat.f_fsid.val[0] = tfsid.val[0]; 18153829Spendry } 18253829Spendry 18353829Spendry /* 18437488Smckusick * Set vnode attributes to VNOVAL 18537488Smckusick */ 18637488Smckusick void vattr_null(vap) 18737488Smckusick register struct vattr *vap; 18837488Smckusick { 18937488Smckusick 19037488Smckusick vap->va_type = VNON; 19152005Smckusick vap->va_size = vap->va_bytes = VNOVAL; 19237488Smckusick vap->va_mode = vap->va_nlink = vap->va_uid = vap->va_gid = 19352005Smckusick vap->va_fsid = vap->va_fileid = 19452005Smckusick vap->va_blocksize = vap->va_rdev = 19554347Smckusick vap->va_atime.ts_sec = vap->va_atime.ts_nsec = 19654347Smckusick vap->va_mtime.ts_sec = vap->va_mtime.ts_nsec = 19754347Smckusick vap->va_ctime.ts_sec = vap->va_ctime.ts_nsec = 19838258Smckusick vap->va_flags = vap->va_gen = VNOVAL; 19958548Sbostic vap->va_vaflags = 0; 20037488Smckusick } 20138265Smckusick 20238265Smckusick /* 20339397Smckusick * Routines having to do with the management of the vnode table. 20439397Smckusick */ 20553547Sheideman extern int (**dead_vnodeop_p)(); 20639635Smckusick extern void vclean(); 20740883Smckusick long numvnodes; 20853493Sheideman extern struct vattr va_null; 20939397Smckusick 21039397Smckusick /* 21139397Smckusick * Return the next vnode from the free list. 21239397Smckusick */ 21339397Smckusick getnewvnode(tag, mp, vops, vpp) 21439397Smckusick enum vtagtype tag; 21539397Smckusick struct mount *mp; 21653495Sheideman int (**vops)(); 21739397Smckusick struct vnode **vpp; 21839397Smckusick { 21965511Smckusick register struct vnode *vp; 22057042Smargo int s; 22139397Smckusick 22265260Smckusick if ((vnode_free_list.tqh_first == NULL && 22365260Smckusick numvnodes < 2 * desiredvnodes) || 22454347Smckusick numvnodes < desiredvnodes) { 22545118Smckusick vp = (struct vnode *)malloc((u_long)sizeof *vp, 22645118Smckusick M_VNODE, M_WAITOK); 22740883Smckusick bzero((char *)vp, sizeof *vp); 22840883Smckusick numvnodes++; 22940883Smckusick } else { 23065260Smckusick if ((vp = vnode_free_list.tqh_first) == NULL) { 23140883Smckusick tablefull("vnode"); 23240883Smckusick *vpp = 0; 23340883Smckusick return (ENFILE); 23440883Smckusick } 23540883Smckusick if (vp->v_usecount) 23640883Smckusick panic("free vnode isn't"); 23765260Smckusick TAILQ_REMOVE(&vnode_free_list, vp, v_freelist); 23865505Smckusick /* see comment on why 0xdeadb is set at end of vgone (below) */ 23965505Smckusick vp->v_freelist.tqe_prev = (struct vnode **)0xdeadb; 24052190Smckusick vp->v_lease = NULL; 24140883Smckusick if (vp->v_type != VBAD) 24240883Smckusick vgone(vp); 24357042Smargo #ifdef DIAGNOSTIC 24452006Smckusick if (vp->v_data) 24552006Smckusick panic("cleaned vnode isn't"); 24657042Smargo s = splbio(); 24757042Smargo if (vp->v_numoutput) 24857042Smargo panic("Clean vnode has pending I/O's"); 24957042Smargo splx(s); 25057042Smargo #endif 25140883Smckusick vp->v_flag = 0; 25240883Smckusick vp->v_lastr = 0; 25365745Shibler vp->v_ralen = 0; 25465745Shibler vp->v_maxra = 0; 25557042Smargo vp->v_lastw = 0; 25657042Smargo vp->v_lasta = 0; 25757042Smargo vp->v_cstart = 0; 25857042Smargo vp->v_clen = 0; 25940883Smckusick vp->v_socket = 0; 26039397Smckusick } 26139512Smckusick vp->v_type = VNON; 26239397Smckusick cache_purge(vp); 26339397Smckusick vp->v_tag = tag; 26439433Smckusick vp->v_op = vops; 26539397Smckusick insmntque(vp, mp); 26639397Smckusick *vpp = vp; 26765505Smckusick vp->v_usecount = 1; 26865260Smckusick vp->v_data = 0; 26939397Smckusick return (0); 27039397Smckusick } 27165679Shibler 27239397Smckusick /* 27339397Smckusick * Move a vnode from one mount queue to another. 27439397Smckusick */ 27539397Smckusick insmntque(vp, mp) 27639397Smckusick register struct vnode *vp; 27739397Smckusick register struct mount *mp; 27839397Smckusick { 27939397Smckusick 28039397Smckusick /* 28139397Smckusick * Delete from old mount point vnode list, if on one. 28239397Smckusick */ 28365679Shibler if (vp->v_mount != NULL) 28465260Smckusick LIST_REMOVE(vp, v_mntvnodes); 28539397Smckusick /* 28639397Smckusick * Insert into list of vnodes for the new mount point, if available. 28739397Smckusick */ 28865260Smckusick if ((vp->v_mount = mp) == NULL) 28939397Smckusick return; 29065260Smckusick LIST_INSERT_HEAD(&mp->mnt_vnodelist, vp, v_mntvnodes); 29139397Smckusick } 29239397Smckusick 29339397Smckusick /* 29449232Smckusick * Update outstanding I/O count and do wakeup if requested. 29549232Smckusick */ 29649232Smckusick vwakeup(bp) 29749232Smckusick register struct buf *bp; 29849232Smckusick { 29949232Smckusick register struct vnode *vp; 30049232Smckusick 30157810Smckusick bp->b_flags &= ~B_WRITEINPROG; 30249232Smckusick if (vp = bp->b_vp) { 30349232Smckusick vp->v_numoutput--; 30457042Smargo if (vp->v_numoutput < 0) 30557042Smargo panic("vwakeup: neg numoutput"); 30649232Smckusick if ((vp->v_flag & VBWAIT) && vp->v_numoutput <= 0) { 30749232Smckusick if (vp->v_numoutput < 0) 30849232Smckusick panic("vwakeup: neg numoutput"); 30949232Smckusick vp->v_flag &= ~VBWAIT; 31049232Smckusick wakeup((caddr_t)&vp->v_numoutput); 31149232Smckusick } 31249232Smckusick } 31349232Smckusick } 31449232Smckusick 31549232Smckusick /* 31649232Smckusick * Flush out and invalidate all buffers associated with a vnode. 31749232Smckusick * Called with the underlying object locked. 31849232Smckusick */ 31954442Smckusick int 32057792Smckusick vinvalbuf(vp, flags, cred, p, slpflag, slptimeo) 32149232Smckusick register struct vnode *vp; 32256459Smargo int flags; 32354442Smckusick struct ucred *cred; 32454442Smckusick struct proc *p; 32557792Smckusick int slpflag, slptimeo; 32649232Smckusick { 32749232Smckusick register struct buf *bp; 32849232Smckusick struct buf *nbp, *blist; 32954442Smckusick int s, error; 33049232Smckusick 33156459Smargo if (flags & V_SAVE) { 33254442Smckusick if (error = VOP_FSYNC(vp, cred, MNT_WAIT, p)) 33354442Smckusick return (error); 33465260Smckusick if (vp->v_dirtyblkhd.lh_first != NULL) 33554442Smckusick panic("vinvalbuf: dirty bufs"); 33654442Smckusick } 33749232Smckusick for (;;) { 33865260Smckusick if ((blist = vp->v_cleanblkhd.lh_first) && flags & V_SAVEMETA) 33956459Smargo while (blist && blist->b_lblkno < 0) 34065260Smckusick blist = blist->b_vnbufs.le_next; 34165260Smckusick if (!blist && (blist = vp->v_dirtyblkhd.lh_first) && 34256608Smckusick (flags & V_SAVEMETA)) 34356459Smargo while (blist && blist->b_lblkno < 0) 34465260Smckusick blist = blist->b_vnbufs.le_next; 34556459Smargo if (!blist) 34649232Smckusick break; 34756459Smargo 34849232Smckusick for (bp = blist; bp; bp = nbp) { 34965260Smckusick nbp = bp->b_vnbufs.le_next; 35056459Smargo if (flags & V_SAVEMETA && bp->b_lblkno < 0) 35156459Smargo continue; 35249232Smckusick s = splbio(); 35349232Smckusick if (bp->b_flags & B_BUSY) { 35449232Smckusick bp->b_flags |= B_WANTED; 35557792Smckusick error = tsleep((caddr_t)bp, 35657792Smckusick slpflag | (PRIBIO + 1), "vinvalbuf", 35757792Smckusick slptimeo); 35849232Smckusick splx(s); 35957792Smckusick if (error) 36057792Smckusick return (error); 36149232Smckusick break; 36249232Smckusick } 36349232Smckusick bremfree(bp); 36449232Smckusick bp->b_flags |= B_BUSY; 36549232Smckusick splx(s); 36657792Smckusick /* 36757792Smckusick * XXX Since there are no node locks for NFS, I believe 36857792Smckusick * there is a slight chance that a delayed write will 36957792Smckusick * occur while sleeping just above, so check for it. 37057792Smckusick */ 37157792Smckusick if ((bp->b_flags & B_DELWRI) && (flags & V_SAVE)) { 37257792Smckusick (void) VOP_BWRITE(bp); 37357792Smckusick break; 37457792Smckusick } 37556459Smargo bp->b_flags |= B_INVAL; 37649232Smckusick brelse(bp); 37749232Smckusick } 37849232Smckusick } 37956608Smckusick if (!(flags & V_SAVEMETA) && 38065260Smckusick (vp->v_dirtyblkhd.lh_first || vp->v_cleanblkhd.lh_first)) 38149232Smckusick panic("vinvalbuf: flush failed"); 38254442Smckusick return (0); 38349232Smckusick } 38449232Smckusick 38549232Smckusick /* 38649232Smckusick * Associate a buffer with a vnode. 38749232Smckusick */ 38849232Smckusick bgetvp(vp, bp) 38949232Smckusick register struct vnode *vp; 39049232Smckusick register struct buf *bp; 39149232Smckusick { 39249232Smckusick 39349232Smckusick if (bp->b_vp) 39449232Smckusick panic("bgetvp: not free"); 39549232Smckusick VHOLD(vp); 39649232Smckusick bp->b_vp = vp; 39749232Smckusick if (vp->v_type == VBLK || vp->v_type == VCHR) 39849232Smckusick bp->b_dev = vp->v_rdev; 39949232Smckusick else 40049232Smckusick bp->b_dev = NODEV; 40149232Smckusick /* 40249232Smckusick * Insert onto list for new vnode. 40349232Smckusick */ 40456608Smckusick bufinsvn(bp, &vp->v_cleanblkhd); 40549232Smckusick } 40649232Smckusick 40749232Smckusick /* 40849232Smckusick * Disassociate a buffer from a vnode. 40949232Smckusick */ 41049232Smckusick brelvp(bp) 41149232Smckusick register struct buf *bp; 41249232Smckusick { 41349232Smckusick struct vnode *vp; 41449232Smckusick 41549232Smckusick if (bp->b_vp == (struct vnode *) 0) 41649232Smckusick panic("brelvp: NULL"); 41749232Smckusick /* 41849232Smckusick * Delete from old vnode list, if on one. 41949232Smckusick */ 42065260Smckusick if (bp->b_vnbufs.le_next != NOLIST) 42156608Smckusick bufremvn(bp); 42249232Smckusick vp = bp->b_vp; 42349232Smckusick bp->b_vp = (struct vnode *) 0; 42449232Smckusick HOLDRELE(vp); 42549232Smckusick } 42649232Smckusick 42749232Smckusick /* 42849232Smckusick * Reassign a buffer from one vnode to another. 42949232Smckusick * Used to assign file specific control information 43049232Smckusick * (indirect blocks) to the vnode to which they belong. 43149232Smckusick */ 43249232Smckusick reassignbuf(bp, newvp) 43349232Smckusick register struct buf *bp; 43449232Smckusick register struct vnode *newvp; 43549232Smckusick { 43665260Smckusick register struct buflists *listheadp; 43749232Smckusick 43852655Smckusick if (newvp == NULL) { 43952655Smckusick printf("reassignbuf: NULL"); 44052655Smckusick return; 44152655Smckusick } 44249232Smckusick /* 44349232Smckusick * Delete from old vnode list, if on one. 44449232Smckusick */ 44565260Smckusick if (bp->b_vnbufs.le_next != NOLIST) 44656608Smckusick bufremvn(bp); 44749232Smckusick /* 44849232Smckusick * If dirty, put on list of dirty buffers; 44949232Smckusick * otherwise insert onto list of clean buffers. 45049232Smckusick */ 45149232Smckusick if (bp->b_flags & B_DELWRI) 45249232Smckusick listheadp = &newvp->v_dirtyblkhd; 45349232Smckusick else 45449232Smckusick listheadp = &newvp->v_cleanblkhd; 45556608Smckusick bufinsvn(bp, listheadp); 45649232Smckusick } 45749232Smckusick 45849232Smckusick /* 45939433Smckusick * Create a vnode for a block device. 46039433Smckusick * Used for root filesystem, argdev, and swap areas. 46139433Smckusick * Also used for memory file system special devices. 46239397Smckusick */ 46339433Smckusick bdevvp(dev, vpp) 46439433Smckusick dev_t dev; 46539433Smckusick struct vnode **vpp; 46639433Smckusick { 46739433Smckusick register struct vnode *vp; 46839433Smckusick struct vnode *nvp; 46939433Smckusick int error; 47039433Smckusick 47146989Smckusick if (dev == NODEV) 47246989Smckusick return (0); 47353547Sheideman error = getnewvnode(VT_NON, (struct mount *)0, spec_vnodeop_p, &nvp); 47439433Smckusick if (error) { 47539433Smckusick *vpp = 0; 47639433Smckusick return (error); 47739433Smckusick } 47839433Smckusick vp = nvp; 47939433Smckusick vp->v_type = VBLK; 48039615Smckusick if (nvp = checkalias(vp, dev, (struct mount *)0)) { 48139433Smckusick vput(vp); 48239433Smckusick vp = nvp; 48339433Smckusick } 48439433Smckusick *vpp = vp; 48539433Smckusick return (0); 48639433Smckusick } 48739433Smckusick 48839433Smckusick /* 48939433Smckusick * Check to see if the new vnode represents a special device 49039433Smckusick * for which we already have a vnode (either because of 49139433Smckusick * bdevvp() or because of a different vnode representing 49239433Smckusick * the same block device). If such an alias exists, deallocate 49339509Smckusick * the existing contents and return the aliased vnode. The 49439433Smckusick * caller is responsible for filling it with its new contents. 49539433Smckusick */ 49639433Smckusick struct vnode * 49739615Smckusick checkalias(nvp, nvp_rdev, mp) 49839433Smckusick register struct vnode *nvp; 49939615Smckusick dev_t nvp_rdev; 50039433Smckusick struct mount *mp; 50139433Smckusick { 50239433Smckusick register struct vnode *vp; 50339615Smckusick struct vnode **vpp; 50439433Smckusick 50539433Smckusick if (nvp->v_type != VBLK && nvp->v_type != VCHR) 50641400Smckusick return (NULLVP); 50739615Smckusick 50839615Smckusick vpp = &speclisth[SPECHASH(nvp_rdev)]; 50939433Smckusick loop: 51039615Smckusick for (vp = *vpp; vp; vp = vp->v_specnext) { 51139615Smckusick if (nvp_rdev != vp->v_rdev || nvp->v_type != vp->v_type) 51239433Smckusick continue; 51339615Smckusick /* 51439615Smckusick * Alias, but not in use, so flush it out. 51539615Smckusick */ 51639809Smckusick if (vp->v_usecount == 0) { 51739615Smckusick vgone(vp); 51839615Smckusick goto loop; 51939615Smckusick } 52065260Smckusick if (vget(vp, 1)) 52139633Smckusick goto loop; 52239433Smckusick break; 52339433Smckusick } 52439615Smckusick if (vp == NULL || vp->v_tag != VT_NON) { 52539615Smckusick MALLOC(nvp->v_specinfo, struct specinfo *, 52639615Smckusick sizeof(struct specinfo), M_VNODE, M_WAITOK); 52739615Smckusick nvp->v_rdev = nvp_rdev; 52839809Smckusick nvp->v_hashchain = vpp; 52939615Smckusick nvp->v_specnext = *vpp; 53042152Smckusick nvp->v_specflags = 0; 53139615Smckusick *vpp = nvp; 53240640Smckusick if (vp != NULL) { 53340640Smckusick nvp->v_flag |= VALIASED; 53440640Smckusick vp->v_flag |= VALIASED; 53540640Smckusick vput(vp); 53640640Smckusick } 53741400Smckusick return (NULLVP); 53839433Smckusick } 53939484Smckusick VOP_UNLOCK(vp); 54039484Smckusick vclean(vp, 0); 54139433Smckusick vp->v_op = nvp->v_op; 54239433Smckusick vp->v_tag = nvp->v_tag; 54339433Smckusick nvp->v_type = VNON; 54439433Smckusick insmntque(vp, mp); 54539433Smckusick return (vp); 54639433Smckusick } 54739433Smckusick 54839433Smckusick /* 54939433Smckusick * Grab a particular vnode from the free list, increment its 55039433Smckusick * reference count and lock it. The vnode lock bit is set the 55139433Smckusick * vnode is being eliminated in vgone. The process is awakened 55239433Smckusick * when the transition is completed, and an error returned to 55339433Smckusick * indicate that the vnode is no longer usable (possibly having 55439433Smckusick * been changed to a new file system type). 55539433Smckusick */ 55665260Smckusick vget(vp, lockflag) 55739397Smckusick register struct vnode *vp; 55865260Smckusick int lockflag; 55939397Smckusick { 56039397Smckusick 56139433Smckusick if (vp->v_flag & VXLOCK) { 56239433Smckusick vp->v_flag |= VXWANT; 56339433Smckusick sleep((caddr_t)vp, PINOD); 56439433Smckusick return (1); 56539433Smckusick } 56665679Shibler if (vp->v_usecount == 0) 56765260Smckusick TAILQ_REMOVE(&vnode_free_list, vp, v_freelist); 56859450Smckusick vp->v_usecount++; 56965260Smckusick if (lockflag) 57065260Smckusick VOP_LOCK(vp); 57139433Smckusick return (0); 57239397Smckusick } 57339397Smckusick 57439397Smckusick /* 57539397Smckusick * Vnode reference, just increment the count 57639397Smckusick */ 57739397Smckusick void vref(vp) 57839397Smckusick struct vnode *vp; 57939397Smckusick { 58039397Smckusick 58159450Smckusick if (vp->v_usecount <= 0) 58259450Smckusick panic("vref used where vget required"); 58339809Smckusick vp->v_usecount++; 58439397Smckusick } 58539397Smckusick 58639397Smckusick /* 58739397Smckusick * vput(), just unlock and vrele() 58839397Smckusick */ 58939397Smckusick void vput(vp) 59039397Smckusick register struct vnode *vp; 59139397Smckusick { 59252416Storek 59339397Smckusick VOP_UNLOCK(vp); 59439397Smckusick vrele(vp); 59539397Smckusick } 59639397Smckusick 59739397Smckusick /* 59839397Smckusick * Vnode release. 59939397Smckusick * If count drops to zero, call inactive routine and return to freelist. 60039397Smckusick */ 60139397Smckusick void vrele(vp) 60239397Smckusick register struct vnode *vp; 60339397Smckusick { 60439397Smckusick 60550109Smckusick #ifdef DIAGNOSTIC 60639397Smckusick if (vp == NULL) 60739433Smckusick panic("vrele: null vp"); 60850109Smckusick #endif 60939809Smckusick vp->v_usecount--; 61039809Smckusick if (vp->v_usecount > 0) 61139397Smckusick return; 61250109Smckusick #ifdef DIAGNOSTIC 61350109Smckusick if (vp->v_usecount != 0 || vp->v_writecount != 0) { 61450109Smckusick vprint("vrele: bad ref count", vp); 61550109Smckusick panic("vrele: ref cnt"); 61650109Smckusick } 61750109Smckusick #endif 61855468Smckusick /* 61955468Smckusick * insert at tail of LRU list 62055468Smckusick */ 62165260Smckusick TAILQ_INSERT_TAIL(&vnode_free_list, vp, v_freelist); 62254442Smckusick VOP_INACTIVE(vp); 62339397Smckusick } 62439433Smckusick 62539433Smckusick /* 62639809Smckusick * Page or buffer structure gets a reference. 62739809Smckusick */ 62853312Smckusick void vhold(vp) 62939809Smckusick register struct vnode *vp; 63039809Smckusick { 63139809Smckusick 63239809Smckusick vp->v_holdcnt++; 63339809Smckusick } 63439809Smckusick 63539809Smckusick /* 63639809Smckusick * Page or buffer structure frees a reference. 63739809Smckusick */ 63853312Smckusick void holdrele(vp) 63939809Smckusick register struct vnode *vp; 64039809Smckusick { 64139809Smckusick 64239809Smckusick if (vp->v_holdcnt <= 0) 64339809Smckusick panic("holdrele: holdcnt"); 64439809Smckusick vp->v_holdcnt--; 64539809Smckusick } 64639809Smckusick 64739809Smckusick /* 64839509Smckusick * Remove any vnodes in the vnode table belonging to mount point mp. 64939509Smckusick * 65039509Smckusick * If MNT_NOFORCE is specified, there should not be any active ones, 65139509Smckusick * return error if any are found (nb: this is a user error, not a 65239509Smckusick * system error). If MNT_FORCE is specified, detach any active vnodes 65339509Smckusick * that are found. 65439509Smckusick */ 65565679Shibler #ifdef DIAGNOSTIC 65660930Smckusick int busyprt = 0; /* print out busy vnodes */ 65760930Smckusick struct ctldebug debug1 = { "busyprt", &busyprt }; 65865679Shibler #endif 65939509Smckusick 66039509Smckusick vflush(mp, skipvp, flags) 66139509Smckusick struct mount *mp; 66239509Smckusick struct vnode *skipvp; 66339509Smckusick int flags; 66439509Smckusick { 66539509Smckusick register struct vnode *vp, *nvp; 66639509Smckusick int busy = 0; 66739509Smckusick 66841400Smckusick if ((mp->mnt_flag & MNT_MPBUSY) == 0) 66941300Smckusick panic("vflush: not busy"); 67041421Smckusick loop: 67165260Smckusick for (vp = mp->mnt_vnodelist.lh_first; vp; vp = nvp) { 67241421Smckusick if (vp->v_mount != mp) 67341421Smckusick goto loop; 67465260Smckusick nvp = vp->v_mntvnodes.le_next; 67539509Smckusick /* 67639509Smckusick * Skip over a selected vnode. 67739509Smckusick */ 67839509Smckusick if (vp == skipvp) 67939509Smckusick continue; 68039509Smckusick /* 68141300Smckusick * Skip over a vnodes marked VSYSTEM. 68241300Smckusick */ 68341300Smckusick if ((flags & SKIPSYSTEM) && (vp->v_flag & VSYSTEM)) 68441300Smckusick continue; 68541300Smckusick /* 68657040Smckusick * If WRITECLOSE is set, only flush out regular file 68757040Smckusick * vnodes open for writing. 68857040Smckusick */ 68957040Smckusick if ((flags & WRITECLOSE) && 69057040Smckusick (vp->v_writecount == 0 || vp->v_type != VREG)) 69157040Smckusick continue; 69257040Smckusick /* 69339809Smckusick * With v_usecount == 0, all we need to do is clear 69439509Smckusick * out the vnode data structures and we are done. 69539509Smckusick */ 69639809Smckusick if (vp->v_usecount == 0) { 69739509Smckusick vgone(vp); 69839509Smckusick continue; 69939509Smckusick } 70039509Smckusick /* 70157040Smckusick * If FORCECLOSE is set, forcibly close the vnode. 70239509Smckusick * For block or character devices, revert to an 70339509Smckusick * anonymous device. For all other files, just kill them. 70439509Smckusick */ 70541300Smckusick if (flags & FORCECLOSE) { 70639509Smckusick if (vp->v_type != VBLK && vp->v_type != VCHR) { 70739509Smckusick vgone(vp); 70839509Smckusick } else { 70939509Smckusick vclean(vp, 0); 71053547Sheideman vp->v_op = spec_vnodeop_p; 71139509Smckusick insmntque(vp, (struct mount *)0); 71239509Smckusick } 71339509Smckusick continue; 71439509Smckusick } 71565679Shibler #ifdef DIAGNOSTIC 71639509Smckusick if (busyprt) 71739667Smckusick vprint("vflush: busy vnode", vp); 71865679Shibler #endif 71939509Smckusick busy++; 72039509Smckusick } 72139509Smckusick if (busy) 72239509Smckusick return (EBUSY); 72339509Smckusick return (0); 72439509Smckusick } 72539509Smckusick 72639509Smckusick /* 72739433Smckusick * Disassociate the underlying file system from a vnode. 72839433Smckusick */ 72954347Smckusick void 73054347Smckusick vclean(vp, flags) 73139433Smckusick register struct vnode *vp; 73245118Smckusick int flags; 73339433Smckusick { 73439484Smckusick int active; 73539433Smckusick 73639484Smckusick /* 73739484Smckusick * Check to see if the vnode is in use. 73839667Smckusick * If so we have to reference it before we clean it out 73939667Smckusick * so that its count cannot fall to zero and generate a 74039667Smckusick * race against ourselves to recycle it. 74139484Smckusick */ 74239809Smckusick if (active = vp->v_usecount) 74339484Smckusick VREF(vp); 74439484Smckusick /* 74556805Smckusick * Even if the count is zero, the VOP_INACTIVE routine may still 74656805Smckusick * have the object locked while it cleans it out. The VOP_LOCK 74756805Smckusick * ensures that the VOP_INACTIVE routine is done with its work. 74856805Smckusick * For active vnodes, it ensures that no other activity can 74956805Smckusick * occur while the underlying object is being cleaned out. 75056805Smckusick */ 75156805Smckusick VOP_LOCK(vp); 75256805Smckusick /* 75339484Smckusick * Prevent the vnode from being recycled or 75439484Smckusick * brought into use while we clean it out. 75539484Smckusick */ 75639667Smckusick if (vp->v_flag & VXLOCK) 75739667Smckusick panic("vclean: deadlock"); 75839433Smckusick vp->v_flag |= VXLOCK; 75939433Smckusick /* 76056805Smckusick * Clean out any buffers associated with the vnode. 76139667Smckusick */ 76241300Smckusick if (flags & DOCLOSE) 76357792Smckusick vinvalbuf(vp, V_SAVE, NOCRED, NULL, 0, 0); 76439667Smckusick /* 76556805Smckusick * Any other processes trying to obtain this lock must first 76656805Smckusick * wait for VXLOCK to clear, then call the new lock operation. 76739433Smckusick */ 76856805Smckusick VOP_UNLOCK(vp); 76939433Smckusick /* 77056805Smckusick * If purging an active vnode, it must be closed and 77156805Smckusick * deactivated before being reclaimed. 77239433Smckusick */ 77339484Smckusick if (active) { 77456805Smckusick if (flags & DOCLOSE) 77556805Smckusick VOP_CLOSE(vp, IO_NDELAY, NOCRED, NULL); 77656805Smckusick VOP_INACTIVE(vp); 77739433Smckusick } 77839433Smckusick /* 77939433Smckusick * Reclaim the vnode. 78039433Smckusick */ 78156805Smckusick if (VOP_RECLAIM(vp)) 78239433Smckusick panic("vclean: cannot reclaim"); 78339484Smckusick if (active) 78439484Smckusick vrele(vp); 78553580Sheideman 78639433Smckusick /* 78756805Smckusick * Done with purge, notify sleepers of the grim news. 78839433Smckusick */ 78956805Smckusick vp->v_op = dead_vnodeop_p; 79056805Smckusick vp->v_tag = VT_NON; 79139433Smckusick vp->v_flag &= ~VXLOCK; 79239433Smckusick if (vp->v_flag & VXWANT) { 79339433Smckusick vp->v_flag &= ~VXWANT; 79439433Smckusick wakeup((caddr_t)vp); 79539433Smckusick } 79639433Smckusick } 79739433Smckusick 79839433Smckusick /* 79939633Smckusick * Eliminate all activity associated with the requested vnode 80039633Smckusick * and with all vnodes aliased to the requested vnode. 80139633Smckusick */ 80239633Smckusick void vgoneall(vp) 80339633Smckusick register struct vnode *vp; 80439633Smckusick { 80539809Smckusick register struct vnode *vq; 80639633Smckusick 80740665Smckusick if (vp->v_flag & VALIASED) { 80840665Smckusick /* 80940665Smckusick * If a vgone (or vclean) is already in progress, 81040665Smckusick * wait until it is done and return. 81140665Smckusick */ 81240665Smckusick if (vp->v_flag & VXLOCK) { 81340665Smckusick vp->v_flag |= VXWANT; 81440665Smckusick sleep((caddr_t)vp, PINOD); 81540665Smckusick return; 81639633Smckusick } 81740665Smckusick /* 81840665Smckusick * Ensure that vp will not be vgone'd while we 81940665Smckusick * are eliminating its aliases. 82040665Smckusick */ 82140665Smckusick vp->v_flag |= VXLOCK; 82240665Smckusick while (vp->v_flag & VALIASED) { 82340665Smckusick for (vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 82440665Smckusick if (vq->v_rdev != vp->v_rdev || 82540665Smckusick vq->v_type != vp->v_type || vp == vq) 82640665Smckusick continue; 82740665Smckusick vgone(vq); 82840665Smckusick break; 82940665Smckusick } 83040665Smckusick } 83140665Smckusick /* 83240665Smckusick * Remove the lock so that vgone below will 83340665Smckusick * really eliminate the vnode after which time 83440665Smckusick * vgone will awaken any sleepers. 83540665Smckusick */ 83640665Smckusick vp->v_flag &= ~VXLOCK; 83739633Smckusick } 83839633Smckusick vgone(vp); 83939633Smckusick } 84039633Smckusick 84139633Smckusick /* 84239433Smckusick * Eliminate all activity associated with a vnode 84339433Smckusick * in preparation for reuse. 84439433Smckusick */ 84539433Smckusick void vgone(vp) 84639433Smckusick register struct vnode *vp; 84739433Smckusick { 84839809Smckusick register struct vnode *vq; 84939615Smckusick struct vnode *vx; 85039433Smckusick 85139433Smckusick /* 85240548Smckusick * If a vgone (or vclean) is already in progress, 85340548Smckusick * wait until it is done and return. 85440548Smckusick */ 85540548Smckusick if (vp->v_flag & VXLOCK) { 85640548Smckusick vp->v_flag |= VXWANT; 85740548Smckusick sleep((caddr_t)vp, PINOD); 85840548Smckusick return; 85940548Smckusick } 86040548Smckusick /* 86139433Smckusick * Clean out the filesystem specific data. 86239433Smckusick */ 86341300Smckusick vclean(vp, DOCLOSE); 86439433Smckusick /* 86539433Smckusick * Delete from old mount point vnode list, if on one. 86639433Smckusick */ 86765260Smckusick if (vp->v_mount != NULL) { 86865260Smckusick LIST_REMOVE(vp, v_mntvnodes); 86952311Smckusick vp->v_mount = NULL; 87039433Smckusick } 87139433Smckusick /* 87239433Smckusick * If special device, remove it from special device alias list. 87339433Smckusick */ 87439433Smckusick if (vp->v_type == VBLK || vp->v_type == VCHR) { 87539809Smckusick if (*vp->v_hashchain == vp) { 87639809Smckusick *vp->v_hashchain = vp->v_specnext; 87739433Smckusick } else { 87839809Smckusick for (vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 87939615Smckusick if (vq->v_specnext != vp) 88039433Smckusick continue; 88139615Smckusick vq->v_specnext = vp->v_specnext; 88239433Smckusick break; 88339433Smckusick } 88439615Smckusick if (vq == NULL) 88539433Smckusick panic("missing bdev"); 88639433Smckusick } 88739615Smckusick if (vp->v_flag & VALIASED) { 88852416Storek vx = NULL; 88939809Smckusick for (vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 89040108Smckusick if (vq->v_rdev != vp->v_rdev || 89140108Smckusick vq->v_type != vp->v_type) 89239615Smckusick continue; 89352416Storek if (vx) 89452416Storek break; 89539615Smckusick vx = vq; 89639615Smckusick } 89752416Storek if (vx == NULL) 89839615Smckusick panic("missing alias"); 89952416Storek if (vq == NULL) 90039615Smckusick vx->v_flag &= ~VALIASED; 90139615Smckusick vp->v_flag &= ~VALIASED; 90239615Smckusick } 90339615Smckusick FREE(vp->v_specinfo, M_VNODE); 90439615Smckusick vp->v_specinfo = NULL; 90539433Smckusick } 90639433Smckusick /* 90756932Smckusick * If it is on the freelist and not already at the head, 90865505Smckusick * move it to the head of the list. The test of the back 90965505Smckusick * pointer and the reference count of zero is because 91065505Smckusick * it will be removed from the free list by getnewvnode, 91165505Smckusick * but will not have its reference count incremented until 91265505Smckusick * after calling vgone. If the reference count were 91365505Smckusick * incremented first, vgone would (incorrectly) try to 91465505Smckusick * close the previous instance of the underlying object. 91565505Smckusick * So, the back pointer is explicitly set to `0xdeadb' in 91665505Smckusick * getnewvnode after removing it from the freelist to ensure 91765505Smckusick * that we do not try to move it here. 91839433Smckusick */ 91965505Smckusick if (vp->v_usecount == 0 && 92065505Smckusick vp->v_freelist.tqe_prev != (struct vnode **)0xdeadb && 92165505Smckusick vnode_free_list.tqh_first != vp) { 92265260Smckusick TAILQ_REMOVE(&vnode_free_list, vp, v_freelist); 92365260Smckusick TAILQ_INSERT_HEAD(&vnode_free_list, vp, v_freelist); 92439433Smckusick } 92539484Smckusick vp->v_type = VBAD; 92639433Smckusick } 92739633Smckusick 92839633Smckusick /* 92939821Smckusick * Lookup a vnode by device number. 93039821Smckusick */ 93139821Smckusick vfinddev(dev, type, vpp) 93239821Smckusick dev_t dev; 93339821Smckusick enum vtype type; 93439821Smckusick struct vnode **vpp; 93539821Smckusick { 93639821Smckusick register struct vnode *vp; 93739821Smckusick 93839821Smckusick for (vp = speclisth[SPECHASH(dev)]; vp; vp = vp->v_specnext) { 93939821Smckusick if (dev != vp->v_rdev || type != vp->v_type) 94039821Smckusick continue; 94139821Smckusick *vpp = vp; 94259484Smckusick return (1); 94339821Smckusick } 94459484Smckusick return (0); 94539821Smckusick } 94639821Smckusick 94739821Smckusick /* 94839633Smckusick * Calculate the total number of references to a special device. 94939633Smckusick */ 95039633Smckusick vcount(vp) 95139633Smckusick register struct vnode *vp; 95239633Smckusick { 95339809Smckusick register struct vnode *vq; 95439633Smckusick int count; 95539633Smckusick 95639633Smckusick if ((vp->v_flag & VALIASED) == 0) 95739809Smckusick return (vp->v_usecount); 95839633Smckusick loop: 95939809Smckusick for (count = 0, vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 96040108Smckusick if (vq->v_rdev != vp->v_rdev || vq->v_type != vp->v_type) 96139633Smckusick continue; 96239633Smckusick /* 96339633Smckusick * Alias, but not in use, so flush it out. 96439633Smckusick */ 96539809Smckusick if (vq->v_usecount == 0) { 96639633Smckusick vgone(vq); 96739633Smckusick goto loop; 96839633Smckusick } 96939809Smckusick count += vq->v_usecount; 97039633Smckusick } 97139633Smckusick return (count); 97239633Smckusick } 97339667Smckusick 97439667Smckusick /* 97539667Smckusick * Print out a description of a vnode. 97639667Smckusick */ 97739667Smckusick static char *typename[] = 97840286Smckusick { "VNON", "VREG", "VDIR", "VBLK", "VCHR", "VLNK", "VSOCK", "VFIFO", "VBAD" }; 97939667Smckusick 98039667Smckusick vprint(label, vp) 98139667Smckusick char *label; 98239667Smckusick register struct vnode *vp; 98339667Smckusick { 98439913Smckusick char buf[64]; 98539667Smckusick 98639667Smckusick if (label != NULL) 98739667Smckusick printf("%s: ", label); 98850109Smckusick printf("type %s, usecount %d, writecount %d, refcount %d,", 98950109Smckusick typename[vp->v_type], vp->v_usecount, vp->v_writecount, 99050109Smckusick vp->v_holdcnt); 99139913Smckusick buf[0] = '\0'; 99239913Smckusick if (vp->v_flag & VROOT) 99339913Smckusick strcat(buf, "|VROOT"); 99439913Smckusick if (vp->v_flag & VTEXT) 99539913Smckusick strcat(buf, "|VTEXT"); 99641300Smckusick if (vp->v_flag & VSYSTEM) 99741300Smckusick strcat(buf, "|VSYSTEM"); 99841300Smckusick if (vp->v_flag & VXLOCK) 99941300Smckusick strcat(buf, "|VXLOCK"); 100041300Smckusick if (vp->v_flag & VXWANT) 100141300Smckusick strcat(buf, "|VXWANT"); 100241300Smckusick if (vp->v_flag & VBWAIT) 100341300Smckusick strcat(buf, "|VBWAIT"); 100439913Smckusick if (vp->v_flag & VALIASED) 100539913Smckusick strcat(buf, "|VALIASED"); 100639913Smckusick if (buf[0] != '\0') 100739913Smckusick printf(" flags (%s)", &buf[1]); 100865260Smckusick if (vp->v_data == NULL) { 100965260Smckusick printf("\n"); 101065260Smckusick } else { 101165260Smckusick printf("\n\t"); 101265260Smckusick VOP_PRINT(vp); 101365260Smckusick } 101439667Smckusick } 101541110Smarc 101649691Smckusick #ifdef DEBUG 101749691Smckusick /* 101849691Smckusick * List all of the locked vnodes in the system. 101949691Smckusick * Called when debugging the kernel. 102049691Smckusick */ 102149691Smckusick printlockedvnodes() 102249691Smckusick { 102349691Smckusick register struct mount *mp; 102449691Smckusick register struct vnode *vp; 102549691Smckusick 102649691Smckusick printf("Locked vnodes\n"); 102765260Smckusick for (mp = mountlist.tqh_first; mp != NULL; mp = mp->mnt_list.tqe_next) { 102865260Smckusick for (vp = mp->mnt_vnodelist.lh_first; 102965260Smckusick vp != NULL; 103065260Smckusick vp = vp->v_mntvnodes.le_next) 103149691Smckusick if (VOP_ISLOCKED(vp)) 103249691Smckusick vprint((char *)0, vp); 103365260Smckusick } 103449691Smckusick } 103549691Smckusick #endif 103649691Smckusick 103741110Smarc int kinfo_vdebug = 1; 103841110Smarc int kinfo_vgetfailed; 103941110Smarc #define KINFO_VNODESLOP 10 104041110Smarc /* 104157841Smckusick * Dump vnode list (via sysctl). 104241110Smarc * Copyout address of vnode followed by vnode. 104341110Smarc */ 104445118Smckusick /* ARGSUSED */ 104557841Smckusick sysctl_vnode(where, sizep) 104641110Smarc char *where; 104758465Sbostic size_t *sizep; 104841110Smarc { 104965260Smckusick register struct mount *mp, *nmp; 105041110Smarc struct vnode *vp; 105141110Smarc register char *bp = where, *savebp; 105253818Smckusick char *ewhere; 105341110Smarc int error; 105441110Smarc 105541110Smarc #define VPTRSZ sizeof (struct vnode *) 105641110Smarc #define VNODESZ sizeof (struct vnode) 105741110Smarc if (where == NULL) { 105857841Smckusick *sizep = (numvnodes + KINFO_VNODESLOP) * (VPTRSZ + VNODESZ); 105941110Smarc return (0); 106041110Smarc } 106157841Smckusick ewhere = where + *sizep; 106241110Smarc 106365260Smckusick for (mp = mountlist.tqh_first; mp != NULL; mp = nmp) { 106465260Smckusick nmp = mp->mnt_list.tqe_next; 106565260Smckusick if (vfs_busy(mp)) 106641300Smckusick continue; 106741110Smarc savebp = bp; 106841110Smarc again: 106965260Smckusick for (vp = mp->mnt_vnodelist.lh_first; 107065260Smckusick vp != NULL; 107165260Smckusick vp = vp->v_mntvnodes.le_next) { 107241422Smckusick /* 107341422Smckusick * Check that the vp is still associated with 107441422Smckusick * this filesystem. RACE: could have been 107541422Smckusick * recycled onto the same filesystem. 107641422Smckusick */ 107741421Smckusick if (vp->v_mount != mp) { 107841421Smckusick if (kinfo_vdebug) 107941421Smckusick printf("kinfo: vp changed\n"); 108041421Smckusick bp = savebp; 108141421Smckusick goto again; 108241421Smckusick } 108357841Smckusick if (bp + VPTRSZ + VNODESZ > ewhere) { 108457841Smckusick *sizep = bp - where; 108557841Smckusick return (ENOMEM); 108657841Smckusick } 108757841Smckusick if ((error = copyout((caddr_t)&vp, bp, VPTRSZ)) || 108857841Smckusick (error = copyout((caddr_t)vp, bp + VPTRSZ, VNODESZ))) 108941110Smarc return (error); 109041110Smarc bp += VPTRSZ + VNODESZ; 109141110Smarc } 109265260Smckusick vfs_unbusy(mp); 109365260Smckusick } 109441110Smarc 109557841Smckusick *sizep = bp - where; 109641110Smarc return (0); 109741110Smarc } 109865679Shibler 109965679Shibler /* 110065679Shibler * Check to see if a filesystem is mounted on a block device. 110165679Shibler */ 110265679Shibler int 110365679Shibler vfs_mountedon(vp) 110465679Shibler register struct vnode *vp; 110565679Shibler { 110665679Shibler register struct vnode *vq; 110765679Shibler 110865679Shibler if (vp->v_specflags & SI_MOUNTEDON) 110965679Shibler return (EBUSY); 111065679Shibler if (vp->v_flag & VALIASED) { 111165679Shibler for (vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 111265679Shibler if (vq->v_rdev != vp->v_rdev || 111365679Shibler vq->v_type != vp->v_type) 111465679Shibler continue; 111565679Shibler if (vq->v_specflags & SI_MOUNTEDON) 111665679Shibler return (EBUSY); 111765679Shibler } 111865679Shibler } 111965679Shibler return (0); 112065679Shibler } 112165679Shibler 112265679Shibler /* 112365679Shibler * Build hash lists of net addresses and hang them off the mount point. 112465679Shibler * Called by ufs_mount() to set up the lists of export addresses. 112565679Shibler */ 112665679Shibler static int 112765679Shibler vfs_hang_addrlist(mp, nep, argp) 112865679Shibler struct mount *mp; 112965679Shibler struct netexport *nep; 113065679Shibler struct export_args *argp; 113165679Shibler { 113265679Shibler register struct netcred *np; 113365679Shibler register struct radix_node_head *rnh; 113465679Shibler register int i; 113565679Shibler struct radix_node *rn; 113665679Shibler struct sockaddr *saddr, *smask = 0; 113765679Shibler struct domain *dom; 113865679Shibler int error; 113965679Shibler 114065679Shibler if (argp->ex_addrlen == 0) { 114165679Shibler if (mp->mnt_flag & MNT_DEFEXPORTED) 114265679Shibler return (EPERM); 114365679Shibler np = &nep->ne_defexported; 114465679Shibler np->netc_exflags = argp->ex_flags; 114565679Shibler np->netc_anon = argp->ex_anon; 114665679Shibler np->netc_anon.cr_ref = 1; 114765679Shibler mp->mnt_flag |= MNT_DEFEXPORTED; 114865679Shibler return (0); 114965679Shibler } 115065679Shibler i = sizeof(struct netcred) + argp->ex_addrlen + argp->ex_masklen; 115165679Shibler np = (struct netcred *)malloc(i, M_NETADDR, M_WAITOK); 115265679Shibler bzero((caddr_t)np, i); 115365679Shibler saddr = (struct sockaddr *)(np + 1); 115465679Shibler if (error = copyin(argp->ex_addr, (caddr_t)saddr, argp->ex_addrlen)) 115565679Shibler goto out; 115665679Shibler if (saddr->sa_len > argp->ex_addrlen) 115765679Shibler saddr->sa_len = argp->ex_addrlen; 115865679Shibler if (argp->ex_masklen) { 115965679Shibler smask = (struct sockaddr *)((caddr_t)saddr + argp->ex_addrlen); 116065679Shibler error = copyin(argp->ex_addr, (caddr_t)smask, argp->ex_masklen); 116165679Shibler if (error) 116265679Shibler goto out; 116365679Shibler if (smask->sa_len > argp->ex_masklen) 116465679Shibler smask->sa_len = argp->ex_masklen; 116565679Shibler } 116665679Shibler i = saddr->sa_family; 116765679Shibler if ((rnh = nep->ne_rtable[i]) == 0) { 116865679Shibler /* 116965679Shibler * Seems silly to initialize every AF when most are not 117065679Shibler * used, do so on demand here 117165679Shibler */ 117265679Shibler for (dom = domains; dom; dom = dom->dom_next) 117365679Shibler if (dom->dom_family == i && dom->dom_rtattach) { 117465679Shibler dom->dom_rtattach((void **)&nep->ne_rtable[i], 117565679Shibler dom->dom_rtoffset); 117665679Shibler break; 117765679Shibler } 117865679Shibler if ((rnh = nep->ne_rtable[i]) == 0) { 117965679Shibler error = ENOBUFS; 118065679Shibler goto out; 118165679Shibler } 118265679Shibler } 118365679Shibler rn = (*rnh->rnh_addaddr)((caddr_t)saddr, (caddr_t)smask, rnh, 118465679Shibler np->netc_rnodes); 118565679Shibler if (rn == 0 || np != (struct netcred *)rn) { /* already exists */ 118665679Shibler error = EPERM; 118765679Shibler goto out; 118865679Shibler } 118965679Shibler np->netc_exflags = argp->ex_flags; 119065679Shibler np->netc_anon = argp->ex_anon; 119165679Shibler np->netc_anon.cr_ref = 1; 119265679Shibler return (0); 119365679Shibler out: 119465679Shibler free(np, M_NETADDR); 119565679Shibler return (error); 119665679Shibler } 119765679Shibler 119865679Shibler /* ARGSUSED */ 119965679Shibler static int 120065679Shibler vfs_free_netcred(rn, w) 120165679Shibler struct radix_node *rn; 120265679Shibler caddr_t w; 120365679Shibler { 120465679Shibler register struct radix_node_head *rnh = (struct radix_node_head *)w; 120565679Shibler 120665679Shibler (*rnh->rnh_deladdr)(rn->rn_key, rn->rn_mask, rnh); 120765679Shibler free((caddr_t)rn, M_NETADDR); 120865679Shibler return (0); 120965679Shibler } 121065679Shibler 121165679Shibler /* 121265679Shibler * Free the net address hash lists that are hanging off the mount points. 121365679Shibler */ 121465679Shibler static void 121565679Shibler vfs_free_addrlist(nep) 121665679Shibler struct netexport *nep; 121765679Shibler { 121865679Shibler register int i; 121965679Shibler register struct radix_node_head *rnh; 122065679Shibler 122165679Shibler for (i = 0; i <= AF_MAX; i++) 122265679Shibler if (rnh = nep->ne_rtable[i]) { 122365679Shibler (*rnh->rnh_walktree)(rnh, vfs_free_netcred, 122465679Shibler (caddr_t)rnh); 122565679Shibler free((caddr_t)rnh, M_RTABLE); 122665679Shibler nep->ne_rtable[i] = 0; 122765679Shibler } 122865679Shibler } 122965679Shibler 123065679Shibler int 123165679Shibler vfs_export(mp, nep, argp) 123265679Shibler struct mount *mp; 123365679Shibler struct netexport *nep; 123465679Shibler struct export_args *argp; 123565679Shibler { 123665679Shibler int error; 123765679Shibler 123865679Shibler if (argp->ex_flags & MNT_DELEXPORT) { 123965679Shibler vfs_free_addrlist(nep); 124065679Shibler mp->mnt_flag &= ~(MNT_EXPORTED | MNT_DEFEXPORTED); 124165679Shibler } 124265679Shibler if (argp->ex_flags & MNT_EXPORTED) { 124365679Shibler if (error = vfs_hang_addrlist(mp, nep, argp)) 124465679Shibler return (error); 124565679Shibler mp->mnt_flag |= MNT_EXPORTED; 124665679Shibler } 124765679Shibler return (0); 124865679Shibler } 124965679Shibler 125065679Shibler struct netcred * 125165679Shibler vfs_export_lookup(mp, nep, nam) 125265679Shibler register struct mount *mp; 125365679Shibler struct netexport *nep; 125465679Shibler struct mbuf *nam; 125565679Shibler { 125665679Shibler register struct netcred *np; 125765679Shibler register struct radix_node_head *rnh; 125865679Shibler struct sockaddr *saddr; 125965679Shibler 126065679Shibler np = NULL; 126165679Shibler if (mp->mnt_flag & MNT_EXPORTED) { 126265679Shibler /* 126365679Shibler * Lookup in the export list first. 126465679Shibler */ 126565679Shibler if (nam != NULL) { 126665679Shibler saddr = mtod(nam, struct sockaddr *); 126765679Shibler rnh = nep->ne_rtable[saddr->sa_family]; 126865679Shibler if (rnh != NULL) { 126965679Shibler np = (struct netcred *) 127065679Shibler (*rnh->rnh_matchaddr)((caddr_t)saddr, 127165679Shibler rnh); 127265679Shibler if (np && np->netc_rnodes->rn_flags & RNF_ROOT) 127365679Shibler np = NULL; 127465679Shibler } 127565679Shibler } 127665679Shibler /* 127765679Shibler * If no address match, use the default if it exists. 127865679Shibler */ 127965679Shibler if (np == NULL && mp->mnt_flag & MNT_DEFEXPORTED) 128065679Shibler np = &nep->ne_defexported; 128165679Shibler } 128265679Shibler return (np); 128365679Shibler } 1284