137488Smckusick /* 263180Sbostic * Copyright (c) 1989, 1993 363180Sbostic * The Regents of the University of California. All rights reserved. 465771Sbostic * (c) UNIX System Laboratories, Inc. 565771Sbostic * All or some portions of this file are derived from material licensed 665771Sbostic * to the University of California by American Telephone and Telegraph 765771Sbostic * Co. or Unix System Laboratories, Inc. and are reproduced herein with 865771Sbostic * the permission of UNIX System Laboratories, Inc. 937488Smckusick * 1044458Sbostic * %sccs.include.redist.c% 1137488Smckusick * 12*66503Sbostic * @(#)vfs_subr.c 8.11 (Berkeley) 03/28/94 1337488Smckusick */ 1437488Smckusick 1537488Smckusick /* 1637488Smckusick * External virtual filesystem routines 1737488Smckusick */ 1837488Smckusick 1951460Sbostic #include <sys/param.h> 2053829Spendry #include <sys/systm.h> 2151460Sbostic #include <sys/proc.h> 2251460Sbostic #include <sys/mount.h> 2351460Sbostic #include <sys/time.h> 2451460Sbostic #include <sys/vnode.h> 2552415Smckusick #include <sys/stat.h> 2651460Sbostic #include <sys/namei.h> 2751460Sbostic #include <sys/ucred.h> 2851460Sbostic #include <sys/buf.h> 2951460Sbostic #include <sys/errno.h> 3051460Sbostic #include <sys/malloc.h> 3165679Shibler #include <sys/domain.h> 3265679Shibler #include <sys/mbuf.h> 3337488Smckusick 3460930Smckusick #include <vm/vm.h> 3560930Smckusick #include <sys/sysctl.h> 3660930Smckusick 3755050Spendry #include <miscfs/specfs/specdev.h> 3855050Spendry 3952415Smckusick enum vtype iftovt_tab[16] = { 4052415Smckusick VNON, VFIFO, VCHR, VNON, VDIR, VNON, VBLK, VNON, 4152415Smckusick VREG, VNON, VLNK, VNON, VSOCK, VNON, VNON, VBAD, 4252415Smckusick }; 4352415Smckusick int vttoif_tab[9] = { 4452415Smckusick 0, S_IFREG, S_IFDIR, S_IFBLK, S_IFCHR, S_IFLNK, 4552415Smckusick S_IFSOCK, S_IFIFO, S_IFMT, 4652415Smckusick }; 4752415Smckusick 4837488Smckusick /* 4956608Smckusick * Insq/Remq for the vnode usage lists. 5056608Smckusick */ 5165260Smckusick #define bufinsvn(bp, dp) LIST_INSERT_HEAD(dp, bp, b_vnbufs) 5265260Smckusick #define bufremvn(bp) { \ 5365260Smckusick LIST_REMOVE(bp, b_vnbufs); \ 5465260Smckusick (bp)->b_vnbufs.le_next = NOLIST; \ 5565260Smckusick } 5656608Smckusick 5765260Smckusick TAILQ_HEAD(freelst, vnode) vnode_free_list; /* vnode free list */ 5865260Smckusick struct mntlist mountlist; /* mounted filesystem list */ 5965260Smckusick 6056608Smckusick /* 6165260Smckusick * Initialize the vnode management data structures. 6237488Smckusick */ 6365260Smckusick vntblinit() 6437488Smckusick { 6537488Smckusick 6665260Smckusick TAILQ_INIT(&vnode_free_list); 6765260Smckusick TAILQ_INIT(&mountlist); 6837488Smckusick } 6937488Smckusick 7037488Smckusick /* 7137488Smckusick * Lock a filesystem. 7237488Smckusick * Used to prevent access to it while mounting and unmounting. 7337488Smckusick */ 7437488Smckusick vfs_lock(mp) 7537488Smckusick register struct mount *mp; 7637488Smckusick { 7737488Smckusick 7841400Smckusick while(mp->mnt_flag & MNT_MLOCK) { 7941400Smckusick mp->mnt_flag |= MNT_MWAIT; 8039045Smckusick sleep((caddr_t)mp, PVFS); 8139045Smckusick } 8241400Smckusick mp->mnt_flag |= MNT_MLOCK; 8337488Smckusick return (0); 8437488Smckusick } 8537488Smckusick 8637488Smckusick /* 8737488Smckusick * Unlock a locked filesystem. 8837488Smckusick * Panic if filesystem is not locked. 8937488Smckusick */ 9037488Smckusick void 9137488Smckusick vfs_unlock(mp) 9237488Smckusick register struct mount *mp; 9337488Smckusick { 9437488Smckusick 9541400Smckusick if ((mp->mnt_flag & MNT_MLOCK) == 0) 9641300Smckusick panic("vfs_unlock: not locked"); 9741400Smckusick mp->mnt_flag &= ~MNT_MLOCK; 9841400Smckusick if (mp->mnt_flag & MNT_MWAIT) { 9941400Smckusick mp->mnt_flag &= ~MNT_MWAIT; 10037488Smckusick wakeup((caddr_t)mp); 10137488Smckusick } 10237488Smckusick } 10337488Smckusick 10437488Smckusick /* 10541300Smckusick * Mark a mount point as busy. 10641300Smckusick * Used to synchronize access and to delay unmounting. 10741300Smckusick */ 10841300Smckusick vfs_busy(mp) 10941300Smckusick register struct mount *mp; 11041300Smckusick { 11141300Smckusick 11241400Smckusick while(mp->mnt_flag & MNT_MPBUSY) { 11341400Smckusick mp->mnt_flag |= MNT_MPWANT; 11441400Smckusick sleep((caddr_t)&mp->mnt_flag, PVFS); 11541300Smckusick } 11641419Smckusick if (mp->mnt_flag & MNT_UNMOUNT) 11741419Smckusick return (1); 11841400Smckusick mp->mnt_flag |= MNT_MPBUSY; 11941300Smckusick return (0); 12041300Smckusick } 12141300Smckusick 12241300Smckusick /* 12341300Smckusick * Free a busy filesystem. 12441300Smckusick * Panic if filesystem is not busy. 12541300Smckusick */ 12641300Smckusick vfs_unbusy(mp) 12741300Smckusick register struct mount *mp; 12841300Smckusick { 12941300Smckusick 13041400Smckusick if ((mp->mnt_flag & MNT_MPBUSY) == 0) 13141300Smckusick panic("vfs_unbusy: not busy"); 13241400Smckusick mp->mnt_flag &= ~MNT_MPBUSY; 13341400Smckusick if (mp->mnt_flag & MNT_MPWANT) { 13441400Smckusick mp->mnt_flag &= ~MNT_MPWANT; 13541400Smckusick wakeup((caddr_t)&mp->mnt_flag); 13641300Smckusick } 13741300Smckusick } 13841300Smckusick 13941300Smckusick /* 14037488Smckusick * Lookup a mount point by filesystem identifier. 14137488Smckusick */ 14237488Smckusick struct mount * 14337488Smckusick getvfs(fsid) 14437488Smckusick fsid_t *fsid; 14537488Smckusick { 14637488Smckusick register struct mount *mp; 14737488Smckusick 14865260Smckusick for (mp = mountlist.tqh_first; mp != NULL; mp = mp->mnt_list.tqe_next) { 14941400Smckusick if (mp->mnt_stat.f_fsid.val[0] == fsid->val[0] && 15065260Smckusick mp->mnt_stat.f_fsid.val[1] == fsid->val[1]) 15138288Smckusick return (mp); 15265260Smckusick } 15338288Smckusick return ((struct mount *)0); 15437488Smckusick } 15537488Smckusick 15637488Smckusick /* 15753829Spendry * Get a new unique fsid 15853829Spendry */ 15953829Spendry void 16053829Spendry getnewfsid(mp, mtype) 16153829Spendry struct mount *mp; 16253829Spendry int mtype; 16353829Spendry { 16453829Spendry static u_short xxxfs_mntid; 16553829Spendry 16653829Spendry fsid_t tfsid; 16753829Spendry 16865507Spendry mp->mnt_stat.f_fsid.val[0] = makedev(nblkdev + mtype, 0); 16953829Spendry mp->mnt_stat.f_fsid.val[1] = mtype; 17053829Spendry if (xxxfs_mntid == 0) 17153829Spendry ++xxxfs_mntid; 17265507Spendry tfsid.val[0] = makedev(nblkdev + mtype, xxxfs_mntid); 17353829Spendry tfsid.val[1] = mtype; 17465260Smckusick if (mountlist.tqh_first != NULL) { 17553936Spendry while (getvfs(&tfsid)) { 17653936Spendry tfsid.val[0]++; 17753936Spendry xxxfs_mntid++; 17853936Spendry } 17953829Spendry } 18053829Spendry mp->mnt_stat.f_fsid.val[0] = tfsid.val[0]; 18153829Spendry } 18253829Spendry 18353829Spendry /* 18437488Smckusick * Set vnode attributes to VNOVAL 18537488Smckusick */ 18637488Smckusick void vattr_null(vap) 18737488Smckusick register struct vattr *vap; 18837488Smckusick { 18937488Smckusick 19037488Smckusick vap->va_type = VNON; 19152005Smckusick vap->va_size = vap->va_bytes = VNOVAL; 19237488Smckusick vap->va_mode = vap->va_nlink = vap->va_uid = vap->va_gid = 19352005Smckusick vap->va_fsid = vap->va_fileid = 19452005Smckusick vap->va_blocksize = vap->va_rdev = 19554347Smckusick vap->va_atime.ts_sec = vap->va_atime.ts_nsec = 19654347Smckusick vap->va_mtime.ts_sec = vap->va_mtime.ts_nsec = 19754347Smckusick vap->va_ctime.ts_sec = vap->va_ctime.ts_nsec = 19838258Smckusick vap->va_flags = vap->va_gen = VNOVAL; 19958548Sbostic vap->va_vaflags = 0; 20037488Smckusick } 20138265Smckusick 20238265Smckusick /* 20339397Smckusick * Routines having to do with the management of the vnode table. 20439397Smckusick */ 20553547Sheideman extern int (**dead_vnodeop_p)(); 20639635Smckusick extern void vclean(); 20740883Smckusick long numvnodes; 20853493Sheideman extern struct vattr va_null; 20939397Smckusick 21039397Smckusick /* 21139397Smckusick * Return the next vnode from the free list. 21239397Smckusick */ 21339397Smckusick getnewvnode(tag, mp, vops, vpp) 21439397Smckusick enum vtagtype tag; 21539397Smckusick struct mount *mp; 21653495Sheideman int (**vops)(); 21739397Smckusick struct vnode **vpp; 21839397Smckusick { 21965511Smckusick register struct vnode *vp; 22057042Smargo int s; 22139397Smckusick 22265260Smckusick if ((vnode_free_list.tqh_first == NULL && 22365260Smckusick numvnodes < 2 * desiredvnodes) || 22454347Smckusick numvnodes < desiredvnodes) { 22545118Smckusick vp = (struct vnode *)malloc((u_long)sizeof *vp, 22645118Smckusick M_VNODE, M_WAITOK); 22740883Smckusick bzero((char *)vp, sizeof *vp); 22840883Smckusick numvnodes++; 22940883Smckusick } else { 23065260Smckusick if ((vp = vnode_free_list.tqh_first) == NULL) { 23140883Smckusick tablefull("vnode"); 23240883Smckusick *vpp = 0; 23340883Smckusick return (ENFILE); 23440883Smckusick } 23540883Smckusick if (vp->v_usecount) 23640883Smckusick panic("free vnode isn't"); 23765260Smckusick TAILQ_REMOVE(&vnode_free_list, vp, v_freelist); 23865505Smckusick /* see comment on why 0xdeadb is set at end of vgone (below) */ 23965505Smckusick vp->v_freelist.tqe_prev = (struct vnode **)0xdeadb; 24052190Smckusick vp->v_lease = NULL; 24140883Smckusick if (vp->v_type != VBAD) 24240883Smckusick vgone(vp); 24357042Smargo #ifdef DIAGNOSTIC 24452006Smckusick if (vp->v_data) 24552006Smckusick panic("cleaned vnode isn't"); 24657042Smargo s = splbio(); 24757042Smargo if (vp->v_numoutput) 24857042Smargo panic("Clean vnode has pending I/O's"); 24957042Smargo splx(s); 25057042Smargo #endif 25140883Smckusick vp->v_flag = 0; 25240883Smckusick vp->v_lastr = 0; 25365745Shibler vp->v_ralen = 0; 25465745Shibler vp->v_maxra = 0; 25557042Smargo vp->v_lastw = 0; 25657042Smargo vp->v_lasta = 0; 25757042Smargo vp->v_cstart = 0; 25857042Smargo vp->v_clen = 0; 25940883Smckusick vp->v_socket = 0; 26039397Smckusick } 26139512Smckusick vp->v_type = VNON; 26239397Smckusick cache_purge(vp); 26339397Smckusick vp->v_tag = tag; 26439433Smckusick vp->v_op = vops; 26539397Smckusick insmntque(vp, mp); 26639397Smckusick *vpp = vp; 26765505Smckusick vp->v_usecount = 1; 26865260Smckusick vp->v_data = 0; 26939397Smckusick return (0); 27039397Smckusick } 27165679Shibler 27239397Smckusick /* 27339397Smckusick * Move a vnode from one mount queue to another. 27439397Smckusick */ 27539397Smckusick insmntque(vp, mp) 27639397Smckusick register struct vnode *vp; 27739397Smckusick register struct mount *mp; 27839397Smckusick { 27939397Smckusick 28039397Smckusick /* 28139397Smckusick * Delete from old mount point vnode list, if on one. 28239397Smckusick */ 28365679Shibler if (vp->v_mount != NULL) 28465260Smckusick LIST_REMOVE(vp, v_mntvnodes); 28539397Smckusick /* 28639397Smckusick * Insert into list of vnodes for the new mount point, if available. 28739397Smckusick */ 28865260Smckusick if ((vp->v_mount = mp) == NULL) 28939397Smckusick return; 29065260Smckusick LIST_INSERT_HEAD(&mp->mnt_vnodelist, vp, v_mntvnodes); 29139397Smckusick } 29239397Smckusick 29339397Smckusick /* 29449232Smckusick * Update outstanding I/O count and do wakeup if requested. 29549232Smckusick */ 29649232Smckusick vwakeup(bp) 29749232Smckusick register struct buf *bp; 29849232Smckusick { 29949232Smckusick register struct vnode *vp; 30049232Smckusick 30157810Smckusick bp->b_flags &= ~B_WRITEINPROG; 30249232Smckusick if (vp = bp->b_vp) { 30349232Smckusick vp->v_numoutput--; 30457042Smargo if (vp->v_numoutput < 0) 30557042Smargo panic("vwakeup: neg numoutput"); 30649232Smckusick if ((vp->v_flag & VBWAIT) && vp->v_numoutput <= 0) { 30749232Smckusick if (vp->v_numoutput < 0) 30849232Smckusick panic("vwakeup: neg numoutput"); 30949232Smckusick vp->v_flag &= ~VBWAIT; 31049232Smckusick wakeup((caddr_t)&vp->v_numoutput); 31149232Smckusick } 31249232Smckusick } 31349232Smckusick } 31449232Smckusick 31549232Smckusick /* 31649232Smckusick * Flush out and invalidate all buffers associated with a vnode. 31749232Smckusick * Called with the underlying object locked. 31849232Smckusick */ 31954442Smckusick int 32057792Smckusick vinvalbuf(vp, flags, cred, p, slpflag, slptimeo) 32149232Smckusick register struct vnode *vp; 32256459Smargo int flags; 32354442Smckusick struct ucred *cred; 32454442Smckusick struct proc *p; 32557792Smckusick int slpflag, slptimeo; 32649232Smckusick { 32749232Smckusick register struct buf *bp; 32849232Smckusick struct buf *nbp, *blist; 32954442Smckusick int s, error; 33049232Smckusick 33156459Smargo if (flags & V_SAVE) { 33254442Smckusick if (error = VOP_FSYNC(vp, cred, MNT_WAIT, p)) 33354442Smckusick return (error); 33465260Smckusick if (vp->v_dirtyblkhd.lh_first != NULL) 33554442Smckusick panic("vinvalbuf: dirty bufs"); 33654442Smckusick } 33749232Smckusick for (;;) { 33865260Smckusick if ((blist = vp->v_cleanblkhd.lh_first) && flags & V_SAVEMETA) 33956459Smargo while (blist && blist->b_lblkno < 0) 34065260Smckusick blist = blist->b_vnbufs.le_next; 34165260Smckusick if (!blist && (blist = vp->v_dirtyblkhd.lh_first) && 34256608Smckusick (flags & V_SAVEMETA)) 34356459Smargo while (blist && blist->b_lblkno < 0) 34465260Smckusick blist = blist->b_vnbufs.le_next; 34556459Smargo if (!blist) 34649232Smckusick break; 34756459Smargo 34849232Smckusick for (bp = blist; bp; bp = nbp) { 34965260Smckusick nbp = bp->b_vnbufs.le_next; 35056459Smargo if (flags & V_SAVEMETA && bp->b_lblkno < 0) 35156459Smargo continue; 35249232Smckusick s = splbio(); 35349232Smckusick if (bp->b_flags & B_BUSY) { 35449232Smckusick bp->b_flags |= B_WANTED; 35557792Smckusick error = tsleep((caddr_t)bp, 35657792Smckusick slpflag | (PRIBIO + 1), "vinvalbuf", 35757792Smckusick slptimeo); 35849232Smckusick splx(s); 35957792Smckusick if (error) 36057792Smckusick return (error); 36149232Smckusick break; 36249232Smckusick } 36349232Smckusick bremfree(bp); 36449232Smckusick bp->b_flags |= B_BUSY; 36549232Smckusick splx(s); 36657792Smckusick /* 36757792Smckusick * XXX Since there are no node locks for NFS, I believe 36857792Smckusick * there is a slight chance that a delayed write will 36957792Smckusick * occur while sleeping just above, so check for it. 37057792Smckusick */ 37157792Smckusick if ((bp->b_flags & B_DELWRI) && (flags & V_SAVE)) { 37257792Smckusick (void) VOP_BWRITE(bp); 37357792Smckusick break; 37457792Smckusick } 37556459Smargo bp->b_flags |= B_INVAL; 37649232Smckusick brelse(bp); 37749232Smckusick } 37849232Smckusick } 37956608Smckusick if (!(flags & V_SAVEMETA) && 38065260Smckusick (vp->v_dirtyblkhd.lh_first || vp->v_cleanblkhd.lh_first)) 38149232Smckusick panic("vinvalbuf: flush failed"); 38254442Smckusick return (0); 38349232Smckusick } 38449232Smckusick 38549232Smckusick /* 38649232Smckusick * Associate a buffer with a vnode. 38749232Smckusick */ 38849232Smckusick bgetvp(vp, bp) 38949232Smckusick register struct vnode *vp; 39049232Smckusick register struct buf *bp; 39149232Smckusick { 39249232Smckusick 39349232Smckusick if (bp->b_vp) 39449232Smckusick panic("bgetvp: not free"); 39549232Smckusick VHOLD(vp); 39649232Smckusick bp->b_vp = vp; 39749232Smckusick if (vp->v_type == VBLK || vp->v_type == VCHR) 39849232Smckusick bp->b_dev = vp->v_rdev; 39949232Smckusick else 40049232Smckusick bp->b_dev = NODEV; 40149232Smckusick /* 40249232Smckusick * Insert onto list for new vnode. 40349232Smckusick */ 40456608Smckusick bufinsvn(bp, &vp->v_cleanblkhd); 40549232Smckusick } 40649232Smckusick 40749232Smckusick /* 40849232Smckusick * Disassociate a buffer from a vnode. 40949232Smckusick */ 41049232Smckusick brelvp(bp) 41149232Smckusick register struct buf *bp; 41249232Smckusick { 41349232Smckusick struct vnode *vp; 41449232Smckusick 41549232Smckusick if (bp->b_vp == (struct vnode *) 0) 41649232Smckusick panic("brelvp: NULL"); 41749232Smckusick /* 41849232Smckusick * Delete from old vnode list, if on one. 41949232Smckusick */ 42065260Smckusick if (bp->b_vnbufs.le_next != NOLIST) 42156608Smckusick bufremvn(bp); 42249232Smckusick vp = bp->b_vp; 42349232Smckusick bp->b_vp = (struct vnode *) 0; 42449232Smckusick HOLDRELE(vp); 42549232Smckusick } 42649232Smckusick 42749232Smckusick /* 42849232Smckusick * Reassign a buffer from one vnode to another. 42949232Smckusick * Used to assign file specific control information 43049232Smckusick * (indirect blocks) to the vnode to which they belong. 43149232Smckusick */ 43249232Smckusick reassignbuf(bp, newvp) 43349232Smckusick register struct buf *bp; 43449232Smckusick register struct vnode *newvp; 43549232Smckusick { 43665260Smckusick register struct buflists *listheadp; 43749232Smckusick 43852655Smckusick if (newvp == NULL) { 43952655Smckusick printf("reassignbuf: NULL"); 44052655Smckusick return; 44152655Smckusick } 44249232Smckusick /* 44349232Smckusick * Delete from old vnode list, if on one. 44449232Smckusick */ 44565260Smckusick if (bp->b_vnbufs.le_next != NOLIST) 44656608Smckusick bufremvn(bp); 44749232Smckusick /* 44849232Smckusick * If dirty, put on list of dirty buffers; 44949232Smckusick * otherwise insert onto list of clean buffers. 45049232Smckusick */ 45149232Smckusick if (bp->b_flags & B_DELWRI) 45249232Smckusick listheadp = &newvp->v_dirtyblkhd; 45349232Smckusick else 45449232Smckusick listheadp = &newvp->v_cleanblkhd; 45556608Smckusick bufinsvn(bp, listheadp); 45649232Smckusick } 45749232Smckusick 45849232Smckusick /* 45939433Smckusick * Create a vnode for a block device. 46039433Smckusick * Used for root filesystem, argdev, and swap areas. 46139433Smckusick * Also used for memory file system special devices. 46239397Smckusick */ 46339433Smckusick bdevvp(dev, vpp) 46439433Smckusick dev_t dev; 46539433Smckusick struct vnode **vpp; 46639433Smckusick { 46739433Smckusick register struct vnode *vp; 46839433Smckusick struct vnode *nvp; 46939433Smckusick int error; 47039433Smckusick 47146989Smckusick if (dev == NODEV) 47246989Smckusick return (0); 47353547Sheideman error = getnewvnode(VT_NON, (struct mount *)0, spec_vnodeop_p, &nvp); 47439433Smckusick if (error) { 47539433Smckusick *vpp = 0; 47639433Smckusick return (error); 47739433Smckusick } 47839433Smckusick vp = nvp; 47939433Smckusick vp->v_type = VBLK; 48039615Smckusick if (nvp = checkalias(vp, dev, (struct mount *)0)) { 48139433Smckusick vput(vp); 48239433Smckusick vp = nvp; 48339433Smckusick } 48439433Smckusick *vpp = vp; 48539433Smckusick return (0); 48639433Smckusick } 48739433Smckusick 48839433Smckusick /* 48939433Smckusick * Check to see if the new vnode represents a special device 49039433Smckusick * for which we already have a vnode (either because of 49139433Smckusick * bdevvp() or because of a different vnode representing 49239433Smckusick * the same block device). If such an alias exists, deallocate 49339509Smckusick * the existing contents and return the aliased vnode. The 49439433Smckusick * caller is responsible for filling it with its new contents. 49539433Smckusick */ 49639433Smckusick struct vnode * 49739615Smckusick checkalias(nvp, nvp_rdev, mp) 49839433Smckusick register struct vnode *nvp; 49939615Smckusick dev_t nvp_rdev; 50039433Smckusick struct mount *mp; 50139433Smckusick { 50239433Smckusick register struct vnode *vp; 50339615Smckusick struct vnode **vpp; 50439433Smckusick 50539433Smckusick if (nvp->v_type != VBLK && nvp->v_type != VCHR) 50641400Smckusick return (NULLVP); 50739615Smckusick 50839615Smckusick vpp = &speclisth[SPECHASH(nvp_rdev)]; 50939433Smckusick loop: 51039615Smckusick for (vp = *vpp; vp; vp = vp->v_specnext) { 51139615Smckusick if (nvp_rdev != vp->v_rdev || nvp->v_type != vp->v_type) 51239433Smckusick continue; 51339615Smckusick /* 51439615Smckusick * Alias, but not in use, so flush it out. 51539615Smckusick */ 51639809Smckusick if (vp->v_usecount == 0) { 51739615Smckusick vgone(vp); 51839615Smckusick goto loop; 51939615Smckusick } 52065260Smckusick if (vget(vp, 1)) 52139633Smckusick goto loop; 52239433Smckusick break; 52339433Smckusick } 52439615Smckusick if (vp == NULL || vp->v_tag != VT_NON) { 52539615Smckusick MALLOC(nvp->v_specinfo, struct specinfo *, 52639615Smckusick sizeof(struct specinfo), M_VNODE, M_WAITOK); 52739615Smckusick nvp->v_rdev = nvp_rdev; 52839809Smckusick nvp->v_hashchain = vpp; 52939615Smckusick nvp->v_specnext = *vpp; 53042152Smckusick nvp->v_specflags = 0; 53139615Smckusick *vpp = nvp; 53240640Smckusick if (vp != NULL) { 53340640Smckusick nvp->v_flag |= VALIASED; 53440640Smckusick vp->v_flag |= VALIASED; 53540640Smckusick vput(vp); 53640640Smckusick } 53741400Smckusick return (NULLVP); 53839433Smckusick } 53939484Smckusick VOP_UNLOCK(vp); 54039484Smckusick vclean(vp, 0); 54139433Smckusick vp->v_op = nvp->v_op; 54239433Smckusick vp->v_tag = nvp->v_tag; 54339433Smckusick nvp->v_type = VNON; 54439433Smckusick insmntque(vp, mp); 54539433Smckusick return (vp); 54639433Smckusick } 54739433Smckusick 54839433Smckusick /* 54939433Smckusick * Grab a particular vnode from the free list, increment its 55039433Smckusick * reference count and lock it. The vnode lock bit is set the 55139433Smckusick * vnode is being eliminated in vgone. The process is awakened 55239433Smckusick * when the transition is completed, and an error returned to 55339433Smckusick * indicate that the vnode is no longer usable (possibly having 55439433Smckusick * been changed to a new file system type). 55539433Smckusick */ 55665260Smckusick vget(vp, lockflag) 55739397Smckusick register struct vnode *vp; 55865260Smckusick int lockflag; 55939397Smckusick { 56039397Smckusick 56139433Smckusick if (vp->v_flag & VXLOCK) { 56239433Smckusick vp->v_flag |= VXWANT; 56339433Smckusick sleep((caddr_t)vp, PINOD); 56439433Smckusick return (1); 56539433Smckusick } 56666423Shibler if (vp->v_usecount == 0) { 56766423Shibler #ifdef DIAGNOSTIC 568*66503Sbostic if (vp->v_freelist.tqe_prev == (struct vnode **)0xdeadb) 56966423Shibler panic("vget: race with getnewvnode"); 57066423Shibler #endif 57165260Smckusick TAILQ_REMOVE(&vnode_free_list, vp, v_freelist); 57266423Shibler } 57359450Smckusick vp->v_usecount++; 57465260Smckusick if (lockflag) 57565260Smckusick VOP_LOCK(vp); 57639433Smckusick return (0); 57739397Smckusick } 57839397Smckusick 57939397Smckusick /* 58039397Smckusick * Vnode reference, just increment the count 58139397Smckusick */ 58239397Smckusick void vref(vp) 58339397Smckusick struct vnode *vp; 58439397Smckusick { 58539397Smckusick 58659450Smckusick if (vp->v_usecount <= 0) 58759450Smckusick panic("vref used where vget required"); 58839809Smckusick vp->v_usecount++; 58939397Smckusick } 59039397Smckusick 59139397Smckusick /* 59239397Smckusick * vput(), just unlock and vrele() 59339397Smckusick */ 59439397Smckusick void vput(vp) 59539397Smckusick register struct vnode *vp; 59639397Smckusick { 59752416Storek 59839397Smckusick VOP_UNLOCK(vp); 59939397Smckusick vrele(vp); 60039397Smckusick } 60139397Smckusick 60239397Smckusick /* 60339397Smckusick * Vnode release. 60439397Smckusick * If count drops to zero, call inactive routine and return to freelist. 60539397Smckusick */ 60639397Smckusick void vrele(vp) 60739397Smckusick register struct vnode *vp; 60839397Smckusick { 60939397Smckusick 61050109Smckusick #ifdef DIAGNOSTIC 61139397Smckusick if (vp == NULL) 61239433Smckusick panic("vrele: null vp"); 61350109Smckusick #endif 61439809Smckusick vp->v_usecount--; 61539809Smckusick if (vp->v_usecount > 0) 61639397Smckusick return; 61750109Smckusick #ifdef DIAGNOSTIC 61850109Smckusick if (vp->v_usecount != 0 || vp->v_writecount != 0) { 61950109Smckusick vprint("vrele: bad ref count", vp); 62050109Smckusick panic("vrele: ref cnt"); 62150109Smckusick } 62250109Smckusick #endif 62355468Smckusick /* 62455468Smckusick * insert at tail of LRU list 62555468Smckusick */ 62665260Smckusick TAILQ_INSERT_TAIL(&vnode_free_list, vp, v_freelist); 62754442Smckusick VOP_INACTIVE(vp); 62839397Smckusick } 62939433Smckusick 63039433Smckusick /* 63139809Smckusick * Page or buffer structure gets a reference. 63239809Smckusick */ 63353312Smckusick void vhold(vp) 63439809Smckusick register struct vnode *vp; 63539809Smckusick { 63639809Smckusick 63739809Smckusick vp->v_holdcnt++; 63839809Smckusick } 63939809Smckusick 64039809Smckusick /* 64139809Smckusick * Page or buffer structure frees a reference. 64239809Smckusick */ 64353312Smckusick void holdrele(vp) 64439809Smckusick register struct vnode *vp; 64539809Smckusick { 64639809Smckusick 64739809Smckusick if (vp->v_holdcnt <= 0) 64839809Smckusick panic("holdrele: holdcnt"); 64939809Smckusick vp->v_holdcnt--; 65039809Smckusick } 65139809Smckusick 65239809Smckusick /* 65339509Smckusick * Remove any vnodes in the vnode table belonging to mount point mp. 65439509Smckusick * 65539509Smckusick * If MNT_NOFORCE is specified, there should not be any active ones, 65639509Smckusick * return error if any are found (nb: this is a user error, not a 65739509Smckusick * system error). If MNT_FORCE is specified, detach any active vnodes 65839509Smckusick * that are found. 65939509Smckusick */ 66065679Shibler #ifdef DIAGNOSTIC 66160930Smckusick int busyprt = 0; /* print out busy vnodes */ 66260930Smckusick struct ctldebug debug1 = { "busyprt", &busyprt }; 66365679Shibler #endif 66439509Smckusick 66539509Smckusick vflush(mp, skipvp, flags) 66639509Smckusick struct mount *mp; 66739509Smckusick struct vnode *skipvp; 66839509Smckusick int flags; 66939509Smckusick { 67039509Smckusick register struct vnode *vp, *nvp; 67139509Smckusick int busy = 0; 67239509Smckusick 67341400Smckusick if ((mp->mnt_flag & MNT_MPBUSY) == 0) 67441300Smckusick panic("vflush: not busy"); 67541421Smckusick loop: 67665260Smckusick for (vp = mp->mnt_vnodelist.lh_first; vp; vp = nvp) { 67741421Smckusick if (vp->v_mount != mp) 67841421Smckusick goto loop; 67965260Smckusick nvp = vp->v_mntvnodes.le_next; 68039509Smckusick /* 68139509Smckusick * Skip over a selected vnode. 68239509Smckusick */ 68339509Smckusick if (vp == skipvp) 68439509Smckusick continue; 68539509Smckusick /* 68641300Smckusick * Skip over a vnodes marked VSYSTEM. 68741300Smckusick */ 68841300Smckusick if ((flags & SKIPSYSTEM) && (vp->v_flag & VSYSTEM)) 68941300Smckusick continue; 69041300Smckusick /* 69157040Smckusick * If WRITECLOSE is set, only flush out regular file 69257040Smckusick * vnodes open for writing. 69357040Smckusick */ 69457040Smckusick if ((flags & WRITECLOSE) && 69557040Smckusick (vp->v_writecount == 0 || vp->v_type != VREG)) 69657040Smckusick continue; 69757040Smckusick /* 69839809Smckusick * With v_usecount == 0, all we need to do is clear 69939509Smckusick * out the vnode data structures and we are done. 70039509Smckusick */ 70139809Smckusick if (vp->v_usecount == 0) { 70239509Smckusick vgone(vp); 70339509Smckusick continue; 70439509Smckusick } 70539509Smckusick /* 70657040Smckusick * If FORCECLOSE is set, forcibly close the vnode. 70739509Smckusick * For block or character devices, revert to an 70839509Smckusick * anonymous device. For all other files, just kill them. 70939509Smckusick */ 71041300Smckusick if (flags & FORCECLOSE) { 71139509Smckusick if (vp->v_type != VBLK && vp->v_type != VCHR) { 71239509Smckusick vgone(vp); 71339509Smckusick } else { 71439509Smckusick vclean(vp, 0); 71553547Sheideman vp->v_op = spec_vnodeop_p; 71639509Smckusick insmntque(vp, (struct mount *)0); 71739509Smckusick } 71839509Smckusick continue; 71939509Smckusick } 72065679Shibler #ifdef DIAGNOSTIC 72139509Smckusick if (busyprt) 72239667Smckusick vprint("vflush: busy vnode", vp); 72365679Shibler #endif 72439509Smckusick busy++; 72539509Smckusick } 72639509Smckusick if (busy) 72739509Smckusick return (EBUSY); 72839509Smckusick return (0); 72939509Smckusick } 73039509Smckusick 73139509Smckusick /* 73239433Smckusick * Disassociate the underlying file system from a vnode. 73339433Smckusick */ 73454347Smckusick void 73554347Smckusick vclean(vp, flags) 73639433Smckusick register struct vnode *vp; 73745118Smckusick int flags; 73839433Smckusick { 73939484Smckusick int active; 74039433Smckusick 74139484Smckusick /* 74239484Smckusick * Check to see if the vnode is in use. 74339667Smckusick * If so we have to reference it before we clean it out 74439667Smckusick * so that its count cannot fall to zero and generate a 74539667Smckusick * race against ourselves to recycle it. 74639484Smckusick */ 74739809Smckusick if (active = vp->v_usecount) 74839484Smckusick VREF(vp); 74939484Smckusick /* 75056805Smckusick * Even if the count is zero, the VOP_INACTIVE routine may still 75156805Smckusick * have the object locked while it cleans it out. The VOP_LOCK 75256805Smckusick * ensures that the VOP_INACTIVE routine is done with its work. 75356805Smckusick * For active vnodes, it ensures that no other activity can 75456805Smckusick * occur while the underlying object is being cleaned out. 75556805Smckusick */ 75656805Smckusick VOP_LOCK(vp); 75756805Smckusick /* 75839484Smckusick * Prevent the vnode from being recycled or 75939484Smckusick * brought into use while we clean it out. 76039484Smckusick */ 76139667Smckusick if (vp->v_flag & VXLOCK) 76239667Smckusick panic("vclean: deadlock"); 76339433Smckusick vp->v_flag |= VXLOCK; 76439433Smckusick /* 76556805Smckusick * Clean out any buffers associated with the vnode. 76639667Smckusick */ 76741300Smckusick if (flags & DOCLOSE) 76857792Smckusick vinvalbuf(vp, V_SAVE, NOCRED, NULL, 0, 0); 76939667Smckusick /* 77056805Smckusick * Any other processes trying to obtain this lock must first 77156805Smckusick * wait for VXLOCK to clear, then call the new lock operation. 77239433Smckusick */ 77356805Smckusick VOP_UNLOCK(vp); 77439433Smckusick /* 77556805Smckusick * If purging an active vnode, it must be closed and 77656805Smckusick * deactivated before being reclaimed. 77739433Smckusick */ 77839484Smckusick if (active) { 77956805Smckusick if (flags & DOCLOSE) 78056805Smckusick VOP_CLOSE(vp, IO_NDELAY, NOCRED, NULL); 78156805Smckusick VOP_INACTIVE(vp); 78239433Smckusick } 78339433Smckusick /* 78439433Smckusick * Reclaim the vnode. 78539433Smckusick */ 78656805Smckusick if (VOP_RECLAIM(vp)) 78739433Smckusick panic("vclean: cannot reclaim"); 78839484Smckusick if (active) 78939484Smckusick vrele(vp); 79053580Sheideman 79139433Smckusick /* 79256805Smckusick * Done with purge, notify sleepers of the grim news. 79339433Smckusick */ 79456805Smckusick vp->v_op = dead_vnodeop_p; 79556805Smckusick vp->v_tag = VT_NON; 79639433Smckusick vp->v_flag &= ~VXLOCK; 79739433Smckusick if (vp->v_flag & VXWANT) { 79839433Smckusick vp->v_flag &= ~VXWANT; 79939433Smckusick wakeup((caddr_t)vp); 80039433Smckusick } 80139433Smckusick } 80239433Smckusick 80339433Smckusick /* 80439633Smckusick * Eliminate all activity associated with the requested vnode 80539633Smckusick * and with all vnodes aliased to the requested vnode. 80639633Smckusick */ 80739633Smckusick void vgoneall(vp) 80839633Smckusick register struct vnode *vp; 80939633Smckusick { 81039809Smckusick register struct vnode *vq; 81139633Smckusick 81240665Smckusick if (vp->v_flag & VALIASED) { 81340665Smckusick /* 81440665Smckusick * If a vgone (or vclean) is already in progress, 81540665Smckusick * wait until it is done and return. 81640665Smckusick */ 81740665Smckusick if (vp->v_flag & VXLOCK) { 81840665Smckusick vp->v_flag |= VXWANT; 81940665Smckusick sleep((caddr_t)vp, PINOD); 82040665Smckusick return; 82139633Smckusick } 82240665Smckusick /* 82340665Smckusick * Ensure that vp will not be vgone'd while we 82440665Smckusick * are eliminating its aliases. 82540665Smckusick */ 82640665Smckusick vp->v_flag |= VXLOCK; 82740665Smckusick while (vp->v_flag & VALIASED) { 82840665Smckusick for (vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 82940665Smckusick if (vq->v_rdev != vp->v_rdev || 83040665Smckusick vq->v_type != vp->v_type || vp == vq) 83140665Smckusick continue; 83240665Smckusick vgone(vq); 83340665Smckusick break; 83440665Smckusick } 83540665Smckusick } 83640665Smckusick /* 83740665Smckusick * Remove the lock so that vgone below will 83840665Smckusick * really eliminate the vnode after which time 83940665Smckusick * vgone will awaken any sleepers. 84040665Smckusick */ 84140665Smckusick vp->v_flag &= ~VXLOCK; 84239633Smckusick } 84339633Smckusick vgone(vp); 84439633Smckusick } 84539633Smckusick 84639633Smckusick /* 84739433Smckusick * Eliminate all activity associated with a vnode 84839433Smckusick * in preparation for reuse. 84939433Smckusick */ 85039433Smckusick void vgone(vp) 85139433Smckusick register struct vnode *vp; 85239433Smckusick { 85339809Smckusick register struct vnode *vq; 85439615Smckusick struct vnode *vx; 85539433Smckusick 85639433Smckusick /* 85740548Smckusick * If a vgone (or vclean) is already in progress, 85840548Smckusick * wait until it is done and return. 85940548Smckusick */ 86040548Smckusick if (vp->v_flag & VXLOCK) { 86140548Smckusick vp->v_flag |= VXWANT; 86240548Smckusick sleep((caddr_t)vp, PINOD); 86340548Smckusick return; 86440548Smckusick } 86540548Smckusick /* 86639433Smckusick * Clean out the filesystem specific data. 86739433Smckusick */ 86841300Smckusick vclean(vp, DOCLOSE); 86939433Smckusick /* 87039433Smckusick * Delete from old mount point vnode list, if on one. 87139433Smckusick */ 87265260Smckusick if (vp->v_mount != NULL) { 87365260Smckusick LIST_REMOVE(vp, v_mntvnodes); 87452311Smckusick vp->v_mount = NULL; 87539433Smckusick } 87639433Smckusick /* 87739433Smckusick * If special device, remove it from special device alias list. 87839433Smckusick */ 87939433Smckusick if (vp->v_type == VBLK || vp->v_type == VCHR) { 88039809Smckusick if (*vp->v_hashchain == vp) { 88139809Smckusick *vp->v_hashchain = vp->v_specnext; 88239433Smckusick } else { 88339809Smckusick for (vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 88439615Smckusick if (vq->v_specnext != vp) 88539433Smckusick continue; 88639615Smckusick vq->v_specnext = vp->v_specnext; 88739433Smckusick break; 88839433Smckusick } 88939615Smckusick if (vq == NULL) 89039433Smckusick panic("missing bdev"); 89139433Smckusick } 89239615Smckusick if (vp->v_flag & VALIASED) { 89352416Storek vx = NULL; 89439809Smckusick for (vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 89540108Smckusick if (vq->v_rdev != vp->v_rdev || 89640108Smckusick vq->v_type != vp->v_type) 89739615Smckusick continue; 89852416Storek if (vx) 89952416Storek break; 90039615Smckusick vx = vq; 90139615Smckusick } 90252416Storek if (vx == NULL) 90339615Smckusick panic("missing alias"); 90452416Storek if (vq == NULL) 90539615Smckusick vx->v_flag &= ~VALIASED; 90639615Smckusick vp->v_flag &= ~VALIASED; 90739615Smckusick } 90839615Smckusick FREE(vp->v_specinfo, M_VNODE); 90939615Smckusick vp->v_specinfo = NULL; 91039433Smckusick } 91139433Smckusick /* 91256932Smckusick * If it is on the freelist and not already at the head, 91365505Smckusick * move it to the head of the list. The test of the back 91465505Smckusick * pointer and the reference count of zero is because 91565505Smckusick * it will be removed from the free list by getnewvnode, 91665505Smckusick * but will not have its reference count incremented until 91765505Smckusick * after calling vgone. If the reference count were 91865505Smckusick * incremented first, vgone would (incorrectly) try to 91965505Smckusick * close the previous instance of the underlying object. 92065505Smckusick * So, the back pointer is explicitly set to `0xdeadb' in 92165505Smckusick * getnewvnode after removing it from the freelist to ensure 92265505Smckusick * that we do not try to move it here. 92339433Smckusick */ 92465505Smckusick if (vp->v_usecount == 0 && 92565505Smckusick vp->v_freelist.tqe_prev != (struct vnode **)0xdeadb && 92665505Smckusick vnode_free_list.tqh_first != vp) { 92765260Smckusick TAILQ_REMOVE(&vnode_free_list, vp, v_freelist); 92865260Smckusick TAILQ_INSERT_HEAD(&vnode_free_list, vp, v_freelist); 92939433Smckusick } 93039484Smckusick vp->v_type = VBAD; 93139433Smckusick } 93239633Smckusick 93339633Smckusick /* 93439821Smckusick * Lookup a vnode by device number. 93539821Smckusick */ 93639821Smckusick vfinddev(dev, type, vpp) 93739821Smckusick dev_t dev; 93839821Smckusick enum vtype type; 93939821Smckusick struct vnode **vpp; 94039821Smckusick { 94139821Smckusick register struct vnode *vp; 94239821Smckusick 94339821Smckusick for (vp = speclisth[SPECHASH(dev)]; vp; vp = vp->v_specnext) { 94439821Smckusick if (dev != vp->v_rdev || type != vp->v_type) 94539821Smckusick continue; 94639821Smckusick *vpp = vp; 94759484Smckusick return (1); 94839821Smckusick } 94959484Smckusick return (0); 95039821Smckusick } 95139821Smckusick 95239821Smckusick /* 95339633Smckusick * Calculate the total number of references to a special device. 95439633Smckusick */ 95539633Smckusick vcount(vp) 95639633Smckusick register struct vnode *vp; 95739633Smckusick { 95839809Smckusick register struct vnode *vq; 95939633Smckusick int count; 96039633Smckusick 96139633Smckusick if ((vp->v_flag & VALIASED) == 0) 96239809Smckusick return (vp->v_usecount); 96339633Smckusick loop: 96439809Smckusick for (count = 0, vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 96540108Smckusick if (vq->v_rdev != vp->v_rdev || vq->v_type != vp->v_type) 96639633Smckusick continue; 96739633Smckusick /* 96839633Smckusick * Alias, but not in use, so flush it out. 96939633Smckusick */ 97039809Smckusick if (vq->v_usecount == 0) { 97139633Smckusick vgone(vq); 97239633Smckusick goto loop; 97339633Smckusick } 97439809Smckusick count += vq->v_usecount; 97539633Smckusick } 97639633Smckusick return (count); 97739633Smckusick } 97839667Smckusick 97939667Smckusick /* 98039667Smckusick * Print out a description of a vnode. 98139667Smckusick */ 98239667Smckusick static char *typename[] = 98340286Smckusick { "VNON", "VREG", "VDIR", "VBLK", "VCHR", "VLNK", "VSOCK", "VFIFO", "VBAD" }; 98439667Smckusick 98539667Smckusick vprint(label, vp) 98639667Smckusick char *label; 98739667Smckusick register struct vnode *vp; 98839667Smckusick { 98939913Smckusick char buf[64]; 99039667Smckusick 99139667Smckusick if (label != NULL) 99239667Smckusick printf("%s: ", label); 99350109Smckusick printf("type %s, usecount %d, writecount %d, refcount %d,", 99450109Smckusick typename[vp->v_type], vp->v_usecount, vp->v_writecount, 99550109Smckusick vp->v_holdcnt); 99639913Smckusick buf[0] = '\0'; 99739913Smckusick if (vp->v_flag & VROOT) 99839913Smckusick strcat(buf, "|VROOT"); 99939913Smckusick if (vp->v_flag & VTEXT) 100039913Smckusick strcat(buf, "|VTEXT"); 100141300Smckusick if (vp->v_flag & VSYSTEM) 100241300Smckusick strcat(buf, "|VSYSTEM"); 100341300Smckusick if (vp->v_flag & VXLOCK) 100441300Smckusick strcat(buf, "|VXLOCK"); 100541300Smckusick if (vp->v_flag & VXWANT) 100641300Smckusick strcat(buf, "|VXWANT"); 100741300Smckusick if (vp->v_flag & VBWAIT) 100841300Smckusick strcat(buf, "|VBWAIT"); 100939913Smckusick if (vp->v_flag & VALIASED) 101039913Smckusick strcat(buf, "|VALIASED"); 101139913Smckusick if (buf[0] != '\0') 101239913Smckusick printf(" flags (%s)", &buf[1]); 101365260Smckusick if (vp->v_data == NULL) { 101465260Smckusick printf("\n"); 101565260Smckusick } else { 101665260Smckusick printf("\n\t"); 101765260Smckusick VOP_PRINT(vp); 101865260Smckusick } 101939667Smckusick } 102041110Smarc 102149691Smckusick #ifdef DEBUG 102249691Smckusick /* 102349691Smckusick * List all of the locked vnodes in the system. 102449691Smckusick * Called when debugging the kernel. 102549691Smckusick */ 102649691Smckusick printlockedvnodes() 102749691Smckusick { 102849691Smckusick register struct mount *mp; 102949691Smckusick register struct vnode *vp; 103049691Smckusick 103149691Smckusick printf("Locked vnodes\n"); 103265260Smckusick for (mp = mountlist.tqh_first; mp != NULL; mp = mp->mnt_list.tqe_next) { 103365260Smckusick for (vp = mp->mnt_vnodelist.lh_first; 103465260Smckusick vp != NULL; 103565260Smckusick vp = vp->v_mntvnodes.le_next) 103649691Smckusick if (VOP_ISLOCKED(vp)) 103749691Smckusick vprint((char *)0, vp); 103865260Smckusick } 103949691Smckusick } 104049691Smckusick #endif 104149691Smckusick 104241110Smarc int kinfo_vdebug = 1; 104341110Smarc int kinfo_vgetfailed; 104441110Smarc #define KINFO_VNODESLOP 10 104541110Smarc /* 104657841Smckusick * Dump vnode list (via sysctl). 104741110Smarc * Copyout address of vnode followed by vnode. 104841110Smarc */ 104945118Smckusick /* ARGSUSED */ 105057841Smckusick sysctl_vnode(where, sizep) 105141110Smarc char *where; 105258465Sbostic size_t *sizep; 105341110Smarc { 105465260Smckusick register struct mount *mp, *nmp; 105541110Smarc struct vnode *vp; 105641110Smarc register char *bp = where, *savebp; 105753818Smckusick char *ewhere; 105841110Smarc int error; 105941110Smarc 106041110Smarc #define VPTRSZ sizeof (struct vnode *) 106141110Smarc #define VNODESZ sizeof (struct vnode) 106241110Smarc if (where == NULL) { 106357841Smckusick *sizep = (numvnodes + KINFO_VNODESLOP) * (VPTRSZ + VNODESZ); 106441110Smarc return (0); 106541110Smarc } 106657841Smckusick ewhere = where + *sizep; 106741110Smarc 106865260Smckusick for (mp = mountlist.tqh_first; mp != NULL; mp = nmp) { 106965260Smckusick nmp = mp->mnt_list.tqe_next; 107065260Smckusick if (vfs_busy(mp)) 107141300Smckusick continue; 107241110Smarc savebp = bp; 107341110Smarc again: 107465260Smckusick for (vp = mp->mnt_vnodelist.lh_first; 107565260Smckusick vp != NULL; 107665260Smckusick vp = vp->v_mntvnodes.le_next) { 107741422Smckusick /* 107841422Smckusick * Check that the vp is still associated with 107941422Smckusick * this filesystem. RACE: could have been 108041422Smckusick * recycled onto the same filesystem. 108141422Smckusick */ 108241421Smckusick if (vp->v_mount != mp) { 108341421Smckusick if (kinfo_vdebug) 108441421Smckusick printf("kinfo: vp changed\n"); 108541421Smckusick bp = savebp; 108641421Smckusick goto again; 108741421Smckusick } 108857841Smckusick if (bp + VPTRSZ + VNODESZ > ewhere) { 108957841Smckusick *sizep = bp - where; 109057841Smckusick return (ENOMEM); 109157841Smckusick } 109257841Smckusick if ((error = copyout((caddr_t)&vp, bp, VPTRSZ)) || 109357841Smckusick (error = copyout((caddr_t)vp, bp + VPTRSZ, VNODESZ))) 109441110Smarc return (error); 109541110Smarc bp += VPTRSZ + VNODESZ; 109641110Smarc } 109765260Smckusick vfs_unbusy(mp); 109865260Smckusick } 109941110Smarc 110057841Smckusick *sizep = bp - where; 110141110Smarc return (0); 110241110Smarc } 110365679Shibler 110465679Shibler /* 110565679Shibler * Check to see if a filesystem is mounted on a block device. 110665679Shibler */ 110765679Shibler int 110865679Shibler vfs_mountedon(vp) 110965679Shibler register struct vnode *vp; 111065679Shibler { 111165679Shibler register struct vnode *vq; 111265679Shibler 111365679Shibler if (vp->v_specflags & SI_MOUNTEDON) 111465679Shibler return (EBUSY); 111565679Shibler if (vp->v_flag & VALIASED) { 111665679Shibler for (vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 111765679Shibler if (vq->v_rdev != vp->v_rdev || 111865679Shibler vq->v_type != vp->v_type) 111965679Shibler continue; 112065679Shibler if (vq->v_specflags & SI_MOUNTEDON) 112165679Shibler return (EBUSY); 112265679Shibler } 112365679Shibler } 112465679Shibler return (0); 112565679Shibler } 112665679Shibler 112765679Shibler /* 112865679Shibler * Build hash lists of net addresses and hang them off the mount point. 112965679Shibler * Called by ufs_mount() to set up the lists of export addresses. 113065679Shibler */ 113165679Shibler static int 113265679Shibler vfs_hang_addrlist(mp, nep, argp) 113365679Shibler struct mount *mp; 113465679Shibler struct netexport *nep; 113565679Shibler struct export_args *argp; 113665679Shibler { 113765679Shibler register struct netcred *np; 113865679Shibler register struct radix_node_head *rnh; 113965679Shibler register int i; 114065679Shibler struct radix_node *rn; 114165679Shibler struct sockaddr *saddr, *smask = 0; 114265679Shibler struct domain *dom; 114365679Shibler int error; 114465679Shibler 114565679Shibler if (argp->ex_addrlen == 0) { 114665679Shibler if (mp->mnt_flag & MNT_DEFEXPORTED) 114765679Shibler return (EPERM); 114865679Shibler np = &nep->ne_defexported; 114965679Shibler np->netc_exflags = argp->ex_flags; 115065679Shibler np->netc_anon = argp->ex_anon; 115165679Shibler np->netc_anon.cr_ref = 1; 115265679Shibler mp->mnt_flag |= MNT_DEFEXPORTED; 115365679Shibler return (0); 115465679Shibler } 115565679Shibler i = sizeof(struct netcred) + argp->ex_addrlen + argp->ex_masklen; 115665679Shibler np = (struct netcred *)malloc(i, M_NETADDR, M_WAITOK); 115765679Shibler bzero((caddr_t)np, i); 115865679Shibler saddr = (struct sockaddr *)(np + 1); 115965679Shibler if (error = copyin(argp->ex_addr, (caddr_t)saddr, argp->ex_addrlen)) 116065679Shibler goto out; 116165679Shibler if (saddr->sa_len > argp->ex_addrlen) 116265679Shibler saddr->sa_len = argp->ex_addrlen; 116365679Shibler if (argp->ex_masklen) { 116465679Shibler smask = (struct sockaddr *)((caddr_t)saddr + argp->ex_addrlen); 116565679Shibler error = copyin(argp->ex_addr, (caddr_t)smask, argp->ex_masklen); 116665679Shibler if (error) 116765679Shibler goto out; 116865679Shibler if (smask->sa_len > argp->ex_masklen) 116965679Shibler smask->sa_len = argp->ex_masklen; 117065679Shibler } 117165679Shibler i = saddr->sa_family; 117265679Shibler if ((rnh = nep->ne_rtable[i]) == 0) { 117365679Shibler /* 117465679Shibler * Seems silly to initialize every AF when most are not 117565679Shibler * used, do so on demand here 117665679Shibler */ 117765679Shibler for (dom = domains; dom; dom = dom->dom_next) 117865679Shibler if (dom->dom_family == i && dom->dom_rtattach) { 117965679Shibler dom->dom_rtattach((void **)&nep->ne_rtable[i], 118065679Shibler dom->dom_rtoffset); 118165679Shibler break; 118265679Shibler } 118365679Shibler if ((rnh = nep->ne_rtable[i]) == 0) { 118465679Shibler error = ENOBUFS; 118565679Shibler goto out; 118665679Shibler } 118765679Shibler } 118865679Shibler rn = (*rnh->rnh_addaddr)((caddr_t)saddr, (caddr_t)smask, rnh, 118965679Shibler np->netc_rnodes); 119065679Shibler if (rn == 0 || np != (struct netcred *)rn) { /* already exists */ 119165679Shibler error = EPERM; 119265679Shibler goto out; 119365679Shibler } 119465679Shibler np->netc_exflags = argp->ex_flags; 119565679Shibler np->netc_anon = argp->ex_anon; 119665679Shibler np->netc_anon.cr_ref = 1; 119765679Shibler return (0); 119865679Shibler out: 119965679Shibler free(np, M_NETADDR); 120065679Shibler return (error); 120165679Shibler } 120265679Shibler 120365679Shibler /* ARGSUSED */ 120465679Shibler static int 120565679Shibler vfs_free_netcred(rn, w) 120665679Shibler struct radix_node *rn; 120765679Shibler caddr_t w; 120865679Shibler { 120965679Shibler register struct radix_node_head *rnh = (struct radix_node_head *)w; 121065679Shibler 121165679Shibler (*rnh->rnh_deladdr)(rn->rn_key, rn->rn_mask, rnh); 121265679Shibler free((caddr_t)rn, M_NETADDR); 121365679Shibler return (0); 121465679Shibler } 121565679Shibler 121665679Shibler /* 121765679Shibler * Free the net address hash lists that are hanging off the mount points. 121865679Shibler */ 121965679Shibler static void 122065679Shibler vfs_free_addrlist(nep) 122165679Shibler struct netexport *nep; 122265679Shibler { 122365679Shibler register int i; 122465679Shibler register struct radix_node_head *rnh; 122565679Shibler 122665679Shibler for (i = 0; i <= AF_MAX; i++) 122765679Shibler if (rnh = nep->ne_rtable[i]) { 122865679Shibler (*rnh->rnh_walktree)(rnh, vfs_free_netcred, 122965679Shibler (caddr_t)rnh); 123065679Shibler free((caddr_t)rnh, M_RTABLE); 123165679Shibler nep->ne_rtable[i] = 0; 123265679Shibler } 123365679Shibler } 123465679Shibler 123565679Shibler int 123665679Shibler vfs_export(mp, nep, argp) 123765679Shibler struct mount *mp; 123865679Shibler struct netexport *nep; 123965679Shibler struct export_args *argp; 124065679Shibler { 124165679Shibler int error; 124265679Shibler 124365679Shibler if (argp->ex_flags & MNT_DELEXPORT) { 124465679Shibler vfs_free_addrlist(nep); 124565679Shibler mp->mnt_flag &= ~(MNT_EXPORTED | MNT_DEFEXPORTED); 124665679Shibler } 124765679Shibler if (argp->ex_flags & MNT_EXPORTED) { 124865679Shibler if (error = vfs_hang_addrlist(mp, nep, argp)) 124965679Shibler return (error); 125065679Shibler mp->mnt_flag |= MNT_EXPORTED; 125165679Shibler } 125265679Shibler return (0); 125365679Shibler } 125465679Shibler 125565679Shibler struct netcred * 125665679Shibler vfs_export_lookup(mp, nep, nam) 125765679Shibler register struct mount *mp; 125865679Shibler struct netexport *nep; 125965679Shibler struct mbuf *nam; 126065679Shibler { 126165679Shibler register struct netcred *np; 126265679Shibler register struct radix_node_head *rnh; 126365679Shibler struct sockaddr *saddr; 126465679Shibler 126565679Shibler np = NULL; 126665679Shibler if (mp->mnt_flag & MNT_EXPORTED) { 126765679Shibler /* 126865679Shibler * Lookup in the export list first. 126965679Shibler */ 127065679Shibler if (nam != NULL) { 127165679Shibler saddr = mtod(nam, struct sockaddr *); 127265679Shibler rnh = nep->ne_rtable[saddr->sa_family]; 127365679Shibler if (rnh != NULL) { 127465679Shibler np = (struct netcred *) 127565679Shibler (*rnh->rnh_matchaddr)((caddr_t)saddr, 127665679Shibler rnh); 127765679Shibler if (np && np->netc_rnodes->rn_flags & RNF_ROOT) 127865679Shibler np = NULL; 127965679Shibler } 128065679Shibler } 128165679Shibler /* 128265679Shibler * If no address match, use the default if it exists. 128365679Shibler */ 128465679Shibler if (np == NULL && mp->mnt_flag & MNT_DEFEXPORTED) 128565679Shibler np = &nep->ne_defexported; 128665679Shibler } 128765679Shibler return (np); 128865679Shibler } 1289