137488Smckusick /* 263180Sbostic * Copyright (c) 1989, 1993 363180Sbostic * The Regents of the University of California. All rights reserved. 465771Sbostic * (c) UNIX System Laboratories, Inc. 565771Sbostic * All or some portions of this file are derived from material licensed 665771Sbostic * to the University of California by American Telephone and Telegraph 765771Sbostic * Co. or Unix System Laboratories, Inc. and are reproduced herein with 865771Sbostic * the permission of UNIX System Laboratories, Inc. 937488Smckusick * 1044458Sbostic * %sccs.include.redist.c% 1137488Smckusick * 12*68171Scgd * @(#)vfs_subr.c 8.14 (Berkeley) 01/09/95 1337488Smckusick */ 1437488Smckusick 1537488Smckusick /* 1637488Smckusick * External virtual filesystem routines 1737488Smckusick */ 1837488Smckusick 1951460Sbostic #include <sys/param.h> 2053829Spendry #include <sys/systm.h> 2151460Sbostic #include <sys/proc.h> 2251460Sbostic #include <sys/mount.h> 2351460Sbostic #include <sys/time.h> 2451460Sbostic #include <sys/vnode.h> 2552415Smckusick #include <sys/stat.h> 2651460Sbostic #include <sys/namei.h> 2751460Sbostic #include <sys/ucred.h> 2851460Sbostic #include <sys/buf.h> 2951460Sbostic #include <sys/errno.h> 3051460Sbostic #include <sys/malloc.h> 3165679Shibler #include <sys/domain.h> 3265679Shibler #include <sys/mbuf.h> 3337488Smckusick 3460930Smckusick #include <vm/vm.h> 3560930Smckusick #include <sys/sysctl.h> 3660930Smckusick 3755050Spendry #include <miscfs/specfs/specdev.h> 3855050Spendry 3952415Smckusick enum vtype iftovt_tab[16] = { 4052415Smckusick VNON, VFIFO, VCHR, VNON, VDIR, VNON, VBLK, VNON, 4152415Smckusick VREG, VNON, VLNK, VNON, VSOCK, VNON, VNON, VBAD, 4252415Smckusick }; 4352415Smckusick int vttoif_tab[9] = { 4452415Smckusick 0, S_IFREG, S_IFDIR, S_IFBLK, S_IFCHR, S_IFLNK, 4552415Smckusick S_IFSOCK, S_IFIFO, S_IFMT, 4652415Smckusick }; 4752415Smckusick 4837488Smckusick /* 4956608Smckusick * Insq/Remq for the vnode usage lists. 5056608Smckusick */ 5165260Smckusick #define bufinsvn(bp, dp) LIST_INSERT_HEAD(dp, bp, b_vnbufs) 5265260Smckusick #define bufremvn(bp) { \ 5365260Smckusick LIST_REMOVE(bp, b_vnbufs); \ 5465260Smckusick (bp)->b_vnbufs.le_next = NOLIST; \ 5565260Smckusick } 5656608Smckusick 5765260Smckusick TAILQ_HEAD(freelst, vnode) vnode_free_list; /* vnode free list */ 5865260Smckusick struct mntlist mountlist; /* mounted filesystem list */ 5965260Smckusick 6056608Smckusick /* 6165260Smckusick * Initialize the vnode management data structures. 6237488Smckusick */ 6365260Smckusick vntblinit() 6437488Smckusick { 6537488Smckusick 6665260Smckusick TAILQ_INIT(&vnode_free_list); 6765260Smckusick TAILQ_INIT(&mountlist); 6837488Smckusick } 6937488Smckusick 7037488Smckusick /* 7137488Smckusick * Lock a filesystem. 7237488Smckusick * Used to prevent access to it while mounting and unmounting. 7337488Smckusick */ 7437488Smckusick vfs_lock(mp) 7537488Smckusick register struct mount *mp; 7637488Smckusick { 7737488Smckusick 7841400Smckusick while(mp->mnt_flag & MNT_MLOCK) { 7941400Smckusick mp->mnt_flag |= MNT_MWAIT; 8039045Smckusick sleep((caddr_t)mp, PVFS); 8139045Smckusick } 8241400Smckusick mp->mnt_flag |= MNT_MLOCK; 8337488Smckusick return (0); 8437488Smckusick } 8537488Smckusick 8637488Smckusick /* 8737488Smckusick * Unlock a locked filesystem. 8837488Smckusick * Panic if filesystem is not locked. 8937488Smckusick */ 9037488Smckusick void 9137488Smckusick vfs_unlock(mp) 9237488Smckusick register struct mount *mp; 9337488Smckusick { 9437488Smckusick 9541400Smckusick if ((mp->mnt_flag & MNT_MLOCK) == 0) 9641300Smckusick panic("vfs_unlock: not locked"); 9741400Smckusick mp->mnt_flag &= ~MNT_MLOCK; 9841400Smckusick if (mp->mnt_flag & MNT_MWAIT) { 9941400Smckusick mp->mnt_flag &= ~MNT_MWAIT; 10037488Smckusick wakeup((caddr_t)mp); 10137488Smckusick } 10237488Smckusick } 10337488Smckusick 10437488Smckusick /* 10541300Smckusick * Mark a mount point as busy. 10641300Smckusick * Used to synchronize access and to delay unmounting. 10741300Smckusick */ 10841300Smckusick vfs_busy(mp) 10941300Smckusick register struct mount *mp; 11041300Smckusick { 11141300Smckusick 11241400Smckusick while(mp->mnt_flag & MNT_MPBUSY) { 11341400Smckusick mp->mnt_flag |= MNT_MPWANT; 11441400Smckusick sleep((caddr_t)&mp->mnt_flag, PVFS); 11541300Smckusick } 11641419Smckusick if (mp->mnt_flag & MNT_UNMOUNT) 11741419Smckusick return (1); 11841400Smckusick mp->mnt_flag |= MNT_MPBUSY; 11941300Smckusick return (0); 12041300Smckusick } 12141300Smckusick 12241300Smckusick /* 12341300Smckusick * Free a busy filesystem. 12441300Smckusick * Panic if filesystem is not busy. 12541300Smckusick */ 12641300Smckusick vfs_unbusy(mp) 12741300Smckusick register struct mount *mp; 12841300Smckusick { 12941300Smckusick 13041400Smckusick if ((mp->mnt_flag & MNT_MPBUSY) == 0) 13141300Smckusick panic("vfs_unbusy: not busy"); 13241400Smckusick mp->mnt_flag &= ~MNT_MPBUSY; 13341400Smckusick if (mp->mnt_flag & MNT_MPWANT) { 13441400Smckusick mp->mnt_flag &= ~MNT_MPWANT; 13541400Smckusick wakeup((caddr_t)&mp->mnt_flag); 13641300Smckusick } 13741300Smckusick } 13841300Smckusick 13941300Smckusick /* 14037488Smckusick * Lookup a mount point by filesystem identifier. 14137488Smckusick */ 14237488Smckusick struct mount * 14337488Smckusick getvfs(fsid) 14437488Smckusick fsid_t *fsid; 14537488Smckusick { 14637488Smckusick register struct mount *mp; 14737488Smckusick 14865260Smckusick for (mp = mountlist.tqh_first; mp != NULL; mp = mp->mnt_list.tqe_next) { 14941400Smckusick if (mp->mnt_stat.f_fsid.val[0] == fsid->val[0] && 15065260Smckusick mp->mnt_stat.f_fsid.val[1] == fsid->val[1]) 15138288Smckusick return (mp); 15265260Smckusick } 15338288Smckusick return ((struct mount *)0); 15437488Smckusick } 15537488Smckusick 15637488Smckusick /* 15753829Spendry * Get a new unique fsid 15853829Spendry */ 15953829Spendry void 16053829Spendry getnewfsid(mp, mtype) 16153829Spendry struct mount *mp; 16253829Spendry int mtype; 16353829Spendry { 16453829Spendry static u_short xxxfs_mntid; 16553829Spendry 16653829Spendry fsid_t tfsid; 16753829Spendry 16865507Spendry mp->mnt_stat.f_fsid.val[0] = makedev(nblkdev + mtype, 0); 16953829Spendry mp->mnt_stat.f_fsid.val[1] = mtype; 17053829Spendry if (xxxfs_mntid == 0) 17153829Spendry ++xxxfs_mntid; 17265507Spendry tfsid.val[0] = makedev(nblkdev + mtype, xxxfs_mntid); 17353829Spendry tfsid.val[1] = mtype; 17465260Smckusick if (mountlist.tqh_first != NULL) { 17553936Spendry while (getvfs(&tfsid)) { 17653936Spendry tfsid.val[0]++; 17753936Spendry xxxfs_mntid++; 17853936Spendry } 17953829Spendry } 18053829Spendry mp->mnt_stat.f_fsid.val[0] = tfsid.val[0]; 18153829Spendry } 18253829Spendry 18353829Spendry /* 18437488Smckusick * Set vnode attributes to VNOVAL 18537488Smckusick */ 18637488Smckusick void vattr_null(vap) 18737488Smckusick register struct vattr *vap; 18837488Smckusick { 18937488Smckusick 19037488Smckusick vap->va_type = VNON; 19152005Smckusick vap->va_size = vap->va_bytes = VNOVAL; 19237488Smckusick vap->va_mode = vap->va_nlink = vap->va_uid = vap->va_gid = 19352005Smckusick vap->va_fsid = vap->va_fileid = 19452005Smckusick vap->va_blocksize = vap->va_rdev = 19554347Smckusick vap->va_atime.ts_sec = vap->va_atime.ts_nsec = 19654347Smckusick vap->va_mtime.ts_sec = vap->va_mtime.ts_nsec = 19754347Smckusick vap->va_ctime.ts_sec = vap->va_ctime.ts_nsec = 19838258Smckusick vap->va_flags = vap->va_gen = VNOVAL; 19958548Sbostic vap->va_vaflags = 0; 20037488Smckusick } 20138265Smckusick 20238265Smckusick /* 20339397Smckusick * Routines having to do with the management of the vnode table. 20439397Smckusick */ 20553547Sheideman extern int (**dead_vnodeop_p)(); 20639635Smckusick extern void vclean(); 20740883Smckusick long numvnodes; 20853493Sheideman extern struct vattr va_null; 20939397Smckusick 21039397Smckusick /* 21139397Smckusick * Return the next vnode from the free list. 21239397Smckusick */ 21339397Smckusick getnewvnode(tag, mp, vops, vpp) 21439397Smckusick enum vtagtype tag; 21539397Smckusick struct mount *mp; 21653495Sheideman int (**vops)(); 21739397Smckusick struct vnode **vpp; 21839397Smckusick { 21965511Smckusick register struct vnode *vp; 22057042Smargo int s; 22139397Smckusick 22265260Smckusick if ((vnode_free_list.tqh_first == NULL && 22365260Smckusick numvnodes < 2 * desiredvnodes) || 22454347Smckusick numvnodes < desiredvnodes) { 22545118Smckusick vp = (struct vnode *)malloc((u_long)sizeof *vp, 22645118Smckusick M_VNODE, M_WAITOK); 22740883Smckusick bzero((char *)vp, sizeof *vp); 22840883Smckusick numvnodes++; 22940883Smckusick } else { 23065260Smckusick if ((vp = vnode_free_list.tqh_first) == NULL) { 23140883Smckusick tablefull("vnode"); 23240883Smckusick *vpp = 0; 23340883Smckusick return (ENFILE); 23440883Smckusick } 23540883Smckusick if (vp->v_usecount) 23640883Smckusick panic("free vnode isn't"); 23765260Smckusick TAILQ_REMOVE(&vnode_free_list, vp, v_freelist); 23865505Smckusick /* see comment on why 0xdeadb is set at end of vgone (below) */ 23965505Smckusick vp->v_freelist.tqe_prev = (struct vnode **)0xdeadb; 24052190Smckusick vp->v_lease = NULL; 24140883Smckusick if (vp->v_type != VBAD) 24240883Smckusick vgone(vp); 24357042Smargo #ifdef DIAGNOSTIC 24452006Smckusick if (vp->v_data) 24552006Smckusick panic("cleaned vnode isn't"); 24657042Smargo s = splbio(); 24757042Smargo if (vp->v_numoutput) 24857042Smargo panic("Clean vnode has pending I/O's"); 24957042Smargo splx(s); 25057042Smargo #endif 25140883Smckusick vp->v_flag = 0; 25240883Smckusick vp->v_lastr = 0; 25365745Shibler vp->v_ralen = 0; 25465745Shibler vp->v_maxra = 0; 25557042Smargo vp->v_lastw = 0; 25657042Smargo vp->v_lasta = 0; 25757042Smargo vp->v_cstart = 0; 25857042Smargo vp->v_clen = 0; 25940883Smckusick vp->v_socket = 0; 26039397Smckusick } 26139512Smckusick vp->v_type = VNON; 26239397Smckusick cache_purge(vp); 26339397Smckusick vp->v_tag = tag; 26439433Smckusick vp->v_op = vops; 26539397Smckusick insmntque(vp, mp); 26639397Smckusick *vpp = vp; 26765505Smckusick vp->v_usecount = 1; 26865260Smckusick vp->v_data = 0; 26939397Smckusick return (0); 27039397Smckusick } 27165679Shibler 27239397Smckusick /* 27339397Smckusick * Move a vnode from one mount queue to another. 27439397Smckusick */ 27539397Smckusick insmntque(vp, mp) 27639397Smckusick register struct vnode *vp; 27739397Smckusick register struct mount *mp; 27839397Smckusick { 27939397Smckusick 28039397Smckusick /* 28139397Smckusick * Delete from old mount point vnode list, if on one. 28239397Smckusick */ 28365679Shibler if (vp->v_mount != NULL) 28465260Smckusick LIST_REMOVE(vp, v_mntvnodes); 28539397Smckusick /* 28639397Smckusick * Insert into list of vnodes for the new mount point, if available. 28739397Smckusick */ 28865260Smckusick if ((vp->v_mount = mp) == NULL) 28939397Smckusick return; 29065260Smckusick LIST_INSERT_HEAD(&mp->mnt_vnodelist, vp, v_mntvnodes); 29139397Smckusick } 29239397Smckusick 29339397Smckusick /* 29449232Smckusick * Update outstanding I/O count and do wakeup if requested. 29549232Smckusick */ 29649232Smckusick vwakeup(bp) 29749232Smckusick register struct buf *bp; 29849232Smckusick { 29949232Smckusick register struct vnode *vp; 30049232Smckusick 30157810Smckusick bp->b_flags &= ~B_WRITEINPROG; 30249232Smckusick if (vp = bp->b_vp) { 30349232Smckusick vp->v_numoutput--; 30457042Smargo if (vp->v_numoutput < 0) 30557042Smargo panic("vwakeup: neg numoutput"); 30649232Smckusick if ((vp->v_flag & VBWAIT) && vp->v_numoutput <= 0) { 30749232Smckusick if (vp->v_numoutput < 0) 30849232Smckusick panic("vwakeup: neg numoutput"); 30949232Smckusick vp->v_flag &= ~VBWAIT; 31049232Smckusick wakeup((caddr_t)&vp->v_numoutput); 31149232Smckusick } 31249232Smckusick } 31349232Smckusick } 31449232Smckusick 31549232Smckusick /* 31649232Smckusick * Flush out and invalidate all buffers associated with a vnode. 31749232Smckusick * Called with the underlying object locked. 31849232Smckusick */ 31954442Smckusick int 32057792Smckusick vinvalbuf(vp, flags, cred, p, slpflag, slptimeo) 32149232Smckusick register struct vnode *vp; 32256459Smargo int flags; 32354442Smckusick struct ucred *cred; 32454442Smckusick struct proc *p; 32557792Smckusick int slpflag, slptimeo; 32649232Smckusick { 32749232Smckusick register struct buf *bp; 32849232Smckusick struct buf *nbp, *blist; 32954442Smckusick int s, error; 33049232Smckusick 33156459Smargo if (flags & V_SAVE) { 33254442Smckusick if (error = VOP_FSYNC(vp, cred, MNT_WAIT, p)) 33354442Smckusick return (error); 33465260Smckusick if (vp->v_dirtyblkhd.lh_first != NULL) 33554442Smckusick panic("vinvalbuf: dirty bufs"); 33654442Smckusick } 33749232Smckusick for (;;) { 33865260Smckusick if ((blist = vp->v_cleanblkhd.lh_first) && flags & V_SAVEMETA) 33956459Smargo while (blist && blist->b_lblkno < 0) 34065260Smckusick blist = blist->b_vnbufs.le_next; 34165260Smckusick if (!blist && (blist = vp->v_dirtyblkhd.lh_first) && 34256608Smckusick (flags & V_SAVEMETA)) 34356459Smargo while (blist && blist->b_lblkno < 0) 34465260Smckusick blist = blist->b_vnbufs.le_next; 34556459Smargo if (!blist) 34649232Smckusick break; 34756459Smargo 34849232Smckusick for (bp = blist; bp; bp = nbp) { 34965260Smckusick nbp = bp->b_vnbufs.le_next; 35056459Smargo if (flags & V_SAVEMETA && bp->b_lblkno < 0) 35156459Smargo continue; 35249232Smckusick s = splbio(); 35349232Smckusick if (bp->b_flags & B_BUSY) { 35449232Smckusick bp->b_flags |= B_WANTED; 35557792Smckusick error = tsleep((caddr_t)bp, 35657792Smckusick slpflag | (PRIBIO + 1), "vinvalbuf", 35757792Smckusick slptimeo); 35849232Smckusick splx(s); 35957792Smckusick if (error) 36057792Smckusick return (error); 36149232Smckusick break; 36249232Smckusick } 36349232Smckusick bremfree(bp); 36449232Smckusick bp->b_flags |= B_BUSY; 36549232Smckusick splx(s); 36657792Smckusick /* 36757792Smckusick * XXX Since there are no node locks for NFS, I believe 36857792Smckusick * there is a slight chance that a delayed write will 36957792Smckusick * occur while sleeping just above, so check for it. 37057792Smckusick */ 37157792Smckusick if ((bp->b_flags & B_DELWRI) && (flags & V_SAVE)) { 37257792Smckusick (void) VOP_BWRITE(bp); 37357792Smckusick break; 37457792Smckusick } 37556459Smargo bp->b_flags |= B_INVAL; 37649232Smckusick brelse(bp); 37749232Smckusick } 37849232Smckusick } 37956608Smckusick if (!(flags & V_SAVEMETA) && 38065260Smckusick (vp->v_dirtyblkhd.lh_first || vp->v_cleanblkhd.lh_first)) 38149232Smckusick panic("vinvalbuf: flush failed"); 38254442Smckusick return (0); 38349232Smckusick } 38449232Smckusick 38549232Smckusick /* 38649232Smckusick * Associate a buffer with a vnode. 38749232Smckusick */ 38849232Smckusick bgetvp(vp, bp) 38949232Smckusick register struct vnode *vp; 39049232Smckusick register struct buf *bp; 39149232Smckusick { 39249232Smckusick 39349232Smckusick if (bp->b_vp) 39449232Smckusick panic("bgetvp: not free"); 39549232Smckusick VHOLD(vp); 39649232Smckusick bp->b_vp = vp; 39749232Smckusick if (vp->v_type == VBLK || vp->v_type == VCHR) 39849232Smckusick bp->b_dev = vp->v_rdev; 39949232Smckusick else 40049232Smckusick bp->b_dev = NODEV; 40149232Smckusick /* 40249232Smckusick * Insert onto list for new vnode. 40349232Smckusick */ 40456608Smckusick bufinsvn(bp, &vp->v_cleanblkhd); 40549232Smckusick } 40649232Smckusick 40749232Smckusick /* 40849232Smckusick * Disassociate a buffer from a vnode. 40949232Smckusick */ 41049232Smckusick brelvp(bp) 41149232Smckusick register struct buf *bp; 41249232Smckusick { 41349232Smckusick struct vnode *vp; 41449232Smckusick 41549232Smckusick if (bp->b_vp == (struct vnode *) 0) 41649232Smckusick panic("brelvp: NULL"); 41749232Smckusick /* 41849232Smckusick * Delete from old vnode list, if on one. 41949232Smckusick */ 42065260Smckusick if (bp->b_vnbufs.le_next != NOLIST) 42156608Smckusick bufremvn(bp); 42249232Smckusick vp = bp->b_vp; 42349232Smckusick bp->b_vp = (struct vnode *) 0; 42449232Smckusick HOLDRELE(vp); 42549232Smckusick } 42649232Smckusick 42749232Smckusick /* 42849232Smckusick * Reassign a buffer from one vnode to another. 42949232Smckusick * Used to assign file specific control information 43049232Smckusick * (indirect blocks) to the vnode to which they belong. 43149232Smckusick */ 43249232Smckusick reassignbuf(bp, newvp) 43349232Smckusick register struct buf *bp; 43449232Smckusick register struct vnode *newvp; 43549232Smckusick { 43665260Smckusick register struct buflists *listheadp; 43749232Smckusick 43852655Smckusick if (newvp == NULL) { 43952655Smckusick printf("reassignbuf: NULL"); 44052655Smckusick return; 44152655Smckusick } 44249232Smckusick /* 44349232Smckusick * Delete from old vnode list, if on one. 44449232Smckusick */ 44565260Smckusick if (bp->b_vnbufs.le_next != NOLIST) 44656608Smckusick bufremvn(bp); 44749232Smckusick /* 44849232Smckusick * If dirty, put on list of dirty buffers; 44949232Smckusick * otherwise insert onto list of clean buffers. 45049232Smckusick */ 45149232Smckusick if (bp->b_flags & B_DELWRI) 45249232Smckusick listheadp = &newvp->v_dirtyblkhd; 45349232Smckusick else 45449232Smckusick listheadp = &newvp->v_cleanblkhd; 45556608Smckusick bufinsvn(bp, listheadp); 45649232Smckusick } 45749232Smckusick 45849232Smckusick /* 45939433Smckusick * Create a vnode for a block device. 46039433Smckusick * Used for root filesystem, argdev, and swap areas. 46139433Smckusick * Also used for memory file system special devices. 46239397Smckusick */ 46339433Smckusick bdevvp(dev, vpp) 46439433Smckusick dev_t dev; 46539433Smckusick struct vnode **vpp; 46639433Smckusick { 46739433Smckusick register struct vnode *vp; 46839433Smckusick struct vnode *nvp; 46939433Smckusick int error; 47039433Smckusick 47146989Smckusick if (dev == NODEV) 47246989Smckusick return (0); 47353547Sheideman error = getnewvnode(VT_NON, (struct mount *)0, spec_vnodeop_p, &nvp); 47439433Smckusick if (error) { 47539433Smckusick *vpp = 0; 47639433Smckusick return (error); 47739433Smckusick } 47839433Smckusick vp = nvp; 47939433Smckusick vp->v_type = VBLK; 48039615Smckusick if (nvp = checkalias(vp, dev, (struct mount *)0)) { 48139433Smckusick vput(vp); 48239433Smckusick vp = nvp; 48339433Smckusick } 48439433Smckusick *vpp = vp; 48539433Smckusick return (0); 48639433Smckusick } 48739433Smckusick 48839433Smckusick /* 48939433Smckusick * Check to see if the new vnode represents a special device 49039433Smckusick * for which we already have a vnode (either because of 49139433Smckusick * bdevvp() or because of a different vnode representing 49239433Smckusick * the same block device). If such an alias exists, deallocate 49339509Smckusick * the existing contents and return the aliased vnode. The 49439433Smckusick * caller is responsible for filling it with its new contents. 49539433Smckusick */ 49639433Smckusick struct vnode * 49739615Smckusick checkalias(nvp, nvp_rdev, mp) 49839433Smckusick register struct vnode *nvp; 49939615Smckusick dev_t nvp_rdev; 50039433Smckusick struct mount *mp; 50139433Smckusick { 50239433Smckusick register struct vnode *vp; 50339615Smckusick struct vnode **vpp; 50439433Smckusick 50539433Smckusick if (nvp->v_type != VBLK && nvp->v_type != VCHR) 50641400Smckusick return (NULLVP); 50739615Smckusick 50839615Smckusick vpp = &speclisth[SPECHASH(nvp_rdev)]; 50939433Smckusick loop: 51039615Smckusick for (vp = *vpp; vp; vp = vp->v_specnext) { 51139615Smckusick if (nvp_rdev != vp->v_rdev || nvp->v_type != vp->v_type) 51239433Smckusick continue; 51339615Smckusick /* 51439615Smckusick * Alias, but not in use, so flush it out. 51539615Smckusick */ 51639809Smckusick if (vp->v_usecount == 0) { 51739615Smckusick vgone(vp); 51839615Smckusick goto loop; 51939615Smckusick } 52065260Smckusick if (vget(vp, 1)) 52139633Smckusick goto loop; 52239433Smckusick break; 52339433Smckusick } 52439615Smckusick if (vp == NULL || vp->v_tag != VT_NON) { 52539615Smckusick MALLOC(nvp->v_specinfo, struct specinfo *, 52639615Smckusick sizeof(struct specinfo), M_VNODE, M_WAITOK); 52739615Smckusick nvp->v_rdev = nvp_rdev; 52839809Smckusick nvp->v_hashchain = vpp; 52939615Smckusick nvp->v_specnext = *vpp; 53042152Smckusick nvp->v_specflags = 0; 53139615Smckusick *vpp = nvp; 53240640Smckusick if (vp != NULL) { 53340640Smckusick nvp->v_flag |= VALIASED; 53440640Smckusick vp->v_flag |= VALIASED; 53540640Smckusick vput(vp); 53640640Smckusick } 53741400Smckusick return (NULLVP); 53839433Smckusick } 53939484Smckusick VOP_UNLOCK(vp); 54039484Smckusick vclean(vp, 0); 54139433Smckusick vp->v_op = nvp->v_op; 54239433Smckusick vp->v_tag = nvp->v_tag; 54339433Smckusick nvp->v_type = VNON; 54439433Smckusick insmntque(vp, mp); 54539433Smckusick return (vp); 54639433Smckusick } 54739433Smckusick 54839433Smckusick /* 54939433Smckusick * Grab a particular vnode from the free list, increment its 55039433Smckusick * reference count and lock it. The vnode lock bit is set the 55139433Smckusick * vnode is being eliminated in vgone. The process is awakened 55239433Smckusick * when the transition is completed, and an error returned to 55339433Smckusick * indicate that the vnode is no longer usable (possibly having 55439433Smckusick * been changed to a new file system type). 55539433Smckusick */ 55665260Smckusick vget(vp, lockflag) 55739397Smckusick register struct vnode *vp; 55865260Smckusick int lockflag; 55939397Smckusick { 56039397Smckusick 56166897Smckusick /* 56266897Smckusick * If the vnode is in the process of being cleaned out for 56366897Smckusick * another use, we wait for the cleaning to finish and then 56466897Smckusick * return failure. Cleaning is determined either by checking 56566897Smckusick * that the VXLOCK flag is set, or that the use count is 56666897Smckusick * zero with the back pointer set to show that it has been 56766897Smckusick * removed from the free list by getnewvnode. The VXLOCK 56866897Smckusick * flag may not have been set yet because vclean is blocked in 56966897Smckusick * the VOP_LOCK call waiting for the VOP_INACTIVE to complete. 57066897Smckusick */ 57166897Smckusick if ((vp->v_flag & VXLOCK) || 57266897Smckusick (vp->v_usecount == 0 && 57366897Smckusick vp->v_freelist.tqe_prev == (struct vnode **)0xdeadb)) { 57439433Smckusick vp->v_flag |= VXWANT; 57539433Smckusick sleep((caddr_t)vp, PINOD); 57639433Smckusick return (1); 57739433Smckusick } 57866897Smckusick if (vp->v_usecount == 0) 57965260Smckusick TAILQ_REMOVE(&vnode_free_list, vp, v_freelist); 58059450Smckusick vp->v_usecount++; 58165260Smckusick if (lockflag) 58265260Smckusick VOP_LOCK(vp); 58339433Smckusick return (0); 58439397Smckusick } 58539397Smckusick 58639397Smckusick /* 58739397Smckusick * Vnode reference, just increment the count 58839397Smckusick */ 58939397Smckusick void vref(vp) 59039397Smckusick struct vnode *vp; 59139397Smckusick { 59239397Smckusick 59359450Smckusick if (vp->v_usecount <= 0) 59459450Smckusick panic("vref used where vget required"); 59539809Smckusick vp->v_usecount++; 59639397Smckusick } 59739397Smckusick 59839397Smckusick /* 59939397Smckusick * vput(), just unlock and vrele() 60039397Smckusick */ 60139397Smckusick void vput(vp) 60239397Smckusick register struct vnode *vp; 60339397Smckusick { 60452416Storek 60539397Smckusick VOP_UNLOCK(vp); 60639397Smckusick vrele(vp); 60739397Smckusick } 60839397Smckusick 60939397Smckusick /* 61039397Smckusick * Vnode release. 61139397Smckusick * If count drops to zero, call inactive routine and return to freelist. 61239397Smckusick */ 61339397Smckusick void vrele(vp) 61439397Smckusick register struct vnode *vp; 61539397Smckusick { 61639397Smckusick 61750109Smckusick #ifdef DIAGNOSTIC 61839397Smckusick if (vp == NULL) 61939433Smckusick panic("vrele: null vp"); 62050109Smckusick #endif 62139809Smckusick vp->v_usecount--; 62239809Smckusick if (vp->v_usecount > 0) 62339397Smckusick return; 62450109Smckusick #ifdef DIAGNOSTIC 62550109Smckusick if (vp->v_usecount != 0 || vp->v_writecount != 0) { 62650109Smckusick vprint("vrele: bad ref count", vp); 62750109Smckusick panic("vrele: ref cnt"); 62850109Smckusick } 62950109Smckusick #endif 63055468Smckusick /* 63155468Smckusick * insert at tail of LRU list 63255468Smckusick */ 63365260Smckusick TAILQ_INSERT_TAIL(&vnode_free_list, vp, v_freelist); 63454442Smckusick VOP_INACTIVE(vp); 63539397Smckusick } 63639433Smckusick 63739433Smckusick /* 63839809Smckusick * Page or buffer structure gets a reference. 63939809Smckusick */ 64053312Smckusick void vhold(vp) 64139809Smckusick register struct vnode *vp; 64239809Smckusick { 64339809Smckusick 64439809Smckusick vp->v_holdcnt++; 64539809Smckusick } 64639809Smckusick 64739809Smckusick /* 64839809Smckusick * Page or buffer structure frees a reference. 64939809Smckusick */ 65053312Smckusick void holdrele(vp) 65139809Smckusick register struct vnode *vp; 65239809Smckusick { 65339809Smckusick 65439809Smckusick if (vp->v_holdcnt <= 0) 65539809Smckusick panic("holdrele: holdcnt"); 65639809Smckusick vp->v_holdcnt--; 65739809Smckusick } 65839809Smckusick 65939809Smckusick /* 66039509Smckusick * Remove any vnodes in the vnode table belonging to mount point mp. 66139509Smckusick * 66239509Smckusick * If MNT_NOFORCE is specified, there should not be any active ones, 66339509Smckusick * return error if any are found (nb: this is a user error, not a 66439509Smckusick * system error). If MNT_FORCE is specified, detach any active vnodes 66539509Smckusick * that are found. 66639509Smckusick */ 66765679Shibler #ifdef DIAGNOSTIC 66860930Smckusick int busyprt = 0; /* print out busy vnodes */ 66960930Smckusick struct ctldebug debug1 = { "busyprt", &busyprt }; 67065679Shibler #endif 67139509Smckusick 67239509Smckusick vflush(mp, skipvp, flags) 67339509Smckusick struct mount *mp; 67439509Smckusick struct vnode *skipvp; 67539509Smckusick int flags; 67639509Smckusick { 67739509Smckusick register struct vnode *vp, *nvp; 67839509Smckusick int busy = 0; 67939509Smckusick 68041400Smckusick if ((mp->mnt_flag & MNT_MPBUSY) == 0) 68141300Smckusick panic("vflush: not busy"); 68241421Smckusick loop: 68365260Smckusick for (vp = mp->mnt_vnodelist.lh_first; vp; vp = nvp) { 68441421Smckusick if (vp->v_mount != mp) 68541421Smckusick goto loop; 68665260Smckusick nvp = vp->v_mntvnodes.le_next; 68739509Smckusick /* 68839509Smckusick * Skip over a selected vnode. 68939509Smckusick */ 69039509Smckusick if (vp == skipvp) 69139509Smckusick continue; 69239509Smckusick /* 69341300Smckusick * Skip over a vnodes marked VSYSTEM. 69441300Smckusick */ 69541300Smckusick if ((flags & SKIPSYSTEM) && (vp->v_flag & VSYSTEM)) 69641300Smckusick continue; 69741300Smckusick /* 69857040Smckusick * If WRITECLOSE is set, only flush out regular file 69957040Smckusick * vnodes open for writing. 70057040Smckusick */ 70157040Smckusick if ((flags & WRITECLOSE) && 70257040Smckusick (vp->v_writecount == 0 || vp->v_type != VREG)) 70357040Smckusick continue; 70457040Smckusick /* 70539809Smckusick * With v_usecount == 0, all we need to do is clear 70639509Smckusick * out the vnode data structures and we are done. 70739509Smckusick */ 70839809Smckusick if (vp->v_usecount == 0) { 70939509Smckusick vgone(vp); 71039509Smckusick continue; 71139509Smckusick } 71239509Smckusick /* 71357040Smckusick * If FORCECLOSE is set, forcibly close the vnode. 71439509Smckusick * For block or character devices, revert to an 71539509Smckusick * anonymous device. For all other files, just kill them. 71639509Smckusick */ 71741300Smckusick if (flags & FORCECLOSE) { 71839509Smckusick if (vp->v_type != VBLK && vp->v_type != VCHR) { 71939509Smckusick vgone(vp); 72039509Smckusick } else { 72139509Smckusick vclean(vp, 0); 72253547Sheideman vp->v_op = spec_vnodeop_p; 72339509Smckusick insmntque(vp, (struct mount *)0); 72439509Smckusick } 72539509Smckusick continue; 72639509Smckusick } 72765679Shibler #ifdef DIAGNOSTIC 72839509Smckusick if (busyprt) 72939667Smckusick vprint("vflush: busy vnode", vp); 73065679Shibler #endif 73139509Smckusick busy++; 73239509Smckusick } 73339509Smckusick if (busy) 73439509Smckusick return (EBUSY); 73539509Smckusick return (0); 73639509Smckusick } 73739509Smckusick 73839509Smckusick /* 73939433Smckusick * Disassociate the underlying file system from a vnode. 74039433Smckusick */ 74154347Smckusick void 74254347Smckusick vclean(vp, flags) 74339433Smckusick register struct vnode *vp; 74445118Smckusick int flags; 74539433Smckusick { 74639484Smckusick int active; 74739433Smckusick 74839484Smckusick /* 74939484Smckusick * Check to see if the vnode is in use. 75039667Smckusick * If so we have to reference it before we clean it out 75139667Smckusick * so that its count cannot fall to zero and generate a 75239667Smckusick * race against ourselves to recycle it. 75339484Smckusick */ 75439809Smckusick if (active = vp->v_usecount) 75539484Smckusick VREF(vp); 75639484Smckusick /* 75756805Smckusick * Even if the count is zero, the VOP_INACTIVE routine may still 75856805Smckusick * have the object locked while it cleans it out. The VOP_LOCK 75956805Smckusick * ensures that the VOP_INACTIVE routine is done with its work. 76056805Smckusick * For active vnodes, it ensures that no other activity can 76156805Smckusick * occur while the underlying object is being cleaned out. 76256805Smckusick */ 76356805Smckusick VOP_LOCK(vp); 76456805Smckusick /* 76539484Smckusick * Prevent the vnode from being recycled or 76639484Smckusick * brought into use while we clean it out. 76739484Smckusick */ 76839667Smckusick if (vp->v_flag & VXLOCK) 76939667Smckusick panic("vclean: deadlock"); 77039433Smckusick vp->v_flag |= VXLOCK; 77139433Smckusick /* 77256805Smckusick * Clean out any buffers associated with the vnode. 77339667Smckusick */ 77441300Smckusick if (flags & DOCLOSE) 77557792Smckusick vinvalbuf(vp, V_SAVE, NOCRED, NULL, 0, 0); 77639667Smckusick /* 77756805Smckusick * Any other processes trying to obtain this lock must first 77856805Smckusick * wait for VXLOCK to clear, then call the new lock operation. 77939433Smckusick */ 78056805Smckusick VOP_UNLOCK(vp); 78139433Smckusick /* 78256805Smckusick * If purging an active vnode, it must be closed and 78356805Smckusick * deactivated before being reclaimed. 78439433Smckusick */ 78539484Smckusick if (active) { 78656805Smckusick if (flags & DOCLOSE) 78756805Smckusick VOP_CLOSE(vp, IO_NDELAY, NOCRED, NULL); 78856805Smckusick VOP_INACTIVE(vp); 78939433Smckusick } 79039433Smckusick /* 79139433Smckusick * Reclaim the vnode. 79239433Smckusick */ 79356805Smckusick if (VOP_RECLAIM(vp)) 79439433Smckusick panic("vclean: cannot reclaim"); 79539484Smckusick if (active) 79639484Smckusick vrele(vp); 79753580Sheideman 79839433Smckusick /* 79956805Smckusick * Done with purge, notify sleepers of the grim news. 80039433Smckusick */ 80156805Smckusick vp->v_op = dead_vnodeop_p; 80256805Smckusick vp->v_tag = VT_NON; 80339433Smckusick vp->v_flag &= ~VXLOCK; 80439433Smckusick if (vp->v_flag & VXWANT) { 80539433Smckusick vp->v_flag &= ~VXWANT; 80639433Smckusick wakeup((caddr_t)vp); 80739433Smckusick } 80839433Smckusick } 80939433Smckusick 81039433Smckusick /* 81139633Smckusick * Eliminate all activity associated with the requested vnode 81239633Smckusick * and with all vnodes aliased to the requested vnode. 81339633Smckusick */ 81439633Smckusick void vgoneall(vp) 81539633Smckusick register struct vnode *vp; 81639633Smckusick { 81739809Smckusick register struct vnode *vq; 81839633Smckusick 81940665Smckusick if (vp->v_flag & VALIASED) { 82040665Smckusick /* 82140665Smckusick * If a vgone (or vclean) is already in progress, 82240665Smckusick * wait until it is done and return. 82340665Smckusick */ 82440665Smckusick if (vp->v_flag & VXLOCK) { 82540665Smckusick vp->v_flag |= VXWANT; 82640665Smckusick sleep((caddr_t)vp, PINOD); 82740665Smckusick return; 82839633Smckusick } 82940665Smckusick /* 83040665Smckusick * Ensure that vp will not be vgone'd while we 83140665Smckusick * are eliminating its aliases. 83240665Smckusick */ 83340665Smckusick vp->v_flag |= VXLOCK; 83440665Smckusick while (vp->v_flag & VALIASED) { 83540665Smckusick for (vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 83640665Smckusick if (vq->v_rdev != vp->v_rdev || 83740665Smckusick vq->v_type != vp->v_type || vp == vq) 83840665Smckusick continue; 83940665Smckusick vgone(vq); 84040665Smckusick break; 84140665Smckusick } 84240665Smckusick } 84340665Smckusick /* 84440665Smckusick * Remove the lock so that vgone below will 84540665Smckusick * really eliminate the vnode after which time 84640665Smckusick * vgone will awaken any sleepers. 84740665Smckusick */ 84840665Smckusick vp->v_flag &= ~VXLOCK; 84939633Smckusick } 85039633Smckusick vgone(vp); 85139633Smckusick } 85239633Smckusick 85339633Smckusick /* 85439433Smckusick * Eliminate all activity associated with a vnode 85539433Smckusick * in preparation for reuse. 85639433Smckusick */ 85739433Smckusick void vgone(vp) 85839433Smckusick register struct vnode *vp; 85939433Smckusick { 86039809Smckusick register struct vnode *vq; 86139615Smckusick struct vnode *vx; 86239433Smckusick 86339433Smckusick /* 86440548Smckusick * If a vgone (or vclean) is already in progress, 86540548Smckusick * wait until it is done and return. 86640548Smckusick */ 86740548Smckusick if (vp->v_flag & VXLOCK) { 86840548Smckusick vp->v_flag |= VXWANT; 86940548Smckusick sleep((caddr_t)vp, PINOD); 87040548Smckusick return; 87140548Smckusick } 87240548Smckusick /* 87339433Smckusick * Clean out the filesystem specific data. 87439433Smckusick */ 87541300Smckusick vclean(vp, DOCLOSE); 87639433Smckusick /* 87739433Smckusick * Delete from old mount point vnode list, if on one. 87839433Smckusick */ 87965260Smckusick if (vp->v_mount != NULL) { 88065260Smckusick LIST_REMOVE(vp, v_mntvnodes); 88152311Smckusick vp->v_mount = NULL; 88239433Smckusick } 88339433Smckusick /* 88439433Smckusick * If special device, remove it from special device alias list. 88539433Smckusick */ 88639433Smckusick if (vp->v_type == VBLK || vp->v_type == VCHR) { 88739809Smckusick if (*vp->v_hashchain == vp) { 88839809Smckusick *vp->v_hashchain = vp->v_specnext; 88939433Smckusick } else { 89039809Smckusick for (vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 89139615Smckusick if (vq->v_specnext != vp) 89239433Smckusick continue; 89339615Smckusick vq->v_specnext = vp->v_specnext; 89439433Smckusick break; 89539433Smckusick } 89639615Smckusick if (vq == NULL) 89739433Smckusick panic("missing bdev"); 89839433Smckusick } 89939615Smckusick if (vp->v_flag & VALIASED) { 90052416Storek vx = NULL; 90139809Smckusick for (vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 90240108Smckusick if (vq->v_rdev != vp->v_rdev || 90340108Smckusick vq->v_type != vp->v_type) 90439615Smckusick continue; 90552416Storek if (vx) 90652416Storek break; 90739615Smckusick vx = vq; 90839615Smckusick } 90952416Storek if (vx == NULL) 91039615Smckusick panic("missing alias"); 91152416Storek if (vq == NULL) 91239615Smckusick vx->v_flag &= ~VALIASED; 91339615Smckusick vp->v_flag &= ~VALIASED; 91439615Smckusick } 91539615Smckusick FREE(vp->v_specinfo, M_VNODE); 91639615Smckusick vp->v_specinfo = NULL; 91739433Smckusick } 91839433Smckusick /* 91956932Smckusick * If it is on the freelist and not already at the head, 92065505Smckusick * move it to the head of the list. The test of the back 92165505Smckusick * pointer and the reference count of zero is because 92265505Smckusick * it will be removed from the free list by getnewvnode, 92365505Smckusick * but will not have its reference count incremented until 92465505Smckusick * after calling vgone. If the reference count were 92565505Smckusick * incremented first, vgone would (incorrectly) try to 92665505Smckusick * close the previous instance of the underlying object. 92765505Smckusick * So, the back pointer is explicitly set to `0xdeadb' in 92865505Smckusick * getnewvnode after removing it from the freelist to ensure 92965505Smckusick * that we do not try to move it here. 93039433Smckusick */ 93165505Smckusick if (vp->v_usecount == 0 && 93265505Smckusick vp->v_freelist.tqe_prev != (struct vnode **)0xdeadb && 93365505Smckusick vnode_free_list.tqh_first != vp) { 93465260Smckusick TAILQ_REMOVE(&vnode_free_list, vp, v_freelist); 93565260Smckusick TAILQ_INSERT_HEAD(&vnode_free_list, vp, v_freelist); 93639433Smckusick } 93739484Smckusick vp->v_type = VBAD; 93839433Smckusick } 93939633Smckusick 94039633Smckusick /* 94139821Smckusick * Lookup a vnode by device number. 94239821Smckusick */ 94339821Smckusick vfinddev(dev, type, vpp) 94439821Smckusick dev_t dev; 94539821Smckusick enum vtype type; 94639821Smckusick struct vnode **vpp; 94739821Smckusick { 94839821Smckusick register struct vnode *vp; 94939821Smckusick 95039821Smckusick for (vp = speclisth[SPECHASH(dev)]; vp; vp = vp->v_specnext) { 95139821Smckusick if (dev != vp->v_rdev || type != vp->v_type) 95239821Smckusick continue; 95339821Smckusick *vpp = vp; 95459484Smckusick return (1); 95539821Smckusick } 95659484Smckusick return (0); 95739821Smckusick } 95839821Smckusick 95939821Smckusick /* 96039633Smckusick * Calculate the total number of references to a special device. 96139633Smckusick */ 96239633Smckusick vcount(vp) 96339633Smckusick register struct vnode *vp; 96439633Smckusick { 96566742Smckusick register struct vnode *vq, *vnext; 96639633Smckusick int count; 96739633Smckusick 96866742Smckusick loop: 96939633Smckusick if ((vp->v_flag & VALIASED) == 0) 97039809Smckusick return (vp->v_usecount); 97166742Smckusick for (count = 0, vq = *vp->v_hashchain; vq; vq = vnext) { 97266742Smckusick vnext = vq->v_specnext; 97340108Smckusick if (vq->v_rdev != vp->v_rdev || vq->v_type != vp->v_type) 97439633Smckusick continue; 97539633Smckusick /* 97639633Smckusick * Alias, but not in use, so flush it out. 97739633Smckusick */ 97866742Smckusick if (vq->v_usecount == 0 && vq != vp) { 97939633Smckusick vgone(vq); 98039633Smckusick goto loop; 98139633Smckusick } 98239809Smckusick count += vq->v_usecount; 98339633Smckusick } 98439633Smckusick return (count); 98539633Smckusick } 98639667Smckusick 98739667Smckusick /* 98839667Smckusick * Print out a description of a vnode. 98939667Smckusick */ 99039667Smckusick static char *typename[] = 99140286Smckusick { "VNON", "VREG", "VDIR", "VBLK", "VCHR", "VLNK", "VSOCK", "VFIFO", "VBAD" }; 99239667Smckusick 993*68171Scgd void 99439667Smckusick vprint(label, vp) 99539667Smckusick char *label; 99639667Smckusick register struct vnode *vp; 99739667Smckusick { 99839913Smckusick char buf[64]; 99939667Smckusick 100039667Smckusick if (label != NULL) 100139667Smckusick printf("%s: ", label); 100250109Smckusick printf("type %s, usecount %d, writecount %d, refcount %d,", 100350109Smckusick typename[vp->v_type], vp->v_usecount, vp->v_writecount, 100450109Smckusick vp->v_holdcnt); 100539913Smckusick buf[0] = '\0'; 100639913Smckusick if (vp->v_flag & VROOT) 100739913Smckusick strcat(buf, "|VROOT"); 100839913Smckusick if (vp->v_flag & VTEXT) 100939913Smckusick strcat(buf, "|VTEXT"); 101041300Smckusick if (vp->v_flag & VSYSTEM) 101141300Smckusick strcat(buf, "|VSYSTEM"); 101241300Smckusick if (vp->v_flag & VXLOCK) 101341300Smckusick strcat(buf, "|VXLOCK"); 101441300Smckusick if (vp->v_flag & VXWANT) 101541300Smckusick strcat(buf, "|VXWANT"); 101641300Smckusick if (vp->v_flag & VBWAIT) 101741300Smckusick strcat(buf, "|VBWAIT"); 101839913Smckusick if (vp->v_flag & VALIASED) 101939913Smckusick strcat(buf, "|VALIASED"); 102039913Smckusick if (buf[0] != '\0') 102139913Smckusick printf(" flags (%s)", &buf[1]); 102265260Smckusick if (vp->v_data == NULL) { 102365260Smckusick printf("\n"); 102465260Smckusick } else { 102565260Smckusick printf("\n\t"); 102665260Smckusick VOP_PRINT(vp); 102765260Smckusick } 102839667Smckusick } 102941110Smarc 103049691Smckusick #ifdef DEBUG 103149691Smckusick /* 103249691Smckusick * List all of the locked vnodes in the system. 103349691Smckusick * Called when debugging the kernel. 103449691Smckusick */ 103549691Smckusick printlockedvnodes() 103649691Smckusick { 103749691Smckusick register struct mount *mp; 103849691Smckusick register struct vnode *vp; 103949691Smckusick 104049691Smckusick printf("Locked vnodes\n"); 104165260Smckusick for (mp = mountlist.tqh_first; mp != NULL; mp = mp->mnt_list.tqe_next) { 104265260Smckusick for (vp = mp->mnt_vnodelist.lh_first; 104365260Smckusick vp != NULL; 104465260Smckusick vp = vp->v_mntvnodes.le_next) 104549691Smckusick if (VOP_ISLOCKED(vp)) 104649691Smckusick vprint((char *)0, vp); 104765260Smckusick } 104849691Smckusick } 104949691Smckusick #endif 105049691Smckusick 105141110Smarc int kinfo_vdebug = 1; 105241110Smarc int kinfo_vgetfailed; 105341110Smarc #define KINFO_VNODESLOP 10 105441110Smarc /* 105557841Smckusick * Dump vnode list (via sysctl). 105641110Smarc * Copyout address of vnode followed by vnode. 105741110Smarc */ 105845118Smckusick /* ARGSUSED */ 105957841Smckusick sysctl_vnode(where, sizep) 106041110Smarc char *where; 106158465Sbostic size_t *sizep; 106241110Smarc { 106365260Smckusick register struct mount *mp, *nmp; 106441110Smarc struct vnode *vp; 106541110Smarc register char *bp = where, *savebp; 106653818Smckusick char *ewhere; 106741110Smarc int error; 106841110Smarc 106941110Smarc #define VPTRSZ sizeof (struct vnode *) 107041110Smarc #define VNODESZ sizeof (struct vnode) 107141110Smarc if (where == NULL) { 107257841Smckusick *sizep = (numvnodes + KINFO_VNODESLOP) * (VPTRSZ + VNODESZ); 107341110Smarc return (0); 107441110Smarc } 107557841Smckusick ewhere = where + *sizep; 107641110Smarc 107765260Smckusick for (mp = mountlist.tqh_first; mp != NULL; mp = nmp) { 107865260Smckusick nmp = mp->mnt_list.tqe_next; 107965260Smckusick if (vfs_busy(mp)) 108041300Smckusick continue; 108141110Smarc savebp = bp; 108241110Smarc again: 108365260Smckusick for (vp = mp->mnt_vnodelist.lh_first; 108465260Smckusick vp != NULL; 108565260Smckusick vp = vp->v_mntvnodes.le_next) { 108641422Smckusick /* 108741422Smckusick * Check that the vp is still associated with 108841422Smckusick * this filesystem. RACE: could have been 108941422Smckusick * recycled onto the same filesystem. 109041422Smckusick */ 109141421Smckusick if (vp->v_mount != mp) { 109241421Smckusick if (kinfo_vdebug) 109341421Smckusick printf("kinfo: vp changed\n"); 109441421Smckusick bp = savebp; 109541421Smckusick goto again; 109641421Smckusick } 109757841Smckusick if (bp + VPTRSZ + VNODESZ > ewhere) { 109857841Smckusick *sizep = bp - where; 109957841Smckusick return (ENOMEM); 110057841Smckusick } 110157841Smckusick if ((error = copyout((caddr_t)&vp, bp, VPTRSZ)) || 110257841Smckusick (error = copyout((caddr_t)vp, bp + VPTRSZ, VNODESZ))) 110341110Smarc return (error); 110441110Smarc bp += VPTRSZ + VNODESZ; 110541110Smarc } 110665260Smckusick vfs_unbusy(mp); 110765260Smckusick } 110841110Smarc 110957841Smckusick *sizep = bp - where; 111041110Smarc return (0); 111141110Smarc } 111265679Shibler 111365679Shibler /* 111465679Shibler * Check to see if a filesystem is mounted on a block device. 111565679Shibler */ 111665679Shibler int 111765679Shibler vfs_mountedon(vp) 111865679Shibler register struct vnode *vp; 111965679Shibler { 112065679Shibler register struct vnode *vq; 112165679Shibler 112265679Shibler if (vp->v_specflags & SI_MOUNTEDON) 112365679Shibler return (EBUSY); 112465679Shibler if (vp->v_flag & VALIASED) { 112565679Shibler for (vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 112665679Shibler if (vq->v_rdev != vp->v_rdev || 112765679Shibler vq->v_type != vp->v_type) 112865679Shibler continue; 112965679Shibler if (vq->v_specflags & SI_MOUNTEDON) 113065679Shibler return (EBUSY); 113165679Shibler } 113265679Shibler } 113365679Shibler return (0); 113465679Shibler } 113565679Shibler 113665679Shibler /* 113765679Shibler * Build hash lists of net addresses and hang them off the mount point. 113865679Shibler * Called by ufs_mount() to set up the lists of export addresses. 113965679Shibler */ 114065679Shibler static int 114165679Shibler vfs_hang_addrlist(mp, nep, argp) 114265679Shibler struct mount *mp; 114365679Shibler struct netexport *nep; 114465679Shibler struct export_args *argp; 114565679Shibler { 114665679Shibler register struct netcred *np; 114765679Shibler register struct radix_node_head *rnh; 114865679Shibler register int i; 114965679Shibler struct radix_node *rn; 115065679Shibler struct sockaddr *saddr, *smask = 0; 115165679Shibler struct domain *dom; 115265679Shibler int error; 115365679Shibler 115465679Shibler if (argp->ex_addrlen == 0) { 115565679Shibler if (mp->mnt_flag & MNT_DEFEXPORTED) 115665679Shibler return (EPERM); 115765679Shibler np = &nep->ne_defexported; 115865679Shibler np->netc_exflags = argp->ex_flags; 115965679Shibler np->netc_anon = argp->ex_anon; 116065679Shibler np->netc_anon.cr_ref = 1; 116165679Shibler mp->mnt_flag |= MNT_DEFEXPORTED; 116265679Shibler return (0); 116365679Shibler } 116465679Shibler i = sizeof(struct netcred) + argp->ex_addrlen + argp->ex_masklen; 116565679Shibler np = (struct netcred *)malloc(i, M_NETADDR, M_WAITOK); 116665679Shibler bzero((caddr_t)np, i); 116765679Shibler saddr = (struct sockaddr *)(np + 1); 116865679Shibler if (error = copyin(argp->ex_addr, (caddr_t)saddr, argp->ex_addrlen)) 116965679Shibler goto out; 117065679Shibler if (saddr->sa_len > argp->ex_addrlen) 117165679Shibler saddr->sa_len = argp->ex_addrlen; 117265679Shibler if (argp->ex_masklen) { 117365679Shibler smask = (struct sockaddr *)((caddr_t)saddr + argp->ex_addrlen); 117465679Shibler error = copyin(argp->ex_addr, (caddr_t)smask, argp->ex_masklen); 117565679Shibler if (error) 117665679Shibler goto out; 117765679Shibler if (smask->sa_len > argp->ex_masklen) 117865679Shibler smask->sa_len = argp->ex_masklen; 117965679Shibler } 118065679Shibler i = saddr->sa_family; 118165679Shibler if ((rnh = nep->ne_rtable[i]) == 0) { 118265679Shibler /* 118365679Shibler * Seems silly to initialize every AF when most are not 118465679Shibler * used, do so on demand here 118565679Shibler */ 118665679Shibler for (dom = domains; dom; dom = dom->dom_next) 118765679Shibler if (dom->dom_family == i && dom->dom_rtattach) { 118865679Shibler dom->dom_rtattach((void **)&nep->ne_rtable[i], 118965679Shibler dom->dom_rtoffset); 119065679Shibler break; 119165679Shibler } 119265679Shibler if ((rnh = nep->ne_rtable[i]) == 0) { 119365679Shibler error = ENOBUFS; 119465679Shibler goto out; 119565679Shibler } 119665679Shibler } 119765679Shibler rn = (*rnh->rnh_addaddr)((caddr_t)saddr, (caddr_t)smask, rnh, 119865679Shibler np->netc_rnodes); 119965679Shibler if (rn == 0 || np != (struct netcred *)rn) { /* already exists */ 120065679Shibler error = EPERM; 120165679Shibler goto out; 120265679Shibler } 120365679Shibler np->netc_exflags = argp->ex_flags; 120465679Shibler np->netc_anon = argp->ex_anon; 120565679Shibler np->netc_anon.cr_ref = 1; 120665679Shibler return (0); 120765679Shibler out: 120865679Shibler free(np, M_NETADDR); 120965679Shibler return (error); 121065679Shibler } 121165679Shibler 121265679Shibler /* ARGSUSED */ 121365679Shibler static int 121465679Shibler vfs_free_netcred(rn, w) 121565679Shibler struct radix_node *rn; 121665679Shibler caddr_t w; 121765679Shibler { 121865679Shibler register struct radix_node_head *rnh = (struct radix_node_head *)w; 121965679Shibler 122065679Shibler (*rnh->rnh_deladdr)(rn->rn_key, rn->rn_mask, rnh); 122165679Shibler free((caddr_t)rn, M_NETADDR); 122265679Shibler return (0); 122365679Shibler } 122465679Shibler 122565679Shibler /* 122665679Shibler * Free the net address hash lists that are hanging off the mount points. 122765679Shibler */ 122865679Shibler static void 122965679Shibler vfs_free_addrlist(nep) 123065679Shibler struct netexport *nep; 123165679Shibler { 123265679Shibler register int i; 123365679Shibler register struct radix_node_head *rnh; 123465679Shibler 123565679Shibler for (i = 0; i <= AF_MAX; i++) 123665679Shibler if (rnh = nep->ne_rtable[i]) { 123765679Shibler (*rnh->rnh_walktree)(rnh, vfs_free_netcred, 123865679Shibler (caddr_t)rnh); 123965679Shibler free((caddr_t)rnh, M_RTABLE); 124065679Shibler nep->ne_rtable[i] = 0; 124165679Shibler } 124265679Shibler } 124365679Shibler 124465679Shibler int 124565679Shibler vfs_export(mp, nep, argp) 124665679Shibler struct mount *mp; 124765679Shibler struct netexport *nep; 124865679Shibler struct export_args *argp; 124965679Shibler { 125065679Shibler int error; 125165679Shibler 125265679Shibler if (argp->ex_flags & MNT_DELEXPORT) { 125365679Shibler vfs_free_addrlist(nep); 125465679Shibler mp->mnt_flag &= ~(MNT_EXPORTED | MNT_DEFEXPORTED); 125565679Shibler } 125665679Shibler if (argp->ex_flags & MNT_EXPORTED) { 125765679Shibler if (error = vfs_hang_addrlist(mp, nep, argp)) 125865679Shibler return (error); 125965679Shibler mp->mnt_flag |= MNT_EXPORTED; 126065679Shibler } 126165679Shibler return (0); 126265679Shibler } 126365679Shibler 126465679Shibler struct netcred * 126565679Shibler vfs_export_lookup(mp, nep, nam) 126665679Shibler register struct mount *mp; 126765679Shibler struct netexport *nep; 126865679Shibler struct mbuf *nam; 126965679Shibler { 127065679Shibler register struct netcred *np; 127165679Shibler register struct radix_node_head *rnh; 127265679Shibler struct sockaddr *saddr; 127365679Shibler 127465679Shibler np = NULL; 127565679Shibler if (mp->mnt_flag & MNT_EXPORTED) { 127665679Shibler /* 127765679Shibler * Lookup in the export list first. 127865679Shibler */ 127965679Shibler if (nam != NULL) { 128065679Shibler saddr = mtod(nam, struct sockaddr *); 128165679Shibler rnh = nep->ne_rtable[saddr->sa_family]; 128265679Shibler if (rnh != NULL) { 128365679Shibler np = (struct netcred *) 128465679Shibler (*rnh->rnh_matchaddr)((caddr_t)saddr, 128565679Shibler rnh); 128665679Shibler if (np && np->netc_rnodes->rn_flags & RNF_ROOT) 128765679Shibler np = NULL; 128865679Shibler } 128965679Shibler } 129065679Shibler /* 129165679Shibler * If no address match, use the default if it exists. 129265679Shibler */ 129365679Shibler if (np == NULL && mp->mnt_flag & MNT_DEFEXPORTED) 129465679Shibler np = &nep->ne_defexported; 129565679Shibler } 129665679Shibler return (np); 129765679Shibler } 1298