137488Smckusick /* 237488Smckusick * Copyright (c) 1989 The Regents of the University of California. 337488Smckusick * All rights reserved. 437488Smckusick * 544458Sbostic * %sccs.include.redist.c% 637488Smckusick * 7*56805Smckusick * @(#)vfs_subr.c 7.88 (Berkeley) 11/14/92 837488Smckusick */ 937488Smckusick 1037488Smckusick /* 1137488Smckusick * External virtual filesystem routines 1237488Smckusick */ 1337488Smckusick 1451460Sbostic #include <sys/param.h> 1553829Spendry #include <sys/systm.h> 1651460Sbostic #include <sys/proc.h> 1751460Sbostic #include <sys/mount.h> 1851460Sbostic #include <sys/time.h> 1951460Sbostic #include <sys/vnode.h> 2052415Smckusick #include <sys/stat.h> 2151460Sbostic #include <sys/namei.h> 2251460Sbostic #include <sys/ucred.h> 2351460Sbostic #include <sys/buf.h> 2451460Sbostic #include <sys/errno.h> 2551460Sbostic #include <sys/malloc.h> 2637488Smckusick 2755050Spendry #include <miscfs/specfs/specdev.h> 2855050Spendry 2952415Smckusick enum vtype iftovt_tab[16] = { 3052415Smckusick VNON, VFIFO, VCHR, VNON, VDIR, VNON, VBLK, VNON, 3152415Smckusick VREG, VNON, VLNK, VNON, VSOCK, VNON, VNON, VBAD, 3252415Smckusick }; 3352415Smckusick int vttoif_tab[9] = { 3452415Smckusick 0, S_IFREG, S_IFDIR, S_IFBLK, S_IFCHR, S_IFLNK, 3552415Smckusick S_IFSOCK, S_IFIFO, S_IFMT, 3652415Smckusick }; 3752415Smckusick 3837488Smckusick /* 3956608Smckusick * Insq/Remq for the vnode usage lists. 4056608Smckusick */ 4156608Smckusick #define bufinsvn(bp, dp) list_enter_head(dp, bp, struct buf *, b_vnbufs) 4256608Smckusick #define bufremvn(bp) list_remove(bp, struct buf *, b_vnbufs) 4356608Smckusick 4456608Smckusick /* 4537488Smckusick * Remove a mount point from the list of mounted filesystems. 4637488Smckusick * Unmount of the root is illegal. 4737488Smckusick */ 4837488Smckusick void 4937488Smckusick vfs_remove(mp) 5037488Smckusick register struct mount *mp; 5137488Smckusick { 5237488Smckusick 5337488Smckusick if (mp == rootfs) 5437488Smckusick panic("vfs_remove: unmounting root"); 5541400Smckusick mp->mnt_prev->mnt_next = mp->mnt_next; 5641400Smckusick mp->mnt_next->mnt_prev = mp->mnt_prev; 5741400Smckusick mp->mnt_vnodecovered->v_mountedhere = (struct mount *)0; 5837488Smckusick vfs_unlock(mp); 5937488Smckusick } 6037488Smckusick 6137488Smckusick /* 6237488Smckusick * Lock a filesystem. 6337488Smckusick * Used to prevent access to it while mounting and unmounting. 6437488Smckusick */ 6537488Smckusick vfs_lock(mp) 6637488Smckusick register struct mount *mp; 6737488Smckusick { 6837488Smckusick 6941400Smckusick while(mp->mnt_flag & MNT_MLOCK) { 7041400Smckusick mp->mnt_flag |= MNT_MWAIT; 7139045Smckusick sleep((caddr_t)mp, PVFS); 7239045Smckusick } 7341400Smckusick mp->mnt_flag |= MNT_MLOCK; 7437488Smckusick return (0); 7537488Smckusick } 7637488Smckusick 7737488Smckusick /* 7837488Smckusick * Unlock a locked filesystem. 7937488Smckusick * Panic if filesystem is not locked. 8037488Smckusick */ 8137488Smckusick void 8237488Smckusick vfs_unlock(mp) 8337488Smckusick register struct mount *mp; 8437488Smckusick { 8537488Smckusick 8641400Smckusick if ((mp->mnt_flag & MNT_MLOCK) == 0) 8741300Smckusick panic("vfs_unlock: not locked"); 8841400Smckusick mp->mnt_flag &= ~MNT_MLOCK; 8941400Smckusick if (mp->mnt_flag & MNT_MWAIT) { 9041400Smckusick mp->mnt_flag &= ~MNT_MWAIT; 9137488Smckusick wakeup((caddr_t)mp); 9237488Smckusick } 9337488Smckusick } 9437488Smckusick 9537488Smckusick /* 9641300Smckusick * Mark a mount point as busy. 9741300Smckusick * Used to synchronize access and to delay unmounting. 9841300Smckusick */ 9941300Smckusick vfs_busy(mp) 10041300Smckusick register struct mount *mp; 10141300Smckusick { 10241300Smckusick 10341400Smckusick while(mp->mnt_flag & MNT_MPBUSY) { 10441400Smckusick mp->mnt_flag |= MNT_MPWANT; 10541400Smckusick sleep((caddr_t)&mp->mnt_flag, PVFS); 10641300Smckusick } 10741419Smckusick if (mp->mnt_flag & MNT_UNMOUNT) 10841419Smckusick return (1); 10941400Smckusick mp->mnt_flag |= MNT_MPBUSY; 11041300Smckusick return (0); 11141300Smckusick } 11241300Smckusick 11341300Smckusick /* 11441300Smckusick * Free a busy filesystem. 11541300Smckusick * Panic if filesystem is not busy. 11641300Smckusick */ 11741300Smckusick vfs_unbusy(mp) 11841300Smckusick register struct mount *mp; 11941300Smckusick { 12041300Smckusick 12141400Smckusick if ((mp->mnt_flag & MNT_MPBUSY) == 0) 12241300Smckusick panic("vfs_unbusy: not busy"); 12341400Smckusick mp->mnt_flag &= ~MNT_MPBUSY; 12441400Smckusick if (mp->mnt_flag & MNT_MPWANT) { 12541400Smckusick mp->mnt_flag &= ~MNT_MPWANT; 12641400Smckusick wakeup((caddr_t)&mp->mnt_flag); 12741300Smckusick } 12841300Smckusick } 12941300Smckusick 13041300Smckusick /* 13137488Smckusick * Lookup a mount point by filesystem identifier. 13237488Smckusick */ 13337488Smckusick struct mount * 13437488Smckusick getvfs(fsid) 13537488Smckusick fsid_t *fsid; 13637488Smckusick { 13737488Smckusick register struct mount *mp; 13837488Smckusick 13938288Smckusick mp = rootfs; 14038288Smckusick do { 14141400Smckusick if (mp->mnt_stat.f_fsid.val[0] == fsid->val[0] && 14241400Smckusick mp->mnt_stat.f_fsid.val[1] == fsid->val[1]) { 14338288Smckusick return (mp); 14437488Smckusick } 14541400Smckusick mp = mp->mnt_next; 14638288Smckusick } while (mp != rootfs); 14738288Smckusick return ((struct mount *)0); 14837488Smckusick } 14937488Smckusick 15037488Smckusick /* 15153829Spendry * Get a new unique fsid 15253829Spendry */ 15353829Spendry void 15453829Spendry getnewfsid(mp, mtype) 15553829Spendry struct mount *mp; 15653829Spendry int mtype; 15753829Spendry { 15853829Spendry static u_short xxxfs_mntid; 15953829Spendry 16053829Spendry fsid_t tfsid; 16153829Spendry 16253829Spendry mp->mnt_stat.f_fsid.val[0] = makedev(nblkdev + 11, 0); /* XXX */ 16353829Spendry mp->mnt_stat.f_fsid.val[1] = mtype; 16453829Spendry if (xxxfs_mntid == 0) 16553829Spendry ++xxxfs_mntid; 16653829Spendry tfsid.val[0] = makedev(nblkdev, xxxfs_mntid); 16753829Spendry tfsid.val[1] = mtype; 16853936Spendry if (rootfs) { 16953936Spendry while (getvfs(&tfsid)) { 17053936Spendry tfsid.val[0]++; 17153936Spendry xxxfs_mntid++; 17253936Spendry } 17353829Spendry } 17453829Spendry mp->mnt_stat.f_fsid.val[0] = tfsid.val[0]; 17553829Spendry } 17653829Spendry 17753829Spendry /* 17837488Smckusick * Set vnode attributes to VNOVAL 17937488Smckusick */ 18037488Smckusick void vattr_null(vap) 18137488Smckusick register struct vattr *vap; 18237488Smckusick { 18337488Smckusick 18437488Smckusick vap->va_type = VNON; 18552005Smckusick vap->va_size = vap->va_bytes = VNOVAL; 18637488Smckusick vap->va_mode = vap->va_nlink = vap->va_uid = vap->va_gid = 18752005Smckusick vap->va_fsid = vap->va_fileid = 18852005Smckusick vap->va_blocksize = vap->va_rdev = 18954347Smckusick vap->va_atime.ts_sec = vap->va_atime.ts_nsec = 19054347Smckusick vap->va_mtime.ts_sec = vap->va_mtime.ts_nsec = 19154347Smckusick vap->va_ctime.ts_sec = vap->va_ctime.ts_nsec = 19238258Smckusick vap->va_flags = vap->va_gen = VNOVAL; 19337488Smckusick } 19438265Smckusick 19538265Smckusick /* 19639397Smckusick * Routines having to do with the management of the vnode table. 19739397Smckusick */ 19855468Smckusick struct vnode *vfreeh, **vfreet = &vfreeh; 19953547Sheideman extern int (**dead_vnodeop_p)(); 20039635Smckusick extern void vclean(); 20140883Smckusick long numvnodes; 20253493Sheideman extern struct vattr va_null; 20339397Smckusick 20439397Smckusick /* 20539397Smckusick * Return the next vnode from the free list. 20639397Smckusick */ 20739397Smckusick getnewvnode(tag, mp, vops, vpp) 20839397Smckusick enum vtagtype tag; 20939397Smckusick struct mount *mp; 21053495Sheideman int (**vops)(); 21139397Smckusick struct vnode **vpp; 21239397Smckusick { 21339397Smckusick register struct vnode *vp, *vq; 21439397Smckusick 21554347Smckusick if ((vfreeh == NULL && numvnodes < 2 * desiredvnodes) || 21654347Smckusick numvnodes < desiredvnodes) { 21745118Smckusick vp = (struct vnode *)malloc((u_long)sizeof *vp, 21845118Smckusick M_VNODE, M_WAITOK); 21940883Smckusick bzero((char *)vp, sizeof *vp); 22040883Smckusick numvnodes++; 22140883Smckusick } else { 22240883Smckusick if ((vp = vfreeh) == NULL) { 22340883Smckusick tablefull("vnode"); 22440883Smckusick *vpp = 0; 22540883Smckusick return (ENFILE); 22640883Smckusick } 22740883Smckusick if (vp->v_usecount) 22840883Smckusick panic("free vnode isn't"); 22940883Smckusick if (vq = vp->v_freef) 23040883Smckusick vq->v_freeb = &vfreeh; 23140883Smckusick else 23240883Smckusick vfreet = &vfreeh; 23340883Smckusick vfreeh = vq; 23440883Smckusick vp->v_freef = NULL; 23540883Smckusick vp->v_freeb = NULL; 23652190Smckusick vp->v_lease = NULL; 23740883Smckusick if (vp->v_type != VBAD) 23840883Smckusick vgone(vp); 23952006Smckusick if (vp->v_data) 24052006Smckusick panic("cleaned vnode isn't"); 24140883Smckusick vp->v_flag = 0; 24240883Smckusick vp->v_lastr = 0; 24340883Smckusick vp->v_socket = 0; 24439397Smckusick } 24539512Smckusick vp->v_type = VNON; 24639397Smckusick cache_purge(vp); 24739397Smckusick vp->v_tag = tag; 24839433Smckusick vp->v_op = vops; 24939397Smckusick insmntque(vp, mp); 25039397Smckusick VREF(vp); 25139397Smckusick *vpp = vp; 25239397Smckusick return (0); 25339397Smckusick } 25439397Smckusick 25539397Smckusick /* 25639397Smckusick * Move a vnode from one mount queue to another. 25739397Smckusick */ 25839397Smckusick insmntque(vp, mp) 25939397Smckusick register struct vnode *vp; 26039397Smckusick register struct mount *mp; 26139397Smckusick { 26249973Smckusick register struct vnode *vq; 26339397Smckusick 26439397Smckusick /* 26539397Smckusick * Delete from old mount point vnode list, if on one. 26639397Smckusick */ 26739397Smckusick if (vp->v_mountb) { 26839397Smckusick if (vq = vp->v_mountf) 26939397Smckusick vq->v_mountb = vp->v_mountb; 27039397Smckusick *vp->v_mountb = vq; 27139397Smckusick } 27239397Smckusick /* 27339397Smckusick * Insert into list of vnodes for the new mount point, if available. 27439397Smckusick */ 27539621Smckusick vp->v_mount = mp; 27639397Smckusick if (mp == NULL) { 27739397Smckusick vp->v_mountf = NULL; 27839397Smckusick vp->v_mountb = NULL; 27939397Smckusick return; 28039397Smckusick } 28149973Smckusick if (vq = mp->mnt_mounth) 28249973Smckusick vq->v_mountb = &vp->v_mountf; 28349973Smckusick vp->v_mountf = vq; 28449973Smckusick vp->v_mountb = &mp->mnt_mounth; 28549973Smckusick mp->mnt_mounth = vp; 28639397Smckusick } 28739397Smckusick 28839397Smckusick /* 28949232Smckusick * Update outstanding I/O count and do wakeup if requested. 29049232Smckusick */ 29149232Smckusick vwakeup(bp) 29249232Smckusick register struct buf *bp; 29349232Smckusick { 29449232Smckusick register struct vnode *vp; 29549232Smckusick 29649232Smckusick bp->b_dirtyoff = bp->b_dirtyend = 0; 29749232Smckusick if (vp = bp->b_vp) { 29849232Smckusick vp->v_numoutput--; 29949232Smckusick if ((vp->v_flag & VBWAIT) && vp->v_numoutput <= 0) { 30049232Smckusick if (vp->v_numoutput < 0) 30149232Smckusick panic("vwakeup: neg numoutput"); 30249232Smckusick vp->v_flag &= ~VBWAIT; 30349232Smckusick wakeup((caddr_t)&vp->v_numoutput); 30449232Smckusick } 30549232Smckusick } 30649232Smckusick } 30749232Smckusick 30849232Smckusick /* 30949232Smckusick * Flush out and invalidate all buffers associated with a vnode. 31049232Smckusick * Called with the underlying object locked. 31149232Smckusick */ 31254442Smckusick int 31356459Smargo vinvalbuf(vp, flags, cred, p) 31449232Smckusick register struct vnode *vp; 31556459Smargo int flags; 31654442Smckusick struct ucred *cred; 31754442Smckusick struct proc *p; 31849232Smckusick { 31949232Smckusick register struct buf *bp; 32049232Smckusick struct buf *nbp, *blist; 32154442Smckusick int s, error; 32249232Smckusick 32356459Smargo if (flags & V_SAVE) { 32454442Smckusick if (error = VOP_FSYNC(vp, cred, MNT_WAIT, p)) 32554442Smckusick return (error); 32656608Smckusick if (vp->v_dirtyblkhd.le_next != NULL) 32754442Smckusick panic("vinvalbuf: dirty bufs"); 32854442Smckusick } 32949232Smckusick for (;;) { 33056608Smckusick if ((blist = vp->v_cleanblkhd.le_next) && flags & V_SAVEMETA) 33156459Smargo while (blist && blist->b_lblkno < 0) 33256608Smckusick blist = blist->b_vnbufs.qe_next; 33356608Smckusick if (!blist && (blist = vp->v_dirtyblkhd.le_next) && 33456608Smckusick (flags & V_SAVEMETA)) 33556459Smargo while (blist && blist->b_lblkno < 0) 33656608Smckusick blist = blist->b_vnbufs.qe_next; 33756459Smargo if (!blist) 33849232Smckusick break; 33956459Smargo 34049232Smckusick for (bp = blist; bp; bp = nbp) { 34156608Smckusick nbp = bp->b_vnbufs.qe_next; 34256459Smargo if (flags & V_SAVEMETA && bp->b_lblkno < 0) 34356459Smargo continue; 34449232Smckusick s = splbio(); 34549232Smckusick if (bp->b_flags & B_BUSY) { 34649232Smckusick bp->b_flags |= B_WANTED; 34749232Smckusick sleep((caddr_t)bp, PRIBIO + 1); 34849232Smckusick splx(s); 34949232Smckusick break; 35049232Smckusick } 35149232Smckusick bremfree(bp); 35249232Smckusick bp->b_flags |= B_BUSY; 35349232Smckusick splx(s); 35456459Smargo bp->b_flags |= B_INVAL; 35549232Smckusick brelse(bp); 35649232Smckusick } 35749232Smckusick } 35856608Smckusick if (!(flags & V_SAVEMETA) && 35956608Smckusick (vp->v_dirtyblkhd.le_next || vp->v_cleanblkhd.le_next)) 36049232Smckusick panic("vinvalbuf: flush failed"); 36154442Smckusick return (0); 36249232Smckusick } 36349232Smckusick 36449232Smckusick /* 36549232Smckusick * Associate a buffer with a vnode. 36649232Smckusick */ 36749232Smckusick bgetvp(vp, bp) 36849232Smckusick register struct vnode *vp; 36949232Smckusick register struct buf *bp; 37049232Smckusick { 37149973Smckusick register struct vnode *vq; 37249232Smckusick 37349232Smckusick if (bp->b_vp) 37449232Smckusick panic("bgetvp: not free"); 37549232Smckusick VHOLD(vp); 37649232Smckusick bp->b_vp = vp; 37749232Smckusick if (vp->v_type == VBLK || vp->v_type == VCHR) 37849232Smckusick bp->b_dev = vp->v_rdev; 37949232Smckusick else 38049232Smckusick bp->b_dev = NODEV; 38149232Smckusick /* 38249232Smckusick * Insert onto list for new vnode. 38349232Smckusick */ 38456608Smckusick bufinsvn(bp, &vp->v_cleanblkhd); 38549232Smckusick } 38649232Smckusick 38749232Smckusick /* 38849232Smckusick * Disassociate a buffer from a vnode. 38949232Smckusick */ 39049232Smckusick brelvp(bp) 39149232Smckusick register struct buf *bp; 39249232Smckusick { 39349232Smckusick struct vnode *vp; 39449232Smckusick 39549232Smckusick if (bp->b_vp == (struct vnode *) 0) 39649232Smckusick panic("brelvp: NULL"); 39749232Smckusick /* 39849232Smckusick * Delete from old vnode list, if on one. 39949232Smckusick */ 40056608Smckusick if (bp->b_vnbufs.qe_next != NOLIST) 40156608Smckusick bufremvn(bp); 40249232Smckusick vp = bp->b_vp; 40349232Smckusick bp->b_vp = (struct vnode *) 0; 40449232Smckusick HOLDRELE(vp); 40549232Smckusick } 40649232Smckusick 40749232Smckusick /* 40849232Smckusick * Reassign a buffer from one vnode to another. 40949232Smckusick * Used to assign file specific control information 41049232Smckusick * (indirect blocks) to the vnode to which they belong. 41149232Smckusick */ 41249232Smckusick reassignbuf(bp, newvp) 41349232Smckusick register struct buf *bp; 41449232Smckusick register struct vnode *newvp; 41549232Smckusick { 41656608Smckusick register struct list_entry *listheadp; 41749232Smckusick 41852655Smckusick if (newvp == NULL) { 41952655Smckusick printf("reassignbuf: NULL"); 42052655Smckusick return; 42152655Smckusick } 42249232Smckusick /* 42349232Smckusick * Delete from old vnode list, if on one. 42449232Smckusick */ 42556608Smckusick if (bp->b_vnbufs.qe_next != NOLIST) 42656608Smckusick bufremvn(bp); 42749232Smckusick /* 42849232Smckusick * If dirty, put on list of dirty buffers; 42949232Smckusick * otherwise insert onto list of clean buffers. 43049232Smckusick */ 43149232Smckusick if (bp->b_flags & B_DELWRI) 43249232Smckusick listheadp = &newvp->v_dirtyblkhd; 43349232Smckusick else 43449232Smckusick listheadp = &newvp->v_cleanblkhd; 43556608Smckusick bufinsvn(bp, listheadp); 43649232Smckusick } 43749232Smckusick 43849232Smckusick /* 43939433Smckusick * Create a vnode for a block device. 44039433Smckusick * Used for root filesystem, argdev, and swap areas. 44139433Smckusick * Also used for memory file system special devices. 44239397Smckusick */ 44339433Smckusick bdevvp(dev, vpp) 44439433Smckusick dev_t dev; 44539433Smckusick struct vnode **vpp; 44639433Smckusick { 44739433Smckusick register struct vnode *vp; 44839433Smckusick struct vnode *nvp; 44939433Smckusick int error; 45039433Smckusick 45146989Smckusick if (dev == NODEV) 45246989Smckusick return (0); 45353547Sheideman error = getnewvnode(VT_NON, (struct mount *)0, spec_vnodeop_p, &nvp); 45439433Smckusick if (error) { 45539433Smckusick *vpp = 0; 45639433Smckusick return (error); 45739433Smckusick } 45839433Smckusick vp = nvp; 45939433Smckusick vp->v_type = VBLK; 46039615Smckusick if (nvp = checkalias(vp, dev, (struct mount *)0)) { 46139433Smckusick vput(vp); 46239433Smckusick vp = nvp; 46339433Smckusick } 46439433Smckusick *vpp = vp; 46539433Smckusick return (0); 46639433Smckusick } 46739433Smckusick 46839433Smckusick /* 46939433Smckusick * Check to see if the new vnode represents a special device 47039433Smckusick * for which we already have a vnode (either because of 47139433Smckusick * bdevvp() or because of a different vnode representing 47239433Smckusick * the same block device). If such an alias exists, deallocate 47339509Smckusick * the existing contents and return the aliased vnode. The 47439433Smckusick * caller is responsible for filling it with its new contents. 47539433Smckusick */ 47639433Smckusick struct vnode * 47739615Smckusick checkalias(nvp, nvp_rdev, mp) 47839433Smckusick register struct vnode *nvp; 47939615Smckusick dev_t nvp_rdev; 48039433Smckusick struct mount *mp; 48139433Smckusick { 48239433Smckusick register struct vnode *vp; 48339615Smckusick struct vnode **vpp; 48439433Smckusick 48539433Smckusick if (nvp->v_type != VBLK && nvp->v_type != VCHR) 48641400Smckusick return (NULLVP); 48739615Smckusick 48839615Smckusick vpp = &speclisth[SPECHASH(nvp_rdev)]; 48939433Smckusick loop: 49039615Smckusick for (vp = *vpp; vp; vp = vp->v_specnext) { 49139615Smckusick if (nvp_rdev != vp->v_rdev || nvp->v_type != vp->v_type) 49239433Smckusick continue; 49339615Smckusick /* 49439615Smckusick * Alias, but not in use, so flush it out. 49539615Smckusick */ 49639809Smckusick if (vp->v_usecount == 0) { 49739615Smckusick vgone(vp); 49839615Smckusick goto loop; 49939615Smckusick } 50039633Smckusick if (vget(vp)) 50139633Smckusick goto loop; 50239433Smckusick break; 50339433Smckusick } 50439615Smckusick if (vp == NULL || vp->v_tag != VT_NON) { 50539615Smckusick MALLOC(nvp->v_specinfo, struct specinfo *, 50639615Smckusick sizeof(struct specinfo), M_VNODE, M_WAITOK); 50739615Smckusick nvp->v_rdev = nvp_rdev; 50839809Smckusick nvp->v_hashchain = vpp; 50939615Smckusick nvp->v_specnext = *vpp; 51042152Smckusick nvp->v_specflags = 0; 51139615Smckusick *vpp = nvp; 51240640Smckusick if (vp != NULL) { 51340640Smckusick nvp->v_flag |= VALIASED; 51440640Smckusick vp->v_flag |= VALIASED; 51540640Smckusick vput(vp); 51640640Smckusick } 51741400Smckusick return (NULLVP); 51839433Smckusick } 51939484Smckusick VOP_UNLOCK(vp); 52039484Smckusick vclean(vp, 0); 52139433Smckusick vp->v_op = nvp->v_op; 52239433Smckusick vp->v_tag = nvp->v_tag; 52339433Smckusick nvp->v_type = VNON; 52439433Smckusick insmntque(vp, mp); 52539433Smckusick return (vp); 52639433Smckusick } 52739433Smckusick 52839433Smckusick /* 52939433Smckusick * Grab a particular vnode from the free list, increment its 53039433Smckusick * reference count and lock it. The vnode lock bit is set the 53139433Smckusick * vnode is being eliminated in vgone. The process is awakened 53239433Smckusick * when the transition is completed, and an error returned to 53339433Smckusick * indicate that the vnode is no longer usable (possibly having 53439433Smckusick * been changed to a new file system type). 53539433Smckusick */ 53639397Smckusick vget(vp) 53739397Smckusick register struct vnode *vp; 53839397Smckusick { 53939397Smckusick register struct vnode *vq; 54039397Smckusick 54139433Smckusick if (vp->v_flag & VXLOCK) { 54239433Smckusick vp->v_flag |= VXWANT; 54339433Smckusick sleep((caddr_t)vp, PINOD); 54439433Smckusick return (1); 54539433Smckusick } 54639809Smckusick if (vp->v_usecount == 0) { 54739433Smckusick if (vq = vp->v_freef) 54839433Smckusick vq->v_freeb = vp->v_freeb; 54939433Smckusick else 55039433Smckusick vfreet = vp->v_freeb; 55139433Smckusick *vp->v_freeb = vq; 55239433Smckusick vp->v_freef = NULL; 55339433Smckusick vp->v_freeb = NULL; 55439433Smckusick } 55539397Smckusick VREF(vp); 55639433Smckusick VOP_LOCK(vp); 55739433Smckusick return (0); 55839397Smckusick } 55939397Smckusick 56039397Smckusick /* 56139397Smckusick * Vnode reference, just increment the count 56239397Smckusick */ 56339397Smckusick void vref(vp) 56439397Smckusick struct vnode *vp; 56539397Smckusick { 56639397Smckusick 56739809Smckusick vp->v_usecount++; 56839397Smckusick } 56939397Smckusick 57039397Smckusick /* 57139397Smckusick * vput(), just unlock and vrele() 57239397Smckusick */ 57339397Smckusick void vput(vp) 57439397Smckusick register struct vnode *vp; 57539397Smckusick { 57652416Storek 57739397Smckusick VOP_UNLOCK(vp); 57839397Smckusick vrele(vp); 57939397Smckusick } 58039397Smckusick 58139397Smckusick /* 58239397Smckusick * Vnode release. 58339397Smckusick * If count drops to zero, call inactive routine and return to freelist. 58439397Smckusick */ 58539397Smckusick void vrele(vp) 58639397Smckusick register struct vnode *vp; 58739397Smckusick { 58839397Smckusick 58950109Smckusick #ifdef DIAGNOSTIC 59039397Smckusick if (vp == NULL) 59139433Smckusick panic("vrele: null vp"); 59250109Smckusick #endif 59339809Smckusick vp->v_usecount--; 59439809Smckusick if (vp->v_usecount > 0) 59539397Smckusick return; 59650109Smckusick #ifdef DIAGNOSTIC 59750109Smckusick if (vp->v_usecount != 0 || vp->v_writecount != 0) { 59850109Smckusick vprint("vrele: bad ref count", vp); 59950109Smckusick panic("vrele: ref cnt"); 60050109Smckusick } 60150109Smckusick #endif 60255468Smckusick /* 60355468Smckusick * insert at tail of LRU list 60455468Smckusick */ 60555468Smckusick *vfreet = vp; 60655468Smckusick vp->v_freeb = vfreet; 60739433Smckusick vp->v_freef = NULL; 60839433Smckusick vfreet = &vp->v_freef; 60954442Smckusick VOP_INACTIVE(vp); 61039397Smckusick } 61139433Smckusick 61239433Smckusick /* 61339809Smckusick * Page or buffer structure gets a reference. 61439809Smckusick */ 61553312Smckusick void vhold(vp) 61639809Smckusick register struct vnode *vp; 61739809Smckusick { 61839809Smckusick 61939809Smckusick vp->v_holdcnt++; 62039809Smckusick } 62139809Smckusick 62239809Smckusick /* 62339809Smckusick * Page or buffer structure frees a reference. 62439809Smckusick */ 62553312Smckusick void holdrele(vp) 62639809Smckusick register struct vnode *vp; 62739809Smckusick { 62839809Smckusick 62939809Smckusick if (vp->v_holdcnt <= 0) 63039809Smckusick panic("holdrele: holdcnt"); 63139809Smckusick vp->v_holdcnt--; 63239809Smckusick } 63339809Smckusick 63439809Smckusick /* 63539509Smckusick * Remove any vnodes in the vnode table belonging to mount point mp. 63639509Smckusick * 63739509Smckusick * If MNT_NOFORCE is specified, there should not be any active ones, 63839509Smckusick * return error if any are found (nb: this is a user error, not a 63939509Smckusick * system error). If MNT_FORCE is specified, detach any active vnodes 64039509Smckusick * that are found. 64139509Smckusick */ 64239509Smckusick int busyprt = 0; /* patch to print out busy vnodes */ 64339509Smckusick 64439509Smckusick vflush(mp, skipvp, flags) 64539509Smckusick struct mount *mp; 64639509Smckusick struct vnode *skipvp; 64739509Smckusick int flags; 64839509Smckusick { 64939509Smckusick register struct vnode *vp, *nvp; 65039509Smckusick int busy = 0; 65139509Smckusick 65241400Smckusick if ((mp->mnt_flag & MNT_MPBUSY) == 0) 65341300Smckusick panic("vflush: not busy"); 65441421Smckusick loop: 65541400Smckusick for (vp = mp->mnt_mounth; vp; vp = nvp) { 65641421Smckusick if (vp->v_mount != mp) 65741421Smckusick goto loop; 65839509Smckusick nvp = vp->v_mountf; 65939509Smckusick /* 66039509Smckusick * Skip over a selected vnode. 66139509Smckusick */ 66239509Smckusick if (vp == skipvp) 66339509Smckusick continue; 66439509Smckusick /* 66541300Smckusick * Skip over a vnodes marked VSYSTEM. 66641300Smckusick */ 66741300Smckusick if ((flags & SKIPSYSTEM) && (vp->v_flag & VSYSTEM)) 66841300Smckusick continue; 66941300Smckusick /* 67039809Smckusick * With v_usecount == 0, all we need to do is clear 67139509Smckusick * out the vnode data structures and we are done. 67239509Smckusick */ 67339809Smckusick if (vp->v_usecount == 0) { 67439509Smckusick vgone(vp); 67539509Smckusick continue; 67639509Smckusick } 67739509Smckusick /* 67839509Smckusick * For block or character devices, revert to an 67939509Smckusick * anonymous device. For all other files, just kill them. 68039509Smckusick */ 68141300Smckusick if (flags & FORCECLOSE) { 68239509Smckusick if (vp->v_type != VBLK && vp->v_type != VCHR) { 68339509Smckusick vgone(vp); 68439509Smckusick } else { 68539509Smckusick vclean(vp, 0); 68653547Sheideman vp->v_op = spec_vnodeop_p; 68739509Smckusick insmntque(vp, (struct mount *)0); 68839509Smckusick } 68939509Smckusick continue; 69039509Smckusick } 69139509Smckusick if (busyprt) 69239667Smckusick vprint("vflush: busy vnode", vp); 69339509Smckusick busy++; 69439509Smckusick } 69539509Smckusick if (busy) 69639509Smckusick return (EBUSY); 69739509Smckusick return (0); 69839509Smckusick } 69939509Smckusick 70039509Smckusick /* 70139433Smckusick * Disassociate the underlying file system from a vnode. 70239433Smckusick */ 70354347Smckusick void 70454347Smckusick vclean(vp, flags) 70539433Smckusick register struct vnode *vp; 70645118Smckusick int flags; 70739433Smckusick { 70839484Smckusick int active; 70939433Smckusick 71039484Smckusick /* 71139484Smckusick * Check to see if the vnode is in use. 71239667Smckusick * If so we have to reference it before we clean it out 71339667Smckusick * so that its count cannot fall to zero and generate a 71439667Smckusick * race against ourselves to recycle it. 71539484Smckusick */ 71639809Smckusick if (active = vp->v_usecount) 71739484Smckusick VREF(vp); 71839484Smckusick /* 719*56805Smckusick * Even if the count is zero, the VOP_INACTIVE routine may still 720*56805Smckusick * have the object locked while it cleans it out. The VOP_LOCK 721*56805Smckusick * ensures that the VOP_INACTIVE routine is done with its work. 722*56805Smckusick * For active vnodes, it ensures that no other activity can 723*56805Smckusick * occur while the underlying object is being cleaned out. 724*56805Smckusick */ 725*56805Smckusick VOP_LOCK(vp); 726*56805Smckusick /* 72739484Smckusick * Prevent the vnode from being recycled or 72839484Smckusick * brought into use while we clean it out. 72939484Smckusick */ 73039667Smckusick if (vp->v_flag & VXLOCK) 73139667Smckusick panic("vclean: deadlock"); 73239433Smckusick vp->v_flag |= VXLOCK; 73339433Smckusick /* 734*56805Smckusick * Clean out any buffers associated with the vnode. 73539667Smckusick */ 73641300Smckusick if (flags & DOCLOSE) 73754442Smckusick vinvalbuf(vp, 1, NOCRED, NULL); 73839667Smckusick /* 739*56805Smckusick * Any other processes trying to obtain this lock must first 740*56805Smckusick * wait for VXLOCK to clear, then call the new lock operation. 74139433Smckusick */ 742*56805Smckusick VOP_UNLOCK(vp); 74339433Smckusick /* 744*56805Smckusick * If purging an active vnode, it must be closed and 745*56805Smckusick * deactivated before being reclaimed. 74639433Smckusick */ 74739484Smckusick if (active) { 748*56805Smckusick if (flags & DOCLOSE) 749*56805Smckusick VOP_CLOSE(vp, IO_NDELAY, NOCRED, NULL); 750*56805Smckusick VOP_INACTIVE(vp); 75139433Smckusick } 75239433Smckusick /* 75339433Smckusick * Reclaim the vnode. 75439433Smckusick */ 755*56805Smckusick if (VOP_RECLAIM(vp)) 75639433Smckusick panic("vclean: cannot reclaim"); 75739484Smckusick if (active) 75839484Smckusick vrele(vp); 75953580Sheideman 76039433Smckusick /* 761*56805Smckusick * Done with purge, notify sleepers of the grim news. 76239433Smckusick */ 763*56805Smckusick vp->v_op = dead_vnodeop_p; 764*56805Smckusick vp->v_tag = VT_NON; 76539433Smckusick vp->v_flag &= ~VXLOCK; 76639433Smckusick if (vp->v_flag & VXWANT) { 76739433Smckusick vp->v_flag &= ~VXWANT; 76839433Smckusick wakeup((caddr_t)vp); 76939433Smckusick } 77039433Smckusick } 77139433Smckusick 77239433Smckusick /* 77339633Smckusick * Eliminate all activity associated with the requested vnode 77439633Smckusick * and with all vnodes aliased to the requested vnode. 77539633Smckusick */ 77639633Smckusick void vgoneall(vp) 77739633Smckusick register struct vnode *vp; 77839633Smckusick { 77939809Smckusick register struct vnode *vq; 78039633Smckusick 78140665Smckusick if (vp->v_flag & VALIASED) { 78240665Smckusick /* 78340665Smckusick * If a vgone (or vclean) is already in progress, 78440665Smckusick * wait until it is done and return. 78540665Smckusick */ 78640665Smckusick if (vp->v_flag & VXLOCK) { 78740665Smckusick vp->v_flag |= VXWANT; 78840665Smckusick sleep((caddr_t)vp, PINOD); 78940665Smckusick return; 79039633Smckusick } 79140665Smckusick /* 79240665Smckusick * Ensure that vp will not be vgone'd while we 79340665Smckusick * are eliminating its aliases. 79440665Smckusick */ 79540665Smckusick vp->v_flag |= VXLOCK; 79640665Smckusick while (vp->v_flag & VALIASED) { 79740665Smckusick for (vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 79840665Smckusick if (vq->v_rdev != vp->v_rdev || 79940665Smckusick vq->v_type != vp->v_type || vp == vq) 80040665Smckusick continue; 80140665Smckusick vgone(vq); 80240665Smckusick break; 80340665Smckusick } 80440665Smckusick } 80540665Smckusick /* 80640665Smckusick * Remove the lock so that vgone below will 80740665Smckusick * really eliminate the vnode after which time 80840665Smckusick * vgone will awaken any sleepers. 80940665Smckusick */ 81040665Smckusick vp->v_flag &= ~VXLOCK; 81139633Smckusick } 81239633Smckusick vgone(vp); 81339633Smckusick } 81439633Smckusick 81539633Smckusick /* 81639433Smckusick * Eliminate all activity associated with a vnode 81739433Smckusick * in preparation for reuse. 81839433Smckusick */ 81939433Smckusick void vgone(vp) 82039433Smckusick register struct vnode *vp; 82139433Smckusick { 82239809Smckusick register struct vnode *vq; 82339615Smckusick struct vnode *vx; 82439433Smckusick 82539433Smckusick /* 82640548Smckusick * If a vgone (or vclean) is already in progress, 82740548Smckusick * wait until it is done and return. 82840548Smckusick */ 82940548Smckusick if (vp->v_flag & VXLOCK) { 83040548Smckusick vp->v_flag |= VXWANT; 83140548Smckusick sleep((caddr_t)vp, PINOD); 83240548Smckusick return; 83340548Smckusick } 83440548Smckusick /* 83539433Smckusick * Clean out the filesystem specific data. 83639433Smckusick */ 83741300Smckusick vclean(vp, DOCLOSE); 83839433Smckusick /* 83939433Smckusick * Delete from old mount point vnode list, if on one. 84039433Smckusick */ 84139433Smckusick if (vp->v_mountb) { 84239433Smckusick if (vq = vp->v_mountf) 84339433Smckusick vq->v_mountb = vp->v_mountb; 84439433Smckusick *vp->v_mountb = vq; 84539433Smckusick vp->v_mountf = NULL; 84639433Smckusick vp->v_mountb = NULL; 84752311Smckusick vp->v_mount = NULL; 84839433Smckusick } 84939433Smckusick /* 85039433Smckusick * If special device, remove it from special device alias list. 85139433Smckusick */ 85239433Smckusick if (vp->v_type == VBLK || vp->v_type == VCHR) { 85339809Smckusick if (*vp->v_hashchain == vp) { 85439809Smckusick *vp->v_hashchain = vp->v_specnext; 85539433Smckusick } else { 85639809Smckusick for (vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 85739615Smckusick if (vq->v_specnext != vp) 85839433Smckusick continue; 85939615Smckusick vq->v_specnext = vp->v_specnext; 86039433Smckusick break; 86139433Smckusick } 86239615Smckusick if (vq == NULL) 86339433Smckusick panic("missing bdev"); 86439433Smckusick } 86539615Smckusick if (vp->v_flag & VALIASED) { 86652416Storek vx = NULL; 86739809Smckusick for (vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 86840108Smckusick if (vq->v_rdev != vp->v_rdev || 86940108Smckusick vq->v_type != vp->v_type) 87039615Smckusick continue; 87152416Storek if (vx) 87252416Storek break; 87339615Smckusick vx = vq; 87439615Smckusick } 87552416Storek if (vx == NULL) 87639615Smckusick panic("missing alias"); 87752416Storek if (vq == NULL) 87839615Smckusick vx->v_flag &= ~VALIASED; 87939615Smckusick vp->v_flag &= ~VALIASED; 88039615Smckusick } 88139615Smckusick FREE(vp->v_specinfo, M_VNODE); 88239615Smckusick vp->v_specinfo = NULL; 88339433Smckusick } 88439433Smckusick /* 88539433Smckusick * If it is on the freelist, move it to the head of the list. 88639433Smckusick */ 88739433Smckusick if (vp->v_freeb) { 88839433Smckusick if (vq = vp->v_freef) 88939433Smckusick vq->v_freeb = vp->v_freeb; 89039433Smckusick else 89139433Smckusick vfreet = vp->v_freeb; 89239433Smckusick *vp->v_freeb = vq; 89339433Smckusick vp->v_freef = vfreeh; 89439433Smckusick vp->v_freeb = &vfreeh; 89539433Smckusick vfreeh->v_freeb = &vp->v_freef; 89639433Smckusick vfreeh = vp; 89739433Smckusick } 89839484Smckusick vp->v_type = VBAD; 89939433Smckusick } 90039633Smckusick 90139633Smckusick /* 90239821Smckusick * Lookup a vnode by device number. 90339821Smckusick */ 90439821Smckusick vfinddev(dev, type, vpp) 90539821Smckusick dev_t dev; 90639821Smckusick enum vtype type; 90739821Smckusick struct vnode **vpp; 90839821Smckusick { 90939821Smckusick register struct vnode *vp; 91039821Smckusick 91139821Smckusick for (vp = speclisth[SPECHASH(dev)]; vp; vp = vp->v_specnext) { 91239821Smckusick if (dev != vp->v_rdev || type != vp->v_type) 91339821Smckusick continue; 91439821Smckusick *vpp = vp; 91539821Smckusick return (0); 91639821Smckusick } 91739821Smckusick return (1); 91839821Smckusick } 91939821Smckusick 92039821Smckusick /* 92139633Smckusick * Calculate the total number of references to a special device. 92239633Smckusick */ 92339633Smckusick vcount(vp) 92439633Smckusick register struct vnode *vp; 92539633Smckusick { 92639809Smckusick register struct vnode *vq; 92739633Smckusick int count; 92839633Smckusick 92939633Smckusick if ((vp->v_flag & VALIASED) == 0) 93039809Smckusick return (vp->v_usecount); 93139633Smckusick loop: 93239809Smckusick for (count = 0, vq = *vp->v_hashchain; vq; vq = vq->v_specnext) { 93340108Smckusick if (vq->v_rdev != vp->v_rdev || vq->v_type != vp->v_type) 93439633Smckusick continue; 93539633Smckusick /* 93639633Smckusick * Alias, but not in use, so flush it out. 93739633Smckusick */ 93839809Smckusick if (vq->v_usecount == 0) { 93939633Smckusick vgone(vq); 94039633Smckusick goto loop; 94139633Smckusick } 94239809Smckusick count += vq->v_usecount; 94339633Smckusick } 94439633Smckusick return (count); 94539633Smckusick } 94639667Smckusick 94739667Smckusick /* 94839667Smckusick * Print out a description of a vnode. 94939667Smckusick */ 95039667Smckusick static char *typename[] = 95140286Smckusick { "VNON", "VREG", "VDIR", "VBLK", "VCHR", "VLNK", "VSOCK", "VFIFO", "VBAD" }; 95239667Smckusick 95339667Smckusick vprint(label, vp) 95439667Smckusick char *label; 95539667Smckusick register struct vnode *vp; 95639667Smckusick { 95739913Smckusick char buf[64]; 95839667Smckusick 95939667Smckusick if (label != NULL) 96039667Smckusick printf("%s: ", label); 96150109Smckusick printf("type %s, usecount %d, writecount %d, refcount %d,", 96250109Smckusick typename[vp->v_type], vp->v_usecount, vp->v_writecount, 96350109Smckusick vp->v_holdcnt); 96439913Smckusick buf[0] = '\0'; 96539913Smckusick if (vp->v_flag & VROOT) 96639913Smckusick strcat(buf, "|VROOT"); 96739913Smckusick if (vp->v_flag & VTEXT) 96839913Smckusick strcat(buf, "|VTEXT"); 96941300Smckusick if (vp->v_flag & VSYSTEM) 97041300Smckusick strcat(buf, "|VSYSTEM"); 97141300Smckusick if (vp->v_flag & VXLOCK) 97241300Smckusick strcat(buf, "|VXLOCK"); 97341300Smckusick if (vp->v_flag & VXWANT) 97441300Smckusick strcat(buf, "|VXWANT"); 97541300Smckusick if (vp->v_flag & VBWAIT) 97641300Smckusick strcat(buf, "|VBWAIT"); 97739913Smckusick if (vp->v_flag & VALIASED) 97839913Smckusick strcat(buf, "|VALIASED"); 97939913Smckusick if (buf[0] != '\0') 98039913Smckusick printf(" flags (%s)", &buf[1]); 98139913Smckusick printf("\n\t"); 98239667Smckusick VOP_PRINT(vp); 98339667Smckusick } 98441110Smarc 98549691Smckusick #ifdef DEBUG 98649691Smckusick /* 98749691Smckusick * List all of the locked vnodes in the system. 98849691Smckusick * Called when debugging the kernel. 98949691Smckusick */ 99049691Smckusick printlockedvnodes() 99149691Smckusick { 99249691Smckusick register struct mount *mp; 99349691Smckusick register struct vnode *vp; 99449691Smckusick 99549691Smckusick printf("Locked vnodes\n"); 99649691Smckusick mp = rootfs; 99749691Smckusick do { 99849691Smckusick for (vp = mp->mnt_mounth; vp; vp = vp->v_mountf) 99949691Smckusick if (VOP_ISLOCKED(vp)) 100049691Smckusick vprint((char *)0, vp); 100149691Smckusick mp = mp->mnt_next; 100249691Smckusick } while (mp != rootfs); 100349691Smckusick } 100449691Smckusick #endif 100549691Smckusick 100641110Smarc int kinfo_vdebug = 1; 100741110Smarc int kinfo_vgetfailed; 100841110Smarc #define KINFO_VNODESLOP 10 100941110Smarc /* 101041110Smarc * Dump vnode list (via kinfo). 101141110Smarc * Copyout address of vnode followed by vnode. 101241110Smarc */ 101345118Smckusick /* ARGSUSED */ 101441110Smarc kinfo_vnode(op, where, acopysize, arg, aneeded) 101545118Smckusick int op; 101641110Smarc char *where; 101745118Smckusick int *acopysize, arg, *aneeded; 101841110Smarc { 101941110Smarc register struct mount *mp = rootfs; 102041300Smckusick struct mount *omp; 102141110Smarc struct vnode *vp; 102241110Smarc register char *bp = where, *savebp; 102353818Smckusick char *ewhere; 102441110Smarc int error; 102541110Smarc 102641110Smarc #define VPTRSZ sizeof (struct vnode *) 102741110Smarc #define VNODESZ sizeof (struct vnode) 102841110Smarc if (where == NULL) { 102941110Smarc *aneeded = (numvnodes + KINFO_VNODESLOP) * (VPTRSZ + VNODESZ); 103041110Smarc return (0); 103141110Smarc } 103253818Smckusick ewhere = where + *acopysize; 103341110Smarc 103441110Smarc do { 103541300Smckusick if (vfs_busy(mp)) { 103641400Smckusick mp = mp->mnt_next; 103741300Smckusick continue; 103841300Smckusick } 103941110Smarc savebp = bp; 104041110Smarc again: 104141421Smckusick for (vp = mp->mnt_mounth; vp; vp = vp->v_mountf) { 104241422Smckusick /* 104341422Smckusick * Check that the vp is still associated with 104441422Smckusick * this filesystem. RACE: could have been 104541422Smckusick * recycled onto the same filesystem. 104641422Smckusick */ 104741421Smckusick if (vp->v_mount != mp) { 104841421Smckusick if (kinfo_vdebug) 104941421Smckusick printf("kinfo: vp changed\n"); 105041421Smckusick bp = savebp; 105141421Smckusick goto again; 105241421Smckusick } 105341110Smarc if ((bp + VPTRSZ + VNODESZ <= ewhere) && 105441110Smarc ((error = copyout((caddr_t)&vp, bp, VPTRSZ)) || 105541110Smarc (error = copyout((caddr_t)vp, bp + VPTRSZ, 105641422Smckusick VNODESZ)))) 105741110Smarc return (error); 105841110Smarc bp += VPTRSZ + VNODESZ; 105941110Smarc } 106041300Smckusick omp = mp; 106141400Smckusick mp = mp->mnt_next; 106241300Smckusick vfs_unbusy(omp); 106341110Smarc } while (mp != rootfs); 106441110Smarc 106541110Smarc *aneeded = bp - where; 106641110Smarc if (bp > ewhere) 106741110Smarc *acopysize = ewhere - where; 106841110Smarc else 106941110Smarc *acopysize = bp - where; 107041110Smarc return (0); 107141110Smarc } 1072