123398Smckusick /* 237731Smckusick * Copyright (c) 1982, 1986, 1989 Regents of the University of California. 337731Smckusick * All rights reserved. 423398Smckusick * 544460Sbostic * %sccs.include.redist.c% 637731Smckusick * 7*45744Smckusick * @(#)vfs_vnops.c 7.25 (Berkeley) 12/05/90 823398Smckusick */ 918Sbill 1017099Sbloom #include "param.h" 1117099Sbloom #include "systm.h" 1217099Sbloom #include "user.h" 1337731Smckusick #include "kernel.h" 1417099Sbloom #include "file.h" 1537731Smckusick #include "stat.h" 1637731Smckusick #include "buf.h" 1737731Smckusick #include "proc.h" 1837731Smckusick #include "uio.h" 1917099Sbloom #include "socket.h" 2017099Sbloom #include "socketvar.h" 2137731Smckusick #include "mount.h" 2237731Smckusick #include "vnode.h" 2337731Smckusick #include "ioctl.h" 2437731Smckusick #include "tty.h" 2518Sbill 2637731Smckusick int vn_read(), vn_write(), vn_ioctl(), vn_select(), vn_close(); 2737731Smckusick struct fileops vnops = 2837731Smckusick { vn_read, vn_write, vn_ioctl, vn_select, vn_close }; 2937520Smckusick 3018Sbill /* 3137731Smckusick * Common code for vnode open operations. 3237731Smckusick * Check permissions, and call the VOP_OPEN or VOP_CREATE routine. 3318Sbill */ 3437731Smckusick vn_open(ndp, fmode, cmode) 3537731Smckusick register struct nameidata *ndp; 3637731Smckusick int fmode, cmode; 3737731Smckusick { 3837731Smckusick register struct vnode *vp; 3937731Smckusick struct vattr vat; 4037731Smckusick struct vattr *vap = &vat; 4137731Smckusick int error; 4237731Smckusick 4337731Smckusick if (fmode & FCREAT) { 4437731Smckusick ndp->ni_nameiop = CREATE | LOCKPARENT | LOCKLEAF; 4537731Smckusick if ((fmode & FEXCL) == 0) 4637731Smckusick ndp->ni_nameiop |= FOLLOW; 4737731Smckusick if (error = namei(ndp)) 4837731Smckusick return (error); 4937731Smckusick if (ndp->ni_vp == NULL) { 5041362Smckusick VATTR_NULL(vap); 5137731Smckusick vap->va_type = VREG; 5237731Smckusick vap->va_mode = cmode; 5337731Smckusick if (error = VOP_CREATE(ndp, vap)) 5437731Smckusick return (error); 5537731Smckusick fmode &= ~FTRUNC; 5637731Smckusick vp = ndp->ni_vp; 5737731Smckusick } else { 5839761Smckusick if (ndp->ni_dvp == ndp->ni_vp) 5939761Smckusick vrele(ndp->ni_dvp); 6043343Smckusick else 6139761Smckusick vput(ndp->ni_dvp); 6239761Smckusick ndp->ni_dvp = NULL; 6337731Smckusick vp = ndp->ni_vp; 6437731Smckusick if (fmode & FEXCL) { 6537731Smckusick error = EEXIST; 6637731Smckusick goto bad; 6737731Smckusick } 6837731Smckusick fmode &= ~FCREAT; 6937731Smckusick } 7037731Smckusick } else { 7137731Smckusick ndp->ni_nameiop = LOOKUP | FOLLOW | LOCKLEAF; 7237731Smckusick if (error = namei(ndp)) 7337731Smckusick return (error); 7437731Smckusick vp = ndp->ni_vp; 7537731Smckusick } 7637731Smckusick if (vp->v_type == VSOCK) { 7737731Smckusick error = EOPNOTSUPP; 7837731Smckusick goto bad; 7937731Smckusick } 8037731Smckusick if ((fmode & FCREAT) == 0) { 8137731Smckusick if (fmode & FREAD) { 8238401Smckusick if (error = VOP_ACCESS(vp, VREAD, ndp->ni_cred)) 8337731Smckusick goto bad; 8437731Smckusick } 8537731Smckusick if (fmode & (FWRITE|FTRUNC)) { 8637731Smckusick if (vp->v_type == VDIR) { 8737731Smckusick error = EISDIR; 8837731Smckusick goto bad; 8937731Smckusick } 9038401Smckusick if ((error = vn_writechk(vp)) || 9138401Smckusick (error = VOP_ACCESS(vp, VWRITE, ndp->ni_cred))) 9238401Smckusick goto bad; 9337731Smckusick } 9437731Smckusick } 9537731Smckusick if (fmode & FTRUNC) { 9641362Smckusick VATTR_NULL(vap); 9737731Smckusick vap->va_size = 0; 9837731Smckusick if (error = VOP_SETATTR(vp, vap, ndp->ni_cred)) 9937731Smckusick goto bad; 10037731Smckusick } 10137731Smckusick VOP_UNLOCK(vp); 10238351Smckusick error = VOP_OPEN(vp, fmode, ndp->ni_cred); 10338351Smckusick if (error) 10438351Smckusick vrele(vp); 10538351Smckusick return (error); 10637731Smckusick 10737731Smckusick bad: 10837731Smckusick vput(vp); 10940707Skarels return (error); 11037731Smckusick } 11137731Smckusick 11237731Smckusick /* 11338401Smckusick * Check for write permissions on the specified vnode. 11438401Smckusick * The read-only status of the file system is checked. 11538401Smckusick * Also, prototype text segments cannot be written. 11637731Smckusick */ 11738401Smckusick vn_writechk(vp) 11837731Smckusick register struct vnode *vp; 11918Sbill { 12018Sbill 12138401Smckusick /* 12238401Smckusick * Disallow write attempts on read-only file systems; 12338401Smckusick * unless the file is a socket or a block or character 12438401Smckusick * device resident on the file system. 12538401Smckusick */ 12645060Smckusick if (vp->v_mount->mnt_flag & MNT_RDONLY) { 12745060Smckusick switch (vp->v_type) { 12845060Smckusick case VREG: case VDIR: case VLNK: 12945060Smckusick return (EROFS); 13045060Smckusick } 13145060Smckusick } 13238401Smckusick /* 13338401Smckusick * If there's shared text associated with 13438401Smckusick * the vnode, try to free it up once. If 13538401Smckusick * we fail, we can't allow writing. 13638401Smckusick */ 137*45744Smckusick if ((vp->v_flag & VTEXT) && !vnode_pager_uncache(vp)) 13838401Smckusick return (ETXTBSY); 13938401Smckusick return (0); 14037731Smckusick } 14137731Smckusick 14237731Smckusick /* 14337731Smckusick * Vnode version of rdwri() for calls on file systems. 14437731Smckusick */ 14537731Smckusick vn_rdwr(rw, vp, base, len, offset, segflg, ioflg, cred, aresid) 14637731Smckusick enum uio_rw rw; 14737731Smckusick struct vnode *vp; 14837731Smckusick caddr_t base; 14937731Smckusick int len; 15037731Smckusick off_t offset; 15137731Smckusick enum uio_seg segflg; 15237731Smckusick int ioflg; 15337731Smckusick struct ucred *cred; 15437731Smckusick int *aresid; 15537731Smckusick { 15637731Smckusick struct uio auio; 15737731Smckusick struct iovec aiov; 15837731Smckusick int error; 15937731Smckusick 16039590Smckusick if ((ioflg & IO_NODELOCKED) == 0) 16139590Smckusick VOP_LOCK(vp); 16237731Smckusick auio.uio_iov = &aiov; 16337731Smckusick auio.uio_iovcnt = 1; 16437731Smckusick aiov.iov_base = base; 16537731Smckusick aiov.iov_len = len; 16637731Smckusick auio.uio_resid = len; 16737731Smckusick auio.uio_offset = offset; 16837731Smckusick auio.uio_segflg = segflg; 16937731Smckusick auio.uio_rw = rw; 17037731Smckusick if (rw == UIO_READ) 17139590Smckusick error = VOP_READ(vp, &auio, ioflg, cred); 17237731Smckusick else 17339590Smckusick error = VOP_WRITE(vp, &auio, ioflg, cred); 17437731Smckusick if (aresid) 17537731Smckusick *aresid = auio.uio_resid; 17637731Smckusick else 17737731Smckusick if (auio.uio_resid && error == 0) 17837731Smckusick error = EIO; 17939590Smckusick if ((ioflg & IO_NODELOCKED) == 0) 18039590Smckusick VOP_UNLOCK(vp); 18137731Smckusick return (error); 18237731Smckusick } 18337731Smckusick 18437731Smckusick vn_read(fp, uio, cred) 18537731Smckusick struct file *fp; 18637731Smckusick struct uio *uio; 18737731Smckusick struct ucred *cred; 18837731Smckusick { 18939590Smckusick register struct vnode *vp = (struct vnode *)fp->f_data; 19039590Smckusick int count, error; 19137731Smckusick 19239590Smckusick VOP_LOCK(vp); 19339590Smckusick uio->uio_offset = fp->f_offset; 19439590Smckusick count = uio->uio_resid; 19539590Smckusick error = VOP_READ(vp, uio, (fp->f_flag & FNDELAY) ? IO_NDELAY : 0, cred); 19639590Smckusick fp->f_offset += count - uio->uio_resid; 19739590Smckusick VOP_UNLOCK(vp); 19839590Smckusick return (error); 19937731Smckusick } 20037731Smckusick 20137731Smckusick vn_write(fp, uio, cred) 20237731Smckusick struct file *fp; 20337731Smckusick struct uio *uio; 20437731Smckusick struct ucred *cred; 20537731Smckusick { 20637731Smckusick register struct vnode *vp = (struct vnode *)fp->f_data; 20739590Smckusick int count, error, ioflag = 0; 20837731Smckusick 20937731Smckusick if (vp->v_type == VREG && (fp->f_flag & FAPPEND)) 21037731Smckusick ioflag |= IO_APPEND; 21137731Smckusick if (fp->f_flag & FNDELAY) 21237731Smckusick ioflag |= IO_NDELAY; 21339590Smckusick VOP_LOCK(vp); 21439590Smckusick uio->uio_offset = fp->f_offset; 21539590Smckusick count = uio->uio_resid; 21639590Smckusick error = VOP_WRITE(vp, uio, ioflag, cred); 21739590Smckusick if (ioflag & IO_APPEND) 21839590Smckusick fp->f_offset = uio->uio_offset; 21939590Smckusick else 22039590Smckusick fp->f_offset += count - uio->uio_resid; 22139590Smckusick VOP_UNLOCK(vp); 22239590Smckusick return (error); 22337731Smckusick } 22437731Smckusick 22537731Smckusick /* 22637731Smckusick * Get stat info for a vnode. 22737731Smckusick */ 22837731Smckusick vn_stat(vp, sb) 22937731Smckusick struct vnode *vp; 23037731Smckusick register struct stat *sb; 23137731Smckusick { 23237731Smckusick struct vattr vattr; 23337731Smckusick register struct vattr *vap; 23437731Smckusick int error; 23537731Smckusick u_short mode; 23637731Smckusick 23737731Smckusick vap = &vattr; 23837731Smckusick error = VOP_GETATTR(vp, vap, u.u_cred); 23937731Smckusick if (error) 24037731Smckusick return (error); 24137731Smckusick /* 24237731Smckusick * Copy from vattr table 24337731Smckusick */ 24437731Smckusick sb->st_dev = vap->va_fsid; 24537731Smckusick sb->st_ino = vap->va_fileid; 24637731Smckusick mode = vap->va_mode; 24737731Smckusick switch (vp->v_type) { 24837731Smckusick case VREG: 24939382Smckusick mode |= S_IFREG; 25037731Smckusick break; 25137731Smckusick case VDIR: 25239382Smckusick mode |= S_IFDIR; 25337731Smckusick break; 25437731Smckusick case VBLK: 25539382Smckusick mode |= S_IFBLK; 25637731Smckusick break; 25737731Smckusick case VCHR: 25839382Smckusick mode |= S_IFCHR; 25937731Smckusick break; 26037731Smckusick case VLNK: 26139382Smckusick mode |= S_IFLNK; 26237731Smckusick break; 26337731Smckusick case VSOCK: 26439382Smckusick mode |= S_IFSOCK; 26537731Smckusick break; 26640284Smckusick case VFIFO: 26740284Smckusick mode |= S_IFIFO; 26840284Smckusick break; 26937731Smckusick default: 27037731Smckusick return (EBADF); 27137731Smckusick }; 27237731Smckusick sb->st_mode = mode; 27337731Smckusick sb->st_nlink = vap->va_nlink; 27437731Smckusick sb->st_uid = vap->va_uid; 27537731Smckusick sb->st_gid = vap->va_gid; 27637731Smckusick sb->st_rdev = vap->va_rdev; 27737731Smckusick sb->st_size = vap->va_size; 27837731Smckusick sb->st_atime = vap->va_atime.tv_sec; 27937731Smckusick sb->st_spare1 = 0; 28037731Smckusick sb->st_mtime = vap->va_mtime.tv_sec; 28137731Smckusick sb->st_spare2 = 0; 28237731Smckusick sb->st_ctime = vap->va_ctime.tv_sec; 28337731Smckusick sb->st_spare3 = 0; 28437731Smckusick sb->st_blksize = vap->va_blocksize; 28538257Smckusick sb->st_flags = vap->va_flags; 28638257Smckusick sb->st_gen = vap->va_gen; 28738769Smckusick sb->st_blocks = vap->va_bytes / S_BLKSIZE; 28837731Smckusick return (0); 28937731Smckusick } 29037731Smckusick 29137731Smckusick /* 29237731Smckusick * Vnode ioctl call 29337731Smckusick */ 29437731Smckusick vn_ioctl(fp, com, data) 29537731Smckusick struct file *fp; 29637731Smckusick int com; 29737731Smckusick caddr_t data; 29837731Smckusick { 29937731Smckusick register struct vnode *vp = ((struct vnode *)fp->f_data); 30037731Smckusick struct vattr vattr; 30137731Smckusick int error; 30237731Smckusick 30337731Smckusick switch (vp->v_type) { 30437731Smckusick 30537731Smckusick case VREG: 30637731Smckusick case VDIR: 30737731Smckusick if (com == FIONREAD) { 30837731Smckusick if (error = VOP_GETATTR(vp, &vattr, u.u_cred)) 30937731Smckusick return (error); 31037731Smckusick *(off_t *)data = vattr.va_size - fp->f_offset; 31137731Smckusick return (0); 31218Sbill } 31337731Smckusick if (com == FIONBIO || com == FIOASYNC) /* XXX */ 31437731Smckusick return (0); /* XXX */ 31537731Smckusick /* fall into ... */ 31637731Smckusick 31737731Smckusick default: 31837731Smckusick return (ENOTTY); 31937731Smckusick 32040284Smckusick case VFIFO: 32137731Smckusick case VCHR: 32237731Smckusick case VBLK: 32339564Smarc error = VOP_IOCTL(vp, com, data, fp->f_flag, u.u_cred); 32439564Smarc if (error == 0 && com == TIOCSCTTY) { 32539564Smarc u.u_procp->p_session->s_ttyvp = vp; 32639564Smarc VREF(vp); 32739564Smarc } 32839564Smarc return (error); 32918Sbill } 33037731Smckusick } 33137731Smckusick 33237731Smckusick /* 33337731Smckusick * Vnode select call 33437731Smckusick */ 33537731Smckusick vn_select(fp, which) 33637731Smckusick struct file *fp; 33737731Smckusick int which; 33837731Smckusick { 33940707Skarels return (VOP_SELECT(((struct vnode *)fp->f_data), which, fp->f_flag, 34040284Smckusick u.u_cred)); 34137731Smckusick } 34237731Smckusick 34337731Smckusick /* 34437731Smckusick * Vnode close call 34537731Smckusick */ 34637731Smckusick vn_close(fp) 34737731Smckusick register struct file *fp; 34837731Smckusick { 34937731Smckusick struct vnode *vp = ((struct vnode *)fp->f_data); 35037731Smckusick int error; 35137731Smckusick 35237731Smckusick if (fp->f_flag & (FSHLOCK|FEXLOCK)) 35337731Smckusick vn_unlock(fp, FSHLOCK|FEXLOCK); 35411162Ssam /* 35537731Smckusick * Must delete vnode reference from this file entry 35637731Smckusick * before VOP_CLOSE, so that only other references 35737731Smckusick * will prevent close. 35811162Ssam */ 35937731Smckusick fp->f_data = (caddr_t) 0; 36037731Smckusick error = VOP_CLOSE(vp, fp->f_flag, u.u_cred); 36137731Smckusick vrele(vp); 36237731Smckusick return (error); 36337731Smckusick } 36437731Smckusick 36537731Smckusick /* 36637731Smckusick * Place an advisory lock on a vnode. 36737731Smckusick * !! THIS IMPLIES THAT ALL STATEFUL FILE SERVERS WILL USE file table entries 36837731Smckusick */ 36937731Smckusick vn_lock(fp, cmd) 37037731Smckusick register struct file *fp; 37137731Smckusick int cmd; 37237731Smckusick { 37337731Smckusick register int priority = PLOCK; 37437731Smckusick register struct vnode *vp = (struct vnode *)fp->f_data; 37540707Skarels int error = 0; 37640707Skarels static char lockstr[] = "flock"; 37737731Smckusick 37837731Smckusick if ((cmd & LOCK_EX) == 0) 37937731Smckusick priority += 4; 38040707Skarels priority |= PCATCH; 38140707Skarels 38211162Ssam /* 38337731Smckusick * If there's a exclusive lock currently applied 38437731Smckusick * to the file, then we've gotta wait for the 38537731Smckusick * lock with everyone else. 38611162Ssam */ 38737731Smckusick again: 38837731Smckusick while (vp->v_flag & VEXLOCK) { 38937731Smckusick /* 39037731Smckusick * If we're holding an exclusive 39137731Smckusick * lock, then release it. 39237731Smckusick */ 39337731Smckusick if (fp->f_flag & FEXLOCK) { 39437731Smckusick vn_unlock(fp, FEXLOCK); 39537731Smckusick continue; 39637731Smckusick } 39737731Smckusick if (cmd & LOCK_NB) 39837731Smckusick return (EWOULDBLOCK); 39937731Smckusick vp->v_flag |= VLWAIT; 40040707Skarels if (error = tsleep((caddr_t)&vp->v_exlockc, priority, 40140707Skarels lockstr, 0)) 40240707Skarels return (error); 40318Sbill } 40445060Smckusick if (error == 0 && (cmd & LOCK_EX) && (vp->v_flag & VSHLOCK)) { 40537731Smckusick /* 40637731Smckusick * Must wait for any shared locks to finish 40737731Smckusick * before we try to apply a exclusive lock. 40837731Smckusick * 40937731Smckusick * If we're holding a shared 41037731Smckusick * lock, then release it. 41137731Smckusick */ 41237731Smckusick if (fp->f_flag & FSHLOCK) { 41337731Smckusick vn_unlock(fp, FSHLOCK); 41437731Smckusick goto again; 41537731Smckusick } 41637731Smckusick if (cmd & LOCK_NB) 41737731Smckusick return (EWOULDBLOCK); 41837731Smckusick vp->v_flag |= VLWAIT; 41940707Skarels if (error = tsleep((caddr_t)&vp->v_shlockc, PLOCK | PCATCH, 42045060Smckusick lockstr, 0)) 42140707Skarels return (error); 42237731Smckusick } 42337731Smckusick if (fp->f_flag & FEXLOCK) 42437731Smckusick panic("vn_lock"); 42537731Smckusick if (cmd & LOCK_EX) { 42637731Smckusick cmd &= ~LOCK_SH; 42737731Smckusick vp->v_exlockc++; 42837731Smckusick vp->v_flag |= VEXLOCK; 42937731Smckusick fp->f_flag |= FEXLOCK; 43037731Smckusick } 43137731Smckusick if ((cmd & LOCK_SH) && (fp->f_flag & FSHLOCK) == 0) { 43237731Smckusick vp->v_shlockc++; 43337731Smckusick vp->v_flag |= VSHLOCK; 43437731Smckusick fp->f_flag |= FSHLOCK; 43537731Smckusick } 43637731Smckusick return (0); 43718Sbill } 43818Sbill 43918Sbill /* 44037731Smckusick * Unlock a file. 44118Sbill */ 44237731Smckusick vn_unlock(fp, kind) 44337731Smckusick register struct file *fp; 44437731Smckusick int kind; 44518Sbill { 44637731Smckusick register struct vnode *vp = (struct vnode *)fp->f_data; 44737731Smckusick int flags; 44818Sbill 44937731Smckusick kind &= fp->f_flag; 45037731Smckusick if (vp == NULL || kind == 0) 45137731Smckusick return; 45237731Smckusick flags = vp->v_flag; 45337731Smckusick if (kind & FSHLOCK) { 45437731Smckusick if ((flags & VSHLOCK) == 0) 45537731Smckusick panic("vn_unlock: SHLOCK"); 45637731Smckusick if (--vp->v_shlockc == 0) { 45737731Smckusick vp->v_flag &= ~VSHLOCK; 45837731Smckusick if (flags & VLWAIT) 45937731Smckusick wakeup((caddr_t)&vp->v_shlockc); 46037731Smckusick } 46137731Smckusick fp->f_flag &= ~FSHLOCK; 46237552Smckusick } 46337731Smckusick if (kind & FEXLOCK) { 46437731Smckusick if ((flags & VEXLOCK) == 0) 46537731Smckusick panic("vn_unlock: EXLOCK"); 46637731Smckusick if (--vp->v_exlockc == 0) { 46737731Smckusick vp->v_flag &= ~(VEXLOCK|VLWAIT); 46837731Smckusick if (flags & VLWAIT) 46937731Smckusick wakeup((caddr_t)&vp->v_exlockc); 47037731Smckusick } 47137731Smckusick fp->f_flag &= ~FEXLOCK; 47237731Smckusick } 47318Sbill } 47418Sbill 47518Sbill /* 47637731Smckusick * vn_fhtovp() - convert a fh to a vnode ptr (optionally locked) 47737731Smckusick * - look up fsid in mount list (if not found ret error) 47837731Smckusick * - get vp by calling VFS_FHTOVP() macro 47937731Smckusick * - if lockflag lock it with VOP_LOCK() 48018Sbill */ 48137731Smckusick vn_fhtovp(fhp, lockflag, vpp) 48237731Smckusick fhandle_t *fhp; 48337731Smckusick int lockflag; 48437731Smckusick struct vnode **vpp; 48518Sbill { 48637731Smckusick register struct mount *mp; 48718Sbill 48837731Smckusick if ((mp = getvfs(&fhp->fh_fsid)) == NULL) 48937731Smckusick return (ESTALE); 49038146Smckusick if (VFS_FHTOVP(mp, &fhp->fh_fid, vpp)) 49138146Smckusick return (ESTALE); 49238146Smckusick if (!lockflag) 49338146Smckusick VOP_UNLOCK(*vpp); 49437731Smckusick return (0); 49537731Smckusick } 49637731Smckusick 49737731Smckusick /* 49837731Smckusick * Noop 49937731Smckusick */ 50037731Smckusick vfs_noop() 50137731Smckusick { 50237731Smckusick 50337731Smckusick return (ENXIO); 50437731Smckusick } 50537731Smckusick 50637731Smckusick /* 50737731Smckusick * Null op 50837731Smckusick */ 50937731Smckusick vfs_nullop() 51037731Smckusick { 51137731Smckusick 51237731Smckusick return (0); 51337731Smckusick } 514