123398Smckusick /* 237731Smckusick * Copyright (c) 1982, 1986, 1989 Regents of the University of California. 337731Smckusick * All rights reserved. 423398Smckusick * 544460Sbostic * %sccs.include.redist.c% 637731Smckusick * 7*45060Smckusick * @(#)vfs_vnops.c 7.24 (Berkeley) 08/22/90 823398Smckusick */ 918Sbill 1017099Sbloom #include "param.h" 1117099Sbloom #include "systm.h" 1217099Sbloom #include "user.h" 1337731Smckusick #include "kernel.h" 1417099Sbloom #include "file.h" 1537731Smckusick #include "stat.h" 1637731Smckusick #include "buf.h" 1737731Smckusick #include "proc.h" 1837731Smckusick #include "uio.h" 1917099Sbloom #include "socket.h" 2017099Sbloom #include "socketvar.h" 2137731Smckusick #include "mount.h" 2237731Smckusick #include "vnode.h" 2337731Smckusick #include "ioctl.h" 2437731Smckusick #include "tty.h" 2518Sbill 2637731Smckusick int vn_read(), vn_write(), vn_ioctl(), vn_select(), vn_close(); 2737731Smckusick struct fileops vnops = 2837731Smckusick { vn_read, vn_write, vn_ioctl, vn_select, vn_close }; 2937520Smckusick 3018Sbill /* 3137731Smckusick * Common code for vnode open operations. 3237731Smckusick * Check permissions, and call the VOP_OPEN or VOP_CREATE routine. 3318Sbill */ 3437731Smckusick vn_open(ndp, fmode, cmode) 3537731Smckusick register struct nameidata *ndp; 3637731Smckusick int fmode, cmode; 3737731Smckusick { 3837731Smckusick register struct vnode *vp; 3937731Smckusick struct vattr vat; 4037731Smckusick struct vattr *vap = &vat; 4137731Smckusick int error; 4237731Smckusick 4337731Smckusick if (fmode & FCREAT) { 4437731Smckusick ndp->ni_nameiop = CREATE | LOCKPARENT | LOCKLEAF; 4537731Smckusick if ((fmode & FEXCL) == 0) 4637731Smckusick ndp->ni_nameiop |= FOLLOW; 4737731Smckusick if (error = namei(ndp)) 4837731Smckusick return (error); 4937731Smckusick if (ndp->ni_vp == NULL) { 5041362Smckusick VATTR_NULL(vap); 5137731Smckusick vap->va_type = VREG; 5237731Smckusick vap->va_mode = cmode; 5337731Smckusick if (error = VOP_CREATE(ndp, vap)) 5437731Smckusick return (error); 5537731Smckusick fmode &= ~FTRUNC; 5637731Smckusick vp = ndp->ni_vp; 5737731Smckusick } else { 5839761Smckusick if (ndp->ni_dvp == ndp->ni_vp) 5939761Smckusick vrele(ndp->ni_dvp); 6043343Smckusick else 6139761Smckusick vput(ndp->ni_dvp); 6239761Smckusick ndp->ni_dvp = NULL; 6337731Smckusick vp = ndp->ni_vp; 6437731Smckusick if (fmode & FEXCL) { 6537731Smckusick error = EEXIST; 6637731Smckusick goto bad; 6737731Smckusick } 6837731Smckusick fmode &= ~FCREAT; 6937731Smckusick } 7037731Smckusick } else { 7137731Smckusick ndp->ni_nameiop = LOOKUP | FOLLOW | LOCKLEAF; 7237731Smckusick if (error = namei(ndp)) 7337731Smckusick return (error); 7437731Smckusick vp = ndp->ni_vp; 7537731Smckusick } 7637731Smckusick if (vp->v_type == VSOCK) { 7737731Smckusick error = EOPNOTSUPP; 7837731Smckusick goto bad; 7937731Smckusick } 8037731Smckusick if ((fmode & FCREAT) == 0) { 8137731Smckusick if (fmode & FREAD) { 8238401Smckusick if (error = VOP_ACCESS(vp, VREAD, ndp->ni_cred)) 8337731Smckusick goto bad; 8437731Smckusick } 8537731Smckusick if (fmode & (FWRITE|FTRUNC)) { 8637731Smckusick if (vp->v_type == VDIR) { 8737731Smckusick error = EISDIR; 8837731Smckusick goto bad; 8937731Smckusick } 9038401Smckusick if ((error = vn_writechk(vp)) || 9138401Smckusick (error = VOP_ACCESS(vp, VWRITE, ndp->ni_cred))) 9238401Smckusick goto bad; 9337731Smckusick } 9437731Smckusick } 9537731Smckusick if (fmode & FTRUNC) { 9641362Smckusick VATTR_NULL(vap); 9737731Smckusick vap->va_size = 0; 9837731Smckusick if (error = VOP_SETATTR(vp, vap, ndp->ni_cred)) 9937731Smckusick goto bad; 10037731Smckusick } 10137731Smckusick VOP_UNLOCK(vp); 10238351Smckusick error = VOP_OPEN(vp, fmode, ndp->ni_cred); 10338351Smckusick if (error) 10438351Smckusick vrele(vp); 10538351Smckusick return (error); 10637731Smckusick 10737731Smckusick bad: 10837731Smckusick vput(vp); 10940707Skarels return (error); 11037731Smckusick } 11137731Smckusick 11237731Smckusick /* 11338401Smckusick * Check for write permissions on the specified vnode. 11438401Smckusick * The read-only status of the file system is checked. 11538401Smckusick * Also, prototype text segments cannot be written. 11637731Smckusick */ 11738401Smckusick vn_writechk(vp) 11837731Smckusick register struct vnode *vp; 11918Sbill { 12018Sbill 12138401Smckusick /* 12238401Smckusick * Disallow write attempts on read-only file systems; 12338401Smckusick * unless the file is a socket or a block or character 12438401Smckusick * device resident on the file system. 12538401Smckusick */ 126*45060Smckusick if (vp->v_mount->mnt_flag & MNT_RDONLY) { 127*45060Smckusick switch (vp->v_type) { 128*45060Smckusick case VREG: case VDIR: case VLNK: 129*45060Smckusick return (EROFS); 130*45060Smckusick } 131*45060Smckusick } 13238401Smckusick /* 13338401Smckusick * If there's shared text associated with 13438401Smckusick * the vnode, try to free it up once. If 13538401Smckusick * we fail, we can't allow writing. 13638401Smckusick */ 13738401Smckusick if (vp->v_flag & VTEXT) 13838401Smckusick xrele(vp); 13938401Smckusick if (vp->v_flag & VTEXT) 14038401Smckusick return (ETXTBSY); 14138401Smckusick return (0); 14237731Smckusick } 14337731Smckusick 14437731Smckusick /* 14537731Smckusick * Vnode version of rdwri() for calls on file systems. 14637731Smckusick */ 14737731Smckusick vn_rdwr(rw, vp, base, len, offset, segflg, ioflg, cred, aresid) 14837731Smckusick enum uio_rw rw; 14937731Smckusick struct vnode *vp; 15037731Smckusick caddr_t base; 15137731Smckusick int len; 15237731Smckusick off_t offset; 15337731Smckusick enum uio_seg segflg; 15437731Smckusick int ioflg; 15537731Smckusick struct ucred *cred; 15637731Smckusick int *aresid; 15737731Smckusick { 15837731Smckusick struct uio auio; 15937731Smckusick struct iovec aiov; 16037731Smckusick int error; 16137731Smckusick 16239590Smckusick if ((ioflg & IO_NODELOCKED) == 0) 16339590Smckusick VOP_LOCK(vp); 16437731Smckusick auio.uio_iov = &aiov; 16537731Smckusick auio.uio_iovcnt = 1; 16637731Smckusick aiov.iov_base = base; 16737731Smckusick aiov.iov_len = len; 16837731Smckusick auio.uio_resid = len; 16937731Smckusick auio.uio_offset = offset; 17037731Smckusick auio.uio_segflg = segflg; 17137731Smckusick auio.uio_rw = rw; 17237731Smckusick if (rw == UIO_READ) 17339590Smckusick error = VOP_READ(vp, &auio, ioflg, cred); 17437731Smckusick else 17539590Smckusick error = VOP_WRITE(vp, &auio, ioflg, cred); 17637731Smckusick if (aresid) 17737731Smckusick *aresid = auio.uio_resid; 17837731Smckusick else 17937731Smckusick if (auio.uio_resid && error == 0) 18037731Smckusick error = EIO; 18139590Smckusick if ((ioflg & IO_NODELOCKED) == 0) 18239590Smckusick VOP_UNLOCK(vp); 18337731Smckusick return (error); 18437731Smckusick } 18537731Smckusick 18637731Smckusick vn_read(fp, uio, cred) 18737731Smckusick struct file *fp; 18837731Smckusick struct uio *uio; 18937731Smckusick struct ucred *cred; 19037731Smckusick { 19139590Smckusick register struct vnode *vp = (struct vnode *)fp->f_data; 19239590Smckusick int count, error; 19337731Smckusick 19439590Smckusick VOP_LOCK(vp); 19539590Smckusick uio->uio_offset = fp->f_offset; 19639590Smckusick count = uio->uio_resid; 19739590Smckusick error = VOP_READ(vp, uio, (fp->f_flag & FNDELAY) ? IO_NDELAY : 0, cred); 19839590Smckusick fp->f_offset += count - uio->uio_resid; 19939590Smckusick VOP_UNLOCK(vp); 20039590Smckusick return (error); 20137731Smckusick } 20237731Smckusick 20337731Smckusick vn_write(fp, uio, cred) 20437731Smckusick struct file *fp; 20537731Smckusick struct uio *uio; 20637731Smckusick struct ucred *cred; 20737731Smckusick { 20837731Smckusick register struct vnode *vp = (struct vnode *)fp->f_data; 20939590Smckusick int count, error, ioflag = 0; 21037731Smckusick 21137731Smckusick if (vp->v_type == VREG && (fp->f_flag & FAPPEND)) 21237731Smckusick ioflag |= IO_APPEND; 21337731Smckusick if (fp->f_flag & FNDELAY) 21437731Smckusick ioflag |= IO_NDELAY; 21539590Smckusick VOP_LOCK(vp); 21639590Smckusick uio->uio_offset = fp->f_offset; 21739590Smckusick count = uio->uio_resid; 21839590Smckusick error = VOP_WRITE(vp, uio, ioflag, cred); 21939590Smckusick if (ioflag & IO_APPEND) 22039590Smckusick fp->f_offset = uio->uio_offset; 22139590Smckusick else 22239590Smckusick fp->f_offset += count - uio->uio_resid; 22339590Smckusick VOP_UNLOCK(vp); 22439590Smckusick return (error); 22537731Smckusick } 22637731Smckusick 22737731Smckusick /* 22837731Smckusick * Get stat info for a vnode. 22937731Smckusick */ 23037731Smckusick vn_stat(vp, sb) 23137731Smckusick struct vnode *vp; 23237731Smckusick register struct stat *sb; 23337731Smckusick { 23437731Smckusick struct vattr vattr; 23537731Smckusick register struct vattr *vap; 23637731Smckusick int error; 23737731Smckusick u_short mode; 23837731Smckusick 23937731Smckusick vap = &vattr; 24037731Smckusick error = VOP_GETATTR(vp, vap, u.u_cred); 24137731Smckusick if (error) 24237731Smckusick return (error); 24337731Smckusick /* 24437731Smckusick * Copy from vattr table 24537731Smckusick */ 24637731Smckusick sb->st_dev = vap->va_fsid; 24737731Smckusick sb->st_ino = vap->va_fileid; 24837731Smckusick mode = vap->va_mode; 24937731Smckusick switch (vp->v_type) { 25037731Smckusick case VREG: 25139382Smckusick mode |= S_IFREG; 25237731Smckusick break; 25337731Smckusick case VDIR: 25439382Smckusick mode |= S_IFDIR; 25537731Smckusick break; 25637731Smckusick case VBLK: 25739382Smckusick mode |= S_IFBLK; 25837731Smckusick break; 25937731Smckusick case VCHR: 26039382Smckusick mode |= S_IFCHR; 26137731Smckusick break; 26237731Smckusick case VLNK: 26339382Smckusick mode |= S_IFLNK; 26437731Smckusick break; 26537731Smckusick case VSOCK: 26639382Smckusick mode |= S_IFSOCK; 26737731Smckusick break; 26840284Smckusick case VFIFO: 26940284Smckusick mode |= S_IFIFO; 27040284Smckusick break; 27137731Smckusick default: 27237731Smckusick return (EBADF); 27337731Smckusick }; 27437731Smckusick sb->st_mode = mode; 27537731Smckusick sb->st_nlink = vap->va_nlink; 27637731Smckusick sb->st_uid = vap->va_uid; 27737731Smckusick sb->st_gid = vap->va_gid; 27837731Smckusick sb->st_rdev = vap->va_rdev; 27937731Smckusick sb->st_size = vap->va_size; 28037731Smckusick sb->st_atime = vap->va_atime.tv_sec; 28137731Smckusick sb->st_spare1 = 0; 28237731Smckusick sb->st_mtime = vap->va_mtime.tv_sec; 28337731Smckusick sb->st_spare2 = 0; 28437731Smckusick sb->st_ctime = vap->va_ctime.tv_sec; 28537731Smckusick sb->st_spare3 = 0; 28637731Smckusick sb->st_blksize = vap->va_blocksize; 28738257Smckusick sb->st_flags = vap->va_flags; 28838257Smckusick sb->st_gen = vap->va_gen; 28938769Smckusick sb->st_blocks = vap->va_bytes / S_BLKSIZE; 29037731Smckusick return (0); 29137731Smckusick } 29237731Smckusick 29337731Smckusick /* 29437731Smckusick * Vnode ioctl call 29537731Smckusick */ 29637731Smckusick vn_ioctl(fp, com, data) 29737731Smckusick struct file *fp; 29837731Smckusick int com; 29937731Smckusick caddr_t data; 30037731Smckusick { 30137731Smckusick register struct vnode *vp = ((struct vnode *)fp->f_data); 30237731Smckusick struct vattr vattr; 30337731Smckusick int error; 30437731Smckusick 30537731Smckusick switch (vp->v_type) { 30637731Smckusick 30737731Smckusick case VREG: 30837731Smckusick case VDIR: 30937731Smckusick if (com == FIONREAD) { 31037731Smckusick if (error = VOP_GETATTR(vp, &vattr, u.u_cred)) 31137731Smckusick return (error); 31237731Smckusick *(off_t *)data = vattr.va_size - fp->f_offset; 31337731Smckusick return (0); 31418Sbill } 31537731Smckusick if (com == FIONBIO || com == FIOASYNC) /* XXX */ 31637731Smckusick return (0); /* XXX */ 31737731Smckusick /* fall into ... */ 31837731Smckusick 31937731Smckusick default: 32037731Smckusick return (ENOTTY); 32137731Smckusick 32240284Smckusick case VFIFO: 32337731Smckusick case VCHR: 32437731Smckusick case VBLK: 32539564Smarc error = VOP_IOCTL(vp, com, data, fp->f_flag, u.u_cred); 32639564Smarc if (error == 0 && com == TIOCSCTTY) { 32739564Smarc u.u_procp->p_session->s_ttyvp = vp; 32839564Smarc VREF(vp); 32939564Smarc } 33039564Smarc return (error); 33118Sbill } 33237731Smckusick } 33337731Smckusick 33437731Smckusick /* 33537731Smckusick * Vnode select call 33637731Smckusick */ 33737731Smckusick vn_select(fp, which) 33837731Smckusick struct file *fp; 33937731Smckusick int which; 34037731Smckusick { 34140707Skarels return (VOP_SELECT(((struct vnode *)fp->f_data), which, fp->f_flag, 34240284Smckusick u.u_cred)); 34337731Smckusick } 34437731Smckusick 34537731Smckusick /* 34637731Smckusick * Vnode close call 34737731Smckusick */ 34837731Smckusick vn_close(fp) 34937731Smckusick register struct file *fp; 35037731Smckusick { 35137731Smckusick struct vnode *vp = ((struct vnode *)fp->f_data); 35237731Smckusick int error; 35337731Smckusick 35437731Smckusick if (fp->f_flag & (FSHLOCK|FEXLOCK)) 35537731Smckusick vn_unlock(fp, FSHLOCK|FEXLOCK); 35611162Ssam /* 35737731Smckusick * Must delete vnode reference from this file entry 35837731Smckusick * before VOP_CLOSE, so that only other references 35937731Smckusick * will prevent close. 36011162Ssam */ 36137731Smckusick fp->f_data = (caddr_t) 0; 36237731Smckusick error = VOP_CLOSE(vp, fp->f_flag, u.u_cred); 36337731Smckusick vrele(vp); 36437731Smckusick return (error); 36537731Smckusick } 36637731Smckusick 36737731Smckusick /* 36837731Smckusick * Place an advisory lock on a vnode. 36937731Smckusick * !! THIS IMPLIES THAT ALL STATEFUL FILE SERVERS WILL USE file table entries 37037731Smckusick */ 37137731Smckusick vn_lock(fp, cmd) 37237731Smckusick register struct file *fp; 37337731Smckusick int cmd; 37437731Smckusick { 37537731Smckusick register int priority = PLOCK; 37637731Smckusick register struct vnode *vp = (struct vnode *)fp->f_data; 37740707Skarels int error = 0; 37840707Skarels static char lockstr[] = "flock"; 37937731Smckusick 38037731Smckusick if ((cmd & LOCK_EX) == 0) 38137731Smckusick priority += 4; 38240707Skarels priority |= PCATCH; 38340707Skarels 38411162Ssam /* 38537731Smckusick * If there's a exclusive lock currently applied 38637731Smckusick * to the file, then we've gotta wait for the 38737731Smckusick * lock with everyone else. 38811162Ssam */ 38937731Smckusick again: 39037731Smckusick while (vp->v_flag & VEXLOCK) { 39137731Smckusick /* 39237731Smckusick * If we're holding an exclusive 39337731Smckusick * lock, then release it. 39437731Smckusick */ 39537731Smckusick if (fp->f_flag & FEXLOCK) { 39637731Smckusick vn_unlock(fp, FEXLOCK); 39737731Smckusick continue; 39837731Smckusick } 39937731Smckusick if (cmd & LOCK_NB) 40037731Smckusick return (EWOULDBLOCK); 40137731Smckusick vp->v_flag |= VLWAIT; 40240707Skarels if (error = tsleep((caddr_t)&vp->v_exlockc, priority, 40340707Skarels lockstr, 0)) 40440707Skarels return (error); 40518Sbill } 406*45060Smckusick if (error == 0 && (cmd & LOCK_EX) && (vp->v_flag & VSHLOCK)) { 40737731Smckusick /* 40837731Smckusick * Must wait for any shared locks to finish 40937731Smckusick * before we try to apply a exclusive lock. 41037731Smckusick * 41137731Smckusick * If we're holding a shared 41237731Smckusick * lock, then release it. 41337731Smckusick */ 41437731Smckusick if (fp->f_flag & FSHLOCK) { 41537731Smckusick vn_unlock(fp, FSHLOCK); 41637731Smckusick goto again; 41737731Smckusick } 41837731Smckusick if (cmd & LOCK_NB) 41937731Smckusick return (EWOULDBLOCK); 42037731Smckusick vp->v_flag |= VLWAIT; 42140707Skarels if (error = tsleep((caddr_t)&vp->v_shlockc, PLOCK | PCATCH, 422*45060Smckusick lockstr, 0)) 42340707Skarels return (error); 42437731Smckusick } 42537731Smckusick if (fp->f_flag & FEXLOCK) 42637731Smckusick panic("vn_lock"); 42737731Smckusick if (cmd & LOCK_EX) { 42837731Smckusick cmd &= ~LOCK_SH; 42937731Smckusick vp->v_exlockc++; 43037731Smckusick vp->v_flag |= VEXLOCK; 43137731Smckusick fp->f_flag |= FEXLOCK; 43237731Smckusick } 43337731Smckusick if ((cmd & LOCK_SH) && (fp->f_flag & FSHLOCK) == 0) { 43437731Smckusick vp->v_shlockc++; 43537731Smckusick vp->v_flag |= VSHLOCK; 43637731Smckusick fp->f_flag |= FSHLOCK; 43737731Smckusick } 43837731Smckusick return (0); 43918Sbill } 44018Sbill 44118Sbill /* 44237731Smckusick * Unlock a file. 44318Sbill */ 44437731Smckusick vn_unlock(fp, kind) 44537731Smckusick register struct file *fp; 44637731Smckusick int kind; 44718Sbill { 44837731Smckusick register struct vnode *vp = (struct vnode *)fp->f_data; 44937731Smckusick int flags; 45018Sbill 45137731Smckusick kind &= fp->f_flag; 45237731Smckusick if (vp == NULL || kind == 0) 45337731Smckusick return; 45437731Smckusick flags = vp->v_flag; 45537731Smckusick if (kind & FSHLOCK) { 45637731Smckusick if ((flags & VSHLOCK) == 0) 45737731Smckusick panic("vn_unlock: SHLOCK"); 45837731Smckusick if (--vp->v_shlockc == 0) { 45937731Smckusick vp->v_flag &= ~VSHLOCK; 46037731Smckusick if (flags & VLWAIT) 46137731Smckusick wakeup((caddr_t)&vp->v_shlockc); 46237731Smckusick } 46337731Smckusick fp->f_flag &= ~FSHLOCK; 46437552Smckusick } 46537731Smckusick if (kind & FEXLOCK) { 46637731Smckusick if ((flags & VEXLOCK) == 0) 46737731Smckusick panic("vn_unlock: EXLOCK"); 46837731Smckusick if (--vp->v_exlockc == 0) { 46937731Smckusick vp->v_flag &= ~(VEXLOCK|VLWAIT); 47037731Smckusick if (flags & VLWAIT) 47137731Smckusick wakeup((caddr_t)&vp->v_exlockc); 47237731Smckusick } 47337731Smckusick fp->f_flag &= ~FEXLOCK; 47437731Smckusick } 47518Sbill } 47618Sbill 47718Sbill /* 47837731Smckusick * vn_fhtovp() - convert a fh to a vnode ptr (optionally locked) 47937731Smckusick * - look up fsid in mount list (if not found ret error) 48037731Smckusick * - get vp by calling VFS_FHTOVP() macro 48137731Smckusick * - if lockflag lock it with VOP_LOCK() 48218Sbill */ 48337731Smckusick vn_fhtovp(fhp, lockflag, vpp) 48437731Smckusick fhandle_t *fhp; 48537731Smckusick int lockflag; 48637731Smckusick struct vnode **vpp; 48718Sbill { 48837731Smckusick register struct mount *mp; 48918Sbill 49037731Smckusick if ((mp = getvfs(&fhp->fh_fsid)) == NULL) 49137731Smckusick return (ESTALE); 49238146Smckusick if (VFS_FHTOVP(mp, &fhp->fh_fid, vpp)) 49338146Smckusick return (ESTALE); 49438146Smckusick if (!lockflag) 49538146Smckusick VOP_UNLOCK(*vpp); 49637731Smckusick return (0); 49737731Smckusick } 49837731Smckusick 49937731Smckusick /* 50037731Smckusick * Noop 50137731Smckusick */ 50237731Smckusick vfs_noop() 50337731Smckusick { 50437731Smckusick 50537731Smckusick return (ENXIO); 50637731Smckusick } 50737731Smckusick 50837731Smckusick /* 50937731Smckusick * Null op 51037731Smckusick */ 51137731Smckusick vfs_nullop() 51237731Smckusick { 51337731Smckusick 51437731Smckusick return (0); 51537731Smckusick } 516