xref: /csrg-svn/sys/dev/vn.c (revision 52761)
141480Smckusick /*
241480Smckusick  * Copyright (c) 1988 University of Utah.
341480Smckusick  * Copyright (c) 1990 The Regents of the University of California.
441480Smckusick  * All rights reserved.
541480Smckusick  *
641480Smckusick  * This code is derived from software contributed to Berkeley by
741480Smckusick  * the Systems Programming Group of the University of Utah Computer
841480Smckusick  * Science Department.
941480Smckusick  *
1041480Smckusick  * %sccs.include.redist.c%
1141480Smckusick  *
1249299Shibler  * from: Utah $Hdr: vn.c 1.1 91/04/30$
1341480Smckusick  *
14*52761Shibler  *	@(#)vn.c	7.8 (Berkeley) 02/29/92
1541480Smckusick  */
1641480Smckusick 
1741480Smckusick /*
1849299Shibler  * Vnode disk driver.
1941480Smckusick  *
2049299Shibler  * Block/character interface to a vnode.  Allows one to treat a file
2149299Shibler  * as a disk (e.g. build a filesystem in it, mount it, etc.).
2241480Smckusick  *
2349299Shibler  * NOTE 1: This uses the VOP_BMAP/VOP_STRATEGY interface to the vnode
2449299Shibler  * instead of a simple VOP_RDWR.  We do this to avoid distorting the
2549299Shibler  * local buffer cache.
2649299Shibler  *
2749299Shibler  * NOTE 2: There is a security issue involved with this driver.
2841480Smckusick  * Once mounted all access to the contents of the "mapped" file via
2941480Smckusick  * the special file is controlled by the permissions on the special
3041480Smckusick  * file, the protection of the mapped file is ignored (effectively,
3141480Smckusick  * by using root credentials in all transactions).
3241480Smckusick  */
3349299Shibler #include "vn.h"
3449299Shibler #if NVN > 0
3541480Smckusick 
3645788Sbostic #include "sys/param.h"
3745788Sbostic #include "sys/systm.h"
3849299Shibler #include "sys/namei.h"
3949299Shibler #include "sys/proc.h"
4045788Sbostic #include "sys/errno.h"
4145788Sbostic #include "sys/dkstat.h"
4249299Shibler #include "sys/buf.h"
4349299Shibler #include "sys/malloc.h"
4445788Sbostic #include "sys/ioctl.h"
4549299Shibler #include "sys/mount.h"
4645788Sbostic #include "sys/vnode.h"
4749299Shibler #include "sys/specdev.h"
4845788Sbostic #include "sys/file.h"
4945788Sbostic #include "sys/uio.h"
5041480Smckusick 
5149299Shibler #include "vnioctl.h"
5241480Smckusick 
5341480Smckusick #ifdef DEBUG
5449299Shibler int vndebug = 0x00;
5549299Shibler #define VDB_FOLLOW	0x01
5649299Shibler #define VDB_INIT	0x02
5749299Shibler #define VDB_IO		0x04
5841480Smckusick #endif
5941480Smckusick 
6049299Shibler struct	buf vnbuf[NVN];
6149299Shibler struct	buf vntab[NVN];
6241480Smckusick 
6341480Smckusick #define b_cylin	b_resid
6441480Smckusick 
6549299Shibler #define	vnunit(x)	((minor(x) >> 3) & 0x7)	/* for consistency */
6641480Smckusick 
6749299Shibler #define	getvnbuf()	\
6841480Smckusick 	((struct buf *)malloc(sizeof(struct buf), M_DEVBUF, M_WAITOK))
6949299Shibler #define putvnbuf(bp)	\
7041480Smckusick 	free((caddr_t)(bp), M_DEVBUF)
7141480Smckusick 
7249299Shibler struct vn_softc {
7341480Smckusick 	int		 sc_flags;	/* flags */
7449299Shibler 	size_t		 sc_size;	/* size of vn */
7541480Smckusick 	struct vnode	*sc_vp;		/* vnode */
7641480Smckusick 	struct ucred	*sc_cred;	/* credentials */
7741480Smckusick 	int		 sc_maxactive;	/* max # of active requests */
7849299Shibler } vn_softc[NVN];
7941480Smckusick 
8041480Smckusick /* sc_flags */
8149299Shibler #define	VNF_ALIVE	0x01
8249299Shibler #define VNF_INITED	0x02
8341480Smckusick 
8449299Shibler int
8549299Shibler vnopen(dev, flags, mode, p)
8641480Smckusick 	dev_t dev;
8749299Shibler 	int flags, mode;
8849299Shibler 	struct proc *p;
8941480Smckusick {
9049299Shibler 	int unit = vnunit(dev);
9141480Smckusick 
9241480Smckusick #ifdef DEBUG
9349299Shibler 	if (vndebug & VDB_FOLLOW)
9449299Shibler 		printf("vnopen(%x, %x, %x, %x)\n", dev, flags, mode, p);
9541480Smckusick #endif
9649299Shibler 	if (unit >= NVN)
9741480Smckusick 		return(ENXIO);
9841480Smckusick 	return(0);
9941480Smckusick }
10041480Smckusick 
10141480Smckusick /*
10241480Smckusick  * Break the request into bsize pieces and submit using VOP_BMAP/VOP_STRATEGY.
10341480Smckusick  * Note that this driver can only be used for swapping over NFS on the hp
10441480Smckusick  * since nfs_strategy on the vax cannot handle u-areas and page tables.
10541480Smckusick  */
10649299Shibler vnstrategy(bp)
10741480Smckusick 	register struct buf *bp;
10841480Smckusick {
10949299Shibler 	int unit = vnunit(bp->b_dev);
11049299Shibler 	register struct vn_softc *vn = &vn_softc[unit];
11141480Smckusick 	register struct buf *nbp;
11241480Smckusick 	register int bn, bsize, resid;
11341480Smckusick 	register caddr_t addr;
11441480Smckusick 	int sz, flags;
11549299Shibler 	extern int vniodone();
11641480Smckusick 
11741480Smckusick #ifdef DEBUG
11849299Shibler 	if (vndebug & VDB_FOLLOW)
11949299Shibler 		printf("vnstrategy(%x): unit %d\n", bp, unit);
12041480Smckusick #endif
12149299Shibler 	if ((vn->sc_flags & VNF_INITED) == 0) {
12241480Smckusick 		bp->b_error = ENXIO;
12341480Smckusick 		bp->b_flags |= B_ERROR;
12449299Shibler 		biodone(bp);
12541480Smckusick 		return;
12641480Smckusick 	}
12741480Smckusick 	bn = bp->b_blkno;
12841480Smckusick 	sz = howmany(bp->b_bcount, DEV_BSIZE);
12941480Smckusick 	bp->b_resid = bp->b_bcount;
13049299Shibler 	if (bn < 0 || bn + sz > vn->sc_size) {
13149299Shibler 		if (bn != vn->sc_size) {
13241480Smckusick 			bp->b_error = EINVAL;
13341480Smckusick 			bp->b_flags |= B_ERROR;
13441480Smckusick 		}
13549299Shibler 		biodone(bp);
13641480Smckusick 		return;
13741480Smckusick 	}
13841480Smckusick 	bn = dbtob(bn);
13951945Smckusick 	bsize = vn->sc_vp->v_mount->mnt_stat.f_iosize;
14041480Smckusick 	addr = bp->b_un.b_addr;
14141480Smckusick 	flags = bp->b_flags | B_CALL;
14241480Smckusick 	for (resid = bp->b_resid; resid; resid -= sz) {
14341480Smckusick 		struct vnode *vp;
14441480Smckusick 		daddr_t nbn;
14541480Smckusick 		int off, s;
14641480Smckusick 
14749299Shibler 		nbp = getvnbuf();
14841480Smckusick 		off = bn % bsize;
14941480Smckusick 		sz = MIN(bsize - off, resid);
15049299Shibler 		(void) VOP_BMAP(vn->sc_vp, bn / bsize, &vp, &nbn);
15141480Smckusick #ifdef DEBUG
15249299Shibler 		if (vndebug & VDB_IO)
15349299Shibler 			printf("vnstrategy: vp %x/%x bn %x/%x\n",
15449299Shibler 			       vn->sc_vp, vp, bn, nbn);
15541480Smckusick #endif
15641480Smckusick 		nbp->b_flags = flags;
15741480Smckusick 		nbp->b_bcount = sz;
15841480Smckusick 		nbp->b_bufsize = bp->b_bufsize;
15941480Smckusick 		nbp->b_error = 0;
16049299Shibler 		if (vp->v_type == VBLK || vp->v_type == VCHR)
16149299Shibler 			nbp->b_dev = vp->v_rdev;
16249299Shibler 		else
16349299Shibler 			nbp->b_dev = NODEV;
16441480Smckusick 		nbp->b_un.b_addr = addr;
16541480Smckusick 		nbp->b_blkno = nbn + btodb(off);
16641480Smckusick 		nbp->b_proc = bp->b_proc;
16749299Shibler 		nbp->b_iodone = vniodone;
16841480Smckusick 		nbp->b_vp = vp;
16941480Smckusick 		nbp->b_pfcent = (int) bp;	/* XXX */
17041480Smckusick 		/*
17141480Smckusick 		 * Just sort by block number
17241480Smckusick 		 */
17341480Smckusick 		nbp->b_cylin = nbp->b_blkno;
17441480Smckusick 		s = splbio();
17549299Shibler 		disksort(&vntab[unit], nbp);
17649299Shibler 		if (vntab[unit].b_active < vn->sc_maxactive) {
17749299Shibler 			vntab[unit].b_active++;
17849299Shibler 			vnstart(unit);
17941480Smckusick 		}
18041480Smckusick 		splx(s);
18141480Smckusick 		bn += sz;
18241480Smckusick 		addr += sz;
18341480Smckusick 	}
18441480Smckusick }
18541480Smckusick 
18641480Smckusick /*
18741480Smckusick  * Feed requests sequentially.
18841480Smckusick  * We do it this way to keep from flooding NFS servers if we are connected
18941480Smckusick  * to an NFS file.  This places the burden on the client rather than the
19041480Smckusick  * server.
19141480Smckusick  */
19249299Shibler vnstart(unit)
19341480Smckusick {
19449299Shibler 	register struct vn_softc *vn = &vn_softc[unit];
19541480Smckusick 	register struct buf *bp;
19641480Smckusick 
19741480Smckusick 	/*
19841480Smckusick 	 * Dequeue now since lower level strategy routine might
19941480Smckusick 	 * queue using same links
20041480Smckusick 	 */
20149299Shibler 	bp = vntab[unit].b_actf;
20249299Shibler 	vntab[unit].b_actf = bp->b_actf;
20341480Smckusick #ifdef DEBUG
20449299Shibler 	if (vndebug & VDB_IO)
20549299Shibler 		printf("vnstart(%d): bp %x vp %x blkno %x addr %x cnt %x\n",
20641480Smckusick 		       unit, bp, bp->b_vp, bp->b_blkno, bp->b_un.b_addr,
20741480Smckusick 		       bp->b_bcount);
20841480Smckusick #endif
20941480Smckusick 	VOP_STRATEGY(bp);
21041480Smckusick }
21141480Smckusick 
21249299Shibler vniodone(bp)
21341480Smckusick 	register struct buf *bp;
21441480Smckusick {
21541480Smckusick 	register struct buf *pbp = (struct buf *)bp->b_pfcent;	/* XXX */
21649299Shibler 	register int unit = vnunit(pbp->b_dev);
21741480Smckusick 	int s;
21841480Smckusick 
21941480Smckusick 	s = splbio();
22041480Smckusick #ifdef DEBUG
22149299Shibler 	if (vndebug & VDB_IO)
22249299Shibler 		printf("vniodone(%d): bp %x vp %x blkno %x addr %x cnt %x\n",
22341480Smckusick 		       unit, bp, bp->b_vp, bp->b_blkno, bp->b_un.b_addr,
22441480Smckusick 		       bp->b_bcount);
22541480Smckusick #endif
22641480Smckusick 	if (bp->b_error) {
22741480Smckusick #ifdef DEBUG
22849299Shibler 		if (vndebug & VDB_IO)
22949299Shibler 			printf("vniodone: bp %x error %d\n", bp, bp->b_error);
23041480Smckusick #endif
23141480Smckusick 		pbp->b_flags |= B_ERROR;
23249299Shibler 		pbp->b_error = biowait(bp);
23341480Smckusick 	}
23441480Smckusick 	pbp->b_resid -= bp->b_bcount;
23549299Shibler 	putvnbuf(bp);
23641480Smckusick 	if (pbp->b_resid == 0) {
23741480Smckusick #ifdef DEBUG
23849299Shibler 		if (vndebug & VDB_IO)
23949299Shibler 			printf("vniodone: pbp %x iodone\n", pbp);
24041480Smckusick #endif
24149299Shibler 		biodone(pbp);
24241480Smckusick 	}
24349299Shibler 	if (vntab[unit].b_actf)
24449299Shibler 		vnstart(unit);
24541480Smckusick 	else
24649299Shibler 		vntab[unit].b_active--;
24741480Smckusick 	splx(s);
24841480Smckusick }
24941480Smckusick 
25049299Shibler vnread(dev, uio, flags, p)
25141480Smckusick 	dev_t dev;
25241480Smckusick 	struct uio *uio;
25349299Shibler 	int flags;
25449299Shibler 	struct proc *p;
25541480Smckusick {
25649299Shibler 	register int unit = vnunit(dev);
25741480Smckusick 
25841480Smckusick #ifdef DEBUG
25949299Shibler 	if (vndebug & VDB_FOLLOW)
26049299Shibler 		printf("vnread(%x, %x, %x, %x)\n", dev, uio, flags, p);
26141480Smckusick #endif
26249299Shibler 	return(physio(vnstrategy, &vnbuf[unit], dev, B_READ, minphys, uio));
26341480Smckusick }
26441480Smckusick 
26549299Shibler vnwrite(dev, uio, flags, p)
26641480Smckusick 	dev_t dev;
26741480Smckusick 	struct uio *uio;
26849299Shibler 	int flags;
26949299Shibler 	struct proc *p;
27041480Smckusick {
27149299Shibler 	register int unit = vnunit(dev);
27241480Smckusick 
27341480Smckusick #ifdef DEBUG
27449299Shibler 	if (vndebug & VDB_FOLLOW)
27549299Shibler 		printf("vnwrite(%x, %x, %x, %x)\n", dev, uio, flags, p);
27641480Smckusick #endif
27749299Shibler 	return(physio(vnstrategy, &vnbuf[unit], dev, B_WRITE, minphys, uio));
27841480Smckusick }
27941480Smckusick 
28041480Smckusick /* ARGSUSED */
28149299Shibler vnioctl(dev, cmd, data, flag, p)
28241480Smckusick 	dev_t dev;
28341480Smckusick 	u_long cmd;
28441480Smckusick 	caddr_t data;
28541480Smckusick 	int flag;
28649299Shibler 	struct proc *p;
28741480Smckusick {
28849299Shibler 	int unit = vnunit(dev);
28949299Shibler 	register struct vn_softc *vn;
29049299Shibler 	struct vn_ioctl *vio;
29141480Smckusick 	struct vattr vattr;
29249299Shibler 	struct nameidata nd;
29341480Smckusick 	int error;
29441480Smckusick 
29541480Smckusick #ifdef DEBUG
29649299Shibler 	if (vndebug & VDB_FOLLOW)
29749299Shibler 		printf("vnioctl(%x, %x, %x, %x, %x): unit %d\n",
29849299Shibler 		       dev, cmd, data, flag, p, unit);
29941480Smckusick #endif
30049299Shibler 	error = suser(p->p_ucred, &p->p_acflag);
30141480Smckusick 	if (error)
30241480Smckusick 		return (error);
30349299Shibler 	if (unit >= NVN)
30441480Smckusick 		return (ENXIO);
30541480Smckusick 
30649299Shibler 	vn = &vn_softc[unit];
30749299Shibler 	vio = (struct vn_ioctl *)data;
30841480Smckusick 	switch (cmd) {
30941480Smckusick 
31049299Shibler 	case VNIOCSET:
31149299Shibler 		if (vn->sc_flags & VNF_INITED)
31241480Smckusick 			return(EBUSY);
31341480Smckusick 		/*
31441480Smckusick 		 * Always open for read and write.
31541480Smckusick 		 * This is probably bogus, but it lets vn_open()
31641480Smckusick 		 * weed out directories, sockets, etc. so we don't
31741480Smckusick 		 * have to worry about them.
31841480Smckusick 		 */
319*52761Shibler 		NDINIT(&nd, LOOKUP, FOLLOW, UIO_USERSPACE, vio->vn_file, p);
320*52761Shibler 		if (error = vn_open(&nd, FREAD|FWRITE, 0))
32141480Smckusick 			return(error);
32250115Smckusick 		if (error = VOP_GETATTR(nd.ni_vp, &vattr, p->p_ucred, p)) {
32350115Smckusick 			VOP_UNLOCK(nd.ni_vp);
32450115Smckusick 			(void) vn_close(nd.ni_vp, FREAD|FWRITE, p->p_ucred, p);
32541480Smckusick 			return(error);
32641480Smckusick 		}
32750115Smckusick 		VOP_UNLOCK(nd.ni_vp);
32849299Shibler 		vn->sc_vp = nd.ni_vp;
32949299Shibler 		vn->sc_size = btodb(vattr.va_size);	/* note truncation */
33050115Smckusick 		if (error = vnsetcred(vn, p->p_ucred)) {
33150115Smckusick 			(void) vn_close(vn->sc_vp, FREAD|FWRITE, p->p_ucred, p);
33241480Smckusick 			return(error);
33341480Smckusick 		}
33449299Shibler 		vnthrottle(vn, vn->sc_vp);
33549299Shibler 		vio->vn_size = dbtob(vn->sc_size);
33649299Shibler 		vn->sc_flags |= VNF_INITED;
33741480Smckusick #ifdef DEBUG
33849299Shibler 		if (vndebug & VDB_INIT)
33949299Shibler 			printf("vnioctl: SET vp %x size %x\n",
34049299Shibler 			       vn->sc_vp, vn->sc_size);
34141480Smckusick #endif
34241480Smckusick 		break;
34341480Smckusick 
34449299Shibler 	case VNIOCCLR:
34549299Shibler 		if ((vn->sc_flags & VNF_INITED) == 0)
34641480Smckusick 			return(ENXIO);
34749299Shibler 		vnclear(vn);
34841480Smckusick #ifdef DEBUG
34949299Shibler 		if (vndebug & VDB_INIT)
35049299Shibler 			printf("vnioctl: CLRed\n");
35141480Smckusick #endif
35241480Smckusick 		break;
35341480Smckusick 
35441480Smckusick 	default:
35541480Smckusick 		return(ENXIO);
35641480Smckusick 	}
35741480Smckusick 	return(0);
35841480Smckusick }
35941480Smckusick 
36041480Smckusick /*
36141480Smckusick  * Duplicate the current processes' credentials.  Since we are called only
36241480Smckusick  * as the result of a SET ioctl and only root can do that, any future access
36341480Smckusick  * to this "disk" is essentially as root.  Note that credentials may change
36441480Smckusick  * if some other uid can write directly to the mapped file (NFS).
36541480Smckusick  */
36649299Shibler vnsetcred(vn, cred)
36749299Shibler 	register struct vn_softc *vn;
36849299Shibler 	struct ucred cred;
36941480Smckusick {
37041480Smckusick 	struct uio auio;
37141480Smckusick 	struct iovec aiov;
37241480Smckusick 	char tmpbuf[DEV_BSIZE];
37341480Smckusick 
37449299Shibler 	vn->sc_cred = crdup(cred);
37541480Smckusick 	/* XXX: Horrible kludge to establish credentials for NFS */
37641480Smckusick 	aiov.iov_base = tmpbuf;
37749299Shibler 	aiov.iov_len = MIN(DEV_BSIZE, dbtob(vn->sc_size));
37841480Smckusick 	auio.uio_iov = &aiov;
37941480Smckusick 	auio.uio_iovcnt = 1;
38041480Smckusick 	auio.uio_offset = 0;
38141480Smckusick 	auio.uio_rw = UIO_READ;
38241480Smckusick 	auio.uio_segflg = UIO_SYSSPACE;
38341480Smckusick 	auio.uio_resid = aiov.iov_len;
38449299Shibler 	return(VOP_READ(vn->sc_vp, &auio, 0, vn->sc_cred));
38541480Smckusick }
38641480Smckusick 
38741480Smckusick /*
38841480Smckusick  * Set maxactive based on FS type
38941480Smckusick  */
39049299Shibler vnthrottle(vn, vp)
39149299Shibler 	register struct vn_softc *vn;
39241480Smckusick 	struct vnode *vp;
39341480Smckusick {
39449299Shibler 	extern struct vnodeops ufs_vnodeops, nfsv2_vnodeops;
39541480Smckusick 
39649299Shibler 	if (vp->v_op == &nfsv2_vnodeops)
39749299Shibler 		vn->sc_maxactive = 2;
39841480Smckusick 	else
39949299Shibler 		vn->sc_maxactive = 8;
40041480Smckusick 
40149299Shibler 	if (vn->sc_maxactive < 1)
40249299Shibler 		vn->sc_maxactive = 1;
40341480Smckusick }
40441480Smckusick 
40549299Shibler vnshutdown()
40641480Smckusick {
40749299Shibler 	register struct vn_softc *vn;
40841480Smckusick 
40949299Shibler 	for (vn = &vn_softc[0]; vn < &vn_softc[NVN]; vn++)
41049299Shibler 		if (vn->sc_flags & VNF_INITED)
41149299Shibler 			vnclear(vn);
41241480Smckusick }
41341480Smckusick 
41449299Shibler vnclear(vn)
41549299Shibler 	register struct vn_softc *vn;
41641480Smckusick {
41749299Shibler 	register struct vnode *vp = vn->sc_vp;
41850115Smckusick 	struct proc *p = curproc;		/* XXX */
41941480Smckusick 
42041480Smckusick #ifdef DEBUG
42149299Shibler 	if (vndebug & VDB_FOLLOW)
42249299Shibler 		printf("vnclear(%x): vp %x\n", vp);
42341480Smckusick #endif
42449299Shibler 	vn->sc_flags &= ~VNF_INITED;
42541480Smckusick 	if (vp == (struct vnode *)0)
42649299Shibler 		panic("vnioctl: null vp");
42741480Smckusick #if 0
42841480Smckusick 	/* XXX - this doesn't work right now */
42949299Shibler 	(void) VOP_FSYNC(vp, 0, vn->sc_cred, MNT_WAIT, p);
43041480Smckusick #endif
43150115Smckusick 	(void) vn_close(vp, FREAD|FWRITE, vn->sc_cred, p);
43249299Shibler 	crfree(vn->sc_cred);
43349299Shibler 	vn->sc_vp = (struct vnode *)0;
43449299Shibler 	vn->sc_cred = (struct ucred *)0;
43549299Shibler 	vn->sc_size = 0;
43641480Smckusick }
43741480Smckusick 
43849299Shibler vnsize(dev)
43941480Smckusick 	dev_t dev;
44041480Smckusick {
44149299Shibler 	int unit = vnunit(dev);
44249299Shibler 	register struct vn_softc *vn = &vn_softc[unit];
44341480Smckusick 
44449299Shibler 	if (unit >= NVN || (vn->sc_flags & VNF_INITED) == 0)
44541480Smckusick 		return(-1);
44649299Shibler 	return(vn->sc_size);
44741480Smckusick }
44841480Smckusick 
44949299Shibler vndump(dev)
45041480Smckusick {
45141480Smckusick 	return(ENXIO);
45241480Smckusick }
45341480Smckusick #endif
454