xref: /csrg-svn/sys/kern/vfs_lookup.c (revision 38001)
123401Smckusick /*
237715Smckusick  * Copyright (c) 1982, 1986, 1989 Regents of the University of California.
337715Smckusick  * All rights reserved.
423401Smckusick  *
537715Smckusick  * Redistribution and use in source and binary forms are permitted
637715Smckusick  * provided that the above copyright notice and this paragraph are
737715Smckusick  * duplicated in all such forms and that any documentation,
837715Smckusick  * advertising materials, and other materials related to such
937715Smckusick  * distribution and use acknowledge that the software was developed
1037715Smckusick  * by the University of California, Berkeley.  The name of the
1137715Smckusick  * University may not be used to endorse or promote products derived
1237715Smckusick  * from this software without specific prior written permission.
1337715Smckusick  * THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR
1437715Smckusick  * IMPLIED WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED
1537715Smckusick  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
1637715Smckusick  *
17*38001Smckusick  *	@(#)vfs_lookup.c	7.10 (Berkeley) 05/13/89
1823401Smckusick  */
1930Sbill 
2017100Sbloom #include "param.h"
2137715Smckusick #include "time.h"
2237715Smckusick #include "namei.h"
2337715Smckusick #include "vnode.h"
2417100Sbloom #include "mount.h"
2537715Smckusick #include "errno.h"
2631650Smckusick #include "malloc.h"
2737715Smckusick 
2837582Smarc #ifdef KTRACE
2937715Smckusick #include "user.h"
3037582Smarc #include "proc.h"
3137582Smarc #include "ktrace.h"
3237582Smarc #endif
3330Sbill 
3430Sbill /*
3527268Smckusick  * Convert a pathname into a pointer to a locked inode.
367534Sroot  * This is a very central and rather complicated routine.
3730Sbill  *
3837715Smckusick  * The flag argument is LOOKUP, CREATE, RENAME, or DELETE depending on
3937715Smckusick  * whether the name is to be looked up, created, renamed, or deleted.
4037715Smckusick  * When CREATE, RENAME, or DELETE is specified, information usable in
4137715Smckusick  * creating, renaming, or deleting a directory entry may be calculated.
4237715Smckusick  * If flag has LOCKPARENT or'ed into it and the target of the pathname
4337715Smckusick  * exists, namei returns both the target and its parent directory locked.
4437715Smckusick  * When creating or renaming and LOCKPARENT is specified, the target may not
4537715Smckusick  * be ".".  When deleting and LOCKPARENT is specified, the target may be ".".
469166Ssam  *
4716688Smckusick  * The FOLLOW flag is set when symbolic links are to be followed
489166Ssam  * when they occur at the end of the name translation process.
4927268Smckusick  * Symbolic links are always followed for all other pathname
5027268Smckusick  * components other than the last.
519166Ssam  *
5227268Smckusick  * The segflg defines whether the name is to be copied from user
5327268Smckusick  * space or kernel space.
5427268Smckusick  *
5515798Smckusick  * Overall outline of namei:
5615798Smckusick  *
577534Sroot  *	copy in name
587534Sroot  *	get starting directory
597534Sroot  * dirloop:
6016688Smckusick  *	copy next component of name to ndp->ni_dent
617534Sroot  *	handle degenerate case where name is null string
6237715Smckusick  *	if .. and on mounted filesys, find parent
6337715Smckusick  *	call lookup routine for next component name
6437715Smckusick  *	  directory vnode returned in ni_dvp, unlocked unless LOCKPARENT set
6537715Smckusick  *	  component vnode returned in ni_vp (if it exists), locked.
667534Sroot  *	if symbolic link, massage name in buffer and continue at dirloop
6737715Smckusick  *	if result inode is mounted on, find mounted on vnode
687534Sroot  *	if more components of name, do next level at dirloop
6937715Smckusick  *	return the answer in ni_vp as locked vnode;
7037715Smckusick  *	  if LOCKPARENT set, return locked parent in ni_dvp
719166Ssam  *
7237715Smckusick  * NOTE: (LOOKUP | LOCKPARENT) currently returns the parent vnode unlocked.
7330Sbill  */
7416688Smckusick namei(ndp)
7516688Smckusick 	register struct nameidata *ndp;
7630Sbill {
777534Sroot 	register char *cp;		/* pointer into pathname argument */
7837715Smckusick 	register struct vnode *dp = 0;	/* the directory we are searching */
7937715Smckusick 	register int i;		   	/* Temp counter */
8037715Smckusick 	struct vnode *tdp;		/* saved dp */
8137715Smckusick 	struct mount *mp;		/* mount table entry */
8218109Smckusick 	int docache;			/* == 0 do not cache last component */
8337715Smckusick 	int flag;			/* LOOKUP, CREATE, RENAME or DELETE */
8437715Smckusick 	int wantparent;			/* 1 => wantparent or lockparent flag */
85*38001Smckusick 	int lockparent;			/* 1 => lockparent flag */
8637715Smckusick 	int error = 0;
8730Sbill 
8837715Smckusick 	flag = ndp->ni_nameiop & OPFLAG;
8937715Smckusick 	wantparent = ndp->ni_nameiop & (LOCKPARENT|WANTPARENT);
90*38001Smckusick 	lockparent = ndp->ni_nameiop & LOCKPARENT;
9116688Smckusick 	docache = (ndp->ni_nameiop & NOCACHE) ^ NOCACHE;
9237715Smckusick 	if (flag == DELETE || wantparent)
9315798Smckusick 		docache = 0;
9430Sbill 	/*
957534Sroot 	 * Get a buffer for the name to be translated, and copy the
967534Sroot 	 * name into the buffer.
975972Swnj 	 */
9837715Smckusick 	MALLOC(ndp->ni_pnbuf, caddr_t, MAXPATHLEN, M_NAMEI, M_WAITOK);
9916688Smckusick 	if (ndp->ni_segflg == UIO_SYSSPACE)
10037715Smckusick 		error = copystr(ndp->ni_dirp, ndp->ni_pnbuf, MAXPATHLEN,
10137715Smckusick 		    &ndp->ni_pathlen);
10216688Smckusick 	else
10337715Smckusick 		error = copyinstr(ndp->ni_dirp, ndp->ni_pnbuf, MAXPATHLEN,
10437715Smckusick 		    &ndp->ni_pathlen);
10516688Smckusick 	if (error) {
10637715Smckusick 		free(ndp->ni_pnbuf, M_NAMEI);
10737715Smckusick 		return (error);
1085972Swnj 	}
10937715Smckusick 	ndp->ni_ptr = ndp->ni_pnbuf;
11037715Smckusick 	ndp->ni_loopcnt = 0;
11137715Smckusick 	dp = ndp->ni_cdir;
11237715Smckusick 	dp->v_count++;
11337582Smarc #ifdef KTRACE
11437582Smarc 	if (KTRPOINT(u.u_procp, KTR_NAMEI))
11537715Smckusick 		ktrnamei(u.u_procp->p_tracep, ndp->ni_pnbuf);
11637582Smarc #endif
1177534Sroot 
11837715Smckusick start:
1195972Swnj 	/*
1207534Sroot 	 * Get starting directory.
12137715Smckusick 	 * Done at start of translation and after symbolic link.
12230Sbill 	 */
12337715Smckusick 	if (*ndp->ni_ptr == '/') {
12437715Smckusick 		vrele(dp);
12537715Smckusick 		while (*ndp->ni_ptr == '/') {
12637715Smckusick 			ndp->ni_ptr++;
12737715Smckusick 			ndp->ni_pathlen--;
12837715Smckusick 		}
12937715Smckusick 		if ((dp = ndp->ni_rdir) == NULL)
13030Sbill 			dp = rootdir;
13137715Smckusick 		dp->v_count++;
13237715Smckusick 	}
13337715Smckusick 	VOP_LOCK(dp);
13418027Smckusick 	ndp->ni_endoff = 0;
1357534Sroot 
1367534Sroot 	/*
1377534Sroot 	 * We come to dirloop to search a new directory.
1387534Sroot 	 */
1396571Smckusic dirloop:
14030Sbill 	/*
14116688Smckusick 	 * Copy next component of name to ndp->ni_dent.
14237715Smckusick 	 * XXX kern_exec looks at d_name
14337715Smckusick 	 * ??? The ni_hash value may be useful for vfs_cache
14437715Smckusick 	 * XXX There must be the last component of the filename left
14537715Smckusick 	 * somewhere accessible via. ndp for NFS (and any other stateless file
14637715Smckusick 	 * systems) in case they are doing a CREATE. The "Towards a..." noted
14737715Smckusick 	 * that ni_ptr would be left pointing to the last component, but since
14837715Smckusick 	 * the ni_pnbuf gets free'd, that is not a good idea.
1497534Sroot 	 */
15037743Smckusick #ifdef notdef
15137743Smckusick 	for (cp = ndp->ni_ptr; *cp != 0 && *cp != '/'; cp++) {
15237743Smckusick 		if ((*cp & 0200) == 0)
15337743Smckusick 			continue;
15437743Smckusick 		if ((*cp&0377) == ('/'|0200) || flag != DELETE) {
15537743Smckusick 			error = EINVAL;
15637743Smckusick 			goto bad;
15737743Smckusick 		}
15837743Smckusick 	}
15937743Smckusick 	ndp->ni_namelen = cp - ndp->ni_ptr;
16037743Smckusick 	if (ndp->ni_namelen >= MAXNAMLEN) {
16137743Smckusick 		error = ENAMETOOLONG;
16237743Smckusick 		goto bad;
16337743Smckusick 	}
16437743Smckusick 	ndp->ni_pathlen -= ndp->ni_namelen;
16537743Smckusick #ifdef NAMEI_DIAGNOSTIC
16637743Smckusick 	{ char c = *cp;
16737743Smckusick 	*cp = '\0';
16837743Smckusick 	printf("{%s}: ", ndp->ni_ptr);
16937743Smckusick 	*cp = c; }
17037743Smckusick #endif
17137743Smckusick #else fornow
17237715Smckusick 	ndp->ni_hash = 0;
17337715Smckusick 	for (cp = ndp->ni_ptr, i = 0; *cp != 0 && *cp != '/'; cp++) {
1746571Smckusic 		if (i >= MAXNAMLEN) {
17537715Smckusick 			error = ENAMETOOLONG;
1767534Sroot 			goto bad;
1775972Swnj 		}
17821014Smckusick 		if (*cp & 0200)
17921014Smckusick 			if ((*cp&0377) == ('/'|0200) || flag != DELETE) {
18037715Smckusick 				error = EINVAL;
18121014Smckusick 				goto bad;
18221014Smckusick 			}
18316688Smckusick 		ndp->ni_dent.d_name[i++] = *cp;
18437715Smckusick 		ndp->ni_hash += (unsigned char)*cp * i;
1855972Swnj 	}
18637715Smckusick 	ndp->ni_namelen = i;
18716688Smckusick 	ndp->ni_dent.d_namlen = i;
18816688Smckusick 	ndp->ni_dent.d_name[i] = '\0';
18937715Smckusick 	ndp->ni_pathlen -= i;
19037715Smckusick #ifdef NAMEI_DIAGNOSTIC
19137715Smckusick 	printf("{%s}: ", ndp->ni_dent.d_name);
19237715Smckusick #endif
19337743Smckusick #endif fornow
19437715Smckusick 	ndp->ni_next = cp;
19537715Smckusick 	ndp->ni_makeentry = 1;
19618109Smckusick 	if (*cp == '\0' && docache == 0)
19737715Smckusick 		ndp->ni_makeentry = 0;
19837715Smckusick 	ndp->ni_isdotdot = (ndp->ni_namelen == 2 &&
19937715Smckusick 		ndp->ni_dent.d_name[1] == '.' && ndp->ni_dent.d_name[0] == '.');
2007534Sroot 
2017534Sroot 	/*
2027534Sroot 	 * Check for degenerate name (e.g. / or "")
2037534Sroot 	 * which is a way of talking about a directory,
2047534Sroot 	 * e.g. like "/." or ".".
2057534Sroot 	 */
20637715Smckusick 	if (ndp->ni_ptr[0] == '\0') {
20737715Smckusick 		if (flag != LOOKUP || wantparent) {
20837715Smckusick 			error = EISDIR;
2097534Sroot 			goto bad;
2105972Swnj 		}
21137715Smckusick 		free(ndp->ni_pnbuf, M_NAMEI);
21237715Smckusick 		if (!(ndp->ni_nameiop & LOCKLEAF))
21337715Smckusick 			VOP_UNLOCK(dp);
21437715Smckusick 		ndp->ni_vp = dp;
21537715Smckusick 		return (0);
2165972Swnj 	}
2177534Sroot 
2186571Smckusic 	/*
21937715Smckusick 	 * Handle "..": two special cases.
22037715Smckusick 	 * 1. If at root directory (e.g. after chroot)
22137715Smckusick 	 *    then ignore it so can't get out.
22237715Smckusick 	 * 2. If this vnode is the root of a mounted
22337715Smckusick 	 *    file system, then replace it with the
22437715Smckusick 	 *    vnode which was mounted on so we take the
22537715Smckusick 	 *    .. in the other file system.
22636547Smckusick 	 */
22737715Smckusick 	if (ndp->ni_isdotdot) {
22836547Smckusick 		for (;;) {
22937715Smckusick 			if (dp == ndp->ni_rdir || dp == rootdir) {
23037715Smckusick 				ndp->ni_dvp = dp;
23137715Smckusick 				dp->v_count++;
23237715Smckusick 				goto nextname;
23336547Smckusick 			}
23437715Smckusick 			if ((dp->v_flag & VROOT) == 0)
23536547Smckusick 				break;
23637715Smckusick 			tdp = dp;
23737715Smckusick 			dp = dp->v_mount->m_vnodecovered;
23837715Smckusick 			vput(tdp);
23937715Smckusick 			VOP_LOCK(dp);
24037715Smckusick 			dp->v_count++;
24136547Smckusick 		}
24236547Smckusick 	}
24336547Smckusick 
24436547Smckusick 	/*
24515798Smckusick 	 * We now have a segment name to search for, and a directory to search.
24615798Smckusick 	 */
24737715Smckusick 	if (error = VOP_LOOKUP(dp, ndp)) {
24837715Smckusick 		if (ndp->ni_vp != NULL)
24937715Smckusick 			panic("leaf should be empty");
25037582Smarc #ifdef NAMEI_DIAGNOSTIC
25137715Smckusick 		printf("not found\n");
25237582Smarc #endif
2535972Swnj 		/*
25437715Smckusick 		 * If creating and at end of pathname, then can consider
25537715Smckusick 		 * allowing file to be created.
2565972Swnj 		 */
25737715Smckusick 		if (ndp->ni_dvp->v_mount->m_flag & M_RDONLY)
25837715Smckusick 			error = EROFS;
25937742Smckusick 		if (flag == LOOKUP || flag == DELETE ||
26037742Smckusick 		    error != ENOENT || *cp != 0)
2617534Sroot 			goto bad;
2625972Swnj 		/*
26337715Smckusick 		 * We return with ni_vp NULL to indicate that the entry
26437715Smckusick 		 * doesn't currently exist, leaving a pointer to the
26537715Smckusick 		 * (possibly locked) directory inode in ndp->ni_dvp.
2665972Swnj 		 */
26737715Smckusick 		FREE(ndp->ni_pnbuf, M_NAMEI);
26837715Smckusick 		return (0);	/* should this be ENOENT? */
2697534Sroot 	}
27037582Smarc #ifdef NAMEI_DIAGNOSTIC
27137715Smckusick 	printf("found\n");
27237582Smarc #endif
2737534Sroot 
2747534Sroot 	/*
27537715Smckusick 	 * Check for symbolic link
2767534Sroot 	 */
27737715Smckusick 	dp = ndp->ni_vp;
27837715Smckusick 	if ((dp->v_type == VLNK) &&
27937715Smckusick 	    ((ndp->ni_nameiop & FOLLOW) || *ndp->ni_next == '/')) {
28037715Smckusick 		struct iovec aiov;
28137715Smckusick 		struct uio auio;
28237715Smckusick 		int linklen;
2837534Sroot 
28437715Smckusick 		if (++ndp->ni_loopcnt > MAXSYMLINKS) {
28537715Smckusick 			error = ELOOP;
28637715Smckusick 			goto bad2;
28737715Smckusick 		}
28837715Smckusick 		if (ndp->ni_pathlen == 1)
28937715Smckusick 			MALLOC(cp, char *, MAXPATHLEN, M_NAMEI, M_WAITOK);
2907534Sroot 		else
29137715Smckusick 			cp = ndp->ni_pnbuf;
29237715Smckusick 		aiov.iov_base = cp;
29337715Smckusick 		aiov.iov_len = MAXPATHLEN;
29437715Smckusick 		auio.uio_iov = &aiov;
29537715Smckusick 		auio.uio_iovcnt = 1;
29637715Smckusick 		auio.uio_offset = 0;
29737715Smckusick 		auio.uio_rw = UIO_READ;
29837715Smckusick 		auio.uio_segflg = UIO_SYSSPACE;
29937715Smckusick 		auio.uio_resid = MAXPATHLEN;
30037715Smckusick 		if (error = VOP_READLINK(dp, &auio, ndp->ni_cred)) {
30137715Smckusick 			if (ndp->ni_pathlen == 1)
30237715Smckusick 				free(cp, M_NAMEI);
30337715Smckusick 			goto bad2;
3049166Ssam 		}
30537715Smckusick 		linklen = MAXPATHLEN - auio.uio_resid;
30637715Smckusick 		if (linklen + ndp->ni_pathlen >= MAXPATHLEN) {
30737715Smckusick 			if (ndp->ni_pathlen == 1)
30837715Smckusick 				free(cp, M_NAMEI);
30937715Smckusick 			error = ENAMETOOLONG;
31012011Smckusick 			goto bad2;
31115798Smckusick 		}
31237715Smckusick 		if (ndp->ni_pathlen == 1) {
31337715Smckusick 			FREE(ndp->ni_pnbuf, M_NAMEI);
31437715Smckusick 			ndp->ni_pnbuf = cp;
315*38001Smckusick 			ndp->ni_pnbuf[linklen] = '\0';
31637715Smckusick 		} else
317*38001Smckusick 			bcopy(ndp->ni_next, cp + linklen, ndp->ni_pathlen);
31837715Smckusick 		ndp->ni_ptr = cp;
31937715Smckusick 		ndp->ni_pathlen += linklen;
32037715Smckusick 		vput(dp);
32137715Smckusick 		dp = ndp->ni_dvp;
322*38001Smckusick 		if (lockparent && *ndp->ni_next == '\0')
323*38001Smckusick 			VOP_UNLOCK(dp);
32437715Smckusick 		goto start;
32515798Smckusick 	}
32615798Smckusick 
3277534Sroot 	/*
32837715Smckusick 	 * Check to see if the vnode has been mounted on;
32937715Smckusick 	 * if so find the root of the mounted file system.
3307534Sroot 	 */
33137715Smckusick mntloop:
33237715Smckusick 	while (dp->v_type == VDIR && (mp = dp->v_mountedhere)) {
33337715Smckusick 		while(mp->m_flag & M_MLOCK) {
33437715Smckusick 			mp->m_flag |= M_MWAIT;
33537715Smckusick 			sleep((caddr_t)mp, PVFS);
33637715Smckusick 			goto mntloop;
33721014Smckusick 		}
33837715Smckusick 		error = VFS_ROOT(dp->v_mountedhere, &tdp);
33937715Smckusick 		if (error)
3407534Sroot 			goto bad2;
34137715Smckusick 		vput(dp);
34237715Smckusick 		ndp->ni_vp = dp = tdp;
34330Sbill 	}
3447534Sroot 
34537715Smckusick nextname:
34630Sbill 	/*
3477534Sroot 	 * Not a symbolic link.  If more pathname,
3487534Sroot 	 * continue at next component, else return.
34930Sbill 	 */
35037715Smckusick 	ndp->ni_ptr = ndp->ni_next;
35137715Smckusick 	if (*ndp->ni_ptr == '/') {
35237715Smckusick 		while (*ndp->ni_ptr == '/') {
35337715Smckusick 			ndp->ni_ptr++;
35437715Smckusick 			ndp->ni_pathlen--;
35537715Smckusick 		}
35637715Smckusick 		vrele(ndp->ni_dvp);
3577534Sroot 		goto dirloop;
35830Sbill 	}
3597534Sroot 	/*
36037715Smckusick 	 * Check for read-only file systems and executing texts
3617534Sroot 	 */
36237715Smckusick 	if (flag != LOOKUP && (error = vn_access(dp, VWRITE, ndp->ni_cred)))
36337715Smckusick 		goto bad2;
36437715Smckusick 	if (!wantparent)
36537715Smckusick 		vrele(ndp->ni_dvp);
36637715Smckusick 	if ((ndp->ni_nameiop & LOCKLEAF) == 0)
36737715Smckusick 		VOP_UNLOCK(dp);
36837715Smckusick 	FREE(ndp->ni_pnbuf, M_NAMEI);
36937715Smckusick 	return (0);
3707534Sroot 
37137715Smckusick bad2:
372*38001Smckusick 	if (lockparent && *ndp->ni_next == '\0')
373*38001Smckusick 		VOP_UNLOCK(ndp->ni_dvp);
37437715Smckusick 	vrele(ndp->ni_dvp);
37537715Smckusick bad:
37637715Smckusick 	vput(dp);
37737715Smckusick 	ndp->ni_vp = NULL;
37837715Smckusick 	FREE(ndp->ni_pnbuf, M_NAMEI);
37910849Ssam 	return (error);
3805972Swnj }
381