xref: /csrg-svn/sys/kern/vfs_lookup.c (revision 39758)
123401Smckusick /*
237715Smckusick  * Copyright (c) 1982, 1986, 1989 Regents of the University of California.
337715Smckusick  * All rights reserved.
423401Smckusick  *
537715Smckusick  * Redistribution and use in source and binary forms are permitted
637715Smckusick  * provided that the above copyright notice and this paragraph are
737715Smckusick  * duplicated in all such forms and that any documentation,
837715Smckusick  * advertising materials, and other materials related to such
937715Smckusick  * distribution and use acknowledge that the software was developed
1037715Smckusick  * by the University of California, Berkeley.  The name of the
1137715Smckusick  * University may not be used to endorse or promote products derived
1237715Smckusick  * from this software without specific prior written permission.
1337715Smckusick  * THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR
1437715Smckusick  * IMPLIED WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED
1537715Smckusick  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
1637715Smckusick  *
17*39758Smckusick  *	@(#)vfs_lookup.c	7.19 (Berkeley) 12/20/89
1823401Smckusick  */
1930Sbill 
2017100Sbloom #include "param.h"
2137715Smckusick #include "time.h"
2237715Smckusick #include "namei.h"
2337715Smckusick #include "vnode.h"
2417100Sbloom #include "mount.h"
2537715Smckusick #include "errno.h"
2631650Smckusick #include "malloc.h"
2737715Smckusick 
2837582Smarc #ifdef KTRACE
2937715Smckusick #include "user.h"
3037582Smarc #include "proc.h"
3137582Smarc #include "ktrace.h"
3237582Smarc #endif
3330Sbill 
3430Sbill /*
3527268Smckusick  * Convert a pathname into a pointer to a locked inode.
367534Sroot  * This is a very central and rather complicated routine.
3730Sbill  *
3837715Smckusick  * The flag argument is LOOKUP, CREATE, RENAME, or DELETE depending on
3937715Smckusick  * whether the name is to be looked up, created, renamed, or deleted.
4037715Smckusick  * When CREATE, RENAME, or DELETE is specified, information usable in
4137715Smckusick  * creating, renaming, or deleting a directory entry may be calculated.
4237715Smckusick  * If flag has LOCKPARENT or'ed into it and the target of the pathname
4337715Smckusick  * exists, namei returns both the target and its parent directory locked.
4437715Smckusick  * When creating or renaming and LOCKPARENT is specified, the target may not
4537715Smckusick  * be ".".  When deleting and LOCKPARENT is specified, the target may be ".".
469166Ssam  *
4716688Smckusick  * The FOLLOW flag is set when symbolic links are to be followed
489166Ssam  * when they occur at the end of the name translation process.
4927268Smckusick  * Symbolic links are always followed for all other pathname
5027268Smckusick  * components other than the last.
519166Ssam  *
5227268Smckusick  * The segflg defines whether the name is to be copied from user
5327268Smckusick  * space or kernel space.
5427268Smckusick  *
5515798Smckusick  * Overall outline of namei:
5615798Smckusick  *
577534Sroot  *	copy in name
587534Sroot  *	get starting directory
597534Sroot  * dirloop:
6016688Smckusick  *	copy next component of name to ndp->ni_dent
617534Sroot  *	handle degenerate case where name is null string
6237715Smckusick  *	if .. and on mounted filesys, find parent
6337715Smckusick  *	call lookup routine for next component name
6437715Smckusick  *	  directory vnode returned in ni_dvp, unlocked unless LOCKPARENT set
6537715Smckusick  *	  component vnode returned in ni_vp (if it exists), locked.
667534Sroot  *	if symbolic link, massage name in buffer and continue at dirloop
6737715Smckusick  *	if result inode is mounted on, find mounted on vnode
687534Sroot  *	if more components of name, do next level at dirloop
6937715Smckusick  *	return the answer in ni_vp as locked vnode;
7037715Smckusick  *	  if LOCKPARENT set, return locked parent in ni_dvp
719166Ssam  *
7237715Smckusick  * NOTE: (LOOKUP | LOCKPARENT) currently returns the parent vnode unlocked.
7330Sbill  */
7416688Smckusick namei(ndp)
7516688Smckusick 	register struct nameidata *ndp;
7630Sbill {
777534Sroot 	register char *cp;		/* pointer into pathname argument */
7837715Smckusick 	register struct vnode *dp = 0;	/* the directory we are searching */
7937715Smckusick 	register int i;		   	/* Temp counter */
8037715Smckusick 	struct vnode *tdp;		/* saved dp */
8137715Smckusick 	struct mount *mp;		/* mount table entry */
8218109Smckusick 	int docache;			/* == 0 do not cache last component */
8337715Smckusick 	int flag;			/* LOOKUP, CREATE, RENAME or DELETE */
8437715Smckusick 	int wantparent;			/* 1 => wantparent or lockparent flag */
8538001Smckusick 	int lockparent;			/* 1 => lockparent flag */
8637715Smckusick 	int error = 0;
8730Sbill 
88*39758Smckusick 	ndp->ni_dvp = NULL;
8937715Smckusick 	flag = ndp->ni_nameiop & OPFLAG;
9037715Smckusick 	wantparent = ndp->ni_nameiop & (LOCKPARENT|WANTPARENT);
9138001Smckusick 	lockparent = ndp->ni_nameiop & LOCKPARENT;
9216688Smckusick 	docache = (ndp->ni_nameiop & NOCACHE) ^ NOCACHE;
9337715Smckusick 	if (flag == DELETE || wantparent)
9415798Smckusick 		docache = 0;
9530Sbill 	/*
967534Sroot 	 * Get a buffer for the name to be translated, and copy the
977534Sroot 	 * name into the buffer.
985972Swnj 	 */
9937715Smckusick 	MALLOC(ndp->ni_pnbuf, caddr_t, MAXPATHLEN, M_NAMEI, M_WAITOK);
10016688Smckusick 	if (ndp->ni_segflg == UIO_SYSSPACE)
10137715Smckusick 		error = copystr(ndp->ni_dirp, ndp->ni_pnbuf, MAXPATHLEN,
10237715Smckusick 		    &ndp->ni_pathlen);
10316688Smckusick 	else
10437715Smckusick 		error = copyinstr(ndp->ni_dirp, ndp->ni_pnbuf, MAXPATHLEN,
10537715Smckusick 		    &ndp->ni_pathlen);
10616688Smckusick 	if (error) {
10737715Smckusick 		free(ndp->ni_pnbuf, M_NAMEI);
10838003Smckusick 		ndp->ni_vp = NULL;
10937715Smckusick 		return (error);
1105972Swnj 	}
11137715Smckusick 	ndp->ni_ptr = ndp->ni_pnbuf;
11237715Smckusick 	ndp->ni_loopcnt = 0;
11337715Smckusick 	dp = ndp->ni_cdir;
11438347Smckusick 	VREF(dp);
11537582Smarc #ifdef KTRACE
11637582Smarc 	if (KTRPOINT(u.u_procp, KTR_NAMEI))
11737715Smckusick 		ktrnamei(u.u_procp->p_tracep, ndp->ni_pnbuf);
11837582Smarc #endif
1197534Sroot 
12037715Smckusick start:
1215972Swnj 	/*
1227534Sroot 	 * Get starting directory.
12337715Smckusick 	 * Done at start of translation and after symbolic link.
12430Sbill 	 */
12537715Smckusick 	if (*ndp->ni_ptr == '/') {
12637715Smckusick 		vrele(dp);
12737715Smckusick 		while (*ndp->ni_ptr == '/') {
12837715Smckusick 			ndp->ni_ptr++;
12937715Smckusick 			ndp->ni_pathlen--;
13037715Smckusick 		}
13137715Smckusick 		if ((dp = ndp->ni_rdir) == NULL)
13230Sbill 			dp = rootdir;
13338347Smckusick 		VREF(dp);
13437715Smckusick 	}
13537715Smckusick 	VOP_LOCK(dp);
13618027Smckusick 	ndp->ni_endoff = 0;
1377534Sroot 
1387534Sroot 	/*
1397534Sroot 	 * We come to dirloop to search a new directory.
1407534Sroot 	 */
1416571Smckusic dirloop:
14230Sbill 	/*
14316688Smckusick 	 * Copy next component of name to ndp->ni_dent.
14437715Smckusick 	 * XXX kern_exec looks at d_name
14537715Smckusick 	 * ??? The ni_hash value may be useful for vfs_cache
14637715Smckusick 	 * XXX There must be the last component of the filename left
14737715Smckusick 	 * somewhere accessible via. ndp for NFS (and any other stateless file
14837715Smckusick 	 * systems) in case they are doing a CREATE. The "Towards a..." noted
14937715Smckusick 	 * that ni_ptr would be left pointing to the last component, but since
15037715Smckusick 	 * the ni_pnbuf gets free'd, that is not a good idea.
1517534Sroot 	 */
15237743Smckusick #ifdef notdef
15337743Smckusick 	for (cp = ndp->ni_ptr; *cp != 0 && *cp != '/'; cp++) {
15437743Smckusick 		if ((*cp & 0200) == 0)
15537743Smckusick 			continue;
15637743Smckusick 		if ((*cp&0377) == ('/'|0200) || flag != DELETE) {
15737743Smckusick 			error = EINVAL;
15837743Smckusick 			goto bad;
15937743Smckusick 		}
16037743Smckusick 	}
16137743Smckusick 	ndp->ni_namelen = cp - ndp->ni_ptr;
16237743Smckusick 	if (ndp->ni_namelen >= MAXNAMLEN) {
16337743Smckusick 		error = ENAMETOOLONG;
16437743Smckusick 		goto bad;
16537743Smckusick 	}
16637743Smckusick 	ndp->ni_pathlen -= ndp->ni_namelen;
16737743Smckusick #ifdef NAMEI_DIAGNOSTIC
16837743Smckusick 	{ char c = *cp;
16937743Smckusick 	*cp = '\0';
17037743Smckusick 	printf("{%s}: ", ndp->ni_ptr);
17137743Smckusick 	*cp = c; }
17237743Smckusick #endif
17337743Smckusick #else fornow
17437715Smckusick 	ndp->ni_hash = 0;
17537715Smckusick 	for (cp = ndp->ni_ptr, i = 0; *cp != 0 && *cp != '/'; cp++) {
1766571Smckusic 		if (i >= MAXNAMLEN) {
17737715Smckusick 			error = ENAMETOOLONG;
1787534Sroot 			goto bad;
1795972Swnj 		}
18021014Smckusick 		if (*cp & 0200)
18121014Smckusick 			if ((*cp&0377) == ('/'|0200) || flag != DELETE) {
18237715Smckusick 				error = EINVAL;
18321014Smckusick 				goto bad;
18421014Smckusick 			}
18516688Smckusick 		ndp->ni_dent.d_name[i++] = *cp;
18637715Smckusick 		ndp->ni_hash += (unsigned char)*cp * i;
1875972Swnj 	}
18837715Smckusick 	ndp->ni_namelen = i;
18916688Smckusick 	ndp->ni_dent.d_namlen = i;
19016688Smckusick 	ndp->ni_dent.d_name[i] = '\0';
19137715Smckusick 	ndp->ni_pathlen -= i;
19237715Smckusick #ifdef NAMEI_DIAGNOSTIC
19337715Smckusick 	printf("{%s}: ", ndp->ni_dent.d_name);
19437715Smckusick #endif
19537743Smckusick #endif fornow
19637715Smckusick 	ndp->ni_next = cp;
19737715Smckusick 	ndp->ni_makeentry = 1;
19818109Smckusick 	if (*cp == '\0' && docache == 0)
19937715Smckusick 		ndp->ni_makeentry = 0;
20037715Smckusick 	ndp->ni_isdotdot = (ndp->ni_namelen == 2 &&
20137715Smckusick 		ndp->ni_dent.d_name[1] == '.' && ndp->ni_dent.d_name[0] == '.');
2027534Sroot 
2037534Sroot 	/*
2047534Sroot 	 * Check for degenerate name (e.g. / or "")
2057534Sroot 	 * which is a way of talking about a directory,
2067534Sroot 	 * e.g. like "/." or ".".
2077534Sroot 	 */
20837715Smckusick 	if (ndp->ni_ptr[0] == '\0') {
20937715Smckusick 		if (flag != LOOKUP || wantparent) {
21037715Smckusick 			error = EISDIR;
2117534Sroot 			goto bad;
2125972Swnj 		}
21337715Smckusick 		free(ndp->ni_pnbuf, M_NAMEI);
21437715Smckusick 		if (!(ndp->ni_nameiop & LOCKLEAF))
21537715Smckusick 			VOP_UNLOCK(dp);
21637715Smckusick 		ndp->ni_vp = dp;
21737715Smckusick 		return (0);
2185972Swnj 	}
2197534Sroot 
2206571Smckusic 	/*
22137715Smckusick 	 * Handle "..": two special cases.
22237715Smckusick 	 * 1. If at root directory (e.g. after chroot)
22337715Smckusick 	 *    then ignore it so can't get out.
22437715Smckusick 	 * 2. If this vnode is the root of a mounted
22537715Smckusick 	 *    file system, then replace it with the
22637715Smckusick 	 *    vnode which was mounted on so we take the
22737715Smckusick 	 *    .. in the other file system.
22836547Smckusick 	 */
22937715Smckusick 	if (ndp->ni_isdotdot) {
23036547Smckusick 		for (;;) {
23137715Smckusick 			if (dp == ndp->ni_rdir || dp == rootdir) {
23237715Smckusick 				ndp->ni_dvp = dp;
23338390Smckusick 				ndp->ni_vp = dp;
23438347Smckusick 				VREF(dp);
23537715Smckusick 				goto nextname;
23636547Smckusick 			}
23737715Smckusick 			if ((dp->v_flag & VROOT) == 0)
23836547Smckusick 				break;
23937715Smckusick 			tdp = dp;
24037715Smckusick 			dp = dp->v_mount->m_vnodecovered;
24137715Smckusick 			vput(tdp);
24238390Smckusick 			VREF(dp);
24337715Smckusick 			VOP_LOCK(dp);
24436547Smckusick 		}
24536547Smckusick 	}
24636547Smckusick 
24736547Smckusick 	/*
24815798Smckusick 	 * We now have a segment name to search for, and a directory to search.
24915798Smckusick 	 */
25037715Smckusick 	if (error = VOP_LOOKUP(dp, ndp)) {
25137715Smckusick 		if (ndp->ni_vp != NULL)
25237715Smckusick 			panic("leaf should be empty");
25337582Smarc #ifdef NAMEI_DIAGNOSTIC
25437715Smckusick 		printf("not found\n");
25537582Smarc #endif
25638581Smckusick 		if (flag == LOOKUP || flag == DELETE ||
25738581Smckusick 		    error != ENOENT || *cp != 0)
25838581Smckusick 			goto bad;
2595972Swnj 		/*
26037715Smckusick 		 * If creating and at end of pathname, then can consider
26137715Smckusick 		 * allowing file to be created.
2625972Swnj 		 */
26338581Smckusick 		if (ndp->ni_dvp->v_mount->m_flag & M_RDONLY) {
26437715Smckusick 			error = EROFS;
2657534Sroot 			goto bad;
26638581Smckusick 		}
2675972Swnj 		/*
26837715Smckusick 		 * We return with ni_vp NULL to indicate that the entry
26937715Smckusick 		 * doesn't currently exist, leaving a pointer to the
27037715Smckusick 		 * (possibly locked) directory inode in ndp->ni_dvp.
2715972Swnj 		 */
27237715Smckusick 		FREE(ndp->ni_pnbuf, M_NAMEI);
27337715Smckusick 		return (0);	/* should this be ENOENT? */
2747534Sroot 	}
27537582Smarc #ifdef NAMEI_DIAGNOSTIC
27637715Smckusick 	printf("found\n");
27737582Smarc #endif
2787534Sroot 
2797534Sroot 	/*
28037715Smckusick 	 * Check for symbolic link
2817534Sroot 	 */
28237715Smckusick 	dp = ndp->ni_vp;
28337715Smckusick 	if ((dp->v_type == VLNK) &&
28437715Smckusick 	    ((ndp->ni_nameiop & FOLLOW) || *ndp->ni_next == '/')) {
28537715Smckusick 		struct iovec aiov;
28637715Smckusick 		struct uio auio;
28737715Smckusick 		int linklen;
2887534Sroot 
28937715Smckusick 		if (++ndp->ni_loopcnt > MAXSYMLINKS) {
29037715Smckusick 			error = ELOOP;
29137715Smckusick 			goto bad2;
29237715Smckusick 		}
29338215Smckusick 		if (ndp->ni_pathlen > 1)
29437715Smckusick 			MALLOC(cp, char *, MAXPATHLEN, M_NAMEI, M_WAITOK);
2957534Sroot 		else
29637715Smckusick 			cp = ndp->ni_pnbuf;
29737715Smckusick 		aiov.iov_base = cp;
29837715Smckusick 		aiov.iov_len = MAXPATHLEN;
29937715Smckusick 		auio.uio_iov = &aiov;
30037715Smckusick 		auio.uio_iovcnt = 1;
30137715Smckusick 		auio.uio_offset = 0;
30237715Smckusick 		auio.uio_rw = UIO_READ;
30337715Smckusick 		auio.uio_segflg = UIO_SYSSPACE;
30437715Smckusick 		auio.uio_resid = MAXPATHLEN;
30537715Smckusick 		if (error = VOP_READLINK(dp, &auio, ndp->ni_cred)) {
30638215Smckusick 			if (ndp->ni_pathlen > 1)
30737715Smckusick 				free(cp, M_NAMEI);
30837715Smckusick 			goto bad2;
3099166Ssam 		}
31037715Smckusick 		linklen = MAXPATHLEN - auio.uio_resid;
31137715Smckusick 		if (linklen + ndp->ni_pathlen >= MAXPATHLEN) {
31238215Smckusick 			if (ndp->ni_pathlen > 1)
31337715Smckusick 				free(cp, M_NAMEI);
31437715Smckusick 			error = ENAMETOOLONG;
31512011Smckusick 			goto bad2;
31615798Smckusick 		}
31738215Smckusick 		if (ndp->ni_pathlen > 1) {
31838215Smckusick 			bcopy(ndp->ni_next, cp + linklen, ndp->ni_pathlen);
31937715Smckusick 			FREE(ndp->ni_pnbuf, M_NAMEI);
32037715Smckusick 			ndp->ni_pnbuf = cp;
32138215Smckusick 		} else
32238001Smckusick 			ndp->ni_pnbuf[linklen] = '\0';
32337715Smckusick 		ndp->ni_ptr = cp;
32437715Smckusick 		vput(dp);
32537715Smckusick 		dp = ndp->ni_dvp;
32638393Smckusick 		if (lockparent && ndp->ni_pathlen == 1)
32738001Smckusick 			VOP_UNLOCK(dp);
32838393Smckusick 		ndp->ni_pathlen += linklen;
32937715Smckusick 		goto start;
33015798Smckusick 	}
33115798Smckusick 
3327534Sroot 	/*
33337715Smckusick 	 * Check to see if the vnode has been mounted on;
33437715Smckusick 	 * if so find the root of the mounted file system.
3357534Sroot 	 */
33637715Smckusick mntloop:
33737715Smckusick 	while (dp->v_type == VDIR && (mp = dp->v_mountedhere)) {
33837715Smckusick 		while(mp->m_flag & M_MLOCK) {
33937715Smckusick 			mp->m_flag |= M_MWAIT;
34037715Smckusick 			sleep((caddr_t)mp, PVFS);
34137715Smckusick 			goto mntloop;
34221014Smckusick 		}
34337715Smckusick 		error = VFS_ROOT(dp->v_mountedhere, &tdp);
34437715Smckusick 		if (error)
3457534Sroot 			goto bad2;
34637715Smckusick 		vput(dp);
34737715Smckusick 		ndp->ni_vp = dp = tdp;
34830Sbill 	}
3497534Sroot 
35037715Smckusick nextname:
35130Sbill 	/*
3527534Sroot 	 * Not a symbolic link.  If more pathname,
3537534Sroot 	 * continue at next component, else return.
35430Sbill 	 */
35537715Smckusick 	ndp->ni_ptr = ndp->ni_next;
35637715Smckusick 	if (*ndp->ni_ptr == '/') {
35737715Smckusick 		while (*ndp->ni_ptr == '/') {
35837715Smckusick 			ndp->ni_ptr++;
35937715Smckusick 			ndp->ni_pathlen--;
36037715Smckusick 		}
36137715Smckusick 		vrele(ndp->ni_dvp);
3627534Sroot 		goto dirloop;
36330Sbill 	}
3647534Sroot 	/*
36538400Smckusick 	 * Check for read-only file systems.
3667534Sroot 	 */
36738400Smckusick 	if (flag == DELETE || flag == RENAME) {
36838267Smckusick 		/*
36938400Smckusick 		 * Disallow directory write attempts on read-only
37038400Smckusick 		 * file systems.
37138267Smckusick 		 */
37238400Smckusick 		if ((dp->v_mount->m_flag & M_RDONLY) ||
37338400Smckusick 		    (wantparent && (ndp->ni_dvp->v_mount->m_flag & M_RDONLY))) {
37438267Smckusick 			error = EROFS;
37538267Smckusick 			goto bad2;
37638267Smckusick 		}
37738267Smckusick 	}
37837715Smckusick 	if (!wantparent)
37937715Smckusick 		vrele(ndp->ni_dvp);
38037715Smckusick 	if ((ndp->ni_nameiop & LOCKLEAF) == 0)
38137715Smckusick 		VOP_UNLOCK(dp);
38237715Smckusick 	FREE(ndp->ni_pnbuf, M_NAMEI);
38337715Smckusick 	return (0);
3847534Sroot 
38537715Smckusick bad2:
38638001Smckusick 	if (lockparent && *ndp->ni_next == '\0')
38738001Smckusick 		VOP_UNLOCK(ndp->ni_dvp);
38837715Smckusick 	vrele(ndp->ni_dvp);
38937715Smckusick bad:
39037715Smckusick 	vput(dp);
39137715Smckusick 	ndp->ni_vp = NULL;
39237715Smckusick 	FREE(ndp->ni_pnbuf, M_NAMEI);
39310849Ssam 	return (error);
3945972Swnj }
395