xref: /netbsd-src/sys/fs/msdosfs/msdosfs_lookup.c (revision 6a493d6bc668897c91594964a732d38505b70cbb)
1 /*	$NetBSD: msdosfs_lookup.c,v 1.30 2013/12/24 16:51:24 mlelstv Exp $	*/
2 
3 /*-
4  * Copyright (C) 1994, 1995, 1997 Wolfgang Solfrank.
5  * Copyright (C) 1994, 1995, 1997 TooLs GmbH.
6  * All rights reserved.
7  * Original code by Paul Popelka (paulp@uts.amdahl.com) (see below).
8  *
9  * Redistribution and use in source and binary forms, with or without
10  * modification, are permitted provided that the following conditions
11  * are met:
12  * 1. Redistributions of source code must retain the above copyright
13  *    notice, this list of conditions and the following disclaimer.
14  * 2. Redistributions in binary form must reproduce the above copyright
15  *    notice, this list of conditions and the following disclaimer in the
16  *    documentation and/or other materials provided with the distribution.
17  * 3. All advertising materials mentioning features or use of this software
18  *    must display the following acknowledgement:
19  *	This product includes software developed by TooLs GmbH.
20  * 4. The name of TooLs GmbH may not be used to endorse or promote products
21  *    derived from this software without specific prior written permission.
22  *
23  * THIS SOFTWARE IS PROVIDED BY TOOLS GMBH ``AS IS'' AND ANY EXPRESS OR
24  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
25  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
26  * IN NO EVENT SHALL TOOLS GMBH BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
27  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
28  * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
29  * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
30  * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
31  * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
32  * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
33  */
34 /*
35  * Written by Paul Popelka (paulp@uts.amdahl.com)
36  *
37  * You can do anything you want with this software, just don't say you wrote
38  * it, and don't remove this notice.
39  *
40  * This software is provided "as is".
41  *
42  * The author supplies this software to be publicly redistributed on the
43  * understanding that the author is not responsible for the correct
44  * functioning of this software in any circumstances and is not liable for
45  * any damages caused by this software.
46  *
47  * October 1992
48  */
49 
50 #if HAVE_NBTOOL_CONFIG_H
51 #include "nbtool_config.h"
52 #endif
53 
54 #include <sys/cdefs.h>
55 __KERNEL_RCSID(0, "$NetBSD: msdosfs_lookup.c,v 1.30 2013/12/24 16:51:24 mlelstv Exp $");
56 
57 #include <sys/param.h>
58 
59 #ifdef _KERNEL
60 #include <sys/systm.h>
61 #include <sys/mount.h>
62 #include <sys/kauth.h>
63 #include <sys/namei.h>
64 #include <sys/dirent.h>
65 #include <sys/buf.h>
66 #include <sys/vnode.h>
67 #else
68 #include <ffs/buf.h>
69 #endif /* _KERNEL */
70 
71 #include <fs/msdosfs/bpb.h>
72 #include <fs/msdosfs/direntry.h>
73 #include <fs/msdosfs/denode.h>
74 #include <fs/msdosfs/msdosfsmount.h>
75 #include <fs/msdosfs/fat.h>
76 
77 
78 #ifdef _KERNEL
79 /*
80  * When we search a directory the blocks containing directory entries are
81  * read and examined.  The directory entries contain information that would
82  * normally be in the inode of a unix filesystem.  This means that some of
83  * a directory's contents may also be in memory resident denodes (sort of
84  * an inode).  This can cause problems if we are searching while some other
85  * process is modifying a directory.  To prevent one process from accessing
86  * incompletely modified directory information we depend upon being the
87  * sole owner of a directory block.  bread/brelse provide this service.
88  * This being the case, when a process modifies a directory it must first
89  * acquire the disk block that contains the directory entry to be modified.
90  * Then update the disk block and the denode, and then write the disk block
91  * out to disk.  This way disk blocks containing directory entries and in
92  * memory denode's will be in synch.
93  */
94 int
95 msdosfs_lookup(void *v)
96 {
97 	struct vop_lookup_args /* {
98 		struct vnode *a_dvp;
99 		struct vnode **a_vpp;
100 		struct componentname *a_cnp;
101 	} */ *ap = v;
102 	struct vnode *vdp = ap->a_dvp;
103 	struct vnode **vpp = ap->a_vpp;
104 	struct componentname *cnp = ap->a_cnp;
105 	daddr_t bn;
106 	int error;
107 	int slotcount;
108 	int slotoffset = 0;
109 	int frcn;
110 	u_long cluster;
111 	int blkoff;
112 	int diroff;
113 	int blsize;
114 	int isadir;		/* ~0 if found direntry is a directory	 */
115 	u_long scn;		/* starting cluster number		 */
116 	struct vnode *pdp;
117 	struct denode *dp;
118 	struct denode *tdp;
119 	struct msdosfsmount *pmp;
120 	struct buf *bp = 0;
121 	struct direntry *dep;
122 	u_char dosfilename[12];
123 	int flags;
124 	int nameiop = cnp->cn_nameiop;
125 	int wincnt = 1;
126 	int chksum = -1, chksum_ok;
127 	int olddos = 1;
128 
129 	flags = cnp->cn_flags;
130 
131 #ifdef MSDOSFS_DEBUG
132 	printf("msdosfs_lookup(): looking for %.*s\n",
133 		(int)cnp->cn_namelen, cnp->cn_nameptr);
134 #endif
135 	dp = VTODE(vdp);
136 	pmp = dp->de_pmp;
137 	*vpp = NULL;
138 #ifdef MSDOSFS_DEBUG
139 	printf("msdosfs_lookup(): vdp %p, dp %p, Attr %02x\n",
140 	    vdp, dp, dp->de_Attributes);
141 #endif
142 
143 	/*
144 	 * Check accessiblity of directory.
145 	 */
146 	if ((error = VOP_ACCESS(vdp, VEXEC, cnp->cn_cred)) != 0)
147 		return (error);
148 
149 	if ((flags & ISLASTCN) && (vdp->v_mount->mnt_flag & MNT_RDONLY) &&
150 	    (cnp->cn_nameiop == DELETE || cnp->cn_nameiop == RENAME))
151 		return (EROFS);
152 
153 	/*
154 	 * We now have a segment name to search for, and a directory to search.
155 	 *
156 	 * Before tediously performing a linear scan of the directory,
157 	 * check the name cache to see if the directory/name pair
158 	 * we are looking for is known already.
159 	 */
160 	if (cache_lookup(vdp, cnp->cn_nameptr, cnp->cn_namelen,
161 			 cnp->cn_nameiop, cnp->cn_flags, NULL, vpp)) {
162 		return *vpp == NULLVP ? ENOENT: 0;
163 	}
164 
165 	/*
166 	 * If they are going after the . or .. entry in the root directory,
167 	 * they won't find it.  DOS filesystems don't have them in the root
168 	 * directory.  So, we fake it. deget() is in on this scam too.
169 	 */
170 	if ((vdp->v_vflag & VV_ROOT) && cnp->cn_nameptr[0] == '.' &&
171 	    (cnp->cn_namelen == 1 ||
172 		(cnp->cn_namelen == 2 && cnp->cn_nameptr[1] == '.'))) {
173 		isadir = ATTR_DIRECTORY;
174 		scn = MSDOSFSROOT;
175 #ifdef MSDOSFS_DEBUG
176 		printf("msdosfs_lookup(): looking for . or .. in root directory\n");
177 #endif
178 		cluster = MSDOSFSROOT;
179 		blkoff = MSDOSFSROOT_OFS;
180 		goto foundroot;
181 	}
182 
183 	switch (unix2dosfn((const u_char *)cnp->cn_nameptr, dosfilename,
184 	    cnp->cn_namelen, 0)) {
185 	case 0:
186 		return (EINVAL);
187 	case 1:
188 		break;
189 	case 2:
190 		wincnt = winSlotCnt((const u_char *)cnp->cn_nameptr,
191 		    cnp->cn_namelen) + 1;
192 		break;
193 	case 3:
194 		olddos = 0;
195 		wincnt = winSlotCnt((const u_char *)cnp->cn_nameptr,
196 		    cnp->cn_namelen) + 1;
197 		break;
198 	}
199 	if (pmp->pm_flags & MSDOSFSMNT_SHORTNAME)
200 		wincnt = 1;
201 
202 	/*
203 	 * Suppress search for slots unless creating
204 	 * file and at end of pathname, in which case
205 	 * we watch for a place to put the new file in
206 	 * case it doesn't already exist.
207 	 */
208 	slotcount = wincnt;
209 	if ((nameiop == CREATE || nameiop == RENAME) &&
210 	    (flags & ISLASTCN))
211 		slotcount = 0;
212 
213 #ifdef MSDOSFS_DEBUG
214 	printf("msdosfs_lookup(): dos filename: %s\n", dosfilename);
215 #endif
216 	/*
217 	 * Search the directory pointed at by vdp for the name pointed at
218 	 * by cnp->cn_nameptr.
219 	 */
220 	tdp = NULL;
221 	/*
222 	 * The outer loop ranges over the clusters that make up the
223 	 * directory.  Note that the root directory is different from all
224 	 * other directories.  It has a fixed number of blocks that are not
225 	 * part of the pool of allocatable clusters.  So, we treat it a
226 	 * little differently. The root directory starts at "cluster" 0.
227 	 */
228 	diroff = 0;
229 	for (frcn = 0; diroff < dp->de_FileSize; frcn++) {
230 		if ((error = pcbmap(dp, frcn, &bn, &cluster, &blsize)) != 0) {
231 			if (error == E2BIG)
232 				break;
233 			return (error);
234 		}
235 		error = bread(pmp->pm_devvp, de_bn2kb(pmp, bn), blsize, NOCRED,
236 		    0, &bp);
237 		if (error) {
238 			return (error);
239 		}
240 		for (blkoff = 0; blkoff < blsize;
241 		     blkoff += sizeof(struct direntry),
242 		     diroff += sizeof(struct direntry)) {
243 			dep = (struct direntry *)((char *)bp->b_data + blkoff);
244 			/*
245 			 * If the slot is empty and we are still looking
246 			 * for an empty then remember this one.  If the
247 			 * slot is not empty then check to see if it
248 			 * matches what we are looking for.  If the slot
249 			 * has never been filled with anything, then the
250 			 * remainder of the directory has never been used,
251 			 * so there is no point in searching it.
252 			 */
253 			if (dep->deName[0] == SLOT_EMPTY ||
254 			    dep->deName[0] == SLOT_DELETED) {
255 				/*
256 				 * Drop memory of previous long matches
257 				 */
258 				chksum = -1;
259 
260 				if (slotcount < wincnt) {
261 					slotcount++;
262 					slotoffset = diroff;
263 				}
264 				if (dep->deName[0] == SLOT_EMPTY) {
265 					brelse(bp, 0);
266 					goto notfound;
267 				}
268 			} else {
269 				/*
270 				 * If there wasn't enough space for our
271 				 * winentries, forget about the empty space
272 				 */
273 				if (slotcount < wincnt)
274 					slotcount = 0;
275 
276 				/*
277 				 * Check for Win95 long filename entry
278 				 */
279 				if (dep->deAttributes == ATTR_WIN95) {
280 					if (pmp->pm_flags & MSDOSFSMNT_SHORTNAME)
281 						continue;
282 
283 					chksum = winChkName((const u_char *)cnp->cn_nameptr,
284 							    cnp->cn_namelen,
285 							    (struct winentry *)dep,
286 							    chksum);
287 					continue;
288 				}
289 
290 				/*
291 				 * Ignore volume labels (anywhere, not just
292 				 * the root directory).
293 				 */
294 				if (dep->deAttributes & ATTR_VOLUME) {
295 					chksum = -1;
296 					continue;
297 				}
298 
299 				/*
300 				 * Check for a checksum or name match
301 				 */
302 				chksum_ok = (chksum == winChksum(dep->deName));
303 				if (!chksum_ok && (
304 					!olddos ||
305 					memcmp(&dosfilename[0],dep->deName,8) ||
306 					memcmp(&dosfilename[8],dep->deExtension,3))) {
307 					chksum = -1;
308 					continue;
309 				}
310 #ifdef MSDOSFS_DEBUG
311 				printf("msdosfs_lookup(): match blkoff %d, diroff %d\n",
312 				    blkoff, diroff);
313 #endif
314 				/*
315 				 * Remember where this directory
316 				 * entry came from for whoever did
317 				 * this lookup.
318 				 */
319 				dp->de_fndoffset = diroff;
320 				if (chksum_ok && nameiop == RENAME) {
321 					/*
322 					 * Target had correct long name
323 					 * directory entries, reuse them
324 					 * as needed.
325 					 */
326 					dp->de_fndcnt = wincnt - 1;
327 				} else {
328 					/*
329 					 * Long name directory entries
330 					 * not present or corrupt, can only
331 					 * reuse dos directory entry.
332 					 */
333 					dp->de_fndcnt = 0;
334 				}
335 
336 				goto found;
337 			}
338 		}	/* for (blkoff = 0; .... */
339 		/*
340 		 * Release the buffer holding the directory cluster just
341 		 * searched.
342 		 */
343 		brelse(bp, 0);
344 	}	/* for (frcn = 0; ; frcn++) */
345 
346 notfound:
347 	/*
348 	 * We hold no disk buffers at this point.
349 	 */
350 
351 	/*
352 	 * If we get here we didn't find the entry we were looking for. But
353 	 * that's ok if we are creating or renaming and are at the end of
354 	 * the pathname and the directory hasn't been removed.
355 	 */
356 #ifdef MSDOSFS_DEBUG
357 	printf("msdosfs_lookup(): op %d, refcnt %ld, slotcount %d, slotoffset %d\n",
358 	    nameiop, dp->de_refcnt, slotcount, slotoffset);
359 #endif
360 	if ((nameiop == CREATE || nameiop == RENAME) &&
361 	    (flags & ISLASTCN) && dp->de_refcnt != 0) {
362 		/*
363 		 * Access for write is interpreted as allowing
364 		 * creation of files in the directory.
365 		 */
366 		error = VOP_ACCESS(vdp, VWRITE, cnp->cn_cred);
367 		if (error)
368 			return (error);
369 
370 		/*
371 		 * Fixup the slot description to point to the place where
372 		 * we might put the new DOS direntry (putting the Win95
373 		 * long name entries before that)
374 		 */
375 		if (!slotcount) {
376 			slotcount = 1;
377 			slotoffset = diroff;
378 		}
379 		if (wincnt > slotcount) {
380 			slotoffset +=
381 				sizeof(struct direntry) * (wincnt - slotcount);
382 		}
383 
384 		/*
385 		 * Return an indication of where the new directory
386 		 * entry should be put.
387 		 */
388 		dp->de_fndoffset = slotoffset;
389 		dp->de_fndcnt = wincnt - 1;
390 
391 		/*
392 		 * We return with the directory locked, so that
393 		 * the parameters we set up above will still be
394 		 * valid if we actually decide to do a direnter().
395 		 * We return ni_vp == NULL to indicate that the entry
396 		 * does not currently exist; we leave a pointer to
397 		 * the (locked) directory inode in ndp->ni_dvp.
398 		 *
399 		 * NB - if the directory is unlocked, then this
400 		 * information cannot be used.
401 		 */
402 		return (EJUSTRETURN);
403 	}
404 
405 #if 0
406 	/*
407 	 * Insert name into cache (as non-existent) if appropriate.
408 	 *
409 	 * XXX Negative caching is broken for msdosfs because the name
410 	 * cache doesn't understand peculiarities such as case insensitivity
411 	 * and 8.3 filenames.  Hence, it may not invalidate all negative
412 	 * entries if a file with this name is later created.
413 	 * e.g. creating a file 'foo' won't invalidate a negative entry
414 	 * for 'FOO'.
415 	 */
416 	if (nameiop != CREATE)
417 		cache_enter(vdp, *vpp, cnp->cn_nameptr, cnp->cn_namelen,
418 			    cnp->cn_flags);
419 #endif
420 
421 	return (ENOENT);
422 
423 found:
424 	/*
425 	 * NOTE:  We still have the buffer with matched directory entry at
426 	 * this point.
427 	 */
428 	isadir = dep->deAttributes & ATTR_DIRECTORY;
429 	scn = getushort(dep->deStartCluster);
430 	if (FAT32(pmp)) {
431 		scn |= getushort(dep->deHighClust) << 16;
432 		if (scn == pmp->pm_rootdirblk) {
433 			/*
434 			 * There should actually be 0 here.
435 			 * Just ignore the error.
436 			 */
437 			scn = MSDOSFSROOT;
438 		}
439 	}
440 
441 	if (isadir) {
442 		cluster = scn;
443 		if (cluster == MSDOSFSROOT)
444 			blkoff = MSDOSFSROOT_OFS;
445 		else
446 			blkoff = 0;
447 	} else if (cluster == MSDOSFSROOT)
448 		blkoff = diroff;
449 
450 	/*
451 	 * Now release buf to allow deget to read the entry again.
452 	 * Reserving it here and giving it to deget could result
453 	 * in a deadlock.
454 	 */
455 	brelse(bp, 0);
456 
457 foundroot:
458 	/*
459 	 * If we entered at foundroot, then we are looking for the . or ..
460 	 * entry of the filesystems root directory.  isadir and scn were
461 	 * setup before jumping here.  And, bp is already null.
462 	 */
463 	if (FAT32(pmp) && scn == MSDOSFSROOT)
464 		scn = pmp->pm_rootdirblk;
465 
466 	/*
467 	 * If deleting, and at end of pathname, return
468 	 * parameters which can be used to remove file.
469 	 * Lock the inode, being careful with ".".
470 	 */
471 	if (nameiop == DELETE && (flags & ISLASTCN)) {
472 		/*
473 		 * Don't allow deleting the root.
474 		 */
475 		if (blkoff == MSDOSFSROOT_OFS)
476 			return EINVAL;
477 
478 		/*
479 		 * Write access to directory required to delete files.
480 		 */
481 		error = VOP_ACCESS(vdp, VWRITE, cnp->cn_cred);
482 		if (error)
483 			return (error);
484 
485 		/*
486 		 * Return pointer to current entry in dp->i_offset.
487 		 * Save directory inode pointer in ndp->ni_dvp for dirremove().
488 		 */
489 		if (dp->de_StartCluster == scn && isadir) {	/* "." */
490 			vref(vdp);
491 			*vpp = vdp;
492 			return (0);
493 		}
494 		if ((error = deget(pmp, cluster, blkoff, &tdp)) != 0)
495 			return (error);
496 		*vpp = DETOV(tdp);
497 		return (0);
498 	}
499 
500 	/*
501 	 * If rewriting (RENAME), return the inode and the
502 	 * information required to rewrite the present directory
503 	 * Must get inode of directory entry to verify it's a
504 	 * regular file, or empty directory.
505 	 */
506 	if (nameiop == RENAME && (flags & ISLASTCN)) {
507 
508 		if (vdp->v_mount->mnt_flag & MNT_RDONLY)
509 			return (EROFS);
510 
511 		if (blkoff == MSDOSFSROOT_OFS)
512 			return EINVAL;
513 
514 		error = VOP_ACCESS(vdp, VWRITE, cnp->cn_cred);
515 		if (error)
516 			return (error);
517 
518 		/*
519 		 * Careful about locking second inode.
520 		 * This can only occur if the target is ".".
521 		 */
522 		if (dp->de_StartCluster == scn && isadir)
523 			return (EISDIR);
524 
525 		if ((error = deget(pmp, cluster, blkoff, &tdp)) != 0)
526 			return (error);
527 		*vpp = DETOV(tdp);
528 		return (0);
529 	}
530 
531 	/*
532 	 * Step through the translation in the name.  We do not `vput' the
533 	 * directory because we may need it again if a symbolic link
534 	 * is relative to the current directory.  Instead we save it
535 	 * unlocked as "pdp".  We must get the target inode before unlocking
536 	 * the directory to insure that the inode will not be removed
537 	 * before we get it.  We prevent deadlock by always fetching
538 	 * inodes from the root, moving down the directory tree. Thus
539 	 * when following backward pointers ".." we must unlock the
540 	 * parent directory before getting the requested directory.
541 	 * There is a potential race condition here if both the current
542 	 * and parent directories are removed before the VFS_VGET for the
543 	 * inode associated with ".." returns.  We hope that this occurs
544 	 * infrequently since we cannot avoid this race condition without
545 	 * implementing a sophisticated deadlock detection algorithm.
546 	 * Note also that this simple deadlock detection scheme will not
547 	 * work if the file system has any hard links other than ".."
548 	 * that point backwards in the directory structure.
549 	 */
550 	pdp = vdp;
551 	if (flags & ISDOTDOT) {
552 		VOP_UNLOCK(pdp);	/* race to get the inode */
553 		error = deget(pmp, cluster, blkoff, &tdp);
554 		vn_lock(pdp, LK_EXCLUSIVE | LK_RETRY);
555 		if (error) {
556 			return error;
557 		}
558 		*vpp = DETOV(tdp);
559 	} else if (dp->de_StartCluster == scn && isadir) {
560 		vref(vdp);	/* we want ourself, ie "." */
561 		*vpp = vdp;
562 	} else {
563 		if ((error = deget(pmp, cluster, blkoff, &tdp)) != 0)
564 			return (error);
565 		*vpp = DETOV(tdp);
566 	}
567 
568 	/*
569 	 * Insert name into cache if appropriate.
570 	 */
571 	cache_enter(vdp, *vpp, cnp->cn_nameptr, cnp->cn_namelen, cnp->cn_flags);
572 
573 	return 0;
574 }
575 #endif /* _KERNEL */
576 
577 /*
578  * dep  - directory entry to copy into the directory
579  * ddep - directory to add to
580  * depp - return the address of the denode for the created directory entry
581  *	  if depp != 0
582  * cnp  - componentname needed for Win95 long filenames
583  */
584 int
585 createde(struct denode *dep, struct denode *ddep, struct denode **depp, struct componentname *cnp)
586 {
587 	int error, rberror;
588 	u_long dirclust, clusoffset;
589 	u_long fndoffset, havecnt = 0, wcnt = 1, i;
590 	struct direntry *ndep;
591 	struct msdosfsmount *pmp = ddep->de_pmp;
592 	struct buf *bp;
593 	daddr_t bn;
594 	int blsize;
595 #ifdef _KERNEL
596 	int async = ddep->de_pmp->pm_mountp->mnt_flag & MNT_ASYNC;
597 #else
598 #define async 0
599 #endif
600 
601 #ifdef MSDOSFS_DEBUG
602 	printf("createde(dep %p, ddep %p, depp %p, cnp %p)\n",
603 	    dep, ddep, depp, cnp);
604 #endif
605 
606 	/*
607 	 * If no space left in the directory then allocate another cluster
608 	 * and chain it onto the end of the file.  There is one exception
609 	 * to this.  That is, if the root directory has no more space it
610 	 * can NOT be expanded.  extendfile() checks for and fails attempts
611 	 * to extend the root directory.  We just return an error in that
612 	 * case.
613 	 */
614 	if (ddep->de_fndoffset >= ddep->de_FileSize) {
615 		u_long needlen = ddep->de_fndoffset + sizeof(struct direntry)
616 		    - ddep->de_FileSize;
617 		dirclust = de_clcount(pmp, needlen);
618 		if ((error = extendfile(ddep, dirclust, 0, 0, DE_CLEAR)) != 0) {
619 			(void)detrunc(ddep, ddep->de_FileSize, 0, NOCRED);
620 			goto err_norollback;
621 		}
622 
623 		/*
624 		 * Update the size of the directory
625 		 */
626 		ddep->de_FileSize += de_cn2off(pmp, dirclust);
627 	}
628 
629 	/*
630 	 * We just read in the cluster with space.  Copy the new directory
631 	 * entry in.  Then write it to disk. NOTE:  DOS directories
632 	 * do not get smaller as clusters are emptied.
633 	 */
634 	error = pcbmap(ddep, de_cluster(pmp, ddep->de_fndoffset),
635 		       &bn, &dirclust, &blsize);
636 	if (error)
637 		goto err_norollback;
638 	clusoffset = ddep->de_fndoffset;
639 	if (dirclust != MSDOSFSROOT)
640 		clusoffset &= pmp->pm_crbomask;
641 	if ((error = bread(pmp->pm_devvp, de_bn2kb(pmp, bn), blsize, NOCRED,
642 	    B_MODIFY, &bp)) != 0) {
643 		goto err_norollback;
644 	}
645 	ndep = bptoep(pmp, bp, clusoffset);
646 
647 	DE_EXTERNALIZE(ndep, dep);
648 
649 	/*
650 	 * Now write the Win95 long name
651 	 */
652 	if (ddep->de_fndcnt > 0) {
653 		u_int8_t chksum = winChksum(ndep->deName);
654 		const u_char *un = (const u_char *)cnp->cn_nameptr;
655 		int unlen = cnp->cn_namelen;
656 		u_long xhavecnt;
657 
658 		fndoffset = ddep->de_fndoffset;
659 		xhavecnt = ddep->de_fndcnt + 1;
660 
661 		for(; wcnt < xhavecnt; wcnt++) {
662 			if ((fndoffset & pmp->pm_crbomask) == 0) {
663 				/* we should never get here if ddep is root
664 				 * directory */
665 
666 				if (async)
667 					(void) bdwrite(bp);
668 				else if ((error = bwrite(bp)) != 0)
669 					goto rollback;
670 
671 				fndoffset -= sizeof(struct direntry);
672 				error = pcbmap(ddep,
673 					       de_cluster(pmp, fndoffset),
674 					       &bn, 0, &blsize);
675 				if (error)
676 					goto rollback;
677 
678 				error = bread(pmp->pm_devvp, de_bn2kb(pmp, bn),
679 				    blsize, NOCRED, B_MODIFY, &bp);
680 				if (error) {
681 					goto rollback;
682 				}
683 				ndep = bptoep(pmp, bp,
684 						fndoffset & pmp->pm_crbomask);
685 			} else {
686 				ndep--;
687 				fndoffset -= sizeof(struct direntry);
688 			}
689 			if (!unix2winfn(un, unlen, (struct winentry *)ndep,
690 						wcnt, chksum))
691 				break;
692 		}
693 	}
694 
695 	if (async)
696 		bdwrite(bp);
697 	else if ((error = bwrite(bp)) != 0)
698 		goto rollback;
699 
700 	/*
701 	 * If they want us to return with the denode gotten.
702 	 */
703 	if (depp) {
704 		u_long diroffset = clusoffset;
705 		if (dep->de_Attributes & ATTR_DIRECTORY) {
706 			dirclust = dep->de_StartCluster;
707 			if (FAT32(pmp) && dirclust == pmp->pm_rootdirblk)
708 				dirclust = MSDOSFSROOT;
709 			if (dirclust == MSDOSFSROOT)
710 				diroffset = MSDOSFSROOT_OFS;
711 			else
712 				diroffset = 0;
713 		}
714 		return deget(pmp, dirclust, diroffset, depp);
715 	}
716 
717 	return 0;
718 
719     rollback:
720 	/*
721 	 * Mark all slots modified so far as deleted. Note that we
722 	 * can't just call removede(), since directory is not in
723 	 * consistent state.
724 	 */
725 	fndoffset = ddep->de_fndoffset;
726 	rberror = pcbmap(ddep, de_cluster(pmp, fndoffset),
727 	       &bn, NULL, &blsize);
728 	if (rberror)
729 		goto err_norollback;
730 	if ((rberror = bread(pmp->pm_devvp, de_bn2kb(pmp, bn), blsize, NOCRED,
731 	    B_MODIFY, &bp)) != 0) {
732 		goto err_norollback;
733 	}
734 	ndep = bptoep(pmp, bp, clusoffset);
735 
736 	havecnt = ddep->de_fndcnt + 1;
737 	for(i = wcnt; i <= havecnt; i++) {
738 		/* mark entry as deleted */
739 		ndep->deName[0] = SLOT_DELETED;
740 
741 		if ((fndoffset & pmp->pm_crbomask) == 0) {
742 			/* we should never get here if ddep is root
743 			 * directory */
744 
745 			if (async)
746 				bdwrite(bp);
747 			else if ((rberror = bwrite(bp)) != 0)
748 				goto err_norollback;
749 
750 			fndoffset -= sizeof(struct direntry);
751 			rberror = pcbmap(ddep,
752 				       de_cluster(pmp, fndoffset),
753 				       &bn, 0, &blsize);
754 			if (rberror)
755 				goto err_norollback;
756 
757 			rberror = bread(pmp->pm_devvp, de_bn2kb(pmp, bn),
758 			    blsize, NOCRED, B_MODIFY, &bp);
759 			if (rberror) {
760 				goto err_norollback;
761 			}
762 			ndep = bptoep(pmp, bp, fndoffset);
763 		} else {
764 			ndep--;
765 			fndoffset -= sizeof(struct direntry);
766 		}
767 	}
768 
769 	/* ignore any further error */
770 	if (async)
771 		(void) bdwrite(bp);
772 	else
773 		(void) bwrite(bp);
774 
775     err_norollback:
776 	return error;
777 }
778 
779 /*
780  * Be sure a directory is empty except for "." and "..". Return 1 if empty,
781  * return 0 if not empty or error.
782  */
783 int
784 dosdirempty(struct denode *dep)
785 {
786 	int blsize;
787 	int error;
788 	u_long cn;
789 	daddr_t bn;
790 	struct buf *bp;
791 	struct msdosfsmount *pmp = dep->de_pmp;
792 	struct direntry *dentp;
793 
794 	/*
795 	 * Since the filesize field in directory entries for a directory is
796 	 * zero, we just have to feel our way through the directory until
797 	 * we hit end of file.
798 	 */
799 	for (cn = 0;; cn++) {
800 		if ((error = pcbmap(dep, cn, &bn, 0, &blsize)) != 0) {
801 			if (error == E2BIG)
802 				return (1);	/* it's empty */
803 			return (0);
804 		}
805 		error = bread(pmp->pm_devvp, de_bn2kb(pmp, bn), blsize, NOCRED,
806 		    0, &bp);
807 		if (error) {
808 			return (0);
809 		}
810 		for (dentp = (struct direntry *)bp->b_data;
811 		     (char *)dentp < (char *)bp->b_data + blsize;
812 		     dentp++) {
813 			if (dentp->deName[0] != SLOT_DELETED &&
814 			    (dentp->deAttributes & ATTR_VOLUME) == 0) {
815 				/*
816 				 * In dos directories an entry whose name
817 				 * starts with SLOT_EMPTY (0) starts the
818 				 * beginning of the unused part of the
819 				 * directory, so we can just return that it
820 				 * is empty.
821 				 */
822 				if (dentp->deName[0] == SLOT_EMPTY) {
823 					brelse(bp, 0);
824 					return (1);
825 				}
826 				/*
827 				 * Any names other than "." and ".." in a
828 				 * directory mean it is not empty.
829 				 */
830 				if (memcmp(dentp->deName, ".          ", 11) &&
831 				    memcmp(dentp->deName, "..         ", 11)) {
832 					brelse(bp, 0);
833 #ifdef MSDOSFS_DEBUG
834 					printf("dosdirempty(): found %.11s, %d, %d\n",
835 					    dentp->deName, dentp->deName[0],
836 						dentp->deName[1]);
837 #endif
838 					return (0);	/* not empty */
839 				}
840 			}
841 		}
842 		brelse(bp, 0);
843 	}
844 	/* NOTREACHED */
845 }
846 
847 /*
848  * Check to see if the directory described by target is in some
849  * subdirectory of source.  This prevents something like the following from
850  * succeeding and leaving a bunch or files and directories orphaned. mv
851  * /a/b/c /a/b/c/d/e/f Where c and f are directories.
852  *
853  * source - the inode for /a/b/c
854  * target - the inode for /a/b/c/d/e/f
855  *
856  * Returns 0 if target is NOT a subdirectory of source.
857  * Otherwise returns a non-zero error number.
858  * The target inode is always unlocked on return.
859  */
860 int
861 doscheckpath(struct denode *source, struct denode *target)
862 {
863 	u_long scn;
864 	struct msdosfsmount *pmp;
865 	struct direntry *ep;
866 	struct denode *dep;
867 	struct buf *bp = NULL;
868 	int error = 0;
869 
870 	dep = target;
871 	if ((target->de_Attributes & ATTR_DIRECTORY) == 0 ||
872 	    (source->de_Attributes & ATTR_DIRECTORY) == 0) {
873 		error = ENOTDIR;
874 		goto out;
875 	}
876 	if (dep->de_StartCluster == source->de_StartCluster) {
877 		error = EEXIST;
878 		goto out;
879 	}
880 	if (dep->de_StartCluster == MSDOSFSROOT)
881 		goto out;
882 	pmp = dep->de_pmp;
883 #ifdef	DIAGNOSTIC
884 	if (pmp != source->de_pmp)
885 		panic("doscheckpath: source and target on different filesystems");
886 #endif
887 	if (FAT32(pmp) && dep->de_StartCluster == pmp->pm_rootdirblk)
888 		goto out;
889 
890 	for (;;) {
891 		if ((dep->de_Attributes & ATTR_DIRECTORY) == 0) {
892 			error = ENOTDIR;
893 			break;
894 		}
895 		scn = dep->de_StartCluster;
896 		error = bread(pmp->pm_devvp, de_bn2kb(pmp, cntobn(pmp, scn)),
897 			      pmp->pm_bpcluster, NOCRED, 0, &bp);
898 		if (error)
899 			break;
900 
901 		ep = (struct direntry *) bp->b_data + 1;
902 		if ((ep->deAttributes & ATTR_DIRECTORY) == 0 ||
903 		    memcmp(ep->deName, "..         ", 11) != 0) {
904 			error = ENOTDIR;
905 			break;
906 		}
907 		scn = getushort(ep->deStartCluster);
908 		if (FAT32(pmp))
909 			scn |= getushort(ep->deHighClust) << 16;
910 
911 		if (scn == source->de_StartCluster) {
912 			error = EINVAL;
913 			break;
914 		}
915 		if (scn == MSDOSFSROOT)
916 			break;
917 		if (FAT32(pmp) && scn == pmp->pm_rootdirblk) {
918 			/*
919 			 * scn should be 0 in this case,
920 			 * but we silently ignore the error.
921 			 */
922 			break;
923 		}
924 
925 		vput(DETOV(dep));
926 		brelse(bp, 0);
927 		bp = NULL;
928 		/* NOTE: deget() clears dep on error */
929 		if ((error = deget(pmp, scn, 0, &dep)) != 0)
930 			break;
931 	}
932 out:
933 	if (bp)
934 		brelse(bp, 0);
935 	if (error == ENOTDIR)
936 		printf("doscheckpath(): .. not a directory?\n");
937 	if (dep != NULL)
938 		vput(DETOV(dep));
939 	return (error);
940 }
941 
942 /*
943  * Read in the disk block containing the directory entry (dirclu, dirofs)
944  * and return the address of the buf header, and the address of the
945  * directory entry within the block.
946  */
947 int
948 readep(struct msdosfsmount *pmp, u_long dirclust, u_long diroffset, struct buf **bpp, struct direntry **epp)
949 {
950 	int error;
951 	daddr_t bn;
952 	int blsize;
953 
954 	blsize = pmp->pm_bpcluster;
955 	if (dirclust == MSDOSFSROOT
956 	    && de_blk(pmp, diroffset + blsize) > pmp->pm_rootdirsize)
957 		blsize = de_bn2off(pmp, pmp->pm_rootdirsize) & pmp->pm_crbomask;
958 	bn = detobn(pmp, dirclust, diroffset);
959 	if ((error = bread(pmp->pm_devvp, de_bn2kb(pmp, bn), blsize, NOCRED,
960 	    0, bpp)) != 0) {
961 		*bpp = NULL;
962 		return (error);
963 	}
964 	if (epp)
965 		*epp = bptoep(pmp, *bpp, diroffset);
966 	return (0);
967 }
968 
969 /*
970  * Read in the disk block containing the directory entry dep came from and
971  * return the address of the buf header, and the address of the directory
972  * entry within the block.
973  */
974 int
975 readde(struct denode *dep, struct buf **bpp, struct direntry **epp)
976 {
977 	return (readep(dep->de_pmp, dep->de_dirclust, dep->de_diroffset,
978 			bpp, epp));
979 }
980 
981 /*
982  * Remove a directory entry. At this point the file represented by the
983  * directory entry to be removed is still full length until noone has it
984  * open.  When the file no longer being used msdosfs_inactive() is called
985  * and will truncate the file to 0 length.  When the vnode containing the
986  * denode is needed for some other purpose by VFS it will call
987  * msdosfs_reclaim() which will remove the denode from the denode cache.
988  */
989 int
990 removede(struct denode *pdep, struct denode *dep)
991 	/* pdep:	 directory where the entry is removed */
992 	/* dep:	 file to be removed */
993 {
994 	int error;
995 	struct direntry *ep;
996 	struct buf *bp;
997 	daddr_t bn;
998 	int blsize;
999 	struct msdosfsmount *pmp = pdep->de_pmp;
1000 	u_long offset = pdep->de_fndoffset;
1001 #ifdef _KERNEL
1002 	int async = pdep->de_pmp->pm_mountp->mnt_flag & MNT_ASYNC;
1003 #else
1004 #define async 0
1005 #endif
1006 
1007 #ifdef MSDOSFS_DEBUG
1008 	printf("removede(): filename %s, dep %p, offset %08lx\n",
1009 	    dep->de_Name, dep, offset);
1010 #endif
1011 
1012 	dep->de_refcnt--;
1013 	offset += sizeof(struct direntry);
1014 	do {
1015 		offset -= sizeof(struct direntry);
1016 		error = pcbmap(pdep, de_cluster(pmp, offset), &bn, 0, &blsize);
1017 		if (error)
1018 			return error;
1019 		error = bread(pmp->pm_devvp, de_bn2kb(pmp, bn), blsize, NOCRED,
1020 		    B_MODIFY, &bp);
1021 		if (error) {
1022 			return error;
1023 		}
1024 		ep = bptoep(pmp, bp, offset);
1025 		/*
1026 		 * Check whether, if we came here the second time, i.e.
1027 		 * when underflowing into the previous block, the last
1028 		 * entry in this block is a longfilename entry, too.
1029 		 */
1030 		if (ep->deAttributes != ATTR_WIN95
1031 		    && offset != pdep->de_fndoffset) {
1032 			brelse(bp, 0);
1033 			break;
1034 		}
1035 		offset += sizeof(struct direntry);
1036 		while (1) {
1037 			/*
1038 			 * We are a bit agressive here in that we delete any Win95
1039 			 * entries preceding this entry, not just the ones we "own".
1040 			 * Since these presumably aren't valid anyway,
1041 			 * there should be no harm.
1042 			 */
1043 			offset -= sizeof(struct direntry);
1044 			ep--->deName[0] = SLOT_DELETED;
1045 			if ((pmp->pm_flags & MSDOSFSMNT_NOWIN95)
1046 			    || !(offset & pmp->pm_crbomask)
1047 			    || ep->deAttributes != ATTR_WIN95)
1048 				break;
1049 		}
1050 		if (async)
1051 			bdwrite(bp);
1052 		else if ((error = bwrite(bp)) != 0)
1053 			return error;
1054 	} while (!(pmp->pm_flags & MSDOSFSMNT_NOWIN95)
1055 	    && !(offset & pmp->pm_crbomask)
1056 	    && offset);
1057 	return 0;
1058 }
1059 
1060 /*
1061  * Create a unique DOS name in dvp
1062  */
1063 int
1064 uniqdosname(struct denode *dep, struct componentname *cnp, u_char *cp)
1065 {
1066 	struct msdosfsmount *pmp = dep->de_pmp;
1067 	struct direntry *dentp;
1068 	int gen;
1069 	int blsize;
1070 	u_long cn;
1071 	daddr_t bn;
1072 	struct buf *bp;
1073 	int error;
1074 
1075 	for (gen = 1;; gen++) {
1076 		/*
1077 		 * Generate DOS name with generation number
1078 		 */
1079 		if (!unix2dosfn((const u_char *)cnp->cn_nameptr, cp,
1080 		    cnp->cn_namelen, gen))
1081 			return gen == 1 ? EINVAL : EEXIST;
1082 
1083 		/*
1084 		 * Now look for a dir entry with this exact name
1085 		 */
1086 		for (cn = error = 0; !error; cn++) {
1087 			if ((error = pcbmap(dep, cn, &bn, 0, &blsize)) != 0) {
1088 				if (error == E2BIG)	/* EOF reached and not found */
1089 					return 0;
1090 				return error;
1091 			}
1092 			error = bread(pmp->pm_devvp, de_bn2kb(pmp, bn), blsize,
1093 			    NOCRED, 0, &bp);
1094 			if (error) {
1095 				return error;
1096 			}
1097 			for (dentp = (struct direntry *)bp->b_data;
1098 			     (char *)dentp < (char *)bp->b_data + blsize;
1099 			     dentp++) {
1100 				if (dentp->deName[0] == SLOT_EMPTY) {
1101 					/*
1102 					 * Last used entry and not found
1103 					 */
1104 					brelse(bp, 0);
1105 					return 0;
1106 				}
1107 				/*
1108 				 * Ignore volume labels and Win95 entries
1109 				 */
1110 				if (dentp->deAttributes & ATTR_VOLUME)
1111 					continue;
1112 				if (!memcmp(dentp->deName, cp, 11)) {
1113 					error = EEXIST;
1114 					break;
1115 				}
1116 			}
1117 			brelse(bp, 0);
1118 		}
1119 	}
1120 }
1121 
1122 /*
1123  * Find any Win'95 long filename entry in directory dep
1124  */
1125 int
1126 findwin95(struct denode *dep)
1127 {
1128 	struct msdosfsmount *pmp = dep->de_pmp;
1129 	struct direntry *dentp;
1130 	int blsize, win95;
1131 	u_long cn;
1132 	daddr_t bn;
1133 	struct buf *bp;
1134 
1135 	win95 = 1;
1136 	/*
1137 	 * Read through the directory looking for Win'95 entries
1138 	 * XXX Note: Error currently handled just as EOF
1139 	 */
1140 	for (cn = 0;; cn++) {
1141 		if (pcbmap(dep, cn, &bn, 0, &blsize))
1142 			return win95;
1143 		if (bread(pmp->pm_devvp, de_bn2kb(pmp, bn), blsize, NOCRED,
1144 		    0, &bp)) {
1145 			return win95;
1146 		}
1147 		for (dentp = (struct direntry *)bp->b_data;
1148 		     (char *)dentp < (char *)bp->b_data + blsize;
1149 		     dentp++) {
1150 			if (dentp->deName[0] == SLOT_EMPTY) {
1151 				/*
1152 				 * Last used entry and not found
1153 				 */
1154 				brelse(bp, 0);
1155 				return win95;
1156 			}
1157 			if (dentp->deName[0] == SLOT_DELETED) {
1158 				/*
1159 				 * Ignore deleted files
1160 				 * Note: might be an indication of Win'95
1161 				 * anyway	XXX
1162 				 */
1163 				continue;
1164 			}
1165 			if (dentp->deAttributes == ATTR_WIN95) {
1166 				brelse(bp, 0);
1167 				return 1;
1168 			}
1169 			win95 = 0;
1170 		}
1171 		brelse(bp, 0);
1172 	}
1173 }
1174