xref: /titanic_50/usr/src/uts/common/fs/udfs/udf_dir.c (revision 53089ab7c84db6fb76c16ca50076c147cda11757)
1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 /*
22  * Copyright (c) 1998, 2010, Oracle and/or its affiliates. All rights reserved.
23  */
24 
25 #include <sys/types.h>
26 #include <sys/t_lock.h>
27 #include <sys/param.h>
28 #include <sys/time.h>
29 #include <sys/systm.h>
30 #include <sys/sysmacros.h>
31 #include <sys/resource.h>
32 #include <sys/signal.h>
33 #include <sys/cred.h>
34 #include <sys/user.h>
35 #include <sys/buf.h>
36 #include <sys/vfs.h>
37 #include <sys/stat.h>
38 #include <sys/vnode.h>
39 #include <sys/mode.h>
40 #include <sys/proc.h>
41 #include <sys/disp.h>
42 #include <sys/file.h>
43 #include <sys/fcntl.h>
44 #include <sys/flock.h>
45 #include <sys/kmem.h>
46 #include <sys/uio.h>
47 #include <sys/dnlc.h>
48 #include <sys/conf.h>
49 #include <sys/errno.h>
50 #include <sys/mman.h>
51 #include <sys/fbuf.h>
52 #include <sys/pathname.h>
53 #include <sys/debug.h>
54 #include <sys/vmsystm.h>
55 #include <sys/cmn_err.h>
56 #include <sys/dirent.h>
57 #include <sys/errno.h>
58 #include <sys/modctl.h>
59 #include <sys/statvfs.h>
60 #include <sys/mount.h>
61 #include <sys/sunddi.h>
62 #include <sys/bootconf.h>
63 #include <sys/policy.h>
64 
65 #include <vm/hat.h>
66 #include <vm/page.h>
67 #include <vm/pvn.h>
68 #include <vm/as.h>
69 #include <vm/seg.h>
70 #include <vm/seg_map.h>
71 #include <vm/seg_kmem.h>
72 #include <vm/seg_vn.h>
73 #include <vm/rm.h>
74 #include <vm/page.h>
75 #include <sys/swap.h>
76 
77 
78 #include <fs/fs_subr.h>
79 
80 
81 #include <sys/fs/udf_volume.h>
82 #include <sys/fs/udf_inode.h>
83 
84 
85 struct slot {
86 	enum	{NONE, COMPACT, FOUND, EXIST} status;
87 	off_t	offset;		/* offset of area with free space */
88 	int	size;		/* size of area at slotoffset */
89 	struct	fbuf *fbp;	/* dir buf where slot is */
90 	struct file_id *ep;	/* pointer to slot */
91 	off_t	endoff;		/* last useful location found in search */
92 };
93 
94 
95 int32_t ud_dircheckforname(struct ud_inode *, char *, int,
96 		struct slot *, struct ud_inode **, uint8_t *, struct cred *);
97 int32_t ud_dirempty(struct ud_inode *, uint64_t, struct cred *);
98 int32_t str2cmp(char *, int32_t, char *, int32_t, char *, int32_t);
99 int32_t ud_dircheckpath(int32_t, struct ud_inode *, struct cred *);
100 int32_t ud_dirmakeinode(struct ud_inode *, struct ud_inode **,
101 	struct vattr *, enum de_op, struct cred *);
102 int32_t ud_diraddentry(struct ud_inode *, char *,
103 	enum de_op, int, struct slot *, struct ud_inode *,
104 	struct ud_inode *, struct cred *);
105 int32_t ud_dirmakedirect(struct ud_inode *, struct ud_inode *, struct cred *);
106 int32_t ud_dirrename(struct ud_inode *, struct ud_inode *,
107 	struct ud_inode *, struct ud_inode *, char *, uint8_t *,
108 	struct slot *, struct cred *);
109 int32_t ud_dirprepareentry(struct ud_inode *,
110 	struct slot *, uint8_t *, struct cred *);
111 int32_t ud_dirfixdotdot(struct ud_inode *, struct ud_inode *,
112 		struct ud_inode *);
113 int32_t ud_write_fid(struct ud_inode *, struct slot *, uint8_t *);
114 
115 int
116 ud_dirlook(struct ud_inode *dip,
117 	char *namep, struct ud_inode **ipp, struct cred *cr, int32_t skipdnlc)
118 {
119 	struct udf_vfs *udf_vfsp;
120 	int32_t error = 0, namelen, adhoc_search;
121 	u_offset_t offset, adhoc_offset, dirsize, end;
122 	struct vnode *dvp, *vp;
123 	struct fbuf *fbp;
124 	struct file_id *fid;
125 	uint8_t *fname, dummy[3];
126 	int32_t id_len, doingchk;
127 	uint32_t old_loc;
128 	uint16_t old_prn;
129 
130 	uint8_t *dname;
131 	uint8_t *buf = NULL;
132 
133 	ud_printf("ud_dirlook\n");
134 
135 	udf_vfsp = dip->i_udf;
136 
137 restart:
138 	doingchk = 0;
139 	old_prn = 0xFFFF;
140 	old_loc = 0;
141 	dvp = ITOV(dip);
142 	/*
143 	 * Check accessibility of directory.
144 	 */
145 	if (dip->i_type != VDIR) {
146 		return (ENOTDIR);
147 	}
148 	if (error = ud_iaccess(dip, IEXEC, cr, 1)) {
149 		return (error);
150 	}
151 
152 	/*
153 	 * Null component name is synonym for directory being searched.
154 	 */
155 	if (*namep == '\0') {
156 		VN_HOLD(dvp);
157 		*ipp = dip;
158 		return (0);
159 	}
160 	namelen = strlen(namep);
161 	if ((namelen == 1) &&
162 	    (namep[0] == '.') && (namep[1] == '\0')) {
163 		/* Current directory */
164 		VN_HOLD(dvp);
165 		*ipp = dip;
166 		dnlc_enter(dvp, namep, ITOV(*ipp));
167 		return (0);
168 	}
169 
170 	if ((!skipdnlc) && (vp = dnlc_lookup(dvp, namep))) {
171 		/* vp is already held from dnlc_lookup */
172 
173 		*ipp = VTOI(vp);
174 		return (0);
175 	}
176 
177 	dname = kmem_zalloc(1024, KM_SLEEP);
178 	buf = kmem_zalloc(udf_vfsp->udf_lbsize, KM_SLEEP);
179 
180 	/*
181 	 * Read lock the inode we are searching.  You will notice that we
182 	 * didn't hold the read lock while searching the dnlc.  This means
183 	 * that the entry could now be in the dnlc.  This doesn't cause any
184 	 * problems because dnlc_enter won't add an entry if it is already
185 	 * there.
186 	 */
187 	rw_enter(&dip->i_rwlock, RW_READER);
188 
189 	/*
190 	 * Take care to look at dip->i_diroff only once, as it
191 	 * may be changing due to other threads/cpus.
192 	 */
193 
194 recheck:
195 	offset = dip->i_diroff;
196 	end = dirsize = dip->i_size;
197 
198 	if (offset > dirsize) {
199 		offset = 0;
200 	}
201 	adhoc_offset = offset;
202 	adhoc_search = (offset == 0) ? 1 : 2;
203 
204 	fbp = NULL;
205 
206 	while (adhoc_search--) {
207 		while (offset < end) {
208 			error = ud_get_next_fid(dip, &fbp,
209 			    offset, &fid, &fname, buf);
210 			if (error != 0) {
211 				break;
212 			}
213 			if ((fid->fid_flags & FID_DELETED) == 0) {
214 				if (fid->fid_flags & FID_PARENT) {
215 					id_len = 2;
216 					fname = dummy;
217 					dummy[0] = '.';
218 					dummy[1] = '.';
219 					dummy[2] = '\0';
220 				} else {
221 					if ((error = ud_uncompress(
222 					    fid->fid_idlen, &id_len,
223 					    fname, dname)) != 0) {
224 						break;
225 					}
226 					fname = (uint8_t *)dname;
227 					fname[id_len] = '\0';
228 				}
229 				if ((namelen == id_len) &&
230 				    (strncmp(namep, (caddr_t)fname,
231 				    namelen) == 0)) {
232 					uint32_t loc;
233 					uint16_t prn;
234 
235 
236 					loc = SWAP_32(fid->fid_icb.lad_ext_loc);
237 					prn = SWAP_16(fid->fid_icb.lad_ext_prn);
238 					dip->i_diroff = offset + FID_LEN(fid);
239 
240 					if (doingchk) {
241 						if ((loc == old_loc) &&
242 						    (prn == old_prn)) {
243 							goto checkok;
244 						} else {
245 							if (fbp != NULL) {
246 								fbrelse(fbp,
247 								    S_READ);
248 								fbp = NULL;
249 							}
250 							VN_RELE(ITOV(*ipp));
251 							rw_exit(&dip->i_rwlock);
252 							goto restart;
253 						}
254 						/* NOTREACHED */
255 					}
256 
257 					if (namelen == 2 &&
258 					    fname[0] == '.' &&
259 					    fname[1] == '.') {
260 
261 						struct timespec32 omtime;
262 
263 						omtime = dip->i_mtime;
264 						rw_exit(&dip->i_rwlock);
265 
266 						error = ud_iget(dip->i_vfs, prn,
267 						    loc, ipp, NULL, cr);
268 
269 						rw_enter(&dip->i_rwlock,
270 						    RW_READER);
271 
272 						if (error) {
273 							goto done;
274 						}
275 
276 						if ((omtime.tv_sec !=
277 						    dip->i_mtime.tv_sec) ||
278 						    (omtime.tv_nsec !=
279 						    dip->i_mtime.tv_nsec)) {
280 
281 							doingchk = 1;
282 							old_prn = prn;
283 							old_loc = loc;
284 							dip->i_diroff = 0;
285 							if (fbp != NULL) {
286 								fbrelse(fbp,
287 								    S_READ);
288 								fbp = NULL;
289 							}
290 							goto recheck;
291 						}
292 					} else {
293 
294 						error = ud_iget(dip->i_vfs, prn,
295 						    loc, ipp, NULL, cr);
296 					}
297 checkok:
298 					if (error == 0) {
299 						dnlc_enter(dvp, namep,
300 						    ITOV(*ipp));
301 					}
302 					goto done;
303 				}
304 			}
305 			offset += FID_LEN(fid);
306 		}
307 		if (fbp != NULL) {
308 			fbrelse(fbp, S_READ);
309 			fbp = NULL;
310 		}
311 		end = adhoc_offset;
312 		offset = 0;
313 	}
314 	error = ENOENT;
315 done:
316 	kmem_free(buf, udf_vfsp->udf_lbsize);
317 	kmem_free(dname, 1024);
318 	if (fbp != NULL) {
319 		fbrelse(fbp, S_READ);
320 	}
321 	rw_exit(&dip->i_rwlock);
322 	return (error);
323 }
324 
325 int
326 ud_direnter(
327 	struct ud_inode *tdp,
328 	char *namep,
329 	enum de_op op,
330 	struct ud_inode *sdp,
331 	struct ud_inode *sip,
332 	struct vattr *vap,
333 	struct ud_inode **ipp,
334 	struct cred *cr,
335 	caller_context_t *ctp)
336 {
337 	struct udf_vfs *udf_vfsp;
338 	struct ud_inode *tip;
339 	struct slot slot;
340 	int32_t namlen, err;
341 	char *s;
342 
343 	uint8_t *buf = NULL;
344 
345 	ud_printf("ud_direnter\n");
346 
347 	udf_vfsp = tdp->i_udf;
348 	/* don't allow '/' characters in pathname component */
349 	for (s = namep, namlen = 0; *s; s++, namlen++) {
350 		if (*s == '/') {
351 			return (EACCES);
352 		}
353 	}
354 
355 	if (namlen == 0) {
356 		cmn_err(CE_WARN, "name length == 0 in ud_direnter");
357 		return (EINVAL);
358 	}
359 
360 	ASSERT(RW_WRITE_HELD(&tdp->i_rwlock));
361 	/*
362 	 * If name is "." or ".." then if this is a create look it up
363 	 * and return EEXIST.  Rename or link TO "." or ".." is forbidden.
364 	 */
365 	if (namep[0] == '.' &&
366 	    (namlen == 1 || (namlen == 2 && namep[1] == '.'))) {
367 		if (op == DE_RENAME) {
368 			return (EINVAL);	/* *SIGH* should be ENOTEMPTY */
369 		}
370 		if (ipp) {
371 			/*
372 			 * ud_dirlook will acquire the i_rwlock
373 			 */
374 			rw_exit(&tdp->i_rwlock);
375 			if (err = ud_dirlook(tdp, namep, ipp, cr, 0)) {
376 				rw_enter(&tdp->i_rwlock, RW_WRITER);
377 				return (err);
378 			}
379 			rw_enter(&tdp->i_rwlock, RW_WRITER);
380 		}
381 		return (EEXIST);
382 	}
383 
384 	tip = NULL;
385 	slot.status = NONE;
386 	slot.offset = 0;
387 	slot.size = 0;
388 	slot.fbp = NULL;
389 	slot.ep = NULL;
390 	slot.endoff = 0;
391 
392 	/*
393 	 * For link and rename lock the source entry and check the link count
394 	 * to see if it has been removed while it was unlocked.  If not, we
395 	 * increment the link count and force the inode to disk to make sure
396 	 * that it is there before any directory entry that points to it.
397 	 */
398 	if (op == DE_LINK || op == DE_RENAME) {
399 		rw_enter(&sip->i_contents, RW_WRITER);
400 		if (sip->i_nlink == 0) {
401 			rw_exit(&sip->i_contents);
402 			return (ENOENT);
403 		}
404 		if (sip->i_nlink == MAXLINK) {
405 			rw_exit(&sip->i_contents);
406 			return (EMLINK);
407 		}
408 
409 		sip->i_nlink++;
410 		mutex_enter(&sip->i_tlock);
411 		sip->i_flag |= ICHG;
412 		mutex_exit(&sip->i_tlock);
413 		ud_iupdat(sip, 1);
414 		rw_exit(&sip->i_contents);
415 	}
416 	/*
417 	 * If target directory has not been removed, then we can consider
418 	 * allowing file to be created.
419 	 */
420 	if (tdp->i_nlink == 0) {
421 		err = ENOENT;
422 		goto out2;
423 	}
424 	/*
425 	 * Check accessibility of directory.
426 	 */
427 	if (tdp->i_type != VDIR) {
428 		err = ENOTDIR;
429 		goto out2;
430 	}
431 	/*
432 	 * Execute access is required to search the directory.
433 	 */
434 	if (err = ud_iaccess(tdp, IEXEC, cr, 1)) {
435 		goto out2;
436 	}
437 	/*
438 	 * If this is a rename of a directory and the parent is
439 	 * different (".." must be changed), then the source
440 	 * directory must not be in the directory hierarchy
441 	 * above the target, as this would orphan everything
442 	 * below the source directory.  Also the user must have
443 	 * write permission in the source so as to be able to
444 	 * change "..".
445 	 */
446 	if (op == DE_RENAME) {
447 		if (sip == tdp) {
448 			err = EINVAL;
449 			goto out2;
450 		}
451 		rw_enter(&sip->i_contents, RW_READER);
452 		if ((sip->i_type == VDIR) && (sdp != tdp)) {
453 			uint32_t blkno;
454 
455 			if ((err = ud_iaccess(sip, IWRITE, cr, 0))) {
456 				rw_exit(&sip->i_contents);
457 				goto out2;
458 			}
459 			blkno = sip->i_icb_lbano;
460 			rw_exit(&sip->i_contents);
461 			if ((err = ud_dircheckpath(blkno, tdp, cr))) {
462 				goto out2;
463 			}
464 		} else {
465 			rw_exit(&sip->i_contents);
466 		}
467 	}
468 
469 	/*
470 	 * Search for the entry. Return VN_HELD tip if found.
471 	 */
472 	buf = kmem_zalloc(udf_vfsp->udf_lbsize, KM_SLEEP);
473 	rw_enter(&tdp->i_contents, RW_WRITER);
474 	if (err = ud_dircheckforname(tdp,
475 	    namep, namlen, &slot, &tip, buf, cr)) {
476 		goto out;
477 	}
478 	if (tip) {
479 		switch (op) {
480 			case DE_CREATE :
481 			case DE_MKDIR :
482 				if (ipp) {
483 					*ipp = tip;
484 					err = EEXIST;
485 				} else {
486 					VN_RELE(ITOV(tip));
487 				}
488 				break;
489 			case DE_RENAME :
490 				err = ud_dirrename(sdp, sip, tdp, tip,
491 				    namep, buf, &slot, cr);
492 				/*
493 				 * We used to VN_RELE() here, but this
494 				 * was moved down so that we could send
495 				 * a vnevent after the locks were dropped.
496 				 */
497 				break;
498 			case DE_LINK :
499 				/*
500 				 * Can't link to an existing file.
501 				 */
502 				VN_RELE(ITOV(tip));
503 				err = EEXIST;
504 				break;
505 		}
506 	} else {
507 		/*
508 		 * The entry does not exist. Check write permission in
509 		 * directory to see if entry can be created.
510 		 */
511 		if (err = ud_iaccess(tdp, IWRITE, cr, 0)) {
512 			goto out;
513 		}
514 		if ((op == DE_CREATE) || (op == DE_MKDIR)) {
515 			/*
516 			 * Make new inode and directory entry as required.
517 			 */
518 			if (err = ud_dirmakeinode(tdp, &sip, vap, op, cr))
519 				goto out;
520 		}
521 		if (err = ud_diraddentry(tdp, namep, op,
522 		    namlen, &slot, sip, sdp, cr)) {
523 			if ((op == DE_CREATE) || (op == DE_MKDIR)) {
524 				/*
525 				 * Unmake the inode we just made.
526 				 */
527 				rw_enter(&sip->i_contents, RW_WRITER);
528 				if (sip->i_type == VDIR) {
529 					tdp->i_nlink--;
530 				}
531 				sip->i_nlink = 0;
532 				mutex_enter(&sip->i_tlock);
533 				sip->i_flag |= ICHG;
534 				mutex_exit(&sip->i_tlock);
535 				rw_exit(&sip->i_contents);
536 				VN_RELE(ITOV(sip));
537 				sip = NULL;
538 			}
539 		} else if (ipp) {
540 			*ipp = sip;
541 		} else if ((op == DE_CREATE) || (op == DE_MKDIR)) {
542 			VN_RELE(ITOV(sip));
543 		}
544 	}
545 out:
546 	if (buf != NULL) {
547 		kmem_free(buf, udf_vfsp->udf_lbsize);
548 	}
549 	if (slot.fbp) {
550 		fbrelse(slot.fbp, S_OTHER);
551 	}
552 	rw_exit(&tdp->i_contents);
553 
554 	if (op == DE_RENAME) {
555 		/*
556 		 * If it's all good, send events after locks are dropped
557 		 * but before vnodes are released.
558 		 */
559 		if (err == 0) {
560 			if (tip) {
561 				vnevent_rename_dest(ITOV(tip), ITOV(tdp),
562 				    namep, ctp);
563 			}
564 
565 			if (sdp != tdp) {
566 				vnevent_rename_dest_dir(ITOV(tdp), ctp);
567 			}
568 		}
569 
570 		/*
571 		 * The following VN_RELE() was moved from the
572 		 * DE_RENAME case above
573 		 */
574 		if (tip) {
575 			VN_RELE(ITOV(tip));
576 		}
577 	}
578 
579 out2:
580 	if (err && ((op == DE_LINK) || (op == DE_RENAME))) {
581 		/*
582 		 * Undo bumped link count.
583 		 */
584 		rw_enter(&sip->i_contents, RW_WRITER);
585 		sip->i_nlink--;
586 		rw_exit(&sip->i_contents);
587 
588 		mutex_enter(&sip->i_tlock);
589 		sip->i_flag |= ICHG;
590 		mutex_exit(&sip->i_tlock);
591 	}
592 	return (err);
593 }
594 
595 /*
596  * Locking i_contents in this
597  * function seems to be really weird
598  */
599 int
600 ud_dirremove(
601 	struct ud_inode *dp,
602 	char *namep,
603 	struct ud_inode *oip,
604 	struct vnode *cdir,
605 	enum dr_op op,
606 	struct cred *cr,
607 	caller_context_t *ctp)
608 {
609 	struct udf_vfs *udf_vfsp;
610 	int32_t namelen, err = 0;
611 	struct slot slot;
612 	struct ud_inode *ip;
613 	mode_t mode;
614 	struct file_id *fid;
615 	uint8_t *buf = NULL;
616 	uint32_t tbno;
617 
618 	ud_printf("ud_dirremove\n");
619 
620 	ASSERT(RW_WRITE_HELD(&dp->i_rwlock));
621 
622 	udf_vfsp = dp->i_udf;
623 	namelen = (int)strlen(namep);
624 	if (namelen == 0) {
625 		cmn_err(CE_WARN, "name length == 0 in ud_dirremove");
626 		return (EINVAL);
627 	}
628 
629 	/*
630 	 * return err when removing . and ..
631 	 */
632 	if (namep[0] == '.') {
633 		if (namelen == 1) {
634 			return (EINVAL);
635 		} else if (namelen == 2 && namep[1] == '.') {
636 			return (EEXIST);	/* SIGH should be ENOTEMPTY */
637 		}
638 	}
639 
640 	ASSERT(RW_WRITE_HELD(&dp->i_rwlock));
641 
642 	/*
643 	 * Check accessibility of directory.
644 	 */
645 	if (dp->i_type != VDIR) {
646 		return (ENOTDIR);
647 	}
648 
649 	ip = NULL;
650 	slot.status = FOUND;	/* don't need to look for empty slot */
651 	slot.offset = 0;
652 	slot.size = 0;
653 	slot.fbp = NULL;
654 	slot.ep = NULL;
655 	slot.endoff = 0;
656 	/*
657 	 * Execute access is required to search the directory.
658 	 * Access for write is interpreted as allowing
659 	 * deletion of files in the directory.
660 	 */
661 	if (err = ud_iaccess(dp, IEXEC|IWRITE, cr, 1)) {
662 		return (err);
663 	}
664 
665 	buf = (uint8_t *)kmem_zalloc(udf_vfsp->udf_lbsize, KM_SLEEP);
666 
667 	rw_enter(&dp->i_contents, RW_WRITER);
668 
669 	if (err = ud_dircheckforname(dp, namep, namelen, &slot, &ip,
670 	    buf, cr)) {
671 		goto out_novfs;
672 	}
673 	if (ip == NULL) {
674 		err = ENOENT;
675 		goto out_novfs;
676 	}
677 	if (oip && oip != ip) {
678 		err = ENOENT;
679 		goto out_novfs;
680 	}
681 
682 	if ((mode = ip->i_type) == VDIR) {
683 		/*
684 		 * vn_vfswlock() prevents races between mount and rmdir.
685 		 */
686 		if (vn_vfswlock(ITOV(ip))) {
687 			err = EBUSY;
688 			goto out_novfs;
689 		}
690 		if (vn_mountedvfs(ITOV(ip)) != NULL && op != DR_RENAME) {
691 			err = EBUSY;
692 			goto out;
693 		}
694 		/*
695 		 * If we are removing a directory, get a lock on it.
696 		 * If the directory is empty, it will stay empty until
697 		 * we can remove it.
698 		 */
699 		rw_enter(&ip->i_rwlock, RW_READER);
700 	}
701 	/* We must be holding i_contents */
702 	rw_enter(&ip->i_contents, RW_READER);
703 
704 	if (err = ud_sticky_remove_access(dp, ip, cr)) {
705 		rw_exit(&ip->i_contents);
706 		if (mode == VDIR) {
707 			rw_exit(&ip->i_rwlock);
708 		}
709 		goto out;
710 	}
711 	if (op == DR_RMDIR) {
712 		/*
713 		 * For rmdir(2), some special checks are required.
714 		 * (a) Don't remove any alias of the parent (e.g. ".").
715 		 * (b) Don't remove the current directory.
716 		 * (c) Make sure the entry is (still) a directory.
717 		 * (d) Make sure the directory is empty.
718 		 */
719 
720 		if (dp == ip || ITOV(ip) == cdir) {
721 			err = EINVAL;
722 		} else if (ip->i_type != VDIR) {
723 			err = ENOTDIR;
724 		} else if ((ip->i_nlink != 1) ||
725 		    (!ud_dirempty(ip, dp->i_uniqid, cr))) {
726 			/*
727 			 * Directories do not have an
728 			 * entry for "." so only one link
729 			 * will be there
730 			 */
731 			err = EEXIST;	/* SIGH should be ENOTEMPTY */
732 		}
733 		if (err) {
734 			rw_exit(&ip->i_contents);
735 			if (mode == VDIR) {
736 				rw_exit(&ip->i_rwlock);
737 			}
738 			goto out;
739 		}
740 	} else if (op == DR_REMOVE)  {
741 		/*
742 		 * unlink(2) requires a different check: allow only
743 		 * privileged processes to unlink a directory.
744 		 */
745 		struct vnode *vp = ITOV(ip);
746 
747 		if (vp->v_type == VDIR &&
748 		    secpolicy_fs_linkdir(cr, vp->v_vfsp)) {
749 			err = EPERM;
750 			rw_exit(&ip->i_contents);
751 			rw_exit(&ip->i_rwlock);
752 			goto out;
753 		}
754 	}
755 	rw_exit(&ip->i_contents);
756 
757 	/*
758 	 * Remove the cache'd entry, if any.
759 	 */
760 	dnlc_remove(ITOV(dp), namep);
761 
762 	/*
763 	 * We can collapse all the directory
764 	 * entries that are deleted into one big entry
765 	 * but the better way is to
766 	 * defer it till next directory entry
767 	 * creation. where we can do this
768 	 * in a more efficient way
769 	 */
770 	fid = slot.ep;
771 
772 	/*
773 	 * If this is the last entry
774 	 * just truncate the file instead
775 	 * of marking it deleted
776 	 */
777 	if ((slot.offset + FID_LEN(fid)) == dp->i_size) {
778 		fbrelse(slot.fbp, S_OTHER);
779 		if ((err = ud_itrunc(dp, slot.offset, 0, cr)) != 0) {
780 			goto out;
781 		}
782 	} else {
783 		fid->fid_flags |= FID_DELETED;
784 
785 		if ((err = ud_ip_off2bno(dp, slot.offset, &tbno)) != 0) {
786 			goto out;
787 		}
788 
789 		ud_make_tag(dp->i_udf, &fid->fid_tag,
790 		    UD_FILE_ID_DESC, tbno, FID_LEN(fid));
791 
792 		err = ud_write_fid(dp, &slot, buf);
793 	}
794 
795 	slot.fbp = NULL;
796 
797 	/*
798 	 * If we were removing a directory, it is 'gone' now so we can
799 	 * unlock it.
800 	 */
801 	if (mode == VDIR) {
802 		rw_exit(&ip->i_rwlock);
803 	}
804 
805 	mutex_enter(&dp->i_tlock);
806 	dp->i_flag |= IUPD|ICHG;
807 	mutex_exit(&dp->i_tlock);
808 	mutex_enter(&ip->i_tlock);
809 	ip->i_flag |= ICHG;
810 	mutex_exit(&ip->i_tlock);
811 
812 	if (err != 0) {
813 		goto out;
814 	}
815 
816 	rw_enter(&ip->i_contents, RW_WRITER);
817 
818 	/*
819 	 * Now dispose of the inode.
820 	 */
821 	if (ip->i_nlink > 0) {
822 		if ((op == DR_RMDIR) && (ip->i_type == VDIR)) {
823 			/*
824 			 * Decrement by 1 because there is no "."
825 			 * Clear the inode, but there may be other hard
826 			 * links so don't free the inode.
827 			 * Decrement the dp linkcount because we're
828 			 * trashing the ".." entry.
829 			 */
830 			ip->i_nlink --;
831 			dp->i_nlink--;
832 			dnlc_remove(ITOV(ip), ".");
833 			dnlc_remove(ITOV(ip), "..");
834 /*
835  *			(void) ud_itrunc(ip, 0, 0, cr);
836  */
837 		} else {
838 			ip->i_nlink--;
839 		}
840 	}
841 	ITIMES_NOLOCK(dp);
842 	ITIMES_NOLOCK(ip);
843 	rw_exit(&ip->i_contents);
844 out:
845 	if (mode == VDIR) {
846 		vn_vfsunlock(ITOV(ip));
847 	}
848 out_novfs:
849 	ASSERT(RW_WRITE_HELD(&dp->i_contents));
850 
851 	if (slot.fbp != NULL) {
852 		fbrelse(slot.fbp, S_OTHER);
853 	}
854 	rw_exit(&dp->i_contents);
855 
856 	if (ip) {
857 		/*
858 		 * If no errors, send any events after locks are dropped,
859 		 * but before the VN_RELE().
860 		 */
861 		if (err == 0) {
862 			if (op == DR_REMOVE) {
863 				vnevent_remove(ITOV(ip), ITOV(dp), namep, ctp);
864 			} else if (op == DR_RMDIR) {
865 				vnevent_rmdir(ITOV(ip), ITOV(dp), namep, ctp);
866 			}
867 		}
868 		VN_RELE(ITOV(ip));
869 	}
870 
871 	kmem_free(buf, udf_vfsp->udf_lbsize);
872 	return (err);
873 }
874 
875 int
876 ud_dircheckforname(struct ud_inode *tdp,
877 	char *namep, int32_t namelen, struct slot *slotp,
878 	struct ud_inode **ipp, uint8_t *buf, struct cred *cr)
879 {
880 	struct udf_vfs *udf_vfsp;
881 	uint32_t dirsize, offset;
882 	struct fbuf *fbp;
883 	struct file_id *fid;
884 	int32_t sz, error = 0, sz_req, matched = 0;
885 	uint8_t *nm;
886 
887 	uint8_t *dname;
888 	int32_t id_len;
889 
890 	ud_printf("ud_dircheckforname\n");
891 
892 	ASSERT(RW_WRITE_HELD(&tdp->i_rwlock));
893 	fbp = NULL;
894 
895 	dname = (uint8_t *)kmem_zalloc(1024, KM_SLEEP);
896 
897 	udf_vfsp = tdp->i_udf;
898 
899 	offset = 0;
900 	dirsize = tdp->i_size;
901 
902 	if (slotp->status != FOUND) {
903 		int32_t temp;
904 
905 		temp = 1024; /* set to size of dname allocated above */
906 		if ((error = ud_compress(namelen, &temp,
907 		    (uint8_t *)namep, dname)) != 0) {
908 			goto end;
909 		}
910 		sz_req = F_LEN + temp;
911 		sz_req  = (sz_req + 3) & ~3;
912 	}
913 
914 	while (offset < dirsize) {
915 		if ((error = ud_get_next_fid(tdp, &fbp,
916 		    offset, &fid, &nm, buf)) != 0) {
917 			break;
918 		}
919 		if ((error = ud_uncompress(fid->fid_idlen,
920 		    &id_len, nm, dname)) != 0) {
921 			break;
922 		}
923 		if ((fid->fid_flags & FID_DELETED) == 0) {
924 			/* Check for name match */
925 			if (((namelen == id_len) &&
926 			    (strncmp(namep, (caddr_t)dname, namelen) == 0)) ||
927 			    ((fid->fid_flags & FID_PARENT) &&
928 			    (namep[0] == '.' &&
929 			    (namelen == 1 ||
930 			    (namelen == 2 && namep[1] == '.'))))) {
931 
932 				tdp->i_diroff = offset;
933 				if ((fid->fid_flags & FID_PARENT) &&
934 				    (namelen == 1) && (namep[0] == '.')) {
935 					struct vnode *vp = ITOV(tdp);
936 
937 					*ipp = tdp;
938 					VN_HOLD(vp);
939 				} else {
940 					uint16_t prn;
941 					uint32_t loc;
942 
943 					prn = SWAP_16(fid->fid_icb.lad_ext_prn);
944 					loc = SWAP_32(fid->fid_icb.lad_ext_loc);
945 					if ((error = ud_iget(tdp->i_vfs, prn,
946 					    loc, ipp, NULL, cr)) != 0) {
947 
948 						fbrelse(fbp, S_OTHER);
949 						goto end;
950 					}
951 				}
952 				slotp->status = EXIST;
953 				slotp->offset = offset;
954 				slotp->size = FID_LEN(fid);
955 				slotp->fbp = fbp;
956 				slotp->ep = fid;
957 				slotp->endoff = 0;
958 				goto end;
959 			}
960 		} else {
961 			/*
962 			 * see if we need to find an
963 			 * empty slot and the current slot
964 			 * matches
965 			 */
966 			if ((slotp->status != FOUND) || (matched == 0)) {
967 				sz = FID_LEN(fid);
968 				if (sz == sz_req) {
969 					slotp->status = FOUND;
970 					slotp->offset = offset;
971 					slotp->size = sz;
972 				}
973 				if (matched == 0) {
974 					if ((namelen == id_len) &&
975 					    (strncmp(namep, (caddr_t)dname,
976 					    namelen) == 0)) {
977 						matched = 1;
978 						slotp->status = FOUND;
979 						slotp->offset = offset;
980 						slotp->size = sz;
981 					}
982 				}
983 			}
984 		}
985 		offset += FID_LEN(fid);
986 	}
987 	if (fbp) {
988 		fbrelse(fbp, S_OTHER);
989 	}
990 	if (slotp->status == NONE) {
991 		/*
992 		 * We didn't find a slot; the new directory entry should be put
993 		 * at the end of the directory.  Return an indication of where
994 		 * this is, and set "endoff" to zero; since we're going to have
995 		 * to extend the directory, we're certainly not going to
996 		 * trucate it.
997 		 */
998 		slotp->offset = dirsize;
999 		if (tdp->i_desc_type == ICB_FLAG_ONE_AD) {
1000 			slotp->size = tdp->i_max_emb - tdp->i_size;
1001 		} else {
1002 			slotp->size = udf_vfsp->udf_lbsize -
1003 			    slotp->offset & udf_vfsp->udf_lbmask;
1004 		}
1005 		slotp->endoff = 0;
1006 	}
1007 
1008 	*ipp = NULL;
1009 end:
1010 	kmem_free((caddr_t)dname, 1024);
1011 	return (error);
1012 }
1013 
1014 /*
1015  * Return 1 if the dir has all files
1016  * deleted except the parent
1017  * else return 0
1018  */
1019 /* ARGSUSED */
1020 int
1021 ud_dirempty(struct ud_inode *ip, uint64_t ino, struct cred *cr)
1022 {
1023 	offset_t off;
1024 	int32_t empty = 1, error, count, entry_len, rcount;
1025 	struct file_id *fid;
1026 	caddr_t addr;
1027 	uint32_t tbno;
1028 	int32_t	desc_len;
1029 
1030 	ud_printf("ud_dirempty\n");
1031 
1032 	ASSERT(RW_LOCK_HELD(&ip->i_contents));
1033 
1034 	if (ip->i_size == 0) {
1035 		return (empty);
1036 	}
1037 
1038 	desc_len = 1024;
1039 	addr = kmem_zalloc(desc_len, KM_SLEEP);
1040 	fid = (struct file_id *)addr;
1041 
1042 	for (off = 0; off < ip->i_size; off += entry_len) {
1043 
1044 		/*
1045 		 * First read fid
1046 		 * and verify checksum
1047 		 */
1048 
1049 		rcount = sizeof (struct file_id);
1050 		error = ud_rdwri(UIO_READ, FREAD, ip, addr, rcount, off,
1051 		    UIO_SYSSPACE, &count, cr);
1052 		if ((error != 0) || (count != 0)) {
1053 			empty = 0;
1054 			break;
1055 		}
1056 
1057 		if ((error = ud_ip_off2bno(ip, off, &tbno)) != 0) {
1058 			empty = 0;
1059 			break;
1060 		}
1061 
1062 		/*
1063 		 * We verify the tag id and also the FID_LEN.
1064 		 * FID_LEN should be <= desc_len.
1065 		 */
1066 		if (ud_verify_tag_and_desc(&fid->fid_tag,
1067 		    UD_FILE_ID_DESC,
1068 		    tbno, 0, desc_len) != 0) {
1069 		/* Corrupted directory */
1070 			empty = 0;
1071 			break;
1072 		}
1073 
1074 		/*
1075 		 * Read the fid + iulen + len
1076 		 * Now verify both checksum andCRC
1077 		 */
1078 
1079 		rcount = FID_LEN(fid);
1080 		error = ud_rdwri(UIO_READ, FREAD, ip, addr, rcount, off,
1081 		    UIO_SYSSPACE, &count, cr);
1082 		if ((error != 0) || (count != 0)) {
1083 			empty = 0;
1084 			break;
1085 		}
1086 		/*
1087 		 * Now that the entire decsriptor is read we verify the
1088 		 * crc.
1089 		 */
1090 		if (ud_verify_tag_and_desc(&fid->fid_tag,
1091 		    UD_FILE_ID_DESC,
1092 		    tbno,
1093 		    1, rcount) != 0) {
1094 			/* Corrupted directory */
1095 			empty = 0;
1096 			break;
1097 		}
1098 
1099 		/*
1100 		 * Is the file deleted
1101 		 */
1102 
1103 		if ((fid->fid_flags & FID_DELETED) == 0) {
1104 			if ((fid->fid_flags & FID_PARENT) == 0) {
1105 				empty = 0;
1106 				break;
1107 			}
1108 		}
1109 		entry_len = FID_LEN(fid);
1110 	}
1111 
1112 	kmem_free(addr, 1024);
1113 
1114 	return (empty);
1115 }
1116 
1117 
1118 int
1119 ud_dircheckpath(int32_t blkno,
1120 	struct ud_inode *target, struct cred *cr)
1121 {
1122 	int32_t err = 0;
1123 	struct vfs *vfsp;
1124 	struct udf_vfs *udf_vfsp;
1125 	struct fbuf *fbp;
1126 	struct file_id *fid;
1127 	struct ud_inode *ip, *tip;
1128 	uint16_t prn;
1129 	uint32_t lbno, dummy, tbno;
1130 	daddr_t parent_icb_loc;
1131 
1132 	ud_printf("ud_dircheckpath\n");
1133 
1134 	udf_vfsp = target->i_udf;
1135 	ip = target;
1136 
1137 	ASSERT(udf_vfsp != NULL);
1138 	ASSERT(MUTEX_HELD(&target->i_udf->udf_rename_lck));
1139 	ASSERT(RW_WRITE_HELD(&ip->i_rwlock));
1140 
1141 	if (ip->i_icb_lbano == blkno) {
1142 		err = EINVAL;
1143 		goto out;
1144 	}
1145 	if (ip->i_icb_lbano == udf_vfsp->udf_root_blkno) {
1146 		goto out;
1147 	}
1148 
1149 	/*
1150 	 * Search back through the directory tree, using the PARENT entries
1151 	 * Fail any attempt to move a directory into an ancestor directory.
1152 	 */
1153 	for (;;) {
1154 		if ((err = fbread(ITOV(ip), 0,
1155 		    udf_vfsp->udf_lbsize, S_READ, &fbp)) != 0) {
1156 			break;
1157 		}
1158 
1159 		if ((err = ud_ip_off2bno(ip, 0, &tbno)) != 0) {
1160 			break;
1161 		}
1162 		fid = (struct file_id *)fbp->fb_addr;
1163 		/* IS this a valid file_identifier */
1164 		if (ud_verify_tag_and_desc(&fid->fid_tag,
1165 		    UD_FILE_ID_DESC,
1166 		    tbno,
1167 		    1, udf_vfsp->udf_lbsize) != 0) {
1168 			break;
1169 		}
1170 		if ((fid->fid_flags & FID_DELETED) != 0) {
1171 			break;
1172 		}
1173 		if ((fid->fid_flags & FID_PARENT) == 0) {
1174 			/*
1175 			 * This cannot happen unless
1176 			 * something is grossly wrong
1177 			 * First entry has to be parent
1178 			 */
1179 			break;
1180 		}
1181 		prn = SWAP_16(fid->fid_icb.lad_ext_prn);
1182 		lbno = SWAP_32(fid->fid_icb.lad_ext_loc);
1183 		parent_icb_loc =
1184 		    ud_xlate_to_daddr(udf_vfsp, prn, lbno, 1, &dummy);
1185 		ASSERT(dummy == 1);
1186 		if (parent_icb_loc == blkno) {
1187 			err = EINVAL;
1188 			break;
1189 		}
1190 		vfsp = ip->i_vfs;
1191 		udf_vfsp = ip->i_udf;
1192 		if (parent_icb_loc == udf_vfsp->udf_root_blkno) {
1193 			break;
1194 		}
1195 		if (fbp != NULL) {
1196 			fbrelse(fbp, S_OTHER);
1197 			fbp = NULL;
1198 		}
1199 		if (ip != target) {
1200 			rw_exit(&ip->i_rwlock);
1201 			VN_RELE(ITOV(ip));
1202 		}
1203 
1204 		/*
1205 		 * Race to get the inode.
1206 		 */
1207 		if (err = ud_iget(vfsp, prn, lbno, &tip, NULL, cr)) {
1208 			ip = NULL;
1209 			break;
1210 		}
1211 		ip = tip;
1212 		rw_enter(&ip->i_rwlock, RW_READER);
1213 	}
1214 	if (fbp) {
1215 		fbrelse(fbp, S_OTHER);
1216 	}
1217 out:
1218 	if (ip) {
1219 		if (ip != target) {
1220 			rw_exit(&ip->i_rwlock);
1221 			VN_RELE(ITOV(ip));
1222 		}
1223 	}
1224 	return (err);
1225 }
1226 
1227 int
1228 ud_dirmakeinode(struct ud_inode *tdp, struct ud_inode **ipp,
1229 	struct vattr *vap, enum de_op op, struct cred *cr)
1230 {
1231 	struct ud_inode *ip;
1232 	int32_t error;
1233 
1234 	ASSERT(vap != NULL);
1235 	ASSERT(op == DE_CREATE || op == DE_MKDIR);
1236 	ASSERT((vap->va_mask & (AT_TYPE|AT_MODE)) == (AT_TYPE|AT_MODE));
1237 	ASSERT(RW_WRITE_HELD(&tdp->i_rwlock));
1238 
1239 	/*
1240 	 * Allocate a new inode.
1241 	 */
1242 	if ((error = ud_ialloc(tdp, &ip, vap, cr)) != 0) {
1243 		return (error);
1244 	}
1245 
1246 	ASSERT(ip != NULL);
1247 
1248 	rw_enter(&ip->i_contents, RW_WRITER);
1249 
1250 	if (op == DE_MKDIR) {
1251 		error = ud_dirmakedirect(ip, tdp, cr);
1252 	}
1253 
1254 	ip->i_flag |= IACC|IUPD|ICHG;
1255 	/*
1256 	 * Clear IACC and/or IUPD if the caller specified the atime and/or
1257 	 * mtime fields.  They were set from the passed in attributes in
1258 	 * ud_ialloc().
1259 	 */
1260 	if (vap->va_mask & AT_ATIME)
1261 		ip->i_flag &= ~IACC;
1262 	if (vap->va_mask & AT_MTIME)
1263 		ip->i_flag &= ~IUPD;
1264 	/*
1265 	 * push inode before it's name appears in a directory
1266 	 */
1267 	ud_iupdat(ip, 1);
1268 	*ipp = ip;
1269 	rw_exit(&ip->i_contents);
1270 	return (error);
1271 }
1272 
1273 /*
1274  * Enter the file sip in the directory tdp with name namep.
1275  */
1276 int
1277 ud_diraddentry(struct ud_inode *tdp, char *namep,
1278 	enum de_op op, int32_t namelen, struct slot *slotp,
1279 	struct ud_inode *sip, struct ud_inode *sdp, struct cred *cr)
1280 {
1281 	struct udf_vfs *udf_vfsp;
1282 	int32_t error, temp;
1283 	struct file_id *fid;
1284 	uint8_t *buf = NULL;
1285 
1286 	ASSERT(RW_WRITE_HELD(&tdp->i_rwlock));
1287 
1288 	ud_printf("ud_diraddentry\n");
1289 
1290 	udf_vfsp = sip->i_udf;
1291 
1292 	/*
1293 	 * Check inode to be linked to see if it is in the
1294 	 * same filesystem.
1295 	 */
1296 	if (ITOV(tdp)->v_vfsp != ITOV(sip)->v_vfsp) {
1297 		error = EXDEV;
1298 		goto bad;
1299 	}
1300 
1301 	if ((op == DE_RENAME) && (sip->i_type == VDIR)) {
1302 		if ((error = ud_dirfixdotdot(sip, sdp, tdp)) != 0) {
1303 			goto bad;
1304 		}
1305 	}
1306 
1307 	buf = (uint8_t *)kmem_zalloc(udf_vfsp->udf_lbsize, KM_SLEEP);
1308 
1309 	/*
1310 	 * Fill in entry data.
1311 	 */
1312 	fid = (struct file_id *)buf;
1313 	fid->fid_ver = SWAP_16(1);
1314 	if (sip->i_type == VDIR) {
1315 		fid->fid_flags = FID_DIR;
1316 	} else {
1317 		fid->fid_flags = 0;
1318 	}
1319 	fid->fid_iulen = 0;
1320 
1321 	fid->fid_icb.lad_ext_len = SWAP_32(sip->i_udf->udf_lbsize);
1322 	fid->fid_icb.lad_ext_loc = SWAP_32(sip->i_icb_block);
1323 	fid->fid_icb.lad_ext_prn = SWAP_16(sip->i_icb_prn);
1324 	fid->fid_iulen = 0;
1325 
1326 	temp = MIN(udf_vfsp->udf_lbsize - F_LEN, MAXNAMELEN);
1327 	if ((error = ud_compress(namelen, &temp,
1328 	    (uint8_t *)namep, fid->fid_spec)) == 0) {
1329 		fid->fid_idlen = (uint8_t)temp;
1330 		error = ud_dirprepareentry(tdp, slotp, buf, cr);
1331 	}
1332 
1333 	kmem_free(buf, udf_vfsp->udf_lbsize);
1334 
1335 bad:
1336 	return (error);
1337 }
1338 
1339 /*
1340  * Write a prototype directory into the empty inode ip, whose parent is dp.
1341  */
1342 /* ARGSUSED2 */
1343 int
1344 ud_dirmakedirect(struct ud_inode *ip,
1345 	struct ud_inode *dp, struct cred *cr)
1346 {
1347 	int32_t err;
1348 	uint32_t blkno, size, parent_len, tbno;
1349 	struct fbuf *fbp;
1350 	struct file_id *fid;
1351 	struct icb_ext *iext;
1352 
1353 	ud_printf("ud_dirmakedirect\n");
1354 
1355 	ASSERT(RW_WRITE_HELD(&ip->i_contents));
1356 	ASSERT(RW_WRITE_HELD(&dp->i_rwlock));
1357 
1358 	parent_len = sizeof (struct file_id);
1359 
1360 	if ((ip->i_desc_type != ICB_FLAG_ONE_AD) ||
1361 	    (parent_len > ip->i_max_emb)) {
1362 		ASSERT(ip->i_ext);
1363 		/*
1364 		 * Allocate space for the directory we're creating.
1365 		 */
1366 		if ((err = ud_alloc_space(ip->i_vfs, ip->i_icb_prn,
1367 		    0, 1, &blkno, &size, 0, 0)) != 0) {
1368 			return (err);
1369 		}
1370 		/*
1371 		 * init with the size of
1372 		 * directory with just the
1373 		 * parent
1374 		 */
1375 		ip->i_size = sizeof (struct file_id);
1376 		ip->i_flag |= IUPD|ICHG|IATTCHG;
1377 		iext = ip->i_ext;
1378 		iext->ib_prn = ip->i_icb_prn;
1379 		iext->ib_block = blkno;
1380 		iext->ib_count = ip->i_size;
1381 		iext->ib_offset = 0;
1382 		ip->i_ext_used = 1;
1383 	} else {
1384 		ip->i_size = sizeof (struct file_id);
1385 		ip->i_flag |= IUPD|ICHG|IATTCHG;
1386 	}
1387 
1388 	ITIMES_NOLOCK(ip);
1389 
1390 	/*
1391 	 * Update the dp link count and write out the change.
1392 	 * This reflects the ".." entry we'll soon write.
1393 	 */
1394 	if (dp->i_nlink == MAXLINK) {
1395 		return (EMLINK);
1396 	}
1397 	dp->i_nlink++;
1398 	dp->i_flag |= ICHG;
1399 	ud_iupdat(dp, 1);
1400 
1401 	/*
1402 	 * Initialize directory with ".."
1403 	 * Since the parent directory is locked, we don't have to
1404 	 * worry about anything changing when we drop the write
1405 	 * lock on (ip).
1406 	 */
1407 	rw_exit(&ip->i_contents);
1408 	if ((err = fbread(ITOV(ip), (offset_t)0,
1409 	    ip->i_udf->udf_lbsize, S_WRITE, &fbp)) != 0) {
1410 		rw_enter(&ip->i_contents, RW_WRITER);
1411 		return (err);
1412 	}
1413 
1414 	bzero(fbp->fb_addr, ip->i_udf->udf_lbsize);
1415 
1416 	fid = (struct file_id *)fbp->fb_addr;
1417 	fid->fid_ver = SWAP_16(1);
1418 	fid->fid_flags = FID_DIR | FID_PARENT;
1419 	fid->fid_icb.lad_ext_len = SWAP_32(dp->i_udf->udf_lbsize);
1420 	fid->fid_icb.lad_ext_loc = SWAP_32(dp->i_icb_block);
1421 	fid->fid_icb.lad_ext_prn = SWAP_16(dp->i_icb_prn);
1422 
1423 	/*
1424 	 * fid_idlen, fid_iulen and fid_spec are zero
1425 	 * due to bzero above
1426 	 */
1427 
1428 	if ((err = ud_ip_off2bno(ip, 0, &tbno)) == 0) {
1429 		ud_make_tag(ip->i_udf, &fid->fid_tag,
1430 		    UD_FILE_ID_DESC, tbno, FID_LEN(fid));
1431 	}
1432 
1433 	err = ud_fbwrite(fbp, ip);
1434 	rw_enter(&ip->i_contents, RW_WRITER);
1435 
1436 	return (err);
1437 }
1438 
1439 int
1440 ud_dirrename(struct ud_inode *sdp, struct ud_inode *sip,
1441 	struct ud_inode *tdp, struct ud_inode *tip, char *namep,
1442 	uint8_t *buf, struct slot *slotp, struct cred *cr)
1443 {
1444 	int32_t error = 0, doingdirectory;
1445 	struct file_id *fid;
1446 
1447 	ud_printf("ud_dirrename\n");
1448 	ASSERT(sdp->i_udf != NULL);
1449 	ASSERT(MUTEX_HELD(&sdp->i_udf->udf_rename_lck));
1450 	ASSERT(RW_WRITE_HELD(&tdp->i_rwlock));
1451 	ASSERT(RW_WRITE_HELD(&tdp->i_contents));
1452 	ASSERT(buf);
1453 	ASSERT(slotp->ep);
1454 
1455 	fid = slotp->ep;
1456 
1457 	/*
1458 	 * Short circuit rename of something to itself.
1459 	 */
1460 	if (sip->i_icb_lbano == tip->i_icb_lbano) {
1461 		return (ESAME);		/* special KLUDGE error code */
1462 	}
1463 	/*
1464 	 * Everything is protected under the vfs_rename_lock so the ordering
1465 	 * of i_contents locks doesn't matter here.
1466 	 */
1467 	rw_enter(&sip->i_contents, RW_READER);
1468 	rw_enter(&tip->i_contents, RW_READER);
1469 
1470 	/*
1471 	 * Check that everything is on the same filesystem.
1472 	 */
1473 	if ((ITOV(tip)->v_vfsp != ITOV(tdp)->v_vfsp) ||
1474 	    (ITOV(tip)->v_vfsp != ITOV(sip)->v_vfsp)) {
1475 		error = EXDEV;		/* XXX archaic */
1476 		goto out;
1477 	}
1478 
1479 	/*
1480 	 * Must have write permission to rewrite target entry.
1481 	 */
1482 	if ((error = ud_iaccess(tdp, IWRITE, cr, 0)) != 0 ||
1483 	    (error = ud_sticky_remove_access(tdp, tip, cr)) != 0)
1484 		goto out;
1485 
1486 	/*
1487 	 * Ensure source and target are compatible (both directories
1488 	 * or both not directories).  If target is a directory it must
1489 	 * be empty and have no links to it; in addition it must not
1490 	 * be a mount point, and both the source and target must be
1491 	 * writable.
1492 	 */
1493 	doingdirectory = (sip->i_type == VDIR);
1494 	if (tip->i_type == VDIR) {
1495 		if (!doingdirectory) {
1496 			error = EISDIR;
1497 			goto out;
1498 		}
1499 		/*
1500 		 * vn_vfswlock will prevent mounts from using the directory
1501 		 * until we are done.
1502 		 */
1503 		if (vn_vfswlock(ITOV(tip))) {
1504 			error = EBUSY;
1505 			goto out;
1506 		}
1507 		if (vn_mountedvfs(ITOV(tip)) != NULL) {
1508 			vn_vfsunlock(ITOV(tip));
1509 			error = EBUSY;
1510 			goto out;
1511 		}
1512 		if (!ud_dirempty(tip, tdp->i_uniqid, cr) || tip->i_nlink > 2) {
1513 			vn_vfsunlock(ITOV(tip));
1514 			error = EEXIST;	/* SIGH should be ENOTEMPTY */
1515 			goto out;
1516 		}
1517 	} else if (doingdirectory) {
1518 		error = ENOTDIR;
1519 		goto out;
1520 	}
1521 
1522 	/*
1523 	 * Rewrite the inode pointer for target name entry
1524 	 * from the target inode (ip) to the source inode (sip).
1525 	 * This prevents the target entry from disappearing
1526 	 * during a crash. Mark the directory inode to reflect the changes.
1527 	 */
1528 	dnlc_remove(ITOV(tdp), namep);
1529 	fid->fid_icb.lad_ext_prn = SWAP_16(sip->i_icb_prn);
1530 	fid->fid_icb.lad_ext_loc = SWAP_32(sip->i_icb_block);
1531 	dnlc_enter(ITOV(tdp), namep, ITOV(sip));
1532 
1533 	ud_make_tag(tdp->i_udf, &fid->fid_tag, UD_FILE_ID_DESC,
1534 	    SWAP_32(fid->fid_tag.tag_loc), FID_LEN(fid));
1535 
1536 	error = ud_write_fid(tdp, slotp, buf);
1537 
1538 	if (error) {
1539 		if (doingdirectory) {
1540 			vn_vfsunlock(ITOV(tip));
1541 		}
1542 		goto out;
1543 	}
1544 
1545 	/*
1546 	 * Upgrade to write lock on tip
1547 	 */
1548 	rw_exit(&tip->i_contents);
1549 	rw_enter(&tip->i_contents, RW_WRITER);
1550 
1551 	mutex_enter(&tdp->i_tlock);
1552 	tdp->i_flag |= IUPD|ICHG;
1553 	mutex_exit(&tdp->i_tlock);
1554 	/*
1555 	 * Decrement the link count of the target inode.
1556 	 * Fix the ".." entry in sip to point to dp.
1557 	 * This is done after the new entry is on the disk.
1558 	 */
1559 	tip->i_nlink--;
1560 	mutex_enter(&tip->i_tlock);
1561 	tip->i_flag |= ICHG;
1562 	mutex_exit(&tip->i_tlock);
1563 
1564 	if (doingdirectory) {
1565 		/*
1566 		 * The entry for tip no longer exists so I can unlock the
1567 		 * vfslock.
1568 		 */
1569 		vn_vfsunlock(ITOV(tip));
1570 		/*
1571 		 * Decrement target link count once more if it was a directory.
1572 		 */
1573 		if (tip->i_nlink != 0) {
1574 			cmn_err(CE_WARN,
1575 			"ud_direnter: target directory link count != 0");
1576 			rw_exit(&tip->i_contents);
1577 			rw_exit(&sip->i_contents);
1578 			return (EINVAL);
1579 		}
1580 		/*
1581 		 * Renaming a directory with the parent different
1582 		 * requires that ".." be rewritten.  The window is
1583 		 * still there for ".." to be inconsistent, but this
1584 		 * is unavoidable, and a lot shorter than when it was
1585 		 * done in a user process.  We decrement the link
1586 		 * count in the new parent as appropriate to reflect
1587 		 * the just-removed target.  If the parent is the
1588 		 * same, this is appropriate since the original
1589 		 * directory is going away.  If the new parent is
1590 		 * different, dirfixdotdot() will bump the link count
1591 		 * back.
1592 		 */
1593 		tdp->i_nlink--;
1594 		mutex_enter(&tdp->i_tlock);
1595 		tdp->i_flag |= ICHG;
1596 		mutex_exit(&tdp->i_tlock);
1597 		ITIMES_NOLOCK(tdp);
1598 		if (sdp != tdp) {
1599 			rw_exit(&tip->i_contents);
1600 			rw_exit(&sip->i_contents);
1601 			error = ud_dirfixdotdot(sip, sdp, tdp);
1602 			return (error);
1603 		}
1604 	}
1605 
1606 out:
1607 	rw_exit(&tip->i_contents);
1608 	rw_exit(&sip->i_contents);
1609 	return (error);
1610 }
1611 
1612 
1613 /*
1614  * 1. When we find a slot that belonged to a file which was deleted
1615  *      and is in the middle of the directory
1616  * 2. There is not empty slot available. The new entry
1617  *      will be at the end of the directory and fits in the same block.
1618  * 3. There is no empty slot available. The new
1619  *      entry will not fit the left over directory
1620  *      so we need to allocate a new block. If
1621  *      we cannot allocate a proximity block we need
1622  *      to allocate a new icb, and data block.
1623  */
1624 int
1625 ud_dirprepareentry(struct ud_inode *dp,
1626 	struct slot *slotp, uint8_t *buf, struct cred *cr)
1627 {
1628 	struct fbuf *fbp;
1629 	uint16_t old_dtype;
1630 	int32_t error = 0;
1631 	uint32_t entrysize, count, offset, tbno, old_size, off;
1632 	struct file_id *fid;
1633 	int32_t lbsize, lbmask, mask;
1634 
1635 	ASSERT(RW_WRITE_HELD(&dp->i_rwlock));
1636 
1637 	ASSERT((slotp->status == NONE) || (slotp->status == FOUND));
1638 
1639 	ud_printf("ud_dirprepareentry\n");
1640 	lbsize = dp->i_udf->udf_lbsize;
1641 	lbmask = dp->i_udf->udf_lbmask;
1642 	mask = ~lbmask;
1643 
1644 	fid = (struct file_id *)buf;
1645 	entrysize = FID_LEN(fid);
1646 
1647 	/*
1648 	 * If we didn't find a slot, then indicate that the
1649 	 * new slot belongs at the end of the directory.
1650 	 * If we found a slot, then the new entry can be
1651 	 * put at slotp->offset.
1652 	 */
1653 	if (slotp->status == NONE) {
1654 		/*
1655 		 * We did not find a slot, the next
1656 		 * entry will be in the end of the directory
1657 		 * see if we can fit the new entry inside
1658 		 * the old block. If not allocate a new block.
1659 		 */
1660 		if (entrysize > slotp->size) {
1661 			/*
1662 			 * extend the directory
1663 			 * size by one new block
1664 			 */
1665 			old_dtype = dp->i_desc_type;
1666 			old_size = (uint32_t)dp->i_size;
1667 			error = ud_bmap_write(dp, slotp->offset,
1668 			    blkoff(dp->i_udf, slotp->offset) + entrysize,
1669 			    0, cr);
1670 			if (error != 0) {
1671 				return (error);
1672 			}
1673 			if (old_dtype != dp->i_desc_type) {
1674 				/*
1675 				 * oops we changed the astrat
1676 				 * of the file, we have to
1677 				 * recaliculate tags
1678 				 * fortunately we donot have more
1679 				 * than one lbsize to handle here
1680 				 */
1681 				if ((error = ud_ip_off2bno(dp,
1682 				    0, &tbno)) != 0) {
1683 					return (error);
1684 				}
1685 				if ((error = fbread(ITOV(dp), 0,
1686 				    dp->i_udf->udf_lbsize,
1687 				    S_WRITE, &fbp)) != 0) {
1688 					return (error);
1689 				}
1690 				off = 0;
1691 				while (off < old_size) {
1692 					struct file_id *tfid;
1693 
1694 					tfid = (struct file_id *)
1695 					    (fbp->fb_addr + off);
1696 
1697 					ud_make_tag(dp->i_udf, &tfid->fid_tag,
1698 					    UD_FILE_ID_DESC, tbno,
1699 					    FID_LEN(tfid));
1700 
1701 					off += FID_LEN(tfid);
1702 				}
1703 				if (error = ud_fbwrite(fbp, dp)) {
1704 					return (error);
1705 				}
1706 			}
1707 		} else {
1708 			/* Extend the directory size */
1709 			if (dp->i_desc_type != ICB_FLAG_ONE_AD) {
1710 				ASSERT(dp->i_ext);
1711 				dp->i_ext[dp->i_ext_used - 1].ib_count +=
1712 				    entrysize;
1713 			}
1714 		}
1715 		dp->i_size += entrysize;
1716 		dp->i_flag |= IUPD|ICHG|IATTCHG;
1717 		ITIMES_NOLOCK(dp);
1718 	} else if (slotp->status != FOUND) {
1719 		cmn_err(CE_WARN, "status is not NONE/FOUND");
1720 		return (EINVAL);
1721 	}
1722 
1723 	if ((error = ud_ip_off2bno(dp, slotp->offset, &tbno)) != 0) {
1724 		return (error);
1725 	}
1726 	ud_make_tag(dp->i_udf, &fid->fid_tag, UD_FILE_ID_DESC,
1727 	    tbno, FID_LEN(fid));
1728 
1729 	/*
1730 	 * fbread cannot cross a
1731 	 * MAXBSIZE boundary so handle it here
1732 	 */
1733 	offset = slotp->offset;
1734 	if ((error = fbread(ITOV(dp), offset & mask, lbsize,
1735 	    S_WRITE, &fbp)) != 0) {
1736 		return (error);
1737 	}
1738 	if ((offset & mask) != ((offset + entrysize) & mask)) {
1739 		count = entrysize - ((offset + entrysize) & lbmask);
1740 	} else {
1741 		count = entrysize;
1742 	}
1743 	bcopy((caddr_t)buf, fbp->fb_addr + (offset & lbmask), count);
1744 
1745 	if (error = ud_fbwrite(fbp, dp)) {
1746 		return (error);
1747 	}
1748 
1749 	if (entrysize > count) {
1750 		if ((error = fbread(ITOV(dp), (offset + entrysize) & mask,
1751 		    lbsize, S_WRITE, &fbp)) != 0) {
1752 			return (error);
1753 		}
1754 		bcopy((caddr_t)(buf + count), fbp->fb_addr, entrysize - count);
1755 		if (error = ud_fbwrite(fbp, dp)) {
1756 			return (error);
1757 		}
1758 	}
1759 
1760 	dp->i_flag |= IUPD|ICHG|IATTCHG;
1761 	ITIMES_NOLOCK(dp);
1762 	return (error);
1763 }
1764 
1765 
1766 /*
1767  * Fix the FID_PARENT entry of the child directory so that it points
1768  * to the new parent directory instead of the old one.  Routine
1769  * assumes that dp is a directory and that all the inodes are on
1770  * the same file system.
1771  */
1772 int
1773 ud_dirfixdotdot(struct ud_inode *dp,
1774 	struct ud_inode *opdp, struct ud_inode *npdp)
1775 {
1776 	int32_t err = 0;
1777 	struct fbuf *fbp;
1778 	struct file_id *fid;
1779 	uint32_t loc, dummy, tbno;
1780 
1781 	ud_printf("ud_dirfixdotdot\n");
1782 
1783 	ASSERT(opdp->i_type == VDIR);
1784 	ASSERT(npdp->i_type == VDIR);
1785 
1786 	ASSERT(RW_WRITE_HELD(&npdp->i_rwlock));
1787 
1788 	err = fbread(ITOV(dp), (offset_t)0,
1789 	    dp->i_udf->udf_lbsize, S_WRITE, &fbp);
1790 
1791 	if (err || dp->i_nlink == 0 ||
1792 	    dp->i_size < sizeof (struct file_id)) {
1793 		goto bad;
1794 	}
1795 
1796 	if ((err = ud_ip_off2bno(dp, 0, &tbno)) != 0) {
1797 		goto bad;
1798 	}
1799 
1800 	fid = (struct file_id *)fbp->fb_addr;
1801 	if ((ud_verify_tag_and_desc(&fid->fid_tag, UD_FILE_ID_DESC,
1802 	    tbno,
1803 	    1, dp->i_udf->udf_lbsize) != 0) ||
1804 	    ((fid->fid_flags & (FID_DIR | FID_PARENT)) !=
1805 	    (FID_DIR | FID_PARENT))) {
1806 		err = ENOTDIR;
1807 		goto bad;
1808 	}
1809 
1810 	loc = ud_xlate_to_daddr(dp->i_udf,
1811 	    SWAP_16(fid->fid_icb.lad_ext_prn),
1812 	    SWAP_32(fid->fid_icb.lad_ext_loc), 1, &dummy);
1813 	ASSERT(dummy == 1);
1814 	if (loc == npdp->i_icb_lbano) {
1815 		goto bad;
1816 	}
1817 
1818 	/*
1819 	 * Increment the link count in the new parent inode and force it out.
1820 	 */
1821 	if (npdp->i_nlink == MAXLINK) {
1822 		err = EMLINK;
1823 		goto bad;
1824 	}
1825 
1826 	npdp->i_nlink++;
1827 	mutex_enter(&npdp->i_tlock);
1828 	npdp->i_flag |= ICHG;
1829 	mutex_exit(&npdp->i_tlock);
1830 	ud_iupdat(npdp, 1);
1831 
1832 	/*
1833 	 * Rewrite the child FID_PARENT entry and force it out.
1834 	 */
1835 	dnlc_remove(ITOV(dp), "..");
1836 	fid->fid_icb.lad_ext_loc = SWAP_32(npdp->i_icb_block);
1837 	fid->fid_icb.lad_ext_prn = SWAP_16(npdp->i_icb_prn);
1838 	ud_make_tag(npdp->i_udf, &fid->fid_tag,
1839 	    UD_FILE_ID_DESC, tbno, FID_LEN(fid));
1840 	dnlc_enter(ITOV(dp), "..", ITOV(npdp));
1841 
1842 	err = ud_fbwrite(fbp, dp);
1843 	fbp = NULL;
1844 	if (err != 0) {
1845 		goto bad;
1846 	}
1847 
1848 	/*
1849 	 * Decrement the link count of the old parent inode and force
1850 	 * it out.  If opdp is NULL, then this is a new directory link;
1851 	 * it has no parent, so we need not do anything.
1852 	 */
1853 	if (opdp != NULL) {
1854 		rw_enter(&opdp->i_contents, RW_WRITER);
1855 		if (opdp->i_nlink != 0) {
1856 			opdp->i_nlink--;
1857 			mutex_enter(&opdp->i_tlock);
1858 			opdp->i_flag |= ICHG;
1859 			mutex_exit(&opdp->i_tlock);
1860 			ud_iupdat(opdp, 1);
1861 		}
1862 		rw_exit(&opdp->i_contents);
1863 	}
1864 	return (0);
1865 
1866 bad:
1867 	if (fbp) {
1868 		fbrelse(fbp, S_OTHER);
1869 	}
1870 	return (err);
1871 }
1872 
1873 int32_t
1874 ud_write_fid(struct ud_inode *dp, struct slot *slot, uint8_t *buf)
1875 {
1876 	struct udf_vfs *udf_vfsp;
1877 	struct fbuf *lfbp;
1878 	struct file_id *fid;
1879 	int32_t error = 0;
1880 	uint32_t lbsize, lbmask, count, old_count;
1881 
1882 
1883 	ASSERT(slot->fbp);
1884 	ASSERT(slot->ep);
1885 
1886 	udf_vfsp = dp->i_udf;
1887 	fid = slot->ep;
1888 	lbsize = dp->i_udf->udf_lbsize;
1889 	lbmask = dp->i_udf->udf_lbmask;
1890 
1891 	if (((uint8_t *)fid >= buf) &&
1892 	    ((uint8_t *)fid < &buf[udf_vfsp->udf_lbsize])) {
1893 
1894 		if ((error = fbread(ITOV(dp),
1895 		    (offset_t)(slot->offset & ~lbmask),
1896 		    lbsize, S_WRITE, &lfbp)) != 0) {
1897 			goto out;
1898 		}
1899 
1900 
1901 		/*
1902 		 * We do not need to write the
1903 		 * file name. So check if the entry
1904 		 * does not cross a block boundary
1905 		 * and write only required portions
1906 		 */
1907 		if (((slot->offset & lbmask) +
1908 			sizeof (struct file_id)) > lbsize) {
1909 
1910 			if ((slot->offset & lbmask) != 0) {
1911 				old_count = lbsize -
1912 					(slot->offset & lbmask);
1913 				count = (slot->offset +
1914 					sizeof (struct file_id)) &
1915 					lbmask;
1916 			} else {
1917 				old_count = 0;
1918 				count = sizeof (struct file_id);
1919 			}
1920 
1921 			bcopy(buf, lfbp->fb_addr +
1922 				(slot->offset & lbmask), old_count);
1923 			bcopy(buf + old_count,
1924 				slot->fbp->fb_addr, count);
1925 
1926 			error = ud_fbwrite(lfbp, dp);
1927 
1928 			error = ud_fbwrite(slot->fbp, dp);
1929 		} else {
1930 			bcopy(buf, lfbp->fb_addr +
1931 				(slot->offset & lbmask),
1932 				sizeof (struct file_id));
1933 
1934 			error = ud_fbwrite(lfbp, dp);
1935 
1936 			fbrelse(slot->fbp, S_OTHER);
1937 		}
1938 	} else {
1939 		if ((error = ud_fbwrite(slot->fbp, dp)) != 0) {
1940 			fid->fid_flags &= ~FID_DELETED;
1941 			ud_make_tag(dp->i_udf, &fid->fid_tag, UD_FILE_ID_DESC,
1942 			    SWAP_32(fid->fid_tag.tag_loc), FID_LEN(fid));
1943 		}
1944 	}
1945 	slot->fbp = NULL;
1946 
1947 out:
1948 	return (error);
1949 }
1950