xref: /freebsd/sys/kern/kern_conf.c (revision 6b2c1e49da284f28ec7b52f7c031474087e37104)
1 /*-
2  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
3  *
4  * Copyright (c) 1999-2002 Poul-Henning Kamp
5  * All rights reserved.
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  * 1. Redistributions of source code must retain the above copyright
11  *    notice, this list of conditions and the following disclaimer.
12  * 2. Redistributions in binary form must reproduce the above copyright
13  *    notice, this list of conditions and the following disclaimer in the
14  *    documentation and/or other materials provided with the distribution.
15  *
16  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
17  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
18  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
19  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
20  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
21  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
22  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
23  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
24  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26  * SUCH DAMAGE.
27  */
28 
29 #include <sys/cdefs.h>
30 __FBSDID("$FreeBSD$");
31 
32 #include <sys/param.h>
33 #include <sys/kernel.h>
34 #include <sys/systm.h>
35 #include <sys/bus.h>
36 #include <sys/bio.h>
37 #include <sys/lock.h>
38 #include <sys/mutex.h>
39 #include <sys/module.h>
40 #include <sys/malloc.h>
41 #include <sys/conf.h>
42 #include <sys/vnode.h>
43 #include <sys/queue.h>
44 #include <sys/poll.h>
45 #include <sys/sx.h>
46 #include <sys/ctype.h>
47 #include <sys/ucred.h>
48 #include <sys/taskqueue.h>
49 #include <machine/stdarg.h>
50 
51 #include <fs/devfs/devfs_int.h>
52 #include <vm/vm.h>
53 
54 static MALLOC_DEFINE(M_DEVT, "cdev", "cdev storage");
55 
56 struct mtx devmtx;
57 static void destroy_devl(struct cdev *dev);
58 static int destroy_dev_sched_cbl(struct cdev *dev,
59     void (*cb)(void *), void *arg);
60 static void destroy_dev_tq(void *ctx, int pending);
61 static int make_dev_credv(int flags, struct cdev **dres, struct cdevsw *devsw,
62     int unit, struct ucred *cr, uid_t uid, gid_t gid, int mode, const char *fmt,
63     va_list ap);
64 
65 static struct cdev_priv_list cdevp_free_list =
66     TAILQ_HEAD_INITIALIZER(cdevp_free_list);
67 static SLIST_HEAD(free_cdevsw, cdevsw) cdevsw_gt_post_list =
68     SLIST_HEAD_INITIALIZER(cdevsw_gt_post_list);
69 
70 void
71 dev_lock(void)
72 {
73 
74 	mtx_lock(&devmtx);
75 }
76 
77 /*
78  * Free all the memory collected while the cdev mutex was
79  * locked. Since devmtx is after the system map mutex, free() cannot
80  * be called immediately and is postponed until cdev mutex can be
81  * dropped.
82  */
83 static void
84 dev_unlock_and_free(void)
85 {
86 	struct cdev_priv_list cdp_free;
87 	struct free_cdevsw csw_free;
88 	struct cdev_priv *cdp;
89 	struct cdevsw *csw;
90 
91 	mtx_assert(&devmtx, MA_OWNED);
92 
93 	/*
94 	 * Make the local copy of the list heads while the dev_mtx is
95 	 * held. Free it later.
96 	 */
97 	TAILQ_INIT(&cdp_free);
98 	TAILQ_CONCAT(&cdp_free, &cdevp_free_list, cdp_list);
99 	csw_free = cdevsw_gt_post_list;
100 	SLIST_INIT(&cdevsw_gt_post_list);
101 
102 	mtx_unlock(&devmtx);
103 
104 	while ((cdp = TAILQ_FIRST(&cdp_free)) != NULL) {
105 		TAILQ_REMOVE(&cdp_free, cdp, cdp_list);
106 		devfs_free(&cdp->cdp_c);
107 	}
108 	while ((csw = SLIST_FIRST(&csw_free)) != NULL) {
109 		SLIST_REMOVE_HEAD(&csw_free, d_postfree_list);
110 		free(csw, M_DEVT);
111 	}
112 }
113 
114 static void
115 dev_free_devlocked(struct cdev *cdev)
116 {
117 	struct cdev_priv *cdp;
118 
119 	mtx_assert(&devmtx, MA_OWNED);
120 	cdp = cdev2priv(cdev);
121 	KASSERT((cdp->cdp_flags & CDP_UNREF_DTR) == 0,
122 	    ("destroy_dev() was not called after delist_dev(%p)", cdev));
123 	TAILQ_INSERT_HEAD(&cdevp_free_list, cdp, cdp_list);
124 }
125 
126 static void
127 cdevsw_free_devlocked(struct cdevsw *csw)
128 {
129 
130 	mtx_assert(&devmtx, MA_OWNED);
131 	SLIST_INSERT_HEAD(&cdevsw_gt_post_list, csw, d_postfree_list);
132 }
133 
134 void
135 dev_unlock(void)
136 {
137 
138 	mtx_unlock(&devmtx);
139 }
140 
141 void
142 dev_ref(struct cdev *dev)
143 {
144 
145 	mtx_assert(&devmtx, MA_NOTOWNED);
146 	mtx_lock(&devmtx);
147 	dev->si_refcount++;
148 	mtx_unlock(&devmtx);
149 }
150 
151 void
152 dev_refl(struct cdev *dev)
153 {
154 
155 	mtx_assert(&devmtx, MA_OWNED);
156 	dev->si_refcount++;
157 }
158 
159 void
160 dev_rel(struct cdev *dev)
161 {
162 	int flag = 0;
163 
164 	mtx_assert(&devmtx, MA_NOTOWNED);
165 	dev_lock();
166 	dev->si_refcount--;
167 	KASSERT(dev->si_refcount >= 0,
168 	    ("dev_rel(%s) gave negative count", devtoname(dev)));
169 	if (dev->si_devsw == NULL && dev->si_refcount == 0) {
170 		LIST_REMOVE(dev, si_list);
171 		flag = 1;
172 	}
173 	dev_unlock();
174 	if (flag)
175 		devfs_free(dev);
176 }
177 
178 struct cdevsw *
179 dev_refthread(struct cdev *dev, int *ref)
180 {
181 	struct cdevsw *csw;
182 	struct cdev_priv *cdp;
183 
184 	mtx_assert(&devmtx, MA_NOTOWNED);
185 	if ((dev->si_flags & SI_ETERNAL) != 0) {
186 		*ref = 0;
187 		return (dev->si_devsw);
188 	}
189 	dev_lock();
190 	csw = dev->si_devsw;
191 	if (csw != NULL) {
192 		cdp = cdev2priv(dev);
193 		if ((cdp->cdp_flags & CDP_SCHED_DTR) == 0)
194 			atomic_add_long(&dev->si_threadcount, 1);
195 		else
196 			csw = NULL;
197 	}
198 	dev_unlock();
199 	if (csw != NULL)
200 		*ref = 1;
201 	return (csw);
202 }
203 
204 struct cdevsw *
205 devvn_refthread(struct vnode *vp, struct cdev **devp, int *ref)
206 {
207 	struct cdevsw *csw;
208 	struct cdev_priv *cdp;
209 	struct cdev *dev;
210 
211 	mtx_assert(&devmtx, MA_NOTOWNED);
212 	if ((vp->v_vflag & VV_ETERNALDEV) != 0) {
213 		dev = vp->v_rdev;
214 		if (dev == NULL)
215 			return (NULL);
216 		KASSERT((dev->si_flags & SI_ETERNAL) != 0,
217 		    ("Not eternal cdev"));
218 		*ref = 0;
219 		csw = dev->si_devsw;
220 		KASSERT(csw != NULL, ("Eternal cdev is destroyed"));
221 		*devp = dev;
222 		return (csw);
223 	}
224 
225 	csw = NULL;
226 	dev_lock();
227 	dev = vp->v_rdev;
228 	if (dev == NULL) {
229 		dev_unlock();
230 		return (NULL);
231 	}
232 	cdp = cdev2priv(dev);
233 	if ((cdp->cdp_flags & CDP_SCHED_DTR) == 0) {
234 		csw = dev->si_devsw;
235 		if (csw != NULL)
236 			atomic_add_long(&dev->si_threadcount, 1);
237 	}
238 	dev_unlock();
239 	if (csw != NULL) {
240 		*devp = dev;
241 		*ref = 1;
242 	}
243 	return (csw);
244 }
245 
246 void
247 dev_relthread(struct cdev *dev, int ref)
248 {
249 
250 	mtx_assert(&devmtx, MA_NOTOWNED);
251 	if (!ref)
252 		return;
253 	KASSERT(dev->si_threadcount > 0,
254 	    ("%s threadcount is wrong", dev->si_name));
255 	atomic_subtract_rel_long(&dev->si_threadcount, 1);
256 }
257 
258 int
259 nullop(void)
260 {
261 
262 	return (0);
263 }
264 
265 int
266 eopnotsupp(void)
267 {
268 
269 	return (EOPNOTSUPP);
270 }
271 
272 static int
273 enxio(void)
274 {
275 	return (ENXIO);
276 }
277 
278 static int
279 enodev(void)
280 {
281 	return (ENODEV);
282 }
283 
284 /* Define a dead_cdevsw for use when devices leave unexpectedly. */
285 
286 #define dead_open	(d_open_t *)enxio
287 #define dead_close	(d_close_t *)enxio
288 #define dead_read	(d_read_t *)enxio
289 #define dead_write	(d_write_t *)enxio
290 #define dead_ioctl	(d_ioctl_t *)enxio
291 #define dead_poll	(d_poll_t *)enodev
292 #define dead_mmap	(d_mmap_t *)enodev
293 
294 static void
295 dead_strategy(struct bio *bp)
296 {
297 
298 	biofinish(bp, NULL, ENXIO);
299 }
300 
301 #define dead_dump	(dumper_t *)enxio
302 #define dead_kqfilter	(d_kqfilter_t *)enxio
303 #define dead_mmap_single (d_mmap_single_t *)enodev
304 
305 static struct cdevsw dead_cdevsw = {
306 	.d_version =	D_VERSION,
307 	.d_open =	dead_open,
308 	.d_close =	dead_close,
309 	.d_read =	dead_read,
310 	.d_write =	dead_write,
311 	.d_ioctl =	dead_ioctl,
312 	.d_poll =	dead_poll,
313 	.d_mmap =	dead_mmap,
314 	.d_strategy =	dead_strategy,
315 	.d_name =	"dead",
316 	.d_dump =	dead_dump,
317 	.d_kqfilter =	dead_kqfilter,
318 	.d_mmap_single = dead_mmap_single
319 };
320 
321 /* Default methods if driver does not specify method */
322 
323 #define null_open	(d_open_t *)nullop
324 #define null_close	(d_close_t *)nullop
325 #define no_read		(d_read_t *)enodev
326 #define no_write	(d_write_t *)enodev
327 #define no_ioctl	(d_ioctl_t *)enodev
328 #define no_mmap		(d_mmap_t *)enodev
329 #define no_kqfilter	(d_kqfilter_t *)enodev
330 #define no_mmap_single	(d_mmap_single_t *)enodev
331 
332 static void
333 no_strategy(struct bio *bp)
334 {
335 
336 	biofinish(bp, NULL, ENODEV);
337 }
338 
339 static int
340 no_poll(struct cdev *dev __unused, int events, struct thread *td __unused)
341 {
342 
343 	return (poll_no_poll(events));
344 }
345 
346 #define no_dump		(dumper_t *)enodev
347 
348 static int
349 giant_open(struct cdev *dev, int oflags, int devtype, struct thread *td)
350 {
351 	struct cdevsw *dsw;
352 	int ref, retval;
353 
354 	dsw = dev_refthread(dev, &ref);
355 	if (dsw == NULL)
356 		return (ENXIO);
357 	mtx_lock(&Giant);
358 	retval = dsw->d_gianttrick->d_open(dev, oflags, devtype, td);
359 	mtx_unlock(&Giant);
360 	dev_relthread(dev, ref);
361 	return (retval);
362 }
363 
364 static int
365 giant_fdopen(struct cdev *dev, int oflags, struct thread *td, struct file *fp)
366 {
367 	struct cdevsw *dsw;
368 	int ref, retval;
369 
370 	dsw = dev_refthread(dev, &ref);
371 	if (dsw == NULL)
372 		return (ENXIO);
373 	mtx_lock(&Giant);
374 	retval = dsw->d_gianttrick->d_fdopen(dev, oflags, td, fp);
375 	mtx_unlock(&Giant);
376 	dev_relthread(dev, ref);
377 	return (retval);
378 }
379 
380 static int
381 giant_close(struct cdev *dev, int fflag, int devtype, struct thread *td)
382 {
383 	struct cdevsw *dsw;
384 	int ref, retval;
385 
386 	dsw = dev_refthread(dev, &ref);
387 	if (dsw == NULL)
388 		return (ENXIO);
389 	mtx_lock(&Giant);
390 	retval = dsw->d_gianttrick->d_close(dev, fflag, devtype, td);
391 	mtx_unlock(&Giant);
392 	dev_relthread(dev, ref);
393 	return (retval);
394 }
395 
396 static void
397 giant_strategy(struct bio *bp)
398 {
399 	struct cdevsw *dsw;
400 	struct cdev *dev;
401 	int ref;
402 
403 	dev = bp->bio_dev;
404 	dsw = dev_refthread(dev, &ref);
405 	if (dsw == NULL) {
406 		biofinish(bp, NULL, ENXIO);
407 		return;
408 	}
409 	mtx_lock(&Giant);
410 	dsw->d_gianttrick->d_strategy(bp);
411 	mtx_unlock(&Giant);
412 	dev_relthread(dev, ref);
413 }
414 
415 static int
416 giant_ioctl(struct cdev *dev, u_long cmd, caddr_t data, int fflag, struct thread *td)
417 {
418 	struct cdevsw *dsw;
419 	int ref, retval;
420 
421 	dsw = dev_refthread(dev, &ref);
422 	if (dsw == NULL)
423 		return (ENXIO);
424 	mtx_lock(&Giant);
425 	retval = dsw->d_gianttrick->d_ioctl(dev, cmd, data, fflag, td);
426 	mtx_unlock(&Giant);
427 	dev_relthread(dev, ref);
428 	return (retval);
429 }
430 
431 static int
432 giant_read(struct cdev *dev, struct uio *uio, int ioflag)
433 {
434 	struct cdevsw *dsw;
435 	int ref, retval;
436 
437 	dsw = dev_refthread(dev, &ref);
438 	if (dsw == NULL)
439 		return (ENXIO);
440 	mtx_lock(&Giant);
441 	retval = dsw->d_gianttrick->d_read(dev, uio, ioflag);
442 	mtx_unlock(&Giant);
443 	dev_relthread(dev, ref);
444 	return (retval);
445 }
446 
447 static int
448 giant_write(struct cdev *dev, struct uio *uio, int ioflag)
449 {
450 	struct cdevsw *dsw;
451 	int ref, retval;
452 
453 	dsw = dev_refthread(dev, &ref);
454 	if (dsw == NULL)
455 		return (ENXIO);
456 	mtx_lock(&Giant);
457 	retval = dsw->d_gianttrick->d_write(dev, uio, ioflag);
458 	mtx_unlock(&Giant);
459 	dev_relthread(dev, ref);
460 	return (retval);
461 }
462 
463 static int
464 giant_poll(struct cdev *dev, int events, struct thread *td)
465 {
466 	struct cdevsw *dsw;
467 	int ref, retval;
468 
469 	dsw = dev_refthread(dev, &ref);
470 	if (dsw == NULL)
471 		return (ENXIO);
472 	mtx_lock(&Giant);
473 	retval = dsw->d_gianttrick->d_poll(dev, events, td);
474 	mtx_unlock(&Giant);
475 	dev_relthread(dev, ref);
476 	return (retval);
477 }
478 
479 static int
480 giant_kqfilter(struct cdev *dev, struct knote *kn)
481 {
482 	struct cdevsw *dsw;
483 	int ref, retval;
484 
485 	dsw = dev_refthread(dev, &ref);
486 	if (dsw == NULL)
487 		return (ENXIO);
488 	mtx_lock(&Giant);
489 	retval = dsw->d_gianttrick->d_kqfilter(dev, kn);
490 	mtx_unlock(&Giant);
491 	dev_relthread(dev, ref);
492 	return (retval);
493 }
494 
495 static int
496 giant_mmap(struct cdev *dev, vm_ooffset_t offset, vm_paddr_t *paddr, int nprot,
497     vm_memattr_t *memattr)
498 {
499 	struct cdevsw *dsw;
500 	int ref, retval;
501 
502 	dsw = dev_refthread(dev, &ref);
503 	if (dsw == NULL)
504 		return (ENXIO);
505 	mtx_lock(&Giant);
506 	retval = dsw->d_gianttrick->d_mmap(dev, offset, paddr, nprot,
507 	    memattr);
508 	mtx_unlock(&Giant);
509 	dev_relthread(dev, ref);
510 	return (retval);
511 }
512 
513 static int
514 giant_mmap_single(struct cdev *dev, vm_ooffset_t *offset, vm_size_t size,
515     vm_object_t *object, int nprot)
516 {
517 	struct cdevsw *dsw;
518 	int ref, retval;
519 
520 	dsw = dev_refthread(dev, &ref);
521 	if (dsw == NULL)
522 		return (ENXIO);
523 	mtx_lock(&Giant);
524 	retval = dsw->d_gianttrick->d_mmap_single(dev, offset, size, object,
525 	    nprot);
526 	mtx_unlock(&Giant);
527 	dev_relthread(dev, ref);
528 	return (retval);
529 }
530 
531 static void
532 notify(struct cdev *dev, const char *ev, int flags)
533 {
534 	static const char prefix[] = "cdev=";
535 	char *data;
536 	int namelen, mflags;
537 
538 	if (cold)
539 		return;
540 	mflags = (flags & MAKEDEV_NOWAIT) ? M_NOWAIT : M_WAITOK;
541 	namelen = strlen(dev->si_name);
542 	data = malloc(namelen + sizeof(prefix), M_TEMP, mflags);
543 	if (data == NULL)
544 		return;
545 	memcpy(data, prefix, sizeof(prefix) - 1);
546 	memcpy(data + sizeof(prefix) - 1, dev->si_name, namelen + 1);
547 	devctl_notify_f("DEVFS", "CDEV", ev, data, mflags);
548 	free(data, M_TEMP);
549 }
550 
551 static void
552 notify_create(struct cdev *dev, int flags)
553 {
554 
555 	notify(dev, "CREATE", flags);
556 }
557 
558 static void
559 notify_destroy(struct cdev *dev)
560 {
561 
562 	notify(dev, "DESTROY", MAKEDEV_WAITOK);
563 }
564 
565 static struct cdev *
566 newdev(struct make_dev_args *args, struct cdev *si)
567 {
568 	struct cdev *si2;
569 	struct cdevsw *csw;
570 
571 	mtx_assert(&devmtx, MA_OWNED);
572 	csw = args->mda_devsw;
573 	si2 = NULL;
574 	if (csw->d_flags & D_NEEDMINOR) {
575 		/* We may want to return an existing device */
576 		LIST_FOREACH(si2, &csw->d_devs, si_list) {
577 			if (dev2unit(si2) == args->mda_unit) {
578 				dev_free_devlocked(si);
579 				si = si2;
580 				break;
581 			}
582 		}
583 
584 		/*
585 		 * If we're returning an existing device, we should make sure
586 		 * it isn't already initialized.  This would have been caught
587 		 * in consumers anyways, but it's good to catch such a case
588 		 * early.  We still need to complete initialization of the
589 		 * device, and we'll use whatever make_dev_args were passed in
590 		 * to do so.
591 		 */
592 		KASSERT(si2 == NULL || (si2->si_flags & SI_NAMED) == 0,
593 		    ("make_dev() by driver %s on pre-existing device (min=%x, name=%s)",
594 		    args->mda_devsw->d_name, dev2unit(si2), devtoname(si2)));
595 	}
596 	si->si_drv0 = args->mda_unit;
597 	si->si_drv1 = args->mda_si_drv1;
598 	si->si_drv2 = args->mda_si_drv2;
599 	/* Only push to csw->d_devs if it's not a cloned device. */
600 	if (si2 == NULL) {
601 		si->si_devsw = csw;
602 		LIST_INSERT_HEAD(&csw->d_devs, si, si_list);
603 	} else {
604 		KASSERT(si->si_devsw == csw,
605 		    ("%s: inconsistent devsw between clone_create() and make_dev()",
606 		    __func__));
607 	}
608 	return (si);
609 }
610 
611 static void
612 fini_cdevsw(struct cdevsw *devsw)
613 {
614 	struct cdevsw *gt;
615 
616 	if (devsw->d_gianttrick != NULL) {
617 		gt = devsw->d_gianttrick;
618 		memcpy(devsw, gt, sizeof *devsw);
619 		cdevsw_free_devlocked(gt);
620 		devsw->d_gianttrick = NULL;
621 	}
622 	devsw->d_flags &= ~D_INIT;
623 }
624 
625 static int
626 prep_cdevsw(struct cdevsw *devsw, int flags)
627 {
628 	struct cdevsw *dsw2;
629 
630 	mtx_assert(&devmtx, MA_OWNED);
631 	if (devsw->d_flags & D_INIT)
632 		return (0);
633 	if (devsw->d_flags & D_NEEDGIANT) {
634 		dev_unlock();
635 		dsw2 = malloc(sizeof *dsw2, M_DEVT,
636 		     (flags & MAKEDEV_NOWAIT) ? M_NOWAIT : M_WAITOK);
637 		dev_lock();
638 		if (dsw2 == NULL && !(devsw->d_flags & D_INIT))
639 			return (ENOMEM);
640 	} else
641 		dsw2 = NULL;
642 	if (devsw->d_flags & D_INIT) {
643 		if (dsw2 != NULL)
644 			cdevsw_free_devlocked(dsw2);
645 		return (0);
646 	}
647 
648 	if (devsw->d_version != D_VERSION_04) {
649 		printf(
650 		    "WARNING: Device driver \"%s\" has wrong version %s\n",
651 		    devsw->d_name == NULL ? "???" : devsw->d_name,
652 		    "and is disabled.  Recompile KLD module.");
653 		devsw->d_open = dead_open;
654 		devsw->d_close = dead_close;
655 		devsw->d_read = dead_read;
656 		devsw->d_write = dead_write;
657 		devsw->d_ioctl = dead_ioctl;
658 		devsw->d_poll = dead_poll;
659 		devsw->d_mmap = dead_mmap;
660 		devsw->d_mmap_single = dead_mmap_single;
661 		devsw->d_strategy = dead_strategy;
662 		devsw->d_dump = dead_dump;
663 		devsw->d_kqfilter = dead_kqfilter;
664 	}
665 
666 	if (devsw->d_flags & D_NEEDGIANT) {
667 		printf("WARNING: Device \"%s\" is Giant locked and may be "
668 		    "deleted before FreeBSD 13.0.\n",
669 		    devsw->d_name == NULL ? "???" : devsw->d_name);
670 		if (devsw->d_gianttrick == NULL) {
671 			memcpy(dsw2, devsw, sizeof *dsw2);
672 			devsw->d_gianttrick = dsw2;
673 			dsw2 = NULL;
674 		}
675 	}
676 
677 #define FIXUP(member, noop, giant) 				\
678 	do {							\
679 		if (devsw->member == NULL) {			\
680 			devsw->member = noop;			\
681 		} else if (devsw->d_flags & D_NEEDGIANT)	\
682 			devsw->member = giant;			\
683 		}						\
684 	while (0)
685 
686 	FIXUP(d_open,		null_open,	giant_open);
687 	FIXUP(d_fdopen,		NULL,		giant_fdopen);
688 	FIXUP(d_close,		null_close,	giant_close);
689 	FIXUP(d_read,		no_read,	giant_read);
690 	FIXUP(d_write,		no_write,	giant_write);
691 	FIXUP(d_ioctl,		no_ioctl,	giant_ioctl);
692 	FIXUP(d_poll,		no_poll,	giant_poll);
693 	FIXUP(d_mmap,		no_mmap,	giant_mmap);
694 	FIXUP(d_strategy,	no_strategy,	giant_strategy);
695 	FIXUP(d_kqfilter,	no_kqfilter,	giant_kqfilter);
696 	FIXUP(d_mmap_single,	no_mmap_single,	giant_mmap_single);
697 
698 	if (devsw->d_dump == NULL)	devsw->d_dump = no_dump;
699 
700 	LIST_INIT(&devsw->d_devs);
701 
702 	devsw->d_flags |= D_INIT;
703 
704 	if (dsw2 != NULL)
705 		cdevsw_free_devlocked(dsw2);
706 	return (0);
707 }
708 
709 static int
710 prep_devname(struct cdev *dev, const char *fmt, va_list ap)
711 {
712 	int len;
713 	char *from, *q, *s, *to;
714 
715 	mtx_assert(&devmtx, MA_OWNED);
716 
717 	len = vsnrprintf(dev->si_name, sizeof(dev->si_name), 32, fmt, ap);
718 	if (len > sizeof(dev->si_name) - 1)
719 		return (ENAMETOOLONG);
720 
721 	/* Strip leading slashes. */
722 	for (from = dev->si_name; *from == '/'; from++)
723 		;
724 
725 	for (to = dev->si_name; *from != '\0'; from++, to++) {
726 		/*
727 		 * Spaces and double quotation marks cause
728 		 * problems for the devctl(4) protocol.
729 		 * Reject names containing those characters.
730 		 */
731 		if (isspace(*from) || *from == '"')
732 			return (EINVAL);
733 		/* Treat multiple sequential slashes as single. */
734 		while (from[0] == '/' && from[1] == '/')
735 			from++;
736 		/* Trailing slash is considered invalid. */
737 		if (from[0] == '/' && from[1] == '\0')
738 			return (EINVAL);
739 		*to = *from;
740 	}
741 	*to = '\0';
742 
743 	if (dev->si_name[0] == '\0')
744 		return (EINVAL);
745 
746 	/* Disallow "." and ".." components. */
747 	for (s = dev->si_name;;) {
748 		for (q = s; *q != '/' && *q != '\0'; q++)
749 			;
750 		if (q - s == 1 && s[0] == '.')
751 			return (EINVAL);
752 		if (q - s == 2 && s[0] == '.' && s[1] == '.')
753 			return (EINVAL);
754 		if (*q != '/')
755 			break;
756 		s = q + 1;
757 	}
758 
759 	if (devfs_dev_exists(dev->si_name) != 0)
760 		return (EEXIST);
761 
762 	return (0);
763 }
764 
765 void
766 make_dev_args_init_impl(struct make_dev_args *args, size_t sz)
767 {
768 
769 	bzero(args, sz);
770 	args->mda_size = sz;
771 }
772 
773 static int
774 make_dev_sv(struct make_dev_args *args1, struct cdev **dres,
775     const char *fmt, va_list ap)
776 {
777 	struct cdev *dev, *dev_new;
778 	struct make_dev_args args;
779 	int res;
780 
781 	bzero(&args, sizeof(args));
782 	if (sizeof(args) < args1->mda_size)
783 		return (EINVAL);
784 	bcopy(args1, &args, args1->mda_size);
785 	KASSERT((args.mda_flags & MAKEDEV_WAITOK) == 0 ||
786 	    (args.mda_flags & MAKEDEV_NOWAIT) == 0,
787 	    ("make_dev_sv: both WAITOK and NOWAIT specified"));
788 	dev_new = devfs_alloc(args.mda_flags);
789 	if (dev_new == NULL)
790 		return (ENOMEM);
791 	dev_lock();
792 	res = prep_cdevsw(args.mda_devsw, args.mda_flags);
793 	if (res != 0) {
794 		dev_unlock();
795 		devfs_free(dev_new);
796 		return (res);
797 	}
798 	dev = newdev(&args, dev_new);
799 	if ((dev->si_flags & SI_NAMED) == 0) {
800 		res = prep_devname(dev, fmt, ap);
801 		if (res != 0) {
802 			if ((args.mda_flags & MAKEDEV_CHECKNAME) == 0) {
803 				panic(
804 			"make_dev_sv: bad si_name (error=%d, si_name=%s)",
805 				    res, dev->si_name);
806 			}
807 			if (dev == dev_new) {
808 				LIST_REMOVE(dev, si_list);
809 				dev_unlock();
810 				devfs_free(dev);
811 			} else
812 				dev_unlock();
813 			return (res);
814 		}
815 	}
816 	if ((args.mda_flags & MAKEDEV_REF) != 0)
817 		dev_refl(dev);
818 	if ((args.mda_flags & MAKEDEV_ETERNAL) != 0)
819 		dev->si_flags |= SI_ETERNAL;
820 	KASSERT(!(dev->si_flags & SI_NAMED),
821 	    ("make_dev() by driver %s on pre-existing device (min=%x, name=%s)",
822 	    args.mda_devsw->d_name, dev2unit(dev), devtoname(dev)));
823 	dev->si_flags |= SI_NAMED;
824 	if (args.mda_cr != NULL)
825 		dev->si_cred = crhold(args.mda_cr);
826 	dev->si_uid = args.mda_uid;
827 	dev->si_gid = args.mda_gid;
828 	dev->si_mode = args.mda_mode;
829 
830 	devfs_create(dev);
831 	clean_unrhdrl(devfs_inos);
832 	dev_unlock_and_free();
833 
834 	notify_create(dev, args.mda_flags);
835 
836 	*dres = dev;
837 	return (0);
838 }
839 
840 int
841 make_dev_s(struct make_dev_args *args, struct cdev **dres,
842     const char *fmt, ...)
843 {
844 	va_list ap;
845 	int res;
846 
847 	va_start(ap, fmt);
848 	res = make_dev_sv(args, dres, fmt, ap);
849 	va_end(ap);
850 	return (res);
851 }
852 
853 static int
854 make_dev_credv(int flags, struct cdev **dres, struct cdevsw *devsw, int unit,
855     struct ucred *cr, uid_t uid, gid_t gid, int mode, const char *fmt,
856     va_list ap)
857 {
858 	struct make_dev_args args;
859 
860 	make_dev_args_init(&args);
861 	args.mda_flags = flags;
862 	args.mda_devsw = devsw;
863 	args.mda_cr = cr;
864 	args.mda_uid = uid;
865 	args.mda_gid = gid;
866 	args.mda_mode = mode;
867 	args.mda_unit = unit;
868 	return (make_dev_sv(&args, dres, fmt, ap));
869 }
870 
871 struct cdev *
872 make_dev(struct cdevsw *devsw, int unit, uid_t uid, gid_t gid, int mode,
873     const char *fmt, ...)
874 {
875 	struct cdev *dev;
876 	va_list ap;
877 	int res __unused;
878 
879 	va_start(ap, fmt);
880 	res = make_dev_credv(0, &dev, devsw, unit, NULL, uid, gid, mode, fmt,
881 		      ap);
882 	va_end(ap);
883 	KASSERT(res == 0 && dev != NULL,
884 	    ("make_dev: failed make_dev_credv (error=%d)", res));
885 	return (dev);
886 }
887 
888 struct cdev *
889 make_dev_cred(struct cdevsw *devsw, int unit, struct ucred *cr, uid_t uid,
890     gid_t gid, int mode, const char *fmt, ...)
891 {
892 	struct cdev *dev;
893 	va_list ap;
894 	int res __unused;
895 
896 	va_start(ap, fmt);
897 	res = make_dev_credv(0, &dev, devsw, unit, cr, uid, gid, mode, fmt, ap);
898 	va_end(ap);
899 
900 	KASSERT(res == 0 && dev != NULL,
901 	    ("make_dev_cred: failed make_dev_credv (error=%d)", res));
902 	return (dev);
903 }
904 
905 struct cdev *
906 make_dev_credf(int flags, struct cdevsw *devsw, int unit, struct ucred *cr,
907     uid_t uid, gid_t gid, int mode, const char *fmt, ...)
908 {
909 	struct cdev *dev;
910 	va_list ap;
911 	int res;
912 
913 	va_start(ap, fmt);
914 	res = make_dev_credv(flags, &dev, devsw, unit, cr, uid, gid, mode,
915 	    fmt, ap);
916 	va_end(ap);
917 
918 	KASSERT(((flags & MAKEDEV_NOWAIT) != 0 && res == ENOMEM) ||
919 	    ((flags & MAKEDEV_CHECKNAME) != 0 && res != ENOMEM) || res == 0,
920 	    ("make_dev_credf: failed make_dev_credv (error=%d)", res));
921 	return (res == 0 ? dev : NULL);
922 }
923 
924 int
925 make_dev_p(int flags, struct cdev **cdev, struct cdevsw *devsw,
926     struct ucred *cr, uid_t uid, gid_t gid, int mode, const char *fmt, ...)
927 {
928 	va_list ap;
929 	int res;
930 
931 	va_start(ap, fmt);
932 	res = make_dev_credv(flags, cdev, devsw, 0, cr, uid, gid, mode,
933 	    fmt, ap);
934 	va_end(ap);
935 
936 	KASSERT(((flags & MAKEDEV_NOWAIT) != 0 && res == ENOMEM) ||
937 	    ((flags & MAKEDEV_CHECKNAME) != 0 && res != ENOMEM) || res == 0,
938 	    ("make_dev_p: failed make_dev_credv (error=%d)", res));
939 	return (res);
940 }
941 
942 static void
943 dev_dependsl(struct cdev *pdev, struct cdev *cdev)
944 {
945 
946 	cdev->si_parent = pdev;
947 	cdev->si_flags |= SI_CHILD;
948 	LIST_INSERT_HEAD(&pdev->si_children, cdev, si_siblings);
949 }
950 
951 
952 void
953 dev_depends(struct cdev *pdev, struct cdev *cdev)
954 {
955 
956 	dev_lock();
957 	dev_dependsl(pdev, cdev);
958 	dev_unlock();
959 }
960 
961 static int
962 make_dev_alias_v(int flags, struct cdev **cdev, struct cdev *pdev,
963     const char *fmt, va_list ap)
964 {
965 	struct cdev *dev;
966 	int error;
967 
968 	KASSERT(pdev != NULL, ("make_dev_alias_v: pdev is NULL"));
969 	KASSERT((flags & MAKEDEV_WAITOK) == 0 || (flags & MAKEDEV_NOWAIT) == 0,
970 	    ("make_dev_alias_v: both WAITOK and NOWAIT specified"));
971 	KASSERT((flags & ~(MAKEDEV_WAITOK | MAKEDEV_NOWAIT |
972 	    MAKEDEV_CHECKNAME)) == 0,
973 	    ("make_dev_alias_v: invalid flags specified (flags=%02x)", flags));
974 
975 	dev = devfs_alloc(flags);
976 	if (dev == NULL)
977 		return (ENOMEM);
978 	dev_lock();
979 	dev->si_flags |= SI_ALIAS;
980 	error = prep_devname(dev, fmt, ap);
981 	if (error != 0) {
982 		if ((flags & MAKEDEV_CHECKNAME) == 0) {
983 			panic("make_dev_alias_v: bad si_name "
984 			    "(error=%d, si_name=%s)", error, dev->si_name);
985 		}
986 		dev_unlock();
987 		devfs_free(dev);
988 		return (error);
989 	}
990 	dev->si_flags |= SI_NAMED;
991 	devfs_create(dev);
992 	dev_dependsl(pdev, dev);
993 	clean_unrhdrl(devfs_inos);
994 	dev_unlock();
995 
996 	notify_create(dev, flags);
997 	*cdev = dev;
998 
999 	return (0);
1000 }
1001 
1002 struct cdev *
1003 make_dev_alias(struct cdev *pdev, const char *fmt, ...)
1004 {
1005 	struct cdev *dev;
1006 	va_list ap;
1007 	int res __unused;
1008 
1009 	va_start(ap, fmt);
1010 	res = make_dev_alias_v(MAKEDEV_WAITOK, &dev, pdev, fmt, ap);
1011 	va_end(ap);
1012 
1013 	KASSERT(res == 0 && dev != NULL,
1014 	    ("make_dev_alias: failed make_dev_alias_v (error=%d)", res));
1015 	return (dev);
1016 }
1017 
1018 int
1019 make_dev_alias_p(int flags, struct cdev **cdev, struct cdev *pdev,
1020     const char *fmt, ...)
1021 {
1022 	va_list ap;
1023 	int res;
1024 
1025 	va_start(ap, fmt);
1026 	res = make_dev_alias_v(flags, cdev, pdev, fmt, ap);
1027 	va_end(ap);
1028 	return (res);
1029 }
1030 
1031 int
1032 make_dev_physpath_alias(int flags, struct cdev **cdev, struct cdev *pdev,
1033     struct cdev *old_alias, const char *physpath)
1034 {
1035 	char *devfspath;
1036 	int physpath_len;
1037 	int max_parentpath_len;
1038 	int parentpath_len;
1039 	int devfspathbuf_len;
1040 	int mflags;
1041 	int ret;
1042 
1043 	*cdev = NULL;
1044 	devfspath = NULL;
1045 	physpath_len = strlen(physpath);
1046 	ret = EINVAL;
1047 	if (physpath_len == 0)
1048 		goto out;
1049 
1050 	if (strncmp("id1,", physpath, 4) == 0) {
1051 		physpath += 4;
1052 		physpath_len -= 4;
1053 		if (physpath_len == 0)
1054 			goto out;
1055 	}
1056 
1057 	max_parentpath_len = SPECNAMELEN - physpath_len - /*/*/1;
1058 	parentpath_len = strlen(pdev->si_name);
1059 	if (max_parentpath_len < parentpath_len) {
1060 		if (bootverbose)
1061 			printf("WARNING: Unable to alias %s "
1062 			    "to %s/%s - path too long\n",
1063 			    pdev->si_name, physpath, pdev->si_name);
1064 		ret = ENAMETOOLONG;
1065 		goto out;
1066 	}
1067 
1068 	mflags = (flags & MAKEDEV_NOWAIT) ? M_NOWAIT : M_WAITOK;
1069 	devfspathbuf_len = physpath_len + /*/*/1 + parentpath_len + /*NUL*/1;
1070 	devfspath = malloc(devfspathbuf_len, M_DEVBUF, mflags);
1071 	if (devfspath == NULL) {
1072 		ret = ENOMEM;
1073 		goto out;
1074 	}
1075 
1076 	sprintf(devfspath, "%s/%s", physpath, pdev->si_name);
1077 	if (old_alias != NULL && strcmp(old_alias->si_name, devfspath) == 0) {
1078 		/* Retain the existing alias. */
1079 		*cdev = old_alias;
1080 		old_alias = NULL;
1081 		ret = 0;
1082 	} else {
1083 		ret = make_dev_alias_p(flags, cdev, pdev, "%s", devfspath);
1084 	}
1085 out:
1086 	if (old_alias != NULL)
1087 		destroy_dev(old_alias);
1088 	if (devfspath != NULL)
1089 		free(devfspath, M_DEVBUF);
1090 	return (ret);
1091 }
1092 
1093 static void
1094 destroy_devl(struct cdev *dev)
1095 {
1096 	struct cdevsw *csw;
1097 	struct cdev_privdata *p;
1098 	struct cdev_priv *cdp;
1099 
1100 	mtx_assert(&devmtx, MA_OWNED);
1101 	KASSERT(dev->si_flags & SI_NAMED,
1102 	    ("WARNING: Driver mistake: destroy_dev on %d\n", dev2unit(dev)));
1103 	KASSERT((dev->si_flags & SI_ETERNAL) == 0,
1104 	    ("WARNING: Driver mistake: destroy_dev on eternal %d\n",
1105 	     dev2unit(dev)));
1106 
1107 	cdp = cdev2priv(dev);
1108 	if ((cdp->cdp_flags & CDP_UNREF_DTR) == 0) {
1109 		/*
1110 		 * Avoid race with dev_rel(), e.g. from the populate
1111 		 * loop.  If CDP_UNREF_DTR flag is set, the reference
1112 		 * to be dropped at the end of destroy_devl() was
1113 		 * already taken by delist_dev_locked().
1114 		 */
1115 		dev_refl(dev);
1116 
1117 		devfs_destroy(dev);
1118 	}
1119 
1120 	/* Remove name marking */
1121 	dev->si_flags &= ~SI_NAMED;
1122 
1123 	/* If we are a child, remove us from the parents list */
1124 	if (dev->si_flags & SI_CHILD) {
1125 		LIST_REMOVE(dev, si_siblings);
1126 		dev->si_flags &= ~SI_CHILD;
1127 	}
1128 
1129 	/* Kill our children */
1130 	while (!LIST_EMPTY(&dev->si_children))
1131 		destroy_devl(LIST_FIRST(&dev->si_children));
1132 
1133 	/* Remove from clone list */
1134 	if (dev->si_flags & SI_CLONELIST) {
1135 		LIST_REMOVE(dev, si_clone);
1136 		dev->si_flags &= ~SI_CLONELIST;
1137 	}
1138 
1139 	csw = dev->si_devsw;
1140 	dev->si_devsw = NULL;	/* already NULL for SI_ALIAS */
1141 	while (csw != NULL && csw->d_purge != NULL && dev->si_threadcount) {
1142 		csw->d_purge(dev);
1143 		msleep(csw, &devmtx, PRIBIO, "devprg", hz/10);
1144 		if (dev->si_threadcount)
1145 			printf("Still %lu threads in %s\n",
1146 			    dev->si_threadcount, devtoname(dev));
1147 	}
1148 	while (dev->si_threadcount != 0) {
1149 		/* Use unique dummy wait ident */
1150 		msleep(&csw, &devmtx, PRIBIO, "devdrn", hz / 10);
1151 	}
1152 
1153 	dev_unlock();
1154 	if ((cdp->cdp_flags & CDP_UNREF_DTR) == 0) {
1155 		/* avoid out of order notify events */
1156 		notify_destroy(dev);
1157 	}
1158 	mtx_lock(&cdevpriv_mtx);
1159 	while ((p = LIST_FIRST(&cdp->cdp_fdpriv)) != NULL) {
1160 		devfs_destroy_cdevpriv(p);
1161 		mtx_lock(&cdevpriv_mtx);
1162 	}
1163 	mtx_unlock(&cdevpriv_mtx);
1164 	dev_lock();
1165 
1166 	dev->si_drv1 = 0;
1167 	dev->si_drv2 = 0;
1168 	bzero(&dev->__si_u, sizeof(dev->__si_u));
1169 
1170 	if (!(dev->si_flags & SI_ALIAS)) {
1171 		/* Remove from cdevsw list */
1172 		LIST_REMOVE(dev, si_list);
1173 
1174 		/* If cdevsw has no more struct cdev *'s, clean it */
1175 		if (LIST_EMPTY(&csw->d_devs)) {
1176 			fini_cdevsw(csw);
1177 			wakeup(&csw->d_devs);
1178 		}
1179 	}
1180 	dev->si_flags &= ~SI_ALIAS;
1181 	cdp->cdp_flags &= ~CDP_UNREF_DTR;
1182 	dev->si_refcount--;
1183 
1184 	if (dev->si_refcount > 0)
1185 		LIST_INSERT_HEAD(&dead_cdevsw.d_devs, dev, si_list);
1186 	else
1187 		dev_free_devlocked(dev);
1188 }
1189 
1190 static void
1191 delist_dev_locked(struct cdev *dev)
1192 {
1193 	struct cdev_priv *cdp;
1194 	struct cdev *child;
1195 
1196 	mtx_assert(&devmtx, MA_OWNED);
1197 	cdp = cdev2priv(dev);
1198 	if ((cdp->cdp_flags & CDP_UNREF_DTR) != 0)
1199 		return;
1200 	cdp->cdp_flags |= CDP_UNREF_DTR;
1201 	dev_refl(dev);
1202 	devfs_destroy(dev);
1203 	LIST_FOREACH(child, &dev->si_children, si_siblings)
1204 		delist_dev_locked(child);
1205 	dev_unlock();
1206 	/* ensure the destroy event is queued in order */
1207 	notify_destroy(dev);
1208 	dev_lock();
1209 }
1210 
1211 /*
1212  * This function will delist a character device and its children from
1213  * the directory listing and create a destroy event without waiting
1214  * for all character device references to go away. At some later point
1215  * destroy_dev() must be called to complete the character device
1216  * destruction. After calling this function the character device name
1217  * can instantly be re-used.
1218  */
1219 void
1220 delist_dev(struct cdev *dev)
1221 {
1222 
1223 	WITNESS_WARN(WARN_GIANTOK | WARN_SLEEPOK, NULL, "delist_dev");
1224 	dev_lock();
1225 	delist_dev_locked(dev);
1226 	dev_unlock();
1227 }
1228 
1229 void
1230 destroy_dev(struct cdev *dev)
1231 {
1232 
1233 	WITNESS_WARN(WARN_GIANTOK | WARN_SLEEPOK, NULL, "destroy_dev");
1234 	dev_lock();
1235 	destroy_devl(dev);
1236 	dev_unlock_and_free();
1237 }
1238 
1239 const char *
1240 devtoname(struct cdev *dev)
1241 {
1242 
1243 	return (dev->si_name);
1244 }
1245 
1246 int
1247 dev_stdclone(char *name, char **namep, const char *stem, int *unit)
1248 {
1249 	int u, i;
1250 
1251 	i = strlen(stem);
1252 	if (bcmp(stem, name, i) != 0)
1253 		return (0);
1254 	if (!isdigit(name[i]))
1255 		return (0);
1256 	u = 0;
1257 	if (name[i] == '0' && isdigit(name[i+1]))
1258 		return (0);
1259 	while (isdigit(name[i])) {
1260 		u *= 10;
1261 		u += name[i++] - '0';
1262 	}
1263 	if (u > 0xffffff)
1264 		return (0);
1265 	*unit = u;
1266 	if (namep)
1267 		*namep = &name[i];
1268 	if (name[i])
1269 		return (2);
1270 	return (1);
1271 }
1272 
1273 /*
1274  * Helper functions for cloning device drivers.
1275  *
1276  * The objective here is to make it unnecessary for the device drivers to
1277  * use rman or similar to manage their unit number space.  Due to the way
1278  * we do "on-demand" devices, using rman or other "private" methods
1279  * will be very tricky to lock down properly once we lock down this file.
1280  *
1281  * Instead we give the drivers these routines which puts the struct cdev *'s
1282  * that are to be managed on their own list, and gives the driver the ability
1283  * to ask for the first free unit number or a given specified unit number.
1284  *
1285  * In addition these routines support paired devices (pty, nmdm and similar)
1286  * by respecting a number of "flag" bits in the minor number.
1287  *
1288  */
1289 
1290 struct clonedevs {
1291 	LIST_HEAD(,cdev)	head;
1292 };
1293 
1294 void
1295 clone_setup(struct clonedevs **cdp)
1296 {
1297 
1298 	*cdp = malloc(sizeof **cdp, M_DEVBUF, M_WAITOK | M_ZERO);
1299 	LIST_INIT(&(*cdp)->head);
1300 }
1301 
1302 int
1303 clone_create(struct clonedevs **cdp, struct cdevsw *csw, int *up,
1304     struct cdev **dp, int extra)
1305 {
1306 	struct clonedevs *cd;
1307 	struct cdev *dev, *ndev, *dl, *de;
1308 	struct make_dev_args args;
1309 	int unit, low, u;
1310 
1311 	KASSERT(*cdp != NULL,
1312 	    ("clone_setup() not called in driver \"%s\"", csw->d_name));
1313 	KASSERT(!(extra & CLONE_UNITMASK),
1314 	    ("Illegal extra bits (0x%x) in clone_create", extra));
1315 	KASSERT(*up <= CLONE_UNITMASK,
1316 	    ("Too high unit (0x%x) in clone_create", *up));
1317 	KASSERT(csw->d_flags & D_NEEDMINOR,
1318 	    ("clone_create() on cdevsw without minor numbers"));
1319 
1320 
1321 	/*
1322 	 * Search the list for a lot of things in one go:
1323 	 *   A preexisting match is returned immediately.
1324 	 *   The lowest free unit number if we are passed -1, and the place
1325 	 *	 in the list where we should insert that new element.
1326 	 *   The place to insert a specified unit number, if applicable
1327 	 *       the end of the list.
1328 	 */
1329 	unit = *up;
1330 	ndev = devfs_alloc(MAKEDEV_WAITOK);
1331 	dev_lock();
1332 	prep_cdevsw(csw, MAKEDEV_WAITOK);
1333 	low = extra;
1334 	de = dl = NULL;
1335 	cd = *cdp;
1336 	LIST_FOREACH(dev, &cd->head, si_clone) {
1337 		KASSERT(dev->si_flags & SI_CLONELIST,
1338 		    ("Dev %p(%s) should be on clonelist", dev, dev->si_name));
1339 		u = dev2unit(dev);
1340 		if (u == (unit | extra)) {
1341 			*dp = dev;
1342 			dev_unlock();
1343 			devfs_free(ndev);
1344 			return (0);
1345 		}
1346 		if (unit == -1 && u == low) {
1347 			low++;
1348 			de = dev;
1349 			continue;
1350 		} else if (u < (unit | extra)) {
1351 			de = dev;
1352 			continue;
1353 		} else if (u > (unit | extra)) {
1354 			dl = dev;
1355 			break;
1356 		}
1357 	}
1358 	if (unit == -1)
1359 		unit = low & CLONE_UNITMASK;
1360 	make_dev_args_init(&args);
1361 	args.mda_unit = unit | extra;
1362 	args.mda_devsw = csw;
1363 	dev = newdev(&args, ndev);
1364 	if (dev->si_flags & SI_CLONELIST) {
1365 		printf("dev %p (%s) is on clonelist\n", dev, dev->si_name);
1366 		printf("unit=%d, low=%d, extra=0x%x\n", unit, low, extra);
1367 		LIST_FOREACH(dev, &cd->head, si_clone) {
1368 			printf("\t%p %s\n", dev, dev->si_name);
1369 		}
1370 		panic("foo");
1371 	}
1372 	KASSERT(!(dev->si_flags & SI_CLONELIST),
1373 	    ("Dev %p(%s) should not be on clonelist", dev, dev->si_name));
1374 	if (dl != NULL)
1375 		LIST_INSERT_BEFORE(dl, dev, si_clone);
1376 	else if (de != NULL)
1377 		LIST_INSERT_AFTER(de, dev, si_clone);
1378 	else
1379 		LIST_INSERT_HEAD(&cd->head, dev, si_clone);
1380 	dev->si_flags |= SI_CLONELIST;
1381 	*up = unit;
1382 	dev_unlock_and_free();
1383 	return (1);
1384 }
1385 
1386 /*
1387  * Kill everything still on the list.  The driver should already have
1388  * disposed of any softc hung of the struct cdev *'s at this time.
1389  */
1390 void
1391 clone_cleanup(struct clonedevs **cdp)
1392 {
1393 	struct cdev *dev;
1394 	struct cdev_priv *cp;
1395 	struct clonedevs *cd;
1396 
1397 	cd = *cdp;
1398 	if (cd == NULL)
1399 		return;
1400 	dev_lock();
1401 	while (!LIST_EMPTY(&cd->head)) {
1402 		dev = LIST_FIRST(&cd->head);
1403 		LIST_REMOVE(dev, si_clone);
1404 		KASSERT(dev->si_flags & SI_CLONELIST,
1405 		    ("Dev %p(%s) should be on clonelist", dev, dev->si_name));
1406 		dev->si_flags &= ~SI_CLONELIST;
1407 		cp = cdev2priv(dev);
1408 		if (!(cp->cdp_flags & CDP_SCHED_DTR)) {
1409 			cp->cdp_flags |= CDP_SCHED_DTR;
1410 			KASSERT(dev->si_flags & SI_NAMED,
1411 				("Driver has goofed in cloning underways udev %jx unit %x",
1412 				(uintmax_t)dev2udev(dev), dev2unit(dev)));
1413 			destroy_devl(dev);
1414 		}
1415 	}
1416 	dev_unlock_and_free();
1417 	free(cd, M_DEVBUF);
1418 	*cdp = NULL;
1419 }
1420 
1421 static TAILQ_HEAD(, cdev_priv) dev_ddtr =
1422 	TAILQ_HEAD_INITIALIZER(dev_ddtr);
1423 static struct task dev_dtr_task = TASK_INITIALIZER(0, destroy_dev_tq, NULL);
1424 
1425 static void
1426 destroy_dev_tq(void *ctx, int pending)
1427 {
1428 	struct cdev_priv *cp;
1429 	struct cdev *dev;
1430 	void (*cb)(void *);
1431 	void *cb_arg;
1432 
1433 	dev_lock();
1434 	while (!TAILQ_EMPTY(&dev_ddtr)) {
1435 		cp = TAILQ_FIRST(&dev_ddtr);
1436 		dev = &cp->cdp_c;
1437 		KASSERT(cp->cdp_flags & CDP_SCHED_DTR,
1438 		    ("cdev %p in dev_destroy_tq without CDP_SCHED_DTR", cp));
1439 		TAILQ_REMOVE(&dev_ddtr, cp, cdp_dtr_list);
1440 		cb = cp->cdp_dtr_cb;
1441 		cb_arg = cp->cdp_dtr_cb_arg;
1442 		destroy_devl(dev);
1443 		dev_unlock_and_free();
1444 		dev_rel(dev);
1445 		if (cb != NULL)
1446 			cb(cb_arg);
1447 		dev_lock();
1448 	}
1449 	dev_unlock();
1450 }
1451 
1452 /*
1453  * devmtx shall be locked on entry. devmtx will be unlocked after
1454  * function return.
1455  */
1456 static int
1457 destroy_dev_sched_cbl(struct cdev *dev, void (*cb)(void *), void *arg)
1458 {
1459 	struct cdev_priv *cp;
1460 
1461 	mtx_assert(&devmtx, MA_OWNED);
1462 	cp = cdev2priv(dev);
1463 	if (cp->cdp_flags & CDP_SCHED_DTR) {
1464 		dev_unlock();
1465 		return (0);
1466 	}
1467 	dev_refl(dev);
1468 	cp->cdp_flags |= CDP_SCHED_DTR;
1469 	cp->cdp_dtr_cb = cb;
1470 	cp->cdp_dtr_cb_arg = arg;
1471 	TAILQ_INSERT_TAIL(&dev_ddtr, cp, cdp_dtr_list);
1472 	dev_unlock();
1473 	taskqueue_enqueue(taskqueue_swi_giant, &dev_dtr_task);
1474 	return (1);
1475 }
1476 
1477 int
1478 destroy_dev_sched_cb(struct cdev *dev, void (*cb)(void *), void *arg)
1479 {
1480 
1481 	dev_lock();
1482 	return (destroy_dev_sched_cbl(dev, cb, arg));
1483 }
1484 
1485 int
1486 destroy_dev_sched(struct cdev *dev)
1487 {
1488 
1489 	return (destroy_dev_sched_cb(dev, NULL, NULL));
1490 }
1491 
1492 void
1493 destroy_dev_drain(struct cdevsw *csw)
1494 {
1495 
1496 	dev_lock();
1497 	while (!LIST_EMPTY(&csw->d_devs)) {
1498 		msleep(&csw->d_devs, &devmtx, PRIBIO, "devscd", hz/10);
1499 	}
1500 	dev_unlock();
1501 }
1502 
1503 void
1504 drain_dev_clone_events(void)
1505 {
1506 
1507 	sx_xlock(&clone_drain_lock);
1508 	sx_xunlock(&clone_drain_lock);
1509 }
1510 
1511 #include "opt_ddb.h"
1512 #ifdef DDB
1513 #include <sys/kernel.h>
1514 
1515 #include <ddb/ddb.h>
1516 
1517 DB_SHOW_COMMAND(cdev, db_show_cdev)
1518 {
1519 	struct cdev_priv *cdp;
1520 	struct cdev *dev;
1521 	u_int flags;
1522 	char buf[512];
1523 
1524 	if (!have_addr) {
1525 		TAILQ_FOREACH(cdp, &cdevp_list, cdp_list) {
1526 			dev = &cdp->cdp_c;
1527 			db_printf("%s %p\n", dev->si_name, dev);
1528 			if (db_pager_quit)
1529 				break;
1530 		}
1531 		return;
1532 	}
1533 
1534 	dev = (struct cdev *)addr;
1535 	cdp = cdev2priv(dev);
1536 	db_printf("dev %s ref %d use %ld thr %ld inuse %u fdpriv %p\n",
1537 	    dev->si_name, dev->si_refcount, dev->si_usecount,
1538 	    dev->si_threadcount, cdp->cdp_inuse, cdp->cdp_fdpriv.lh_first);
1539 	db_printf("devsw %p si_drv0 %d si_drv1 %p si_drv2 %p\n",
1540 	    dev->si_devsw, dev->si_drv0, dev->si_drv1, dev->si_drv2);
1541 	flags = dev->si_flags;
1542 #define	SI_FLAG(flag)	do {						\
1543 	if (flags & (flag)) {						\
1544 		if (buf[0] != '\0')					\
1545 			strlcat(buf, ", ", sizeof(buf));		\
1546 		strlcat(buf, (#flag) + 3, sizeof(buf));			\
1547 		flags &= ~(flag);					\
1548 	}								\
1549 } while (0)
1550 	buf[0] = '\0';
1551 	SI_FLAG(SI_ETERNAL);
1552 	SI_FLAG(SI_ALIAS);
1553 	SI_FLAG(SI_NAMED);
1554 	SI_FLAG(SI_CHILD);
1555 	SI_FLAG(SI_DUMPDEV);
1556 	SI_FLAG(SI_CLONELIST);
1557 	db_printf("si_flags %s\n", buf);
1558 
1559 	flags = cdp->cdp_flags;
1560 #define	CDP_FLAG(flag)	do {						\
1561 	if (flags & (flag)) {						\
1562 		if (buf[0] != '\0')					\
1563 			strlcat(buf, ", ", sizeof(buf));		\
1564 		strlcat(buf, (#flag) + 4, sizeof(buf));			\
1565 		flags &= ~(flag);					\
1566 	}								\
1567 } while (0)
1568 	buf[0] = '\0';
1569 	CDP_FLAG(CDP_ACTIVE);
1570 	CDP_FLAG(CDP_SCHED_DTR);
1571 	db_printf("cdp_flags %s\n", buf);
1572 }
1573 #endif
1574