xref: /freebsd/sys/geom/geom_dev.c (revision 69c9999d0ca45b210e75706ab4952ad5a33ce6ec)
1 /*-
2  * Copyright (c) 2002 Poul-Henning Kamp
3  * Copyright (c) 2002 Networks Associates Technology, Inc.
4  * All rights reserved.
5  *
6  * This software was developed for the FreeBSD Project by Poul-Henning Kamp
7  * and NAI Labs, the Security Research Division of Network Associates, Inc.
8  * under DARPA/SPAWAR contract N66001-01-C-8035 ("CBOSS"), as part of the
9  * DARPA CHATS research program.
10  *
11  * Redistribution and use in source and binary forms, with or without
12  * modification, are permitted provided that the following conditions
13  * are met:
14  * 1. Redistributions of source code must retain the above copyright
15  *    notice, this list of conditions and the following disclaimer.
16  * 2. Redistributions in binary form must reproduce the above copyright
17  *    notice, this list of conditions and the following disclaimer in the
18  *    documentation and/or other materials provided with the distribution.
19  * 3. The names of the authors may not be used to endorse or promote
20  *    products derived from this software without specific prior written
21  *    permission.
22  *
23  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
24  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
27  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33  * SUCH DAMAGE.
34  *
35  * $FreeBSD$
36  */
37 
38 #include <sys/param.h>
39 #include <sys/stdint.h>
40 #include <sys/systm.h>
41 #include <sys/malloc.h>
42 #include <sys/kernel.h>
43 #include <sys/conf.h>
44 #include <sys/bio.h>
45 #include <sys/lock.h>
46 #include <sys/mutex.h>
47 #include <sys/errno.h>
48 #include <sys/time.h>
49 #include <sys/disk.h>
50 #include <sys/fcntl.h>
51 #include <geom/geom.h>
52 #include <geom/geom_int.h>
53 #include <machine/limits.h>
54 
55 #define CDEV_MAJOR	4
56 
57 static d_open_t		g_dev_open;
58 static d_close_t	g_dev_close;
59 static d_strategy_t	g_dev_strategy;
60 static d_ioctl_t	g_dev_ioctl;
61 static d_psize_t	g_dev_psize;
62 
63 static struct cdevsw g_dev_cdevsw = {
64 	/* open */      g_dev_open,
65 	/* close */     g_dev_close,
66 	/* read */      physread,
67 	/* write */     physwrite,
68 	/* ioctl */     g_dev_ioctl,
69 	/* poll */      nopoll,
70 	/* mmap */      nommap,
71 	/* strategy */  g_dev_strategy,
72 	/* name */      "g_dev",
73 	/* maj */       CDEV_MAJOR,
74 	/* dump */      nodump,
75 	/* psize */     g_dev_psize,
76 	/* flags */     D_DISK | D_CANFREE | D_TRACKCLOSE,
77 	/* kqfilter */	nokqfilter
78 };
79 
80 static g_taste_t g_dev_taste;
81 static g_orphan_t g_dev_orphan;
82 
83 static struct g_class g_dev_class	= {
84 	"DEV",
85 	g_dev_taste,
86 	NULL,
87 	G_CLASS_INITIALIZER
88 };
89 
90 int
91 g_dev_print(void)
92 {
93 	struct g_geom *gp;
94 
95 	if (LIST_EMPTY(&g_dev_class.geom))
96 		return (0);
97 	printf("List of GEOM disk devices:\n  ");
98 	LIST_FOREACH(gp, &g_dev_class.geom, geom)
99 		printf(" %s", gp->name);
100 	printf("\n");
101 	return (1);
102 }
103 
104 /*
105  * XXX: This is disgusting and wrong in every way imaginable:  The only reason
106  * XXX: we have a clone function is because of the root-mount hack we currently
107  * XXX: employ.  An improvment would be to unregister this cloner once we know
108  * XXX: we no longer need it.  Ideally, root-fs would be mounted through DEVFS
109  * XXX: eliminating the need for this hack.
110  */
111 static void
112 g_dev_clone(void *arg __unused, char *name, int namelen __unused, dev_t *dev)
113 {
114 	struct g_geom *gp;
115 
116 	if (*dev != NODEV)
117 		return;
118 
119 	g_waitidle();
120 
121 	/* g_topology_lock(); */
122 	LIST_FOREACH(gp, &g_dev_class.geom, geom) {
123 		if (strcmp(gp->name, name))
124 			continue;
125 		*dev = gp->softc;
126 		g_trace(G_T_TOPOLOGY, "g_dev_clone(%s) = %p", name, *dev);
127 		return;
128 	}
129 	/* g_topology_unlock(); */
130 	return;
131 }
132 
133 static void
134 g_dev_register_cloner(void *foo __unused)
135 {
136 	static int once;
137 
138 	/* XXX: why would this happen more than once ?? */
139 	if (!once) {
140 		EVENTHANDLER_REGISTER(dev_clone, g_dev_clone, 0, 1000);
141 		once++;
142 	}
143 }
144 
145 SYSINIT(geomdev,SI_SUB_DRIVERS,SI_ORDER_MIDDLE,g_dev_register_cloner,NULL);
146 
147 static struct g_geom *
148 g_dev_taste(struct g_class *mp, struct g_provider *pp, int insist __unused)
149 {
150 	struct g_geom *gp;
151 	struct g_consumer *cp;
152 	static int unit;
153 	int error;
154 	dev_t dev;
155 
156 	g_trace(G_T_TOPOLOGY, "dev_taste(%s,%s)", mp->name, pp->name);
157 	g_topology_assert();
158 	LIST_FOREACH(cp, &pp->consumers, consumers)
159 		if (cp->geom->class == mp)
160 			return (NULL);
161 	gp = g_new_geomf(mp, pp->name);
162 	gp->orphan = g_dev_orphan;
163 	cp = g_new_consumer(gp);
164 	error = g_attach(cp, pp);
165 	KASSERT(error == 0,
166 	    ("g_dev_taste(%s) failed to g_attach, err=%d", pp->name, error));
167 	/*
168 	 * XXX: I'm not 100% sure we can call make_dev(9) without Giant
169 	 * yet.  Once we can, we don't need to drop topology here either.
170 	 */
171 	g_topology_unlock();
172 	mtx_lock(&Giant);
173 	dev = make_dev(&g_dev_cdevsw, unit2minor(unit++),
174 	    UID_ROOT, GID_OPERATOR, 0640, gp->name);
175 	mtx_unlock(&Giant);
176 	g_topology_lock();
177 
178 	gp->softc = dev;
179 	dev->si_drv1 = gp;
180 	dev->si_drv2 = cp;
181 	return (gp);
182 }
183 
184 static int
185 g_dev_open(dev_t dev, int flags, int fmt, struct thread *td)
186 {
187 	struct g_geom *gp;
188 	struct g_consumer *cp;
189 	int error, r, w, e;
190 
191 	gp = dev->si_drv1;
192 	cp = dev->si_drv2;
193 	if (gp == NULL || cp == NULL)
194 		return(ENXIO);
195 	g_trace(G_T_ACCESS, "g_dev_open(%s, %d, %d, %p)",
196 	    gp->name, flags, fmt, td);
197 	DROP_GIANT();
198 	g_topology_lock();
199 	g_silence();
200 	r = flags & FREAD ? 1 : 0;
201 	w = flags & FWRITE ? 1 : 0;
202 #ifdef notyet
203 	e = flags & O_EXCL ? 1 : 0;
204 #else
205 	e = 0;
206 #endif
207 	error = g_access_rel(cp, r, w, e);
208 	g_topology_unlock();
209 	PICKUP_GIANT();
210 	g_waitidle();
211 	dev->si_bsize_phys = cp->provider->sectorsize;
212 	return(error);
213 }
214 
215 static int
216 g_dev_close(dev_t dev, int flags, int fmt, struct thread *td)
217 {
218 	struct g_geom *gp;
219 	struct g_consumer *cp;
220 	int error, r, w, e;
221 
222 	gp = dev->si_drv1;
223 	cp = dev->si_drv2;
224 	if (gp == NULL || cp == NULL)
225 		return(ENXIO);
226 	g_trace(G_T_ACCESS, "g_dev_close(%s, %d, %d, %p)",
227 	    gp->name, flags, fmt, td);
228 	DROP_GIANT();
229 	g_topology_lock();
230 	g_silence();
231 	r = flags & FREAD ? -1 : 0;
232 	w = flags & FWRITE ? -1 : 0;
233 #ifdef notyet
234 	e = flags & O_EXCL ? -1 : 0;
235 #else
236 	e = 0;
237 #endif
238 	error = g_access_rel(cp, r, w, e);
239 	g_topology_unlock();
240 	PICKUP_GIANT();
241 	g_waitidle();
242 	return (error);
243 }
244 
245 static int
246 g_dev_ioctl(dev_t dev, u_long cmd, caddr_t data, int fflag, struct thread *td)
247 {
248 	struct g_geom *gp, *gp2;
249 	struct g_consumer *cp;
250 	struct g_provider *pp2;
251 	struct g_kerneldump kd;
252 	int i, error;
253 	u_int u;
254 	struct g_ioctl *gio;
255 
256 	gp = dev->si_drv1;
257 	cp = dev->si_drv2;
258 	pp2 = cp->provider;
259 	gp2 = pp2->geom;
260 	gio = NULL;
261 
262 	error = 0;
263 	DROP_GIANT();
264 
265 	i = IOCPARM_LEN(cmd);
266 	switch (cmd) {
267 	case DIOCGSECTORSIZE:
268 		*(u_int *)data = cp->provider->sectorsize;
269 		if (*(u_int *)data == 0)
270 			error = ENOENT;
271 		break;
272 	case DIOCGMEDIASIZE:
273 		*(off_t *)data = cp->provider->mediasize;
274 		if (*(off_t *)data == 0)
275 			error = ENOENT;
276 		break;
277 	case DIOCGFWSECTORS:
278 		error = g_io_getattr("GEOM::fwsectors", cp, &i, data);
279 		if (error == 0 && *(u_int *)data == 0)
280 			error = ENOENT;
281 		break;
282 	case DIOCGFWHEADS:
283 		error = g_io_getattr("GEOM::fwheads", cp, &i, data);
284 		if (error == 0 && *(u_int *)data == 0)
285 			error = ENOENT;
286 		break;
287 	case DIOCGFRONTSTUFF:
288 		error = g_io_getattr("GEOM::frontstuff", cp, &i, data);
289 		break;
290 	case DIOCSKERNELDUMP:
291 		u = *((u_int *)data);
292 		if (!u) {
293 			set_dumper(NULL);
294 			error = 0;
295 			break;
296 		}
297 		kd.offset = 0;
298 		kd.length = OFF_MAX;
299 		i = sizeof kd;
300 		error = g_io_getattr("GEOM::kerneldump", cp, &i, &kd);
301 		if (!error)
302 			dev->si_flags |= SI_DUMPDEV;
303 		break;
304 
305 	default:
306 		gio = g_malloc(sizeof *gio, M_WAITOK | M_ZERO);
307 		gio->cmd = cmd;
308 		gio->data = data;
309 		gio->fflag = fflag;
310 		gio->td = td;
311 		i = sizeof *gio;
312 		if (cmd & IOC_IN)
313 			error = g_io_setattr("GEOM::ioctl", cp, i, gio);
314 		else
315 			error = g_io_getattr("GEOM::ioctl", cp, &i, gio);
316 		break;
317 	}
318 
319 	PICKUP_GIANT();
320 	if (error == EDIRIOCTL) {
321 		KASSERT(gio != NULL, ("NULL gio but EDIRIOCTL"));
322 		KASSERT(gio->func != NULL, ("NULL function but EDIRIOCTL"));
323 		error = (gio->func)(gio->dev, cmd, data, fflag, td);
324 	}
325 	if (gio != NULL)
326 		g_free(gio);
327 	g_waitidle();
328 	if (error == ENOIOCTL) {
329 		if (g_debugflags & G_T_TOPOLOGY) {
330 			i = IOCGROUP(cmd);
331 			printf("IOCTL(0x%lx) \"%s\"", cmd, gp->name);
332 			if (i > ' ' && i <= '~')
333 				printf(" '%c'", (int)IOCGROUP(cmd));
334 			else
335 				printf(" 0x%lx", IOCGROUP(cmd));
336 			printf("/%ld ", cmd & 0xff);
337 			if (cmd & IOC_IN)
338 				printf("I");
339 			if (cmd & IOC_OUT)
340 				printf("O");
341 			printf("(%ld) = ENOIOCTL\n", IOCPARM_LEN(cmd));
342 		}
343 		error = ENOTTY;
344 	}
345 	return (error);
346 }
347 
348 static int
349 g_dev_psize(dev_t dev)
350 {
351 	struct g_consumer *cp;
352 	off_t mediasize;
353 
354 	cp = dev->si_drv2;
355 
356 	mediasize = cp->provider->mediasize;
357 	return (mediasize >> DEV_BSHIFT);
358 }
359 
360 static void
361 g_dev_done(struct bio *bp2)
362 {
363 	struct bio *bp;
364 
365 	bp = bp2->bio_linkage;
366 	bp->bio_error = bp2->bio_error;
367 	if (bp->bio_error != 0) {
368 		g_trace(G_T_BIO, "g_dev_done(%p) had error %d",
369 		    bp2, bp->bio_error);
370 		bp->bio_flags |= BIO_ERROR;
371 	} else {
372 		g_trace(G_T_BIO, "g_dev_done(%p/%p) resid %ld completed %jd",
373 		    bp2, bp, bp->bio_resid, (intmax_t)bp2->bio_completed);
374 	}
375 	bp->bio_resid = bp->bio_bcount - bp2->bio_completed;
376 	g_destroy_bio(bp2);
377 	mtx_lock(&Giant);
378 	biodone(bp);
379 	mtx_unlock(&Giant);
380 }
381 
382 static void
383 g_dev_strategy(struct bio *bp)
384 {
385 	struct g_geom *gp;
386 	struct g_consumer *cp;
387 	struct bio *bp2;
388 	dev_t dev;
389 
390 	KASSERT(bp->bio_cmd == BIO_READ ||
391 	        bp->bio_cmd == BIO_WRITE ||
392 	        bp->bio_cmd == BIO_DELETE,
393 		("Wrong bio_cmd bio=%p cmd=%d", bp, bp->bio_cmd));
394 	dev = bp->bio_dev;
395 	gp = dev->si_drv1;
396 	cp = dev->si_drv2;
397 	bp2 = g_clone_bio(bp);
398 	KASSERT(bp2 != NULL, ("XXX: ENOMEM in a bad place"));
399 	bp2->bio_offset = (off_t)bp->bio_blkno << DEV_BSHIFT;
400 	KASSERT(bp2->bio_offset >= 0,
401 	    ("Negative bio_offset (%jd) on bio %p",
402 	    (intmax_t)bp2->bio_offset, bp));
403 	bp2->bio_length = (off_t)bp->bio_bcount;
404 	bp2->bio_done = g_dev_done;
405 	g_trace(G_T_BIO,
406 	    "g_dev_strategy(%p/%p) offset %jd length %jd data %p cmd %d",
407 	    bp, bp2, (intmax_t)bp->bio_offset, (intmax_t)bp2->bio_length,
408 	    bp2->bio_data, bp2->bio_cmd);
409 	g_io_request(bp2, cp);
410 }
411 
412 /*
413  * g_dev_orphan()
414  *
415  * Called from below when the provider orphaned us.  It is our responsibility
416  * to get the access counts back to zero, until we do so the stack below will
417  * not unravel.  We must clear the kernel-dump settings, if this is the
418  * current dumpdev.  We call destroy_dev(9) to send our dev_t the way of
419  * punched cards and if we have non-zero access counts, we call down with
420  * them negated before we detattch and selfdestruct.
421  */
422 
423 static void
424 g_dev_orphan(struct g_consumer *cp)
425 {
426 	struct g_geom *gp;
427 	dev_t dev;
428 
429 	gp = cp->geom;
430 	g_trace(G_T_TOPOLOGY, "g_dev_orphan(%p(%s))", cp, gp->name);
431 	g_topology_assert();
432 	if (cp->biocount > 0)
433 		return;
434 	dev = gp->softc;
435 	if (dev->si_flags & SI_DUMPDEV)
436 		set_dumper(NULL);
437 	/* XXX: we may need Giant for now */
438 	destroy_dev(dev);
439 	if (cp->acr > 0 || cp->acw > 0 || cp->ace > 0)
440 		g_access_rel(cp, -cp->acr, -cp->acw, -cp->ace);
441 	g_detach(cp);
442 	g_destroy_consumer(cp);
443 	g_destroy_geom(gp);
444 }
445 
446 DECLARE_GEOM_CLASS(g_dev_class, g_dev);
447