xref: /freebsd/sys/geom/vinum/geom_vinum.c (revision 7d99ab9fd0cc2c1ce2ecef0ed6d0672c2a50b0cb)
1 /*-
2  *  Copyright (c) 2004, 2007 Lukas Ertl
3  *  Copyright (c) 2007, 2009 Ulf Lilleengen
4  *  All rights reserved.
5  *
6  * Redistribution and use in source and binary forms, with or without
7  * modification, are permitted provided that the following conditions
8  * are met:
9  * 1. Redistributions of source code must retain the above copyright
10  *    notice, this list of conditions and the following disclaimer.
11  * 2. Redistributions in binary form must reproduce the above copyright
12  *    notice, this list of conditions and the following disclaimer in the
13  *    documentation and/or other materials provided with the distribution.
14  *
15  * THIS SOFTWARE IS PROVIDED BY AUTHOR AND CONTRIBUTORS ``AS IS'' AND
16  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18  * ARE DISCLAIMED.  IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE
19  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
21  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25  * SUCH DAMAGE.
26  *
27  */
28 
29 #include <sys/cdefs.h>
30 __FBSDID("$FreeBSD$");
31 
32 #include <sys/param.h>
33 #include <sys/bio.h>
34 #include <sys/kernel.h>
35 #include <sys/kthread.h>
36 #include <sys/lock.h>
37 #include <sys/malloc.h>
38 #include <sys/module.h>
39 #include <sys/mutex.h>
40 #include <sys/sbuf.h>
41 #include <sys/sysctl.h>
42 #include <sys/systm.h>
43 
44 #include <geom/geom.h>
45 #include <geom/vinum/geom_vinum_var.h>
46 #include <geom/vinum/geom_vinum.h>
47 #include <geom/vinum/geom_vinum_raid5.h>
48 
49 SYSCTL_DECL(_kern_geom);
50 static SYSCTL_NODE(_kern_geom, OID_AUTO, vinum, CTLFLAG_RW, 0,
51     "GEOM_VINUM stuff");
52 u_int g_vinum_debug = 0;
53 TUNABLE_INT("kern.geom.vinum.debug", &g_vinum_debug);
54 SYSCTL_UINT(_kern_geom_vinum, OID_AUTO, debug, CTLFLAG_RW, &g_vinum_debug, 0,
55     "Debug level");
56 
57 static int	gv_create(struct g_geom *, struct gctl_req *);
58 static void	gv_attach(struct gv_softc *, struct gctl_req *);
59 static void	gv_detach(struct gv_softc *, struct gctl_req *);
60 static void	gv_parityop(struct gv_softc *, struct gctl_req *);
61 
62 
63 static void
64 gv_orphan(struct g_consumer *cp)
65 {
66 	struct g_geom *gp;
67 	struct gv_softc *sc;
68 	struct gv_drive *d;
69 
70 	g_topology_assert();
71 
72 	KASSERT(cp != NULL, ("gv_orphan: null cp"));
73 	gp = cp->geom;
74 	KASSERT(gp != NULL, ("gv_orphan: null gp"));
75 	sc = gp->softc;
76 	KASSERT(sc != NULL, ("gv_orphan: null sc"));
77 	d = cp->private;
78 	KASSERT(d != NULL, ("gv_orphan: null d"));
79 
80 	g_trace(G_T_TOPOLOGY, "gv_orphan(%s)", gp->name);
81 
82 	gv_post_event(sc, GV_EVENT_DRIVE_LOST, d, NULL, 0, 0);
83 }
84 
85 void
86 gv_start(struct bio *bp)
87 {
88 	struct g_geom *gp;
89 	struct gv_softc *sc;
90 
91 	gp = bp->bio_to->geom;
92 	sc = gp->softc;
93 
94 	switch (bp->bio_cmd) {
95 	case BIO_READ:
96 	case BIO_WRITE:
97 	case BIO_DELETE:
98 		break;
99 	case BIO_GETATTR:
100 	default:
101 		g_io_deliver(bp, EOPNOTSUPP);
102 		return;
103 	}
104 	mtx_lock(&sc->bqueue_mtx);
105 	bioq_disksort(sc->bqueue_down, bp);
106 	wakeup(sc);
107 	mtx_unlock(&sc->bqueue_mtx);
108 }
109 
110 void
111 gv_done(struct bio *bp)
112 {
113 	struct g_geom *gp;
114 	struct gv_softc *sc;
115 
116 	KASSERT(bp != NULL, ("NULL bp"));
117 
118 	gp = bp->bio_from->geom;
119 	sc = gp->softc;
120 
121 	mtx_lock(&sc->bqueue_mtx);
122 	bioq_disksort(sc->bqueue_up, bp);
123 	wakeup(sc);
124 	mtx_unlock(&sc->bqueue_mtx);
125 }
126 
127 int
128 gv_access(struct g_provider *pp, int dr, int dw, int de)
129 {
130 	struct g_geom *gp;
131 	struct gv_softc *sc;
132 	struct gv_drive *d, *d2;
133 	int error;
134 
135 	gp = pp->geom;
136 	sc = gp->softc;
137 	/*
138 	 * We want to modify the read count with the write count in case we have
139 	 * plexes in a RAID-5 organization.
140 	 */
141 	dr += dw;
142 
143 	LIST_FOREACH(d, &sc->drives, drive) {
144 		if (d->consumer == NULL)
145 			continue;
146 		error = g_access(d->consumer, dr, dw, de);
147 		if (error) {
148 			LIST_FOREACH(d2, &sc->drives, drive) {
149 				if (d == d2)
150 					break;
151 				g_access(d2->consumer, -dr, -dw, -de);
152 			}
153 			G_VINUM_DEBUG(0, "g_access '%s' failed: %d", d->name,
154 			    error);
155 			return (error);
156 		}
157 	}
158 	return (0);
159 }
160 
161 static void
162 gv_init(struct g_class *mp)
163 {
164 	struct g_geom *gp;
165 	struct gv_softc *sc;
166 
167 	g_trace(G_T_TOPOLOGY, "gv_init(%p)", mp);
168 
169 	gp = g_new_geomf(mp, "VINUM");
170 	gp->spoiled = gv_orphan;
171 	gp->orphan = gv_orphan;
172 	gp->access = gv_access;
173 	gp->start = gv_start;
174 	gp->softc = g_malloc(sizeof(struct gv_softc), M_WAITOK | M_ZERO);
175 	sc = gp->softc;
176 	sc->geom = gp;
177 	sc->bqueue_down = g_malloc(sizeof(struct bio_queue_head),
178 	    M_WAITOK | M_ZERO);
179 	sc->bqueue_up = g_malloc(sizeof(struct bio_queue_head),
180 	    M_WAITOK | M_ZERO);
181 	bioq_init(sc->bqueue_down);
182 	bioq_init(sc->bqueue_up);
183 	LIST_INIT(&sc->drives);
184 	LIST_INIT(&sc->subdisks);
185 	LIST_INIT(&sc->plexes);
186 	LIST_INIT(&sc->volumes);
187 	TAILQ_INIT(&sc->equeue);
188 	mtx_init(&sc->config_mtx, "gv_config", NULL, MTX_DEF);
189 	mtx_init(&sc->equeue_mtx, "gv_equeue", NULL, MTX_DEF);
190 	mtx_init(&sc->bqueue_mtx, "gv_bqueue", NULL, MTX_DEF);
191 	kproc_create(gv_worker, sc, &sc->worker, 0, 0, "gv_worker");
192 }
193 
194 static int
195 gv_unload(struct gctl_req *req, struct g_class *mp, struct g_geom *gp)
196 {
197 	struct gv_softc *sc;
198 
199 	g_trace(G_T_TOPOLOGY, "gv_unload(%p)", mp);
200 
201 	g_topology_assert();
202 	sc = gp->softc;
203 
204 	if (sc != NULL) {
205 		gv_worker_exit(sc);
206 		gp->softc = NULL;
207 		g_wither_geom(gp, ENXIO);
208 	}
209 
210 	return (0);
211 }
212 
213 /* Handle userland request of attaching object. */
214 static void
215 gv_attach(struct gv_softc *sc, struct gctl_req *req)
216 {
217 	struct gv_volume *v;
218 	struct gv_plex *p;
219 	struct gv_sd *s;
220 	off_t *offset;
221 	int *rename, type_child, type_parent;
222 	char *child, *parent;
223 
224 	child = gctl_get_param(req, "child", NULL);
225 	if (child == NULL) {
226 		gctl_error(req, "no child given");
227 		return;
228 	}
229 	parent = gctl_get_param(req, "parent", NULL);
230 	if (parent == NULL) {
231 		gctl_error(req, "no parent given");
232 		return;
233 	}
234 	offset = gctl_get_paraml(req, "offset", sizeof(*offset));
235 	if (offset == NULL) {
236 		gctl_error(req, "no offset given");
237 		return;
238 	}
239 	rename = gctl_get_paraml(req, "rename", sizeof(*rename));
240 	if (rename == NULL) {
241 		gctl_error(req, "no rename flag given");
242 		return;
243 	}
244 
245 	type_child = gv_object_type(sc, child);
246 	type_parent = gv_object_type(sc, parent);
247 
248 	switch (type_child) {
249 	case GV_TYPE_PLEX:
250 		if (type_parent != GV_TYPE_VOL) {
251 			gctl_error(req, "no such volume to attach to");
252 			return;
253 		}
254 		v = gv_find_vol(sc, parent);
255 		p = gv_find_plex(sc, child);
256 		gv_post_event(sc, GV_EVENT_ATTACH_PLEX, p, v, *offset, *rename);
257 		break;
258 	case GV_TYPE_SD:
259 		if (type_parent != GV_TYPE_PLEX) {
260 			gctl_error(req, "no such plex to attach to");
261 			return;
262 		}
263 		p = gv_find_plex(sc, parent);
264 		s = gv_find_sd(sc, child);
265 		gv_post_event(sc, GV_EVENT_ATTACH_SD, s, p, *offset, *rename);
266 		break;
267 	default:
268 		gctl_error(req, "invalid child type");
269 		break;
270 	}
271 }
272 
273 /* Handle userland request of detaching object. */
274 static void
275 gv_detach(struct gv_softc *sc, struct gctl_req *req)
276 {
277 	struct gv_plex *p;
278 	struct gv_sd *s;
279 	int *flags, type;
280 	char *object;
281 
282 	object = gctl_get_param(req, "object", NULL);
283 	if (object == NULL) {
284 		gctl_error(req, "no argument given");
285 		return;
286 	}
287 
288 	flags = gctl_get_paraml(req, "flags", sizeof(*flags));
289 	type = gv_object_type(sc, object);
290 	switch (type) {
291 	case GV_TYPE_PLEX:
292 		p = gv_find_plex(sc, object);
293 		gv_post_event(sc, GV_EVENT_DETACH_PLEX, p, NULL, *flags, 0);
294 		break;
295 	case GV_TYPE_SD:
296 		s = gv_find_sd(sc, object);
297 		gv_post_event(sc, GV_EVENT_DETACH_SD, s, NULL, *flags, 0);
298 		break;
299 	default:
300 		gctl_error(req, "invalid object type");
301 		break;
302 	}
303 }
304 
305 /* Handle userland requests for creating new objects. */
306 static int
307 gv_create(struct g_geom *gp, struct gctl_req *req)
308 {
309 	struct gv_softc *sc;
310 	struct gv_drive *d, *d2;
311 	struct gv_plex *p, *p2;
312 	struct gv_sd *s, *s2;
313 	struct gv_volume *v, *v2;
314 	struct g_provider *pp;
315 	int error, i, *drives, *flags, *plexes, *subdisks, *volumes;
316 	char buf[20];
317 
318 	g_topology_assert();
319 
320 	sc = gp->softc;
321 
322 	/* Find out how many of each object have been passed in. */
323 	volumes = gctl_get_paraml(req, "volumes", sizeof(*volumes));
324 	plexes = gctl_get_paraml(req, "plexes", sizeof(*plexes));
325 	subdisks = gctl_get_paraml(req, "subdisks", sizeof(*subdisks));
326 	drives = gctl_get_paraml(req, "drives", sizeof(*drives));
327 	if (volumes == NULL || plexes == NULL || subdisks == NULL ||
328 	    drives == NULL) {
329 		gctl_error(req, "number of objects not given");
330 		return (-1);
331 	}
332 	flags = gctl_get_paraml(req, "flags", sizeof(*flags));
333 	if (flags == NULL) {
334 		gctl_error(req, "flags not given");
335 		return (-1);
336 	}
337 
338 	/* First, handle drive definitions ... */
339 	for (i = 0; i < *drives; i++) {
340 		snprintf(buf, sizeof(buf), "drive%d", i);
341 		d2 = gctl_get_paraml(req, buf, sizeof(*d2));
342 		if (d2 == NULL) {
343 			gctl_error(req, "no drive definition given");
344 			return (-1);
345 		}
346 		/*
347 		 * Make sure that the device specified in the drive config is
348 		 * an active GEOM provider.
349 		 */
350 		pp = g_provider_by_name(d2->device);
351 		if (pp == NULL) {
352 			gctl_error(req, "%s: device not found", d2->device);
353 			goto error;
354 		}
355 		if (gv_find_drive(sc, d2->name) != NULL) {
356 			/* Ignore error. */
357 			if (*flags & GV_FLAG_F)
358 				continue;
359 			gctl_error(req, "drive '%s' already exists", d2->name);
360 			goto error;
361 		}
362 		if (gv_find_drive_device(sc, d2->device) != NULL) {
363 			gctl_error(req, "device '%s' already configured in "
364 			    "gvinum", d2->device);
365 			goto error;
366 		}
367 
368 
369 		d = g_malloc(sizeof(*d), M_WAITOK | M_ZERO);
370 		bcopy(d2, d, sizeof(*d));
371 
372 		gv_post_event(sc, GV_EVENT_CREATE_DRIVE, d, NULL, 0, 0);
373 	}
374 
375 	/* ... then volume definitions ... */
376 	for (i = 0; i < *volumes; i++) {
377 		error = 0;
378 		snprintf(buf, sizeof(buf), "volume%d", i);
379 		v2 = gctl_get_paraml(req, buf, sizeof(*v2));
380 		if (v2 == NULL) {
381 			gctl_error(req, "no volume definition given");
382 			return (-1);
383 		}
384 		if (gv_find_vol(sc, v2->name) != NULL) {
385 			/* Ignore error. */
386 			if (*flags & GV_FLAG_F)
387 				continue;
388 			gctl_error(req, "volume '%s' already exists", v2->name);
389 			goto error;
390 		}
391 
392 		v = g_malloc(sizeof(*v), M_WAITOK | M_ZERO);
393 		bcopy(v2, v, sizeof(*v));
394 
395 		gv_post_event(sc, GV_EVENT_CREATE_VOLUME, v, NULL, 0, 0);
396 	}
397 
398 	/* ... then plex definitions ... */
399 	for (i = 0; i < *plexes; i++) {
400 		error = 0;
401 		snprintf(buf, sizeof(buf), "plex%d", i);
402 		p2 = gctl_get_paraml(req, buf, sizeof(*p2));
403 		if (p2 == NULL) {
404 			gctl_error(req, "no plex definition given");
405 			return (-1);
406 		}
407 		if (gv_find_plex(sc, p2->name) != NULL) {
408 			/* Ignore error. */
409 			if (*flags & GV_FLAG_F)
410 				continue;
411 			gctl_error(req, "plex '%s' already exists", p2->name);
412 			goto error;
413 		}
414 
415 		p = g_malloc(sizeof(*p), M_WAITOK | M_ZERO);
416 		bcopy(p2, p, sizeof(*p));
417 
418 		gv_post_event(sc, GV_EVENT_CREATE_PLEX, p, NULL, 0, 0);
419 	}
420 
421 	/* ... and, finally, subdisk definitions. */
422 	for (i = 0; i < *subdisks; i++) {
423 		error = 0;
424 		snprintf(buf, sizeof(buf), "sd%d", i);
425 		s2 = gctl_get_paraml(req, buf, sizeof(*s2));
426 		if (s2 == NULL) {
427 			gctl_error(req, "no subdisk definition given");
428 			return (-1);
429 		}
430 		if (gv_find_sd(sc, s2->name) != NULL) {
431 			/* Ignore error. */
432 			if (*flags & GV_FLAG_F)
433 				continue;
434 			gctl_error(req, "sd '%s' already exists", s2->name);
435 			goto error;
436 		}
437 
438 		s = g_malloc(sizeof(*s), M_WAITOK | M_ZERO);
439 		bcopy(s2, s, sizeof(*s));
440 
441 		gv_post_event(sc, GV_EVENT_CREATE_SD, s, NULL, 0, 0);
442 	}
443 
444 error:
445 	gv_post_event(sc, GV_EVENT_SETUP_OBJECTS, sc, NULL, 0, 0);
446 	gv_post_event(sc, GV_EVENT_SAVE_CONFIG, sc, NULL, 0, 0);
447 
448 	return (0);
449 }
450 
451 static void
452 gv_config(struct gctl_req *req, struct g_class *mp, char const *verb)
453 {
454 	struct g_geom *gp;
455 	struct gv_softc *sc;
456 	struct sbuf *sb;
457 	char *comment;
458 
459 	g_topology_assert();
460 
461 	gp = LIST_FIRST(&mp->geom);
462 	sc = gp->softc;
463 
464 	if (!strcmp(verb, "attach")) {
465 		gv_attach(sc, req);
466 
467 	} else if (!strcmp(verb, "concat")) {
468 		gv_concat(gp, req);
469 
470 	} else if (!strcmp(verb, "detach")) {
471 		gv_detach(sc, req);
472 
473 	} else if (!strcmp(verb, "list")) {
474 		gv_list(gp, req);
475 
476 	/* Save our configuration back to disk. */
477 	} else if (!strcmp(verb, "saveconfig")) {
478 		gv_post_event(sc, GV_EVENT_SAVE_CONFIG, sc, NULL, 0, 0);
479 
480 	/* Return configuration in string form. */
481 	} else if (!strcmp(verb, "getconfig")) {
482 		comment = gctl_get_param(req, "comment", NULL);
483 		if (comment == NULL) {
484 			gctl_error(req, "no comment parameter given");
485 			return;
486 		}
487 		sb = sbuf_new(NULL, NULL, GV_CFG_LEN, SBUF_FIXEDLEN);
488 		gv_format_config(sc, sb, 0, comment);
489 		sbuf_finish(sb);
490 		gctl_set_param(req, "config", sbuf_data(sb), sbuf_len(sb) + 1);
491 		sbuf_delete(sb);
492 
493 	} else if (!strcmp(verb, "create")) {
494 		gv_create(gp, req);
495 
496 	} else if (!strcmp(verb, "mirror")) {
497 		gv_mirror(gp, req);
498 
499 	} else if (!strcmp(verb, "move")) {
500 		gv_move(gp, req);
501 
502 	} else if (!strcmp(verb, "raid5")) {
503 		gv_raid5(gp, req);
504 
505 	} else if (!strcmp(verb, "rebuildparity") ||
506 	    !strcmp(verb, "checkparity")) {
507 		gv_parityop(sc, req);
508 
509 	} else if (!strcmp(verb, "remove")) {
510 		gv_remove(gp, req);
511 
512 	} else if (!strcmp(verb, "rename")) {
513 		gv_rename(gp, req);
514 
515 	} else if (!strcmp(verb, "resetconfig")) {
516 		gv_post_event(sc, GV_EVENT_RESET_CONFIG, sc, NULL, 0, 0);
517 
518 	} else if (!strcmp(verb, "start")) {
519 		gv_start_obj(gp, req);
520 
521 	} else if (!strcmp(verb, "stripe")) {
522 		gv_stripe(gp, req);
523 
524 	} else if (!strcmp(verb, "setstate")) {
525 		gv_setstate(gp, req);
526 	} else
527 		gctl_error(req, "Unknown verb parameter");
528 }
529 
530 static void
531 gv_parityop(struct gv_softc *sc, struct gctl_req *req)
532 {
533 	struct gv_plex *p;
534 	int *flags, *rebuild, type;
535 	char *plex;
536 
537 	plex = gctl_get_param(req, "plex", NULL);
538 	if (plex == NULL) {
539 		gctl_error(req, "no plex given");
540 		return;
541 	}
542 
543 	flags = gctl_get_paraml(req, "flags", sizeof(*flags));
544 	if (flags == NULL) {
545 		gctl_error(req, "no flags given");
546 		return;
547 	}
548 
549 	rebuild = gctl_get_paraml(req, "rebuild", sizeof(*rebuild));
550 	if (rebuild == NULL) {
551 		gctl_error(req, "no operation given");
552 		return;
553 	}
554 
555 	type = gv_object_type(sc, plex);
556 	if (type != GV_TYPE_PLEX) {
557 		gctl_error(req, "'%s' is not a plex", plex);
558 		return;
559 	}
560 	p = gv_find_plex(sc, plex);
561 
562 	if (p->state != GV_PLEX_UP) {
563 		gctl_error(req, "plex %s is not completely accessible",
564 		    p->name);
565 		return;
566 	}
567 
568 	if (p->org != GV_PLEX_RAID5) {
569 		gctl_error(req, "plex %s is not a RAID5 plex", p->name);
570 		return;
571 	}
572 
573 	/* Put it in the event queue. */
574 	/* XXX: The state of the plex might have changed when this event is
575 	 * picked up ... We should perhaps check this afterwards. */
576 	if (*rebuild)
577 		gv_post_event(sc, GV_EVENT_PARITY_REBUILD, p, NULL, 0, 0);
578 	else
579 		gv_post_event(sc, GV_EVENT_PARITY_CHECK, p, NULL, 0, 0);
580 }
581 
582 
583 static struct g_geom *
584 gv_taste(struct g_class *mp, struct g_provider *pp, int flags __unused)
585 {
586 	struct g_geom *gp;
587 	struct g_consumer *cp;
588 	struct gv_softc *sc;
589 	struct gv_hdr vhdr;
590 	int error;
591 
592  	g_topology_assert();
593 	g_trace(G_T_TOPOLOGY, "gv_taste(%s, %s)", mp->name, pp->name);
594 
595 	gp = LIST_FIRST(&mp->geom);
596 	if (gp == NULL) {
597 		G_VINUM_DEBUG(0, "error: tasting, but not initialized?");
598 		return (NULL);
599 	}
600 	sc = gp->softc;
601 
602 	cp = g_new_consumer(gp);
603 	if (g_attach(cp, pp) != 0) {
604 		g_destroy_consumer(cp);
605 		return (NULL);
606 	}
607 	if (g_access(cp, 1, 0, 0) != 0) {
608 		g_detach(cp);
609 		g_destroy_consumer(cp);
610 		return (NULL);
611 	}
612 	g_topology_unlock();
613 
614 	error = gv_read_header(cp, &vhdr);
615 
616 	g_topology_lock();
617 	g_access(cp, -1, 0, 0);
618 	g_detach(cp);
619 	g_destroy_consumer(cp);
620 
621 	/* Check if what we've been given is a valid vinum drive. */
622 	if (!error)
623 		gv_post_event(sc, GV_EVENT_DRIVE_TASTED, pp, NULL, 0, 0);
624 
625 	return (NULL);
626 }
627 
628 void
629 gv_worker(void *arg)
630 {
631 	struct g_provider *pp;
632 	struct gv_softc *sc;
633 	struct gv_event *ev;
634 	struct gv_volume *v;
635 	struct gv_plex *p;
636 	struct gv_sd *s;
637 	struct gv_drive *d;
638 	struct bio *bp;
639 	int newstate, flags, err, rename;
640 	char *newname;
641 	off_t offset;
642 
643 	sc = arg;
644 	KASSERT(sc != NULL, ("NULL sc"));
645 	for (;;) {
646 		/* Look at the events first... */
647 		ev = gv_get_event(sc);
648 		if (ev != NULL) {
649 			gv_remove_event(sc, ev);
650 
651 			switch (ev->type) {
652 			case GV_EVENT_DRIVE_TASTED:
653 				G_VINUM_DEBUG(2, "event 'drive tasted'");
654 				pp = ev->arg1;
655 				gv_drive_tasted(sc, pp);
656 				break;
657 
658 			case GV_EVENT_DRIVE_LOST:
659 				G_VINUM_DEBUG(2, "event 'drive lost'");
660 				d = ev->arg1;
661 				gv_drive_lost(sc, d);
662 				break;
663 
664 			case GV_EVENT_CREATE_DRIVE:
665 				G_VINUM_DEBUG(2, "event 'create drive'");
666 				d = ev->arg1;
667 				gv_create_drive(sc, d);
668 				break;
669 
670 			case GV_EVENT_CREATE_VOLUME:
671 				G_VINUM_DEBUG(2, "event 'create volume'");
672 				v = ev->arg1;
673 				gv_create_volume(sc, v);
674 				break;
675 
676 			case GV_EVENT_CREATE_PLEX:
677 				G_VINUM_DEBUG(2, "event 'create plex'");
678 				p = ev->arg1;
679 				gv_create_plex(sc, p);
680 				break;
681 
682 			case GV_EVENT_CREATE_SD:
683 				G_VINUM_DEBUG(2, "event 'create sd'");
684 				s = ev->arg1;
685 				gv_create_sd(sc, s);
686 				break;
687 
688 			case GV_EVENT_RM_DRIVE:
689 				G_VINUM_DEBUG(2, "event 'remove drive'");
690 				d = ev->arg1;
691 				flags = ev->arg3;
692 				gv_rm_drive(sc, d, flags);
693 				/*gv_setup_objects(sc);*/
694 				break;
695 
696 			case GV_EVENT_RM_VOLUME:
697 				G_VINUM_DEBUG(2, "event 'remove volume'");
698 				v = ev->arg1;
699 				gv_rm_vol(sc, v);
700 				/*gv_setup_objects(sc);*/
701 				break;
702 
703 			case GV_EVENT_RM_PLEX:
704 				G_VINUM_DEBUG(2, "event 'remove plex'");
705 				p = ev->arg1;
706 				gv_rm_plex(sc, p);
707 				/*gv_setup_objects(sc);*/
708 				break;
709 
710 			case GV_EVENT_RM_SD:
711 				G_VINUM_DEBUG(2, "event 'remove sd'");
712 				s = ev->arg1;
713 				gv_rm_sd(sc, s);
714 				/*gv_setup_objects(sc);*/
715 				break;
716 
717 			case GV_EVENT_SAVE_CONFIG:
718 				G_VINUM_DEBUG(2, "event 'save config'");
719 				gv_save_config(sc);
720 				break;
721 
722 			case GV_EVENT_SET_SD_STATE:
723 				G_VINUM_DEBUG(2, "event 'setstate sd'");
724 				s = ev->arg1;
725 				newstate = ev->arg3;
726 				flags = ev->arg4;
727 				err = gv_set_sd_state(s, newstate, flags);
728 				if (err)
729 					G_VINUM_DEBUG(0, "error setting subdisk"
730 					    " state: error code %d", err);
731 				break;
732 
733 			case GV_EVENT_SET_DRIVE_STATE:
734 				G_VINUM_DEBUG(2, "event 'setstate drive'");
735 				d = ev->arg1;
736 				newstate = ev->arg3;
737 				flags = ev->arg4;
738 				err = gv_set_drive_state(d, newstate, flags);
739 				if (err)
740 					G_VINUM_DEBUG(0, "error setting drive "
741 					    "state: error code %d", err);
742 				break;
743 
744 			case GV_EVENT_SET_VOL_STATE:
745 				G_VINUM_DEBUG(2, "event 'setstate volume'");
746 				v = ev->arg1;
747 				newstate = ev->arg3;
748 				flags = ev->arg4;
749 				err = gv_set_vol_state(v, newstate, flags);
750 				if (err)
751 					G_VINUM_DEBUG(0, "error setting volume "
752 					    "state: error code %d", err);
753 				break;
754 
755 			case GV_EVENT_SET_PLEX_STATE:
756 				G_VINUM_DEBUG(2, "event 'setstate plex'");
757 				p = ev->arg1;
758 				newstate = ev->arg3;
759 				flags = ev->arg4;
760 				err = gv_set_plex_state(p, newstate, flags);
761 				if (err)
762 					G_VINUM_DEBUG(0, "error setting plex "
763 					    "state: error code %d", err);
764 				break;
765 
766 			case GV_EVENT_SETUP_OBJECTS:
767 				G_VINUM_DEBUG(2, "event 'setup objects'");
768 				gv_setup_objects(sc);
769 				break;
770 
771 			case GV_EVENT_RESET_CONFIG:
772 				G_VINUM_DEBUG(2, "event 'resetconfig'");
773 				err = gv_resetconfig(sc);
774 				if (err)
775 					G_VINUM_DEBUG(0, "error resetting "
776 					    "config: error code %d", err);
777 				break;
778 
779 			case GV_EVENT_PARITY_REBUILD:
780 				/*
781 				 * Start the rebuild. The gv_plex_done will
782 				 * handle issuing of the remaining rebuild bio's
783 				 * until it's finished.
784 				 */
785 				G_VINUM_DEBUG(2, "event 'rebuild'");
786 				p = ev->arg1;
787 				if (p->state != GV_PLEX_UP) {
788 					G_VINUM_DEBUG(0, "plex %s is not "
789 					    "completely accessible", p->name);
790 					break;
791 				}
792 				if (p->flags & GV_PLEX_SYNCING ||
793 				    p->flags & GV_PLEX_REBUILDING ||
794 				    p->flags & GV_PLEX_GROWING) {
795 					G_VINUM_DEBUG(0, "plex %s is busy with "
796 					    "syncing or parity build", p->name);
797 					break;
798 				}
799 				p->synced = 0;
800 				p->flags |= GV_PLEX_REBUILDING;
801 				g_topology_assert_not();
802 				g_topology_lock();
803 				err = gv_access(p->vol_sc->provider, 1, 1, 0);
804 				if (err) {
805 					G_VINUM_DEBUG(0, "unable to access "
806 					    "provider");
807 					break;
808 				}
809 				g_topology_unlock();
810 				gv_parity_request(p, GV_BIO_CHECK |
811 				    GV_BIO_PARITY, 0);
812 				break;
813 
814 			case GV_EVENT_PARITY_CHECK:
815 				/* Start parity check. */
816 				G_VINUM_DEBUG(2, "event 'check'");
817 				p = ev->arg1;
818 				if (p->state != GV_PLEX_UP) {
819 					G_VINUM_DEBUG(0, "plex %s is not "
820 					    "completely accessible", p->name);
821 					break;
822 				}
823 				if (p->flags & GV_PLEX_SYNCING ||
824 				    p->flags & GV_PLEX_REBUILDING ||
825 				    p->flags & GV_PLEX_GROWING) {
826 					G_VINUM_DEBUG(0, "plex %s is busy with "
827 					    "syncing or parity build", p->name);
828 					break;
829 				}
830 				p->synced = 0;
831 				g_topology_assert_not();
832 				g_topology_lock();
833 				err = gv_access(p->vol_sc->provider, 1, 1, 0);
834 				if (err) {
835 					G_VINUM_DEBUG(0, "unable to access "
836 					    "provider");
837 					break;
838 				}
839 				g_topology_unlock();
840 				gv_parity_request(p, GV_BIO_CHECK, 0);
841 				break;
842 
843 			case GV_EVENT_START_PLEX:
844 				G_VINUM_DEBUG(2, "event 'start' plex");
845 				p = ev->arg1;
846 				gv_start_plex(p);
847 				break;
848 
849 			case GV_EVENT_START_VOLUME:
850 				G_VINUM_DEBUG(2, "event 'start' volume");
851 				v = ev->arg1;
852 				gv_start_vol(v);
853 				break;
854 
855 			case GV_EVENT_ATTACH_PLEX:
856 				G_VINUM_DEBUG(2, "event 'attach' plex");
857 				p = ev->arg1;
858 				v = ev->arg2;
859 				rename = ev->arg4;
860 				err = gv_attach_plex(p, v, rename);
861 				if (err)
862 					G_VINUM_DEBUG(0, "error attaching %s to"
863 					    " %s: error code %d", p->name,
864 					    v->name, err);
865 				break;
866 
867 			case GV_EVENT_ATTACH_SD:
868 				G_VINUM_DEBUG(2, "event 'attach' sd");
869 				s = ev->arg1;
870 				p = ev->arg2;
871 				offset = ev->arg3;
872 				rename = ev->arg4;
873 				err = gv_attach_sd(s, p, offset, rename);
874 				if (err)
875 					G_VINUM_DEBUG(0, "error attaching %s to"
876 					    " %s: error code %d", s->name,
877 					    p->name, err);
878 				break;
879 
880 			case GV_EVENT_DETACH_PLEX:
881 				G_VINUM_DEBUG(2, "event 'detach' plex");
882 				p = ev->arg1;
883 				flags = ev->arg3;
884 				err = gv_detach_plex(p, flags);
885 				if (err)
886 					G_VINUM_DEBUG(0, "error detaching %s: "
887 					    "error code %d", p->name, err);
888 				break;
889 
890 			case GV_EVENT_DETACH_SD:
891 				G_VINUM_DEBUG(2, "event 'detach' sd");
892 				s = ev->arg1;
893 				flags = ev->arg3;
894 				err = gv_detach_sd(s, flags);
895 				if (err)
896 					G_VINUM_DEBUG(0, "error detaching %s: "
897 					    "error code %d", s->name, err);
898 				break;
899 
900 			case GV_EVENT_RENAME_VOL:
901 				G_VINUM_DEBUG(2, "event 'rename' volume");
902 				v = ev->arg1;
903 				newname = ev->arg2;
904 				flags = ev->arg3;
905 				err = gv_rename_vol(sc, v, newname, flags);
906 				if (err)
907 					G_VINUM_DEBUG(0, "error renaming %s to "
908 					    "%s: error code %d", v->name,
909 					    newname, err);
910 				g_free(newname);
911 				/* Destroy and recreate the provider if we can. */
912 				if (gv_provider_is_open(v->provider)) {
913 					G_VINUM_DEBUG(0, "unable to rename "
914 					    "provider to %s: provider in use",
915 					    v->name);
916 					break;
917 				}
918 				g_topology_lock();
919 				g_wither_provider(v->provider, ENOENT);
920 				g_topology_unlock();
921 				v->provider = NULL;
922 				gv_post_event(sc, GV_EVENT_SETUP_OBJECTS, sc,
923 				    NULL, 0, 0);
924 				break;
925 
926 			case GV_EVENT_RENAME_PLEX:
927 				G_VINUM_DEBUG(2, "event 'rename' plex");
928 				p = ev->arg1;
929 				newname = ev->arg2;
930 				flags = ev->arg3;
931 				err = gv_rename_plex(sc, p, newname, flags);
932 				if (err)
933 					G_VINUM_DEBUG(0, "error renaming %s to "
934 					    "%s: error code %d", p->name,
935 					    newname, err);
936 				g_free(newname);
937 				break;
938 
939 			case GV_EVENT_RENAME_SD:
940 				G_VINUM_DEBUG(2, "event 'rename' sd");
941 				s = ev->arg1;
942 				newname = ev->arg2;
943 				flags = ev->arg3;
944 				err = gv_rename_sd(sc, s, newname, flags);
945 				if (err)
946 					G_VINUM_DEBUG(0, "error renaming %s to "
947 					    "%s: error code %d", s->name,
948 					    newname, err);
949 				g_free(newname);
950 				break;
951 
952 			case GV_EVENT_RENAME_DRIVE:
953 				G_VINUM_DEBUG(2, "event 'rename' drive");
954 				d = ev->arg1;
955 				newname = ev->arg2;
956 				flags = ev->arg3;
957 				err = gv_rename_drive(sc, d, newname, flags);
958 				if (err)
959 					G_VINUM_DEBUG(0, "error renaming %s to "
960 					    "%s: error code %d", d->name,
961 					    newname, err);
962 				g_free(newname);
963 				break;
964 
965 			case GV_EVENT_MOVE_SD:
966 				G_VINUM_DEBUG(2, "event 'move' sd");
967 				s = ev->arg1;
968 				d = ev->arg2;
969 				flags = ev->arg3;
970 				err = gv_move_sd(sc, s, d, flags);
971 				if (err)
972 					G_VINUM_DEBUG(0, "error moving %s to "
973 					    "%s: error code %d", s->name,
974 					    d->name, err);
975 				break;
976 
977 			case GV_EVENT_THREAD_EXIT:
978 				G_VINUM_DEBUG(2, "event 'thread exit'");
979 				g_free(ev);
980 				mtx_lock(&sc->equeue_mtx);
981 				mtx_lock(&sc->bqueue_mtx);
982 				gv_cleanup(sc);
983 				mtx_destroy(&sc->bqueue_mtx);
984 				mtx_destroy(&sc->equeue_mtx);
985 				g_free(sc->bqueue_down);
986 				g_free(sc->bqueue_up);
987 				g_free(sc);
988 				kproc_exit(0);
989 				/* NOTREACHED */
990 
991 			default:
992 				G_VINUM_DEBUG(1, "unknown event %d", ev->type);
993 			}
994 
995 			g_free(ev);
996 			continue;
997 		}
998 
999 		/* ... then do I/O processing. */
1000 		mtx_lock(&sc->bqueue_mtx);
1001 		/* First do new requests. */
1002 		bp = bioq_takefirst(sc->bqueue_down);
1003 		if (bp != NULL) {
1004 			mtx_unlock(&sc->bqueue_mtx);
1005 			/* A bio that interfered with another bio. */
1006 			if (bp->bio_pflags & GV_BIO_ONHOLD) {
1007 				s = bp->bio_caller1;
1008 				p = s->plex_sc;
1009 				/* Is it still locked out? */
1010 				if (gv_stripe_active(p, bp)) {
1011 					/* Park the bio on the waiting queue. */
1012 					bioq_disksort(p->wqueue, bp);
1013 				} else {
1014 					bp->bio_pflags &= ~GV_BIO_ONHOLD;
1015 					g_io_request(bp, s->drive_sc->consumer);
1016 				}
1017 			/* A special request requireing special handling. */
1018 			} else if (bp->bio_pflags & GV_BIO_INTERNAL) {
1019 				p = bp->bio_caller1;
1020 				gv_plex_start(p, bp);
1021 			} else {
1022 				gv_volume_start(sc, bp);
1023 			}
1024 			mtx_lock(&sc->bqueue_mtx);
1025 		}
1026 		/* Then do completed requests. */
1027 		bp = bioq_takefirst(sc->bqueue_up);
1028 		if (bp == NULL) {
1029 			msleep(sc, &sc->bqueue_mtx, PRIBIO, "-", hz/10);
1030 			mtx_unlock(&sc->bqueue_mtx);
1031 			continue;
1032 		}
1033 		mtx_unlock(&sc->bqueue_mtx);
1034 		gv_bio_done(sc, bp);
1035 	}
1036 }
1037 
1038 #define	VINUM_CLASS_NAME "VINUM"
1039 
1040 static struct g_class g_vinum_class	= {
1041 	.name = VINUM_CLASS_NAME,
1042 	.version = G_VERSION,
1043 	.init = gv_init,
1044 	.taste = gv_taste,
1045 	.ctlreq = gv_config,
1046 	.destroy_geom = gv_unload,
1047 };
1048 
1049 DECLARE_GEOM_CLASS(g_vinum_class, g_vinum);
1050