1/*-
2 * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
3 *
4 *  Copyright (c) 2004, 2007 Lukas Ertl
5 *  Copyright (c) 2007, 2009 Ulf Lilleengen
6 *  All rights reserved.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 * 1. Redistributions of source code must retain the above copyright
12 *    notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 *    notice, this list of conditions and the following disclaimer in the
15 *    documentation and/or other materials provided with the distribution.
16 *
17 * THIS SOFTWARE IS PROVIDED BY AUTHOR AND CONTRIBUTORS ``AS IS'' AND
18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20 * ARE DISCLAIMED.  IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE
21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27 * SUCH DAMAGE.
28 *
29 */
30
31#include <sys/cdefs.h>
32__FBSDID("$FreeBSD$");
33
34#include <sys/param.h>
35#include <sys/bio.h>
36#include <sys/kernel.h>
37#include <sys/kthread.h>
38#include <sys/lock.h>
39#include <sys/malloc.h>
40#include <sys/module.h>
41#include <sys/mutex.h>
42#include <sys/sbuf.h>
43#include <sys/sysctl.h>
44#include <sys/systm.h>
45
46#include <geom/geom.h>
47#include <geom/vinum/geom_vinum_var.h>
48#include <geom/vinum/geom_vinum.h>
49#include <geom/vinum/geom_vinum_raid5.h>
50
51SYSCTL_DECL(_kern_geom);
52static SYSCTL_NODE(_kern_geom, OID_AUTO, vinum, CTLFLAG_RW, 0,
53    "GEOM_VINUM stuff");
54u_int g_vinum_debug = 0;
55SYSCTL_UINT(_kern_geom_vinum, OID_AUTO, debug, CTLFLAG_RWTUN, &g_vinum_debug, 0,
56    "Debug level");
57
58static int	gv_create(struct g_geom *, struct gctl_req *);
59static void	gv_attach(struct gv_softc *, struct gctl_req *);
60static void	gv_detach(struct gv_softc *, struct gctl_req *);
61static void	gv_parityop(struct gv_softc *, struct gctl_req *);
62
63
64static void
65gv_orphan(struct g_consumer *cp)
66{
67	struct g_geom *gp;
68	struct gv_softc *sc;
69	struct gv_drive *d;
70
71	g_topology_assert();
72
73	KASSERT(cp != NULL, ("gv_orphan: null cp"));
74	gp = cp->geom;
75	KASSERT(gp != NULL, ("gv_orphan: null gp"));
76	sc = gp->softc;
77	KASSERT(sc != NULL, ("gv_orphan: null sc"));
78	d = cp->private;
79	KASSERT(d != NULL, ("gv_orphan: null d"));
80
81	g_trace(G_T_TOPOLOGY, "gv_orphan(%s)", gp->name);
82
83	gv_post_event(sc, GV_EVENT_DRIVE_LOST, d, NULL, 0, 0);
84}
85
86void
87gv_start(struct bio *bp)
88{
89	struct g_geom *gp;
90	struct gv_softc *sc;
91
92	gp = bp->bio_to->geom;
93	sc = gp->softc;
94
95	switch (bp->bio_cmd) {
96	case BIO_READ:
97	case BIO_WRITE:
98	case BIO_DELETE:
99		break;
100	case BIO_GETATTR:
101	default:
102		g_io_deliver(bp, EOPNOTSUPP);
103		return;
104	}
105	mtx_lock(&sc->bqueue_mtx);
106	bioq_disksort(sc->bqueue_down, bp);
107	wakeup(sc);
108	mtx_unlock(&sc->bqueue_mtx);
109}
110
111void
112gv_done(struct bio *bp)
113{
114	struct g_geom *gp;
115	struct gv_softc *sc;
116
117	KASSERT(bp != NULL, ("NULL bp"));
118
119	gp = bp->bio_from->geom;
120	sc = gp->softc;
121
122	mtx_lock(&sc->bqueue_mtx);
123	bioq_disksort(sc->bqueue_up, bp);
124	wakeup(sc);
125	mtx_unlock(&sc->bqueue_mtx);
126}
127
128int
129gv_access(struct g_provider *pp, int dr, int dw, int de)
130{
131	struct g_geom *gp;
132	struct gv_softc *sc;
133	struct gv_drive *d, *d2;
134	int error;
135
136	gp = pp->geom;
137	sc = gp->softc;
138	/*
139	 * We want to modify the read count with the write count in case we have
140	 * plexes in a RAID-5 organization.
141	 */
142	dr += dw;
143
144	LIST_FOREACH(d, &sc->drives, drive) {
145		if (d->consumer == NULL)
146			continue;
147		error = g_access(d->consumer, dr, dw, de);
148		if (error) {
149			LIST_FOREACH(d2, &sc->drives, drive) {
150				if (d == d2)
151					break;
152				g_access(d2->consumer, -dr, -dw, -de);
153			}
154			G_VINUM_DEBUG(0, "g_access '%s' failed: %d", d->name,
155			    error);
156			return (error);
157		}
158	}
159	return (0);
160}
161
162static void
163gv_init(struct g_class *mp)
164{
165	struct g_geom *gp;
166	struct gv_softc *sc;
167
168	g_trace(G_T_TOPOLOGY, "gv_init(%p)", mp);
169
170	gp = g_new_geomf(mp, "VINUM");
171	gp->spoiled = gv_orphan;
172	gp->orphan = gv_orphan;
173	gp->access = gv_access;
174	gp->start = gv_start;
175	gp->softc = g_malloc(sizeof(struct gv_softc), M_WAITOK | M_ZERO);
176	sc = gp->softc;
177	sc->geom = gp;
178	sc->bqueue_down = g_malloc(sizeof(struct bio_queue_head),
179	    M_WAITOK | M_ZERO);
180	sc->bqueue_up = g_malloc(sizeof(struct bio_queue_head),
181	    M_WAITOK | M_ZERO);
182	bioq_init(sc->bqueue_down);
183	bioq_init(sc->bqueue_up);
184	LIST_INIT(&sc->drives);
185	LIST_INIT(&sc->subdisks);
186	LIST_INIT(&sc->plexes);
187	LIST_INIT(&sc->volumes);
188	TAILQ_INIT(&sc->equeue);
189	mtx_init(&sc->config_mtx, "gv_config", NULL, MTX_DEF);
190	mtx_init(&sc->equeue_mtx, "gv_equeue", NULL, MTX_DEF);
191	mtx_init(&sc->bqueue_mtx, "gv_bqueue", NULL, MTX_DEF);
192	kproc_create(gv_worker, sc, &sc->worker, 0, 0, "gv_worker");
193}
194
195static int
196gv_unload(struct gctl_req *req, struct g_class *mp, struct g_geom *gp)
197{
198	struct gv_softc *sc;
199
200	g_trace(G_T_TOPOLOGY, "gv_unload(%p)", mp);
201
202	g_topology_assert();
203	sc = gp->softc;
204
205	if (sc != NULL) {
206		gv_worker_exit(sc);
207		gp->softc = NULL;
208		g_wither_geom(gp, ENXIO);
209	}
210
211	return (0);
212}
213
214/* Handle userland request of attaching object. */
215static void
216gv_attach(struct gv_softc *sc, struct gctl_req *req)
217{
218	struct gv_volume *v;
219	struct gv_plex *p;
220	struct gv_sd *s;
221	off_t *offset;
222	int *rename, type_child, type_parent;
223	char *child, *parent;
224
225	child = gctl_get_param(req, "child", NULL);
226	if (child == NULL) {
227		gctl_error(req, "no child given");
228		return;
229	}
230	parent = gctl_get_param(req, "parent", NULL);
231	if (parent == NULL) {
232		gctl_error(req, "no parent given");
233		return;
234	}
235	offset = gctl_get_paraml(req, "offset", sizeof(*offset));
236	if (offset == NULL) {
237		gctl_error(req, "no offset given");
238		return;
239	}
240	rename = gctl_get_paraml(req, "rename", sizeof(*rename));
241	if (rename == NULL) {
242		gctl_error(req, "no rename flag given");
243		return;
244	}
245
246	type_child = gv_object_type(sc, child);
247	type_parent = gv_object_type(sc, parent);
248
249	switch (type_child) {
250	case GV_TYPE_PLEX:
251		if (type_parent != GV_TYPE_VOL) {
252			gctl_error(req, "no such volume to attach to");
253			return;
254		}
255		v = gv_find_vol(sc, parent);
256		p = gv_find_plex(sc, child);
257		gv_post_event(sc, GV_EVENT_ATTACH_PLEX, p, v, *offset, *rename);
258		break;
259	case GV_TYPE_SD:
260		if (type_parent != GV_TYPE_PLEX) {
261			gctl_error(req, "no such plex to attach to");
262			return;
263		}
264		p = gv_find_plex(sc, parent);
265		s = gv_find_sd(sc, child);
266		gv_post_event(sc, GV_EVENT_ATTACH_SD, s, p, *offset, *rename);
267		break;
268	default:
269		gctl_error(req, "invalid child type");
270		break;
271	}
272}
273
274/* Handle userland request of detaching object. */
275static void
276gv_detach(struct gv_softc *sc, struct gctl_req *req)
277{
278	struct gv_plex *p;
279	struct gv_sd *s;
280	int *flags, type;
281	char *object;
282
283	object = gctl_get_param(req, "object", NULL);
284	if (object == NULL) {
285		gctl_error(req, "no argument given");
286		return;
287	}
288
289	flags = gctl_get_paraml(req, "flags", sizeof(*flags));
290	type = gv_object_type(sc, object);
291	switch (type) {
292	case GV_TYPE_PLEX:
293		p = gv_find_plex(sc, object);
294		gv_post_event(sc, GV_EVENT_DETACH_PLEX, p, NULL, *flags, 0);
295		break;
296	case GV_TYPE_SD:
297		s = gv_find_sd(sc, object);
298		gv_post_event(sc, GV_EVENT_DETACH_SD, s, NULL, *flags, 0);
299		break;
300	default:
301		gctl_error(req, "invalid object type");
302		break;
303	}
304}
305
306/* Handle userland requests for creating new objects. */
307static int
308gv_create(struct g_geom *gp, struct gctl_req *req)
309{
310	struct gv_softc *sc;
311	struct gv_drive *d, *d2;
312	struct gv_plex *p, *p2;
313	struct gv_sd *s, *s2;
314	struct gv_volume *v, *v2;
315	struct g_provider *pp;
316	int error, i, *drives, *flags, *plexes, *subdisks, *volumes;
317	char buf[20];
318
319	g_topology_assert();
320
321	sc = gp->softc;
322
323	/* Find out how many of each object have been passed in. */
324	volumes = gctl_get_paraml(req, "volumes", sizeof(*volumes));
325	plexes = gctl_get_paraml(req, "plexes", sizeof(*plexes));
326	subdisks = gctl_get_paraml(req, "subdisks", sizeof(*subdisks));
327	drives = gctl_get_paraml(req, "drives", sizeof(*drives));
328	if (volumes == NULL || plexes == NULL || subdisks == NULL ||
329	    drives == NULL) {
330		gctl_error(req, "number of objects not given");
331		return (-1);
332	}
333	flags = gctl_get_paraml(req, "flags", sizeof(*flags));
334	if (flags == NULL) {
335		gctl_error(req, "flags not given");
336		return (-1);
337	}
338
339	/* First, handle drive definitions ... */
340	for (i = 0; i < *drives; i++) {
341		snprintf(buf, sizeof(buf), "drive%d", i);
342		d2 = gctl_get_paraml(req, buf, sizeof(*d2));
343		if (d2 == NULL) {
344			gctl_error(req, "no drive definition given");
345			return (-1);
346		}
347		/*
348		 * Make sure that the device specified in the drive config is
349		 * an active GEOM provider.
350		 */
351		pp = g_provider_by_name(d2->device);
352		if (pp == NULL) {
353			gctl_error(req, "%s: device not found", d2->device);
354			goto error;
355		}
356		if (gv_find_drive(sc, d2->name) != NULL) {
357			/* Ignore error. */
358			if (*flags & GV_FLAG_F)
359				continue;
360			gctl_error(req, "drive '%s' already exists", d2->name);
361			goto error;
362		}
363		if (gv_find_drive_device(sc, d2->device) != NULL) {
364			gctl_error(req, "device '%s' already configured in "
365			    "gvinum", d2->device);
366			goto error;
367		}
368
369
370		d = g_malloc(sizeof(*d), M_WAITOK | M_ZERO);
371		bcopy(d2, d, sizeof(*d));
372
373		gv_post_event(sc, GV_EVENT_CREATE_DRIVE, d, NULL, 0, 0);
374	}
375
376	/* ... then volume definitions ... */
377	for (i = 0; i < *volumes; i++) {
378		error = 0;
379		snprintf(buf, sizeof(buf), "volume%d", i);
380		v2 = gctl_get_paraml(req, buf, sizeof(*v2));
381		if (v2 == NULL) {
382			gctl_error(req, "no volume definition given");
383			return (-1);
384		}
385		if (gv_find_vol(sc, v2->name) != NULL) {
386			/* Ignore error. */
387			if (*flags & GV_FLAG_F)
388				continue;
389			gctl_error(req, "volume '%s' already exists", v2->name);
390			goto error;
391		}
392
393		v = g_malloc(sizeof(*v), M_WAITOK | M_ZERO);
394		bcopy(v2, v, sizeof(*v));
395
396		gv_post_event(sc, GV_EVENT_CREATE_VOLUME, v, NULL, 0, 0);
397	}
398
399	/* ... then plex definitions ... */
400	for (i = 0; i < *plexes; i++) {
401		error = 0;
402		snprintf(buf, sizeof(buf), "plex%d", i);
403		p2 = gctl_get_paraml(req, buf, sizeof(*p2));
404		if (p2 == NULL) {
405			gctl_error(req, "no plex definition given");
406			return (-1);
407		}
408		if (gv_find_plex(sc, p2->name) != NULL) {
409			/* Ignore error. */
410			if (*flags & GV_FLAG_F)
411				continue;
412			gctl_error(req, "plex '%s' already exists", p2->name);
413			goto error;
414		}
415
416		p = g_malloc(sizeof(*p), M_WAITOK | M_ZERO);
417		bcopy(p2, p, sizeof(*p));
418
419		gv_post_event(sc, GV_EVENT_CREATE_PLEX, p, NULL, 0, 0);
420	}
421
422	/* ... and, finally, subdisk definitions. */
423	for (i = 0; i < *subdisks; i++) {
424		error = 0;
425		snprintf(buf, sizeof(buf), "sd%d", i);
426		s2 = gctl_get_paraml(req, buf, sizeof(*s2));
427		if (s2 == NULL) {
428			gctl_error(req, "no subdisk definition given");
429			return (-1);
430		}
431		if (gv_find_sd(sc, s2->name) != NULL) {
432			/* Ignore error. */
433			if (*flags & GV_FLAG_F)
434				continue;
435			gctl_error(req, "sd '%s' already exists", s2->name);
436			goto error;
437		}
438
439		s = g_malloc(sizeof(*s), M_WAITOK | M_ZERO);
440		bcopy(s2, s, sizeof(*s));
441
442		gv_post_event(sc, GV_EVENT_CREATE_SD, s, NULL, 0, 0);
443	}
444
445error:
446	gv_post_event(sc, GV_EVENT_SETUP_OBJECTS, sc, NULL, 0, 0);
447	gv_post_event(sc, GV_EVENT_SAVE_CONFIG, sc, NULL, 0, 0);
448
449	return (0);
450}
451
452static void
453gv_config(struct gctl_req *req, struct g_class *mp, char const *verb)
454{
455	struct g_geom *gp;
456	struct gv_softc *sc;
457	struct sbuf *sb;
458	char *comment;
459
460	g_topology_assert();
461
462	gp = LIST_FIRST(&mp->geom);
463	sc = gp->softc;
464
465	if (!strcmp(verb, "attach")) {
466		gv_attach(sc, req);
467
468	} else if (!strcmp(verb, "concat")) {
469		gv_concat(gp, req);
470
471	} else if (!strcmp(verb, "detach")) {
472		gv_detach(sc, req);
473
474	} else if (!strcmp(verb, "list")) {
475		gv_list(gp, req);
476
477	/* Save our configuration back to disk. */
478	} else if (!strcmp(verb, "saveconfig")) {
479		gv_post_event(sc, GV_EVENT_SAVE_CONFIG, sc, NULL, 0, 0);
480
481	/* Return configuration in string form. */
482	} else if (!strcmp(verb, "getconfig")) {
483		comment = gctl_get_param(req, "comment", NULL);
484		if (comment == NULL) {
485			gctl_error(req, "no comment parameter given");
486			return;
487		}
488		sb = sbuf_new(NULL, NULL, GV_CFG_LEN, SBUF_FIXEDLEN);
489		gv_format_config(sc, sb, 0, comment);
490		sbuf_finish(sb);
491		gctl_set_param(req, "config", sbuf_data(sb), sbuf_len(sb) + 1);
492		sbuf_delete(sb);
493
494	} else if (!strcmp(verb, "create")) {
495		gv_create(gp, req);
496
497	} else if (!strcmp(verb, "mirror")) {
498		gv_mirror(gp, req);
499
500	} else if (!strcmp(verb, "move")) {
501		gv_move(gp, req);
502
503	} else if (!strcmp(verb, "raid5")) {
504		gv_raid5(gp, req);
505
506	} else if (!strcmp(verb, "rebuildparity") ||
507	    !strcmp(verb, "checkparity")) {
508		gv_parityop(sc, req);
509
510	} else if (!strcmp(verb, "remove")) {
511		gv_remove(gp, req);
512
513	} else if (!strcmp(verb, "rename")) {
514		gv_rename(gp, req);
515
516	} else if (!strcmp(verb, "resetconfig")) {
517		gv_post_event(sc, GV_EVENT_RESET_CONFIG, sc, NULL, 0, 0);
518
519	} else if (!strcmp(verb, "start")) {
520		gv_start_obj(gp, req);
521
522	} else if (!strcmp(verb, "stripe")) {
523		gv_stripe(gp, req);
524
525	} else if (!strcmp(verb, "setstate")) {
526		gv_setstate(gp, req);
527	} else
528		gctl_error(req, "Unknown verb parameter");
529}
530
531static void
532gv_parityop(struct gv_softc *sc, struct gctl_req *req)
533{
534	struct gv_plex *p;
535	int *flags, *rebuild, type;
536	char *plex;
537
538	plex = gctl_get_param(req, "plex", NULL);
539	if (plex == NULL) {
540		gctl_error(req, "no plex given");
541		return;
542	}
543
544	flags = gctl_get_paraml(req, "flags", sizeof(*flags));
545	if (flags == NULL) {
546		gctl_error(req, "no flags given");
547		return;
548	}
549
550	rebuild = gctl_get_paraml(req, "rebuild", sizeof(*rebuild));
551	if (rebuild == NULL) {
552		gctl_error(req, "no operation given");
553		return;
554	}
555
556	type = gv_object_type(sc, plex);
557	if (type != GV_TYPE_PLEX) {
558		gctl_error(req, "'%s' is not a plex", plex);
559		return;
560	}
561	p = gv_find_plex(sc, plex);
562
563	if (p->state != GV_PLEX_UP) {
564		gctl_error(req, "plex %s is not completely accessible",
565		    p->name);
566		return;
567	}
568
569	if (p->org != GV_PLEX_RAID5) {
570		gctl_error(req, "plex %s is not a RAID5 plex", p->name);
571		return;
572	}
573
574	/* Put it in the event queue. */
575	/* XXX: The state of the plex might have changed when this event is
576	 * picked up ... We should perhaps check this afterwards. */
577	if (*rebuild)
578		gv_post_event(sc, GV_EVENT_PARITY_REBUILD, p, NULL, 0, 0);
579	else
580		gv_post_event(sc, GV_EVENT_PARITY_CHECK, p, NULL, 0, 0);
581}
582
583
584static struct g_geom *
585gv_taste(struct g_class *mp, struct g_provider *pp, int flags __unused)
586{
587	struct g_geom *gp;
588	struct g_consumer *cp;
589	struct gv_softc *sc;
590	struct gv_hdr vhdr;
591	int error;
592
593 	g_topology_assert();
594	g_trace(G_T_TOPOLOGY, "gv_taste(%s, %s)", mp->name, pp->name);
595
596	gp = LIST_FIRST(&mp->geom);
597	if (gp == NULL) {
598		G_VINUM_DEBUG(0, "error: tasting, but not initialized?");
599		return (NULL);
600	}
601	sc = gp->softc;
602
603	cp = g_new_consumer(gp);
604	if (g_attach(cp, pp) != 0) {
605		g_destroy_consumer(cp);
606		return (NULL);
607	}
608	if (g_access(cp, 1, 0, 0) != 0) {
609		g_detach(cp);
610		g_destroy_consumer(cp);
611		return (NULL);
612	}
613	g_topology_unlock();
614
615	error = gv_read_header(cp, &vhdr);
616
617	g_topology_lock();
618	g_access(cp, -1, 0, 0);
619	g_detach(cp);
620	g_destroy_consumer(cp);
621
622	/* Check if what we've been given is a valid vinum drive. */
623	if (!error)
624		gv_post_event(sc, GV_EVENT_DRIVE_TASTED, pp, NULL, 0, 0);
625
626	return (NULL);
627}
628
629void
630gv_worker(void *arg)
631{
632	struct g_provider *pp;
633	struct gv_softc *sc;
634	struct gv_event *ev;
635	struct gv_volume *v;
636	struct gv_plex *p;
637	struct gv_sd *s;
638	struct gv_drive *d;
639	struct bio *bp;
640	int newstate, flags, err, rename;
641	char *newname;
642	off_t offset;
643
644	sc = arg;
645	KASSERT(sc != NULL, ("NULL sc"));
646	for (;;) {
647		/* Look at the events first... */
648		ev = gv_get_event(sc);
649		if (ev != NULL) {
650			gv_remove_event(sc, ev);
651
652			switch (ev->type) {
653			case GV_EVENT_DRIVE_TASTED:
654				G_VINUM_DEBUG(2, "event 'drive tasted'");
655				pp = ev->arg1;
656				gv_drive_tasted(sc, pp);
657				break;
658
659			case GV_EVENT_DRIVE_LOST:
660				G_VINUM_DEBUG(2, "event 'drive lost'");
661				d = ev->arg1;
662				gv_drive_lost(sc, d);
663				break;
664
665			case GV_EVENT_CREATE_DRIVE:
666				G_VINUM_DEBUG(2, "event 'create drive'");
667				d = ev->arg1;
668				gv_create_drive(sc, d);
669				break;
670
671			case GV_EVENT_CREATE_VOLUME:
672				G_VINUM_DEBUG(2, "event 'create volume'");
673				v = ev->arg1;
674				gv_create_volume(sc, v);
675				break;
676
677			case GV_EVENT_CREATE_PLEX:
678				G_VINUM_DEBUG(2, "event 'create plex'");
679				p = ev->arg1;
680				gv_create_plex(sc, p);
681				break;
682
683			case GV_EVENT_CREATE_SD:
684				G_VINUM_DEBUG(2, "event 'create sd'");
685				s = ev->arg1;
686				gv_create_sd(sc, s);
687				break;
688
689			case GV_EVENT_RM_DRIVE:
690				G_VINUM_DEBUG(2, "event 'remove drive'");
691				d = ev->arg1;
692				flags = ev->arg3;
693				gv_rm_drive(sc, d, flags);
694				/*gv_setup_objects(sc);*/
695				break;
696
697			case GV_EVENT_RM_VOLUME:
698				G_VINUM_DEBUG(2, "event 'remove volume'");
699				v = ev->arg1;
700				gv_rm_vol(sc, v);
701				/*gv_setup_objects(sc);*/
702				break;
703
704			case GV_EVENT_RM_PLEX:
705				G_VINUM_DEBUG(2, "event 'remove plex'");
706				p = ev->arg1;
707				gv_rm_plex(sc, p);
708				/*gv_setup_objects(sc);*/
709				break;
710
711			case GV_EVENT_RM_SD:
712				G_VINUM_DEBUG(2, "event 'remove sd'");
713				s = ev->arg1;
714				gv_rm_sd(sc, s);
715				/*gv_setup_objects(sc);*/
716				break;
717
718			case GV_EVENT_SAVE_CONFIG:
719				G_VINUM_DEBUG(2, "event 'save config'");
720				gv_save_config(sc);
721				break;
722
723			case GV_EVENT_SET_SD_STATE:
724				G_VINUM_DEBUG(2, "event 'setstate sd'");
725				s = ev->arg1;
726				newstate = ev->arg3;
727				flags = ev->arg4;
728				err = gv_set_sd_state(s, newstate, flags);
729				if (err)
730					G_VINUM_DEBUG(0, "error setting subdisk"
731					    " state: error code %d", err);
732				break;
733
734			case GV_EVENT_SET_DRIVE_STATE:
735				G_VINUM_DEBUG(2, "event 'setstate drive'");
736				d = ev->arg1;
737				newstate = ev->arg3;
738				flags = ev->arg4;
739				err = gv_set_drive_state(d, newstate, flags);
740				if (err)
741					G_VINUM_DEBUG(0, "error setting drive "
742					    "state: error code %d", err);
743				break;
744
745			case GV_EVENT_SET_VOL_STATE:
746				G_VINUM_DEBUG(2, "event 'setstate volume'");
747				v = ev->arg1;
748				newstate = ev->arg3;
749				flags = ev->arg4;
750				err = gv_set_vol_state(v, newstate, flags);
751				if (err)
752					G_VINUM_DEBUG(0, "error setting volume "
753					    "state: error code %d", err);
754				break;
755
756			case GV_EVENT_SET_PLEX_STATE:
757				G_VINUM_DEBUG(2, "event 'setstate plex'");
758				p = ev->arg1;
759				newstate = ev->arg3;
760				flags = ev->arg4;
761				err = gv_set_plex_state(p, newstate, flags);
762				if (err)
763					G_VINUM_DEBUG(0, "error setting plex "
764					    "state: error code %d", err);
765				break;
766
767			case GV_EVENT_SETUP_OBJECTS:
768				G_VINUM_DEBUG(2, "event 'setup objects'");
769				gv_setup_objects(sc);
770				break;
771
772			case GV_EVENT_RESET_CONFIG:
773				G_VINUM_DEBUG(2, "event 'resetconfig'");
774				err = gv_resetconfig(sc);
775				if (err)
776					G_VINUM_DEBUG(0, "error resetting "
777					    "config: error code %d", err);
778				break;
779
780			case GV_EVENT_PARITY_REBUILD:
781				/*
782				 * Start the rebuild. The gv_plex_done will
783				 * handle issuing of the remaining rebuild bio's
784				 * until it's finished.
785				 */
786				G_VINUM_DEBUG(2, "event 'rebuild'");
787				p = ev->arg1;
788				if (p->state != GV_PLEX_UP) {
789					G_VINUM_DEBUG(0, "plex %s is not "
790					    "completely accessible", p->name);
791					break;
792				}
793				if (p->flags & GV_PLEX_SYNCING ||
794				    p->flags & GV_PLEX_REBUILDING ||
795				    p->flags & GV_PLEX_GROWING) {
796					G_VINUM_DEBUG(0, "plex %s is busy with "
797					    "syncing or parity build", p->name);
798					break;
799				}
800				p->synced = 0;
801				p->flags |= GV_PLEX_REBUILDING;
802				g_topology_assert_not();
803				g_topology_lock();
804				err = gv_access(p->vol_sc->provider, 1, 1, 0);
805				if (err) {
806					G_VINUM_DEBUG(0, "unable to access "
807					    "provider");
808					break;
809				}
810				g_topology_unlock();
811				gv_parity_request(p, GV_BIO_CHECK |
812				    GV_BIO_PARITY, 0);
813				break;
814
815			case GV_EVENT_PARITY_CHECK:
816				/* Start parity check. */
817				G_VINUM_DEBUG(2, "event 'check'");
818				p = ev->arg1;
819				if (p->state != GV_PLEX_UP) {
820					G_VINUM_DEBUG(0, "plex %s is not "
821					    "completely accessible", p->name);
822					break;
823				}
824				if (p->flags & GV_PLEX_SYNCING ||
825				    p->flags & GV_PLEX_REBUILDING ||
826				    p->flags & GV_PLEX_GROWING) {
827					G_VINUM_DEBUG(0, "plex %s is busy with "
828					    "syncing or parity build", p->name);
829					break;
830				}
831				p->synced = 0;
832				g_topology_assert_not();
833				g_topology_lock();
834				err = gv_access(p->vol_sc->provider, 1, 1, 0);
835				if (err) {
836					G_VINUM_DEBUG(0, "unable to access "
837					    "provider");
838					break;
839				}
840				g_topology_unlock();
841				gv_parity_request(p, GV_BIO_CHECK, 0);
842				break;
843
844			case GV_EVENT_START_PLEX:
845				G_VINUM_DEBUG(2, "event 'start' plex");
846				p = ev->arg1;
847				gv_start_plex(p);
848				break;
849
850			case GV_EVENT_START_VOLUME:
851				G_VINUM_DEBUG(2, "event 'start' volume");
852				v = ev->arg1;
853				gv_start_vol(v);
854				break;
855
856			case GV_EVENT_ATTACH_PLEX:
857				G_VINUM_DEBUG(2, "event 'attach' plex");
858				p = ev->arg1;
859				v = ev->arg2;
860				rename = ev->arg4;
861				err = gv_attach_plex(p, v, rename);
862				if (err)
863					G_VINUM_DEBUG(0, "error attaching %s to"
864					    " %s: error code %d", p->name,
865					    v->name, err);
866				break;
867
868			case GV_EVENT_ATTACH_SD:
869				G_VINUM_DEBUG(2, "event 'attach' sd");
870				s = ev->arg1;
871				p = ev->arg2;
872				offset = ev->arg3;
873				rename = ev->arg4;
874				err = gv_attach_sd(s, p, offset, rename);
875				if (err)
876					G_VINUM_DEBUG(0, "error attaching %s to"
877					    " %s: error code %d", s->name,
878					    p->name, err);
879				break;
880
881			case GV_EVENT_DETACH_PLEX:
882				G_VINUM_DEBUG(2, "event 'detach' plex");
883				p = ev->arg1;
884				flags = ev->arg3;
885				err = gv_detach_plex(p, flags);
886				if (err)
887					G_VINUM_DEBUG(0, "error detaching %s: "
888					    "error code %d", p->name, err);
889				break;
890
891			case GV_EVENT_DETACH_SD:
892				G_VINUM_DEBUG(2, "event 'detach' sd");
893				s = ev->arg1;
894				flags = ev->arg3;
895				err = gv_detach_sd(s, flags);
896				if (err)
897					G_VINUM_DEBUG(0, "error detaching %s: "
898					    "error code %d", s->name, err);
899				break;
900
901			case GV_EVENT_RENAME_VOL:
902				G_VINUM_DEBUG(2, "event 'rename' volume");
903				v = ev->arg1;
904				newname = ev->arg2;
905				flags = ev->arg3;
906				err = gv_rename_vol(sc, v, newname, flags);
907				if (err)
908					G_VINUM_DEBUG(0, "error renaming %s to "
909					    "%s: error code %d", v->name,
910					    newname, err);
911				g_free(newname);
912				/* Destroy and recreate the provider if we can. */
913				if (gv_provider_is_open(v->provider)) {
914					G_VINUM_DEBUG(0, "unable to rename "
915					    "provider to %s: provider in use",
916					    v->name);
917					break;
918				}
919				g_topology_lock();
920				g_wither_provider(v->provider, ENOENT);
921				g_topology_unlock();
922				v->provider = NULL;
923				gv_post_event(sc, GV_EVENT_SETUP_OBJECTS, sc,
924				    NULL, 0, 0);
925				break;
926
927			case GV_EVENT_RENAME_PLEX:
928				G_VINUM_DEBUG(2, "event 'rename' plex");
929				p = ev->arg1;
930				newname = ev->arg2;
931				flags = ev->arg3;
932				err = gv_rename_plex(sc, p, newname, flags);
933				if (err)
934					G_VINUM_DEBUG(0, "error renaming %s to "
935					    "%s: error code %d", p->name,
936					    newname, err);
937				g_free(newname);
938				break;
939
940			case GV_EVENT_RENAME_SD:
941				G_VINUM_DEBUG(2, "event 'rename' sd");
942				s = ev->arg1;
943				newname = ev->arg2;
944				flags = ev->arg3;
945				err = gv_rename_sd(sc, s, newname, flags);
946				if (err)
947					G_VINUM_DEBUG(0, "error renaming %s to "
948					    "%s: error code %d", s->name,
949					    newname, err);
950				g_free(newname);
951				break;
952
953			case GV_EVENT_RENAME_DRIVE:
954				G_VINUM_DEBUG(2, "event 'rename' drive");
955				d = ev->arg1;
956				newname = ev->arg2;
957				flags = ev->arg3;
958				err = gv_rename_drive(sc, d, newname, flags);
959				if (err)
960					G_VINUM_DEBUG(0, "error renaming %s to "
961					    "%s: error code %d", d->name,
962					    newname, err);
963				g_free(newname);
964				break;
965
966			case GV_EVENT_MOVE_SD:
967				G_VINUM_DEBUG(2, "event 'move' sd");
968				s = ev->arg1;
969				d = ev->arg2;
970				flags = ev->arg3;
971				err = gv_move_sd(sc, s, d, flags);
972				if (err)
973					G_VINUM_DEBUG(0, "error moving %s to "
974					    "%s: error code %d", s->name,
975					    d->name, err);
976				break;
977
978			case GV_EVENT_THREAD_EXIT:
979				G_VINUM_DEBUG(2, "event 'thread exit'");
980				g_free(ev);
981				mtx_lock(&sc->equeue_mtx);
982				mtx_lock(&sc->bqueue_mtx);
983				gv_cleanup(sc);
984				mtx_destroy(&sc->bqueue_mtx);
985				mtx_destroy(&sc->equeue_mtx);
986				g_free(sc->bqueue_down);
987				g_free(sc->bqueue_up);
988				g_free(sc);
989				kproc_exit(0);
990				/* NOTREACHED */
991
992			default:
993				G_VINUM_DEBUG(1, "unknown event %d", ev->type);
994			}
995
996			g_free(ev);
997			continue;
998		}
999
1000		/* ... then do I/O processing. */
1001		mtx_lock(&sc->bqueue_mtx);
1002		/* First do new requests. */
1003		bp = bioq_takefirst(sc->bqueue_down);
1004		if (bp != NULL) {
1005			mtx_unlock(&sc->bqueue_mtx);
1006			/* A bio that interfered with another bio. */
1007			if (bp->bio_pflags & GV_BIO_ONHOLD) {
1008				s = bp->bio_caller1;
1009				p = s->plex_sc;
1010				/* Is it still locked out? */
1011				if (gv_stripe_active(p, bp)) {
1012					/* Park the bio on the waiting queue. */
1013					bioq_disksort(p->wqueue, bp);
1014				} else {
1015					bp->bio_pflags &= ~GV_BIO_ONHOLD;
1016					g_io_request(bp, s->drive_sc->consumer);
1017				}
1018			/* A special request requireing special handling. */
1019			} else if (bp->bio_pflags & GV_BIO_INTERNAL) {
1020				p = bp->bio_caller1;
1021				gv_plex_start(p, bp);
1022			} else {
1023				gv_volume_start(sc, bp);
1024			}
1025			mtx_lock(&sc->bqueue_mtx);
1026		}
1027		/* Then do completed requests. */
1028		bp = bioq_takefirst(sc->bqueue_up);
1029		if (bp == NULL) {
1030			msleep(sc, &sc->bqueue_mtx, PRIBIO, "-", hz/10);
1031			mtx_unlock(&sc->bqueue_mtx);
1032			continue;
1033		}
1034		mtx_unlock(&sc->bqueue_mtx);
1035		gv_bio_done(sc, bp);
1036	}
1037}
1038
1039#define	VINUM_CLASS_NAME "VINUM"
1040
1041static struct g_class g_vinum_class	= {
1042	.name = VINUM_CLASS_NAME,
1043	.version = G_VERSION,
1044	.init = gv_init,
1045	.taste = gv_taste,
1046	.ctlreq = gv_config,
1047	.destroy_geom = gv_unload,
1048};
1049
1050DECLARE_GEOM_CLASS(g_vinum_class, g_vinum);
1051MODULE_VERSION(geom_vinum, 0);
1052