1/*-
2 *  Copyright (c) 2004, 2007 Lukas Ertl
3 *  Copyright (c) 2007, 2009 Ulf Lilleengen
4 *  All rights reserved.
5 *
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions
8 * are met:
9 * 1. Redistributions of source code must retain the above copyright
10 *    notice, this list of conditions and the following disclaimer.
11 * 2. Redistributions in binary form must reproduce the above copyright
12 *    notice, this list of conditions and the following disclaimer in the
13 *    documentation and/or other materials provided with the distribution.
14 *
15 * THIS SOFTWARE IS PROVIDED BY AUTHOR AND CONTRIBUTORS ``AS IS'' AND
16 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18 * ARE DISCLAIMED.  IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE
19 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
21 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25 * SUCH DAMAGE.
26 *
27 */
28
29#include <sys/cdefs.h>
30__FBSDID("$FreeBSD$");
31
32#include <sys/param.h>
33#include <sys/bio.h>
34#include <sys/kernel.h>
35#include <sys/kthread.h>
36#include <sys/lock.h>
37#include <sys/malloc.h>
38#include <sys/module.h>
39#include <sys/mutex.h>
40#include <sys/sbuf.h>
41#include <sys/sysctl.h>
42#include <sys/systm.h>
43
44#include <geom/geom.h>
45#include <geom/vinum/geom_vinum_var.h>
46#include <geom/vinum/geom_vinum.h>
47#include <geom/vinum/geom_vinum_raid5.h>
48
49SYSCTL_DECL(_kern_geom);
50static SYSCTL_NODE(_kern_geom, OID_AUTO, vinum, CTLFLAG_RW, 0,
51    "GEOM_VINUM stuff");
52u_int g_vinum_debug = 0;
53TUNABLE_INT("kern.geom.vinum.debug", &g_vinum_debug);
54SYSCTL_UINT(_kern_geom_vinum, OID_AUTO, debug, CTLFLAG_RW, &g_vinum_debug, 0,
55    "Debug level");
56
57static int	gv_create(struct g_geom *, struct gctl_req *);
58static void	gv_attach(struct gv_softc *, struct gctl_req *);
59static void	gv_detach(struct gv_softc *, struct gctl_req *);
60static void	gv_parityop(struct gv_softc *, struct gctl_req *);
61
62
63static void
64gv_orphan(struct g_consumer *cp)
65{
66	struct g_geom *gp;
67	struct gv_softc *sc;
68	struct gv_drive *d;
69
70	g_topology_assert();
71
72	KASSERT(cp != NULL, ("gv_orphan: null cp"));
73	gp = cp->geom;
74	KASSERT(gp != NULL, ("gv_orphan: null gp"));
75	sc = gp->softc;
76	KASSERT(sc != NULL, ("gv_orphan: null sc"));
77	d = cp->private;
78	KASSERT(d != NULL, ("gv_orphan: null d"));
79
80	g_trace(G_T_TOPOLOGY, "gv_orphan(%s)", gp->name);
81
82	gv_post_event(sc, GV_EVENT_DRIVE_LOST, d, NULL, 0, 0);
83}
84
85void
86gv_start(struct bio *bp)
87{
88	struct g_geom *gp;
89	struct gv_softc *sc;
90
91	gp = bp->bio_to->geom;
92	sc = gp->softc;
93
94	switch (bp->bio_cmd) {
95	case BIO_READ:
96	case BIO_WRITE:
97	case BIO_DELETE:
98		break;
99	case BIO_GETATTR:
100	default:
101		g_io_deliver(bp, EOPNOTSUPP);
102		return;
103	}
104	mtx_lock(&sc->bqueue_mtx);
105	bioq_disksort(sc->bqueue_down, bp);
106	wakeup(sc);
107	mtx_unlock(&sc->bqueue_mtx);
108}
109
110void
111gv_done(struct bio *bp)
112{
113	struct g_geom *gp;
114	struct gv_softc *sc;
115
116	KASSERT(bp != NULL, ("NULL bp"));
117
118	gp = bp->bio_from->geom;
119	sc = gp->softc;
120
121	mtx_lock(&sc->bqueue_mtx);
122	bioq_disksort(sc->bqueue_up, bp);
123	wakeup(sc);
124	mtx_unlock(&sc->bqueue_mtx);
125}
126
127int
128gv_access(struct g_provider *pp, int dr, int dw, int de)
129{
130	struct g_geom *gp;
131	struct gv_softc *sc;
132	struct gv_drive *d, *d2;
133	int error;
134
135	gp = pp->geom;
136	sc = gp->softc;
137	/*
138	 * We want to modify the read count with the write count in case we have
139	 * plexes in a RAID-5 organization.
140	 */
141	dr += dw;
142
143	LIST_FOREACH(d, &sc->drives, drive) {
144		if (d->consumer == NULL)
145			continue;
146		error = g_access(d->consumer, dr, dw, de);
147		if (error) {
148			LIST_FOREACH(d2, &sc->drives, drive) {
149				if (d == d2)
150					break;
151				g_access(d2->consumer, -dr, -dw, -de);
152			}
153			G_VINUM_DEBUG(0, "g_access '%s' failed: %d", d->name,
154			    error);
155			return (error);
156		}
157	}
158	return (0);
159}
160
161static void
162gv_init(struct g_class *mp)
163{
164	struct g_geom *gp;
165	struct gv_softc *sc;
166
167	g_trace(G_T_TOPOLOGY, "gv_init(%p)", mp);
168
169	gp = g_new_geomf(mp, "VINUM");
170	gp->spoiled = gv_orphan;
171	gp->orphan = gv_orphan;
172	gp->access = gv_access;
173	gp->start = gv_start;
174	gp->softc = g_malloc(sizeof(struct gv_softc), M_WAITOK | M_ZERO);
175	sc = gp->softc;
176	sc->geom = gp;
177	sc->bqueue_down = g_malloc(sizeof(struct bio_queue_head),
178	    M_WAITOK | M_ZERO);
179	sc->bqueue_up = g_malloc(sizeof(struct bio_queue_head),
180	    M_WAITOK | M_ZERO);
181	bioq_init(sc->bqueue_down);
182	bioq_init(sc->bqueue_up);
183	LIST_INIT(&sc->drives);
184	LIST_INIT(&sc->subdisks);
185	LIST_INIT(&sc->plexes);
186	LIST_INIT(&sc->volumes);
187	TAILQ_INIT(&sc->equeue);
188	mtx_init(&sc->config_mtx, "gv_config", NULL, MTX_DEF);
189	mtx_init(&sc->equeue_mtx, "gv_equeue", NULL, MTX_DEF);
190	mtx_init(&sc->bqueue_mtx, "gv_bqueue", NULL, MTX_DEF);
191	kproc_create(gv_worker, sc, &sc->worker, 0, 0, "gv_worker");
192}
193
194static int
195gv_unload(struct gctl_req *req, struct g_class *mp, struct g_geom *gp)
196{
197	struct gv_softc *sc;
198
199	g_trace(G_T_TOPOLOGY, "gv_unload(%p)", mp);
200
201	g_topology_assert();
202	sc = gp->softc;
203
204	if (sc != NULL) {
205		gv_worker_exit(sc);
206		gp->softc = NULL;
207		g_wither_geom(gp, ENXIO);
208	}
209
210	return (0);
211}
212
213/* Handle userland request of attaching object. */
214static void
215gv_attach(struct gv_softc *sc, struct gctl_req *req)
216{
217	struct gv_volume *v;
218	struct gv_plex *p;
219	struct gv_sd *s;
220	off_t *offset;
221	int *rename, type_child, type_parent;
222	char *child, *parent;
223
224	child = gctl_get_param(req, "child", NULL);
225	if (child == NULL) {
226		gctl_error(req, "no child given");
227		return;
228	}
229	parent = gctl_get_param(req, "parent", NULL);
230	if (parent == NULL) {
231		gctl_error(req, "no parent given");
232		return;
233	}
234	offset = gctl_get_paraml(req, "offset", sizeof(*offset));
235	if (offset == NULL) {
236		gctl_error(req, "no offset given");
237		return;
238	}
239	rename = gctl_get_paraml(req, "rename", sizeof(*rename));
240	if (rename == NULL) {
241		gctl_error(req, "no rename flag given");
242		return;
243	}
244
245	type_child = gv_object_type(sc, child);
246	type_parent = gv_object_type(sc, parent);
247
248	switch (type_child) {
249	case GV_TYPE_PLEX:
250		if (type_parent != GV_TYPE_VOL) {
251			gctl_error(req, "no such volume to attach to");
252			return;
253		}
254		v = gv_find_vol(sc, parent);
255		p = gv_find_plex(sc, child);
256		gv_post_event(sc, GV_EVENT_ATTACH_PLEX, p, v, *offset, *rename);
257		break;
258	case GV_TYPE_SD:
259		if (type_parent != GV_TYPE_PLEX) {
260			gctl_error(req, "no such plex to attach to");
261			return;
262		}
263		p = gv_find_plex(sc, parent);
264		s = gv_find_sd(sc, child);
265		gv_post_event(sc, GV_EVENT_ATTACH_SD, s, p, *offset, *rename);
266		break;
267	default:
268		gctl_error(req, "invalid child type");
269		break;
270	}
271}
272
273/* Handle userland request of detaching object. */
274static void
275gv_detach(struct gv_softc *sc, struct gctl_req *req)
276{
277	struct gv_plex *p;
278	struct gv_sd *s;
279	int *flags, type;
280	char *object;
281
282	object = gctl_get_param(req, "object", NULL);
283	if (object == NULL) {
284		gctl_error(req, "no argument given");
285		return;
286	}
287
288	flags = gctl_get_paraml(req, "flags", sizeof(*flags));
289	type = gv_object_type(sc, object);
290	switch (type) {
291	case GV_TYPE_PLEX:
292		p = gv_find_plex(sc, object);
293		gv_post_event(sc, GV_EVENT_DETACH_PLEX, p, NULL, *flags, 0);
294		break;
295	case GV_TYPE_SD:
296		s = gv_find_sd(sc, object);
297		gv_post_event(sc, GV_EVENT_DETACH_SD, s, NULL, *flags, 0);
298		break;
299	default:
300		gctl_error(req, "invalid object type");
301		break;
302	}
303}
304
305/* Handle userland requests for creating new objects. */
306static int
307gv_create(struct g_geom *gp, struct gctl_req *req)
308{
309	struct gv_softc *sc;
310	struct gv_drive *d, *d2;
311	struct gv_plex *p, *p2;
312	struct gv_sd *s, *s2;
313	struct gv_volume *v, *v2;
314	struct g_provider *pp;
315	int error, i, *drives, *flags, *plexes, *subdisks, *volumes;
316	char buf[20];
317
318	g_topology_assert();
319
320	sc = gp->softc;
321
322	/* Find out how many of each object have been passed in. */
323	volumes = gctl_get_paraml(req, "volumes", sizeof(*volumes));
324	plexes = gctl_get_paraml(req, "plexes", sizeof(*plexes));
325	subdisks = gctl_get_paraml(req, "subdisks", sizeof(*subdisks));
326	drives = gctl_get_paraml(req, "drives", sizeof(*drives));
327	if (volumes == NULL || plexes == NULL || subdisks == NULL ||
328	    drives == NULL) {
329		gctl_error(req, "number of objects not given");
330		return (-1);
331	}
332	flags = gctl_get_paraml(req, "flags", sizeof(*flags));
333	if (flags == NULL) {
334		gctl_error(req, "flags not given");
335		return (-1);
336	}
337
338	/* First, handle drive definitions ... */
339	for (i = 0; i < *drives; i++) {
340		snprintf(buf, sizeof(buf), "drive%d", i);
341		d2 = gctl_get_paraml(req, buf, sizeof(*d2));
342		if (d2 == NULL) {
343			gctl_error(req, "no drive definition given");
344			return (-1);
345		}
346		/*
347		 * Make sure that the device specified in the drive config is
348		 * an active GEOM provider.
349		 */
350		pp = g_provider_by_name(d2->device);
351		if (pp == NULL) {
352			gctl_error(req, "%s: device not found", d2->device);
353			goto error;
354		}
355		if (gv_find_drive(sc, d2->name) != NULL) {
356			/* Ignore error. */
357			if (*flags & GV_FLAG_F)
358				continue;
359			gctl_error(req, "drive '%s' already exists", d2->name);
360			goto error;
361		}
362		if (gv_find_drive_device(sc, d2->device) != NULL) {
363			gctl_error(req, "device '%s' already configured in "
364			    "gvinum", d2->device);
365			goto error;
366		}
367
368
369		d = g_malloc(sizeof(*d), M_WAITOK | M_ZERO);
370		bcopy(d2, d, sizeof(*d));
371
372		gv_post_event(sc, GV_EVENT_CREATE_DRIVE, d, NULL, 0, 0);
373	}
374
375	/* ... then volume definitions ... */
376	for (i = 0; i < *volumes; i++) {
377		error = 0;
378		snprintf(buf, sizeof(buf), "volume%d", i);
379		v2 = gctl_get_paraml(req, buf, sizeof(*v2));
380		if (v2 == NULL) {
381			gctl_error(req, "no volume definition given");
382			return (-1);
383		}
384		if (gv_find_vol(sc, v2->name) != NULL) {
385			/* Ignore error. */
386			if (*flags & GV_FLAG_F)
387				continue;
388			gctl_error(req, "volume '%s' already exists", v2->name);
389			goto error;
390		}
391
392		v = g_malloc(sizeof(*v), M_WAITOK | M_ZERO);
393		bcopy(v2, v, sizeof(*v));
394
395		gv_post_event(sc, GV_EVENT_CREATE_VOLUME, v, NULL, 0, 0);
396	}
397
398	/* ... then plex definitions ... */
399	for (i = 0; i < *plexes; i++) {
400		error = 0;
401		snprintf(buf, sizeof(buf), "plex%d", i);
402		p2 = gctl_get_paraml(req, buf, sizeof(*p2));
403		if (p2 == NULL) {
404			gctl_error(req, "no plex definition given");
405			return (-1);
406		}
407		if (gv_find_plex(sc, p2->name) != NULL) {
408			/* Ignore error. */
409			if (*flags & GV_FLAG_F)
410				continue;
411			gctl_error(req, "plex '%s' already exists", p2->name);
412			goto error;
413		}
414
415		p = g_malloc(sizeof(*p), M_WAITOK | M_ZERO);
416		bcopy(p2, p, sizeof(*p));
417
418		gv_post_event(sc, GV_EVENT_CREATE_PLEX, p, NULL, 0, 0);
419	}
420
421	/* ... and, finally, subdisk definitions. */
422	for (i = 0; i < *subdisks; i++) {
423		error = 0;
424		snprintf(buf, sizeof(buf), "sd%d", i);
425		s2 = gctl_get_paraml(req, buf, sizeof(*s2));
426		if (s2 == NULL) {
427			gctl_error(req, "no subdisk definition given");
428			return (-1);
429		}
430		if (gv_find_sd(sc, s2->name) != NULL) {
431			/* Ignore error. */
432			if (*flags & GV_FLAG_F)
433				continue;
434			gctl_error(req, "sd '%s' already exists", s2->name);
435			goto error;
436		}
437
438		s = g_malloc(sizeof(*s), M_WAITOK | M_ZERO);
439		bcopy(s2, s, sizeof(*s));
440
441		gv_post_event(sc, GV_EVENT_CREATE_SD, s, NULL, 0, 0);
442	}
443
444error:
445	gv_post_event(sc, GV_EVENT_SETUP_OBJECTS, sc, NULL, 0, 0);
446	gv_post_event(sc, GV_EVENT_SAVE_CONFIG, sc, NULL, 0, 0);
447
448	return (0);
449}
450
451static void
452gv_config(struct gctl_req *req, struct g_class *mp, char const *verb)
453{
454	struct g_geom *gp;
455	struct gv_softc *sc;
456	struct sbuf *sb;
457	char *comment;
458
459	g_topology_assert();
460
461	gp = LIST_FIRST(&mp->geom);
462	sc = gp->softc;
463
464	if (!strcmp(verb, "attach")) {
465		gv_attach(sc, req);
466
467	} else if (!strcmp(verb, "concat")) {
468		gv_concat(gp, req);
469
470	} else if (!strcmp(verb, "detach")) {
471		gv_detach(sc, req);
472
473	} else if (!strcmp(verb, "list")) {
474		gv_list(gp, req);
475
476	/* Save our configuration back to disk. */
477	} else if (!strcmp(verb, "saveconfig")) {
478		gv_post_event(sc, GV_EVENT_SAVE_CONFIG, sc, NULL, 0, 0);
479
480	/* Return configuration in string form. */
481	} else if (!strcmp(verb, "getconfig")) {
482		comment = gctl_get_param(req, "comment", NULL);
483		if (comment == NULL) {
484			gctl_error(req, "no comment parameter given");
485			return;
486		}
487		sb = sbuf_new(NULL, NULL, GV_CFG_LEN, SBUF_FIXEDLEN);
488		gv_format_config(sc, sb, 0, comment);
489		sbuf_finish(sb);
490		gctl_set_param(req, "config", sbuf_data(sb), sbuf_len(sb) + 1);
491		sbuf_delete(sb);
492
493	} else if (!strcmp(verb, "create")) {
494		gv_create(gp, req);
495
496	} else if (!strcmp(verb, "mirror")) {
497		gv_mirror(gp, req);
498
499	} else if (!strcmp(verb, "move")) {
500		gv_move(gp, req);
501
502	} else if (!strcmp(verb, "raid5")) {
503		gv_raid5(gp, req);
504
505	} else if (!strcmp(verb, "rebuildparity") ||
506	    !strcmp(verb, "checkparity")) {
507		gv_parityop(sc, req);
508
509	} else if (!strcmp(verb, "remove")) {
510		gv_remove(gp, req);
511
512	} else if (!strcmp(verb, "rename")) {
513		gv_rename(gp, req);
514
515	} else if (!strcmp(verb, "resetconfig")) {
516		gv_post_event(sc, GV_EVENT_RESET_CONFIG, sc, NULL, 0, 0);
517
518	} else if (!strcmp(verb, "start")) {
519		gv_start_obj(gp, req);
520
521	} else if (!strcmp(verb, "stripe")) {
522		gv_stripe(gp, req);
523
524	} else if (!strcmp(verb, "setstate")) {
525		gv_setstate(gp, req);
526	} else
527		gctl_error(req, "Unknown verb parameter");
528}
529
530static void
531gv_parityop(struct gv_softc *sc, struct gctl_req *req)
532{
533	struct gv_plex *p;
534	int *flags, *rebuild, type;
535	char *plex;
536
537	plex = gctl_get_param(req, "plex", NULL);
538	if (plex == NULL) {
539		gctl_error(req, "no plex given");
540		return;
541	}
542
543	flags = gctl_get_paraml(req, "flags", sizeof(*flags));
544	if (flags == NULL) {
545		gctl_error(req, "no flags given");
546		return;
547	}
548
549	rebuild = gctl_get_paraml(req, "rebuild", sizeof(*rebuild));
550	if (rebuild == NULL) {
551		gctl_error(req, "no operation given");
552		return;
553	}
554
555	type = gv_object_type(sc, plex);
556	if (type != GV_TYPE_PLEX) {
557		gctl_error(req, "'%s' is not a plex", plex);
558		return;
559	}
560	p = gv_find_plex(sc, plex);
561
562	if (p->state != GV_PLEX_UP) {
563		gctl_error(req, "plex %s is not completely accessible",
564		    p->name);
565		return;
566	}
567
568	if (p->org != GV_PLEX_RAID5) {
569		gctl_error(req, "plex %s is not a RAID5 plex", p->name);
570		return;
571	}
572
573	/* Put it in the event queue. */
574	/* XXX: The state of the plex might have changed when this event is
575	 * picked up ... We should perhaps check this afterwards. */
576	if (*rebuild)
577		gv_post_event(sc, GV_EVENT_PARITY_REBUILD, p, NULL, 0, 0);
578	else
579		gv_post_event(sc, GV_EVENT_PARITY_CHECK, p, NULL, 0, 0);
580}
581
582
583static struct g_geom *
584gv_taste(struct g_class *mp, struct g_provider *pp, int flags __unused)
585{
586	struct g_geom *gp;
587	struct g_consumer *cp;
588	struct gv_softc *sc;
589	struct gv_hdr vhdr;
590	int error;
591
592 	g_topology_assert();
593	g_trace(G_T_TOPOLOGY, "gv_taste(%s, %s)", mp->name, pp->name);
594
595	gp = LIST_FIRST(&mp->geom);
596	if (gp == NULL) {
597		G_VINUM_DEBUG(0, "error: tasting, but not initialized?");
598		return (NULL);
599	}
600	sc = gp->softc;
601
602	cp = g_new_consumer(gp);
603	if (g_attach(cp, pp) != 0) {
604		g_destroy_consumer(cp);
605		return (NULL);
606	}
607	if (g_access(cp, 1, 0, 0) != 0) {
608		g_detach(cp);
609		g_destroy_consumer(cp);
610		return (NULL);
611	}
612	g_topology_unlock();
613
614	error = gv_read_header(cp, &vhdr);
615
616	g_topology_lock();
617	g_access(cp, -1, 0, 0);
618	g_detach(cp);
619	g_destroy_consumer(cp);
620
621	/* Check if what we've been given is a valid vinum drive. */
622	if (!error)
623		gv_post_event(sc, GV_EVENT_DRIVE_TASTED, pp, NULL, 0, 0);
624
625	return (NULL);
626}
627
628void
629gv_worker(void *arg)
630{
631	struct g_provider *pp;
632	struct gv_softc *sc;
633	struct gv_event *ev;
634	struct gv_volume *v;
635	struct gv_plex *p;
636	struct gv_sd *s;
637	struct gv_drive *d;
638	struct bio *bp;
639	int newstate, flags, err, rename;
640	char *newname;
641	off_t offset;
642
643	sc = arg;
644	KASSERT(sc != NULL, ("NULL sc"));
645	for (;;) {
646		/* Look at the events first... */
647		ev = gv_get_event(sc);
648		if (ev != NULL) {
649			gv_remove_event(sc, ev);
650
651			switch (ev->type) {
652			case GV_EVENT_DRIVE_TASTED:
653				G_VINUM_DEBUG(2, "event 'drive tasted'");
654				pp = ev->arg1;
655				gv_drive_tasted(sc, pp);
656				break;
657
658			case GV_EVENT_DRIVE_LOST:
659				G_VINUM_DEBUG(2, "event 'drive lost'");
660				d = ev->arg1;
661				gv_drive_lost(sc, d);
662				break;
663
664			case GV_EVENT_CREATE_DRIVE:
665				G_VINUM_DEBUG(2, "event 'create drive'");
666				d = ev->arg1;
667				gv_create_drive(sc, d);
668				break;
669
670			case GV_EVENT_CREATE_VOLUME:
671				G_VINUM_DEBUG(2, "event 'create volume'");
672				v = ev->arg1;
673				gv_create_volume(sc, v);
674				break;
675
676			case GV_EVENT_CREATE_PLEX:
677				G_VINUM_DEBUG(2, "event 'create plex'");
678				p = ev->arg1;
679				gv_create_plex(sc, p);
680				break;
681
682			case GV_EVENT_CREATE_SD:
683				G_VINUM_DEBUG(2, "event 'create sd'");
684				s = ev->arg1;
685				gv_create_sd(sc, s);
686				break;
687
688			case GV_EVENT_RM_DRIVE:
689				G_VINUM_DEBUG(2, "event 'remove drive'");
690				d = ev->arg1;
691				flags = ev->arg3;
692				gv_rm_drive(sc, d, flags);
693				/*gv_setup_objects(sc);*/
694				break;
695
696			case GV_EVENT_RM_VOLUME:
697				G_VINUM_DEBUG(2, "event 'remove volume'");
698				v = ev->arg1;
699				gv_rm_vol(sc, v);
700				/*gv_setup_objects(sc);*/
701				break;
702
703			case GV_EVENT_RM_PLEX:
704				G_VINUM_DEBUG(2, "event 'remove plex'");
705				p = ev->arg1;
706				gv_rm_plex(sc, p);
707				/*gv_setup_objects(sc);*/
708				break;
709
710			case GV_EVENT_RM_SD:
711				G_VINUM_DEBUG(2, "event 'remove sd'");
712				s = ev->arg1;
713				gv_rm_sd(sc, s);
714				/*gv_setup_objects(sc);*/
715				break;
716
717			case GV_EVENT_SAVE_CONFIG:
718				G_VINUM_DEBUG(2, "event 'save config'");
719				gv_save_config(sc);
720				break;
721
722			case GV_EVENT_SET_SD_STATE:
723				G_VINUM_DEBUG(2, "event 'setstate sd'");
724				s = ev->arg1;
725				newstate = ev->arg3;
726				flags = ev->arg4;
727				err = gv_set_sd_state(s, newstate, flags);
728				if (err)
729					G_VINUM_DEBUG(0, "error setting subdisk"
730					    " state: error code %d", err);
731				break;
732
733			case GV_EVENT_SET_DRIVE_STATE:
734				G_VINUM_DEBUG(2, "event 'setstate drive'");
735				d = ev->arg1;
736				newstate = ev->arg3;
737				flags = ev->arg4;
738				err = gv_set_drive_state(d, newstate, flags);
739				if (err)
740					G_VINUM_DEBUG(0, "error setting drive "
741					    "state: error code %d", err);
742				break;
743
744			case GV_EVENT_SET_VOL_STATE:
745				G_VINUM_DEBUG(2, "event 'setstate volume'");
746				v = ev->arg1;
747				newstate = ev->arg3;
748				flags = ev->arg4;
749				err = gv_set_vol_state(v, newstate, flags);
750				if (err)
751					G_VINUM_DEBUG(0, "error setting volume "
752					    "state: error code %d", err);
753				break;
754
755			case GV_EVENT_SET_PLEX_STATE:
756				G_VINUM_DEBUG(2, "event 'setstate plex'");
757				p = ev->arg1;
758				newstate = ev->arg3;
759				flags = ev->arg4;
760				err = gv_set_plex_state(p, newstate, flags);
761				if (err)
762					G_VINUM_DEBUG(0, "error setting plex "
763					    "state: error code %d", err);
764				break;
765
766			case GV_EVENT_SETUP_OBJECTS:
767				G_VINUM_DEBUG(2, "event 'setup objects'");
768				gv_setup_objects(sc);
769				break;
770
771			case GV_EVENT_RESET_CONFIG:
772				G_VINUM_DEBUG(2, "event 'resetconfig'");
773				err = gv_resetconfig(sc);
774				if (err)
775					G_VINUM_DEBUG(0, "error resetting "
776					    "config: error code %d", err);
777				break;
778
779			case GV_EVENT_PARITY_REBUILD:
780				/*
781				 * Start the rebuild. The gv_plex_done will
782				 * handle issuing of the remaining rebuild bio's
783				 * until it's finished.
784				 */
785				G_VINUM_DEBUG(2, "event 'rebuild'");
786				p = ev->arg1;
787				if (p->state != GV_PLEX_UP) {
788					G_VINUM_DEBUG(0, "plex %s is not "
789					    "completely accessible", p->name);
790					break;
791				}
792				if (p->flags & GV_PLEX_SYNCING ||
793				    p->flags & GV_PLEX_REBUILDING ||
794				    p->flags & GV_PLEX_GROWING) {
795					G_VINUM_DEBUG(0, "plex %s is busy with "
796					    "syncing or parity build", p->name);
797					break;
798				}
799				p->synced = 0;
800				p->flags |= GV_PLEX_REBUILDING;
801				g_topology_assert_not();
802				g_topology_lock();
803				err = gv_access(p->vol_sc->provider, 1, 1, 0);
804				if (err) {
805					G_VINUM_DEBUG(0, "unable to access "
806					    "provider");
807					break;
808				}
809				g_topology_unlock();
810				gv_parity_request(p, GV_BIO_CHECK |
811				    GV_BIO_PARITY, 0);
812				break;
813
814			case GV_EVENT_PARITY_CHECK:
815				/* Start parity check. */
816				G_VINUM_DEBUG(2, "event 'check'");
817				p = ev->arg1;
818				if (p->state != GV_PLEX_UP) {
819					G_VINUM_DEBUG(0, "plex %s is not "
820					    "completely accessible", p->name);
821					break;
822				}
823				if (p->flags & GV_PLEX_SYNCING ||
824				    p->flags & GV_PLEX_REBUILDING ||
825				    p->flags & GV_PLEX_GROWING) {
826					G_VINUM_DEBUG(0, "plex %s is busy with "
827					    "syncing or parity build", p->name);
828					break;
829				}
830				p->synced = 0;
831				g_topology_assert_not();
832				g_topology_lock();
833				err = gv_access(p->vol_sc->provider, 1, 1, 0);
834				if (err) {
835					G_VINUM_DEBUG(0, "unable to access "
836					    "provider");
837					break;
838				}
839				g_topology_unlock();
840				gv_parity_request(p, GV_BIO_CHECK, 0);
841				break;
842
843			case GV_EVENT_START_PLEX:
844				G_VINUM_DEBUG(2, "event 'start' plex");
845				p = ev->arg1;
846				gv_start_plex(p);
847				break;
848
849			case GV_EVENT_START_VOLUME:
850				G_VINUM_DEBUG(2, "event 'start' volume");
851				v = ev->arg1;
852				gv_start_vol(v);
853				break;
854
855			case GV_EVENT_ATTACH_PLEX:
856				G_VINUM_DEBUG(2, "event 'attach' plex");
857				p = ev->arg1;
858				v = ev->arg2;
859				rename = ev->arg4;
860				err = gv_attach_plex(p, v, rename);
861				if (err)
862					G_VINUM_DEBUG(0, "error attaching %s to"
863					    " %s: error code %d", p->name,
864					    v->name, err);
865				break;
866
867			case GV_EVENT_ATTACH_SD:
868				G_VINUM_DEBUG(2, "event 'attach' sd");
869				s = ev->arg1;
870				p = ev->arg2;
871				offset = ev->arg3;
872				rename = ev->arg4;
873				err = gv_attach_sd(s, p, offset, rename);
874				if (err)
875					G_VINUM_DEBUG(0, "error attaching %s to"
876					    " %s: error code %d", s->name,
877					    p->name, err);
878				break;
879
880			case GV_EVENT_DETACH_PLEX:
881				G_VINUM_DEBUG(2, "event 'detach' plex");
882				p = ev->arg1;
883				flags = ev->arg3;
884				err = gv_detach_plex(p, flags);
885				if (err)
886					G_VINUM_DEBUG(0, "error detaching %s: "
887					    "error code %d", p->name, err);
888				break;
889
890			case GV_EVENT_DETACH_SD:
891				G_VINUM_DEBUG(2, "event 'detach' sd");
892				s = ev->arg1;
893				flags = ev->arg3;
894				err = gv_detach_sd(s, flags);
895				if (err)
896					G_VINUM_DEBUG(0, "error detaching %s: "
897					    "error code %d", s->name, err);
898				break;
899
900			case GV_EVENT_RENAME_VOL:
901				G_VINUM_DEBUG(2, "event 'rename' volume");
902				v = ev->arg1;
903				newname = ev->arg2;
904				flags = ev->arg3;
905				err = gv_rename_vol(sc, v, newname, flags);
906				if (err)
907					G_VINUM_DEBUG(0, "error renaming %s to "
908					    "%s: error code %d", v->name,
909					    newname, err);
910				g_free(newname);
911				/* Destroy and recreate the provider if we can. */
912				if (gv_provider_is_open(v->provider)) {
913					G_VINUM_DEBUG(0, "unable to rename "
914					    "provider to %s: provider in use",
915					    v->name);
916					break;
917				}
918				g_topology_lock();
919				g_wither_provider(v->provider, ENOENT);
920				g_topology_unlock();
921				v->provider = NULL;
922				gv_post_event(sc, GV_EVENT_SETUP_OBJECTS, sc,
923				    NULL, 0, 0);
924				break;
925
926			case GV_EVENT_RENAME_PLEX:
927				G_VINUM_DEBUG(2, "event 'rename' plex");
928				p = ev->arg1;
929				newname = ev->arg2;
930				flags = ev->arg3;
931				err = gv_rename_plex(sc, p, newname, flags);
932				if (err)
933					G_VINUM_DEBUG(0, "error renaming %s to "
934					    "%s: error code %d", p->name,
935					    newname, err);
936				g_free(newname);
937				break;
938
939			case GV_EVENT_RENAME_SD:
940				G_VINUM_DEBUG(2, "event 'rename' sd");
941				s = ev->arg1;
942				newname = ev->arg2;
943				flags = ev->arg3;
944				err = gv_rename_sd(sc, s, newname, flags);
945				if (err)
946					G_VINUM_DEBUG(0, "error renaming %s to "
947					    "%s: error code %d", s->name,
948					    newname, err);
949				g_free(newname);
950				break;
951
952			case GV_EVENT_RENAME_DRIVE:
953				G_VINUM_DEBUG(2, "event 'rename' drive");
954				d = ev->arg1;
955				newname = ev->arg2;
956				flags = ev->arg3;
957				err = gv_rename_drive(sc, d, newname, flags);
958				if (err)
959					G_VINUM_DEBUG(0, "error renaming %s to "
960					    "%s: error code %d", d->name,
961					    newname, err);
962				g_free(newname);
963				break;
964
965			case GV_EVENT_MOVE_SD:
966				G_VINUM_DEBUG(2, "event 'move' sd");
967				s = ev->arg1;
968				d = ev->arg2;
969				flags = ev->arg3;
970				err = gv_move_sd(sc, s, d, flags);
971				if (err)
972					G_VINUM_DEBUG(0, "error moving %s to "
973					    "%s: error code %d", s->name,
974					    d->name, err);
975				break;
976
977			case GV_EVENT_THREAD_EXIT:
978				G_VINUM_DEBUG(2, "event 'thread exit'");
979				g_free(ev);
980				mtx_lock(&sc->equeue_mtx);
981				mtx_lock(&sc->bqueue_mtx);
982				gv_cleanup(sc);
983				mtx_destroy(&sc->bqueue_mtx);
984				mtx_destroy(&sc->equeue_mtx);
985				g_free(sc->bqueue_down);
986				g_free(sc->bqueue_up);
987				g_free(sc);
988				kproc_exit(0);
989				/* NOTREACHED */
990
991			default:
992				G_VINUM_DEBUG(1, "unknown event %d", ev->type);
993			}
994
995			g_free(ev);
996			continue;
997		}
998
999		/* ... then do I/O processing. */
1000		mtx_lock(&sc->bqueue_mtx);
1001		/* First do new requests. */
1002		bp = bioq_takefirst(sc->bqueue_down);
1003		if (bp != NULL) {
1004			mtx_unlock(&sc->bqueue_mtx);
1005			/* A bio that interfered with another bio. */
1006			if (bp->bio_pflags & GV_BIO_ONHOLD) {
1007				s = bp->bio_caller1;
1008				p = s->plex_sc;
1009				/* Is it still locked out? */
1010				if (gv_stripe_active(p, bp)) {
1011					/* Park the bio on the waiting queue. */
1012					bioq_disksort(p->wqueue, bp);
1013				} else {
1014					bp->bio_pflags &= ~GV_BIO_ONHOLD;
1015					g_io_request(bp, s->drive_sc->consumer);
1016				}
1017			/* A special request requireing special handling. */
1018			} else if (bp->bio_pflags & GV_BIO_INTERNAL) {
1019				p = bp->bio_caller1;
1020				gv_plex_start(p, bp);
1021			} else {
1022				gv_volume_start(sc, bp);
1023			}
1024			mtx_lock(&sc->bqueue_mtx);
1025		}
1026		/* Then do completed requests. */
1027		bp = bioq_takefirst(sc->bqueue_up);
1028		if (bp == NULL) {
1029			msleep(sc, &sc->bqueue_mtx, PRIBIO, "-", hz/10);
1030			mtx_unlock(&sc->bqueue_mtx);
1031			continue;
1032		}
1033		mtx_unlock(&sc->bqueue_mtx);
1034		gv_bio_done(sc, bp);
1035	}
1036}
1037
1038#define	VINUM_CLASS_NAME "VINUM"
1039
1040static struct g_class g_vinum_class	= {
1041	.name = VINUM_CLASS_NAME,
1042	.version = G_VERSION,
1043	.init = gv_init,
1044	.taste = gv_taste,
1045	.ctlreq = gv_config,
1046	.destroy_geom = gv_unload,
1047};
1048
1049DECLARE_GEOM_CLASS(g_vinum_class, g_vinum);
1050