]> CyberLeo.Net >> Repos - FreeBSD/releng/9.2.git/blob - sys/geom/vinum/geom_vinum.c
- Copy stable/9 to releng/9.2 as part of the 9.2-RELEASE cycle.
[FreeBSD/releng/9.2.git] / sys / geom / vinum / geom_vinum.c
1 /*-
2  *  Copyright (c) 2004, 2007 Lukas Ertl
3  *  Copyright (c) 2007, 2009 Ulf Lilleengen
4  *  All rights reserved.
5  * 
6  * Redistribution and use in source and binary forms, with or without
7  * modification, are permitted provided that the following conditions
8  * are met:
9  * 1. Redistributions of source code must retain the above copyright
10  *    notice, this list of conditions and the following disclaimer.
11  * 2. Redistributions in binary form must reproduce the above copyright
12  *    notice, this list of conditions and the following disclaimer in the
13  *    documentation and/or other materials provided with the distribution.
14  * 
15  * THIS SOFTWARE IS PROVIDED BY AUTHOR AND CONTRIBUTORS ``AS IS'' AND
16  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18  * ARE DISCLAIMED.  IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE
19  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
21  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25  * SUCH DAMAGE.
26  *
27  */
28
29 #include <sys/cdefs.h>
30 __FBSDID("$FreeBSD$");
31
32 #include <sys/param.h>
33 #include <sys/bio.h>
34 #include <sys/kernel.h>
35 #include <sys/kthread.h>
36 #include <sys/lock.h>
37 #include <sys/malloc.h>
38 #include <sys/module.h>
39 #include <sys/mutex.h>
40 #include <sys/sbuf.h>
41 #include <sys/sysctl.h>
42 #include <sys/systm.h>
43
44 #include <geom/geom.h>
45 #include <geom/vinum/geom_vinum_var.h>
46 #include <geom/vinum/geom_vinum.h>
47 #include <geom/vinum/geom_vinum_raid5.h>
48
49 SYSCTL_DECL(_kern_geom);
50 static SYSCTL_NODE(_kern_geom, OID_AUTO, vinum, CTLFLAG_RW, 0,
51     "GEOM_VINUM stuff");
52 u_int g_vinum_debug = 0;
53 TUNABLE_INT("kern.geom.vinum.debug", &g_vinum_debug);
54 SYSCTL_UINT(_kern_geom_vinum, OID_AUTO, debug, CTLFLAG_RW, &g_vinum_debug, 0,
55     "Debug level");
56
57 static int      gv_create(struct g_geom *, struct gctl_req *);
58 static void     gv_attach(struct gv_softc *, struct gctl_req *);
59 static void     gv_detach(struct gv_softc *, struct gctl_req *);
60 static void     gv_parityop(struct gv_softc *, struct gctl_req *);
61
62
63 static void
64 gv_orphan(struct g_consumer *cp)
65 {
66         struct g_geom *gp;
67         struct gv_softc *sc;
68         struct gv_drive *d;
69         
70         g_topology_assert();
71
72         KASSERT(cp != NULL, ("gv_orphan: null cp"));
73         gp = cp->geom;
74         KASSERT(gp != NULL, ("gv_orphan: null gp"));
75         sc = gp->softc;
76         KASSERT(sc != NULL, ("gv_orphan: null sc"));
77         d = cp->private;
78         KASSERT(d != NULL, ("gv_orphan: null d"));
79
80         g_trace(G_T_TOPOLOGY, "gv_orphan(%s)", gp->name);
81
82         gv_post_event(sc, GV_EVENT_DRIVE_LOST, d, NULL, 0, 0);
83 }
84
85 void
86 gv_start(struct bio *bp)
87 {
88         struct g_geom *gp;
89         struct gv_softc *sc;
90         
91         gp = bp->bio_to->geom;
92         sc = gp->softc;
93
94         switch (bp->bio_cmd) {
95         case BIO_READ:
96         case BIO_WRITE:
97         case BIO_DELETE:
98                 break;
99         case BIO_GETATTR:
100         default:
101                 g_io_deliver(bp, EOPNOTSUPP);
102                 return;
103         }
104         mtx_lock(&sc->bqueue_mtx);
105         bioq_disksort(sc->bqueue_down, bp);
106         wakeup(sc);
107         mtx_unlock(&sc->bqueue_mtx);
108 }
109
110 void
111 gv_done(struct bio *bp)
112 {
113         struct g_geom *gp;
114         struct gv_softc *sc;
115         
116         KASSERT(bp != NULL, ("NULL bp"));
117
118         gp = bp->bio_from->geom;
119         sc = gp->softc;
120
121         mtx_lock(&sc->bqueue_mtx);
122         bioq_disksort(sc->bqueue_up, bp);
123         wakeup(sc);
124         mtx_unlock(&sc->bqueue_mtx);
125 }
126
127 int
128 gv_access(struct g_provider *pp, int dr, int dw, int de)
129 {
130         struct g_geom *gp;
131         struct gv_softc *sc;
132         struct gv_drive *d, *d2;
133         int error;
134         
135         gp = pp->geom;
136         sc = gp->softc;
137         /*
138          * We want to modify the read count with the write count in case we have
139          * plexes in a RAID-5 organization.
140          */
141         dr += dw;
142
143         LIST_FOREACH(d, &sc->drives, drive) {
144                 if (d->consumer == NULL)
145                         continue;
146                 error = g_access(d->consumer, dr, dw, de);
147                 if (error) {
148                         LIST_FOREACH(d2, &sc->drives, drive) {
149                                 if (d == d2)
150                                         break;
151                                 g_access(d2->consumer, -dr, -dw, -de);
152                         }
153                         G_VINUM_DEBUG(0, "g_access '%s' failed: %d", d->name,
154                             error);
155                         return (error);
156                 }
157         }
158         return (0);
159 }
160
161 static void
162 gv_init(struct g_class *mp)
163 {
164         struct g_geom *gp;
165         struct gv_softc *sc;
166
167         g_trace(G_T_TOPOLOGY, "gv_init(%p)", mp);
168
169         gp = g_new_geomf(mp, "VINUM");
170         gp->spoiled = gv_orphan;
171         gp->orphan = gv_orphan;
172         gp->access = gv_access;
173         gp->start = gv_start;
174         gp->softc = g_malloc(sizeof(struct gv_softc), M_WAITOK | M_ZERO);
175         sc = gp->softc;
176         sc->geom = gp;
177         sc->bqueue_down = g_malloc(sizeof(struct bio_queue_head),
178             M_WAITOK | M_ZERO);
179         sc->bqueue_up = g_malloc(sizeof(struct bio_queue_head),
180             M_WAITOK | M_ZERO);
181         bioq_init(sc->bqueue_down);
182         bioq_init(sc->bqueue_up);
183         LIST_INIT(&sc->drives);
184         LIST_INIT(&sc->subdisks);
185         LIST_INIT(&sc->plexes);
186         LIST_INIT(&sc->volumes);
187         TAILQ_INIT(&sc->equeue);
188         mtx_init(&sc->config_mtx, "gv_config", NULL, MTX_DEF);
189         mtx_init(&sc->equeue_mtx, "gv_equeue", NULL, MTX_DEF);
190         mtx_init(&sc->bqueue_mtx, "gv_bqueue", NULL, MTX_DEF);
191         kproc_create(gv_worker, sc, &sc->worker, 0, 0, "gv_worker");
192 }
193
194 static int
195 gv_unload(struct gctl_req *req, struct g_class *mp, struct g_geom *gp)
196 {
197         struct gv_softc *sc;
198
199         g_trace(G_T_TOPOLOGY, "gv_unload(%p)", mp);
200
201         g_topology_assert();
202         sc = gp->softc;
203
204         if (sc != NULL) {
205                 gv_worker_exit(sc);
206                 gp->softc = NULL;
207                 g_wither_geom(gp, ENXIO);
208         }
209
210         return (0);
211 }
212
213 /* Handle userland request of attaching object. */
214 static void
215 gv_attach(struct gv_softc *sc, struct gctl_req *req)
216 {
217         struct gv_volume *v;
218         struct gv_plex *p;
219         struct gv_sd *s;
220         off_t *offset;
221         int *rename, type_child, type_parent;
222         char *child, *parent;
223
224         child = gctl_get_param(req, "child", NULL);
225         if (child == NULL) {
226                 gctl_error(req, "no child given");
227                 return;
228         }
229         parent = gctl_get_param(req, "parent", NULL);
230         if (parent == NULL) {
231                 gctl_error(req, "no parent given");
232                 return;
233         }
234         offset = gctl_get_paraml(req, "offset", sizeof(*offset));
235         if (offset == NULL) {
236                 gctl_error(req, "no offset given");
237                 return;
238         }
239         rename = gctl_get_paraml(req, "rename", sizeof(*rename));
240         if (rename == NULL) {
241                 gctl_error(req, "no rename flag given");
242                 return;
243         }
244
245         type_child = gv_object_type(sc, child);
246         type_parent = gv_object_type(sc, parent);
247
248         switch (type_child) {
249         case GV_TYPE_PLEX:
250                 if (type_parent != GV_TYPE_VOL) {
251                         gctl_error(req, "no such volume to attach to");
252                         return;
253                 }
254                 v = gv_find_vol(sc, parent);
255                 p = gv_find_plex(sc, child);
256                 gv_post_event(sc, GV_EVENT_ATTACH_PLEX, p, v, *offset, *rename);
257                 break;
258         case GV_TYPE_SD:
259                 if (type_parent != GV_TYPE_PLEX) {
260                         gctl_error(req, "no such plex to attach to");
261                         return;
262                 }
263                 p = gv_find_plex(sc, parent);
264                 s = gv_find_sd(sc, child);
265                 gv_post_event(sc, GV_EVENT_ATTACH_SD, s, p, *offset, *rename);
266                 break;
267         default:
268                 gctl_error(req, "invalid child type");
269                 break;
270         }
271 }
272
273 /* Handle userland request of detaching object. */
274 static void
275 gv_detach(struct gv_softc *sc, struct gctl_req *req)
276 {
277         struct gv_plex *p;
278         struct gv_sd *s;
279         int *flags, type;
280         char *object;
281
282         object = gctl_get_param(req, "object", NULL);
283         if (object == NULL) {
284                 gctl_error(req, "no argument given");
285                 return;
286         }
287
288         flags = gctl_get_paraml(req, "flags", sizeof(*flags));
289         type = gv_object_type(sc, object);
290         switch (type) {
291         case GV_TYPE_PLEX:
292                 p = gv_find_plex(sc, object);
293                 gv_post_event(sc, GV_EVENT_DETACH_PLEX, p, NULL, *flags, 0);
294                 break;
295         case GV_TYPE_SD:
296                 s = gv_find_sd(sc, object);
297                 gv_post_event(sc, GV_EVENT_DETACH_SD, s, NULL, *flags, 0);
298                 break;
299         default:
300                 gctl_error(req, "invalid object type");
301                 break;
302         }
303 }
304
305 /* Handle userland requests for creating new objects. */
306 static int
307 gv_create(struct g_geom *gp, struct gctl_req *req)
308 {
309         struct gv_softc *sc;
310         struct gv_drive *d, *d2;
311         struct gv_plex *p, *p2;
312         struct gv_sd *s, *s2;
313         struct gv_volume *v, *v2;
314         struct g_provider *pp;
315         int error, i, *drives, *flags, *plexes, *subdisks, *volumes;
316         char buf[20];
317
318         g_topology_assert();
319
320         sc = gp->softc;
321
322         /* Find out how many of each object have been passed in. */
323         volumes = gctl_get_paraml(req, "volumes", sizeof(*volumes));
324         plexes = gctl_get_paraml(req, "plexes", sizeof(*plexes));
325         subdisks = gctl_get_paraml(req, "subdisks", sizeof(*subdisks));
326         drives = gctl_get_paraml(req, "drives", sizeof(*drives));
327         if (volumes == NULL || plexes == NULL || subdisks == NULL ||
328             drives == NULL) {
329                 gctl_error(req, "number of objects not given");
330                 return (-1);
331         }
332         flags = gctl_get_paraml(req, "flags", sizeof(*flags));
333         if (flags == NULL) {
334                 gctl_error(req, "flags not given");
335                 return (-1);
336         }
337
338         /* First, handle drive definitions ... */
339         for (i = 0; i < *drives; i++) {
340                 snprintf(buf, sizeof(buf), "drive%d", i);
341                 d2 = gctl_get_paraml(req, buf, sizeof(*d2));
342                 if (d2 == NULL) {
343                         gctl_error(req, "no drive definition given");
344                         return (-1);
345                 }
346                 /*
347                  * Make sure that the device specified in the drive config is
348                  * an active GEOM provider.
349                  */
350                 pp = g_provider_by_name(d2->device);
351                 if (pp == NULL) {
352                         gctl_error(req, "%s: device not found", d2->device);
353                         goto error;
354                 }
355                 if (gv_find_drive(sc, d2->name) != NULL) {
356                         /* Ignore error. */
357                         if (*flags & GV_FLAG_F)
358                                 continue;
359                         gctl_error(req, "drive '%s' already exists", d2->name);
360                         goto error;
361                 }
362                 if (gv_find_drive_device(sc, d2->device) != NULL) {
363                         gctl_error(req, "device '%s' already configured in "
364                             "gvinum", d2->device);
365                         goto error;
366                 }
367
368
369                 d = g_malloc(sizeof(*d), M_WAITOK | M_ZERO);
370                 bcopy(d2, d, sizeof(*d));
371
372                 gv_post_event(sc, GV_EVENT_CREATE_DRIVE, d, NULL, 0, 0);
373         }
374
375         /* ... then volume definitions ... */
376         for (i = 0; i < *volumes; i++) {
377                 error = 0;
378                 snprintf(buf, sizeof(buf), "volume%d", i);
379                 v2 = gctl_get_paraml(req, buf, sizeof(*v2));
380                 if (v2 == NULL) {
381                         gctl_error(req, "no volume definition given");
382                         return (-1);
383                 }
384                 if (gv_find_vol(sc, v2->name) != NULL) {
385                         /* Ignore error. */
386                         if (*flags & GV_FLAG_F)
387                                 continue;
388                         gctl_error(req, "volume '%s' already exists", v2->name);
389                         goto error;
390                 }
391
392                 v = g_malloc(sizeof(*v), M_WAITOK | M_ZERO);
393                 bcopy(v2, v, sizeof(*v));
394
395                 gv_post_event(sc, GV_EVENT_CREATE_VOLUME, v, NULL, 0, 0);
396         }
397
398         /* ... then plex definitions ... */
399         for (i = 0; i < *plexes; i++) {
400                 error = 0;
401                 snprintf(buf, sizeof(buf), "plex%d", i);
402                 p2 = gctl_get_paraml(req, buf, sizeof(*p2));
403                 if (p2 == NULL) {
404                         gctl_error(req, "no plex definition given");
405                         return (-1);
406                 }
407                 if (gv_find_plex(sc, p2->name) != NULL) {
408                         /* Ignore error. */
409                         if (*flags & GV_FLAG_F)
410                                 continue;
411                         gctl_error(req, "plex '%s' already exists", p2->name);
412                         goto error;
413                 }
414
415                 p = g_malloc(sizeof(*p), M_WAITOK | M_ZERO);
416                 bcopy(p2, p, sizeof(*p));
417
418                 gv_post_event(sc, GV_EVENT_CREATE_PLEX, p, NULL, 0, 0);
419         }
420
421         /* ... and, finally, subdisk definitions. */
422         for (i = 0; i < *subdisks; i++) {
423                 error = 0;
424                 snprintf(buf, sizeof(buf), "sd%d", i);
425                 s2 = gctl_get_paraml(req, buf, sizeof(*s2));
426                 if (s2 == NULL) {
427                         gctl_error(req, "no subdisk definition given");
428                         return (-1);
429                 }
430                 if (gv_find_sd(sc, s2->name) != NULL) {
431                         /* Ignore error. */
432                         if (*flags & GV_FLAG_F)
433                                 continue;
434                         gctl_error(req, "sd '%s' already exists", s2->name);
435                         goto error;
436                 }
437
438                 s = g_malloc(sizeof(*s), M_WAITOK | M_ZERO);
439                 bcopy(s2, s, sizeof(*s));
440
441                 gv_post_event(sc, GV_EVENT_CREATE_SD, s, NULL, 0, 0);
442         }
443
444 error:
445         gv_post_event(sc, GV_EVENT_SETUP_OBJECTS, sc, NULL, 0, 0);
446         gv_post_event(sc, GV_EVENT_SAVE_CONFIG, sc, NULL, 0, 0);
447
448         return (0);
449 }
450
451 static void
452 gv_config(struct gctl_req *req, struct g_class *mp, char const *verb)
453 {
454         struct g_geom *gp;
455         struct gv_softc *sc;
456         struct sbuf *sb;
457         char *comment;
458
459         g_topology_assert();
460
461         gp = LIST_FIRST(&mp->geom);
462         sc = gp->softc;
463
464         if (!strcmp(verb, "attach")) {
465                 gv_attach(sc, req);
466
467         } else if (!strcmp(verb, "concat")) {
468                 gv_concat(gp, req);
469
470         } else if (!strcmp(verb, "detach")) {
471                 gv_detach(sc, req);
472
473         } else if (!strcmp(verb, "list")) {
474                 gv_list(gp, req);
475
476         /* Save our configuration back to disk. */
477         } else if (!strcmp(verb, "saveconfig")) {
478                 gv_post_event(sc, GV_EVENT_SAVE_CONFIG, sc, NULL, 0, 0);
479
480         /* Return configuration in string form. */
481         } else if (!strcmp(verb, "getconfig")) {
482                 comment = gctl_get_param(req, "comment", NULL);
483                 if (comment == NULL) {
484                         gctl_error(req, "no comment parameter given");
485                         return;
486                 }
487                 sb = sbuf_new(NULL, NULL, GV_CFG_LEN, SBUF_FIXEDLEN);
488                 gv_format_config(sc, sb, 0, comment);
489                 sbuf_finish(sb);
490                 gctl_set_param(req, "config", sbuf_data(sb), sbuf_len(sb) + 1);
491                 sbuf_delete(sb);
492
493         } else if (!strcmp(verb, "create")) {
494                 gv_create(gp, req);
495
496         } else if (!strcmp(verb, "mirror")) {
497                 gv_mirror(gp, req);
498
499         } else if (!strcmp(verb, "move")) {
500                 gv_move(gp, req);
501
502         } else if (!strcmp(verb, "raid5")) {
503                 gv_raid5(gp, req);
504
505         } else if (!strcmp(verb, "rebuildparity") ||
506             !strcmp(verb, "checkparity")) {
507                 gv_parityop(sc, req);
508
509         } else if (!strcmp(verb, "remove")) {
510                 gv_remove(gp, req);
511
512         } else if (!strcmp(verb, "rename")) {
513                 gv_rename(gp, req);
514         
515         } else if (!strcmp(verb, "resetconfig")) {
516                 gv_post_event(sc, GV_EVENT_RESET_CONFIG, sc, NULL, 0, 0);
517
518         } else if (!strcmp(verb, "start")) {
519                 gv_start_obj(gp, req);
520
521         } else if (!strcmp(verb, "stripe")) {
522                 gv_stripe(gp, req);
523
524         } else if (!strcmp(verb, "setstate")) {
525                 gv_setstate(gp, req);
526         } else
527                 gctl_error(req, "Unknown verb parameter");
528 }
529
530 static void
531 gv_parityop(struct gv_softc *sc, struct gctl_req *req)
532 {
533         struct gv_plex *p;
534         int *flags, *rebuild, type;
535         char *plex;
536
537         plex = gctl_get_param(req, "plex", NULL);
538         if (plex == NULL) {
539                 gctl_error(req, "no plex given");
540                 return;
541         }
542
543         flags = gctl_get_paraml(req, "flags", sizeof(*flags));
544         if (flags == NULL) {
545                 gctl_error(req, "no flags given");
546                 return;
547         }
548
549         rebuild = gctl_get_paraml(req, "rebuild", sizeof(*rebuild));
550         if (rebuild == NULL) {
551                 gctl_error(req, "no operation given");
552                 return;
553         }
554
555         type = gv_object_type(sc, plex);
556         if (type != GV_TYPE_PLEX) {
557                 gctl_error(req, "'%s' is not a plex", plex);
558                 return;
559         }
560         p = gv_find_plex(sc, plex);
561
562         if (p->state != GV_PLEX_UP) {
563                 gctl_error(req, "plex %s is not completely accessible",
564                     p->name);
565                 return;
566         }
567
568         if (p->org != GV_PLEX_RAID5) {
569                 gctl_error(req, "plex %s is not a RAID5 plex", p->name);
570                 return;
571         }
572
573         /* Put it in the event queue. */
574         /* XXX: The state of the plex might have changed when this event is
575          * picked up ... We should perhaps check this afterwards. */
576         if (*rebuild)
577                 gv_post_event(sc, GV_EVENT_PARITY_REBUILD, p, NULL, 0, 0);
578         else
579                 gv_post_event(sc, GV_EVENT_PARITY_CHECK, p, NULL, 0, 0);
580 }
581
582
583 static struct g_geom *
584 gv_taste(struct g_class *mp, struct g_provider *pp, int flags __unused)
585 {
586         struct g_geom *gp;
587         struct g_consumer *cp;
588         struct gv_softc *sc;
589         struct gv_hdr vhdr;
590         int error;
591
592         g_topology_assert();
593         g_trace(G_T_TOPOLOGY, "gv_taste(%s, %s)", mp->name, pp->name);
594
595         gp = LIST_FIRST(&mp->geom);
596         if (gp == NULL) {
597                 G_VINUM_DEBUG(0, "error: tasting, but not initialized?");
598                 return (NULL);
599         }
600         sc = gp->softc;
601
602         cp = g_new_consumer(gp);
603         if (g_attach(cp, pp) != 0) {
604                 g_destroy_consumer(cp);
605                 return (NULL);
606         }
607         if (g_access(cp, 1, 0, 0) != 0) {
608                 g_detach(cp);
609                 g_destroy_consumer(cp);
610                 return (NULL);
611         }
612         g_topology_unlock();
613
614         error = gv_read_header(cp, &vhdr);
615
616         g_topology_lock();
617         g_access(cp, -1, 0, 0);
618         g_detach(cp);
619         g_destroy_consumer(cp);
620
621         /* Check if what we've been given is a valid vinum drive. */
622         if (!error)
623                 gv_post_event(sc, GV_EVENT_DRIVE_TASTED, pp, NULL, 0, 0);
624
625         return (NULL);
626 }
627
628 void
629 gv_worker(void *arg)
630 {
631         struct g_provider *pp;
632         struct gv_softc *sc;
633         struct gv_event *ev;
634         struct gv_volume *v;
635         struct gv_plex *p;
636         struct gv_sd *s;
637         struct gv_drive *d;
638         struct bio *bp;
639         int newstate, flags, err, rename;
640         char *newname;
641         off_t offset;
642
643         sc = arg;
644         KASSERT(sc != NULL, ("NULL sc"));
645         for (;;) {
646                 /* Look at the events first... */
647                 ev = gv_get_event(sc);
648                 if (ev != NULL) {
649                         gv_remove_event(sc, ev);
650
651                         switch (ev->type) {
652                         case GV_EVENT_DRIVE_TASTED:
653                                 G_VINUM_DEBUG(2, "event 'drive tasted'");
654                                 pp = ev->arg1;
655                                 gv_drive_tasted(sc, pp);
656                                 break;
657
658                         case GV_EVENT_DRIVE_LOST:
659                                 G_VINUM_DEBUG(2, "event 'drive lost'");
660                                 d = ev->arg1;
661                                 gv_drive_lost(sc, d);
662                                 break;
663
664                         case GV_EVENT_CREATE_DRIVE:
665                                 G_VINUM_DEBUG(2, "event 'create drive'");
666                                 d = ev->arg1;
667                                 gv_create_drive(sc, d);
668                                 break;
669
670                         case GV_EVENT_CREATE_VOLUME:
671                                 G_VINUM_DEBUG(2, "event 'create volume'");
672                                 v = ev->arg1;
673                                 gv_create_volume(sc, v);
674                                 break;
675
676                         case GV_EVENT_CREATE_PLEX:
677                                 G_VINUM_DEBUG(2, "event 'create plex'");
678                                 p = ev->arg1;
679                                 gv_create_plex(sc, p);
680                                 break;
681
682                         case GV_EVENT_CREATE_SD:
683                                 G_VINUM_DEBUG(2, "event 'create sd'");
684                                 s = ev->arg1;
685                                 gv_create_sd(sc, s);
686                                 break;
687
688                         case GV_EVENT_RM_DRIVE:
689                                 G_VINUM_DEBUG(2, "event 'remove drive'");
690                                 d = ev->arg1;
691                                 flags = ev->arg3;
692                                 gv_rm_drive(sc, d, flags);
693                                 /*gv_setup_objects(sc);*/
694                                 break;
695
696                         case GV_EVENT_RM_VOLUME:
697                                 G_VINUM_DEBUG(2, "event 'remove volume'");
698                                 v = ev->arg1;
699                                 gv_rm_vol(sc, v);
700                                 /*gv_setup_objects(sc);*/
701                                 break;
702
703                         case GV_EVENT_RM_PLEX:
704                                 G_VINUM_DEBUG(2, "event 'remove plex'");
705                                 p = ev->arg1;
706                                 gv_rm_plex(sc, p);
707                                 /*gv_setup_objects(sc);*/
708                                 break;
709
710                         case GV_EVENT_RM_SD:
711                                 G_VINUM_DEBUG(2, "event 'remove sd'");
712                                 s = ev->arg1;
713                                 gv_rm_sd(sc, s);
714                                 /*gv_setup_objects(sc);*/
715                                 break;
716
717                         case GV_EVENT_SAVE_CONFIG:
718                                 G_VINUM_DEBUG(2, "event 'save config'");
719                                 gv_save_config(sc);
720                                 break;
721
722                         case GV_EVENT_SET_SD_STATE:
723                                 G_VINUM_DEBUG(2, "event 'setstate sd'");
724                                 s = ev->arg1;
725                                 newstate = ev->arg3;
726                                 flags = ev->arg4;
727                                 err = gv_set_sd_state(s, newstate, flags);
728                                 if (err)
729                                         G_VINUM_DEBUG(0, "error setting subdisk"
730                                             " state: error code %d", err);
731                                 break;
732
733                         case GV_EVENT_SET_DRIVE_STATE:
734                                 G_VINUM_DEBUG(2, "event 'setstate drive'");
735                                 d = ev->arg1;
736                                 newstate = ev->arg3;
737                                 flags = ev->arg4;
738                                 err = gv_set_drive_state(d, newstate, flags);
739                                 if (err)
740                                         G_VINUM_DEBUG(0, "error setting drive "
741                                             "state: error code %d", err);
742                                 break;
743
744                         case GV_EVENT_SET_VOL_STATE:
745                                 G_VINUM_DEBUG(2, "event 'setstate volume'");
746                                 v = ev->arg1;
747                                 newstate = ev->arg3;
748                                 flags = ev->arg4;
749                                 err = gv_set_vol_state(v, newstate, flags);
750                                 if (err)
751                                         G_VINUM_DEBUG(0, "error setting volume "
752                                             "state: error code %d", err);
753                                 break;
754
755                         case GV_EVENT_SET_PLEX_STATE:
756                                 G_VINUM_DEBUG(2, "event 'setstate plex'");
757                                 p = ev->arg1;
758                                 newstate = ev->arg3;
759                                 flags = ev->arg4;
760                                 err = gv_set_plex_state(p, newstate, flags);
761                                 if (err)
762                                         G_VINUM_DEBUG(0, "error setting plex "
763                                             "state: error code %d", err);
764                                 break;
765
766                         case GV_EVENT_SETUP_OBJECTS:
767                                 G_VINUM_DEBUG(2, "event 'setup objects'");
768                                 gv_setup_objects(sc);
769                                 break;
770
771                         case GV_EVENT_RESET_CONFIG:
772                                 G_VINUM_DEBUG(2, "event 'resetconfig'");
773                                 err = gv_resetconfig(sc);
774                                 if (err)
775                                         G_VINUM_DEBUG(0, "error resetting "
776                                             "config: error code %d", err);
777                                 break;
778
779                         case GV_EVENT_PARITY_REBUILD:
780                                 /*
781                                  * Start the rebuild. The gv_plex_done will
782                                  * handle issuing of the remaining rebuild bio's
783                                  * until it's finished. 
784                                  */
785                                 G_VINUM_DEBUG(2, "event 'rebuild'");
786                                 p = ev->arg1;
787                                 if (p->state != GV_PLEX_UP) {
788                                         G_VINUM_DEBUG(0, "plex %s is not "
789                                             "completely accessible", p->name);
790                                         break;
791                                 }
792                                 if (p->flags & GV_PLEX_SYNCING ||
793                                     p->flags & GV_PLEX_REBUILDING ||
794                                     p->flags & GV_PLEX_GROWING) {
795                                         G_VINUM_DEBUG(0, "plex %s is busy with "
796                                             "syncing or parity build", p->name);
797                                         break;
798                                 }
799                                 p->synced = 0;
800                                 p->flags |= GV_PLEX_REBUILDING;
801                                 g_topology_assert_not();
802                                 g_topology_lock();
803                                 err = gv_access(p->vol_sc->provider, 1, 1, 0);
804                                 if (err) {
805                                         G_VINUM_DEBUG(0, "unable to access "
806                                             "provider");
807                                         break;
808                                 }
809                                 g_topology_unlock();
810                                 gv_parity_request(p, GV_BIO_CHECK |
811                                     GV_BIO_PARITY, 0);
812                                 break;
813
814                         case GV_EVENT_PARITY_CHECK:
815                                 /* Start parity check. */
816                                 G_VINUM_DEBUG(2, "event 'check'");
817                                 p = ev->arg1;
818                                 if (p->state != GV_PLEX_UP) {
819                                         G_VINUM_DEBUG(0, "plex %s is not "
820                                             "completely accessible", p->name);
821                                         break;
822                                 }
823                                 if (p->flags & GV_PLEX_SYNCING ||
824                                     p->flags & GV_PLEX_REBUILDING ||
825                                     p->flags & GV_PLEX_GROWING) {
826                                         G_VINUM_DEBUG(0, "plex %s is busy with "
827                                             "syncing or parity build", p->name);
828                                         break;
829                                 }
830                                 p->synced = 0;
831                                 g_topology_assert_not();
832                                 g_topology_lock();
833                                 err = gv_access(p->vol_sc->provider, 1, 1, 0);
834                                 if (err) {
835                                         G_VINUM_DEBUG(0, "unable to access "
836                                             "provider");
837                                         break;
838                                 }
839                                 g_topology_unlock();
840                                 gv_parity_request(p, GV_BIO_CHECK, 0);
841                                 break;
842
843                         case GV_EVENT_START_PLEX:
844                                 G_VINUM_DEBUG(2, "event 'start' plex");
845                                 p = ev->arg1;
846                                 gv_start_plex(p);
847                                 break;
848
849                         case GV_EVENT_START_VOLUME:
850                                 G_VINUM_DEBUG(2, "event 'start' volume");
851                                 v = ev->arg1;
852                                 gv_start_vol(v);
853                                 break;
854
855                         case GV_EVENT_ATTACH_PLEX:
856                                 G_VINUM_DEBUG(2, "event 'attach' plex");
857                                 p = ev->arg1;
858                                 v = ev->arg2;
859                                 rename = ev->arg4;
860                                 err = gv_attach_plex(p, v, rename);
861                                 if (err)
862                                         G_VINUM_DEBUG(0, "error attaching %s to"
863                                             " %s: error code %d", p->name,
864                                             v->name, err);
865                                 break;
866
867                         case GV_EVENT_ATTACH_SD:
868                                 G_VINUM_DEBUG(2, "event 'attach' sd");
869                                 s = ev->arg1;
870                                 p = ev->arg2;
871                                 offset = ev->arg3;
872                                 rename = ev->arg4;
873                                 err = gv_attach_sd(s, p, offset, rename);
874                                 if (err)
875                                         G_VINUM_DEBUG(0, "error attaching %s to"
876                                             " %s: error code %d", s->name,
877                                             p->name, err);
878                                 break;
879
880                         case GV_EVENT_DETACH_PLEX:
881                                 G_VINUM_DEBUG(2, "event 'detach' plex");
882                                 p = ev->arg1;
883                                 flags = ev->arg3;
884                                 err = gv_detach_plex(p, flags);
885                                 if (err)
886                                         G_VINUM_DEBUG(0, "error detaching %s: "
887                                             "error code %d", p->name, err);
888                                 break;
889
890                         case GV_EVENT_DETACH_SD:
891                                 G_VINUM_DEBUG(2, "event 'detach' sd");
892                                 s = ev->arg1;
893                                 flags = ev->arg3;
894                                 err = gv_detach_sd(s, flags);
895                                 if (err)
896                                         G_VINUM_DEBUG(0, "error detaching %s: "
897                                             "error code %d", s->name, err);
898                                 break;
899
900                         case GV_EVENT_RENAME_VOL:
901                                 G_VINUM_DEBUG(2, "event 'rename' volume");
902                                 v = ev->arg1;
903                                 newname = ev->arg2;
904                                 flags = ev->arg3;
905                                 err = gv_rename_vol(sc, v, newname, flags);
906                                 if (err)
907                                         G_VINUM_DEBUG(0, "error renaming %s to "
908                                             "%s: error code %d", v->name,
909                                             newname, err);
910                                 g_free(newname);
911                                 /* Destroy and recreate the provider if we can. */
912                                 if (gv_provider_is_open(v->provider)) {
913                                         G_VINUM_DEBUG(0, "unable to rename "
914                                             "provider to %s: provider in use",
915                                             v->name);
916                                         break;
917                                 }
918                                 g_topology_lock();
919                                 g_wither_provider(v->provider, ENOENT);
920                                 g_topology_unlock();
921                                 v->provider = NULL;
922                                 gv_post_event(sc, GV_EVENT_SETUP_OBJECTS, sc,
923                                     NULL, 0, 0);
924                                 break;
925
926                         case GV_EVENT_RENAME_PLEX:
927                                 G_VINUM_DEBUG(2, "event 'rename' plex");
928                                 p = ev->arg1;
929                                 newname = ev->arg2;
930                                 flags = ev->arg3;
931                                 err = gv_rename_plex(sc, p, newname, flags);
932                                 if (err)
933                                         G_VINUM_DEBUG(0, "error renaming %s to "
934                                             "%s: error code %d", p->name,
935                                             newname, err);
936                                 g_free(newname);
937                                 break;
938
939                         case GV_EVENT_RENAME_SD:
940                                 G_VINUM_DEBUG(2, "event 'rename' sd");
941                                 s = ev->arg1;
942                                 newname = ev->arg2;
943                                 flags = ev->arg3;
944                                 err = gv_rename_sd(sc, s, newname, flags);
945                                 if (err)
946                                         G_VINUM_DEBUG(0, "error renaming %s to "
947                                             "%s: error code %d", s->name,
948                                             newname, err);
949                                 g_free(newname);
950                                 break;
951
952                         case GV_EVENT_RENAME_DRIVE:
953                                 G_VINUM_DEBUG(2, "event 'rename' drive");
954                                 d = ev->arg1;
955                                 newname = ev->arg2;
956                                 flags = ev->arg3;
957                                 err = gv_rename_drive(sc, d, newname, flags);
958                                 if (err)
959                                         G_VINUM_DEBUG(0, "error renaming %s to "
960                                             "%s: error code %d", d->name,
961                                             newname, err);
962                                 g_free(newname);
963                                 break;
964
965                         case GV_EVENT_MOVE_SD:
966                                 G_VINUM_DEBUG(2, "event 'move' sd");
967                                 s = ev->arg1;
968                                 d = ev->arg2;
969                                 flags = ev->arg3;
970                                 err = gv_move_sd(sc, s, d, flags);
971                                 if (err)
972                                         G_VINUM_DEBUG(0, "error moving %s to "
973                                             "%s: error code %d", s->name,
974                                             d->name, err);
975                                 break;
976
977                         case GV_EVENT_THREAD_EXIT:
978                                 G_VINUM_DEBUG(2, "event 'thread exit'");
979                                 g_free(ev);
980                                 mtx_lock(&sc->equeue_mtx);
981                                 mtx_lock(&sc->bqueue_mtx);
982                                 gv_cleanup(sc);
983                                 mtx_destroy(&sc->bqueue_mtx);
984                                 mtx_destroy(&sc->equeue_mtx);
985                                 g_free(sc->bqueue_down);
986                                 g_free(sc->bqueue_up);
987                                 g_free(sc);
988                                 kproc_exit(0);
989                                 /* NOTREACHED */
990
991                         default:
992                                 G_VINUM_DEBUG(1, "unknown event %d", ev->type);
993                         }
994
995                         g_free(ev);
996                         continue;
997                 }
998
999                 /* ... then do I/O processing. */
1000                 mtx_lock(&sc->bqueue_mtx);
1001                 /* First do new requests. */
1002                 bp = bioq_takefirst(sc->bqueue_down);
1003                 if (bp != NULL) {
1004                         mtx_unlock(&sc->bqueue_mtx);
1005                         /* A bio that interfered with another bio. */
1006                         if (bp->bio_pflags & GV_BIO_ONHOLD) {
1007                                 s = bp->bio_caller1;
1008                                 p = s->plex_sc;
1009                                 /* Is it still locked out? */
1010                                 if (gv_stripe_active(p, bp)) {
1011                                         /* Park the bio on the waiting queue. */
1012                                         bioq_disksort(p->wqueue, bp);
1013                                 } else {
1014                                         bp->bio_pflags &= ~GV_BIO_ONHOLD;
1015                                         g_io_request(bp, s->drive_sc->consumer);
1016                                 }
1017                         /* A special request requireing special handling. */
1018                         } else if (bp->bio_pflags & GV_BIO_INTERNAL) {
1019                                 p = bp->bio_caller1;
1020                                 gv_plex_start(p, bp);
1021                         } else {
1022                                 gv_volume_start(sc, bp);
1023                         }
1024                         mtx_lock(&sc->bqueue_mtx);
1025                 }
1026                 /* Then do completed requests. */
1027                 bp = bioq_takefirst(sc->bqueue_up);
1028                 if (bp == NULL) {
1029                         msleep(sc, &sc->bqueue_mtx, PRIBIO, "-", hz/10);
1030                         mtx_unlock(&sc->bqueue_mtx);
1031                         continue;
1032                 }
1033                 mtx_unlock(&sc->bqueue_mtx);
1034                 gv_bio_done(sc, bp);
1035         }
1036 }
1037
1038 #define VINUM_CLASS_NAME "VINUM"
1039
1040 static struct g_class g_vinum_class     = {
1041         .name = VINUM_CLASS_NAME,
1042         .version = G_VERSION,
1043         .init = gv_init,
1044         .taste = gv_taste,
1045         .ctlreq = gv_config,
1046         .destroy_geom = gv_unload,
1047 };
1048
1049 DECLARE_GEOM_CLASS(g_vinum_class, g_vinum);