]> CyberLeo.Net >> Repos - FreeBSD/FreeBSD.git/blob - sys/geom/gate/g_gate.c
Dtrace: improve handling of library paths.
[FreeBSD/FreeBSD.git] / sys / geom / gate / g_gate.c
1 /*-
2  * Copyright (c) 2004-2006 Pawel Jakub Dawidek <pjd@FreeBSD.org>
3  * Copyright (c) 2009-2010 The FreeBSD Foundation
4  * All rights reserved.
5  *
6  * Portions of this software were developed by Pawel Jakub Dawidek
7  * under sponsorship from the FreeBSD Foundation.
8  *
9  * Redistribution and use in source and binary forms, with or without
10  * modification, are permitted provided that the following conditions
11  * are met:
12  * 1. Redistributions of source code must retain the above copyright
13  *    notice, this list of conditions and the following disclaimer.
14  * 2. Redistributions in binary form must reproduce the above copyright
15  *    notice, this list of conditions and the following disclaimer in the
16  *    documentation and/or other materials provided with the distribution.
17  *
18  * THIS SOFTWARE IS PROVIDED BY THE AUTHORS AND CONTRIBUTORS ``AS IS'' AND
19  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE LIABLE
22  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
23  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
24  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
25  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
26  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
27  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
28  * SUCH DAMAGE.
29  */
30
31 #include <sys/cdefs.h>
32 __FBSDID("$FreeBSD$");
33
34 #include <sys/param.h>
35 #include <sys/systm.h>
36 #include <sys/bio.h>
37 #include <sys/conf.h>
38 #include <sys/kernel.h>
39 #include <sys/kthread.h>
40 #include <sys/fcntl.h>
41 #include <sys/linker.h>
42 #include <sys/lock.h>
43 #include <sys/malloc.h>
44 #include <sys/mutex.h>
45 #include <sys/proc.h>
46 #include <sys/limits.h>
47 #include <sys/queue.h>
48 #include <sys/sbuf.h>
49 #include <sys/sysctl.h>
50 #include <sys/signalvar.h>
51 #include <sys/time.h>
52 #include <machine/atomic.h>
53
54 #include <geom/geom.h>
55 #include <geom/gate/g_gate.h>
56
57 FEATURE(geom_gate, "GEOM Gate module");
58
59 static MALLOC_DEFINE(M_GATE, "gg_data", "GEOM Gate Data");
60
61 SYSCTL_DECL(_kern_geom);
62 static SYSCTL_NODE(_kern_geom, OID_AUTO, gate, CTLFLAG_RW, 0,
63     "GEOM_GATE configuration");
64 static int g_gate_debug = 0;
65 TUNABLE_INT("kern.geom.gate.debug", &g_gate_debug);
66 SYSCTL_INT(_kern_geom_gate, OID_AUTO, debug, CTLFLAG_RW, &g_gate_debug, 0,
67     "Debug level");
68 static u_int g_gate_maxunits = 256;
69 TUNABLE_INT("kern.geom.gate.maxunits", &g_gate_maxunits);
70 SYSCTL_UINT(_kern_geom_gate, OID_AUTO, maxunits, CTLFLAG_RDTUN,
71     &g_gate_maxunits, 0, "Maximum number of ggate devices");
72
73 struct g_class g_gate_class = {
74         .name = G_GATE_CLASS_NAME,
75         .version = G_VERSION,
76 };
77
78 static struct cdev *status_dev;
79 static d_ioctl_t g_gate_ioctl;
80 static struct cdevsw g_gate_cdevsw = {
81         .d_version =    D_VERSION,
82         .d_ioctl =      g_gate_ioctl,
83         .d_name =       G_GATE_CTL_NAME
84 };
85
86
87 static struct g_gate_softc **g_gate_units;
88 static u_int g_gate_nunits;
89 static struct mtx g_gate_units_lock;
90
91 static int
92 g_gate_destroy(struct g_gate_softc *sc, boolean_t force)
93 {
94         struct g_provider *pp;
95         struct g_consumer *cp;
96         struct g_geom *gp;
97         struct bio *bp;
98
99         g_topology_assert();
100         mtx_assert(&g_gate_units_lock, MA_OWNED);
101         pp = sc->sc_provider;
102         if (!force && (pp->acr != 0 || pp->acw != 0 || pp->ace != 0)) {
103                 mtx_unlock(&g_gate_units_lock);
104                 return (EBUSY);
105         }
106         mtx_unlock(&g_gate_units_lock);
107         mtx_lock(&sc->sc_queue_mtx);
108         if ((sc->sc_flags & G_GATE_FLAG_DESTROY) == 0)
109                 sc->sc_flags |= G_GATE_FLAG_DESTROY;
110         wakeup(sc);
111         mtx_unlock(&sc->sc_queue_mtx);
112         gp = pp->geom;
113         pp->flags |= G_PF_WITHER;
114         g_orphan_provider(pp, ENXIO);
115         callout_drain(&sc->sc_callout);
116         mtx_lock(&sc->sc_queue_mtx);
117         while ((bp = bioq_first(&sc->sc_inqueue)) != NULL) {
118                 bioq_remove(&sc->sc_inqueue, bp);
119                 sc->sc_queue_count--;
120                 G_GATE_LOGREQ(1, bp, "Request canceled.");
121                 g_io_deliver(bp, ENXIO);
122         }
123         while ((bp = bioq_first(&sc->sc_outqueue)) != NULL) {
124                 bioq_remove(&sc->sc_outqueue, bp);
125                 sc->sc_queue_count--;
126                 G_GATE_LOGREQ(1, bp, "Request canceled.");
127                 g_io_deliver(bp, ENXIO);
128         }
129         mtx_unlock(&sc->sc_queue_mtx);
130         g_topology_unlock();
131         mtx_lock(&g_gate_units_lock);
132         /* One reference is ours. */
133         sc->sc_ref--;
134         while (sc->sc_ref > 0)
135                 msleep(&sc->sc_ref, &g_gate_units_lock, 0, "gg:destroy", 0);
136         g_gate_units[sc->sc_unit] = NULL;
137         KASSERT(g_gate_nunits > 0, ("negative g_gate_nunits?"));
138         g_gate_nunits--;
139         mtx_unlock(&g_gate_units_lock);
140         mtx_destroy(&sc->sc_queue_mtx);
141         g_topology_lock();
142         if ((cp = sc->sc_readcons) != NULL) {
143                 sc->sc_readcons = NULL;
144                 (void)g_access(cp, -1, 0, 0);
145                 g_detach(cp);
146                 g_destroy_consumer(cp);
147         }
148         G_GATE_DEBUG(1, "Device %s destroyed.", gp->name);
149         gp->softc = NULL;
150         g_wither_geom(gp, ENXIO);
151         sc->sc_provider = NULL;
152         free(sc, M_GATE);
153         return (0);
154 }
155
156 static int
157 g_gate_access(struct g_provider *pp, int dr, int dw, int de)
158 {
159         struct g_gate_softc *sc;
160
161         if (dr <= 0 && dw <= 0 && de <= 0)
162                 return (0);
163         sc = pp->geom->softc;
164         if (sc == NULL || (sc->sc_flags & G_GATE_FLAG_DESTROY) != 0)
165                 return (ENXIO);
166         /* XXX: Hack to allow read-only mounts. */
167 #if 0
168         if ((sc->sc_flags & G_GATE_FLAG_READONLY) != 0 && dw > 0)
169                 return (EPERM);
170 #endif
171         if ((sc->sc_flags & G_GATE_FLAG_WRITEONLY) != 0 && dr > 0)
172                 return (EPERM);
173         return (0);
174 }
175
176 static void
177 g_gate_queue_io(struct bio *bp)
178 {
179         struct g_gate_softc *sc;
180
181         sc = bp->bio_to->geom->softc;
182         if (sc == NULL || (sc->sc_flags & G_GATE_FLAG_DESTROY) != 0) {
183                 g_io_deliver(bp, ENXIO);
184                 return;
185         }
186
187         mtx_lock(&sc->sc_queue_mtx);
188
189         if (sc->sc_queue_size > 0 && sc->sc_queue_count > sc->sc_queue_size) {
190                 mtx_unlock(&sc->sc_queue_mtx);
191                 G_GATE_LOGREQ(1, bp, "Queue full, request canceled.");
192                 g_io_deliver(bp, ENOMEM);
193                 return;
194         }
195
196         bp->bio_driver1 = (void *)sc->sc_seq;
197         sc->sc_seq++;
198         sc->sc_queue_count++;
199
200         bioq_insert_tail(&sc->sc_inqueue, bp);
201         wakeup(sc);
202
203         mtx_unlock(&sc->sc_queue_mtx);
204 }
205
206 static void
207 g_gate_done(struct bio *cbp)
208 {
209         struct bio *pbp;
210
211         pbp = cbp->bio_parent;
212         if (cbp->bio_error == 0) {
213                 pbp->bio_completed = cbp->bio_completed;
214                 g_destroy_bio(cbp);
215                 pbp->bio_inbed++;
216                 g_io_deliver(pbp, 0);
217         } else {
218                 /* If direct read failed, pass it through userland daemon. */
219                 g_destroy_bio(cbp);
220                 pbp->bio_children--;
221                 g_gate_queue_io(pbp);
222         }
223 }
224
225 static void
226 g_gate_start(struct bio *pbp)
227 {
228         struct g_gate_softc *sc;
229
230         sc = pbp->bio_to->geom->softc;
231         if (sc == NULL || (sc->sc_flags & G_GATE_FLAG_DESTROY) != 0) {
232                 g_io_deliver(pbp, ENXIO);
233                 return;
234         }
235         G_GATE_LOGREQ(2, pbp, "Request received.");
236         switch (pbp->bio_cmd) {
237         case BIO_READ:
238                 if (sc->sc_readcons != NULL) {
239                         struct bio *cbp;
240
241                         cbp = g_clone_bio(pbp);
242                         if (cbp == NULL) {
243                                 g_io_deliver(pbp, ENOMEM);
244                                 return;
245                         }
246                         cbp->bio_done = g_gate_done;
247                         cbp->bio_offset = pbp->bio_offset + sc->sc_readoffset;
248                         cbp->bio_data = pbp->bio_data;
249                         cbp->bio_length = pbp->bio_length;
250                         cbp->bio_to = sc->sc_readcons->provider;
251                         g_io_request(cbp, sc->sc_readcons);
252                         return;
253                 }
254                 break;
255         case BIO_DELETE:
256         case BIO_WRITE:
257         case BIO_FLUSH:
258                 /* XXX: Hack to allow read-only mounts. */
259                 if ((sc->sc_flags & G_GATE_FLAG_READONLY) != 0) {
260                         g_io_deliver(pbp, EPERM);
261                         return;
262                 }
263                 break;
264         case BIO_GETATTR:
265         default:
266                 G_GATE_LOGREQ(2, pbp, "Ignoring request.");
267                 g_io_deliver(pbp, EOPNOTSUPP);
268                 return;
269         }
270
271         g_gate_queue_io(pbp);
272 }
273
274 static struct g_gate_softc *
275 g_gate_hold(int unit, const char *name)
276 {
277         struct g_gate_softc *sc = NULL;
278
279         mtx_lock(&g_gate_units_lock);
280         if (unit >= 0 && unit < g_gate_maxunits)
281                 sc = g_gate_units[unit];
282         else if (unit == G_GATE_NAME_GIVEN) {
283                 KASSERT(name != NULL, ("name is NULL"));
284                 for (unit = 0; unit < g_gate_maxunits; unit++) {
285                         if (g_gate_units[unit] == NULL)
286                                 continue;
287                         if (strcmp(name,
288                             g_gate_units[unit]->sc_provider->name) != 0) {
289                                 continue;
290                         }
291                         sc = g_gate_units[unit];
292                         break;
293                 }
294         }
295         if (sc != NULL)
296                 sc->sc_ref++;
297         mtx_unlock(&g_gate_units_lock);
298         return (sc);
299 }
300
301 static void
302 g_gate_release(struct g_gate_softc *sc)
303 {
304
305         g_topology_assert_not();
306         mtx_lock(&g_gate_units_lock);
307         sc->sc_ref--;
308         KASSERT(sc->sc_ref >= 0, ("Negative sc_ref for %s.", sc->sc_name));
309         if (sc->sc_ref == 0 && (sc->sc_flags & G_GATE_FLAG_DESTROY) != 0)
310                 wakeup(&sc->sc_ref);
311         mtx_unlock(&g_gate_units_lock);
312 }
313
314 static int
315 g_gate_getunit(int unit, int *errorp)
316 {
317
318         mtx_assert(&g_gate_units_lock, MA_OWNED);
319         if (unit >= 0) {
320                 if (unit >= g_gate_maxunits)
321                         *errorp = EINVAL;
322                 else if (g_gate_units[unit] == NULL)
323                         return (unit);
324                 else
325                         *errorp = EEXIST;
326         } else {
327                 for (unit = 0; unit < g_gate_maxunits; unit++) {
328                         if (g_gate_units[unit] == NULL)
329                                 return (unit);
330                 }
331                 *errorp = ENFILE;
332         }
333         return (-1);
334 }
335
336 static void
337 g_gate_guard(void *arg)
338 {
339         struct g_gate_softc *sc;
340         struct bintime curtime;
341         struct bio *bp, *bp2;
342
343         sc = arg;
344         binuptime(&curtime);
345         g_gate_hold(sc->sc_unit, NULL);
346         mtx_lock(&sc->sc_queue_mtx);
347         TAILQ_FOREACH_SAFE(bp, &sc->sc_inqueue.queue, bio_queue, bp2) {
348                 if (curtime.sec - bp->bio_t0.sec < 5)
349                         continue;
350                 bioq_remove(&sc->sc_inqueue, bp);
351                 sc->sc_queue_count--;
352                 G_GATE_LOGREQ(1, bp, "Request timeout.");
353                 g_io_deliver(bp, EIO);
354         }
355         TAILQ_FOREACH_SAFE(bp, &sc->sc_outqueue.queue, bio_queue, bp2) {
356                 if (curtime.sec - bp->bio_t0.sec < 5)
357                         continue;
358                 bioq_remove(&sc->sc_outqueue, bp);
359                 sc->sc_queue_count--;
360                 G_GATE_LOGREQ(1, bp, "Request timeout.");
361                 g_io_deliver(bp, EIO);
362         }
363         mtx_unlock(&sc->sc_queue_mtx);
364         if ((sc->sc_flags & G_GATE_FLAG_DESTROY) == 0) {
365                 callout_reset(&sc->sc_callout, sc->sc_timeout * hz,
366                     g_gate_guard, sc);
367         }
368         g_gate_release(sc);
369 }
370
371 static void
372 g_gate_orphan(struct g_consumer *cp)
373 {
374         struct g_gate_softc *sc;
375         struct g_geom *gp;
376
377         g_topology_assert();
378         gp = cp->geom;
379         sc = gp->softc;
380         if (sc == NULL)
381                 return;
382         KASSERT(cp == sc->sc_readcons, ("cp=%p sc_readcons=%p", cp,
383             sc->sc_readcons));
384         sc->sc_readcons = NULL;
385         G_GATE_DEBUG(1, "Destroying read consumer on provider %s orphan.",
386             cp->provider->name);
387         (void)g_access(cp, -1, 0, 0);
388         g_detach(cp);
389         g_destroy_consumer(cp);
390 }
391
392 static void
393 g_gate_dumpconf(struct sbuf *sb, const char *indent, struct g_geom *gp,
394     struct g_consumer *cp, struct g_provider *pp)
395 {
396         struct g_gate_softc *sc;
397
398         sc = gp->softc;
399         if (sc == NULL || pp != NULL || cp != NULL)
400                 return;
401         g_gate_hold(sc->sc_unit, NULL);
402         if ((sc->sc_flags & G_GATE_FLAG_READONLY) != 0) {
403                 sbuf_printf(sb, "%s<access>%s</access>\n", indent, "read-only");
404         } else if ((sc->sc_flags & G_GATE_FLAG_WRITEONLY) != 0) {
405                 sbuf_printf(sb, "%s<access>%s</access>\n", indent,
406                     "write-only");
407         } else {
408                 sbuf_printf(sb, "%s<access>%s</access>\n", indent,
409                     "read-write");
410         }
411         if (sc->sc_readcons != NULL) {
412                 sbuf_printf(sb, "%s<read_offset>%jd</read_offset>\n",
413                     indent, (intmax_t)sc->sc_readoffset);
414                 sbuf_printf(sb, "%s<read_provider>%s</read_provider>\n",
415                     indent, sc->sc_readcons->provider->name);
416         }
417         sbuf_printf(sb, "%s<timeout>%u</timeout>\n", indent, sc->sc_timeout);
418         sbuf_printf(sb, "%s<info>%s</info>\n", indent, sc->sc_info);
419         sbuf_printf(sb, "%s<queue_count>%u</queue_count>\n", indent,
420             sc->sc_queue_count);
421         sbuf_printf(sb, "%s<queue_size>%u</queue_size>\n", indent,
422             sc->sc_queue_size);
423         sbuf_printf(sb, "%s<ref>%u</ref>\n", indent, sc->sc_ref);
424         sbuf_printf(sb, "%s<unit>%d</unit>\n", indent, sc->sc_unit);
425         g_topology_unlock();
426         g_gate_release(sc);
427         g_topology_lock();
428 }
429
430 static int
431 g_gate_create(struct g_gate_ctl_create *ggio)
432 {
433         struct g_gate_softc *sc;
434         struct g_geom *gp;
435         struct g_provider *pp, *ropp;
436         struct g_consumer *cp;
437         char name[NAME_MAX];
438         int error = 0, unit;
439
440         if (ggio->gctl_mediasize <= 0) {
441                 G_GATE_DEBUG(1, "Invalid media size.");
442                 return (EINVAL);
443         }
444         if (ggio->gctl_sectorsize <= 0) {
445                 G_GATE_DEBUG(1, "Invalid sector size.");
446                 return (EINVAL);
447         }
448         if (!powerof2(ggio->gctl_sectorsize)) {
449                 G_GATE_DEBUG(1, "Invalid sector size.");
450                 return (EINVAL);
451         }
452         if ((ggio->gctl_mediasize % ggio->gctl_sectorsize) != 0) {
453                 G_GATE_DEBUG(1, "Invalid media size.");
454                 return (EINVAL);
455         }
456         if ((ggio->gctl_flags & G_GATE_FLAG_READONLY) != 0 &&
457             (ggio->gctl_flags & G_GATE_FLAG_WRITEONLY) != 0) {
458                 G_GATE_DEBUG(1, "Invalid flags.");
459                 return (EINVAL);
460         }
461         if (ggio->gctl_unit != G_GATE_UNIT_AUTO &&
462             ggio->gctl_unit != G_GATE_NAME_GIVEN &&
463             ggio->gctl_unit < 0) {
464                 G_GATE_DEBUG(1, "Invalid unit number.");
465                 return (EINVAL);
466         }
467         if (ggio->gctl_unit == G_GATE_NAME_GIVEN &&
468             ggio->gctl_name[0] == '\0') {
469                 G_GATE_DEBUG(1, "No device name.");
470                 return (EINVAL);
471         }
472
473         g_topology_lock();
474
475         if (ggio->gctl_readprov[0] == '\0') {
476                 ropp = NULL;
477         } else {
478                 ropp = g_provider_by_name(ggio->gctl_readprov);
479                 if (ropp == NULL) {
480                         g_topology_unlock();
481                         G_GATE_DEBUG(1, "Provider %s doesn't exist.",
482                             ggio->gctl_readprov);
483                         return (EINVAL);
484                 }
485                 if ((ggio->gctl_readoffset % ggio->gctl_sectorsize) != 0) {
486                         g_topology_unlock();
487                         G_GATE_DEBUG(1, "Invalid read offset.");
488                         return (EINVAL);
489                 }
490                 if (ggio->gctl_mediasize + ggio->gctl_readoffset >
491                     ropp->mediasize) {
492                         g_topology_unlock();
493                         G_GATE_DEBUG(1, "Invalid read offset or media size.");
494                         return (EINVAL);
495                 }
496         }
497
498         sc = malloc(sizeof(*sc), M_GATE, M_WAITOK | M_ZERO);
499         sc->sc_flags = (ggio->gctl_flags & G_GATE_USERFLAGS);
500         strlcpy(sc->sc_info, ggio->gctl_info, sizeof(sc->sc_info));
501         sc->sc_seq = 1;
502         bioq_init(&sc->sc_inqueue);
503         bioq_init(&sc->sc_outqueue);
504         mtx_init(&sc->sc_queue_mtx, "gg:queue", NULL, MTX_DEF);
505         sc->sc_queue_count = 0;
506         sc->sc_queue_size = ggio->gctl_maxcount;
507         if (sc->sc_queue_size > G_GATE_MAX_QUEUE_SIZE)
508                 sc->sc_queue_size = G_GATE_MAX_QUEUE_SIZE;
509         sc->sc_timeout = ggio->gctl_timeout;
510         callout_init(&sc->sc_callout, CALLOUT_MPSAFE);
511
512         gp = g_new_geomf(&g_gate_class, "%s", name);
513         gp->start = g_gate_start;
514         gp->access = g_gate_access;
515         gp->orphan = g_gate_orphan;
516         gp->dumpconf = g_gate_dumpconf;
517         gp->softc = sc;
518
519         if (ropp != NULL) {
520                 cp = g_new_consumer(gp);
521                 error = g_attach(cp, ropp);
522                 if (error != 0) {
523                         G_GATE_DEBUG(1, "Unable to attach to %s.", ropp->name);
524                 } else {
525                         error = g_access(cp, 1, 0, 0);
526                         if (error != 0) {
527                                 G_GATE_DEBUG(1, "Unable to access %s.",
528                                     ropp->name);
529                                 g_detach(cp);
530                         }
531                 }
532                 if (error != 0) {
533                         g_destroy_consumer(cp);
534                         g_destroy_geom(gp);
535                         g_topology_unlock();
536                         mtx_destroy(&sc->sc_queue_mtx);
537                         free(sc, M_GATE);
538                         return (error);
539                 }
540                 sc->sc_readcons = cp;
541                 sc->sc_readoffset = ggio->gctl_readoffset;
542         }
543
544         mtx_lock(&g_gate_units_lock);
545         sc->sc_unit = g_gate_getunit(ggio->gctl_unit, &error);
546         if (sc->sc_unit < 0) {
547                 mtx_unlock(&g_gate_units_lock);
548                 if (sc->sc_readcons != NULL) {
549                         (void)g_access(sc->sc_readcons, -1, 0, 0);
550                         g_detach(sc->sc_readcons);
551                         g_destroy_consumer(sc->sc_readcons);
552                 }
553                 g_destroy_geom(gp);
554                 g_topology_unlock();
555                 mtx_destroy(&sc->sc_queue_mtx);
556                 free(sc, M_GATE);
557                 return (error);
558         }
559         if (ggio->gctl_unit == G_GATE_NAME_GIVEN)
560                 snprintf(name, sizeof(name), "%s", ggio->gctl_name);
561         else {
562                 snprintf(name, sizeof(name), "%s%d", G_GATE_PROVIDER_NAME,
563                     sc->sc_unit);
564         }
565         /* Check for name collision. */
566         for (unit = 0; unit < g_gate_maxunits; unit++) {
567                 if (g_gate_units[unit] == NULL)
568                         continue;
569                 if (strcmp(name, g_gate_units[unit]->sc_name) != 0)
570                         continue;
571                 mtx_unlock(&g_gate_units_lock);
572                 if (sc->sc_readcons != NULL) {
573                         (void)g_access(sc->sc_readcons, -1, 0, 0);
574                         g_detach(sc->sc_readcons);
575                         g_destroy_consumer(sc->sc_readcons);
576                 }
577                 g_destroy_geom(gp);
578                 g_topology_unlock();
579                 mtx_destroy(&sc->sc_queue_mtx);
580                 free(sc, M_GATE);
581                 return (EEXIST);
582         }
583         sc->sc_name = name;
584         g_gate_units[sc->sc_unit] = sc;
585         g_gate_nunits++;
586         mtx_unlock(&g_gate_units_lock);
587
588         ggio->gctl_unit = sc->sc_unit;
589
590         pp = g_new_providerf(gp, "%s", name);
591         pp->mediasize = ggio->gctl_mediasize;
592         pp->sectorsize = ggio->gctl_sectorsize;
593         sc->sc_provider = pp;
594         g_error_provider(pp, 0);
595
596         g_topology_unlock();
597         mtx_lock(&g_gate_units_lock);
598         sc->sc_name = sc->sc_provider->name;
599         mtx_unlock(&g_gate_units_lock);
600         G_GATE_DEBUG(1, "Device %s created.", gp->name);
601
602         if (sc->sc_timeout > 0) {
603                 callout_reset(&sc->sc_callout, sc->sc_timeout * hz,
604                     g_gate_guard, sc);
605         }
606         return (0);
607 }
608
609 static int
610 g_gate_modify(struct g_gate_softc *sc, struct g_gate_ctl_modify *ggio)
611 {
612         struct g_provider *pp;
613         struct g_consumer *cp;
614         int error;
615
616         if ((ggio->gctl_modify & GG_MODIFY_MEDIASIZE) != 0) {
617                 if (ggio->gctl_mediasize <= 0) {
618                         G_GATE_DEBUG(1, "Invalid media size.");
619                         return (EINVAL);
620                 }
621                 pp = sc->sc_provider;
622                 if ((ggio->gctl_mediasize % pp->sectorsize) != 0) {
623                         G_GATE_DEBUG(1, "Invalid media size.");
624                         return (EINVAL);
625                 }
626                 /* TODO */
627                 return (EOPNOTSUPP);
628         }
629
630         if ((ggio->gctl_modify & GG_MODIFY_INFO) != 0)
631                 (void)strlcpy(sc->sc_info, ggio->gctl_info, sizeof(sc->sc_info));
632
633         cp = NULL;
634
635         if ((ggio->gctl_modify & GG_MODIFY_READPROV) != 0) {
636                 g_topology_lock();
637                 if (sc->sc_readcons != NULL) {
638                         cp = sc->sc_readcons;
639                         sc->sc_readcons = NULL;
640                         (void)g_access(cp, -1, 0, 0);
641                         g_detach(cp);
642                         g_destroy_consumer(cp);
643                 }
644                 if (ggio->gctl_readprov[0] != '\0') {
645                         pp = g_provider_by_name(ggio->gctl_readprov);
646                         if (pp == NULL) {
647                                 g_topology_unlock();
648                                 G_GATE_DEBUG(1, "Provider %s doesn't exist.",
649                                     ggio->gctl_readprov);
650                                 return (EINVAL);
651                         }
652                         cp = g_new_consumer(sc->sc_provider->geom);
653                         error = g_attach(cp, pp);
654                         if (error != 0) {
655                                 G_GATE_DEBUG(1, "Unable to attach to %s.",
656                                     pp->name);
657                         } else {
658                                 error = g_access(cp, 1, 0, 0);
659                                 if (error != 0) {
660                                         G_GATE_DEBUG(1, "Unable to access %s.",
661                                             pp->name);
662                                         g_detach(cp);
663                                 }
664                         }
665                         if (error != 0) {
666                                 g_destroy_consumer(cp);
667                                 g_topology_unlock();
668                                 return (error);
669                         }
670                 }
671         } else {
672                 cp = sc->sc_readcons;
673         }
674
675         if ((ggio->gctl_modify & GG_MODIFY_READOFFSET) != 0) {
676                 if (cp == NULL) {
677                         G_GATE_DEBUG(1, "No read provider.");
678                         return (EINVAL);
679                 }
680                 pp = sc->sc_provider;
681                 if ((ggio->gctl_readoffset % pp->sectorsize) != 0) {
682                         G_GATE_DEBUG(1, "Invalid read offset.");
683                         return (EINVAL);
684                 }
685                 if (pp->mediasize + ggio->gctl_readoffset >
686                     cp->provider->mediasize) {
687                         G_GATE_DEBUG(1, "Invalid read offset or media size.");
688                         return (EINVAL);
689                 }
690                 sc->sc_readoffset = ggio->gctl_readoffset;
691         }
692
693         if ((ggio->gctl_modify & GG_MODIFY_READPROV) != 0) {
694                 sc->sc_readcons = cp;
695                 g_topology_unlock();
696         }
697
698         return (0);
699 }
700
701 #define G_GATE_CHECK_VERSION(ggio)      do {                            \
702         if ((ggio)->gctl_version != G_GATE_VERSION) {                   \
703                 printf("Version mismatch %d != %d.\n",                  \
704                     ggio->gctl_version, G_GATE_VERSION);                \
705                 return (EINVAL);                                        \
706         }                                                               \
707 } while (0)
708 static int
709 g_gate_ioctl(struct cdev *dev, u_long cmd, caddr_t addr, int flags, struct thread *td)
710 {
711         struct g_gate_softc *sc;
712         struct bio *bp;
713         int error = 0;
714
715         G_GATE_DEBUG(4, "ioctl(%s, %lx, %p, %x, %p)", devtoname(dev), cmd, addr,
716             flags, td);
717
718         switch (cmd) {
719         case G_GATE_CMD_CREATE:
720             {
721                 struct g_gate_ctl_create *ggio = (void *)addr;
722
723                 G_GATE_CHECK_VERSION(ggio);
724                 error = g_gate_create(ggio);
725                 /*
726                  * Reset TDP_GEOM flag.
727                  * There are pending events for sure, because we just created
728                  * new provider and other classes want to taste it, but we
729                  * cannot answer on I/O requests until we're here.
730                  */
731                 td->td_pflags &= ~TDP_GEOM;
732                 return (error);
733             }
734         case G_GATE_CMD_MODIFY:
735             {
736                 struct g_gate_ctl_modify *ggio = (void *)addr;
737
738                 G_GATE_CHECK_VERSION(ggio);
739                 sc = g_gate_hold(ggio->gctl_unit, NULL);
740                 if (sc == NULL)
741                         return (ENXIO);
742                 error = g_gate_modify(sc, ggio);
743                 g_gate_release(sc);
744                 return (error);
745             }
746         case G_GATE_CMD_DESTROY:
747             {
748                 struct g_gate_ctl_destroy *ggio = (void *)addr;
749
750                 G_GATE_CHECK_VERSION(ggio);
751                 sc = g_gate_hold(ggio->gctl_unit, ggio->gctl_name);
752                 if (sc == NULL)
753                         return (ENXIO);
754                 g_topology_lock();
755                 mtx_lock(&g_gate_units_lock);
756                 error = g_gate_destroy(sc, ggio->gctl_force);
757                 g_topology_unlock();
758                 if (error != 0)
759                         g_gate_release(sc);
760                 return (error);
761             }
762         case G_GATE_CMD_CANCEL:
763             {
764                 struct g_gate_ctl_cancel *ggio = (void *)addr;
765                 struct bio *tbp, *lbp;
766
767                 G_GATE_CHECK_VERSION(ggio);
768                 sc = g_gate_hold(ggio->gctl_unit, ggio->gctl_name);
769                 if (sc == NULL)
770                         return (ENXIO);
771                 lbp = NULL;
772                 mtx_lock(&sc->sc_queue_mtx);
773                 TAILQ_FOREACH_SAFE(bp, &sc->sc_outqueue.queue, bio_queue, tbp) {
774                         if (ggio->gctl_seq == 0 ||
775                             ggio->gctl_seq == (uintptr_t)bp->bio_driver1) {
776                                 G_GATE_LOGREQ(1, bp, "Request canceled.");
777                                 bioq_remove(&sc->sc_outqueue, bp);
778                                 /*
779                                  * Be sure to put requests back onto incoming
780                                  * queue in the proper order.
781                                  */
782                                 if (lbp == NULL)
783                                         bioq_insert_head(&sc->sc_inqueue, bp);
784                                 else {
785                                         TAILQ_INSERT_AFTER(&sc->sc_inqueue.queue,
786                                             lbp, bp, bio_queue);
787                                 }
788                                 lbp = bp;
789                                 /*
790                                  * If only one request was canceled, leave now.
791                                  */
792                                 if (ggio->gctl_seq != 0)
793                                         break;
794                         }
795                 }
796                 if (ggio->gctl_unit == G_GATE_NAME_GIVEN)
797                         ggio->gctl_unit = sc->sc_unit;
798                 mtx_unlock(&sc->sc_queue_mtx);
799                 g_gate_release(sc);
800                 return (error);
801             }
802         case G_GATE_CMD_START:
803             {
804                 struct g_gate_ctl_io *ggio = (void *)addr;
805
806                 G_GATE_CHECK_VERSION(ggio);
807                 sc = g_gate_hold(ggio->gctl_unit, NULL);
808                 if (sc == NULL)
809                         return (ENXIO);
810                 error = 0;
811                 for (;;) {
812                         mtx_lock(&sc->sc_queue_mtx);
813                         bp = bioq_first(&sc->sc_inqueue);
814                         if (bp != NULL)
815                                 break;
816                         if ((sc->sc_flags & G_GATE_FLAG_DESTROY) != 0) {
817                                 ggio->gctl_error = ECANCELED;
818                                 mtx_unlock(&sc->sc_queue_mtx);
819                                 goto start_end;
820                         }
821                         if (msleep(sc, &sc->sc_queue_mtx,
822                             PPAUSE | PDROP | PCATCH, "ggwait", 0) != 0) {
823                                 ggio->gctl_error = ECANCELED;
824                                 goto start_end;
825                         }
826                 }
827                 ggio->gctl_cmd = bp->bio_cmd;
828                 if ((bp->bio_cmd == BIO_DELETE || bp->bio_cmd == BIO_WRITE) &&
829                     bp->bio_length > ggio->gctl_length) {
830                         mtx_unlock(&sc->sc_queue_mtx);
831                         ggio->gctl_length = bp->bio_length;
832                         ggio->gctl_error = ENOMEM;
833                         goto start_end;
834                 }
835                 bioq_remove(&sc->sc_inqueue, bp);
836                 bioq_insert_tail(&sc->sc_outqueue, bp);
837                 mtx_unlock(&sc->sc_queue_mtx);
838
839                 ggio->gctl_seq = (uintptr_t)bp->bio_driver1;
840                 ggio->gctl_offset = bp->bio_offset;
841                 ggio->gctl_length = bp->bio_length;
842
843                 switch (bp->bio_cmd) {
844                 case BIO_READ:
845                 case BIO_DELETE:
846                 case BIO_FLUSH:
847                         break;
848                 case BIO_WRITE:
849                         error = copyout(bp->bio_data, ggio->gctl_data,
850                             bp->bio_length);
851                         if (error != 0) {
852                                 mtx_lock(&sc->sc_queue_mtx);
853                                 bioq_remove(&sc->sc_outqueue, bp);
854                                 bioq_insert_head(&sc->sc_inqueue, bp);
855                                 mtx_unlock(&sc->sc_queue_mtx);
856                                 goto start_end;
857                         }
858                         break;
859                 }
860 start_end:
861                 g_gate_release(sc);
862                 return (error);
863             }
864         case G_GATE_CMD_DONE:
865             {
866                 struct g_gate_ctl_io *ggio = (void *)addr;
867
868                 G_GATE_CHECK_VERSION(ggio);
869                 sc = g_gate_hold(ggio->gctl_unit, NULL);
870                 if (sc == NULL)
871                         return (ENOENT);
872                 error = 0;
873                 mtx_lock(&sc->sc_queue_mtx);
874                 TAILQ_FOREACH(bp, &sc->sc_outqueue.queue, bio_queue) {
875                         if (ggio->gctl_seq == (uintptr_t)bp->bio_driver1)
876                                 break;
877                 }
878                 if (bp != NULL) {
879                         bioq_remove(&sc->sc_outqueue, bp);
880                         sc->sc_queue_count--;
881                 }
882                 mtx_unlock(&sc->sc_queue_mtx);
883                 if (bp == NULL) {
884                         /*
885                          * Request was probably canceled.
886                          */
887                         goto done_end;
888                 }
889                 if (ggio->gctl_error == EAGAIN) {
890                         bp->bio_error = 0;
891                         G_GATE_LOGREQ(1, bp, "Request desisted.");
892                         mtx_lock(&sc->sc_queue_mtx);
893                         sc->sc_queue_count++;
894                         bioq_insert_head(&sc->sc_inqueue, bp);
895                         wakeup(sc);
896                         mtx_unlock(&sc->sc_queue_mtx);
897                 } else {
898                         bp->bio_error = ggio->gctl_error;
899                         if (bp->bio_error == 0) {
900                                 bp->bio_completed = bp->bio_length;
901                                 switch (bp->bio_cmd) {
902                                 case BIO_READ:
903                                         error = copyin(ggio->gctl_data,
904                                             bp->bio_data, bp->bio_length);
905                                         if (error != 0)
906                                                 bp->bio_error = error;
907                                         break;
908                                 case BIO_DELETE:
909                                 case BIO_WRITE:
910                                 case BIO_FLUSH:
911                                         break;
912                                 }
913                         }
914                         G_GATE_LOGREQ(2, bp, "Request done.");
915                         g_io_deliver(bp, bp->bio_error);
916                 }
917 done_end:
918                 g_gate_release(sc);
919                 return (error);
920             }
921         }
922         return (ENOIOCTL);
923 }
924
925 static void
926 g_gate_device(void)
927 {
928
929         status_dev = make_dev(&g_gate_cdevsw, 0x0, UID_ROOT, GID_WHEEL, 0600,
930             G_GATE_CTL_NAME);
931 }
932
933 static int
934 g_gate_modevent(module_t mod, int type, void *data)
935 {
936         int error = 0;
937
938         switch (type) {
939         case MOD_LOAD:
940                 mtx_init(&g_gate_units_lock, "gg_units_lock", NULL, MTX_DEF);
941                 g_gate_units = malloc(g_gate_maxunits * sizeof(g_gate_units[0]),
942                     M_GATE, M_WAITOK | M_ZERO);
943                 g_gate_nunits = 0;
944                 g_gate_device();
945                 break;
946         case MOD_UNLOAD:
947                 mtx_lock(&g_gate_units_lock);
948                 if (g_gate_nunits > 0) {
949                         mtx_unlock(&g_gate_units_lock);
950                         error = EBUSY;
951                         break;
952                 }
953                 mtx_unlock(&g_gate_units_lock);
954                 mtx_destroy(&g_gate_units_lock);
955                 if (status_dev != 0)
956                         destroy_dev(status_dev);
957                 free(g_gate_units, M_GATE);
958                 break;
959         default:
960                 return (EOPNOTSUPP);
961                 break;
962         }
963
964         return (error);
965 }
966 static moduledata_t g_gate_module = {
967         G_GATE_MOD_NAME,
968         g_gate_modevent,
969         NULL
970 };
971 DECLARE_MODULE(geom_gate, g_gate_module, SI_SUB_DRIVERS, SI_ORDER_MIDDLE);
972 DECLARE_GEOM_CLASS(g_gate_class, g_gate);