]> CyberLeo.Net >> Repos - FreeBSD/releng/10.3.git/blob - sys/rpc/svc.c
- Copy stable/10@296371 to releng/10.3 in preparation for 10.3-RC1
[FreeBSD/releng/10.3.git] / sys / rpc / svc.c
1 /*      $NetBSD: svc.c,v 1.21 2000/07/06 03:10:35 christos Exp $        */
2
3 /*-
4  * Copyright (c) 2009, Sun Microsystems, Inc.
5  * All rights reserved.
6  *
7  * Redistribution and use in source and binary forms, with or without 
8  * modification, are permitted provided that the following conditions are met:
9  * - Redistributions of source code must retain the above copyright notice, 
10  *   this list of conditions and the following disclaimer.
11  * - Redistributions in binary form must reproduce the above copyright notice, 
12  *   this list of conditions and the following disclaimer in the documentation 
13  *   and/or other materials provided with the distribution.
14  * - Neither the name of Sun Microsystems, Inc. nor the names of its 
15  *   contributors may be used to endorse or promote products derived 
16  *   from this software without specific prior written permission.
17  * 
18  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" 
19  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 
20  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 
21  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE 
22  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 
23  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 
24  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 
25  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 
26  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 
27  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 
28  * POSSIBILITY OF SUCH DAMAGE.
29  */
30
31 #if defined(LIBC_SCCS) && !defined(lint)
32 static char *sccsid2 = "@(#)svc.c 1.44 88/02/08 Copyr 1984 Sun Micro";
33 static char *sccsid = "@(#)svc.c        2.4 88/08/11 4.0 RPCSRC";
34 #endif
35 #include <sys/cdefs.h>
36 __FBSDID("$FreeBSD$");
37
38 /*
39  * svc.c, Server-side remote procedure call interface.
40  *
41  * There are two sets of procedures here.  The xprt routines are
42  * for handling transport handles.  The svc routines handle the
43  * list of service routines.
44  *
45  * Copyright (C) 1984, Sun Microsystems, Inc.
46  */
47
48 #include <sys/param.h>
49 #include <sys/lock.h>
50 #include <sys/kernel.h>
51 #include <sys/kthread.h>
52 #include <sys/malloc.h>
53 #include <sys/mbuf.h>
54 #include <sys/mutex.h>
55 #include <sys/proc.h>
56 #include <sys/queue.h>
57 #include <sys/socketvar.h>
58 #include <sys/systm.h>
59 #include <sys/smp.h>
60 #include <sys/sx.h>
61 #include <sys/ucred.h>
62
63 #include <rpc/rpc.h>
64 #include <rpc/rpcb_clnt.h>
65 #include <rpc/replay.h>
66
67 #include <rpc/rpc_com.h>
68
69 #define SVC_VERSQUIET 0x0001            /* keep quiet about vers mismatch */
70 #define version_keepquiet(xp) (SVC_EXT(xp)->xp_flags & SVC_VERSQUIET)
71
72 static struct svc_callout *svc_find(SVCPOOL *pool, rpcprog_t, rpcvers_t,
73     char *);
74 static void svc_new_thread(SVCGROUP *grp);
75 static void xprt_unregister_locked(SVCXPRT *xprt);
76 static void svc_change_space_used(SVCPOOL *pool, long delta);
77 static bool_t svc_request_space_available(SVCPOOL *pool);
78
79 /* ***************  SVCXPRT related stuff **************** */
80
81 static int svcpool_minthread_sysctl(SYSCTL_HANDLER_ARGS);
82 static int svcpool_maxthread_sysctl(SYSCTL_HANDLER_ARGS);
83 static int svcpool_threads_sysctl(SYSCTL_HANDLER_ARGS);
84
85 SVCPOOL*
86 svcpool_create(const char *name, struct sysctl_oid_list *sysctl_base)
87 {
88         SVCPOOL *pool;
89         SVCGROUP *grp;
90         int g;
91
92         pool = malloc(sizeof(SVCPOOL), M_RPC, M_WAITOK|M_ZERO);
93         
94         mtx_init(&pool->sp_lock, "sp_lock", NULL, MTX_DEF);
95         pool->sp_name = name;
96         pool->sp_state = SVCPOOL_INIT;
97         pool->sp_proc = NULL;
98         TAILQ_INIT(&pool->sp_callouts);
99         TAILQ_INIT(&pool->sp_lcallouts);
100         pool->sp_minthreads = 1;
101         pool->sp_maxthreads = 1;
102         pool->sp_groupcount = 1;
103         for (g = 0; g < SVC_MAXGROUPS; g++) {
104                 grp = &pool->sp_groups[g];
105                 mtx_init(&grp->sg_lock, "sg_lock", NULL, MTX_DEF);
106                 grp->sg_pool = pool;
107                 grp->sg_state = SVCPOOL_ACTIVE;
108                 TAILQ_INIT(&grp->sg_xlist);
109                 TAILQ_INIT(&grp->sg_active);
110                 LIST_INIT(&grp->sg_idlethreads);
111                 grp->sg_minthreads = 1;
112                 grp->sg_maxthreads = 1;
113         }
114
115         /*
116          * Don't use more than a quarter of mbuf clusters.  Nota bene:
117          * nmbclusters is an int, but nmbclusters*MCLBYTES may overflow
118          * on LP64 architectures, so cast to u_long to avoid undefined
119          * behavior.  (ILP32 architectures cannot have nmbclusters
120          * large enough to overflow for other reasons.)
121          */
122         pool->sp_space_high = (u_long)nmbclusters * MCLBYTES / 4;
123         pool->sp_space_low = (pool->sp_space_high / 3) * 2;
124
125         sysctl_ctx_init(&pool->sp_sysctl);
126         if (sysctl_base) {
127                 SYSCTL_ADD_PROC(&pool->sp_sysctl, sysctl_base, OID_AUTO,
128                     "minthreads", CTLTYPE_INT | CTLFLAG_RW,
129                     pool, 0, svcpool_minthread_sysctl, "I",
130                     "Minimal number of threads");
131                 SYSCTL_ADD_PROC(&pool->sp_sysctl, sysctl_base, OID_AUTO,
132                     "maxthreads", CTLTYPE_INT | CTLFLAG_RW,
133                     pool, 0, svcpool_maxthread_sysctl, "I",
134                     "Maximal number of threads");
135                 SYSCTL_ADD_PROC(&pool->sp_sysctl, sysctl_base, OID_AUTO,
136                     "threads", CTLTYPE_INT | CTLFLAG_RD,
137                     pool, 0, svcpool_threads_sysctl, "I",
138                     "Current number of threads");
139                 SYSCTL_ADD_INT(&pool->sp_sysctl, sysctl_base, OID_AUTO,
140                     "groups", CTLFLAG_RD, &pool->sp_groupcount, 0,
141                     "Number of thread groups");
142
143                 SYSCTL_ADD_ULONG(&pool->sp_sysctl, sysctl_base, OID_AUTO,
144                     "request_space_used", CTLFLAG_RD,
145                     &pool->sp_space_used,
146                     "Space in parsed but not handled requests.");
147
148                 SYSCTL_ADD_ULONG(&pool->sp_sysctl, sysctl_base, OID_AUTO,
149                     "request_space_used_highest", CTLFLAG_RD,
150                     &pool->sp_space_used_highest,
151                     "Highest space used since reboot.");
152
153                 SYSCTL_ADD_ULONG(&pool->sp_sysctl, sysctl_base, OID_AUTO,
154                     "request_space_high", CTLFLAG_RW,
155                     &pool->sp_space_high,
156                     "Maximum space in parsed but not handled requests.");
157
158                 SYSCTL_ADD_ULONG(&pool->sp_sysctl, sysctl_base, OID_AUTO,
159                     "request_space_low", CTLFLAG_RW,
160                     &pool->sp_space_low,
161                     "Low water mark for request space.");
162
163                 SYSCTL_ADD_INT(&pool->sp_sysctl, sysctl_base, OID_AUTO,
164                     "request_space_throttled", CTLFLAG_RD,
165                     &pool->sp_space_throttled, 0,
166                     "Whether nfs requests are currently throttled");
167
168                 SYSCTL_ADD_INT(&pool->sp_sysctl, sysctl_base, OID_AUTO,
169                     "request_space_throttle_count", CTLFLAG_RD,
170                     &pool->sp_space_throttle_count, 0,
171                     "Count of times throttling based on request space has occurred");
172         }
173
174         return pool;
175 }
176
177 void
178 svcpool_destroy(SVCPOOL *pool)
179 {
180         SVCGROUP *grp;
181         SVCXPRT *xprt, *nxprt;
182         struct svc_callout *s;
183         struct svc_loss_callout *sl;
184         struct svcxprt_list cleanup;
185         int g;
186
187         TAILQ_INIT(&cleanup);
188
189         for (g = 0; g < SVC_MAXGROUPS; g++) {
190                 grp = &pool->sp_groups[g];
191                 mtx_lock(&grp->sg_lock);
192                 while ((xprt = TAILQ_FIRST(&grp->sg_xlist)) != NULL) {
193                         xprt_unregister_locked(xprt);
194                         TAILQ_INSERT_TAIL(&cleanup, xprt, xp_link);
195                 }
196                 mtx_unlock(&grp->sg_lock);
197         }
198         TAILQ_FOREACH_SAFE(xprt, &cleanup, xp_link, nxprt) {
199                 SVC_RELEASE(xprt);
200         }
201
202         mtx_lock(&pool->sp_lock);
203         while ((s = TAILQ_FIRST(&pool->sp_callouts)) != NULL) {
204                 mtx_unlock(&pool->sp_lock);
205                 svc_unreg(pool, s->sc_prog, s->sc_vers);
206                 mtx_lock(&pool->sp_lock);
207         }
208         while ((sl = TAILQ_FIRST(&pool->sp_lcallouts)) != NULL) {
209                 mtx_unlock(&pool->sp_lock);
210                 svc_loss_unreg(pool, sl->slc_dispatch);
211                 mtx_lock(&pool->sp_lock);
212         }
213         mtx_unlock(&pool->sp_lock);
214
215         for (g = 0; g < SVC_MAXGROUPS; g++) {
216                 grp = &pool->sp_groups[g];
217                 mtx_destroy(&grp->sg_lock);
218         }
219         mtx_destroy(&pool->sp_lock);
220
221         if (pool->sp_rcache)
222                 replay_freecache(pool->sp_rcache);
223
224         sysctl_ctx_free(&pool->sp_sysctl);
225         free(pool, M_RPC);
226 }
227
228 /*
229  * Sysctl handler to get the present thread count on a pool
230  */
231 static int
232 svcpool_threads_sysctl(SYSCTL_HANDLER_ARGS)
233 {
234         SVCPOOL *pool;
235         int threads, error, g;
236
237         pool = oidp->oid_arg1;
238         threads = 0;
239         mtx_lock(&pool->sp_lock);
240         for (g = 0; g < pool->sp_groupcount; g++)
241                 threads += pool->sp_groups[g].sg_threadcount;
242         mtx_unlock(&pool->sp_lock);
243         error = sysctl_handle_int(oidp, &threads, 0, req);
244         return (error);
245 }
246
247 /*
248  * Sysctl handler to set the minimum thread count on a pool
249  */
250 static int
251 svcpool_minthread_sysctl(SYSCTL_HANDLER_ARGS)
252 {
253         SVCPOOL *pool;
254         int newminthreads, error, g;
255
256         pool = oidp->oid_arg1;
257         newminthreads = pool->sp_minthreads;
258         error = sysctl_handle_int(oidp, &newminthreads, 0, req);
259         if (error == 0 && newminthreads != pool->sp_minthreads) {
260                 if (newminthreads > pool->sp_maxthreads)
261                         return (EINVAL);
262                 mtx_lock(&pool->sp_lock);
263                 pool->sp_minthreads = newminthreads;
264                 for (g = 0; g < pool->sp_groupcount; g++) {
265                         pool->sp_groups[g].sg_minthreads = max(1,
266                             pool->sp_minthreads / pool->sp_groupcount);
267                 }
268                 mtx_unlock(&pool->sp_lock);
269         }
270         return (error);
271 }
272
273 /*
274  * Sysctl handler to set the maximum thread count on a pool
275  */
276 static int
277 svcpool_maxthread_sysctl(SYSCTL_HANDLER_ARGS)
278 {
279         SVCPOOL *pool;
280         int newmaxthreads, error, g;
281
282         pool = oidp->oid_arg1;
283         newmaxthreads = pool->sp_maxthreads;
284         error = sysctl_handle_int(oidp, &newmaxthreads, 0, req);
285         if (error == 0 && newmaxthreads != pool->sp_maxthreads) {
286                 if (newmaxthreads < pool->sp_minthreads)
287                         return (EINVAL);
288                 mtx_lock(&pool->sp_lock);
289                 pool->sp_maxthreads = newmaxthreads;
290                 for (g = 0; g < pool->sp_groupcount; g++) {
291                         pool->sp_groups[g].sg_maxthreads = max(1,
292                             pool->sp_maxthreads / pool->sp_groupcount);
293                 }
294                 mtx_unlock(&pool->sp_lock);
295         }
296         return (error);
297 }
298
299 /*
300  * Activate a transport handle.
301  */
302 void
303 xprt_register(SVCXPRT *xprt)
304 {
305         SVCPOOL *pool = xprt->xp_pool;
306         SVCGROUP *grp;
307         int g;
308
309         SVC_ACQUIRE(xprt);
310         g = atomic_fetchadd_int(&pool->sp_nextgroup, 1) % pool->sp_groupcount;
311         xprt->xp_group = grp = &pool->sp_groups[g];
312         mtx_lock(&grp->sg_lock);
313         xprt->xp_registered = TRUE;
314         xprt->xp_active = FALSE;
315         TAILQ_INSERT_TAIL(&grp->sg_xlist, xprt, xp_link);
316         mtx_unlock(&grp->sg_lock);
317 }
318
319 /*
320  * De-activate a transport handle. Note: the locked version doesn't
321  * release the transport - caller must do that after dropping the pool
322  * lock.
323  */
324 static void
325 xprt_unregister_locked(SVCXPRT *xprt)
326 {
327         SVCGROUP *grp = xprt->xp_group;
328
329         mtx_assert(&grp->sg_lock, MA_OWNED);
330         KASSERT(xprt->xp_registered == TRUE,
331             ("xprt_unregister_locked: not registered"));
332         xprt_inactive_locked(xprt);
333         TAILQ_REMOVE(&grp->sg_xlist, xprt, xp_link);
334         xprt->xp_registered = FALSE;
335 }
336
337 void
338 xprt_unregister(SVCXPRT *xprt)
339 {
340         SVCGROUP *grp = xprt->xp_group;
341
342         mtx_lock(&grp->sg_lock);
343         if (xprt->xp_registered == FALSE) {
344                 /* Already unregistered by another thread */
345                 mtx_unlock(&grp->sg_lock);
346                 return;
347         }
348         xprt_unregister_locked(xprt);
349         mtx_unlock(&grp->sg_lock);
350
351         SVC_RELEASE(xprt);
352 }
353
354 /*
355  * Attempt to assign a service thread to this transport.
356  */
357 static int
358 xprt_assignthread(SVCXPRT *xprt)
359 {
360         SVCGROUP *grp = xprt->xp_group;
361         SVCTHREAD *st;
362
363         mtx_assert(&grp->sg_lock, MA_OWNED);
364         st = LIST_FIRST(&grp->sg_idlethreads);
365         if (st) {
366                 LIST_REMOVE(st, st_ilink);
367                 SVC_ACQUIRE(xprt);
368                 xprt->xp_thread = st;
369                 st->st_xprt = xprt;
370                 cv_signal(&st->st_cond);
371                 return (TRUE);
372         } else {
373                 /*
374                  * See if we can create a new thread. The
375                  * actual thread creation happens in
376                  * svc_run_internal because our locking state
377                  * is poorly defined (we are typically called
378                  * from a socket upcall). Don't create more
379                  * than one thread per second.
380                  */
381                 if (grp->sg_state == SVCPOOL_ACTIVE
382                     && grp->sg_lastcreatetime < time_uptime
383                     && grp->sg_threadcount < grp->sg_maxthreads) {
384                         grp->sg_state = SVCPOOL_THREADWANTED;
385                 }
386         }
387         return (FALSE);
388 }
389
390 void
391 xprt_active(SVCXPRT *xprt)
392 {
393         SVCGROUP *grp = xprt->xp_group;
394
395         mtx_lock(&grp->sg_lock);
396
397         if (!xprt->xp_registered) {
398                 /*
399                  * Race with xprt_unregister - we lose.
400                  */
401                 mtx_unlock(&grp->sg_lock);
402                 return;
403         }
404
405         if (!xprt->xp_active) {
406                 xprt->xp_active = TRUE;
407                 if (xprt->xp_thread == NULL) {
408                         if (!svc_request_space_available(xprt->xp_pool) ||
409                             !xprt_assignthread(xprt))
410                                 TAILQ_INSERT_TAIL(&grp->sg_active, xprt,
411                                     xp_alink);
412                 }
413         }
414
415         mtx_unlock(&grp->sg_lock);
416 }
417
418 void
419 xprt_inactive_locked(SVCXPRT *xprt)
420 {
421         SVCGROUP *grp = xprt->xp_group;
422
423         mtx_assert(&grp->sg_lock, MA_OWNED);
424         if (xprt->xp_active) {
425                 if (xprt->xp_thread == NULL)
426                         TAILQ_REMOVE(&grp->sg_active, xprt, xp_alink);
427                 xprt->xp_active = FALSE;
428         }
429 }
430
431 void
432 xprt_inactive(SVCXPRT *xprt)
433 {
434         SVCGROUP *grp = xprt->xp_group;
435
436         mtx_lock(&grp->sg_lock);
437         xprt_inactive_locked(xprt);
438         mtx_unlock(&grp->sg_lock);
439 }
440
441 /*
442  * Variant of xprt_inactive() for use only when sure that port is
443  * assigned to thread. For example, withing receive handlers.
444  */
445 void
446 xprt_inactive_self(SVCXPRT *xprt)
447 {
448
449         KASSERT(xprt->xp_thread != NULL,
450             ("xprt_inactive_self(%p) with NULL xp_thread", xprt));
451         xprt->xp_active = FALSE;
452 }
453
454 /*
455  * Add a service program to the callout list.
456  * The dispatch routine will be called when a rpc request for this
457  * program number comes in.
458  */
459 bool_t
460 svc_reg(SVCXPRT *xprt, const rpcprog_t prog, const rpcvers_t vers,
461     void (*dispatch)(struct svc_req *, SVCXPRT *),
462     const struct netconfig *nconf)
463 {
464         SVCPOOL *pool = xprt->xp_pool;
465         struct svc_callout *s;
466         char *netid = NULL;
467         int flag = 0;
468
469 /* VARIABLES PROTECTED BY svc_lock: s, svc_head */
470
471         if (xprt->xp_netid) {
472                 netid = strdup(xprt->xp_netid, M_RPC);
473                 flag = 1;
474         } else if (nconf && nconf->nc_netid) {
475                 netid = strdup(nconf->nc_netid, M_RPC);
476                 flag = 1;
477         } /* must have been created with svc_raw_create */
478         if ((netid == NULL) && (flag == 1)) {
479                 return (FALSE);
480         }
481
482         mtx_lock(&pool->sp_lock);
483         if ((s = svc_find(pool, prog, vers, netid)) != NULL) {
484                 if (netid)
485                         free(netid, M_RPC);
486                 if (s->sc_dispatch == dispatch)
487                         goto rpcb_it; /* he is registering another xptr */
488                 mtx_unlock(&pool->sp_lock);
489                 return (FALSE);
490         }
491         s = malloc(sizeof (struct svc_callout), M_RPC, M_NOWAIT);
492         if (s == NULL) {
493                 if (netid)
494                         free(netid, M_RPC);
495                 mtx_unlock(&pool->sp_lock);
496                 return (FALSE);
497         }
498
499         s->sc_prog = prog;
500         s->sc_vers = vers;
501         s->sc_dispatch = dispatch;
502         s->sc_netid = netid;
503         TAILQ_INSERT_TAIL(&pool->sp_callouts, s, sc_link);
504
505         if ((xprt->xp_netid == NULL) && (flag == 1) && netid)
506                 ((SVCXPRT *) xprt)->xp_netid = strdup(netid, M_RPC);
507
508 rpcb_it:
509         mtx_unlock(&pool->sp_lock);
510         /* now register the information with the local binder service */
511         if (nconf) {
512                 bool_t dummy;
513                 struct netconfig tnc;
514                 struct netbuf nb;
515                 tnc = *nconf;
516                 nb.buf = &xprt->xp_ltaddr;
517                 nb.len = xprt->xp_ltaddr.ss_len;
518                 dummy = rpcb_set(prog, vers, &tnc, &nb);
519                 return (dummy);
520         }
521         return (TRUE);
522 }
523
524 /*
525  * Remove a service program from the callout list.
526  */
527 void
528 svc_unreg(SVCPOOL *pool, const rpcprog_t prog, const rpcvers_t vers)
529 {
530         struct svc_callout *s;
531
532         /* unregister the information anyway */
533         (void) rpcb_unset(prog, vers, NULL);
534         mtx_lock(&pool->sp_lock);
535         while ((s = svc_find(pool, prog, vers, NULL)) != NULL) {
536                 TAILQ_REMOVE(&pool->sp_callouts, s, sc_link);
537                 if (s->sc_netid)
538                         mem_free(s->sc_netid, sizeof (s->sc_netid) + 1);
539                 mem_free(s, sizeof (struct svc_callout));
540         }
541         mtx_unlock(&pool->sp_lock);
542 }
543
544 /*
545  * Add a service connection loss program to the callout list.
546  * The dispatch routine will be called when some port in ths pool die.
547  */
548 bool_t
549 svc_loss_reg(SVCXPRT *xprt, void (*dispatch)(SVCXPRT *))
550 {
551         SVCPOOL *pool = xprt->xp_pool;
552         struct svc_loss_callout *s;
553
554         mtx_lock(&pool->sp_lock);
555         TAILQ_FOREACH(s, &pool->sp_lcallouts, slc_link) {
556                 if (s->slc_dispatch == dispatch)
557                         break;
558         }
559         if (s != NULL) {
560                 mtx_unlock(&pool->sp_lock);
561                 return (TRUE);
562         }
563         s = malloc(sizeof (struct svc_callout), M_RPC, M_NOWAIT);
564         if (s == NULL) {
565                 mtx_unlock(&pool->sp_lock);
566                 return (FALSE);
567         }
568         s->slc_dispatch = dispatch;
569         TAILQ_INSERT_TAIL(&pool->sp_lcallouts, s, slc_link);
570         mtx_unlock(&pool->sp_lock);
571         return (TRUE);
572 }
573
574 /*
575  * Remove a service connection loss program from the callout list.
576  */
577 void
578 svc_loss_unreg(SVCPOOL *pool, void (*dispatch)(SVCXPRT *))
579 {
580         struct svc_loss_callout *s;
581
582         mtx_lock(&pool->sp_lock);
583         TAILQ_FOREACH(s, &pool->sp_lcallouts, slc_link) {
584                 if (s->slc_dispatch == dispatch) {
585                         TAILQ_REMOVE(&pool->sp_lcallouts, s, slc_link);
586                         free(s, M_RPC);
587                         break;
588                 }
589         }
590         mtx_unlock(&pool->sp_lock);
591 }
592
593 /* ********************** CALLOUT list related stuff ************* */
594
595 /*
596  * Search the callout list for a program number, return the callout
597  * struct.
598  */
599 static struct svc_callout *
600 svc_find(SVCPOOL *pool, rpcprog_t prog, rpcvers_t vers, char *netid)
601 {
602         struct svc_callout *s;
603
604         mtx_assert(&pool->sp_lock, MA_OWNED);
605         TAILQ_FOREACH(s, &pool->sp_callouts, sc_link) {
606                 if (s->sc_prog == prog && s->sc_vers == vers
607                     && (netid == NULL || s->sc_netid == NULL ||
608                         strcmp(netid, s->sc_netid) == 0))
609                         break;
610         }
611
612         return (s);
613 }
614
615 /* ******************* REPLY GENERATION ROUTINES  ************ */
616
617 static bool_t
618 svc_sendreply_common(struct svc_req *rqstp, struct rpc_msg *rply,
619     struct mbuf *body)
620 {
621         SVCXPRT *xprt = rqstp->rq_xprt;
622         bool_t ok;
623
624         if (rqstp->rq_args) {
625                 m_freem(rqstp->rq_args);
626                 rqstp->rq_args = NULL;
627         }
628
629         if (xprt->xp_pool->sp_rcache)
630                 replay_setreply(xprt->xp_pool->sp_rcache,
631                     rply, svc_getrpccaller(rqstp), body);
632
633         if (!SVCAUTH_WRAP(&rqstp->rq_auth, &body))
634                 return (FALSE);
635
636         ok = SVC_REPLY(xprt, rply, rqstp->rq_addr, body, &rqstp->rq_reply_seq);
637         if (rqstp->rq_addr) {
638                 free(rqstp->rq_addr, M_SONAME);
639                 rqstp->rq_addr = NULL;
640         }
641
642         return (ok);
643 }
644
645 /*
646  * Send a reply to an rpc request
647  */
648 bool_t
649 svc_sendreply(struct svc_req *rqstp, xdrproc_t xdr_results, void * xdr_location)
650 {
651         struct rpc_msg rply; 
652         struct mbuf *m;
653         XDR xdrs;
654         bool_t ok;
655
656         rply.rm_xid = rqstp->rq_xid;
657         rply.rm_direction = REPLY;  
658         rply.rm_reply.rp_stat = MSG_ACCEPTED; 
659         rply.acpted_rply.ar_verf = rqstp->rq_verf; 
660         rply.acpted_rply.ar_stat = SUCCESS;
661         rply.acpted_rply.ar_results.where = NULL;
662         rply.acpted_rply.ar_results.proc = (xdrproc_t) xdr_void;
663
664         m = m_getcl(M_WAITOK, MT_DATA, 0);
665         xdrmbuf_create(&xdrs, m, XDR_ENCODE);
666         ok = xdr_results(&xdrs, xdr_location);
667         XDR_DESTROY(&xdrs);
668
669         if (ok) {
670                 return (svc_sendreply_common(rqstp, &rply, m));
671         } else {
672                 m_freem(m);
673                 return (FALSE);
674         }
675 }
676
677 bool_t
678 svc_sendreply_mbuf(struct svc_req *rqstp, struct mbuf *m)
679 {
680         struct rpc_msg rply; 
681
682         rply.rm_xid = rqstp->rq_xid;
683         rply.rm_direction = REPLY;  
684         rply.rm_reply.rp_stat = MSG_ACCEPTED; 
685         rply.acpted_rply.ar_verf = rqstp->rq_verf; 
686         rply.acpted_rply.ar_stat = SUCCESS;
687         rply.acpted_rply.ar_results.where = NULL;
688         rply.acpted_rply.ar_results.proc = (xdrproc_t) xdr_void;
689
690         return (svc_sendreply_common(rqstp, &rply, m));
691 }
692
693 /*
694  * No procedure error reply
695  */
696 void
697 svcerr_noproc(struct svc_req *rqstp)
698 {
699         SVCXPRT *xprt = rqstp->rq_xprt;
700         struct rpc_msg rply;
701
702         rply.rm_xid = rqstp->rq_xid;
703         rply.rm_direction = REPLY;
704         rply.rm_reply.rp_stat = MSG_ACCEPTED;
705         rply.acpted_rply.ar_verf = rqstp->rq_verf;
706         rply.acpted_rply.ar_stat = PROC_UNAVAIL;
707
708         if (xprt->xp_pool->sp_rcache)
709                 replay_setreply(xprt->xp_pool->sp_rcache,
710                     &rply, svc_getrpccaller(rqstp), NULL);
711
712         svc_sendreply_common(rqstp, &rply, NULL);
713 }
714
715 /*
716  * Can't decode args error reply
717  */
718 void
719 svcerr_decode(struct svc_req *rqstp)
720 {
721         SVCXPRT *xprt = rqstp->rq_xprt;
722         struct rpc_msg rply; 
723
724         rply.rm_xid = rqstp->rq_xid;
725         rply.rm_direction = REPLY; 
726         rply.rm_reply.rp_stat = MSG_ACCEPTED; 
727         rply.acpted_rply.ar_verf = rqstp->rq_verf;
728         rply.acpted_rply.ar_stat = GARBAGE_ARGS;
729
730         if (xprt->xp_pool->sp_rcache)
731                 replay_setreply(xprt->xp_pool->sp_rcache,
732                     &rply, (struct sockaddr *) &xprt->xp_rtaddr, NULL);
733
734         svc_sendreply_common(rqstp, &rply, NULL);
735 }
736
737 /*
738  * Some system error
739  */
740 void
741 svcerr_systemerr(struct svc_req *rqstp)
742 {
743         SVCXPRT *xprt = rqstp->rq_xprt;
744         struct rpc_msg rply; 
745
746         rply.rm_xid = rqstp->rq_xid;
747         rply.rm_direction = REPLY; 
748         rply.rm_reply.rp_stat = MSG_ACCEPTED; 
749         rply.acpted_rply.ar_verf = rqstp->rq_verf;
750         rply.acpted_rply.ar_stat = SYSTEM_ERR;
751
752         if (xprt->xp_pool->sp_rcache)
753                 replay_setreply(xprt->xp_pool->sp_rcache,
754                     &rply, svc_getrpccaller(rqstp), NULL);
755
756         svc_sendreply_common(rqstp, &rply, NULL);
757 }
758
759 /*
760  * Authentication error reply
761  */
762 void
763 svcerr_auth(struct svc_req *rqstp, enum auth_stat why)
764 {
765         SVCXPRT *xprt = rqstp->rq_xprt;
766         struct rpc_msg rply;
767
768         rply.rm_xid = rqstp->rq_xid;
769         rply.rm_direction = REPLY;
770         rply.rm_reply.rp_stat = MSG_DENIED;
771         rply.rjcted_rply.rj_stat = AUTH_ERROR;
772         rply.rjcted_rply.rj_why = why;
773
774         if (xprt->xp_pool->sp_rcache)
775                 replay_setreply(xprt->xp_pool->sp_rcache,
776                     &rply, svc_getrpccaller(rqstp), NULL);
777
778         svc_sendreply_common(rqstp, &rply, NULL);
779 }
780
781 /*
782  * Auth too weak error reply
783  */
784 void
785 svcerr_weakauth(struct svc_req *rqstp)
786 {
787
788         svcerr_auth(rqstp, AUTH_TOOWEAK);
789 }
790
791 /*
792  * Program unavailable error reply
793  */
794 void 
795 svcerr_noprog(struct svc_req *rqstp)
796 {
797         SVCXPRT *xprt = rqstp->rq_xprt;
798         struct rpc_msg rply;  
799
800         rply.rm_xid = rqstp->rq_xid;
801         rply.rm_direction = REPLY;   
802         rply.rm_reply.rp_stat = MSG_ACCEPTED;  
803         rply.acpted_rply.ar_verf = rqstp->rq_verf;  
804         rply.acpted_rply.ar_stat = PROG_UNAVAIL;
805
806         if (xprt->xp_pool->sp_rcache)
807                 replay_setreply(xprt->xp_pool->sp_rcache,
808                     &rply, svc_getrpccaller(rqstp), NULL);
809
810         svc_sendreply_common(rqstp, &rply, NULL);
811 }
812
813 /*
814  * Program version mismatch error reply
815  */
816 void  
817 svcerr_progvers(struct svc_req *rqstp, rpcvers_t low_vers, rpcvers_t high_vers)
818 {
819         SVCXPRT *xprt = rqstp->rq_xprt;
820         struct rpc_msg rply;
821
822         rply.rm_xid = rqstp->rq_xid;
823         rply.rm_direction = REPLY;
824         rply.rm_reply.rp_stat = MSG_ACCEPTED;
825         rply.acpted_rply.ar_verf = rqstp->rq_verf;
826         rply.acpted_rply.ar_stat = PROG_MISMATCH;
827         rply.acpted_rply.ar_vers.low = (uint32_t)low_vers;
828         rply.acpted_rply.ar_vers.high = (uint32_t)high_vers;
829
830         if (xprt->xp_pool->sp_rcache)
831                 replay_setreply(xprt->xp_pool->sp_rcache,
832                     &rply, svc_getrpccaller(rqstp), NULL);
833
834         svc_sendreply_common(rqstp, &rply, NULL);
835 }
836
837 /*
838  * Allocate a new server transport structure. All fields are
839  * initialized to zero and xp_p3 is initialized to point at an
840  * extension structure to hold various flags and authentication
841  * parameters.
842  */
843 SVCXPRT *
844 svc_xprt_alloc()
845 {
846         SVCXPRT *xprt;
847         SVCXPRT_EXT *ext;
848
849         xprt = mem_alloc(sizeof(SVCXPRT));
850         memset(xprt, 0, sizeof(SVCXPRT));
851         ext = mem_alloc(sizeof(SVCXPRT_EXT));
852         memset(ext, 0, sizeof(SVCXPRT_EXT));
853         xprt->xp_p3 = ext;
854         refcount_init(&xprt->xp_refs, 1);
855
856         return (xprt);
857 }
858
859 /*
860  * Free a server transport structure.
861  */
862 void
863 svc_xprt_free(xprt)
864         SVCXPRT *xprt;
865 {
866
867         mem_free(xprt->xp_p3, sizeof(SVCXPRT_EXT));
868         mem_free(xprt, sizeof(SVCXPRT));
869 }
870
871 /* ******************* SERVER INPUT STUFF ******************* */
872
873 /*
874  * Read RPC requests from a transport and queue them to be
875  * executed. We handle authentication and replay cache replies here.
876  * Actually dispatching the RPC is deferred till svc_executereq.
877  */
878 static enum xprt_stat
879 svc_getreq(SVCXPRT *xprt, struct svc_req **rqstp_ret)
880 {
881         SVCPOOL *pool = xprt->xp_pool;
882         struct svc_req *r;
883         struct rpc_msg msg;
884         struct mbuf *args;
885         struct svc_loss_callout *s;
886         enum xprt_stat stat;
887
888         /* now receive msgs from xprtprt (support batch calls) */
889         r = malloc(sizeof(*r), M_RPC, M_WAITOK|M_ZERO);
890
891         msg.rm_call.cb_cred.oa_base = r->rq_credarea;
892         msg.rm_call.cb_verf.oa_base = &r->rq_credarea[MAX_AUTH_BYTES];
893         r->rq_clntcred = &r->rq_credarea[2*MAX_AUTH_BYTES];
894         if (SVC_RECV(xprt, &msg, &r->rq_addr, &args)) {
895                 enum auth_stat why;
896
897                 /*
898                  * Handle replays and authenticate before queuing the
899                  * request to be executed.
900                  */
901                 SVC_ACQUIRE(xprt);
902                 r->rq_xprt = xprt;
903                 if (pool->sp_rcache) {
904                         struct rpc_msg repmsg;
905                         struct mbuf *repbody;
906                         enum replay_state rs;
907                         rs = replay_find(pool->sp_rcache, &msg,
908                             svc_getrpccaller(r), &repmsg, &repbody);
909                         switch (rs) {
910                         case RS_NEW:
911                                 break;
912                         case RS_DONE:
913                                 SVC_REPLY(xprt, &repmsg, r->rq_addr,
914                                     repbody, &r->rq_reply_seq);
915                                 if (r->rq_addr) {
916                                         free(r->rq_addr, M_SONAME);
917                                         r->rq_addr = NULL;
918                                 }
919                                 m_freem(args);
920                                 goto call_done;
921
922                         default:
923                                 m_freem(args);
924                                 goto call_done;
925                         }
926                 }
927
928                 r->rq_xid = msg.rm_xid;
929                 r->rq_prog = msg.rm_call.cb_prog;
930                 r->rq_vers = msg.rm_call.cb_vers;
931                 r->rq_proc = msg.rm_call.cb_proc;
932                 r->rq_size = sizeof(*r) + m_length(args, NULL);
933                 r->rq_args = args;
934                 if ((why = _authenticate(r, &msg)) != AUTH_OK) {
935                         /*
936                          * RPCSEC_GSS uses this return code
937                          * for requests that form part of its
938                          * context establishment protocol and
939                          * should not be dispatched to the
940                          * application.
941                          */
942                         if (why != RPCSEC_GSS_NODISPATCH)
943                                 svcerr_auth(r, why);
944                         goto call_done;
945                 }
946
947                 if (!SVCAUTH_UNWRAP(&r->rq_auth, &r->rq_args)) {
948                         svcerr_decode(r);
949                         goto call_done;
950                 }
951
952                 /*
953                  * Everything checks out, return request to caller.
954                  */
955                 *rqstp_ret = r;
956                 r = NULL;
957         }
958 call_done:
959         if (r) {
960                 svc_freereq(r);
961                 r = NULL;
962         }
963         if ((stat = SVC_STAT(xprt)) == XPRT_DIED) {
964                 TAILQ_FOREACH(s, &pool->sp_lcallouts, slc_link)
965                         (*s->slc_dispatch)(xprt);
966                 xprt_unregister(xprt);
967         }
968
969         return (stat);
970 }
971
972 static void
973 svc_executereq(struct svc_req *rqstp)
974 {
975         SVCXPRT *xprt = rqstp->rq_xprt;
976         SVCPOOL *pool = xprt->xp_pool;
977         int prog_found;
978         rpcvers_t low_vers;
979         rpcvers_t high_vers;
980         struct svc_callout *s;
981
982         /* now match message with a registered service*/
983         prog_found = FALSE;
984         low_vers = (rpcvers_t) -1L;
985         high_vers = (rpcvers_t) 0L;
986         TAILQ_FOREACH(s, &pool->sp_callouts, sc_link) {
987                 if (s->sc_prog == rqstp->rq_prog) {
988                         if (s->sc_vers == rqstp->rq_vers) {
989                                 /*
990                                  * We hand ownership of r to the
991                                  * dispatch method - they must call
992                                  * svc_freereq.
993                                  */
994                                 (*s->sc_dispatch)(rqstp, xprt);
995                                 return;
996                         }  /* found correct version */
997                         prog_found = TRUE;
998                         if (s->sc_vers < low_vers)
999                                 low_vers = s->sc_vers;
1000                         if (s->sc_vers > high_vers)
1001                                 high_vers = s->sc_vers;
1002                 }   /* found correct program */
1003         }
1004
1005         /*
1006          * if we got here, the program or version
1007          * is not served ...
1008          */
1009         if (prog_found)
1010                 svcerr_progvers(rqstp, low_vers, high_vers);
1011         else
1012                 svcerr_noprog(rqstp);
1013
1014         svc_freereq(rqstp);
1015 }
1016
1017 static void
1018 svc_checkidle(SVCGROUP *grp)
1019 {
1020         SVCXPRT *xprt, *nxprt;
1021         time_t timo;
1022         struct svcxprt_list cleanup;
1023
1024         TAILQ_INIT(&cleanup);
1025         TAILQ_FOREACH_SAFE(xprt, &grp->sg_xlist, xp_link, nxprt) {
1026                 /*
1027                  * Only some transports have idle timers. Don't time
1028                  * something out which is just waking up.
1029                  */
1030                 if (!xprt->xp_idletimeout || xprt->xp_thread)
1031                         continue;
1032
1033                 timo = xprt->xp_lastactive + xprt->xp_idletimeout;
1034                 if (time_uptime > timo) {
1035                         xprt_unregister_locked(xprt);
1036                         TAILQ_INSERT_TAIL(&cleanup, xprt, xp_link);
1037                 }
1038         }
1039
1040         mtx_unlock(&grp->sg_lock);
1041         TAILQ_FOREACH_SAFE(xprt, &cleanup, xp_link, nxprt) {
1042                 SVC_RELEASE(xprt);
1043         }
1044         mtx_lock(&grp->sg_lock);
1045 }
1046
1047 static void
1048 svc_assign_waiting_sockets(SVCPOOL *pool)
1049 {
1050         SVCGROUP *grp;
1051         SVCXPRT *xprt;
1052         int g;
1053
1054         for (g = 0; g < pool->sp_groupcount; g++) {
1055                 grp = &pool->sp_groups[g];
1056                 mtx_lock(&grp->sg_lock);
1057                 while ((xprt = TAILQ_FIRST(&grp->sg_active)) != NULL) {
1058                         if (xprt_assignthread(xprt))
1059                                 TAILQ_REMOVE(&grp->sg_active, xprt, xp_alink);
1060                         else
1061                                 break;
1062                 }
1063                 mtx_unlock(&grp->sg_lock);
1064         }
1065 }
1066
1067 static void
1068 svc_change_space_used(SVCPOOL *pool, long delta)
1069 {
1070         unsigned long value;
1071
1072         value = atomic_fetchadd_long(&pool->sp_space_used, delta) + delta;
1073         if (delta > 0) {
1074                 if (value >= pool->sp_space_high && !pool->sp_space_throttled) {
1075                         pool->sp_space_throttled = TRUE;
1076                         pool->sp_space_throttle_count++;
1077                 }
1078                 if (value > pool->sp_space_used_highest)
1079                         pool->sp_space_used_highest = value;
1080         } else {
1081                 if (value < pool->sp_space_low && pool->sp_space_throttled) {
1082                         pool->sp_space_throttled = FALSE;
1083                         svc_assign_waiting_sockets(pool);
1084                 }
1085         }
1086 }
1087
1088 static bool_t
1089 svc_request_space_available(SVCPOOL *pool)
1090 {
1091
1092         if (pool->sp_space_throttled)
1093                 return (FALSE);
1094         return (TRUE);
1095 }
1096
1097 static void
1098 svc_run_internal(SVCGROUP *grp, bool_t ismaster)
1099 {
1100         SVCPOOL *pool = grp->sg_pool;
1101         SVCTHREAD *st, *stpref;
1102         SVCXPRT *xprt;
1103         enum xprt_stat stat;
1104         struct svc_req *rqstp;
1105         struct proc *p;
1106         long sz;
1107         int error;
1108
1109         st = mem_alloc(sizeof(*st));
1110         mtx_init(&st->st_lock, "st_lock", NULL, MTX_DEF);
1111         st->st_pool = pool;
1112         st->st_xprt = NULL;
1113         STAILQ_INIT(&st->st_reqs);
1114         cv_init(&st->st_cond, "rpcsvc");
1115
1116         mtx_lock(&grp->sg_lock);
1117
1118         /*
1119          * If we are a new thread which was spawned to cope with
1120          * increased load, set the state back to SVCPOOL_ACTIVE.
1121          */
1122         if (grp->sg_state == SVCPOOL_THREADSTARTING)
1123                 grp->sg_state = SVCPOOL_ACTIVE;
1124
1125         while (grp->sg_state != SVCPOOL_CLOSING) {
1126                 /*
1127                  * Create new thread if requested.
1128                  */
1129                 if (grp->sg_state == SVCPOOL_THREADWANTED) {
1130                         grp->sg_state = SVCPOOL_THREADSTARTING;
1131                         grp->sg_lastcreatetime = time_uptime;
1132                         mtx_unlock(&grp->sg_lock);
1133                         svc_new_thread(grp);
1134                         mtx_lock(&grp->sg_lock);
1135                         continue;
1136                 }
1137
1138                 /*
1139                  * Check for idle transports once per second.
1140                  */
1141                 if (time_uptime > grp->sg_lastidlecheck) {
1142                         grp->sg_lastidlecheck = time_uptime;
1143                         svc_checkidle(grp);
1144                 }
1145
1146                 xprt = st->st_xprt;
1147                 if (!xprt) {
1148                         /*
1149                          * Enforce maxthreads count.
1150                          */
1151                         if (grp->sg_threadcount > grp->sg_maxthreads)
1152                                 break;
1153
1154                         /*
1155                          * Before sleeping, see if we can find an
1156                          * active transport which isn't being serviced
1157                          * by a thread.
1158                          */
1159                         if (svc_request_space_available(pool) &&
1160                             (xprt = TAILQ_FIRST(&grp->sg_active)) != NULL) {
1161                                 TAILQ_REMOVE(&grp->sg_active, xprt, xp_alink);
1162                                 SVC_ACQUIRE(xprt);
1163                                 xprt->xp_thread = st;
1164                                 st->st_xprt = xprt;
1165                                 continue;
1166                         }
1167
1168                         LIST_INSERT_HEAD(&grp->sg_idlethreads, st, st_ilink);
1169                         if (ismaster || (!ismaster &&
1170                             grp->sg_threadcount > grp->sg_minthreads))
1171                                 error = cv_timedwait_sig(&st->st_cond,
1172                                     &grp->sg_lock, 5 * hz);
1173                         else
1174                                 error = cv_wait_sig(&st->st_cond,
1175                                     &grp->sg_lock);
1176                         if (st->st_xprt == NULL)
1177                                 LIST_REMOVE(st, st_ilink);
1178
1179                         /*
1180                          * Reduce worker thread count when idle.
1181                          */
1182                         if (error == EWOULDBLOCK) {
1183                                 if (!ismaster
1184                                     && (grp->sg_threadcount
1185                                         > grp->sg_minthreads)
1186                                         && !st->st_xprt)
1187                                         break;
1188                         } else if (error != 0) {
1189                                 KASSERT(error == EINTR || error == ERESTART,
1190                                     ("non-signal error %d", error));
1191                                 mtx_unlock(&grp->sg_lock);
1192                                 p = curproc;
1193                                 PROC_LOCK(p);
1194                                 if (P_SHOULDSTOP(p) ||
1195                                     (p->p_flag & P_TOTAL_STOP) != 0) {
1196                                         thread_suspend_check(0);
1197                                         PROC_UNLOCK(p);
1198                                         mtx_lock(&grp->sg_lock);
1199                                 } else {
1200                                         PROC_UNLOCK(p);
1201                                         svc_exit(pool);
1202                                         mtx_lock(&grp->sg_lock);
1203                                         break;
1204                                 }
1205                         }
1206                         continue;
1207                 }
1208                 mtx_unlock(&grp->sg_lock);
1209
1210                 /*
1211                  * Drain the transport socket and queue up any RPCs.
1212                  */
1213                 xprt->xp_lastactive = time_uptime;
1214                 do {
1215                         if (!svc_request_space_available(pool))
1216                                 break;
1217                         rqstp = NULL;
1218                         stat = svc_getreq(xprt, &rqstp);
1219                         if (rqstp) {
1220                                 svc_change_space_used(pool, rqstp->rq_size);
1221                                 /*
1222                                  * See if the application has a preference
1223                                  * for some other thread.
1224                                  */
1225                                 if (pool->sp_assign) {
1226                                         stpref = pool->sp_assign(st, rqstp);
1227                                         rqstp->rq_thread = stpref;
1228                                         STAILQ_INSERT_TAIL(&stpref->st_reqs,
1229                                             rqstp, rq_link);
1230                                         mtx_unlock(&stpref->st_lock);
1231                                         if (stpref != st)
1232                                                 rqstp = NULL;
1233                                 } else {
1234                                         rqstp->rq_thread = st;
1235                                         STAILQ_INSERT_TAIL(&st->st_reqs,
1236                                             rqstp, rq_link);
1237                                 }
1238                         }
1239                 } while (rqstp == NULL && stat == XPRT_MOREREQS
1240                     && grp->sg_state != SVCPOOL_CLOSING);
1241
1242                 /*
1243                  * Move this transport to the end of the active list to
1244                  * ensure fairness when multiple transports are active.
1245                  * If this was the last queued request, svc_getreq will end
1246                  * up calling xprt_inactive to remove from the active list.
1247                  */
1248                 mtx_lock(&grp->sg_lock);
1249                 xprt->xp_thread = NULL;
1250                 st->st_xprt = NULL;
1251                 if (xprt->xp_active) {
1252                         if (!svc_request_space_available(pool) ||
1253                             !xprt_assignthread(xprt))
1254                                 TAILQ_INSERT_TAIL(&grp->sg_active,
1255                                     xprt, xp_alink);
1256                 }
1257                 mtx_unlock(&grp->sg_lock);
1258                 SVC_RELEASE(xprt);
1259
1260                 /*
1261                  * Execute what we have queued.
1262                  */
1263                 mtx_lock(&st->st_lock);
1264                 while ((rqstp = STAILQ_FIRST(&st->st_reqs)) != NULL) {
1265                         STAILQ_REMOVE_HEAD(&st->st_reqs, rq_link);
1266                         mtx_unlock(&st->st_lock);
1267                         sz = (long)rqstp->rq_size;
1268                         svc_executereq(rqstp);
1269                         svc_change_space_used(pool, -sz);
1270                         mtx_lock(&st->st_lock);
1271                 }
1272                 mtx_unlock(&st->st_lock);
1273                 mtx_lock(&grp->sg_lock);
1274         }
1275
1276         if (st->st_xprt) {
1277                 xprt = st->st_xprt;
1278                 st->st_xprt = NULL;
1279                 SVC_RELEASE(xprt);
1280         }
1281         KASSERT(STAILQ_EMPTY(&st->st_reqs), ("stray reqs on exit"));
1282         mtx_destroy(&st->st_lock);
1283         cv_destroy(&st->st_cond);
1284         mem_free(st, sizeof(*st));
1285
1286         grp->sg_threadcount--;
1287         if (!ismaster)
1288                 wakeup(grp);
1289         mtx_unlock(&grp->sg_lock);
1290 }
1291
1292 static void
1293 svc_thread_start(void *arg)
1294 {
1295
1296         svc_run_internal((SVCGROUP *) arg, FALSE);
1297         kthread_exit();
1298 }
1299
1300 static void
1301 svc_new_thread(SVCGROUP *grp)
1302 {
1303         SVCPOOL *pool = grp->sg_pool;
1304         struct thread *td;
1305
1306         mtx_lock(&grp->sg_lock);
1307         grp->sg_threadcount++;
1308         mtx_unlock(&grp->sg_lock);
1309         kthread_add(svc_thread_start, grp, pool->sp_proc, &td, 0, 0,
1310             "%s: service", pool->sp_name);
1311 }
1312
1313 void
1314 svc_run(SVCPOOL *pool)
1315 {
1316         int g, i;
1317         struct proc *p;
1318         struct thread *td;
1319         SVCGROUP *grp;
1320
1321         p = curproc;
1322         td = curthread;
1323         snprintf(td->td_name, sizeof(td->td_name),
1324             "%s: master", pool->sp_name);
1325         pool->sp_state = SVCPOOL_ACTIVE;
1326         pool->sp_proc = p;
1327
1328         /* Choose group count based on number of threads and CPUs. */
1329         pool->sp_groupcount = max(1, min(SVC_MAXGROUPS,
1330             min(pool->sp_maxthreads / 2, mp_ncpus) / 6));
1331         for (g = 0; g < pool->sp_groupcount; g++) {
1332                 grp = &pool->sp_groups[g];
1333                 grp->sg_minthreads = max(1,
1334                     pool->sp_minthreads / pool->sp_groupcount);
1335                 grp->sg_maxthreads = max(1,
1336                     pool->sp_maxthreads / pool->sp_groupcount);
1337                 grp->sg_lastcreatetime = time_uptime;
1338         }
1339
1340         /* Starting threads */
1341         pool->sp_groups[0].sg_threadcount++;
1342         for (g = 0; g < pool->sp_groupcount; g++) {
1343                 grp = &pool->sp_groups[g];
1344                 for (i = ((g == 0) ? 1 : 0); i < grp->sg_minthreads; i++)
1345                         svc_new_thread(grp);
1346         }
1347         svc_run_internal(&pool->sp_groups[0], TRUE);
1348
1349         /* Waiting for threads to stop. */
1350         for (g = 0; g < pool->sp_groupcount; g++) {
1351                 grp = &pool->sp_groups[g];
1352                 mtx_lock(&grp->sg_lock);
1353                 while (grp->sg_threadcount > 0)
1354                         msleep(grp, &grp->sg_lock, 0, "svcexit", 0);
1355                 mtx_unlock(&grp->sg_lock);
1356         }
1357 }
1358
1359 void
1360 svc_exit(SVCPOOL *pool)
1361 {
1362         SVCGROUP *grp;
1363         SVCTHREAD *st;
1364         int g;
1365
1366         pool->sp_state = SVCPOOL_CLOSING;
1367         for (g = 0; g < pool->sp_groupcount; g++) {
1368                 grp = &pool->sp_groups[g];
1369                 mtx_lock(&grp->sg_lock);
1370                 if (grp->sg_state != SVCPOOL_CLOSING) {
1371                         grp->sg_state = SVCPOOL_CLOSING;
1372                         LIST_FOREACH(st, &grp->sg_idlethreads, st_ilink)
1373                                 cv_signal(&st->st_cond);
1374                 }
1375                 mtx_unlock(&grp->sg_lock);
1376         }
1377 }
1378
1379 bool_t
1380 svc_getargs(struct svc_req *rqstp, xdrproc_t xargs, void *args)
1381 {
1382         struct mbuf *m;
1383         XDR xdrs;
1384         bool_t stat;
1385
1386         m = rqstp->rq_args;
1387         rqstp->rq_args = NULL;
1388
1389         xdrmbuf_create(&xdrs, m, XDR_DECODE);
1390         stat = xargs(&xdrs, args);
1391         XDR_DESTROY(&xdrs);
1392
1393         return (stat);
1394 }
1395
1396 bool_t
1397 svc_freeargs(struct svc_req *rqstp, xdrproc_t xargs, void *args)
1398 {
1399         XDR xdrs;
1400
1401         if (rqstp->rq_addr) {
1402                 free(rqstp->rq_addr, M_SONAME);
1403                 rqstp->rq_addr = NULL;
1404         }
1405
1406         xdrs.x_op = XDR_FREE;
1407         return (xargs(&xdrs, args));
1408 }
1409
1410 void
1411 svc_freereq(struct svc_req *rqstp)
1412 {
1413         SVCTHREAD *st;
1414         SVCPOOL *pool;
1415
1416         st = rqstp->rq_thread;
1417         if (st) {
1418                 pool = st->st_pool;
1419                 if (pool->sp_done)
1420                         pool->sp_done(st, rqstp);
1421         }
1422
1423         if (rqstp->rq_auth.svc_ah_ops)
1424                 SVCAUTH_RELEASE(&rqstp->rq_auth);
1425
1426         if (rqstp->rq_xprt) {
1427                 SVC_RELEASE(rqstp->rq_xprt);
1428         }
1429
1430         if (rqstp->rq_addr)
1431                 free(rqstp->rq_addr, M_SONAME);
1432
1433         if (rqstp->rq_args)
1434                 m_freem(rqstp->rq_args);
1435
1436         free(rqstp, M_RPC);
1437 }