1 /* $NetBSD: svc.c,v 1.21 2000/07/06 03:10:35 christos Exp $ */
4 * Copyright (c) 2009, Sun Microsystems, Inc.
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions are met:
9 * - Redistributions of source code must retain the above copyright notice,
10 * this list of conditions and the following disclaimer.
11 * - Redistributions in binary form must reproduce the above copyright notice,
12 * this list of conditions and the following disclaimer in the documentation
13 * and/or other materials provided with the distribution.
14 * - Neither the name of Sun Microsystems, Inc. nor the names of its
15 * contributors may be used to endorse or promote products derived
16 * from this software without specific prior written permission.
18 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
19 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
22 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
23 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
24 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
25 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
26 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
27 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
28 * POSSIBILITY OF SUCH DAMAGE.
31 #if defined(LIBC_SCCS) && !defined(lint)
32 static char *sccsid2 = "@(#)svc.c 1.44 88/02/08 Copyr 1984 Sun Micro";
33 static char *sccsid = "@(#)svc.c 2.4 88/08/11 4.0 RPCSRC";
35 #include <sys/cdefs.h>
36 __FBSDID("$FreeBSD$");
39 * svc.c, Server-side remote procedure call interface.
41 * There are two sets of procedures here. The xprt routines are
42 * for handling transport handles. The svc routines handle the
43 * list of service routines.
45 * Copyright (C) 1984, Sun Microsystems, Inc.
48 #include <sys/param.h>
50 #include <sys/kernel.h>
51 #include <sys/kthread.h>
52 #include <sys/malloc.h>
54 #include <sys/mutex.h>
56 #include <sys/queue.h>
57 #include <sys/socketvar.h>
58 #include <sys/systm.h>
61 #include <sys/ucred.h>
64 #include <rpc/rpcb_clnt.h>
65 #include <rpc/replay.h>
67 #include <rpc/rpc_com.h>
69 #define SVC_VERSQUIET 0x0001 /* keep quiet about vers mismatch */
70 #define version_keepquiet(xp) (SVC_EXT(xp)->xp_flags & SVC_VERSQUIET)
72 static struct svc_callout *svc_find(SVCPOOL *pool, rpcprog_t, rpcvers_t,
74 static void svc_new_thread(SVCGROUP *grp);
75 static void xprt_unregister_locked(SVCXPRT *xprt);
76 static void svc_change_space_used(SVCPOOL *pool, int delta);
77 static bool_t svc_request_space_available(SVCPOOL *pool);
79 /* *************** SVCXPRT related stuff **************** */
81 static int svcpool_minthread_sysctl(SYSCTL_HANDLER_ARGS);
82 static int svcpool_maxthread_sysctl(SYSCTL_HANDLER_ARGS);
83 static int svcpool_threads_sysctl(SYSCTL_HANDLER_ARGS);
86 svcpool_create(const char *name, struct sysctl_oid_list *sysctl_base)
92 pool = malloc(sizeof(SVCPOOL), M_RPC, M_WAITOK|M_ZERO);
94 mtx_init(&pool->sp_lock, "sp_lock", NULL, MTX_DEF);
96 pool->sp_state = SVCPOOL_INIT;
98 TAILQ_INIT(&pool->sp_callouts);
99 TAILQ_INIT(&pool->sp_lcallouts);
100 pool->sp_minthreads = 1;
101 pool->sp_maxthreads = 1;
102 pool->sp_groupcount = 1;
103 for (g = 0; g < SVC_MAXGROUPS; g++) {
104 grp = &pool->sp_groups[g];
105 mtx_init(&grp->sg_lock, "sg_lock", NULL, MTX_DEF);
107 grp->sg_state = SVCPOOL_ACTIVE;
108 TAILQ_INIT(&grp->sg_xlist);
109 TAILQ_INIT(&grp->sg_active);
110 LIST_INIT(&grp->sg_idlethreads);
111 grp->sg_minthreads = 1;
112 grp->sg_maxthreads = 1;
116 * Don't use more than a quarter of mbuf clusters or more than
117 * 45Mb buffering requests.
119 pool->sp_space_high = nmbclusters * MCLBYTES / 4;
120 if (pool->sp_space_high > 45 << 20)
121 pool->sp_space_high = 45 << 20;
122 pool->sp_space_low = 2 * pool->sp_space_high / 3;
124 sysctl_ctx_init(&pool->sp_sysctl);
126 SYSCTL_ADD_PROC(&pool->sp_sysctl, sysctl_base, OID_AUTO,
127 "minthreads", CTLTYPE_INT | CTLFLAG_RW,
128 pool, 0, svcpool_minthread_sysctl, "I",
129 "Minimal number of threads");
130 SYSCTL_ADD_PROC(&pool->sp_sysctl, sysctl_base, OID_AUTO,
131 "maxthreads", CTLTYPE_INT | CTLFLAG_RW,
132 pool, 0, svcpool_maxthread_sysctl, "I",
133 "Maximal number of threads");
134 SYSCTL_ADD_PROC(&pool->sp_sysctl, sysctl_base, OID_AUTO,
135 "threads", CTLTYPE_INT | CTLFLAG_RD,
136 pool, 0, svcpool_threads_sysctl, "I",
137 "Current number of threads");
138 SYSCTL_ADD_INT(&pool->sp_sysctl, sysctl_base, OID_AUTO,
139 "groups", CTLFLAG_RD, &pool->sp_groupcount, 0,
140 "Number of thread groups");
142 SYSCTL_ADD_UINT(&pool->sp_sysctl, sysctl_base, OID_AUTO,
143 "request_space_used", CTLFLAG_RD,
144 &pool->sp_space_used, 0,
145 "Space in parsed but not handled requests.");
147 SYSCTL_ADD_UINT(&pool->sp_sysctl, sysctl_base, OID_AUTO,
148 "request_space_used_highest", CTLFLAG_RD,
149 &pool->sp_space_used_highest, 0,
150 "Highest space used since reboot.");
152 SYSCTL_ADD_UINT(&pool->sp_sysctl, sysctl_base, OID_AUTO,
153 "request_space_high", CTLFLAG_RW,
154 &pool->sp_space_high, 0,
155 "Maximum space in parsed but not handled requests.");
157 SYSCTL_ADD_UINT(&pool->sp_sysctl, sysctl_base, OID_AUTO,
158 "request_space_low", CTLFLAG_RW,
159 &pool->sp_space_low, 0,
160 "Low water mark for request space.");
162 SYSCTL_ADD_INT(&pool->sp_sysctl, sysctl_base, OID_AUTO,
163 "request_space_throttled", CTLFLAG_RD,
164 &pool->sp_space_throttled, 0,
165 "Whether nfs requests are currently throttled");
167 SYSCTL_ADD_INT(&pool->sp_sysctl, sysctl_base, OID_AUTO,
168 "request_space_throttle_count", CTLFLAG_RD,
169 &pool->sp_space_throttle_count, 0,
170 "Count of times throttling based on request space has occurred");
177 svcpool_destroy(SVCPOOL *pool)
180 SVCXPRT *xprt, *nxprt;
181 struct svc_callout *s;
182 struct svc_loss_callout *sl;
183 struct svcxprt_list cleanup;
186 TAILQ_INIT(&cleanup);
188 for (g = 0; g < SVC_MAXGROUPS; g++) {
189 grp = &pool->sp_groups[g];
190 mtx_lock(&grp->sg_lock);
191 while ((xprt = TAILQ_FIRST(&grp->sg_xlist)) != NULL) {
192 xprt_unregister_locked(xprt);
193 TAILQ_INSERT_TAIL(&cleanup, xprt, xp_link);
195 mtx_unlock(&grp->sg_lock);
197 TAILQ_FOREACH_SAFE(xprt, &cleanup, xp_link, nxprt) {
201 mtx_lock(&pool->sp_lock);
202 while ((s = TAILQ_FIRST(&pool->sp_callouts)) != NULL) {
203 mtx_unlock(&pool->sp_lock);
204 svc_unreg(pool, s->sc_prog, s->sc_vers);
205 mtx_lock(&pool->sp_lock);
207 while ((sl = TAILQ_FIRST(&pool->sp_lcallouts)) != NULL) {
208 mtx_unlock(&pool->sp_lock);
209 svc_loss_unreg(pool, sl->slc_dispatch);
210 mtx_lock(&pool->sp_lock);
212 mtx_unlock(&pool->sp_lock);
214 for (g = 0; g < SVC_MAXGROUPS; g++) {
215 grp = &pool->sp_groups[g];
216 mtx_destroy(&grp->sg_lock);
218 mtx_destroy(&pool->sp_lock);
221 replay_freecache(pool->sp_rcache);
223 sysctl_ctx_free(&pool->sp_sysctl);
228 * Sysctl handler to get the present thread count on a pool
231 svcpool_threads_sysctl(SYSCTL_HANDLER_ARGS)
234 int threads, error, g;
236 pool = oidp->oid_arg1;
238 mtx_lock(&pool->sp_lock);
239 for (g = 0; g < pool->sp_groupcount; g++)
240 threads += pool->sp_groups[g].sg_threadcount;
241 mtx_unlock(&pool->sp_lock);
242 error = sysctl_handle_int(oidp, &threads, 0, req);
247 * Sysctl handler to set the minimum thread count on a pool
250 svcpool_minthread_sysctl(SYSCTL_HANDLER_ARGS)
253 int newminthreads, error, g;
255 pool = oidp->oid_arg1;
256 newminthreads = pool->sp_minthreads;
257 error = sysctl_handle_int(oidp, &newminthreads, 0, req);
258 if (error == 0 && newminthreads != pool->sp_minthreads) {
259 if (newminthreads > pool->sp_maxthreads)
261 mtx_lock(&pool->sp_lock);
262 pool->sp_minthreads = newminthreads;
263 for (g = 0; g < pool->sp_groupcount; g++) {
264 pool->sp_groups[g].sg_minthreads = max(1,
265 pool->sp_minthreads / pool->sp_groupcount);
267 mtx_unlock(&pool->sp_lock);
273 * Sysctl handler to set the maximum thread count on a pool
276 svcpool_maxthread_sysctl(SYSCTL_HANDLER_ARGS)
279 int newmaxthreads, error, g;
281 pool = oidp->oid_arg1;
282 newmaxthreads = pool->sp_maxthreads;
283 error = sysctl_handle_int(oidp, &newmaxthreads, 0, req);
284 if (error == 0 && newmaxthreads != pool->sp_maxthreads) {
285 if (newmaxthreads < pool->sp_minthreads)
287 mtx_lock(&pool->sp_lock);
288 pool->sp_maxthreads = newmaxthreads;
289 for (g = 0; g < pool->sp_groupcount; g++) {
290 pool->sp_groups[g].sg_maxthreads = max(1,
291 pool->sp_maxthreads / pool->sp_groupcount);
293 mtx_unlock(&pool->sp_lock);
299 * Activate a transport handle.
302 xprt_register(SVCXPRT *xprt)
304 SVCPOOL *pool = xprt->xp_pool;
309 g = atomic_fetchadd_int(&pool->sp_nextgroup, 1) % pool->sp_groupcount;
310 xprt->xp_group = grp = &pool->sp_groups[g];
311 mtx_lock(&grp->sg_lock);
312 xprt->xp_registered = TRUE;
313 xprt->xp_active = FALSE;
314 TAILQ_INSERT_TAIL(&grp->sg_xlist, xprt, xp_link);
315 mtx_unlock(&grp->sg_lock);
319 * De-activate a transport handle. Note: the locked version doesn't
320 * release the transport - caller must do that after dropping the pool
324 xprt_unregister_locked(SVCXPRT *xprt)
326 SVCGROUP *grp = xprt->xp_group;
328 mtx_assert(&grp->sg_lock, MA_OWNED);
329 KASSERT(xprt->xp_registered == TRUE,
330 ("xprt_unregister_locked: not registered"));
331 xprt_inactive_locked(xprt);
332 TAILQ_REMOVE(&grp->sg_xlist, xprt, xp_link);
333 xprt->xp_registered = FALSE;
337 xprt_unregister(SVCXPRT *xprt)
339 SVCGROUP *grp = xprt->xp_group;
341 mtx_lock(&grp->sg_lock);
342 if (xprt->xp_registered == FALSE) {
343 /* Already unregistered by another thread */
344 mtx_unlock(&grp->sg_lock);
347 xprt_unregister_locked(xprt);
348 mtx_unlock(&grp->sg_lock);
354 * Attempt to assign a service thread to this transport.
357 xprt_assignthread(SVCXPRT *xprt)
359 SVCGROUP *grp = xprt->xp_group;
362 mtx_assert(&grp->sg_lock, MA_OWNED);
363 st = LIST_FIRST(&grp->sg_idlethreads);
365 LIST_REMOVE(st, st_ilink);
367 xprt->xp_thread = st;
369 cv_signal(&st->st_cond);
373 * See if we can create a new thread. The
374 * actual thread creation happens in
375 * svc_run_internal because our locking state
376 * is poorly defined (we are typically called
377 * from a socket upcall). Don't create more
378 * than one thread per second.
380 if (grp->sg_state == SVCPOOL_ACTIVE
381 && grp->sg_lastcreatetime < time_uptime
382 && grp->sg_threadcount < grp->sg_maxthreads) {
383 grp->sg_state = SVCPOOL_THREADWANTED;
390 xprt_active(SVCXPRT *xprt)
392 SVCGROUP *grp = xprt->xp_group;
394 mtx_lock(&grp->sg_lock);
396 if (!xprt->xp_registered) {
398 * Race with xprt_unregister - we lose.
400 mtx_unlock(&grp->sg_lock);
404 if (!xprt->xp_active) {
405 xprt->xp_active = TRUE;
406 if (xprt->xp_thread == NULL) {
407 if (!svc_request_space_available(xprt->xp_pool) ||
408 !xprt_assignthread(xprt))
409 TAILQ_INSERT_TAIL(&grp->sg_active, xprt,
414 mtx_unlock(&grp->sg_lock);
418 xprt_inactive_locked(SVCXPRT *xprt)
420 SVCGROUP *grp = xprt->xp_group;
422 mtx_assert(&grp->sg_lock, MA_OWNED);
423 if (xprt->xp_active) {
424 if (xprt->xp_thread == NULL)
425 TAILQ_REMOVE(&grp->sg_active, xprt, xp_alink);
426 xprt->xp_active = FALSE;
431 xprt_inactive(SVCXPRT *xprt)
433 SVCGROUP *grp = xprt->xp_group;
435 mtx_lock(&grp->sg_lock);
436 xprt_inactive_locked(xprt);
437 mtx_unlock(&grp->sg_lock);
441 * Variant of xprt_inactive() for use only when sure that port is
442 * assigned to thread. For example, withing receive handlers.
445 xprt_inactive_self(SVCXPRT *xprt)
448 KASSERT(xprt->xp_thread != NULL,
449 ("xprt_inactive_self(%p) with NULL xp_thread", xprt));
450 xprt->xp_active = FALSE;
454 * Add a service program to the callout list.
455 * The dispatch routine will be called when a rpc request for this
456 * program number comes in.
459 svc_reg(SVCXPRT *xprt, const rpcprog_t prog, const rpcvers_t vers,
460 void (*dispatch)(struct svc_req *, SVCXPRT *),
461 const struct netconfig *nconf)
463 SVCPOOL *pool = xprt->xp_pool;
464 struct svc_callout *s;
468 /* VARIABLES PROTECTED BY svc_lock: s, svc_head */
470 if (xprt->xp_netid) {
471 netid = strdup(xprt->xp_netid, M_RPC);
473 } else if (nconf && nconf->nc_netid) {
474 netid = strdup(nconf->nc_netid, M_RPC);
476 } /* must have been created with svc_raw_create */
477 if ((netid == NULL) && (flag == 1)) {
481 mtx_lock(&pool->sp_lock);
482 if ((s = svc_find(pool, prog, vers, netid)) != NULL) {
485 if (s->sc_dispatch == dispatch)
486 goto rpcb_it; /* he is registering another xptr */
487 mtx_unlock(&pool->sp_lock);
490 s = malloc(sizeof (struct svc_callout), M_RPC, M_NOWAIT);
494 mtx_unlock(&pool->sp_lock);
500 s->sc_dispatch = dispatch;
502 TAILQ_INSERT_TAIL(&pool->sp_callouts, s, sc_link);
504 if ((xprt->xp_netid == NULL) && (flag == 1) && netid)
505 ((SVCXPRT *) xprt)->xp_netid = strdup(netid, M_RPC);
508 mtx_unlock(&pool->sp_lock);
509 /* now register the information with the local binder service */
512 struct netconfig tnc;
515 nb.buf = &xprt->xp_ltaddr;
516 nb.len = xprt->xp_ltaddr.ss_len;
517 dummy = rpcb_set(prog, vers, &tnc, &nb);
524 * Remove a service program from the callout list.
527 svc_unreg(SVCPOOL *pool, const rpcprog_t prog, const rpcvers_t vers)
529 struct svc_callout *s;
531 /* unregister the information anyway */
532 (void) rpcb_unset(prog, vers, NULL);
533 mtx_lock(&pool->sp_lock);
534 while ((s = svc_find(pool, prog, vers, NULL)) != NULL) {
535 TAILQ_REMOVE(&pool->sp_callouts, s, sc_link);
537 mem_free(s->sc_netid, sizeof (s->sc_netid) + 1);
538 mem_free(s, sizeof (struct svc_callout));
540 mtx_unlock(&pool->sp_lock);
544 * Add a service connection loss program to the callout list.
545 * The dispatch routine will be called when some port in ths pool die.
548 svc_loss_reg(SVCXPRT *xprt, void (*dispatch)(SVCXPRT *))
550 SVCPOOL *pool = xprt->xp_pool;
551 struct svc_loss_callout *s;
553 mtx_lock(&pool->sp_lock);
554 TAILQ_FOREACH(s, &pool->sp_lcallouts, slc_link) {
555 if (s->slc_dispatch == dispatch)
559 mtx_unlock(&pool->sp_lock);
562 s = malloc(sizeof (struct svc_callout), M_RPC, M_NOWAIT);
564 mtx_unlock(&pool->sp_lock);
567 s->slc_dispatch = dispatch;
568 TAILQ_INSERT_TAIL(&pool->sp_lcallouts, s, slc_link);
569 mtx_unlock(&pool->sp_lock);
574 * Remove a service connection loss program from the callout list.
577 svc_loss_unreg(SVCPOOL *pool, void (*dispatch)(SVCXPRT *))
579 struct svc_loss_callout *s;
581 mtx_lock(&pool->sp_lock);
582 TAILQ_FOREACH(s, &pool->sp_lcallouts, slc_link) {
583 if (s->slc_dispatch == dispatch) {
584 TAILQ_REMOVE(&pool->sp_lcallouts, s, slc_link);
589 mtx_unlock(&pool->sp_lock);
592 /* ********************** CALLOUT list related stuff ************* */
595 * Search the callout list for a program number, return the callout
598 static struct svc_callout *
599 svc_find(SVCPOOL *pool, rpcprog_t prog, rpcvers_t vers, char *netid)
601 struct svc_callout *s;
603 mtx_assert(&pool->sp_lock, MA_OWNED);
604 TAILQ_FOREACH(s, &pool->sp_callouts, sc_link) {
605 if (s->sc_prog == prog && s->sc_vers == vers
606 && (netid == NULL || s->sc_netid == NULL ||
607 strcmp(netid, s->sc_netid) == 0))
614 /* ******************* REPLY GENERATION ROUTINES ************ */
617 svc_sendreply_common(struct svc_req *rqstp, struct rpc_msg *rply,
620 SVCXPRT *xprt = rqstp->rq_xprt;
623 if (rqstp->rq_args) {
624 m_freem(rqstp->rq_args);
625 rqstp->rq_args = NULL;
628 if (xprt->xp_pool->sp_rcache)
629 replay_setreply(xprt->xp_pool->sp_rcache,
630 rply, svc_getrpccaller(rqstp), body);
632 if (!SVCAUTH_WRAP(&rqstp->rq_auth, &body))
635 ok = SVC_REPLY(xprt, rply, rqstp->rq_addr, body, &rqstp->rq_reply_seq);
636 if (rqstp->rq_addr) {
637 free(rqstp->rq_addr, M_SONAME);
638 rqstp->rq_addr = NULL;
645 * Send a reply to an rpc request
648 svc_sendreply(struct svc_req *rqstp, xdrproc_t xdr_results, void * xdr_location)
655 rply.rm_xid = rqstp->rq_xid;
656 rply.rm_direction = REPLY;
657 rply.rm_reply.rp_stat = MSG_ACCEPTED;
658 rply.acpted_rply.ar_verf = rqstp->rq_verf;
659 rply.acpted_rply.ar_stat = SUCCESS;
660 rply.acpted_rply.ar_results.where = NULL;
661 rply.acpted_rply.ar_results.proc = (xdrproc_t) xdr_void;
663 m = m_getcl(M_WAITOK, MT_DATA, 0);
664 xdrmbuf_create(&xdrs, m, XDR_ENCODE);
665 ok = xdr_results(&xdrs, xdr_location);
669 return (svc_sendreply_common(rqstp, &rply, m));
677 svc_sendreply_mbuf(struct svc_req *rqstp, struct mbuf *m)
681 rply.rm_xid = rqstp->rq_xid;
682 rply.rm_direction = REPLY;
683 rply.rm_reply.rp_stat = MSG_ACCEPTED;
684 rply.acpted_rply.ar_verf = rqstp->rq_verf;
685 rply.acpted_rply.ar_stat = SUCCESS;
686 rply.acpted_rply.ar_results.where = NULL;
687 rply.acpted_rply.ar_results.proc = (xdrproc_t) xdr_void;
689 return (svc_sendreply_common(rqstp, &rply, m));
693 * No procedure error reply
696 svcerr_noproc(struct svc_req *rqstp)
698 SVCXPRT *xprt = rqstp->rq_xprt;
701 rply.rm_xid = rqstp->rq_xid;
702 rply.rm_direction = REPLY;
703 rply.rm_reply.rp_stat = MSG_ACCEPTED;
704 rply.acpted_rply.ar_verf = rqstp->rq_verf;
705 rply.acpted_rply.ar_stat = PROC_UNAVAIL;
707 if (xprt->xp_pool->sp_rcache)
708 replay_setreply(xprt->xp_pool->sp_rcache,
709 &rply, svc_getrpccaller(rqstp), NULL);
711 svc_sendreply_common(rqstp, &rply, NULL);
715 * Can't decode args error reply
718 svcerr_decode(struct svc_req *rqstp)
720 SVCXPRT *xprt = rqstp->rq_xprt;
723 rply.rm_xid = rqstp->rq_xid;
724 rply.rm_direction = REPLY;
725 rply.rm_reply.rp_stat = MSG_ACCEPTED;
726 rply.acpted_rply.ar_verf = rqstp->rq_verf;
727 rply.acpted_rply.ar_stat = GARBAGE_ARGS;
729 if (xprt->xp_pool->sp_rcache)
730 replay_setreply(xprt->xp_pool->sp_rcache,
731 &rply, (struct sockaddr *) &xprt->xp_rtaddr, NULL);
733 svc_sendreply_common(rqstp, &rply, NULL);
740 svcerr_systemerr(struct svc_req *rqstp)
742 SVCXPRT *xprt = rqstp->rq_xprt;
745 rply.rm_xid = rqstp->rq_xid;
746 rply.rm_direction = REPLY;
747 rply.rm_reply.rp_stat = MSG_ACCEPTED;
748 rply.acpted_rply.ar_verf = rqstp->rq_verf;
749 rply.acpted_rply.ar_stat = SYSTEM_ERR;
751 if (xprt->xp_pool->sp_rcache)
752 replay_setreply(xprt->xp_pool->sp_rcache,
753 &rply, svc_getrpccaller(rqstp), NULL);
755 svc_sendreply_common(rqstp, &rply, NULL);
759 * Authentication error reply
762 svcerr_auth(struct svc_req *rqstp, enum auth_stat why)
764 SVCXPRT *xprt = rqstp->rq_xprt;
767 rply.rm_xid = rqstp->rq_xid;
768 rply.rm_direction = REPLY;
769 rply.rm_reply.rp_stat = MSG_DENIED;
770 rply.rjcted_rply.rj_stat = AUTH_ERROR;
771 rply.rjcted_rply.rj_why = why;
773 if (xprt->xp_pool->sp_rcache)
774 replay_setreply(xprt->xp_pool->sp_rcache,
775 &rply, svc_getrpccaller(rqstp), NULL);
777 svc_sendreply_common(rqstp, &rply, NULL);
781 * Auth too weak error reply
784 svcerr_weakauth(struct svc_req *rqstp)
787 svcerr_auth(rqstp, AUTH_TOOWEAK);
791 * Program unavailable error reply
794 svcerr_noprog(struct svc_req *rqstp)
796 SVCXPRT *xprt = rqstp->rq_xprt;
799 rply.rm_xid = rqstp->rq_xid;
800 rply.rm_direction = REPLY;
801 rply.rm_reply.rp_stat = MSG_ACCEPTED;
802 rply.acpted_rply.ar_verf = rqstp->rq_verf;
803 rply.acpted_rply.ar_stat = PROG_UNAVAIL;
805 if (xprt->xp_pool->sp_rcache)
806 replay_setreply(xprt->xp_pool->sp_rcache,
807 &rply, svc_getrpccaller(rqstp), NULL);
809 svc_sendreply_common(rqstp, &rply, NULL);
813 * Program version mismatch error reply
816 svcerr_progvers(struct svc_req *rqstp, rpcvers_t low_vers, rpcvers_t high_vers)
818 SVCXPRT *xprt = rqstp->rq_xprt;
821 rply.rm_xid = rqstp->rq_xid;
822 rply.rm_direction = REPLY;
823 rply.rm_reply.rp_stat = MSG_ACCEPTED;
824 rply.acpted_rply.ar_verf = rqstp->rq_verf;
825 rply.acpted_rply.ar_stat = PROG_MISMATCH;
826 rply.acpted_rply.ar_vers.low = (uint32_t)low_vers;
827 rply.acpted_rply.ar_vers.high = (uint32_t)high_vers;
829 if (xprt->xp_pool->sp_rcache)
830 replay_setreply(xprt->xp_pool->sp_rcache,
831 &rply, svc_getrpccaller(rqstp), NULL);
833 svc_sendreply_common(rqstp, &rply, NULL);
837 * Allocate a new server transport structure. All fields are
838 * initialized to zero and xp_p3 is initialized to point at an
839 * extension structure to hold various flags and authentication
848 xprt = mem_alloc(sizeof(SVCXPRT));
849 memset(xprt, 0, sizeof(SVCXPRT));
850 ext = mem_alloc(sizeof(SVCXPRT_EXT));
851 memset(ext, 0, sizeof(SVCXPRT_EXT));
853 refcount_init(&xprt->xp_refs, 1);
859 * Free a server transport structure.
866 mem_free(xprt->xp_p3, sizeof(SVCXPRT_EXT));
867 mem_free(xprt, sizeof(SVCXPRT));
870 /* ******************* SERVER INPUT STUFF ******************* */
873 * Read RPC requests from a transport and queue them to be
874 * executed. We handle authentication and replay cache replies here.
875 * Actually dispatching the RPC is deferred till svc_executereq.
877 static enum xprt_stat
878 svc_getreq(SVCXPRT *xprt, struct svc_req **rqstp_ret)
880 SVCPOOL *pool = xprt->xp_pool;
884 struct svc_loss_callout *s;
887 /* now receive msgs from xprtprt (support batch calls) */
888 r = malloc(sizeof(*r), M_RPC, M_WAITOK|M_ZERO);
890 msg.rm_call.cb_cred.oa_base = r->rq_credarea;
891 msg.rm_call.cb_verf.oa_base = &r->rq_credarea[MAX_AUTH_BYTES];
892 r->rq_clntcred = &r->rq_credarea[2*MAX_AUTH_BYTES];
893 if (SVC_RECV(xprt, &msg, &r->rq_addr, &args)) {
897 * Handle replays and authenticate before queuing the
898 * request to be executed.
902 if (pool->sp_rcache) {
903 struct rpc_msg repmsg;
904 struct mbuf *repbody;
905 enum replay_state rs;
906 rs = replay_find(pool->sp_rcache, &msg,
907 svc_getrpccaller(r), &repmsg, &repbody);
912 SVC_REPLY(xprt, &repmsg, r->rq_addr,
913 repbody, &r->rq_reply_seq);
915 free(r->rq_addr, M_SONAME);
927 r->rq_xid = msg.rm_xid;
928 r->rq_prog = msg.rm_call.cb_prog;
929 r->rq_vers = msg.rm_call.cb_vers;
930 r->rq_proc = msg.rm_call.cb_proc;
931 r->rq_size = sizeof(*r) + m_length(args, NULL);
933 if ((why = _authenticate(r, &msg)) != AUTH_OK) {
935 * RPCSEC_GSS uses this return code
936 * for requests that form part of its
937 * context establishment protocol and
938 * should not be dispatched to the
941 if (why != RPCSEC_GSS_NODISPATCH)
946 if (!SVCAUTH_UNWRAP(&r->rq_auth, &r->rq_args)) {
952 * Everything checks out, return request to caller.
962 if ((stat = SVC_STAT(xprt)) == XPRT_DIED) {
963 TAILQ_FOREACH(s, &pool->sp_lcallouts, slc_link)
964 (*s->slc_dispatch)(xprt);
965 xprt_unregister(xprt);
972 svc_executereq(struct svc_req *rqstp)
974 SVCXPRT *xprt = rqstp->rq_xprt;
975 SVCPOOL *pool = xprt->xp_pool;
979 struct svc_callout *s;
981 /* now match message with a registered service*/
983 low_vers = (rpcvers_t) -1L;
984 high_vers = (rpcvers_t) 0L;
985 TAILQ_FOREACH(s, &pool->sp_callouts, sc_link) {
986 if (s->sc_prog == rqstp->rq_prog) {
987 if (s->sc_vers == rqstp->rq_vers) {
989 * We hand ownership of r to the
990 * dispatch method - they must call
993 (*s->sc_dispatch)(rqstp, xprt);
995 } /* found correct version */
997 if (s->sc_vers < low_vers)
998 low_vers = s->sc_vers;
999 if (s->sc_vers > high_vers)
1000 high_vers = s->sc_vers;
1001 } /* found correct program */
1005 * if we got here, the program or version
1009 svcerr_progvers(rqstp, low_vers, high_vers);
1011 svcerr_noprog(rqstp);
1017 svc_checkidle(SVCGROUP *grp)
1019 SVCXPRT *xprt, *nxprt;
1021 struct svcxprt_list cleanup;
1023 TAILQ_INIT(&cleanup);
1024 TAILQ_FOREACH_SAFE(xprt, &grp->sg_xlist, xp_link, nxprt) {
1026 * Only some transports have idle timers. Don't time
1027 * something out which is just waking up.
1029 if (!xprt->xp_idletimeout || xprt->xp_thread)
1032 timo = xprt->xp_lastactive + xprt->xp_idletimeout;
1033 if (time_uptime > timo) {
1034 xprt_unregister_locked(xprt);
1035 TAILQ_INSERT_TAIL(&cleanup, xprt, xp_link);
1039 mtx_unlock(&grp->sg_lock);
1040 TAILQ_FOREACH_SAFE(xprt, &cleanup, xp_link, nxprt) {
1043 mtx_lock(&grp->sg_lock);
1047 svc_assign_waiting_sockets(SVCPOOL *pool)
1053 for (g = 0; g < pool->sp_groupcount; g++) {
1054 grp = &pool->sp_groups[g];
1055 mtx_lock(&grp->sg_lock);
1056 while ((xprt = TAILQ_FIRST(&grp->sg_active)) != NULL) {
1057 if (xprt_assignthread(xprt))
1058 TAILQ_REMOVE(&grp->sg_active, xprt, xp_alink);
1062 mtx_unlock(&grp->sg_lock);
1067 svc_change_space_used(SVCPOOL *pool, int delta)
1071 value = atomic_fetchadd_int(&pool->sp_space_used, delta) + delta;
1073 if (value >= pool->sp_space_high && !pool->sp_space_throttled) {
1074 pool->sp_space_throttled = TRUE;
1075 pool->sp_space_throttle_count++;
1077 if (value > pool->sp_space_used_highest)
1078 pool->sp_space_used_highest = value;
1080 if (value < pool->sp_space_low && pool->sp_space_throttled) {
1081 pool->sp_space_throttled = FALSE;
1082 svc_assign_waiting_sockets(pool);
1088 svc_request_space_available(SVCPOOL *pool)
1091 if (pool->sp_space_throttled)
1097 svc_run_internal(SVCGROUP *grp, bool_t ismaster)
1099 SVCPOOL *pool = grp->sg_pool;
1100 SVCTHREAD *st, *stpref;
1102 enum xprt_stat stat;
1103 struct svc_req *rqstp;
1108 st = mem_alloc(sizeof(*st));
1109 mtx_init(&st->st_lock, "st_lock", NULL, MTX_DEF);
1112 STAILQ_INIT(&st->st_reqs);
1113 cv_init(&st->st_cond, "rpcsvc");
1115 mtx_lock(&grp->sg_lock);
1118 * If we are a new thread which was spawned to cope with
1119 * increased load, set the state back to SVCPOOL_ACTIVE.
1121 if (grp->sg_state == SVCPOOL_THREADSTARTING)
1122 grp->sg_state = SVCPOOL_ACTIVE;
1124 while (grp->sg_state != SVCPOOL_CLOSING) {
1126 * Create new thread if requested.
1128 if (grp->sg_state == SVCPOOL_THREADWANTED) {
1129 grp->sg_state = SVCPOOL_THREADSTARTING;
1130 grp->sg_lastcreatetime = time_uptime;
1131 mtx_unlock(&grp->sg_lock);
1132 svc_new_thread(grp);
1133 mtx_lock(&grp->sg_lock);
1138 * Check for idle transports once per second.
1140 if (time_uptime > grp->sg_lastidlecheck) {
1141 grp->sg_lastidlecheck = time_uptime;
1148 * Enforce maxthreads count.
1150 if (grp->sg_threadcount > grp->sg_maxthreads)
1154 * Before sleeping, see if we can find an
1155 * active transport which isn't being serviced
1158 if (svc_request_space_available(pool) &&
1159 (xprt = TAILQ_FIRST(&grp->sg_active)) != NULL) {
1160 TAILQ_REMOVE(&grp->sg_active, xprt, xp_alink);
1162 xprt->xp_thread = st;
1167 LIST_INSERT_HEAD(&grp->sg_idlethreads, st, st_ilink);
1168 if (ismaster || (!ismaster &&
1169 grp->sg_threadcount > grp->sg_minthreads))
1170 error = cv_timedwait_sig(&st->st_cond,
1171 &grp->sg_lock, 5 * hz);
1173 error = cv_wait_sig(&st->st_cond,
1175 if (st->st_xprt == NULL)
1176 LIST_REMOVE(st, st_ilink);
1179 * Reduce worker thread count when idle.
1181 if (error == EWOULDBLOCK) {
1183 && (grp->sg_threadcount
1184 > grp->sg_minthreads)
1187 } else if (error != 0) {
1188 KASSERT(error == EINTR || error == ERESTART,
1189 ("non-signal error %d", error));
1190 mtx_unlock(&grp->sg_lock);
1193 if (P_SHOULDSTOP(p) ||
1194 (p->p_flag & P_TOTAL_STOP) != 0) {
1195 thread_suspend_check(0);
1197 mtx_lock(&grp->sg_lock);
1201 mtx_lock(&grp->sg_lock);
1207 mtx_unlock(&grp->sg_lock);
1210 * Drain the transport socket and queue up any RPCs.
1212 xprt->xp_lastactive = time_uptime;
1214 if (!svc_request_space_available(pool))
1217 stat = svc_getreq(xprt, &rqstp);
1219 svc_change_space_used(pool, rqstp->rq_size);
1221 * See if the application has a preference
1222 * for some other thread.
1224 if (pool->sp_assign) {
1225 stpref = pool->sp_assign(st, rqstp);
1226 rqstp->rq_thread = stpref;
1227 STAILQ_INSERT_TAIL(&stpref->st_reqs,
1229 mtx_unlock(&stpref->st_lock);
1233 rqstp->rq_thread = st;
1234 STAILQ_INSERT_TAIL(&st->st_reqs,
1238 } while (rqstp == NULL && stat == XPRT_MOREREQS
1239 && grp->sg_state != SVCPOOL_CLOSING);
1242 * Move this transport to the end of the active list to
1243 * ensure fairness when multiple transports are active.
1244 * If this was the last queued request, svc_getreq will end
1245 * up calling xprt_inactive to remove from the active list.
1247 mtx_lock(&grp->sg_lock);
1248 xprt->xp_thread = NULL;
1250 if (xprt->xp_active) {
1251 if (!svc_request_space_available(pool) ||
1252 !xprt_assignthread(xprt))
1253 TAILQ_INSERT_TAIL(&grp->sg_active,
1256 mtx_unlock(&grp->sg_lock);
1260 * Execute what we have queued.
1263 mtx_lock(&st->st_lock);
1264 while ((rqstp = STAILQ_FIRST(&st->st_reqs)) != NULL) {
1265 STAILQ_REMOVE_HEAD(&st->st_reqs, rq_link);
1266 mtx_unlock(&st->st_lock);
1267 sz += rqstp->rq_size;
1268 svc_executereq(rqstp);
1269 mtx_lock(&st->st_lock);
1271 mtx_unlock(&st->st_lock);
1272 svc_change_space_used(pool, -sz);
1273 mtx_lock(&grp->sg_lock);
1281 KASSERT(STAILQ_EMPTY(&st->st_reqs), ("stray reqs on exit"));
1282 mtx_destroy(&st->st_lock);
1283 cv_destroy(&st->st_cond);
1284 mem_free(st, sizeof(*st));
1286 grp->sg_threadcount--;
1289 mtx_unlock(&grp->sg_lock);
1293 svc_thread_start(void *arg)
1296 svc_run_internal((SVCGROUP *) arg, FALSE);
1301 svc_new_thread(SVCGROUP *grp)
1303 SVCPOOL *pool = grp->sg_pool;
1306 grp->sg_threadcount++;
1307 kthread_add(svc_thread_start, grp, pool->sp_proc, &td, 0, 0,
1308 "%s: service", pool->sp_name);
1312 svc_run(SVCPOOL *pool)
1321 snprintf(td->td_name, sizeof(td->td_name),
1322 "%s: master", pool->sp_name);
1323 pool->sp_state = SVCPOOL_ACTIVE;
1326 /* Choose group count based on number of threads and CPUs. */
1327 pool->sp_groupcount = max(1, min(SVC_MAXGROUPS,
1328 min(pool->sp_maxthreads / 2, mp_ncpus) / 6));
1329 for (g = 0; g < pool->sp_groupcount; g++) {
1330 grp = &pool->sp_groups[g];
1331 grp->sg_minthreads = max(1,
1332 pool->sp_minthreads / pool->sp_groupcount);
1333 grp->sg_maxthreads = max(1,
1334 pool->sp_maxthreads / pool->sp_groupcount);
1335 grp->sg_lastcreatetime = time_uptime;
1338 /* Starting threads */
1339 for (g = 0; g < pool->sp_groupcount; g++) {
1340 grp = &pool->sp_groups[g];
1341 for (i = ((g == 0) ? 1 : 0); i < grp->sg_minthreads; i++)
1342 svc_new_thread(grp);
1344 pool->sp_groups[0].sg_threadcount++;
1345 svc_run_internal(&pool->sp_groups[0], TRUE);
1347 /* Waiting for threads to stop. */
1348 for (g = 0; g < pool->sp_groupcount; g++) {
1349 grp = &pool->sp_groups[g];
1350 mtx_lock(&grp->sg_lock);
1351 while (grp->sg_threadcount > 0)
1352 msleep(grp, &grp->sg_lock, 0, "svcexit", 0);
1353 mtx_unlock(&grp->sg_lock);
1358 svc_exit(SVCPOOL *pool)
1364 pool->sp_state = SVCPOOL_CLOSING;
1365 for (g = 0; g < pool->sp_groupcount; g++) {
1366 grp = &pool->sp_groups[g];
1367 mtx_lock(&grp->sg_lock);
1368 if (grp->sg_state != SVCPOOL_CLOSING) {
1369 grp->sg_state = SVCPOOL_CLOSING;
1370 LIST_FOREACH(st, &grp->sg_idlethreads, st_ilink)
1371 cv_signal(&st->st_cond);
1373 mtx_unlock(&grp->sg_lock);
1378 svc_getargs(struct svc_req *rqstp, xdrproc_t xargs, void *args)
1385 rqstp->rq_args = NULL;
1387 xdrmbuf_create(&xdrs, m, XDR_DECODE);
1388 stat = xargs(&xdrs, args);
1395 svc_freeargs(struct svc_req *rqstp, xdrproc_t xargs, void *args)
1399 if (rqstp->rq_addr) {
1400 free(rqstp->rq_addr, M_SONAME);
1401 rqstp->rq_addr = NULL;
1404 xdrs.x_op = XDR_FREE;
1405 return (xargs(&xdrs, args));
1409 svc_freereq(struct svc_req *rqstp)
1414 st = rqstp->rq_thread;
1418 pool->sp_done(st, rqstp);
1421 if (rqstp->rq_auth.svc_ah_ops)
1422 SVCAUTH_RELEASE(&rqstp->rq_auth);
1424 if (rqstp->rq_xprt) {
1425 SVC_RELEASE(rqstp->rq_xprt);
1429 free(rqstp->rq_addr, M_SONAME);
1432 m_freem(rqstp->rq_args);