]> CyberLeo.Net >> Repos - FreeBSD/FreeBSD.git/blob - sys/nfsserver/nfs_syscalls.c
This commit was generated by cvs2svn to compensate for changes in r165071,
[FreeBSD/FreeBSD.git] / sys / nfsserver / nfs_syscalls.c
1 /*-
2  * Copyright (c) 1989, 1993
3  *      The Regents of the University of California.  All rights reserved.
4  *
5  * This code is derived from software contributed to Berkeley by
6  * Rick Macklem at The University of Guelph.
7  *
8  * Redistribution and use in source and binary forms, with or without
9  * modification, are permitted provided that the following conditions
10  * are met:
11  * 1. Redistributions of source code must retain the above copyright
12  *    notice, this list of conditions and the following disclaimer.
13  * 2. Redistributions in binary form must reproduce the above copyright
14  *    notice, this list of conditions and the following disclaimer in the
15  *    documentation and/or other materials provided with the distribution.
16  * 4. Neither the name of the University nor the names of its contributors
17  *    may be used to endorse or promote products derived from this software
18  *    without specific prior written permission.
19  *
20  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
21  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
24  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
26  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
28  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
29  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
30  * SUCH DAMAGE.
31  *
32  *      @(#)nfs_syscalls.c      8.5 (Berkeley) 3/30/95
33  */
34
35 #include <sys/cdefs.h>
36 __FBSDID("$FreeBSD$");
37
38 #include "opt_inet6.h"
39 #include "opt_mac.h"
40
41 #include <sys/param.h>
42 #include <sys/systm.h>
43 #include <sys/sysproto.h>
44 #include <sys/kernel.h>
45 #include <sys/sysctl.h>
46 #include <sys/file.h>
47 #include <sys/filedesc.h>
48 #include <sys/vnode.h>
49 #include <sys/malloc.h>
50 #include <sys/mount.h>
51 #include <sys/priv.h>
52 #include <sys/proc.h>
53 #include <sys/bio.h>
54 #include <sys/buf.h>
55 #include <sys/mbuf.h>
56 #include <sys/socket.h>
57 #include <sys/socketvar.h>
58 #include <sys/domain.h>
59 #include <sys/protosw.h>
60 #include <sys/namei.h>
61 #include <sys/fcntl.h>
62 #include <sys/lockf.h>
63
64 #include <netinet/in.h>
65 #include <netinet/tcp.h>
66 #ifdef INET6
67 #include <net/if.h>
68 #include <netinet6/in6_var.h>
69 #endif
70 #include <nfs/xdr_subs.h>
71 #include <nfs/rpcv2.h>
72 #include <nfs/nfsproto.h>
73 #include <nfsserver/nfs.h>
74 #include <nfsserver/nfsm_subs.h>
75 #include <nfsserver/nfsrvcache.h>
76
77 #include <security/mac/mac_framework.h>
78
79 static MALLOC_DEFINE(M_NFSSVC, "nfsserver_srvsock", "Nfs server structure");
80
81 MALLOC_DEFINE(M_NFSRVDESC, "nfsserver_srvdesc", "NFS server socket descriptor");
82 MALLOC_DEFINE(M_NFSD, "nfsserver_daemon", "Nfs server daemon structure");
83
84
85 #define TRUE    1
86 #define FALSE   0
87
88 SYSCTL_DECL(_vfs_nfsrv);
89
90 int             nfsd_waiting = 0;
91 int             nfsrv_numnfsd = 0;
92 static int      notstarted = 1;
93
94 static int      nfs_privport = 0;
95 SYSCTL_INT(_vfs_nfsrv, NFS_NFSPRIVPORT, nfs_privport, CTLFLAG_RW,
96             &nfs_privport, 0, "");
97 SYSCTL_INT(_vfs_nfsrv, OID_AUTO, gatherdelay, CTLFLAG_RW,
98             &nfsrvw_procrastinate, 0, "");
99 SYSCTL_INT(_vfs_nfsrv, OID_AUTO, gatherdelay_v3, CTLFLAG_RW,
100             &nfsrvw_procrastinate_v3, 0, "");
101
102 static int      nfssvc_addsock(struct file *, struct sockaddr *,
103                     struct thread *);
104 static void     nfsrv_zapsock(struct nfssvc_sock *slp);
105 static int      nfssvc_nfsd(struct thread *);
106
107 /*
108  * NFS server system calls
109  */
110
111 /*
112  * Nfs server psuedo system call for the nfsd's
113  * Based on the flag value it either:
114  * - adds a socket to the selection list
115  * - remains in the kernel as an nfsd
116  * - remains in the kernel as an nfsiod
117  * For INET6 we suppose that nfsd provides only IN6P_IPV6_V6ONLY sockets
118  * and that mountd provides
119  *  - sockaddr with no IPv4-mapped addresses
120  *  - mask for both INET and INET6 families if there is IPv4-mapped overlap
121  */
122 #ifndef _SYS_SYSPROTO_H_
123 struct nfssvc_args {
124         int flag;
125         caddr_t argp;
126 };
127 #endif
128 /*
129  * MPSAFE
130  */
131 int
132 nfssvc(struct thread *td, struct nfssvc_args *uap)
133 {
134         struct file *fp;
135         struct sockaddr *nam;
136         struct nfsd_args nfsdarg;
137         int error;
138
139         KASSERT(!mtx_owned(&Giant), ("nfssvc(): called with Giant"));
140
141 #ifdef MAC
142         error = mac_check_system_nfsd(td->td_ucred);
143         if (error)
144                 return (error);
145 #endif
146         error = priv_check(td, PRIV_NFSD);
147         if (error)
148                 return (error);
149         NET_LOCK_GIANT();
150         NFSD_LOCK();
151         while (nfssvc_sockhead_flag & SLP_INIT) {
152                  nfssvc_sockhead_flag |= SLP_WANTINIT;
153                 (void) msleep(&nfssvc_sockhead, &nfsd_mtx, PSOCK,
154                     "nfsd init", 0);
155         }
156         NFSD_UNLOCK();
157         if (uap->flag & NFSSVC_ADDSOCK) {
158                 error = copyin(uap->argp, (caddr_t)&nfsdarg, sizeof(nfsdarg));
159                 if (error)
160                         goto done2;
161                 if ((error = fget(td, nfsdarg.sock, &fp)) != 0)
162                         goto done2;
163                 if (fp->f_type != DTYPE_SOCKET) {
164                         fdrop(fp, td);
165                         goto done2;
166                 }
167                 /*
168                  * Get the client address for connected sockets.
169                  */
170                 if (nfsdarg.name == NULL || nfsdarg.namelen == 0)
171                         nam = NULL;
172                 else {
173                         error = getsockaddr(&nam, nfsdarg.name,
174                                             nfsdarg.namelen);
175                         if (error) {
176                                 fdrop(fp, td);
177                                 goto done2;
178                         }
179                 }
180                 error = nfssvc_addsock(fp, nam, td);
181                 fdrop(fp, td);
182         } else if (uap->flag & NFSSVC_NFSD) {
183                 error = nfssvc_nfsd(td);
184         } else {
185                 error = ENXIO;
186         }
187         if (error == EINTR || error == ERESTART)
188                 error = 0;
189 done2:
190         NET_UNLOCK_GIANT();
191         return (error);
192 }
193
194 /*
195  * Adds a socket to the list for servicing by nfsds.
196  */
197 static int
198 nfssvc_addsock(struct file *fp, struct sockaddr *mynam, struct thread *td)
199 {
200         int siz;
201         struct nfssvc_sock *slp;
202         struct socket *so;
203         int error, s;
204
205         NET_ASSERT_GIANT();
206
207         so = fp->f_data;
208 #if 0
209         /*
210          * XXXRW: If this code is ever enabled, there's a race when running
211          * MPSAFE.
212          */
213         tslp = NULL;
214         /*
215          * Add it to the list, as required.
216          */
217         if (so->so_proto->pr_protocol == IPPROTO_UDP) {
218                 tslp = nfs_udpsock;
219                 if (tslp->ns_flag & SLP_VALID) {
220                         if (mynam != NULL)
221                                 FREE(mynam, M_SONAME);
222                         return (EPERM);
223                 }
224         }
225 #endif
226         if (so->so_type == SOCK_STREAM)
227                 siz = NFS_MAXPACKET + sizeof (u_long);
228         else
229                 siz = NFS_MAXPACKET;
230         error = soreserve(so, siz, siz);
231         if (error) {
232                 if (mynam != NULL)
233                         FREE(mynam, M_SONAME);
234                 return (error);
235         }
236
237         /*
238          * Set protocol specific options { for now TCP only } and
239          * reserve some space. For datagram sockets, this can get called
240          * repeatedly for the same socket, but that isn't harmful.
241          */
242         if (so->so_type == SOCK_STREAM) {
243                 struct sockopt sopt;
244                 int val;
245
246                 bzero(&sopt, sizeof sopt);
247                 sopt.sopt_dir = SOPT_SET;
248                 sopt.sopt_level = SOL_SOCKET;
249                 sopt.sopt_name = SO_KEEPALIVE;
250                 sopt.sopt_val = &val;
251                 sopt.sopt_valsize = sizeof val;
252                 val = 1;
253                 sosetopt(so, &sopt);
254         }
255         if (so->so_proto->pr_protocol == IPPROTO_TCP) {
256                 struct sockopt sopt;
257                 int val;
258
259                 bzero(&sopt, sizeof sopt);
260                 sopt.sopt_dir = SOPT_SET;
261                 sopt.sopt_level = IPPROTO_TCP;
262                 sopt.sopt_name = TCP_NODELAY;
263                 sopt.sopt_val = &val;
264                 sopt.sopt_valsize = sizeof val;
265                 val = 1;
266                 sosetopt(so, &sopt);
267         }
268         SOCKBUF_LOCK(&so->so_rcv);
269         so->so_rcv.sb_flags &= ~SB_NOINTR;
270         so->so_rcv.sb_timeo = 0;
271         SOCKBUF_UNLOCK(&so->so_rcv);
272         SOCKBUF_LOCK(&so->so_snd);
273         so->so_snd.sb_flags &= ~SB_NOINTR;
274         so->so_snd.sb_timeo = 0;
275         SOCKBUF_UNLOCK(&so->so_snd);
276
277         slp = (struct nfssvc_sock *)
278                 malloc(sizeof (struct nfssvc_sock), M_NFSSVC,
279                 M_WAITOK | M_ZERO);
280         STAILQ_INIT(&slp->ns_rec);
281         NFSD_LOCK();
282         TAILQ_INSERT_TAIL(&nfssvc_sockhead, slp, ns_chain);
283
284         slp->ns_so = so;
285         slp->ns_nam = mynam;
286         fhold(fp);
287         slp->ns_fp = fp;
288         /*
289          * XXXRW: Socket locking here?
290          */
291         s = splnet();
292         so->so_upcallarg = (caddr_t)slp;
293         so->so_upcall = nfsrv_rcv;
294         SOCKBUF_LOCK(&so->so_rcv);
295         so->so_rcv.sb_flags |= SB_UPCALL;
296         SOCKBUF_UNLOCK(&so->so_rcv);
297         slp->ns_flag = (SLP_VALID | SLP_NEEDQ);
298         nfsrv_wakenfsd(slp);
299         splx(s);
300         NFSD_UNLOCK();
301         return (0);
302 }
303
304 /*
305  * Called by nfssvc() for nfsds. Just loops around servicing rpc requests
306  * until it is killed by a signal.
307  */
308 static int
309 nfssvc_nfsd(struct thread *td)
310 {
311         int siz;
312         struct nfssvc_sock *slp;
313         struct nfsd *nfsd;
314         struct nfsrv_descript *nd = NULL;
315         struct mbuf *m, *mreq;
316         int error = 0, cacherep, s, sotype, writes_todo;
317         int procrastinate;
318         u_quad_t cur_usec;
319
320         NET_ASSERT_GIANT();
321
322 #ifndef nolint
323         cacherep = RC_DOIT;
324         writes_todo = 0;
325 #endif
326         nfsd = (struct nfsd *)
327                 malloc(sizeof (struct nfsd), M_NFSD, M_WAITOK | M_ZERO);
328         s = splnet();
329         NFSD_LOCK();
330
331         nfsd->nfsd_td = td;
332         TAILQ_INSERT_TAIL(&nfsd_head, nfsd, nfsd_chain);
333         nfsrv_numnfsd++;
334
335         /*
336          * Loop getting rpc requests until SIGKILL.
337          */
338         for (;;) {
339                 if ((nfsd->nfsd_flag & NFSD_REQINPROG) == 0) {
340                         while (nfsd->nfsd_slp == NULL &&
341                             (nfsd_head_flag & NFSD_CHECKSLP) == 0) {
342                                 nfsd->nfsd_flag |= NFSD_WAITING;
343                                 nfsd_waiting++;
344                                 error = msleep(nfsd, &nfsd_mtx,
345                                     PSOCK | PCATCH, "-", 0);
346                                 nfsd_waiting--;
347                                 if (error)
348                                         goto done;
349                         }
350                         if (nfsd->nfsd_slp == NULL &&
351                             (nfsd_head_flag & NFSD_CHECKSLP) != 0) {
352                                 TAILQ_FOREACH(slp, &nfssvc_sockhead, ns_chain) {
353                                     if ((slp->ns_flag & (SLP_VALID | SLP_DOREC))
354                                         == (SLP_VALID | SLP_DOREC)) {
355                                             slp->ns_flag &= ~SLP_DOREC;
356                                             slp->ns_sref++;
357                                             nfsd->nfsd_slp = slp;
358                                             break;
359                                     }
360                                 }
361                                 if (slp == NULL)
362                                         nfsd_head_flag &= ~NFSD_CHECKSLP;
363                         }
364                         if ((slp = nfsd->nfsd_slp) == NULL)
365                                 continue;
366                         if (slp->ns_flag & SLP_VALID) {
367                                 if (slp->ns_flag & SLP_DISCONN)
368                                         nfsrv_zapsock(slp);
369                                 else if (slp->ns_flag & SLP_NEEDQ) {
370                                         slp->ns_flag &= ~SLP_NEEDQ;
371                                         (void) nfs_slplock(slp, 1);
372                                         NFSD_UNLOCK();
373                                         nfsrv_rcv(slp->ns_so, (caddr_t)slp,
374                                                 M_TRYWAIT);
375                                         NFSD_LOCK();
376                                         nfs_slpunlock(slp);
377                                 }
378                                 error = nfsrv_dorec(slp, nfsd, &nd);
379                                 cur_usec = nfs_curusec();
380                                 if (error && LIST_FIRST(&slp->ns_tq) &&
381                                     LIST_FIRST(&slp->ns_tq)->nd_time <= cur_usec) {
382                                         error = 0;
383                                         cacherep = RC_DOIT;
384                                         writes_todo = 1;
385                                 } else
386                                         writes_todo = 0;
387                                 nfsd->nfsd_flag |= NFSD_REQINPROG;
388                         }
389                 } else {
390                         error = 0;
391                         slp = nfsd->nfsd_slp;
392                 }
393                 if (error || (slp->ns_flag & SLP_VALID) == 0) {
394                         if (nd) {
395                                 if (nd->nd_cr != NULL)
396                                         crfree(nd->nd_cr);
397                                 free((caddr_t)nd, M_NFSRVDESC);
398                                 nd = NULL;
399                         }
400                         nfsd->nfsd_slp = NULL;
401                         nfsd->nfsd_flag &= ~NFSD_REQINPROG;
402                         nfsrv_slpderef(slp);
403                         continue;
404                 }
405                 splx(s);
406                 sotype = slp->ns_so->so_type;
407                 if (nd) {
408                     getmicrotime(&nd->nd_starttime);
409                     if (nd->nd_nam2)
410                         nd->nd_nam = nd->nd_nam2;
411                     else
412                         nd->nd_nam = slp->ns_nam;
413
414                     /*
415                      * Check to see if authorization is needed.
416                      */
417                     cacherep = nfsrv_getcache(nd, &mreq);
418
419                     if (nfs_privport) {
420                         /* Check if source port is privileged */
421                         u_short port;
422                         struct sockaddr *nam = nd->nd_nam;
423                         struct sockaddr_in *sin;
424
425                         sin = (struct sockaddr_in *)nam;
426                         /*
427                          * INET/INET6 - same code:
428                          *    sin_port and sin6_port are at same offset
429                          */
430                         port = ntohs(sin->sin_port);
431                         if (port >= IPPORT_RESERVED &&
432                             nd->nd_procnum != NFSPROC_NULL) {
433 #if defined(INET6) && defined(KLD_MODULE)
434         /* do not use ip6_sprintf: the nfs module should work without INET6 */
435         char b6[INET6_ADDRSTRLEN];
436 #define ip6_sprintf(a) \
437          (sprintf(b6, "%x:%x:%x:%x:%x:%x:%x:%x", \
438                   (a)->s6_addr16[0], (a)->s6_addr16[1], \
439                   (a)->s6_addr16[2], (a)->s6_addr16[3], \
440                   (a)->s6_addr16[4], (a)->s6_addr16[5], \
441                   (a)->s6_addr16[6], (a)->s6_addr16[7]), \
442           b6)
443 #endif
444                             nd->nd_procnum = NFSPROC_NOOP;
445                             nd->nd_repstat = (NFSERR_AUTHERR | AUTH_TOOWEAK);
446                             cacherep = RC_DOIT;
447                             printf("NFS request from unprivileged port (%s:%d)\n",
448 #ifdef INET6
449                                    sin->sin_family == AF_INET6 ?
450                                         ip6_sprintf(&satosin6(sin)->sin6_addr) :
451 #undef ip6_sprintf
452 #endif
453                                    inet_ntoa(sin->sin_addr), port);
454                         }
455                     }
456
457                 }
458
459                 /*
460                  * Loop to get all the write rpc relies that have been
461                  * gathered together.
462                  */
463                 do {
464                     switch (cacherep) {
465                     case RC_DOIT:
466                         if (nd && (nd->nd_flag & ND_NFSV3))
467                             procrastinate = nfsrvw_procrastinate_v3;
468                         else
469                             procrastinate = nfsrvw_procrastinate;
470                         if (writes_todo || (!(nd->nd_flag & ND_NFSV3) &&
471                             nd->nd_procnum == NFSPROC_WRITE &&
472                             procrastinate > 0 && !notstarted))
473                             error = nfsrv_writegather(&nd, slp,
474                                 nfsd->nfsd_td, &mreq);
475                         else
476                             error = (*(nfsrv3_procs[nd->nd_procnum]))(nd,
477                                 slp, nfsd->nfsd_td, &mreq);
478                         if (mreq == NULL)
479                                 break;
480                         if (error != 0 && error != NFSERR_RETVOID) {
481                                 nfsrvstats.srv_errs++;
482                                 nfsrv_updatecache(nd, FALSE, mreq);
483                                 if (nd->nd_nam2)
484                                         FREE(nd->nd_nam2, M_SONAME);
485                                 break;
486                         }
487                         nfsrvstats.srvrpccnt[nd->nd_procnum]++;
488                         nfsrv_updatecache(nd, TRUE, mreq);
489                         nd->nd_mrep = NULL;
490                         /* FALLTHROUGH */
491                     case RC_REPLY:
492                         NFSD_UNLOCK();
493                         siz = m_length(mreq, NULL);
494                         if (siz <= 0 || siz > NFS_MAXPACKET) {
495                                 printf("mbuf siz=%d\n",siz);
496                                 panic("Bad nfs svc reply");
497                         }
498                         m = mreq;
499                         m->m_pkthdr.len = siz;
500                         m->m_pkthdr.rcvif = NULL;
501                         /*
502                          * For stream protocols, prepend a Sun RPC
503                          * Record Mark.
504                          */
505                         if (sotype == SOCK_STREAM) {
506                                 M_PREPEND(m, NFSX_UNSIGNED, M_TRYWAIT);
507                                 *mtod(m, u_int32_t *) = htonl(0x80000000 | siz);
508                         }
509                         NFSD_LOCK();
510                         if (slp->ns_so->so_proto->pr_flags & PR_CONNREQUIRED)
511                                 (void) nfs_slplock(slp, 1);
512                         if (slp->ns_flag & SLP_VALID) {
513                             NFSD_UNLOCK();
514                             error = nfsrv_send(slp->ns_so, nd->nd_nam2, m);
515                             NFSD_LOCK();
516                         } else {
517                             error = EPIPE;
518                             m_freem(m);
519                         }
520                         if (nd->nd_nam2)
521                                 FREE(nd->nd_nam2, M_SONAME);
522                         if (nd->nd_mrep)
523                                 m_freem(nd->nd_mrep);
524                         if (error == EPIPE)
525                                 nfsrv_zapsock(slp);
526                         if (slp->ns_so->so_proto->pr_flags & PR_CONNREQUIRED)
527                                 nfs_slpunlock(slp);
528                         if (error == EINTR || error == ERESTART) {
529                                 if (nd->nd_cr != NULL)
530                                         crfree(nd->nd_cr);
531                                 free((caddr_t)nd, M_NFSRVDESC);
532                                 nfsrv_slpderef(slp);
533                                 s = splnet();
534                                 goto done;
535                         }
536                         break;
537                     case RC_DROPIT:
538                         m_freem(nd->nd_mrep);
539                         if (nd->nd_nam2)
540                                 FREE(nd->nd_nam2, M_SONAME);
541                         break;
542                     };
543                     if (nd) {
544                         if (nd->nd_cr != NULL)
545                                 crfree(nd->nd_cr);
546                         FREE((caddr_t)nd, M_NFSRVDESC);
547                         nd = NULL;
548                     }
549
550                     /*
551                      * Check to see if there are outstanding writes that
552                      * need to be serviced.
553                      */
554                     cur_usec = nfs_curusec();
555                     s = splsoftclock();
556                     if (LIST_FIRST(&slp->ns_tq) &&
557                         LIST_FIRST(&slp->ns_tq)->nd_time <= cur_usec) {
558                         cacherep = RC_DOIT;
559                         writes_todo = 1;
560                     } else
561                         writes_todo = 0;
562                     splx(s);
563                 } while (writes_todo);
564                 s = splnet();
565                 if (nfsrv_dorec(slp, nfsd, &nd)) {
566                         nfsd->nfsd_flag &= ~NFSD_REQINPROG;
567                         nfsd->nfsd_slp = NULL;
568                         nfsrv_slpderef(slp);
569                 }
570                 KASSERT(!(debug_mpsafenet == 0 && !mtx_owned(&Giant)),
571                     ("nfssvc_nfsd(): debug.mpsafenet=0 && !Giant"));
572                 KASSERT(!(debug_mpsafenet == 1 && mtx_owned(&Giant)),
573                     ("nfssvc_nfsd(): debug.mpsafenet=1 && Giant"));
574         }
575 done:
576         KASSERT(!(debug_mpsafenet == 0 && !mtx_owned(&Giant)),
577             ("nfssvc_nfsd(): debug.mpsafenet=0 && !Giant"));
578         KASSERT(!(debug_mpsafenet == 1 && mtx_owned(&Giant)),
579             ("nfssvc_nfsd(): debug.mpsafenet=1 && Giant"));
580         TAILQ_REMOVE(&nfsd_head, nfsd, nfsd_chain);
581         splx(s);
582         free((caddr_t)nfsd, M_NFSD);
583         if (--nfsrv_numnfsd == 0)
584                 nfsrv_init(TRUE);       /* Reinitialize everything */
585         NFSD_UNLOCK();
586         return (error);
587 }
588
589 /*
590  * Shut down a socket associated with an nfssvc_sock structure.
591  * Should be called with the send lock set, if required.
592  * The trick here is to increment the sref at the start, so that the nfsds
593  * will stop using it and clear ns_flag at the end so that it will not be
594  * reassigned during cleanup.
595  */
596 static void
597 nfsrv_zapsock(struct nfssvc_sock *slp)
598 {
599         struct nfsrv_descript *nwp, *nnwp;
600         struct socket *so;
601         struct file *fp;
602         struct nfsrv_rec *rec;
603         int s;
604
605         NET_ASSERT_GIANT();
606         NFSD_LOCK_ASSERT();
607
608         /*
609          * XXXRW: By clearing all flags, other threads/etc should ignore
610          * this slp and we can safely release nfsd_mtx so we can clean
611          * up the slp safely.
612          */
613         slp->ns_flag &= ~SLP_ALLFLAGS;
614         fp = slp->ns_fp;
615         if (fp) {
616                 NFSD_UNLOCK();
617                 slp->ns_fp = NULL;
618                 so = slp->ns_so;
619                 SOCKBUF_LOCK(&so->so_rcv);
620                 so->so_rcv.sb_flags &= ~SB_UPCALL;
621                 SOCKBUF_UNLOCK(&so->so_rcv);
622                 so->so_upcall = NULL;
623                 so->so_upcallarg = NULL;
624                 soshutdown(so, SHUT_RDWR);
625                 closef(fp, NULL);
626                 NFSD_LOCK();
627                 if (slp->ns_nam)
628                         FREE(slp->ns_nam, M_SONAME);
629                 m_freem(slp->ns_raw);
630                 while ((rec = STAILQ_FIRST(&slp->ns_rec)) != NULL) {
631                         STAILQ_REMOVE_HEAD(&slp->ns_rec, nr_link);
632                         if (rec->nr_address)
633                                 FREE(rec->nr_address, M_SONAME);
634                         m_freem(rec->nr_packet);
635                         free(rec, M_NFSRVDESC);
636                 }
637                 s = splsoftclock();
638                 for (nwp = LIST_FIRST(&slp->ns_tq); nwp; nwp = nnwp) {
639                         nnwp = LIST_NEXT(nwp, nd_tq);
640                         LIST_REMOVE(nwp, nd_tq);
641                         if (nwp->nd_cr != NULL)
642                                 crfree(nwp->nd_cr);
643                         free((caddr_t)nwp, M_NFSRVDESC);
644                 }
645                 LIST_INIT(&slp->ns_tq);
646                 splx(s);
647         }
648 }
649
650 /*
651  * Derefence a server socket structure. If it has no more references and
652  * is no longer valid, you can throw it away.
653  */
654 void
655 nfsrv_slpderef(struct nfssvc_sock *slp)
656 {
657
658         NFSD_LOCK_ASSERT();
659
660         if (--(slp->ns_sref) == 0 && (slp->ns_flag & SLP_VALID) == 0) {
661                 TAILQ_REMOVE(&nfssvc_sockhead, slp, ns_chain);
662                 free((caddr_t)slp, M_NFSSVC);
663         }
664 }
665
666 /*
667  * Lock a socket against others.
668  *
669  * XXXRW: Wait argument is always 1 in the caller.  Replace with a real
670  * sleep lock?
671  */
672 int
673 nfs_slplock(struct nfssvc_sock *slp, int wait)
674 {
675         int *statep = &slp->ns_solock;
676
677         NFSD_LOCK_ASSERT();
678
679         if (!wait && (*statep & NFSRV_SNDLOCK))
680                 return(0);      /* already locked, fail */
681         while (*statep & NFSRV_SNDLOCK) {
682                 *statep |= NFSRV_WANTSND;
683                 (void) msleep(statep, &nfsd_mtx, PZERO - 1, "nfsslplck", 0);
684         }
685         *statep |= NFSRV_SNDLOCK;
686         return (1);
687 }
688
689 /*
690  * Unlock the stream socket for others.
691  */
692 void
693 nfs_slpunlock(struct nfssvc_sock *slp)
694 {
695         int *statep = &slp->ns_solock;
696
697         NFSD_LOCK_ASSERT();
698
699         if ((*statep & NFSRV_SNDLOCK) == 0)
700                 panic("nfs slpunlock");
701         *statep &= ~NFSRV_SNDLOCK;
702         if (*statep & NFSRV_WANTSND) {
703                 *statep &= ~NFSRV_WANTSND;
704                 wakeup(statep);
705         }
706 }
707
708 /*
709  * Initialize the data structures for the server.
710  * Handshake with any new nfsds starting up to avoid any chance of
711  * corruption.
712  */
713 void
714 nfsrv_init(int terminating)
715 {
716         struct nfssvc_sock *slp, *nslp;
717
718         NET_ASSERT_GIANT();
719         NFSD_LOCK_ASSERT();
720
721         if (nfssvc_sockhead_flag & SLP_INIT)
722                 panic("nfsd init");
723         nfssvc_sockhead_flag |= SLP_INIT;
724         if (terminating) {
725                 TAILQ_FOREACH_SAFE(slp, &nfssvc_sockhead, ns_chain, nslp) {
726                         if (slp->ns_flag & SLP_VALID)
727                                 nfsrv_zapsock(slp);
728                         TAILQ_REMOVE(&nfssvc_sockhead, slp, ns_chain);
729                         free((caddr_t)slp, M_NFSSVC);
730                 }
731                 nfsrv_cleancache();     /* And clear out server cache */
732         } else
733                 nfs_pub.np_valid = 0;
734
735         TAILQ_INIT(&nfssvc_sockhead);
736         nfssvc_sockhead_flag &= ~SLP_INIT;
737         if (nfssvc_sockhead_flag & SLP_WANTINIT) {
738                 nfssvc_sockhead_flag &= ~SLP_WANTINIT;
739                 wakeup(&nfssvc_sockhead);
740         }
741
742         TAILQ_INIT(&nfsd_head);
743         nfsd_head_flag &= ~NFSD_CHECKSLP;
744
745 #if 0
746         nfs_udpsock = (struct nfssvc_sock *)
747             malloc(sizeof (struct nfssvc_sock), M_NFSSVC, M_WAITOK | M_ZERO);
748         STAILQ_INIT(&nfs_udpsock->ns_rec);
749         TAILQ_INSERT_HEAD(&nfssvc_sockhead, nfs_udpsock, ns_chain);
750
751         nfs_cltpsock = (struct nfssvc_sock *)
752             malloc(sizeof (struct nfssvc_sock), M_NFSSVC, M_WAITOK | M_ZERO);
753         STAILQ_INIT(&nfs_cltpsock->ns_rec);
754         TAILQ_INSERT_TAIL(&nfssvc_sockhead, nfs_cltpsock, ns_chain);
755 #endif
756 }