2 * Copyright (c) 1989, 1993, 1995
3 * The Regents of the University of California. All rights reserved.
5 * This code is derived from software contributed to Berkeley by
6 * Rick Macklem at The University of Guelph.
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
16 * 4. Neither the name of the University nor the names of its contributors
17 * may be used to endorse or promote products derived from this software
18 * without specific prior written permission.
20 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
21 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
24 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
26 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
28 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
29 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32 * from nfs_vfsops.c 8.12 (Berkeley) 5/20/95
35 #include <sys/cdefs.h>
36 __FBSDID("$FreeBSD$");
39 #include "opt_bootp.h"
40 #include "opt_nfsroot.h"
42 #include <sys/param.h>
43 #include <sys/systm.h>
44 #include <sys/kernel.h>
47 #include <sys/clock.h>
49 #include <sys/limits.h>
51 #include <sys/malloc.h>
53 #include <sys/module.h>
54 #include <sys/mount.h>
56 #include <sys/socket.h>
57 #include <sys/socketvar.h>
58 #include <sys/sockio.h>
59 #include <sys/sysctl.h>
60 #include <sys/vnode.h>
61 #include <sys/signalvar.h>
64 #include <vm/vm_extern.h>
68 #include <net/route.h>
69 #include <netinet/in.h>
71 #include <fs/nfs/nfsport.h>
72 #include <fs/nfsclient/nfsnode.h>
73 #include <fs/nfsclient/nfsmount.h>
74 #include <fs/nfsclient/nfs.h>
75 #include <nfs/nfsdiskless.h>
77 FEATURE(nfscl, "NFSv4 client");
79 extern int nfscl_ticks;
80 extern struct timeval nfsboottime;
81 extern struct nfsstats newnfsstats;
82 extern int nfsrv_useacl;
84 MALLOC_DEFINE(M_NEWNFSREQ, "newnfsclient_req", "New NFS request header");
85 MALLOC_DEFINE(M_NEWNFSMNT, "newnfsmnt", "New NFS mount struct");
87 SYSCTL_DECL(_vfs_nfs);
88 static int nfs_ip_paranoia = 1;
89 SYSCTL_INT(_vfs_nfs, OID_AUTO, nfs_ip_paranoia, CTLFLAG_RW,
90 &nfs_ip_paranoia, 0, "");
91 static int nfs_tprintf_initial_delay = NFS_TPRINTF_INITIAL_DELAY;
92 SYSCTL_INT(_vfs_nfs, NFS_TPRINTF_INITIAL_DELAY,
93 downdelayinitial, CTLFLAG_RW, &nfs_tprintf_initial_delay, 0, "");
94 /* how long between console messages "nfs server foo not responding" */
95 static int nfs_tprintf_delay = NFS_TPRINTF_DELAY;
96 SYSCTL_INT(_vfs_nfs, NFS_TPRINTF_DELAY,
97 downdelayinterval, CTLFLAG_RW, &nfs_tprintf_delay, 0, "");
99 static int nfs_mountroot(struct mount *);
100 static void nfs_sec_name(char *, int *);
101 static void nfs_decode_args(struct mount *mp, struct nfsmount *nmp,
102 struct nfs_args *argp, const char *, struct ucred *,
104 static int mountnfs(struct nfs_args *, struct mount *,
105 struct sockaddr *, char *, u_char *, int, u_char *, int,
106 u_char *, int, struct vnode **, struct ucred *,
107 struct thread *, int);
108 static void nfs_getnlminfo(struct vnode *, uint8_t *, size_t *,
109 struct sockaddr_storage *, int *, off_t *,
111 static vfs_mount_t nfs_mount;
112 static vfs_cmount_t nfs_cmount;
113 static vfs_unmount_t nfs_unmount;
114 static vfs_root_t nfs_root;
115 static vfs_statfs_t nfs_statfs;
116 static vfs_sync_t nfs_sync;
117 static vfs_sysctl_t nfs_sysctl;
120 * nfs vfs operations.
122 static struct vfsops nfs_vfsops = {
123 .vfs_init = ncl_init,
124 .vfs_mount = nfs_mount,
125 .vfs_cmount = nfs_cmount,
126 .vfs_root = nfs_root,
127 .vfs_statfs = nfs_statfs,
128 .vfs_sync = nfs_sync,
129 .vfs_uninit = ncl_uninit,
130 .vfs_unmount = nfs_unmount,
131 .vfs_sysctl = nfs_sysctl,
133 VFS_SET(nfs_vfsops, nfs, VFCF_NETWORK);
135 /* So that loader and kldload(2) can find us, wherever we are.. */
136 MODULE_VERSION(nfs, 1);
137 MODULE_DEPEND(nfs, nfscommon, 1, 1, 1);
138 MODULE_DEPEND(nfs, krpc, 1, 1, 1);
139 MODULE_DEPEND(nfs, nfssvc, 1, 1, 1);
140 MODULE_DEPEND(nfs, nfslock, 1, 1, 1);
143 * This structure is now defined in sys/nfs/nfs_diskless.c so that it
144 * can be shared by both NFS clients. It is declared here so that it
145 * will be defined for kernels built without NFS_ROOT, although it
146 * isn't used in that case.
148 #if !defined(NFS_ROOT) && !defined(NFSCLIENT)
149 struct nfs_diskless nfs_diskless = { { { 0 } } };
150 struct nfsv3_diskless nfsv3_diskless = { { { 0 } } };
151 int nfs_diskless_valid = 0;
154 SYSCTL_INT(_vfs_nfs, OID_AUTO, diskless_valid, CTLFLAG_RD,
155 &nfs_diskless_valid, 0,
156 "Has the diskless struct been filled correctly");
158 SYSCTL_STRING(_vfs_nfs, OID_AUTO, diskless_rootpath, CTLFLAG_RD,
159 nfsv3_diskless.root_hostnam, 0, "Path to nfs root");
161 SYSCTL_OPAQUE(_vfs_nfs, OID_AUTO, diskless_rootaddr, CTLFLAG_RD,
162 &nfsv3_diskless.root_saddr, sizeof(nfsv3_diskless.root_saddr),
163 "%Ssockaddr_in", "Diskless root nfs address");
166 void newnfsargs_ntoh(struct nfs_args *);
167 static int nfs_mountdiskless(char *,
168 struct sockaddr_in *, struct nfs_args *,
169 struct thread *, struct vnode **, struct mount *);
170 static void nfs_convert_diskless(void);
171 static void nfs_convert_oargs(struct nfs_args *args,
172 struct onfs_args *oargs);
175 newnfs_iosize(struct nfsmount *nmp)
179 /* First, set the upper limit for iosize */
180 if (nmp->nm_flag & NFSMNT_NFSV4) {
181 maxio = NFS_MAXBSIZE;
182 } else if (nmp->nm_flag & NFSMNT_NFSV3) {
183 if (nmp->nm_sotype == SOCK_DGRAM)
184 maxio = NFS_MAXDGRAMDATA;
186 maxio = NFS_MAXBSIZE;
188 maxio = NFS_V2MAXDATA;
190 if (nmp->nm_rsize > maxio || nmp->nm_rsize == 0)
191 nmp->nm_rsize = maxio;
192 if (nmp->nm_rsize > MAXBSIZE)
193 nmp->nm_rsize = MAXBSIZE;
194 if (nmp->nm_readdirsize > maxio || nmp->nm_readdirsize == 0)
195 nmp->nm_readdirsize = maxio;
196 if (nmp->nm_readdirsize > nmp->nm_rsize)
197 nmp->nm_readdirsize = nmp->nm_rsize;
198 if (nmp->nm_wsize > maxio || nmp->nm_wsize == 0)
199 nmp->nm_wsize = maxio;
200 if (nmp->nm_wsize > MAXBSIZE)
201 nmp->nm_wsize = MAXBSIZE;
204 * Calculate the size used for io buffers. Use the larger
205 * of the two sizes to minimise nfs requests but make sure
206 * that it is at least one VM page to avoid wasting buffer
209 iosize = imax(nmp->nm_rsize, nmp->nm_wsize);
210 iosize = imax(iosize, PAGE_SIZE);
211 nmp->nm_mountp->mnt_stat.f_iosize = iosize;
216 nfs_convert_oargs(struct nfs_args *args, struct onfs_args *oargs)
219 args->version = NFS_ARGSVERSION;
220 args->addr = oargs->addr;
221 args->addrlen = oargs->addrlen;
222 args->sotype = oargs->sotype;
223 args->proto = oargs->proto;
224 args->fh = oargs->fh;
225 args->fhsize = oargs->fhsize;
226 args->flags = oargs->flags;
227 args->wsize = oargs->wsize;
228 args->rsize = oargs->rsize;
229 args->readdirsize = oargs->readdirsize;
230 args->timeo = oargs->timeo;
231 args->retrans = oargs->retrans;
232 args->readahead = oargs->readahead;
233 args->hostname = oargs->hostname;
237 nfs_convert_diskless(void)
240 bcopy(&nfs_diskless.myif, &nfsv3_diskless.myif,
241 sizeof(struct ifaliasreq));
242 bcopy(&nfs_diskless.mygateway, &nfsv3_diskless.mygateway,
243 sizeof(struct sockaddr_in));
244 nfs_convert_oargs(&nfsv3_diskless.root_args,&nfs_diskless.root_args);
245 if (nfsv3_diskless.root_args.flags & NFSMNT_NFSV3) {
246 nfsv3_diskless.root_fhsize = NFSX_MYFH;
247 bcopy(nfs_diskless.root_fh, nfsv3_diskless.root_fh, NFSX_MYFH);
249 nfsv3_diskless.root_fhsize = NFSX_V2FH;
250 bcopy(nfs_diskless.root_fh, nfsv3_diskless.root_fh, NFSX_V2FH);
252 bcopy(&nfs_diskless.root_saddr,&nfsv3_diskless.root_saddr,
253 sizeof(struct sockaddr_in));
254 bcopy(nfs_diskless.root_hostnam, nfsv3_diskless.root_hostnam, MNAMELEN);
255 nfsv3_diskless.root_time = nfs_diskless.root_time;
256 bcopy(nfs_diskless.my_hostnam, nfsv3_diskless.my_hostnam,
258 nfs_diskless_valid = 3;
265 nfs_statfs(struct mount *mp, struct statfs *sbp)
269 struct nfsmount *nmp = VFSTONFS(mp);
270 struct nfsvattr nfsva;
273 int error = 0, attrflag, gotfsinfo = 0, ret;
278 error = vfs_busy(mp, MBF_NOWAIT);
281 error = ncl_nget(mp, nmp->nm_fh, nmp->nm_fhsize, &np, LK_EXCLUSIVE);
287 mtx_lock(&nmp->nm_mtx);
288 if (NFSHASNFSV3(nmp) && !NFSHASGOTFSINFO(nmp)) {
289 mtx_unlock(&nmp->nm_mtx);
290 error = nfsrpc_fsinfo(vp, &fs, td->td_ucred, td, &nfsva,
295 mtx_unlock(&nmp->nm_mtx);
297 error = nfsrpc_statfs(vp, &sb, &fs, td->td_ucred, td, &nfsva,
300 ret = nfsrpc_getattrnovp(nmp, nmp->nm_fh, nmp->nm_fhsize, 1,
301 td->td_ucred, td, &nfsva, NULL);
304 * Just set default values to get things going.
306 NFSBZERO((caddr_t)&nfsva, sizeof (struct nfsvattr));
307 nfsva.na_vattr.va_type = VDIR;
308 nfsva.na_vattr.va_mode = 0777;
309 nfsva.na_vattr.va_nlink = 100;
310 nfsva.na_vattr.va_uid = (uid_t)0;
311 nfsva.na_vattr.va_gid = (gid_t)0;
312 nfsva.na_vattr.va_fileid = 2;
313 nfsva.na_vattr.va_gen = 1;
314 nfsva.na_vattr.va_blocksize = NFS_FABLKSIZE;
315 nfsva.na_vattr.va_size = 512 * 1024;
318 (void) nfscl_loadattrcache(&vp, &nfsva, NULL, NULL, 0, 1);
320 mtx_lock(&nmp->nm_mtx);
321 if (gotfsinfo || (nmp->nm_flag & NFSMNT_NFSV4))
322 nfscl_loadfsinfo(nmp, &fs);
323 nfscl_loadsbinfo(nmp, &sb, sbp);
324 sbp->f_iosize = newnfs_iosize(nmp);
325 mtx_unlock(&nmp->nm_mtx);
326 if (sbp != &mp->mnt_stat) {
327 bcopy(mp->mnt_stat.f_mntonname, sbp->f_mntonname, MNAMELEN);
328 bcopy(mp->mnt_stat.f_mntfromname, sbp->f_mntfromname, MNAMELEN);
330 strncpy(&sbp->f_fstypename[0], mp->mnt_vfc->vfc_name, MFSNAMELEN);
331 } else if (NFS_ISV4(vp)) {
332 error = nfscl_maperr(td, error, (uid_t)0, (gid_t)0);
340 * nfs version 3 fsinfo rpc call
343 ncl_fsinfo(struct nfsmount *nmp, struct vnode *vp, struct ucred *cred,
347 struct nfsvattr nfsva;
350 error = nfsrpc_fsinfo(vp, &fs, cred, td, &nfsva, &attrflag, NULL);
353 (void) nfscl_loadattrcache(&vp, &nfsva, NULL, NULL, 0,
355 mtx_lock(&nmp->nm_mtx);
356 nfscl_loadfsinfo(nmp, &fs);
357 mtx_unlock(&nmp->nm_mtx);
363 * Mount a remote root fs via. nfs. This depends on the info in the
364 * nfs_diskless structure that has been filled in properly by some primary
366 * It goes something like this:
367 * - do enough of "ifconfig" by calling ifioctl() so that the system
368 * can talk to the server
369 * - If nfs_diskless.mygateway is filled in, use that address as
371 * - build the rootfs mount point and call mountnfs() to do the rest.
373 * It is assumed to be safe to read, modify, and write the nfsv3_diskless
374 * structure, as well as other global NFS client variables here, as
375 * nfs_mountroot() will be called once in the boot before any other NFS
376 * client activity occurs.
379 nfs_mountroot(struct mount *mp)
381 struct thread *td = curthread;
382 struct nfsv3_diskless *nd = &nfsv3_diskless;
391 #if defined(BOOTP_NFSROOT) && defined(BOOTP)
392 bootpc_init(); /* use bootp to get nfs_diskless filled in */
393 #elif defined(NFS_ROOT)
394 nfs_setup_diskless();
397 if (nfs_diskless_valid == 0)
399 if (nfs_diskless_valid == 1)
400 nfs_convert_diskless();
403 * XXX splnet, so networks will receive...
408 * Do enough of ifconfig(8) so that the critical net interface can
409 * talk to the server.
411 error = socreate(nd->myif.ifra_addr.sa_family, &so, nd->root_args.sotype, 0,
414 panic("nfs_mountroot: socreate(%04x): %d",
415 nd->myif.ifra_addr.sa_family, error);
417 #if 0 /* XXX Bad idea */
419 * We might not have been told the right interface, so we pass
420 * over the first ten interfaces of the same kind, until we get
421 * one of them configured.
424 for (i = strlen(nd->myif.ifra_name) - 1;
425 nd->myif.ifra_name[i] >= '0' &&
426 nd->myif.ifra_name[i] <= '9';
427 nd->myif.ifra_name[i] ++) {
428 error = ifioctl(so, SIOCAIFADDR, (caddr_t)&nd->myif, td);
433 error = ifioctl(so, SIOCAIFADDR, (caddr_t)&nd->myif, td);
435 panic("nfs_mountroot: SIOCAIFADDR: %d", error);
436 if ((cp = getenv("boot.netif.mtu")) != NULL) {
437 ir.ifr_mtu = strtol(cp, NULL, 10);
438 bcopy(nd->myif.ifra_name, ir.ifr_name, IFNAMSIZ);
440 error = ifioctl(so, SIOCSIFMTU, (caddr_t)&ir, td);
442 printf("nfs_mountroot: SIOCSIFMTU: %d", error);
447 * If the gateway field is filled in, set it as the default route.
448 * Note that pxeboot will set a default route of 0 if the route
449 * is not set by the DHCP server. Check also for a value of 0
450 * to avoid panicking inappropriately in that situation.
452 if (nd->mygateway.sin_len != 0 &&
453 nd->mygateway.sin_addr.s_addr != 0) {
454 struct sockaddr_in mask, sin;
456 bzero((caddr_t)&mask, sizeof(mask));
458 sin.sin_family = AF_INET;
459 sin.sin_len = sizeof(sin);
460 /* XXX MRT use table 0 for this sort of thing */
461 CURVNET_SET(TD_TO_VNET(td));
462 error = rtrequest(RTM_ADD, (struct sockaddr *)&sin,
463 (struct sockaddr *)&nd->mygateway,
464 (struct sockaddr *)&mask,
465 RTF_UP | RTF_GATEWAY, NULL);
468 panic("nfs_mountroot: RTM_ADD: %d", error);
472 * Create the rootfs mount point.
474 nd->root_args.fh = nd->root_fh;
475 nd->root_args.fhsize = nd->root_fhsize;
476 l = ntohl(nd->root_saddr.sin_addr.s_addr);
477 snprintf(buf, sizeof(buf), "%ld.%ld.%ld.%ld:%s",
478 (l >> 24) & 0xff, (l >> 16) & 0xff,
479 (l >> 8) & 0xff, (l >> 0) & 0xff, nd->root_hostnam);
480 printf("NFS ROOT: %s\n", buf);
481 nd->root_args.hostname = buf;
482 if ((error = nfs_mountdiskless(buf,
483 &nd->root_saddr, &nd->root_args, td, &vp, mp)) != 0) {
488 * This is not really an nfs issue, but it is much easier to
489 * set hostname here and then let the "/etc/rc.xxx" files
490 * mount the right /var based upon its preset value.
492 mtx_lock(&prison0.pr_mtx);
493 strlcpy(prison0.pr_hostname, nd->my_hostnam,
494 sizeof(prison0.pr_hostname));
495 mtx_unlock(&prison0.pr_mtx);
496 inittodr(ntohl(nd->root_time));
501 * Internal version of mount system call for diskless setup.
504 nfs_mountdiskless(char *path,
505 struct sockaddr_in *sin, struct nfs_args *args, struct thread *td,
506 struct vnode **vpp, struct mount *mp)
508 struct sockaddr *nam;
513 * Find the directory path in "path", which also has the server's
514 * name/ip address in it.
516 dirpath = strchr(path, ':');
518 dirlen = strlen(++dirpath);
521 nam = sodupsockaddr((struct sockaddr *)sin, M_WAITOK);
522 if ((error = mountnfs(args, mp, nam, path, NULL, 0, dirpath, dirlen,
523 NULL, 0, vpp, td->td_ucred, td, NFS_DEFAULT_NEGNAMETIMEO)) != 0) {
524 printf("nfs_mountroot: mount %s on /: %d\n", path, error);
531 nfs_sec_name(char *sec, int *flagsp)
533 if (!strcmp(sec, "krb5"))
534 *flagsp |= NFSMNT_KERB;
535 else if (!strcmp(sec, "krb5i"))
536 *flagsp |= (NFSMNT_KERB | NFSMNT_INTEGRITY);
537 else if (!strcmp(sec, "krb5p"))
538 *flagsp |= (NFSMNT_KERB | NFSMNT_PRIVACY);
542 nfs_decode_args(struct mount *mp, struct nfsmount *nmp, struct nfs_args *argp,
543 const char *hostname, struct ucred *cred, struct thread *td)
552 * Set read-only flag if requested; otherwise, clear it if this is
553 * an update. If this is not an update, then either the read-only
554 * flag is already clear, or this is a root mount and it was set
555 * intentionally at some previous point.
557 if (vfs_getopt(mp->mnt_optnew, "ro", NULL, NULL) == 0) {
559 mp->mnt_flag |= MNT_RDONLY;
561 } else if (mp->mnt_flag & MNT_UPDATE) {
563 mp->mnt_flag &= ~MNT_RDONLY;
568 * Silently clear NFSMNT_NOCONN if it's a TCP mount, it makes
569 * no sense in that context. Also, set up appropriate retransmit
570 * and soft timeout behavior.
572 if (argp->sotype == SOCK_STREAM) {
573 nmp->nm_flag &= ~NFSMNT_NOCONN;
574 nmp->nm_timeo = NFS_MAXTIMEO;
575 if ((argp->flags & NFSMNT_NFSV4) != 0)
576 nmp->nm_retry = INT_MAX;
578 nmp->nm_retry = NFS_RETRANS_TCP;
581 /* Also clear RDIRPLUS if NFSv2, it crashes some servers */
582 if ((argp->flags & (NFSMNT_NFSV3 | NFSMNT_NFSV4)) == 0) {
583 argp->flags &= ~NFSMNT_RDIRPLUS;
584 nmp->nm_flag &= ~NFSMNT_RDIRPLUS;
587 /* Clear NFSMNT_RESVPORT for NFSv4, since it is not required. */
588 if ((argp->flags & NFSMNT_NFSV4) != 0) {
589 argp->flags &= ~NFSMNT_RESVPORT;
590 nmp->nm_flag &= ~NFSMNT_RESVPORT;
593 /* Re-bind if rsrvd port requested and wasn't on one */
594 adjsock = !(nmp->nm_flag & NFSMNT_RESVPORT)
595 && (argp->flags & NFSMNT_RESVPORT);
596 /* Also re-bind if we're switching to/from a connected UDP socket */
597 adjsock |= ((nmp->nm_flag & NFSMNT_NOCONN) !=
598 (argp->flags & NFSMNT_NOCONN));
600 /* Update flags atomically. Don't change the lock bits. */
601 nmp->nm_flag = argp->flags | nmp->nm_flag;
604 if ((argp->flags & NFSMNT_TIMEO) && argp->timeo > 0) {
605 nmp->nm_timeo = (argp->timeo * NFS_HZ + 5) / 10;
606 if (nmp->nm_timeo < NFS_MINTIMEO)
607 nmp->nm_timeo = NFS_MINTIMEO;
608 else if (nmp->nm_timeo > NFS_MAXTIMEO)
609 nmp->nm_timeo = NFS_MAXTIMEO;
612 if ((argp->flags & NFSMNT_RETRANS) && argp->retrans > 1) {
613 nmp->nm_retry = argp->retrans;
614 if (nmp->nm_retry > NFS_MAXREXMIT)
615 nmp->nm_retry = NFS_MAXREXMIT;
618 if ((argp->flags & NFSMNT_WSIZE) && argp->wsize > 0) {
619 nmp->nm_wsize = argp->wsize;
620 /* Round down to multiple of blocksize */
621 nmp->nm_wsize &= ~(NFS_FABLKSIZE - 1);
622 if (nmp->nm_wsize <= 0)
623 nmp->nm_wsize = NFS_FABLKSIZE;
626 if ((argp->flags & NFSMNT_RSIZE) && argp->rsize > 0) {
627 nmp->nm_rsize = argp->rsize;
628 /* Round down to multiple of blocksize */
629 nmp->nm_rsize &= ~(NFS_FABLKSIZE - 1);
630 if (nmp->nm_rsize <= 0)
631 nmp->nm_rsize = NFS_FABLKSIZE;
634 if ((argp->flags & NFSMNT_READDIRSIZE) && argp->readdirsize > 0) {
635 nmp->nm_readdirsize = argp->readdirsize;
638 if ((argp->flags & NFSMNT_ACREGMIN) && argp->acregmin >= 0)
639 nmp->nm_acregmin = argp->acregmin;
641 nmp->nm_acregmin = NFS_MINATTRTIMO;
642 if ((argp->flags & NFSMNT_ACREGMAX) && argp->acregmax >= 0)
643 nmp->nm_acregmax = argp->acregmax;
645 nmp->nm_acregmax = NFS_MAXATTRTIMO;
646 if ((argp->flags & NFSMNT_ACDIRMIN) && argp->acdirmin >= 0)
647 nmp->nm_acdirmin = argp->acdirmin;
649 nmp->nm_acdirmin = NFS_MINDIRATTRTIMO;
650 if ((argp->flags & NFSMNT_ACDIRMAX) && argp->acdirmax >= 0)
651 nmp->nm_acdirmax = argp->acdirmax;
653 nmp->nm_acdirmax = NFS_MAXDIRATTRTIMO;
654 if (nmp->nm_acdirmin > nmp->nm_acdirmax)
655 nmp->nm_acdirmin = nmp->nm_acdirmax;
656 if (nmp->nm_acregmin > nmp->nm_acregmax)
657 nmp->nm_acregmin = nmp->nm_acregmax;
659 if ((argp->flags & NFSMNT_READAHEAD) && argp->readahead >= 0) {
660 if (argp->readahead <= NFS_MAXRAHEAD)
661 nmp->nm_readahead = argp->readahead;
663 nmp->nm_readahead = NFS_MAXRAHEAD;
665 if ((argp->flags & NFSMNT_WCOMMITSIZE) && argp->wcommitsize >= 0) {
666 if (argp->wcommitsize < nmp->nm_wsize)
667 nmp->nm_wcommitsize = nmp->nm_wsize;
669 nmp->nm_wcommitsize = argp->wcommitsize;
672 adjsock |= ((nmp->nm_sotype != argp->sotype) ||
673 (nmp->nm_soproto != argp->proto));
675 if (nmp->nm_client != NULL && adjsock) {
676 int haslock = 0, error = 0;
678 if (nmp->nm_sotype == SOCK_STREAM) {
679 error = newnfs_sndlock(&nmp->nm_sockreq.nr_lock);
684 newnfs_disconnect(&nmp->nm_sockreq);
686 newnfs_sndunlock(&nmp->nm_sockreq.nr_lock);
687 nmp->nm_sotype = argp->sotype;
688 nmp->nm_soproto = argp->proto;
689 if (nmp->nm_sotype == SOCK_DGRAM)
690 while (newnfs_connect(nmp, &nmp->nm_sockreq,
692 printf("newnfs_args: retrying connect\n");
693 (void) nfs_catnap(PSOCK, 0, "newnfscon");
697 nmp->nm_sotype = argp->sotype;
698 nmp->nm_soproto = argp->proto;
701 if (hostname != NULL) {
702 strlcpy(nmp->nm_hostname, hostname,
703 sizeof(nmp->nm_hostname));
704 p = strchr(nmp->nm_hostname, ':');
710 static const char *nfs_opts[] = { "from", "nfs_args",
711 "noatime", "noexec", "suiddir", "nosuid", "nosymfollow", "union",
712 "noclusterr", "noclusterw", "multilabel", "acls", "force", "update",
713 "async", "noconn", "nolockd", "conn", "lockd", "intr", "rdirplus",
714 "readdirsize", "soft", "hard", "mntudp", "tcp", "udp", "wsize", "rsize",
715 "retrans", "acregmin", "acregmax", "acdirmin", "acdirmax", "resvport",
716 "readahead", "hostname", "timeout", "addr", "fh", "nfsv3", "sec",
717 "principal", "nfsv4", "gssname", "allgssname", "dirpath",
718 "negnametimeo", "nocto",
725 * It seems a bit dumb to copyinstr() the host and path here and then
726 * bcopy() them in mountnfs(), but I wanted to detect errors before
727 * doing the sockargs() call because sockargs() allocates an mbuf and
728 * an error after that means that I have to release the mbuf.
732 nfs_mount(struct mount *mp)
734 struct nfs_args args = {
735 .version = NFS_ARGSVERSION,
737 .addrlen = sizeof (struct sockaddr_in),
738 .sotype = SOCK_STREAM,
742 .flags = NFSMNT_RESVPORT,
745 .readdirsize = NFS_READDIRSIZE,
747 .retrans = NFS_RETRANS,
748 .readahead = NFS_DEFRAHEAD,
749 .wcommitsize = 0, /* was: NQ_DEFLEASE */
751 .acregmin = NFS_MINATTRTIMO,
752 .acregmax = NFS_MAXATTRTIMO,
753 .acdirmin = NFS_MINDIRATTRTIMO,
754 .acdirmax = NFS_MAXDIRATTRTIMO,
756 int error = 0, ret, len;
757 struct sockaddr *nam = NULL;
761 u_char nfh[NFSX_FHMAX], krbname[100], dirpath[100], srvkrbname[100];
762 char *opt, *name, *secname;
763 int negnametimeo = NFS_DEFAULT_NEGNAMETIMEO;
764 int dirlen, has_nfs_args_opt, krbnamelen, srvkrbnamelen;
767 has_nfs_args_opt = 0;
768 if (vfs_filteropt(mp->mnt_optnew, nfs_opts)) {
774 if ((mp->mnt_flag & (MNT_ROOTFS | MNT_UPDATE)) == MNT_ROOTFS) {
775 error = nfs_mountroot(mp);
782 * The old mount_nfs program passed the struct nfs_args
783 * from userspace to kernel. The new mount_nfs program
784 * passes string options via nmount() from userspace to kernel
785 * and we populate the struct nfs_args in the kernel.
787 if (vfs_getopt(mp->mnt_optnew, "nfs_args", NULL, NULL) == 0) {
788 error = vfs_copyopt(mp->mnt_optnew, "nfs_args", &args,
793 if (args.version != NFS_ARGSVERSION) {
794 error = EPROGMISMATCH;
797 has_nfs_args_opt = 1;
800 /* Handle the new style options. */
801 if (vfs_getopt(mp->mnt_optnew, "noconn", NULL, NULL) == 0)
802 args.flags |= NFSMNT_NOCONN;
803 if (vfs_getopt(mp->mnt_optnew, "conn", NULL, NULL) == 0)
804 args.flags |= NFSMNT_NOCONN;
805 if (vfs_getopt(mp->mnt_optnew, "nolockd", NULL, NULL) == 0)
806 args.flags |= NFSMNT_NOLOCKD;
807 if (vfs_getopt(mp->mnt_optnew, "lockd", NULL, NULL) == 0)
808 args.flags &= ~NFSMNT_NOLOCKD;
809 if (vfs_getopt(mp->mnt_optnew, "intr", NULL, NULL) == 0)
810 args.flags |= NFSMNT_INT;
811 if (vfs_getopt(mp->mnt_optnew, "rdirplus", NULL, NULL) == 0)
812 args.flags |= NFSMNT_RDIRPLUS;
813 if (vfs_getopt(mp->mnt_optnew, "resvport", NULL, NULL) == 0)
814 args.flags |= NFSMNT_RESVPORT;
815 if (vfs_getopt(mp->mnt_optnew, "noresvport", NULL, NULL) == 0)
816 args.flags &= ~NFSMNT_RESVPORT;
817 if (vfs_getopt(mp->mnt_optnew, "soft", NULL, NULL) == 0)
818 args.flags |= NFSMNT_SOFT;
819 if (vfs_getopt(mp->mnt_optnew, "hard", NULL, NULL) == 0)
820 args.flags &= ~NFSMNT_SOFT;
821 if (vfs_getopt(mp->mnt_optnew, "mntudp", NULL, NULL) == 0)
822 args.sotype = SOCK_DGRAM;
823 if (vfs_getopt(mp->mnt_optnew, "udp", NULL, NULL) == 0)
824 args.sotype = SOCK_DGRAM;
825 if (vfs_getopt(mp->mnt_optnew, "tcp", NULL, NULL) == 0)
826 args.sotype = SOCK_STREAM;
827 if (vfs_getopt(mp->mnt_optnew, "nfsv3", NULL, NULL) == 0)
828 args.flags |= NFSMNT_NFSV3;
829 if (vfs_getopt(mp->mnt_optnew, "nfsv4", NULL, NULL) == 0) {
830 args.flags |= NFSMNT_NFSV4;
831 args.sotype = SOCK_STREAM;
833 if (vfs_getopt(mp->mnt_optnew, "allgssname", NULL, NULL) == 0)
834 args.flags |= NFSMNT_ALLGSSNAME;
835 if (vfs_getopt(mp->mnt_optnew, "nocto", NULL, NULL) == 0)
836 args.flags |= NFSMNT_NOCTO;
837 if (vfs_getopt(mp->mnt_optnew, "readdirsize", (void **)&opt, NULL) == 0) {
839 vfs_mount_error(mp, "illegal readdirsize");
843 ret = sscanf(opt, "%d", &args.readdirsize);
844 if (ret != 1 || args.readdirsize <= 0) {
845 vfs_mount_error(mp, "illegal readdirsize: %s",
850 args.flags |= NFSMNT_READDIRSIZE;
852 if (vfs_getopt(mp->mnt_optnew, "readahead", (void **)&opt, NULL) == 0) {
854 vfs_mount_error(mp, "illegal readahead");
858 ret = sscanf(opt, "%d", &args.readahead);
859 if (ret != 1 || args.readahead <= 0) {
860 vfs_mount_error(mp, "illegal readahead: %s",
865 args.flags |= NFSMNT_READAHEAD;
867 if (vfs_getopt(mp->mnt_optnew, "wsize", (void **)&opt, NULL) == 0) {
869 vfs_mount_error(mp, "illegal wsize");
873 ret = sscanf(opt, "%d", &args.wsize);
874 if (ret != 1 || args.wsize <= 0) {
875 vfs_mount_error(mp, "illegal wsize: %s",
880 args.flags |= NFSMNT_WSIZE;
882 if (vfs_getopt(mp->mnt_optnew, "rsize", (void **)&opt, NULL) == 0) {
884 vfs_mount_error(mp, "illegal rsize");
888 ret = sscanf(opt, "%d", &args.rsize);
889 if (ret != 1 || args.rsize <= 0) {
890 vfs_mount_error(mp, "illegal wsize: %s",
895 args.flags |= NFSMNT_RSIZE;
897 if (vfs_getopt(mp->mnt_optnew, "retrans", (void **)&opt, NULL) == 0) {
899 vfs_mount_error(mp, "illegal retrans");
903 ret = sscanf(opt, "%d", &args.retrans);
904 if (ret != 1 || args.retrans <= 0) {
905 vfs_mount_error(mp, "illegal retrans: %s",
910 args.flags |= NFSMNT_RETRANS;
912 if (vfs_getopt(mp->mnt_optnew, "acregmin", (void **)&opt, NULL) == 0) {
913 ret = sscanf(opt, "%d", &args.acregmin);
914 if (ret != 1 || args.acregmin < 0) {
915 vfs_mount_error(mp, "illegal acregmin: %s",
920 args.flags |= NFSMNT_ACREGMIN;
922 if (vfs_getopt(mp->mnt_optnew, "acregmax", (void **)&opt, NULL) == 0) {
923 ret = sscanf(opt, "%d", &args.acregmax);
924 if (ret != 1 || args.acregmax < 0) {
925 vfs_mount_error(mp, "illegal acregmax: %s",
930 args.flags |= NFSMNT_ACREGMAX;
932 if (vfs_getopt(mp->mnt_optnew, "acdirmin", (void **)&opt, NULL) == 0) {
933 ret = sscanf(opt, "%d", &args.acdirmin);
934 if (ret != 1 || args.acdirmin < 0) {
935 vfs_mount_error(mp, "illegal acdirmin: %s",
940 args.flags |= NFSMNT_ACDIRMIN;
942 if (vfs_getopt(mp->mnt_optnew, "acdirmax", (void **)&opt, NULL) == 0) {
943 ret = sscanf(opt, "%d", &args.acdirmax);
944 if (ret != 1 || args.acdirmax < 0) {
945 vfs_mount_error(mp, "illegal acdirmax: %s",
950 args.flags |= NFSMNT_ACDIRMAX;
952 if (vfs_getopt(mp->mnt_optnew, "timeout", (void **)&opt, NULL) == 0) {
953 ret = sscanf(opt, "%d", &args.timeo);
954 if (ret != 1 || args.timeo <= 0) {
955 vfs_mount_error(mp, "illegal timeout: %s",
960 args.flags |= NFSMNT_TIMEO;
962 if (vfs_getopt(mp->mnt_optnew, "negnametimeo", (void **)&opt, NULL)
964 ret = sscanf(opt, "%d", &negnametimeo);
965 if (ret != 1 || negnametimeo < 0) {
966 vfs_mount_error(mp, "illegal negnametimeo: %s",
972 if (vfs_getopt(mp->mnt_optnew, "sec",
973 (void **) &secname, NULL) == 0)
974 nfs_sec_name(secname, &args.flags);
976 if (mp->mnt_flag & MNT_UPDATE) {
977 struct nfsmount *nmp = VFSTONFS(mp);
984 * When doing an update, we can't change version,
985 * security, switch lockd strategies or change cookie
988 args.flags = (args.flags &
994 NFSMNT_NOLOCKD /*|NFSMNT_XLATECOOKIE*/)) |
1001 NFSMNT_NOLOCKD /*|NFSMNT_XLATECOOKIE*/));
1002 nfs_decode_args(mp, nmp, &args, NULL, td->td_ucred, td);
1007 * Make the nfs_ip_paranoia sysctl serve as the default connection
1008 * or no-connection mode for those protocols that support
1009 * no-connection mode (the flag will be cleared later for protocols
1010 * that do not support no-connection mode). This will allow a client
1011 * to receive replies from a different IP then the request was
1012 * sent to. Note: default value for nfs_ip_paranoia is 1 (paranoid),
1015 if (nfs_ip_paranoia == 0)
1016 args.flags |= NFSMNT_NOCONN;
1018 if (has_nfs_args_opt != 0) {
1020 * In the 'nfs_args' case, the pointers in the args
1021 * structure are in userland - we copy them in here.
1023 if (args.fhsize < 0 || args.fhsize > NFSX_V3FHMAX) {
1024 vfs_mount_error(mp, "Bad file handle");
1028 error = copyin((caddr_t)args.fh, (caddr_t)nfh,
1032 error = copyinstr(args.hostname, hst, MNAMELEN - 1, &hstlen);
1035 bzero(&hst[hstlen], MNAMELEN - hstlen);
1036 args.hostname = hst;
1037 /* sockargs() call must be after above copyin() calls */
1038 error = getsockaddr(&nam, (caddr_t)args.addr,
1043 if (vfs_getopt(mp->mnt_optnew, "fh", (void **)&args.fh,
1044 &args.fhsize) == 0) {
1045 if (args.fhsize < 0 || args.fhsize > NFSX_FHMAX) {
1046 vfs_mount_error(mp, "Bad file handle");
1050 bcopy(args.fh, nfh, args.fhsize);
1054 (void) vfs_getopt(mp->mnt_optnew, "hostname",
1055 (void **)&args.hostname, &len);
1056 if (args.hostname == NULL) {
1057 vfs_mount_error(mp, "Invalid hostname");
1061 bcopy(args.hostname, hst, MNAMELEN);
1062 hst[MNAMELEN - 1] = '\0';
1065 if (vfs_getopt(mp->mnt_optnew, "principal", (void **)&name, NULL) == 0)
1066 strlcpy(srvkrbname, name, sizeof (srvkrbname));
1068 snprintf(srvkrbname, sizeof (srvkrbname), "nfs@%s", hst);
1069 srvkrbnamelen = strlen(srvkrbname);
1071 if (vfs_getopt(mp->mnt_optnew, "gssname", (void **)&name, NULL) == 0)
1072 strlcpy(krbname, name, sizeof (krbname));
1075 krbnamelen = strlen(krbname);
1077 if (vfs_getopt(mp->mnt_optnew, "dirpath", (void **)&name, NULL) == 0)
1078 strlcpy(dirpath, name, sizeof (dirpath));
1081 dirlen = strlen(dirpath);
1083 if (has_nfs_args_opt == 0) {
1084 if (vfs_getopt(mp->mnt_optnew, "addr",
1085 (void **)&args.addr, &args.addrlen) == 0) {
1086 if (args.addrlen > SOCK_MAXADDRLEN) {
1087 error = ENAMETOOLONG;
1090 nam = malloc(args.addrlen, M_SONAME, M_WAITOK);
1091 bcopy(args.addr, nam, args.addrlen);
1092 nam->sa_len = args.addrlen;
1094 vfs_mount_error(mp, "No server address");
1101 error = mountnfs(&args, mp, nam, hst, krbname, krbnamelen, dirpath,
1102 dirlen, srvkrbname, srvkrbnamelen, &vp, td->td_ucred, td,
1107 mp->mnt_kern_flag |= (MNTK_MPSAFE|MNTK_LOOKUP_SHARED);
1118 * It seems a bit dumb to copyinstr() the host and path here and then
1119 * bcopy() them in mountnfs(), but I wanted to detect errors before
1120 * doing the sockargs() call because sockargs() allocates an mbuf and
1121 * an error after that means that I have to release the mbuf.
1125 nfs_cmount(struct mntarg *ma, void *data, int flags)
1128 struct nfs_args args;
1130 error = copyin(data, &args, sizeof (struct nfs_args));
1134 ma = mount_arg(ma, "nfs_args", &args, sizeof args);
1136 error = kernel_mount(ma, flags);
1141 * Common code for mount and mountroot
1144 mountnfs(struct nfs_args *argp, struct mount *mp, struct sockaddr *nam,
1145 char *hst, u_char *krbname, int krbnamelen, u_char *dirpath, int dirlen,
1146 u_char *srvkrbname, int srvkrbnamelen, struct vnode **vpp,
1147 struct ucred *cred, struct thread *td, int negnametimeo)
1149 struct nfsmount *nmp;
1151 int error, trycnt, ret;
1152 struct nfsvattr nfsva;
1153 static u_int64_t clval = 0;
1155 if (mp->mnt_flag & MNT_UPDATE) {
1157 printf("%s: MNT_UPDATE is no longer handled here\n", __func__);
1158 FREE(nam, M_SONAME);
1161 MALLOC(nmp, struct nfsmount *, sizeof (struct nfsmount) +
1162 krbnamelen + dirlen + srvkrbnamelen + 2,
1163 M_NEWNFSMNT, M_WAITOK | M_ZERO);
1164 TAILQ_INIT(&nmp->nm_bufq);
1166 clval = (u_int64_t)nfsboottime.tv_sec;
1167 nmp->nm_clval = clval++;
1168 nmp->nm_krbnamelen = krbnamelen;
1169 nmp->nm_dirpathlen = dirlen;
1170 nmp->nm_srvkrbnamelen = srvkrbnamelen;
1171 if (td->td_ucred->cr_uid != (uid_t)0) {
1173 * nm_uid is used to get KerberosV credentials for
1174 * the nfsv4 state handling operations if there is
1175 * no host based principal set. Use the uid of
1176 * this user if not root, since they are doing the
1177 * mount. I don't think setting this for root will
1178 * work, since root normally does not have user
1179 * credentials in a credentials cache.
1181 nmp->nm_uid = td->td_ucred->cr_uid;
1184 * Just set to -1, so it won't be used.
1186 nmp->nm_uid = (uid_t)-1;
1189 /* Copy and null terminate all the names */
1190 if (nmp->nm_krbnamelen > 0) {
1191 bcopy(krbname, nmp->nm_krbname, nmp->nm_krbnamelen);
1192 nmp->nm_name[nmp->nm_krbnamelen] = '\0';
1194 if (nmp->nm_dirpathlen > 0) {
1195 bcopy(dirpath, NFSMNT_DIRPATH(nmp),
1196 nmp->nm_dirpathlen);
1197 nmp->nm_name[nmp->nm_krbnamelen + nmp->nm_dirpathlen
1200 if (nmp->nm_srvkrbnamelen > 0) {
1201 bcopy(srvkrbname, NFSMNT_SRVKRBNAME(nmp),
1202 nmp->nm_srvkrbnamelen);
1203 nmp->nm_name[nmp->nm_krbnamelen + nmp->nm_dirpathlen
1204 + nmp->nm_srvkrbnamelen + 2] = '\0';
1206 nmp->nm_sockreq.nr_cred = crhold(cred);
1207 mtx_init(&nmp->nm_sockreq.nr_mtx, "nfssock", NULL, MTX_DEF);
1209 nmp->nm_getinfo = nfs_getnlminfo;
1210 nmp->nm_vinvalbuf = ncl_vinvalbuf;
1213 nmp->nm_mountp = mp;
1214 mtx_init(&nmp->nm_mtx, "NFSmount lock", NULL, MTX_DEF | MTX_DUPOK);
1215 nmp->nm_negnametimeo = negnametimeo;
1217 nfs_decode_args(mp, nmp, argp, hst, cred, td);
1220 * V2 can only handle 32 bit filesizes. A 4GB-1 limit may be too
1221 * high, depending on whether we end up with negative offsets in
1222 * the client or server somewhere. 2GB-1 may be safer.
1224 * For V3, ncl_fsinfo will adjust this as necessary. Assume maximum
1225 * that we can handle until we find out otherwise.
1226 * XXX Our "safe" limit on the client is what we can store in our
1227 * buffer cache using signed(!) block numbers.
1229 if ((argp->flags & (NFSMNT_NFSV3 | NFSMNT_NFSV4)) == 0)
1230 nmp->nm_maxfilesize = 0xffffffffLL;
1232 nmp->nm_maxfilesize = OFF_MAX;
1234 nmp->nm_timeo = NFS_TIMEO;
1235 nmp->nm_retry = NFS_RETRANS;
1236 if ((argp->flags & (NFSMNT_NFSV3 | NFSMNT_NFSV4)) == 0) {
1237 nmp->nm_wsize = NFS_WSIZE;
1238 nmp->nm_rsize = NFS_RSIZE;
1239 nmp->nm_readdirsize = NFS_READDIRSIZE;
1241 nmp->nm_wcommitsize = hibufspace / (desiredvnodes / 1000);
1242 nmp->nm_numgrps = NFS_MAXGRPS;
1243 nmp->nm_readahead = NFS_DEFRAHEAD;
1244 nmp->nm_tprintf_delay = nfs_tprintf_delay;
1245 if (nmp->nm_tprintf_delay < 0)
1246 nmp->nm_tprintf_delay = 0;
1247 nmp->nm_tprintf_initial_delay = nfs_tprintf_initial_delay;
1248 if (nmp->nm_tprintf_initial_delay < 0)
1249 nmp->nm_tprintf_initial_delay = 0;
1250 nmp->nm_fhsize = argp->fhsize;
1251 if (nmp->nm_fhsize > 0)
1252 bcopy((caddr_t)argp->fh, (caddr_t)nmp->nm_fh, argp->fhsize);
1253 bcopy(hst, mp->mnt_stat.f_mntfromname, MNAMELEN);
1255 /* Set up the sockets and per-host congestion */
1256 nmp->nm_sotype = argp->sotype;
1257 nmp->nm_soproto = argp->proto;
1258 nmp->nm_sockreq.nr_prog = NFS_PROG;
1259 if ((argp->flags & NFSMNT_NFSV4))
1260 nmp->nm_sockreq.nr_vers = NFS_VER4;
1261 else if ((argp->flags & NFSMNT_NFSV3))
1262 nmp->nm_sockreq.nr_vers = NFS_VER3;
1264 nmp->nm_sockreq.nr_vers = NFS_VER2;
1267 if ((error = newnfs_connect(nmp, &nmp->nm_sockreq, cred, td, 0)))
1271 * A reference count is needed on the nfsnode representing the
1272 * remote root. If this object is not persistent, then backward
1273 * traversals of the mount point (i.e. "..") will not work if
1274 * the nfsnode gets flushed out of the cache. Ufs does not have
1275 * this problem, because one can identify root inodes by their
1276 * number == ROOTINO (2).
1278 if (nmp->nm_fhsize == 0 && (nmp->nm_flag & NFSMNT_NFSV4) &&
1279 nmp->nm_dirpathlen > 0) {
1281 * If the fhsize on the mount point == 0 for V4, the mount
1282 * path needs to be looked up.
1286 error = nfsrpc_getdirpath(nmp, NFSMNT_DIRPATH(nmp),
1289 (void) nfs_catnap(PZERO, error, "nfsgetdirp");
1290 } while (error && --trycnt > 0);
1292 error = nfscl_maperr(td, error, (uid_t)0, (gid_t)0);
1296 if (nmp->nm_fhsize > 0) {
1298 * Set f_iosize to NFS_DIRBLKSIZ so that bo_bsize gets set
1299 * non-zero for the root vnode. f_iosize will be set correctly
1300 * by nfs_statfs() before any I/O occurs.
1302 mp->mnt_stat.f_iosize = NFS_DIRBLKSIZ;
1303 error = ncl_nget(mp, nmp->nm_fh, nmp->nm_fhsize, &np,
1310 * Get file attributes and transfer parameters for the
1311 * mountpoint. This has the side effect of filling in
1312 * (*vpp)->v_type with the correct value.
1314 ret = nfsrpc_getattrnovp(nmp, nmp->nm_fh, nmp->nm_fhsize, 1,
1315 cred, td, &nfsva, NULL);
1318 * Just set default values to get things going.
1320 NFSBZERO((caddr_t)&nfsva, sizeof (struct nfsvattr));
1321 nfsva.na_vattr.va_type = VDIR;
1322 nfsva.na_vattr.va_mode = 0777;
1323 nfsva.na_vattr.va_nlink = 100;
1324 nfsva.na_vattr.va_uid = (uid_t)0;
1325 nfsva.na_vattr.va_gid = (gid_t)0;
1326 nfsva.na_vattr.va_fileid = 2;
1327 nfsva.na_vattr.va_gen = 1;
1328 nfsva.na_vattr.va_blocksize = NFS_FABLKSIZE;
1329 nfsva.na_vattr.va_size = 512 * 1024;
1331 (void) nfscl_loadattrcache(vpp, &nfsva, NULL, NULL, 0, 1);
1332 if (argp->flags & NFSMNT_NFSV3)
1333 ncl_fsinfo(nmp, *vpp, cred, td);
1335 /* Mark if the mount point supports NFSv4 ACLs. */
1336 if ((argp->flags & NFSMNT_NFSV4) != 0 && nfsrv_useacl != 0 &&
1338 NFSISSET_ATTRBIT(&nfsva.na_suppattr, NFSATTRBIT_ACL)) {
1340 mp->mnt_flag |= MNT_NFS4ACLS;
1345 * Lose the lock but keep the ref.
1347 NFSVOPUNLOCK(*vpp, 0);
1353 newnfs_disconnect(&nmp->nm_sockreq);
1354 crfree(nmp->nm_sockreq.nr_cred);
1355 mtx_destroy(&nmp->nm_sockreq.nr_mtx);
1356 mtx_destroy(&nmp->nm_mtx);
1357 FREE(nmp, M_NEWNFSMNT);
1358 FREE(nam, M_SONAME);
1363 * unmount system call
1366 nfs_unmount(struct mount *mp, int mntflags)
1369 struct nfsmount *nmp;
1370 int error, flags = 0, trycnt = 0;
1374 if (mntflags & MNT_FORCE)
1375 flags |= FORCECLOSE;
1378 * Goes something like this..
1379 * - Call vflush() to clear out vnodes for this filesystem
1380 * - Close the socket
1381 * - Free up the data structures
1383 /* In the forced case, cancel any outstanding requests. */
1384 if (mntflags & MNT_FORCE) {
1385 error = newnfs_nmcancelreqs(nmp);
1388 /* For a forced close, get rid of the renew thread now */
1389 nfscl_umount(nmp, td);
1391 /* We hold 1 extra ref on the root vnode; see comment in mountnfs(). */
1393 error = vflush(mp, 1, flags, td);
1394 if ((mntflags & MNT_FORCE) && error != 0 && ++trycnt < 30)
1395 (void) nfs_catnap(PSOCK, error, "newndm");
1396 } while ((mntflags & MNT_FORCE) && error != 0 && trycnt < 30);
1401 * We are now committed to the unmount.
1403 if ((mntflags & MNT_FORCE) == 0)
1404 nfscl_umount(nmp, td);
1405 newnfs_disconnect(&nmp->nm_sockreq);
1406 crfree(nmp->nm_sockreq.nr_cred);
1407 FREE(nmp->nm_nam, M_SONAME);
1409 mtx_destroy(&nmp->nm_sockreq.nr_mtx);
1410 mtx_destroy(&nmp->nm_mtx);
1411 FREE(nmp, M_NEWNFSMNT);
1417 * Return root of a filesystem
1420 nfs_root(struct mount *mp, int flags, struct vnode **vpp)
1423 struct nfsmount *nmp;
1428 error = ncl_nget(mp, nmp->nm_fh, nmp->nm_fhsize, &np, flags);
1433 * Get transfer parameters and attributes for root vnode once.
1435 mtx_lock(&nmp->nm_mtx);
1436 if (NFSHASNFSV3(nmp) && !NFSHASGOTFSINFO(nmp)) {
1437 mtx_unlock(&nmp->nm_mtx);
1438 ncl_fsinfo(nmp, vp, curthread->td_ucred, curthread);
1440 mtx_unlock(&nmp->nm_mtx);
1441 if (vp->v_type == VNON)
1443 vp->v_vflag |= VV_ROOT;
1449 * Flush out the buffer cache
1453 nfs_sync(struct mount *mp, int waitfor)
1455 struct vnode *vp, *mvp;
1457 int error, allerror = 0;
1463 * If a forced dismount is in progress, return from here so that
1464 * the umount(2) syscall doesn't get stuck in VFS_SYNC() before
1465 * calling VFS_UNMOUNT().
1467 if ((mp->mnt_kern_flag & MNTK_UNMOUNTF) != 0) {
1473 * Force stale buffer cache information to be flushed.
1476 MNT_VNODE_FOREACH(vp, mp, mvp) {
1479 /* XXX Racy bv_cnt check. */
1480 if (NFSVOPISLOCKED(vp) || vp->v_bufobj.bo_dirty.bv_cnt == 0 ||
1481 waitfor == MNT_LAZY) {
1486 if (vget(vp, LK_EXCLUSIVE | LK_INTERLOCK, td)) {
1488 MNT_VNODE_FOREACH_ABORT_ILOCKED(mp, mvp);
1491 error = VOP_FSYNC(vp, waitfor, td);
1494 NFSVOPUNLOCK(vp, 0);
1504 nfs_sysctl(struct mount *mp, fsctlop_t op, struct sysctl_req *req)
1506 struct nfsmount *nmp = VFSTONFS(mp);
1510 bzero(&vq, sizeof(vq));
1513 case VFS_CTL_NOLOCKS:
1514 val = (nmp->nm_flag & NFSMNT_NOLOCKS) ? 1 : 0;
1515 if (req->oldptr != NULL) {
1516 error = SYSCTL_OUT(req, &val, sizeof(val));
1520 if (req->newptr != NULL) {
1521 error = SYSCTL_IN(req, &val, sizeof(val));
1525 nmp->nm_flag |= NFSMNT_NOLOCKS;
1527 nmp->nm_flag &= ~NFSMNT_NOLOCKS;
1532 mtx_lock(&nmp->nm_mtx);
1533 if (nmp->nm_state & NFSSTA_TIMEO)
1534 vq.vq_flags |= VQ_NOTRESP;
1535 mtx_unlock(&nmp->nm_mtx);
1537 if (!(nmp->nm_flag & NFSMNT_NOLOCKS) &&
1538 (nmp->nm_state & NFSSTA_LOCKTIMEO))
1539 vq.vq_flags |= VQ_NOTRESPLOCK;
1541 error = SYSCTL_OUT(req, &vq, sizeof(vq));
1544 if (req->oldptr != NULL) {
1545 error = SYSCTL_OUT(req, &nmp->nm_tprintf_initial_delay,
1546 sizeof(nmp->nm_tprintf_initial_delay));
1550 if (req->newptr != NULL) {
1551 error = vfs_suser(mp, req->td);
1554 error = SYSCTL_IN(req, &nmp->nm_tprintf_initial_delay,
1555 sizeof(nmp->nm_tprintf_initial_delay));
1558 if (nmp->nm_tprintf_initial_delay < 0)
1559 nmp->nm_tprintf_initial_delay = 0;
1569 * Extract the information needed by the nlm from the nfs vnode.
1572 nfs_getnlminfo(struct vnode *vp, uint8_t *fhp, size_t *fhlenp,
1573 struct sockaddr_storage *sp, int *is_v3p, off_t *sizep,
1574 struct timeval *timeop)
1576 struct nfsmount *nmp;
1577 struct nfsnode *np = VTONFS(vp);
1579 nmp = VFSTONFS(vp->v_mount);
1581 *fhlenp = (size_t)np->n_fhp->nfh_len;
1583 bcopy(np->n_fhp->nfh_fh, fhp, np->n_fhp->nfh_len);
1585 bcopy(nmp->nm_nam, sp, min(nmp->nm_nam->sa_len, sizeof(*sp)));
1587 *is_v3p = NFS_ISV3(vp);
1589 *sizep = np->n_size;
1590 if (timeop != NULL) {
1591 timeop->tv_sec = nmp->nm_timeo / NFS_HZ;
1592 timeop->tv_usec = (nmp->nm_timeo % NFS_HZ) * (1000000 / NFS_HZ);